diff --git "a/checkpoint-51552/trainer_state.json" "b/checkpoint-51552/trainer_state.json" new file mode 100644--- /dev/null +++ "b/checkpoint-51552/trainer_state.json" @@ -0,0 +1,309340 @@ +{ + "best_metric": 0.07964583486318588, + "best_model_checkpoint": "ai-generated-essay-detection-distilbert/checkpoint-51552", + "epoch": 1.0, + "eval_steps": 1, + "global_step": 51552, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4e-09, + "loss": 0.6852, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 8e-09, + "loss": 0.6837, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 1.1999999999999998e-08, + "loss": 0.7127, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 1.6e-08, + "loss": 0.6631, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 2e-08, + "loss": 0.6651, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 2.3999999999999997e-08, + "loss": 0.6342, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 2.8000000000000003e-08, + "loss": 0.6956, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 3.2e-08, + "loss": 0.6923, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 3.6e-08, + "loss": 0.7301, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 4e-08, + "loss": 0.6653, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 4.4e-08, + "loss": 0.698, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 4.799999999999999e-08, + "loss": 0.7004, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 5.2e-08, + "loss": 0.7007, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 5.6000000000000005e-08, + "loss": 0.6826, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 6e-08, + "loss": 0.7321, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 6.4e-08, + "loss": 0.733, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 6.8e-08, + "loss": 0.6876, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 7.2e-08, + "loss": 0.7111, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 7.599999999999999e-08, + "loss": 0.6828, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 8e-08, + "loss": 0.6964, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 8.4e-08, + "loss": 0.6948, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 8.8e-08, + "loss": 0.7185, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 9.2e-08, + "loss": 0.6787, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 9.599999999999999e-08, + "loss": 0.7321, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 1e-07, + "loss": 0.6783, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 1.04e-07, + "loss": 0.6877, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 1.08e-07, + "loss": 0.7226, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 1.1200000000000001e-07, + "loss": 0.7366, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 1.1599999999999999e-07, + "loss": 0.6531, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 1.2e-07, + "loss": 0.7434, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 1.24e-07, + "loss": 0.6896, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 1.28e-07, + "loss": 0.6965, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 1.32e-07, + "loss": 0.7109, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 1.36e-07, + "loss": 0.6843, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 1.3999999999999998e-07, + "loss": 0.6918, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 1.44e-07, + "loss": 0.7564, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 1.48e-07, + "loss": 0.6649, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 1.5199999999999998e-07, + "loss": 0.7083, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 1.56e-07, + "loss": 0.7115, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 1.6e-07, + "loss": 0.7091, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 1.6399999999999999e-07, + "loss": 0.6793, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 1.68e-07, + "loss": 0.7116, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 1.7199999999999998e-07, + "loss": 0.6707, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 1.76e-07, + "loss": 0.6488, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 1.8e-07, + "loss": 0.7046, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 1.84e-07, + "loss": 0.7179, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 1.88e-07, + "loss": 0.6768, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 1.9199999999999997e-07, + "loss": 0.7096, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 1.9599999999999998e-07, + "loss": 0.6562, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 2e-07, + "loss": 0.739, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999611665566384e-07, + "loss": 0.6793, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 1.999922333113277e-07, + "loss": 0.7034, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998834996699155e-07, + "loss": 0.6697, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998446662265542e-07, + "loss": 0.6863, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998058327831927e-07, + "loss": 0.7083, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 1.9997669993398314e-07, + "loss": 0.6704, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 1.9997281658964699e-07, + "loss": 0.6917, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 1.9996893324531086e-07, + "loss": 0.6942, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 1.999650499009747e-07, + "loss": 0.6823, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 1.9996116655663857e-07, + "loss": 0.6454, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 1.9995728321230242e-07, + "loss": 0.7098, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 1.999533998679663e-07, + "loss": 0.6726, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 1.9994951652363013e-07, + "loss": 0.704, + "step": 63 + }, + { + "epoch": 0.0, + "learning_rate": 1.99945633179294e-07, + "loss": 0.7149, + "step": 64 + }, + { + "epoch": 0.0, + "learning_rate": 1.9994174983495785e-07, + "loss": 0.6567, + "step": 65 + }, + { + "epoch": 0.0, + "learning_rate": 1.9993786649062172e-07, + "loss": 0.7054, + "step": 66 + }, + { + "epoch": 0.0, + "learning_rate": 1.9993398314628557e-07, + "loss": 0.683, + "step": 67 + }, + { + "epoch": 0.0, + "learning_rate": 1.9993009980194944e-07, + "loss": 0.6622, + "step": 68 + }, + { + "epoch": 0.0, + "learning_rate": 1.9992621645761328e-07, + "loss": 0.7106, + "step": 69 + }, + { + "epoch": 0.0, + "learning_rate": 1.9992233311327716e-07, + "loss": 0.7072, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 1.99918449768941e-07, + "loss": 0.7089, + "step": 71 + }, + { + "epoch": 0.0, + "learning_rate": 1.9991456642460487e-07, + "loss": 0.6781, + "step": 72 + }, + { + "epoch": 0.0, + "learning_rate": 1.9991068308026872e-07, + "loss": 0.7118, + "step": 73 + }, + { + "epoch": 0.0, + "learning_rate": 1.999067997359326e-07, + "loss": 0.6799, + "step": 74 + }, + { + "epoch": 0.0, + "learning_rate": 1.9990291639159643e-07, + "loss": 0.6756, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 1.998990330472603e-07, + "loss": 0.6864, + "step": 76 + }, + { + "epoch": 0.0, + "learning_rate": 1.9989514970292415e-07, + "loss": 0.7018, + "step": 77 + }, + { + "epoch": 0.0, + "learning_rate": 1.9989126635858802e-07, + "loss": 0.7007, + "step": 78 + }, + { + "epoch": 0.0, + "learning_rate": 1.9988738301425187e-07, + "loss": 0.6794, + "step": 79 + }, + { + "epoch": 0.0, + "learning_rate": 1.998834996699157e-07, + "loss": 0.6965, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 1.9987961632557956e-07, + "loss": 0.6964, + "step": 81 + }, + { + "epoch": 0.0, + "learning_rate": 1.9987573298124343e-07, + "loss": 0.6991, + "step": 82 + }, + { + "epoch": 0.0, + "learning_rate": 1.9987184963690727e-07, + "loss": 0.6695, + "step": 83 + }, + { + "epoch": 0.0, + "learning_rate": 1.9986796629257114e-07, + "loss": 0.6967, + "step": 84 + }, + { + "epoch": 0.0, + "learning_rate": 1.99864082948235e-07, + "loss": 0.6752, + "step": 85 + }, + { + "epoch": 0.0, + "learning_rate": 1.9986019960389886e-07, + "loss": 0.6634, + "step": 86 + }, + { + "epoch": 0.0, + "learning_rate": 1.998563162595627e-07, + "loss": 0.7069, + "step": 87 + }, + { + "epoch": 0.0, + "learning_rate": 1.9985243291522658e-07, + "loss": 0.6953, + "step": 88 + }, + { + "epoch": 0.0, + "learning_rate": 1.9984854957089042e-07, + "loss": 0.7234, + "step": 89 + }, + { + "epoch": 0.0, + "learning_rate": 1.998446662265543e-07, + "loss": 0.7092, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 1.9984078288221814e-07, + "loss": 0.7124, + "step": 91 + }, + { + "epoch": 0.0, + "learning_rate": 1.99836899537882e-07, + "loss": 0.7118, + "step": 92 + }, + { + "epoch": 0.0, + "learning_rate": 1.9983301619354586e-07, + "loss": 0.7095, + "step": 93 + }, + { + "epoch": 0.0, + "learning_rate": 1.9982913284920973e-07, + "loss": 0.7064, + "step": 94 + }, + { + "epoch": 0.0, + "learning_rate": 1.9982524950487357e-07, + "loss": 0.7093, + "step": 95 + }, + { + "epoch": 0.0, + "learning_rate": 1.9982136616053744e-07, + "loss": 0.6593, + "step": 96 + }, + { + "epoch": 0.0, + "learning_rate": 1.998174828162013e-07, + "loss": 0.6608, + "step": 97 + }, + { + "epoch": 0.0, + "learning_rate": 1.9981359947186516e-07, + "loss": 0.739, + "step": 98 + }, + { + "epoch": 0.0, + "learning_rate": 1.99809716127529e-07, + "loss": 0.6991, + "step": 99 + }, + { + "epoch": 0.0, + "learning_rate": 1.9980583278319288e-07, + "loss": 0.7095, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 1.9980194943885672e-07, + "loss": 0.7309, + "step": 101 + }, + { + "epoch": 0.0, + "learning_rate": 1.997980660945206e-07, + "loss": 0.7522, + "step": 102 + }, + { + "epoch": 0.0, + "learning_rate": 1.9979418275018444e-07, + "loss": 0.7019, + "step": 103 + }, + { + "epoch": 0.0, + "learning_rate": 1.997902994058483e-07, + "loss": 0.7333, + "step": 104 + }, + { + "epoch": 0.0, + "learning_rate": 1.9978641606151215e-07, + "loss": 0.6566, + "step": 105 + }, + { + "epoch": 0.0, + "learning_rate": 1.9978253271717603e-07, + "loss": 0.6811, + "step": 106 + }, + { + "epoch": 0.0, + "learning_rate": 1.9977864937283987e-07, + "loss": 0.693, + "step": 107 + }, + { + "epoch": 0.0, + "learning_rate": 1.9977476602850374e-07, + "loss": 0.6807, + "step": 108 + }, + { + "epoch": 0.0, + "learning_rate": 1.997708826841676e-07, + "loss": 0.6804, + "step": 109 + }, + { + "epoch": 0.0, + "learning_rate": 1.9976699933983146e-07, + "loss": 0.6959, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 1.997631159954953e-07, + "loss": 0.7436, + "step": 111 + }, + { + "epoch": 0.0, + "learning_rate": 1.9975923265115918e-07, + "loss": 0.6751, + "step": 112 + }, + { + "epoch": 0.0, + "learning_rate": 1.9975534930682302e-07, + "loss": 0.675, + "step": 113 + }, + { + "epoch": 0.0, + "learning_rate": 1.997514659624869e-07, + "loss": 0.7194, + "step": 114 + }, + { + "epoch": 0.0, + "learning_rate": 1.9974758261815074e-07, + "loss": 0.6736, + "step": 115 + }, + { + "epoch": 0.0, + "learning_rate": 1.997436992738146e-07, + "loss": 0.7027, + "step": 116 + }, + { + "epoch": 0.0, + "learning_rate": 1.9973981592947845e-07, + "loss": 0.682, + "step": 117 + }, + { + "epoch": 0.0, + "learning_rate": 1.9973593258514233e-07, + "loss": 0.6794, + "step": 118 + }, + { + "epoch": 0.0, + "learning_rate": 1.9973204924080617e-07, + "loss": 0.7128, + "step": 119 + }, + { + "epoch": 0.0, + "learning_rate": 1.9972816589647004e-07, + "loss": 0.7336, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 1.9972428255213389e-07, + "loss": 0.7125, + "step": 121 + }, + { + "epoch": 0.0, + "learning_rate": 1.9972039920779776e-07, + "loss": 0.6851, + "step": 122 + }, + { + "epoch": 0.0, + "learning_rate": 1.997165158634616e-07, + "loss": 0.7091, + "step": 123 + }, + { + "epoch": 0.0, + "learning_rate": 1.9971263251912547e-07, + "loss": 0.7094, + "step": 124 + }, + { + "epoch": 0.0, + "learning_rate": 1.9970874917478932e-07, + "loss": 0.6762, + "step": 125 + }, + { + "epoch": 0.0, + "learning_rate": 1.997048658304532e-07, + "loss": 0.7009, + "step": 126 + }, + { + "epoch": 0.0, + "learning_rate": 1.9970098248611704e-07, + "loss": 0.7062, + "step": 127 + }, + { + "epoch": 0.0, + "learning_rate": 1.996970991417809e-07, + "loss": 0.6912, + "step": 128 + }, + { + "epoch": 0.0, + "learning_rate": 1.9969321579744475e-07, + "loss": 0.6762, + "step": 129 + }, + { + "epoch": 0.0, + "learning_rate": 1.9968933245310862e-07, + "loss": 0.6589, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 1.9968544910877247e-07, + "loss": 0.7004, + "step": 131 + }, + { + "epoch": 0.0, + "learning_rate": 1.9968156576443634e-07, + "loss": 0.6398, + "step": 132 + }, + { + "epoch": 0.0, + "learning_rate": 1.9967768242010019e-07, + "loss": 0.6841, + "step": 133 + }, + { + "epoch": 0.0, + "learning_rate": 1.9967379907576406e-07, + "loss": 0.6676, + "step": 134 + }, + { + "epoch": 0.0, + "learning_rate": 1.996699157314279e-07, + "loss": 0.6738, + "step": 135 + }, + { + "epoch": 0.0, + "learning_rate": 1.9966603238709177e-07, + "loss": 0.6615, + "step": 136 + }, + { + "epoch": 0.0, + "learning_rate": 1.996621490427556e-07, + "loss": 0.7092, + "step": 137 + }, + { + "epoch": 0.0, + "learning_rate": 1.9965826569841946e-07, + "loss": 0.6873, + "step": 138 + }, + { + "epoch": 0.0, + "learning_rate": 1.996543823540833e-07, + "loss": 0.7105, + "step": 139 + }, + { + "epoch": 0.0, + "learning_rate": 1.9965049900974718e-07, + "loss": 0.6527, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 1.9964661566541103e-07, + "loss": 0.7059, + "step": 141 + }, + { + "epoch": 0.0, + "learning_rate": 1.996427323210749e-07, + "loss": 0.6763, + "step": 142 + }, + { + "epoch": 0.0, + "learning_rate": 1.9963884897673874e-07, + "loss": 0.708, + "step": 143 + }, + { + "epoch": 0.0, + "learning_rate": 1.996349656324026e-07, + "loss": 0.6434, + "step": 144 + }, + { + "epoch": 0.0, + "learning_rate": 1.9963108228806646e-07, + "loss": 0.6414, + "step": 145 + }, + { + "epoch": 0.0, + "learning_rate": 1.9962719894373033e-07, + "loss": 0.7145, + "step": 146 + }, + { + "epoch": 0.0, + "learning_rate": 1.9962331559939417e-07, + "loss": 0.7042, + "step": 147 + }, + { + "epoch": 0.0, + "learning_rate": 1.9961943225505805e-07, + "loss": 0.6945, + "step": 148 + }, + { + "epoch": 0.0, + "learning_rate": 1.996155489107219e-07, + "loss": 0.7062, + "step": 149 + }, + { + "epoch": 0.0, + "learning_rate": 1.9961166556638576e-07, + "loss": 0.7245, + "step": 150 + }, + { + "epoch": 0.0, + "learning_rate": 1.996077822220496e-07, + "loss": 0.7067, + "step": 151 + }, + { + "epoch": 0.0, + "learning_rate": 1.9960389887771348e-07, + "loss": 0.6664, + "step": 152 + }, + { + "epoch": 0.0, + "learning_rate": 1.9960001553337732e-07, + "loss": 0.7122, + "step": 153 + }, + { + "epoch": 0.0, + "learning_rate": 1.995961321890412e-07, + "loss": 0.7133, + "step": 154 + }, + { + "epoch": 0.0, + "learning_rate": 1.9959224884470504e-07, + "loss": 0.6898, + "step": 155 + }, + { + "epoch": 0.0, + "learning_rate": 1.995883655003689e-07, + "loss": 0.6929, + "step": 156 + }, + { + "epoch": 0.0, + "learning_rate": 1.9958448215603276e-07, + "loss": 0.6905, + "step": 157 + }, + { + "epoch": 0.0, + "learning_rate": 1.9958059881169663e-07, + "loss": 0.6711, + "step": 158 + }, + { + "epoch": 0.0, + "learning_rate": 1.9957671546736047e-07, + "loss": 0.7527, + "step": 159 + }, + { + "epoch": 0.0, + "learning_rate": 1.9957283212302434e-07, + "loss": 0.6915, + "step": 160 + }, + { + "epoch": 0.0, + "learning_rate": 1.995689487786882e-07, + "loss": 0.6825, + "step": 161 + }, + { + "epoch": 0.0, + "learning_rate": 1.9956506543435206e-07, + "loss": 0.6854, + "step": 162 + }, + { + "epoch": 0.0, + "learning_rate": 1.995611820900159e-07, + "loss": 0.7082, + "step": 163 + }, + { + "epoch": 0.0, + "learning_rate": 1.9955729874567978e-07, + "loss": 0.7232, + "step": 164 + }, + { + "epoch": 0.0, + "learning_rate": 1.9955341540134362e-07, + "loss": 0.7193, + "step": 165 + }, + { + "epoch": 0.0, + "learning_rate": 1.995495320570075e-07, + "loss": 0.6968, + "step": 166 + }, + { + "epoch": 0.0, + "learning_rate": 1.9954564871267134e-07, + "loss": 0.6939, + "step": 167 + }, + { + "epoch": 0.0, + "learning_rate": 1.995417653683352e-07, + "loss": 0.6854, + "step": 168 + }, + { + "epoch": 0.0, + "learning_rate": 1.9953788202399906e-07, + "loss": 0.6959, + "step": 169 + }, + { + "epoch": 0.0, + "learning_rate": 1.9953399867966293e-07, + "loss": 0.6771, + "step": 170 + }, + { + "epoch": 0.0, + "learning_rate": 1.9953011533532677e-07, + "loss": 0.6557, + "step": 171 + }, + { + "epoch": 0.0, + "learning_rate": 1.9952623199099064e-07, + "loss": 0.676, + "step": 172 + }, + { + "epoch": 0.0, + "learning_rate": 1.995223486466545e-07, + "loss": 0.6864, + "step": 173 + }, + { + "epoch": 0.0, + "learning_rate": 1.9951846530231836e-07, + "loss": 0.7083, + "step": 174 + }, + { + "epoch": 0.0, + "learning_rate": 1.995145819579822e-07, + "loss": 0.6518, + "step": 175 + }, + { + "epoch": 0.0, + "learning_rate": 1.9951069861364608e-07, + "loss": 0.6958, + "step": 176 + }, + { + "epoch": 0.0, + "learning_rate": 1.9950681526930992e-07, + "loss": 0.6922, + "step": 177 + }, + { + "epoch": 0.0, + "learning_rate": 1.995029319249738e-07, + "loss": 0.6448, + "step": 178 + }, + { + "epoch": 0.0, + "learning_rate": 1.9949904858063764e-07, + "loss": 0.7177, + "step": 179 + }, + { + "epoch": 0.0, + "learning_rate": 1.994951652363015e-07, + "loss": 0.7101, + "step": 180 + }, + { + "epoch": 0.0, + "learning_rate": 1.9949128189196535e-07, + "loss": 0.6845, + "step": 181 + }, + { + "epoch": 0.0, + "learning_rate": 1.9948739854762923e-07, + "loss": 0.6757, + "step": 182 + }, + { + "epoch": 0.0, + "learning_rate": 1.9948351520329307e-07, + "loss": 0.695, + "step": 183 + }, + { + "epoch": 0.0, + "learning_rate": 1.9947963185895694e-07, + "loss": 0.6643, + "step": 184 + }, + { + "epoch": 0.0, + "learning_rate": 1.994757485146208e-07, + "loss": 0.6981, + "step": 185 + }, + { + "epoch": 0.0, + "learning_rate": 1.9947186517028466e-07, + "loss": 0.7226, + "step": 186 + }, + { + "epoch": 0.0, + "learning_rate": 1.994679818259485e-07, + "loss": 0.6775, + "step": 187 + }, + { + "epoch": 0.0, + "learning_rate": 1.9946409848161238e-07, + "loss": 0.6818, + "step": 188 + }, + { + "epoch": 0.0, + "learning_rate": 1.9946021513727622e-07, + "loss": 0.6887, + "step": 189 + }, + { + "epoch": 0.0, + "learning_rate": 1.994563317929401e-07, + "loss": 0.6317, + "step": 190 + }, + { + "epoch": 0.0, + "learning_rate": 1.9945244844860394e-07, + "loss": 0.6409, + "step": 191 + }, + { + "epoch": 0.0, + "learning_rate": 1.994485651042678e-07, + "loss": 0.7115, + "step": 192 + }, + { + "epoch": 0.0, + "learning_rate": 1.9944468175993165e-07, + "loss": 0.682, + "step": 193 + }, + { + "epoch": 0.0, + "learning_rate": 1.9944079841559553e-07, + "loss": 0.6878, + "step": 194 + }, + { + "epoch": 0.0, + "learning_rate": 1.9943691507125934e-07, + "loss": 0.7184, + "step": 195 + }, + { + "epoch": 0.0, + "learning_rate": 1.9943303172692322e-07, + "loss": 0.6619, + "step": 196 + }, + { + "epoch": 0.0, + "learning_rate": 1.9942914838258706e-07, + "loss": 0.6289, + "step": 197 + }, + { + "epoch": 0.0, + "learning_rate": 1.9942526503825093e-07, + "loss": 0.6642, + "step": 198 + }, + { + "epoch": 0.0, + "learning_rate": 1.9942138169391478e-07, + "loss": 0.6913, + "step": 199 + }, + { + "epoch": 0.0, + "learning_rate": 1.9941749834957865e-07, + "loss": 0.6848, + "step": 200 + }, + { + "epoch": 0.0, + "learning_rate": 1.994136150052425e-07, + "loss": 0.7376, + "step": 201 + }, + { + "epoch": 0.0, + "learning_rate": 1.9940973166090636e-07, + "loss": 0.7036, + "step": 202 + }, + { + "epoch": 0.0, + "learning_rate": 1.994058483165702e-07, + "loss": 0.6882, + "step": 203 + }, + { + "epoch": 0.0, + "learning_rate": 1.9940196497223408e-07, + "loss": 0.686, + "step": 204 + }, + { + "epoch": 0.0, + "learning_rate": 1.9939808162789793e-07, + "loss": 0.7051, + "step": 205 + }, + { + "epoch": 0.0, + "learning_rate": 1.993941982835618e-07, + "loss": 0.6514, + "step": 206 + }, + { + "epoch": 0.0, + "learning_rate": 1.9939031493922564e-07, + "loss": 0.712, + "step": 207 + }, + { + "epoch": 0.0, + "learning_rate": 1.9938643159488951e-07, + "loss": 0.6678, + "step": 208 + }, + { + "epoch": 0.0, + "learning_rate": 1.9938254825055336e-07, + "loss": 0.6996, + "step": 209 + }, + { + "epoch": 0.0, + "learning_rate": 1.9937866490621723e-07, + "loss": 0.6678, + "step": 210 + }, + { + "epoch": 0.0, + "learning_rate": 1.9937478156188108e-07, + "loss": 0.6977, + "step": 211 + }, + { + "epoch": 0.0, + "learning_rate": 1.9937089821754495e-07, + "loss": 0.7309, + "step": 212 + }, + { + "epoch": 0.0, + "learning_rate": 1.993670148732088e-07, + "loss": 0.7209, + "step": 213 + }, + { + "epoch": 0.0, + "learning_rate": 1.9936313152887266e-07, + "loss": 0.6938, + "step": 214 + }, + { + "epoch": 0.0, + "learning_rate": 1.993592481845365e-07, + "loss": 0.6762, + "step": 215 + }, + { + "epoch": 0.0, + "learning_rate": 1.9935536484020038e-07, + "loss": 0.6601, + "step": 216 + }, + { + "epoch": 0.0, + "learning_rate": 1.9935148149586423e-07, + "loss": 0.686, + "step": 217 + }, + { + "epoch": 0.0, + "learning_rate": 1.993475981515281e-07, + "loss": 0.6836, + "step": 218 + }, + { + "epoch": 0.0, + "learning_rate": 1.9934371480719194e-07, + "loss": 0.6699, + "step": 219 + }, + { + "epoch": 0.0, + "learning_rate": 1.993398314628558e-07, + "loss": 0.6932, + "step": 220 + }, + { + "epoch": 0.0, + "learning_rate": 1.9933594811851966e-07, + "loss": 0.6842, + "step": 221 + }, + { + "epoch": 0.0, + "learning_rate": 1.9933206477418353e-07, + "loss": 0.6932, + "step": 222 + }, + { + "epoch": 0.0, + "learning_rate": 1.9932818142984737e-07, + "loss": 0.7408, + "step": 223 + }, + { + "epoch": 0.0, + "learning_rate": 1.9932429808551125e-07, + "loss": 0.6942, + "step": 224 + }, + { + "epoch": 0.0, + "learning_rate": 1.993204147411751e-07, + "loss": 0.6876, + "step": 225 + }, + { + "epoch": 0.0, + "learning_rate": 1.9931653139683896e-07, + "loss": 0.6725, + "step": 226 + }, + { + "epoch": 0.0, + "learning_rate": 1.993126480525028e-07, + "loss": 0.7284, + "step": 227 + }, + { + "epoch": 0.0, + "learning_rate": 1.9930876470816665e-07, + "loss": 0.727, + "step": 228 + }, + { + "epoch": 0.0, + "learning_rate": 1.9930488136383052e-07, + "loss": 0.7043, + "step": 229 + }, + { + "epoch": 0.0, + "learning_rate": 1.9930099801949437e-07, + "loss": 0.6693, + "step": 230 + }, + { + "epoch": 0.0, + "learning_rate": 1.9929711467515824e-07, + "loss": 0.7216, + "step": 231 + }, + { + "epoch": 0.0, + "learning_rate": 1.9929323133082209e-07, + "loss": 0.7015, + "step": 232 + }, + { + "epoch": 0.0, + "learning_rate": 1.9928934798648596e-07, + "loss": 0.7108, + "step": 233 + }, + { + "epoch": 0.0, + "learning_rate": 1.992854646421498e-07, + "loss": 0.6939, + "step": 234 + }, + { + "epoch": 0.0, + "learning_rate": 1.9928158129781367e-07, + "loss": 0.658, + "step": 235 + }, + { + "epoch": 0.0, + "learning_rate": 1.9927769795347752e-07, + "loss": 0.706, + "step": 236 + }, + { + "epoch": 0.0, + "learning_rate": 1.992738146091414e-07, + "loss": 0.6943, + "step": 237 + }, + { + "epoch": 0.0, + "learning_rate": 1.9926993126480524e-07, + "loss": 0.6775, + "step": 238 + }, + { + "epoch": 0.0, + "learning_rate": 1.992660479204691e-07, + "loss": 0.6653, + "step": 239 + }, + { + "epoch": 0.0, + "learning_rate": 1.9926216457613295e-07, + "loss": 0.692, + "step": 240 + }, + { + "epoch": 0.0, + "learning_rate": 1.9925828123179682e-07, + "loss": 0.7289, + "step": 241 + }, + { + "epoch": 0.0, + "learning_rate": 1.9925439788746067e-07, + "loss": 0.67, + "step": 242 + }, + { + "epoch": 0.0, + "learning_rate": 1.9925051454312454e-07, + "loss": 0.6877, + "step": 243 + }, + { + "epoch": 0.0, + "learning_rate": 1.9924663119878838e-07, + "loss": 0.6714, + "step": 244 + }, + { + "epoch": 0.0, + "learning_rate": 1.9924274785445226e-07, + "loss": 0.7108, + "step": 245 + }, + { + "epoch": 0.0, + "learning_rate": 1.992388645101161e-07, + "loss": 0.6822, + "step": 246 + }, + { + "epoch": 0.0, + "learning_rate": 1.9923498116577997e-07, + "loss": 0.6994, + "step": 247 + }, + { + "epoch": 0.0, + "learning_rate": 1.9923109782144382e-07, + "loss": 0.6621, + "step": 248 + }, + { + "epoch": 0.0, + "learning_rate": 1.992272144771077e-07, + "loss": 0.7121, + "step": 249 + }, + { + "epoch": 0.0, + "learning_rate": 1.9922333113277153e-07, + "loss": 0.6367, + "step": 250 + }, + { + "epoch": 0.0, + "learning_rate": 1.992194477884354e-07, + "loss": 0.6793, + "step": 251 + }, + { + "epoch": 0.0, + "learning_rate": 1.9921556444409925e-07, + "loss": 0.6622, + "step": 252 + }, + { + "epoch": 0.0, + "learning_rate": 1.992116810997631e-07, + "loss": 0.7114, + "step": 253 + }, + { + "epoch": 0.0, + "learning_rate": 1.9920779775542697e-07, + "loss": 0.7091, + "step": 254 + }, + { + "epoch": 0.0, + "learning_rate": 1.992039144110908e-07, + "loss": 0.6959, + "step": 255 + }, + { + "epoch": 0.0, + "learning_rate": 1.9920003106675468e-07, + "loss": 0.7315, + "step": 256 + }, + { + "epoch": 0.0, + "learning_rate": 1.9919614772241853e-07, + "loss": 0.6697, + "step": 257 + }, + { + "epoch": 0.01, + "learning_rate": 1.9919226437808237e-07, + "loss": 0.7179, + "step": 258 + }, + { + "epoch": 0.01, + "learning_rate": 1.9918838103374624e-07, + "loss": 0.6931, + "step": 259 + }, + { + "epoch": 0.01, + "learning_rate": 1.991844976894101e-07, + "loss": 0.6796, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 1.9918061434507396e-07, + "loss": 0.6925, + "step": 261 + }, + { + "epoch": 0.01, + "learning_rate": 1.991767310007378e-07, + "loss": 0.7331, + "step": 262 + }, + { + "epoch": 0.01, + "learning_rate": 1.9917284765640168e-07, + "loss": 0.6842, + "step": 263 + }, + { + "epoch": 0.01, + "learning_rate": 1.9916896431206552e-07, + "loss": 0.6821, + "step": 264 + }, + { + "epoch": 0.01, + "learning_rate": 1.991650809677294e-07, + "loss": 0.6873, + "step": 265 + }, + { + "epoch": 0.01, + "learning_rate": 1.9916119762339324e-07, + "loss": 0.6526, + "step": 266 + }, + { + "epoch": 0.01, + "learning_rate": 1.991573142790571e-07, + "loss": 0.6838, + "step": 267 + }, + { + "epoch": 0.01, + "learning_rate": 1.9915343093472096e-07, + "loss": 0.684, + "step": 268 + }, + { + "epoch": 0.01, + "learning_rate": 1.9914954759038483e-07, + "loss": 0.6976, + "step": 269 + }, + { + "epoch": 0.01, + "learning_rate": 1.9914566424604867e-07, + "loss": 0.6604, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 1.9914178090171254e-07, + "loss": 0.6683, + "step": 271 + }, + { + "epoch": 0.01, + "learning_rate": 1.991378975573764e-07, + "loss": 0.6755, + "step": 272 + }, + { + "epoch": 0.01, + "learning_rate": 1.9913401421304026e-07, + "loss": 0.7025, + "step": 273 + }, + { + "epoch": 0.01, + "learning_rate": 1.991301308687041e-07, + "loss": 0.6816, + "step": 274 + }, + { + "epoch": 0.01, + "learning_rate": 1.9912624752436798e-07, + "loss": 0.6488, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 1.9912236418003182e-07, + "loss": 0.6731, + "step": 276 + }, + { + "epoch": 0.01, + "learning_rate": 1.991184808356957e-07, + "loss": 0.6688, + "step": 277 + }, + { + "epoch": 0.01, + "learning_rate": 1.9911459749135954e-07, + "loss": 0.6776, + "step": 278 + }, + { + "epoch": 0.01, + "learning_rate": 1.991107141470234e-07, + "loss": 0.6764, + "step": 279 + }, + { + "epoch": 0.01, + "learning_rate": 1.9910683080268725e-07, + "loss": 0.6772, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 1.9910294745835113e-07, + "loss": 0.7063, + "step": 281 + }, + { + "epoch": 0.01, + "learning_rate": 1.9909906411401497e-07, + "loss": 0.7019, + "step": 282 + }, + { + "epoch": 0.01, + "learning_rate": 1.9909518076967884e-07, + "loss": 0.689, + "step": 283 + }, + { + "epoch": 0.01, + "learning_rate": 1.990912974253427e-07, + "loss": 0.7191, + "step": 284 + }, + { + "epoch": 0.01, + "learning_rate": 1.9908741408100656e-07, + "loss": 0.6809, + "step": 285 + }, + { + "epoch": 0.01, + "learning_rate": 1.990835307366704e-07, + "loss": 0.69, + "step": 286 + }, + { + "epoch": 0.01, + "learning_rate": 1.9907964739233428e-07, + "loss": 0.6688, + "step": 287 + }, + { + "epoch": 0.01, + "learning_rate": 1.9907576404799812e-07, + "loss": 0.7188, + "step": 288 + }, + { + "epoch": 0.01, + "learning_rate": 1.99071880703662e-07, + "loss": 0.7268, + "step": 289 + }, + { + "epoch": 0.01, + "learning_rate": 1.9906799735932584e-07, + "loss": 0.692, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 1.990641140149897e-07, + "loss": 0.6473, + "step": 291 + }, + { + "epoch": 0.01, + "learning_rate": 1.9906023067065355e-07, + "loss": 0.7034, + "step": 292 + }, + { + "epoch": 0.01, + "learning_rate": 1.9905634732631743e-07, + "loss": 0.7199, + "step": 293 + }, + { + "epoch": 0.01, + "learning_rate": 1.9905246398198127e-07, + "loss": 0.6769, + "step": 294 + }, + { + "epoch": 0.01, + "learning_rate": 1.9904858063764514e-07, + "loss": 0.7043, + "step": 295 + }, + { + "epoch": 0.01, + "learning_rate": 1.9904469729330899e-07, + "loss": 0.7345, + "step": 296 + }, + { + "epoch": 0.01, + "learning_rate": 1.9904081394897286e-07, + "loss": 0.6691, + "step": 297 + }, + { + "epoch": 0.01, + "learning_rate": 1.990369306046367e-07, + "loss": 0.6874, + "step": 298 + }, + { + "epoch": 0.01, + "learning_rate": 1.9903304726030057e-07, + "loss": 0.7031, + "step": 299 + }, + { + "epoch": 0.01, + "learning_rate": 1.9902916391596442e-07, + "loss": 0.6744, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 1.990252805716283e-07, + "loss": 0.6685, + "step": 301 + }, + { + "epoch": 0.01, + "learning_rate": 1.9902139722729214e-07, + "loss": 0.7247, + "step": 302 + }, + { + "epoch": 0.01, + "learning_rate": 1.99017513882956e-07, + "loss": 0.7111, + "step": 303 + }, + { + "epoch": 0.01, + "learning_rate": 1.9901363053861985e-07, + "loss": 0.6992, + "step": 304 + }, + { + "epoch": 0.01, + "learning_rate": 1.9900974719428372e-07, + "loss": 0.7175, + "step": 305 + }, + { + "epoch": 0.01, + "learning_rate": 1.9900586384994757e-07, + "loss": 0.6876, + "step": 306 + }, + { + "epoch": 0.01, + "learning_rate": 1.9900198050561144e-07, + "loss": 0.6823, + "step": 307 + }, + { + "epoch": 0.01, + "learning_rate": 1.9899809716127529e-07, + "loss": 0.672, + "step": 308 + }, + { + "epoch": 0.01, + "learning_rate": 1.9899421381693916e-07, + "loss": 0.6881, + "step": 309 + }, + { + "epoch": 0.01, + "learning_rate": 1.98990330472603e-07, + "loss": 0.6455, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 1.9898644712826685e-07, + "loss": 0.6885, + "step": 311 + }, + { + "epoch": 0.01, + "learning_rate": 1.989825637839307e-07, + "loss": 0.6476, + "step": 312 + }, + { + "epoch": 0.01, + "learning_rate": 1.9897868043959456e-07, + "loss": 0.6654, + "step": 313 + }, + { + "epoch": 0.01, + "learning_rate": 1.989747970952584e-07, + "loss": 0.6604, + "step": 314 + }, + { + "epoch": 0.01, + "learning_rate": 1.9897091375092228e-07, + "loss": 0.6976, + "step": 315 + }, + { + "epoch": 0.01, + "learning_rate": 1.9896703040658613e-07, + "loss": 0.7105, + "step": 316 + }, + { + "epoch": 0.01, + "learning_rate": 1.9896314706225e-07, + "loss": 0.7011, + "step": 317 + }, + { + "epoch": 0.01, + "learning_rate": 1.9895926371791384e-07, + "loss": 0.6945, + "step": 318 + }, + { + "epoch": 0.01, + "learning_rate": 1.989553803735777e-07, + "loss": 0.7114, + "step": 319 + }, + { + "epoch": 0.01, + "learning_rate": 1.9895149702924156e-07, + "loss": 0.7013, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 1.9894761368490543e-07, + "loss": 0.6888, + "step": 321 + }, + { + "epoch": 0.01, + "learning_rate": 1.9894373034056927e-07, + "loss": 0.6721, + "step": 322 + }, + { + "epoch": 0.01, + "learning_rate": 1.9893984699623315e-07, + "loss": 0.6665, + "step": 323 + }, + { + "epoch": 0.01, + "learning_rate": 1.98935963651897e-07, + "loss": 0.718, + "step": 324 + }, + { + "epoch": 0.01, + "learning_rate": 1.9893208030756086e-07, + "loss": 0.7019, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 1.989281969632247e-07, + "loss": 0.7457, + "step": 326 + }, + { + "epoch": 0.01, + "learning_rate": 1.9892431361888858e-07, + "loss": 0.7055, + "step": 327 + }, + { + "epoch": 0.01, + "learning_rate": 1.9892043027455242e-07, + "loss": 0.6514, + "step": 328 + }, + { + "epoch": 0.01, + "learning_rate": 1.989165469302163e-07, + "loss": 0.6575, + "step": 329 + }, + { + "epoch": 0.01, + "learning_rate": 1.9891266358588014e-07, + "loss": 0.7107, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 1.98908780241544e-07, + "loss": 0.7087, + "step": 331 + }, + { + "epoch": 0.01, + "learning_rate": 1.9890489689720786e-07, + "loss": 0.6725, + "step": 332 + }, + { + "epoch": 0.01, + "learning_rate": 1.9890101355287173e-07, + "loss": 0.7237, + "step": 333 + }, + { + "epoch": 0.01, + "learning_rate": 1.9889713020853557e-07, + "loss": 0.6757, + "step": 334 + }, + { + "epoch": 0.01, + "learning_rate": 1.9889324686419944e-07, + "loss": 0.691, + "step": 335 + }, + { + "epoch": 0.01, + "learning_rate": 1.988893635198633e-07, + "loss": 0.6707, + "step": 336 + }, + { + "epoch": 0.01, + "learning_rate": 1.9888548017552716e-07, + "loss": 0.6471, + "step": 337 + }, + { + "epoch": 0.01, + "learning_rate": 1.98881596831191e-07, + "loss": 0.7175, + "step": 338 + }, + { + "epoch": 0.01, + "learning_rate": 1.9887771348685488e-07, + "loss": 0.6856, + "step": 339 + }, + { + "epoch": 0.01, + "learning_rate": 1.9887383014251872e-07, + "loss": 0.7305, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 1.988699467981826e-07, + "loss": 0.7088, + "step": 341 + }, + { + "epoch": 0.01, + "learning_rate": 1.9886606345384644e-07, + "loss": 0.6848, + "step": 342 + }, + { + "epoch": 0.01, + "learning_rate": 1.988621801095103e-07, + "loss": 0.6596, + "step": 343 + }, + { + "epoch": 0.01, + "learning_rate": 1.9885829676517416e-07, + "loss": 0.7154, + "step": 344 + }, + { + "epoch": 0.01, + "learning_rate": 1.9885441342083803e-07, + "loss": 0.7355, + "step": 345 + }, + { + "epoch": 0.01, + "learning_rate": 1.9885053007650187e-07, + "loss": 0.7066, + "step": 346 + }, + { + "epoch": 0.01, + "learning_rate": 1.9884664673216574e-07, + "loss": 0.6556, + "step": 347 + }, + { + "epoch": 0.01, + "learning_rate": 1.988427633878296e-07, + "loss": 0.6806, + "step": 348 + }, + { + "epoch": 0.01, + "learning_rate": 1.9883888004349346e-07, + "loss": 0.6847, + "step": 349 + }, + { + "epoch": 0.01, + "learning_rate": 1.988349966991573e-07, + "loss": 0.6645, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 1.9883111335482118e-07, + "loss": 0.6736, + "step": 351 + }, + { + "epoch": 0.01, + "learning_rate": 1.9882723001048502e-07, + "loss": 0.6633, + "step": 352 + }, + { + "epoch": 0.01, + "learning_rate": 1.988233466661489e-07, + "loss": 0.7268, + "step": 353 + }, + { + "epoch": 0.01, + "learning_rate": 1.9881946332181274e-07, + "loss": 0.6798, + "step": 354 + }, + { + "epoch": 0.01, + "learning_rate": 1.988155799774766e-07, + "loss": 0.6698, + "step": 355 + }, + { + "epoch": 0.01, + "learning_rate": 1.9881169663314045e-07, + "loss": 0.6683, + "step": 356 + }, + { + "epoch": 0.01, + "learning_rate": 1.9880781328880433e-07, + "loss": 0.666, + "step": 357 + }, + { + "epoch": 0.01, + "learning_rate": 1.9880392994446817e-07, + "loss": 0.7177, + "step": 358 + }, + { + "epoch": 0.01, + "learning_rate": 1.9880004660013204e-07, + "loss": 0.6809, + "step": 359 + }, + { + "epoch": 0.01, + "learning_rate": 1.987961632557959e-07, + "loss": 0.6691, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 1.9879227991145976e-07, + "loss": 0.6887, + "step": 361 + }, + { + "epoch": 0.01, + "learning_rate": 1.987883965671236e-07, + "loss": 0.6992, + "step": 362 + }, + { + "epoch": 0.01, + "learning_rate": 1.9878451322278748e-07, + "loss": 0.6974, + "step": 363 + }, + { + "epoch": 0.01, + "learning_rate": 1.9878062987845132e-07, + "loss": 0.7599, + "step": 364 + }, + { + "epoch": 0.01, + "learning_rate": 1.987767465341152e-07, + "loss": 0.7045, + "step": 365 + }, + { + "epoch": 0.01, + "learning_rate": 1.9877286318977904e-07, + "loss": 0.6927, + "step": 366 + }, + { + "epoch": 0.01, + "learning_rate": 1.987689798454429e-07, + "loss": 0.6815, + "step": 367 + }, + { + "epoch": 0.01, + "learning_rate": 1.9876509650110675e-07, + "loss": 0.6332, + "step": 368 + }, + { + "epoch": 0.01, + "learning_rate": 1.987612131567706e-07, + "loss": 0.6887, + "step": 369 + }, + { + "epoch": 0.01, + "learning_rate": 1.9875732981243444e-07, + "loss": 0.6514, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 1.9875344646809832e-07, + "loss": 0.6516, + "step": 371 + }, + { + "epoch": 0.01, + "learning_rate": 1.9874956312376216e-07, + "loss": 0.6896, + "step": 372 + }, + { + "epoch": 0.01, + "learning_rate": 1.9874567977942603e-07, + "loss": 0.6666, + "step": 373 + }, + { + "epoch": 0.01, + "learning_rate": 1.9874179643508988e-07, + "loss": 0.6585, + "step": 374 + }, + { + "epoch": 0.01, + "learning_rate": 1.9873791309075375e-07, + "loss": 0.7133, + "step": 375 + }, + { + "epoch": 0.01, + "learning_rate": 1.987340297464176e-07, + "loss": 0.6771, + "step": 376 + }, + { + "epoch": 0.01, + "learning_rate": 1.9873014640208146e-07, + "loss": 0.7141, + "step": 377 + }, + { + "epoch": 0.01, + "learning_rate": 1.987262630577453e-07, + "loss": 0.6209, + "step": 378 + }, + { + "epoch": 0.01, + "learning_rate": 1.9872237971340918e-07, + "loss": 0.6658, + "step": 379 + }, + { + "epoch": 0.01, + "learning_rate": 1.9871849636907303e-07, + "loss": 0.6755, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 1.987146130247369e-07, + "loss": 0.6953, + "step": 381 + }, + { + "epoch": 0.01, + "learning_rate": 1.9871072968040074e-07, + "loss": 0.6789, + "step": 382 + }, + { + "epoch": 0.01, + "learning_rate": 1.9870684633606461e-07, + "loss": 0.6889, + "step": 383 + }, + { + "epoch": 0.01, + "learning_rate": 1.9870296299172846e-07, + "loss": 0.6958, + "step": 384 + }, + { + "epoch": 0.01, + "learning_rate": 1.9869907964739233e-07, + "loss": 0.6832, + "step": 385 + }, + { + "epoch": 0.01, + "learning_rate": 1.9869519630305618e-07, + "loss": 0.6439, + "step": 386 + }, + { + "epoch": 0.01, + "learning_rate": 1.9869131295872005e-07, + "loss": 0.7204, + "step": 387 + }, + { + "epoch": 0.01, + "learning_rate": 1.986874296143839e-07, + "loss": 0.6974, + "step": 388 + }, + { + "epoch": 0.01, + "learning_rate": 1.9868354627004776e-07, + "loss": 0.6469, + "step": 389 + }, + { + "epoch": 0.01, + "learning_rate": 1.986796629257116e-07, + "loss": 0.6966, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 1.9867577958137548e-07, + "loss": 0.6797, + "step": 391 + }, + { + "epoch": 0.01, + "learning_rate": 1.9867189623703933e-07, + "loss": 0.6646, + "step": 392 + }, + { + "epoch": 0.01, + "learning_rate": 1.986680128927032e-07, + "loss": 0.7152, + "step": 393 + }, + { + "epoch": 0.01, + "learning_rate": 1.9866412954836704e-07, + "loss": 0.6675, + "step": 394 + }, + { + "epoch": 0.01, + "learning_rate": 1.986602462040309e-07, + "loss": 0.6988, + "step": 395 + }, + { + "epoch": 0.01, + "learning_rate": 1.9865636285969476e-07, + "loss": 0.6714, + "step": 396 + }, + { + "epoch": 0.01, + "learning_rate": 1.9865247951535863e-07, + "loss": 0.7094, + "step": 397 + }, + { + "epoch": 0.01, + "learning_rate": 1.9864859617102247e-07, + "loss": 0.6636, + "step": 398 + }, + { + "epoch": 0.01, + "learning_rate": 1.9864471282668635e-07, + "loss": 0.7196, + "step": 399 + }, + { + "epoch": 0.01, + "learning_rate": 1.986408294823502e-07, + "loss": 0.6757, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 1.9863694613801406e-07, + "loss": 0.6777, + "step": 401 + }, + { + "epoch": 0.01, + "learning_rate": 1.986330627936779e-07, + "loss": 0.7273, + "step": 402 + }, + { + "epoch": 0.01, + "learning_rate": 1.9862917944934178e-07, + "loss": 0.656, + "step": 403 + }, + { + "epoch": 0.01, + "learning_rate": 1.9862529610500562e-07, + "loss": 0.68, + "step": 404 + }, + { + "epoch": 0.01, + "learning_rate": 1.9862141276066947e-07, + "loss": 0.6845, + "step": 405 + }, + { + "epoch": 0.01, + "learning_rate": 1.9861752941633334e-07, + "loss": 0.6629, + "step": 406 + }, + { + "epoch": 0.01, + "learning_rate": 1.9861364607199719e-07, + "loss": 0.654, + "step": 407 + }, + { + "epoch": 0.01, + "learning_rate": 1.9860976272766106e-07, + "loss": 0.6942, + "step": 408 + }, + { + "epoch": 0.01, + "learning_rate": 1.986058793833249e-07, + "loss": 0.6935, + "step": 409 + }, + { + "epoch": 0.01, + "learning_rate": 1.9860199603898877e-07, + "loss": 0.6991, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 1.9859811269465262e-07, + "loss": 0.677, + "step": 411 + }, + { + "epoch": 0.01, + "learning_rate": 1.985942293503165e-07, + "loss": 0.6868, + "step": 412 + }, + { + "epoch": 0.01, + "learning_rate": 1.9859034600598034e-07, + "loss": 0.7343, + "step": 413 + }, + { + "epoch": 0.01, + "learning_rate": 1.985864626616442e-07, + "loss": 0.677, + "step": 414 + }, + { + "epoch": 0.01, + "learning_rate": 1.9858257931730805e-07, + "loss": 0.6512, + "step": 415 + }, + { + "epoch": 0.01, + "learning_rate": 1.9857869597297192e-07, + "loss": 0.7189, + "step": 416 + }, + { + "epoch": 0.01, + "learning_rate": 1.9857481262863577e-07, + "loss": 0.731, + "step": 417 + }, + { + "epoch": 0.01, + "learning_rate": 1.9857092928429964e-07, + "loss": 0.6794, + "step": 418 + }, + { + "epoch": 0.01, + "learning_rate": 1.9856704593996348e-07, + "loss": 0.6826, + "step": 419 + }, + { + "epoch": 0.01, + "learning_rate": 1.9856316259562736e-07, + "loss": 0.6664, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 1.985592792512912e-07, + "loss": 0.6823, + "step": 421 + }, + { + "epoch": 0.01, + "learning_rate": 1.9855539590695507e-07, + "loss": 0.6517, + "step": 422 + }, + { + "epoch": 0.01, + "learning_rate": 1.9855151256261892e-07, + "loss": 0.6518, + "step": 423 + }, + { + "epoch": 0.01, + "learning_rate": 1.985476292182828e-07, + "loss": 0.7128, + "step": 424 + }, + { + "epoch": 0.01, + "learning_rate": 1.9854374587394663e-07, + "loss": 0.6933, + "step": 425 + }, + { + "epoch": 0.01, + "learning_rate": 1.985398625296105e-07, + "loss": 0.6683, + "step": 426 + }, + { + "epoch": 0.01, + "learning_rate": 1.9853597918527435e-07, + "loss": 0.62, + "step": 427 + }, + { + "epoch": 0.01, + "learning_rate": 1.985320958409382e-07, + "loss": 0.6711, + "step": 428 + }, + { + "epoch": 0.01, + "learning_rate": 1.9852821249660207e-07, + "loss": 0.6779, + "step": 429 + }, + { + "epoch": 0.01, + "learning_rate": 1.985243291522659e-07, + "loss": 0.6881, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 1.9852044580792978e-07, + "loss": 0.6647, + "step": 431 + }, + { + "epoch": 0.01, + "learning_rate": 1.9851656246359363e-07, + "loss": 0.6516, + "step": 432 + }, + { + "epoch": 0.01, + "learning_rate": 1.985126791192575e-07, + "loss": 0.6959, + "step": 433 + }, + { + "epoch": 0.01, + "learning_rate": 1.9850879577492135e-07, + "loss": 0.6792, + "step": 434 + }, + { + "epoch": 0.01, + "learning_rate": 1.985049124305852e-07, + "loss": 0.6845, + "step": 435 + }, + { + "epoch": 0.01, + "learning_rate": 1.9850102908624906e-07, + "loss": 0.6662, + "step": 436 + }, + { + "epoch": 0.01, + "learning_rate": 1.984971457419129e-07, + "loss": 0.6947, + "step": 437 + }, + { + "epoch": 0.01, + "learning_rate": 1.9849326239757678e-07, + "loss": 0.7235, + "step": 438 + }, + { + "epoch": 0.01, + "learning_rate": 1.9848937905324062e-07, + "loss": 0.6395, + "step": 439 + }, + { + "epoch": 0.01, + "learning_rate": 1.984854957089045e-07, + "loss": 0.6768, + "step": 440 + }, + { + "epoch": 0.01, + "learning_rate": 1.9848161236456834e-07, + "loss": 0.693, + "step": 441 + }, + { + "epoch": 0.01, + "learning_rate": 1.984777290202322e-07, + "loss": 0.6855, + "step": 442 + }, + { + "epoch": 0.01, + "learning_rate": 1.9847384567589606e-07, + "loss": 0.6852, + "step": 443 + }, + { + "epoch": 0.01, + "learning_rate": 1.9846996233155993e-07, + "loss": 0.6581, + "step": 444 + }, + { + "epoch": 0.01, + "learning_rate": 1.9846607898722377e-07, + "loss": 0.6467, + "step": 445 + }, + { + "epoch": 0.01, + "learning_rate": 1.9846219564288764e-07, + "loss": 0.6587, + "step": 446 + }, + { + "epoch": 0.01, + "learning_rate": 1.984583122985515e-07, + "loss": 0.6867, + "step": 447 + }, + { + "epoch": 0.01, + "learning_rate": 1.9845442895421536e-07, + "loss": 0.7054, + "step": 448 + }, + { + "epoch": 0.01, + "learning_rate": 1.984505456098792e-07, + "loss": 0.6679, + "step": 449 + }, + { + "epoch": 0.01, + "learning_rate": 1.9844666226554308e-07, + "loss": 0.6685, + "step": 450 + }, + { + "epoch": 0.01, + "learning_rate": 1.9844277892120692e-07, + "loss": 0.6879, + "step": 451 + }, + { + "epoch": 0.01, + "learning_rate": 1.984388955768708e-07, + "loss": 0.6546, + "step": 452 + }, + { + "epoch": 0.01, + "learning_rate": 1.9843501223253464e-07, + "loss": 0.7108, + "step": 453 + }, + { + "epoch": 0.01, + "learning_rate": 1.984311288881985e-07, + "loss": 0.7092, + "step": 454 + }, + { + "epoch": 0.01, + "learning_rate": 1.9842724554386235e-07, + "loss": 0.6677, + "step": 455 + }, + { + "epoch": 0.01, + "learning_rate": 1.9842336219952623e-07, + "loss": 0.6316, + "step": 456 + }, + { + "epoch": 0.01, + "learning_rate": 1.9841947885519007e-07, + "loss": 0.6848, + "step": 457 + }, + { + "epoch": 0.01, + "learning_rate": 1.9841559551085394e-07, + "loss": 0.6459, + "step": 458 + }, + { + "epoch": 0.01, + "learning_rate": 1.984117121665178e-07, + "loss": 0.6748, + "step": 459 + }, + { + "epoch": 0.01, + "learning_rate": 1.9840782882218166e-07, + "loss": 0.6927, + "step": 460 + }, + { + "epoch": 0.01, + "learning_rate": 1.984039454778455e-07, + "loss": 0.6884, + "step": 461 + }, + { + "epoch": 0.01, + "learning_rate": 1.9840006213350938e-07, + "loss": 0.6334, + "step": 462 + }, + { + "epoch": 0.01, + "learning_rate": 1.9839617878917322e-07, + "loss": 0.6456, + "step": 463 + }, + { + "epoch": 0.01, + "learning_rate": 1.983922954448371e-07, + "loss": 0.7365, + "step": 464 + }, + { + "epoch": 0.01, + "learning_rate": 1.9838841210050094e-07, + "loss": 0.6665, + "step": 465 + }, + { + "epoch": 0.01, + "learning_rate": 1.983845287561648e-07, + "loss": 0.6292, + "step": 466 + }, + { + "epoch": 0.01, + "learning_rate": 1.9838064541182865e-07, + "loss": 0.6746, + "step": 467 + }, + { + "epoch": 0.01, + "learning_rate": 1.9837676206749253e-07, + "loss": 0.7065, + "step": 468 + }, + { + "epoch": 0.01, + "learning_rate": 1.9837287872315637e-07, + "loss": 0.6914, + "step": 469 + }, + { + "epoch": 0.01, + "learning_rate": 1.9836899537882024e-07, + "loss": 0.6573, + "step": 470 + }, + { + "epoch": 0.01, + "learning_rate": 1.983651120344841e-07, + "loss": 0.65, + "step": 471 + }, + { + "epoch": 0.01, + "learning_rate": 1.9836122869014796e-07, + "loss": 0.7067, + "step": 472 + }, + { + "epoch": 0.01, + "learning_rate": 1.983573453458118e-07, + "loss": 0.7273, + "step": 473 + }, + { + "epoch": 0.01, + "learning_rate": 1.9835346200147567e-07, + "loss": 0.6993, + "step": 474 + }, + { + "epoch": 0.01, + "learning_rate": 1.9834957865713952e-07, + "loss": 0.6974, + "step": 475 + }, + { + "epoch": 0.01, + "learning_rate": 1.983456953128034e-07, + "loss": 0.6355, + "step": 476 + }, + { + "epoch": 0.01, + "learning_rate": 1.9834181196846724e-07, + "loss": 0.6988, + "step": 477 + }, + { + "epoch": 0.01, + "learning_rate": 1.983379286241311e-07, + "loss": 0.6168, + "step": 478 + }, + { + "epoch": 0.01, + "learning_rate": 1.9833404527979495e-07, + "loss": 0.6646, + "step": 479 + }, + { + "epoch": 0.01, + "learning_rate": 1.9833016193545882e-07, + "loss": 0.6896, + "step": 480 + }, + { + "epoch": 0.01, + "learning_rate": 1.9832627859112267e-07, + "loss": 0.7079, + "step": 481 + }, + { + "epoch": 0.01, + "learning_rate": 1.9832239524678654e-07, + "loss": 0.6668, + "step": 482 + }, + { + "epoch": 0.01, + "learning_rate": 1.9831851190245039e-07, + "loss": 0.6901, + "step": 483 + }, + { + "epoch": 0.01, + "learning_rate": 1.9831462855811426e-07, + "loss": 0.6925, + "step": 484 + }, + { + "epoch": 0.01, + "learning_rate": 1.9831074521377808e-07, + "loss": 0.6563, + "step": 485 + }, + { + "epoch": 0.01, + "learning_rate": 1.9830686186944195e-07, + "loss": 0.6806, + "step": 486 + }, + { + "epoch": 0.01, + "learning_rate": 1.983029785251058e-07, + "loss": 0.6579, + "step": 487 + }, + { + "epoch": 0.01, + "learning_rate": 1.9829909518076966e-07, + "loss": 0.7482, + "step": 488 + }, + { + "epoch": 0.01, + "learning_rate": 1.982952118364335e-07, + "loss": 0.6904, + "step": 489 + }, + { + "epoch": 0.01, + "learning_rate": 1.9829132849209738e-07, + "loss": 0.6862, + "step": 490 + }, + { + "epoch": 0.01, + "learning_rate": 1.9828744514776123e-07, + "loss": 0.6707, + "step": 491 + }, + { + "epoch": 0.01, + "learning_rate": 1.982835618034251e-07, + "loss": 0.6876, + "step": 492 + }, + { + "epoch": 0.01, + "learning_rate": 1.9827967845908894e-07, + "loss": 0.7012, + "step": 493 + }, + { + "epoch": 0.01, + "learning_rate": 1.982757951147528e-07, + "loss": 0.7018, + "step": 494 + }, + { + "epoch": 0.01, + "learning_rate": 1.9827191177041666e-07, + "loss": 0.6625, + "step": 495 + }, + { + "epoch": 0.01, + "learning_rate": 1.9826802842608053e-07, + "loss": 0.6668, + "step": 496 + }, + { + "epoch": 0.01, + "learning_rate": 1.9826414508174437e-07, + "loss": 0.6613, + "step": 497 + }, + { + "epoch": 0.01, + "learning_rate": 1.9826026173740825e-07, + "loss": 0.6842, + "step": 498 + }, + { + "epoch": 0.01, + "learning_rate": 1.982563783930721e-07, + "loss": 0.6907, + "step": 499 + }, + { + "epoch": 0.01, + "learning_rate": 1.9825249504873596e-07, + "loss": 0.6977, + "step": 500 + }, + { + "epoch": 0.01, + "learning_rate": 1.982486117043998e-07, + "loss": 0.635, + "step": 501 + }, + { + "epoch": 0.01, + "learning_rate": 1.9824472836006368e-07, + "loss": 0.6891, + "step": 502 + }, + { + "epoch": 0.01, + "learning_rate": 1.9824084501572752e-07, + "loss": 0.7293, + "step": 503 + }, + { + "epoch": 0.01, + "learning_rate": 1.982369616713914e-07, + "loss": 0.7054, + "step": 504 + }, + { + "epoch": 0.01, + "learning_rate": 1.9823307832705524e-07, + "loss": 0.6607, + "step": 505 + }, + { + "epoch": 0.01, + "learning_rate": 1.982291949827191e-07, + "loss": 0.6763, + "step": 506 + }, + { + "epoch": 0.01, + "learning_rate": 1.9822531163838296e-07, + "loss": 0.6761, + "step": 507 + }, + { + "epoch": 0.01, + "learning_rate": 1.9822142829404683e-07, + "loss": 0.6872, + "step": 508 + }, + { + "epoch": 0.01, + "learning_rate": 1.9821754494971067e-07, + "loss": 0.6605, + "step": 509 + }, + { + "epoch": 0.01, + "learning_rate": 1.9821366160537455e-07, + "loss": 0.6654, + "step": 510 + }, + { + "epoch": 0.01, + "learning_rate": 1.982097782610384e-07, + "loss": 0.686, + "step": 511 + }, + { + "epoch": 0.01, + "learning_rate": 1.9820589491670226e-07, + "loss": 0.6354, + "step": 512 + }, + { + "epoch": 0.01, + "learning_rate": 1.982020115723661e-07, + "loss": 0.6214, + "step": 513 + }, + { + "epoch": 0.01, + "learning_rate": 1.9819812822802998e-07, + "loss": 0.6796, + "step": 514 + }, + { + "epoch": 0.01, + "learning_rate": 1.9819424488369382e-07, + "loss": 0.715, + "step": 515 + }, + { + "epoch": 0.01, + "learning_rate": 1.981903615393577e-07, + "loss": 0.6675, + "step": 516 + }, + { + "epoch": 0.01, + "learning_rate": 1.9818647819502154e-07, + "loss": 0.6731, + "step": 517 + }, + { + "epoch": 0.01, + "learning_rate": 1.981825948506854e-07, + "loss": 0.661, + "step": 518 + }, + { + "epoch": 0.01, + "learning_rate": 1.9817871150634926e-07, + "loss": 0.7083, + "step": 519 + }, + { + "epoch": 0.01, + "learning_rate": 1.9817482816201313e-07, + "loss": 0.6675, + "step": 520 + }, + { + "epoch": 0.01, + "learning_rate": 1.9817094481767697e-07, + "loss": 0.6914, + "step": 521 + }, + { + "epoch": 0.01, + "learning_rate": 1.9816706147334084e-07, + "loss": 0.6735, + "step": 522 + }, + { + "epoch": 0.01, + "learning_rate": 1.981631781290047e-07, + "loss": 0.6644, + "step": 523 + }, + { + "epoch": 0.01, + "learning_rate": 1.9815929478466856e-07, + "loss": 0.6243, + "step": 524 + }, + { + "epoch": 0.01, + "learning_rate": 1.981554114403324e-07, + "loss": 0.6721, + "step": 525 + }, + { + "epoch": 0.01, + "learning_rate": 1.9815152809599628e-07, + "loss": 0.6882, + "step": 526 + }, + { + "epoch": 0.01, + "learning_rate": 1.9814764475166012e-07, + "loss": 0.6888, + "step": 527 + }, + { + "epoch": 0.01, + "learning_rate": 1.98143761407324e-07, + "loss": 0.669, + "step": 528 + }, + { + "epoch": 0.01, + "learning_rate": 1.9813987806298784e-07, + "loss": 0.734, + "step": 529 + }, + { + "epoch": 0.01, + "learning_rate": 1.981359947186517e-07, + "loss": 0.6941, + "step": 530 + }, + { + "epoch": 0.01, + "learning_rate": 1.9813211137431556e-07, + "loss": 0.6824, + "step": 531 + }, + { + "epoch": 0.01, + "learning_rate": 1.9812822802997943e-07, + "loss": 0.7194, + "step": 532 + }, + { + "epoch": 0.01, + "learning_rate": 1.9812434468564327e-07, + "loss": 0.6247, + "step": 533 + }, + { + "epoch": 0.01, + "learning_rate": 1.9812046134130714e-07, + "loss": 0.6504, + "step": 534 + }, + { + "epoch": 0.01, + "learning_rate": 1.98116577996971e-07, + "loss": 0.6895, + "step": 535 + }, + { + "epoch": 0.01, + "learning_rate": 1.9811269465263486e-07, + "loss": 0.7036, + "step": 536 + }, + { + "epoch": 0.01, + "learning_rate": 1.981088113082987e-07, + "loss": 0.6674, + "step": 537 + }, + { + "epoch": 0.01, + "learning_rate": 1.9810492796396258e-07, + "loss": 0.687, + "step": 538 + }, + { + "epoch": 0.01, + "learning_rate": 1.9810104461962642e-07, + "loss": 0.6735, + "step": 539 + }, + { + "epoch": 0.01, + "learning_rate": 1.980971612752903e-07, + "loss": 0.6704, + "step": 540 + }, + { + "epoch": 0.01, + "learning_rate": 1.9809327793095414e-07, + "loss": 0.658, + "step": 541 + }, + { + "epoch": 0.01, + "learning_rate": 1.98089394586618e-07, + "loss": 0.7265, + "step": 542 + }, + { + "epoch": 0.01, + "learning_rate": 1.9808551124228183e-07, + "loss": 0.7272, + "step": 543 + }, + { + "epoch": 0.01, + "learning_rate": 1.980816278979457e-07, + "loss": 0.6444, + "step": 544 + }, + { + "epoch": 0.01, + "learning_rate": 1.9807774455360954e-07, + "loss": 0.6574, + "step": 545 + }, + { + "epoch": 0.01, + "learning_rate": 1.9807386120927342e-07, + "loss": 0.6246, + "step": 546 + }, + { + "epoch": 0.01, + "learning_rate": 1.9806997786493726e-07, + "loss": 0.6875, + "step": 547 + }, + { + "epoch": 0.01, + "learning_rate": 1.9806609452060113e-07, + "loss": 0.6885, + "step": 548 + }, + { + "epoch": 0.01, + "learning_rate": 1.9806221117626498e-07, + "loss": 0.6728, + "step": 549 + }, + { + "epoch": 0.01, + "learning_rate": 1.9805832783192885e-07, + "loss": 0.663, + "step": 550 + }, + { + "epoch": 0.01, + "learning_rate": 1.980544444875927e-07, + "loss": 0.6305, + "step": 551 + }, + { + "epoch": 0.01, + "learning_rate": 1.9805056114325656e-07, + "loss": 0.6639, + "step": 552 + }, + { + "epoch": 0.01, + "learning_rate": 1.980466777989204e-07, + "loss": 0.6565, + "step": 553 + }, + { + "epoch": 0.01, + "learning_rate": 1.9804279445458428e-07, + "loss": 0.6569, + "step": 554 + }, + { + "epoch": 0.01, + "learning_rate": 1.9803891111024813e-07, + "loss": 0.657, + "step": 555 + }, + { + "epoch": 0.01, + "learning_rate": 1.98035027765912e-07, + "loss": 0.6189, + "step": 556 + }, + { + "epoch": 0.01, + "learning_rate": 1.9803114442157584e-07, + "loss": 0.6527, + "step": 557 + }, + { + "epoch": 0.01, + "learning_rate": 1.9802726107723971e-07, + "loss": 0.6723, + "step": 558 + }, + { + "epoch": 0.01, + "learning_rate": 1.9802337773290356e-07, + "loss": 0.6819, + "step": 559 + }, + { + "epoch": 0.01, + "learning_rate": 1.9801949438856743e-07, + "loss": 0.6669, + "step": 560 + }, + { + "epoch": 0.01, + "learning_rate": 1.9801561104423128e-07, + "loss": 0.691, + "step": 561 + }, + { + "epoch": 0.01, + "learning_rate": 1.9801172769989515e-07, + "loss": 0.6804, + "step": 562 + }, + { + "epoch": 0.01, + "learning_rate": 1.98007844355559e-07, + "loss": 0.6848, + "step": 563 + }, + { + "epoch": 0.01, + "learning_rate": 1.9800396101122286e-07, + "loss": 0.6873, + "step": 564 + }, + { + "epoch": 0.01, + "learning_rate": 1.980000776668867e-07, + "loss": 0.6366, + "step": 565 + }, + { + "epoch": 0.01, + "learning_rate": 1.9799619432255058e-07, + "loss": 0.6746, + "step": 566 + }, + { + "epoch": 0.01, + "learning_rate": 1.9799231097821443e-07, + "loss": 0.6991, + "step": 567 + }, + { + "epoch": 0.01, + "learning_rate": 1.979884276338783e-07, + "loss": 0.6383, + "step": 568 + }, + { + "epoch": 0.01, + "learning_rate": 1.9798454428954214e-07, + "loss": 0.6209, + "step": 569 + }, + { + "epoch": 0.01, + "learning_rate": 1.9798066094520601e-07, + "loss": 0.6143, + "step": 570 + }, + { + "epoch": 0.01, + "learning_rate": 1.9797677760086986e-07, + "loss": 0.6539, + "step": 571 + }, + { + "epoch": 0.01, + "learning_rate": 1.9797289425653373e-07, + "loss": 0.679, + "step": 572 + }, + { + "epoch": 0.01, + "learning_rate": 1.9796901091219757e-07, + "loss": 0.6696, + "step": 573 + }, + { + "epoch": 0.01, + "learning_rate": 1.9796512756786145e-07, + "loss": 0.6744, + "step": 574 + }, + { + "epoch": 0.01, + "learning_rate": 1.979612442235253e-07, + "loss": 0.7208, + "step": 575 + }, + { + "epoch": 0.01, + "learning_rate": 1.9795736087918916e-07, + "loss": 0.6493, + "step": 576 + }, + { + "epoch": 0.01, + "learning_rate": 1.97953477534853e-07, + "loss": 0.6788, + "step": 577 + }, + { + "epoch": 0.01, + "learning_rate": 1.9794959419051688e-07, + "loss": 0.6517, + "step": 578 + }, + { + "epoch": 0.01, + "learning_rate": 1.9794571084618072e-07, + "loss": 0.7357, + "step": 579 + }, + { + "epoch": 0.01, + "learning_rate": 1.979418275018446e-07, + "loss": 0.6893, + "step": 580 + }, + { + "epoch": 0.01, + "learning_rate": 1.9793794415750844e-07, + "loss": 0.6509, + "step": 581 + }, + { + "epoch": 0.01, + "learning_rate": 1.9793406081317229e-07, + "loss": 0.6653, + "step": 582 + }, + { + "epoch": 0.01, + "learning_rate": 1.9793017746883616e-07, + "loss": 0.6862, + "step": 583 + }, + { + "epoch": 0.01, + "learning_rate": 1.979262941245e-07, + "loss": 0.6435, + "step": 584 + }, + { + "epoch": 0.01, + "learning_rate": 1.9792241078016387e-07, + "loss": 0.7067, + "step": 585 + }, + { + "epoch": 0.01, + "learning_rate": 1.9791852743582772e-07, + "loss": 0.6578, + "step": 586 + }, + { + "epoch": 0.01, + "learning_rate": 1.979146440914916e-07, + "loss": 0.6315, + "step": 587 + }, + { + "epoch": 0.01, + "learning_rate": 1.9791076074715544e-07, + "loss": 0.695, + "step": 588 + }, + { + "epoch": 0.01, + "learning_rate": 1.979068774028193e-07, + "loss": 0.6952, + "step": 589 + }, + { + "epoch": 0.01, + "learning_rate": 1.9790299405848315e-07, + "loss": 0.5991, + "step": 590 + }, + { + "epoch": 0.01, + "learning_rate": 1.9789911071414702e-07, + "loss": 0.696, + "step": 591 + }, + { + "epoch": 0.01, + "learning_rate": 1.9789522736981087e-07, + "loss": 0.6901, + "step": 592 + }, + { + "epoch": 0.01, + "learning_rate": 1.9789134402547474e-07, + "loss": 0.7512, + "step": 593 + }, + { + "epoch": 0.01, + "learning_rate": 1.9788746068113858e-07, + "loss": 0.691, + "step": 594 + }, + { + "epoch": 0.01, + "learning_rate": 1.9788357733680246e-07, + "loss": 0.6766, + "step": 595 + }, + { + "epoch": 0.01, + "learning_rate": 1.978796939924663e-07, + "loss": 0.6448, + "step": 596 + }, + { + "epoch": 0.01, + "learning_rate": 1.9787581064813017e-07, + "loss": 0.6309, + "step": 597 + }, + { + "epoch": 0.01, + "learning_rate": 1.9787192730379402e-07, + "loss": 0.7199, + "step": 598 + }, + { + "epoch": 0.01, + "learning_rate": 1.978680439594579e-07, + "loss": 0.6953, + "step": 599 + }, + { + "epoch": 0.01, + "learning_rate": 1.9786416061512173e-07, + "loss": 0.6663, + "step": 600 + }, + { + "epoch": 0.01, + "learning_rate": 1.9786027727078558e-07, + "loss": 0.6427, + "step": 601 + }, + { + "epoch": 0.01, + "learning_rate": 1.9785639392644945e-07, + "loss": 0.6907, + "step": 602 + }, + { + "epoch": 0.01, + "learning_rate": 1.978525105821133e-07, + "loss": 0.6779, + "step": 603 + }, + { + "epoch": 0.01, + "learning_rate": 1.9784862723777717e-07, + "loss": 0.6948, + "step": 604 + }, + { + "epoch": 0.01, + "learning_rate": 1.97844743893441e-07, + "loss": 0.6449, + "step": 605 + }, + { + "epoch": 0.01, + "learning_rate": 1.9784086054910488e-07, + "loss": 0.6737, + "step": 606 + }, + { + "epoch": 0.01, + "learning_rate": 1.9783697720476873e-07, + "loss": 0.6655, + "step": 607 + }, + { + "epoch": 0.01, + "learning_rate": 1.978330938604326e-07, + "loss": 0.7, + "step": 608 + }, + { + "epoch": 0.01, + "learning_rate": 1.9782921051609645e-07, + "loss": 0.7121, + "step": 609 + }, + { + "epoch": 0.01, + "learning_rate": 1.9782532717176032e-07, + "loss": 0.7207, + "step": 610 + }, + { + "epoch": 0.01, + "learning_rate": 1.9782144382742416e-07, + "loss": 0.6938, + "step": 611 + }, + { + "epoch": 0.01, + "learning_rate": 1.97817560483088e-07, + "loss": 0.6717, + "step": 612 + }, + { + "epoch": 0.01, + "learning_rate": 1.9781367713875188e-07, + "loss": 0.6728, + "step": 613 + }, + { + "epoch": 0.01, + "learning_rate": 1.9780979379441572e-07, + "loss": 0.636, + "step": 614 + }, + { + "epoch": 0.01, + "learning_rate": 1.978059104500796e-07, + "loss": 0.6316, + "step": 615 + }, + { + "epoch": 0.01, + "learning_rate": 1.9780202710574344e-07, + "loss": 0.6303, + "step": 616 + }, + { + "epoch": 0.01, + "learning_rate": 1.977981437614073e-07, + "loss": 0.6406, + "step": 617 + }, + { + "epoch": 0.01, + "learning_rate": 1.9779426041707116e-07, + "loss": 0.6896, + "step": 618 + }, + { + "epoch": 0.01, + "learning_rate": 1.9779037707273503e-07, + "loss": 0.6544, + "step": 619 + }, + { + "epoch": 0.01, + "learning_rate": 1.9778649372839887e-07, + "loss": 0.6628, + "step": 620 + }, + { + "epoch": 0.01, + "learning_rate": 1.9778261038406274e-07, + "loss": 0.6818, + "step": 621 + }, + { + "epoch": 0.01, + "learning_rate": 1.977787270397266e-07, + "loss": 0.703, + "step": 622 + }, + { + "epoch": 0.01, + "learning_rate": 1.9777484369539046e-07, + "loss": 0.656, + "step": 623 + }, + { + "epoch": 0.01, + "learning_rate": 1.977709603510543e-07, + "loss": 0.6765, + "step": 624 + }, + { + "epoch": 0.01, + "learning_rate": 1.9776707700671818e-07, + "loss": 0.6627, + "step": 625 + }, + { + "epoch": 0.01, + "learning_rate": 1.9776319366238202e-07, + "loss": 0.6602, + "step": 626 + }, + { + "epoch": 0.01, + "learning_rate": 1.977593103180459e-07, + "loss": 0.6866, + "step": 627 + }, + { + "epoch": 0.01, + "learning_rate": 1.9775542697370974e-07, + "loss": 0.6795, + "step": 628 + }, + { + "epoch": 0.01, + "learning_rate": 1.977515436293736e-07, + "loss": 0.6517, + "step": 629 + }, + { + "epoch": 0.01, + "learning_rate": 1.9774766028503746e-07, + "loss": 0.6529, + "step": 630 + }, + { + "epoch": 0.01, + "learning_rate": 1.9774377694070133e-07, + "loss": 0.5939, + "step": 631 + }, + { + "epoch": 0.01, + "learning_rate": 1.9773989359636517e-07, + "loss": 0.6936, + "step": 632 + }, + { + "epoch": 0.01, + "learning_rate": 1.9773601025202904e-07, + "loss": 0.6555, + "step": 633 + }, + { + "epoch": 0.01, + "learning_rate": 1.977321269076929e-07, + "loss": 0.6712, + "step": 634 + }, + { + "epoch": 0.01, + "learning_rate": 1.9772824356335676e-07, + "loss": 0.6787, + "step": 635 + }, + { + "epoch": 0.01, + "learning_rate": 1.977243602190206e-07, + "loss": 0.6335, + "step": 636 + }, + { + "epoch": 0.01, + "learning_rate": 1.9772047687468448e-07, + "loss": 0.6389, + "step": 637 + }, + { + "epoch": 0.01, + "learning_rate": 1.9771659353034832e-07, + "loss": 0.6718, + "step": 638 + }, + { + "epoch": 0.01, + "learning_rate": 1.977127101860122e-07, + "loss": 0.6714, + "step": 639 + }, + { + "epoch": 0.01, + "learning_rate": 1.9770882684167604e-07, + "loss": 0.6568, + "step": 640 + }, + { + "epoch": 0.01, + "learning_rate": 1.977049434973399e-07, + "loss": 0.6776, + "step": 641 + }, + { + "epoch": 0.01, + "learning_rate": 1.9770106015300375e-07, + "loss": 0.7428, + "step": 642 + }, + { + "epoch": 0.01, + "learning_rate": 1.9769717680866763e-07, + "loss": 0.6695, + "step": 643 + }, + { + "epoch": 0.01, + "learning_rate": 1.9769329346433147e-07, + "loss": 0.6371, + "step": 644 + }, + { + "epoch": 0.01, + "learning_rate": 1.9768941011999534e-07, + "loss": 0.6273, + "step": 645 + }, + { + "epoch": 0.01, + "learning_rate": 1.976855267756592e-07, + "loss": 0.6241, + "step": 646 + }, + { + "epoch": 0.01, + "learning_rate": 1.9768164343132306e-07, + "loss": 0.6837, + "step": 647 + }, + { + "epoch": 0.01, + "learning_rate": 1.976777600869869e-07, + "loss": 0.5847, + "step": 648 + }, + { + "epoch": 0.01, + "learning_rate": 1.9767387674265077e-07, + "loss": 0.6752, + "step": 649 + }, + { + "epoch": 0.01, + "learning_rate": 1.9766999339831462e-07, + "loss": 0.6488, + "step": 650 + }, + { + "epoch": 0.01, + "learning_rate": 1.976661100539785e-07, + "loss": 0.6895, + "step": 651 + }, + { + "epoch": 0.01, + "learning_rate": 1.9766222670964234e-07, + "loss": 0.6778, + "step": 652 + }, + { + "epoch": 0.01, + "learning_rate": 1.976583433653062e-07, + "loss": 0.6592, + "step": 653 + }, + { + "epoch": 0.01, + "learning_rate": 1.9765446002097005e-07, + "loss": 0.6579, + "step": 654 + }, + { + "epoch": 0.01, + "learning_rate": 1.9765057667663392e-07, + "loss": 0.6779, + "step": 655 + }, + { + "epoch": 0.01, + "learning_rate": 1.9764669333229777e-07, + "loss": 0.635, + "step": 656 + }, + { + "epoch": 0.01, + "learning_rate": 1.9764280998796164e-07, + "loss": 0.6182, + "step": 657 + }, + { + "epoch": 0.01, + "learning_rate": 1.9763892664362549e-07, + "loss": 0.6409, + "step": 658 + }, + { + "epoch": 0.01, + "learning_rate": 1.9763504329928933e-07, + "loss": 0.6494, + "step": 659 + }, + { + "epoch": 0.01, + "learning_rate": 1.9763115995495318e-07, + "loss": 0.6747, + "step": 660 + }, + { + "epoch": 0.01, + "learning_rate": 1.9762727661061705e-07, + "loss": 0.6283, + "step": 661 + }, + { + "epoch": 0.01, + "learning_rate": 1.976233932662809e-07, + "loss": 0.6681, + "step": 662 + }, + { + "epoch": 0.01, + "learning_rate": 1.9761950992194476e-07, + "loss": 0.6799, + "step": 663 + }, + { + "epoch": 0.01, + "learning_rate": 1.976156265776086e-07, + "loss": 0.6511, + "step": 664 + }, + { + "epoch": 0.01, + "learning_rate": 1.9761174323327248e-07, + "loss": 0.6689, + "step": 665 + }, + { + "epoch": 0.01, + "learning_rate": 1.9760785988893633e-07, + "loss": 0.6415, + "step": 666 + }, + { + "epoch": 0.01, + "learning_rate": 1.976039765446002e-07, + "loss": 0.7374, + "step": 667 + }, + { + "epoch": 0.01, + "learning_rate": 1.9760009320026404e-07, + "loss": 0.693, + "step": 668 + }, + { + "epoch": 0.01, + "learning_rate": 1.9759620985592791e-07, + "loss": 0.6558, + "step": 669 + }, + { + "epoch": 0.01, + "learning_rate": 1.9759232651159176e-07, + "loss": 0.6855, + "step": 670 + }, + { + "epoch": 0.01, + "learning_rate": 1.9758844316725563e-07, + "loss": 0.63, + "step": 671 + }, + { + "epoch": 0.01, + "learning_rate": 1.9758455982291947e-07, + "loss": 0.6225, + "step": 672 + }, + { + "epoch": 0.01, + "learning_rate": 1.9758067647858335e-07, + "loss": 0.6574, + "step": 673 + }, + { + "epoch": 0.01, + "learning_rate": 1.975767931342472e-07, + "loss": 0.7026, + "step": 674 + }, + { + "epoch": 0.01, + "learning_rate": 1.9757290978991106e-07, + "loss": 0.6773, + "step": 675 + }, + { + "epoch": 0.01, + "learning_rate": 1.975690264455749e-07, + "loss": 0.6029, + "step": 676 + }, + { + "epoch": 0.01, + "learning_rate": 1.9756514310123878e-07, + "loss": 0.6803, + "step": 677 + }, + { + "epoch": 0.01, + "learning_rate": 1.9756125975690262e-07, + "loss": 0.6694, + "step": 678 + }, + { + "epoch": 0.01, + "learning_rate": 1.975573764125665e-07, + "loss": 0.6552, + "step": 679 + }, + { + "epoch": 0.01, + "learning_rate": 1.9755349306823034e-07, + "loss": 0.654, + "step": 680 + }, + { + "epoch": 0.01, + "learning_rate": 1.975496097238942e-07, + "loss": 0.6491, + "step": 681 + }, + { + "epoch": 0.01, + "learning_rate": 1.9754572637955806e-07, + "loss": 0.7227, + "step": 682 + }, + { + "epoch": 0.01, + "learning_rate": 1.9754184303522193e-07, + "loss": 0.6385, + "step": 683 + }, + { + "epoch": 0.01, + "learning_rate": 1.9753795969088577e-07, + "loss": 0.6445, + "step": 684 + }, + { + "epoch": 0.01, + "learning_rate": 1.9753407634654965e-07, + "loss": 0.7154, + "step": 685 + }, + { + "epoch": 0.01, + "learning_rate": 1.975301930022135e-07, + "loss": 0.6376, + "step": 686 + }, + { + "epoch": 0.01, + "learning_rate": 1.9752630965787736e-07, + "loss": 0.7111, + "step": 687 + }, + { + "epoch": 0.01, + "learning_rate": 1.975224263135412e-07, + "loss": 0.7268, + "step": 688 + }, + { + "epoch": 0.01, + "learning_rate": 1.9751854296920508e-07, + "loss": 0.6643, + "step": 689 + }, + { + "epoch": 0.01, + "learning_rate": 1.9751465962486892e-07, + "loss": 0.6843, + "step": 690 + }, + { + "epoch": 0.01, + "learning_rate": 1.975107762805328e-07, + "loss": 0.6708, + "step": 691 + }, + { + "epoch": 0.01, + "learning_rate": 1.9750689293619664e-07, + "loss": 0.6653, + "step": 692 + }, + { + "epoch": 0.01, + "learning_rate": 1.975030095918605e-07, + "loss": 0.6706, + "step": 693 + }, + { + "epoch": 0.01, + "learning_rate": 1.9749912624752436e-07, + "loss": 0.7087, + "step": 694 + }, + { + "epoch": 0.01, + "learning_rate": 1.9749524290318823e-07, + "loss": 0.7395, + "step": 695 + }, + { + "epoch": 0.01, + "learning_rate": 1.9749135955885207e-07, + "loss": 0.6546, + "step": 696 + }, + { + "epoch": 0.01, + "learning_rate": 1.9748747621451594e-07, + "loss": 0.6716, + "step": 697 + }, + { + "epoch": 0.01, + "learning_rate": 1.974835928701798e-07, + "loss": 0.6621, + "step": 698 + }, + { + "epoch": 0.01, + "learning_rate": 1.9747970952584366e-07, + "loss": 0.6607, + "step": 699 + }, + { + "epoch": 0.01, + "learning_rate": 1.974758261815075e-07, + "loss": 0.6793, + "step": 700 + }, + { + "epoch": 0.01, + "learning_rate": 1.9747194283717138e-07, + "loss": 0.7129, + "step": 701 + }, + { + "epoch": 0.01, + "learning_rate": 1.9746805949283522e-07, + "loss": 0.7121, + "step": 702 + }, + { + "epoch": 0.01, + "learning_rate": 1.974641761484991e-07, + "loss": 0.6568, + "step": 703 + }, + { + "epoch": 0.01, + "learning_rate": 1.9746029280416294e-07, + "loss": 0.5816, + "step": 704 + }, + { + "epoch": 0.01, + "learning_rate": 1.974564094598268e-07, + "loss": 0.6845, + "step": 705 + }, + { + "epoch": 0.01, + "learning_rate": 1.9745252611549066e-07, + "loss": 0.6815, + "step": 706 + }, + { + "epoch": 0.01, + "learning_rate": 1.9744864277115453e-07, + "loss": 0.6426, + "step": 707 + }, + { + "epoch": 0.01, + "learning_rate": 1.9744475942681837e-07, + "loss": 0.6584, + "step": 708 + }, + { + "epoch": 0.01, + "learning_rate": 1.9744087608248224e-07, + "loss": 0.6352, + "step": 709 + }, + { + "epoch": 0.01, + "learning_rate": 1.974369927381461e-07, + "loss": 0.6495, + "step": 710 + }, + { + "epoch": 0.01, + "learning_rate": 1.9743310939380996e-07, + "loss": 0.6458, + "step": 711 + }, + { + "epoch": 0.01, + "learning_rate": 1.974292260494738e-07, + "loss": 0.6532, + "step": 712 + }, + { + "epoch": 0.01, + "learning_rate": 1.9742534270513768e-07, + "loss": 0.5996, + "step": 713 + }, + { + "epoch": 0.01, + "learning_rate": 1.9742145936080152e-07, + "loss": 0.6346, + "step": 714 + }, + { + "epoch": 0.01, + "learning_rate": 1.974175760164654e-07, + "loss": 0.69, + "step": 715 + }, + { + "epoch": 0.01, + "learning_rate": 1.9741369267212924e-07, + "loss": 0.6381, + "step": 716 + }, + { + "epoch": 0.01, + "learning_rate": 1.9740980932779308e-07, + "loss": 0.672, + "step": 717 + }, + { + "epoch": 0.01, + "learning_rate": 1.9740592598345693e-07, + "loss": 0.6469, + "step": 718 + }, + { + "epoch": 0.01, + "learning_rate": 1.974020426391208e-07, + "loss": 0.6679, + "step": 719 + }, + { + "epoch": 0.01, + "learning_rate": 1.9739815929478464e-07, + "loss": 0.642, + "step": 720 + }, + { + "epoch": 0.01, + "learning_rate": 1.9739427595044852e-07, + "loss": 0.6555, + "step": 721 + }, + { + "epoch": 0.01, + "learning_rate": 1.9739039260611236e-07, + "loss": 0.59, + "step": 722 + }, + { + "epoch": 0.01, + "learning_rate": 1.9738650926177623e-07, + "loss": 0.6499, + "step": 723 + }, + { + "epoch": 0.01, + "learning_rate": 1.9738262591744008e-07, + "loss": 0.7141, + "step": 724 + }, + { + "epoch": 0.01, + "learning_rate": 1.9737874257310395e-07, + "loss": 0.6774, + "step": 725 + }, + { + "epoch": 0.01, + "learning_rate": 1.973748592287678e-07, + "loss": 0.6493, + "step": 726 + }, + { + "epoch": 0.01, + "learning_rate": 1.9737097588443167e-07, + "loss": 0.6525, + "step": 727 + }, + { + "epoch": 0.01, + "learning_rate": 1.973670925400955e-07, + "loss": 0.6243, + "step": 728 + }, + { + "epoch": 0.01, + "learning_rate": 1.9736320919575938e-07, + "loss": 0.6781, + "step": 729 + }, + { + "epoch": 0.01, + "learning_rate": 1.9735932585142323e-07, + "loss": 0.6807, + "step": 730 + }, + { + "epoch": 0.01, + "learning_rate": 1.973554425070871e-07, + "loss": 0.6667, + "step": 731 + }, + { + "epoch": 0.01, + "learning_rate": 1.9735155916275094e-07, + "loss": 0.6561, + "step": 732 + }, + { + "epoch": 0.01, + "learning_rate": 1.9734767581841481e-07, + "loss": 0.7187, + "step": 733 + }, + { + "epoch": 0.01, + "learning_rate": 1.9734379247407866e-07, + "loss": 0.666, + "step": 734 + }, + { + "epoch": 0.01, + "learning_rate": 1.9733990912974253e-07, + "loss": 0.7042, + "step": 735 + }, + { + "epoch": 0.01, + "learning_rate": 1.9733602578540638e-07, + "loss": 0.6126, + "step": 736 + }, + { + "epoch": 0.01, + "learning_rate": 1.9733214244107025e-07, + "loss": 0.6436, + "step": 737 + }, + { + "epoch": 0.01, + "learning_rate": 1.973282590967341e-07, + "loss": 0.6622, + "step": 738 + }, + { + "epoch": 0.01, + "learning_rate": 1.9732437575239796e-07, + "loss": 0.6353, + "step": 739 + }, + { + "epoch": 0.01, + "learning_rate": 1.973204924080618e-07, + "loss": 0.6484, + "step": 740 + }, + { + "epoch": 0.01, + "learning_rate": 1.9731660906372568e-07, + "loss": 0.668, + "step": 741 + }, + { + "epoch": 0.01, + "learning_rate": 1.9731272571938953e-07, + "loss": 0.6155, + "step": 742 + }, + { + "epoch": 0.01, + "learning_rate": 1.973088423750534e-07, + "loss": 0.7053, + "step": 743 + }, + { + "epoch": 0.01, + "learning_rate": 1.9730495903071724e-07, + "loss": 0.6879, + "step": 744 + }, + { + "epoch": 0.01, + "learning_rate": 1.9730107568638111e-07, + "loss": 0.6334, + "step": 745 + }, + { + "epoch": 0.01, + "learning_rate": 1.9729719234204496e-07, + "loss": 0.6524, + "step": 746 + }, + { + "epoch": 0.01, + "learning_rate": 1.9729330899770883e-07, + "loss": 0.6308, + "step": 747 + }, + { + "epoch": 0.01, + "learning_rate": 1.9728942565337267e-07, + "loss": 0.6647, + "step": 748 + }, + { + "epoch": 0.01, + "learning_rate": 1.9728554230903655e-07, + "loss": 0.6154, + "step": 749 + }, + { + "epoch": 0.01, + "learning_rate": 1.972816589647004e-07, + "loss": 0.6081, + "step": 750 + }, + { + "epoch": 0.01, + "learning_rate": 1.9727777562036426e-07, + "loss": 0.6475, + "step": 751 + }, + { + "epoch": 0.01, + "learning_rate": 1.972738922760281e-07, + "loss": 0.6805, + "step": 752 + }, + { + "epoch": 0.01, + "learning_rate": 1.9727000893169198e-07, + "loss": 0.7127, + "step": 753 + }, + { + "epoch": 0.01, + "learning_rate": 1.9726612558735582e-07, + "loss": 0.6291, + "step": 754 + }, + { + "epoch": 0.01, + "learning_rate": 1.972622422430197e-07, + "loss": 0.6512, + "step": 755 + }, + { + "epoch": 0.01, + "learning_rate": 1.9725835889868354e-07, + "loss": 0.6541, + "step": 756 + }, + { + "epoch": 0.01, + "learning_rate": 1.972544755543474e-07, + "loss": 0.6361, + "step": 757 + }, + { + "epoch": 0.01, + "learning_rate": 1.9725059221001126e-07, + "loss": 0.7104, + "step": 758 + }, + { + "epoch": 0.01, + "learning_rate": 1.972467088656751e-07, + "loss": 0.6245, + "step": 759 + }, + { + "epoch": 0.01, + "learning_rate": 1.9724282552133897e-07, + "loss": 0.6024, + "step": 760 + }, + { + "epoch": 0.01, + "learning_rate": 1.9723894217700282e-07, + "loss": 0.6813, + "step": 761 + }, + { + "epoch": 0.01, + "learning_rate": 1.972350588326667e-07, + "loss": 0.6638, + "step": 762 + }, + { + "epoch": 0.01, + "learning_rate": 1.9723117548833054e-07, + "loss": 0.6563, + "step": 763 + }, + { + "epoch": 0.01, + "learning_rate": 1.972272921439944e-07, + "loss": 0.6381, + "step": 764 + }, + { + "epoch": 0.01, + "learning_rate": 1.9722340879965825e-07, + "loss": 0.66, + "step": 765 + }, + { + "epoch": 0.01, + "learning_rate": 1.9721952545532212e-07, + "loss": 0.6366, + "step": 766 + }, + { + "epoch": 0.01, + "learning_rate": 1.9721564211098597e-07, + "loss": 0.6688, + "step": 767 + }, + { + "epoch": 0.01, + "learning_rate": 1.9721175876664984e-07, + "loss": 0.6305, + "step": 768 + }, + { + "epoch": 0.01, + "learning_rate": 1.9720787542231368e-07, + "loss": 0.6876, + "step": 769 + }, + { + "epoch": 0.01, + "learning_rate": 1.9720399207797756e-07, + "loss": 0.6321, + "step": 770 + }, + { + "epoch": 0.01, + "learning_rate": 1.972001087336414e-07, + "loss": 0.6281, + "step": 771 + }, + { + "epoch": 0.01, + "learning_rate": 1.9719622538930527e-07, + "loss": 0.6832, + "step": 772 + }, + { + "epoch": 0.01, + "learning_rate": 1.9719234204496912e-07, + "loss": 0.6484, + "step": 773 + }, + { + "epoch": 0.02, + "learning_rate": 1.97188458700633e-07, + "loss": 0.6676, + "step": 774 + }, + { + "epoch": 0.02, + "learning_rate": 1.9718457535629683e-07, + "loss": 0.6521, + "step": 775 + }, + { + "epoch": 0.02, + "learning_rate": 1.9718069201196068e-07, + "loss": 0.618, + "step": 776 + }, + { + "epoch": 0.02, + "learning_rate": 1.9717680866762455e-07, + "loss": 0.65, + "step": 777 + }, + { + "epoch": 0.02, + "learning_rate": 1.971729253232884e-07, + "loss": 0.666, + "step": 778 + }, + { + "epoch": 0.02, + "learning_rate": 1.9716904197895227e-07, + "loss": 0.7003, + "step": 779 + }, + { + "epoch": 0.02, + "learning_rate": 1.971651586346161e-07, + "loss": 0.5724, + "step": 780 + }, + { + "epoch": 0.02, + "learning_rate": 1.9716127529027998e-07, + "loss": 0.6608, + "step": 781 + }, + { + "epoch": 0.02, + "learning_rate": 1.9715739194594383e-07, + "loss": 0.7361, + "step": 782 + }, + { + "epoch": 0.02, + "learning_rate": 1.971535086016077e-07, + "loss": 0.6389, + "step": 783 + }, + { + "epoch": 0.02, + "learning_rate": 1.9714962525727155e-07, + "loss": 0.6384, + "step": 784 + }, + { + "epoch": 0.02, + "learning_rate": 1.9714574191293542e-07, + "loss": 0.7203, + "step": 785 + }, + { + "epoch": 0.02, + "learning_rate": 1.9714185856859926e-07, + "loss": 0.6001, + "step": 786 + }, + { + "epoch": 0.02, + "learning_rate": 1.9713797522426313e-07, + "loss": 0.6302, + "step": 787 + }, + { + "epoch": 0.02, + "learning_rate": 1.9713409187992698e-07, + "loss": 0.665, + "step": 788 + }, + { + "epoch": 0.02, + "learning_rate": 1.9713020853559082e-07, + "loss": 0.6689, + "step": 789 + }, + { + "epoch": 0.02, + "learning_rate": 1.971263251912547e-07, + "loss": 0.6776, + "step": 790 + }, + { + "epoch": 0.02, + "learning_rate": 1.9712244184691854e-07, + "loss": 0.6153, + "step": 791 + }, + { + "epoch": 0.02, + "learning_rate": 1.971185585025824e-07, + "loss": 0.6426, + "step": 792 + }, + { + "epoch": 0.02, + "learning_rate": 1.9711467515824626e-07, + "loss": 0.6557, + "step": 793 + }, + { + "epoch": 0.02, + "learning_rate": 1.9711079181391013e-07, + "loss": 0.6168, + "step": 794 + }, + { + "epoch": 0.02, + "learning_rate": 1.9710690846957397e-07, + "loss": 0.651, + "step": 795 + }, + { + "epoch": 0.02, + "learning_rate": 1.9710302512523784e-07, + "loss": 0.6148, + "step": 796 + }, + { + "epoch": 0.02, + "learning_rate": 1.970991417809017e-07, + "loss": 0.5882, + "step": 797 + }, + { + "epoch": 0.02, + "learning_rate": 1.9709525843656556e-07, + "loss": 0.6436, + "step": 798 + }, + { + "epoch": 0.02, + "learning_rate": 1.970913750922294e-07, + "loss": 0.6298, + "step": 799 + }, + { + "epoch": 0.02, + "learning_rate": 1.9708749174789328e-07, + "loss": 0.6041, + "step": 800 + }, + { + "epoch": 0.02, + "learning_rate": 1.9708360840355712e-07, + "loss": 0.653, + "step": 801 + }, + { + "epoch": 0.02, + "learning_rate": 1.97079725059221e-07, + "loss": 0.6717, + "step": 802 + }, + { + "epoch": 0.02, + "learning_rate": 1.9707584171488484e-07, + "loss": 0.6903, + "step": 803 + }, + { + "epoch": 0.02, + "learning_rate": 1.970719583705487e-07, + "loss": 0.6463, + "step": 804 + }, + { + "epoch": 0.02, + "learning_rate": 1.9706807502621256e-07, + "loss": 0.7157, + "step": 805 + }, + { + "epoch": 0.02, + "learning_rate": 1.9706419168187643e-07, + "loss": 0.6893, + "step": 806 + }, + { + "epoch": 0.02, + "learning_rate": 1.9706030833754027e-07, + "loss": 0.6428, + "step": 807 + }, + { + "epoch": 0.02, + "learning_rate": 1.9705642499320414e-07, + "loss": 0.6242, + "step": 808 + }, + { + "epoch": 0.02, + "learning_rate": 1.97052541648868e-07, + "loss": 0.6309, + "step": 809 + }, + { + "epoch": 0.02, + "learning_rate": 1.9704865830453186e-07, + "loss": 0.6588, + "step": 810 + }, + { + "epoch": 0.02, + "learning_rate": 1.970447749601957e-07, + "loss": 0.5859, + "step": 811 + }, + { + "epoch": 0.02, + "learning_rate": 1.9704089161585958e-07, + "loss": 0.7223, + "step": 812 + }, + { + "epoch": 0.02, + "learning_rate": 1.9703700827152342e-07, + "loss": 0.6133, + "step": 813 + }, + { + "epoch": 0.02, + "learning_rate": 1.970331249271873e-07, + "loss": 0.6376, + "step": 814 + }, + { + "epoch": 0.02, + "learning_rate": 1.9702924158285114e-07, + "loss": 0.7113, + "step": 815 + }, + { + "epoch": 0.02, + "learning_rate": 1.97025358238515e-07, + "loss": 0.7169, + "step": 816 + }, + { + "epoch": 0.02, + "learning_rate": 1.9702147489417885e-07, + "loss": 0.6586, + "step": 817 + }, + { + "epoch": 0.02, + "learning_rate": 1.9701759154984273e-07, + "loss": 0.6743, + "step": 818 + }, + { + "epoch": 0.02, + "learning_rate": 1.9701370820550657e-07, + "loss": 0.7031, + "step": 819 + }, + { + "epoch": 0.02, + "learning_rate": 1.9700982486117044e-07, + "loss": 0.6776, + "step": 820 + }, + { + "epoch": 0.02, + "learning_rate": 1.970059415168343e-07, + "loss": 0.6812, + "step": 821 + }, + { + "epoch": 0.02, + "learning_rate": 1.9700205817249816e-07, + "loss": 0.6628, + "step": 822 + }, + { + "epoch": 0.02, + "learning_rate": 1.96998174828162e-07, + "loss": 0.7094, + "step": 823 + }, + { + "epoch": 0.02, + "learning_rate": 1.9699429148382588e-07, + "loss": 0.6307, + "step": 824 + }, + { + "epoch": 0.02, + "learning_rate": 1.9699040813948972e-07, + "loss": 0.6866, + "step": 825 + }, + { + "epoch": 0.02, + "learning_rate": 1.969865247951536e-07, + "loss": 0.634, + "step": 826 + }, + { + "epoch": 0.02, + "learning_rate": 1.9698264145081744e-07, + "loss": 0.6137, + "step": 827 + }, + { + "epoch": 0.02, + "learning_rate": 1.969787581064813e-07, + "loss": 0.6534, + "step": 828 + }, + { + "epoch": 0.02, + "learning_rate": 1.9697487476214515e-07, + "loss": 0.6536, + "step": 829 + }, + { + "epoch": 0.02, + "learning_rate": 1.9697099141780902e-07, + "loss": 0.6064, + "step": 830 + }, + { + "epoch": 0.02, + "learning_rate": 1.9696710807347287e-07, + "loss": 0.6537, + "step": 831 + }, + { + "epoch": 0.02, + "learning_rate": 1.9696322472913674e-07, + "loss": 0.6503, + "step": 832 + }, + { + "epoch": 0.02, + "learning_rate": 1.9695934138480056e-07, + "loss": 0.7168, + "step": 833 + }, + { + "epoch": 0.02, + "learning_rate": 1.9695545804046443e-07, + "loss": 0.6682, + "step": 834 + }, + { + "epoch": 0.02, + "learning_rate": 1.9695157469612828e-07, + "loss": 0.6622, + "step": 835 + }, + { + "epoch": 0.02, + "learning_rate": 1.9694769135179215e-07, + "loss": 0.6829, + "step": 836 + }, + { + "epoch": 0.02, + "learning_rate": 1.96943808007456e-07, + "loss": 0.6353, + "step": 837 + }, + { + "epoch": 0.02, + "learning_rate": 1.9693992466311986e-07, + "loss": 0.7498, + "step": 838 + }, + { + "epoch": 0.02, + "learning_rate": 1.969360413187837e-07, + "loss": 0.6458, + "step": 839 + }, + { + "epoch": 0.02, + "learning_rate": 1.9693215797444758e-07, + "loss": 0.6468, + "step": 840 + }, + { + "epoch": 0.02, + "learning_rate": 1.9692827463011143e-07, + "loss": 0.5845, + "step": 841 + }, + { + "epoch": 0.02, + "learning_rate": 1.969243912857753e-07, + "loss": 0.6455, + "step": 842 + }, + { + "epoch": 0.02, + "learning_rate": 1.9692050794143914e-07, + "loss": 0.6987, + "step": 843 + }, + { + "epoch": 0.02, + "learning_rate": 1.9691662459710301e-07, + "loss": 0.6254, + "step": 844 + }, + { + "epoch": 0.02, + "learning_rate": 1.9691274125276686e-07, + "loss": 0.6455, + "step": 845 + }, + { + "epoch": 0.02, + "learning_rate": 1.9690885790843073e-07, + "loss": 0.6591, + "step": 846 + }, + { + "epoch": 0.02, + "learning_rate": 1.9690497456409457e-07, + "loss": 0.6848, + "step": 847 + }, + { + "epoch": 0.02, + "learning_rate": 1.9690109121975845e-07, + "loss": 0.6217, + "step": 848 + }, + { + "epoch": 0.02, + "learning_rate": 1.968972078754223e-07, + "loss": 0.6651, + "step": 849 + }, + { + "epoch": 0.02, + "learning_rate": 1.9689332453108616e-07, + "loss": 0.6115, + "step": 850 + }, + { + "epoch": 0.02, + "learning_rate": 1.9688944118675e-07, + "loss": 0.6085, + "step": 851 + }, + { + "epoch": 0.02, + "learning_rate": 1.9688555784241388e-07, + "loss": 0.6147, + "step": 852 + }, + { + "epoch": 0.02, + "learning_rate": 1.9688167449807772e-07, + "loss": 0.5774, + "step": 853 + }, + { + "epoch": 0.02, + "learning_rate": 1.968777911537416e-07, + "loss": 0.6796, + "step": 854 + }, + { + "epoch": 0.02, + "learning_rate": 1.9687390780940544e-07, + "loss": 0.6045, + "step": 855 + }, + { + "epoch": 0.02, + "learning_rate": 1.968700244650693e-07, + "loss": 0.6892, + "step": 856 + }, + { + "epoch": 0.02, + "learning_rate": 1.9686614112073316e-07, + "loss": 0.6296, + "step": 857 + }, + { + "epoch": 0.02, + "learning_rate": 1.9686225777639703e-07, + "loss": 0.624, + "step": 858 + }, + { + "epoch": 0.02, + "learning_rate": 1.9685837443206087e-07, + "loss": 0.6611, + "step": 859 + }, + { + "epoch": 0.02, + "learning_rate": 1.9685449108772475e-07, + "loss": 0.6267, + "step": 860 + }, + { + "epoch": 0.02, + "learning_rate": 1.968506077433886e-07, + "loss": 0.6595, + "step": 861 + }, + { + "epoch": 0.02, + "learning_rate": 1.9684672439905246e-07, + "loss": 0.6222, + "step": 862 + }, + { + "epoch": 0.02, + "learning_rate": 1.968428410547163e-07, + "loss": 0.7085, + "step": 863 + }, + { + "epoch": 0.02, + "learning_rate": 1.9683895771038018e-07, + "loss": 0.5916, + "step": 864 + }, + { + "epoch": 0.02, + "learning_rate": 1.9683507436604402e-07, + "loss": 0.5902, + "step": 865 + }, + { + "epoch": 0.02, + "learning_rate": 1.968311910217079e-07, + "loss": 0.6149, + "step": 866 + }, + { + "epoch": 0.02, + "learning_rate": 1.9682730767737174e-07, + "loss": 0.6321, + "step": 867 + }, + { + "epoch": 0.02, + "learning_rate": 1.968234243330356e-07, + "loss": 0.5982, + "step": 868 + }, + { + "epoch": 0.02, + "learning_rate": 1.9681954098869946e-07, + "loss": 0.6784, + "step": 869 + }, + { + "epoch": 0.02, + "learning_rate": 1.9681565764436333e-07, + "loss": 0.6697, + "step": 870 + }, + { + "epoch": 0.02, + "learning_rate": 1.9681177430002717e-07, + "loss": 0.7077, + "step": 871 + }, + { + "epoch": 0.02, + "learning_rate": 1.9680789095569104e-07, + "loss": 0.602, + "step": 872 + }, + { + "epoch": 0.02, + "learning_rate": 1.968040076113549e-07, + "loss": 0.5915, + "step": 873 + }, + { + "epoch": 0.02, + "learning_rate": 1.9680012426701876e-07, + "loss": 0.545, + "step": 874 + }, + { + "epoch": 0.02, + "learning_rate": 1.967962409226826e-07, + "loss": 0.6807, + "step": 875 + }, + { + "epoch": 0.02, + "learning_rate": 1.9679235757834648e-07, + "loss": 0.6678, + "step": 876 + }, + { + "epoch": 0.02, + "learning_rate": 1.9678847423401032e-07, + "loss": 0.5949, + "step": 877 + }, + { + "epoch": 0.02, + "learning_rate": 1.967845908896742e-07, + "loss": 0.641, + "step": 878 + }, + { + "epoch": 0.02, + "learning_rate": 1.9678070754533804e-07, + "loss": 0.665, + "step": 879 + }, + { + "epoch": 0.02, + "learning_rate": 1.967768242010019e-07, + "loss": 0.6753, + "step": 880 + }, + { + "epoch": 0.02, + "learning_rate": 1.9677294085666576e-07, + "loss": 0.6405, + "step": 881 + }, + { + "epoch": 0.02, + "learning_rate": 1.9676905751232963e-07, + "loss": 0.6008, + "step": 882 + }, + { + "epoch": 0.02, + "learning_rate": 1.9676517416799347e-07, + "loss": 0.573, + "step": 883 + }, + { + "epoch": 0.02, + "learning_rate": 1.9676129082365734e-07, + "loss": 0.5645, + "step": 884 + }, + { + "epoch": 0.02, + "learning_rate": 1.967574074793212e-07, + "loss": 0.6251, + "step": 885 + }, + { + "epoch": 0.02, + "learning_rate": 1.9675352413498506e-07, + "loss": 0.6412, + "step": 886 + }, + { + "epoch": 0.02, + "learning_rate": 1.967496407906489e-07, + "loss": 0.6893, + "step": 887 + }, + { + "epoch": 0.02, + "learning_rate": 1.9674575744631278e-07, + "loss": 0.673, + "step": 888 + }, + { + "epoch": 0.02, + "learning_rate": 1.9674187410197662e-07, + "loss": 0.6608, + "step": 889 + }, + { + "epoch": 0.02, + "learning_rate": 1.967379907576405e-07, + "loss": 0.6429, + "step": 890 + }, + { + "epoch": 0.02, + "learning_rate": 1.967341074133043e-07, + "loss": 0.5909, + "step": 891 + }, + { + "epoch": 0.02, + "learning_rate": 1.9673022406896818e-07, + "loss": 0.6906, + "step": 892 + }, + { + "epoch": 0.02, + "learning_rate": 1.9672634072463203e-07, + "loss": 0.6329, + "step": 893 + }, + { + "epoch": 0.02, + "learning_rate": 1.967224573802959e-07, + "loss": 0.5862, + "step": 894 + }, + { + "epoch": 0.02, + "learning_rate": 1.9671857403595974e-07, + "loss": 0.6024, + "step": 895 + }, + { + "epoch": 0.02, + "learning_rate": 1.9671469069162362e-07, + "loss": 0.6184, + "step": 896 + }, + { + "epoch": 0.02, + "learning_rate": 1.9671080734728746e-07, + "loss": 0.658, + "step": 897 + }, + { + "epoch": 0.02, + "learning_rate": 1.9670692400295133e-07, + "loss": 0.6225, + "step": 898 + }, + { + "epoch": 0.02, + "learning_rate": 1.9670304065861518e-07, + "loss": 0.5927, + "step": 899 + }, + { + "epoch": 0.02, + "learning_rate": 1.9669915731427905e-07, + "loss": 0.6781, + "step": 900 + }, + { + "epoch": 0.02, + "learning_rate": 1.966952739699429e-07, + "loss": 0.6956, + "step": 901 + }, + { + "epoch": 0.02, + "learning_rate": 1.9669139062560677e-07, + "loss": 0.6246, + "step": 902 + }, + { + "epoch": 0.02, + "learning_rate": 1.966875072812706e-07, + "loss": 0.5935, + "step": 903 + }, + { + "epoch": 0.02, + "learning_rate": 1.9668362393693448e-07, + "loss": 0.601, + "step": 904 + }, + { + "epoch": 0.02, + "learning_rate": 1.9667974059259833e-07, + "loss": 0.643, + "step": 905 + }, + { + "epoch": 0.02, + "learning_rate": 1.966758572482622e-07, + "loss": 0.6324, + "step": 906 + }, + { + "epoch": 0.02, + "learning_rate": 1.9667197390392604e-07, + "loss": 0.6415, + "step": 907 + }, + { + "epoch": 0.02, + "learning_rate": 1.9666809055958991e-07, + "loss": 0.5989, + "step": 908 + }, + { + "epoch": 0.02, + "learning_rate": 1.9666420721525376e-07, + "loss": 0.562, + "step": 909 + }, + { + "epoch": 0.02, + "learning_rate": 1.9666032387091763e-07, + "loss": 0.6721, + "step": 910 + }, + { + "epoch": 0.02, + "learning_rate": 1.9665644052658148e-07, + "loss": 0.6525, + "step": 911 + }, + { + "epoch": 0.02, + "learning_rate": 1.9665255718224535e-07, + "loss": 0.6714, + "step": 912 + }, + { + "epoch": 0.02, + "learning_rate": 1.966486738379092e-07, + "loss": 0.6933, + "step": 913 + }, + { + "epoch": 0.02, + "learning_rate": 1.9664479049357306e-07, + "loss": 0.6379, + "step": 914 + }, + { + "epoch": 0.02, + "learning_rate": 1.966409071492369e-07, + "loss": 0.5707, + "step": 915 + }, + { + "epoch": 0.02, + "learning_rate": 1.9663702380490078e-07, + "loss": 0.5396, + "step": 916 + }, + { + "epoch": 0.02, + "learning_rate": 1.9663314046056463e-07, + "loss": 0.5959, + "step": 917 + }, + { + "epoch": 0.02, + "learning_rate": 1.966292571162285e-07, + "loss": 0.6215, + "step": 918 + }, + { + "epoch": 0.02, + "learning_rate": 1.9662537377189234e-07, + "loss": 0.6427, + "step": 919 + }, + { + "epoch": 0.02, + "learning_rate": 1.9662149042755621e-07, + "loss": 0.6299, + "step": 920 + }, + { + "epoch": 0.02, + "learning_rate": 1.9661760708322006e-07, + "loss": 0.6528, + "step": 921 + }, + { + "epoch": 0.02, + "learning_rate": 1.9661372373888393e-07, + "loss": 0.6093, + "step": 922 + }, + { + "epoch": 0.02, + "learning_rate": 1.9660984039454778e-07, + "loss": 0.6489, + "step": 923 + }, + { + "epoch": 0.02, + "learning_rate": 1.9660595705021165e-07, + "loss": 0.5914, + "step": 924 + }, + { + "epoch": 0.02, + "learning_rate": 1.966020737058755e-07, + "loss": 0.6459, + "step": 925 + }, + { + "epoch": 0.02, + "learning_rate": 1.9659819036153936e-07, + "loss": 0.6637, + "step": 926 + }, + { + "epoch": 0.02, + "learning_rate": 1.965943070172032e-07, + "loss": 0.5611, + "step": 927 + }, + { + "epoch": 0.02, + "learning_rate": 1.9659042367286708e-07, + "loss": 0.5957, + "step": 928 + }, + { + "epoch": 0.02, + "learning_rate": 1.9658654032853092e-07, + "loss": 0.6195, + "step": 929 + }, + { + "epoch": 0.02, + "learning_rate": 1.965826569841948e-07, + "loss": 0.5524, + "step": 930 + }, + { + "epoch": 0.02, + "learning_rate": 1.9657877363985864e-07, + "loss": 0.6204, + "step": 931 + }, + { + "epoch": 0.02, + "learning_rate": 1.965748902955225e-07, + "loss": 0.5971, + "step": 932 + }, + { + "epoch": 0.02, + "learning_rate": 1.9657100695118636e-07, + "loss": 0.6876, + "step": 933 + }, + { + "epoch": 0.02, + "learning_rate": 1.9656712360685023e-07, + "loss": 0.71, + "step": 934 + }, + { + "epoch": 0.02, + "learning_rate": 1.9656324026251407e-07, + "loss": 0.6028, + "step": 935 + }, + { + "epoch": 0.02, + "learning_rate": 1.9655935691817792e-07, + "loss": 0.7023, + "step": 936 + }, + { + "epoch": 0.02, + "learning_rate": 1.965554735738418e-07, + "loss": 0.6125, + "step": 937 + }, + { + "epoch": 0.02, + "learning_rate": 1.9655159022950564e-07, + "loss": 0.6824, + "step": 938 + }, + { + "epoch": 0.02, + "learning_rate": 1.965477068851695e-07, + "loss": 0.7023, + "step": 939 + }, + { + "epoch": 0.02, + "learning_rate": 1.9654382354083335e-07, + "loss": 0.5964, + "step": 940 + }, + { + "epoch": 0.02, + "learning_rate": 1.9653994019649722e-07, + "loss": 0.6136, + "step": 941 + }, + { + "epoch": 0.02, + "learning_rate": 1.9653605685216107e-07, + "loss": 0.5546, + "step": 942 + }, + { + "epoch": 0.02, + "learning_rate": 1.9653217350782494e-07, + "loss": 0.5474, + "step": 943 + }, + { + "epoch": 0.02, + "learning_rate": 1.9652829016348878e-07, + "loss": 0.6701, + "step": 944 + }, + { + "epoch": 0.02, + "learning_rate": 1.9652440681915266e-07, + "loss": 0.651, + "step": 945 + }, + { + "epoch": 0.02, + "learning_rate": 1.965205234748165e-07, + "loss": 0.6968, + "step": 946 + }, + { + "epoch": 0.02, + "learning_rate": 1.9651664013048037e-07, + "loss": 0.5917, + "step": 947 + }, + { + "epoch": 0.02, + "learning_rate": 1.9651275678614422e-07, + "loss": 0.6348, + "step": 948 + }, + { + "epoch": 0.02, + "learning_rate": 1.9650887344180806e-07, + "loss": 0.6259, + "step": 949 + }, + { + "epoch": 0.02, + "learning_rate": 1.9650499009747193e-07, + "loss": 0.6077, + "step": 950 + }, + { + "epoch": 0.02, + "learning_rate": 1.9650110675313578e-07, + "loss": 0.6475, + "step": 951 + }, + { + "epoch": 0.02, + "learning_rate": 1.9649722340879965e-07, + "loss": 0.5661, + "step": 952 + }, + { + "epoch": 0.02, + "learning_rate": 1.964933400644635e-07, + "loss": 0.5653, + "step": 953 + }, + { + "epoch": 0.02, + "learning_rate": 1.9648945672012737e-07, + "loss": 0.6656, + "step": 954 + }, + { + "epoch": 0.02, + "learning_rate": 1.964855733757912e-07, + "loss": 0.669, + "step": 955 + }, + { + "epoch": 0.02, + "learning_rate": 1.9648169003145508e-07, + "loss": 0.5525, + "step": 956 + }, + { + "epoch": 0.02, + "learning_rate": 1.9647780668711893e-07, + "loss": 0.5899, + "step": 957 + }, + { + "epoch": 0.02, + "learning_rate": 1.964739233427828e-07, + "loss": 0.6861, + "step": 958 + }, + { + "epoch": 0.02, + "learning_rate": 1.9647003999844665e-07, + "loss": 0.5788, + "step": 959 + }, + { + "epoch": 0.02, + "learning_rate": 1.9646615665411052e-07, + "loss": 0.5749, + "step": 960 + }, + { + "epoch": 0.02, + "learning_rate": 1.9646227330977436e-07, + "loss": 0.5396, + "step": 961 + }, + { + "epoch": 0.02, + "learning_rate": 1.9645838996543823e-07, + "loss": 0.5698, + "step": 962 + }, + { + "epoch": 0.02, + "learning_rate": 1.9645450662110208e-07, + "loss": 0.6205, + "step": 963 + }, + { + "epoch": 0.02, + "learning_rate": 1.9645062327676595e-07, + "loss": 0.6473, + "step": 964 + }, + { + "epoch": 0.02, + "learning_rate": 1.964467399324298e-07, + "loss": 0.5636, + "step": 965 + }, + { + "epoch": 0.02, + "learning_rate": 1.9644285658809364e-07, + "loss": 0.7161, + "step": 966 + }, + { + "epoch": 0.02, + "learning_rate": 1.964389732437575e-07, + "loss": 0.5789, + "step": 967 + }, + { + "epoch": 0.02, + "learning_rate": 1.9643508989942136e-07, + "loss": 0.5924, + "step": 968 + }, + { + "epoch": 0.02, + "learning_rate": 1.9643120655508523e-07, + "loss": 0.6286, + "step": 969 + }, + { + "epoch": 0.02, + "learning_rate": 1.9642732321074907e-07, + "loss": 0.6186, + "step": 970 + }, + { + "epoch": 0.02, + "learning_rate": 1.9642343986641294e-07, + "loss": 0.5825, + "step": 971 + }, + { + "epoch": 0.02, + "learning_rate": 1.964195565220768e-07, + "loss": 0.6532, + "step": 972 + }, + { + "epoch": 0.02, + "learning_rate": 1.9641567317774066e-07, + "loss": 0.6537, + "step": 973 + }, + { + "epoch": 0.02, + "learning_rate": 1.964117898334045e-07, + "loss": 0.6449, + "step": 974 + }, + { + "epoch": 0.02, + "learning_rate": 1.9640790648906838e-07, + "loss": 0.5687, + "step": 975 + }, + { + "epoch": 0.02, + "learning_rate": 1.9640402314473222e-07, + "loss": 0.5985, + "step": 976 + }, + { + "epoch": 0.02, + "learning_rate": 1.964001398003961e-07, + "loss": 0.664, + "step": 977 + }, + { + "epoch": 0.02, + "learning_rate": 1.9639625645605994e-07, + "loss": 0.5035, + "step": 978 + }, + { + "epoch": 0.02, + "learning_rate": 1.963923731117238e-07, + "loss": 0.69, + "step": 979 + }, + { + "epoch": 0.02, + "learning_rate": 1.9638848976738766e-07, + "loss": 0.6388, + "step": 980 + }, + { + "epoch": 0.02, + "learning_rate": 1.9638460642305153e-07, + "loss": 0.6553, + "step": 981 + }, + { + "epoch": 0.02, + "learning_rate": 1.9638072307871537e-07, + "loss": 0.6879, + "step": 982 + }, + { + "epoch": 0.02, + "learning_rate": 1.9637683973437924e-07, + "loss": 0.6038, + "step": 983 + }, + { + "epoch": 0.02, + "learning_rate": 1.963729563900431e-07, + "loss": 0.6197, + "step": 984 + }, + { + "epoch": 0.02, + "learning_rate": 1.9636907304570696e-07, + "loss": 0.6183, + "step": 985 + }, + { + "epoch": 0.02, + "learning_rate": 1.963651897013708e-07, + "loss": 0.5915, + "step": 986 + }, + { + "epoch": 0.02, + "learning_rate": 1.9636130635703468e-07, + "loss": 0.5866, + "step": 987 + }, + { + "epoch": 0.02, + "learning_rate": 1.9635742301269852e-07, + "loss": 0.5544, + "step": 988 + }, + { + "epoch": 0.02, + "learning_rate": 1.963535396683624e-07, + "loss": 0.5554, + "step": 989 + }, + { + "epoch": 0.02, + "learning_rate": 1.9634965632402624e-07, + "loss": 0.6027, + "step": 990 + }, + { + "epoch": 0.02, + "learning_rate": 1.963457729796901e-07, + "loss": 0.5278, + "step": 991 + }, + { + "epoch": 0.02, + "learning_rate": 1.9634188963535395e-07, + "loss": 0.7128, + "step": 992 + }, + { + "epoch": 0.02, + "learning_rate": 1.9633800629101783e-07, + "loss": 0.6272, + "step": 993 + }, + { + "epoch": 0.02, + "learning_rate": 1.9633412294668167e-07, + "loss": 0.5687, + "step": 994 + }, + { + "epoch": 0.02, + "learning_rate": 1.9633023960234554e-07, + "loss": 0.6037, + "step": 995 + }, + { + "epoch": 0.02, + "learning_rate": 1.963263562580094e-07, + "loss": 0.5253, + "step": 996 + }, + { + "epoch": 0.02, + "learning_rate": 1.9632247291367326e-07, + "loss": 0.6947, + "step": 997 + }, + { + "epoch": 0.02, + "learning_rate": 1.963185895693371e-07, + "loss": 0.5688, + "step": 998 + }, + { + "epoch": 0.02, + "learning_rate": 1.9631470622500098e-07, + "loss": 0.6793, + "step": 999 + }, + { + "epoch": 0.02, + "learning_rate": 1.9631082288066482e-07, + "loss": 0.6297, + "step": 1000 + }, + { + "epoch": 0.02, + "learning_rate": 1.963069395363287e-07, + "loss": 0.5829, + "step": 1001 + }, + { + "epoch": 0.02, + "learning_rate": 1.9630305619199254e-07, + "loss": 0.5629, + "step": 1002 + }, + { + "epoch": 0.02, + "learning_rate": 1.962991728476564e-07, + "loss": 0.658, + "step": 1003 + }, + { + "epoch": 0.02, + "learning_rate": 1.9629528950332025e-07, + "loss": 0.6185, + "step": 1004 + }, + { + "epoch": 0.02, + "learning_rate": 1.9629140615898412e-07, + "loss": 0.5517, + "step": 1005 + }, + { + "epoch": 0.02, + "learning_rate": 1.9628752281464797e-07, + "loss": 0.6246, + "step": 1006 + }, + { + "epoch": 0.02, + "learning_rate": 1.9628363947031181e-07, + "loss": 0.5982, + "step": 1007 + }, + { + "epoch": 0.02, + "learning_rate": 1.9627975612597566e-07, + "loss": 0.6407, + "step": 1008 + }, + { + "epoch": 0.02, + "learning_rate": 1.9627587278163953e-07, + "loss": 0.6661, + "step": 1009 + }, + { + "epoch": 0.02, + "learning_rate": 1.9627198943730338e-07, + "loss": 0.7383, + "step": 1010 + }, + { + "epoch": 0.02, + "learning_rate": 1.9626810609296725e-07, + "loss": 0.5973, + "step": 1011 + }, + { + "epoch": 0.02, + "learning_rate": 1.962642227486311e-07, + "loss": 0.5588, + "step": 1012 + }, + { + "epoch": 0.02, + "learning_rate": 1.9626033940429496e-07, + "loss": 0.5558, + "step": 1013 + }, + { + "epoch": 0.02, + "learning_rate": 1.962564560599588e-07, + "loss": 0.5879, + "step": 1014 + }, + { + "epoch": 0.02, + "learning_rate": 1.9625257271562268e-07, + "loss": 0.6282, + "step": 1015 + }, + { + "epoch": 0.02, + "learning_rate": 1.9624868937128653e-07, + "loss": 0.6729, + "step": 1016 + }, + { + "epoch": 0.02, + "learning_rate": 1.962448060269504e-07, + "loss": 0.6281, + "step": 1017 + }, + { + "epoch": 0.02, + "learning_rate": 1.9624092268261424e-07, + "loss": 0.6199, + "step": 1018 + }, + { + "epoch": 0.02, + "learning_rate": 1.9623703933827811e-07, + "loss": 0.5513, + "step": 1019 + }, + { + "epoch": 0.02, + "learning_rate": 1.9623315599394196e-07, + "loss": 0.6335, + "step": 1020 + }, + { + "epoch": 0.02, + "learning_rate": 1.9622927264960583e-07, + "loss": 0.6213, + "step": 1021 + }, + { + "epoch": 0.02, + "learning_rate": 1.9622538930526968e-07, + "loss": 0.6606, + "step": 1022 + }, + { + "epoch": 0.02, + "learning_rate": 1.9622150596093355e-07, + "loss": 0.6325, + "step": 1023 + }, + { + "epoch": 0.02, + "learning_rate": 1.962176226165974e-07, + "loss": 0.5022, + "step": 1024 + }, + { + "epoch": 0.02, + "learning_rate": 1.9621373927226126e-07, + "loss": 0.5916, + "step": 1025 + }, + { + "epoch": 0.02, + "learning_rate": 1.962098559279251e-07, + "loss": 0.5915, + "step": 1026 + }, + { + "epoch": 0.02, + "learning_rate": 1.9620597258358898e-07, + "loss": 0.7067, + "step": 1027 + }, + { + "epoch": 0.02, + "learning_rate": 1.9620208923925282e-07, + "loss": 0.4858, + "step": 1028 + }, + { + "epoch": 0.02, + "learning_rate": 1.961982058949167e-07, + "loss": 0.7296, + "step": 1029 + }, + { + "epoch": 0.02, + "learning_rate": 1.9619432255058054e-07, + "loss": 0.6251, + "step": 1030 + }, + { + "epoch": 0.02, + "learning_rate": 1.961904392062444e-07, + "loss": 0.5529, + "step": 1031 + }, + { + "epoch": 0.02, + "learning_rate": 1.9618655586190826e-07, + "loss": 0.6482, + "step": 1032 + }, + { + "epoch": 0.02, + "learning_rate": 1.9618267251757213e-07, + "loss": 0.5543, + "step": 1033 + }, + { + "epoch": 0.02, + "learning_rate": 1.9617878917323597e-07, + "loss": 0.5329, + "step": 1034 + }, + { + "epoch": 0.02, + "learning_rate": 1.9617490582889985e-07, + "loss": 0.5668, + "step": 1035 + }, + { + "epoch": 0.02, + "learning_rate": 1.961710224845637e-07, + "loss": 0.611, + "step": 1036 + }, + { + "epoch": 0.02, + "learning_rate": 1.9616713914022756e-07, + "loss": 0.6065, + "step": 1037 + }, + { + "epoch": 0.02, + "learning_rate": 1.961632557958914e-07, + "loss": 0.5428, + "step": 1038 + }, + { + "epoch": 0.02, + "learning_rate": 1.9615937245155528e-07, + "loss": 0.5757, + "step": 1039 + }, + { + "epoch": 0.02, + "learning_rate": 1.9615548910721912e-07, + "loss": 0.6154, + "step": 1040 + }, + { + "epoch": 0.02, + "learning_rate": 1.96151605762883e-07, + "loss": 0.6035, + "step": 1041 + }, + { + "epoch": 0.02, + "learning_rate": 1.9614772241854684e-07, + "loss": 0.6039, + "step": 1042 + }, + { + "epoch": 0.02, + "learning_rate": 1.961438390742107e-07, + "loss": 0.6985, + "step": 1043 + }, + { + "epoch": 0.02, + "learning_rate": 1.9613995572987456e-07, + "loss": 0.4895, + "step": 1044 + }, + { + "epoch": 0.02, + "learning_rate": 1.9613607238553843e-07, + "loss": 0.6523, + "step": 1045 + }, + { + "epoch": 0.02, + "learning_rate": 1.9613218904120227e-07, + "loss": 0.5943, + "step": 1046 + }, + { + "epoch": 0.02, + "learning_rate": 1.9612830569686614e-07, + "loss": 0.5543, + "step": 1047 + }, + { + "epoch": 0.02, + "learning_rate": 1.9612442235253e-07, + "loss": 0.5409, + "step": 1048 + }, + { + "epoch": 0.02, + "learning_rate": 1.9612053900819386e-07, + "loss": 0.5295, + "step": 1049 + }, + { + "epoch": 0.02, + "learning_rate": 1.961166556638577e-07, + "loss": 0.6661, + "step": 1050 + }, + { + "epoch": 0.02, + "learning_rate": 1.9611277231952158e-07, + "loss": 0.5839, + "step": 1051 + }, + { + "epoch": 0.02, + "learning_rate": 1.9610888897518542e-07, + "loss": 0.5383, + "step": 1052 + }, + { + "epoch": 0.02, + "learning_rate": 1.961050056308493e-07, + "loss": 0.6183, + "step": 1053 + }, + { + "epoch": 0.02, + "learning_rate": 1.9610112228651314e-07, + "loss": 0.6186, + "step": 1054 + }, + { + "epoch": 0.02, + "learning_rate": 1.96097238942177e-07, + "loss": 0.6558, + "step": 1055 + }, + { + "epoch": 0.02, + "learning_rate": 1.9609335559784086e-07, + "loss": 0.6644, + "step": 1056 + }, + { + "epoch": 0.02, + "learning_rate": 1.9608947225350473e-07, + "loss": 0.5274, + "step": 1057 + }, + { + "epoch": 0.02, + "learning_rate": 1.9608558890916857e-07, + "loss": 0.6028, + "step": 1058 + }, + { + "epoch": 0.02, + "learning_rate": 1.9608170556483244e-07, + "loss": 0.6683, + "step": 1059 + }, + { + "epoch": 0.02, + "learning_rate": 1.960778222204963e-07, + "loss": 0.5463, + "step": 1060 + }, + { + "epoch": 0.02, + "learning_rate": 1.9607393887616016e-07, + "loss": 0.4945, + "step": 1061 + }, + { + "epoch": 0.02, + "learning_rate": 1.96070055531824e-07, + "loss": 0.4943, + "step": 1062 + }, + { + "epoch": 0.02, + "learning_rate": 1.9606617218748788e-07, + "loss": 0.7208, + "step": 1063 + }, + { + "epoch": 0.02, + "learning_rate": 1.9606228884315172e-07, + "loss": 0.7569, + "step": 1064 + }, + { + "epoch": 0.02, + "learning_rate": 1.9605840549881557e-07, + "loss": 0.6626, + "step": 1065 + }, + { + "epoch": 0.02, + "learning_rate": 1.960545221544794e-07, + "loss": 0.6508, + "step": 1066 + }, + { + "epoch": 0.02, + "learning_rate": 1.9605063881014328e-07, + "loss": 0.5627, + "step": 1067 + }, + { + "epoch": 0.02, + "learning_rate": 1.9604675546580713e-07, + "loss": 0.6829, + "step": 1068 + }, + { + "epoch": 0.02, + "learning_rate": 1.96042872121471e-07, + "loss": 0.6678, + "step": 1069 + }, + { + "epoch": 0.02, + "learning_rate": 1.9603898877713484e-07, + "loss": 0.6358, + "step": 1070 + }, + { + "epoch": 0.02, + "learning_rate": 1.9603510543279872e-07, + "loss": 0.5889, + "step": 1071 + }, + { + "epoch": 0.02, + "learning_rate": 1.9603122208846256e-07, + "loss": 0.4978, + "step": 1072 + }, + { + "epoch": 0.02, + "learning_rate": 1.9602733874412643e-07, + "loss": 0.5195, + "step": 1073 + }, + { + "epoch": 0.02, + "learning_rate": 1.9602345539979028e-07, + "loss": 0.5856, + "step": 1074 + }, + { + "epoch": 0.02, + "learning_rate": 1.9601957205545415e-07, + "loss": 0.5907, + "step": 1075 + }, + { + "epoch": 0.02, + "learning_rate": 1.96015688711118e-07, + "loss": 0.5659, + "step": 1076 + }, + { + "epoch": 0.02, + "learning_rate": 1.9601180536678187e-07, + "loss": 0.5851, + "step": 1077 + }, + { + "epoch": 0.02, + "learning_rate": 1.960079220224457e-07, + "loss": 0.5744, + "step": 1078 + }, + { + "epoch": 0.02, + "learning_rate": 1.9600403867810958e-07, + "loss": 0.5789, + "step": 1079 + }, + { + "epoch": 0.02, + "learning_rate": 1.9600015533377343e-07, + "loss": 0.5517, + "step": 1080 + }, + { + "epoch": 0.02, + "learning_rate": 1.959962719894373e-07, + "loss": 0.5443, + "step": 1081 + }, + { + "epoch": 0.02, + "learning_rate": 1.9599238864510114e-07, + "loss": 0.5636, + "step": 1082 + }, + { + "epoch": 0.02, + "learning_rate": 1.9598850530076501e-07, + "loss": 0.6291, + "step": 1083 + }, + { + "epoch": 0.02, + "learning_rate": 1.9598462195642886e-07, + "loss": 0.6094, + "step": 1084 + }, + { + "epoch": 0.02, + "learning_rate": 1.9598073861209273e-07, + "loss": 0.5609, + "step": 1085 + }, + { + "epoch": 0.02, + "learning_rate": 1.9597685526775658e-07, + "loss": 0.544, + "step": 1086 + }, + { + "epoch": 0.02, + "learning_rate": 1.9597297192342045e-07, + "loss": 0.6399, + "step": 1087 + }, + { + "epoch": 0.02, + "learning_rate": 1.959690885790843e-07, + "loss": 0.5276, + "step": 1088 + }, + { + "epoch": 0.02, + "learning_rate": 1.9596520523474816e-07, + "loss": 0.6434, + "step": 1089 + }, + { + "epoch": 0.02, + "learning_rate": 1.95961321890412e-07, + "loss": 0.6124, + "step": 1090 + }, + { + "epoch": 0.02, + "learning_rate": 1.9595743854607588e-07, + "loss": 0.5113, + "step": 1091 + }, + { + "epoch": 0.02, + "learning_rate": 1.9595355520173973e-07, + "loss": 0.5301, + "step": 1092 + }, + { + "epoch": 0.02, + "learning_rate": 1.959496718574036e-07, + "loss": 0.5334, + "step": 1093 + }, + { + "epoch": 0.02, + "learning_rate": 1.9594578851306744e-07, + "loss": 0.6016, + "step": 1094 + }, + { + "epoch": 0.02, + "learning_rate": 1.9594190516873131e-07, + "loss": 0.5698, + "step": 1095 + }, + { + "epoch": 0.02, + "learning_rate": 1.9593802182439516e-07, + "loss": 0.5657, + "step": 1096 + }, + { + "epoch": 0.02, + "learning_rate": 1.9593413848005903e-07, + "loss": 0.568, + "step": 1097 + }, + { + "epoch": 0.02, + "learning_rate": 1.9593025513572288e-07, + "loss": 0.5551, + "step": 1098 + }, + { + "epoch": 0.02, + "learning_rate": 1.9592637179138675e-07, + "loss": 0.6039, + "step": 1099 + }, + { + "epoch": 0.02, + "learning_rate": 1.959224884470506e-07, + "loss": 0.6194, + "step": 1100 + }, + { + "epoch": 0.02, + "learning_rate": 1.9591860510271446e-07, + "loss": 0.7669, + "step": 1101 + }, + { + "epoch": 0.02, + "learning_rate": 1.959147217583783e-07, + "loss": 0.5264, + "step": 1102 + }, + { + "epoch": 0.02, + "learning_rate": 1.9591083841404218e-07, + "loss": 0.5648, + "step": 1103 + }, + { + "epoch": 0.02, + "learning_rate": 1.9590695506970602e-07, + "loss": 0.5575, + "step": 1104 + }, + { + "epoch": 0.02, + "learning_rate": 1.959030717253699e-07, + "loss": 0.6209, + "step": 1105 + }, + { + "epoch": 0.02, + "learning_rate": 1.9589918838103374e-07, + "loss": 0.4894, + "step": 1106 + }, + { + "epoch": 0.02, + "learning_rate": 1.958953050366976e-07, + "loss": 0.6, + "step": 1107 + }, + { + "epoch": 0.02, + "learning_rate": 1.9589142169236146e-07, + "loss": 0.6555, + "step": 1108 + }, + { + "epoch": 0.02, + "learning_rate": 1.9588753834802533e-07, + "loss": 0.5194, + "step": 1109 + }, + { + "epoch": 0.02, + "learning_rate": 1.9588365500368917e-07, + "loss": 0.442, + "step": 1110 + }, + { + "epoch": 0.02, + "learning_rate": 1.9587977165935305e-07, + "loss": 0.4973, + "step": 1111 + }, + { + "epoch": 0.02, + "learning_rate": 1.958758883150169e-07, + "loss": 0.5446, + "step": 1112 + }, + { + "epoch": 0.02, + "learning_rate": 1.9587200497068074e-07, + "loss": 0.5716, + "step": 1113 + }, + { + "epoch": 0.02, + "learning_rate": 1.958681216263446e-07, + "loss": 0.5013, + "step": 1114 + }, + { + "epoch": 0.02, + "learning_rate": 1.9586423828200845e-07, + "loss": 0.6008, + "step": 1115 + }, + { + "epoch": 0.02, + "learning_rate": 1.9586035493767232e-07, + "loss": 0.5274, + "step": 1116 + }, + { + "epoch": 0.02, + "learning_rate": 1.9585647159333617e-07, + "loss": 0.5799, + "step": 1117 + }, + { + "epoch": 0.02, + "learning_rate": 1.9585258824900004e-07, + "loss": 0.4861, + "step": 1118 + }, + { + "epoch": 0.02, + "learning_rate": 1.9584870490466389e-07, + "loss": 0.5147, + "step": 1119 + }, + { + "epoch": 0.02, + "learning_rate": 1.9584482156032776e-07, + "loss": 0.6322, + "step": 1120 + }, + { + "epoch": 0.02, + "learning_rate": 1.958409382159916e-07, + "loss": 0.5919, + "step": 1121 + }, + { + "epoch": 0.02, + "learning_rate": 1.9583705487165547e-07, + "loss": 0.4783, + "step": 1122 + }, + { + "epoch": 0.02, + "learning_rate": 1.9583317152731932e-07, + "loss": 0.6555, + "step": 1123 + }, + { + "epoch": 0.02, + "learning_rate": 1.9582928818298316e-07, + "loss": 0.4693, + "step": 1124 + }, + { + "epoch": 0.02, + "learning_rate": 1.9582540483864703e-07, + "loss": 0.5443, + "step": 1125 + }, + { + "epoch": 0.02, + "learning_rate": 1.9582152149431088e-07, + "loss": 0.4811, + "step": 1126 + }, + { + "epoch": 0.02, + "learning_rate": 1.9581763814997475e-07, + "loss": 0.58, + "step": 1127 + }, + { + "epoch": 0.02, + "learning_rate": 1.958137548056386e-07, + "loss": 0.6363, + "step": 1128 + }, + { + "epoch": 0.02, + "learning_rate": 1.9580987146130247e-07, + "loss": 0.5795, + "step": 1129 + }, + { + "epoch": 0.02, + "learning_rate": 1.958059881169663e-07, + "loss": 0.6275, + "step": 1130 + }, + { + "epoch": 0.02, + "learning_rate": 1.9580210477263018e-07, + "loss": 0.6084, + "step": 1131 + }, + { + "epoch": 0.02, + "learning_rate": 1.9579822142829403e-07, + "loss": 0.5415, + "step": 1132 + }, + { + "epoch": 0.02, + "learning_rate": 1.957943380839579e-07, + "loss": 0.5306, + "step": 1133 + }, + { + "epoch": 0.02, + "learning_rate": 1.9579045473962175e-07, + "loss": 0.6143, + "step": 1134 + }, + { + "epoch": 0.02, + "learning_rate": 1.9578657139528562e-07, + "loss": 0.6389, + "step": 1135 + }, + { + "epoch": 0.02, + "learning_rate": 1.9578268805094946e-07, + "loss": 0.5535, + "step": 1136 + }, + { + "epoch": 0.02, + "learning_rate": 1.9577880470661333e-07, + "loss": 0.5886, + "step": 1137 + }, + { + "epoch": 0.02, + "learning_rate": 1.9577492136227718e-07, + "loss": 0.5227, + "step": 1138 + }, + { + "epoch": 0.02, + "learning_rate": 1.9577103801794105e-07, + "loss": 0.6129, + "step": 1139 + }, + { + "epoch": 0.02, + "learning_rate": 1.957671546736049e-07, + "loss": 0.5765, + "step": 1140 + }, + { + "epoch": 0.02, + "learning_rate": 1.9576327132926877e-07, + "loss": 0.5499, + "step": 1141 + }, + { + "epoch": 0.02, + "learning_rate": 1.957593879849326e-07, + "loss": 0.5496, + "step": 1142 + }, + { + "epoch": 0.02, + "learning_rate": 1.9575550464059646e-07, + "loss": 0.6292, + "step": 1143 + }, + { + "epoch": 0.02, + "learning_rate": 1.9575162129626033e-07, + "loss": 0.6451, + "step": 1144 + }, + { + "epoch": 0.02, + "learning_rate": 1.9574773795192417e-07, + "loss": 0.6346, + "step": 1145 + }, + { + "epoch": 0.02, + "learning_rate": 1.9574385460758804e-07, + "loss": 0.4696, + "step": 1146 + }, + { + "epoch": 0.02, + "learning_rate": 1.957399712632519e-07, + "loss": 0.4832, + "step": 1147 + }, + { + "epoch": 0.02, + "learning_rate": 1.9573608791891576e-07, + "loss": 0.6206, + "step": 1148 + }, + { + "epoch": 0.02, + "learning_rate": 1.957322045745796e-07, + "loss": 0.4448, + "step": 1149 + }, + { + "epoch": 0.02, + "learning_rate": 1.9572832123024348e-07, + "loss": 0.5954, + "step": 1150 + }, + { + "epoch": 0.02, + "learning_rate": 1.9572443788590732e-07, + "loss": 0.5967, + "step": 1151 + }, + { + "epoch": 0.02, + "learning_rate": 1.957205545415712e-07, + "loss": 0.5695, + "step": 1152 + }, + { + "epoch": 0.02, + "learning_rate": 1.9571667119723504e-07, + "loss": 0.6347, + "step": 1153 + }, + { + "epoch": 0.02, + "learning_rate": 1.957127878528989e-07, + "loss": 0.5643, + "step": 1154 + }, + { + "epoch": 0.02, + "learning_rate": 1.9570890450856276e-07, + "loss": 0.6014, + "step": 1155 + }, + { + "epoch": 0.02, + "learning_rate": 1.9570502116422663e-07, + "loss": 0.6664, + "step": 1156 + }, + { + "epoch": 0.02, + "learning_rate": 1.9570113781989047e-07, + "loss": 0.4595, + "step": 1157 + }, + { + "epoch": 0.02, + "learning_rate": 1.9569725447555434e-07, + "loss": 0.4972, + "step": 1158 + }, + { + "epoch": 0.02, + "learning_rate": 1.956933711312182e-07, + "loss": 0.6396, + "step": 1159 + }, + { + "epoch": 0.02, + "learning_rate": 1.9568948778688206e-07, + "loss": 0.4224, + "step": 1160 + }, + { + "epoch": 0.02, + "learning_rate": 1.956856044425459e-07, + "loss": 0.6182, + "step": 1161 + }, + { + "epoch": 0.02, + "learning_rate": 1.9568172109820978e-07, + "loss": 0.5678, + "step": 1162 + }, + { + "epoch": 0.02, + "learning_rate": 1.9567783775387362e-07, + "loss": 0.4623, + "step": 1163 + }, + { + "epoch": 0.02, + "learning_rate": 1.956739544095375e-07, + "loss": 0.4669, + "step": 1164 + }, + { + "epoch": 0.02, + "learning_rate": 1.9567007106520134e-07, + "loss": 0.6243, + "step": 1165 + }, + { + "epoch": 0.02, + "learning_rate": 1.956661877208652e-07, + "loss": 0.5934, + "step": 1166 + }, + { + "epoch": 0.02, + "learning_rate": 1.9566230437652905e-07, + "loss": 0.5395, + "step": 1167 + }, + { + "epoch": 0.02, + "learning_rate": 1.9565842103219293e-07, + "loss": 0.5308, + "step": 1168 + }, + { + "epoch": 0.02, + "learning_rate": 1.9565453768785677e-07, + "loss": 0.5827, + "step": 1169 + }, + { + "epoch": 0.02, + "learning_rate": 1.9565065434352064e-07, + "loss": 0.4766, + "step": 1170 + }, + { + "epoch": 0.02, + "learning_rate": 1.956467709991845e-07, + "loss": 0.5746, + "step": 1171 + }, + { + "epoch": 0.02, + "learning_rate": 1.9564288765484836e-07, + "loss": 0.562, + "step": 1172 + }, + { + "epoch": 0.02, + "learning_rate": 1.956390043105122e-07, + "loss": 0.6079, + "step": 1173 + }, + { + "epoch": 0.02, + "learning_rate": 1.9563512096617608e-07, + "loss": 0.5653, + "step": 1174 + }, + { + "epoch": 0.02, + "learning_rate": 1.9563123762183992e-07, + "loss": 0.5176, + "step": 1175 + }, + { + "epoch": 0.02, + "learning_rate": 1.956273542775038e-07, + "loss": 0.5444, + "step": 1176 + }, + { + "epoch": 0.02, + "learning_rate": 1.9562347093316764e-07, + "loss": 0.5631, + "step": 1177 + }, + { + "epoch": 0.02, + "learning_rate": 1.956195875888315e-07, + "loss": 0.5144, + "step": 1178 + }, + { + "epoch": 0.02, + "learning_rate": 1.9561570424449535e-07, + "loss": 0.4081, + "step": 1179 + }, + { + "epoch": 0.02, + "learning_rate": 1.9561182090015922e-07, + "loss": 0.505, + "step": 1180 + }, + { + "epoch": 0.02, + "learning_rate": 1.9560793755582304e-07, + "loss": 0.4751, + "step": 1181 + }, + { + "epoch": 0.02, + "learning_rate": 1.9560405421148691e-07, + "loss": 0.5481, + "step": 1182 + }, + { + "epoch": 0.02, + "learning_rate": 1.9560017086715076e-07, + "loss": 0.5768, + "step": 1183 + }, + { + "epoch": 0.02, + "learning_rate": 1.9559628752281463e-07, + "loss": 0.4796, + "step": 1184 + }, + { + "epoch": 0.02, + "learning_rate": 1.9559240417847848e-07, + "loss": 0.5584, + "step": 1185 + }, + { + "epoch": 0.02, + "learning_rate": 1.9558852083414235e-07, + "loss": 0.6131, + "step": 1186 + }, + { + "epoch": 0.02, + "learning_rate": 1.955846374898062e-07, + "loss": 0.483, + "step": 1187 + }, + { + "epoch": 0.02, + "learning_rate": 1.9558075414547006e-07, + "loss": 0.6189, + "step": 1188 + }, + { + "epoch": 0.02, + "learning_rate": 1.955768708011339e-07, + "loss": 0.4697, + "step": 1189 + }, + { + "epoch": 0.02, + "learning_rate": 1.9557298745679778e-07, + "loss": 0.6745, + "step": 1190 + }, + { + "epoch": 0.02, + "learning_rate": 1.9556910411246163e-07, + "loss": 0.5505, + "step": 1191 + }, + { + "epoch": 0.02, + "learning_rate": 1.955652207681255e-07, + "loss": 0.6005, + "step": 1192 + }, + { + "epoch": 0.02, + "learning_rate": 1.9556133742378934e-07, + "loss": 0.508, + "step": 1193 + }, + { + "epoch": 0.02, + "learning_rate": 1.9555745407945321e-07, + "loss": 0.6201, + "step": 1194 + }, + { + "epoch": 0.02, + "learning_rate": 1.9555357073511706e-07, + "loss": 0.7872, + "step": 1195 + }, + { + "epoch": 0.02, + "learning_rate": 1.9554968739078093e-07, + "loss": 0.5817, + "step": 1196 + }, + { + "epoch": 0.02, + "learning_rate": 1.9554580404644478e-07, + "loss": 0.5712, + "step": 1197 + }, + { + "epoch": 0.02, + "learning_rate": 1.9554192070210865e-07, + "loss": 0.4869, + "step": 1198 + }, + { + "epoch": 0.02, + "learning_rate": 1.955380373577725e-07, + "loss": 0.5601, + "step": 1199 + }, + { + "epoch": 0.02, + "learning_rate": 1.9553415401343636e-07, + "loss": 0.4847, + "step": 1200 + }, + { + "epoch": 0.02, + "learning_rate": 1.955302706691002e-07, + "loss": 0.5267, + "step": 1201 + }, + { + "epoch": 0.02, + "learning_rate": 1.9552638732476408e-07, + "loss": 0.5472, + "step": 1202 + }, + { + "epoch": 0.02, + "learning_rate": 1.9552250398042792e-07, + "loss": 0.5358, + "step": 1203 + }, + { + "epoch": 0.02, + "learning_rate": 1.955186206360918e-07, + "loss": 0.533, + "step": 1204 + }, + { + "epoch": 0.02, + "learning_rate": 1.9551473729175564e-07, + "loss": 0.3856, + "step": 1205 + }, + { + "epoch": 0.02, + "learning_rate": 1.955108539474195e-07, + "loss": 0.4928, + "step": 1206 + }, + { + "epoch": 0.02, + "learning_rate": 1.9550697060308336e-07, + "loss": 0.5801, + "step": 1207 + }, + { + "epoch": 0.02, + "learning_rate": 1.9550308725874723e-07, + "loss": 0.5113, + "step": 1208 + }, + { + "epoch": 0.02, + "learning_rate": 1.9549920391441107e-07, + "loss": 0.5366, + "step": 1209 + }, + { + "epoch": 0.02, + "learning_rate": 1.9549532057007495e-07, + "loss": 0.4881, + "step": 1210 + }, + { + "epoch": 0.02, + "learning_rate": 1.954914372257388e-07, + "loss": 0.511, + "step": 1211 + }, + { + "epoch": 0.02, + "learning_rate": 1.9548755388140266e-07, + "loss": 0.5413, + "step": 1212 + }, + { + "epoch": 0.02, + "learning_rate": 1.954836705370665e-07, + "loss": 0.4405, + "step": 1213 + }, + { + "epoch": 0.02, + "learning_rate": 1.9547978719273038e-07, + "loss": 0.4855, + "step": 1214 + }, + { + "epoch": 0.02, + "learning_rate": 1.9547590384839422e-07, + "loss": 0.5012, + "step": 1215 + }, + { + "epoch": 0.02, + "learning_rate": 1.954720205040581e-07, + "loss": 0.4589, + "step": 1216 + }, + { + "epoch": 0.02, + "learning_rate": 1.9546813715972194e-07, + "loss": 0.632, + "step": 1217 + }, + { + "epoch": 0.02, + "learning_rate": 1.954642538153858e-07, + "loss": 0.4607, + "step": 1218 + }, + { + "epoch": 0.02, + "learning_rate": 1.9546037047104966e-07, + "loss": 0.7469, + "step": 1219 + }, + { + "epoch": 0.02, + "learning_rate": 1.9545648712671353e-07, + "loss": 0.3406, + "step": 1220 + }, + { + "epoch": 0.02, + "learning_rate": 1.9545260378237737e-07, + "loss": 0.5921, + "step": 1221 + }, + { + "epoch": 0.02, + "learning_rate": 1.9544872043804124e-07, + "loss": 0.5116, + "step": 1222 + }, + { + "epoch": 0.02, + "learning_rate": 1.954448370937051e-07, + "loss": 0.5171, + "step": 1223 + }, + { + "epoch": 0.02, + "learning_rate": 1.9544095374936896e-07, + "loss": 0.5957, + "step": 1224 + }, + { + "epoch": 0.02, + "learning_rate": 1.954370704050328e-07, + "loss": 0.5217, + "step": 1225 + }, + { + "epoch": 0.02, + "learning_rate": 1.9543318706069668e-07, + "loss": 0.5134, + "step": 1226 + }, + { + "epoch": 0.02, + "learning_rate": 1.9542930371636052e-07, + "loss": 0.5206, + "step": 1227 + }, + { + "epoch": 0.02, + "learning_rate": 1.954254203720244e-07, + "loss": 0.5978, + "step": 1228 + }, + { + "epoch": 0.02, + "learning_rate": 1.9542153702768824e-07, + "loss": 0.5281, + "step": 1229 + }, + { + "epoch": 0.02, + "learning_rate": 1.954176536833521e-07, + "loss": 0.4691, + "step": 1230 + }, + { + "epoch": 0.02, + "learning_rate": 1.9541377033901596e-07, + "loss": 0.6706, + "step": 1231 + }, + { + "epoch": 0.02, + "learning_rate": 1.9540988699467983e-07, + "loss": 0.5207, + "step": 1232 + }, + { + "epoch": 0.02, + "learning_rate": 1.9540600365034367e-07, + "loss": 0.5839, + "step": 1233 + }, + { + "epoch": 0.02, + "learning_rate": 1.9540212030600754e-07, + "loss": 0.4831, + "step": 1234 + }, + { + "epoch": 0.02, + "learning_rate": 1.953982369616714e-07, + "loss": 0.4549, + "step": 1235 + }, + { + "epoch": 0.02, + "learning_rate": 1.9539435361733526e-07, + "loss": 0.6418, + "step": 1236 + }, + { + "epoch": 0.02, + "learning_rate": 1.953904702729991e-07, + "loss": 0.4934, + "step": 1237 + }, + { + "epoch": 0.02, + "learning_rate": 1.9538658692866298e-07, + "loss": 0.401, + "step": 1238 + }, + { + "epoch": 0.02, + "learning_rate": 1.953827035843268e-07, + "loss": 0.6183, + "step": 1239 + }, + { + "epoch": 0.02, + "learning_rate": 1.9537882023999067e-07, + "loss": 0.4597, + "step": 1240 + }, + { + "epoch": 0.02, + "learning_rate": 1.953749368956545e-07, + "loss": 0.637, + "step": 1241 + }, + { + "epoch": 0.02, + "learning_rate": 1.9537105355131838e-07, + "loss": 0.594, + "step": 1242 + }, + { + "epoch": 0.02, + "learning_rate": 1.9536717020698223e-07, + "loss": 0.5762, + "step": 1243 + }, + { + "epoch": 0.02, + "learning_rate": 1.953632868626461e-07, + "loss": 0.5967, + "step": 1244 + }, + { + "epoch": 0.02, + "learning_rate": 1.9535940351830994e-07, + "loss": 0.5533, + "step": 1245 + }, + { + "epoch": 0.02, + "learning_rate": 1.9535552017397382e-07, + "loss": 0.4135, + "step": 1246 + }, + { + "epoch": 0.02, + "learning_rate": 1.9535163682963766e-07, + "loss": 0.5858, + "step": 1247 + }, + { + "epoch": 0.02, + "learning_rate": 1.9534775348530153e-07, + "loss": 0.3802, + "step": 1248 + }, + { + "epoch": 0.02, + "learning_rate": 1.9534387014096538e-07, + "loss": 0.4803, + "step": 1249 + }, + { + "epoch": 0.02, + "learning_rate": 1.9533998679662925e-07, + "loss": 0.4329, + "step": 1250 + }, + { + "epoch": 0.02, + "learning_rate": 1.953361034522931e-07, + "loss": 0.494, + "step": 1251 + }, + { + "epoch": 0.02, + "learning_rate": 1.9533222010795697e-07, + "loss": 0.6552, + "step": 1252 + }, + { + "epoch": 0.02, + "learning_rate": 1.953283367636208e-07, + "loss": 0.4856, + "step": 1253 + }, + { + "epoch": 0.02, + "learning_rate": 1.9532445341928468e-07, + "loss": 0.5285, + "step": 1254 + }, + { + "epoch": 0.02, + "learning_rate": 1.9532057007494853e-07, + "loss": 0.4788, + "step": 1255 + }, + { + "epoch": 0.02, + "learning_rate": 1.953166867306124e-07, + "loss": 0.5472, + "step": 1256 + }, + { + "epoch": 0.02, + "learning_rate": 1.9531280338627624e-07, + "loss": 0.6273, + "step": 1257 + }, + { + "epoch": 0.02, + "learning_rate": 1.9530892004194011e-07, + "loss": 0.4935, + "step": 1258 + }, + { + "epoch": 0.02, + "learning_rate": 1.9530503669760396e-07, + "loss": 0.514, + "step": 1259 + }, + { + "epoch": 0.02, + "learning_rate": 1.9530115335326783e-07, + "loss": 0.4231, + "step": 1260 + }, + { + "epoch": 0.02, + "learning_rate": 1.9529727000893168e-07, + "loss": 0.5481, + "step": 1261 + }, + { + "epoch": 0.02, + "learning_rate": 1.9529338666459555e-07, + "loss": 0.597, + "step": 1262 + }, + { + "epoch": 0.02, + "learning_rate": 1.952895033202594e-07, + "loss": 0.419, + "step": 1263 + }, + { + "epoch": 0.02, + "learning_rate": 1.9528561997592326e-07, + "loss": 0.5739, + "step": 1264 + }, + { + "epoch": 0.02, + "learning_rate": 1.952817366315871e-07, + "loss": 0.4123, + "step": 1265 + }, + { + "epoch": 0.02, + "learning_rate": 1.9527785328725098e-07, + "loss": 0.5623, + "step": 1266 + }, + { + "epoch": 0.02, + "learning_rate": 1.9527396994291483e-07, + "loss": 0.5959, + "step": 1267 + }, + { + "epoch": 0.02, + "learning_rate": 1.952700865985787e-07, + "loss": 0.4732, + "step": 1268 + }, + { + "epoch": 0.02, + "learning_rate": 1.9526620325424254e-07, + "loss": 0.5172, + "step": 1269 + }, + { + "epoch": 0.02, + "learning_rate": 1.9526231990990641e-07, + "loss": 0.4691, + "step": 1270 + }, + { + "epoch": 0.02, + "learning_rate": 1.9525843656557026e-07, + "loss": 0.5564, + "step": 1271 + }, + { + "epoch": 0.02, + "learning_rate": 1.9525455322123413e-07, + "loss": 0.6489, + "step": 1272 + }, + { + "epoch": 0.02, + "learning_rate": 1.9525066987689798e-07, + "loss": 0.4726, + "step": 1273 + }, + { + "epoch": 0.02, + "learning_rate": 1.9524678653256185e-07, + "loss": 0.4096, + "step": 1274 + }, + { + "epoch": 0.02, + "learning_rate": 1.952429031882257e-07, + "loss": 0.7683, + "step": 1275 + }, + { + "epoch": 0.02, + "learning_rate": 1.9523901984388956e-07, + "loss": 0.5003, + "step": 1276 + }, + { + "epoch": 0.02, + "learning_rate": 1.952351364995534e-07, + "loss": 0.4839, + "step": 1277 + }, + { + "epoch": 0.02, + "learning_rate": 1.9523125315521728e-07, + "loss": 0.4727, + "step": 1278 + }, + { + "epoch": 0.02, + "learning_rate": 1.9522736981088112e-07, + "loss": 0.5791, + "step": 1279 + }, + { + "epoch": 0.02, + "learning_rate": 1.95223486466545e-07, + "loss": 0.5156, + "step": 1280 + }, + { + "epoch": 0.02, + "learning_rate": 1.9521960312220884e-07, + "loss": 0.4962, + "step": 1281 + }, + { + "epoch": 0.02, + "learning_rate": 1.952157197778727e-07, + "loss": 0.4269, + "step": 1282 + }, + { + "epoch": 0.02, + "learning_rate": 1.9521183643353656e-07, + "loss": 0.4781, + "step": 1283 + }, + { + "epoch": 0.02, + "learning_rate": 1.9520795308920043e-07, + "loss": 0.5362, + "step": 1284 + }, + { + "epoch": 0.02, + "learning_rate": 1.9520406974486427e-07, + "loss": 0.5826, + "step": 1285 + }, + { + "epoch": 0.02, + "learning_rate": 1.9520018640052815e-07, + "loss": 0.5519, + "step": 1286 + }, + { + "epoch": 0.02, + "learning_rate": 1.95196303056192e-07, + "loss": 0.4723, + "step": 1287 + }, + { + "epoch": 0.02, + "learning_rate": 1.9519241971185586e-07, + "loss": 0.5387, + "step": 1288 + }, + { + "epoch": 0.03, + "learning_rate": 1.951885363675197e-07, + "loss": 0.4941, + "step": 1289 + }, + { + "epoch": 0.03, + "learning_rate": 1.9518465302318355e-07, + "loss": 0.6409, + "step": 1290 + }, + { + "epoch": 0.03, + "learning_rate": 1.9518076967884742e-07, + "loss": 0.4445, + "step": 1291 + }, + { + "epoch": 0.03, + "learning_rate": 1.9517688633451127e-07, + "loss": 0.5846, + "step": 1292 + }, + { + "epoch": 0.03, + "learning_rate": 1.9517300299017514e-07, + "loss": 0.4093, + "step": 1293 + }, + { + "epoch": 0.03, + "learning_rate": 1.9516911964583899e-07, + "loss": 0.6023, + "step": 1294 + }, + { + "epoch": 0.03, + "learning_rate": 1.9516523630150286e-07, + "loss": 0.4843, + "step": 1295 + }, + { + "epoch": 0.03, + "learning_rate": 1.951613529571667e-07, + "loss": 0.6982, + "step": 1296 + }, + { + "epoch": 0.03, + "learning_rate": 1.9515746961283055e-07, + "loss": 0.453, + "step": 1297 + }, + { + "epoch": 0.03, + "learning_rate": 1.9515358626849442e-07, + "loss": 0.4869, + "step": 1298 + }, + { + "epoch": 0.03, + "learning_rate": 1.9514970292415826e-07, + "loss": 0.4412, + "step": 1299 + }, + { + "epoch": 0.03, + "learning_rate": 1.9514581957982213e-07, + "loss": 0.3838, + "step": 1300 + }, + { + "epoch": 0.03, + "learning_rate": 1.9514193623548598e-07, + "loss": 0.4944, + "step": 1301 + }, + { + "epoch": 0.03, + "learning_rate": 1.9513805289114985e-07, + "loss": 0.4932, + "step": 1302 + }, + { + "epoch": 0.03, + "learning_rate": 1.951341695468137e-07, + "loss": 0.5697, + "step": 1303 + }, + { + "epoch": 0.03, + "learning_rate": 1.9513028620247757e-07, + "loss": 0.4816, + "step": 1304 + }, + { + "epoch": 0.03, + "learning_rate": 1.951264028581414e-07, + "loss": 0.4931, + "step": 1305 + }, + { + "epoch": 0.03, + "learning_rate": 1.9512251951380528e-07, + "loss": 0.4175, + "step": 1306 + }, + { + "epoch": 0.03, + "learning_rate": 1.9511863616946913e-07, + "loss": 0.616, + "step": 1307 + }, + { + "epoch": 0.03, + "learning_rate": 1.95114752825133e-07, + "loss": 0.4516, + "step": 1308 + }, + { + "epoch": 0.03, + "learning_rate": 1.9511086948079685e-07, + "loss": 0.3801, + "step": 1309 + }, + { + "epoch": 0.03, + "learning_rate": 1.9510698613646072e-07, + "loss": 0.49, + "step": 1310 + }, + { + "epoch": 0.03, + "learning_rate": 1.9510310279212456e-07, + "loss": 0.4557, + "step": 1311 + }, + { + "epoch": 0.03, + "learning_rate": 1.9509921944778843e-07, + "loss": 0.4604, + "step": 1312 + }, + { + "epoch": 0.03, + "learning_rate": 1.9509533610345228e-07, + "loss": 0.5756, + "step": 1313 + }, + { + "epoch": 0.03, + "learning_rate": 1.9509145275911615e-07, + "loss": 0.4706, + "step": 1314 + }, + { + "epoch": 0.03, + "learning_rate": 1.9508756941478e-07, + "loss": 0.4356, + "step": 1315 + }, + { + "epoch": 0.03, + "learning_rate": 1.9508368607044387e-07, + "loss": 0.5231, + "step": 1316 + }, + { + "epoch": 0.03, + "learning_rate": 1.950798027261077e-07, + "loss": 0.6064, + "step": 1317 + }, + { + "epoch": 0.03, + "learning_rate": 1.9507591938177158e-07, + "loss": 0.4406, + "step": 1318 + }, + { + "epoch": 0.03, + "learning_rate": 1.9507203603743543e-07, + "loss": 0.6882, + "step": 1319 + }, + { + "epoch": 0.03, + "learning_rate": 1.9506815269309927e-07, + "loss": 0.4392, + "step": 1320 + }, + { + "epoch": 0.03, + "learning_rate": 1.9506426934876314e-07, + "loss": 0.4753, + "step": 1321 + }, + { + "epoch": 0.03, + "learning_rate": 1.95060386004427e-07, + "loss": 0.5321, + "step": 1322 + }, + { + "epoch": 0.03, + "learning_rate": 1.9505650266009086e-07, + "loss": 0.4829, + "step": 1323 + }, + { + "epoch": 0.03, + "learning_rate": 1.950526193157547e-07, + "loss": 0.6063, + "step": 1324 + }, + { + "epoch": 0.03, + "learning_rate": 1.9504873597141858e-07, + "loss": 0.4673, + "step": 1325 + }, + { + "epoch": 0.03, + "learning_rate": 1.9504485262708242e-07, + "loss": 0.5406, + "step": 1326 + }, + { + "epoch": 0.03, + "learning_rate": 1.950409692827463e-07, + "loss": 0.4116, + "step": 1327 + }, + { + "epoch": 0.03, + "learning_rate": 1.9503708593841014e-07, + "loss": 0.5152, + "step": 1328 + }, + { + "epoch": 0.03, + "learning_rate": 1.95033202594074e-07, + "loss": 0.4972, + "step": 1329 + }, + { + "epoch": 0.03, + "learning_rate": 1.9502931924973786e-07, + "loss": 0.5193, + "step": 1330 + }, + { + "epoch": 0.03, + "learning_rate": 1.9502543590540173e-07, + "loss": 0.4864, + "step": 1331 + }, + { + "epoch": 0.03, + "learning_rate": 1.9502155256106557e-07, + "loss": 0.487, + "step": 1332 + }, + { + "epoch": 0.03, + "learning_rate": 1.9501766921672944e-07, + "loss": 0.6797, + "step": 1333 + }, + { + "epoch": 0.03, + "learning_rate": 1.950137858723933e-07, + "loss": 0.4755, + "step": 1334 + }, + { + "epoch": 0.03, + "learning_rate": 1.9500990252805716e-07, + "loss": 0.4355, + "step": 1335 + }, + { + "epoch": 0.03, + "learning_rate": 1.95006019183721e-07, + "loss": 0.4819, + "step": 1336 + }, + { + "epoch": 0.03, + "learning_rate": 1.9500213583938488e-07, + "loss": 0.4219, + "step": 1337 + }, + { + "epoch": 0.03, + "learning_rate": 1.9499825249504872e-07, + "loss": 0.5625, + "step": 1338 + }, + { + "epoch": 0.03, + "learning_rate": 1.949943691507126e-07, + "loss": 0.368, + "step": 1339 + }, + { + "epoch": 0.03, + "learning_rate": 1.9499048580637644e-07, + "loss": 0.5515, + "step": 1340 + }, + { + "epoch": 0.03, + "learning_rate": 1.949866024620403e-07, + "loss": 0.5468, + "step": 1341 + }, + { + "epoch": 0.03, + "learning_rate": 1.9498271911770415e-07, + "loss": 0.3567, + "step": 1342 + }, + { + "epoch": 0.03, + "learning_rate": 1.9497883577336803e-07, + "loss": 0.3599, + "step": 1343 + }, + { + "epoch": 0.03, + "learning_rate": 1.9497495242903187e-07, + "loss": 0.5469, + "step": 1344 + }, + { + "epoch": 0.03, + "learning_rate": 1.9497106908469574e-07, + "loss": 0.5537, + "step": 1345 + }, + { + "epoch": 0.03, + "learning_rate": 1.949671857403596e-07, + "loss": 0.5301, + "step": 1346 + }, + { + "epoch": 0.03, + "learning_rate": 1.9496330239602346e-07, + "loss": 0.5285, + "step": 1347 + }, + { + "epoch": 0.03, + "learning_rate": 1.949594190516873e-07, + "loss": 0.5033, + "step": 1348 + }, + { + "epoch": 0.03, + "learning_rate": 1.9495553570735118e-07, + "loss": 0.4917, + "step": 1349 + }, + { + "epoch": 0.03, + "learning_rate": 1.9495165236301502e-07, + "loss": 0.5041, + "step": 1350 + }, + { + "epoch": 0.03, + "learning_rate": 1.949477690186789e-07, + "loss": 0.4531, + "step": 1351 + }, + { + "epoch": 0.03, + "learning_rate": 1.9494388567434274e-07, + "loss": 0.6302, + "step": 1352 + }, + { + "epoch": 0.03, + "learning_rate": 1.949400023300066e-07, + "loss": 0.7205, + "step": 1353 + }, + { + "epoch": 0.03, + "learning_rate": 1.9493611898567045e-07, + "loss": 0.4078, + "step": 1354 + }, + { + "epoch": 0.03, + "learning_rate": 1.949322356413343e-07, + "loss": 0.5355, + "step": 1355 + }, + { + "epoch": 0.03, + "learning_rate": 1.9492835229699814e-07, + "loss": 0.4743, + "step": 1356 + }, + { + "epoch": 0.03, + "learning_rate": 1.9492446895266201e-07, + "loss": 0.5083, + "step": 1357 + }, + { + "epoch": 0.03, + "learning_rate": 1.9492058560832586e-07, + "loss": 0.5488, + "step": 1358 + }, + { + "epoch": 0.03, + "learning_rate": 1.9491670226398973e-07, + "loss": 0.5242, + "step": 1359 + }, + { + "epoch": 0.03, + "learning_rate": 1.9491281891965358e-07, + "loss": 0.509, + "step": 1360 + }, + { + "epoch": 0.03, + "learning_rate": 1.9490893557531745e-07, + "loss": 0.3386, + "step": 1361 + }, + { + "epoch": 0.03, + "learning_rate": 1.949050522309813e-07, + "loss": 0.3598, + "step": 1362 + }, + { + "epoch": 0.03, + "learning_rate": 1.9490116888664516e-07, + "loss": 0.4801, + "step": 1363 + }, + { + "epoch": 0.03, + "learning_rate": 1.94897285542309e-07, + "loss": 0.4146, + "step": 1364 + }, + { + "epoch": 0.03, + "learning_rate": 1.9489340219797288e-07, + "loss": 0.5445, + "step": 1365 + }, + { + "epoch": 0.03, + "learning_rate": 1.9488951885363673e-07, + "loss": 0.4144, + "step": 1366 + }, + { + "epoch": 0.03, + "learning_rate": 1.948856355093006e-07, + "loss": 0.4396, + "step": 1367 + }, + { + "epoch": 0.03, + "learning_rate": 1.9488175216496444e-07, + "loss": 0.5975, + "step": 1368 + }, + { + "epoch": 0.03, + "learning_rate": 1.9487786882062831e-07, + "loss": 0.4926, + "step": 1369 + }, + { + "epoch": 0.03, + "learning_rate": 1.9487398547629216e-07, + "loss": 0.4556, + "step": 1370 + }, + { + "epoch": 0.03, + "learning_rate": 1.9487010213195603e-07, + "loss": 0.4376, + "step": 1371 + }, + { + "epoch": 0.03, + "learning_rate": 1.9486621878761988e-07, + "loss": 0.4303, + "step": 1372 + }, + { + "epoch": 0.03, + "learning_rate": 1.9486233544328375e-07, + "loss": 0.4019, + "step": 1373 + }, + { + "epoch": 0.03, + "learning_rate": 1.948584520989476e-07, + "loss": 0.4862, + "step": 1374 + }, + { + "epoch": 0.03, + "learning_rate": 1.9485456875461146e-07, + "loss": 0.4645, + "step": 1375 + }, + { + "epoch": 0.03, + "learning_rate": 1.948506854102753e-07, + "loss": 0.4393, + "step": 1376 + }, + { + "epoch": 0.03, + "learning_rate": 1.9484680206593918e-07, + "loss": 0.5865, + "step": 1377 + }, + { + "epoch": 0.03, + "learning_rate": 1.9484291872160302e-07, + "loss": 0.5321, + "step": 1378 + }, + { + "epoch": 0.03, + "learning_rate": 1.948390353772669e-07, + "loss": 0.5263, + "step": 1379 + }, + { + "epoch": 0.03, + "learning_rate": 1.9483515203293074e-07, + "loss": 0.443, + "step": 1380 + }, + { + "epoch": 0.03, + "learning_rate": 1.948312686885946e-07, + "loss": 0.4868, + "step": 1381 + }, + { + "epoch": 0.03, + "learning_rate": 1.9482738534425846e-07, + "loss": 0.5185, + "step": 1382 + }, + { + "epoch": 0.03, + "learning_rate": 1.9482350199992233e-07, + "loss": 0.471, + "step": 1383 + }, + { + "epoch": 0.03, + "learning_rate": 1.9481961865558617e-07, + "loss": 0.4928, + "step": 1384 + }, + { + "epoch": 0.03, + "learning_rate": 1.9481573531125005e-07, + "loss": 0.393, + "step": 1385 + }, + { + "epoch": 0.03, + "learning_rate": 1.948118519669139e-07, + "loss": 0.4293, + "step": 1386 + }, + { + "epoch": 0.03, + "learning_rate": 1.9480796862257776e-07, + "loss": 0.4046, + "step": 1387 + }, + { + "epoch": 0.03, + "learning_rate": 1.948040852782416e-07, + "loss": 0.3761, + "step": 1388 + }, + { + "epoch": 0.03, + "learning_rate": 1.9480020193390548e-07, + "loss": 0.5289, + "step": 1389 + }, + { + "epoch": 0.03, + "learning_rate": 1.9479631858956932e-07, + "loss": 0.5049, + "step": 1390 + }, + { + "epoch": 0.03, + "learning_rate": 1.947924352452332e-07, + "loss": 0.4915, + "step": 1391 + }, + { + "epoch": 0.03, + "learning_rate": 1.9478855190089704e-07, + "loss": 0.4658, + "step": 1392 + }, + { + "epoch": 0.03, + "learning_rate": 1.947846685565609e-07, + "loss": 0.6387, + "step": 1393 + }, + { + "epoch": 0.03, + "learning_rate": 1.9478078521222476e-07, + "loss": 0.4679, + "step": 1394 + }, + { + "epoch": 0.03, + "learning_rate": 1.9477690186788863e-07, + "loss": 0.577, + "step": 1395 + }, + { + "epoch": 0.03, + "learning_rate": 1.9477301852355247e-07, + "loss": 0.3215, + "step": 1396 + }, + { + "epoch": 0.03, + "learning_rate": 1.9476913517921634e-07, + "loss": 0.5174, + "step": 1397 + }, + { + "epoch": 0.03, + "learning_rate": 1.947652518348802e-07, + "loss": 0.3272, + "step": 1398 + }, + { + "epoch": 0.03, + "learning_rate": 1.9476136849054406e-07, + "loss": 0.3813, + "step": 1399 + }, + { + "epoch": 0.03, + "learning_rate": 1.947574851462079e-07, + "loss": 0.3463, + "step": 1400 + }, + { + "epoch": 0.03, + "learning_rate": 1.9475360180187178e-07, + "loss": 0.6955, + "step": 1401 + }, + { + "epoch": 0.03, + "learning_rate": 1.9474971845753562e-07, + "loss": 0.4513, + "step": 1402 + }, + { + "epoch": 0.03, + "learning_rate": 1.947458351131995e-07, + "loss": 0.5744, + "step": 1403 + }, + { + "epoch": 0.03, + "learning_rate": 1.9474195176886334e-07, + "loss": 0.4537, + "step": 1404 + }, + { + "epoch": 0.03, + "learning_rate": 1.947380684245272e-07, + "loss": 0.6525, + "step": 1405 + }, + { + "epoch": 0.03, + "learning_rate": 1.9473418508019106e-07, + "loss": 0.7161, + "step": 1406 + }, + { + "epoch": 0.03, + "learning_rate": 1.9473030173585493e-07, + "loss": 0.5045, + "step": 1407 + }, + { + "epoch": 0.03, + "learning_rate": 1.9472641839151877e-07, + "loss": 0.5484, + "step": 1408 + }, + { + "epoch": 0.03, + "learning_rate": 1.9472253504718264e-07, + "loss": 0.6113, + "step": 1409 + }, + { + "epoch": 0.03, + "learning_rate": 1.947186517028465e-07, + "loss": 0.4836, + "step": 1410 + }, + { + "epoch": 0.03, + "learning_rate": 1.9471476835851036e-07, + "loss": 0.493, + "step": 1411 + }, + { + "epoch": 0.03, + "learning_rate": 1.947108850141742e-07, + "loss": 0.5595, + "step": 1412 + }, + { + "epoch": 0.03, + "learning_rate": 1.9470700166983805e-07, + "loss": 0.4759, + "step": 1413 + }, + { + "epoch": 0.03, + "learning_rate": 1.947031183255019e-07, + "loss": 0.6388, + "step": 1414 + }, + { + "epoch": 0.03, + "learning_rate": 1.9469923498116577e-07, + "loss": 0.3944, + "step": 1415 + }, + { + "epoch": 0.03, + "learning_rate": 1.946953516368296e-07, + "loss": 0.6135, + "step": 1416 + }, + { + "epoch": 0.03, + "learning_rate": 1.9469146829249348e-07, + "loss": 0.5114, + "step": 1417 + }, + { + "epoch": 0.03, + "learning_rate": 1.9468758494815733e-07, + "loss": 0.4691, + "step": 1418 + }, + { + "epoch": 0.03, + "learning_rate": 1.946837016038212e-07, + "loss": 0.3361, + "step": 1419 + }, + { + "epoch": 0.03, + "learning_rate": 1.9467981825948504e-07, + "loss": 0.6139, + "step": 1420 + }, + { + "epoch": 0.03, + "learning_rate": 1.9467593491514892e-07, + "loss": 0.4751, + "step": 1421 + }, + { + "epoch": 0.03, + "learning_rate": 1.9467205157081276e-07, + "loss": 0.4495, + "step": 1422 + }, + { + "epoch": 0.03, + "learning_rate": 1.9466816822647663e-07, + "loss": 0.4608, + "step": 1423 + }, + { + "epoch": 0.03, + "learning_rate": 1.9466428488214048e-07, + "loss": 0.4894, + "step": 1424 + }, + { + "epoch": 0.03, + "learning_rate": 1.9466040153780435e-07, + "loss": 0.5037, + "step": 1425 + }, + { + "epoch": 0.03, + "learning_rate": 1.946565181934682e-07, + "loss": 0.4401, + "step": 1426 + }, + { + "epoch": 0.03, + "learning_rate": 1.9465263484913207e-07, + "loss": 0.5489, + "step": 1427 + }, + { + "epoch": 0.03, + "learning_rate": 1.946487515047959e-07, + "loss": 0.4041, + "step": 1428 + }, + { + "epoch": 0.03, + "learning_rate": 1.9464486816045978e-07, + "loss": 0.5544, + "step": 1429 + }, + { + "epoch": 0.03, + "learning_rate": 1.9464098481612363e-07, + "loss": 0.3802, + "step": 1430 + }, + { + "epoch": 0.03, + "learning_rate": 1.946371014717875e-07, + "loss": 0.5135, + "step": 1431 + }, + { + "epoch": 0.03, + "learning_rate": 1.9463321812745134e-07, + "loss": 0.5099, + "step": 1432 + }, + { + "epoch": 0.03, + "learning_rate": 1.9462933478311521e-07, + "loss": 0.4243, + "step": 1433 + }, + { + "epoch": 0.03, + "learning_rate": 1.9462545143877906e-07, + "loss": 0.4703, + "step": 1434 + }, + { + "epoch": 0.03, + "learning_rate": 1.9462156809444293e-07, + "loss": 0.3468, + "step": 1435 + }, + { + "epoch": 0.03, + "learning_rate": 1.9461768475010678e-07, + "loss": 0.5575, + "step": 1436 + }, + { + "epoch": 0.03, + "learning_rate": 1.9461380140577065e-07, + "loss": 0.4833, + "step": 1437 + }, + { + "epoch": 0.03, + "learning_rate": 1.946099180614345e-07, + "loss": 0.3783, + "step": 1438 + }, + { + "epoch": 0.03, + "learning_rate": 1.9460603471709836e-07, + "loss": 0.4582, + "step": 1439 + }, + { + "epoch": 0.03, + "learning_rate": 1.946021513727622e-07, + "loss": 0.3633, + "step": 1440 + }, + { + "epoch": 0.03, + "learning_rate": 1.9459826802842608e-07, + "loss": 0.504, + "step": 1441 + }, + { + "epoch": 0.03, + "learning_rate": 1.9459438468408993e-07, + "loss": 0.5173, + "step": 1442 + }, + { + "epoch": 0.03, + "learning_rate": 1.945905013397538e-07, + "loss": 0.5262, + "step": 1443 + }, + { + "epoch": 0.03, + "learning_rate": 1.9458661799541764e-07, + "loss": 0.6366, + "step": 1444 + }, + { + "epoch": 0.03, + "learning_rate": 1.9458273465108151e-07, + "loss": 0.3821, + "step": 1445 + }, + { + "epoch": 0.03, + "learning_rate": 1.9457885130674536e-07, + "loss": 0.4758, + "step": 1446 + }, + { + "epoch": 0.03, + "learning_rate": 1.9457496796240923e-07, + "loss": 0.3658, + "step": 1447 + }, + { + "epoch": 0.03, + "learning_rate": 1.9457108461807308e-07, + "loss": 0.3554, + "step": 1448 + }, + { + "epoch": 0.03, + "learning_rate": 1.9456720127373695e-07, + "loss": 0.3932, + "step": 1449 + }, + { + "epoch": 0.03, + "learning_rate": 1.945633179294008e-07, + "loss": 0.4, + "step": 1450 + }, + { + "epoch": 0.03, + "learning_rate": 1.9455943458506466e-07, + "loss": 0.4565, + "step": 1451 + }, + { + "epoch": 0.03, + "learning_rate": 1.945555512407285e-07, + "loss": 0.5167, + "step": 1452 + }, + { + "epoch": 0.03, + "learning_rate": 1.9455166789639238e-07, + "loss": 0.4866, + "step": 1453 + }, + { + "epoch": 0.03, + "learning_rate": 1.9454778455205622e-07, + "loss": 0.4408, + "step": 1454 + }, + { + "epoch": 0.03, + "learning_rate": 1.945439012077201e-07, + "loss": 0.3613, + "step": 1455 + }, + { + "epoch": 0.03, + "learning_rate": 1.9454001786338394e-07, + "loss": 0.3816, + "step": 1456 + }, + { + "epoch": 0.03, + "learning_rate": 1.945361345190478e-07, + "loss": 0.3316, + "step": 1457 + }, + { + "epoch": 0.03, + "learning_rate": 1.9453225117471166e-07, + "loss": 0.4781, + "step": 1458 + }, + { + "epoch": 0.03, + "learning_rate": 1.9452836783037553e-07, + "loss": 0.3132, + "step": 1459 + }, + { + "epoch": 0.03, + "learning_rate": 1.9452448448603937e-07, + "loss": 0.4569, + "step": 1460 + }, + { + "epoch": 0.03, + "learning_rate": 1.9452060114170325e-07, + "loss": 0.4729, + "step": 1461 + }, + { + "epoch": 0.03, + "learning_rate": 1.945167177973671e-07, + "loss": 0.5114, + "step": 1462 + }, + { + "epoch": 0.03, + "learning_rate": 1.9451283445303096e-07, + "loss": 0.3993, + "step": 1463 + }, + { + "epoch": 0.03, + "learning_rate": 1.945089511086948e-07, + "loss": 0.4348, + "step": 1464 + }, + { + "epoch": 0.03, + "learning_rate": 1.9450506776435868e-07, + "loss": 0.5791, + "step": 1465 + }, + { + "epoch": 0.03, + "learning_rate": 1.9450118442002252e-07, + "loss": 0.4479, + "step": 1466 + }, + { + "epoch": 0.03, + "learning_rate": 1.9449730107568637e-07, + "loss": 0.602, + "step": 1467 + }, + { + "epoch": 0.03, + "learning_rate": 1.9449341773135024e-07, + "loss": 0.4628, + "step": 1468 + }, + { + "epoch": 0.03, + "learning_rate": 1.9448953438701409e-07, + "loss": 0.349, + "step": 1469 + }, + { + "epoch": 0.03, + "learning_rate": 1.9448565104267796e-07, + "loss": 0.4019, + "step": 1470 + }, + { + "epoch": 0.03, + "learning_rate": 1.944817676983418e-07, + "loss": 0.441, + "step": 1471 + }, + { + "epoch": 0.03, + "learning_rate": 1.9447788435400565e-07, + "loss": 0.5835, + "step": 1472 + }, + { + "epoch": 0.03, + "learning_rate": 1.9447400100966952e-07, + "loss": 0.3525, + "step": 1473 + }, + { + "epoch": 0.03, + "learning_rate": 1.9447011766533336e-07, + "loss": 0.4284, + "step": 1474 + }, + { + "epoch": 0.03, + "learning_rate": 1.9446623432099723e-07, + "loss": 0.4467, + "step": 1475 + }, + { + "epoch": 0.03, + "learning_rate": 1.9446235097666108e-07, + "loss": 0.4956, + "step": 1476 + }, + { + "epoch": 0.03, + "learning_rate": 1.9445846763232495e-07, + "loss": 0.378, + "step": 1477 + }, + { + "epoch": 0.03, + "learning_rate": 1.944545842879888e-07, + "loss": 0.4717, + "step": 1478 + }, + { + "epoch": 0.03, + "learning_rate": 1.9445070094365267e-07, + "loss": 0.3454, + "step": 1479 + }, + { + "epoch": 0.03, + "learning_rate": 1.944468175993165e-07, + "loss": 0.3938, + "step": 1480 + }, + { + "epoch": 0.03, + "learning_rate": 1.9444293425498038e-07, + "loss": 0.5689, + "step": 1481 + }, + { + "epoch": 0.03, + "learning_rate": 1.9443905091064423e-07, + "loss": 0.4903, + "step": 1482 + }, + { + "epoch": 0.03, + "learning_rate": 1.944351675663081e-07, + "loss": 0.3594, + "step": 1483 + }, + { + "epoch": 0.03, + "learning_rate": 1.9443128422197195e-07, + "loss": 0.3595, + "step": 1484 + }, + { + "epoch": 0.03, + "learning_rate": 1.9442740087763582e-07, + "loss": 0.3915, + "step": 1485 + }, + { + "epoch": 0.03, + "learning_rate": 1.9442351753329966e-07, + "loss": 0.5502, + "step": 1486 + }, + { + "epoch": 0.03, + "learning_rate": 1.9441963418896353e-07, + "loss": 0.6624, + "step": 1487 + }, + { + "epoch": 0.03, + "learning_rate": 1.9441575084462738e-07, + "loss": 0.4093, + "step": 1488 + }, + { + "epoch": 0.03, + "learning_rate": 1.9441186750029125e-07, + "loss": 0.4459, + "step": 1489 + }, + { + "epoch": 0.03, + "learning_rate": 1.944079841559551e-07, + "loss": 0.4039, + "step": 1490 + }, + { + "epoch": 0.03, + "learning_rate": 1.9440410081161897e-07, + "loss": 0.3441, + "step": 1491 + }, + { + "epoch": 0.03, + "learning_rate": 1.944002174672828e-07, + "loss": 0.3744, + "step": 1492 + }, + { + "epoch": 0.03, + "learning_rate": 1.9439633412294668e-07, + "loss": 0.479, + "step": 1493 + }, + { + "epoch": 0.03, + "learning_rate": 1.9439245077861053e-07, + "loss": 0.4111, + "step": 1494 + }, + { + "epoch": 0.03, + "learning_rate": 1.943885674342744e-07, + "loss": 0.6126, + "step": 1495 + }, + { + "epoch": 0.03, + "learning_rate": 1.9438468408993824e-07, + "loss": 0.3914, + "step": 1496 + }, + { + "epoch": 0.03, + "learning_rate": 1.943808007456021e-07, + "loss": 0.4327, + "step": 1497 + }, + { + "epoch": 0.03, + "learning_rate": 1.9437691740126596e-07, + "loss": 0.4507, + "step": 1498 + }, + { + "epoch": 0.03, + "learning_rate": 1.943730340569298e-07, + "loss": 0.4256, + "step": 1499 + }, + { + "epoch": 0.03, + "learning_rate": 1.9436915071259368e-07, + "loss": 0.4196, + "step": 1500 + }, + { + "epoch": 0.03, + "learning_rate": 1.9436526736825752e-07, + "loss": 0.5146, + "step": 1501 + }, + { + "epoch": 0.03, + "learning_rate": 1.943613840239214e-07, + "loss": 0.4198, + "step": 1502 + }, + { + "epoch": 0.03, + "learning_rate": 1.9435750067958524e-07, + "loss": 0.4276, + "step": 1503 + }, + { + "epoch": 0.03, + "learning_rate": 1.943536173352491e-07, + "loss": 0.4694, + "step": 1504 + }, + { + "epoch": 0.03, + "learning_rate": 1.9434973399091296e-07, + "loss": 0.5142, + "step": 1505 + }, + { + "epoch": 0.03, + "learning_rate": 1.9434585064657683e-07, + "loss": 0.3929, + "step": 1506 + }, + { + "epoch": 0.03, + "learning_rate": 1.9434196730224067e-07, + "loss": 0.3882, + "step": 1507 + }, + { + "epoch": 0.03, + "learning_rate": 1.9433808395790454e-07, + "loss": 0.398, + "step": 1508 + }, + { + "epoch": 0.03, + "learning_rate": 1.943342006135684e-07, + "loss": 0.5004, + "step": 1509 + }, + { + "epoch": 0.03, + "learning_rate": 1.9433031726923226e-07, + "loss": 0.392, + "step": 1510 + }, + { + "epoch": 0.03, + "learning_rate": 1.943264339248961e-07, + "loss": 0.3121, + "step": 1511 + }, + { + "epoch": 0.03, + "learning_rate": 1.9432255058055998e-07, + "loss": 0.3403, + "step": 1512 + }, + { + "epoch": 0.03, + "learning_rate": 1.9431866723622382e-07, + "loss": 0.4014, + "step": 1513 + }, + { + "epoch": 0.03, + "learning_rate": 1.943147838918877e-07, + "loss": 0.4818, + "step": 1514 + }, + { + "epoch": 0.03, + "learning_rate": 1.9431090054755154e-07, + "loss": 0.3192, + "step": 1515 + }, + { + "epoch": 0.03, + "learning_rate": 1.943070172032154e-07, + "loss": 0.4422, + "step": 1516 + }, + { + "epoch": 0.03, + "learning_rate": 1.9430313385887925e-07, + "loss": 0.4032, + "step": 1517 + }, + { + "epoch": 0.03, + "learning_rate": 1.9429925051454313e-07, + "loss": 0.4861, + "step": 1518 + }, + { + "epoch": 0.03, + "learning_rate": 1.9429536717020697e-07, + "loss": 0.5126, + "step": 1519 + }, + { + "epoch": 0.03, + "learning_rate": 1.9429148382587084e-07, + "loss": 0.4194, + "step": 1520 + }, + { + "epoch": 0.03, + "learning_rate": 1.942876004815347e-07, + "loss": 0.5149, + "step": 1521 + }, + { + "epoch": 0.03, + "learning_rate": 1.9428371713719856e-07, + "loss": 0.3706, + "step": 1522 + }, + { + "epoch": 0.03, + "learning_rate": 1.942798337928624e-07, + "loss": 0.5176, + "step": 1523 + }, + { + "epoch": 0.03, + "learning_rate": 1.9427595044852628e-07, + "loss": 0.3841, + "step": 1524 + }, + { + "epoch": 0.03, + "learning_rate": 1.9427206710419012e-07, + "loss": 0.4202, + "step": 1525 + }, + { + "epoch": 0.03, + "learning_rate": 1.94268183759854e-07, + "loss": 0.5174, + "step": 1526 + }, + { + "epoch": 0.03, + "learning_rate": 1.9426430041551784e-07, + "loss": 0.4765, + "step": 1527 + }, + { + "epoch": 0.03, + "learning_rate": 1.942604170711817e-07, + "loss": 0.4282, + "step": 1528 + }, + { + "epoch": 0.03, + "learning_rate": 1.9425653372684553e-07, + "loss": 0.4054, + "step": 1529 + }, + { + "epoch": 0.03, + "learning_rate": 1.942526503825094e-07, + "loss": 0.5222, + "step": 1530 + }, + { + "epoch": 0.03, + "learning_rate": 1.9424876703817324e-07, + "loss": 0.4053, + "step": 1531 + }, + { + "epoch": 0.03, + "learning_rate": 1.9424488369383711e-07, + "loss": 0.4295, + "step": 1532 + }, + { + "epoch": 0.03, + "learning_rate": 1.9424100034950096e-07, + "loss": 0.4062, + "step": 1533 + }, + { + "epoch": 0.03, + "learning_rate": 1.9423711700516483e-07, + "loss": 0.4319, + "step": 1534 + }, + { + "epoch": 0.03, + "learning_rate": 1.9423323366082868e-07, + "loss": 0.3623, + "step": 1535 + }, + { + "epoch": 0.03, + "learning_rate": 1.9422935031649255e-07, + "loss": 0.3723, + "step": 1536 + }, + { + "epoch": 0.03, + "learning_rate": 1.942254669721564e-07, + "loss": 0.3854, + "step": 1537 + }, + { + "epoch": 0.03, + "learning_rate": 1.9422158362782026e-07, + "loss": 0.4036, + "step": 1538 + }, + { + "epoch": 0.03, + "learning_rate": 1.942177002834841e-07, + "loss": 0.4419, + "step": 1539 + }, + { + "epoch": 0.03, + "learning_rate": 1.9421381693914798e-07, + "loss": 0.4249, + "step": 1540 + }, + { + "epoch": 0.03, + "learning_rate": 1.9420993359481183e-07, + "loss": 0.6282, + "step": 1541 + }, + { + "epoch": 0.03, + "learning_rate": 1.942060502504757e-07, + "loss": 0.442, + "step": 1542 + }, + { + "epoch": 0.03, + "learning_rate": 1.9420216690613954e-07, + "loss": 0.3123, + "step": 1543 + }, + { + "epoch": 0.03, + "learning_rate": 1.9419828356180341e-07, + "loss": 0.4192, + "step": 1544 + }, + { + "epoch": 0.03, + "learning_rate": 1.9419440021746726e-07, + "loss": 0.5082, + "step": 1545 + }, + { + "epoch": 0.03, + "learning_rate": 1.9419051687313113e-07, + "loss": 0.4216, + "step": 1546 + }, + { + "epoch": 0.03, + "learning_rate": 1.9418663352879498e-07, + "loss": 0.3497, + "step": 1547 + }, + { + "epoch": 0.03, + "learning_rate": 1.9418275018445885e-07, + "loss": 0.3745, + "step": 1548 + }, + { + "epoch": 0.03, + "learning_rate": 1.941788668401227e-07, + "loss": 0.4252, + "step": 1549 + }, + { + "epoch": 0.03, + "learning_rate": 1.9417498349578656e-07, + "loss": 0.5255, + "step": 1550 + }, + { + "epoch": 0.03, + "learning_rate": 1.941711001514504e-07, + "loss": 0.5044, + "step": 1551 + }, + { + "epoch": 0.03, + "learning_rate": 1.9416721680711428e-07, + "loss": 0.4297, + "step": 1552 + }, + { + "epoch": 0.03, + "learning_rate": 1.9416333346277812e-07, + "loss": 0.4109, + "step": 1553 + }, + { + "epoch": 0.03, + "learning_rate": 1.94159450118442e-07, + "loss": 0.4676, + "step": 1554 + }, + { + "epoch": 0.03, + "learning_rate": 1.9415556677410584e-07, + "loss": 0.3936, + "step": 1555 + }, + { + "epoch": 0.03, + "learning_rate": 1.941516834297697e-07, + "loss": 0.4365, + "step": 1556 + }, + { + "epoch": 0.03, + "learning_rate": 1.9414780008543356e-07, + "loss": 0.3756, + "step": 1557 + }, + { + "epoch": 0.03, + "learning_rate": 1.9414391674109743e-07, + "loss": 0.4022, + "step": 1558 + }, + { + "epoch": 0.03, + "learning_rate": 1.9414003339676127e-07, + "loss": 0.3933, + "step": 1559 + }, + { + "epoch": 0.03, + "learning_rate": 1.9413615005242515e-07, + "loss": 0.3398, + "step": 1560 + }, + { + "epoch": 0.03, + "learning_rate": 1.94132266708089e-07, + "loss": 0.3683, + "step": 1561 + }, + { + "epoch": 0.03, + "learning_rate": 1.9412838336375286e-07, + "loss": 0.4896, + "step": 1562 + }, + { + "epoch": 0.03, + "learning_rate": 1.941245000194167e-07, + "loss": 0.4069, + "step": 1563 + }, + { + "epoch": 0.03, + "learning_rate": 1.9412061667508058e-07, + "loss": 0.4952, + "step": 1564 + }, + { + "epoch": 0.03, + "learning_rate": 1.9411673333074442e-07, + "loss": 0.3515, + "step": 1565 + }, + { + "epoch": 0.03, + "learning_rate": 1.941128499864083e-07, + "loss": 0.4927, + "step": 1566 + }, + { + "epoch": 0.03, + "learning_rate": 1.9410896664207214e-07, + "loss": 0.2887, + "step": 1567 + }, + { + "epoch": 0.03, + "learning_rate": 1.94105083297736e-07, + "loss": 0.3949, + "step": 1568 + }, + { + "epoch": 0.03, + "learning_rate": 1.9410119995339986e-07, + "loss": 0.3458, + "step": 1569 + }, + { + "epoch": 0.03, + "learning_rate": 1.9409731660906373e-07, + "loss": 0.388, + "step": 1570 + }, + { + "epoch": 0.03, + "learning_rate": 1.9409343326472757e-07, + "loss": 0.4257, + "step": 1571 + }, + { + "epoch": 0.03, + "learning_rate": 1.9408954992039144e-07, + "loss": 0.3789, + "step": 1572 + }, + { + "epoch": 0.03, + "learning_rate": 1.940856665760553e-07, + "loss": 0.7059, + "step": 1573 + }, + { + "epoch": 0.03, + "learning_rate": 1.9408178323171916e-07, + "loss": 0.3942, + "step": 1574 + }, + { + "epoch": 0.03, + "learning_rate": 1.94077899887383e-07, + "loss": 0.5262, + "step": 1575 + }, + { + "epoch": 0.03, + "learning_rate": 1.9407401654304688e-07, + "loss": 0.4621, + "step": 1576 + }, + { + "epoch": 0.03, + "learning_rate": 1.9407013319871072e-07, + "loss": 0.3889, + "step": 1577 + }, + { + "epoch": 0.03, + "learning_rate": 1.940662498543746e-07, + "loss": 0.4905, + "step": 1578 + }, + { + "epoch": 0.03, + "learning_rate": 1.9406236651003844e-07, + "loss": 0.475, + "step": 1579 + }, + { + "epoch": 0.03, + "learning_rate": 1.940584831657023e-07, + "loss": 0.4422, + "step": 1580 + }, + { + "epoch": 0.03, + "learning_rate": 1.9405459982136616e-07, + "loss": 0.4686, + "step": 1581 + }, + { + "epoch": 0.03, + "learning_rate": 1.9405071647703003e-07, + "loss": 0.7084, + "step": 1582 + }, + { + "epoch": 0.03, + "learning_rate": 1.9404683313269387e-07, + "loss": 0.3059, + "step": 1583 + }, + { + "epoch": 0.03, + "learning_rate": 1.9404294978835774e-07, + "loss": 0.4072, + "step": 1584 + }, + { + "epoch": 0.03, + "learning_rate": 1.940390664440216e-07, + "loss": 0.4274, + "step": 1585 + }, + { + "epoch": 0.03, + "learning_rate": 1.9403518309968546e-07, + "loss": 0.4987, + "step": 1586 + }, + { + "epoch": 0.03, + "learning_rate": 1.9403129975534928e-07, + "loss": 0.5136, + "step": 1587 + }, + { + "epoch": 0.03, + "learning_rate": 1.9402741641101315e-07, + "loss": 0.3309, + "step": 1588 + }, + { + "epoch": 0.03, + "learning_rate": 1.94023533066677e-07, + "loss": 0.3374, + "step": 1589 + }, + { + "epoch": 0.03, + "learning_rate": 1.9401964972234087e-07, + "loss": 0.3934, + "step": 1590 + }, + { + "epoch": 0.03, + "learning_rate": 1.940157663780047e-07, + "loss": 0.3911, + "step": 1591 + }, + { + "epoch": 0.03, + "learning_rate": 1.9401188303366858e-07, + "loss": 0.5697, + "step": 1592 + }, + { + "epoch": 0.03, + "learning_rate": 1.9400799968933243e-07, + "loss": 0.3852, + "step": 1593 + }, + { + "epoch": 0.03, + "learning_rate": 1.940041163449963e-07, + "loss": 0.4596, + "step": 1594 + }, + { + "epoch": 0.03, + "learning_rate": 1.9400023300066014e-07, + "loss": 0.3868, + "step": 1595 + }, + { + "epoch": 0.03, + "learning_rate": 1.9399634965632402e-07, + "loss": 0.4272, + "step": 1596 + }, + { + "epoch": 0.03, + "learning_rate": 1.9399246631198786e-07, + "loss": 0.3891, + "step": 1597 + }, + { + "epoch": 0.03, + "learning_rate": 1.9398858296765173e-07, + "loss": 0.549, + "step": 1598 + }, + { + "epoch": 0.03, + "learning_rate": 1.9398469962331558e-07, + "loss": 0.4672, + "step": 1599 + }, + { + "epoch": 0.03, + "learning_rate": 1.9398081627897945e-07, + "loss": 0.3168, + "step": 1600 + }, + { + "epoch": 0.03, + "learning_rate": 1.939769329346433e-07, + "loss": 0.5387, + "step": 1601 + }, + { + "epoch": 0.03, + "learning_rate": 1.9397304959030717e-07, + "loss": 0.4601, + "step": 1602 + }, + { + "epoch": 0.03, + "learning_rate": 1.93969166245971e-07, + "loss": 0.3387, + "step": 1603 + }, + { + "epoch": 0.03, + "learning_rate": 1.9396528290163488e-07, + "loss": 0.4156, + "step": 1604 + }, + { + "epoch": 0.03, + "learning_rate": 1.9396139955729873e-07, + "loss": 0.3552, + "step": 1605 + }, + { + "epoch": 0.03, + "learning_rate": 1.939575162129626e-07, + "loss": 0.4797, + "step": 1606 + }, + { + "epoch": 0.03, + "learning_rate": 1.9395363286862644e-07, + "loss": 0.5278, + "step": 1607 + }, + { + "epoch": 0.03, + "learning_rate": 1.9394974952429032e-07, + "loss": 0.3143, + "step": 1608 + }, + { + "epoch": 0.03, + "learning_rate": 1.9394586617995416e-07, + "loss": 0.4203, + "step": 1609 + }, + { + "epoch": 0.03, + "learning_rate": 1.9394198283561803e-07, + "loss": 0.3744, + "step": 1610 + }, + { + "epoch": 0.03, + "learning_rate": 1.9393809949128188e-07, + "loss": 0.5225, + "step": 1611 + }, + { + "epoch": 0.03, + "learning_rate": 1.9393421614694575e-07, + "loss": 0.5021, + "step": 1612 + }, + { + "epoch": 0.03, + "learning_rate": 1.939303328026096e-07, + "loss": 0.4721, + "step": 1613 + }, + { + "epoch": 0.03, + "learning_rate": 1.9392644945827346e-07, + "loss": 0.4341, + "step": 1614 + }, + { + "epoch": 0.03, + "learning_rate": 1.939225661139373e-07, + "loss": 0.4175, + "step": 1615 + }, + { + "epoch": 0.03, + "learning_rate": 1.9391868276960118e-07, + "loss": 0.3251, + "step": 1616 + }, + { + "epoch": 0.03, + "learning_rate": 1.9391479942526503e-07, + "loss": 0.5544, + "step": 1617 + }, + { + "epoch": 0.03, + "learning_rate": 1.939109160809289e-07, + "loss": 0.4453, + "step": 1618 + }, + { + "epoch": 0.03, + "learning_rate": 1.9390703273659274e-07, + "loss": 0.4414, + "step": 1619 + }, + { + "epoch": 0.03, + "learning_rate": 1.9390314939225661e-07, + "loss": 0.334, + "step": 1620 + }, + { + "epoch": 0.03, + "learning_rate": 1.9389926604792046e-07, + "loss": 0.2948, + "step": 1621 + }, + { + "epoch": 0.03, + "learning_rate": 1.9389538270358433e-07, + "loss": 0.292, + "step": 1622 + }, + { + "epoch": 0.03, + "learning_rate": 1.9389149935924818e-07, + "loss": 0.3911, + "step": 1623 + }, + { + "epoch": 0.03, + "learning_rate": 1.9388761601491205e-07, + "loss": 0.3403, + "step": 1624 + }, + { + "epoch": 0.03, + "learning_rate": 1.938837326705759e-07, + "loss": 0.5588, + "step": 1625 + }, + { + "epoch": 0.03, + "learning_rate": 1.9387984932623976e-07, + "loss": 0.3195, + "step": 1626 + }, + { + "epoch": 0.03, + "learning_rate": 1.938759659819036e-07, + "loss": 0.388, + "step": 1627 + }, + { + "epoch": 0.03, + "learning_rate": 1.9387208263756748e-07, + "loss": 0.2862, + "step": 1628 + }, + { + "epoch": 0.03, + "learning_rate": 1.9386819929323132e-07, + "loss": 0.5922, + "step": 1629 + }, + { + "epoch": 0.03, + "learning_rate": 1.938643159488952e-07, + "loss": 0.561, + "step": 1630 + }, + { + "epoch": 0.03, + "learning_rate": 1.9386043260455904e-07, + "loss": 0.5039, + "step": 1631 + }, + { + "epoch": 0.03, + "learning_rate": 1.938565492602229e-07, + "loss": 0.3245, + "step": 1632 + }, + { + "epoch": 0.03, + "learning_rate": 1.9385266591588676e-07, + "loss": 0.4432, + "step": 1633 + }, + { + "epoch": 0.03, + "learning_rate": 1.9384878257155063e-07, + "loss": 0.5509, + "step": 1634 + }, + { + "epoch": 0.03, + "learning_rate": 1.9384489922721447e-07, + "loss": 0.2912, + "step": 1635 + }, + { + "epoch": 0.03, + "learning_rate": 1.9384101588287835e-07, + "loss": 0.344, + "step": 1636 + }, + { + "epoch": 0.03, + "learning_rate": 1.938371325385422e-07, + "loss": 0.567, + "step": 1637 + }, + { + "epoch": 0.03, + "learning_rate": 1.9383324919420606e-07, + "loss": 0.4189, + "step": 1638 + }, + { + "epoch": 0.03, + "learning_rate": 1.938293658498699e-07, + "loss": 0.4371, + "step": 1639 + }, + { + "epoch": 0.03, + "learning_rate": 1.9382548250553378e-07, + "loss": 0.3149, + "step": 1640 + }, + { + "epoch": 0.03, + "learning_rate": 1.9382159916119762e-07, + "loss": 0.421, + "step": 1641 + }, + { + "epoch": 0.03, + "learning_rate": 1.938177158168615e-07, + "loss": 0.3706, + "step": 1642 + }, + { + "epoch": 0.03, + "learning_rate": 1.9381383247252534e-07, + "loss": 0.296, + "step": 1643 + }, + { + "epoch": 0.03, + "learning_rate": 1.9380994912818919e-07, + "loss": 0.3344, + "step": 1644 + }, + { + "epoch": 0.03, + "learning_rate": 1.9380606578385303e-07, + "loss": 0.8061, + "step": 1645 + }, + { + "epoch": 0.03, + "learning_rate": 1.938021824395169e-07, + "loss": 0.3853, + "step": 1646 + }, + { + "epoch": 0.03, + "learning_rate": 1.9379829909518075e-07, + "loss": 0.4314, + "step": 1647 + }, + { + "epoch": 0.03, + "learning_rate": 1.9379441575084462e-07, + "loss": 0.2652, + "step": 1648 + }, + { + "epoch": 0.03, + "learning_rate": 1.9379053240650846e-07, + "loss": 0.3214, + "step": 1649 + }, + { + "epoch": 0.03, + "learning_rate": 1.9378664906217233e-07, + "loss": 0.2968, + "step": 1650 + }, + { + "epoch": 0.03, + "learning_rate": 1.9378276571783618e-07, + "loss": 0.4708, + "step": 1651 + }, + { + "epoch": 0.03, + "learning_rate": 1.9377888237350005e-07, + "loss": 0.3921, + "step": 1652 + }, + { + "epoch": 0.03, + "learning_rate": 1.937749990291639e-07, + "loss": 0.3791, + "step": 1653 + }, + { + "epoch": 0.03, + "learning_rate": 1.9377111568482777e-07, + "loss": 0.2965, + "step": 1654 + }, + { + "epoch": 0.03, + "learning_rate": 1.937672323404916e-07, + "loss": 0.3287, + "step": 1655 + }, + { + "epoch": 0.03, + "learning_rate": 1.9376334899615548e-07, + "loss": 0.3656, + "step": 1656 + }, + { + "epoch": 0.03, + "learning_rate": 1.9375946565181933e-07, + "loss": 0.466, + "step": 1657 + }, + { + "epoch": 0.03, + "learning_rate": 1.937555823074832e-07, + "loss": 0.5535, + "step": 1658 + }, + { + "epoch": 0.03, + "learning_rate": 1.9375169896314705e-07, + "loss": 0.3353, + "step": 1659 + }, + { + "epoch": 0.03, + "learning_rate": 1.9374781561881092e-07, + "loss": 0.5806, + "step": 1660 + }, + { + "epoch": 0.03, + "learning_rate": 1.9374393227447476e-07, + "loss": 0.5623, + "step": 1661 + }, + { + "epoch": 0.03, + "learning_rate": 1.9374004893013863e-07, + "loss": 0.5744, + "step": 1662 + }, + { + "epoch": 0.03, + "learning_rate": 1.9373616558580248e-07, + "loss": 0.2913, + "step": 1663 + }, + { + "epoch": 0.03, + "learning_rate": 1.9373228224146635e-07, + "loss": 0.6455, + "step": 1664 + }, + { + "epoch": 0.03, + "learning_rate": 1.937283988971302e-07, + "loss": 0.3105, + "step": 1665 + }, + { + "epoch": 0.03, + "learning_rate": 1.9372451555279407e-07, + "loss": 0.3082, + "step": 1666 + }, + { + "epoch": 0.03, + "learning_rate": 1.937206322084579e-07, + "loss": 0.3167, + "step": 1667 + }, + { + "epoch": 0.03, + "learning_rate": 1.9371674886412178e-07, + "loss": 0.5256, + "step": 1668 + }, + { + "epoch": 0.03, + "learning_rate": 1.9371286551978563e-07, + "loss": 0.2735, + "step": 1669 + }, + { + "epoch": 0.03, + "learning_rate": 1.937089821754495e-07, + "loss": 0.298, + "step": 1670 + }, + { + "epoch": 0.03, + "learning_rate": 1.9370509883111334e-07, + "loss": 0.3712, + "step": 1671 + }, + { + "epoch": 0.03, + "learning_rate": 1.9370121548677722e-07, + "loss": 0.379, + "step": 1672 + }, + { + "epoch": 0.03, + "learning_rate": 1.9369733214244106e-07, + "loss": 0.3244, + "step": 1673 + }, + { + "epoch": 0.03, + "learning_rate": 1.936934487981049e-07, + "loss": 0.5201, + "step": 1674 + }, + { + "epoch": 0.03, + "learning_rate": 1.9368956545376878e-07, + "loss": 0.3778, + "step": 1675 + }, + { + "epoch": 0.03, + "learning_rate": 1.9368568210943262e-07, + "loss": 0.3779, + "step": 1676 + }, + { + "epoch": 0.03, + "learning_rate": 1.936817987650965e-07, + "loss": 0.4079, + "step": 1677 + }, + { + "epoch": 0.03, + "learning_rate": 1.9367791542076034e-07, + "loss": 0.3518, + "step": 1678 + }, + { + "epoch": 0.03, + "learning_rate": 1.936740320764242e-07, + "loss": 0.2731, + "step": 1679 + }, + { + "epoch": 0.03, + "learning_rate": 1.9367014873208806e-07, + "loss": 0.458, + "step": 1680 + }, + { + "epoch": 0.03, + "learning_rate": 1.9366626538775193e-07, + "loss": 0.5503, + "step": 1681 + }, + { + "epoch": 0.03, + "learning_rate": 1.9366238204341577e-07, + "loss": 0.2253, + "step": 1682 + }, + { + "epoch": 0.03, + "learning_rate": 1.9365849869907964e-07, + "loss": 0.2802, + "step": 1683 + }, + { + "epoch": 0.03, + "learning_rate": 1.936546153547435e-07, + "loss": 0.2822, + "step": 1684 + }, + { + "epoch": 0.03, + "learning_rate": 1.9365073201040736e-07, + "loss": 0.306, + "step": 1685 + }, + { + "epoch": 0.03, + "learning_rate": 1.936468486660712e-07, + "loss": 0.2405, + "step": 1686 + }, + { + "epoch": 0.03, + "learning_rate": 1.9364296532173508e-07, + "loss": 0.4175, + "step": 1687 + }, + { + "epoch": 0.03, + "learning_rate": 1.9363908197739892e-07, + "loss": 0.5027, + "step": 1688 + }, + { + "epoch": 0.03, + "learning_rate": 1.936351986330628e-07, + "loss": 0.2741, + "step": 1689 + }, + { + "epoch": 0.03, + "learning_rate": 1.9363131528872664e-07, + "loss": 0.407, + "step": 1690 + }, + { + "epoch": 0.03, + "learning_rate": 1.936274319443905e-07, + "loss": 0.4557, + "step": 1691 + }, + { + "epoch": 0.03, + "learning_rate": 1.9362354860005435e-07, + "loss": 0.5691, + "step": 1692 + }, + { + "epoch": 0.03, + "learning_rate": 1.9361966525571823e-07, + "loss": 0.3534, + "step": 1693 + }, + { + "epoch": 0.03, + "learning_rate": 1.9361578191138207e-07, + "loss": 0.3785, + "step": 1694 + }, + { + "epoch": 0.03, + "learning_rate": 1.9361189856704594e-07, + "loss": 0.5864, + "step": 1695 + }, + { + "epoch": 0.03, + "learning_rate": 1.936080152227098e-07, + "loss": 0.2426, + "step": 1696 + }, + { + "epoch": 0.03, + "learning_rate": 1.9360413187837366e-07, + "loss": 0.4424, + "step": 1697 + }, + { + "epoch": 0.03, + "learning_rate": 1.936002485340375e-07, + "loss": 0.5353, + "step": 1698 + }, + { + "epoch": 0.03, + "learning_rate": 1.9359636518970138e-07, + "loss": 0.3493, + "step": 1699 + }, + { + "epoch": 0.03, + "learning_rate": 1.9359248184536522e-07, + "loss": 0.4003, + "step": 1700 + }, + { + "epoch": 0.03, + "learning_rate": 1.935885985010291e-07, + "loss": 0.3368, + "step": 1701 + }, + { + "epoch": 0.03, + "learning_rate": 1.9358471515669294e-07, + "loss": 0.6129, + "step": 1702 + }, + { + "epoch": 0.03, + "learning_rate": 1.9358083181235678e-07, + "loss": 0.4693, + "step": 1703 + }, + { + "epoch": 0.03, + "learning_rate": 1.9357694846802063e-07, + "loss": 0.4501, + "step": 1704 + }, + { + "epoch": 0.03, + "learning_rate": 1.935730651236845e-07, + "loss": 0.3429, + "step": 1705 + }, + { + "epoch": 0.03, + "learning_rate": 1.9356918177934834e-07, + "loss": 0.3126, + "step": 1706 + }, + { + "epoch": 0.03, + "learning_rate": 1.9356529843501222e-07, + "loss": 0.248, + "step": 1707 + }, + { + "epoch": 0.03, + "learning_rate": 1.9356141509067606e-07, + "loss": 0.257, + "step": 1708 + }, + { + "epoch": 0.03, + "learning_rate": 1.9355753174633993e-07, + "loss": 0.4945, + "step": 1709 + }, + { + "epoch": 0.03, + "learning_rate": 1.9355364840200378e-07, + "loss": 0.4647, + "step": 1710 + }, + { + "epoch": 0.03, + "learning_rate": 1.9354976505766765e-07, + "loss": 0.3037, + "step": 1711 + }, + { + "epoch": 0.03, + "learning_rate": 1.935458817133315e-07, + "loss": 0.3989, + "step": 1712 + }, + { + "epoch": 0.03, + "learning_rate": 1.9354199836899536e-07, + "loss": 0.2684, + "step": 1713 + }, + { + "epoch": 0.03, + "learning_rate": 1.935381150246592e-07, + "loss": 0.6922, + "step": 1714 + }, + { + "epoch": 0.03, + "learning_rate": 1.9353423168032308e-07, + "loss": 0.4663, + "step": 1715 + }, + { + "epoch": 0.03, + "learning_rate": 1.9353034833598693e-07, + "loss": 0.5849, + "step": 1716 + }, + { + "epoch": 0.03, + "learning_rate": 1.935264649916508e-07, + "loss": 0.3119, + "step": 1717 + }, + { + "epoch": 0.03, + "learning_rate": 1.9352258164731464e-07, + "loss": 0.4248, + "step": 1718 + }, + { + "epoch": 0.03, + "learning_rate": 1.9351869830297851e-07, + "loss": 0.2485, + "step": 1719 + }, + { + "epoch": 0.03, + "learning_rate": 1.9351481495864236e-07, + "loss": 0.2187, + "step": 1720 + }, + { + "epoch": 0.03, + "learning_rate": 1.9351093161430623e-07, + "loss": 0.2315, + "step": 1721 + }, + { + "epoch": 0.03, + "learning_rate": 1.9350704826997008e-07, + "loss": 0.3628, + "step": 1722 + }, + { + "epoch": 0.03, + "learning_rate": 1.9350316492563395e-07, + "loss": 0.3768, + "step": 1723 + }, + { + "epoch": 0.03, + "learning_rate": 1.934992815812978e-07, + "loss": 0.4965, + "step": 1724 + }, + { + "epoch": 0.03, + "learning_rate": 1.9349539823696166e-07, + "loss": 0.4546, + "step": 1725 + }, + { + "epoch": 0.03, + "learning_rate": 1.934915148926255e-07, + "loss": 0.4596, + "step": 1726 + }, + { + "epoch": 0.03, + "learning_rate": 1.9348763154828938e-07, + "loss": 0.4546, + "step": 1727 + }, + { + "epoch": 0.03, + "learning_rate": 1.9348374820395322e-07, + "loss": 0.3376, + "step": 1728 + }, + { + "epoch": 0.03, + "learning_rate": 1.934798648596171e-07, + "loss": 0.4948, + "step": 1729 + }, + { + "epoch": 0.03, + "learning_rate": 1.9347598151528094e-07, + "loss": 0.3619, + "step": 1730 + }, + { + "epoch": 0.03, + "learning_rate": 1.934720981709448e-07, + "loss": 0.3794, + "step": 1731 + }, + { + "epoch": 0.03, + "learning_rate": 1.9346821482660866e-07, + "loss": 0.3545, + "step": 1732 + }, + { + "epoch": 0.03, + "learning_rate": 1.9346433148227253e-07, + "loss": 0.2853, + "step": 1733 + }, + { + "epoch": 0.03, + "learning_rate": 1.9346044813793637e-07, + "loss": 0.4494, + "step": 1734 + }, + { + "epoch": 0.03, + "learning_rate": 1.9345656479360025e-07, + "loss": 0.395, + "step": 1735 + }, + { + "epoch": 0.03, + "learning_rate": 1.934526814492641e-07, + "loss": 0.3445, + "step": 1736 + }, + { + "epoch": 0.03, + "learning_rate": 1.9344879810492796e-07, + "loss": 0.3449, + "step": 1737 + }, + { + "epoch": 0.03, + "learning_rate": 1.934449147605918e-07, + "loss": 0.2371, + "step": 1738 + }, + { + "epoch": 0.03, + "learning_rate": 1.9344103141625568e-07, + "loss": 0.2685, + "step": 1739 + }, + { + "epoch": 0.03, + "learning_rate": 1.9343714807191952e-07, + "loss": 0.2722, + "step": 1740 + }, + { + "epoch": 0.03, + "learning_rate": 1.934332647275834e-07, + "loss": 0.2871, + "step": 1741 + }, + { + "epoch": 0.03, + "learning_rate": 1.9342938138324724e-07, + "loss": 0.6552, + "step": 1742 + }, + { + "epoch": 0.03, + "learning_rate": 1.934254980389111e-07, + "loss": 0.3818, + "step": 1743 + }, + { + "epoch": 0.03, + "learning_rate": 1.9342161469457496e-07, + "loss": 0.363, + "step": 1744 + }, + { + "epoch": 0.03, + "learning_rate": 1.9341773135023883e-07, + "loss": 0.3466, + "step": 1745 + }, + { + "epoch": 0.03, + "learning_rate": 1.9341384800590267e-07, + "loss": 0.3085, + "step": 1746 + }, + { + "epoch": 0.03, + "learning_rate": 1.9340996466156654e-07, + "loss": 0.2756, + "step": 1747 + }, + { + "epoch": 0.03, + "learning_rate": 1.934060813172304e-07, + "loss": 0.3463, + "step": 1748 + }, + { + "epoch": 0.03, + "learning_rate": 1.9340219797289426e-07, + "loss": 0.4708, + "step": 1749 + }, + { + "epoch": 0.03, + "learning_rate": 1.933983146285581e-07, + "loss": 0.413, + "step": 1750 + }, + { + "epoch": 0.03, + "learning_rate": 1.9339443128422198e-07, + "loss": 0.5094, + "step": 1751 + }, + { + "epoch": 0.03, + "learning_rate": 1.9339054793988582e-07, + "loss": 0.2368, + "step": 1752 + }, + { + "epoch": 0.03, + "learning_rate": 1.933866645955497e-07, + "loss": 0.2949, + "step": 1753 + }, + { + "epoch": 0.03, + "learning_rate": 1.9338278125121354e-07, + "loss": 0.4935, + "step": 1754 + }, + { + "epoch": 0.03, + "learning_rate": 1.933788979068774e-07, + "loss": 0.4296, + "step": 1755 + }, + { + "epoch": 0.03, + "learning_rate": 1.9337501456254126e-07, + "loss": 0.4738, + "step": 1756 + }, + { + "epoch": 0.03, + "learning_rate": 1.9337113121820513e-07, + "loss": 0.4487, + "step": 1757 + }, + { + "epoch": 0.03, + "learning_rate": 1.9336724787386897e-07, + "loss": 0.4146, + "step": 1758 + }, + { + "epoch": 0.03, + "learning_rate": 1.9336336452953284e-07, + "loss": 0.4793, + "step": 1759 + }, + { + "epoch": 0.03, + "learning_rate": 1.933594811851967e-07, + "loss": 0.3278, + "step": 1760 + }, + { + "epoch": 0.03, + "learning_rate": 1.9335559784086053e-07, + "loss": 0.2398, + "step": 1761 + }, + { + "epoch": 0.03, + "learning_rate": 1.9335171449652438e-07, + "loss": 0.2486, + "step": 1762 + }, + { + "epoch": 0.03, + "learning_rate": 1.9334783115218825e-07, + "loss": 0.4199, + "step": 1763 + }, + { + "epoch": 0.03, + "learning_rate": 1.933439478078521e-07, + "loss": 0.2601, + "step": 1764 + }, + { + "epoch": 0.03, + "learning_rate": 1.9334006446351597e-07, + "loss": 0.5745, + "step": 1765 + }, + { + "epoch": 0.03, + "learning_rate": 1.933361811191798e-07, + "loss": 0.3294, + "step": 1766 + }, + { + "epoch": 0.03, + "learning_rate": 1.9333229777484368e-07, + "loss": 0.2569, + "step": 1767 + }, + { + "epoch": 0.03, + "learning_rate": 1.9332841443050753e-07, + "loss": 0.3959, + "step": 1768 + }, + { + "epoch": 0.03, + "learning_rate": 1.933245310861714e-07, + "loss": 0.3335, + "step": 1769 + }, + { + "epoch": 0.03, + "learning_rate": 1.9332064774183524e-07, + "loss": 0.5092, + "step": 1770 + }, + { + "epoch": 0.03, + "learning_rate": 1.9331676439749912e-07, + "loss": 0.3046, + "step": 1771 + }, + { + "epoch": 0.03, + "learning_rate": 1.9331288105316296e-07, + "loss": 0.2034, + "step": 1772 + }, + { + "epoch": 0.03, + "learning_rate": 1.9330899770882683e-07, + "loss": 0.3558, + "step": 1773 + }, + { + "epoch": 0.03, + "learning_rate": 1.9330511436449068e-07, + "loss": 0.5492, + "step": 1774 + }, + { + "epoch": 0.03, + "learning_rate": 1.9330123102015455e-07, + "loss": 0.4075, + "step": 1775 + }, + { + "epoch": 0.03, + "learning_rate": 1.932973476758184e-07, + "loss": 0.2816, + "step": 1776 + }, + { + "epoch": 0.03, + "learning_rate": 1.9329346433148227e-07, + "loss": 0.3718, + "step": 1777 + }, + { + "epoch": 0.03, + "learning_rate": 1.932895809871461e-07, + "loss": 0.3065, + "step": 1778 + }, + { + "epoch": 0.03, + "learning_rate": 1.9328569764280998e-07, + "loss": 0.373, + "step": 1779 + }, + { + "epoch": 0.03, + "learning_rate": 1.9328181429847383e-07, + "loss": 0.2641, + "step": 1780 + }, + { + "epoch": 0.03, + "learning_rate": 1.932779309541377e-07, + "loss": 0.6258, + "step": 1781 + }, + { + "epoch": 0.03, + "learning_rate": 1.9327404760980154e-07, + "loss": 0.2535, + "step": 1782 + }, + { + "epoch": 0.03, + "learning_rate": 1.9327016426546542e-07, + "loss": 0.2507, + "step": 1783 + }, + { + "epoch": 0.03, + "learning_rate": 1.9326628092112926e-07, + "loss": 0.3822, + "step": 1784 + }, + { + "epoch": 0.03, + "learning_rate": 1.9326239757679313e-07, + "loss": 0.3735, + "step": 1785 + }, + { + "epoch": 0.03, + "learning_rate": 1.9325851423245698e-07, + "loss": 0.3199, + "step": 1786 + }, + { + "epoch": 0.03, + "learning_rate": 1.9325463088812085e-07, + "loss": 0.4151, + "step": 1787 + }, + { + "epoch": 0.03, + "learning_rate": 1.932507475437847e-07, + "loss": 0.3442, + "step": 1788 + }, + { + "epoch": 0.03, + "learning_rate": 1.9324686419944856e-07, + "loss": 0.463, + "step": 1789 + }, + { + "epoch": 0.03, + "learning_rate": 1.932429808551124e-07, + "loss": 0.2227, + "step": 1790 + }, + { + "epoch": 0.03, + "learning_rate": 1.9323909751077628e-07, + "loss": 0.2563, + "step": 1791 + }, + { + "epoch": 0.03, + "learning_rate": 1.9323521416644013e-07, + "loss": 0.3446, + "step": 1792 + }, + { + "epoch": 0.03, + "learning_rate": 1.93231330822104e-07, + "loss": 0.3892, + "step": 1793 + }, + { + "epoch": 0.03, + "learning_rate": 1.9322744747776784e-07, + "loss": 0.4542, + "step": 1794 + }, + { + "epoch": 0.03, + "learning_rate": 1.9322356413343171e-07, + "loss": 0.3281, + "step": 1795 + }, + { + "epoch": 0.03, + "learning_rate": 1.9321968078909556e-07, + "loss": 0.322, + "step": 1796 + }, + { + "epoch": 0.03, + "learning_rate": 1.9321579744475943e-07, + "loss": 0.2692, + "step": 1797 + }, + { + "epoch": 0.03, + "learning_rate": 1.9321191410042328e-07, + "loss": 0.2931, + "step": 1798 + }, + { + "epoch": 0.03, + "learning_rate": 1.9320803075608715e-07, + "loss": 0.2748, + "step": 1799 + }, + { + "epoch": 0.03, + "learning_rate": 1.93204147411751e-07, + "loss": 0.2826, + "step": 1800 + }, + { + "epoch": 0.03, + "learning_rate": 1.9320026406741486e-07, + "loss": 0.3793, + "step": 1801 + }, + { + "epoch": 0.03, + "learning_rate": 1.931963807230787e-07, + "loss": 0.2702, + "step": 1802 + }, + { + "epoch": 0.03, + "learning_rate": 1.9319249737874258e-07, + "loss": 0.2915, + "step": 1803 + }, + { + "epoch": 0.03, + "learning_rate": 1.9318861403440643e-07, + "loss": 0.4175, + "step": 1804 + }, + { + "epoch": 0.04, + "learning_rate": 1.931847306900703e-07, + "loss": 0.4331, + "step": 1805 + }, + { + "epoch": 0.04, + "learning_rate": 1.9318084734573414e-07, + "loss": 0.4283, + "step": 1806 + }, + { + "epoch": 0.04, + "learning_rate": 1.93176964001398e-07, + "loss": 0.3778, + "step": 1807 + }, + { + "epoch": 0.04, + "learning_rate": 1.9317308065706186e-07, + "loss": 0.2722, + "step": 1808 + }, + { + "epoch": 0.04, + "learning_rate": 1.9316919731272573e-07, + "loss": 0.267, + "step": 1809 + }, + { + "epoch": 0.04, + "learning_rate": 1.9316531396838957e-07, + "loss": 0.2676, + "step": 1810 + }, + { + "epoch": 0.04, + "learning_rate": 1.9316143062405345e-07, + "loss": 0.2954, + "step": 1811 + }, + { + "epoch": 0.04, + "learning_rate": 1.931575472797173e-07, + "loss": 0.4044, + "step": 1812 + }, + { + "epoch": 0.04, + "learning_rate": 1.9315366393538116e-07, + "loss": 0.3778, + "step": 1813 + }, + { + "epoch": 0.04, + "learning_rate": 1.93149780591045e-07, + "loss": 0.4385, + "step": 1814 + }, + { + "epoch": 0.04, + "learning_rate": 1.9314589724670888e-07, + "loss": 0.4284, + "step": 1815 + }, + { + "epoch": 0.04, + "learning_rate": 1.9314201390237272e-07, + "loss": 0.3004, + "step": 1816 + }, + { + "epoch": 0.04, + "learning_rate": 1.931381305580366e-07, + "loss": 0.2736, + "step": 1817 + }, + { + "epoch": 0.04, + "learning_rate": 1.9313424721370044e-07, + "loss": 0.4952, + "step": 1818 + }, + { + "epoch": 0.04, + "learning_rate": 1.9313036386936429e-07, + "loss": 0.6012, + "step": 1819 + }, + { + "epoch": 0.04, + "learning_rate": 1.9312648052502813e-07, + "loss": 0.4044, + "step": 1820 + }, + { + "epoch": 0.04, + "learning_rate": 1.93122597180692e-07, + "loss": 0.3551, + "step": 1821 + }, + { + "epoch": 0.04, + "learning_rate": 1.9311871383635585e-07, + "loss": 0.3032, + "step": 1822 + }, + { + "epoch": 0.04, + "learning_rate": 1.9311483049201972e-07, + "loss": 0.4021, + "step": 1823 + }, + { + "epoch": 0.04, + "learning_rate": 1.9311094714768356e-07, + "loss": 0.3118, + "step": 1824 + }, + { + "epoch": 0.04, + "learning_rate": 1.9310706380334743e-07, + "loss": 0.3377, + "step": 1825 + }, + { + "epoch": 0.04, + "learning_rate": 1.9310318045901128e-07, + "loss": 0.2378, + "step": 1826 + }, + { + "epoch": 0.04, + "learning_rate": 1.9309929711467515e-07, + "loss": 0.305, + "step": 1827 + }, + { + "epoch": 0.04, + "learning_rate": 1.93095413770339e-07, + "loss": 0.7563, + "step": 1828 + }, + { + "epoch": 0.04, + "learning_rate": 1.9309153042600287e-07, + "loss": 0.6599, + "step": 1829 + }, + { + "epoch": 0.04, + "learning_rate": 1.930876470816667e-07, + "loss": 0.3261, + "step": 1830 + }, + { + "epoch": 0.04, + "learning_rate": 1.9308376373733058e-07, + "loss": 0.6185, + "step": 1831 + }, + { + "epoch": 0.04, + "learning_rate": 1.9307988039299443e-07, + "loss": 0.3424, + "step": 1832 + }, + { + "epoch": 0.04, + "learning_rate": 1.930759970486583e-07, + "loss": 0.3952, + "step": 1833 + }, + { + "epoch": 0.04, + "learning_rate": 1.9307211370432215e-07, + "loss": 0.3131, + "step": 1834 + }, + { + "epoch": 0.04, + "learning_rate": 1.9306823035998602e-07, + "loss": 0.2932, + "step": 1835 + }, + { + "epoch": 0.04, + "learning_rate": 1.9306434701564986e-07, + "loss": 0.537, + "step": 1836 + }, + { + "epoch": 0.04, + "learning_rate": 1.9306046367131373e-07, + "loss": 0.6991, + "step": 1837 + }, + { + "epoch": 0.04, + "learning_rate": 1.9305658032697758e-07, + "loss": 0.3839, + "step": 1838 + }, + { + "epoch": 0.04, + "learning_rate": 1.9305269698264145e-07, + "loss": 0.429, + "step": 1839 + }, + { + "epoch": 0.04, + "learning_rate": 1.930488136383053e-07, + "loss": 0.6514, + "step": 1840 + }, + { + "epoch": 0.04, + "learning_rate": 1.9304493029396917e-07, + "loss": 0.2944, + "step": 1841 + }, + { + "epoch": 0.04, + "learning_rate": 1.93041046949633e-07, + "loss": 0.2041, + "step": 1842 + }, + { + "epoch": 0.04, + "learning_rate": 1.9303716360529688e-07, + "loss": 0.5668, + "step": 1843 + }, + { + "epoch": 0.04, + "learning_rate": 1.9303328026096073e-07, + "loss": 0.2439, + "step": 1844 + }, + { + "epoch": 0.04, + "learning_rate": 1.930293969166246e-07, + "loss": 0.318, + "step": 1845 + }, + { + "epoch": 0.04, + "learning_rate": 1.9302551357228844e-07, + "loss": 0.3326, + "step": 1846 + }, + { + "epoch": 0.04, + "learning_rate": 1.9302163022795232e-07, + "loss": 0.2842, + "step": 1847 + }, + { + "epoch": 0.04, + "learning_rate": 1.9301774688361616e-07, + "loss": 0.3493, + "step": 1848 + }, + { + "epoch": 0.04, + "learning_rate": 1.9301386353928003e-07, + "loss": 0.3356, + "step": 1849 + }, + { + "epoch": 0.04, + "learning_rate": 1.9300998019494388e-07, + "loss": 0.2175, + "step": 1850 + }, + { + "epoch": 0.04, + "learning_rate": 1.9300609685060772e-07, + "loss": 0.3069, + "step": 1851 + }, + { + "epoch": 0.04, + "learning_rate": 1.930022135062716e-07, + "loss": 0.5014, + "step": 1852 + }, + { + "epoch": 0.04, + "learning_rate": 1.9299833016193544e-07, + "loss": 0.2845, + "step": 1853 + }, + { + "epoch": 0.04, + "learning_rate": 1.929944468175993e-07, + "loss": 0.256, + "step": 1854 + }, + { + "epoch": 0.04, + "learning_rate": 1.9299056347326316e-07, + "loss": 0.4956, + "step": 1855 + }, + { + "epoch": 0.04, + "learning_rate": 1.9298668012892703e-07, + "loss": 0.254, + "step": 1856 + }, + { + "epoch": 0.04, + "learning_rate": 1.9298279678459087e-07, + "loss": 0.3141, + "step": 1857 + }, + { + "epoch": 0.04, + "learning_rate": 1.9297891344025474e-07, + "loss": 0.3301, + "step": 1858 + }, + { + "epoch": 0.04, + "learning_rate": 1.929750300959186e-07, + "loss": 0.3385, + "step": 1859 + }, + { + "epoch": 0.04, + "learning_rate": 1.9297114675158246e-07, + "loss": 0.4955, + "step": 1860 + }, + { + "epoch": 0.04, + "learning_rate": 1.929672634072463e-07, + "loss": 0.4818, + "step": 1861 + }, + { + "epoch": 0.04, + "learning_rate": 1.9296338006291018e-07, + "loss": 0.345, + "step": 1862 + }, + { + "epoch": 0.04, + "learning_rate": 1.9295949671857402e-07, + "loss": 0.4295, + "step": 1863 + }, + { + "epoch": 0.04, + "learning_rate": 1.929556133742379e-07, + "loss": 0.2479, + "step": 1864 + }, + { + "epoch": 0.04, + "learning_rate": 1.9295173002990174e-07, + "loss": 0.2655, + "step": 1865 + }, + { + "epoch": 0.04, + "learning_rate": 1.929478466855656e-07, + "loss": 0.3026, + "step": 1866 + }, + { + "epoch": 0.04, + "learning_rate": 1.9294396334122945e-07, + "loss": 0.2876, + "step": 1867 + }, + { + "epoch": 0.04, + "learning_rate": 1.9294007999689333e-07, + "loss": 0.2574, + "step": 1868 + }, + { + "epoch": 0.04, + "learning_rate": 1.9293619665255717e-07, + "loss": 0.3196, + "step": 1869 + }, + { + "epoch": 0.04, + "learning_rate": 1.9293231330822104e-07, + "loss": 0.2729, + "step": 1870 + }, + { + "epoch": 0.04, + "learning_rate": 1.929284299638849e-07, + "loss": 0.2984, + "step": 1871 + }, + { + "epoch": 0.04, + "learning_rate": 1.9292454661954876e-07, + "loss": 0.2882, + "step": 1872 + }, + { + "epoch": 0.04, + "learning_rate": 1.929206632752126e-07, + "loss": 0.3088, + "step": 1873 + }, + { + "epoch": 0.04, + "learning_rate": 1.9291677993087648e-07, + "loss": 0.3047, + "step": 1874 + }, + { + "epoch": 0.04, + "learning_rate": 1.9291289658654032e-07, + "loss": 0.2856, + "step": 1875 + }, + { + "epoch": 0.04, + "learning_rate": 1.929090132422042e-07, + "loss": 0.4542, + "step": 1876 + }, + { + "epoch": 0.04, + "learning_rate": 1.9290512989786804e-07, + "loss": 0.3027, + "step": 1877 + }, + { + "epoch": 0.04, + "learning_rate": 1.9290124655353188e-07, + "loss": 0.3433, + "step": 1878 + }, + { + "epoch": 0.04, + "learning_rate": 1.9289736320919573e-07, + "loss": 0.512, + "step": 1879 + }, + { + "epoch": 0.04, + "learning_rate": 1.928934798648596e-07, + "loss": 0.327, + "step": 1880 + }, + { + "epoch": 0.04, + "learning_rate": 1.9288959652052344e-07, + "loss": 0.3231, + "step": 1881 + }, + { + "epoch": 0.04, + "learning_rate": 1.9288571317618732e-07, + "loss": 0.2323, + "step": 1882 + }, + { + "epoch": 0.04, + "learning_rate": 1.9288182983185116e-07, + "loss": 0.4093, + "step": 1883 + }, + { + "epoch": 0.04, + "learning_rate": 1.9287794648751503e-07, + "loss": 0.2973, + "step": 1884 + }, + { + "epoch": 0.04, + "learning_rate": 1.9287406314317888e-07, + "loss": 0.33, + "step": 1885 + }, + { + "epoch": 0.04, + "learning_rate": 1.9287017979884275e-07, + "loss": 0.3841, + "step": 1886 + }, + { + "epoch": 0.04, + "learning_rate": 1.928662964545066e-07, + "loss": 0.3823, + "step": 1887 + }, + { + "epoch": 0.04, + "learning_rate": 1.9286241311017046e-07, + "loss": 0.2643, + "step": 1888 + }, + { + "epoch": 0.04, + "learning_rate": 1.928585297658343e-07, + "loss": 0.3019, + "step": 1889 + }, + { + "epoch": 0.04, + "learning_rate": 1.9285464642149818e-07, + "loss": 0.2258, + "step": 1890 + }, + { + "epoch": 0.04, + "learning_rate": 1.9285076307716203e-07, + "loss": 0.4932, + "step": 1891 + }, + { + "epoch": 0.04, + "learning_rate": 1.928468797328259e-07, + "loss": 0.4053, + "step": 1892 + }, + { + "epoch": 0.04, + "learning_rate": 1.9284299638848974e-07, + "loss": 0.5971, + "step": 1893 + }, + { + "epoch": 0.04, + "learning_rate": 1.9283911304415361e-07, + "loss": 0.3011, + "step": 1894 + }, + { + "epoch": 0.04, + "learning_rate": 1.9283522969981746e-07, + "loss": 0.2189, + "step": 1895 + }, + { + "epoch": 0.04, + "learning_rate": 1.9283134635548133e-07, + "loss": 0.3877, + "step": 1896 + }, + { + "epoch": 0.04, + "learning_rate": 1.9282746301114518e-07, + "loss": 0.2419, + "step": 1897 + }, + { + "epoch": 0.04, + "learning_rate": 1.9282357966680905e-07, + "loss": 0.4591, + "step": 1898 + }, + { + "epoch": 0.04, + "learning_rate": 1.928196963224729e-07, + "loss": 0.2317, + "step": 1899 + }, + { + "epoch": 0.04, + "learning_rate": 1.9281581297813676e-07, + "loss": 0.3198, + "step": 1900 + }, + { + "epoch": 0.04, + "learning_rate": 1.928119296338006e-07, + "loss": 0.2834, + "step": 1901 + }, + { + "epoch": 0.04, + "learning_rate": 1.9280804628946448e-07, + "loss": 0.272, + "step": 1902 + }, + { + "epoch": 0.04, + "learning_rate": 1.9280416294512833e-07, + "loss": 0.286, + "step": 1903 + }, + { + "epoch": 0.04, + "learning_rate": 1.928002796007922e-07, + "loss": 0.3225, + "step": 1904 + }, + { + "epoch": 0.04, + "learning_rate": 1.9279639625645604e-07, + "loss": 0.3882, + "step": 1905 + }, + { + "epoch": 0.04, + "learning_rate": 1.927925129121199e-07, + "loss": 0.4501, + "step": 1906 + }, + { + "epoch": 0.04, + "learning_rate": 1.9278862956778376e-07, + "loss": 0.3854, + "step": 1907 + }, + { + "epoch": 0.04, + "learning_rate": 1.9278474622344763e-07, + "loss": 0.3102, + "step": 1908 + }, + { + "epoch": 0.04, + "learning_rate": 1.9278086287911147e-07, + "loss": 0.6939, + "step": 1909 + }, + { + "epoch": 0.04, + "learning_rate": 1.9277697953477535e-07, + "loss": 0.2929, + "step": 1910 + }, + { + "epoch": 0.04, + "learning_rate": 1.927730961904392e-07, + "loss": 0.2914, + "step": 1911 + }, + { + "epoch": 0.04, + "learning_rate": 1.9276921284610306e-07, + "loss": 0.3297, + "step": 1912 + }, + { + "epoch": 0.04, + "learning_rate": 1.927653295017669e-07, + "loss": 0.5926, + "step": 1913 + }, + { + "epoch": 0.04, + "learning_rate": 1.9276144615743078e-07, + "loss": 0.1951, + "step": 1914 + }, + { + "epoch": 0.04, + "learning_rate": 1.9275756281309462e-07, + "loss": 0.5432, + "step": 1915 + }, + { + "epoch": 0.04, + "learning_rate": 1.927536794687585e-07, + "loss": 0.2427, + "step": 1916 + }, + { + "epoch": 0.04, + "learning_rate": 1.9274979612442234e-07, + "loss": 0.342, + "step": 1917 + }, + { + "epoch": 0.04, + "learning_rate": 1.927459127800862e-07, + "loss": 0.2846, + "step": 1918 + }, + { + "epoch": 0.04, + "learning_rate": 1.9274202943575006e-07, + "loss": 0.2617, + "step": 1919 + }, + { + "epoch": 0.04, + "learning_rate": 1.9273814609141393e-07, + "loss": 0.2942, + "step": 1920 + }, + { + "epoch": 0.04, + "learning_rate": 1.9273426274707777e-07, + "loss": 0.2958, + "step": 1921 + }, + { + "epoch": 0.04, + "learning_rate": 1.9273037940274164e-07, + "loss": 0.3068, + "step": 1922 + }, + { + "epoch": 0.04, + "learning_rate": 1.927264960584055e-07, + "loss": 0.3729, + "step": 1923 + }, + { + "epoch": 0.04, + "learning_rate": 1.9272261271406936e-07, + "loss": 0.3711, + "step": 1924 + }, + { + "epoch": 0.04, + "learning_rate": 1.927187293697332e-07, + "loss": 0.6538, + "step": 1925 + }, + { + "epoch": 0.04, + "learning_rate": 1.9271484602539708e-07, + "loss": 0.4399, + "step": 1926 + }, + { + "epoch": 0.04, + "learning_rate": 1.9271096268106092e-07, + "loss": 0.2061, + "step": 1927 + }, + { + "epoch": 0.04, + "learning_rate": 1.927070793367248e-07, + "loss": 0.5157, + "step": 1928 + }, + { + "epoch": 0.04, + "learning_rate": 1.9270319599238864e-07, + "loss": 0.2807, + "step": 1929 + }, + { + "epoch": 0.04, + "learning_rate": 1.926993126480525e-07, + "loss": 0.4566, + "step": 1930 + }, + { + "epoch": 0.04, + "learning_rate": 1.9269542930371636e-07, + "loss": 0.481, + "step": 1931 + }, + { + "epoch": 0.04, + "learning_rate": 1.9269154595938023e-07, + "loss": 0.3284, + "step": 1932 + }, + { + "epoch": 0.04, + "learning_rate": 1.9268766261504407e-07, + "loss": 0.3945, + "step": 1933 + }, + { + "epoch": 0.04, + "learning_rate": 1.9268377927070794e-07, + "loss": 0.3886, + "step": 1934 + }, + { + "epoch": 0.04, + "learning_rate": 1.9267989592637176e-07, + "loss": 0.3881, + "step": 1935 + }, + { + "epoch": 0.04, + "learning_rate": 1.9267601258203563e-07, + "loss": 0.5136, + "step": 1936 + }, + { + "epoch": 0.04, + "learning_rate": 1.9267212923769948e-07, + "loss": 0.2928, + "step": 1937 + }, + { + "epoch": 0.04, + "learning_rate": 1.9266824589336335e-07, + "loss": 0.4786, + "step": 1938 + }, + { + "epoch": 0.04, + "learning_rate": 1.926643625490272e-07, + "loss": 0.2858, + "step": 1939 + }, + { + "epoch": 0.04, + "learning_rate": 1.9266047920469107e-07, + "loss": 0.3595, + "step": 1940 + }, + { + "epoch": 0.04, + "learning_rate": 1.926565958603549e-07, + "loss": 0.2321, + "step": 1941 + }, + { + "epoch": 0.04, + "learning_rate": 1.9265271251601878e-07, + "loss": 0.247, + "step": 1942 + }, + { + "epoch": 0.04, + "learning_rate": 1.9264882917168263e-07, + "loss": 0.2053, + "step": 1943 + }, + { + "epoch": 0.04, + "learning_rate": 1.926449458273465e-07, + "loss": 0.2667, + "step": 1944 + }, + { + "epoch": 0.04, + "learning_rate": 1.9264106248301034e-07, + "loss": 0.5025, + "step": 1945 + }, + { + "epoch": 0.04, + "learning_rate": 1.9263717913867422e-07, + "loss": 0.3271, + "step": 1946 + }, + { + "epoch": 0.04, + "learning_rate": 1.9263329579433806e-07, + "loss": 0.2376, + "step": 1947 + }, + { + "epoch": 0.04, + "learning_rate": 1.9262941245000193e-07, + "loss": 0.2468, + "step": 1948 + }, + { + "epoch": 0.04, + "learning_rate": 1.9262552910566578e-07, + "loss": 0.2141, + "step": 1949 + }, + { + "epoch": 0.04, + "learning_rate": 1.9262164576132965e-07, + "loss": 0.4381, + "step": 1950 + }, + { + "epoch": 0.04, + "learning_rate": 1.926177624169935e-07, + "loss": 0.2836, + "step": 1951 + }, + { + "epoch": 0.04, + "learning_rate": 1.9261387907265737e-07, + "loss": 0.5527, + "step": 1952 + }, + { + "epoch": 0.04, + "learning_rate": 1.926099957283212e-07, + "loss": 0.3346, + "step": 1953 + }, + { + "epoch": 0.04, + "learning_rate": 1.9260611238398508e-07, + "loss": 0.215, + "step": 1954 + }, + { + "epoch": 0.04, + "learning_rate": 1.9260222903964893e-07, + "loss": 0.4251, + "step": 1955 + }, + { + "epoch": 0.04, + "learning_rate": 1.925983456953128e-07, + "loss": 0.2849, + "step": 1956 + }, + { + "epoch": 0.04, + "learning_rate": 1.9259446235097664e-07, + "loss": 0.3089, + "step": 1957 + }, + { + "epoch": 0.04, + "learning_rate": 1.9259057900664052e-07, + "loss": 0.5037, + "step": 1958 + }, + { + "epoch": 0.04, + "learning_rate": 1.9258669566230436e-07, + "loss": 0.27, + "step": 1959 + }, + { + "epoch": 0.04, + "learning_rate": 1.9258281231796823e-07, + "loss": 0.3634, + "step": 1960 + }, + { + "epoch": 0.04, + "learning_rate": 1.9257892897363208e-07, + "loss": 0.2638, + "step": 1961 + }, + { + "epoch": 0.04, + "learning_rate": 1.9257504562929595e-07, + "loss": 0.598, + "step": 1962 + }, + { + "epoch": 0.04, + "learning_rate": 1.925711622849598e-07, + "loss": 0.3694, + "step": 1963 + }, + { + "epoch": 0.04, + "learning_rate": 1.9256727894062366e-07, + "loss": 0.3569, + "step": 1964 + }, + { + "epoch": 0.04, + "learning_rate": 1.925633955962875e-07, + "loss": 0.3125, + "step": 1965 + }, + { + "epoch": 0.04, + "learning_rate": 1.9255951225195138e-07, + "loss": 0.2432, + "step": 1966 + }, + { + "epoch": 0.04, + "learning_rate": 1.9255562890761523e-07, + "loss": 0.3424, + "step": 1967 + }, + { + "epoch": 0.04, + "learning_rate": 1.925517455632791e-07, + "loss": 0.5105, + "step": 1968 + }, + { + "epoch": 0.04, + "learning_rate": 1.9254786221894294e-07, + "loss": 0.2963, + "step": 1969 + }, + { + "epoch": 0.04, + "learning_rate": 1.9254397887460681e-07, + "loss": 0.2125, + "step": 1970 + }, + { + "epoch": 0.04, + "learning_rate": 1.9254009553027066e-07, + "loss": 0.234, + "step": 1971 + }, + { + "epoch": 0.04, + "learning_rate": 1.9253621218593453e-07, + "loss": 0.2824, + "step": 1972 + }, + { + "epoch": 0.04, + "learning_rate": 1.9253232884159838e-07, + "loss": 0.4151, + "step": 1973 + }, + { + "epoch": 0.04, + "learning_rate": 1.9252844549726225e-07, + "loss": 0.2051, + "step": 1974 + }, + { + "epoch": 0.04, + "learning_rate": 1.925245621529261e-07, + "loss": 0.2545, + "step": 1975 + }, + { + "epoch": 0.04, + "learning_rate": 1.9252067880858996e-07, + "loss": 0.2829, + "step": 1976 + }, + { + "epoch": 0.04, + "learning_rate": 1.925167954642538e-07, + "loss": 0.3514, + "step": 1977 + }, + { + "epoch": 0.04, + "learning_rate": 1.9251291211991768e-07, + "loss": 0.4905, + "step": 1978 + }, + { + "epoch": 0.04, + "learning_rate": 1.9250902877558153e-07, + "loss": 0.4551, + "step": 1979 + }, + { + "epoch": 0.04, + "learning_rate": 1.925051454312454e-07, + "loss": 0.3967, + "step": 1980 + }, + { + "epoch": 0.04, + "learning_rate": 1.9250126208690924e-07, + "loss": 0.6381, + "step": 1981 + }, + { + "epoch": 0.04, + "learning_rate": 1.924973787425731e-07, + "loss": 0.3923, + "step": 1982 + }, + { + "epoch": 0.04, + "learning_rate": 1.9249349539823696e-07, + "loss": 0.3029, + "step": 1983 + }, + { + "epoch": 0.04, + "learning_rate": 1.9248961205390083e-07, + "loss": 0.4454, + "step": 1984 + }, + { + "epoch": 0.04, + "learning_rate": 1.9248572870956467e-07, + "loss": 0.2274, + "step": 1985 + }, + { + "epoch": 0.04, + "learning_rate": 1.9248184536522855e-07, + "loss": 0.3112, + "step": 1986 + }, + { + "epoch": 0.04, + "learning_rate": 1.924779620208924e-07, + "loss": 0.3088, + "step": 1987 + }, + { + "epoch": 0.04, + "learning_rate": 1.9247407867655626e-07, + "loss": 0.2036, + "step": 1988 + }, + { + "epoch": 0.04, + "learning_rate": 1.924701953322201e-07, + "loss": 0.199, + "step": 1989 + }, + { + "epoch": 0.04, + "learning_rate": 1.9246631198788398e-07, + "loss": 0.1981, + "step": 1990 + }, + { + "epoch": 0.04, + "learning_rate": 1.9246242864354782e-07, + "loss": 0.1873, + "step": 1991 + }, + { + "epoch": 0.04, + "learning_rate": 1.924585452992117e-07, + "loss": 0.7788, + "step": 1992 + }, + { + "epoch": 0.04, + "learning_rate": 1.9245466195487551e-07, + "loss": 0.4571, + "step": 1993 + }, + { + "epoch": 0.04, + "learning_rate": 1.9245077861053939e-07, + "loss": 0.5966, + "step": 1994 + }, + { + "epoch": 0.04, + "learning_rate": 1.9244689526620323e-07, + "loss": 0.5057, + "step": 1995 + }, + { + "epoch": 0.04, + "learning_rate": 1.924430119218671e-07, + "loss": 0.4973, + "step": 1996 + }, + { + "epoch": 0.04, + "learning_rate": 1.9243912857753095e-07, + "loss": 0.2537, + "step": 1997 + }, + { + "epoch": 0.04, + "learning_rate": 1.9243524523319482e-07, + "loss": 0.1891, + "step": 1998 + }, + { + "epoch": 0.04, + "learning_rate": 1.9243136188885866e-07, + "loss": 0.2542, + "step": 1999 + }, + { + "epoch": 0.04, + "learning_rate": 1.9242747854452254e-07, + "loss": 0.3691, + "step": 2000 + }, + { + "epoch": 0.04, + "learning_rate": 1.9242359520018638e-07, + "loss": 0.6, + "step": 2001 + }, + { + "epoch": 0.04, + "learning_rate": 1.9241971185585025e-07, + "loss": 0.3878, + "step": 2002 + }, + { + "epoch": 0.04, + "learning_rate": 1.924158285115141e-07, + "loss": 0.2697, + "step": 2003 + }, + { + "epoch": 0.04, + "learning_rate": 1.9241194516717797e-07, + "loss": 0.4711, + "step": 2004 + }, + { + "epoch": 0.04, + "learning_rate": 1.924080618228418e-07, + "loss": 0.2745, + "step": 2005 + }, + { + "epoch": 0.04, + "learning_rate": 1.9240417847850568e-07, + "loss": 0.2472, + "step": 2006 + }, + { + "epoch": 0.04, + "learning_rate": 1.9240029513416953e-07, + "loss": 0.3686, + "step": 2007 + }, + { + "epoch": 0.04, + "learning_rate": 1.923964117898334e-07, + "loss": 0.4389, + "step": 2008 + }, + { + "epoch": 0.04, + "learning_rate": 1.9239252844549725e-07, + "loss": 0.3944, + "step": 2009 + }, + { + "epoch": 0.04, + "learning_rate": 1.9238864510116112e-07, + "loss": 0.2511, + "step": 2010 + }, + { + "epoch": 0.04, + "learning_rate": 1.9238476175682496e-07, + "loss": 0.2143, + "step": 2011 + }, + { + "epoch": 0.04, + "learning_rate": 1.9238087841248883e-07, + "loss": 0.4522, + "step": 2012 + }, + { + "epoch": 0.04, + "learning_rate": 1.9237699506815268e-07, + "loss": 0.3354, + "step": 2013 + }, + { + "epoch": 0.04, + "learning_rate": 1.9237311172381655e-07, + "loss": 0.2239, + "step": 2014 + }, + { + "epoch": 0.04, + "learning_rate": 1.923692283794804e-07, + "loss": 0.2651, + "step": 2015 + }, + { + "epoch": 0.04, + "learning_rate": 1.9236534503514427e-07, + "loss": 0.4428, + "step": 2016 + }, + { + "epoch": 0.04, + "learning_rate": 1.923614616908081e-07, + "loss": 0.2687, + "step": 2017 + }, + { + "epoch": 0.04, + "learning_rate": 1.9235757834647198e-07, + "loss": 0.406, + "step": 2018 + }, + { + "epoch": 0.04, + "learning_rate": 1.9235369500213583e-07, + "loss": 0.2749, + "step": 2019 + }, + { + "epoch": 0.04, + "learning_rate": 1.923498116577997e-07, + "loss": 0.326, + "step": 2020 + }, + { + "epoch": 0.04, + "learning_rate": 1.9234592831346354e-07, + "loss": 0.337, + "step": 2021 + }, + { + "epoch": 0.04, + "learning_rate": 1.9234204496912742e-07, + "loss": 0.2266, + "step": 2022 + }, + { + "epoch": 0.04, + "learning_rate": 1.9233816162479126e-07, + "loss": 0.2312, + "step": 2023 + }, + { + "epoch": 0.04, + "learning_rate": 1.9233427828045513e-07, + "loss": 0.3068, + "step": 2024 + }, + { + "epoch": 0.04, + "learning_rate": 1.9233039493611898e-07, + "loss": 0.2553, + "step": 2025 + }, + { + "epoch": 0.04, + "learning_rate": 1.9232651159178285e-07, + "loss": 0.2159, + "step": 2026 + }, + { + "epoch": 0.04, + "learning_rate": 1.923226282474467e-07, + "loss": 0.2785, + "step": 2027 + }, + { + "epoch": 0.04, + "learning_rate": 1.9231874490311054e-07, + "loss": 0.2451, + "step": 2028 + }, + { + "epoch": 0.04, + "learning_rate": 1.923148615587744e-07, + "loss": 0.2162, + "step": 2029 + }, + { + "epoch": 0.04, + "learning_rate": 1.9231097821443826e-07, + "loss": 0.5102, + "step": 2030 + }, + { + "epoch": 0.04, + "learning_rate": 1.9230709487010213e-07, + "loss": 0.3161, + "step": 2031 + }, + { + "epoch": 0.04, + "learning_rate": 1.9230321152576597e-07, + "loss": 0.2005, + "step": 2032 + }, + { + "epoch": 0.04, + "learning_rate": 1.9229932818142984e-07, + "loss": 0.3959, + "step": 2033 + }, + { + "epoch": 0.04, + "learning_rate": 1.922954448370937e-07, + "loss": 0.5131, + "step": 2034 + }, + { + "epoch": 0.04, + "learning_rate": 1.9229156149275756e-07, + "loss": 0.2642, + "step": 2035 + }, + { + "epoch": 0.04, + "learning_rate": 1.922876781484214e-07, + "loss": 0.2121, + "step": 2036 + }, + { + "epoch": 0.04, + "learning_rate": 1.9228379480408528e-07, + "loss": 0.3537, + "step": 2037 + }, + { + "epoch": 0.04, + "learning_rate": 1.9227991145974912e-07, + "loss": 0.1759, + "step": 2038 + }, + { + "epoch": 0.04, + "learning_rate": 1.92276028115413e-07, + "loss": 0.1992, + "step": 2039 + }, + { + "epoch": 0.04, + "learning_rate": 1.9227214477107684e-07, + "loss": 0.2122, + "step": 2040 + }, + { + "epoch": 0.04, + "learning_rate": 1.922682614267407e-07, + "loss": 0.3602, + "step": 2041 + }, + { + "epoch": 0.04, + "learning_rate": 1.9226437808240455e-07, + "loss": 0.1949, + "step": 2042 + }, + { + "epoch": 0.04, + "learning_rate": 1.9226049473806843e-07, + "loss": 0.4243, + "step": 2043 + }, + { + "epoch": 0.04, + "learning_rate": 1.9225661139373227e-07, + "loss": 0.2538, + "step": 2044 + }, + { + "epoch": 0.04, + "learning_rate": 1.9225272804939614e-07, + "loss": 0.327, + "step": 2045 + }, + { + "epoch": 0.04, + "learning_rate": 1.9224884470506e-07, + "loss": 0.1903, + "step": 2046 + }, + { + "epoch": 0.04, + "learning_rate": 1.9224496136072386e-07, + "loss": 0.4231, + "step": 2047 + }, + { + "epoch": 0.04, + "learning_rate": 1.922410780163877e-07, + "loss": 0.2831, + "step": 2048 + }, + { + "epoch": 0.04, + "learning_rate": 1.9223719467205158e-07, + "loss": 0.1947, + "step": 2049 + }, + { + "epoch": 0.04, + "learning_rate": 1.9223331132771542e-07, + "loss": 0.4156, + "step": 2050 + }, + { + "epoch": 0.04, + "learning_rate": 1.9222942798337927e-07, + "loss": 0.6674, + "step": 2051 + }, + { + "epoch": 0.04, + "learning_rate": 1.9222554463904314e-07, + "loss": 0.3858, + "step": 2052 + }, + { + "epoch": 0.04, + "learning_rate": 1.9222166129470698e-07, + "loss": 0.415, + "step": 2053 + }, + { + "epoch": 0.04, + "learning_rate": 1.9221777795037085e-07, + "loss": 0.45, + "step": 2054 + }, + { + "epoch": 0.04, + "learning_rate": 1.922138946060347e-07, + "loss": 0.2048, + "step": 2055 + }, + { + "epoch": 0.04, + "learning_rate": 1.9221001126169854e-07, + "loss": 0.1992, + "step": 2056 + }, + { + "epoch": 0.04, + "learning_rate": 1.9220612791736242e-07, + "loss": 0.3579, + "step": 2057 + }, + { + "epoch": 0.04, + "learning_rate": 1.9220224457302626e-07, + "loss": 0.2476, + "step": 2058 + }, + { + "epoch": 0.04, + "learning_rate": 1.9219836122869013e-07, + "loss": 0.3704, + "step": 2059 + }, + { + "epoch": 0.04, + "learning_rate": 1.9219447788435398e-07, + "loss": 0.1923, + "step": 2060 + }, + { + "epoch": 0.04, + "learning_rate": 1.9219059454001785e-07, + "loss": 0.1926, + "step": 2061 + }, + { + "epoch": 0.04, + "learning_rate": 1.921867111956817e-07, + "loss": 0.2448, + "step": 2062 + }, + { + "epoch": 0.04, + "learning_rate": 1.9218282785134556e-07, + "loss": 0.3345, + "step": 2063 + }, + { + "epoch": 0.04, + "learning_rate": 1.921789445070094e-07, + "loss": 0.2604, + "step": 2064 + }, + { + "epoch": 0.04, + "learning_rate": 1.9217506116267328e-07, + "loss": 0.2196, + "step": 2065 + }, + { + "epoch": 0.04, + "learning_rate": 1.9217117781833713e-07, + "loss": 0.3471, + "step": 2066 + }, + { + "epoch": 0.04, + "learning_rate": 1.92167294474001e-07, + "loss": 0.289, + "step": 2067 + }, + { + "epoch": 0.04, + "learning_rate": 1.9216341112966484e-07, + "loss": 0.2138, + "step": 2068 + }, + { + "epoch": 0.04, + "learning_rate": 1.9215952778532871e-07, + "loss": 0.2283, + "step": 2069 + }, + { + "epoch": 0.04, + "learning_rate": 1.9215564444099256e-07, + "loss": 0.3258, + "step": 2070 + }, + { + "epoch": 0.04, + "learning_rate": 1.9215176109665643e-07, + "loss": 0.7519, + "step": 2071 + }, + { + "epoch": 0.04, + "learning_rate": 1.9214787775232028e-07, + "loss": 0.3251, + "step": 2072 + }, + { + "epoch": 0.04, + "learning_rate": 1.9214399440798415e-07, + "loss": 0.2147, + "step": 2073 + }, + { + "epoch": 0.04, + "learning_rate": 1.92140111063648e-07, + "loss": 0.4046, + "step": 2074 + }, + { + "epoch": 0.04, + "learning_rate": 1.9213622771931186e-07, + "loss": 0.7641, + "step": 2075 + }, + { + "epoch": 0.04, + "learning_rate": 1.921323443749757e-07, + "loss": 0.3527, + "step": 2076 + }, + { + "epoch": 0.04, + "learning_rate": 1.9212846103063958e-07, + "loss": 0.4233, + "step": 2077 + }, + { + "epoch": 0.04, + "learning_rate": 1.9212457768630343e-07, + "loss": 0.4741, + "step": 2078 + }, + { + "epoch": 0.04, + "learning_rate": 1.921206943419673e-07, + "loss": 0.3561, + "step": 2079 + }, + { + "epoch": 0.04, + "learning_rate": 1.9211681099763114e-07, + "loss": 0.2997, + "step": 2080 + }, + { + "epoch": 0.04, + "learning_rate": 1.92112927653295e-07, + "loss": 0.3353, + "step": 2081 + }, + { + "epoch": 0.04, + "learning_rate": 1.9210904430895886e-07, + "loss": 0.3359, + "step": 2082 + }, + { + "epoch": 0.04, + "learning_rate": 1.9210516096462273e-07, + "loss": 0.3349, + "step": 2083 + }, + { + "epoch": 0.04, + "learning_rate": 1.9210127762028657e-07, + "loss": 0.3895, + "step": 2084 + }, + { + "epoch": 0.04, + "learning_rate": 1.9209739427595045e-07, + "loss": 0.1713, + "step": 2085 + }, + { + "epoch": 0.04, + "learning_rate": 1.920935109316143e-07, + "loss": 0.3574, + "step": 2086 + }, + { + "epoch": 0.04, + "learning_rate": 1.9208962758727816e-07, + "loss": 0.3035, + "step": 2087 + }, + { + "epoch": 0.04, + "learning_rate": 1.92085744242942e-07, + "loss": 0.1923, + "step": 2088 + }, + { + "epoch": 0.04, + "learning_rate": 1.9208186089860588e-07, + "loss": 0.2899, + "step": 2089 + }, + { + "epoch": 0.04, + "learning_rate": 1.9207797755426972e-07, + "loss": 0.2742, + "step": 2090 + }, + { + "epoch": 0.04, + "learning_rate": 1.920740942099336e-07, + "loss": 0.2082, + "step": 2091 + }, + { + "epoch": 0.04, + "learning_rate": 1.9207021086559744e-07, + "loss": 0.2923, + "step": 2092 + }, + { + "epoch": 0.04, + "learning_rate": 1.920663275212613e-07, + "loss": 0.3486, + "step": 2093 + }, + { + "epoch": 0.04, + "learning_rate": 1.9206244417692516e-07, + "loss": 0.3148, + "step": 2094 + }, + { + "epoch": 0.04, + "learning_rate": 1.9205856083258903e-07, + "loss": 0.2133, + "step": 2095 + }, + { + "epoch": 0.04, + "learning_rate": 1.9205467748825287e-07, + "loss": 0.1823, + "step": 2096 + }, + { + "epoch": 0.04, + "learning_rate": 1.9205079414391675e-07, + "loss": 0.368, + "step": 2097 + }, + { + "epoch": 0.04, + "learning_rate": 1.920469107995806e-07, + "loss": 0.3275, + "step": 2098 + }, + { + "epoch": 0.04, + "learning_rate": 1.9204302745524446e-07, + "loss": 0.3476, + "step": 2099 + }, + { + "epoch": 0.04, + "learning_rate": 1.920391441109083e-07, + "loss": 0.3229, + "step": 2100 + }, + { + "epoch": 0.04, + "learning_rate": 1.9203526076657218e-07, + "loss": 0.2084, + "step": 2101 + }, + { + "epoch": 0.04, + "learning_rate": 1.9203137742223602e-07, + "loss": 0.2382, + "step": 2102 + }, + { + "epoch": 0.04, + "learning_rate": 1.920274940778999e-07, + "loss": 0.2072, + "step": 2103 + }, + { + "epoch": 0.04, + "learning_rate": 1.9202361073356374e-07, + "loss": 0.218, + "step": 2104 + }, + { + "epoch": 0.04, + "learning_rate": 1.920197273892276e-07, + "loss": 0.2745, + "step": 2105 + }, + { + "epoch": 0.04, + "learning_rate": 1.9201584404489146e-07, + "loss": 0.4721, + "step": 2106 + }, + { + "epoch": 0.04, + "learning_rate": 1.9201196070055533e-07, + "loss": 0.7249, + "step": 2107 + }, + { + "epoch": 0.04, + "learning_rate": 1.9200807735621917e-07, + "loss": 0.2717, + "step": 2108 + }, + { + "epoch": 0.04, + "learning_rate": 1.9200419401188302e-07, + "loss": 0.1866, + "step": 2109 + }, + { + "epoch": 0.04, + "learning_rate": 1.9200031066754686e-07, + "loss": 0.1855, + "step": 2110 + }, + { + "epoch": 0.04, + "learning_rate": 1.9199642732321073e-07, + "loss": 0.2573, + "step": 2111 + }, + { + "epoch": 0.04, + "learning_rate": 1.9199254397887458e-07, + "loss": 0.4334, + "step": 2112 + }, + { + "epoch": 0.04, + "learning_rate": 1.9198866063453845e-07, + "loss": 0.2278, + "step": 2113 + }, + { + "epoch": 0.04, + "learning_rate": 1.919847772902023e-07, + "loss": 0.3346, + "step": 2114 + }, + { + "epoch": 0.04, + "learning_rate": 1.9198089394586617e-07, + "loss": 0.2275, + "step": 2115 + }, + { + "epoch": 0.04, + "learning_rate": 1.9197701060153e-07, + "loss": 0.3814, + "step": 2116 + }, + { + "epoch": 0.04, + "learning_rate": 1.9197312725719388e-07, + "loss": 0.2431, + "step": 2117 + }, + { + "epoch": 0.04, + "learning_rate": 1.9196924391285773e-07, + "loss": 0.27, + "step": 2118 + }, + { + "epoch": 0.04, + "learning_rate": 1.919653605685216e-07, + "loss": 0.5802, + "step": 2119 + }, + { + "epoch": 0.04, + "learning_rate": 1.9196147722418544e-07, + "loss": 0.3047, + "step": 2120 + }, + { + "epoch": 0.04, + "learning_rate": 1.9195759387984932e-07, + "loss": 0.347, + "step": 2121 + }, + { + "epoch": 0.04, + "learning_rate": 1.9195371053551316e-07, + "loss": 0.1833, + "step": 2122 + }, + { + "epoch": 0.04, + "learning_rate": 1.9194982719117703e-07, + "loss": 0.2504, + "step": 2123 + }, + { + "epoch": 0.04, + "learning_rate": 1.9194594384684088e-07, + "loss": 0.5121, + "step": 2124 + }, + { + "epoch": 0.04, + "learning_rate": 1.9194206050250475e-07, + "loss": 0.4186, + "step": 2125 + }, + { + "epoch": 0.04, + "learning_rate": 1.919381771581686e-07, + "loss": 0.1587, + "step": 2126 + }, + { + "epoch": 0.04, + "learning_rate": 1.9193429381383247e-07, + "loss": 0.1846, + "step": 2127 + }, + { + "epoch": 0.04, + "learning_rate": 1.919304104694963e-07, + "loss": 0.3872, + "step": 2128 + }, + { + "epoch": 0.04, + "learning_rate": 1.9192652712516018e-07, + "loss": 0.2652, + "step": 2129 + }, + { + "epoch": 0.04, + "learning_rate": 1.9192264378082403e-07, + "loss": 0.2256, + "step": 2130 + }, + { + "epoch": 0.04, + "learning_rate": 1.919187604364879e-07, + "loss": 0.2647, + "step": 2131 + }, + { + "epoch": 0.04, + "learning_rate": 1.9191487709215174e-07, + "loss": 0.3497, + "step": 2132 + }, + { + "epoch": 0.04, + "learning_rate": 1.9191099374781562e-07, + "loss": 0.2699, + "step": 2133 + }, + { + "epoch": 0.04, + "learning_rate": 1.9190711040347946e-07, + "loss": 0.2734, + "step": 2134 + }, + { + "epoch": 0.04, + "learning_rate": 1.9190322705914333e-07, + "loss": 0.402, + "step": 2135 + }, + { + "epoch": 0.04, + "learning_rate": 1.9189934371480718e-07, + "loss": 0.1927, + "step": 2136 + }, + { + "epoch": 0.04, + "learning_rate": 1.9189546037047105e-07, + "loss": 0.4533, + "step": 2137 + }, + { + "epoch": 0.04, + "learning_rate": 1.918915770261349e-07, + "loss": 0.2839, + "step": 2138 + }, + { + "epoch": 0.04, + "learning_rate": 1.9188769368179876e-07, + "loss": 0.2361, + "step": 2139 + }, + { + "epoch": 0.04, + "learning_rate": 1.918838103374626e-07, + "loss": 0.2413, + "step": 2140 + }, + { + "epoch": 0.04, + "learning_rate": 1.9187992699312648e-07, + "loss": 0.2814, + "step": 2141 + }, + { + "epoch": 0.04, + "learning_rate": 1.9187604364879033e-07, + "loss": 0.2902, + "step": 2142 + }, + { + "epoch": 0.04, + "learning_rate": 1.918721603044542e-07, + "loss": 0.3612, + "step": 2143 + }, + { + "epoch": 0.04, + "learning_rate": 1.9186827696011804e-07, + "loss": 0.2824, + "step": 2144 + }, + { + "epoch": 0.04, + "learning_rate": 1.9186439361578191e-07, + "loss": 0.3846, + "step": 2145 + }, + { + "epoch": 0.04, + "learning_rate": 1.9186051027144576e-07, + "loss": 0.4492, + "step": 2146 + }, + { + "epoch": 0.04, + "learning_rate": 1.9185662692710963e-07, + "loss": 0.1776, + "step": 2147 + }, + { + "epoch": 0.04, + "learning_rate": 1.9185274358277348e-07, + "loss": 0.2782, + "step": 2148 + }, + { + "epoch": 0.04, + "learning_rate": 1.9184886023843735e-07, + "loss": 0.197, + "step": 2149 + }, + { + "epoch": 0.04, + "learning_rate": 1.918449768941012e-07, + "loss": 0.5334, + "step": 2150 + }, + { + "epoch": 0.04, + "learning_rate": 1.9184109354976506e-07, + "loss": 0.4257, + "step": 2151 + }, + { + "epoch": 0.04, + "learning_rate": 1.918372102054289e-07, + "loss": 0.3681, + "step": 2152 + }, + { + "epoch": 0.04, + "learning_rate": 1.9183332686109278e-07, + "loss": 0.2532, + "step": 2153 + }, + { + "epoch": 0.04, + "learning_rate": 1.9182944351675663e-07, + "loss": 0.2274, + "step": 2154 + }, + { + "epoch": 0.04, + "learning_rate": 1.918255601724205e-07, + "loss": 0.1623, + "step": 2155 + }, + { + "epoch": 0.04, + "learning_rate": 1.9182167682808434e-07, + "loss": 0.319, + "step": 2156 + }, + { + "epoch": 0.04, + "learning_rate": 1.9181779348374821e-07, + "loss": 0.3165, + "step": 2157 + }, + { + "epoch": 0.04, + "learning_rate": 1.9181391013941206e-07, + "loss": 0.2486, + "step": 2158 + }, + { + "epoch": 0.04, + "learning_rate": 1.9181002679507593e-07, + "loss": 0.3074, + "step": 2159 + }, + { + "epoch": 0.04, + "learning_rate": 1.9180614345073977e-07, + "loss": 0.1712, + "step": 2160 + }, + { + "epoch": 0.04, + "learning_rate": 1.9180226010640365e-07, + "loss": 0.1842, + "step": 2161 + }, + { + "epoch": 0.04, + "learning_rate": 1.917983767620675e-07, + "loss": 0.2519, + "step": 2162 + }, + { + "epoch": 0.04, + "learning_rate": 1.9179449341773136e-07, + "loss": 0.2744, + "step": 2163 + }, + { + "epoch": 0.04, + "learning_rate": 1.917906100733952e-07, + "loss": 0.2562, + "step": 2164 + }, + { + "epoch": 0.04, + "learning_rate": 1.9178672672905908e-07, + "loss": 0.2781, + "step": 2165 + }, + { + "epoch": 0.04, + "learning_rate": 1.9178284338472292e-07, + "loss": 0.5022, + "step": 2166 + }, + { + "epoch": 0.04, + "learning_rate": 1.9177896004038677e-07, + "loss": 0.2277, + "step": 2167 + }, + { + "epoch": 0.04, + "learning_rate": 1.9177507669605061e-07, + "loss": 0.1975, + "step": 2168 + }, + { + "epoch": 0.04, + "learning_rate": 1.9177119335171449e-07, + "loss": 0.2463, + "step": 2169 + }, + { + "epoch": 0.04, + "learning_rate": 1.9176731000737833e-07, + "loss": 0.2725, + "step": 2170 + }, + { + "epoch": 0.04, + "learning_rate": 1.917634266630422e-07, + "loss": 0.3911, + "step": 2171 + }, + { + "epoch": 0.04, + "learning_rate": 1.9175954331870605e-07, + "loss": 0.3368, + "step": 2172 + }, + { + "epoch": 0.04, + "learning_rate": 1.9175565997436992e-07, + "loss": 0.2114, + "step": 2173 + }, + { + "epoch": 0.04, + "learning_rate": 1.9175177663003376e-07, + "loss": 0.3391, + "step": 2174 + }, + { + "epoch": 0.04, + "learning_rate": 1.9174789328569764e-07, + "loss": 0.2508, + "step": 2175 + }, + { + "epoch": 0.04, + "learning_rate": 1.9174400994136148e-07, + "loss": 0.378, + "step": 2176 + }, + { + "epoch": 0.04, + "learning_rate": 1.9174012659702535e-07, + "loss": 0.2328, + "step": 2177 + }, + { + "epoch": 0.04, + "learning_rate": 1.917362432526892e-07, + "loss": 0.182, + "step": 2178 + }, + { + "epoch": 0.04, + "learning_rate": 1.9173235990835307e-07, + "loss": 0.2911, + "step": 2179 + }, + { + "epoch": 0.04, + "learning_rate": 1.917284765640169e-07, + "loss": 0.2886, + "step": 2180 + }, + { + "epoch": 0.04, + "learning_rate": 1.9172459321968078e-07, + "loss": 0.4175, + "step": 2181 + }, + { + "epoch": 0.04, + "learning_rate": 1.9172070987534463e-07, + "loss": 0.2664, + "step": 2182 + }, + { + "epoch": 0.04, + "learning_rate": 1.917168265310085e-07, + "loss": 0.3492, + "step": 2183 + }, + { + "epoch": 0.04, + "learning_rate": 1.9171294318667235e-07, + "loss": 0.2306, + "step": 2184 + }, + { + "epoch": 0.04, + "learning_rate": 1.9170905984233622e-07, + "loss": 0.8515, + "step": 2185 + }, + { + "epoch": 0.04, + "learning_rate": 1.9170517649800006e-07, + "loss": 0.3685, + "step": 2186 + }, + { + "epoch": 0.04, + "learning_rate": 1.9170129315366393e-07, + "loss": 0.3298, + "step": 2187 + }, + { + "epoch": 0.04, + "learning_rate": 1.9169740980932778e-07, + "loss": 0.2202, + "step": 2188 + }, + { + "epoch": 0.04, + "learning_rate": 1.9169352646499165e-07, + "loss": 0.2672, + "step": 2189 + }, + { + "epoch": 0.04, + "learning_rate": 1.916896431206555e-07, + "loss": 0.2029, + "step": 2190 + }, + { + "epoch": 0.04, + "learning_rate": 1.9168575977631937e-07, + "loss": 0.1681, + "step": 2191 + }, + { + "epoch": 0.04, + "learning_rate": 1.916818764319832e-07, + "loss": 0.2962, + "step": 2192 + }, + { + "epoch": 0.04, + "learning_rate": 1.9167799308764708e-07, + "loss": 0.3191, + "step": 2193 + }, + { + "epoch": 0.04, + "learning_rate": 1.9167410974331093e-07, + "loss": 0.3428, + "step": 2194 + }, + { + "epoch": 0.04, + "learning_rate": 1.916702263989748e-07, + "loss": 0.4427, + "step": 2195 + }, + { + "epoch": 0.04, + "learning_rate": 1.9166634305463865e-07, + "loss": 0.2371, + "step": 2196 + }, + { + "epoch": 0.04, + "learning_rate": 1.9166245971030252e-07, + "loss": 0.1734, + "step": 2197 + }, + { + "epoch": 0.04, + "learning_rate": 1.9165857636596636e-07, + "loss": 0.1927, + "step": 2198 + }, + { + "epoch": 0.04, + "learning_rate": 1.9165469302163023e-07, + "loss": 0.3398, + "step": 2199 + }, + { + "epoch": 0.04, + "learning_rate": 1.9165080967729408e-07, + "loss": 0.2526, + "step": 2200 + }, + { + "epoch": 0.04, + "learning_rate": 1.9164692633295795e-07, + "loss": 0.1499, + "step": 2201 + }, + { + "epoch": 0.04, + "learning_rate": 1.916430429886218e-07, + "loss": 0.3828, + "step": 2202 + }, + { + "epoch": 0.04, + "learning_rate": 1.9163915964428567e-07, + "loss": 0.3988, + "step": 2203 + }, + { + "epoch": 0.04, + "learning_rate": 1.916352762999495e-07, + "loss": 0.3335, + "step": 2204 + }, + { + "epoch": 0.04, + "learning_rate": 1.9163139295561336e-07, + "loss": 0.2793, + "step": 2205 + }, + { + "epoch": 0.04, + "learning_rate": 1.9162750961127723e-07, + "loss": 0.2283, + "step": 2206 + }, + { + "epoch": 0.04, + "learning_rate": 1.9162362626694107e-07, + "loss": 0.2019, + "step": 2207 + }, + { + "epoch": 0.04, + "learning_rate": 1.9161974292260494e-07, + "loss": 0.2062, + "step": 2208 + }, + { + "epoch": 0.04, + "learning_rate": 1.916158595782688e-07, + "loss": 0.2914, + "step": 2209 + }, + { + "epoch": 0.04, + "learning_rate": 1.9161197623393266e-07, + "loss": 0.4644, + "step": 2210 + }, + { + "epoch": 0.04, + "learning_rate": 1.916080928895965e-07, + "loss": 0.2536, + "step": 2211 + }, + { + "epoch": 0.04, + "learning_rate": 1.9160420954526038e-07, + "loss": 0.2317, + "step": 2212 + }, + { + "epoch": 0.04, + "learning_rate": 1.9160032620092422e-07, + "loss": 0.2282, + "step": 2213 + }, + { + "epoch": 0.04, + "learning_rate": 1.915964428565881e-07, + "loss": 0.1992, + "step": 2214 + }, + { + "epoch": 0.04, + "learning_rate": 1.9159255951225194e-07, + "loss": 0.2032, + "step": 2215 + }, + { + "epoch": 0.04, + "learning_rate": 1.915886761679158e-07, + "loss": 0.2047, + "step": 2216 + }, + { + "epoch": 0.04, + "learning_rate": 1.9158479282357965e-07, + "loss": 0.159, + "step": 2217 + }, + { + "epoch": 0.04, + "learning_rate": 1.9158090947924353e-07, + "loss": 0.5209, + "step": 2218 + }, + { + "epoch": 0.04, + "learning_rate": 1.9157702613490737e-07, + "loss": 0.2439, + "step": 2219 + }, + { + "epoch": 0.04, + "learning_rate": 1.9157314279057124e-07, + "loss": 0.2339, + "step": 2220 + }, + { + "epoch": 0.04, + "learning_rate": 1.915692594462351e-07, + "loss": 0.2727, + "step": 2221 + }, + { + "epoch": 0.04, + "learning_rate": 1.9156537610189896e-07, + "loss": 0.1674, + "step": 2222 + }, + { + "epoch": 0.04, + "learning_rate": 1.915614927575628e-07, + "loss": 0.2353, + "step": 2223 + }, + { + "epoch": 0.04, + "learning_rate": 1.9155760941322668e-07, + "loss": 0.2964, + "step": 2224 + }, + { + "epoch": 0.04, + "learning_rate": 1.9155372606889052e-07, + "loss": 0.5196, + "step": 2225 + }, + { + "epoch": 0.04, + "learning_rate": 1.9154984272455437e-07, + "loss": 0.1842, + "step": 2226 + }, + { + "epoch": 0.04, + "learning_rate": 1.9154595938021824e-07, + "loss": 0.2809, + "step": 2227 + }, + { + "epoch": 0.04, + "learning_rate": 1.9154207603588208e-07, + "loss": 0.1912, + "step": 2228 + }, + { + "epoch": 0.04, + "learning_rate": 1.9153819269154595e-07, + "loss": 0.322, + "step": 2229 + }, + { + "epoch": 0.04, + "learning_rate": 1.915343093472098e-07, + "loss": 0.2779, + "step": 2230 + }, + { + "epoch": 0.04, + "learning_rate": 1.9153042600287367e-07, + "loss": 0.2983, + "step": 2231 + }, + { + "epoch": 0.04, + "learning_rate": 1.9152654265853752e-07, + "loss": 0.2722, + "step": 2232 + }, + { + "epoch": 0.04, + "learning_rate": 1.9152265931420136e-07, + "loss": 0.3027, + "step": 2233 + }, + { + "epoch": 0.04, + "learning_rate": 1.9151877596986523e-07, + "loss": 0.3169, + "step": 2234 + }, + { + "epoch": 0.04, + "learning_rate": 1.9151489262552908e-07, + "loss": 0.2037, + "step": 2235 + }, + { + "epoch": 0.04, + "learning_rate": 1.9151100928119295e-07, + "loss": 0.5432, + "step": 2236 + }, + { + "epoch": 0.04, + "learning_rate": 1.915071259368568e-07, + "loss": 0.2507, + "step": 2237 + }, + { + "epoch": 0.04, + "learning_rate": 1.9150324259252066e-07, + "loss": 0.2115, + "step": 2238 + }, + { + "epoch": 0.04, + "learning_rate": 1.914993592481845e-07, + "loss": 0.1781, + "step": 2239 + }, + { + "epoch": 0.04, + "learning_rate": 1.9149547590384838e-07, + "loss": 0.5975, + "step": 2240 + }, + { + "epoch": 0.04, + "learning_rate": 1.9149159255951223e-07, + "loss": 0.1992, + "step": 2241 + }, + { + "epoch": 0.04, + "learning_rate": 1.914877092151761e-07, + "loss": 0.2578, + "step": 2242 + }, + { + "epoch": 0.04, + "learning_rate": 1.9148382587083994e-07, + "loss": 0.1614, + "step": 2243 + }, + { + "epoch": 0.04, + "learning_rate": 1.9147994252650381e-07, + "loss": 0.2966, + "step": 2244 + }, + { + "epoch": 0.04, + "learning_rate": 1.9147605918216766e-07, + "loss": 0.3627, + "step": 2245 + }, + { + "epoch": 0.04, + "learning_rate": 1.9147217583783153e-07, + "loss": 0.3442, + "step": 2246 + }, + { + "epoch": 0.04, + "learning_rate": 1.9146829249349538e-07, + "loss": 0.2578, + "step": 2247 + }, + { + "epoch": 0.04, + "learning_rate": 1.9146440914915925e-07, + "loss": 0.3627, + "step": 2248 + }, + { + "epoch": 0.04, + "learning_rate": 1.914605258048231e-07, + "loss": 0.2467, + "step": 2249 + }, + { + "epoch": 0.04, + "learning_rate": 1.9145664246048696e-07, + "loss": 0.2069, + "step": 2250 + }, + { + "epoch": 0.04, + "learning_rate": 1.914527591161508e-07, + "loss": 0.4171, + "step": 2251 + }, + { + "epoch": 0.04, + "learning_rate": 1.9144887577181468e-07, + "loss": 0.2227, + "step": 2252 + }, + { + "epoch": 0.04, + "learning_rate": 1.9144499242747853e-07, + "loss": 0.3698, + "step": 2253 + }, + { + "epoch": 0.04, + "learning_rate": 1.914411090831424e-07, + "loss": 0.1696, + "step": 2254 + }, + { + "epoch": 0.04, + "learning_rate": 1.9143722573880624e-07, + "loss": 0.27, + "step": 2255 + }, + { + "epoch": 0.04, + "learning_rate": 1.9143334239447011e-07, + "loss": 0.2843, + "step": 2256 + }, + { + "epoch": 0.04, + "learning_rate": 1.9142945905013396e-07, + "loss": 0.1574, + "step": 2257 + }, + { + "epoch": 0.04, + "learning_rate": 1.9142557570579783e-07, + "loss": 0.3496, + "step": 2258 + }, + { + "epoch": 0.04, + "learning_rate": 1.9142169236146167e-07, + "loss": 0.2006, + "step": 2259 + }, + { + "epoch": 0.04, + "learning_rate": 1.9141780901712555e-07, + "loss": 0.1498, + "step": 2260 + }, + { + "epoch": 0.04, + "learning_rate": 1.914139256727894e-07, + "loss": 0.1976, + "step": 2261 + }, + { + "epoch": 0.04, + "learning_rate": 1.9141004232845326e-07, + "loss": 0.155, + "step": 2262 + }, + { + "epoch": 0.04, + "learning_rate": 1.914061589841171e-07, + "loss": 0.2906, + "step": 2263 + }, + { + "epoch": 0.04, + "learning_rate": 1.9140227563978098e-07, + "loss": 0.3436, + "step": 2264 + }, + { + "epoch": 0.04, + "learning_rate": 1.9139839229544482e-07, + "loss": 0.2845, + "step": 2265 + }, + { + "epoch": 0.04, + "learning_rate": 1.913945089511087e-07, + "loss": 0.2754, + "step": 2266 + }, + { + "epoch": 0.04, + "learning_rate": 1.9139062560677254e-07, + "loss": 0.187, + "step": 2267 + }, + { + "epoch": 0.04, + "learning_rate": 1.913867422624364e-07, + "loss": 0.2042, + "step": 2268 + }, + { + "epoch": 0.04, + "learning_rate": 1.9138285891810026e-07, + "loss": 0.44, + "step": 2269 + }, + { + "epoch": 0.04, + "learning_rate": 1.9137897557376413e-07, + "loss": 0.1663, + "step": 2270 + }, + { + "epoch": 0.04, + "learning_rate": 1.9137509222942797e-07, + "loss": 0.2594, + "step": 2271 + }, + { + "epoch": 0.04, + "learning_rate": 1.9137120888509185e-07, + "loss": 0.1794, + "step": 2272 + }, + { + "epoch": 0.04, + "learning_rate": 1.913673255407557e-07, + "loss": 0.2559, + "step": 2273 + }, + { + "epoch": 0.04, + "learning_rate": 1.9136344219641956e-07, + "loss": 0.1763, + "step": 2274 + }, + { + "epoch": 0.04, + "learning_rate": 1.913595588520834e-07, + "loss": 0.2008, + "step": 2275 + }, + { + "epoch": 0.04, + "learning_rate": 1.9135567550774728e-07, + "loss": 0.1704, + "step": 2276 + }, + { + "epoch": 0.04, + "learning_rate": 1.9135179216341112e-07, + "loss": 0.2927, + "step": 2277 + }, + { + "epoch": 0.04, + "learning_rate": 1.91347908819075e-07, + "loss": 0.2074, + "step": 2278 + }, + { + "epoch": 0.04, + "learning_rate": 1.9134402547473884e-07, + "loss": 0.2989, + "step": 2279 + }, + { + "epoch": 0.04, + "learning_rate": 1.913401421304027e-07, + "loss": 0.2197, + "step": 2280 + }, + { + "epoch": 0.04, + "learning_rate": 1.9133625878606656e-07, + "loss": 0.257, + "step": 2281 + }, + { + "epoch": 0.04, + "learning_rate": 1.9133237544173043e-07, + "loss": 0.2169, + "step": 2282 + }, + { + "epoch": 0.04, + "learning_rate": 1.9132849209739425e-07, + "loss": 0.2873, + "step": 2283 + }, + { + "epoch": 0.04, + "learning_rate": 1.9132460875305812e-07, + "loss": 0.3402, + "step": 2284 + }, + { + "epoch": 0.04, + "learning_rate": 1.9132072540872196e-07, + "loss": 0.548, + "step": 2285 + }, + { + "epoch": 0.04, + "learning_rate": 1.9131684206438583e-07, + "loss": 0.1624, + "step": 2286 + }, + { + "epoch": 0.04, + "learning_rate": 1.9131295872004968e-07, + "loss": 0.2218, + "step": 2287 + }, + { + "epoch": 0.04, + "learning_rate": 1.9130907537571355e-07, + "loss": 0.2516, + "step": 2288 + }, + { + "epoch": 0.04, + "learning_rate": 1.913051920313774e-07, + "loss": 0.3256, + "step": 2289 + }, + { + "epoch": 0.04, + "learning_rate": 1.9130130868704127e-07, + "loss": 0.1706, + "step": 2290 + }, + { + "epoch": 0.04, + "learning_rate": 1.912974253427051e-07, + "loss": 0.3039, + "step": 2291 + }, + { + "epoch": 0.04, + "learning_rate": 1.9129354199836898e-07, + "loss": 0.1612, + "step": 2292 + }, + { + "epoch": 0.04, + "learning_rate": 1.9128965865403283e-07, + "loss": 0.2315, + "step": 2293 + }, + { + "epoch": 0.04, + "learning_rate": 1.912857753096967e-07, + "loss": 0.2006, + "step": 2294 + }, + { + "epoch": 0.04, + "learning_rate": 1.9128189196536055e-07, + "loss": 0.1686, + "step": 2295 + }, + { + "epoch": 0.04, + "learning_rate": 1.9127800862102442e-07, + "loss": 0.368, + "step": 2296 + }, + { + "epoch": 0.04, + "learning_rate": 1.9127412527668826e-07, + "loss": 0.2219, + "step": 2297 + }, + { + "epoch": 0.04, + "learning_rate": 1.9127024193235213e-07, + "loss": 0.1682, + "step": 2298 + }, + { + "epoch": 0.04, + "learning_rate": 1.9126635858801598e-07, + "loss": 0.462, + "step": 2299 + }, + { + "epoch": 0.04, + "learning_rate": 1.9126247524367985e-07, + "loss": 0.2024, + "step": 2300 + }, + { + "epoch": 0.04, + "learning_rate": 1.912585918993437e-07, + "loss": 0.2592, + "step": 2301 + }, + { + "epoch": 0.04, + "learning_rate": 1.9125470855500757e-07, + "loss": 0.1733, + "step": 2302 + }, + { + "epoch": 0.04, + "learning_rate": 1.912508252106714e-07, + "loss": 0.3561, + "step": 2303 + }, + { + "epoch": 0.04, + "learning_rate": 1.9124694186633528e-07, + "loss": 0.2009, + "step": 2304 + }, + { + "epoch": 0.04, + "learning_rate": 1.9124305852199913e-07, + "loss": 0.2299, + "step": 2305 + }, + { + "epoch": 0.04, + "learning_rate": 1.91239175177663e-07, + "loss": 0.2888, + "step": 2306 + }, + { + "epoch": 0.04, + "learning_rate": 1.9123529183332684e-07, + "loss": 0.3529, + "step": 2307 + }, + { + "epoch": 0.04, + "learning_rate": 1.9123140848899072e-07, + "loss": 0.3019, + "step": 2308 + }, + { + "epoch": 0.04, + "learning_rate": 1.9122752514465456e-07, + "loss": 0.4809, + "step": 2309 + }, + { + "epoch": 0.04, + "learning_rate": 1.9122364180031843e-07, + "loss": 0.1778, + "step": 2310 + }, + { + "epoch": 0.04, + "learning_rate": 1.9121975845598228e-07, + "loss": 0.2203, + "step": 2311 + }, + { + "epoch": 0.04, + "learning_rate": 1.9121587511164615e-07, + "loss": 0.2867, + "step": 2312 + }, + { + "epoch": 0.04, + "learning_rate": 1.9121199176731e-07, + "loss": 0.2744, + "step": 2313 + }, + { + "epoch": 0.04, + "learning_rate": 1.9120810842297386e-07, + "loss": 0.1608, + "step": 2314 + }, + { + "epoch": 0.04, + "learning_rate": 1.912042250786377e-07, + "loss": 0.2975, + "step": 2315 + }, + { + "epoch": 0.04, + "learning_rate": 1.9120034173430158e-07, + "loss": 0.189, + "step": 2316 + }, + { + "epoch": 0.04, + "learning_rate": 1.9119645838996543e-07, + "loss": 0.3539, + "step": 2317 + }, + { + "epoch": 0.04, + "learning_rate": 1.911925750456293e-07, + "loss": 0.2595, + "step": 2318 + }, + { + "epoch": 0.04, + "learning_rate": 1.9118869170129314e-07, + "loss": 0.3809, + "step": 2319 + }, + { + "epoch": 0.05, + "learning_rate": 1.9118480835695701e-07, + "loss": 0.4166, + "step": 2320 + }, + { + "epoch": 0.05, + "learning_rate": 1.9118092501262086e-07, + "loss": 0.3286, + "step": 2321 + }, + { + "epoch": 0.05, + "learning_rate": 1.9117704166828473e-07, + "loss": 0.3565, + "step": 2322 + }, + { + "epoch": 0.05, + "learning_rate": 1.9117315832394858e-07, + "loss": 0.3996, + "step": 2323 + }, + { + "epoch": 0.05, + "learning_rate": 1.9116927497961245e-07, + "loss": 0.2639, + "step": 2324 + }, + { + "epoch": 0.05, + "learning_rate": 1.911653916352763e-07, + "loss": 0.1578, + "step": 2325 + }, + { + "epoch": 0.05, + "learning_rate": 1.9116150829094016e-07, + "loss": 0.314, + "step": 2326 + }, + { + "epoch": 0.05, + "learning_rate": 1.91157624946604e-07, + "loss": 0.2412, + "step": 2327 + }, + { + "epoch": 0.05, + "learning_rate": 1.9115374160226788e-07, + "loss": 0.2372, + "step": 2328 + }, + { + "epoch": 0.05, + "learning_rate": 1.9114985825793173e-07, + "loss": 0.1408, + "step": 2329 + }, + { + "epoch": 0.05, + "learning_rate": 1.911459749135956e-07, + "loss": 0.2258, + "step": 2330 + }, + { + "epoch": 0.05, + "learning_rate": 1.9114209156925944e-07, + "loss": 0.352, + "step": 2331 + }, + { + "epoch": 0.05, + "learning_rate": 1.9113820822492331e-07, + "loss": 0.3683, + "step": 2332 + }, + { + "epoch": 0.05, + "learning_rate": 1.9113432488058716e-07, + "loss": 0.1615, + "step": 2333 + }, + { + "epoch": 0.05, + "learning_rate": 1.9113044153625103e-07, + "loss": 0.2111, + "step": 2334 + }, + { + "epoch": 0.05, + "learning_rate": 1.9112655819191487e-07, + "loss": 0.5346, + "step": 2335 + }, + { + "epoch": 0.05, + "learning_rate": 1.9112267484757875e-07, + "loss": 0.4643, + "step": 2336 + }, + { + "epoch": 0.05, + "learning_rate": 1.911187915032426e-07, + "loss": 0.2474, + "step": 2337 + }, + { + "epoch": 0.05, + "learning_rate": 1.9111490815890646e-07, + "loss": 0.2657, + "step": 2338 + }, + { + "epoch": 0.05, + "learning_rate": 1.911110248145703e-07, + "loss": 0.2998, + "step": 2339 + }, + { + "epoch": 0.05, + "learning_rate": 1.9110714147023418e-07, + "loss": 0.3054, + "step": 2340 + }, + { + "epoch": 0.05, + "learning_rate": 1.91103258125898e-07, + "loss": 0.1431, + "step": 2341 + }, + { + "epoch": 0.05, + "learning_rate": 1.9109937478156187e-07, + "loss": 0.4043, + "step": 2342 + }, + { + "epoch": 0.05, + "learning_rate": 1.9109549143722571e-07, + "loss": 0.1776, + "step": 2343 + }, + { + "epoch": 0.05, + "learning_rate": 1.9109160809288959e-07, + "loss": 0.4256, + "step": 2344 + }, + { + "epoch": 0.05, + "learning_rate": 1.9108772474855343e-07, + "loss": 0.1989, + "step": 2345 + }, + { + "epoch": 0.05, + "learning_rate": 1.910838414042173e-07, + "loss": 0.2438, + "step": 2346 + }, + { + "epoch": 0.05, + "learning_rate": 1.9107995805988115e-07, + "loss": 0.2251, + "step": 2347 + }, + { + "epoch": 0.05, + "learning_rate": 1.9107607471554502e-07, + "loss": 0.2826, + "step": 2348 + }, + { + "epoch": 0.05, + "learning_rate": 1.9107219137120886e-07, + "loss": 0.1986, + "step": 2349 + }, + { + "epoch": 0.05, + "learning_rate": 1.9106830802687274e-07, + "loss": 0.2022, + "step": 2350 + }, + { + "epoch": 0.05, + "learning_rate": 1.9106442468253658e-07, + "loss": 0.2554, + "step": 2351 + }, + { + "epoch": 0.05, + "learning_rate": 1.9106054133820045e-07, + "loss": 0.2963, + "step": 2352 + }, + { + "epoch": 0.05, + "learning_rate": 1.910566579938643e-07, + "loss": 0.2262, + "step": 2353 + }, + { + "epoch": 0.05, + "learning_rate": 1.9105277464952817e-07, + "loss": 0.2764, + "step": 2354 + }, + { + "epoch": 0.05, + "learning_rate": 1.9104889130519201e-07, + "loss": 0.4382, + "step": 2355 + }, + { + "epoch": 0.05, + "learning_rate": 1.9104500796085588e-07, + "loss": 0.2115, + "step": 2356 + }, + { + "epoch": 0.05, + "learning_rate": 1.9104112461651973e-07, + "loss": 0.1676, + "step": 2357 + }, + { + "epoch": 0.05, + "learning_rate": 1.910372412721836e-07, + "loss": 0.1393, + "step": 2358 + }, + { + "epoch": 0.05, + "learning_rate": 1.9103335792784745e-07, + "loss": 0.225, + "step": 2359 + }, + { + "epoch": 0.05, + "learning_rate": 1.9102947458351132e-07, + "loss": 0.2223, + "step": 2360 + }, + { + "epoch": 0.05, + "learning_rate": 1.9102559123917516e-07, + "loss": 0.3581, + "step": 2361 + }, + { + "epoch": 0.05, + "learning_rate": 1.9102170789483903e-07, + "loss": 0.2221, + "step": 2362 + }, + { + "epoch": 0.05, + "learning_rate": 1.9101782455050288e-07, + "loss": 0.3571, + "step": 2363 + }, + { + "epoch": 0.05, + "learning_rate": 1.9101394120616675e-07, + "loss": 0.6683, + "step": 2364 + }, + { + "epoch": 0.05, + "learning_rate": 1.910100578618306e-07, + "loss": 0.4576, + "step": 2365 + }, + { + "epoch": 0.05, + "learning_rate": 1.9100617451749447e-07, + "loss": 0.3772, + "step": 2366 + }, + { + "epoch": 0.05, + "learning_rate": 1.910022911731583e-07, + "loss": 0.2739, + "step": 2367 + }, + { + "epoch": 0.05, + "learning_rate": 1.9099840782882218e-07, + "loss": 0.1272, + "step": 2368 + }, + { + "epoch": 0.05, + "learning_rate": 1.9099452448448603e-07, + "loss": 0.3451, + "step": 2369 + }, + { + "epoch": 0.05, + "learning_rate": 1.909906411401499e-07, + "loss": 0.2573, + "step": 2370 + }, + { + "epoch": 0.05, + "learning_rate": 1.9098675779581375e-07, + "loss": 0.1512, + "step": 2371 + }, + { + "epoch": 0.05, + "learning_rate": 1.9098287445147762e-07, + "loss": 0.1769, + "step": 2372 + }, + { + "epoch": 0.05, + "learning_rate": 1.9097899110714146e-07, + "loss": 0.2661, + "step": 2373 + }, + { + "epoch": 0.05, + "learning_rate": 1.9097510776280533e-07, + "loss": 0.2558, + "step": 2374 + }, + { + "epoch": 0.05, + "learning_rate": 1.9097122441846918e-07, + "loss": 0.1559, + "step": 2375 + }, + { + "epoch": 0.05, + "learning_rate": 1.9096734107413305e-07, + "loss": 0.3787, + "step": 2376 + }, + { + "epoch": 0.05, + "learning_rate": 1.909634577297969e-07, + "loss": 0.3078, + "step": 2377 + }, + { + "epoch": 0.05, + "learning_rate": 1.9095957438546077e-07, + "loss": 0.2799, + "step": 2378 + }, + { + "epoch": 0.05, + "learning_rate": 1.909556910411246e-07, + "loss": 0.3198, + "step": 2379 + }, + { + "epoch": 0.05, + "learning_rate": 1.9095180769678848e-07, + "loss": 0.2504, + "step": 2380 + }, + { + "epoch": 0.05, + "learning_rate": 1.9094792435245233e-07, + "loss": 0.2065, + "step": 2381 + }, + { + "epoch": 0.05, + "learning_rate": 1.9094404100811617e-07, + "loss": 0.4014, + "step": 2382 + }, + { + "epoch": 0.05, + "learning_rate": 1.9094015766378004e-07, + "loss": 0.3588, + "step": 2383 + }, + { + "epoch": 0.05, + "learning_rate": 1.909362743194439e-07, + "loss": 0.1405, + "step": 2384 + }, + { + "epoch": 0.05, + "learning_rate": 1.9093239097510776e-07, + "loss": 0.2483, + "step": 2385 + }, + { + "epoch": 0.05, + "learning_rate": 1.909285076307716e-07, + "loss": 0.415, + "step": 2386 + }, + { + "epoch": 0.05, + "learning_rate": 1.9092462428643548e-07, + "loss": 0.1872, + "step": 2387 + }, + { + "epoch": 0.05, + "learning_rate": 1.9092074094209932e-07, + "loss": 0.3174, + "step": 2388 + }, + { + "epoch": 0.05, + "learning_rate": 1.909168575977632e-07, + "loss": 0.1888, + "step": 2389 + }, + { + "epoch": 0.05, + "learning_rate": 1.9091297425342704e-07, + "loss": 0.3509, + "step": 2390 + }, + { + "epoch": 0.05, + "learning_rate": 1.909090909090909e-07, + "loss": 0.1428, + "step": 2391 + }, + { + "epoch": 0.05, + "learning_rate": 1.9090520756475476e-07, + "loss": 0.1967, + "step": 2392 + }, + { + "epoch": 0.05, + "learning_rate": 1.9090132422041863e-07, + "loss": 0.1942, + "step": 2393 + }, + { + "epoch": 0.05, + "learning_rate": 1.9089744087608247e-07, + "loss": 0.1163, + "step": 2394 + }, + { + "epoch": 0.05, + "learning_rate": 1.9089355753174634e-07, + "loss": 0.2068, + "step": 2395 + }, + { + "epoch": 0.05, + "learning_rate": 1.908896741874102e-07, + "loss": 0.3142, + "step": 2396 + }, + { + "epoch": 0.05, + "learning_rate": 1.9088579084307406e-07, + "loss": 0.1664, + "step": 2397 + }, + { + "epoch": 0.05, + "learning_rate": 1.908819074987379e-07, + "loss": 0.1995, + "step": 2398 + }, + { + "epoch": 0.05, + "learning_rate": 1.9087802415440175e-07, + "loss": 0.2065, + "step": 2399 + }, + { + "epoch": 0.05, + "learning_rate": 1.9087414081006562e-07, + "loss": 0.1884, + "step": 2400 + }, + { + "epoch": 0.05, + "learning_rate": 1.9087025746572947e-07, + "loss": 0.2002, + "step": 2401 + }, + { + "epoch": 0.05, + "learning_rate": 1.9086637412139334e-07, + "loss": 0.1856, + "step": 2402 + }, + { + "epoch": 0.05, + "learning_rate": 1.9086249077705718e-07, + "loss": 0.2214, + "step": 2403 + }, + { + "epoch": 0.05, + "learning_rate": 1.9085860743272105e-07, + "loss": 0.287, + "step": 2404 + }, + { + "epoch": 0.05, + "learning_rate": 1.908547240883849e-07, + "loss": 0.1896, + "step": 2405 + }, + { + "epoch": 0.05, + "learning_rate": 1.9085084074404877e-07, + "loss": 0.3342, + "step": 2406 + }, + { + "epoch": 0.05, + "learning_rate": 1.9084695739971262e-07, + "loss": 0.2604, + "step": 2407 + }, + { + "epoch": 0.05, + "learning_rate": 1.908430740553765e-07, + "loss": 0.2315, + "step": 2408 + }, + { + "epoch": 0.05, + "learning_rate": 1.9083919071104033e-07, + "loss": 0.4611, + "step": 2409 + }, + { + "epoch": 0.05, + "learning_rate": 1.9083530736670418e-07, + "loss": 0.3604, + "step": 2410 + }, + { + "epoch": 0.05, + "learning_rate": 1.9083142402236805e-07, + "loss": 0.2759, + "step": 2411 + }, + { + "epoch": 0.05, + "learning_rate": 1.908275406780319e-07, + "loss": 0.289, + "step": 2412 + }, + { + "epoch": 0.05, + "learning_rate": 1.9082365733369576e-07, + "loss": 0.4046, + "step": 2413 + }, + { + "epoch": 0.05, + "learning_rate": 1.908197739893596e-07, + "loss": 0.2203, + "step": 2414 + }, + { + "epoch": 0.05, + "learning_rate": 1.9081589064502348e-07, + "loss": 0.3456, + "step": 2415 + }, + { + "epoch": 0.05, + "learning_rate": 1.9081200730068733e-07, + "loss": 0.1729, + "step": 2416 + }, + { + "epoch": 0.05, + "learning_rate": 1.908081239563512e-07, + "loss": 0.3744, + "step": 2417 + }, + { + "epoch": 0.05, + "learning_rate": 1.9080424061201504e-07, + "loss": 0.2528, + "step": 2418 + }, + { + "epoch": 0.05, + "learning_rate": 1.9080035726767891e-07, + "loss": 0.1425, + "step": 2419 + }, + { + "epoch": 0.05, + "learning_rate": 1.9079647392334276e-07, + "loss": 0.3701, + "step": 2420 + }, + { + "epoch": 0.05, + "learning_rate": 1.9079259057900663e-07, + "loss": 0.2337, + "step": 2421 + }, + { + "epoch": 0.05, + "learning_rate": 1.9078870723467048e-07, + "loss": 0.1394, + "step": 2422 + }, + { + "epoch": 0.05, + "learning_rate": 1.9078482389033435e-07, + "loss": 0.3445, + "step": 2423 + }, + { + "epoch": 0.05, + "learning_rate": 1.907809405459982e-07, + "loss": 0.2567, + "step": 2424 + }, + { + "epoch": 0.05, + "learning_rate": 1.9077705720166206e-07, + "loss": 0.1419, + "step": 2425 + }, + { + "epoch": 0.05, + "learning_rate": 1.907731738573259e-07, + "loss": 0.2003, + "step": 2426 + }, + { + "epoch": 0.05, + "learning_rate": 1.9076929051298978e-07, + "loss": 0.2664, + "step": 2427 + }, + { + "epoch": 0.05, + "learning_rate": 1.9076540716865363e-07, + "loss": 0.2637, + "step": 2428 + }, + { + "epoch": 0.05, + "learning_rate": 1.907615238243175e-07, + "loss": 0.1255, + "step": 2429 + }, + { + "epoch": 0.05, + "learning_rate": 1.9075764047998134e-07, + "loss": 0.3851, + "step": 2430 + }, + { + "epoch": 0.05, + "learning_rate": 1.9075375713564521e-07, + "loss": 0.1555, + "step": 2431 + }, + { + "epoch": 0.05, + "learning_rate": 1.9074987379130906e-07, + "loss": 0.2373, + "step": 2432 + }, + { + "epoch": 0.05, + "learning_rate": 1.9074599044697293e-07, + "loss": 0.3298, + "step": 2433 + }, + { + "epoch": 0.05, + "learning_rate": 1.9074210710263677e-07, + "loss": 0.2117, + "step": 2434 + }, + { + "epoch": 0.05, + "learning_rate": 1.9073822375830065e-07, + "loss": 0.3456, + "step": 2435 + }, + { + "epoch": 0.05, + "learning_rate": 1.907343404139645e-07, + "loss": 0.2137, + "step": 2436 + }, + { + "epoch": 0.05, + "learning_rate": 1.9073045706962836e-07, + "loss": 0.1209, + "step": 2437 + }, + { + "epoch": 0.05, + "learning_rate": 1.907265737252922e-07, + "loss": 0.1882, + "step": 2438 + }, + { + "epoch": 0.05, + "learning_rate": 1.9072269038095608e-07, + "loss": 0.1786, + "step": 2439 + }, + { + "epoch": 0.05, + "learning_rate": 1.9071880703661992e-07, + "loss": 0.3191, + "step": 2440 + }, + { + "epoch": 0.05, + "learning_rate": 1.907149236922838e-07, + "loss": 0.2005, + "step": 2441 + }, + { + "epoch": 0.05, + "learning_rate": 1.9071104034794764e-07, + "loss": 0.2364, + "step": 2442 + }, + { + "epoch": 0.05, + "learning_rate": 1.907071570036115e-07, + "loss": 0.3457, + "step": 2443 + }, + { + "epoch": 0.05, + "learning_rate": 1.9070327365927536e-07, + "loss": 0.4505, + "step": 2444 + }, + { + "epoch": 0.05, + "learning_rate": 1.9069939031493923e-07, + "loss": 0.2651, + "step": 2445 + }, + { + "epoch": 0.05, + "learning_rate": 1.9069550697060307e-07, + "loss": 0.1697, + "step": 2446 + }, + { + "epoch": 0.05, + "learning_rate": 1.9069162362626695e-07, + "loss": 0.1255, + "step": 2447 + }, + { + "epoch": 0.05, + "learning_rate": 1.906877402819308e-07, + "loss": 0.1559, + "step": 2448 + }, + { + "epoch": 0.05, + "learning_rate": 1.9068385693759466e-07, + "loss": 0.6893, + "step": 2449 + }, + { + "epoch": 0.05, + "learning_rate": 1.906799735932585e-07, + "loss": 0.2785, + "step": 2450 + }, + { + "epoch": 0.05, + "learning_rate": 1.9067609024892238e-07, + "loss": 0.3125, + "step": 2451 + }, + { + "epoch": 0.05, + "learning_rate": 1.9067220690458622e-07, + "loss": 0.1261, + "step": 2452 + }, + { + "epoch": 0.05, + "learning_rate": 1.906683235602501e-07, + "loss": 0.2379, + "step": 2453 + }, + { + "epoch": 0.05, + "learning_rate": 1.9066444021591394e-07, + "loss": 0.2362, + "step": 2454 + }, + { + "epoch": 0.05, + "learning_rate": 1.906605568715778e-07, + "loss": 0.1936, + "step": 2455 + }, + { + "epoch": 0.05, + "learning_rate": 1.9065667352724166e-07, + "loss": 0.1631, + "step": 2456 + }, + { + "epoch": 0.05, + "learning_rate": 1.906527901829055e-07, + "loss": 0.188, + "step": 2457 + }, + { + "epoch": 0.05, + "learning_rate": 1.9064890683856935e-07, + "loss": 0.3968, + "step": 2458 + }, + { + "epoch": 0.05, + "learning_rate": 1.9064502349423322e-07, + "loss": 0.1181, + "step": 2459 + }, + { + "epoch": 0.05, + "learning_rate": 1.9064114014989706e-07, + "loss": 0.2192, + "step": 2460 + }, + { + "epoch": 0.05, + "learning_rate": 1.9063725680556093e-07, + "loss": 0.2684, + "step": 2461 + }, + { + "epoch": 0.05, + "learning_rate": 1.9063337346122478e-07, + "loss": 0.3971, + "step": 2462 + }, + { + "epoch": 0.05, + "learning_rate": 1.9062949011688865e-07, + "loss": 0.214, + "step": 2463 + }, + { + "epoch": 0.05, + "learning_rate": 1.906256067725525e-07, + "loss": 0.1586, + "step": 2464 + }, + { + "epoch": 0.05, + "learning_rate": 1.9062172342821637e-07, + "loss": 0.3444, + "step": 2465 + }, + { + "epoch": 0.05, + "learning_rate": 1.906178400838802e-07, + "loss": 0.1959, + "step": 2466 + }, + { + "epoch": 0.05, + "learning_rate": 1.9061395673954408e-07, + "loss": 0.4102, + "step": 2467 + }, + { + "epoch": 0.05, + "learning_rate": 1.9061007339520793e-07, + "loss": 0.2105, + "step": 2468 + }, + { + "epoch": 0.05, + "learning_rate": 1.906061900508718e-07, + "loss": 0.6629, + "step": 2469 + }, + { + "epoch": 0.05, + "learning_rate": 1.9060230670653565e-07, + "loss": 0.1177, + "step": 2470 + }, + { + "epoch": 0.05, + "learning_rate": 1.9059842336219952e-07, + "loss": 0.1598, + "step": 2471 + }, + { + "epoch": 0.05, + "learning_rate": 1.9059454001786336e-07, + "loss": 0.1655, + "step": 2472 + }, + { + "epoch": 0.05, + "learning_rate": 1.9059065667352723e-07, + "loss": 0.322, + "step": 2473 + }, + { + "epoch": 0.05, + "learning_rate": 1.9058677332919108e-07, + "loss": 0.2725, + "step": 2474 + }, + { + "epoch": 0.05, + "learning_rate": 1.9058288998485495e-07, + "loss": 0.2149, + "step": 2475 + }, + { + "epoch": 0.05, + "learning_rate": 1.905790066405188e-07, + "loss": 0.1387, + "step": 2476 + }, + { + "epoch": 0.05, + "learning_rate": 1.9057512329618267e-07, + "loss": 0.1486, + "step": 2477 + }, + { + "epoch": 0.05, + "learning_rate": 1.905712399518465e-07, + "loss": 0.1384, + "step": 2478 + }, + { + "epoch": 0.05, + "learning_rate": 1.9056735660751038e-07, + "loss": 0.2245, + "step": 2479 + }, + { + "epoch": 0.05, + "learning_rate": 1.9056347326317423e-07, + "loss": 0.1956, + "step": 2480 + }, + { + "epoch": 0.05, + "learning_rate": 1.905595899188381e-07, + "loss": 0.1646, + "step": 2481 + }, + { + "epoch": 0.05, + "learning_rate": 1.9055570657450194e-07, + "loss": 0.2318, + "step": 2482 + }, + { + "epoch": 0.05, + "learning_rate": 1.9055182323016582e-07, + "loss": 0.4493, + "step": 2483 + }, + { + "epoch": 0.05, + "learning_rate": 1.9054793988582966e-07, + "loss": 0.2622, + "step": 2484 + }, + { + "epoch": 0.05, + "learning_rate": 1.9054405654149353e-07, + "loss": 0.372, + "step": 2485 + }, + { + "epoch": 0.05, + "learning_rate": 1.9054017319715738e-07, + "loss": 0.1582, + "step": 2486 + }, + { + "epoch": 0.05, + "learning_rate": 1.9053628985282125e-07, + "loss": 0.1537, + "step": 2487 + }, + { + "epoch": 0.05, + "learning_rate": 1.905324065084851e-07, + "loss": 0.3603, + "step": 2488 + }, + { + "epoch": 0.05, + "learning_rate": 1.9052852316414897e-07, + "loss": 0.5594, + "step": 2489 + }, + { + "epoch": 0.05, + "learning_rate": 1.905246398198128e-07, + "loss": 0.2588, + "step": 2490 + }, + { + "epoch": 0.05, + "learning_rate": 1.9052075647547668e-07, + "loss": 0.2197, + "step": 2491 + }, + { + "epoch": 0.05, + "learning_rate": 1.9051687313114053e-07, + "loss": 0.2655, + "step": 2492 + }, + { + "epoch": 0.05, + "learning_rate": 1.905129897868044e-07, + "loss": 0.2299, + "step": 2493 + }, + { + "epoch": 0.05, + "learning_rate": 1.9050910644246824e-07, + "loss": 0.3857, + "step": 2494 + }, + { + "epoch": 0.05, + "learning_rate": 1.9050522309813211e-07, + "loss": 0.1678, + "step": 2495 + }, + { + "epoch": 0.05, + "learning_rate": 1.9050133975379596e-07, + "loss": 0.2246, + "step": 2496 + }, + { + "epoch": 0.05, + "learning_rate": 1.9049745640945983e-07, + "loss": 0.2539, + "step": 2497 + }, + { + "epoch": 0.05, + "learning_rate": 1.9049357306512368e-07, + "loss": 0.1627, + "step": 2498 + }, + { + "epoch": 0.05, + "learning_rate": 1.9048968972078755e-07, + "loss": 0.2282, + "step": 2499 + }, + { + "epoch": 0.05, + "learning_rate": 1.904858063764514e-07, + "loss": 0.1457, + "step": 2500 + }, + { + "epoch": 0.05, + "learning_rate": 1.9048192303211526e-07, + "loss": 0.1847, + "step": 2501 + }, + { + "epoch": 0.05, + "learning_rate": 1.904780396877791e-07, + "loss": 0.1322, + "step": 2502 + }, + { + "epoch": 0.05, + "learning_rate": 1.9047415634344298e-07, + "loss": 0.3504, + "step": 2503 + }, + { + "epoch": 0.05, + "learning_rate": 1.9047027299910683e-07, + "loss": 0.3734, + "step": 2504 + }, + { + "epoch": 0.05, + "learning_rate": 1.904663896547707e-07, + "loss": 0.1468, + "step": 2505 + }, + { + "epoch": 0.05, + "learning_rate": 1.9046250631043454e-07, + "loss": 0.3473, + "step": 2506 + }, + { + "epoch": 0.05, + "learning_rate": 1.9045862296609841e-07, + "loss": 0.1369, + "step": 2507 + }, + { + "epoch": 0.05, + "learning_rate": 1.9045473962176226e-07, + "loss": 0.4465, + "step": 2508 + }, + { + "epoch": 0.05, + "learning_rate": 1.9045085627742613e-07, + "loss": 0.3414, + "step": 2509 + }, + { + "epoch": 0.05, + "learning_rate": 1.9044697293308997e-07, + "loss": 0.099, + "step": 2510 + }, + { + "epoch": 0.05, + "learning_rate": 1.9044308958875385e-07, + "loss": 0.1679, + "step": 2511 + }, + { + "epoch": 0.05, + "learning_rate": 1.904392062444177e-07, + "loss": 0.1479, + "step": 2512 + }, + { + "epoch": 0.05, + "learning_rate": 1.9043532290008156e-07, + "loss": 0.3301, + "step": 2513 + }, + { + "epoch": 0.05, + "learning_rate": 1.904314395557454e-07, + "loss": 0.3721, + "step": 2514 + }, + { + "epoch": 0.05, + "learning_rate": 1.9042755621140925e-07, + "loss": 0.4788, + "step": 2515 + }, + { + "epoch": 0.05, + "learning_rate": 1.904236728670731e-07, + "loss": 0.3848, + "step": 2516 + }, + { + "epoch": 0.05, + "learning_rate": 1.9041978952273697e-07, + "loss": 0.33, + "step": 2517 + }, + { + "epoch": 0.05, + "learning_rate": 1.9041590617840081e-07, + "loss": 0.2374, + "step": 2518 + }, + { + "epoch": 0.05, + "learning_rate": 1.9041202283406469e-07, + "loss": 0.1771, + "step": 2519 + }, + { + "epoch": 0.05, + "learning_rate": 1.9040813948972853e-07, + "loss": 0.2146, + "step": 2520 + }, + { + "epoch": 0.05, + "learning_rate": 1.904042561453924e-07, + "loss": 0.1238, + "step": 2521 + }, + { + "epoch": 0.05, + "learning_rate": 1.9040037280105625e-07, + "loss": 0.1201, + "step": 2522 + }, + { + "epoch": 0.05, + "learning_rate": 1.9039648945672012e-07, + "loss": 0.3529, + "step": 2523 + }, + { + "epoch": 0.05, + "learning_rate": 1.9039260611238396e-07, + "loss": 0.3091, + "step": 2524 + }, + { + "epoch": 0.05, + "learning_rate": 1.9038872276804784e-07, + "loss": 0.5155, + "step": 2525 + }, + { + "epoch": 0.05, + "learning_rate": 1.9038483942371168e-07, + "loss": 0.1845, + "step": 2526 + }, + { + "epoch": 0.05, + "learning_rate": 1.9038095607937555e-07, + "loss": 0.1902, + "step": 2527 + }, + { + "epoch": 0.05, + "learning_rate": 1.903770727350394e-07, + "loss": 0.8458, + "step": 2528 + }, + { + "epoch": 0.05, + "learning_rate": 1.9037318939070327e-07, + "loss": 0.253, + "step": 2529 + }, + { + "epoch": 0.05, + "learning_rate": 1.9036930604636711e-07, + "loss": 0.3169, + "step": 2530 + }, + { + "epoch": 0.05, + "learning_rate": 1.9036542270203098e-07, + "loss": 0.2409, + "step": 2531 + }, + { + "epoch": 0.05, + "learning_rate": 1.9036153935769483e-07, + "loss": 0.2936, + "step": 2532 + }, + { + "epoch": 0.05, + "learning_rate": 1.903576560133587e-07, + "loss": 0.1178, + "step": 2533 + }, + { + "epoch": 0.05, + "learning_rate": 1.9035377266902255e-07, + "loss": 0.1612, + "step": 2534 + }, + { + "epoch": 0.05, + "learning_rate": 1.9034988932468642e-07, + "loss": 0.181, + "step": 2535 + }, + { + "epoch": 0.05, + "learning_rate": 1.9034600598035026e-07, + "loss": 0.2128, + "step": 2536 + }, + { + "epoch": 0.05, + "learning_rate": 1.9034212263601413e-07, + "loss": 0.1588, + "step": 2537 + }, + { + "epoch": 0.05, + "learning_rate": 1.9033823929167798e-07, + "loss": 0.1387, + "step": 2538 + }, + { + "epoch": 0.05, + "learning_rate": 1.9033435594734185e-07, + "loss": 0.4409, + "step": 2539 + }, + { + "epoch": 0.05, + "learning_rate": 1.903304726030057e-07, + "loss": 0.4654, + "step": 2540 + }, + { + "epoch": 0.05, + "learning_rate": 1.9032658925866957e-07, + "loss": 0.2465, + "step": 2541 + }, + { + "epoch": 0.05, + "learning_rate": 1.903227059143334e-07, + "loss": 0.4964, + "step": 2542 + }, + { + "epoch": 0.05, + "learning_rate": 1.9031882256999728e-07, + "loss": 0.2776, + "step": 2543 + }, + { + "epoch": 0.05, + "learning_rate": 1.9031493922566113e-07, + "loss": 0.1954, + "step": 2544 + }, + { + "epoch": 0.05, + "learning_rate": 1.90311055881325e-07, + "loss": 0.2242, + "step": 2545 + }, + { + "epoch": 0.05, + "learning_rate": 1.9030717253698885e-07, + "loss": 0.1876, + "step": 2546 + }, + { + "epoch": 0.05, + "learning_rate": 1.9030328919265272e-07, + "loss": 0.1833, + "step": 2547 + }, + { + "epoch": 0.05, + "learning_rate": 1.9029940584831656e-07, + "loss": 0.1601, + "step": 2548 + }, + { + "epoch": 0.05, + "learning_rate": 1.9029552250398043e-07, + "loss": 0.1387, + "step": 2549 + }, + { + "epoch": 0.05, + "learning_rate": 1.9029163915964428e-07, + "loss": 0.2615, + "step": 2550 + }, + { + "epoch": 0.05, + "learning_rate": 1.9028775581530815e-07, + "loss": 0.1158, + "step": 2551 + }, + { + "epoch": 0.05, + "learning_rate": 1.90283872470972e-07, + "loss": 0.193, + "step": 2552 + }, + { + "epoch": 0.05, + "learning_rate": 1.9027998912663587e-07, + "loss": 0.2354, + "step": 2553 + }, + { + "epoch": 0.05, + "learning_rate": 1.902761057822997e-07, + "loss": 0.362, + "step": 2554 + }, + { + "epoch": 0.05, + "learning_rate": 1.9027222243796358e-07, + "loss": 0.1555, + "step": 2555 + }, + { + "epoch": 0.05, + "learning_rate": 1.9026833909362743e-07, + "loss": 0.1505, + "step": 2556 + }, + { + "epoch": 0.05, + "learning_rate": 1.902644557492913e-07, + "loss": 0.1849, + "step": 2557 + }, + { + "epoch": 0.05, + "learning_rate": 1.9026057240495514e-07, + "loss": 0.1663, + "step": 2558 + }, + { + "epoch": 0.05, + "learning_rate": 1.90256689060619e-07, + "loss": 0.2912, + "step": 2559 + }, + { + "epoch": 0.05, + "learning_rate": 1.9025280571628286e-07, + "loss": 0.1402, + "step": 2560 + }, + { + "epoch": 0.05, + "learning_rate": 1.902489223719467e-07, + "loss": 0.2088, + "step": 2561 + }, + { + "epoch": 0.05, + "learning_rate": 1.9024503902761058e-07, + "loss": 0.1452, + "step": 2562 + }, + { + "epoch": 0.05, + "learning_rate": 1.9024115568327442e-07, + "loss": 0.1448, + "step": 2563 + }, + { + "epoch": 0.05, + "learning_rate": 1.902372723389383e-07, + "loss": 0.1464, + "step": 2564 + }, + { + "epoch": 0.05, + "learning_rate": 1.9023338899460214e-07, + "loss": 0.1439, + "step": 2565 + }, + { + "epoch": 0.05, + "learning_rate": 1.90229505650266e-07, + "loss": 0.1752, + "step": 2566 + }, + { + "epoch": 0.05, + "learning_rate": 1.9022562230592986e-07, + "loss": 0.247, + "step": 2567 + }, + { + "epoch": 0.05, + "learning_rate": 1.9022173896159373e-07, + "loss": 0.1581, + "step": 2568 + }, + { + "epoch": 0.05, + "learning_rate": 1.9021785561725757e-07, + "loss": 0.2937, + "step": 2569 + }, + { + "epoch": 0.05, + "learning_rate": 1.9021397227292144e-07, + "loss": 0.1505, + "step": 2570 + }, + { + "epoch": 0.05, + "learning_rate": 1.902100889285853e-07, + "loss": 0.2561, + "step": 2571 + }, + { + "epoch": 0.05, + "learning_rate": 1.9020620558424916e-07, + "loss": 0.1729, + "step": 2572 + }, + { + "epoch": 0.05, + "learning_rate": 1.90202322239913e-07, + "loss": 0.1922, + "step": 2573 + }, + { + "epoch": 0.05, + "learning_rate": 1.9019843889557685e-07, + "loss": 0.2659, + "step": 2574 + }, + { + "epoch": 0.05, + "learning_rate": 1.9019455555124072e-07, + "loss": 0.1622, + "step": 2575 + }, + { + "epoch": 0.05, + "learning_rate": 1.9019067220690457e-07, + "loss": 0.2441, + "step": 2576 + }, + { + "epoch": 0.05, + "learning_rate": 1.9018678886256844e-07, + "loss": 0.2902, + "step": 2577 + }, + { + "epoch": 0.05, + "learning_rate": 1.9018290551823228e-07, + "loss": 0.2204, + "step": 2578 + }, + { + "epoch": 0.05, + "learning_rate": 1.9017902217389615e-07, + "loss": 0.1094, + "step": 2579 + }, + { + "epoch": 0.05, + "learning_rate": 1.9017513882956e-07, + "loss": 0.176, + "step": 2580 + }, + { + "epoch": 0.05, + "learning_rate": 1.9017125548522387e-07, + "loss": 0.2263, + "step": 2581 + }, + { + "epoch": 0.05, + "learning_rate": 1.9016737214088772e-07, + "loss": 0.2864, + "step": 2582 + }, + { + "epoch": 0.05, + "learning_rate": 1.901634887965516e-07, + "loss": 0.1555, + "step": 2583 + }, + { + "epoch": 0.05, + "learning_rate": 1.9015960545221543e-07, + "loss": 0.1981, + "step": 2584 + }, + { + "epoch": 0.05, + "learning_rate": 1.901557221078793e-07, + "loss": 0.1469, + "step": 2585 + }, + { + "epoch": 0.05, + "learning_rate": 1.9015183876354315e-07, + "loss": 0.4968, + "step": 2586 + }, + { + "epoch": 0.05, + "learning_rate": 1.90147955419207e-07, + "loss": 0.1618, + "step": 2587 + }, + { + "epoch": 0.05, + "learning_rate": 1.9014407207487087e-07, + "loss": 0.1075, + "step": 2588 + }, + { + "epoch": 0.05, + "learning_rate": 1.901401887305347e-07, + "loss": 0.3492, + "step": 2589 + }, + { + "epoch": 0.05, + "learning_rate": 1.9013630538619858e-07, + "loss": 0.1295, + "step": 2590 + }, + { + "epoch": 0.05, + "learning_rate": 1.9013242204186243e-07, + "loss": 0.2164, + "step": 2591 + }, + { + "epoch": 0.05, + "learning_rate": 1.901285386975263e-07, + "loss": 0.2745, + "step": 2592 + }, + { + "epoch": 0.05, + "learning_rate": 1.9012465535319014e-07, + "loss": 0.1581, + "step": 2593 + }, + { + "epoch": 0.05, + "learning_rate": 1.9012077200885401e-07, + "loss": 0.3198, + "step": 2594 + }, + { + "epoch": 0.05, + "learning_rate": 1.9011688866451786e-07, + "loss": 0.2672, + "step": 2595 + }, + { + "epoch": 0.05, + "learning_rate": 1.9011300532018173e-07, + "loss": 0.1188, + "step": 2596 + }, + { + "epoch": 0.05, + "learning_rate": 1.9010912197584558e-07, + "loss": 0.5858, + "step": 2597 + }, + { + "epoch": 0.05, + "learning_rate": 1.9010523863150945e-07, + "loss": 0.1923, + "step": 2598 + }, + { + "epoch": 0.05, + "learning_rate": 1.901013552871733e-07, + "loss": 0.4581, + "step": 2599 + }, + { + "epoch": 0.05, + "learning_rate": 1.9009747194283716e-07, + "loss": 0.1433, + "step": 2600 + }, + { + "epoch": 0.05, + "learning_rate": 1.90093588598501e-07, + "loss": 0.3314, + "step": 2601 + }, + { + "epoch": 0.05, + "learning_rate": 1.9008970525416488e-07, + "loss": 0.3607, + "step": 2602 + }, + { + "epoch": 0.05, + "learning_rate": 1.9008582190982873e-07, + "loss": 0.2444, + "step": 2603 + }, + { + "epoch": 0.05, + "learning_rate": 1.900819385654926e-07, + "loss": 0.291, + "step": 2604 + }, + { + "epoch": 0.05, + "learning_rate": 1.9007805522115644e-07, + "loss": 0.1593, + "step": 2605 + }, + { + "epoch": 0.05, + "learning_rate": 1.9007417187682031e-07, + "loss": 0.2575, + "step": 2606 + }, + { + "epoch": 0.05, + "learning_rate": 1.9007028853248416e-07, + "loss": 0.1207, + "step": 2607 + }, + { + "epoch": 0.05, + "learning_rate": 1.9006640518814803e-07, + "loss": 0.2285, + "step": 2608 + }, + { + "epoch": 0.05, + "learning_rate": 1.9006252184381187e-07, + "loss": 0.1683, + "step": 2609 + }, + { + "epoch": 0.05, + "learning_rate": 1.9005863849947575e-07, + "loss": 0.5142, + "step": 2610 + }, + { + "epoch": 0.05, + "learning_rate": 1.900547551551396e-07, + "loss": 0.16, + "step": 2611 + }, + { + "epoch": 0.05, + "learning_rate": 1.9005087181080346e-07, + "loss": 0.2913, + "step": 2612 + }, + { + "epoch": 0.05, + "learning_rate": 1.900469884664673e-07, + "loss": 0.1727, + "step": 2613 + }, + { + "epoch": 0.05, + "learning_rate": 1.9004310512213118e-07, + "loss": 0.1434, + "step": 2614 + }, + { + "epoch": 0.05, + "learning_rate": 1.9003922177779502e-07, + "loss": 0.6163, + "step": 2615 + }, + { + "epoch": 0.05, + "learning_rate": 1.900353384334589e-07, + "loss": 0.1575, + "step": 2616 + }, + { + "epoch": 0.05, + "learning_rate": 1.9003145508912274e-07, + "loss": 0.1638, + "step": 2617 + }, + { + "epoch": 0.05, + "learning_rate": 1.900275717447866e-07, + "loss": 0.2826, + "step": 2618 + }, + { + "epoch": 0.05, + "learning_rate": 1.9002368840045046e-07, + "loss": 0.1396, + "step": 2619 + }, + { + "epoch": 0.05, + "learning_rate": 1.9001980505611433e-07, + "loss": 0.2166, + "step": 2620 + }, + { + "epoch": 0.05, + "learning_rate": 1.9001592171177817e-07, + "loss": 0.2486, + "step": 2621 + }, + { + "epoch": 0.05, + "learning_rate": 1.9001203836744205e-07, + "loss": 0.3613, + "step": 2622 + }, + { + "epoch": 0.05, + "learning_rate": 1.900081550231059e-07, + "loss": 0.1056, + "step": 2623 + }, + { + "epoch": 0.05, + "learning_rate": 1.9000427167876976e-07, + "loss": 0.1373, + "step": 2624 + }, + { + "epoch": 0.05, + "learning_rate": 1.900003883344336e-07, + "loss": 0.1717, + "step": 2625 + }, + { + "epoch": 0.05, + "learning_rate": 1.8999650499009748e-07, + "loss": 0.186, + "step": 2626 + }, + { + "epoch": 0.05, + "learning_rate": 1.8999262164576132e-07, + "loss": 0.2276, + "step": 2627 + }, + { + "epoch": 0.05, + "learning_rate": 1.899887383014252e-07, + "loss": 0.3492, + "step": 2628 + }, + { + "epoch": 0.05, + "learning_rate": 1.8998485495708904e-07, + "loss": 0.351, + "step": 2629 + }, + { + "epoch": 0.05, + "learning_rate": 1.899809716127529e-07, + "loss": 0.2114, + "step": 2630 + }, + { + "epoch": 0.05, + "learning_rate": 1.8997708826841673e-07, + "loss": 0.1275, + "step": 2631 + }, + { + "epoch": 0.05, + "learning_rate": 1.899732049240806e-07, + "loss": 0.2021, + "step": 2632 + }, + { + "epoch": 0.05, + "learning_rate": 1.8996932157974445e-07, + "loss": 0.1614, + "step": 2633 + }, + { + "epoch": 0.05, + "learning_rate": 1.8996543823540832e-07, + "loss": 0.302, + "step": 2634 + }, + { + "epoch": 0.05, + "learning_rate": 1.8996155489107216e-07, + "loss": 0.1897, + "step": 2635 + }, + { + "epoch": 0.05, + "learning_rate": 1.8995767154673603e-07, + "loss": 0.1714, + "step": 2636 + }, + { + "epoch": 0.05, + "learning_rate": 1.8995378820239988e-07, + "loss": 0.1335, + "step": 2637 + }, + { + "epoch": 0.05, + "learning_rate": 1.8994990485806375e-07, + "loss": 0.3304, + "step": 2638 + }, + { + "epoch": 0.05, + "learning_rate": 1.899460215137276e-07, + "loss": 0.1166, + "step": 2639 + }, + { + "epoch": 0.05, + "learning_rate": 1.8994213816939147e-07, + "loss": 0.176, + "step": 2640 + }, + { + "epoch": 0.05, + "learning_rate": 1.899382548250553e-07, + "loss": 0.2803, + "step": 2641 + }, + { + "epoch": 0.05, + "learning_rate": 1.8993437148071918e-07, + "loss": 0.2046, + "step": 2642 + }, + { + "epoch": 0.05, + "learning_rate": 1.8993048813638303e-07, + "loss": 0.2573, + "step": 2643 + }, + { + "epoch": 0.05, + "learning_rate": 1.899266047920469e-07, + "loss": 0.1585, + "step": 2644 + }, + { + "epoch": 0.05, + "learning_rate": 1.8992272144771075e-07, + "loss": 0.1275, + "step": 2645 + }, + { + "epoch": 0.05, + "learning_rate": 1.8991883810337462e-07, + "loss": 0.2535, + "step": 2646 + }, + { + "epoch": 0.05, + "learning_rate": 1.8991495475903846e-07, + "loss": 0.5557, + "step": 2647 + }, + { + "epoch": 0.05, + "learning_rate": 1.8991107141470233e-07, + "loss": 0.127, + "step": 2648 + }, + { + "epoch": 0.05, + "learning_rate": 1.8990718807036618e-07, + "loss": 0.2997, + "step": 2649 + }, + { + "epoch": 0.05, + "learning_rate": 1.8990330472603005e-07, + "loss": 0.2238, + "step": 2650 + }, + { + "epoch": 0.05, + "learning_rate": 1.898994213816939e-07, + "loss": 0.2437, + "step": 2651 + }, + { + "epoch": 0.05, + "learning_rate": 1.8989553803735777e-07, + "loss": 0.1836, + "step": 2652 + }, + { + "epoch": 0.05, + "learning_rate": 1.898916546930216e-07, + "loss": 0.2629, + "step": 2653 + }, + { + "epoch": 0.05, + "learning_rate": 1.8988777134868548e-07, + "loss": 0.1704, + "step": 2654 + }, + { + "epoch": 0.05, + "learning_rate": 1.8988388800434933e-07, + "loss": 0.1391, + "step": 2655 + }, + { + "epoch": 0.05, + "learning_rate": 1.898800046600132e-07, + "loss": 0.1748, + "step": 2656 + }, + { + "epoch": 0.05, + "learning_rate": 1.8987612131567704e-07, + "loss": 0.4239, + "step": 2657 + }, + { + "epoch": 0.05, + "learning_rate": 1.8987223797134092e-07, + "loss": 0.138, + "step": 2658 + }, + { + "epoch": 0.05, + "learning_rate": 1.8986835462700476e-07, + "loss": 0.2657, + "step": 2659 + }, + { + "epoch": 0.05, + "learning_rate": 1.8986447128266863e-07, + "loss": 0.1383, + "step": 2660 + }, + { + "epoch": 0.05, + "learning_rate": 1.8986058793833248e-07, + "loss": 0.4647, + "step": 2661 + }, + { + "epoch": 0.05, + "learning_rate": 1.8985670459399635e-07, + "loss": 0.5005, + "step": 2662 + }, + { + "epoch": 0.05, + "learning_rate": 1.898528212496602e-07, + "loss": 0.1225, + "step": 2663 + }, + { + "epoch": 0.05, + "learning_rate": 1.8984893790532407e-07, + "loss": 0.2018, + "step": 2664 + }, + { + "epoch": 0.05, + "learning_rate": 1.898450545609879e-07, + "loss": 0.1799, + "step": 2665 + }, + { + "epoch": 0.05, + "learning_rate": 1.8984117121665178e-07, + "loss": 0.1546, + "step": 2666 + }, + { + "epoch": 0.05, + "learning_rate": 1.8983728787231563e-07, + "loss": 0.1137, + "step": 2667 + }, + { + "epoch": 0.05, + "learning_rate": 1.898334045279795e-07, + "loss": 0.3578, + "step": 2668 + }, + { + "epoch": 0.05, + "learning_rate": 1.8982952118364334e-07, + "loss": 0.1687, + "step": 2669 + }, + { + "epoch": 0.05, + "learning_rate": 1.8982563783930721e-07, + "loss": 0.2303, + "step": 2670 + }, + { + "epoch": 0.05, + "learning_rate": 1.8982175449497106e-07, + "loss": 0.27, + "step": 2671 + }, + { + "epoch": 0.05, + "learning_rate": 1.8981787115063493e-07, + "loss": 0.1705, + "step": 2672 + }, + { + "epoch": 0.05, + "learning_rate": 1.8981398780629878e-07, + "loss": 0.1331, + "step": 2673 + }, + { + "epoch": 0.05, + "learning_rate": 1.8981010446196265e-07, + "loss": 0.108, + "step": 2674 + }, + { + "epoch": 0.05, + "learning_rate": 1.898062211176265e-07, + "loss": 0.184, + "step": 2675 + }, + { + "epoch": 0.05, + "learning_rate": 1.8980233777329036e-07, + "loss": 0.1556, + "step": 2676 + }, + { + "epoch": 0.05, + "learning_rate": 1.897984544289542e-07, + "loss": 0.1123, + "step": 2677 + }, + { + "epoch": 0.05, + "learning_rate": 1.8979457108461808e-07, + "loss": 0.2431, + "step": 2678 + }, + { + "epoch": 0.05, + "learning_rate": 1.8979068774028193e-07, + "loss": 0.0914, + "step": 2679 + }, + { + "epoch": 0.05, + "learning_rate": 1.897868043959458e-07, + "loss": 0.1802, + "step": 2680 + }, + { + "epoch": 0.05, + "learning_rate": 1.8978292105160964e-07, + "loss": 0.3212, + "step": 2681 + }, + { + "epoch": 0.05, + "learning_rate": 1.8977903770727351e-07, + "loss": 0.3154, + "step": 2682 + }, + { + "epoch": 0.05, + "learning_rate": 1.8977515436293736e-07, + "loss": 0.349, + "step": 2683 + }, + { + "epoch": 0.05, + "learning_rate": 1.8977127101860123e-07, + "loss": 0.1684, + "step": 2684 + }, + { + "epoch": 0.05, + "learning_rate": 1.8976738767426508e-07, + "loss": 0.1422, + "step": 2685 + }, + { + "epoch": 0.05, + "learning_rate": 1.8976350432992895e-07, + "loss": 0.3716, + "step": 2686 + }, + { + "epoch": 0.05, + "learning_rate": 1.897596209855928e-07, + "loss": 0.197, + "step": 2687 + }, + { + "epoch": 0.05, + "learning_rate": 1.8975573764125666e-07, + "loss": 0.1085, + "step": 2688 + }, + { + "epoch": 0.05, + "learning_rate": 1.8975185429692048e-07, + "loss": 0.4093, + "step": 2689 + }, + { + "epoch": 0.05, + "learning_rate": 1.8974797095258435e-07, + "loss": 0.3114, + "step": 2690 + }, + { + "epoch": 0.05, + "learning_rate": 1.897440876082482e-07, + "loss": 0.118, + "step": 2691 + }, + { + "epoch": 0.05, + "learning_rate": 1.8974020426391207e-07, + "loss": 0.1268, + "step": 2692 + }, + { + "epoch": 0.05, + "learning_rate": 1.8973632091957591e-07, + "loss": 0.1819, + "step": 2693 + }, + { + "epoch": 0.05, + "learning_rate": 1.8973243757523979e-07, + "loss": 0.2477, + "step": 2694 + }, + { + "epoch": 0.05, + "learning_rate": 1.8972855423090363e-07, + "loss": 0.1398, + "step": 2695 + }, + { + "epoch": 0.05, + "learning_rate": 1.897246708865675e-07, + "loss": 0.2083, + "step": 2696 + }, + { + "epoch": 0.05, + "learning_rate": 1.8972078754223135e-07, + "loss": 0.153, + "step": 2697 + }, + { + "epoch": 0.05, + "learning_rate": 1.8971690419789522e-07, + "loss": 0.5899, + "step": 2698 + }, + { + "epoch": 0.05, + "learning_rate": 1.8971302085355906e-07, + "loss": 0.117, + "step": 2699 + }, + { + "epoch": 0.05, + "learning_rate": 1.8970913750922294e-07, + "loss": 0.292, + "step": 2700 + }, + { + "epoch": 0.05, + "learning_rate": 1.8970525416488678e-07, + "loss": 0.1226, + "step": 2701 + }, + { + "epoch": 0.05, + "learning_rate": 1.8970137082055065e-07, + "loss": 0.3845, + "step": 2702 + }, + { + "epoch": 0.05, + "learning_rate": 1.896974874762145e-07, + "loss": 0.2994, + "step": 2703 + }, + { + "epoch": 0.05, + "learning_rate": 1.8969360413187837e-07, + "loss": 0.4882, + "step": 2704 + }, + { + "epoch": 0.05, + "learning_rate": 1.8968972078754221e-07, + "loss": 0.512, + "step": 2705 + }, + { + "epoch": 0.05, + "learning_rate": 1.8968583744320608e-07, + "loss": 0.1265, + "step": 2706 + }, + { + "epoch": 0.05, + "learning_rate": 1.8968195409886993e-07, + "loss": 0.1068, + "step": 2707 + }, + { + "epoch": 0.05, + "learning_rate": 1.896780707545338e-07, + "loss": 0.314, + "step": 2708 + }, + { + "epoch": 0.05, + "learning_rate": 1.8967418741019765e-07, + "loss": 0.122, + "step": 2709 + }, + { + "epoch": 0.05, + "learning_rate": 1.8967030406586152e-07, + "loss": 0.1779, + "step": 2710 + }, + { + "epoch": 0.05, + "learning_rate": 1.8966642072152536e-07, + "loss": 0.2064, + "step": 2711 + }, + { + "epoch": 0.05, + "learning_rate": 1.8966253737718923e-07, + "loss": 0.1074, + "step": 2712 + }, + { + "epoch": 0.05, + "learning_rate": 1.8965865403285308e-07, + "loss": 0.2594, + "step": 2713 + }, + { + "epoch": 0.05, + "learning_rate": 1.8965477068851695e-07, + "loss": 0.2161, + "step": 2714 + }, + { + "epoch": 0.05, + "learning_rate": 1.896508873441808e-07, + "loss": 0.1099, + "step": 2715 + }, + { + "epoch": 0.05, + "learning_rate": 1.8964700399984467e-07, + "loss": 0.135, + "step": 2716 + }, + { + "epoch": 0.05, + "learning_rate": 1.896431206555085e-07, + "loss": 0.1193, + "step": 2717 + }, + { + "epoch": 0.05, + "learning_rate": 1.8963923731117238e-07, + "loss": 0.1396, + "step": 2718 + }, + { + "epoch": 0.05, + "learning_rate": 1.8963535396683623e-07, + "loss": 0.1453, + "step": 2719 + }, + { + "epoch": 0.05, + "learning_rate": 1.896314706225001e-07, + "loss": 0.115, + "step": 2720 + }, + { + "epoch": 0.05, + "learning_rate": 1.8962758727816395e-07, + "loss": 0.1354, + "step": 2721 + }, + { + "epoch": 0.05, + "learning_rate": 1.8962370393382782e-07, + "loss": 0.2079, + "step": 2722 + }, + { + "epoch": 0.05, + "learning_rate": 1.8961982058949166e-07, + "loss": 0.2878, + "step": 2723 + }, + { + "epoch": 0.05, + "learning_rate": 1.8961593724515553e-07, + "loss": 0.1522, + "step": 2724 + }, + { + "epoch": 0.05, + "learning_rate": 1.8961205390081938e-07, + "loss": 0.1053, + "step": 2725 + }, + { + "epoch": 0.05, + "learning_rate": 1.8960817055648325e-07, + "loss": 0.2306, + "step": 2726 + }, + { + "epoch": 0.05, + "learning_rate": 1.896042872121471e-07, + "loss": 0.0994, + "step": 2727 + }, + { + "epoch": 0.05, + "learning_rate": 1.8960040386781097e-07, + "loss": 0.2324, + "step": 2728 + }, + { + "epoch": 0.05, + "learning_rate": 1.895965205234748e-07, + "loss": 0.3254, + "step": 2729 + }, + { + "epoch": 0.05, + "learning_rate": 1.8959263717913868e-07, + "loss": 0.1147, + "step": 2730 + }, + { + "epoch": 0.05, + "learning_rate": 1.8958875383480253e-07, + "loss": 0.1397, + "step": 2731 + }, + { + "epoch": 0.05, + "learning_rate": 1.895848704904664e-07, + "loss": 0.2856, + "step": 2732 + }, + { + "epoch": 0.05, + "learning_rate": 1.8958098714613024e-07, + "loss": 0.1602, + "step": 2733 + }, + { + "epoch": 0.05, + "learning_rate": 1.8957710380179412e-07, + "loss": 0.1274, + "step": 2734 + }, + { + "epoch": 0.05, + "learning_rate": 1.8957322045745796e-07, + "loss": 0.1233, + "step": 2735 + }, + { + "epoch": 0.05, + "learning_rate": 1.895693371131218e-07, + "loss": 0.1967, + "step": 2736 + }, + { + "epoch": 0.05, + "learning_rate": 1.8956545376878568e-07, + "loss": 0.1497, + "step": 2737 + }, + { + "epoch": 0.05, + "learning_rate": 1.8956157042444952e-07, + "loss": 0.1703, + "step": 2738 + }, + { + "epoch": 0.05, + "learning_rate": 1.895576870801134e-07, + "loss": 0.1101, + "step": 2739 + }, + { + "epoch": 0.05, + "learning_rate": 1.8955380373577724e-07, + "loss": 0.1545, + "step": 2740 + }, + { + "epoch": 0.05, + "learning_rate": 1.895499203914411e-07, + "loss": 0.1641, + "step": 2741 + }, + { + "epoch": 0.05, + "learning_rate": 1.8954603704710496e-07, + "loss": 0.156, + "step": 2742 + }, + { + "epoch": 0.05, + "learning_rate": 1.8954215370276883e-07, + "loss": 0.1151, + "step": 2743 + }, + { + "epoch": 0.05, + "learning_rate": 1.8953827035843267e-07, + "loss": 0.1952, + "step": 2744 + }, + { + "epoch": 0.05, + "learning_rate": 1.8953438701409654e-07, + "loss": 0.2595, + "step": 2745 + }, + { + "epoch": 0.05, + "learning_rate": 1.895305036697604e-07, + "loss": 0.2114, + "step": 2746 + }, + { + "epoch": 0.05, + "learning_rate": 1.8952662032542423e-07, + "loss": 0.0946, + "step": 2747 + }, + { + "epoch": 0.05, + "learning_rate": 1.895227369810881e-07, + "loss": 0.2572, + "step": 2748 + }, + { + "epoch": 0.05, + "learning_rate": 1.8951885363675195e-07, + "loss": 0.2217, + "step": 2749 + }, + { + "epoch": 0.05, + "learning_rate": 1.8951497029241582e-07, + "loss": 0.1415, + "step": 2750 + }, + { + "epoch": 0.05, + "learning_rate": 1.8951108694807967e-07, + "loss": 0.1832, + "step": 2751 + }, + { + "epoch": 0.05, + "learning_rate": 1.8950720360374354e-07, + "loss": 0.4894, + "step": 2752 + }, + { + "epoch": 0.05, + "learning_rate": 1.8950332025940738e-07, + "loss": 0.5951, + "step": 2753 + }, + { + "epoch": 0.05, + "learning_rate": 1.8949943691507125e-07, + "loss": 0.1472, + "step": 2754 + }, + { + "epoch": 0.05, + "learning_rate": 1.894955535707351e-07, + "loss": 0.1349, + "step": 2755 + }, + { + "epoch": 0.05, + "learning_rate": 1.8949167022639897e-07, + "loss": 0.1558, + "step": 2756 + }, + { + "epoch": 0.05, + "learning_rate": 1.8948778688206282e-07, + "loss": 0.1326, + "step": 2757 + }, + { + "epoch": 0.05, + "learning_rate": 1.894839035377267e-07, + "loss": 0.3135, + "step": 2758 + }, + { + "epoch": 0.05, + "learning_rate": 1.8948002019339053e-07, + "loss": 0.3438, + "step": 2759 + }, + { + "epoch": 0.05, + "learning_rate": 1.894761368490544e-07, + "loss": 0.1029, + "step": 2760 + }, + { + "epoch": 0.05, + "learning_rate": 1.8947225350471825e-07, + "loss": 0.3178, + "step": 2761 + }, + { + "epoch": 0.05, + "learning_rate": 1.8946837016038212e-07, + "loss": 0.1632, + "step": 2762 + }, + { + "epoch": 0.05, + "learning_rate": 1.8946448681604597e-07, + "loss": 0.1037, + "step": 2763 + }, + { + "epoch": 0.05, + "learning_rate": 1.894606034717098e-07, + "loss": 0.3542, + "step": 2764 + }, + { + "epoch": 0.05, + "learning_rate": 1.8945672012737368e-07, + "loss": 0.3151, + "step": 2765 + }, + { + "epoch": 0.05, + "learning_rate": 1.8945283678303753e-07, + "loss": 0.1327, + "step": 2766 + }, + { + "epoch": 0.05, + "learning_rate": 1.894489534387014e-07, + "loss": 0.1856, + "step": 2767 + }, + { + "epoch": 0.05, + "learning_rate": 1.8944507009436524e-07, + "loss": 0.1373, + "step": 2768 + }, + { + "epoch": 0.05, + "learning_rate": 1.8944118675002911e-07, + "loss": 0.0973, + "step": 2769 + }, + { + "epoch": 0.05, + "learning_rate": 1.8943730340569296e-07, + "loss": 0.6031, + "step": 2770 + }, + { + "epoch": 0.05, + "learning_rate": 1.8943342006135683e-07, + "loss": 0.1231, + "step": 2771 + }, + { + "epoch": 0.05, + "learning_rate": 1.8942953671702068e-07, + "loss": 0.1242, + "step": 2772 + }, + { + "epoch": 0.05, + "learning_rate": 1.8942565337268455e-07, + "loss": 0.1295, + "step": 2773 + }, + { + "epoch": 0.05, + "learning_rate": 1.894217700283484e-07, + "loss": 0.0863, + "step": 2774 + }, + { + "epoch": 0.05, + "learning_rate": 1.8941788668401226e-07, + "loss": 0.1011, + "step": 2775 + }, + { + "epoch": 0.05, + "learning_rate": 1.894140033396761e-07, + "loss": 0.161, + "step": 2776 + }, + { + "epoch": 0.05, + "learning_rate": 1.8941011999533998e-07, + "loss": 0.2257, + "step": 2777 + }, + { + "epoch": 0.05, + "learning_rate": 1.8940623665100383e-07, + "loss": 0.1808, + "step": 2778 + }, + { + "epoch": 0.05, + "learning_rate": 1.894023533066677e-07, + "loss": 0.5393, + "step": 2779 + }, + { + "epoch": 0.05, + "learning_rate": 1.8939846996233154e-07, + "loss": 0.1828, + "step": 2780 + }, + { + "epoch": 0.05, + "learning_rate": 1.8939458661799541e-07, + "loss": 0.1372, + "step": 2781 + }, + { + "epoch": 0.05, + "learning_rate": 1.8939070327365926e-07, + "loss": 0.344, + "step": 2782 + }, + { + "epoch": 0.05, + "learning_rate": 1.8938681992932313e-07, + "loss": 0.1716, + "step": 2783 + }, + { + "epoch": 0.05, + "learning_rate": 1.8938293658498698e-07, + "loss": 0.1557, + "step": 2784 + }, + { + "epoch": 0.05, + "learning_rate": 1.8937905324065085e-07, + "loss": 0.2552, + "step": 2785 + }, + { + "epoch": 0.05, + "learning_rate": 1.893751698963147e-07, + "loss": 0.1155, + "step": 2786 + }, + { + "epoch": 0.05, + "learning_rate": 1.8937128655197856e-07, + "loss": 0.1577, + "step": 2787 + }, + { + "epoch": 0.05, + "learning_rate": 1.893674032076424e-07, + "loss": 0.1825, + "step": 2788 + }, + { + "epoch": 0.05, + "learning_rate": 1.8936351986330628e-07, + "loss": 0.151, + "step": 2789 + }, + { + "epoch": 0.05, + "learning_rate": 1.8935963651897012e-07, + "loss": 0.189, + "step": 2790 + }, + { + "epoch": 0.05, + "learning_rate": 1.89355753174634e-07, + "loss": 0.1805, + "step": 2791 + }, + { + "epoch": 0.05, + "learning_rate": 1.8935186983029784e-07, + "loss": 0.0939, + "step": 2792 + }, + { + "epoch": 0.05, + "learning_rate": 1.893479864859617e-07, + "loss": 0.2233, + "step": 2793 + }, + { + "epoch": 0.05, + "learning_rate": 1.8934410314162556e-07, + "loss": 0.1237, + "step": 2794 + }, + { + "epoch": 0.05, + "learning_rate": 1.8934021979728943e-07, + "loss": 0.284, + "step": 2795 + }, + { + "epoch": 0.05, + "learning_rate": 1.8933633645295327e-07, + "loss": 0.3264, + "step": 2796 + }, + { + "epoch": 0.05, + "learning_rate": 1.8933245310861715e-07, + "loss": 0.2116, + "step": 2797 + }, + { + "epoch": 0.05, + "learning_rate": 1.89328569764281e-07, + "loss": 0.1665, + "step": 2798 + }, + { + "epoch": 0.05, + "learning_rate": 1.8932468641994486e-07, + "loss": 0.1088, + "step": 2799 + }, + { + "epoch": 0.05, + "learning_rate": 1.893208030756087e-07, + "loss": 0.401, + "step": 2800 + }, + { + "epoch": 0.05, + "learning_rate": 1.8931691973127258e-07, + "loss": 0.2969, + "step": 2801 + }, + { + "epoch": 0.05, + "learning_rate": 1.8931303638693642e-07, + "loss": 0.1172, + "step": 2802 + }, + { + "epoch": 0.05, + "learning_rate": 1.893091530426003e-07, + "loss": 0.1061, + "step": 2803 + }, + { + "epoch": 0.05, + "learning_rate": 1.8930526969826414e-07, + "loss": 0.1521, + "step": 2804 + }, + { + "epoch": 0.05, + "learning_rate": 1.8930138635392799e-07, + "loss": 0.1181, + "step": 2805 + }, + { + "epoch": 0.05, + "learning_rate": 1.8929750300959183e-07, + "loss": 0.1522, + "step": 2806 + }, + { + "epoch": 0.05, + "learning_rate": 1.892936196652557e-07, + "loss": 0.2051, + "step": 2807 + }, + { + "epoch": 0.05, + "learning_rate": 1.8928973632091955e-07, + "loss": 0.2378, + "step": 2808 + }, + { + "epoch": 0.05, + "learning_rate": 1.8928585297658342e-07, + "loss": 0.0865, + "step": 2809 + }, + { + "epoch": 0.05, + "learning_rate": 1.8928196963224726e-07, + "loss": 0.1307, + "step": 2810 + }, + { + "epoch": 0.05, + "learning_rate": 1.8927808628791113e-07, + "loss": 0.595, + "step": 2811 + }, + { + "epoch": 0.05, + "learning_rate": 1.8927420294357498e-07, + "loss": 0.4112, + "step": 2812 + }, + { + "epoch": 0.05, + "learning_rate": 1.8927031959923885e-07, + "loss": 0.1851, + "step": 2813 + }, + { + "epoch": 0.05, + "learning_rate": 1.892664362549027e-07, + "loss": 0.1043, + "step": 2814 + }, + { + "epoch": 0.05, + "learning_rate": 1.8926255291056657e-07, + "loss": 0.2735, + "step": 2815 + }, + { + "epoch": 0.05, + "learning_rate": 1.892586695662304e-07, + "loss": 0.1865, + "step": 2816 + }, + { + "epoch": 0.05, + "learning_rate": 1.8925478622189428e-07, + "loss": 0.2062, + "step": 2817 + }, + { + "epoch": 0.05, + "learning_rate": 1.8925090287755813e-07, + "loss": 0.1746, + "step": 2818 + }, + { + "epoch": 0.05, + "learning_rate": 1.89247019533222e-07, + "loss": 0.1089, + "step": 2819 + }, + { + "epoch": 0.05, + "learning_rate": 1.8924313618888585e-07, + "loss": 0.1302, + "step": 2820 + }, + { + "epoch": 0.05, + "learning_rate": 1.8923925284454972e-07, + "loss": 0.175, + "step": 2821 + }, + { + "epoch": 0.05, + "learning_rate": 1.8923536950021356e-07, + "loss": 0.1708, + "step": 2822 + }, + { + "epoch": 0.05, + "learning_rate": 1.8923148615587743e-07, + "loss": 0.2291, + "step": 2823 + }, + { + "epoch": 0.05, + "learning_rate": 1.8922760281154128e-07, + "loss": 0.2026, + "step": 2824 + }, + { + "epoch": 0.05, + "learning_rate": 1.8922371946720515e-07, + "loss": 0.3696, + "step": 2825 + }, + { + "epoch": 0.05, + "learning_rate": 1.89219836122869e-07, + "loss": 0.3535, + "step": 2826 + }, + { + "epoch": 0.05, + "learning_rate": 1.8921595277853287e-07, + "loss": 0.2432, + "step": 2827 + }, + { + "epoch": 0.05, + "learning_rate": 1.892120694341967e-07, + "loss": 0.0975, + "step": 2828 + }, + { + "epoch": 0.05, + "learning_rate": 1.8920818608986058e-07, + "loss": 0.1947, + "step": 2829 + }, + { + "epoch": 0.05, + "learning_rate": 1.8920430274552443e-07, + "loss": 0.2951, + "step": 2830 + }, + { + "epoch": 0.05, + "learning_rate": 1.892004194011883e-07, + "loss": 0.1278, + "step": 2831 + }, + { + "epoch": 0.05, + "learning_rate": 1.8919653605685214e-07, + "loss": 0.4063, + "step": 2832 + }, + { + "epoch": 0.05, + "learning_rate": 1.8919265271251602e-07, + "loss": 0.1542, + "step": 2833 + }, + { + "epoch": 0.05, + "learning_rate": 1.8918876936817986e-07, + "loss": 0.1851, + "step": 2834 + }, + { + "epoch": 0.05, + "learning_rate": 1.8918488602384373e-07, + "loss": 0.1223, + "step": 2835 + }, + { + "epoch": 0.06, + "learning_rate": 1.8918100267950758e-07, + "loss": 0.3741, + "step": 2836 + }, + { + "epoch": 0.06, + "learning_rate": 1.8917711933517145e-07, + "loss": 0.142, + "step": 2837 + }, + { + "epoch": 0.06, + "learning_rate": 1.891732359908353e-07, + "loss": 0.2065, + "step": 2838 + }, + { + "epoch": 0.06, + "learning_rate": 1.8916935264649917e-07, + "loss": 0.1114, + "step": 2839 + }, + { + "epoch": 0.06, + "learning_rate": 1.89165469302163e-07, + "loss": 0.1111, + "step": 2840 + }, + { + "epoch": 0.06, + "learning_rate": 1.8916158595782688e-07, + "loss": 0.2647, + "step": 2841 + }, + { + "epoch": 0.06, + "learning_rate": 1.8915770261349073e-07, + "loss": 0.1636, + "step": 2842 + }, + { + "epoch": 0.06, + "learning_rate": 1.891538192691546e-07, + "loss": 0.1013, + "step": 2843 + }, + { + "epoch": 0.06, + "learning_rate": 1.8914993592481844e-07, + "loss": 0.2527, + "step": 2844 + }, + { + "epoch": 0.06, + "learning_rate": 1.8914605258048231e-07, + "loss": 0.1815, + "step": 2845 + }, + { + "epoch": 0.06, + "learning_rate": 1.8914216923614616e-07, + "loss": 0.528, + "step": 2846 + }, + { + "epoch": 0.06, + "learning_rate": 1.8913828589181003e-07, + "loss": 0.2486, + "step": 2847 + }, + { + "epoch": 0.06, + "learning_rate": 1.8913440254747388e-07, + "loss": 0.1732, + "step": 2848 + }, + { + "epoch": 0.06, + "learning_rate": 1.8913051920313775e-07, + "loss": 0.1214, + "step": 2849 + }, + { + "epoch": 0.06, + "learning_rate": 1.891266358588016e-07, + "loss": 0.1564, + "step": 2850 + }, + { + "epoch": 0.06, + "learning_rate": 1.8912275251446546e-07, + "loss": 0.149, + "step": 2851 + }, + { + "epoch": 0.06, + "learning_rate": 1.891188691701293e-07, + "loss": 0.0958, + "step": 2852 + }, + { + "epoch": 0.06, + "learning_rate": 1.8911498582579318e-07, + "loss": 0.2299, + "step": 2853 + }, + { + "epoch": 0.06, + "learning_rate": 1.8911110248145703e-07, + "loss": 0.138, + "step": 2854 + }, + { + "epoch": 0.06, + "learning_rate": 1.891072191371209e-07, + "loss": 0.1394, + "step": 2855 + }, + { + "epoch": 0.06, + "learning_rate": 1.8910333579278474e-07, + "loss": 0.1232, + "step": 2856 + }, + { + "epoch": 0.06, + "learning_rate": 1.8909945244844861e-07, + "loss": 0.3692, + "step": 2857 + }, + { + "epoch": 0.06, + "learning_rate": 1.8909556910411246e-07, + "loss": 0.2166, + "step": 2858 + }, + { + "epoch": 0.06, + "learning_rate": 1.8909168575977633e-07, + "loss": 0.1249, + "step": 2859 + }, + { + "epoch": 0.06, + "learning_rate": 1.8908780241544018e-07, + "loss": 0.4641, + "step": 2860 + }, + { + "epoch": 0.06, + "learning_rate": 1.8908391907110405e-07, + "loss": 0.1985, + "step": 2861 + }, + { + "epoch": 0.06, + "learning_rate": 1.890800357267679e-07, + "loss": 0.2808, + "step": 2862 + }, + { + "epoch": 0.06, + "learning_rate": 1.8907615238243174e-07, + "loss": 0.3188, + "step": 2863 + }, + { + "epoch": 0.06, + "learning_rate": 1.8907226903809558e-07, + "loss": 0.1693, + "step": 2864 + }, + { + "epoch": 0.06, + "learning_rate": 1.8906838569375945e-07, + "loss": 0.1595, + "step": 2865 + }, + { + "epoch": 0.06, + "learning_rate": 1.890645023494233e-07, + "loss": 0.1422, + "step": 2866 + }, + { + "epoch": 0.06, + "learning_rate": 1.8906061900508717e-07, + "loss": 0.1565, + "step": 2867 + }, + { + "epoch": 0.06, + "learning_rate": 1.8905673566075101e-07, + "loss": 0.2071, + "step": 2868 + }, + { + "epoch": 0.06, + "learning_rate": 1.8905285231641489e-07, + "loss": 0.1995, + "step": 2869 + }, + { + "epoch": 0.06, + "learning_rate": 1.8904896897207873e-07, + "loss": 0.0994, + "step": 2870 + }, + { + "epoch": 0.06, + "learning_rate": 1.890450856277426e-07, + "loss": 0.2244, + "step": 2871 + }, + { + "epoch": 0.06, + "learning_rate": 1.8904120228340645e-07, + "loss": 0.1355, + "step": 2872 + }, + { + "epoch": 0.06, + "learning_rate": 1.8903731893907032e-07, + "loss": 0.1522, + "step": 2873 + }, + { + "epoch": 0.06, + "learning_rate": 1.8903343559473416e-07, + "loss": 0.3276, + "step": 2874 + }, + { + "epoch": 0.06, + "learning_rate": 1.8902955225039804e-07, + "loss": 0.1234, + "step": 2875 + }, + { + "epoch": 0.06, + "learning_rate": 1.8902566890606188e-07, + "loss": 0.1381, + "step": 2876 + }, + { + "epoch": 0.06, + "learning_rate": 1.8902178556172575e-07, + "loss": 0.1639, + "step": 2877 + }, + { + "epoch": 0.06, + "learning_rate": 1.890179022173896e-07, + "loss": 0.1526, + "step": 2878 + }, + { + "epoch": 0.06, + "learning_rate": 1.8901401887305347e-07, + "loss": 0.1041, + "step": 2879 + }, + { + "epoch": 0.06, + "learning_rate": 1.8901013552871731e-07, + "loss": 0.2819, + "step": 2880 + }, + { + "epoch": 0.06, + "learning_rate": 1.8900625218438119e-07, + "loss": 0.1571, + "step": 2881 + }, + { + "epoch": 0.06, + "learning_rate": 1.8900236884004503e-07, + "loss": 0.4148, + "step": 2882 + }, + { + "epoch": 0.06, + "learning_rate": 1.889984854957089e-07, + "loss": 0.0985, + "step": 2883 + }, + { + "epoch": 0.06, + "learning_rate": 1.8899460215137275e-07, + "loss": 0.2068, + "step": 2884 + }, + { + "epoch": 0.06, + "learning_rate": 1.8899071880703662e-07, + "loss": 0.2454, + "step": 2885 + }, + { + "epoch": 0.06, + "learning_rate": 1.8898683546270046e-07, + "loss": 0.1485, + "step": 2886 + }, + { + "epoch": 0.06, + "learning_rate": 1.8898295211836433e-07, + "loss": 0.2061, + "step": 2887 + }, + { + "epoch": 0.06, + "learning_rate": 1.8897906877402818e-07, + "loss": 0.1393, + "step": 2888 + }, + { + "epoch": 0.06, + "learning_rate": 1.8897518542969205e-07, + "loss": 0.1917, + "step": 2889 + }, + { + "epoch": 0.06, + "learning_rate": 1.889713020853559e-07, + "loss": 0.1136, + "step": 2890 + }, + { + "epoch": 0.06, + "learning_rate": 1.8896741874101977e-07, + "loss": 0.1689, + "step": 2891 + }, + { + "epoch": 0.06, + "learning_rate": 1.889635353966836e-07, + "loss": 0.3541, + "step": 2892 + }, + { + "epoch": 0.06, + "learning_rate": 1.8895965205234748e-07, + "loss": 0.2043, + "step": 2893 + }, + { + "epoch": 0.06, + "learning_rate": 1.8895576870801133e-07, + "loss": 0.1272, + "step": 2894 + }, + { + "epoch": 0.06, + "learning_rate": 1.889518853636752e-07, + "loss": 0.1018, + "step": 2895 + }, + { + "epoch": 0.06, + "learning_rate": 1.8894800201933905e-07, + "loss": 0.1061, + "step": 2896 + }, + { + "epoch": 0.06, + "learning_rate": 1.8894411867500292e-07, + "loss": 0.1072, + "step": 2897 + }, + { + "epoch": 0.06, + "learning_rate": 1.8894023533066676e-07, + "loss": 0.1128, + "step": 2898 + }, + { + "epoch": 0.06, + "learning_rate": 1.8893635198633063e-07, + "loss": 0.1144, + "step": 2899 + }, + { + "epoch": 0.06, + "learning_rate": 1.8893246864199448e-07, + "loss": 0.3085, + "step": 2900 + }, + { + "epoch": 0.06, + "learning_rate": 1.8892858529765835e-07, + "loss": 0.1656, + "step": 2901 + }, + { + "epoch": 0.06, + "learning_rate": 1.889247019533222e-07, + "loss": 0.078, + "step": 2902 + }, + { + "epoch": 0.06, + "learning_rate": 1.8892081860898607e-07, + "loss": 0.1027, + "step": 2903 + }, + { + "epoch": 0.06, + "learning_rate": 1.889169352646499e-07, + "loss": 0.4506, + "step": 2904 + }, + { + "epoch": 0.06, + "learning_rate": 1.8891305192031378e-07, + "loss": 0.1909, + "step": 2905 + }, + { + "epoch": 0.06, + "learning_rate": 1.8890916857597763e-07, + "loss": 0.0958, + "step": 2906 + }, + { + "epoch": 0.06, + "learning_rate": 1.889052852316415e-07, + "loss": 0.1442, + "step": 2907 + }, + { + "epoch": 0.06, + "learning_rate": 1.8890140188730534e-07, + "loss": 0.6319, + "step": 2908 + }, + { + "epoch": 0.06, + "learning_rate": 1.8889751854296922e-07, + "loss": 0.1374, + "step": 2909 + }, + { + "epoch": 0.06, + "learning_rate": 1.8889363519863306e-07, + "loss": 0.1479, + "step": 2910 + }, + { + "epoch": 0.06, + "learning_rate": 1.8888975185429693e-07, + "loss": 0.2206, + "step": 2911 + }, + { + "epoch": 0.06, + "learning_rate": 1.8888586850996078e-07, + "loss": 0.2623, + "step": 2912 + }, + { + "epoch": 0.06, + "learning_rate": 1.8888198516562462e-07, + "loss": 0.2644, + "step": 2913 + }, + { + "epoch": 0.06, + "learning_rate": 1.888781018212885e-07, + "loss": 0.1317, + "step": 2914 + }, + { + "epoch": 0.06, + "learning_rate": 1.8887421847695234e-07, + "loss": 0.1139, + "step": 2915 + }, + { + "epoch": 0.06, + "learning_rate": 1.888703351326162e-07, + "loss": 0.1508, + "step": 2916 + }, + { + "epoch": 0.06, + "learning_rate": 1.8886645178828006e-07, + "loss": 0.2959, + "step": 2917 + }, + { + "epoch": 0.06, + "learning_rate": 1.8886256844394393e-07, + "loss": 0.1589, + "step": 2918 + }, + { + "epoch": 0.06, + "learning_rate": 1.8885868509960777e-07, + "loss": 0.1913, + "step": 2919 + }, + { + "epoch": 0.06, + "learning_rate": 1.8885480175527164e-07, + "loss": 0.3656, + "step": 2920 + }, + { + "epoch": 0.06, + "learning_rate": 1.888509184109355e-07, + "loss": 0.3892, + "step": 2921 + }, + { + "epoch": 0.06, + "learning_rate": 1.8884703506659933e-07, + "loss": 0.3143, + "step": 2922 + }, + { + "epoch": 0.06, + "learning_rate": 1.888431517222632e-07, + "loss": 0.0821, + "step": 2923 + }, + { + "epoch": 0.06, + "learning_rate": 1.8883926837792705e-07, + "loss": 0.3372, + "step": 2924 + }, + { + "epoch": 0.06, + "learning_rate": 1.8883538503359092e-07, + "loss": 0.1944, + "step": 2925 + }, + { + "epoch": 0.06, + "learning_rate": 1.8883150168925477e-07, + "loss": 0.1673, + "step": 2926 + }, + { + "epoch": 0.06, + "learning_rate": 1.8882761834491864e-07, + "loss": 0.1015, + "step": 2927 + }, + { + "epoch": 0.06, + "learning_rate": 1.8882373500058248e-07, + "loss": 0.3881, + "step": 2928 + }, + { + "epoch": 0.06, + "learning_rate": 1.8881985165624635e-07, + "loss": 0.2198, + "step": 2929 + }, + { + "epoch": 0.06, + "learning_rate": 1.888159683119102e-07, + "loss": 0.0914, + "step": 2930 + }, + { + "epoch": 0.06, + "learning_rate": 1.8881208496757407e-07, + "loss": 0.5108, + "step": 2931 + }, + { + "epoch": 0.06, + "learning_rate": 1.8880820162323792e-07, + "loss": 0.2918, + "step": 2932 + }, + { + "epoch": 0.06, + "learning_rate": 1.888043182789018e-07, + "loss": 0.2353, + "step": 2933 + }, + { + "epoch": 0.06, + "learning_rate": 1.8880043493456563e-07, + "loss": 0.1479, + "step": 2934 + }, + { + "epoch": 0.06, + "learning_rate": 1.887965515902295e-07, + "loss": 0.1841, + "step": 2935 + }, + { + "epoch": 0.06, + "learning_rate": 1.8879266824589335e-07, + "loss": 0.127, + "step": 2936 + }, + { + "epoch": 0.06, + "learning_rate": 1.8878878490155722e-07, + "loss": 0.1608, + "step": 2937 + }, + { + "epoch": 0.06, + "learning_rate": 1.8878490155722107e-07, + "loss": 0.0974, + "step": 2938 + }, + { + "epoch": 0.06, + "learning_rate": 1.8878101821288494e-07, + "loss": 0.1115, + "step": 2939 + }, + { + "epoch": 0.06, + "learning_rate": 1.8877713486854878e-07, + "loss": 0.218, + "step": 2940 + }, + { + "epoch": 0.06, + "learning_rate": 1.8877325152421263e-07, + "loss": 0.4355, + "step": 2941 + }, + { + "epoch": 0.06, + "learning_rate": 1.887693681798765e-07, + "loss": 0.1583, + "step": 2942 + }, + { + "epoch": 0.06, + "learning_rate": 1.8876548483554034e-07, + "loss": 0.4285, + "step": 2943 + }, + { + "epoch": 0.06, + "learning_rate": 1.8876160149120421e-07, + "loss": 0.2206, + "step": 2944 + }, + { + "epoch": 0.06, + "learning_rate": 1.8875771814686806e-07, + "loss": 0.111, + "step": 2945 + }, + { + "epoch": 0.06, + "learning_rate": 1.8875383480253193e-07, + "loss": 0.1147, + "step": 2946 + }, + { + "epoch": 0.06, + "learning_rate": 1.8874995145819578e-07, + "loss": 0.139, + "step": 2947 + }, + { + "epoch": 0.06, + "learning_rate": 1.8874606811385965e-07, + "loss": 0.618, + "step": 2948 + }, + { + "epoch": 0.06, + "learning_rate": 1.887421847695235e-07, + "loss": 0.1398, + "step": 2949 + }, + { + "epoch": 0.06, + "learning_rate": 1.8873830142518736e-07, + "loss": 0.2784, + "step": 2950 + }, + { + "epoch": 0.06, + "learning_rate": 1.887344180808512e-07, + "loss": 0.1391, + "step": 2951 + }, + { + "epoch": 0.06, + "learning_rate": 1.8873053473651508e-07, + "loss": 0.1751, + "step": 2952 + }, + { + "epoch": 0.06, + "learning_rate": 1.8872665139217893e-07, + "loss": 0.4198, + "step": 2953 + }, + { + "epoch": 0.06, + "learning_rate": 1.887227680478428e-07, + "loss": 0.1406, + "step": 2954 + }, + { + "epoch": 0.06, + "learning_rate": 1.8871888470350664e-07, + "loss": 0.2129, + "step": 2955 + }, + { + "epoch": 0.06, + "learning_rate": 1.8871500135917051e-07, + "loss": 0.1893, + "step": 2956 + }, + { + "epoch": 0.06, + "learning_rate": 1.8871111801483436e-07, + "loss": 0.3923, + "step": 2957 + }, + { + "epoch": 0.06, + "learning_rate": 1.8870723467049823e-07, + "loss": 0.1471, + "step": 2958 + }, + { + "epoch": 0.06, + "learning_rate": 1.8870335132616208e-07, + "loss": 0.1337, + "step": 2959 + }, + { + "epoch": 0.06, + "learning_rate": 1.8869946798182595e-07, + "loss": 0.2688, + "step": 2960 + }, + { + "epoch": 0.06, + "learning_rate": 1.886955846374898e-07, + "loss": 0.0847, + "step": 2961 + }, + { + "epoch": 0.06, + "learning_rate": 1.8869170129315366e-07, + "loss": 0.2424, + "step": 2962 + }, + { + "epoch": 0.06, + "learning_rate": 1.886878179488175e-07, + "loss": 0.1594, + "step": 2963 + }, + { + "epoch": 0.06, + "learning_rate": 1.8868393460448138e-07, + "loss": 0.1444, + "step": 2964 + }, + { + "epoch": 0.06, + "learning_rate": 1.8868005126014522e-07, + "loss": 0.1098, + "step": 2965 + }, + { + "epoch": 0.06, + "learning_rate": 1.886761679158091e-07, + "loss": 0.3066, + "step": 2966 + }, + { + "epoch": 0.06, + "learning_rate": 1.8867228457147294e-07, + "loss": 0.1046, + "step": 2967 + }, + { + "epoch": 0.06, + "learning_rate": 1.886684012271368e-07, + "loss": 0.3869, + "step": 2968 + }, + { + "epoch": 0.06, + "learning_rate": 1.8866451788280066e-07, + "loss": 0.3739, + "step": 2969 + }, + { + "epoch": 0.06, + "learning_rate": 1.8866063453846453e-07, + "loss": 0.4221, + "step": 2970 + }, + { + "epoch": 0.06, + "learning_rate": 1.8865675119412837e-07, + "loss": 0.158, + "step": 2971 + }, + { + "epoch": 0.06, + "learning_rate": 1.8865286784979225e-07, + "loss": 0.1243, + "step": 2972 + }, + { + "epoch": 0.06, + "learning_rate": 1.886489845054561e-07, + "loss": 0.302, + "step": 2973 + }, + { + "epoch": 0.06, + "learning_rate": 1.8864510116111996e-07, + "loss": 0.2284, + "step": 2974 + }, + { + "epoch": 0.06, + "learning_rate": 1.886412178167838e-07, + "loss": 0.3221, + "step": 2975 + }, + { + "epoch": 0.06, + "learning_rate": 1.8863733447244768e-07, + "loss": 0.1646, + "step": 2976 + }, + { + "epoch": 0.06, + "learning_rate": 1.8863345112811152e-07, + "loss": 0.1416, + "step": 2977 + }, + { + "epoch": 0.06, + "learning_rate": 1.886295677837754e-07, + "loss": 0.1755, + "step": 2978 + }, + { + "epoch": 0.06, + "learning_rate": 1.8862568443943921e-07, + "loss": 0.1739, + "step": 2979 + }, + { + "epoch": 0.06, + "learning_rate": 1.8862180109510309e-07, + "loss": 0.2627, + "step": 2980 + }, + { + "epoch": 0.06, + "learning_rate": 1.8861791775076693e-07, + "loss": 0.3225, + "step": 2981 + }, + { + "epoch": 0.06, + "learning_rate": 1.886140344064308e-07, + "loss": 0.3799, + "step": 2982 + }, + { + "epoch": 0.06, + "learning_rate": 1.8861015106209465e-07, + "loss": 0.3943, + "step": 2983 + }, + { + "epoch": 0.06, + "learning_rate": 1.8860626771775852e-07, + "loss": 0.1212, + "step": 2984 + }, + { + "epoch": 0.06, + "learning_rate": 1.8860238437342236e-07, + "loss": 0.1162, + "step": 2985 + }, + { + "epoch": 0.06, + "learning_rate": 1.8859850102908623e-07, + "loss": 0.3709, + "step": 2986 + }, + { + "epoch": 0.06, + "learning_rate": 1.8859461768475008e-07, + "loss": 0.108, + "step": 2987 + }, + { + "epoch": 0.06, + "learning_rate": 1.8859073434041395e-07, + "loss": 0.168, + "step": 2988 + }, + { + "epoch": 0.06, + "learning_rate": 1.885868509960778e-07, + "loss": 0.2576, + "step": 2989 + }, + { + "epoch": 0.06, + "learning_rate": 1.8858296765174167e-07, + "loss": 0.1279, + "step": 2990 + }, + { + "epoch": 0.06, + "learning_rate": 1.885790843074055e-07, + "loss": 0.3338, + "step": 2991 + }, + { + "epoch": 0.06, + "learning_rate": 1.8857520096306938e-07, + "loss": 0.1923, + "step": 2992 + }, + { + "epoch": 0.06, + "learning_rate": 1.8857131761873323e-07, + "loss": 0.118, + "step": 2993 + }, + { + "epoch": 0.06, + "learning_rate": 1.885674342743971e-07, + "loss": 0.1027, + "step": 2994 + }, + { + "epoch": 0.06, + "learning_rate": 1.8856355093006095e-07, + "loss": 0.1532, + "step": 2995 + }, + { + "epoch": 0.06, + "learning_rate": 1.8855966758572482e-07, + "loss": 0.3923, + "step": 2996 + }, + { + "epoch": 0.06, + "learning_rate": 1.8855578424138866e-07, + "loss": 0.1016, + "step": 2997 + }, + { + "epoch": 0.06, + "learning_rate": 1.8855190089705253e-07, + "loss": 0.0925, + "step": 2998 + }, + { + "epoch": 0.06, + "learning_rate": 1.8854801755271638e-07, + "loss": 0.1045, + "step": 2999 + }, + { + "epoch": 0.06, + "learning_rate": 1.8854413420838025e-07, + "loss": 0.7688, + "step": 3000 + }, + { + "epoch": 0.06, + "learning_rate": 1.885402508640441e-07, + "loss": 0.2316, + "step": 3001 + }, + { + "epoch": 0.06, + "learning_rate": 1.8853636751970797e-07, + "loss": 0.4154, + "step": 3002 + }, + { + "epoch": 0.06, + "learning_rate": 1.885324841753718e-07, + "loss": 0.1126, + "step": 3003 + }, + { + "epoch": 0.06, + "learning_rate": 1.8852860083103568e-07, + "loss": 0.0691, + "step": 3004 + }, + { + "epoch": 0.06, + "learning_rate": 1.8852471748669953e-07, + "loss": 0.1416, + "step": 3005 + }, + { + "epoch": 0.06, + "learning_rate": 1.885208341423634e-07, + "loss": 0.19, + "step": 3006 + }, + { + "epoch": 0.06, + "learning_rate": 1.8851695079802724e-07, + "loss": 0.3576, + "step": 3007 + }, + { + "epoch": 0.06, + "learning_rate": 1.8851306745369112e-07, + "loss": 0.4459, + "step": 3008 + }, + { + "epoch": 0.06, + "learning_rate": 1.8850918410935496e-07, + "loss": 0.1282, + "step": 3009 + }, + { + "epoch": 0.06, + "learning_rate": 1.8850530076501883e-07, + "loss": 0.1269, + "step": 3010 + }, + { + "epoch": 0.06, + "learning_rate": 1.8850141742068268e-07, + "loss": 0.313, + "step": 3011 + }, + { + "epoch": 0.06, + "learning_rate": 1.8849753407634655e-07, + "loss": 0.1859, + "step": 3012 + }, + { + "epoch": 0.06, + "learning_rate": 1.884936507320104e-07, + "loss": 0.079, + "step": 3013 + }, + { + "epoch": 0.06, + "learning_rate": 1.8848976738767427e-07, + "loss": 0.1342, + "step": 3014 + }, + { + "epoch": 0.06, + "learning_rate": 1.884858840433381e-07, + "loss": 0.3347, + "step": 3015 + }, + { + "epoch": 0.06, + "learning_rate": 1.8848200069900198e-07, + "loss": 0.1003, + "step": 3016 + }, + { + "epoch": 0.06, + "learning_rate": 1.8847811735466583e-07, + "loss": 0.2421, + "step": 3017 + }, + { + "epoch": 0.06, + "learning_rate": 1.884742340103297e-07, + "loss": 0.1394, + "step": 3018 + }, + { + "epoch": 0.06, + "learning_rate": 1.8847035066599354e-07, + "loss": 0.1479, + "step": 3019 + }, + { + "epoch": 0.06, + "learning_rate": 1.8846646732165741e-07, + "loss": 0.1955, + "step": 3020 + }, + { + "epoch": 0.06, + "learning_rate": 1.8846258397732126e-07, + "loss": 0.2836, + "step": 3021 + }, + { + "epoch": 0.06, + "learning_rate": 1.8845870063298513e-07, + "loss": 0.3213, + "step": 3022 + }, + { + "epoch": 0.06, + "learning_rate": 1.8845481728864898e-07, + "loss": 0.2401, + "step": 3023 + }, + { + "epoch": 0.06, + "learning_rate": 1.8845093394431285e-07, + "loss": 0.1514, + "step": 3024 + }, + { + "epoch": 0.06, + "learning_rate": 1.884470505999767e-07, + "loss": 0.1449, + "step": 3025 + }, + { + "epoch": 0.06, + "learning_rate": 1.8844316725564056e-07, + "loss": 0.3272, + "step": 3026 + }, + { + "epoch": 0.06, + "learning_rate": 1.884392839113044e-07, + "loss": 0.1776, + "step": 3027 + }, + { + "epoch": 0.06, + "learning_rate": 1.8843540056696828e-07, + "loss": 0.0686, + "step": 3028 + }, + { + "epoch": 0.06, + "learning_rate": 1.8843151722263213e-07, + "loss": 0.3128, + "step": 3029 + }, + { + "epoch": 0.06, + "learning_rate": 1.88427633878296e-07, + "loss": 0.3259, + "step": 3030 + }, + { + "epoch": 0.06, + "learning_rate": 1.8842375053395984e-07, + "loss": 0.0957, + "step": 3031 + }, + { + "epoch": 0.06, + "learning_rate": 1.8841986718962371e-07, + "loss": 0.1353, + "step": 3032 + }, + { + "epoch": 0.06, + "learning_rate": 1.8841598384528756e-07, + "loss": 0.1181, + "step": 3033 + }, + { + "epoch": 0.06, + "learning_rate": 1.8841210050095143e-07, + "loss": 0.0874, + "step": 3034 + }, + { + "epoch": 0.06, + "learning_rate": 1.8840821715661528e-07, + "loss": 0.0704, + "step": 3035 + }, + { + "epoch": 0.06, + "learning_rate": 1.8840433381227915e-07, + "loss": 0.1904, + "step": 3036 + }, + { + "epoch": 0.06, + "learning_rate": 1.8840045046794297e-07, + "loss": 0.389, + "step": 3037 + }, + { + "epoch": 0.06, + "learning_rate": 1.8839656712360684e-07, + "loss": 0.2212, + "step": 3038 + }, + { + "epoch": 0.06, + "learning_rate": 1.8839268377927068e-07, + "loss": 0.118, + "step": 3039 + }, + { + "epoch": 0.06, + "learning_rate": 1.8838880043493455e-07, + "loss": 0.3867, + "step": 3040 + }, + { + "epoch": 0.06, + "learning_rate": 1.883849170905984e-07, + "loss": 0.1094, + "step": 3041 + }, + { + "epoch": 0.06, + "learning_rate": 1.8838103374626227e-07, + "loss": 0.0842, + "step": 3042 + }, + { + "epoch": 0.06, + "learning_rate": 1.8837715040192611e-07, + "loss": 0.4206, + "step": 3043 + }, + { + "epoch": 0.06, + "learning_rate": 1.8837326705758999e-07, + "loss": 0.0766, + "step": 3044 + }, + { + "epoch": 0.06, + "learning_rate": 1.8836938371325383e-07, + "loss": 0.2034, + "step": 3045 + }, + { + "epoch": 0.06, + "learning_rate": 1.883655003689177e-07, + "loss": 0.2908, + "step": 3046 + }, + { + "epoch": 0.06, + "learning_rate": 1.8836161702458155e-07, + "loss": 0.3439, + "step": 3047 + }, + { + "epoch": 0.06, + "learning_rate": 1.8835773368024542e-07, + "loss": 0.0766, + "step": 3048 + }, + { + "epoch": 0.06, + "learning_rate": 1.8835385033590926e-07, + "loss": 0.1085, + "step": 3049 + }, + { + "epoch": 0.06, + "learning_rate": 1.8834996699157314e-07, + "loss": 0.2548, + "step": 3050 + }, + { + "epoch": 0.06, + "learning_rate": 1.8834608364723698e-07, + "loss": 0.2557, + "step": 3051 + }, + { + "epoch": 0.06, + "learning_rate": 1.8834220030290085e-07, + "loss": 0.5004, + "step": 3052 + }, + { + "epoch": 0.06, + "learning_rate": 1.883383169585647e-07, + "loss": 0.2176, + "step": 3053 + }, + { + "epoch": 0.06, + "learning_rate": 1.8833443361422857e-07, + "loss": 0.1399, + "step": 3054 + }, + { + "epoch": 0.06, + "learning_rate": 1.8833055026989241e-07, + "loss": 0.1375, + "step": 3055 + }, + { + "epoch": 0.06, + "learning_rate": 1.8832666692555629e-07, + "loss": 0.105, + "step": 3056 + }, + { + "epoch": 0.06, + "learning_rate": 1.8832278358122013e-07, + "loss": 0.0908, + "step": 3057 + }, + { + "epoch": 0.06, + "learning_rate": 1.88318900236884e-07, + "loss": 0.1602, + "step": 3058 + }, + { + "epoch": 0.06, + "learning_rate": 1.8831501689254785e-07, + "loss": 0.2304, + "step": 3059 + }, + { + "epoch": 0.06, + "learning_rate": 1.8831113354821172e-07, + "loss": 0.2533, + "step": 3060 + }, + { + "epoch": 0.06, + "learning_rate": 1.8830725020387556e-07, + "loss": 0.5064, + "step": 3061 + }, + { + "epoch": 0.06, + "learning_rate": 1.8830336685953943e-07, + "loss": 0.1609, + "step": 3062 + }, + { + "epoch": 0.06, + "learning_rate": 1.8829948351520328e-07, + "loss": 0.1482, + "step": 3063 + }, + { + "epoch": 0.06, + "learning_rate": 1.8829560017086715e-07, + "loss": 0.1193, + "step": 3064 + }, + { + "epoch": 0.06, + "learning_rate": 1.88291716826531e-07, + "loss": 0.1756, + "step": 3065 + }, + { + "epoch": 0.06, + "learning_rate": 1.8828783348219487e-07, + "loss": 0.0826, + "step": 3066 + }, + { + "epoch": 0.06, + "learning_rate": 1.882839501378587e-07, + "loss": 0.193, + "step": 3067 + }, + { + "epoch": 0.06, + "learning_rate": 1.8828006679352258e-07, + "loss": 0.1359, + "step": 3068 + }, + { + "epoch": 0.06, + "learning_rate": 1.8827618344918643e-07, + "loss": 0.2907, + "step": 3069 + }, + { + "epoch": 0.06, + "learning_rate": 1.882723001048503e-07, + "loss": 0.0713, + "step": 3070 + }, + { + "epoch": 0.06, + "learning_rate": 1.8826841676051415e-07, + "loss": 0.23, + "step": 3071 + }, + { + "epoch": 0.06, + "learning_rate": 1.8826453341617802e-07, + "loss": 0.1043, + "step": 3072 + }, + { + "epoch": 0.06, + "learning_rate": 1.8826065007184186e-07, + "loss": 0.1384, + "step": 3073 + }, + { + "epoch": 0.06, + "learning_rate": 1.8825676672750573e-07, + "loss": 0.4132, + "step": 3074 + }, + { + "epoch": 0.06, + "learning_rate": 1.8825288338316958e-07, + "loss": 0.2896, + "step": 3075 + }, + { + "epoch": 0.06, + "learning_rate": 1.8824900003883345e-07, + "loss": 0.3434, + "step": 3076 + }, + { + "epoch": 0.06, + "learning_rate": 1.882451166944973e-07, + "loss": 0.4388, + "step": 3077 + }, + { + "epoch": 0.06, + "learning_rate": 1.8824123335016117e-07, + "loss": 0.1011, + "step": 3078 + }, + { + "epoch": 0.06, + "learning_rate": 1.88237350005825e-07, + "loss": 0.0898, + "step": 3079 + }, + { + "epoch": 0.06, + "learning_rate": 1.8823346666148888e-07, + "loss": 0.1012, + "step": 3080 + }, + { + "epoch": 0.06, + "learning_rate": 1.8822958331715273e-07, + "loss": 0.083, + "step": 3081 + }, + { + "epoch": 0.06, + "learning_rate": 1.882256999728166e-07, + "loss": 0.0974, + "step": 3082 + }, + { + "epoch": 0.06, + "learning_rate": 1.8822181662848044e-07, + "loss": 0.2261, + "step": 3083 + }, + { + "epoch": 0.06, + "learning_rate": 1.8821793328414432e-07, + "loss": 0.2631, + "step": 3084 + }, + { + "epoch": 0.06, + "learning_rate": 1.8821404993980816e-07, + "loss": 0.223, + "step": 3085 + }, + { + "epoch": 0.06, + "learning_rate": 1.8821016659547203e-07, + "loss": 0.118, + "step": 3086 + }, + { + "epoch": 0.06, + "learning_rate": 1.8820628325113588e-07, + "loss": 0.3796, + "step": 3087 + }, + { + "epoch": 0.06, + "learning_rate": 1.8820239990679975e-07, + "loss": 0.3296, + "step": 3088 + }, + { + "epoch": 0.06, + "learning_rate": 1.881985165624636e-07, + "loss": 0.1453, + "step": 3089 + }, + { + "epoch": 0.06, + "learning_rate": 1.8819463321812744e-07, + "loss": 0.0885, + "step": 3090 + }, + { + "epoch": 0.06, + "learning_rate": 1.881907498737913e-07, + "loss": 0.1879, + "step": 3091 + }, + { + "epoch": 0.06, + "learning_rate": 1.8818686652945516e-07, + "loss": 0.2683, + "step": 3092 + }, + { + "epoch": 0.06, + "learning_rate": 1.8818298318511903e-07, + "loss": 0.1004, + "step": 3093 + }, + { + "epoch": 0.06, + "learning_rate": 1.8817909984078287e-07, + "loss": 0.5719, + "step": 3094 + }, + { + "epoch": 0.06, + "learning_rate": 1.8817521649644672e-07, + "loss": 0.2544, + "step": 3095 + }, + { + "epoch": 0.06, + "learning_rate": 1.881713331521106e-07, + "loss": 0.1556, + "step": 3096 + }, + { + "epoch": 0.06, + "learning_rate": 1.8816744980777443e-07, + "loss": 0.4712, + "step": 3097 + }, + { + "epoch": 0.06, + "learning_rate": 1.881635664634383e-07, + "loss": 0.1095, + "step": 3098 + }, + { + "epoch": 0.06, + "learning_rate": 1.8815968311910215e-07, + "loss": 0.6021, + "step": 3099 + }, + { + "epoch": 0.06, + "learning_rate": 1.8815579977476602e-07, + "loss": 0.0952, + "step": 3100 + }, + { + "epoch": 0.06, + "learning_rate": 1.8815191643042987e-07, + "loss": 0.1982, + "step": 3101 + }, + { + "epoch": 0.06, + "learning_rate": 1.8814803308609374e-07, + "loss": 0.5736, + "step": 3102 + }, + { + "epoch": 0.06, + "learning_rate": 1.8814414974175758e-07, + "loss": 0.1327, + "step": 3103 + }, + { + "epoch": 0.06, + "learning_rate": 1.8814026639742145e-07, + "loss": 0.0939, + "step": 3104 + }, + { + "epoch": 0.06, + "learning_rate": 1.881363830530853e-07, + "loss": 0.3941, + "step": 3105 + }, + { + "epoch": 0.06, + "learning_rate": 1.8813249970874917e-07, + "loss": 0.1068, + "step": 3106 + }, + { + "epoch": 0.06, + "learning_rate": 1.8812861636441302e-07, + "loss": 0.115, + "step": 3107 + }, + { + "epoch": 0.06, + "learning_rate": 1.881247330200769e-07, + "loss": 0.1925, + "step": 3108 + }, + { + "epoch": 0.06, + "learning_rate": 1.8812084967574073e-07, + "loss": 0.1829, + "step": 3109 + }, + { + "epoch": 0.06, + "learning_rate": 1.881169663314046e-07, + "loss": 0.1459, + "step": 3110 + }, + { + "epoch": 0.06, + "learning_rate": 1.8811308298706845e-07, + "loss": 0.0873, + "step": 3111 + }, + { + "epoch": 0.06, + "learning_rate": 1.8810919964273232e-07, + "loss": 0.3023, + "step": 3112 + }, + { + "epoch": 0.06, + "learning_rate": 1.8810531629839617e-07, + "loss": 0.104, + "step": 3113 + }, + { + "epoch": 0.06, + "learning_rate": 1.8810143295406004e-07, + "loss": 0.1072, + "step": 3114 + }, + { + "epoch": 0.06, + "learning_rate": 1.8809754960972388e-07, + "loss": 0.2681, + "step": 3115 + }, + { + "epoch": 0.06, + "learning_rate": 1.8809366626538775e-07, + "loss": 0.5631, + "step": 3116 + }, + { + "epoch": 0.06, + "learning_rate": 1.880897829210516e-07, + "loss": 0.0967, + "step": 3117 + }, + { + "epoch": 0.06, + "learning_rate": 1.8808589957671544e-07, + "loss": 0.1946, + "step": 3118 + }, + { + "epoch": 0.06, + "learning_rate": 1.8808201623237931e-07, + "loss": 0.1119, + "step": 3119 + }, + { + "epoch": 0.06, + "learning_rate": 1.8807813288804316e-07, + "loss": 0.0937, + "step": 3120 + }, + { + "epoch": 0.06, + "learning_rate": 1.8807424954370703e-07, + "loss": 0.0683, + "step": 3121 + }, + { + "epoch": 0.06, + "learning_rate": 1.8807036619937088e-07, + "loss": 0.1645, + "step": 3122 + }, + { + "epoch": 0.06, + "learning_rate": 1.8806648285503475e-07, + "loss": 0.4883, + "step": 3123 + }, + { + "epoch": 0.06, + "learning_rate": 1.880625995106986e-07, + "loss": 0.0929, + "step": 3124 + }, + { + "epoch": 0.06, + "learning_rate": 1.8805871616636246e-07, + "loss": 0.0815, + "step": 3125 + }, + { + "epoch": 0.06, + "learning_rate": 1.880548328220263e-07, + "loss": 0.1325, + "step": 3126 + }, + { + "epoch": 0.06, + "learning_rate": 1.8805094947769018e-07, + "loss": 0.1196, + "step": 3127 + }, + { + "epoch": 0.06, + "learning_rate": 1.8804706613335403e-07, + "loss": 0.133, + "step": 3128 + }, + { + "epoch": 0.06, + "learning_rate": 1.880431827890179e-07, + "loss": 0.3177, + "step": 3129 + }, + { + "epoch": 0.06, + "learning_rate": 1.8803929944468174e-07, + "loss": 0.0977, + "step": 3130 + }, + { + "epoch": 0.06, + "learning_rate": 1.8803541610034561e-07, + "loss": 0.2323, + "step": 3131 + }, + { + "epoch": 0.06, + "learning_rate": 1.8803153275600946e-07, + "loss": 0.466, + "step": 3132 + }, + { + "epoch": 0.06, + "learning_rate": 1.8802764941167333e-07, + "loss": 0.0829, + "step": 3133 + }, + { + "epoch": 0.06, + "learning_rate": 1.8802376606733718e-07, + "loss": 0.298, + "step": 3134 + }, + { + "epoch": 0.06, + "learning_rate": 1.8801988272300105e-07, + "loss": 0.1916, + "step": 3135 + }, + { + "epoch": 0.06, + "learning_rate": 1.880159993786649e-07, + "loss": 0.1371, + "step": 3136 + }, + { + "epoch": 0.06, + "learning_rate": 1.8801211603432876e-07, + "loss": 0.1473, + "step": 3137 + }, + { + "epoch": 0.06, + "learning_rate": 1.880082326899926e-07, + "loss": 0.0778, + "step": 3138 + }, + { + "epoch": 0.06, + "learning_rate": 1.8800434934565648e-07, + "loss": 0.1443, + "step": 3139 + }, + { + "epoch": 0.06, + "learning_rate": 1.8800046600132032e-07, + "loss": 0.3117, + "step": 3140 + }, + { + "epoch": 0.06, + "learning_rate": 1.879965826569842e-07, + "loss": 0.0749, + "step": 3141 + }, + { + "epoch": 0.06, + "learning_rate": 1.8799269931264804e-07, + "loss": 0.0728, + "step": 3142 + }, + { + "epoch": 0.06, + "learning_rate": 1.879888159683119e-07, + "loss": 0.4896, + "step": 3143 + }, + { + "epoch": 0.06, + "learning_rate": 1.8798493262397576e-07, + "loss": 0.4375, + "step": 3144 + }, + { + "epoch": 0.06, + "learning_rate": 1.8798104927963963e-07, + "loss": 0.1481, + "step": 3145 + }, + { + "epoch": 0.06, + "learning_rate": 1.8797716593530347e-07, + "loss": 0.1587, + "step": 3146 + }, + { + "epoch": 0.06, + "learning_rate": 1.8797328259096735e-07, + "loss": 0.0649, + "step": 3147 + }, + { + "epoch": 0.06, + "learning_rate": 1.879693992466312e-07, + "loss": 0.1101, + "step": 3148 + }, + { + "epoch": 0.06, + "learning_rate": 1.8796551590229506e-07, + "loss": 0.1076, + "step": 3149 + }, + { + "epoch": 0.06, + "learning_rate": 1.879616325579589e-07, + "loss": 0.1147, + "step": 3150 + }, + { + "epoch": 0.06, + "learning_rate": 1.8795774921362278e-07, + "loss": 0.4988, + "step": 3151 + }, + { + "epoch": 0.06, + "learning_rate": 1.8795386586928662e-07, + "loss": 0.1557, + "step": 3152 + }, + { + "epoch": 0.06, + "learning_rate": 1.8794998252495047e-07, + "loss": 0.094, + "step": 3153 + }, + { + "epoch": 0.06, + "learning_rate": 1.8794609918061431e-07, + "loss": 0.0937, + "step": 3154 + }, + { + "epoch": 0.06, + "learning_rate": 1.8794221583627819e-07, + "loss": 0.2896, + "step": 3155 + }, + { + "epoch": 0.06, + "learning_rate": 1.8793833249194203e-07, + "loss": 0.1063, + "step": 3156 + }, + { + "epoch": 0.06, + "learning_rate": 1.879344491476059e-07, + "loss": 0.1266, + "step": 3157 + }, + { + "epoch": 0.06, + "learning_rate": 1.8793056580326975e-07, + "loss": 0.0929, + "step": 3158 + }, + { + "epoch": 0.06, + "learning_rate": 1.8792668245893362e-07, + "loss": 0.0909, + "step": 3159 + }, + { + "epoch": 0.06, + "learning_rate": 1.8792279911459746e-07, + "loss": 0.2363, + "step": 3160 + }, + { + "epoch": 0.06, + "learning_rate": 1.8791891577026133e-07, + "loss": 0.1298, + "step": 3161 + }, + { + "epoch": 0.06, + "learning_rate": 1.8791503242592518e-07, + "loss": 0.193, + "step": 3162 + }, + { + "epoch": 0.06, + "learning_rate": 1.8791114908158905e-07, + "loss": 0.0798, + "step": 3163 + }, + { + "epoch": 0.06, + "learning_rate": 1.879072657372529e-07, + "loss": 0.1053, + "step": 3164 + }, + { + "epoch": 0.06, + "learning_rate": 1.8790338239291677e-07, + "loss": 0.1962, + "step": 3165 + }, + { + "epoch": 0.06, + "learning_rate": 1.878994990485806e-07, + "loss": 0.1833, + "step": 3166 + }, + { + "epoch": 0.06, + "learning_rate": 1.8789561570424448e-07, + "loss": 0.1096, + "step": 3167 + }, + { + "epoch": 0.06, + "learning_rate": 1.8789173235990833e-07, + "loss": 0.2051, + "step": 3168 + }, + { + "epoch": 0.06, + "learning_rate": 1.878878490155722e-07, + "loss": 0.1741, + "step": 3169 + }, + { + "epoch": 0.06, + "learning_rate": 1.8788396567123605e-07, + "loss": 0.2122, + "step": 3170 + }, + { + "epoch": 0.06, + "learning_rate": 1.8788008232689992e-07, + "loss": 0.2212, + "step": 3171 + }, + { + "epoch": 0.06, + "learning_rate": 1.8787619898256376e-07, + "loss": 0.1053, + "step": 3172 + }, + { + "epoch": 0.06, + "learning_rate": 1.8787231563822763e-07, + "loss": 0.1552, + "step": 3173 + }, + { + "epoch": 0.06, + "learning_rate": 1.8786843229389148e-07, + "loss": 0.0895, + "step": 3174 + }, + { + "epoch": 0.06, + "learning_rate": 1.8786454894955535e-07, + "loss": 0.4573, + "step": 3175 + }, + { + "epoch": 0.06, + "learning_rate": 1.878606656052192e-07, + "loss": 0.095, + "step": 3176 + }, + { + "epoch": 0.06, + "learning_rate": 1.8785678226088307e-07, + "loss": 0.0923, + "step": 3177 + }, + { + "epoch": 0.06, + "learning_rate": 1.878528989165469e-07, + "loss": 0.0789, + "step": 3178 + }, + { + "epoch": 0.06, + "learning_rate": 1.8784901557221078e-07, + "loss": 0.1388, + "step": 3179 + }, + { + "epoch": 0.06, + "learning_rate": 1.8784513222787463e-07, + "loss": 0.2813, + "step": 3180 + }, + { + "epoch": 0.06, + "learning_rate": 1.878412488835385e-07, + "loss": 0.0858, + "step": 3181 + }, + { + "epoch": 0.06, + "learning_rate": 1.8783736553920234e-07, + "loss": 0.0641, + "step": 3182 + }, + { + "epoch": 0.06, + "learning_rate": 1.8783348219486622e-07, + "loss": 0.3844, + "step": 3183 + }, + { + "epoch": 0.06, + "learning_rate": 1.8782959885053006e-07, + "loss": 0.2071, + "step": 3184 + }, + { + "epoch": 0.06, + "learning_rate": 1.8782571550619393e-07, + "loss": 0.0912, + "step": 3185 + }, + { + "epoch": 0.06, + "learning_rate": 1.8782183216185778e-07, + "loss": 0.1107, + "step": 3186 + }, + { + "epoch": 0.06, + "learning_rate": 1.8781794881752165e-07, + "loss": 0.2358, + "step": 3187 + }, + { + "epoch": 0.06, + "learning_rate": 1.878140654731855e-07, + "loss": 0.5258, + "step": 3188 + }, + { + "epoch": 0.06, + "learning_rate": 1.8781018212884937e-07, + "loss": 0.2658, + "step": 3189 + }, + { + "epoch": 0.06, + "learning_rate": 1.878062987845132e-07, + "loss": 0.2975, + "step": 3190 + }, + { + "epoch": 0.06, + "learning_rate": 1.8780241544017708e-07, + "loss": 0.1324, + "step": 3191 + }, + { + "epoch": 0.06, + "learning_rate": 1.8779853209584093e-07, + "loss": 0.1968, + "step": 3192 + }, + { + "epoch": 0.06, + "learning_rate": 1.877946487515048e-07, + "loss": 0.2722, + "step": 3193 + }, + { + "epoch": 0.06, + "learning_rate": 1.8779076540716864e-07, + "loss": 0.1557, + "step": 3194 + }, + { + "epoch": 0.06, + "learning_rate": 1.8778688206283252e-07, + "loss": 0.0929, + "step": 3195 + }, + { + "epoch": 0.06, + "learning_rate": 1.8778299871849636e-07, + "loss": 0.3466, + "step": 3196 + }, + { + "epoch": 0.06, + "learning_rate": 1.8777911537416023e-07, + "loss": 0.0896, + "step": 3197 + }, + { + "epoch": 0.06, + "learning_rate": 1.8777523202982408e-07, + "loss": 0.0756, + "step": 3198 + }, + { + "epoch": 0.06, + "learning_rate": 1.8777134868548795e-07, + "loss": 0.1055, + "step": 3199 + }, + { + "epoch": 0.06, + "learning_rate": 1.877674653411518e-07, + "loss": 0.0789, + "step": 3200 + }, + { + "epoch": 0.06, + "learning_rate": 1.8776358199681566e-07, + "loss": 0.1519, + "step": 3201 + }, + { + "epoch": 0.06, + "learning_rate": 1.877596986524795e-07, + "loss": 0.0724, + "step": 3202 + }, + { + "epoch": 0.06, + "learning_rate": 1.8775581530814338e-07, + "loss": 0.0812, + "step": 3203 + }, + { + "epoch": 0.06, + "learning_rate": 1.8775193196380723e-07, + "loss": 0.3179, + "step": 3204 + }, + { + "epoch": 0.06, + "learning_rate": 1.877480486194711e-07, + "loss": 0.2049, + "step": 3205 + }, + { + "epoch": 0.06, + "learning_rate": 1.8774416527513494e-07, + "loss": 0.411, + "step": 3206 + }, + { + "epoch": 0.06, + "learning_rate": 1.8774028193079881e-07, + "loss": 0.2282, + "step": 3207 + }, + { + "epoch": 0.06, + "learning_rate": 1.8773639858646266e-07, + "loss": 0.3989, + "step": 3208 + }, + { + "epoch": 0.06, + "learning_rate": 1.8773251524212653e-07, + "loss": 0.0765, + "step": 3209 + }, + { + "epoch": 0.06, + "learning_rate": 1.8772863189779038e-07, + "loss": 0.0905, + "step": 3210 + }, + { + "epoch": 0.06, + "learning_rate": 1.8772474855345422e-07, + "loss": 0.0707, + "step": 3211 + }, + { + "epoch": 0.06, + "learning_rate": 1.8772086520911807e-07, + "loss": 0.1121, + "step": 3212 + }, + { + "epoch": 0.06, + "learning_rate": 1.8771698186478194e-07, + "loss": 0.2812, + "step": 3213 + }, + { + "epoch": 0.06, + "learning_rate": 1.8771309852044578e-07, + "loss": 0.0828, + "step": 3214 + }, + { + "epoch": 0.06, + "learning_rate": 1.8770921517610965e-07, + "loss": 0.1205, + "step": 3215 + }, + { + "epoch": 0.06, + "learning_rate": 1.877053318317735e-07, + "loss": 0.2535, + "step": 3216 + }, + { + "epoch": 0.06, + "learning_rate": 1.8770144848743737e-07, + "loss": 0.0992, + "step": 3217 + }, + { + "epoch": 0.06, + "learning_rate": 1.8769756514310121e-07, + "loss": 0.2881, + "step": 3218 + }, + { + "epoch": 0.06, + "learning_rate": 1.8769368179876509e-07, + "loss": 0.1521, + "step": 3219 + }, + { + "epoch": 0.06, + "learning_rate": 1.8768979845442893e-07, + "loss": 0.1334, + "step": 3220 + }, + { + "epoch": 0.06, + "learning_rate": 1.876859151100928e-07, + "loss": 0.1535, + "step": 3221 + }, + { + "epoch": 0.06, + "learning_rate": 1.8768203176575665e-07, + "loss": 0.3093, + "step": 3222 + }, + { + "epoch": 0.06, + "learning_rate": 1.8767814842142052e-07, + "loss": 0.2888, + "step": 3223 + }, + { + "epoch": 0.06, + "learning_rate": 1.8767426507708436e-07, + "loss": 0.1063, + "step": 3224 + }, + { + "epoch": 0.06, + "learning_rate": 1.8767038173274824e-07, + "loss": 0.2347, + "step": 3225 + }, + { + "epoch": 0.06, + "learning_rate": 1.8766649838841208e-07, + "loss": 0.0635, + "step": 3226 + }, + { + "epoch": 0.06, + "learning_rate": 1.8766261504407595e-07, + "loss": 0.168, + "step": 3227 + }, + { + "epoch": 0.06, + "learning_rate": 1.876587316997398e-07, + "loss": 0.2388, + "step": 3228 + }, + { + "epoch": 0.06, + "learning_rate": 1.8765484835540367e-07, + "loss": 0.1397, + "step": 3229 + }, + { + "epoch": 0.06, + "learning_rate": 1.8765096501106751e-07, + "loss": 0.1368, + "step": 3230 + }, + { + "epoch": 0.06, + "learning_rate": 1.8764708166673139e-07, + "loss": 0.062, + "step": 3231 + }, + { + "epoch": 0.06, + "learning_rate": 1.8764319832239523e-07, + "loss": 0.1082, + "step": 3232 + }, + { + "epoch": 0.06, + "learning_rate": 1.876393149780591e-07, + "loss": 0.1448, + "step": 3233 + }, + { + "epoch": 0.06, + "learning_rate": 1.8763543163372295e-07, + "loss": 0.1929, + "step": 3234 + }, + { + "epoch": 0.06, + "learning_rate": 1.8763154828938682e-07, + "loss": 0.127, + "step": 3235 + }, + { + "epoch": 0.06, + "learning_rate": 1.8762766494505066e-07, + "loss": 0.3802, + "step": 3236 + }, + { + "epoch": 0.06, + "learning_rate": 1.8762378160071453e-07, + "loss": 0.1154, + "step": 3237 + }, + { + "epoch": 0.06, + "learning_rate": 1.8761989825637838e-07, + "loss": 0.0815, + "step": 3238 + }, + { + "epoch": 0.06, + "learning_rate": 1.8761601491204225e-07, + "loss": 0.1805, + "step": 3239 + }, + { + "epoch": 0.06, + "learning_rate": 1.876121315677061e-07, + "loss": 0.4075, + "step": 3240 + }, + { + "epoch": 0.06, + "learning_rate": 1.8760824822336997e-07, + "loss": 0.1249, + "step": 3241 + }, + { + "epoch": 0.06, + "learning_rate": 1.876043648790338e-07, + "loss": 0.0713, + "step": 3242 + }, + { + "epoch": 0.06, + "learning_rate": 1.8760048153469768e-07, + "loss": 0.1286, + "step": 3243 + }, + { + "epoch": 0.06, + "learning_rate": 1.8759659819036153e-07, + "loss": 0.3401, + "step": 3244 + }, + { + "epoch": 0.06, + "learning_rate": 1.875927148460254e-07, + "loss": 0.4296, + "step": 3245 + }, + { + "epoch": 0.06, + "learning_rate": 1.8758883150168925e-07, + "loss": 0.2302, + "step": 3246 + }, + { + "epoch": 0.06, + "learning_rate": 1.8758494815735312e-07, + "loss": 0.585, + "step": 3247 + }, + { + "epoch": 0.06, + "learning_rate": 1.8758106481301696e-07, + "loss": 0.2177, + "step": 3248 + }, + { + "epoch": 0.06, + "learning_rate": 1.8757718146868083e-07, + "loss": 0.5155, + "step": 3249 + }, + { + "epoch": 0.06, + "learning_rate": 1.8757329812434468e-07, + "loss": 0.068, + "step": 3250 + }, + { + "epoch": 0.06, + "learning_rate": 1.8756941478000855e-07, + "loss": 0.129, + "step": 3251 + }, + { + "epoch": 0.06, + "learning_rate": 1.875655314356724e-07, + "loss": 0.1142, + "step": 3252 + }, + { + "epoch": 0.06, + "learning_rate": 1.8756164809133627e-07, + "loss": 0.0728, + "step": 3253 + }, + { + "epoch": 0.06, + "learning_rate": 1.875577647470001e-07, + "loss": 0.2538, + "step": 3254 + }, + { + "epoch": 0.06, + "learning_rate": 1.8755388140266398e-07, + "loss": 0.2616, + "step": 3255 + }, + { + "epoch": 0.06, + "learning_rate": 1.8754999805832783e-07, + "loss": 0.1015, + "step": 3256 + }, + { + "epoch": 0.06, + "learning_rate": 1.875461147139917e-07, + "loss": 0.0872, + "step": 3257 + }, + { + "epoch": 0.06, + "learning_rate": 1.8754223136965554e-07, + "loss": 0.0686, + "step": 3258 + }, + { + "epoch": 0.06, + "learning_rate": 1.8753834802531942e-07, + "loss": 0.2832, + "step": 3259 + }, + { + "epoch": 0.06, + "learning_rate": 1.8753446468098326e-07, + "loss": 0.2518, + "step": 3260 + }, + { + "epoch": 0.06, + "learning_rate": 1.8753058133664713e-07, + "loss": 0.2768, + "step": 3261 + }, + { + "epoch": 0.06, + "learning_rate": 1.8752669799231098e-07, + "loss": 0.1516, + "step": 3262 + }, + { + "epoch": 0.06, + "learning_rate": 1.8752281464797485e-07, + "loss": 0.2138, + "step": 3263 + }, + { + "epoch": 0.06, + "learning_rate": 1.875189313036387e-07, + "loss": 0.2187, + "step": 3264 + }, + { + "epoch": 0.06, + "learning_rate": 1.8751504795930257e-07, + "loss": 0.1147, + "step": 3265 + }, + { + "epoch": 0.06, + "learning_rate": 1.875111646149664e-07, + "loss": 0.078, + "step": 3266 + }, + { + "epoch": 0.06, + "learning_rate": 1.8750728127063026e-07, + "loss": 0.1509, + "step": 3267 + }, + { + "epoch": 0.06, + "learning_rate": 1.8750339792629413e-07, + "loss": 0.0743, + "step": 3268 + }, + { + "epoch": 0.06, + "learning_rate": 1.8749951458195797e-07, + "loss": 0.0723, + "step": 3269 + }, + { + "epoch": 0.06, + "learning_rate": 1.8749563123762182e-07, + "loss": 0.0694, + "step": 3270 + }, + { + "epoch": 0.06, + "learning_rate": 1.874917478932857e-07, + "loss": 0.3428, + "step": 3271 + }, + { + "epoch": 0.06, + "learning_rate": 1.8748786454894953e-07, + "loss": 0.1249, + "step": 3272 + }, + { + "epoch": 0.06, + "learning_rate": 1.874839812046134e-07, + "loss": 0.0777, + "step": 3273 + }, + { + "epoch": 0.06, + "learning_rate": 1.8748009786027725e-07, + "loss": 0.1994, + "step": 3274 + }, + { + "epoch": 0.06, + "learning_rate": 1.8747621451594112e-07, + "loss": 0.0963, + "step": 3275 + }, + { + "epoch": 0.06, + "learning_rate": 1.8747233117160497e-07, + "loss": 0.066, + "step": 3276 + }, + { + "epoch": 0.06, + "learning_rate": 1.8746844782726884e-07, + "loss": 0.0866, + "step": 3277 + }, + { + "epoch": 0.06, + "learning_rate": 1.8746456448293268e-07, + "loss": 0.061, + "step": 3278 + }, + { + "epoch": 0.06, + "learning_rate": 1.8746068113859655e-07, + "loss": 0.151, + "step": 3279 + }, + { + "epoch": 0.06, + "learning_rate": 1.874567977942604e-07, + "loss": 0.2189, + "step": 3280 + }, + { + "epoch": 0.06, + "learning_rate": 1.8745291444992427e-07, + "loss": 0.1768, + "step": 3281 + }, + { + "epoch": 0.06, + "learning_rate": 1.8744903110558812e-07, + "loss": 0.071, + "step": 3282 + }, + { + "epoch": 0.06, + "learning_rate": 1.87445147761252e-07, + "loss": 0.4664, + "step": 3283 + }, + { + "epoch": 0.06, + "learning_rate": 1.8744126441691583e-07, + "loss": 0.0681, + "step": 3284 + }, + { + "epoch": 0.06, + "learning_rate": 1.874373810725797e-07, + "loss": 0.0581, + "step": 3285 + }, + { + "epoch": 0.06, + "learning_rate": 1.8743349772824355e-07, + "loss": 0.1667, + "step": 3286 + }, + { + "epoch": 0.06, + "learning_rate": 1.8742961438390742e-07, + "loss": 0.078, + "step": 3287 + }, + { + "epoch": 0.06, + "learning_rate": 1.8742573103957127e-07, + "loss": 0.1583, + "step": 3288 + }, + { + "epoch": 0.06, + "learning_rate": 1.8742184769523514e-07, + "loss": 0.0584, + "step": 3289 + }, + { + "epoch": 0.06, + "learning_rate": 1.8741796435089898e-07, + "loss": 0.4857, + "step": 3290 + }, + { + "epoch": 0.06, + "learning_rate": 1.8741408100656285e-07, + "loss": 0.0749, + "step": 3291 + }, + { + "epoch": 0.06, + "learning_rate": 1.874101976622267e-07, + "loss": 0.4819, + "step": 3292 + }, + { + "epoch": 0.06, + "learning_rate": 1.8740631431789057e-07, + "loss": 0.3429, + "step": 3293 + }, + { + "epoch": 0.06, + "learning_rate": 1.8740243097355442e-07, + "loss": 0.3681, + "step": 3294 + }, + { + "epoch": 0.06, + "learning_rate": 1.8739854762921826e-07, + "loss": 0.061, + "step": 3295 + }, + { + "epoch": 0.06, + "learning_rate": 1.8739466428488213e-07, + "loss": 0.1361, + "step": 3296 + }, + { + "epoch": 0.06, + "learning_rate": 1.8739078094054598e-07, + "loss": 0.1636, + "step": 3297 + }, + { + "epoch": 0.06, + "learning_rate": 1.8738689759620985e-07, + "loss": 0.0704, + "step": 3298 + }, + { + "epoch": 0.06, + "learning_rate": 1.873830142518737e-07, + "loss": 0.0984, + "step": 3299 + }, + { + "epoch": 0.06, + "learning_rate": 1.8737913090753756e-07, + "loss": 0.0725, + "step": 3300 + }, + { + "epoch": 0.06, + "learning_rate": 1.873752475632014e-07, + "loss": 0.0622, + "step": 3301 + }, + { + "epoch": 0.06, + "learning_rate": 1.8737136421886528e-07, + "loss": 0.0622, + "step": 3302 + }, + { + "epoch": 0.06, + "learning_rate": 1.8736748087452913e-07, + "loss": 0.1184, + "step": 3303 + }, + { + "epoch": 0.06, + "learning_rate": 1.87363597530193e-07, + "loss": 0.0836, + "step": 3304 + }, + { + "epoch": 0.06, + "learning_rate": 1.8735971418585684e-07, + "loss": 0.1036, + "step": 3305 + }, + { + "epoch": 0.06, + "learning_rate": 1.8735583084152071e-07, + "loss": 0.2913, + "step": 3306 + }, + { + "epoch": 0.06, + "learning_rate": 1.8735194749718456e-07, + "loss": 0.2999, + "step": 3307 + }, + { + "epoch": 0.06, + "learning_rate": 1.8734806415284843e-07, + "loss": 0.0851, + "step": 3308 + }, + { + "epoch": 0.06, + "learning_rate": 1.8734418080851228e-07, + "loss": 0.1978, + "step": 3309 + }, + { + "epoch": 0.06, + "learning_rate": 1.8734029746417615e-07, + "loss": 0.0618, + "step": 3310 + }, + { + "epoch": 0.06, + "learning_rate": 1.8733641411984e-07, + "loss": 0.0645, + "step": 3311 + }, + { + "epoch": 0.06, + "learning_rate": 1.8733253077550386e-07, + "loss": 0.1252, + "step": 3312 + }, + { + "epoch": 0.06, + "learning_rate": 1.873286474311677e-07, + "loss": 0.1035, + "step": 3313 + }, + { + "epoch": 0.06, + "learning_rate": 1.8732476408683158e-07, + "loss": 0.319, + "step": 3314 + }, + { + "epoch": 0.06, + "learning_rate": 1.8732088074249542e-07, + "loss": 0.1318, + "step": 3315 + }, + { + "epoch": 0.06, + "learning_rate": 1.873169973981593e-07, + "loss": 0.4282, + "step": 3316 + }, + { + "epoch": 0.06, + "learning_rate": 1.8731311405382314e-07, + "loss": 0.0858, + "step": 3317 + }, + { + "epoch": 0.06, + "learning_rate": 1.87309230709487e-07, + "loss": 0.5269, + "step": 3318 + }, + { + "epoch": 0.06, + "learning_rate": 1.8730534736515086e-07, + "loss": 0.1485, + "step": 3319 + }, + { + "epoch": 0.06, + "learning_rate": 1.8730146402081473e-07, + "loss": 0.395, + "step": 3320 + }, + { + "epoch": 0.06, + "learning_rate": 1.8729758067647857e-07, + "loss": 0.0757, + "step": 3321 + }, + { + "epoch": 0.06, + "learning_rate": 1.8729369733214245e-07, + "loss": 0.2004, + "step": 3322 + }, + { + "epoch": 0.06, + "learning_rate": 1.872898139878063e-07, + "loss": 0.1329, + "step": 3323 + }, + { + "epoch": 0.06, + "learning_rate": 1.8728593064347016e-07, + "loss": 0.1711, + "step": 3324 + }, + { + "epoch": 0.06, + "learning_rate": 1.87282047299134e-07, + "loss": 0.116, + "step": 3325 + }, + { + "epoch": 0.06, + "learning_rate": 1.8727816395479788e-07, + "loss": 0.593, + "step": 3326 + }, + { + "epoch": 0.06, + "learning_rate": 1.872742806104617e-07, + "loss": 0.1308, + "step": 3327 + }, + { + "epoch": 0.06, + "learning_rate": 1.8727039726612557e-07, + "loss": 0.1408, + "step": 3328 + }, + { + "epoch": 0.06, + "learning_rate": 1.8726651392178941e-07, + "loss": 0.1086, + "step": 3329 + }, + { + "epoch": 0.06, + "learning_rate": 1.8726263057745329e-07, + "loss": 0.1001, + "step": 3330 + }, + { + "epoch": 0.06, + "learning_rate": 1.8725874723311713e-07, + "loss": 0.3113, + "step": 3331 + }, + { + "epoch": 0.06, + "learning_rate": 1.87254863888781e-07, + "loss": 0.0881, + "step": 3332 + }, + { + "epoch": 0.06, + "learning_rate": 1.8725098054444485e-07, + "loss": 0.0677, + "step": 3333 + }, + { + "epoch": 0.06, + "learning_rate": 1.8724709720010872e-07, + "loss": 0.2823, + "step": 3334 + }, + { + "epoch": 0.06, + "learning_rate": 1.8724321385577256e-07, + "loss": 0.1154, + "step": 3335 + }, + { + "epoch": 0.06, + "learning_rate": 1.8723933051143643e-07, + "loss": 0.3386, + "step": 3336 + }, + { + "epoch": 0.06, + "learning_rate": 1.8723544716710028e-07, + "loss": 0.1164, + "step": 3337 + }, + { + "epoch": 0.06, + "learning_rate": 1.8723156382276415e-07, + "loss": 0.1746, + "step": 3338 + }, + { + "epoch": 0.06, + "learning_rate": 1.87227680478428e-07, + "loss": 0.1086, + "step": 3339 + }, + { + "epoch": 0.06, + "learning_rate": 1.8722379713409187e-07, + "loss": 0.0553, + "step": 3340 + }, + { + "epoch": 0.06, + "learning_rate": 1.872199137897557e-07, + "loss": 0.316, + "step": 3341 + }, + { + "epoch": 0.06, + "learning_rate": 1.8721603044541958e-07, + "loss": 0.2806, + "step": 3342 + }, + { + "epoch": 0.06, + "learning_rate": 1.8721214710108343e-07, + "loss": 0.1125, + "step": 3343 + }, + { + "epoch": 0.06, + "learning_rate": 1.872082637567473e-07, + "loss": 0.1555, + "step": 3344 + }, + { + "epoch": 0.06, + "learning_rate": 1.8720438041241115e-07, + "loss": 0.1279, + "step": 3345 + }, + { + "epoch": 0.06, + "learning_rate": 1.8720049706807502e-07, + "loss": 0.099, + "step": 3346 + }, + { + "epoch": 0.06, + "learning_rate": 1.8719661372373886e-07, + "loss": 0.1342, + "step": 3347 + }, + { + "epoch": 0.06, + "learning_rate": 1.8719273037940273e-07, + "loss": 0.2234, + "step": 3348 + }, + { + "epoch": 0.06, + "learning_rate": 1.8718884703506658e-07, + "loss": 0.3212, + "step": 3349 + }, + { + "epoch": 0.06, + "learning_rate": 1.8718496369073045e-07, + "loss": 0.0884, + "step": 3350 + }, + { + "epoch": 0.07, + "learning_rate": 1.871810803463943e-07, + "loss": 0.3374, + "step": 3351 + }, + { + "epoch": 0.07, + "learning_rate": 1.8717719700205817e-07, + "loss": 0.1354, + "step": 3352 + }, + { + "epoch": 0.07, + "learning_rate": 1.87173313657722e-07, + "loss": 0.1478, + "step": 3353 + }, + { + "epoch": 0.07, + "learning_rate": 1.8716943031338588e-07, + "loss": 0.1121, + "step": 3354 + }, + { + "epoch": 0.07, + "learning_rate": 1.8716554696904973e-07, + "loss": 0.1284, + "step": 3355 + }, + { + "epoch": 0.07, + "learning_rate": 1.871616636247136e-07, + "loss": 0.0814, + "step": 3356 + }, + { + "epoch": 0.07, + "learning_rate": 1.8715778028037744e-07, + "loss": 0.6071, + "step": 3357 + }, + { + "epoch": 0.07, + "learning_rate": 1.8715389693604132e-07, + "loss": 0.5472, + "step": 3358 + }, + { + "epoch": 0.07, + "learning_rate": 1.8715001359170516e-07, + "loss": 0.0836, + "step": 3359 + }, + { + "epoch": 0.07, + "learning_rate": 1.8714613024736903e-07, + "loss": 0.2032, + "step": 3360 + }, + { + "epoch": 0.07, + "learning_rate": 1.8714224690303288e-07, + "loss": 0.2834, + "step": 3361 + }, + { + "epoch": 0.07, + "learning_rate": 1.8713836355869675e-07, + "loss": 0.0831, + "step": 3362 + }, + { + "epoch": 0.07, + "learning_rate": 1.871344802143606e-07, + "loss": 0.1037, + "step": 3363 + }, + { + "epoch": 0.07, + "learning_rate": 1.8713059687002447e-07, + "loss": 0.077, + "step": 3364 + }, + { + "epoch": 0.07, + "learning_rate": 1.871267135256883e-07, + "loss": 0.2716, + "step": 3365 + }, + { + "epoch": 0.07, + "learning_rate": 1.8712283018135218e-07, + "loss": 0.3076, + "step": 3366 + }, + { + "epoch": 0.07, + "learning_rate": 1.8711894683701603e-07, + "loss": 0.0588, + "step": 3367 + }, + { + "epoch": 0.07, + "learning_rate": 1.871150634926799e-07, + "loss": 0.2464, + "step": 3368 + }, + { + "epoch": 0.07, + "learning_rate": 1.8711118014834374e-07, + "loss": 0.1105, + "step": 3369 + }, + { + "epoch": 0.07, + "learning_rate": 1.8710729680400762e-07, + "loss": 0.0929, + "step": 3370 + }, + { + "epoch": 0.07, + "learning_rate": 1.8710341345967146e-07, + "loss": 0.0982, + "step": 3371 + }, + { + "epoch": 0.07, + "learning_rate": 1.8709953011533533e-07, + "loss": 0.5228, + "step": 3372 + }, + { + "epoch": 0.07, + "learning_rate": 1.8709564677099918e-07, + "loss": 0.1509, + "step": 3373 + }, + { + "epoch": 0.07, + "learning_rate": 1.8709176342666305e-07, + "loss": 0.1083, + "step": 3374 + }, + { + "epoch": 0.07, + "learning_rate": 1.870878800823269e-07, + "loss": 0.1377, + "step": 3375 + }, + { + "epoch": 0.07, + "learning_rate": 1.8708399673799076e-07, + "loss": 0.3102, + "step": 3376 + }, + { + "epoch": 0.07, + "learning_rate": 1.870801133936546e-07, + "loss": 0.2222, + "step": 3377 + }, + { + "epoch": 0.07, + "learning_rate": 1.8707623004931848e-07, + "loss": 0.269, + "step": 3378 + }, + { + "epoch": 0.07, + "learning_rate": 1.8707234670498233e-07, + "loss": 0.2406, + "step": 3379 + }, + { + "epoch": 0.07, + "learning_rate": 1.870684633606462e-07, + "loss": 0.2984, + "step": 3380 + }, + { + "epoch": 0.07, + "learning_rate": 1.8706458001631004e-07, + "loss": 0.1889, + "step": 3381 + }, + { + "epoch": 0.07, + "learning_rate": 1.8706069667197391e-07, + "loss": 0.0844, + "step": 3382 + }, + { + "epoch": 0.07, + "learning_rate": 1.8705681332763776e-07, + "loss": 0.1058, + "step": 3383 + }, + { + "epoch": 0.07, + "learning_rate": 1.8705292998330163e-07, + "loss": 0.1648, + "step": 3384 + }, + { + "epoch": 0.07, + "learning_rate": 1.8704904663896545e-07, + "loss": 0.1199, + "step": 3385 + }, + { + "epoch": 0.07, + "learning_rate": 1.8704516329462932e-07, + "loss": 0.0656, + "step": 3386 + }, + { + "epoch": 0.07, + "learning_rate": 1.8704127995029317e-07, + "loss": 0.0854, + "step": 3387 + }, + { + "epoch": 0.07, + "learning_rate": 1.8703739660595704e-07, + "loss": 0.0792, + "step": 3388 + }, + { + "epoch": 0.07, + "learning_rate": 1.8703351326162088e-07, + "loss": 0.0737, + "step": 3389 + }, + { + "epoch": 0.07, + "learning_rate": 1.8702962991728475e-07, + "loss": 0.1312, + "step": 3390 + }, + { + "epoch": 0.07, + "learning_rate": 1.870257465729486e-07, + "loss": 0.0857, + "step": 3391 + }, + { + "epoch": 0.07, + "learning_rate": 1.8702186322861247e-07, + "loss": 0.1193, + "step": 3392 + }, + { + "epoch": 0.07, + "learning_rate": 1.8701797988427632e-07, + "loss": 0.237, + "step": 3393 + }, + { + "epoch": 0.07, + "learning_rate": 1.8701409653994019e-07, + "loss": 0.0933, + "step": 3394 + }, + { + "epoch": 0.07, + "learning_rate": 1.8701021319560403e-07, + "loss": 0.1594, + "step": 3395 + }, + { + "epoch": 0.07, + "learning_rate": 1.870063298512679e-07, + "loss": 0.3317, + "step": 3396 + }, + { + "epoch": 0.07, + "learning_rate": 1.8700244650693175e-07, + "loss": 0.1123, + "step": 3397 + }, + { + "epoch": 0.07, + "learning_rate": 1.8699856316259562e-07, + "loss": 0.8583, + "step": 3398 + }, + { + "epoch": 0.07, + "learning_rate": 1.8699467981825946e-07, + "loss": 0.0598, + "step": 3399 + }, + { + "epoch": 0.07, + "learning_rate": 1.8699079647392334e-07, + "loss": 0.0889, + "step": 3400 + }, + { + "epoch": 0.07, + "learning_rate": 1.8698691312958718e-07, + "loss": 0.1931, + "step": 3401 + }, + { + "epoch": 0.07, + "learning_rate": 1.8698302978525105e-07, + "loss": 0.123, + "step": 3402 + }, + { + "epoch": 0.07, + "learning_rate": 1.869791464409149e-07, + "loss": 0.0644, + "step": 3403 + }, + { + "epoch": 0.07, + "learning_rate": 1.8697526309657877e-07, + "loss": 0.4035, + "step": 3404 + }, + { + "epoch": 0.07, + "learning_rate": 1.8697137975224261e-07, + "loss": 0.2028, + "step": 3405 + }, + { + "epoch": 0.07, + "learning_rate": 1.8696749640790649e-07, + "loss": 0.0736, + "step": 3406 + }, + { + "epoch": 0.07, + "learning_rate": 1.8696361306357033e-07, + "loss": 0.117, + "step": 3407 + }, + { + "epoch": 0.07, + "learning_rate": 1.869597297192342e-07, + "loss": 0.0539, + "step": 3408 + }, + { + "epoch": 0.07, + "learning_rate": 1.8695584637489805e-07, + "loss": 0.2308, + "step": 3409 + }, + { + "epoch": 0.07, + "learning_rate": 1.8695196303056192e-07, + "loss": 0.1057, + "step": 3410 + }, + { + "epoch": 0.07, + "learning_rate": 1.8694807968622576e-07, + "loss": 0.1008, + "step": 3411 + }, + { + "epoch": 0.07, + "learning_rate": 1.8694419634188963e-07, + "loss": 0.1065, + "step": 3412 + }, + { + "epoch": 0.07, + "learning_rate": 1.8694031299755348e-07, + "loss": 0.049, + "step": 3413 + }, + { + "epoch": 0.07, + "learning_rate": 1.8693642965321735e-07, + "loss": 0.2372, + "step": 3414 + }, + { + "epoch": 0.07, + "learning_rate": 1.869325463088812e-07, + "loss": 0.3085, + "step": 3415 + }, + { + "epoch": 0.07, + "learning_rate": 1.8692866296454507e-07, + "loss": 0.0747, + "step": 3416 + }, + { + "epoch": 0.07, + "learning_rate": 1.869247796202089e-07, + "loss": 0.0631, + "step": 3417 + }, + { + "epoch": 0.07, + "learning_rate": 1.8692089627587278e-07, + "loss": 0.3999, + "step": 3418 + }, + { + "epoch": 0.07, + "learning_rate": 1.8691701293153663e-07, + "loss": 0.0621, + "step": 3419 + }, + { + "epoch": 0.07, + "learning_rate": 1.869131295872005e-07, + "loss": 0.0714, + "step": 3420 + }, + { + "epoch": 0.07, + "learning_rate": 1.8690924624286435e-07, + "loss": 0.2441, + "step": 3421 + }, + { + "epoch": 0.07, + "learning_rate": 1.8690536289852822e-07, + "loss": 0.1027, + "step": 3422 + }, + { + "epoch": 0.07, + "learning_rate": 1.8690147955419206e-07, + "loss": 0.0998, + "step": 3423 + }, + { + "epoch": 0.07, + "learning_rate": 1.8689759620985593e-07, + "loss": 0.0632, + "step": 3424 + }, + { + "epoch": 0.07, + "learning_rate": 1.8689371286551978e-07, + "loss": 0.1353, + "step": 3425 + }, + { + "epoch": 0.07, + "learning_rate": 1.8688982952118365e-07, + "loss": 0.1209, + "step": 3426 + }, + { + "epoch": 0.07, + "learning_rate": 1.868859461768475e-07, + "loss": 0.1823, + "step": 3427 + }, + { + "epoch": 0.07, + "learning_rate": 1.8688206283251137e-07, + "loss": 0.1988, + "step": 3428 + }, + { + "epoch": 0.07, + "learning_rate": 1.868781794881752e-07, + "loss": 0.1067, + "step": 3429 + }, + { + "epoch": 0.07, + "learning_rate": 1.8687429614383908e-07, + "loss": 0.0994, + "step": 3430 + }, + { + "epoch": 0.07, + "learning_rate": 1.8687041279950293e-07, + "loss": 0.4647, + "step": 3431 + }, + { + "epoch": 0.07, + "learning_rate": 1.868665294551668e-07, + "loss": 0.1788, + "step": 3432 + }, + { + "epoch": 0.07, + "learning_rate": 1.8686264611083064e-07, + "loss": 0.0629, + "step": 3433 + }, + { + "epoch": 0.07, + "learning_rate": 1.8685876276649452e-07, + "loss": 0.0945, + "step": 3434 + }, + { + "epoch": 0.07, + "learning_rate": 1.8685487942215836e-07, + "loss": 0.2109, + "step": 3435 + }, + { + "epoch": 0.07, + "learning_rate": 1.8685099607782223e-07, + "loss": 0.0535, + "step": 3436 + }, + { + "epoch": 0.07, + "learning_rate": 1.8684711273348608e-07, + "loss": 0.4127, + "step": 3437 + }, + { + "epoch": 0.07, + "learning_rate": 1.8684322938914995e-07, + "loss": 0.0687, + "step": 3438 + }, + { + "epoch": 0.07, + "learning_rate": 1.868393460448138e-07, + "loss": 0.1477, + "step": 3439 + }, + { + "epoch": 0.07, + "learning_rate": 1.8683546270047767e-07, + "loss": 0.259, + "step": 3440 + }, + { + "epoch": 0.07, + "learning_rate": 1.868315793561415e-07, + "loss": 0.136, + "step": 3441 + }, + { + "epoch": 0.07, + "learning_rate": 1.8682769601180538e-07, + "loss": 0.0752, + "step": 3442 + }, + { + "epoch": 0.07, + "learning_rate": 1.868238126674692e-07, + "loss": 0.0765, + "step": 3443 + }, + { + "epoch": 0.07, + "learning_rate": 1.8681992932313307e-07, + "loss": 0.2696, + "step": 3444 + }, + { + "epoch": 0.07, + "learning_rate": 1.8681604597879692e-07, + "loss": 0.099, + "step": 3445 + }, + { + "epoch": 0.07, + "learning_rate": 1.868121626344608e-07, + "loss": 0.0906, + "step": 3446 + }, + { + "epoch": 0.07, + "learning_rate": 1.8680827929012463e-07, + "loss": 0.1512, + "step": 3447 + }, + { + "epoch": 0.07, + "learning_rate": 1.868043959457885e-07, + "loss": 0.0819, + "step": 3448 + }, + { + "epoch": 0.07, + "learning_rate": 1.8680051260145235e-07, + "loss": 0.1283, + "step": 3449 + }, + { + "epoch": 0.07, + "learning_rate": 1.8679662925711622e-07, + "loss": 0.18, + "step": 3450 + }, + { + "epoch": 0.07, + "learning_rate": 1.8679274591278007e-07, + "loss": 0.1069, + "step": 3451 + }, + { + "epoch": 0.07, + "learning_rate": 1.8678886256844394e-07, + "loss": 0.0709, + "step": 3452 + }, + { + "epoch": 0.07, + "learning_rate": 1.8678497922410778e-07, + "loss": 0.3422, + "step": 3453 + }, + { + "epoch": 0.07, + "learning_rate": 1.8678109587977165e-07, + "loss": 0.1861, + "step": 3454 + }, + { + "epoch": 0.07, + "learning_rate": 1.867772125354355e-07, + "loss": 0.0491, + "step": 3455 + }, + { + "epoch": 0.07, + "learning_rate": 1.8677332919109937e-07, + "loss": 0.0694, + "step": 3456 + }, + { + "epoch": 0.07, + "learning_rate": 1.8676944584676322e-07, + "loss": 0.0756, + "step": 3457 + }, + { + "epoch": 0.07, + "learning_rate": 1.867655625024271e-07, + "loss": 0.2156, + "step": 3458 + }, + { + "epoch": 0.07, + "learning_rate": 1.8676167915809093e-07, + "loss": 0.2199, + "step": 3459 + }, + { + "epoch": 0.07, + "learning_rate": 1.867577958137548e-07, + "loss": 0.1753, + "step": 3460 + }, + { + "epoch": 0.07, + "learning_rate": 1.8675391246941865e-07, + "loss": 0.0775, + "step": 3461 + }, + { + "epoch": 0.07, + "learning_rate": 1.8675002912508252e-07, + "loss": 0.2471, + "step": 3462 + }, + { + "epoch": 0.07, + "learning_rate": 1.8674614578074637e-07, + "loss": 0.0785, + "step": 3463 + }, + { + "epoch": 0.07, + "learning_rate": 1.8674226243641024e-07, + "loss": 0.1977, + "step": 3464 + }, + { + "epoch": 0.07, + "learning_rate": 1.8673837909207408e-07, + "loss": 0.416, + "step": 3465 + }, + { + "epoch": 0.07, + "learning_rate": 1.8673449574773795e-07, + "loss": 0.3087, + "step": 3466 + }, + { + "epoch": 0.07, + "learning_rate": 1.867306124034018e-07, + "loss": 0.1056, + "step": 3467 + }, + { + "epoch": 0.07, + "learning_rate": 1.8672672905906567e-07, + "loss": 0.0565, + "step": 3468 + }, + { + "epoch": 0.07, + "learning_rate": 1.8672284571472952e-07, + "loss": 0.0877, + "step": 3469 + }, + { + "epoch": 0.07, + "learning_rate": 1.8671896237039339e-07, + "loss": 0.0739, + "step": 3470 + }, + { + "epoch": 0.07, + "learning_rate": 1.8671507902605723e-07, + "loss": 0.0758, + "step": 3471 + }, + { + "epoch": 0.07, + "learning_rate": 1.8671119568172108e-07, + "loss": 0.4427, + "step": 3472 + }, + { + "epoch": 0.07, + "learning_rate": 1.8670731233738495e-07, + "loss": 0.2685, + "step": 3473 + }, + { + "epoch": 0.07, + "learning_rate": 1.867034289930488e-07, + "loss": 0.1687, + "step": 3474 + }, + { + "epoch": 0.07, + "learning_rate": 1.8669954564871266e-07, + "loss": 0.3374, + "step": 3475 + }, + { + "epoch": 0.07, + "learning_rate": 1.866956623043765e-07, + "loss": 0.0621, + "step": 3476 + }, + { + "epoch": 0.07, + "learning_rate": 1.8669177896004038e-07, + "loss": 0.0592, + "step": 3477 + }, + { + "epoch": 0.07, + "learning_rate": 1.8668789561570423e-07, + "loss": 0.1716, + "step": 3478 + }, + { + "epoch": 0.07, + "learning_rate": 1.866840122713681e-07, + "loss": 0.2508, + "step": 3479 + }, + { + "epoch": 0.07, + "learning_rate": 1.8668012892703194e-07, + "loss": 0.1292, + "step": 3480 + }, + { + "epoch": 0.07, + "learning_rate": 1.8667624558269581e-07, + "loss": 0.1562, + "step": 3481 + }, + { + "epoch": 0.07, + "learning_rate": 1.8667236223835966e-07, + "loss": 0.134, + "step": 3482 + }, + { + "epoch": 0.07, + "learning_rate": 1.8666847889402353e-07, + "loss": 0.2371, + "step": 3483 + }, + { + "epoch": 0.07, + "learning_rate": 1.8666459554968738e-07, + "loss": 0.1478, + "step": 3484 + }, + { + "epoch": 0.07, + "learning_rate": 1.8666071220535125e-07, + "loss": 0.0598, + "step": 3485 + }, + { + "epoch": 0.07, + "learning_rate": 1.866568288610151e-07, + "loss": 0.0728, + "step": 3486 + }, + { + "epoch": 0.07, + "learning_rate": 1.8665294551667896e-07, + "loss": 0.0912, + "step": 3487 + }, + { + "epoch": 0.07, + "learning_rate": 1.866490621723428e-07, + "loss": 0.2239, + "step": 3488 + }, + { + "epoch": 0.07, + "learning_rate": 1.8664517882800668e-07, + "loss": 0.4617, + "step": 3489 + }, + { + "epoch": 0.07, + "learning_rate": 1.8664129548367053e-07, + "loss": 0.1173, + "step": 3490 + }, + { + "epoch": 0.07, + "learning_rate": 1.866374121393344e-07, + "loss": 0.2345, + "step": 3491 + }, + { + "epoch": 0.07, + "learning_rate": 1.8663352879499824e-07, + "loss": 0.0673, + "step": 3492 + }, + { + "epoch": 0.07, + "learning_rate": 1.866296454506621e-07, + "loss": 0.0594, + "step": 3493 + }, + { + "epoch": 0.07, + "learning_rate": 1.8662576210632596e-07, + "loss": 0.0603, + "step": 3494 + }, + { + "epoch": 0.07, + "learning_rate": 1.8662187876198983e-07, + "loss": 0.1201, + "step": 3495 + }, + { + "epoch": 0.07, + "learning_rate": 1.8661799541765367e-07, + "loss": 0.1883, + "step": 3496 + }, + { + "epoch": 0.07, + "learning_rate": 1.8661411207331755e-07, + "loss": 0.4301, + "step": 3497 + }, + { + "epoch": 0.07, + "learning_rate": 1.866102287289814e-07, + "loss": 0.3212, + "step": 3498 + }, + { + "epoch": 0.07, + "learning_rate": 1.8660634538464526e-07, + "loss": 0.2501, + "step": 3499 + }, + { + "epoch": 0.07, + "learning_rate": 1.866024620403091e-07, + "loss": 0.0703, + "step": 3500 + }, + { + "epoch": 0.07, + "learning_rate": 1.8659857869597295e-07, + "loss": 0.2103, + "step": 3501 + }, + { + "epoch": 0.07, + "learning_rate": 1.865946953516368e-07, + "loss": 0.3132, + "step": 3502 + }, + { + "epoch": 0.07, + "learning_rate": 1.8659081200730067e-07, + "loss": 0.0519, + "step": 3503 + }, + { + "epoch": 0.07, + "learning_rate": 1.8658692866296451e-07, + "loss": 0.1658, + "step": 3504 + }, + { + "epoch": 0.07, + "learning_rate": 1.8658304531862839e-07, + "loss": 0.2148, + "step": 3505 + }, + { + "epoch": 0.07, + "learning_rate": 1.8657916197429223e-07, + "loss": 0.1096, + "step": 3506 + }, + { + "epoch": 0.07, + "learning_rate": 1.865752786299561e-07, + "loss": 0.0563, + "step": 3507 + }, + { + "epoch": 0.07, + "learning_rate": 1.8657139528561995e-07, + "loss": 0.0851, + "step": 3508 + }, + { + "epoch": 0.07, + "learning_rate": 1.8656751194128382e-07, + "loss": 0.1134, + "step": 3509 + }, + { + "epoch": 0.07, + "learning_rate": 1.8656362859694766e-07, + "loss": 0.1187, + "step": 3510 + }, + { + "epoch": 0.07, + "learning_rate": 1.8655974525261153e-07, + "loss": 0.1101, + "step": 3511 + }, + { + "epoch": 0.07, + "learning_rate": 1.8655586190827538e-07, + "loss": 0.0974, + "step": 3512 + }, + { + "epoch": 0.07, + "learning_rate": 1.8655197856393925e-07, + "loss": 0.1254, + "step": 3513 + }, + { + "epoch": 0.07, + "learning_rate": 1.865480952196031e-07, + "loss": 0.1104, + "step": 3514 + }, + { + "epoch": 0.07, + "learning_rate": 1.8654421187526697e-07, + "loss": 0.1019, + "step": 3515 + }, + { + "epoch": 0.07, + "learning_rate": 1.865403285309308e-07, + "loss": 0.0838, + "step": 3516 + }, + { + "epoch": 0.07, + "learning_rate": 1.8653644518659468e-07, + "loss": 0.1236, + "step": 3517 + }, + { + "epoch": 0.07, + "learning_rate": 1.8653256184225853e-07, + "loss": 0.3047, + "step": 3518 + }, + { + "epoch": 0.07, + "learning_rate": 1.865286784979224e-07, + "loss": 0.0565, + "step": 3519 + }, + { + "epoch": 0.07, + "learning_rate": 1.8652479515358625e-07, + "loss": 0.1578, + "step": 3520 + }, + { + "epoch": 0.07, + "learning_rate": 1.8652091180925012e-07, + "loss": 0.0926, + "step": 3521 + }, + { + "epoch": 0.07, + "learning_rate": 1.8651702846491396e-07, + "loss": 0.3036, + "step": 3522 + }, + { + "epoch": 0.07, + "learning_rate": 1.8651314512057783e-07, + "loss": 0.162, + "step": 3523 + }, + { + "epoch": 0.07, + "learning_rate": 1.8650926177624168e-07, + "loss": 0.5417, + "step": 3524 + }, + { + "epoch": 0.07, + "learning_rate": 1.8650537843190555e-07, + "loss": 0.0603, + "step": 3525 + }, + { + "epoch": 0.07, + "learning_rate": 1.865014950875694e-07, + "loss": 0.2213, + "step": 3526 + }, + { + "epoch": 0.07, + "learning_rate": 1.8649761174323327e-07, + "loss": 0.0834, + "step": 3527 + }, + { + "epoch": 0.07, + "learning_rate": 1.864937283988971e-07, + "loss": 0.066, + "step": 3528 + }, + { + "epoch": 0.07, + "learning_rate": 1.8648984505456098e-07, + "loss": 0.3758, + "step": 3529 + }, + { + "epoch": 0.07, + "learning_rate": 1.8648596171022483e-07, + "loss": 0.0969, + "step": 3530 + }, + { + "epoch": 0.07, + "learning_rate": 1.864820783658887e-07, + "loss": 0.3901, + "step": 3531 + }, + { + "epoch": 0.07, + "learning_rate": 1.8647819502155254e-07, + "loss": 0.2711, + "step": 3532 + }, + { + "epoch": 0.07, + "learning_rate": 1.8647431167721642e-07, + "loss": 0.1873, + "step": 3533 + }, + { + "epoch": 0.07, + "learning_rate": 1.8647042833288026e-07, + "loss": 0.0683, + "step": 3534 + }, + { + "epoch": 0.07, + "learning_rate": 1.8646654498854413e-07, + "loss": 0.0758, + "step": 3535 + }, + { + "epoch": 0.07, + "learning_rate": 1.8646266164420798e-07, + "loss": 0.5206, + "step": 3536 + }, + { + "epoch": 0.07, + "learning_rate": 1.8645877829987185e-07, + "loss": 0.2935, + "step": 3537 + }, + { + "epoch": 0.07, + "learning_rate": 1.864548949555357e-07, + "loss": 0.0904, + "step": 3538 + }, + { + "epoch": 0.07, + "learning_rate": 1.8645101161119957e-07, + "loss": 0.0578, + "step": 3539 + }, + { + "epoch": 0.07, + "learning_rate": 1.864471282668634e-07, + "loss": 0.1235, + "step": 3540 + }, + { + "epoch": 0.07, + "learning_rate": 1.8644324492252728e-07, + "loss": 0.0668, + "step": 3541 + }, + { + "epoch": 0.07, + "learning_rate": 1.8643936157819113e-07, + "loss": 0.0658, + "step": 3542 + }, + { + "epoch": 0.07, + "learning_rate": 1.86435478233855e-07, + "loss": 0.0959, + "step": 3543 + }, + { + "epoch": 0.07, + "learning_rate": 1.8643159488951884e-07, + "loss": 0.0932, + "step": 3544 + }, + { + "epoch": 0.07, + "learning_rate": 1.8642771154518272e-07, + "loss": 0.0575, + "step": 3545 + }, + { + "epoch": 0.07, + "learning_rate": 1.8642382820084656e-07, + "loss": 0.0499, + "step": 3546 + }, + { + "epoch": 0.07, + "learning_rate": 1.8641994485651043e-07, + "loss": 0.2024, + "step": 3547 + }, + { + "epoch": 0.07, + "learning_rate": 1.8641606151217428e-07, + "loss": 0.0744, + "step": 3548 + }, + { + "epoch": 0.07, + "learning_rate": 1.8641217816783815e-07, + "loss": 0.1474, + "step": 3549 + }, + { + "epoch": 0.07, + "learning_rate": 1.86408294823502e-07, + "loss": 0.35, + "step": 3550 + }, + { + "epoch": 0.07, + "learning_rate": 1.8640441147916586e-07, + "loss": 0.1468, + "step": 3551 + }, + { + "epoch": 0.07, + "learning_rate": 1.864005281348297e-07, + "loss": 0.0522, + "step": 3552 + }, + { + "epoch": 0.07, + "learning_rate": 1.8639664479049358e-07, + "loss": 0.3921, + "step": 3553 + }, + { + "epoch": 0.07, + "learning_rate": 1.8639276144615743e-07, + "loss": 0.0628, + "step": 3554 + }, + { + "epoch": 0.07, + "learning_rate": 1.863888781018213e-07, + "loss": 0.1006, + "step": 3555 + }, + { + "epoch": 0.07, + "learning_rate": 1.8638499475748514e-07, + "loss": 0.0535, + "step": 3556 + }, + { + "epoch": 0.07, + "learning_rate": 1.8638111141314901e-07, + "loss": 0.1101, + "step": 3557 + }, + { + "epoch": 0.07, + "learning_rate": 1.8637722806881286e-07, + "loss": 0.1054, + "step": 3558 + }, + { + "epoch": 0.07, + "learning_rate": 1.863733447244767e-07, + "loss": 0.1099, + "step": 3559 + }, + { + "epoch": 0.07, + "learning_rate": 1.8636946138014055e-07, + "loss": 0.0728, + "step": 3560 + }, + { + "epoch": 0.07, + "learning_rate": 1.8636557803580442e-07, + "loss": 0.1853, + "step": 3561 + }, + { + "epoch": 0.07, + "learning_rate": 1.8636169469146827e-07, + "loss": 0.1149, + "step": 3562 + }, + { + "epoch": 0.07, + "learning_rate": 1.8635781134713214e-07, + "loss": 0.1667, + "step": 3563 + }, + { + "epoch": 0.07, + "learning_rate": 1.8635392800279598e-07, + "loss": 0.1444, + "step": 3564 + }, + { + "epoch": 0.07, + "learning_rate": 1.8635004465845985e-07, + "loss": 0.0508, + "step": 3565 + }, + { + "epoch": 0.07, + "learning_rate": 1.863461613141237e-07, + "loss": 0.275, + "step": 3566 + }, + { + "epoch": 0.07, + "learning_rate": 1.8634227796978757e-07, + "loss": 0.1098, + "step": 3567 + }, + { + "epoch": 0.07, + "learning_rate": 1.8633839462545142e-07, + "loss": 0.0794, + "step": 3568 + }, + { + "epoch": 0.07, + "learning_rate": 1.8633451128111529e-07, + "loss": 0.0752, + "step": 3569 + }, + { + "epoch": 0.07, + "learning_rate": 1.8633062793677913e-07, + "loss": 0.0683, + "step": 3570 + }, + { + "epoch": 0.07, + "learning_rate": 1.86326744592443e-07, + "loss": 0.1222, + "step": 3571 + }, + { + "epoch": 0.07, + "learning_rate": 1.8632286124810685e-07, + "loss": 0.2338, + "step": 3572 + }, + { + "epoch": 0.07, + "learning_rate": 1.8631897790377072e-07, + "loss": 0.1202, + "step": 3573 + }, + { + "epoch": 0.07, + "learning_rate": 1.8631509455943456e-07, + "loss": 0.0845, + "step": 3574 + }, + { + "epoch": 0.07, + "learning_rate": 1.8631121121509844e-07, + "loss": 0.1493, + "step": 3575 + }, + { + "epoch": 0.07, + "learning_rate": 1.8630732787076228e-07, + "loss": 0.103, + "step": 3576 + }, + { + "epoch": 0.07, + "learning_rate": 1.8630344452642615e-07, + "loss": 0.1456, + "step": 3577 + }, + { + "epoch": 0.07, + "learning_rate": 1.8629956118209e-07, + "loss": 0.0764, + "step": 3578 + }, + { + "epoch": 0.07, + "learning_rate": 1.8629567783775387e-07, + "loss": 0.2098, + "step": 3579 + }, + { + "epoch": 0.07, + "learning_rate": 1.8629179449341771e-07, + "loss": 0.0885, + "step": 3580 + }, + { + "epoch": 0.07, + "learning_rate": 1.8628791114908159e-07, + "loss": 0.0685, + "step": 3581 + }, + { + "epoch": 0.07, + "learning_rate": 1.8628402780474543e-07, + "loss": 0.576, + "step": 3582 + }, + { + "epoch": 0.07, + "learning_rate": 1.862801444604093e-07, + "loss": 0.1851, + "step": 3583 + }, + { + "epoch": 0.07, + "learning_rate": 1.8627626111607315e-07, + "loss": 0.0949, + "step": 3584 + }, + { + "epoch": 0.07, + "learning_rate": 1.8627237777173702e-07, + "loss": 0.2711, + "step": 3585 + }, + { + "epoch": 0.07, + "learning_rate": 1.8626849442740086e-07, + "loss": 0.0765, + "step": 3586 + }, + { + "epoch": 0.07, + "learning_rate": 1.8626461108306474e-07, + "loss": 0.1178, + "step": 3587 + }, + { + "epoch": 0.07, + "learning_rate": 1.8626072773872858e-07, + "loss": 0.0531, + "step": 3588 + }, + { + "epoch": 0.07, + "learning_rate": 1.8625684439439245e-07, + "loss": 0.0487, + "step": 3589 + }, + { + "epoch": 0.07, + "learning_rate": 1.862529610500563e-07, + "loss": 0.1575, + "step": 3590 + }, + { + "epoch": 0.07, + "learning_rate": 1.8624907770572017e-07, + "loss": 0.5407, + "step": 3591 + }, + { + "epoch": 0.07, + "learning_rate": 1.86245194361384e-07, + "loss": 0.0581, + "step": 3592 + }, + { + "epoch": 0.07, + "learning_rate": 1.8624131101704788e-07, + "loss": 0.1301, + "step": 3593 + }, + { + "epoch": 0.07, + "learning_rate": 1.8623742767271173e-07, + "loss": 0.0676, + "step": 3594 + }, + { + "epoch": 0.07, + "learning_rate": 1.862335443283756e-07, + "loss": 0.0554, + "step": 3595 + }, + { + "epoch": 0.07, + "learning_rate": 1.8622966098403945e-07, + "loss": 0.084, + "step": 3596 + }, + { + "epoch": 0.07, + "learning_rate": 1.8622577763970332e-07, + "loss": 0.1039, + "step": 3597 + }, + { + "epoch": 0.07, + "learning_rate": 1.8622189429536716e-07, + "loss": 0.1824, + "step": 3598 + }, + { + "epoch": 0.07, + "learning_rate": 1.8621801095103103e-07, + "loss": 0.0781, + "step": 3599 + }, + { + "epoch": 0.07, + "learning_rate": 1.8621412760669488e-07, + "loss": 0.0665, + "step": 3600 + }, + { + "epoch": 0.07, + "learning_rate": 1.8621024426235875e-07, + "loss": 0.5113, + "step": 3601 + }, + { + "epoch": 0.07, + "learning_rate": 1.862063609180226e-07, + "loss": 0.2439, + "step": 3602 + }, + { + "epoch": 0.07, + "learning_rate": 1.8620247757368647e-07, + "loss": 0.1469, + "step": 3603 + }, + { + "epoch": 0.07, + "learning_rate": 1.861985942293503e-07, + "loss": 0.0674, + "step": 3604 + }, + { + "epoch": 0.07, + "learning_rate": 1.8619471088501418e-07, + "loss": 0.2941, + "step": 3605 + }, + { + "epoch": 0.07, + "learning_rate": 1.8619082754067803e-07, + "loss": 0.1247, + "step": 3606 + }, + { + "epoch": 0.07, + "learning_rate": 1.861869441963419e-07, + "loss": 0.1848, + "step": 3607 + }, + { + "epoch": 0.07, + "learning_rate": 1.8618306085200574e-07, + "loss": 0.0893, + "step": 3608 + }, + { + "epoch": 0.07, + "learning_rate": 1.8617917750766962e-07, + "loss": 0.0816, + "step": 3609 + }, + { + "epoch": 0.07, + "learning_rate": 1.8617529416333346e-07, + "loss": 0.107, + "step": 3610 + }, + { + "epoch": 0.07, + "learning_rate": 1.8617141081899733e-07, + "loss": 0.0795, + "step": 3611 + }, + { + "epoch": 0.07, + "learning_rate": 1.8616752747466118e-07, + "loss": 0.2899, + "step": 3612 + }, + { + "epoch": 0.07, + "learning_rate": 1.8616364413032505e-07, + "loss": 0.2184, + "step": 3613 + }, + { + "epoch": 0.07, + "learning_rate": 1.861597607859889e-07, + "loss": 0.2107, + "step": 3614 + }, + { + "epoch": 0.07, + "learning_rate": 1.8615587744165277e-07, + "loss": 0.1106, + "step": 3615 + }, + { + "epoch": 0.07, + "learning_rate": 1.861519940973166e-07, + "loss": 0.0477, + "step": 3616 + }, + { + "epoch": 0.07, + "learning_rate": 1.8614811075298046e-07, + "loss": 0.1324, + "step": 3617 + }, + { + "epoch": 0.07, + "learning_rate": 1.861442274086443e-07, + "loss": 0.1308, + "step": 3618 + }, + { + "epoch": 0.07, + "learning_rate": 1.8614034406430817e-07, + "loss": 0.5082, + "step": 3619 + }, + { + "epoch": 0.07, + "learning_rate": 1.8613646071997202e-07, + "loss": 0.4196, + "step": 3620 + }, + { + "epoch": 0.07, + "learning_rate": 1.861325773756359e-07, + "loss": 0.3454, + "step": 3621 + }, + { + "epoch": 0.07, + "learning_rate": 1.8612869403129973e-07, + "loss": 0.2434, + "step": 3622 + }, + { + "epoch": 0.07, + "learning_rate": 1.861248106869636e-07, + "loss": 0.1739, + "step": 3623 + }, + { + "epoch": 0.07, + "learning_rate": 1.8612092734262745e-07, + "loss": 0.6074, + "step": 3624 + }, + { + "epoch": 0.07, + "learning_rate": 1.8611704399829132e-07, + "loss": 0.1308, + "step": 3625 + }, + { + "epoch": 0.07, + "learning_rate": 1.8611316065395517e-07, + "loss": 0.101, + "step": 3626 + }, + { + "epoch": 0.07, + "learning_rate": 1.8610927730961904e-07, + "loss": 0.3465, + "step": 3627 + }, + { + "epoch": 0.07, + "learning_rate": 1.8610539396528288e-07, + "loss": 0.0761, + "step": 3628 + }, + { + "epoch": 0.07, + "learning_rate": 1.8610151062094675e-07, + "loss": 0.285, + "step": 3629 + }, + { + "epoch": 0.07, + "learning_rate": 1.860976272766106e-07, + "loss": 0.0592, + "step": 3630 + }, + { + "epoch": 0.07, + "learning_rate": 1.8609374393227447e-07, + "loss": 0.4291, + "step": 3631 + }, + { + "epoch": 0.07, + "learning_rate": 1.8608986058793832e-07, + "loss": 0.0674, + "step": 3632 + }, + { + "epoch": 0.07, + "learning_rate": 1.860859772436022e-07, + "loss": 0.0947, + "step": 3633 + }, + { + "epoch": 0.07, + "learning_rate": 1.8608209389926603e-07, + "loss": 0.0566, + "step": 3634 + }, + { + "epoch": 0.07, + "learning_rate": 1.860782105549299e-07, + "loss": 0.1396, + "step": 3635 + }, + { + "epoch": 0.07, + "learning_rate": 1.8607432721059375e-07, + "loss": 0.0571, + "step": 3636 + }, + { + "epoch": 0.07, + "learning_rate": 1.8607044386625762e-07, + "loss": 0.0518, + "step": 3637 + }, + { + "epoch": 0.07, + "learning_rate": 1.8606656052192147e-07, + "loss": 0.0633, + "step": 3638 + }, + { + "epoch": 0.07, + "learning_rate": 1.8606267717758534e-07, + "loss": 0.1888, + "step": 3639 + }, + { + "epoch": 0.07, + "learning_rate": 1.8605879383324918e-07, + "loss": 0.1332, + "step": 3640 + }, + { + "epoch": 0.07, + "learning_rate": 1.8605491048891305e-07, + "loss": 0.1228, + "step": 3641 + }, + { + "epoch": 0.07, + "learning_rate": 1.860510271445769e-07, + "loss": 0.0633, + "step": 3642 + }, + { + "epoch": 0.07, + "learning_rate": 1.8604714380024077e-07, + "loss": 0.2938, + "step": 3643 + }, + { + "epoch": 0.07, + "learning_rate": 1.8604326045590462e-07, + "loss": 0.0938, + "step": 3644 + }, + { + "epoch": 0.07, + "learning_rate": 1.8603937711156849e-07, + "loss": 0.0899, + "step": 3645 + }, + { + "epoch": 0.07, + "learning_rate": 1.8603549376723233e-07, + "loss": 0.0543, + "step": 3646 + }, + { + "epoch": 0.07, + "learning_rate": 1.860316104228962e-07, + "loss": 0.0494, + "step": 3647 + }, + { + "epoch": 0.07, + "learning_rate": 1.8602772707856005e-07, + "loss": 0.1834, + "step": 3648 + }, + { + "epoch": 0.07, + "learning_rate": 1.860238437342239e-07, + "loss": 0.434, + "step": 3649 + }, + { + "epoch": 0.07, + "learning_rate": 1.8601996038988776e-07, + "loss": 0.0698, + "step": 3650 + }, + { + "epoch": 0.07, + "learning_rate": 1.860160770455516e-07, + "loss": 0.5246, + "step": 3651 + }, + { + "epoch": 0.07, + "learning_rate": 1.8601219370121548e-07, + "loss": 0.1163, + "step": 3652 + }, + { + "epoch": 0.07, + "learning_rate": 1.8600831035687933e-07, + "loss": 0.1237, + "step": 3653 + }, + { + "epoch": 0.07, + "learning_rate": 1.860044270125432e-07, + "loss": 0.0927, + "step": 3654 + }, + { + "epoch": 0.07, + "learning_rate": 1.8600054366820704e-07, + "loss": 0.062, + "step": 3655 + }, + { + "epoch": 0.07, + "learning_rate": 1.8599666032387091e-07, + "loss": 0.1964, + "step": 3656 + }, + { + "epoch": 0.07, + "learning_rate": 1.8599277697953476e-07, + "loss": 0.3474, + "step": 3657 + }, + { + "epoch": 0.07, + "learning_rate": 1.8598889363519863e-07, + "loss": 0.2656, + "step": 3658 + }, + { + "epoch": 0.07, + "learning_rate": 1.8598501029086248e-07, + "loss": 0.4381, + "step": 3659 + }, + { + "epoch": 0.07, + "learning_rate": 1.8598112694652635e-07, + "loss": 0.0637, + "step": 3660 + }, + { + "epoch": 0.07, + "learning_rate": 1.859772436021902e-07, + "loss": 0.2483, + "step": 3661 + }, + { + "epoch": 0.07, + "learning_rate": 1.8597336025785406e-07, + "loss": 0.0587, + "step": 3662 + }, + { + "epoch": 0.07, + "learning_rate": 1.859694769135179e-07, + "loss": 0.1011, + "step": 3663 + }, + { + "epoch": 0.07, + "learning_rate": 1.8596559356918178e-07, + "loss": 0.1897, + "step": 3664 + }, + { + "epoch": 0.07, + "learning_rate": 1.8596171022484563e-07, + "loss": 0.1209, + "step": 3665 + }, + { + "epoch": 0.07, + "learning_rate": 1.859578268805095e-07, + "loss": 0.1359, + "step": 3666 + }, + { + "epoch": 0.07, + "learning_rate": 1.8595394353617334e-07, + "loss": 0.1705, + "step": 3667 + }, + { + "epoch": 0.07, + "learning_rate": 1.859500601918372e-07, + "loss": 0.2435, + "step": 3668 + }, + { + "epoch": 0.07, + "learning_rate": 1.8594617684750106e-07, + "loss": 0.2894, + "step": 3669 + }, + { + "epoch": 0.07, + "learning_rate": 1.8594229350316493e-07, + "loss": 0.1332, + "step": 3670 + }, + { + "epoch": 0.07, + "learning_rate": 1.8593841015882877e-07, + "loss": 0.1137, + "step": 3671 + }, + { + "epoch": 0.07, + "learning_rate": 1.8593452681449265e-07, + "loss": 0.4843, + "step": 3672 + }, + { + "epoch": 0.07, + "learning_rate": 1.859306434701565e-07, + "loss": 0.2745, + "step": 3673 + }, + { + "epoch": 0.07, + "learning_rate": 1.8592676012582036e-07, + "loss": 0.0522, + "step": 3674 + }, + { + "epoch": 0.07, + "learning_rate": 1.859228767814842e-07, + "loss": 0.0511, + "step": 3675 + }, + { + "epoch": 0.07, + "learning_rate": 1.8591899343714805e-07, + "loss": 0.0651, + "step": 3676 + }, + { + "epoch": 0.07, + "learning_rate": 1.8591511009281192e-07, + "loss": 0.0497, + "step": 3677 + }, + { + "epoch": 0.07, + "learning_rate": 1.8591122674847577e-07, + "loss": 0.0982, + "step": 3678 + }, + { + "epoch": 0.07, + "learning_rate": 1.8590734340413961e-07, + "loss": 0.069, + "step": 3679 + }, + { + "epoch": 0.07, + "learning_rate": 1.8590346005980349e-07, + "loss": 0.2013, + "step": 3680 + }, + { + "epoch": 0.07, + "learning_rate": 1.8589957671546733e-07, + "loss": 0.1037, + "step": 3681 + }, + { + "epoch": 0.07, + "learning_rate": 1.858956933711312e-07, + "loss": 0.303, + "step": 3682 + }, + { + "epoch": 0.07, + "learning_rate": 1.8589181002679505e-07, + "loss": 0.562, + "step": 3683 + }, + { + "epoch": 0.07, + "learning_rate": 1.8588792668245892e-07, + "loss": 0.3589, + "step": 3684 + }, + { + "epoch": 0.07, + "learning_rate": 1.8588404333812276e-07, + "loss": 0.0766, + "step": 3685 + }, + { + "epoch": 0.07, + "learning_rate": 1.8588015999378664e-07, + "loss": 0.069, + "step": 3686 + }, + { + "epoch": 0.07, + "learning_rate": 1.8587627664945048e-07, + "loss": 0.0932, + "step": 3687 + }, + { + "epoch": 0.07, + "learning_rate": 1.8587239330511435e-07, + "loss": 0.0519, + "step": 3688 + }, + { + "epoch": 0.07, + "learning_rate": 1.858685099607782e-07, + "loss": 0.1566, + "step": 3689 + }, + { + "epoch": 0.07, + "learning_rate": 1.8586462661644207e-07, + "loss": 0.3116, + "step": 3690 + }, + { + "epoch": 0.07, + "learning_rate": 1.858607432721059e-07, + "loss": 0.0799, + "step": 3691 + }, + { + "epoch": 0.07, + "learning_rate": 1.8585685992776978e-07, + "loss": 0.4226, + "step": 3692 + }, + { + "epoch": 0.07, + "learning_rate": 1.8585297658343363e-07, + "loss": 0.0919, + "step": 3693 + }, + { + "epoch": 0.07, + "learning_rate": 1.858490932390975e-07, + "loss": 0.0429, + "step": 3694 + }, + { + "epoch": 0.07, + "learning_rate": 1.8584520989476135e-07, + "loss": 0.6374, + "step": 3695 + }, + { + "epoch": 0.07, + "learning_rate": 1.8584132655042522e-07, + "loss": 0.0439, + "step": 3696 + }, + { + "epoch": 0.07, + "learning_rate": 1.8583744320608906e-07, + "loss": 0.0524, + "step": 3697 + }, + { + "epoch": 0.07, + "learning_rate": 1.8583355986175293e-07, + "loss": 0.1015, + "step": 3698 + }, + { + "epoch": 0.07, + "learning_rate": 1.8582967651741678e-07, + "loss": 0.3063, + "step": 3699 + }, + { + "epoch": 0.07, + "learning_rate": 1.8582579317308065e-07, + "loss": 0.0627, + "step": 3700 + }, + { + "epoch": 0.07, + "learning_rate": 1.858219098287445e-07, + "loss": 0.0528, + "step": 3701 + }, + { + "epoch": 0.07, + "learning_rate": 1.8581802648440837e-07, + "loss": 0.0713, + "step": 3702 + }, + { + "epoch": 0.07, + "learning_rate": 1.858141431400722e-07, + "loss": 0.0565, + "step": 3703 + }, + { + "epoch": 0.07, + "learning_rate": 1.8581025979573608e-07, + "loss": 0.0608, + "step": 3704 + }, + { + "epoch": 0.07, + "learning_rate": 1.8580637645139993e-07, + "loss": 0.1048, + "step": 3705 + }, + { + "epoch": 0.07, + "learning_rate": 1.858024931070638e-07, + "loss": 0.6798, + "step": 3706 + }, + { + "epoch": 0.07, + "learning_rate": 1.8579860976272764e-07, + "loss": 0.5437, + "step": 3707 + }, + { + "epoch": 0.07, + "learning_rate": 1.8579472641839152e-07, + "loss": 0.1151, + "step": 3708 + }, + { + "epoch": 0.07, + "learning_rate": 1.8579084307405536e-07, + "loss": 0.1709, + "step": 3709 + }, + { + "epoch": 0.07, + "learning_rate": 1.8578695972971923e-07, + "loss": 0.0464, + "step": 3710 + }, + { + "epoch": 0.07, + "learning_rate": 1.8578307638538308e-07, + "loss": 0.0606, + "step": 3711 + }, + { + "epoch": 0.07, + "learning_rate": 1.8577919304104695e-07, + "loss": 0.0738, + "step": 3712 + }, + { + "epoch": 0.07, + "learning_rate": 1.857753096967108e-07, + "loss": 0.1337, + "step": 3713 + }, + { + "epoch": 0.07, + "learning_rate": 1.8577142635237467e-07, + "loss": 0.3659, + "step": 3714 + }, + { + "epoch": 0.07, + "learning_rate": 1.857675430080385e-07, + "loss": 0.126, + "step": 3715 + }, + { + "epoch": 0.07, + "learning_rate": 1.8576365966370238e-07, + "loss": 0.0626, + "step": 3716 + }, + { + "epoch": 0.07, + "learning_rate": 1.8575977631936623e-07, + "loss": 0.2596, + "step": 3717 + }, + { + "epoch": 0.07, + "learning_rate": 1.857558929750301e-07, + "loss": 0.1181, + "step": 3718 + }, + { + "epoch": 0.07, + "learning_rate": 1.8575200963069394e-07, + "loss": 0.1567, + "step": 3719 + }, + { + "epoch": 0.07, + "learning_rate": 1.8574812628635782e-07, + "loss": 0.1617, + "step": 3720 + }, + { + "epoch": 0.07, + "learning_rate": 1.8574424294202166e-07, + "loss": 0.0845, + "step": 3721 + }, + { + "epoch": 0.07, + "learning_rate": 1.8574035959768553e-07, + "loss": 0.084, + "step": 3722 + }, + { + "epoch": 0.07, + "learning_rate": 1.8573647625334938e-07, + "loss": 0.0948, + "step": 3723 + }, + { + "epoch": 0.07, + "learning_rate": 1.8573259290901325e-07, + "loss": 0.0838, + "step": 3724 + }, + { + "epoch": 0.07, + "learning_rate": 1.857287095646771e-07, + "loss": 0.0935, + "step": 3725 + }, + { + "epoch": 0.07, + "learning_rate": 1.8572482622034096e-07, + "loss": 0.3606, + "step": 3726 + }, + { + "epoch": 0.07, + "learning_rate": 1.857209428760048e-07, + "loss": 0.1158, + "step": 3727 + }, + { + "epoch": 0.07, + "learning_rate": 1.8571705953166868e-07, + "loss": 0.0846, + "step": 3728 + }, + { + "epoch": 0.07, + "learning_rate": 1.8571317618733253e-07, + "loss": 0.091, + "step": 3729 + }, + { + "epoch": 0.07, + "learning_rate": 1.857092928429964e-07, + "loss": 0.0665, + "step": 3730 + }, + { + "epoch": 0.07, + "learning_rate": 1.8570540949866024e-07, + "loss": 0.0812, + "step": 3731 + }, + { + "epoch": 0.07, + "learning_rate": 1.8570152615432411e-07, + "loss": 0.0503, + "step": 3732 + }, + { + "epoch": 0.07, + "learning_rate": 1.8569764280998793e-07, + "loss": 0.0549, + "step": 3733 + }, + { + "epoch": 0.07, + "learning_rate": 1.856937594656518e-07, + "loss": 0.0547, + "step": 3734 + }, + { + "epoch": 0.07, + "learning_rate": 1.8568987612131565e-07, + "loss": 0.0588, + "step": 3735 + }, + { + "epoch": 0.07, + "learning_rate": 1.8568599277697952e-07, + "loss": 0.2883, + "step": 3736 + }, + { + "epoch": 0.07, + "learning_rate": 1.8568210943264337e-07, + "loss": 0.0795, + "step": 3737 + }, + { + "epoch": 0.07, + "learning_rate": 1.8567822608830724e-07, + "loss": 0.0968, + "step": 3738 + }, + { + "epoch": 0.07, + "learning_rate": 1.8567434274397108e-07, + "loss": 0.1053, + "step": 3739 + }, + { + "epoch": 0.07, + "learning_rate": 1.8567045939963495e-07, + "loss": 0.0516, + "step": 3740 + }, + { + "epoch": 0.07, + "learning_rate": 1.856665760552988e-07, + "loss": 0.3675, + "step": 3741 + }, + { + "epoch": 0.07, + "learning_rate": 1.8566269271096267e-07, + "loss": 0.1905, + "step": 3742 + }, + { + "epoch": 0.07, + "learning_rate": 1.8565880936662652e-07, + "loss": 0.0761, + "step": 3743 + }, + { + "epoch": 0.07, + "learning_rate": 1.8565492602229039e-07, + "loss": 0.0551, + "step": 3744 + }, + { + "epoch": 0.07, + "learning_rate": 1.8565104267795423e-07, + "loss": 0.1383, + "step": 3745 + }, + { + "epoch": 0.07, + "learning_rate": 1.856471593336181e-07, + "loss": 0.6754, + "step": 3746 + }, + { + "epoch": 0.07, + "learning_rate": 1.8564327598928195e-07, + "loss": 0.0758, + "step": 3747 + }, + { + "epoch": 0.07, + "learning_rate": 1.8563939264494582e-07, + "loss": 0.0619, + "step": 3748 + }, + { + "epoch": 0.07, + "learning_rate": 1.8563550930060966e-07, + "loss": 0.2429, + "step": 3749 + }, + { + "epoch": 0.07, + "learning_rate": 1.8563162595627354e-07, + "loss": 0.2453, + "step": 3750 + }, + { + "epoch": 0.07, + "learning_rate": 1.8562774261193738e-07, + "loss": 0.0495, + "step": 3751 + }, + { + "epoch": 0.07, + "learning_rate": 1.8562385926760125e-07, + "loss": 0.1947, + "step": 3752 + }, + { + "epoch": 0.07, + "learning_rate": 1.856199759232651e-07, + "loss": 0.2636, + "step": 3753 + }, + { + "epoch": 0.07, + "learning_rate": 1.8561609257892897e-07, + "loss": 0.3491, + "step": 3754 + }, + { + "epoch": 0.07, + "learning_rate": 1.8561220923459281e-07, + "loss": 0.0746, + "step": 3755 + }, + { + "epoch": 0.07, + "learning_rate": 1.8560832589025669e-07, + "loss": 0.0703, + "step": 3756 + }, + { + "epoch": 0.07, + "learning_rate": 1.8560444254592053e-07, + "loss": 0.0368, + "step": 3757 + }, + { + "epoch": 0.07, + "learning_rate": 1.856005592015844e-07, + "loss": 0.2027, + "step": 3758 + }, + { + "epoch": 0.07, + "learning_rate": 1.8559667585724825e-07, + "loss": 0.1539, + "step": 3759 + }, + { + "epoch": 0.07, + "learning_rate": 1.8559279251291212e-07, + "loss": 0.0444, + "step": 3760 + }, + { + "epoch": 0.07, + "learning_rate": 1.8558890916857596e-07, + "loss": 0.2492, + "step": 3761 + }, + { + "epoch": 0.07, + "learning_rate": 1.8558502582423984e-07, + "loss": 0.0679, + "step": 3762 + }, + { + "epoch": 0.07, + "learning_rate": 1.8558114247990368e-07, + "loss": 0.3161, + "step": 3763 + }, + { + "epoch": 0.07, + "learning_rate": 1.8557725913556755e-07, + "loss": 0.1603, + "step": 3764 + }, + { + "epoch": 0.07, + "learning_rate": 1.855733757912314e-07, + "loss": 0.1233, + "step": 3765 + }, + { + "epoch": 0.07, + "learning_rate": 1.8556949244689527e-07, + "loss": 0.0438, + "step": 3766 + }, + { + "epoch": 0.07, + "learning_rate": 1.855656091025591e-07, + "loss": 0.0655, + "step": 3767 + }, + { + "epoch": 0.07, + "learning_rate": 1.8556172575822298e-07, + "loss": 0.3832, + "step": 3768 + }, + { + "epoch": 0.07, + "learning_rate": 1.8555784241388683e-07, + "loss": 0.2599, + "step": 3769 + }, + { + "epoch": 0.07, + "learning_rate": 1.855539590695507e-07, + "loss": 0.0913, + "step": 3770 + }, + { + "epoch": 0.07, + "learning_rate": 1.8555007572521455e-07, + "loss": 0.1473, + "step": 3771 + }, + { + "epoch": 0.07, + "learning_rate": 1.8554619238087842e-07, + "loss": 0.1548, + "step": 3772 + }, + { + "epoch": 0.07, + "learning_rate": 1.8554230903654226e-07, + "loss": 0.1042, + "step": 3773 + }, + { + "epoch": 0.07, + "learning_rate": 1.8553842569220613e-07, + "loss": 0.0735, + "step": 3774 + }, + { + "epoch": 0.07, + "learning_rate": 1.8553454234786998e-07, + "loss": 0.2356, + "step": 3775 + }, + { + "epoch": 0.07, + "learning_rate": 1.8553065900353385e-07, + "loss": 0.1997, + "step": 3776 + }, + { + "epoch": 0.07, + "learning_rate": 1.855267756591977e-07, + "loss": 0.0994, + "step": 3777 + }, + { + "epoch": 0.07, + "learning_rate": 1.8552289231486157e-07, + "loss": 0.2957, + "step": 3778 + }, + { + "epoch": 0.07, + "learning_rate": 1.855190089705254e-07, + "loss": 0.1992, + "step": 3779 + }, + { + "epoch": 0.07, + "learning_rate": 1.8551512562618928e-07, + "loss": 0.0679, + "step": 3780 + }, + { + "epoch": 0.07, + "learning_rate": 1.8551124228185313e-07, + "loss": 0.0703, + "step": 3781 + }, + { + "epoch": 0.07, + "learning_rate": 1.85507358937517e-07, + "loss": 0.2228, + "step": 3782 + }, + { + "epoch": 0.07, + "learning_rate": 1.8550347559318085e-07, + "loss": 0.2531, + "step": 3783 + }, + { + "epoch": 0.07, + "learning_rate": 1.8549959224884472e-07, + "loss": 0.1949, + "step": 3784 + }, + { + "epoch": 0.07, + "learning_rate": 1.8549570890450856e-07, + "loss": 0.0666, + "step": 3785 + }, + { + "epoch": 0.07, + "learning_rate": 1.8549182556017243e-07, + "loss": 0.08, + "step": 3786 + }, + { + "epoch": 0.07, + "learning_rate": 1.8548794221583628e-07, + "loss": 0.2846, + "step": 3787 + }, + { + "epoch": 0.07, + "learning_rate": 1.8548405887150015e-07, + "loss": 0.354, + "step": 3788 + }, + { + "epoch": 0.07, + "learning_rate": 1.85480175527164e-07, + "loss": 0.1043, + "step": 3789 + }, + { + "epoch": 0.07, + "learning_rate": 1.8547629218282787e-07, + "loss": 0.0773, + "step": 3790 + }, + { + "epoch": 0.07, + "learning_rate": 1.8547240883849168e-07, + "loss": 0.2554, + "step": 3791 + }, + { + "epoch": 0.07, + "learning_rate": 1.8546852549415556e-07, + "loss": 0.0692, + "step": 3792 + }, + { + "epoch": 0.07, + "learning_rate": 1.854646421498194e-07, + "loss": 0.3416, + "step": 3793 + }, + { + "epoch": 0.07, + "learning_rate": 1.8546075880548327e-07, + "loss": 0.298, + "step": 3794 + }, + { + "epoch": 0.07, + "learning_rate": 1.8545687546114712e-07, + "loss": 0.0547, + "step": 3795 + }, + { + "epoch": 0.07, + "learning_rate": 1.85452992116811e-07, + "loss": 0.0767, + "step": 3796 + }, + { + "epoch": 0.07, + "learning_rate": 1.8544910877247483e-07, + "loss": 0.0783, + "step": 3797 + }, + { + "epoch": 0.07, + "learning_rate": 1.854452254281387e-07, + "loss": 0.0585, + "step": 3798 + }, + { + "epoch": 0.07, + "learning_rate": 1.8544134208380255e-07, + "loss": 0.0927, + "step": 3799 + }, + { + "epoch": 0.07, + "learning_rate": 1.8543745873946642e-07, + "loss": 0.0743, + "step": 3800 + }, + { + "epoch": 0.07, + "learning_rate": 1.8543357539513027e-07, + "loss": 0.4671, + "step": 3801 + }, + { + "epoch": 0.07, + "learning_rate": 1.8542969205079414e-07, + "loss": 0.0532, + "step": 3802 + }, + { + "epoch": 0.07, + "learning_rate": 1.8542580870645798e-07, + "loss": 0.1302, + "step": 3803 + }, + { + "epoch": 0.07, + "learning_rate": 1.8542192536212185e-07, + "loss": 0.0535, + "step": 3804 + }, + { + "epoch": 0.07, + "learning_rate": 1.854180420177857e-07, + "loss": 0.0997, + "step": 3805 + }, + { + "epoch": 0.07, + "learning_rate": 1.8541415867344957e-07, + "loss": 0.0505, + "step": 3806 + }, + { + "epoch": 0.07, + "learning_rate": 1.8541027532911342e-07, + "loss": 0.0459, + "step": 3807 + }, + { + "epoch": 0.07, + "learning_rate": 1.854063919847773e-07, + "loss": 0.0744, + "step": 3808 + }, + { + "epoch": 0.07, + "learning_rate": 1.8540250864044113e-07, + "loss": 0.0403, + "step": 3809 + }, + { + "epoch": 0.07, + "learning_rate": 1.85398625296105e-07, + "loss": 0.1721, + "step": 3810 + }, + { + "epoch": 0.07, + "learning_rate": 1.8539474195176885e-07, + "loss": 0.0933, + "step": 3811 + }, + { + "epoch": 0.07, + "learning_rate": 1.8539085860743272e-07, + "loss": 0.0654, + "step": 3812 + }, + { + "epoch": 0.07, + "learning_rate": 1.8538697526309657e-07, + "loss": 0.1046, + "step": 3813 + }, + { + "epoch": 0.07, + "learning_rate": 1.8538309191876044e-07, + "loss": 0.406, + "step": 3814 + }, + { + "epoch": 0.07, + "learning_rate": 1.8537920857442428e-07, + "loss": 0.0439, + "step": 3815 + }, + { + "epoch": 0.07, + "learning_rate": 1.8537532523008815e-07, + "loss": 0.0601, + "step": 3816 + }, + { + "epoch": 0.07, + "learning_rate": 1.85371441885752e-07, + "loss": 0.1293, + "step": 3817 + }, + { + "epoch": 0.07, + "learning_rate": 1.8536755854141587e-07, + "loss": 0.317, + "step": 3818 + }, + { + "epoch": 0.07, + "learning_rate": 1.8536367519707972e-07, + "loss": 0.0486, + "step": 3819 + }, + { + "epoch": 0.07, + "learning_rate": 1.853597918527436e-07, + "loss": 0.3557, + "step": 3820 + }, + { + "epoch": 0.07, + "learning_rate": 1.8535590850840743e-07, + "loss": 0.0424, + "step": 3821 + }, + { + "epoch": 0.07, + "learning_rate": 1.853520251640713e-07, + "loss": 0.0833, + "step": 3822 + }, + { + "epoch": 0.07, + "learning_rate": 1.8534814181973515e-07, + "loss": 0.093, + "step": 3823 + }, + { + "epoch": 0.07, + "learning_rate": 1.8534425847539902e-07, + "loss": 0.0639, + "step": 3824 + }, + { + "epoch": 0.07, + "learning_rate": 1.8534037513106286e-07, + "loss": 0.1304, + "step": 3825 + }, + { + "epoch": 0.07, + "learning_rate": 1.853364917867267e-07, + "loss": 0.2327, + "step": 3826 + }, + { + "epoch": 0.07, + "learning_rate": 1.8533260844239058e-07, + "loss": 0.2347, + "step": 3827 + }, + { + "epoch": 0.07, + "learning_rate": 1.8532872509805443e-07, + "loss": 0.5184, + "step": 3828 + }, + { + "epoch": 0.07, + "learning_rate": 1.853248417537183e-07, + "loss": 0.2823, + "step": 3829 + }, + { + "epoch": 0.07, + "learning_rate": 1.8532095840938214e-07, + "loss": 0.3059, + "step": 3830 + }, + { + "epoch": 0.07, + "learning_rate": 1.8531707506504601e-07, + "loss": 0.0511, + "step": 3831 + }, + { + "epoch": 0.07, + "learning_rate": 1.8531319172070986e-07, + "loss": 0.0505, + "step": 3832 + }, + { + "epoch": 0.07, + "learning_rate": 1.8530930837637373e-07, + "loss": 0.0864, + "step": 3833 + }, + { + "epoch": 0.07, + "learning_rate": 1.8530542503203758e-07, + "loss": 0.5854, + "step": 3834 + }, + { + "epoch": 0.07, + "learning_rate": 1.8530154168770145e-07, + "loss": 0.0514, + "step": 3835 + }, + { + "epoch": 0.07, + "learning_rate": 1.852976583433653e-07, + "loss": 0.1429, + "step": 3836 + }, + { + "epoch": 0.07, + "learning_rate": 1.8529377499902916e-07, + "loss": 0.1117, + "step": 3837 + }, + { + "epoch": 0.07, + "learning_rate": 1.85289891654693e-07, + "loss": 0.1355, + "step": 3838 + }, + { + "epoch": 0.07, + "learning_rate": 1.8528600831035688e-07, + "loss": 0.1221, + "step": 3839 + }, + { + "epoch": 0.07, + "learning_rate": 1.8528212496602073e-07, + "loss": 0.0649, + "step": 3840 + }, + { + "epoch": 0.07, + "learning_rate": 1.852782416216846e-07, + "loss": 0.0621, + "step": 3841 + }, + { + "epoch": 0.07, + "learning_rate": 1.8527435827734844e-07, + "loss": 0.0817, + "step": 3842 + }, + { + "epoch": 0.07, + "learning_rate": 1.852704749330123e-07, + "loss": 0.077, + "step": 3843 + }, + { + "epoch": 0.07, + "learning_rate": 1.8526659158867616e-07, + "loss": 0.0719, + "step": 3844 + }, + { + "epoch": 0.07, + "learning_rate": 1.8526270824434003e-07, + "loss": 0.0953, + "step": 3845 + }, + { + "epoch": 0.07, + "learning_rate": 1.8525882490000387e-07, + "loss": 0.1136, + "step": 3846 + }, + { + "epoch": 0.07, + "learning_rate": 1.8525494155566775e-07, + "loss": 0.068, + "step": 3847 + }, + { + "epoch": 0.07, + "learning_rate": 1.852510582113316e-07, + "loss": 0.602, + "step": 3848 + }, + { + "epoch": 0.07, + "learning_rate": 1.8524717486699544e-07, + "loss": 0.3322, + "step": 3849 + }, + { + "epoch": 0.07, + "learning_rate": 1.852432915226593e-07, + "loss": 0.4865, + "step": 3850 + }, + { + "epoch": 0.07, + "learning_rate": 1.8523940817832315e-07, + "loss": 0.048, + "step": 3851 + }, + { + "epoch": 0.07, + "learning_rate": 1.8523552483398702e-07, + "loss": 0.083, + "step": 3852 + }, + { + "epoch": 0.07, + "learning_rate": 1.8523164148965087e-07, + "loss": 0.1473, + "step": 3853 + }, + { + "epoch": 0.07, + "learning_rate": 1.8522775814531474e-07, + "loss": 0.0664, + "step": 3854 + }, + { + "epoch": 0.07, + "learning_rate": 1.8522387480097859e-07, + "loss": 0.073, + "step": 3855 + }, + { + "epoch": 0.07, + "learning_rate": 1.8521999145664243e-07, + "loss": 0.0617, + "step": 3856 + }, + { + "epoch": 0.07, + "learning_rate": 1.852161081123063e-07, + "loss": 0.31, + "step": 3857 + }, + { + "epoch": 0.07, + "learning_rate": 1.8521222476797015e-07, + "loss": 0.0555, + "step": 3858 + }, + { + "epoch": 0.07, + "learning_rate": 1.8520834142363402e-07, + "loss": 0.3564, + "step": 3859 + }, + { + "epoch": 0.07, + "learning_rate": 1.8520445807929786e-07, + "loss": 0.0639, + "step": 3860 + }, + { + "epoch": 0.07, + "learning_rate": 1.8520057473496174e-07, + "loss": 0.066, + "step": 3861 + }, + { + "epoch": 0.07, + "learning_rate": 1.8519669139062558e-07, + "loss": 0.1939, + "step": 3862 + }, + { + "epoch": 0.07, + "learning_rate": 1.8519280804628945e-07, + "loss": 0.0729, + "step": 3863 + }, + { + "epoch": 0.07, + "learning_rate": 1.851889247019533e-07, + "loss": 0.5595, + "step": 3864 + }, + { + "epoch": 0.07, + "learning_rate": 1.8518504135761717e-07, + "loss": 0.0602, + "step": 3865 + }, + { + "epoch": 0.07, + "learning_rate": 1.85181158013281e-07, + "loss": 0.1928, + "step": 3866 + }, + { + "epoch": 0.08, + "learning_rate": 1.8517727466894488e-07, + "loss": 0.0989, + "step": 3867 + }, + { + "epoch": 0.08, + "learning_rate": 1.8517339132460873e-07, + "loss": 0.1012, + "step": 3868 + }, + { + "epoch": 0.08, + "learning_rate": 1.851695079802726e-07, + "loss": 0.3194, + "step": 3869 + }, + { + "epoch": 0.08, + "learning_rate": 1.8516562463593645e-07, + "loss": 0.5534, + "step": 3870 + }, + { + "epoch": 0.08, + "learning_rate": 1.8516174129160032e-07, + "loss": 0.5543, + "step": 3871 + }, + { + "epoch": 0.08, + "learning_rate": 1.8515785794726416e-07, + "loss": 0.2893, + "step": 3872 + }, + { + "epoch": 0.08, + "learning_rate": 1.8515397460292803e-07, + "loss": 0.0769, + "step": 3873 + }, + { + "epoch": 0.08, + "learning_rate": 1.8515009125859188e-07, + "loss": 0.0542, + "step": 3874 + }, + { + "epoch": 0.08, + "learning_rate": 1.8514620791425575e-07, + "loss": 0.4114, + "step": 3875 + }, + { + "epoch": 0.08, + "learning_rate": 1.851423245699196e-07, + "loss": 0.0705, + "step": 3876 + }, + { + "epoch": 0.08, + "learning_rate": 1.8513844122558347e-07, + "loss": 0.0533, + "step": 3877 + }, + { + "epoch": 0.08, + "learning_rate": 1.851345578812473e-07, + "loss": 0.1169, + "step": 3878 + }, + { + "epoch": 0.08, + "learning_rate": 1.8513067453691118e-07, + "loss": 0.0778, + "step": 3879 + }, + { + "epoch": 0.08, + "learning_rate": 1.8512679119257503e-07, + "loss": 0.1161, + "step": 3880 + }, + { + "epoch": 0.08, + "learning_rate": 1.851229078482389e-07, + "loss": 0.0844, + "step": 3881 + }, + { + "epoch": 0.08, + "learning_rate": 1.8511902450390275e-07, + "loss": 0.211, + "step": 3882 + }, + { + "epoch": 0.08, + "learning_rate": 1.8511514115956662e-07, + "loss": 0.1291, + "step": 3883 + }, + { + "epoch": 0.08, + "learning_rate": 1.8511125781523046e-07, + "loss": 0.103, + "step": 3884 + }, + { + "epoch": 0.08, + "learning_rate": 1.8510737447089433e-07, + "loss": 0.0737, + "step": 3885 + }, + { + "epoch": 0.08, + "learning_rate": 1.8510349112655818e-07, + "loss": 0.0747, + "step": 3886 + }, + { + "epoch": 0.08, + "learning_rate": 1.8509960778222205e-07, + "loss": 0.2548, + "step": 3887 + }, + { + "epoch": 0.08, + "learning_rate": 1.850957244378859e-07, + "loss": 0.2425, + "step": 3888 + }, + { + "epoch": 0.08, + "learning_rate": 1.8509184109354977e-07, + "loss": 0.1299, + "step": 3889 + }, + { + "epoch": 0.08, + "learning_rate": 1.850879577492136e-07, + "loss": 0.0836, + "step": 3890 + }, + { + "epoch": 0.08, + "learning_rate": 1.8508407440487748e-07, + "loss": 0.0572, + "step": 3891 + }, + { + "epoch": 0.08, + "learning_rate": 1.8508019106054133e-07, + "loss": 0.2853, + "step": 3892 + }, + { + "epoch": 0.08, + "learning_rate": 1.850763077162052e-07, + "loss": 0.0908, + "step": 3893 + }, + { + "epoch": 0.08, + "learning_rate": 1.8507242437186904e-07, + "loss": 0.0749, + "step": 3894 + }, + { + "epoch": 0.08, + "learning_rate": 1.8506854102753292e-07, + "loss": 0.0625, + "step": 3895 + }, + { + "epoch": 0.08, + "learning_rate": 1.8506465768319676e-07, + "loss": 0.0619, + "step": 3896 + }, + { + "epoch": 0.08, + "learning_rate": 1.8506077433886063e-07, + "loss": 0.0865, + "step": 3897 + }, + { + "epoch": 0.08, + "learning_rate": 1.8505689099452448e-07, + "loss": 0.1022, + "step": 3898 + }, + { + "epoch": 0.08, + "learning_rate": 1.8505300765018835e-07, + "loss": 0.1581, + "step": 3899 + }, + { + "epoch": 0.08, + "learning_rate": 1.850491243058522e-07, + "loss": 0.1223, + "step": 3900 + }, + { + "epoch": 0.08, + "learning_rate": 1.8504524096151606e-07, + "loss": 0.1911, + "step": 3901 + }, + { + "epoch": 0.08, + "learning_rate": 1.850413576171799e-07, + "loss": 0.1102, + "step": 3902 + }, + { + "epoch": 0.08, + "learning_rate": 1.8503747427284378e-07, + "loss": 0.0431, + "step": 3903 + }, + { + "epoch": 0.08, + "learning_rate": 1.8503359092850763e-07, + "loss": 0.291, + "step": 3904 + }, + { + "epoch": 0.08, + "learning_rate": 1.850297075841715e-07, + "loss": 0.0953, + "step": 3905 + }, + { + "epoch": 0.08, + "learning_rate": 1.8502582423983534e-07, + "loss": 0.0512, + "step": 3906 + }, + { + "epoch": 0.08, + "learning_rate": 1.850219408954992e-07, + "loss": 0.0674, + "step": 3907 + }, + { + "epoch": 0.08, + "learning_rate": 1.8501805755116303e-07, + "loss": 0.1433, + "step": 3908 + }, + { + "epoch": 0.08, + "learning_rate": 1.850141742068269e-07, + "loss": 0.0784, + "step": 3909 + }, + { + "epoch": 0.08, + "learning_rate": 1.8501029086249075e-07, + "loss": 0.4043, + "step": 3910 + }, + { + "epoch": 0.08, + "learning_rate": 1.8500640751815462e-07, + "loss": 0.1766, + "step": 3911 + }, + { + "epoch": 0.08, + "learning_rate": 1.8500252417381847e-07, + "loss": 0.0488, + "step": 3912 + }, + { + "epoch": 0.08, + "learning_rate": 1.8499864082948234e-07, + "loss": 0.0485, + "step": 3913 + }, + { + "epoch": 0.08, + "learning_rate": 1.8499475748514618e-07, + "loss": 0.0419, + "step": 3914 + }, + { + "epoch": 0.08, + "learning_rate": 1.8499087414081005e-07, + "loss": 0.0606, + "step": 3915 + }, + { + "epoch": 0.08, + "learning_rate": 1.849869907964739e-07, + "loss": 0.3248, + "step": 3916 + }, + { + "epoch": 0.08, + "learning_rate": 1.8498310745213777e-07, + "loss": 0.3597, + "step": 3917 + }, + { + "epoch": 0.08, + "learning_rate": 1.8497922410780162e-07, + "loss": 0.0713, + "step": 3918 + }, + { + "epoch": 0.08, + "learning_rate": 1.849753407634655e-07, + "loss": 0.2372, + "step": 3919 + }, + { + "epoch": 0.08, + "learning_rate": 1.8497145741912933e-07, + "loss": 0.0405, + "step": 3920 + }, + { + "epoch": 0.08, + "learning_rate": 1.849675740747932e-07, + "loss": 0.0487, + "step": 3921 + }, + { + "epoch": 0.08, + "learning_rate": 1.8496369073045705e-07, + "loss": 0.0983, + "step": 3922 + }, + { + "epoch": 0.08, + "learning_rate": 1.8495980738612092e-07, + "loss": 0.1824, + "step": 3923 + }, + { + "epoch": 0.08, + "learning_rate": 1.8495592404178476e-07, + "loss": 0.0486, + "step": 3924 + }, + { + "epoch": 0.08, + "learning_rate": 1.8495204069744864e-07, + "loss": 0.399, + "step": 3925 + }, + { + "epoch": 0.08, + "learning_rate": 1.8494815735311248e-07, + "loss": 0.0553, + "step": 3926 + }, + { + "epoch": 0.08, + "learning_rate": 1.8494427400877635e-07, + "loss": 0.0488, + "step": 3927 + }, + { + "epoch": 0.08, + "learning_rate": 1.849403906644402e-07, + "loss": 0.1803, + "step": 3928 + }, + { + "epoch": 0.08, + "learning_rate": 1.8493650732010407e-07, + "loss": 0.272, + "step": 3929 + }, + { + "epoch": 0.08, + "learning_rate": 1.8493262397576791e-07, + "loss": 0.1328, + "step": 3930 + }, + { + "epoch": 0.08, + "learning_rate": 1.8492874063143179e-07, + "loss": 0.09, + "step": 3931 + }, + { + "epoch": 0.08, + "learning_rate": 1.8492485728709563e-07, + "loss": 0.0464, + "step": 3932 + }, + { + "epoch": 0.08, + "learning_rate": 1.849209739427595e-07, + "loss": 0.0718, + "step": 3933 + }, + { + "epoch": 0.08, + "learning_rate": 1.8491709059842335e-07, + "loss": 0.0926, + "step": 3934 + }, + { + "epoch": 0.08, + "learning_rate": 1.8491320725408722e-07, + "loss": 0.1584, + "step": 3935 + }, + { + "epoch": 0.08, + "learning_rate": 1.8490932390975106e-07, + "loss": 0.0481, + "step": 3936 + }, + { + "epoch": 0.08, + "learning_rate": 1.8490544056541494e-07, + "loss": 0.529, + "step": 3937 + }, + { + "epoch": 0.08, + "learning_rate": 1.8490155722107878e-07, + "loss": 0.0529, + "step": 3938 + }, + { + "epoch": 0.08, + "learning_rate": 1.8489767387674265e-07, + "loss": 0.0619, + "step": 3939 + }, + { + "epoch": 0.08, + "learning_rate": 1.848937905324065e-07, + "loss": 0.4439, + "step": 3940 + }, + { + "epoch": 0.08, + "learning_rate": 1.8488990718807037e-07, + "loss": 0.0467, + "step": 3941 + }, + { + "epoch": 0.08, + "learning_rate": 1.848860238437342e-07, + "loss": 0.2219, + "step": 3942 + }, + { + "epoch": 0.08, + "learning_rate": 1.8488214049939808e-07, + "loss": 0.2818, + "step": 3943 + }, + { + "epoch": 0.08, + "learning_rate": 1.8487825715506193e-07, + "loss": 0.5155, + "step": 3944 + }, + { + "epoch": 0.08, + "learning_rate": 1.848743738107258e-07, + "loss": 0.6509, + "step": 3945 + }, + { + "epoch": 0.08, + "learning_rate": 1.8487049046638965e-07, + "loss": 0.3586, + "step": 3946 + }, + { + "epoch": 0.08, + "learning_rate": 1.8486660712205352e-07, + "loss": 0.0544, + "step": 3947 + }, + { + "epoch": 0.08, + "learning_rate": 1.8486272377771736e-07, + "loss": 0.5545, + "step": 3948 + }, + { + "epoch": 0.08, + "learning_rate": 1.8485884043338123e-07, + "loss": 0.1714, + "step": 3949 + }, + { + "epoch": 0.08, + "learning_rate": 1.8485495708904508e-07, + "loss": 0.0829, + "step": 3950 + }, + { + "epoch": 0.08, + "learning_rate": 1.8485107374470895e-07, + "loss": 0.2577, + "step": 3951 + }, + { + "epoch": 0.08, + "learning_rate": 1.848471904003728e-07, + "loss": 0.5738, + "step": 3952 + }, + { + "epoch": 0.08, + "learning_rate": 1.8484330705603667e-07, + "loss": 0.0466, + "step": 3953 + }, + { + "epoch": 0.08, + "learning_rate": 1.848394237117005e-07, + "loss": 0.0373, + "step": 3954 + }, + { + "epoch": 0.08, + "learning_rate": 1.8483554036736438e-07, + "loss": 0.0456, + "step": 3955 + }, + { + "epoch": 0.08, + "learning_rate": 1.8483165702302823e-07, + "loss": 0.0484, + "step": 3956 + }, + { + "epoch": 0.08, + "learning_rate": 1.848277736786921e-07, + "loss": 0.0519, + "step": 3957 + }, + { + "epoch": 0.08, + "learning_rate": 1.8482389033435595e-07, + "loss": 0.122, + "step": 3958 + }, + { + "epoch": 0.08, + "learning_rate": 1.8482000699001982e-07, + "loss": 0.2802, + "step": 3959 + }, + { + "epoch": 0.08, + "learning_rate": 1.8481612364568366e-07, + "loss": 0.3189, + "step": 3960 + }, + { + "epoch": 0.08, + "learning_rate": 1.8481224030134753e-07, + "loss": 0.11, + "step": 3961 + }, + { + "epoch": 0.08, + "learning_rate": 1.8480835695701138e-07, + "loss": 0.0464, + "step": 3962 + }, + { + "epoch": 0.08, + "learning_rate": 1.8480447361267525e-07, + "loss": 0.0665, + "step": 3963 + }, + { + "epoch": 0.08, + "learning_rate": 1.848005902683391e-07, + "loss": 0.0556, + "step": 3964 + }, + { + "epoch": 0.08, + "learning_rate": 1.8479670692400294e-07, + "loss": 0.0698, + "step": 3965 + }, + { + "epoch": 0.08, + "learning_rate": 1.8479282357966678e-07, + "loss": 0.0675, + "step": 3966 + }, + { + "epoch": 0.08, + "learning_rate": 1.8478894023533066e-07, + "loss": 0.076, + "step": 3967 + }, + { + "epoch": 0.08, + "learning_rate": 1.847850568909945e-07, + "loss": 0.0615, + "step": 3968 + }, + { + "epoch": 0.08, + "learning_rate": 1.8478117354665837e-07, + "loss": 0.1589, + "step": 3969 + }, + { + "epoch": 0.08, + "learning_rate": 1.8477729020232222e-07, + "loss": 0.0997, + "step": 3970 + }, + { + "epoch": 0.08, + "learning_rate": 1.847734068579861e-07, + "loss": 0.0469, + "step": 3971 + }, + { + "epoch": 0.08, + "learning_rate": 1.8476952351364993e-07, + "loss": 0.2078, + "step": 3972 + }, + { + "epoch": 0.08, + "learning_rate": 1.847656401693138e-07, + "loss": 0.1151, + "step": 3973 + }, + { + "epoch": 0.08, + "learning_rate": 1.8476175682497765e-07, + "loss": 0.3096, + "step": 3974 + }, + { + "epoch": 0.08, + "learning_rate": 1.8475787348064152e-07, + "loss": 0.1868, + "step": 3975 + }, + { + "epoch": 0.08, + "learning_rate": 1.8475399013630537e-07, + "loss": 0.0471, + "step": 3976 + }, + { + "epoch": 0.08, + "learning_rate": 1.8475010679196924e-07, + "loss": 0.0568, + "step": 3977 + }, + { + "epoch": 0.08, + "learning_rate": 1.8474622344763308e-07, + "loss": 0.0387, + "step": 3978 + }, + { + "epoch": 0.08, + "learning_rate": 1.8474234010329696e-07, + "loss": 0.2708, + "step": 3979 + }, + { + "epoch": 0.08, + "learning_rate": 1.847384567589608e-07, + "loss": 0.4803, + "step": 3980 + }, + { + "epoch": 0.08, + "learning_rate": 1.8473457341462467e-07, + "loss": 0.049, + "step": 3981 + }, + { + "epoch": 0.08, + "learning_rate": 1.8473069007028852e-07, + "loss": 0.2609, + "step": 3982 + }, + { + "epoch": 0.08, + "learning_rate": 1.847268067259524e-07, + "loss": 0.0454, + "step": 3983 + }, + { + "epoch": 0.08, + "learning_rate": 1.8472292338161623e-07, + "loss": 0.093, + "step": 3984 + }, + { + "epoch": 0.08, + "learning_rate": 1.847190400372801e-07, + "loss": 0.0379, + "step": 3985 + }, + { + "epoch": 0.08, + "learning_rate": 1.8471515669294395e-07, + "loss": 0.114, + "step": 3986 + }, + { + "epoch": 0.08, + "learning_rate": 1.8471127334860782e-07, + "loss": 0.0988, + "step": 3987 + }, + { + "epoch": 0.08, + "learning_rate": 1.8470739000427167e-07, + "loss": 0.238, + "step": 3988 + }, + { + "epoch": 0.08, + "learning_rate": 1.8470350665993554e-07, + "loss": 0.123, + "step": 3989 + }, + { + "epoch": 0.08, + "learning_rate": 1.8469962331559938e-07, + "loss": 0.294, + "step": 3990 + }, + { + "epoch": 0.08, + "learning_rate": 1.8469573997126325e-07, + "loss": 0.4788, + "step": 3991 + }, + { + "epoch": 0.08, + "learning_rate": 1.846918566269271e-07, + "loss": 0.1493, + "step": 3992 + }, + { + "epoch": 0.08, + "learning_rate": 1.8468797328259097e-07, + "loss": 0.0985, + "step": 3993 + }, + { + "epoch": 0.08, + "learning_rate": 1.8468408993825482e-07, + "loss": 0.0932, + "step": 3994 + }, + { + "epoch": 0.08, + "learning_rate": 1.846802065939187e-07, + "loss": 0.0508, + "step": 3995 + }, + { + "epoch": 0.08, + "learning_rate": 1.8467632324958253e-07, + "loss": 0.0644, + "step": 3996 + }, + { + "epoch": 0.08, + "learning_rate": 1.846724399052464e-07, + "loss": 0.0505, + "step": 3997 + }, + { + "epoch": 0.08, + "learning_rate": 1.8466855656091025e-07, + "loss": 0.1542, + "step": 3998 + }, + { + "epoch": 0.08, + "learning_rate": 1.8466467321657412e-07, + "loss": 0.2926, + "step": 3999 + }, + { + "epoch": 0.08, + "learning_rate": 1.8466078987223796e-07, + "loss": 0.0517, + "step": 4000 + }, + { + "epoch": 0.08, + "learning_rate": 1.8465690652790184e-07, + "loss": 0.0446, + "step": 4001 + }, + { + "epoch": 0.08, + "learning_rate": 1.8465302318356568e-07, + "loss": 0.5218, + "step": 4002 + }, + { + "epoch": 0.08, + "learning_rate": 1.8464913983922953e-07, + "loss": 0.7758, + "step": 4003 + }, + { + "epoch": 0.08, + "learning_rate": 1.846452564948934e-07, + "loss": 0.0405, + "step": 4004 + }, + { + "epoch": 0.08, + "learning_rate": 1.8464137315055724e-07, + "loss": 0.4113, + "step": 4005 + }, + { + "epoch": 0.08, + "learning_rate": 1.8463748980622111e-07, + "loss": 0.0748, + "step": 4006 + }, + { + "epoch": 0.08, + "learning_rate": 1.8463360646188496e-07, + "loss": 0.2508, + "step": 4007 + }, + { + "epoch": 0.08, + "learning_rate": 1.8462972311754883e-07, + "loss": 0.2445, + "step": 4008 + }, + { + "epoch": 0.08, + "learning_rate": 1.8462583977321268e-07, + "loss": 0.0379, + "step": 4009 + }, + { + "epoch": 0.08, + "learning_rate": 1.8462195642887655e-07, + "loss": 0.0449, + "step": 4010 + }, + { + "epoch": 0.08, + "learning_rate": 1.846180730845404e-07, + "loss": 0.3015, + "step": 4011 + }, + { + "epoch": 0.08, + "learning_rate": 1.8461418974020426e-07, + "loss": 0.0413, + "step": 4012 + }, + { + "epoch": 0.08, + "learning_rate": 1.846103063958681e-07, + "loss": 0.1001, + "step": 4013 + }, + { + "epoch": 0.08, + "learning_rate": 1.8460642305153198e-07, + "loss": 0.0931, + "step": 4014 + }, + { + "epoch": 0.08, + "learning_rate": 1.8460253970719583e-07, + "loss": 0.0616, + "step": 4015 + }, + { + "epoch": 0.08, + "learning_rate": 1.845986563628597e-07, + "loss": 0.1241, + "step": 4016 + }, + { + "epoch": 0.08, + "learning_rate": 1.8459477301852354e-07, + "loss": 0.0994, + "step": 4017 + }, + { + "epoch": 0.08, + "learning_rate": 1.8459088967418741e-07, + "loss": 0.0891, + "step": 4018 + }, + { + "epoch": 0.08, + "learning_rate": 1.8458700632985126e-07, + "loss": 0.2994, + "step": 4019 + }, + { + "epoch": 0.08, + "learning_rate": 1.8458312298551513e-07, + "loss": 0.0729, + "step": 4020 + }, + { + "epoch": 0.08, + "learning_rate": 1.8457923964117897e-07, + "loss": 0.0803, + "step": 4021 + }, + { + "epoch": 0.08, + "learning_rate": 1.8457535629684285e-07, + "loss": 0.1287, + "step": 4022 + }, + { + "epoch": 0.08, + "learning_rate": 1.845714729525067e-07, + "loss": 0.8665, + "step": 4023 + }, + { + "epoch": 0.08, + "learning_rate": 1.8456758960817054e-07, + "loss": 0.0814, + "step": 4024 + }, + { + "epoch": 0.08, + "learning_rate": 1.845637062638344e-07, + "loss": 0.0424, + "step": 4025 + }, + { + "epoch": 0.08, + "learning_rate": 1.8455982291949825e-07, + "loss": 0.2, + "step": 4026 + }, + { + "epoch": 0.08, + "learning_rate": 1.8455593957516212e-07, + "loss": 0.1788, + "step": 4027 + }, + { + "epoch": 0.08, + "learning_rate": 1.8455205623082597e-07, + "loss": 0.0443, + "step": 4028 + }, + { + "epoch": 0.08, + "learning_rate": 1.8454817288648984e-07, + "loss": 0.1043, + "step": 4029 + }, + { + "epoch": 0.08, + "learning_rate": 1.8454428954215369e-07, + "loss": 0.0551, + "step": 4030 + }, + { + "epoch": 0.08, + "learning_rate": 1.8454040619781756e-07, + "loss": 0.0516, + "step": 4031 + }, + { + "epoch": 0.08, + "learning_rate": 1.845365228534814e-07, + "loss": 0.0492, + "step": 4032 + }, + { + "epoch": 0.08, + "learning_rate": 1.8453263950914525e-07, + "loss": 0.1826, + "step": 4033 + }, + { + "epoch": 0.08, + "learning_rate": 1.8452875616480912e-07, + "loss": 0.0637, + "step": 4034 + }, + { + "epoch": 0.08, + "learning_rate": 1.8452487282047296e-07, + "loss": 0.0833, + "step": 4035 + }, + { + "epoch": 0.08, + "learning_rate": 1.8452098947613684e-07, + "loss": 0.0441, + "step": 4036 + }, + { + "epoch": 0.08, + "learning_rate": 1.8451710613180068e-07, + "loss": 0.3287, + "step": 4037 + }, + { + "epoch": 0.08, + "learning_rate": 1.8451322278746455e-07, + "loss": 0.5236, + "step": 4038 + }, + { + "epoch": 0.08, + "learning_rate": 1.845093394431284e-07, + "loss": 0.0371, + "step": 4039 + }, + { + "epoch": 0.08, + "learning_rate": 1.8450545609879227e-07, + "loss": 0.0631, + "step": 4040 + }, + { + "epoch": 0.08, + "learning_rate": 1.8450157275445611e-07, + "loss": 0.2685, + "step": 4041 + }, + { + "epoch": 0.08, + "learning_rate": 1.8449768941011998e-07, + "loss": 0.1595, + "step": 4042 + }, + { + "epoch": 0.08, + "learning_rate": 1.8449380606578383e-07, + "loss": 0.0732, + "step": 4043 + }, + { + "epoch": 0.08, + "learning_rate": 1.844899227214477e-07, + "loss": 0.0604, + "step": 4044 + }, + { + "epoch": 0.08, + "learning_rate": 1.8448603937711155e-07, + "loss": 0.4328, + "step": 4045 + }, + { + "epoch": 0.08, + "learning_rate": 1.8448215603277542e-07, + "loss": 0.0899, + "step": 4046 + }, + { + "epoch": 0.08, + "learning_rate": 1.8447827268843926e-07, + "loss": 0.0836, + "step": 4047 + }, + { + "epoch": 0.08, + "learning_rate": 1.8447438934410313e-07, + "loss": 0.0941, + "step": 4048 + }, + { + "epoch": 0.08, + "learning_rate": 1.8447050599976698e-07, + "loss": 0.0404, + "step": 4049 + }, + { + "epoch": 0.08, + "learning_rate": 1.8446662265543085e-07, + "loss": 0.0435, + "step": 4050 + }, + { + "epoch": 0.08, + "learning_rate": 1.844627393110947e-07, + "loss": 0.067, + "step": 4051 + }, + { + "epoch": 0.08, + "learning_rate": 1.8445885596675857e-07, + "loss": 0.7323, + "step": 4052 + }, + { + "epoch": 0.08, + "learning_rate": 1.844549726224224e-07, + "loss": 0.0664, + "step": 4053 + }, + { + "epoch": 0.08, + "learning_rate": 1.8445108927808628e-07, + "loss": 0.0361, + "step": 4054 + }, + { + "epoch": 0.08, + "learning_rate": 1.8444720593375013e-07, + "loss": 0.0619, + "step": 4055 + }, + { + "epoch": 0.08, + "learning_rate": 1.84443322589414e-07, + "loss": 0.1018, + "step": 4056 + }, + { + "epoch": 0.08, + "learning_rate": 1.8443943924507785e-07, + "loss": 0.0558, + "step": 4057 + }, + { + "epoch": 0.08, + "learning_rate": 1.8443555590074172e-07, + "loss": 0.0354, + "step": 4058 + }, + { + "epoch": 0.08, + "learning_rate": 1.8443167255640556e-07, + "loss": 0.0432, + "step": 4059 + }, + { + "epoch": 0.08, + "learning_rate": 1.8442778921206943e-07, + "loss": 0.058, + "step": 4060 + }, + { + "epoch": 0.08, + "learning_rate": 1.8442390586773328e-07, + "loss": 0.4319, + "step": 4061 + }, + { + "epoch": 0.08, + "learning_rate": 1.8442002252339715e-07, + "loss": 0.1256, + "step": 4062 + }, + { + "epoch": 0.08, + "learning_rate": 1.84416139179061e-07, + "loss": 0.0357, + "step": 4063 + }, + { + "epoch": 0.08, + "learning_rate": 1.8441225583472487e-07, + "loss": 0.1352, + "step": 4064 + }, + { + "epoch": 0.08, + "learning_rate": 1.844083724903887e-07, + "loss": 0.0653, + "step": 4065 + }, + { + "epoch": 0.08, + "learning_rate": 1.8440448914605258e-07, + "loss": 0.0342, + "step": 4066 + }, + { + "epoch": 0.08, + "learning_rate": 1.8440060580171643e-07, + "loss": 0.0374, + "step": 4067 + }, + { + "epoch": 0.08, + "learning_rate": 1.843967224573803e-07, + "loss": 0.3239, + "step": 4068 + }, + { + "epoch": 0.08, + "learning_rate": 1.8439283911304414e-07, + "loss": 0.0461, + "step": 4069 + }, + { + "epoch": 0.08, + "learning_rate": 1.8438895576870802e-07, + "loss": 0.4298, + "step": 4070 + }, + { + "epoch": 0.08, + "learning_rate": 1.8438507242437186e-07, + "loss": 0.13, + "step": 4071 + }, + { + "epoch": 0.08, + "learning_rate": 1.8438118908003573e-07, + "loss": 0.1471, + "step": 4072 + }, + { + "epoch": 0.08, + "learning_rate": 1.8437730573569958e-07, + "loss": 0.0464, + "step": 4073 + }, + { + "epoch": 0.08, + "learning_rate": 1.8437342239136345e-07, + "loss": 0.1025, + "step": 4074 + }, + { + "epoch": 0.08, + "learning_rate": 1.843695390470273e-07, + "loss": 0.0353, + "step": 4075 + }, + { + "epoch": 0.08, + "learning_rate": 1.8436565570269117e-07, + "loss": 0.1286, + "step": 4076 + }, + { + "epoch": 0.08, + "learning_rate": 1.84361772358355e-07, + "loss": 0.5532, + "step": 4077 + }, + { + "epoch": 0.08, + "learning_rate": 1.8435788901401888e-07, + "loss": 0.0472, + "step": 4078 + }, + { + "epoch": 0.08, + "learning_rate": 1.8435400566968273e-07, + "loss": 0.2578, + "step": 4079 + }, + { + "epoch": 0.08, + "learning_rate": 1.843501223253466e-07, + "loss": 0.0507, + "step": 4080 + }, + { + "epoch": 0.08, + "learning_rate": 1.8434623898101042e-07, + "loss": 0.062, + "step": 4081 + }, + { + "epoch": 0.08, + "learning_rate": 1.843423556366743e-07, + "loss": 0.041, + "step": 4082 + }, + { + "epoch": 0.08, + "learning_rate": 1.8433847229233813e-07, + "loss": 0.0511, + "step": 4083 + }, + { + "epoch": 0.08, + "learning_rate": 1.84334588948002e-07, + "loss": 0.0699, + "step": 4084 + }, + { + "epoch": 0.08, + "learning_rate": 1.8433070560366585e-07, + "loss": 0.0437, + "step": 4085 + }, + { + "epoch": 0.08, + "learning_rate": 1.8432682225932972e-07, + "loss": 0.0657, + "step": 4086 + }, + { + "epoch": 0.08, + "learning_rate": 1.8432293891499357e-07, + "loss": 0.0522, + "step": 4087 + }, + { + "epoch": 0.08, + "learning_rate": 1.8431905557065744e-07, + "loss": 0.0686, + "step": 4088 + }, + { + "epoch": 0.08, + "learning_rate": 1.8431517222632128e-07, + "loss": 0.0397, + "step": 4089 + }, + { + "epoch": 0.08, + "learning_rate": 1.8431128888198515e-07, + "loss": 0.2543, + "step": 4090 + }, + { + "epoch": 0.08, + "learning_rate": 1.84307405537649e-07, + "loss": 0.2334, + "step": 4091 + }, + { + "epoch": 0.08, + "learning_rate": 1.8430352219331287e-07, + "loss": 0.066, + "step": 4092 + }, + { + "epoch": 0.08, + "learning_rate": 1.8429963884897672e-07, + "loss": 0.2195, + "step": 4093 + }, + { + "epoch": 0.08, + "learning_rate": 1.842957555046406e-07, + "loss": 0.5811, + "step": 4094 + }, + { + "epoch": 0.08, + "learning_rate": 1.8429187216030443e-07, + "loss": 0.0552, + "step": 4095 + }, + { + "epoch": 0.08, + "learning_rate": 1.842879888159683e-07, + "loss": 0.1371, + "step": 4096 + }, + { + "epoch": 0.08, + "learning_rate": 1.8428410547163215e-07, + "loss": 0.0745, + "step": 4097 + }, + { + "epoch": 0.08, + "learning_rate": 1.8428022212729602e-07, + "loss": 0.1314, + "step": 4098 + }, + { + "epoch": 0.08, + "learning_rate": 1.8427633878295986e-07, + "loss": 0.0368, + "step": 4099 + }, + { + "epoch": 0.08, + "learning_rate": 1.8427245543862374e-07, + "loss": 0.1373, + "step": 4100 + }, + { + "epoch": 0.08, + "learning_rate": 1.8426857209428758e-07, + "loss": 0.0348, + "step": 4101 + }, + { + "epoch": 0.08, + "learning_rate": 1.8426468874995145e-07, + "loss": 0.391, + "step": 4102 + }, + { + "epoch": 0.08, + "learning_rate": 1.842608054056153e-07, + "loss": 0.1885, + "step": 4103 + }, + { + "epoch": 0.08, + "learning_rate": 1.8425692206127917e-07, + "loss": 0.0367, + "step": 4104 + }, + { + "epoch": 0.08, + "learning_rate": 1.8425303871694301e-07, + "loss": 0.2219, + "step": 4105 + }, + { + "epoch": 0.08, + "learning_rate": 1.8424915537260689e-07, + "loss": 0.0325, + "step": 4106 + }, + { + "epoch": 0.08, + "learning_rate": 1.8424527202827073e-07, + "loss": 0.1022, + "step": 4107 + }, + { + "epoch": 0.08, + "learning_rate": 1.842413886839346e-07, + "loss": 0.1106, + "step": 4108 + }, + { + "epoch": 0.08, + "learning_rate": 1.8423750533959845e-07, + "loss": 0.0516, + "step": 4109 + }, + { + "epoch": 0.08, + "learning_rate": 1.8423362199526232e-07, + "loss": 0.0339, + "step": 4110 + }, + { + "epoch": 0.08, + "learning_rate": 1.8422973865092616e-07, + "loss": 0.0357, + "step": 4111 + }, + { + "epoch": 0.08, + "learning_rate": 1.8422585530659004e-07, + "loss": 0.1516, + "step": 4112 + }, + { + "epoch": 0.08, + "learning_rate": 1.8422197196225388e-07, + "loss": 0.1725, + "step": 4113 + }, + { + "epoch": 0.08, + "learning_rate": 1.8421808861791775e-07, + "loss": 0.1325, + "step": 4114 + }, + { + "epoch": 0.08, + "learning_rate": 1.842142052735816e-07, + "loss": 0.0456, + "step": 4115 + }, + { + "epoch": 0.08, + "learning_rate": 1.8421032192924547e-07, + "loss": 0.0434, + "step": 4116 + }, + { + "epoch": 0.08, + "learning_rate": 1.8420643858490931e-07, + "loss": 0.2929, + "step": 4117 + }, + { + "epoch": 0.08, + "learning_rate": 1.8420255524057318e-07, + "loss": 0.0572, + "step": 4118 + }, + { + "epoch": 0.08, + "learning_rate": 1.8419867189623703e-07, + "loss": 0.0566, + "step": 4119 + }, + { + "epoch": 0.08, + "learning_rate": 1.841947885519009e-07, + "loss": 0.19, + "step": 4120 + }, + { + "epoch": 0.08, + "learning_rate": 1.8419090520756475e-07, + "loss": 0.0606, + "step": 4121 + }, + { + "epoch": 0.08, + "learning_rate": 1.8418702186322862e-07, + "loss": 0.0682, + "step": 4122 + }, + { + "epoch": 0.08, + "learning_rate": 1.8418313851889246e-07, + "loss": 0.0432, + "step": 4123 + }, + { + "epoch": 0.08, + "learning_rate": 1.8417925517455633e-07, + "loss": 0.0876, + "step": 4124 + }, + { + "epoch": 0.08, + "learning_rate": 1.8417537183022018e-07, + "loss": 0.0651, + "step": 4125 + }, + { + "epoch": 0.08, + "learning_rate": 1.8417148848588405e-07, + "loss": 0.1083, + "step": 4126 + }, + { + "epoch": 0.08, + "learning_rate": 1.841676051415479e-07, + "loss": 0.0755, + "step": 4127 + }, + { + "epoch": 0.08, + "learning_rate": 1.8416372179721177e-07, + "loss": 0.1544, + "step": 4128 + }, + { + "epoch": 0.08, + "learning_rate": 1.841598384528756e-07, + "loss": 0.0446, + "step": 4129 + }, + { + "epoch": 0.08, + "learning_rate": 1.8415595510853948e-07, + "loss": 0.2295, + "step": 4130 + }, + { + "epoch": 0.08, + "learning_rate": 1.8415207176420333e-07, + "loss": 0.1914, + "step": 4131 + }, + { + "epoch": 0.08, + "learning_rate": 1.841481884198672e-07, + "loss": 0.2042, + "step": 4132 + }, + { + "epoch": 0.08, + "learning_rate": 1.8414430507553105e-07, + "loss": 0.1019, + "step": 4133 + }, + { + "epoch": 0.08, + "learning_rate": 1.8414042173119492e-07, + "loss": 0.0745, + "step": 4134 + }, + { + "epoch": 0.08, + "learning_rate": 1.8413653838685876e-07, + "loss": 0.0404, + "step": 4135 + }, + { + "epoch": 0.08, + "learning_rate": 1.8413265504252263e-07, + "loss": 0.8586, + "step": 4136 + }, + { + "epoch": 0.08, + "learning_rate": 1.8412877169818648e-07, + "loss": 0.0655, + "step": 4137 + }, + { + "epoch": 0.08, + "learning_rate": 1.8412488835385035e-07, + "loss": 0.0425, + "step": 4138 + }, + { + "epoch": 0.08, + "learning_rate": 1.8412100500951417e-07, + "loss": 0.0494, + "step": 4139 + }, + { + "epoch": 0.08, + "learning_rate": 1.8411712166517804e-07, + "loss": 0.1939, + "step": 4140 + }, + { + "epoch": 0.08, + "learning_rate": 1.8411323832084188e-07, + "loss": 0.3398, + "step": 4141 + }, + { + "epoch": 0.08, + "learning_rate": 1.8410935497650576e-07, + "loss": 0.0462, + "step": 4142 + }, + { + "epoch": 0.08, + "learning_rate": 1.841054716321696e-07, + "loss": 0.0443, + "step": 4143 + }, + { + "epoch": 0.08, + "learning_rate": 1.8410158828783347e-07, + "loss": 0.0392, + "step": 4144 + }, + { + "epoch": 0.08, + "learning_rate": 1.8409770494349732e-07, + "loss": 0.0391, + "step": 4145 + }, + { + "epoch": 0.08, + "learning_rate": 1.840938215991612e-07, + "loss": 0.0403, + "step": 4146 + }, + { + "epoch": 0.08, + "learning_rate": 1.8408993825482503e-07, + "loss": 0.0443, + "step": 4147 + }, + { + "epoch": 0.08, + "learning_rate": 1.840860549104889e-07, + "loss": 0.1526, + "step": 4148 + }, + { + "epoch": 0.08, + "learning_rate": 1.8408217156615275e-07, + "loss": 0.0634, + "step": 4149 + }, + { + "epoch": 0.08, + "learning_rate": 1.8407828822181662e-07, + "loss": 0.1839, + "step": 4150 + }, + { + "epoch": 0.08, + "learning_rate": 1.8407440487748047e-07, + "loss": 0.0811, + "step": 4151 + }, + { + "epoch": 0.08, + "learning_rate": 1.8407052153314434e-07, + "loss": 0.0342, + "step": 4152 + }, + { + "epoch": 0.08, + "learning_rate": 1.8406663818880818e-07, + "loss": 0.3985, + "step": 4153 + }, + { + "epoch": 0.08, + "learning_rate": 1.8406275484447206e-07, + "loss": 0.0636, + "step": 4154 + }, + { + "epoch": 0.08, + "learning_rate": 1.840588715001359e-07, + "loss": 0.0505, + "step": 4155 + }, + { + "epoch": 0.08, + "learning_rate": 1.8405498815579977e-07, + "loss": 0.8534, + "step": 4156 + }, + { + "epoch": 0.08, + "learning_rate": 1.8405110481146362e-07, + "loss": 0.0757, + "step": 4157 + }, + { + "epoch": 0.08, + "learning_rate": 1.840472214671275e-07, + "loss": 0.4944, + "step": 4158 + }, + { + "epoch": 0.08, + "learning_rate": 1.8404333812279133e-07, + "loss": 0.5463, + "step": 4159 + }, + { + "epoch": 0.08, + "learning_rate": 1.840394547784552e-07, + "loss": 0.0473, + "step": 4160 + }, + { + "epoch": 0.08, + "learning_rate": 1.8403557143411905e-07, + "loss": 0.3594, + "step": 4161 + }, + { + "epoch": 0.08, + "learning_rate": 1.8403168808978292e-07, + "loss": 0.0824, + "step": 4162 + }, + { + "epoch": 0.08, + "learning_rate": 1.8402780474544677e-07, + "loss": 0.1185, + "step": 4163 + }, + { + "epoch": 0.08, + "learning_rate": 1.8402392140111064e-07, + "loss": 0.238, + "step": 4164 + }, + { + "epoch": 0.08, + "learning_rate": 1.8402003805677448e-07, + "loss": 0.2058, + "step": 4165 + }, + { + "epoch": 0.08, + "learning_rate": 1.8401615471243835e-07, + "loss": 0.044, + "step": 4166 + }, + { + "epoch": 0.08, + "learning_rate": 1.840122713681022e-07, + "loss": 0.1231, + "step": 4167 + }, + { + "epoch": 0.08, + "learning_rate": 1.8400838802376607e-07, + "loss": 0.0534, + "step": 4168 + }, + { + "epoch": 0.08, + "learning_rate": 1.8400450467942992e-07, + "loss": 0.0714, + "step": 4169 + }, + { + "epoch": 0.08, + "learning_rate": 1.840006213350938e-07, + "loss": 0.0688, + "step": 4170 + }, + { + "epoch": 0.08, + "learning_rate": 1.8399673799075763e-07, + "loss": 0.0351, + "step": 4171 + }, + { + "epoch": 0.08, + "learning_rate": 1.839928546464215e-07, + "loss": 0.1449, + "step": 4172 + }, + { + "epoch": 0.08, + "learning_rate": 1.8398897130208535e-07, + "loss": 0.0325, + "step": 4173 + }, + { + "epoch": 0.08, + "learning_rate": 1.8398508795774922e-07, + "loss": 0.1954, + "step": 4174 + }, + { + "epoch": 0.08, + "learning_rate": 1.8398120461341307e-07, + "loss": 0.0892, + "step": 4175 + }, + { + "epoch": 0.08, + "learning_rate": 1.8397732126907694e-07, + "loss": 0.0507, + "step": 4176 + }, + { + "epoch": 0.08, + "learning_rate": 1.8397343792474078e-07, + "loss": 0.1572, + "step": 4177 + }, + { + "epoch": 0.08, + "learning_rate": 1.8396955458040465e-07, + "loss": 0.2904, + "step": 4178 + }, + { + "epoch": 0.08, + "learning_rate": 1.839656712360685e-07, + "loss": 0.1083, + "step": 4179 + }, + { + "epoch": 0.08, + "learning_rate": 1.8396178789173234e-07, + "loss": 0.0992, + "step": 4180 + }, + { + "epoch": 0.08, + "learning_rate": 1.8395790454739621e-07, + "loss": 0.039, + "step": 4181 + }, + { + "epoch": 0.08, + "learning_rate": 1.8395402120306006e-07, + "loss": 0.2238, + "step": 4182 + }, + { + "epoch": 0.08, + "learning_rate": 1.8395013785872393e-07, + "loss": 0.2047, + "step": 4183 + }, + { + "epoch": 0.08, + "learning_rate": 1.8394625451438778e-07, + "loss": 0.036, + "step": 4184 + }, + { + "epoch": 0.08, + "learning_rate": 1.8394237117005165e-07, + "loss": 0.2027, + "step": 4185 + }, + { + "epoch": 0.08, + "learning_rate": 1.839384878257155e-07, + "loss": 0.0527, + "step": 4186 + }, + { + "epoch": 0.08, + "learning_rate": 1.8393460448137936e-07, + "loss": 0.0527, + "step": 4187 + }, + { + "epoch": 0.08, + "learning_rate": 1.839307211370432e-07, + "loss": 0.1912, + "step": 4188 + }, + { + "epoch": 0.08, + "learning_rate": 1.8392683779270708e-07, + "loss": 0.1119, + "step": 4189 + }, + { + "epoch": 0.08, + "learning_rate": 1.8392295444837093e-07, + "loss": 0.037, + "step": 4190 + }, + { + "epoch": 0.08, + "learning_rate": 1.839190711040348e-07, + "loss": 0.1457, + "step": 4191 + }, + { + "epoch": 0.08, + "learning_rate": 1.8391518775969864e-07, + "loss": 0.0276, + "step": 4192 + }, + { + "epoch": 0.08, + "learning_rate": 1.8391130441536251e-07, + "loss": 0.0364, + "step": 4193 + }, + { + "epoch": 0.08, + "learning_rate": 1.8390742107102636e-07, + "loss": 0.0744, + "step": 4194 + }, + { + "epoch": 0.08, + "learning_rate": 1.8390353772669023e-07, + "loss": 0.0277, + "step": 4195 + }, + { + "epoch": 0.08, + "learning_rate": 1.8389965438235407e-07, + "loss": 0.0316, + "step": 4196 + }, + { + "epoch": 0.08, + "learning_rate": 1.8389577103801792e-07, + "loss": 0.0317, + "step": 4197 + }, + { + "epoch": 0.08, + "learning_rate": 1.838918876936818e-07, + "loss": 0.2451, + "step": 4198 + }, + { + "epoch": 0.08, + "learning_rate": 1.8388800434934564e-07, + "loss": 0.0951, + "step": 4199 + }, + { + "epoch": 0.08, + "learning_rate": 1.838841210050095e-07, + "loss": 0.2608, + "step": 4200 + }, + { + "epoch": 0.08, + "learning_rate": 1.8388023766067335e-07, + "loss": 0.0716, + "step": 4201 + }, + { + "epoch": 0.08, + "learning_rate": 1.8387635431633722e-07, + "loss": 0.1359, + "step": 4202 + }, + { + "epoch": 0.08, + "learning_rate": 1.8387247097200107e-07, + "loss": 0.0266, + "step": 4203 + }, + { + "epoch": 0.08, + "learning_rate": 1.8386858762766494e-07, + "loss": 0.07, + "step": 4204 + }, + { + "epoch": 0.08, + "learning_rate": 1.8386470428332879e-07, + "loss": 0.2519, + "step": 4205 + }, + { + "epoch": 0.08, + "learning_rate": 1.8386082093899266e-07, + "loss": 0.0521, + "step": 4206 + }, + { + "epoch": 0.08, + "learning_rate": 1.838569375946565e-07, + "loss": 0.0351, + "step": 4207 + }, + { + "epoch": 0.08, + "learning_rate": 1.8385305425032037e-07, + "loss": 0.0855, + "step": 4208 + }, + { + "epoch": 0.08, + "learning_rate": 1.8384917090598422e-07, + "loss": 0.0894, + "step": 4209 + }, + { + "epoch": 0.08, + "learning_rate": 1.8384528756164806e-07, + "loss": 0.032, + "step": 4210 + }, + { + "epoch": 0.08, + "learning_rate": 1.8384140421731194e-07, + "loss": 0.0556, + "step": 4211 + }, + { + "epoch": 0.08, + "learning_rate": 1.8383752087297578e-07, + "loss": 0.7767, + "step": 4212 + }, + { + "epoch": 0.08, + "learning_rate": 1.8383363752863965e-07, + "loss": 0.0387, + "step": 4213 + }, + { + "epoch": 0.08, + "learning_rate": 1.838297541843035e-07, + "loss": 0.2363, + "step": 4214 + }, + { + "epoch": 0.08, + "learning_rate": 1.8382587083996737e-07, + "loss": 0.1525, + "step": 4215 + }, + { + "epoch": 0.08, + "learning_rate": 1.8382198749563121e-07, + "loss": 0.0784, + "step": 4216 + }, + { + "epoch": 0.08, + "learning_rate": 1.8381810415129508e-07, + "loss": 0.0388, + "step": 4217 + }, + { + "epoch": 0.08, + "learning_rate": 1.8381422080695893e-07, + "loss": 0.0345, + "step": 4218 + }, + { + "epoch": 0.08, + "learning_rate": 1.838103374626228e-07, + "loss": 0.0816, + "step": 4219 + }, + { + "epoch": 0.08, + "learning_rate": 1.8380645411828665e-07, + "loss": 0.2536, + "step": 4220 + }, + { + "epoch": 0.08, + "learning_rate": 1.8380257077395052e-07, + "loss": 0.6671, + "step": 4221 + }, + { + "epoch": 0.08, + "learning_rate": 1.8379868742961436e-07, + "loss": 0.5922, + "step": 4222 + }, + { + "epoch": 0.08, + "learning_rate": 1.8379480408527823e-07, + "loss": 0.1092, + "step": 4223 + }, + { + "epoch": 0.08, + "learning_rate": 1.8379092074094208e-07, + "loss": 0.0831, + "step": 4224 + }, + { + "epoch": 0.08, + "learning_rate": 1.8378703739660595e-07, + "loss": 0.0348, + "step": 4225 + }, + { + "epoch": 0.08, + "learning_rate": 1.837831540522698e-07, + "loss": 0.0407, + "step": 4226 + }, + { + "epoch": 0.08, + "learning_rate": 1.8377927070793367e-07, + "loss": 0.0625, + "step": 4227 + }, + { + "epoch": 0.08, + "learning_rate": 1.837753873635975e-07, + "loss": 0.0333, + "step": 4228 + }, + { + "epoch": 0.08, + "learning_rate": 1.8377150401926138e-07, + "loss": 0.037, + "step": 4229 + }, + { + "epoch": 0.08, + "learning_rate": 1.8376762067492523e-07, + "loss": 0.0662, + "step": 4230 + }, + { + "epoch": 0.08, + "learning_rate": 1.837637373305891e-07, + "loss": 0.0405, + "step": 4231 + }, + { + "epoch": 0.08, + "learning_rate": 1.8375985398625295e-07, + "loss": 0.0503, + "step": 4232 + }, + { + "epoch": 0.08, + "learning_rate": 1.8375597064191682e-07, + "loss": 0.3579, + "step": 4233 + }, + { + "epoch": 0.08, + "learning_rate": 1.8375208729758066e-07, + "loss": 0.0393, + "step": 4234 + }, + { + "epoch": 0.08, + "learning_rate": 1.8374820395324453e-07, + "loss": 0.0598, + "step": 4235 + }, + { + "epoch": 0.08, + "learning_rate": 1.8374432060890838e-07, + "loss": 0.2881, + "step": 4236 + }, + { + "epoch": 0.08, + "learning_rate": 1.8374043726457225e-07, + "loss": 0.1173, + "step": 4237 + }, + { + "epoch": 0.08, + "learning_rate": 1.837365539202361e-07, + "loss": 0.0454, + "step": 4238 + }, + { + "epoch": 0.08, + "learning_rate": 1.8373267057589997e-07, + "loss": 0.3008, + "step": 4239 + }, + { + "epoch": 0.08, + "learning_rate": 1.837287872315638e-07, + "loss": 0.0689, + "step": 4240 + }, + { + "epoch": 0.08, + "learning_rate": 1.8372490388722768e-07, + "loss": 0.6472, + "step": 4241 + }, + { + "epoch": 0.08, + "learning_rate": 1.8372102054289153e-07, + "loss": 0.0382, + "step": 4242 + }, + { + "epoch": 0.08, + "learning_rate": 1.837171371985554e-07, + "loss": 0.2397, + "step": 4243 + }, + { + "epoch": 0.08, + "learning_rate": 1.8371325385421924e-07, + "loss": 0.0776, + "step": 4244 + }, + { + "epoch": 0.08, + "learning_rate": 1.8370937050988312e-07, + "loss": 0.0485, + "step": 4245 + }, + { + "epoch": 0.08, + "learning_rate": 1.8370548716554696e-07, + "loss": 0.0329, + "step": 4246 + }, + { + "epoch": 0.08, + "learning_rate": 1.8370160382121083e-07, + "loss": 0.0637, + "step": 4247 + }, + { + "epoch": 0.08, + "learning_rate": 1.8369772047687468e-07, + "loss": 0.0338, + "step": 4248 + }, + { + "epoch": 0.08, + "learning_rate": 1.8369383713253855e-07, + "loss": 0.0655, + "step": 4249 + }, + { + "epoch": 0.08, + "learning_rate": 1.836899537882024e-07, + "loss": 0.2891, + "step": 4250 + }, + { + "epoch": 0.08, + "learning_rate": 1.8368607044386627e-07, + "loss": 0.1229, + "step": 4251 + }, + { + "epoch": 0.08, + "learning_rate": 1.836821870995301e-07, + "loss": 0.1044, + "step": 4252 + }, + { + "epoch": 0.08, + "learning_rate": 1.8367830375519398e-07, + "loss": 0.2579, + "step": 4253 + }, + { + "epoch": 0.08, + "learning_rate": 1.8367442041085783e-07, + "loss": 0.0283, + "step": 4254 + }, + { + "epoch": 0.08, + "learning_rate": 1.8367053706652167e-07, + "loss": 0.1496, + "step": 4255 + }, + { + "epoch": 0.08, + "learning_rate": 1.8366665372218552e-07, + "loss": 0.0585, + "step": 4256 + }, + { + "epoch": 0.08, + "learning_rate": 1.836627703778494e-07, + "loss": 0.132, + "step": 4257 + }, + { + "epoch": 0.08, + "learning_rate": 1.8365888703351323e-07, + "loss": 0.0334, + "step": 4258 + }, + { + "epoch": 0.08, + "learning_rate": 1.836550036891771e-07, + "loss": 0.0365, + "step": 4259 + }, + { + "epoch": 0.08, + "learning_rate": 1.8365112034484095e-07, + "loss": 0.0501, + "step": 4260 + }, + { + "epoch": 0.08, + "learning_rate": 1.8364723700050482e-07, + "loss": 0.0338, + "step": 4261 + }, + { + "epoch": 0.08, + "learning_rate": 1.8364335365616867e-07, + "loss": 0.1134, + "step": 4262 + }, + { + "epoch": 0.08, + "learning_rate": 1.8363947031183254e-07, + "loss": 0.1419, + "step": 4263 + }, + { + "epoch": 0.08, + "learning_rate": 1.8363558696749638e-07, + "loss": 0.0503, + "step": 4264 + }, + { + "epoch": 0.08, + "learning_rate": 1.8363170362316025e-07, + "loss": 0.0289, + "step": 4265 + }, + { + "epoch": 0.08, + "learning_rate": 1.836278202788241e-07, + "loss": 0.2861, + "step": 4266 + }, + { + "epoch": 0.08, + "learning_rate": 1.8362393693448797e-07, + "loss": 0.0717, + "step": 4267 + }, + { + "epoch": 0.08, + "learning_rate": 1.8362005359015182e-07, + "loss": 0.1115, + "step": 4268 + }, + { + "epoch": 0.08, + "learning_rate": 1.836161702458157e-07, + "loss": 0.1836, + "step": 4269 + }, + { + "epoch": 0.08, + "learning_rate": 1.8361228690147953e-07, + "loss": 0.0532, + "step": 4270 + }, + { + "epoch": 0.08, + "learning_rate": 1.836084035571434e-07, + "loss": 0.0364, + "step": 4271 + }, + { + "epoch": 0.08, + "learning_rate": 1.8360452021280725e-07, + "loss": 0.0428, + "step": 4272 + }, + { + "epoch": 0.08, + "learning_rate": 1.8360063686847112e-07, + "loss": 0.2939, + "step": 4273 + }, + { + "epoch": 0.08, + "learning_rate": 1.8359675352413497e-07, + "loss": 0.1784, + "step": 4274 + }, + { + "epoch": 0.08, + "learning_rate": 1.8359287017979884e-07, + "loss": 0.0379, + "step": 4275 + }, + { + "epoch": 0.08, + "learning_rate": 1.8358898683546268e-07, + "loss": 0.2482, + "step": 4276 + }, + { + "epoch": 0.08, + "learning_rate": 1.8358510349112655e-07, + "loss": 0.5474, + "step": 4277 + }, + { + "epoch": 0.08, + "learning_rate": 1.835812201467904e-07, + "loss": 0.0358, + "step": 4278 + }, + { + "epoch": 0.08, + "learning_rate": 1.8357733680245427e-07, + "loss": 0.1839, + "step": 4279 + }, + { + "epoch": 0.08, + "learning_rate": 1.8357345345811811e-07, + "loss": 0.6858, + "step": 4280 + }, + { + "epoch": 0.08, + "learning_rate": 1.8356957011378199e-07, + "loss": 0.0294, + "step": 4281 + }, + { + "epoch": 0.08, + "learning_rate": 1.8356568676944583e-07, + "loss": 0.0357, + "step": 4282 + }, + { + "epoch": 0.08, + "learning_rate": 1.835618034251097e-07, + "loss": 0.0298, + "step": 4283 + }, + { + "epoch": 0.08, + "learning_rate": 1.8355792008077355e-07, + "loss": 0.4153, + "step": 4284 + }, + { + "epoch": 0.08, + "learning_rate": 1.8355403673643742e-07, + "loss": 0.1333, + "step": 4285 + }, + { + "epoch": 0.08, + "learning_rate": 1.8355015339210126e-07, + "loss": 0.0354, + "step": 4286 + }, + { + "epoch": 0.08, + "learning_rate": 1.8354627004776514e-07, + "loss": 0.0331, + "step": 4287 + }, + { + "epoch": 0.08, + "learning_rate": 1.8354238670342898e-07, + "loss": 0.0307, + "step": 4288 + }, + { + "epoch": 0.08, + "learning_rate": 1.8353850335909285e-07, + "loss": 0.0942, + "step": 4289 + }, + { + "epoch": 0.08, + "learning_rate": 1.835346200147567e-07, + "loss": 0.0461, + "step": 4290 + }, + { + "epoch": 0.08, + "learning_rate": 1.8353073667042057e-07, + "loss": 0.135, + "step": 4291 + }, + { + "epoch": 0.08, + "learning_rate": 1.8352685332608441e-07, + "loss": 0.1232, + "step": 4292 + }, + { + "epoch": 0.08, + "learning_rate": 1.8352296998174828e-07, + "loss": 0.6687, + "step": 4293 + }, + { + "epoch": 0.08, + "learning_rate": 1.8351908663741213e-07, + "loss": 0.1263, + "step": 4294 + }, + { + "epoch": 0.08, + "learning_rate": 1.83515203293076e-07, + "loss": 0.0447, + "step": 4295 + }, + { + "epoch": 0.08, + "learning_rate": 1.8351131994873985e-07, + "loss": 0.0359, + "step": 4296 + }, + { + "epoch": 0.08, + "learning_rate": 1.8350743660440372e-07, + "loss": 0.0559, + "step": 4297 + }, + { + "epoch": 0.08, + "learning_rate": 1.8350355326006756e-07, + "loss": 0.0395, + "step": 4298 + }, + { + "epoch": 0.08, + "learning_rate": 1.8349966991573143e-07, + "loss": 0.0361, + "step": 4299 + }, + { + "epoch": 0.08, + "learning_rate": 1.8349578657139528e-07, + "loss": 0.128, + "step": 4300 + }, + { + "epoch": 0.08, + "learning_rate": 1.8349190322705915e-07, + "loss": 0.3197, + "step": 4301 + }, + { + "epoch": 0.08, + "learning_rate": 1.83488019882723e-07, + "loss": 0.0899, + "step": 4302 + }, + { + "epoch": 0.08, + "learning_rate": 1.8348413653838687e-07, + "loss": 0.0631, + "step": 4303 + }, + { + "epoch": 0.08, + "learning_rate": 1.834802531940507e-07, + "loss": 0.1038, + "step": 4304 + }, + { + "epoch": 0.08, + "learning_rate": 1.8347636984971458e-07, + "loss": 0.1044, + "step": 4305 + }, + { + "epoch": 0.08, + "learning_rate": 1.8347248650537843e-07, + "loss": 0.0434, + "step": 4306 + }, + { + "epoch": 0.08, + "learning_rate": 1.834686031610423e-07, + "loss": 0.0458, + "step": 4307 + }, + { + "epoch": 0.08, + "learning_rate": 1.8346471981670615e-07, + "loss": 0.3571, + "step": 4308 + }, + { + "epoch": 0.08, + "learning_rate": 1.8346083647237002e-07, + "loss": 0.6846, + "step": 4309 + }, + { + "epoch": 0.08, + "learning_rate": 1.8345695312803386e-07, + "loss": 0.0555, + "step": 4310 + }, + { + "epoch": 0.08, + "learning_rate": 1.8345306978369773e-07, + "loss": 0.0688, + "step": 4311 + }, + { + "epoch": 0.08, + "learning_rate": 1.8344918643936158e-07, + "loss": 0.1185, + "step": 4312 + }, + { + "epoch": 0.08, + "learning_rate": 1.8344530309502542e-07, + "loss": 0.1122, + "step": 4313 + }, + { + "epoch": 0.08, + "learning_rate": 1.8344141975068927e-07, + "loss": 0.028, + "step": 4314 + }, + { + "epoch": 0.08, + "learning_rate": 1.8343753640635314e-07, + "loss": 0.0519, + "step": 4315 + }, + { + "epoch": 0.08, + "learning_rate": 1.8343365306201698e-07, + "loss": 0.5947, + "step": 4316 + }, + { + "epoch": 0.08, + "learning_rate": 1.8342976971768086e-07, + "loss": 0.0637, + "step": 4317 + }, + { + "epoch": 0.08, + "learning_rate": 1.834258863733447e-07, + "loss": 0.0423, + "step": 4318 + }, + { + "epoch": 0.08, + "learning_rate": 1.8342200302900857e-07, + "loss": 0.0928, + "step": 4319 + }, + { + "epoch": 0.08, + "learning_rate": 1.8341811968467242e-07, + "loss": 0.1139, + "step": 4320 + }, + { + "epoch": 0.08, + "learning_rate": 1.834142363403363e-07, + "loss": 0.1837, + "step": 4321 + }, + { + "epoch": 0.08, + "learning_rate": 1.8341035299600013e-07, + "loss": 0.0338, + "step": 4322 + }, + { + "epoch": 0.08, + "learning_rate": 1.83406469651664e-07, + "loss": 0.031, + "step": 4323 + }, + { + "epoch": 0.08, + "learning_rate": 1.8340258630732785e-07, + "loss": 0.301, + "step": 4324 + }, + { + "epoch": 0.08, + "learning_rate": 1.8339870296299172e-07, + "loss": 0.3194, + "step": 4325 + }, + { + "epoch": 0.08, + "learning_rate": 1.8339481961865557e-07, + "loss": 0.0708, + "step": 4326 + }, + { + "epoch": 0.08, + "learning_rate": 1.8339093627431944e-07, + "loss": 0.6181, + "step": 4327 + }, + { + "epoch": 0.08, + "learning_rate": 1.8338705292998328e-07, + "loss": 0.0444, + "step": 4328 + }, + { + "epoch": 0.08, + "learning_rate": 1.8338316958564716e-07, + "loss": 0.2373, + "step": 4329 + }, + { + "epoch": 0.08, + "learning_rate": 1.83379286241311e-07, + "loss": 0.0732, + "step": 4330 + }, + { + "epoch": 0.08, + "learning_rate": 1.8337540289697487e-07, + "loss": 0.0335, + "step": 4331 + }, + { + "epoch": 0.08, + "learning_rate": 1.8337151955263872e-07, + "loss": 0.0285, + "step": 4332 + }, + { + "epoch": 0.08, + "learning_rate": 1.833676362083026e-07, + "loss": 0.0677, + "step": 4333 + }, + { + "epoch": 0.08, + "learning_rate": 1.8336375286396643e-07, + "loss": 0.2455, + "step": 4334 + }, + { + "epoch": 0.08, + "learning_rate": 1.833598695196303e-07, + "loss": 0.0357, + "step": 4335 + }, + { + "epoch": 0.08, + "learning_rate": 1.8335598617529415e-07, + "loss": 0.1557, + "step": 4336 + }, + { + "epoch": 0.08, + "learning_rate": 1.8335210283095802e-07, + "loss": 0.0959, + "step": 4337 + }, + { + "epoch": 0.08, + "learning_rate": 1.8334821948662187e-07, + "loss": 0.0561, + "step": 4338 + }, + { + "epoch": 0.08, + "learning_rate": 1.8334433614228574e-07, + "loss": 0.0309, + "step": 4339 + }, + { + "epoch": 0.08, + "learning_rate": 1.8334045279794958e-07, + "loss": 0.1175, + "step": 4340 + }, + { + "epoch": 0.08, + "learning_rate": 1.8333656945361345e-07, + "loss": 0.0503, + "step": 4341 + }, + { + "epoch": 0.08, + "learning_rate": 1.833326861092773e-07, + "loss": 0.3388, + "step": 4342 + }, + { + "epoch": 0.08, + "learning_rate": 1.8332880276494117e-07, + "loss": 0.0946, + "step": 4343 + }, + { + "epoch": 0.08, + "learning_rate": 1.8332491942060502e-07, + "loss": 0.0507, + "step": 4344 + }, + { + "epoch": 0.08, + "learning_rate": 1.833210360762689e-07, + "loss": 0.1987, + "step": 4345 + }, + { + "epoch": 0.08, + "learning_rate": 1.8331715273193273e-07, + "loss": 0.1497, + "step": 4346 + }, + { + "epoch": 0.08, + "learning_rate": 1.833132693875966e-07, + "loss": 0.0388, + "step": 4347 + }, + { + "epoch": 0.08, + "learning_rate": 1.8330938604326045e-07, + "loss": 0.0322, + "step": 4348 + }, + { + "epoch": 0.08, + "learning_rate": 1.8330550269892432e-07, + "loss": 0.1491, + "step": 4349 + }, + { + "epoch": 0.08, + "learning_rate": 1.8330161935458817e-07, + "loss": 0.0497, + "step": 4350 + }, + { + "epoch": 0.08, + "learning_rate": 1.8329773601025204e-07, + "loss": 0.1165, + "step": 4351 + }, + { + "epoch": 0.08, + "learning_rate": 1.8329385266591588e-07, + "loss": 0.0373, + "step": 4352 + }, + { + "epoch": 0.08, + "learning_rate": 1.8328996932157975e-07, + "loss": 0.0485, + "step": 4353 + }, + { + "epoch": 0.08, + "learning_rate": 1.832860859772436e-07, + "loss": 0.0294, + "step": 4354 + }, + { + "epoch": 0.08, + "learning_rate": 1.8328220263290747e-07, + "loss": 0.1306, + "step": 4355 + }, + { + "epoch": 0.08, + "learning_rate": 1.8327831928857131e-07, + "loss": 0.0905, + "step": 4356 + }, + { + "epoch": 0.08, + "learning_rate": 1.8327443594423516e-07, + "loss": 0.0364, + "step": 4357 + }, + { + "epoch": 0.08, + "learning_rate": 1.8327055259989903e-07, + "loss": 0.5504, + "step": 4358 + }, + { + "epoch": 0.08, + "learning_rate": 1.8326666925556288e-07, + "loss": 0.0394, + "step": 4359 + }, + { + "epoch": 0.08, + "learning_rate": 1.8326278591122675e-07, + "loss": 0.0607, + "step": 4360 + }, + { + "epoch": 0.08, + "learning_rate": 1.832589025668906e-07, + "loss": 0.034, + "step": 4361 + }, + { + "epoch": 0.08, + "learning_rate": 1.8325501922255446e-07, + "loss": 0.3957, + "step": 4362 + }, + { + "epoch": 0.08, + "learning_rate": 1.832511358782183e-07, + "loss": 0.031, + "step": 4363 + }, + { + "epoch": 0.08, + "learning_rate": 1.8324725253388218e-07, + "loss": 0.3924, + "step": 4364 + }, + { + "epoch": 0.08, + "learning_rate": 1.8324336918954603e-07, + "loss": 0.0795, + "step": 4365 + }, + { + "epoch": 0.08, + "learning_rate": 1.832394858452099e-07, + "loss": 0.0608, + "step": 4366 + }, + { + "epoch": 0.08, + "learning_rate": 1.8323560250087374e-07, + "loss": 0.0353, + "step": 4367 + }, + { + "epoch": 0.08, + "learning_rate": 1.8323171915653761e-07, + "loss": 0.0485, + "step": 4368 + }, + { + "epoch": 0.08, + "learning_rate": 1.8322783581220146e-07, + "loss": 0.5318, + "step": 4369 + }, + { + "epoch": 0.08, + "learning_rate": 1.8322395246786533e-07, + "loss": 0.0893, + "step": 4370 + }, + { + "epoch": 0.08, + "learning_rate": 1.8322006912352918e-07, + "loss": 0.0272, + "step": 4371 + }, + { + "epoch": 0.08, + "learning_rate": 1.8321618577919302e-07, + "loss": 0.1011, + "step": 4372 + }, + { + "epoch": 0.08, + "learning_rate": 1.832123024348569e-07, + "loss": 0.0518, + "step": 4373 + }, + { + "epoch": 0.08, + "learning_rate": 1.8320841909052074e-07, + "loss": 0.0281, + "step": 4374 + }, + { + "epoch": 0.08, + "learning_rate": 1.832045357461846e-07, + "loss": 0.0388, + "step": 4375 + }, + { + "epoch": 0.08, + "learning_rate": 1.8320065240184845e-07, + "loss": 0.0284, + "step": 4376 + }, + { + "epoch": 0.08, + "learning_rate": 1.8319676905751232e-07, + "loss": 0.1158, + "step": 4377 + }, + { + "epoch": 0.08, + "learning_rate": 1.8319288571317617e-07, + "loss": 0.5498, + "step": 4378 + }, + { + "epoch": 0.08, + "learning_rate": 1.8318900236884004e-07, + "loss": 0.0894, + "step": 4379 + }, + { + "epoch": 0.08, + "learning_rate": 1.8318511902450389e-07, + "loss": 0.7665, + "step": 4380 + }, + { + "epoch": 0.08, + "learning_rate": 1.8318123568016776e-07, + "loss": 0.0391, + "step": 4381 + }, + { + "epoch": 0.09, + "learning_rate": 1.831773523358316e-07, + "loss": 0.056, + "step": 4382 + }, + { + "epoch": 0.09, + "learning_rate": 1.8317346899149547e-07, + "loss": 0.5949, + "step": 4383 + }, + { + "epoch": 0.09, + "learning_rate": 1.8316958564715932e-07, + "loss": 0.0392, + "step": 4384 + }, + { + "epoch": 0.09, + "learning_rate": 1.831657023028232e-07, + "loss": 0.0333, + "step": 4385 + }, + { + "epoch": 0.09, + "learning_rate": 1.8316181895848704e-07, + "loss": 0.0483, + "step": 4386 + }, + { + "epoch": 0.09, + "learning_rate": 1.8315793561415088e-07, + "loss": 0.0996, + "step": 4387 + }, + { + "epoch": 0.09, + "learning_rate": 1.8315405226981475e-07, + "loss": 0.2081, + "step": 4388 + }, + { + "epoch": 0.09, + "learning_rate": 1.831501689254786e-07, + "loss": 0.7311, + "step": 4389 + }, + { + "epoch": 0.09, + "learning_rate": 1.8314628558114247e-07, + "loss": 0.064, + "step": 4390 + }, + { + "epoch": 0.09, + "learning_rate": 1.8314240223680631e-07, + "loss": 0.3242, + "step": 4391 + }, + { + "epoch": 0.09, + "learning_rate": 1.8313851889247018e-07, + "loss": 0.0294, + "step": 4392 + }, + { + "epoch": 0.09, + "learning_rate": 1.8313463554813403e-07, + "loss": 0.2124, + "step": 4393 + }, + { + "epoch": 0.09, + "learning_rate": 1.831307522037979e-07, + "loss": 0.2129, + "step": 4394 + }, + { + "epoch": 0.09, + "learning_rate": 1.8312686885946175e-07, + "loss": 0.0284, + "step": 4395 + }, + { + "epoch": 0.09, + "learning_rate": 1.8312298551512562e-07, + "loss": 0.0378, + "step": 4396 + }, + { + "epoch": 0.09, + "learning_rate": 1.8311910217078946e-07, + "loss": 0.0281, + "step": 4397 + }, + { + "epoch": 0.09, + "learning_rate": 1.8311521882645333e-07, + "loss": 0.234, + "step": 4398 + }, + { + "epoch": 0.09, + "learning_rate": 1.8311133548211718e-07, + "loss": 0.0491, + "step": 4399 + }, + { + "epoch": 0.09, + "learning_rate": 1.8310745213778105e-07, + "loss": 0.2981, + "step": 4400 + }, + { + "epoch": 0.09, + "learning_rate": 1.831035687934449e-07, + "loss": 0.5063, + "step": 4401 + }, + { + "epoch": 0.09, + "learning_rate": 1.8309968544910877e-07, + "loss": 0.0446, + "step": 4402 + }, + { + "epoch": 0.09, + "learning_rate": 1.830958021047726e-07, + "loss": 0.0703, + "step": 4403 + }, + { + "epoch": 0.09, + "learning_rate": 1.8309191876043648e-07, + "loss": 0.2923, + "step": 4404 + }, + { + "epoch": 0.09, + "learning_rate": 1.8308803541610033e-07, + "loss": 0.0336, + "step": 4405 + }, + { + "epoch": 0.09, + "learning_rate": 1.830841520717642e-07, + "loss": 0.0281, + "step": 4406 + }, + { + "epoch": 0.09, + "learning_rate": 1.8308026872742805e-07, + "loss": 0.0317, + "step": 4407 + }, + { + "epoch": 0.09, + "learning_rate": 1.8307638538309192e-07, + "loss": 0.0627, + "step": 4408 + }, + { + "epoch": 0.09, + "learning_rate": 1.8307250203875576e-07, + "loss": 0.0563, + "step": 4409 + }, + { + "epoch": 0.09, + "learning_rate": 1.8306861869441963e-07, + "loss": 0.0336, + "step": 4410 + }, + { + "epoch": 0.09, + "learning_rate": 1.8306473535008348e-07, + "loss": 0.4656, + "step": 4411 + }, + { + "epoch": 0.09, + "learning_rate": 1.8306085200574735e-07, + "loss": 0.0276, + "step": 4412 + }, + { + "epoch": 0.09, + "learning_rate": 1.830569686614112e-07, + "loss": 0.0307, + "step": 4413 + }, + { + "epoch": 0.09, + "learning_rate": 1.8305308531707507e-07, + "loss": 0.0305, + "step": 4414 + }, + { + "epoch": 0.09, + "learning_rate": 1.830492019727389e-07, + "loss": 0.0499, + "step": 4415 + }, + { + "epoch": 0.09, + "learning_rate": 1.8304531862840278e-07, + "loss": 0.0689, + "step": 4416 + }, + { + "epoch": 0.09, + "learning_rate": 1.8304143528406663e-07, + "loss": 0.0495, + "step": 4417 + }, + { + "epoch": 0.09, + "learning_rate": 1.830375519397305e-07, + "loss": 0.0688, + "step": 4418 + }, + { + "epoch": 0.09, + "learning_rate": 1.8303366859539434e-07, + "loss": 0.0291, + "step": 4419 + }, + { + "epoch": 0.09, + "learning_rate": 1.8302978525105822e-07, + "loss": 0.2637, + "step": 4420 + }, + { + "epoch": 0.09, + "learning_rate": 1.8302590190672206e-07, + "loss": 0.6745, + "step": 4421 + }, + { + "epoch": 0.09, + "learning_rate": 1.8302201856238593e-07, + "loss": 0.0637, + "step": 4422 + }, + { + "epoch": 0.09, + "learning_rate": 1.8301813521804978e-07, + "loss": 0.4861, + "step": 4423 + }, + { + "epoch": 0.09, + "learning_rate": 1.8301425187371365e-07, + "loss": 0.0315, + "step": 4424 + }, + { + "epoch": 0.09, + "learning_rate": 1.830103685293775e-07, + "loss": 0.19, + "step": 4425 + }, + { + "epoch": 0.09, + "learning_rate": 1.8300648518504137e-07, + "loss": 0.0884, + "step": 4426 + }, + { + "epoch": 0.09, + "learning_rate": 1.830026018407052e-07, + "loss": 0.0936, + "step": 4427 + }, + { + "epoch": 0.09, + "learning_rate": 1.8299871849636908e-07, + "loss": 0.5574, + "step": 4428 + }, + { + "epoch": 0.09, + "learning_rate": 1.829948351520329e-07, + "loss": 0.0271, + "step": 4429 + }, + { + "epoch": 0.09, + "learning_rate": 1.8299095180769677e-07, + "loss": 0.0326, + "step": 4430 + }, + { + "epoch": 0.09, + "learning_rate": 1.8298706846336062e-07, + "loss": 0.0281, + "step": 4431 + }, + { + "epoch": 0.09, + "learning_rate": 1.829831851190245e-07, + "loss": 0.0413, + "step": 4432 + }, + { + "epoch": 0.09, + "learning_rate": 1.8297930177468833e-07, + "loss": 0.0263, + "step": 4433 + }, + { + "epoch": 0.09, + "learning_rate": 1.829754184303522e-07, + "loss": 0.0483, + "step": 4434 + }, + { + "epoch": 0.09, + "learning_rate": 1.8297153508601605e-07, + "loss": 0.0374, + "step": 4435 + }, + { + "epoch": 0.09, + "learning_rate": 1.8296765174167992e-07, + "loss": 0.4284, + "step": 4436 + }, + { + "epoch": 0.09, + "learning_rate": 1.8296376839734377e-07, + "loss": 0.3221, + "step": 4437 + }, + { + "epoch": 0.09, + "learning_rate": 1.8295988505300764e-07, + "loss": 0.2325, + "step": 4438 + }, + { + "epoch": 0.09, + "learning_rate": 1.8295600170867148e-07, + "loss": 0.0807, + "step": 4439 + }, + { + "epoch": 0.09, + "learning_rate": 1.8295211836433535e-07, + "loss": 0.0328, + "step": 4440 + }, + { + "epoch": 0.09, + "learning_rate": 1.829482350199992e-07, + "loss": 0.3195, + "step": 4441 + }, + { + "epoch": 0.09, + "learning_rate": 1.8294435167566307e-07, + "loss": 0.0649, + "step": 4442 + }, + { + "epoch": 0.09, + "learning_rate": 1.8294046833132692e-07, + "loss": 0.1269, + "step": 4443 + }, + { + "epoch": 0.09, + "learning_rate": 1.829365849869908e-07, + "loss": 0.0326, + "step": 4444 + }, + { + "epoch": 0.09, + "learning_rate": 1.8293270164265463e-07, + "loss": 0.3951, + "step": 4445 + }, + { + "epoch": 0.09, + "learning_rate": 1.829288182983185e-07, + "loss": 0.1191, + "step": 4446 + }, + { + "epoch": 0.09, + "learning_rate": 1.8292493495398235e-07, + "loss": 0.0939, + "step": 4447 + }, + { + "epoch": 0.09, + "learning_rate": 1.8292105160964622e-07, + "loss": 0.2653, + "step": 4448 + }, + { + "epoch": 0.09, + "learning_rate": 1.8291716826531007e-07, + "loss": 0.0386, + "step": 4449 + }, + { + "epoch": 0.09, + "learning_rate": 1.8291328492097394e-07, + "loss": 0.1378, + "step": 4450 + }, + { + "epoch": 0.09, + "learning_rate": 1.8290940157663778e-07, + "loss": 0.1649, + "step": 4451 + }, + { + "epoch": 0.09, + "learning_rate": 1.8290551823230165e-07, + "loss": 0.0897, + "step": 4452 + }, + { + "epoch": 0.09, + "learning_rate": 1.829016348879655e-07, + "loss": 0.0418, + "step": 4453 + }, + { + "epoch": 0.09, + "learning_rate": 1.8289775154362937e-07, + "loss": 0.0608, + "step": 4454 + }, + { + "epoch": 0.09, + "learning_rate": 1.8289386819929321e-07, + "loss": 0.0507, + "step": 4455 + }, + { + "epoch": 0.09, + "learning_rate": 1.8288998485495709e-07, + "loss": 0.5465, + "step": 4456 + }, + { + "epoch": 0.09, + "learning_rate": 1.8288610151062093e-07, + "loss": 0.1512, + "step": 4457 + }, + { + "epoch": 0.09, + "learning_rate": 1.828822181662848e-07, + "loss": 0.0701, + "step": 4458 + }, + { + "epoch": 0.09, + "learning_rate": 1.8287833482194865e-07, + "loss": 0.0478, + "step": 4459 + }, + { + "epoch": 0.09, + "learning_rate": 1.8287445147761252e-07, + "loss": 0.072, + "step": 4460 + }, + { + "epoch": 0.09, + "learning_rate": 1.8287056813327636e-07, + "loss": 0.3015, + "step": 4461 + }, + { + "epoch": 0.09, + "learning_rate": 1.8286668478894024e-07, + "loss": 0.0311, + "step": 4462 + }, + { + "epoch": 0.09, + "learning_rate": 1.8286280144460408e-07, + "loss": 0.1687, + "step": 4463 + }, + { + "epoch": 0.09, + "learning_rate": 1.8285891810026795e-07, + "loss": 0.0607, + "step": 4464 + }, + { + "epoch": 0.09, + "learning_rate": 1.828550347559318e-07, + "loss": 0.0377, + "step": 4465 + }, + { + "epoch": 0.09, + "learning_rate": 1.8285115141159567e-07, + "loss": 0.0487, + "step": 4466 + }, + { + "epoch": 0.09, + "learning_rate": 1.8284726806725951e-07, + "loss": 0.1077, + "step": 4467 + }, + { + "epoch": 0.09, + "learning_rate": 1.8284338472292339e-07, + "loss": 0.0281, + "step": 4468 + }, + { + "epoch": 0.09, + "learning_rate": 1.8283950137858723e-07, + "loss": 0.036, + "step": 4469 + }, + { + "epoch": 0.09, + "learning_rate": 1.828356180342511e-07, + "loss": 0.0387, + "step": 4470 + }, + { + "epoch": 0.09, + "learning_rate": 1.8283173468991495e-07, + "loss": 0.225, + "step": 4471 + }, + { + "epoch": 0.09, + "learning_rate": 1.8282785134557882e-07, + "loss": 0.033, + "step": 4472 + }, + { + "epoch": 0.09, + "learning_rate": 1.8282396800124266e-07, + "loss": 0.0539, + "step": 4473 + }, + { + "epoch": 0.09, + "learning_rate": 1.8282008465690653e-07, + "loss": 0.1069, + "step": 4474 + }, + { + "epoch": 0.09, + "learning_rate": 1.8281620131257038e-07, + "loss": 0.0618, + "step": 4475 + }, + { + "epoch": 0.09, + "learning_rate": 1.8281231796823425e-07, + "loss": 0.0356, + "step": 4476 + }, + { + "epoch": 0.09, + "learning_rate": 1.828084346238981e-07, + "loss": 0.1927, + "step": 4477 + }, + { + "epoch": 0.09, + "learning_rate": 1.8280455127956197e-07, + "loss": 0.0258, + "step": 4478 + }, + { + "epoch": 0.09, + "learning_rate": 1.828006679352258e-07, + "loss": 0.034, + "step": 4479 + }, + { + "epoch": 0.09, + "learning_rate": 1.8279678459088968e-07, + "loss": 0.0327, + "step": 4480 + }, + { + "epoch": 0.09, + "learning_rate": 1.8279290124655353e-07, + "loss": 0.2564, + "step": 4481 + }, + { + "epoch": 0.09, + "learning_rate": 1.827890179022174e-07, + "loss": 0.2247, + "step": 4482 + }, + { + "epoch": 0.09, + "learning_rate": 1.8278513455788125e-07, + "loss": 0.2795, + "step": 4483 + }, + { + "epoch": 0.09, + "learning_rate": 1.8278125121354512e-07, + "loss": 0.0578, + "step": 4484 + }, + { + "epoch": 0.09, + "learning_rate": 1.8277736786920896e-07, + "loss": 0.0651, + "step": 4485 + }, + { + "epoch": 0.09, + "learning_rate": 1.8277348452487283e-07, + "loss": 0.0339, + "step": 4486 + }, + { + "epoch": 0.09, + "learning_rate": 1.8276960118053665e-07, + "loss": 0.1425, + "step": 4487 + }, + { + "epoch": 0.09, + "learning_rate": 1.8276571783620052e-07, + "loss": 0.0357, + "step": 4488 + }, + { + "epoch": 0.09, + "learning_rate": 1.8276183449186437e-07, + "loss": 0.0518, + "step": 4489 + }, + { + "epoch": 0.09, + "learning_rate": 1.8275795114752824e-07, + "loss": 0.574, + "step": 4490 + }, + { + "epoch": 0.09, + "learning_rate": 1.8275406780319208e-07, + "loss": 0.1085, + "step": 4491 + }, + { + "epoch": 0.09, + "learning_rate": 1.8275018445885596e-07, + "loss": 0.0755, + "step": 4492 + }, + { + "epoch": 0.09, + "learning_rate": 1.827463011145198e-07, + "loss": 0.0728, + "step": 4493 + }, + { + "epoch": 0.09, + "learning_rate": 1.8274241777018367e-07, + "loss": 0.1267, + "step": 4494 + }, + { + "epoch": 0.09, + "learning_rate": 1.8273853442584752e-07, + "loss": 0.0928, + "step": 4495 + }, + { + "epoch": 0.09, + "learning_rate": 1.827346510815114e-07, + "loss": 0.252, + "step": 4496 + }, + { + "epoch": 0.09, + "learning_rate": 1.8273076773717523e-07, + "loss": 0.0409, + "step": 4497 + }, + { + "epoch": 0.09, + "learning_rate": 1.827268843928391e-07, + "loss": 0.0761, + "step": 4498 + }, + { + "epoch": 0.09, + "learning_rate": 1.8272300104850295e-07, + "loss": 0.3559, + "step": 4499 + }, + { + "epoch": 0.09, + "learning_rate": 1.8271911770416682e-07, + "loss": 0.2663, + "step": 4500 + }, + { + "epoch": 0.09, + "learning_rate": 1.8271523435983067e-07, + "loss": 0.0423, + "step": 4501 + }, + { + "epoch": 0.09, + "learning_rate": 1.8271135101549454e-07, + "loss": 0.0915, + "step": 4502 + }, + { + "epoch": 0.09, + "learning_rate": 1.8270746767115838e-07, + "loss": 0.1545, + "step": 4503 + }, + { + "epoch": 0.09, + "learning_rate": 1.8270358432682226e-07, + "loss": 0.059, + "step": 4504 + }, + { + "epoch": 0.09, + "learning_rate": 1.826997009824861e-07, + "loss": 0.0227, + "step": 4505 + }, + { + "epoch": 0.09, + "learning_rate": 1.8269581763814997e-07, + "loss": 0.1099, + "step": 4506 + }, + { + "epoch": 0.09, + "learning_rate": 1.8269193429381382e-07, + "loss": 0.2298, + "step": 4507 + }, + { + "epoch": 0.09, + "learning_rate": 1.826880509494777e-07, + "loss": 0.034, + "step": 4508 + }, + { + "epoch": 0.09, + "learning_rate": 1.8268416760514153e-07, + "loss": 0.0419, + "step": 4509 + }, + { + "epoch": 0.09, + "learning_rate": 1.826802842608054e-07, + "loss": 0.0594, + "step": 4510 + }, + { + "epoch": 0.09, + "learning_rate": 1.8267640091646925e-07, + "loss": 0.033, + "step": 4511 + }, + { + "epoch": 0.09, + "learning_rate": 1.8267251757213312e-07, + "loss": 0.1022, + "step": 4512 + }, + { + "epoch": 0.09, + "learning_rate": 1.8266863422779697e-07, + "loss": 0.0616, + "step": 4513 + }, + { + "epoch": 0.09, + "learning_rate": 1.8266475088346084e-07, + "loss": 0.0383, + "step": 4514 + }, + { + "epoch": 0.09, + "learning_rate": 1.8266086753912468e-07, + "loss": 0.0443, + "step": 4515 + }, + { + "epoch": 0.09, + "learning_rate": 1.8265698419478855e-07, + "loss": 0.1239, + "step": 4516 + }, + { + "epoch": 0.09, + "learning_rate": 1.826531008504524e-07, + "loss": 0.0471, + "step": 4517 + }, + { + "epoch": 0.09, + "learning_rate": 1.8264921750611627e-07, + "loss": 0.0283, + "step": 4518 + }, + { + "epoch": 0.09, + "learning_rate": 1.8264533416178012e-07, + "loss": 0.1194, + "step": 4519 + }, + { + "epoch": 0.09, + "learning_rate": 1.82641450817444e-07, + "loss": 0.0287, + "step": 4520 + }, + { + "epoch": 0.09, + "learning_rate": 1.8263756747310783e-07, + "loss": 0.0633, + "step": 4521 + }, + { + "epoch": 0.09, + "learning_rate": 1.826336841287717e-07, + "loss": 0.0396, + "step": 4522 + }, + { + "epoch": 0.09, + "learning_rate": 1.8262980078443555e-07, + "loss": 0.2294, + "step": 4523 + }, + { + "epoch": 0.09, + "learning_rate": 1.8262591744009942e-07, + "loss": 0.083, + "step": 4524 + }, + { + "epoch": 0.09, + "learning_rate": 1.8262203409576327e-07, + "loss": 0.0273, + "step": 4525 + }, + { + "epoch": 0.09, + "learning_rate": 1.8261815075142714e-07, + "loss": 0.0862, + "step": 4526 + }, + { + "epoch": 0.09, + "learning_rate": 1.8261426740709098e-07, + "loss": 0.3926, + "step": 4527 + }, + { + "epoch": 0.09, + "learning_rate": 1.8261038406275485e-07, + "loss": 0.3108, + "step": 4528 + }, + { + "epoch": 0.09, + "learning_rate": 1.826065007184187e-07, + "loss": 0.3425, + "step": 4529 + }, + { + "epoch": 0.09, + "learning_rate": 1.8260261737408257e-07, + "loss": 0.0638, + "step": 4530 + }, + { + "epoch": 0.09, + "learning_rate": 1.8259873402974641e-07, + "loss": 0.0263, + "step": 4531 + }, + { + "epoch": 0.09, + "learning_rate": 1.8259485068541029e-07, + "loss": 0.0439, + "step": 4532 + }, + { + "epoch": 0.09, + "learning_rate": 1.8259096734107413e-07, + "loss": 0.089, + "step": 4533 + }, + { + "epoch": 0.09, + "learning_rate": 1.8258708399673798e-07, + "loss": 0.0256, + "step": 4534 + }, + { + "epoch": 0.09, + "learning_rate": 1.8258320065240185e-07, + "loss": 0.1322, + "step": 4535 + }, + { + "epoch": 0.09, + "learning_rate": 1.825793173080657e-07, + "loss": 0.0385, + "step": 4536 + }, + { + "epoch": 0.09, + "learning_rate": 1.8257543396372956e-07, + "loss": 0.0301, + "step": 4537 + }, + { + "epoch": 0.09, + "learning_rate": 1.825715506193934e-07, + "loss": 0.1081, + "step": 4538 + }, + { + "epoch": 0.09, + "learning_rate": 1.8256766727505728e-07, + "loss": 0.2152, + "step": 4539 + }, + { + "epoch": 0.09, + "learning_rate": 1.8256378393072113e-07, + "loss": 0.0282, + "step": 4540 + }, + { + "epoch": 0.09, + "learning_rate": 1.82559900586385e-07, + "loss": 0.0288, + "step": 4541 + }, + { + "epoch": 0.09, + "learning_rate": 1.8255601724204884e-07, + "loss": 0.0597, + "step": 4542 + }, + { + "epoch": 0.09, + "learning_rate": 1.8255213389771271e-07, + "loss": 0.3629, + "step": 4543 + }, + { + "epoch": 0.09, + "learning_rate": 1.8254825055337656e-07, + "loss": 0.081, + "step": 4544 + }, + { + "epoch": 0.09, + "learning_rate": 1.825443672090404e-07, + "loss": 0.0749, + "step": 4545 + }, + { + "epoch": 0.09, + "learning_rate": 1.8254048386470428e-07, + "loss": 0.0322, + "step": 4546 + }, + { + "epoch": 0.09, + "learning_rate": 1.8253660052036812e-07, + "loss": 0.0255, + "step": 4547 + }, + { + "epoch": 0.09, + "learning_rate": 1.82532717176032e-07, + "loss": 0.0214, + "step": 4548 + }, + { + "epoch": 0.09, + "learning_rate": 1.8252883383169584e-07, + "loss": 0.044, + "step": 4549 + }, + { + "epoch": 0.09, + "learning_rate": 1.825249504873597e-07, + "loss": 0.0284, + "step": 4550 + }, + { + "epoch": 0.09, + "learning_rate": 1.8252106714302355e-07, + "loss": 0.1422, + "step": 4551 + }, + { + "epoch": 0.09, + "learning_rate": 1.8251718379868742e-07, + "loss": 0.3879, + "step": 4552 + }, + { + "epoch": 0.09, + "learning_rate": 1.8251330045435127e-07, + "loss": 0.0975, + "step": 4553 + }, + { + "epoch": 0.09, + "learning_rate": 1.8250941711001514e-07, + "loss": 0.1936, + "step": 4554 + }, + { + "epoch": 0.09, + "learning_rate": 1.8250553376567899e-07, + "loss": 0.5717, + "step": 4555 + }, + { + "epoch": 0.09, + "learning_rate": 1.8250165042134286e-07, + "loss": 0.0645, + "step": 4556 + }, + { + "epoch": 0.09, + "learning_rate": 1.824977670770067e-07, + "loss": 0.0467, + "step": 4557 + }, + { + "epoch": 0.09, + "learning_rate": 1.8249388373267057e-07, + "loss": 0.0388, + "step": 4558 + }, + { + "epoch": 0.09, + "learning_rate": 1.8249000038833442e-07, + "loss": 0.0399, + "step": 4559 + }, + { + "epoch": 0.09, + "learning_rate": 1.824861170439983e-07, + "loss": 0.3401, + "step": 4560 + }, + { + "epoch": 0.09, + "learning_rate": 1.8248223369966214e-07, + "loss": 0.0548, + "step": 4561 + }, + { + "epoch": 0.09, + "learning_rate": 1.82478350355326e-07, + "loss": 0.0297, + "step": 4562 + }, + { + "epoch": 0.09, + "learning_rate": 1.8247446701098985e-07, + "loss": 0.1108, + "step": 4563 + }, + { + "epoch": 0.09, + "learning_rate": 1.824705836666537e-07, + "loss": 0.0207, + "step": 4564 + }, + { + "epoch": 0.09, + "learning_rate": 1.8246670032231757e-07, + "loss": 0.0413, + "step": 4565 + }, + { + "epoch": 0.09, + "learning_rate": 1.8246281697798141e-07, + "loss": 0.0327, + "step": 4566 + }, + { + "epoch": 0.09, + "learning_rate": 1.8245893363364529e-07, + "loss": 0.0313, + "step": 4567 + }, + { + "epoch": 0.09, + "learning_rate": 1.8245505028930913e-07, + "loss": 0.0967, + "step": 4568 + }, + { + "epoch": 0.09, + "learning_rate": 1.82451166944973e-07, + "loss": 0.0267, + "step": 4569 + }, + { + "epoch": 0.09, + "learning_rate": 1.8244728360063685e-07, + "loss": 0.0249, + "step": 4570 + }, + { + "epoch": 0.09, + "learning_rate": 1.8244340025630072e-07, + "loss": 0.4374, + "step": 4571 + }, + { + "epoch": 0.09, + "learning_rate": 1.8243951691196456e-07, + "loss": 0.0512, + "step": 4572 + }, + { + "epoch": 0.09, + "learning_rate": 1.8243563356762843e-07, + "loss": 0.2154, + "step": 4573 + }, + { + "epoch": 0.09, + "learning_rate": 1.8243175022329228e-07, + "loss": 0.0473, + "step": 4574 + }, + { + "epoch": 0.09, + "learning_rate": 1.8242786687895615e-07, + "loss": 0.0761, + "step": 4575 + }, + { + "epoch": 0.09, + "learning_rate": 1.8242398353462e-07, + "loss": 0.1032, + "step": 4576 + }, + { + "epoch": 0.09, + "learning_rate": 1.8242010019028387e-07, + "loss": 0.0416, + "step": 4577 + }, + { + "epoch": 0.09, + "learning_rate": 1.824162168459477e-07, + "loss": 0.3899, + "step": 4578 + }, + { + "epoch": 0.09, + "learning_rate": 1.8241233350161158e-07, + "loss": 0.0579, + "step": 4579 + }, + { + "epoch": 0.09, + "learning_rate": 1.8240845015727543e-07, + "loss": 0.0554, + "step": 4580 + }, + { + "epoch": 0.09, + "learning_rate": 1.824045668129393e-07, + "loss": 0.3372, + "step": 4581 + }, + { + "epoch": 0.09, + "learning_rate": 1.8240068346860315e-07, + "loss": 0.0263, + "step": 4582 + }, + { + "epoch": 0.09, + "learning_rate": 1.8239680012426702e-07, + "loss": 0.0483, + "step": 4583 + }, + { + "epoch": 0.09, + "learning_rate": 1.8239291677993086e-07, + "loss": 0.0289, + "step": 4584 + }, + { + "epoch": 0.09, + "learning_rate": 1.8238903343559473e-07, + "loss": 0.0312, + "step": 4585 + }, + { + "epoch": 0.09, + "learning_rate": 1.8238515009125858e-07, + "loss": 0.175, + "step": 4586 + }, + { + "epoch": 0.09, + "learning_rate": 1.8238126674692245e-07, + "loss": 0.0229, + "step": 4587 + }, + { + "epoch": 0.09, + "learning_rate": 1.823773834025863e-07, + "loss": 0.0993, + "step": 4588 + }, + { + "epoch": 0.09, + "learning_rate": 1.8237350005825017e-07, + "loss": 0.0377, + "step": 4589 + }, + { + "epoch": 0.09, + "learning_rate": 1.82369616713914e-07, + "loss": 0.2264, + "step": 4590 + }, + { + "epoch": 0.09, + "learning_rate": 1.8236573336957788e-07, + "loss": 0.0272, + "step": 4591 + }, + { + "epoch": 0.09, + "learning_rate": 1.8236185002524173e-07, + "loss": 0.0299, + "step": 4592 + }, + { + "epoch": 0.09, + "learning_rate": 1.823579666809056e-07, + "loss": 0.047, + "step": 4593 + }, + { + "epoch": 0.09, + "learning_rate": 1.8235408333656944e-07, + "loss": 0.0446, + "step": 4594 + }, + { + "epoch": 0.09, + "learning_rate": 1.8235019999223332e-07, + "loss": 0.0811, + "step": 4595 + }, + { + "epoch": 0.09, + "learning_rate": 1.8234631664789716e-07, + "loss": 0.0213, + "step": 4596 + }, + { + "epoch": 0.09, + "learning_rate": 1.8234243330356103e-07, + "loss": 0.0357, + "step": 4597 + }, + { + "epoch": 0.09, + "learning_rate": 1.8233854995922488e-07, + "loss": 0.1067, + "step": 4598 + }, + { + "epoch": 0.09, + "learning_rate": 1.8233466661488875e-07, + "loss": 0.1227, + "step": 4599 + }, + { + "epoch": 0.09, + "learning_rate": 1.823307832705526e-07, + "loss": 0.0379, + "step": 4600 + }, + { + "epoch": 0.09, + "learning_rate": 1.8232689992621647e-07, + "loss": 0.1266, + "step": 4601 + }, + { + "epoch": 0.09, + "learning_rate": 1.823230165818803e-07, + "loss": 0.2195, + "step": 4602 + }, + { + "epoch": 0.09, + "learning_rate": 1.8231913323754416e-07, + "loss": 0.0257, + "step": 4603 + }, + { + "epoch": 0.09, + "learning_rate": 1.82315249893208e-07, + "loss": 0.0385, + "step": 4604 + }, + { + "epoch": 0.09, + "learning_rate": 1.8231136654887187e-07, + "loss": 0.0276, + "step": 4605 + }, + { + "epoch": 0.09, + "learning_rate": 1.8230748320453572e-07, + "loss": 0.0237, + "step": 4606 + }, + { + "epoch": 0.09, + "learning_rate": 1.823035998601996e-07, + "loss": 0.1603, + "step": 4607 + }, + { + "epoch": 0.09, + "learning_rate": 1.8229971651586343e-07, + "loss": 0.0406, + "step": 4608 + }, + { + "epoch": 0.09, + "learning_rate": 1.822958331715273e-07, + "loss": 0.0293, + "step": 4609 + }, + { + "epoch": 0.09, + "learning_rate": 1.8229194982719115e-07, + "loss": 0.5943, + "step": 4610 + }, + { + "epoch": 0.09, + "learning_rate": 1.8228806648285502e-07, + "loss": 0.0724, + "step": 4611 + }, + { + "epoch": 0.09, + "learning_rate": 1.8228418313851887e-07, + "loss": 0.0352, + "step": 4612 + }, + { + "epoch": 0.09, + "learning_rate": 1.8228029979418274e-07, + "loss": 0.0209, + "step": 4613 + }, + { + "epoch": 0.09, + "learning_rate": 1.8227641644984658e-07, + "loss": 0.0237, + "step": 4614 + }, + { + "epoch": 0.09, + "learning_rate": 1.8227253310551045e-07, + "loss": 0.0235, + "step": 4615 + }, + { + "epoch": 0.09, + "learning_rate": 1.822686497611743e-07, + "loss": 0.0539, + "step": 4616 + }, + { + "epoch": 0.09, + "learning_rate": 1.8226476641683817e-07, + "loss": 0.0409, + "step": 4617 + }, + { + "epoch": 0.09, + "learning_rate": 1.8226088307250202e-07, + "loss": 0.1244, + "step": 4618 + }, + { + "epoch": 0.09, + "learning_rate": 1.822569997281659e-07, + "loss": 0.0317, + "step": 4619 + }, + { + "epoch": 0.09, + "learning_rate": 1.8225311638382973e-07, + "loss": 0.044, + "step": 4620 + }, + { + "epoch": 0.09, + "learning_rate": 1.822492330394936e-07, + "loss": 0.0248, + "step": 4621 + }, + { + "epoch": 0.09, + "learning_rate": 1.8224534969515745e-07, + "loss": 0.0224, + "step": 4622 + }, + { + "epoch": 0.09, + "learning_rate": 1.8224146635082132e-07, + "loss": 0.064, + "step": 4623 + }, + { + "epoch": 0.09, + "learning_rate": 1.8223758300648517e-07, + "loss": 0.0276, + "step": 4624 + }, + { + "epoch": 0.09, + "learning_rate": 1.8223369966214904e-07, + "loss": 0.048, + "step": 4625 + }, + { + "epoch": 0.09, + "learning_rate": 1.8222981631781288e-07, + "loss": 0.1869, + "step": 4626 + }, + { + "epoch": 0.09, + "learning_rate": 1.8222593297347675e-07, + "loss": 0.0222, + "step": 4627 + }, + { + "epoch": 0.09, + "learning_rate": 1.822220496291406e-07, + "loss": 0.0389, + "step": 4628 + }, + { + "epoch": 0.09, + "learning_rate": 1.8221816628480447e-07, + "loss": 0.2159, + "step": 4629 + }, + { + "epoch": 0.09, + "learning_rate": 1.8221428294046831e-07, + "loss": 0.5829, + "step": 4630 + }, + { + "epoch": 0.09, + "learning_rate": 1.8221039959613219e-07, + "loss": 0.0326, + "step": 4631 + }, + { + "epoch": 0.09, + "learning_rate": 1.8220651625179603e-07, + "loss": 0.5127, + "step": 4632 + }, + { + "epoch": 0.09, + "learning_rate": 1.822026329074599e-07, + "loss": 0.072, + "step": 4633 + }, + { + "epoch": 0.09, + "learning_rate": 1.8219874956312375e-07, + "loss": 0.532, + "step": 4634 + }, + { + "epoch": 0.09, + "learning_rate": 1.8219486621878762e-07, + "loss": 0.0347, + "step": 4635 + }, + { + "epoch": 0.09, + "learning_rate": 1.8219098287445146e-07, + "loss": 0.0522, + "step": 4636 + }, + { + "epoch": 0.09, + "learning_rate": 1.8218709953011534e-07, + "loss": 0.0214, + "step": 4637 + }, + { + "epoch": 0.09, + "learning_rate": 1.8218321618577918e-07, + "loss": 0.0403, + "step": 4638 + }, + { + "epoch": 0.09, + "learning_rate": 1.8217933284144305e-07, + "loss": 0.2504, + "step": 4639 + }, + { + "epoch": 0.09, + "learning_rate": 1.821754494971069e-07, + "loss": 0.0256, + "step": 4640 + }, + { + "epoch": 0.09, + "learning_rate": 1.8217156615277077e-07, + "loss": 0.0249, + "step": 4641 + }, + { + "epoch": 0.09, + "learning_rate": 1.8216768280843461e-07, + "loss": 0.0652, + "step": 4642 + }, + { + "epoch": 0.09, + "learning_rate": 1.8216379946409849e-07, + "loss": 0.8233, + "step": 4643 + }, + { + "epoch": 0.09, + "learning_rate": 1.8215991611976233e-07, + "loss": 0.0404, + "step": 4644 + }, + { + "epoch": 0.09, + "learning_rate": 1.821560327754262e-07, + "loss": 0.5501, + "step": 4645 + }, + { + "epoch": 0.09, + "learning_rate": 1.8215214943109005e-07, + "loss": 0.0287, + "step": 4646 + }, + { + "epoch": 0.09, + "learning_rate": 1.8214826608675392e-07, + "loss": 0.3936, + "step": 4647 + }, + { + "epoch": 0.09, + "learning_rate": 1.8214438274241776e-07, + "loss": 0.0227, + "step": 4648 + }, + { + "epoch": 0.09, + "learning_rate": 1.8214049939808163e-07, + "loss": 0.0241, + "step": 4649 + }, + { + "epoch": 0.09, + "learning_rate": 1.8213661605374548e-07, + "loss": 0.03, + "step": 4650 + }, + { + "epoch": 0.09, + "learning_rate": 1.8213273270940935e-07, + "loss": 0.139, + "step": 4651 + }, + { + "epoch": 0.09, + "learning_rate": 1.821288493650732e-07, + "loss": 0.1859, + "step": 4652 + }, + { + "epoch": 0.09, + "learning_rate": 1.8212496602073707e-07, + "loss": 0.0201, + "step": 4653 + }, + { + "epoch": 0.09, + "learning_rate": 1.821210826764009e-07, + "loss": 0.2687, + "step": 4654 + }, + { + "epoch": 0.09, + "learning_rate": 1.8211719933206478e-07, + "loss": 0.0618, + "step": 4655 + }, + { + "epoch": 0.09, + "learning_rate": 1.8211331598772863e-07, + "loss": 0.037, + "step": 4656 + }, + { + "epoch": 0.09, + "learning_rate": 1.821094326433925e-07, + "loss": 0.0233, + "step": 4657 + }, + { + "epoch": 0.09, + "learning_rate": 1.8210554929905635e-07, + "loss": 0.0243, + "step": 4658 + }, + { + "epoch": 0.09, + "learning_rate": 1.8210166595472022e-07, + "loss": 0.0262, + "step": 4659 + }, + { + "epoch": 0.09, + "learning_rate": 1.8209778261038406e-07, + "loss": 0.1087, + "step": 4660 + }, + { + "epoch": 0.09, + "learning_rate": 1.820938992660479e-07, + "loss": 0.0298, + "step": 4661 + }, + { + "epoch": 0.09, + "learning_rate": 1.8209001592171175e-07, + "loss": 0.037, + "step": 4662 + }, + { + "epoch": 0.09, + "learning_rate": 1.8208613257737562e-07, + "loss": 0.1793, + "step": 4663 + }, + { + "epoch": 0.09, + "learning_rate": 1.8208224923303947e-07, + "loss": 0.0489, + "step": 4664 + }, + { + "epoch": 0.09, + "learning_rate": 1.8207836588870334e-07, + "loss": 0.0454, + "step": 4665 + }, + { + "epoch": 0.09, + "learning_rate": 1.8207448254436719e-07, + "loss": 0.8105, + "step": 4666 + }, + { + "epoch": 0.09, + "learning_rate": 1.8207059920003106e-07, + "loss": 0.0291, + "step": 4667 + }, + { + "epoch": 0.09, + "learning_rate": 1.820667158556949e-07, + "loss": 0.0404, + "step": 4668 + }, + { + "epoch": 0.09, + "learning_rate": 1.8206283251135877e-07, + "loss": 0.4487, + "step": 4669 + }, + { + "epoch": 0.09, + "learning_rate": 1.8205894916702262e-07, + "loss": 0.0538, + "step": 4670 + }, + { + "epoch": 0.09, + "learning_rate": 1.820550658226865e-07, + "loss": 0.1304, + "step": 4671 + }, + { + "epoch": 0.09, + "learning_rate": 1.8205118247835033e-07, + "loss": 0.1293, + "step": 4672 + }, + { + "epoch": 0.09, + "learning_rate": 1.820472991340142e-07, + "loss": 0.6434, + "step": 4673 + }, + { + "epoch": 0.09, + "learning_rate": 1.8204341578967805e-07, + "loss": 0.0326, + "step": 4674 + }, + { + "epoch": 0.09, + "learning_rate": 1.8203953244534192e-07, + "loss": 0.0506, + "step": 4675 + }, + { + "epoch": 0.09, + "learning_rate": 1.8203564910100577e-07, + "loss": 0.5465, + "step": 4676 + }, + { + "epoch": 0.09, + "learning_rate": 1.8203176575666964e-07, + "loss": 0.4044, + "step": 4677 + }, + { + "epoch": 0.09, + "learning_rate": 1.8202788241233348e-07, + "loss": 0.1847, + "step": 4678 + }, + { + "epoch": 0.09, + "learning_rate": 1.8202399906799736e-07, + "loss": 0.0533, + "step": 4679 + }, + { + "epoch": 0.09, + "learning_rate": 1.820201157236612e-07, + "loss": 0.126, + "step": 4680 + }, + { + "epoch": 0.09, + "learning_rate": 1.8201623237932507e-07, + "loss": 0.0233, + "step": 4681 + }, + { + "epoch": 0.09, + "learning_rate": 1.8201234903498892e-07, + "loss": 0.4034, + "step": 4682 + }, + { + "epoch": 0.09, + "learning_rate": 1.820084656906528e-07, + "loss": 0.0309, + "step": 4683 + }, + { + "epoch": 0.09, + "learning_rate": 1.8200458234631663e-07, + "loss": 0.36, + "step": 4684 + }, + { + "epoch": 0.09, + "learning_rate": 1.820006990019805e-07, + "loss": 0.0992, + "step": 4685 + }, + { + "epoch": 0.09, + "learning_rate": 1.8199681565764435e-07, + "loss": 0.0922, + "step": 4686 + }, + { + "epoch": 0.09, + "learning_rate": 1.8199293231330822e-07, + "loss": 0.1675, + "step": 4687 + }, + { + "epoch": 0.09, + "learning_rate": 1.8198904896897207e-07, + "loss": 0.0502, + "step": 4688 + }, + { + "epoch": 0.09, + "learning_rate": 1.8198516562463594e-07, + "loss": 0.0245, + "step": 4689 + }, + { + "epoch": 0.09, + "learning_rate": 1.8198128228029978e-07, + "loss": 0.0258, + "step": 4690 + }, + { + "epoch": 0.09, + "learning_rate": 1.8197739893596365e-07, + "loss": 0.1751, + "step": 4691 + }, + { + "epoch": 0.09, + "learning_rate": 1.819735155916275e-07, + "loss": 0.1374, + "step": 4692 + }, + { + "epoch": 0.09, + "learning_rate": 1.8196963224729137e-07, + "loss": 0.2436, + "step": 4693 + }, + { + "epoch": 0.09, + "learning_rate": 1.8196574890295522e-07, + "loss": 0.0505, + "step": 4694 + }, + { + "epoch": 0.09, + "learning_rate": 1.819618655586191e-07, + "loss": 0.0241, + "step": 4695 + }, + { + "epoch": 0.09, + "learning_rate": 1.8195798221428293e-07, + "loss": 0.07, + "step": 4696 + }, + { + "epoch": 0.09, + "learning_rate": 1.819540988699468e-07, + "loss": 0.5174, + "step": 4697 + }, + { + "epoch": 0.09, + "learning_rate": 1.8195021552561065e-07, + "loss": 0.0607, + "step": 4698 + }, + { + "epoch": 0.09, + "learning_rate": 1.8194633218127452e-07, + "loss": 0.1547, + "step": 4699 + }, + { + "epoch": 0.09, + "learning_rate": 1.8194244883693837e-07, + "loss": 0.0297, + "step": 4700 + }, + { + "epoch": 0.09, + "learning_rate": 1.8193856549260224e-07, + "loss": 0.1303, + "step": 4701 + }, + { + "epoch": 0.09, + "learning_rate": 1.8193468214826608e-07, + "loss": 0.3082, + "step": 4702 + }, + { + "epoch": 0.09, + "learning_rate": 1.8193079880392995e-07, + "loss": 0.0795, + "step": 4703 + }, + { + "epoch": 0.09, + "learning_rate": 1.819269154595938e-07, + "loss": 0.0404, + "step": 4704 + }, + { + "epoch": 0.09, + "learning_rate": 1.8192303211525767e-07, + "loss": 0.0651, + "step": 4705 + }, + { + "epoch": 0.09, + "learning_rate": 1.8191914877092151e-07, + "loss": 0.0873, + "step": 4706 + }, + { + "epoch": 0.09, + "learning_rate": 1.8191526542658539e-07, + "loss": 0.0686, + "step": 4707 + }, + { + "epoch": 0.09, + "learning_rate": 1.8191138208224923e-07, + "loss": 0.0427, + "step": 4708 + }, + { + "epoch": 0.09, + "learning_rate": 1.819074987379131e-07, + "loss": 0.0847, + "step": 4709 + }, + { + "epoch": 0.09, + "learning_rate": 1.8190361539357695e-07, + "loss": 0.226, + "step": 4710 + }, + { + "epoch": 0.09, + "learning_rate": 1.818997320492408e-07, + "loss": 0.1018, + "step": 4711 + }, + { + "epoch": 0.09, + "learning_rate": 1.8189584870490466e-07, + "loss": 0.2413, + "step": 4712 + }, + { + "epoch": 0.09, + "learning_rate": 1.818919653605685e-07, + "loss": 0.0382, + "step": 4713 + }, + { + "epoch": 0.09, + "learning_rate": 1.8188808201623238e-07, + "loss": 0.0242, + "step": 4714 + }, + { + "epoch": 0.09, + "learning_rate": 1.8188419867189623e-07, + "loss": 0.1202, + "step": 4715 + }, + { + "epoch": 0.09, + "learning_rate": 1.818803153275601e-07, + "loss": 0.3067, + "step": 4716 + }, + { + "epoch": 0.09, + "learning_rate": 1.8187643198322394e-07, + "loss": 0.3275, + "step": 4717 + }, + { + "epoch": 0.09, + "learning_rate": 1.8187254863888781e-07, + "loss": 0.0817, + "step": 4718 + }, + { + "epoch": 0.09, + "learning_rate": 1.8186866529455166e-07, + "loss": 0.0273, + "step": 4719 + }, + { + "epoch": 0.09, + "learning_rate": 1.818647819502155e-07, + "loss": 0.0692, + "step": 4720 + }, + { + "epoch": 0.09, + "learning_rate": 1.8186089860587938e-07, + "loss": 0.0328, + "step": 4721 + }, + { + "epoch": 0.09, + "learning_rate": 1.8185701526154322e-07, + "loss": 0.0261, + "step": 4722 + }, + { + "epoch": 0.09, + "learning_rate": 1.818531319172071e-07, + "loss": 0.0448, + "step": 4723 + }, + { + "epoch": 0.09, + "learning_rate": 1.8184924857287094e-07, + "loss": 0.0327, + "step": 4724 + }, + { + "epoch": 0.09, + "learning_rate": 1.818453652285348e-07, + "loss": 0.1214, + "step": 4725 + }, + { + "epoch": 0.09, + "learning_rate": 1.8184148188419865e-07, + "loss": 0.0556, + "step": 4726 + }, + { + "epoch": 0.09, + "learning_rate": 1.8183759853986252e-07, + "loss": 0.2132, + "step": 4727 + }, + { + "epoch": 0.09, + "learning_rate": 1.8183371519552637e-07, + "loss": 0.0251, + "step": 4728 + }, + { + "epoch": 0.09, + "learning_rate": 1.8182983185119024e-07, + "loss": 0.0215, + "step": 4729 + }, + { + "epoch": 0.09, + "learning_rate": 1.8182594850685409e-07, + "loss": 0.4635, + "step": 4730 + }, + { + "epoch": 0.09, + "learning_rate": 1.8182206516251796e-07, + "loss": 0.0432, + "step": 4731 + }, + { + "epoch": 0.09, + "learning_rate": 1.818181818181818e-07, + "loss": 0.0408, + "step": 4732 + }, + { + "epoch": 0.09, + "learning_rate": 1.8181429847384567e-07, + "loss": 0.031, + "step": 4733 + }, + { + "epoch": 0.09, + "learning_rate": 1.8181041512950952e-07, + "loss": 0.2978, + "step": 4734 + }, + { + "epoch": 0.09, + "learning_rate": 1.818065317851734e-07, + "loss": 0.0644, + "step": 4735 + }, + { + "epoch": 0.09, + "learning_rate": 1.8180264844083724e-07, + "loss": 0.0819, + "step": 4736 + }, + { + "epoch": 0.09, + "learning_rate": 1.817987650965011e-07, + "loss": 0.0885, + "step": 4737 + }, + { + "epoch": 0.09, + "learning_rate": 1.8179488175216495e-07, + "loss": 0.3917, + "step": 4738 + }, + { + "epoch": 0.09, + "learning_rate": 1.8179099840782882e-07, + "loss": 0.1254, + "step": 4739 + }, + { + "epoch": 0.09, + "learning_rate": 1.8178711506349267e-07, + "loss": 0.0204, + "step": 4740 + }, + { + "epoch": 0.09, + "learning_rate": 1.8178323171915651e-07, + "loss": 0.0315, + "step": 4741 + }, + { + "epoch": 0.09, + "learning_rate": 1.8177934837482039e-07, + "loss": 0.1548, + "step": 4742 + }, + { + "epoch": 0.09, + "learning_rate": 1.8177546503048423e-07, + "loss": 0.0354, + "step": 4743 + }, + { + "epoch": 0.09, + "learning_rate": 1.817715816861481e-07, + "loss": 0.0524, + "step": 4744 + }, + { + "epoch": 0.09, + "learning_rate": 1.8176769834181195e-07, + "loss": 0.033, + "step": 4745 + }, + { + "epoch": 0.09, + "learning_rate": 1.8176381499747582e-07, + "loss": 0.0675, + "step": 4746 + }, + { + "epoch": 0.09, + "learning_rate": 1.8175993165313966e-07, + "loss": 0.1015, + "step": 4747 + }, + { + "epoch": 0.09, + "learning_rate": 1.8175604830880353e-07, + "loss": 0.2698, + "step": 4748 + }, + { + "epoch": 0.09, + "learning_rate": 1.8175216496446738e-07, + "loss": 0.0383, + "step": 4749 + }, + { + "epoch": 0.09, + "learning_rate": 1.8174828162013125e-07, + "loss": 0.0824, + "step": 4750 + }, + { + "epoch": 0.09, + "learning_rate": 1.817443982757951e-07, + "loss": 0.1921, + "step": 4751 + }, + { + "epoch": 0.09, + "learning_rate": 1.8174051493145897e-07, + "loss": 0.0512, + "step": 4752 + }, + { + "epoch": 0.09, + "learning_rate": 1.817366315871228e-07, + "loss": 0.0647, + "step": 4753 + }, + { + "epoch": 0.09, + "learning_rate": 1.8173274824278668e-07, + "loss": 0.0221, + "step": 4754 + }, + { + "epoch": 0.09, + "learning_rate": 1.8172886489845053e-07, + "loss": 0.1255, + "step": 4755 + }, + { + "epoch": 0.09, + "learning_rate": 1.817249815541144e-07, + "loss": 0.3372, + "step": 4756 + }, + { + "epoch": 0.09, + "learning_rate": 1.8172109820977825e-07, + "loss": 0.0256, + "step": 4757 + }, + { + "epoch": 0.09, + "learning_rate": 1.8171721486544212e-07, + "loss": 0.2686, + "step": 4758 + }, + { + "epoch": 0.09, + "learning_rate": 1.8171333152110596e-07, + "loss": 0.038, + "step": 4759 + }, + { + "epoch": 0.09, + "learning_rate": 1.8170944817676983e-07, + "loss": 0.0537, + "step": 4760 + }, + { + "epoch": 0.09, + "learning_rate": 1.8170556483243368e-07, + "loss": 0.0509, + "step": 4761 + }, + { + "epoch": 0.09, + "learning_rate": 1.8170168148809755e-07, + "loss": 0.0491, + "step": 4762 + }, + { + "epoch": 0.09, + "learning_rate": 1.816977981437614e-07, + "loss": 0.0767, + "step": 4763 + }, + { + "epoch": 0.09, + "learning_rate": 1.8169391479942527e-07, + "loss": 0.0271, + "step": 4764 + }, + { + "epoch": 0.09, + "learning_rate": 1.816900314550891e-07, + "loss": 0.0415, + "step": 4765 + }, + { + "epoch": 0.09, + "learning_rate": 1.8168614811075298e-07, + "loss": 0.054, + "step": 4766 + }, + { + "epoch": 0.09, + "learning_rate": 1.8168226476641683e-07, + "loss": 0.0875, + "step": 4767 + }, + { + "epoch": 0.09, + "learning_rate": 1.816783814220807e-07, + "loss": 0.4302, + "step": 4768 + }, + { + "epoch": 0.09, + "learning_rate": 1.8167449807774454e-07, + "loss": 0.0519, + "step": 4769 + }, + { + "epoch": 0.09, + "learning_rate": 1.8167061473340842e-07, + "loss": 0.6301, + "step": 4770 + }, + { + "epoch": 0.09, + "learning_rate": 1.8166673138907226e-07, + "loss": 0.0526, + "step": 4771 + }, + { + "epoch": 0.09, + "learning_rate": 1.8166284804473613e-07, + "loss": 0.3687, + "step": 4772 + }, + { + "epoch": 0.09, + "learning_rate": 1.8165896470039998e-07, + "loss": 0.103, + "step": 4773 + }, + { + "epoch": 0.09, + "learning_rate": 1.8165508135606385e-07, + "loss": 0.0298, + "step": 4774 + }, + { + "epoch": 0.09, + "learning_rate": 1.816511980117277e-07, + "loss": 0.1157, + "step": 4775 + }, + { + "epoch": 0.09, + "learning_rate": 1.8164731466739157e-07, + "loss": 0.084, + "step": 4776 + }, + { + "epoch": 0.09, + "learning_rate": 1.8164343132305538e-07, + "loss": 0.6936, + "step": 4777 + }, + { + "epoch": 0.09, + "learning_rate": 1.8163954797871926e-07, + "loss": 0.0636, + "step": 4778 + }, + { + "epoch": 0.09, + "learning_rate": 1.816356646343831e-07, + "loss": 0.024, + "step": 4779 + }, + { + "epoch": 0.09, + "learning_rate": 1.8163178129004697e-07, + "loss": 0.039, + "step": 4780 + }, + { + "epoch": 0.09, + "learning_rate": 1.8162789794571082e-07, + "loss": 0.0208, + "step": 4781 + }, + { + "epoch": 0.09, + "learning_rate": 1.816240146013747e-07, + "loss": 0.0387, + "step": 4782 + }, + { + "epoch": 0.09, + "learning_rate": 1.8162013125703853e-07, + "loss": 0.3349, + "step": 4783 + }, + { + "epoch": 0.09, + "learning_rate": 1.816162479127024e-07, + "loss": 0.5702, + "step": 4784 + }, + { + "epoch": 0.09, + "learning_rate": 1.8161236456836625e-07, + "loss": 0.024, + "step": 4785 + }, + { + "epoch": 0.09, + "learning_rate": 1.8160848122403012e-07, + "loss": 0.184, + "step": 4786 + }, + { + "epoch": 0.09, + "learning_rate": 1.8160459787969397e-07, + "loss": 0.038, + "step": 4787 + }, + { + "epoch": 0.09, + "learning_rate": 1.8160071453535784e-07, + "loss": 0.4071, + "step": 4788 + }, + { + "epoch": 0.09, + "learning_rate": 1.8159683119102168e-07, + "loss": 0.4058, + "step": 4789 + }, + { + "epoch": 0.09, + "learning_rate": 1.8159294784668555e-07, + "loss": 0.0302, + "step": 4790 + }, + { + "epoch": 0.09, + "learning_rate": 1.815890645023494e-07, + "loss": 0.0331, + "step": 4791 + }, + { + "epoch": 0.09, + "learning_rate": 1.8158518115801327e-07, + "loss": 0.0219, + "step": 4792 + }, + { + "epoch": 0.09, + "learning_rate": 1.8158129781367712e-07, + "loss": 0.207, + "step": 4793 + }, + { + "epoch": 0.09, + "learning_rate": 1.81577414469341e-07, + "loss": 0.1326, + "step": 4794 + }, + { + "epoch": 0.09, + "learning_rate": 1.8157353112500483e-07, + "loss": 0.4832, + "step": 4795 + }, + { + "epoch": 0.09, + "learning_rate": 1.815696477806687e-07, + "loss": 0.0222, + "step": 4796 + }, + { + "epoch": 0.09, + "learning_rate": 1.8156576443633255e-07, + "loss": 0.0788, + "step": 4797 + }, + { + "epoch": 0.09, + "learning_rate": 1.8156188109199642e-07, + "loss": 0.0399, + "step": 4798 + }, + { + "epoch": 0.09, + "learning_rate": 1.8155799774766027e-07, + "loss": 0.0232, + "step": 4799 + }, + { + "epoch": 0.09, + "learning_rate": 1.8155411440332414e-07, + "loss": 0.1443, + "step": 4800 + }, + { + "epoch": 0.09, + "learning_rate": 1.8155023105898798e-07, + "loss": 0.0259, + "step": 4801 + }, + { + "epoch": 0.09, + "learning_rate": 1.8154634771465185e-07, + "loss": 0.0301, + "step": 4802 + }, + { + "epoch": 0.09, + "learning_rate": 1.815424643703157e-07, + "loss": 0.0223, + "step": 4803 + }, + { + "epoch": 0.09, + "learning_rate": 1.8153858102597957e-07, + "loss": 0.0252, + "step": 4804 + }, + { + "epoch": 0.09, + "learning_rate": 1.8153469768164341e-07, + "loss": 0.1941, + "step": 4805 + }, + { + "epoch": 0.09, + "learning_rate": 1.8153081433730729e-07, + "loss": 0.5963, + "step": 4806 + }, + { + "epoch": 0.09, + "learning_rate": 1.8152693099297113e-07, + "loss": 0.2663, + "step": 4807 + }, + { + "epoch": 0.09, + "learning_rate": 1.81523047648635e-07, + "loss": 0.0431, + "step": 4808 + }, + { + "epoch": 0.09, + "learning_rate": 1.8151916430429885e-07, + "loss": 0.0248, + "step": 4809 + }, + { + "epoch": 0.09, + "learning_rate": 1.8151528095996272e-07, + "loss": 0.0259, + "step": 4810 + }, + { + "epoch": 0.09, + "learning_rate": 1.8151139761562656e-07, + "loss": 0.0282, + "step": 4811 + }, + { + "epoch": 0.09, + "learning_rate": 1.8150751427129044e-07, + "loss": 0.0414, + "step": 4812 + }, + { + "epoch": 0.09, + "learning_rate": 1.8150363092695428e-07, + "loss": 0.1377, + "step": 4813 + }, + { + "epoch": 0.09, + "learning_rate": 1.8149974758261815e-07, + "loss": 0.1056, + "step": 4814 + }, + { + "epoch": 0.09, + "learning_rate": 1.81495864238282e-07, + "loss": 0.0393, + "step": 4815 + }, + { + "epoch": 0.09, + "learning_rate": 1.8149198089394587e-07, + "loss": 0.2233, + "step": 4816 + }, + { + "epoch": 0.09, + "learning_rate": 1.8148809754960971e-07, + "loss": 0.0846, + "step": 4817 + }, + { + "epoch": 0.09, + "learning_rate": 1.8148421420527359e-07, + "loss": 0.0214, + "step": 4818 + }, + { + "epoch": 0.09, + "learning_rate": 1.8148033086093743e-07, + "loss": 0.4032, + "step": 4819 + }, + { + "epoch": 0.09, + "learning_rate": 1.814764475166013e-07, + "loss": 0.0439, + "step": 4820 + }, + { + "epoch": 0.09, + "learning_rate": 1.8147256417226515e-07, + "loss": 0.812, + "step": 4821 + }, + { + "epoch": 0.09, + "learning_rate": 1.8146868082792902e-07, + "loss": 0.0313, + "step": 4822 + }, + { + "epoch": 0.09, + "learning_rate": 1.8146479748359286e-07, + "loss": 0.0801, + "step": 4823 + }, + { + "epoch": 0.09, + "learning_rate": 1.8146091413925673e-07, + "loss": 0.0433, + "step": 4824 + }, + { + "epoch": 0.09, + "learning_rate": 1.8145703079492058e-07, + "loss": 0.1429, + "step": 4825 + }, + { + "epoch": 0.09, + "learning_rate": 1.8145314745058445e-07, + "loss": 0.1757, + "step": 4826 + }, + { + "epoch": 0.09, + "learning_rate": 1.814492641062483e-07, + "loss": 0.0366, + "step": 4827 + }, + { + "epoch": 0.09, + "learning_rate": 1.8144538076191217e-07, + "loss": 0.3882, + "step": 4828 + }, + { + "epoch": 0.09, + "learning_rate": 1.81441497417576e-07, + "loss": 0.0246, + "step": 4829 + }, + { + "epoch": 0.09, + "learning_rate": 1.8143761407323988e-07, + "loss": 0.5582, + "step": 4830 + }, + { + "epoch": 0.09, + "learning_rate": 1.8143373072890373e-07, + "loss": 0.0348, + "step": 4831 + }, + { + "epoch": 0.09, + "learning_rate": 1.814298473845676e-07, + "loss": 0.0494, + "step": 4832 + }, + { + "epoch": 0.09, + "learning_rate": 1.8142596404023145e-07, + "loss": 0.2206, + "step": 4833 + }, + { + "epoch": 0.09, + "learning_rate": 1.8142208069589532e-07, + "loss": 0.0304, + "step": 4834 + }, + { + "epoch": 0.09, + "learning_rate": 1.8141819735155914e-07, + "loss": 0.3786, + "step": 4835 + }, + { + "epoch": 0.09, + "learning_rate": 1.81414314007223e-07, + "loss": 0.0281, + "step": 4836 + }, + { + "epoch": 0.09, + "learning_rate": 1.8141043066288685e-07, + "loss": 0.0198, + "step": 4837 + }, + { + "epoch": 0.09, + "learning_rate": 1.8140654731855072e-07, + "loss": 0.0327, + "step": 4838 + }, + { + "epoch": 0.09, + "learning_rate": 1.8140266397421457e-07, + "loss": 0.0339, + "step": 4839 + }, + { + "epoch": 0.09, + "learning_rate": 1.8139878062987844e-07, + "loss": 0.0284, + "step": 4840 + }, + { + "epoch": 0.09, + "learning_rate": 1.8139489728554229e-07, + "loss": 0.0221, + "step": 4841 + }, + { + "epoch": 0.09, + "learning_rate": 1.8139101394120616e-07, + "loss": 0.3204, + "step": 4842 + }, + { + "epoch": 0.09, + "learning_rate": 1.8138713059687e-07, + "loss": 0.4986, + "step": 4843 + }, + { + "epoch": 0.09, + "learning_rate": 1.8138324725253387e-07, + "loss": 0.0284, + "step": 4844 + }, + { + "epoch": 0.09, + "learning_rate": 1.8137936390819772e-07, + "loss": 0.0159, + "step": 4845 + }, + { + "epoch": 0.09, + "learning_rate": 1.813754805638616e-07, + "loss": 0.6054, + "step": 4846 + }, + { + "epoch": 0.09, + "learning_rate": 1.8137159721952543e-07, + "loss": 0.0684, + "step": 4847 + }, + { + "epoch": 0.09, + "learning_rate": 1.813677138751893e-07, + "loss": 0.3894, + "step": 4848 + }, + { + "epoch": 0.09, + "learning_rate": 1.8136383053085315e-07, + "loss": 0.0228, + "step": 4849 + }, + { + "epoch": 0.09, + "learning_rate": 1.8135994718651702e-07, + "loss": 0.0641, + "step": 4850 + }, + { + "epoch": 0.09, + "learning_rate": 1.8135606384218087e-07, + "loss": 0.046, + "step": 4851 + }, + { + "epoch": 0.09, + "learning_rate": 1.8135218049784474e-07, + "loss": 0.046, + "step": 4852 + }, + { + "epoch": 0.09, + "learning_rate": 1.8134829715350858e-07, + "loss": 0.0289, + "step": 4853 + }, + { + "epoch": 0.09, + "learning_rate": 1.8134441380917246e-07, + "loss": 0.3122, + "step": 4854 + }, + { + "epoch": 0.09, + "learning_rate": 1.813405304648363e-07, + "loss": 0.0204, + "step": 4855 + }, + { + "epoch": 0.09, + "learning_rate": 1.8133664712050017e-07, + "loss": 0.3171, + "step": 4856 + }, + { + "epoch": 0.09, + "learning_rate": 1.8133276377616402e-07, + "loss": 0.0571, + "step": 4857 + }, + { + "epoch": 0.09, + "learning_rate": 1.813288804318279e-07, + "loss": 0.0667, + "step": 4858 + }, + { + "epoch": 0.09, + "learning_rate": 1.8132499708749173e-07, + "loss": 0.2799, + "step": 4859 + }, + { + "epoch": 0.09, + "learning_rate": 1.813211137431556e-07, + "loss": 0.0363, + "step": 4860 + }, + { + "epoch": 0.09, + "learning_rate": 1.8131723039881945e-07, + "loss": 0.6913, + "step": 4861 + }, + { + "epoch": 0.09, + "learning_rate": 1.8131334705448332e-07, + "loss": 0.2587, + "step": 4862 + }, + { + "epoch": 0.09, + "learning_rate": 1.8130946371014717e-07, + "loss": 0.2215, + "step": 4863 + }, + { + "epoch": 0.09, + "learning_rate": 1.8130558036581104e-07, + "loss": 0.1414, + "step": 4864 + }, + { + "epoch": 0.09, + "learning_rate": 1.8130169702147488e-07, + "loss": 0.0263, + "step": 4865 + }, + { + "epoch": 0.09, + "learning_rate": 1.8129781367713875e-07, + "loss": 0.1954, + "step": 4866 + }, + { + "epoch": 0.09, + "learning_rate": 1.812939303328026e-07, + "loss": 0.0765, + "step": 4867 + }, + { + "epoch": 0.09, + "learning_rate": 1.8129004698846647e-07, + "loss": 0.2128, + "step": 4868 + }, + { + "epoch": 0.09, + "learning_rate": 1.8128616364413032e-07, + "loss": 0.0212, + "step": 4869 + }, + { + "epoch": 0.09, + "learning_rate": 1.812822802997942e-07, + "loss": 0.1174, + "step": 4870 + }, + { + "epoch": 0.09, + "learning_rate": 1.8127839695545803e-07, + "loss": 0.0452, + "step": 4871 + }, + { + "epoch": 0.09, + "learning_rate": 1.812745136111219e-07, + "loss": 0.0245, + "step": 4872 + }, + { + "epoch": 0.09, + "learning_rate": 1.8127063026678575e-07, + "loss": 0.0673, + "step": 4873 + }, + { + "epoch": 0.09, + "learning_rate": 1.8126674692244962e-07, + "loss": 0.3497, + "step": 4874 + }, + { + "epoch": 0.09, + "learning_rate": 1.8126286357811347e-07, + "loss": 0.022, + "step": 4875 + }, + { + "epoch": 0.09, + "learning_rate": 1.8125898023377734e-07, + "loss": 0.0307, + "step": 4876 + }, + { + "epoch": 0.09, + "learning_rate": 1.8125509688944118e-07, + "loss": 0.025, + "step": 4877 + }, + { + "epoch": 0.09, + "learning_rate": 1.8125121354510505e-07, + "loss": 0.027, + "step": 4878 + }, + { + "epoch": 0.09, + "learning_rate": 1.812473302007689e-07, + "loss": 0.26, + "step": 4879 + }, + { + "epoch": 0.09, + "learning_rate": 1.8124344685643277e-07, + "loss": 0.0307, + "step": 4880 + }, + { + "epoch": 0.09, + "learning_rate": 1.8123956351209661e-07, + "loss": 0.0326, + "step": 4881 + }, + { + "epoch": 0.09, + "learning_rate": 1.8123568016776049e-07, + "loss": 0.1124, + "step": 4882 + }, + { + "epoch": 0.09, + "learning_rate": 1.8123179682342433e-07, + "loss": 0.0407, + "step": 4883 + }, + { + "epoch": 0.09, + "learning_rate": 1.812279134790882e-07, + "loss": 0.0265, + "step": 4884 + }, + { + "epoch": 0.09, + "learning_rate": 1.8122403013475205e-07, + "loss": 0.0563, + "step": 4885 + }, + { + "epoch": 0.09, + "learning_rate": 1.8122014679041592e-07, + "loss": 0.5884, + "step": 4886 + }, + { + "epoch": 0.09, + "learning_rate": 1.8121626344607976e-07, + "loss": 0.031, + "step": 4887 + }, + { + "epoch": 0.09, + "learning_rate": 1.812123801017436e-07, + "loss": 0.6323, + "step": 4888 + }, + { + "epoch": 0.09, + "learning_rate": 1.8120849675740748e-07, + "loss": 0.043, + "step": 4889 + }, + { + "epoch": 0.09, + "learning_rate": 1.8120461341307133e-07, + "loss": 0.0301, + "step": 4890 + }, + { + "epoch": 0.09, + "learning_rate": 1.812007300687352e-07, + "loss": 0.0356, + "step": 4891 + }, + { + "epoch": 0.09, + "learning_rate": 1.8119684672439904e-07, + "loss": 0.074, + "step": 4892 + }, + { + "epoch": 0.09, + "learning_rate": 1.811929633800629e-07, + "loss": 0.494, + "step": 4893 + }, + { + "epoch": 0.09, + "learning_rate": 1.8118908003572676e-07, + "loss": 0.0342, + "step": 4894 + }, + { + "epoch": 0.09, + "learning_rate": 1.811851966913906e-07, + "loss": 0.0299, + "step": 4895 + }, + { + "epoch": 0.09, + "learning_rate": 1.8118131334705448e-07, + "loss": 0.0362, + "step": 4896 + }, + { + "epoch": 0.09, + "learning_rate": 1.8117743000271832e-07, + "loss": 0.0272, + "step": 4897 + }, + { + "epoch": 0.1, + "learning_rate": 1.811735466583822e-07, + "loss": 0.039, + "step": 4898 + }, + { + "epoch": 0.1, + "learning_rate": 1.8116966331404604e-07, + "loss": 0.0366, + "step": 4899 + }, + { + "epoch": 0.1, + "learning_rate": 1.811657799697099e-07, + "loss": 0.1042, + "step": 4900 + }, + { + "epoch": 0.1, + "learning_rate": 1.8116189662537375e-07, + "loss": 0.6064, + "step": 4901 + }, + { + "epoch": 0.1, + "learning_rate": 1.8115801328103762e-07, + "loss": 0.0201, + "step": 4902 + }, + { + "epoch": 0.1, + "learning_rate": 1.8115412993670147e-07, + "loss": 0.0249, + "step": 4903 + }, + { + "epoch": 0.1, + "learning_rate": 1.8115024659236534e-07, + "loss": 0.0571, + "step": 4904 + }, + { + "epoch": 0.1, + "learning_rate": 1.8114636324802919e-07, + "loss": 0.0694, + "step": 4905 + }, + { + "epoch": 0.1, + "learning_rate": 1.8114247990369306e-07, + "loss": 0.042, + "step": 4906 + }, + { + "epoch": 0.1, + "learning_rate": 1.811385965593569e-07, + "loss": 0.0228, + "step": 4907 + }, + { + "epoch": 0.1, + "learning_rate": 1.8113471321502077e-07, + "loss": 0.086, + "step": 4908 + }, + { + "epoch": 0.1, + "learning_rate": 1.8113082987068462e-07, + "loss": 0.1006, + "step": 4909 + }, + { + "epoch": 0.1, + "learning_rate": 1.811269465263485e-07, + "loss": 0.0265, + "step": 4910 + }, + { + "epoch": 0.1, + "learning_rate": 1.8112306318201234e-07, + "loss": 0.0236, + "step": 4911 + }, + { + "epoch": 0.1, + "learning_rate": 1.811191798376762e-07, + "loss": 0.0489, + "step": 4912 + }, + { + "epoch": 0.1, + "learning_rate": 1.8111529649334005e-07, + "loss": 0.138, + "step": 4913 + }, + { + "epoch": 0.1, + "learning_rate": 1.8111141314900392e-07, + "loss": 0.0667, + "step": 4914 + }, + { + "epoch": 0.1, + "learning_rate": 1.8110752980466777e-07, + "loss": 0.0222, + "step": 4915 + }, + { + "epoch": 0.1, + "learning_rate": 1.8110364646033164e-07, + "loss": 0.031, + "step": 4916 + }, + { + "epoch": 0.1, + "learning_rate": 1.8109976311599549e-07, + "loss": 0.3833, + "step": 4917 + }, + { + "epoch": 0.1, + "learning_rate": 1.8109587977165933e-07, + "loss": 0.308, + "step": 4918 + }, + { + "epoch": 0.1, + "learning_rate": 1.810919964273232e-07, + "loss": 0.0311, + "step": 4919 + }, + { + "epoch": 0.1, + "learning_rate": 1.8108811308298705e-07, + "loss": 0.0241, + "step": 4920 + }, + { + "epoch": 0.1, + "learning_rate": 1.8108422973865092e-07, + "loss": 0.049, + "step": 4921 + }, + { + "epoch": 0.1, + "learning_rate": 1.8108034639431476e-07, + "loss": 0.0492, + "step": 4922 + }, + { + "epoch": 0.1, + "learning_rate": 1.8107646304997863e-07, + "loss": 0.1574, + "step": 4923 + }, + { + "epoch": 0.1, + "learning_rate": 1.8107257970564248e-07, + "loss": 0.0246, + "step": 4924 + }, + { + "epoch": 0.1, + "learning_rate": 1.8106869636130635e-07, + "loss": 0.0209, + "step": 4925 + }, + { + "epoch": 0.1, + "learning_rate": 1.810648130169702e-07, + "loss": 0.0235, + "step": 4926 + }, + { + "epoch": 0.1, + "learning_rate": 1.8106092967263407e-07, + "loss": 0.3312, + "step": 4927 + }, + { + "epoch": 0.1, + "learning_rate": 1.810570463282979e-07, + "loss": 0.0465, + "step": 4928 + }, + { + "epoch": 0.1, + "learning_rate": 1.8105316298396178e-07, + "loss": 0.0288, + "step": 4929 + }, + { + "epoch": 0.1, + "learning_rate": 1.8104927963962563e-07, + "loss": 0.4109, + "step": 4930 + }, + { + "epoch": 0.1, + "learning_rate": 1.810453962952895e-07, + "loss": 0.0451, + "step": 4931 + }, + { + "epoch": 0.1, + "learning_rate": 1.8104151295095335e-07, + "loss": 0.066, + "step": 4932 + }, + { + "epoch": 0.1, + "learning_rate": 1.8103762960661722e-07, + "loss": 0.017, + "step": 4933 + }, + { + "epoch": 0.1, + "learning_rate": 1.8103374626228106e-07, + "loss": 0.0286, + "step": 4934 + }, + { + "epoch": 0.1, + "learning_rate": 1.8102986291794493e-07, + "loss": 0.0237, + "step": 4935 + }, + { + "epoch": 0.1, + "learning_rate": 1.8102597957360878e-07, + "loss": 0.549, + "step": 4936 + }, + { + "epoch": 0.1, + "learning_rate": 1.8102209622927265e-07, + "loss": 0.0641, + "step": 4937 + }, + { + "epoch": 0.1, + "learning_rate": 1.810182128849365e-07, + "loss": 0.0294, + "step": 4938 + }, + { + "epoch": 0.1, + "learning_rate": 1.8101432954060037e-07, + "loss": 0.0412, + "step": 4939 + }, + { + "epoch": 0.1, + "learning_rate": 1.810104461962642e-07, + "loss": 0.0341, + "step": 4940 + }, + { + "epoch": 0.1, + "learning_rate": 1.8100656285192808e-07, + "loss": 0.0352, + "step": 4941 + }, + { + "epoch": 0.1, + "learning_rate": 1.8100267950759193e-07, + "loss": 0.0289, + "step": 4942 + }, + { + "epoch": 0.1, + "learning_rate": 1.809987961632558e-07, + "loss": 0.0361, + "step": 4943 + }, + { + "epoch": 0.1, + "learning_rate": 1.8099491281891964e-07, + "loss": 0.0298, + "step": 4944 + }, + { + "epoch": 0.1, + "learning_rate": 1.8099102947458352e-07, + "loss": 0.0646, + "step": 4945 + }, + { + "epoch": 0.1, + "learning_rate": 1.8098714613024736e-07, + "loss": 0.02, + "step": 4946 + }, + { + "epoch": 0.1, + "learning_rate": 1.8098326278591123e-07, + "loss": 0.7732, + "step": 4947 + }, + { + "epoch": 0.1, + "learning_rate": 1.8097937944157508e-07, + "loss": 0.0309, + "step": 4948 + }, + { + "epoch": 0.1, + "learning_rate": 1.8097549609723895e-07, + "loss": 0.0966, + "step": 4949 + }, + { + "epoch": 0.1, + "learning_rate": 1.809716127529028e-07, + "loss": 0.0262, + "step": 4950 + }, + { + "epoch": 0.1, + "learning_rate": 1.8096772940856664e-07, + "loss": 0.0402, + "step": 4951 + }, + { + "epoch": 0.1, + "learning_rate": 1.8096384606423048e-07, + "loss": 0.0796, + "step": 4952 + }, + { + "epoch": 0.1, + "learning_rate": 1.8095996271989436e-07, + "loss": 0.0215, + "step": 4953 + }, + { + "epoch": 0.1, + "learning_rate": 1.809560793755582e-07, + "loss": 0.0425, + "step": 4954 + }, + { + "epoch": 0.1, + "learning_rate": 1.8095219603122207e-07, + "loss": 0.037, + "step": 4955 + }, + { + "epoch": 0.1, + "learning_rate": 1.8094831268688592e-07, + "loss": 0.0195, + "step": 4956 + }, + { + "epoch": 0.1, + "learning_rate": 1.809444293425498e-07, + "loss": 0.021, + "step": 4957 + }, + { + "epoch": 0.1, + "learning_rate": 1.8094054599821363e-07, + "loss": 0.094, + "step": 4958 + }, + { + "epoch": 0.1, + "learning_rate": 1.809366626538775e-07, + "loss": 0.4687, + "step": 4959 + }, + { + "epoch": 0.1, + "learning_rate": 1.8093277930954135e-07, + "loss": 0.102, + "step": 4960 + }, + { + "epoch": 0.1, + "learning_rate": 1.8092889596520522e-07, + "loss": 0.0391, + "step": 4961 + }, + { + "epoch": 0.1, + "learning_rate": 1.8092501262086907e-07, + "loss": 0.1455, + "step": 4962 + }, + { + "epoch": 0.1, + "learning_rate": 1.8092112927653294e-07, + "loss": 0.0191, + "step": 4963 + }, + { + "epoch": 0.1, + "learning_rate": 1.8091724593219678e-07, + "loss": 0.0601, + "step": 4964 + }, + { + "epoch": 0.1, + "learning_rate": 1.8091336258786065e-07, + "loss": 0.0225, + "step": 4965 + }, + { + "epoch": 0.1, + "learning_rate": 1.809094792435245e-07, + "loss": 0.0533, + "step": 4966 + }, + { + "epoch": 0.1, + "learning_rate": 1.8090559589918837e-07, + "loss": 0.805, + "step": 4967 + }, + { + "epoch": 0.1, + "learning_rate": 1.8090171255485222e-07, + "loss": 0.104, + "step": 4968 + }, + { + "epoch": 0.1, + "learning_rate": 1.808978292105161e-07, + "loss": 0.0351, + "step": 4969 + }, + { + "epoch": 0.1, + "learning_rate": 1.8089394586617993e-07, + "loss": 0.026, + "step": 4970 + }, + { + "epoch": 0.1, + "learning_rate": 1.808900625218438e-07, + "loss": 0.056, + "step": 4971 + }, + { + "epoch": 0.1, + "learning_rate": 1.8088617917750765e-07, + "loss": 0.0305, + "step": 4972 + }, + { + "epoch": 0.1, + "learning_rate": 1.8088229583317152e-07, + "loss": 0.0472, + "step": 4973 + }, + { + "epoch": 0.1, + "learning_rate": 1.8087841248883537e-07, + "loss": 0.028, + "step": 4974 + }, + { + "epoch": 0.1, + "learning_rate": 1.8087452914449924e-07, + "loss": 0.031, + "step": 4975 + }, + { + "epoch": 0.1, + "learning_rate": 1.8087064580016308e-07, + "loss": 0.0251, + "step": 4976 + }, + { + "epoch": 0.1, + "learning_rate": 1.8086676245582695e-07, + "loss": 0.0391, + "step": 4977 + }, + { + "epoch": 0.1, + "learning_rate": 1.808628791114908e-07, + "loss": 0.0719, + "step": 4978 + }, + { + "epoch": 0.1, + "learning_rate": 1.8085899576715467e-07, + "loss": 0.0249, + "step": 4979 + }, + { + "epoch": 0.1, + "learning_rate": 1.8085511242281851e-07, + "loss": 0.1301, + "step": 4980 + }, + { + "epoch": 0.1, + "learning_rate": 1.8085122907848239e-07, + "loss": 0.0213, + "step": 4981 + }, + { + "epoch": 0.1, + "learning_rate": 1.8084734573414623e-07, + "loss": 0.0306, + "step": 4982 + }, + { + "epoch": 0.1, + "learning_rate": 1.808434623898101e-07, + "loss": 0.0364, + "step": 4983 + }, + { + "epoch": 0.1, + "learning_rate": 1.8083957904547395e-07, + "loss": 0.0177, + "step": 4984 + }, + { + "epoch": 0.1, + "learning_rate": 1.8083569570113782e-07, + "loss": 0.0252, + "step": 4985 + }, + { + "epoch": 0.1, + "learning_rate": 1.8083181235680166e-07, + "loss": 0.4466, + "step": 4986 + }, + { + "epoch": 0.1, + "learning_rate": 1.8082792901246554e-07, + "loss": 0.1054, + "step": 4987 + }, + { + "epoch": 0.1, + "learning_rate": 1.8082404566812938e-07, + "loss": 0.0268, + "step": 4988 + }, + { + "epoch": 0.1, + "learning_rate": 1.8082016232379325e-07, + "loss": 0.0891, + "step": 4989 + }, + { + "epoch": 0.1, + "learning_rate": 1.808162789794571e-07, + "loss": 0.0254, + "step": 4990 + }, + { + "epoch": 0.1, + "learning_rate": 1.8081239563512097e-07, + "loss": 0.0212, + "step": 4991 + }, + { + "epoch": 0.1, + "learning_rate": 1.8080851229078481e-07, + "loss": 0.4521, + "step": 4992 + }, + { + "epoch": 0.1, + "learning_rate": 1.8080462894644869e-07, + "loss": 0.3935, + "step": 4993 + }, + { + "epoch": 0.1, + "learning_rate": 1.8080074560211253e-07, + "loss": 0.0211, + "step": 4994 + }, + { + "epoch": 0.1, + "learning_rate": 1.807968622577764e-07, + "loss": 0.5774, + "step": 4995 + }, + { + "epoch": 0.1, + "learning_rate": 1.8079297891344025e-07, + "loss": 0.3617, + "step": 4996 + }, + { + "epoch": 0.1, + "learning_rate": 1.8078909556910412e-07, + "loss": 0.0955, + "step": 4997 + }, + { + "epoch": 0.1, + "learning_rate": 1.8078521222476796e-07, + "loss": 0.0691, + "step": 4998 + }, + { + "epoch": 0.1, + "learning_rate": 1.8078132888043183e-07, + "loss": 0.1584, + "step": 4999 + }, + { + "epoch": 0.1, + "learning_rate": 1.8077744553609568e-07, + "loss": 0.7926, + "step": 5000 + }, + { + "epoch": 0.1, + "learning_rate": 1.8077356219175955e-07, + "loss": 0.0743, + "step": 5001 + }, + { + "epoch": 0.1, + "learning_rate": 1.807696788474234e-07, + "loss": 0.0852, + "step": 5002 + }, + { + "epoch": 0.1, + "learning_rate": 1.8076579550308727e-07, + "loss": 0.0171, + "step": 5003 + }, + { + "epoch": 0.1, + "learning_rate": 1.807619121587511e-07, + "loss": 0.4645, + "step": 5004 + }, + { + "epoch": 0.1, + "learning_rate": 1.8075802881441498e-07, + "loss": 0.027, + "step": 5005 + }, + { + "epoch": 0.1, + "learning_rate": 1.8075414547007883e-07, + "loss": 0.0606, + "step": 5006 + }, + { + "epoch": 0.1, + "learning_rate": 1.807502621257427e-07, + "loss": 0.0456, + "step": 5007 + }, + { + "epoch": 0.1, + "learning_rate": 1.8074637878140655e-07, + "loss": 0.0428, + "step": 5008 + }, + { + "epoch": 0.1, + "learning_rate": 1.807424954370704e-07, + "loss": 0.0506, + "step": 5009 + }, + { + "epoch": 0.1, + "learning_rate": 1.8073861209273424e-07, + "loss": 0.0191, + "step": 5010 + }, + { + "epoch": 0.1, + "learning_rate": 1.807347287483981e-07, + "loss": 0.0477, + "step": 5011 + }, + { + "epoch": 0.1, + "learning_rate": 1.8073084540406195e-07, + "loss": 0.0294, + "step": 5012 + }, + { + "epoch": 0.1, + "learning_rate": 1.8072696205972582e-07, + "loss": 0.1972, + "step": 5013 + }, + { + "epoch": 0.1, + "learning_rate": 1.8072307871538967e-07, + "loss": 0.0283, + "step": 5014 + }, + { + "epoch": 0.1, + "learning_rate": 1.8071919537105354e-07, + "loss": 0.3909, + "step": 5015 + }, + { + "epoch": 0.1, + "learning_rate": 1.8071531202671739e-07, + "loss": 0.0277, + "step": 5016 + }, + { + "epoch": 0.1, + "learning_rate": 1.8071142868238126e-07, + "loss": 0.0356, + "step": 5017 + }, + { + "epoch": 0.1, + "learning_rate": 1.807075453380451e-07, + "loss": 0.0864, + "step": 5018 + }, + { + "epoch": 0.1, + "learning_rate": 1.8070366199370897e-07, + "loss": 0.1243, + "step": 5019 + }, + { + "epoch": 0.1, + "learning_rate": 1.8069977864937282e-07, + "loss": 0.0222, + "step": 5020 + }, + { + "epoch": 0.1, + "learning_rate": 1.806958953050367e-07, + "loss": 0.1804, + "step": 5021 + }, + { + "epoch": 0.1, + "learning_rate": 1.8069201196070053e-07, + "loss": 0.0195, + "step": 5022 + }, + { + "epoch": 0.1, + "learning_rate": 1.806881286163644e-07, + "loss": 0.1506, + "step": 5023 + }, + { + "epoch": 0.1, + "learning_rate": 1.8068424527202825e-07, + "loss": 0.0361, + "step": 5024 + }, + { + "epoch": 0.1, + "learning_rate": 1.8068036192769212e-07, + "loss": 0.0923, + "step": 5025 + }, + { + "epoch": 0.1, + "learning_rate": 1.8067647858335597e-07, + "loss": 0.1055, + "step": 5026 + }, + { + "epoch": 0.1, + "learning_rate": 1.8067259523901984e-07, + "loss": 0.0238, + "step": 5027 + }, + { + "epoch": 0.1, + "learning_rate": 1.8066871189468368e-07, + "loss": 0.0358, + "step": 5028 + }, + { + "epoch": 0.1, + "learning_rate": 1.8066482855034756e-07, + "loss": 0.0622, + "step": 5029 + }, + { + "epoch": 0.1, + "learning_rate": 1.806609452060114e-07, + "loss": 0.0203, + "step": 5030 + }, + { + "epoch": 0.1, + "learning_rate": 1.8065706186167527e-07, + "loss": 0.0422, + "step": 5031 + }, + { + "epoch": 0.1, + "learning_rate": 1.8065317851733912e-07, + "loss": 0.1435, + "step": 5032 + }, + { + "epoch": 0.1, + "learning_rate": 1.80649295173003e-07, + "loss": 0.0405, + "step": 5033 + }, + { + "epoch": 0.1, + "learning_rate": 1.8064541182866683e-07, + "loss": 0.0343, + "step": 5034 + }, + { + "epoch": 0.1, + "learning_rate": 1.806415284843307e-07, + "loss": 0.0211, + "step": 5035 + }, + { + "epoch": 0.1, + "learning_rate": 1.8063764513999455e-07, + "loss": 0.0185, + "step": 5036 + }, + { + "epoch": 0.1, + "learning_rate": 1.8063376179565842e-07, + "loss": 0.1989, + "step": 5037 + }, + { + "epoch": 0.1, + "learning_rate": 1.8062987845132227e-07, + "loss": 0.4358, + "step": 5038 + }, + { + "epoch": 0.1, + "learning_rate": 1.8062599510698614e-07, + "loss": 0.0231, + "step": 5039 + }, + { + "epoch": 0.1, + "learning_rate": 1.8062211176264998e-07, + "loss": 0.0213, + "step": 5040 + }, + { + "epoch": 0.1, + "learning_rate": 1.8061822841831385e-07, + "loss": 0.0195, + "step": 5041 + }, + { + "epoch": 0.1, + "learning_rate": 1.806143450739777e-07, + "loss": 0.049, + "step": 5042 + }, + { + "epoch": 0.1, + "learning_rate": 1.8061046172964157e-07, + "loss": 0.0259, + "step": 5043 + }, + { + "epoch": 0.1, + "learning_rate": 1.8060657838530542e-07, + "loss": 0.0353, + "step": 5044 + }, + { + "epoch": 0.1, + "learning_rate": 1.806026950409693e-07, + "loss": 0.0631, + "step": 5045 + }, + { + "epoch": 0.1, + "learning_rate": 1.8059881169663313e-07, + "loss": 0.7874, + "step": 5046 + }, + { + "epoch": 0.1, + "learning_rate": 1.80594928352297e-07, + "loss": 0.0478, + "step": 5047 + }, + { + "epoch": 0.1, + "learning_rate": 1.8059104500796085e-07, + "loss": 0.0545, + "step": 5048 + }, + { + "epoch": 0.1, + "learning_rate": 1.8058716166362472e-07, + "loss": 0.0539, + "step": 5049 + }, + { + "epoch": 0.1, + "learning_rate": 1.8058327831928857e-07, + "loss": 0.021, + "step": 5050 + }, + { + "epoch": 0.1, + "learning_rate": 1.8057939497495244e-07, + "loss": 0.0374, + "step": 5051 + }, + { + "epoch": 0.1, + "learning_rate": 1.8057551163061628e-07, + "loss": 0.191, + "step": 5052 + }, + { + "epoch": 0.1, + "learning_rate": 1.8057162828628015e-07, + "loss": 0.1322, + "step": 5053 + }, + { + "epoch": 0.1, + "learning_rate": 1.80567744941944e-07, + "loss": 0.6503, + "step": 5054 + }, + { + "epoch": 0.1, + "learning_rate": 1.8056386159760787e-07, + "loss": 0.0239, + "step": 5055 + }, + { + "epoch": 0.1, + "learning_rate": 1.8055997825327172e-07, + "loss": 0.0298, + "step": 5056 + }, + { + "epoch": 0.1, + "learning_rate": 1.8055609490893559e-07, + "loss": 0.7633, + "step": 5057 + }, + { + "epoch": 0.1, + "learning_rate": 1.8055221156459943e-07, + "loss": 0.0506, + "step": 5058 + }, + { + "epoch": 0.1, + "learning_rate": 1.805483282202633e-07, + "loss": 0.0314, + "step": 5059 + }, + { + "epoch": 0.1, + "learning_rate": 1.8054444487592715e-07, + "loss": 0.0318, + "step": 5060 + }, + { + "epoch": 0.1, + "learning_rate": 1.8054056153159102e-07, + "loss": 0.0263, + "step": 5061 + }, + { + "epoch": 0.1, + "learning_rate": 1.8053667818725486e-07, + "loss": 0.0164, + "step": 5062 + }, + { + "epoch": 0.1, + "learning_rate": 1.8053279484291874e-07, + "loss": 0.0267, + "step": 5063 + }, + { + "epoch": 0.1, + "learning_rate": 1.8052891149858258e-07, + "loss": 0.0291, + "step": 5064 + }, + { + "epoch": 0.1, + "learning_rate": 1.8052502815424643e-07, + "loss": 0.0316, + "step": 5065 + }, + { + "epoch": 0.1, + "learning_rate": 1.805211448099103e-07, + "loss": 0.4943, + "step": 5066 + }, + { + "epoch": 0.1, + "learning_rate": 1.8051726146557414e-07, + "loss": 0.2355, + "step": 5067 + }, + { + "epoch": 0.1, + "learning_rate": 1.80513378121238e-07, + "loss": 0.0375, + "step": 5068 + }, + { + "epoch": 0.1, + "learning_rate": 1.8050949477690186e-07, + "loss": 0.0418, + "step": 5069 + }, + { + "epoch": 0.1, + "learning_rate": 1.805056114325657e-07, + "loss": 0.6076, + "step": 5070 + }, + { + "epoch": 0.1, + "learning_rate": 1.8050172808822958e-07, + "loss": 0.021, + "step": 5071 + }, + { + "epoch": 0.1, + "learning_rate": 1.8049784474389342e-07, + "loss": 0.1597, + "step": 5072 + }, + { + "epoch": 0.1, + "learning_rate": 1.804939613995573e-07, + "loss": 0.021, + "step": 5073 + }, + { + "epoch": 0.1, + "learning_rate": 1.8049007805522114e-07, + "loss": 0.0447, + "step": 5074 + }, + { + "epoch": 0.1, + "learning_rate": 1.80486194710885e-07, + "loss": 0.0468, + "step": 5075 + }, + { + "epoch": 0.1, + "learning_rate": 1.8048231136654885e-07, + "loss": 0.4501, + "step": 5076 + }, + { + "epoch": 0.1, + "learning_rate": 1.8047842802221272e-07, + "loss": 0.0272, + "step": 5077 + }, + { + "epoch": 0.1, + "learning_rate": 1.8047454467787657e-07, + "loss": 0.0257, + "step": 5078 + }, + { + "epoch": 0.1, + "learning_rate": 1.8047066133354044e-07, + "loss": 0.0209, + "step": 5079 + }, + { + "epoch": 0.1, + "learning_rate": 1.8046677798920429e-07, + "loss": 0.0451, + "step": 5080 + }, + { + "epoch": 0.1, + "learning_rate": 1.8046289464486816e-07, + "loss": 0.0425, + "step": 5081 + }, + { + "epoch": 0.1, + "learning_rate": 1.80459011300532e-07, + "loss": 0.1203, + "step": 5082 + }, + { + "epoch": 0.1, + "learning_rate": 1.8045512795619587e-07, + "loss": 0.0426, + "step": 5083 + }, + { + "epoch": 0.1, + "learning_rate": 1.8045124461185972e-07, + "loss": 0.362, + "step": 5084 + }, + { + "epoch": 0.1, + "learning_rate": 1.804473612675236e-07, + "loss": 0.0274, + "step": 5085 + }, + { + "epoch": 0.1, + "learning_rate": 1.8044347792318744e-07, + "loss": 0.3792, + "step": 5086 + }, + { + "epoch": 0.1, + "learning_rate": 1.804395945788513e-07, + "loss": 0.0239, + "step": 5087 + }, + { + "epoch": 0.1, + "learning_rate": 1.8043571123451515e-07, + "loss": 0.0202, + "step": 5088 + }, + { + "epoch": 0.1, + "learning_rate": 1.8043182789017902e-07, + "loss": 0.0192, + "step": 5089 + }, + { + "epoch": 0.1, + "learning_rate": 1.8042794454584287e-07, + "loss": 0.1226, + "step": 5090 + }, + { + "epoch": 0.1, + "learning_rate": 1.8042406120150674e-07, + "loss": 0.324, + "step": 5091 + }, + { + "epoch": 0.1, + "learning_rate": 1.8042017785717059e-07, + "loss": 0.0794, + "step": 5092 + }, + { + "epoch": 0.1, + "learning_rate": 1.8041629451283446e-07, + "loss": 0.3728, + "step": 5093 + }, + { + "epoch": 0.1, + "learning_rate": 1.804124111684983e-07, + "loss": 0.3691, + "step": 5094 + }, + { + "epoch": 0.1, + "learning_rate": 1.8040852782416215e-07, + "loss": 0.0279, + "step": 5095 + }, + { + "epoch": 0.1, + "learning_rate": 1.8040464447982602e-07, + "loss": 0.0188, + "step": 5096 + }, + { + "epoch": 0.1, + "learning_rate": 1.8040076113548986e-07, + "loss": 0.0362, + "step": 5097 + }, + { + "epoch": 0.1, + "learning_rate": 1.8039687779115373e-07, + "loss": 0.0354, + "step": 5098 + }, + { + "epoch": 0.1, + "learning_rate": 1.8039299444681758e-07, + "loss": 0.0251, + "step": 5099 + }, + { + "epoch": 0.1, + "learning_rate": 1.8038911110248145e-07, + "loss": 0.0266, + "step": 5100 + }, + { + "epoch": 0.1, + "learning_rate": 1.803852277581453e-07, + "loss": 0.7854, + "step": 5101 + }, + { + "epoch": 0.1, + "learning_rate": 1.8038134441380917e-07, + "loss": 0.1445, + "step": 5102 + }, + { + "epoch": 0.1, + "learning_rate": 1.80377461069473e-07, + "loss": 0.4072, + "step": 5103 + }, + { + "epoch": 0.1, + "learning_rate": 1.8037357772513688e-07, + "loss": 0.2887, + "step": 5104 + }, + { + "epoch": 0.1, + "learning_rate": 1.8036969438080073e-07, + "loss": 0.044, + "step": 5105 + }, + { + "epoch": 0.1, + "learning_rate": 1.803658110364646e-07, + "loss": 0.0518, + "step": 5106 + }, + { + "epoch": 0.1, + "learning_rate": 1.8036192769212845e-07, + "loss": 0.4596, + "step": 5107 + }, + { + "epoch": 0.1, + "learning_rate": 1.8035804434779232e-07, + "loss": 0.1965, + "step": 5108 + }, + { + "epoch": 0.1, + "learning_rate": 1.8035416100345616e-07, + "loss": 0.0316, + "step": 5109 + }, + { + "epoch": 0.1, + "learning_rate": 1.8035027765912003e-07, + "loss": 0.0193, + "step": 5110 + }, + { + "epoch": 0.1, + "learning_rate": 1.8034639431478388e-07, + "loss": 0.1377, + "step": 5111 + }, + { + "epoch": 0.1, + "learning_rate": 1.8034251097044775e-07, + "loss": 0.0718, + "step": 5112 + }, + { + "epoch": 0.1, + "learning_rate": 1.803386276261116e-07, + "loss": 0.0711, + "step": 5113 + }, + { + "epoch": 0.1, + "learning_rate": 1.8033474428177547e-07, + "loss": 0.0218, + "step": 5114 + }, + { + "epoch": 0.1, + "learning_rate": 1.803308609374393e-07, + "loss": 0.0215, + "step": 5115 + }, + { + "epoch": 0.1, + "learning_rate": 1.8032697759310318e-07, + "loss": 0.0491, + "step": 5116 + }, + { + "epoch": 0.1, + "learning_rate": 1.8032309424876703e-07, + "loss": 0.0167, + "step": 5117 + }, + { + "epoch": 0.1, + "learning_rate": 1.803192109044309e-07, + "loss": 0.0436, + "step": 5118 + }, + { + "epoch": 0.1, + "learning_rate": 1.8031532756009474e-07, + "loss": 0.2283, + "step": 5119 + }, + { + "epoch": 0.1, + "learning_rate": 1.8031144421575862e-07, + "loss": 0.0513, + "step": 5120 + }, + { + "epoch": 0.1, + "learning_rate": 1.8030756087142246e-07, + "loss": 0.8165, + "step": 5121 + }, + { + "epoch": 0.1, + "learning_rate": 1.8030367752708633e-07, + "loss": 0.0354, + "step": 5122 + }, + { + "epoch": 0.1, + "learning_rate": 1.8029979418275018e-07, + "loss": 0.0328, + "step": 5123 + }, + { + "epoch": 0.1, + "learning_rate": 1.8029591083841405e-07, + "loss": 0.0273, + "step": 5124 + }, + { + "epoch": 0.1, + "learning_rate": 1.8029202749407787e-07, + "loss": 0.0256, + "step": 5125 + }, + { + "epoch": 0.1, + "learning_rate": 1.8028814414974174e-07, + "loss": 0.0181, + "step": 5126 + }, + { + "epoch": 0.1, + "learning_rate": 1.8028426080540558e-07, + "loss": 0.0272, + "step": 5127 + }, + { + "epoch": 0.1, + "learning_rate": 1.8028037746106946e-07, + "loss": 0.5069, + "step": 5128 + }, + { + "epoch": 0.1, + "learning_rate": 1.802764941167333e-07, + "loss": 0.1077, + "step": 5129 + }, + { + "epoch": 0.1, + "learning_rate": 1.8027261077239717e-07, + "loss": 0.0272, + "step": 5130 + }, + { + "epoch": 0.1, + "learning_rate": 1.8026872742806102e-07, + "loss": 0.3342, + "step": 5131 + }, + { + "epoch": 0.1, + "learning_rate": 1.802648440837249e-07, + "loss": 0.0955, + "step": 5132 + }, + { + "epoch": 0.1, + "learning_rate": 1.8026096073938873e-07, + "loss": 0.0192, + "step": 5133 + }, + { + "epoch": 0.1, + "learning_rate": 1.802570773950526e-07, + "loss": 0.1167, + "step": 5134 + }, + { + "epoch": 0.1, + "learning_rate": 1.8025319405071645e-07, + "loss": 0.0187, + "step": 5135 + }, + { + "epoch": 0.1, + "learning_rate": 1.8024931070638032e-07, + "loss": 0.0584, + "step": 5136 + }, + { + "epoch": 0.1, + "learning_rate": 1.8024542736204417e-07, + "loss": 0.3543, + "step": 5137 + }, + { + "epoch": 0.1, + "learning_rate": 1.8024154401770804e-07, + "loss": 0.0573, + "step": 5138 + }, + { + "epoch": 0.1, + "learning_rate": 1.8023766067337188e-07, + "loss": 0.0255, + "step": 5139 + }, + { + "epoch": 0.1, + "learning_rate": 1.8023377732903575e-07, + "loss": 0.0256, + "step": 5140 + }, + { + "epoch": 0.1, + "learning_rate": 1.802298939846996e-07, + "loss": 0.3414, + "step": 5141 + }, + { + "epoch": 0.1, + "learning_rate": 1.8022601064036347e-07, + "loss": 0.024, + "step": 5142 + }, + { + "epoch": 0.1, + "learning_rate": 1.8022212729602732e-07, + "loss": 0.255, + "step": 5143 + }, + { + "epoch": 0.1, + "learning_rate": 1.802182439516912e-07, + "loss": 0.3907, + "step": 5144 + }, + { + "epoch": 0.1, + "learning_rate": 1.8021436060735503e-07, + "loss": 0.0253, + "step": 5145 + }, + { + "epoch": 0.1, + "learning_rate": 1.802104772630189e-07, + "loss": 0.873, + "step": 5146 + }, + { + "epoch": 0.1, + "learning_rate": 1.8020659391868275e-07, + "loss": 0.0302, + "step": 5147 + }, + { + "epoch": 0.1, + "learning_rate": 1.8020271057434662e-07, + "loss": 0.038, + "step": 5148 + }, + { + "epoch": 0.1, + "learning_rate": 1.8019882723001047e-07, + "loss": 0.2714, + "step": 5149 + }, + { + "epoch": 0.1, + "learning_rate": 1.8019494388567434e-07, + "loss": 0.0232, + "step": 5150 + }, + { + "epoch": 0.1, + "learning_rate": 1.8019106054133818e-07, + "loss": 0.018, + "step": 5151 + }, + { + "epoch": 0.1, + "learning_rate": 1.8018717719700205e-07, + "loss": 0.033, + "step": 5152 + }, + { + "epoch": 0.1, + "learning_rate": 1.801832938526659e-07, + "loss": 0.0203, + "step": 5153 + }, + { + "epoch": 0.1, + "learning_rate": 1.8017941050832977e-07, + "loss": 0.121, + "step": 5154 + }, + { + "epoch": 0.1, + "learning_rate": 1.8017552716399362e-07, + "loss": 0.0184, + "step": 5155 + }, + { + "epoch": 0.1, + "learning_rate": 1.8017164381965749e-07, + "loss": 0.0948, + "step": 5156 + }, + { + "epoch": 0.1, + "learning_rate": 1.8016776047532133e-07, + "loss": 0.0295, + "step": 5157 + }, + { + "epoch": 0.1, + "learning_rate": 1.801638771309852e-07, + "loss": 0.0351, + "step": 5158 + }, + { + "epoch": 0.1, + "learning_rate": 1.8015999378664905e-07, + "loss": 0.0225, + "step": 5159 + }, + { + "epoch": 0.1, + "learning_rate": 1.8015611044231292e-07, + "loss": 0.161, + "step": 5160 + }, + { + "epoch": 0.1, + "learning_rate": 1.8015222709797676e-07, + "loss": 0.0246, + "step": 5161 + }, + { + "epoch": 0.1, + "learning_rate": 1.8014834375364064e-07, + "loss": 0.2324, + "step": 5162 + }, + { + "epoch": 0.1, + "learning_rate": 1.8014446040930448e-07, + "loss": 0.0221, + "step": 5163 + }, + { + "epoch": 0.1, + "learning_rate": 1.8014057706496835e-07, + "loss": 0.0227, + "step": 5164 + }, + { + "epoch": 0.1, + "learning_rate": 1.801366937206322e-07, + "loss": 0.0492, + "step": 5165 + }, + { + "epoch": 0.1, + "learning_rate": 1.8013281037629607e-07, + "loss": 0.2501, + "step": 5166 + }, + { + "epoch": 0.1, + "learning_rate": 1.8012892703195991e-07, + "loss": 0.0369, + "step": 5167 + }, + { + "epoch": 0.1, + "learning_rate": 1.8012504368762379e-07, + "loss": 0.0638, + "step": 5168 + }, + { + "epoch": 0.1, + "learning_rate": 1.8012116034328763e-07, + "loss": 0.0752, + "step": 5169 + }, + { + "epoch": 0.1, + "learning_rate": 1.801172769989515e-07, + "loss": 0.02, + "step": 5170 + }, + { + "epoch": 0.1, + "learning_rate": 1.8011339365461535e-07, + "loss": 0.5362, + "step": 5171 + }, + { + "epoch": 0.1, + "learning_rate": 1.8010951031027922e-07, + "loss": 0.0709, + "step": 5172 + }, + { + "epoch": 0.1, + "learning_rate": 1.8010562696594306e-07, + "loss": 0.05, + "step": 5173 + }, + { + "epoch": 0.1, + "learning_rate": 1.8010174362160693e-07, + "loss": 0.0339, + "step": 5174 + }, + { + "epoch": 0.1, + "learning_rate": 1.8009786027727078e-07, + "loss": 0.0381, + "step": 5175 + }, + { + "epoch": 0.1, + "learning_rate": 1.8009397693293465e-07, + "loss": 0.188, + "step": 5176 + }, + { + "epoch": 0.1, + "learning_rate": 1.800900935885985e-07, + "loss": 0.0412, + "step": 5177 + }, + { + "epoch": 0.1, + "learning_rate": 1.8008621024426237e-07, + "loss": 0.4903, + "step": 5178 + }, + { + "epoch": 0.1, + "learning_rate": 1.800823268999262e-07, + "loss": 0.3447, + "step": 5179 + }, + { + "epoch": 0.1, + "learning_rate": 1.8007844355559008e-07, + "loss": 0.0657, + "step": 5180 + }, + { + "epoch": 0.1, + "learning_rate": 1.8007456021125393e-07, + "loss": 0.0307, + "step": 5181 + }, + { + "epoch": 0.1, + "learning_rate": 1.800706768669178e-07, + "loss": 0.1436, + "step": 5182 + }, + { + "epoch": 0.1, + "learning_rate": 1.8006679352258162e-07, + "loss": 0.1504, + "step": 5183 + }, + { + "epoch": 0.1, + "learning_rate": 1.800629101782455e-07, + "loss": 0.021, + "step": 5184 + }, + { + "epoch": 0.1, + "learning_rate": 1.8005902683390934e-07, + "loss": 0.0523, + "step": 5185 + }, + { + "epoch": 0.1, + "learning_rate": 1.800551434895732e-07, + "loss": 0.0466, + "step": 5186 + }, + { + "epoch": 0.1, + "learning_rate": 1.8005126014523705e-07, + "loss": 0.0239, + "step": 5187 + }, + { + "epoch": 0.1, + "learning_rate": 1.8004737680090092e-07, + "loss": 0.138, + "step": 5188 + }, + { + "epoch": 0.1, + "learning_rate": 1.8004349345656477e-07, + "loss": 0.3479, + "step": 5189 + }, + { + "epoch": 0.1, + "learning_rate": 1.8003961011222864e-07, + "loss": 0.5006, + "step": 5190 + }, + { + "epoch": 0.1, + "learning_rate": 1.8003572676789249e-07, + "loss": 0.2161, + "step": 5191 + }, + { + "epoch": 0.1, + "learning_rate": 1.8003184342355636e-07, + "loss": 0.2292, + "step": 5192 + }, + { + "epoch": 0.1, + "learning_rate": 1.800279600792202e-07, + "loss": 0.1818, + "step": 5193 + }, + { + "epoch": 0.1, + "learning_rate": 1.8002407673488407e-07, + "loss": 0.2002, + "step": 5194 + }, + { + "epoch": 0.1, + "learning_rate": 1.8002019339054792e-07, + "loss": 0.0267, + "step": 5195 + }, + { + "epoch": 0.1, + "learning_rate": 1.800163100462118e-07, + "loss": 0.6349, + "step": 5196 + }, + { + "epoch": 0.1, + "learning_rate": 1.8001242670187563e-07, + "loss": 0.0209, + "step": 5197 + }, + { + "epoch": 0.1, + "learning_rate": 1.800085433575395e-07, + "loss": 0.3774, + "step": 5198 + }, + { + "epoch": 0.1, + "learning_rate": 1.8000466001320335e-07, + "loss": 0.0314, + "step": 5199 + }, + { + "epoch": 0.1, + "learning_rate": 1.8000077666886722e-07, + "loss": 0.4237, + "step": 5200 + }, + { + "epoch": 0.1, + "learning_rate": 1.7999689332453107e-07, + "loss": 0.0319, + "step": 5201 + }, + { + "epoch": 0.1, + "learning_rate": 1.7999300998019494e-07, + "loss": 0.3069, + "step": 5202 + }, + { + "epoch": 0.1, + "learning_rate": 1.7998912663585878e-07, + "loss": 0.046, + "step": 5203 + }, + { + "epoch": 0.1, + "learning_rate": 1.7998524329152266e-07, + "loss": 0.0302, + "step": 5204 + }, + { + "epoch": 0.1, + "learning_rate": 1.799813599471865e-07, + "loss": 0.3877, + "step": 5205 + }, + { + "epoch": 0.1, + "learning_rate": 1.7997747660285037e-07, + "loss": 0.0218, + "step": 5206 + }, + { + "epoch": 0.1, + "learning_rate": 1.7997359325851422e-07, + "loss": 0.0236, + "step": 5207 + }, + { + "epoch": 0.1, + "learning_rate": 1.799697099141781e-07, + "loss": 0.0374, + "step": 5208 + }, + { + "epoch": 0.1, + "learning_rate": 1.7996582656984193e-07, + "loss": 0.0171, + "step": 5209 + }, + { + "epoch": 0.1, + "learning_rate": 1.799619432255058e-07, + "loss": 0.1218, + "step": 5210 + }, + { + "epoch": 0.1, + "learning_rate": 1.7995805988116965e-07, + "loss": 0.054, + "step": 5211 + }, + { + "epoch": 0.1, + "learning_rate": 1.7995417653683352e-07, + "loss": 0.5518, + "step": 5212 + }, + { + "epoch": 0.1, + "learning_rate": 1.7995029319249737e-07, + "loss": 0.0197, + "step": 5213 + }, + { + "epoch": 0.1, + "learning_rate": 1.7994640984816124e-07, + "loss": 0.0174, + "step": 5214 + }, + { + "epoch": 0.1, + "learning_rate": 1.7994252650382508e-07, + "loss": 0.0302, + "step": 5215 + }, + { + "epoch": 0.1, + "learning_rate": 1.7993864315948895e-07, + "loss": 0.0299, + "step": 5216 + }, + { + "epoch": 0.1, + "learning_rate": 1.799347598151528e-07, + "loss": 0.304, + "step": 5217 + }, + { + "epoch": 0.1, + "learning_rate": 1.7993087647081667e-07, + "loss": 0.0209, + "step": 5218 + }, + { + "epoch": 0.1, + "learning_rate": 1.7992699312648052e-07, + "loss": 0.1976, + "step": 5219 + }, + { + "epoch": 0.1, + "learning_rate": 1.799231097821444e-07, + "loss": 0.0155, + "step": 5220 + }, + { + "epoch": 0.1, + "learning_rate": 1.7991922643780823e-07, + "loss": 0.0417, + "step": 5221 + }, + { + "epoch": 0.1, + "learning_rate": 1.799153430934721e-07, + "loss": 0.0373, + "step": 5222 + }, + { + "epoch": 0.1, + "learning_rate": 1.7991145974913595e-07, + "loss": 0.0726, + "step": 5223 + }, + { + "epoch": 0.1, + "learning_rate": 1.7990757640479982e-07, + "loss": 0.0737, + "step": 5224 + }, + { + "epoch": 0.1, + "learning_rate": 1.7990369306046367e-07, + "loss": 0.0535, + "step": 5225 + }, + { + "epoch": 0.1, + "learning_rate": 1.7989980971612754e-07, + "loss": 0.3343, + "step": 5226 + }, + { + "epoch": 0.1, + "learning_rate": 1.7989592637179138e-07, + "loss": 0.0237, + "step": 5227 + }, + { + "epoch": 0.1, + "learning_rate": 1.7989204302745525e-07, + "loss": 0.2126, + "step": 5228 + }, + { + "epoch": 0.1, + "learning_rate": 1.798881596831191e-07, + "loss": 0.0321, + "step": 5229 + }, + { + "epoch": 0.1, + "learning_rate": 1.7988427633878297e-07, + "loss": 0.0213, + "step": 5230 + }, + { + "epoch": 0.1, + "learning_rate": 1.7988039299444682e-07, + "loss": 0.0157, + "step": 5231 + }, + { + "epoch": 0.1, + "learning_rate": 1.7987650965011069e-07, + "loss": 0.0836, + "step": 5232 + }, + { + "epoch": 0.1, + "learning_rate": 1.7987262630577453e-07, + "loss": 0.0646, + "step": 5233 + }, + { + "epoch": 0.1, + "learning_rate": 1.798687429614384e-07, + "loss": 0.0401, + "step": 5234 + }, + { + "epoch": 0.1, + "learning_rate": 1.7986485961710225e-07, + "loss": 0.1473, + "step": 5235 + }, + { + "epoch": 0.1, + "learning_rate": 1.7986097627276612e-07, + "loss": 0.0174, + "step": 5236 + }, + { + "epoch": 0.1, + "learning_rate": 1.7985709292842996e-07, + "loss": 0.142, + "step": 5237 + }, + { + "epoch": 0.1, + "learning_rate": 1.7985320958409384e-07, + "loss": 0.0217, + "step": 5238 + }, + { + "epoch": 0.1, + "learning_rate": 1.7984932623975768e-07, + "loss": 0.0447, + "step": 5239 + }, + { + "epoch": 0.1, + "learning_rate": 1.7984544289542155e-07, + "loss": 0.0201, + "step": 5240 + }, + { + "epoch": 0.1, + "learning_rate": 1.7984155955108537e-07, + "loss": 0.0161, + "step": 5241 + }, + { + "epoch": 0.1, + "learning_rate": 1.7983767620674924e-07, + "loss": 0.157, + "step": 5242 + }, + { + "epoch": 0.1, + "learning_rate": 1.798337928624131e-07, + "loss": 0.0222, + "step": 5243 + }, + { + "epoch": 0.1, + "learning_rate": 1.7982990951807696e-07, + "loss": 0.0274, + "step": 5244 + }, + { + "epoch": 0.1, + "learning_rate": 1.798260261737408e-07, + "loss": 0.0186, + "step": 5245 + }, + { + "epoch": 0.1, + "learning_rate": 1.7982214282940468e-07, + "loss": 0.0191, + "step": 5246 + }, + { + "epoch": 0.1, + "learning_rate": 1.7981825948506852e-07, + "loss": 0.0941, + "step": 5247 + }, + { + "epoch": 0.1, + "learning_rate": 1.798143761407324e-07, + "loss": 0.0238, + "step": 5248 + }, + { + "epoch": 0.1, + "learning_rate": 1.7981049279639624e-07, + "loss": 0.0247, + "step": 5249 + }, + { + "epoch": 0.1, + "learning_rate": 1.798066094520601e-07, + "loss": 0.0383, + "step": 5250 + }, + { + "epoch": 0.1, + "learning_rate": 1.7980272610772395e-07, + "loss": 0.1223, + "step": 5251 + }, + { + "epoch": 0.1, + "learning_rate": 1.7979884276338783e-07, + "loss": 0.0279, + "step": 5252 + }, + { + "epoch": 0.1, + "learning_rate": 1.7979495941905167e-07, + "loss": 0.0256, + "step": 5253 + }, + { + "epoch": 0.1, + "learning_rate": 1.7979107607471554e-07, + "loss": 0.0477, + "step": 5254 + }, + { + "epoch": 0.1, + "learning_rate": 1.7978719273037939e-07, + "loss": 0.018, + "step": 5255 + }, + { + "epoch": 0.1, + "learning_rate": 1.7978330938604326e-07, + "loss": 0.0169, + "step": 5256 + }, + { + "epoch": 0.1, + "learning_rate": 1.797794260417071e-07, + "loss": 0.0906, + "step": 5257 + }, + { + "epoch": 0.1, + "learning_rate": 1.7977554269737097e-07, + "loss": 0.0828, + "step": 5258 + }, + { + "epoch": 0.1, + "learning_rate": 1.7977165935303482e-07, + "loss": 0.3514, + "step": 5259 + }, + { + "epoch": 0.1, + "learning_rate": 1.797677760086987e-07, + "loss": 0.0676, + "step": 5260 + }, + { + "epoch": 0.1, + "learning_rate": 1.7976389266436254e-07, + "loss": 0.4148, + "step": 5261 + }, + { + "epoch": 0.1, + "learning_rate": 1.797600093200264e-07, + "loss": 0.0188, + "step": 5262 + }, + { + "epoch": 0.1, + "learning_rate": 1.7975612597569025e-07, + "loss": 0.1141, + "step": 5263 + }, + { + "epoch": 0.1, + "learning_rate": 1.7975224263135412e-07, + "loss": 0.0234, + "step": 5264 + }, + { + "epoch": 0.1, + "learning_rate": 1.7974835928701797e-07, + "loss": 0.0751, + "step": 5265 + }, + { + "epoch": 0.1, + "learning_rate": 1.7974447594268184e-07, + "loss": 0.0353, + "step": 5266 + }, + { + "epoch": 0.1, + "learning_rate": 1.7974059259834569e-07, + "loss": 0.0172, + "step": 5267 + }, + { + "epoch": 0.1, + "learning_rate": 1.7973670925400956e-07, + "loss": 0.7702, + "step": 5268 + }, + { + "epoch": 0.1, + "learning_rate": 1.797328259096734e-07, + "loss": 0.0904, + "step": 5269 + }, + { + "epoch": 0.1, + "learning_rate": 1.7972894256533727e-07, + "loss": 0.0293, + "step": 5270 + }, + { + "epoch": 0.1, + "learning_rate": 1.7972505922100112e-07, + "loss": 0.0366, + "step": 5271 + }, + { + "epoch": 0.1, + "learning_rate": 1.7972117587666496e-07, + "loss": 0.0379, + "step": 5272 + }, + { + "epoch": 0.1, + "learning_rate": 1.7971729253232883e-07, + "loss": 0.0182, + "step": 5273 + }, + { + "epoch": 0.1, + "learning_rate": 1.7971340918799268e-07, + "loss": 0.0458, + "step": 5274 + }, + { + "epoch": 0.1, + "learning_rate": 1.7970952584365655e-07, + "loss": 0.1759, + "step": 5275 + }, + { + "epoch": 0.1, + "learning_rate": 1.797056424993204e-07, + "loss": 0.0322, + "step": 5276 + }, + { + "epoch": 0.1, + "learning_rate": 1.7970175915498427e-07, + "loss": 0.1323, + "step": 5277 + }, + { + "epoch": 0.1, + "learning_rate": 1.796978758106481e-07, + "loss": 0.0278, + "step": 5278 + }, + { + "epoch": 0.1, + "learning_rate": 1.7969399246631198e-07, + "loss": 0.0176, + "step": 5279 + }, + { + "epoch": 0.1, + "learning_rate": 1.7969010912197583e-07, + "loss": 0.0548, + "step": 5280 + }, + { + "epoch": 0.1, + "learning_rate": 1.796862257776397e-07, + "loss": 0.1758, + "step": 5281 + }, + { + "epoch": 0.1, + "learning_rate": 1.7968234243330355e-07, + "loss": 0.0181, + "step": 5282 + }, + { + "epoch": 0.1, + "learning_rate": 1.7967845908896742e-07, + "loss": 0.0176, + "step": 5283 + }, + { + "epoch": 0.1, + "learning_rate": 1.7967457574463126e-07, + "loss": 0.0592, + "step": 5284 + }, + { + "epoch": 0.1, + "learning_rate": 1.7967069240029513e-07, + "loss": 0.0219, + "step": 5285 + }, + { + "epoch": 0.1, + "learning_rate": 1.7966680905595898e-07, + "loss": 0.0257, + "step": 5286 + }, + { + "epoch": 0.1, + "learning_rate": 1.7966292571162285e-07, + "loss": 0.0351, + "step": 5287 + }, + { + "epoch": 0.1, + "learning_rate": 1.796590423672867e-07, + "loss": 0.0475, + "step": 5288 + }, + { + "epoch": 0.1, + "learning_rate": 1.7965515902295057e-07, + "loss": 0.0481, + "step": 5289 + }, + { + "epoch": 0.1, + "learning_rate": 1.796512756786144e-07, + "loss": 0.1664, + "step": 5290 + }, + { + "epoch": 0.1, + "learning_rate": 1.7964739233427828e-07, + "loss": 0.0162, + "step": 5291 + }, + { + "epoch": 0.1, + "learning_rate": 1.7964350898994213e-07, + "loss": 0.0797, + "step": 5292 + }, + { + "epoch": 0.1, + "learning_rate": 1.79639625645606e-07, + "loss": 0.022, + "step": 5293 + }, + { + "epoch": 0.1, + "learning_rate": 1.7963574230126984e-07, + "loss": 0.0234, + "step": 5294 + }, + { + "epoch": 0.1, + "learning_rate": 1.7963185895693372e-07, + "loss": 0.0185, + "step": 5295 + }, + { + "epoch": 0.1, + "learning_rate": 1.7962797561259756e-07, + "loss": 0.0396, + "step": 5296 + }, + { + "epoch": 0.1, + "learning_rate": 1.7962409226826143e-07, + "loss": 0.0164, + "step": 5297 + }, + { + "epoch": 0.1, + "learning_rate": 1.7962020892392528e-07, + "loss": 0.0225, + "step": 5298 + }, + { + "epoch": 0.1, + "learning_rate": 1.7961632557958912e-07, + "loss": 0.3087, + "step": 5299 + }, + { + "epoch": 0.1, + "learning_rate": 1.79612442235253e-07, + "loss": 0.0193, + "step": 5300 + }, + { + "epoch": 0.1, + "learning_rate": 1.7960855889091684e-07, + "loss": 0.6267, + "step": 5301 + }, + { + "epoch": 0.1, + "learning_rate": 1.7960467554658068e-07, + "loss": 0.0194, + "step": 5302 + }, + { + "epoch": 0.1, + "learning_rate": 1.7960079220224456e-07, + "loss": 0.0213, + "step": 5303 + }, + { + "epoch": 0.1, + "learning_rate": 1.795969088579084e-07, + "loss": 0.3249, + "step": 5304 + }, + { + "epoch": 0.1, + "learning_rate": 1.7959302551357227e-07, + "loss": 0.026, + "step": 5305 + }, + { + "epoch": 0.1, + "learning_rate": 1.7958914216923612e-07, + "loss": 0.0156, + "step": 5306 + }, + { + "epoch": 0.1, + "learning_rate": 1.795852588249e-07, + "loss": 0.0197, + "step": 5307 + }, + { + "epoch": 0.1, + "learning_rate": 1.7958137548056383e-07, + "loss": 0.0992, + "step": 5308 + }, + { + "epoch": 0.1, + "learning_rate": 1.795774921362277e-07, + "loss": 0.3882, + "step": 5309 + }, + { + "epoch": 0.1, + "learning_rate": 1.7957360879189155e-07, + "loss": 0.0278, + "step": 5310 + }, + { + "epoch": 0.1, + "learning_rate": 1.7956972544755542e-07, + "loss": 0.1365, + "step": 5311 + }, + { + "epoch": 0.1, + "learning_rate": 1.7956584210321927e-07, + "loss": 0.0914, + "step": 5312 + }, + { + "epoch": 0.1, + "learning_rate": 1.7956195875888314e-07, + "loss": 0.102, + "step": 5313 + }, + { + "epoch": 0.1, + "learning_rate": 1.7955807541454698e-07, + "loss": 0.0386, + "step": 5314 + }, + { + "epoch": 0.1, + "learning_rate": 1.7955419207021085e-07, + "loss": 0.0287, + "step": 5315 + }, + { + "epoch": 0.1, + "learning_rate": 1.795503087258747e-07, + "loss": 0.0275, + "step": 5316 + }, + { + "epoch": 0.1, + "learning_rate": 1.7954642538153857e-07, + "loss": 0.037, + "step": 5317 + }, + { + "epoch": 0.1, + "learning_rate": 1.7954254203720242e-07, + "loss": 0.0426, + "step": 5318 + }, + { + "epoch": 0.1, + "learning_rate": 1.795386586928663e-07, + "loss": 0.0971, + "step": 5319 + }, + { + "epoch": 0.1, + "learning_rate": 1.7953477534853013e-07, + "loss": 0.2699, + "step": 5320 + }, + { + "epoch": 0.1, + "learning_rate": 1.79530892004194e-07, + "loss": 0.0183, + "step": 5321 + }, + { + "epoch": 0.1, + "learning_rate": 1.7952700865985785e-07, + "loss": 0.0163, + "step": 5322 + }, + { + "epoch": 0.1, + "learning_rate": 1.7952312531552172e-07, + "loss": 0.1643, + "step": 5323 + }, + { + "epoch": 0.1, + "learning_rate": 1.7951924197118557e-07, + "loss": 0.0176, + "step": 5324 + }, + { + "epoch": 0.1, + "learning_rate": 1.7951535862684944e-07, + "loss": 0.0147, + "step": 5325 + }, + { + "epoch": 0.1, + "learning_rate": 1.7951147528251328e-07, + "loss": 0.03, + "step": 5326 + }, + { + "epoch": 0.1, + "learning_rate": 1.7950759193817715e-07, + "loss": 0.0167, + "step": 5327 + }, + { + "epoch": 0.1, + "learning_rate": 1.79503708593841e-07, + "loss": 0.0388, + "step": 5328 + }, + { + "epoch": 0.1, + "learning_rate": 1.7949982524950487e-07, + "loss": 0.0874, + "step": 5329 + }, + { + "epoch": 0.1, + "learning_rate": 1.7949594190516872e-07, + "loss": 0.0764, + "step": 5330 + }, + { + "epoch": 0.1, + "learning_rate": 1.7949205856083259e-07, + "loss": 0.0234, + "step": 5331 + }, + { + "epoch": 0.1, + "learning_rate": 1.7948817521649643e-07, + "loss": 0.2101, + "step": 5332 + }, + { + "epoch": 0.1, + "learning_rate": 1.794842918721603e-07, + "loss": 0.0218, + "step": 5333 + }, + { + "epoch": 0.1, + "learning_rate": 1.7948040852782415e-07, + "loss": 0.0218, + "step": 5334 + }, + { + "epoch": 0.1, + "learning_rate": 1.7947652518348802e-07, + "loss": 0.0138, + "step": 5335 + }, + { + "epoch": 0.1, + "learning_rate": 1.7947264183915186e-07, + "loss": 0.0467, + "step": 5336 + }, + { + "epoch": 0.1, + "learning_rate": 1.7946875849481574e-07, + "loss": 0.1404, + "step": 5337 + }, + { + "epoch": 0.1, + "learning_rate": 1.7946487515047958e-07, + "loss": 0.0565, + "step": 5338 + }, + { + "epoch": 0.1, + "learning_rate": 1.7946099180614345e-07, + "loss": 0.0226, + "step": 5339 + }, + { + "epoch": 0.1, + "learning_rate": 1.794571084618073e-07, + "loss": 0.0278, + "step": 5340 + }, + { + "epoch": 0.1, + "learning_rate": 1.7945322511747117e-07, + "loss": 0.0767, + "step": 5341 + }, + { + "epoch": 0.1, + "learning_rate": 1.7944934177313501e-07, + "loss": 0.0184, + "step": 5342 + }, + { + "epoch": 0.1, + "learning_rate": 1.7944545842879889e-07, + "loss": 0.0515, + "step": 5343 + }, + { + "epoch": 0.1, + "learning_rate": 1.7944157508446273e-07, + "loss": 0.375, + "step": 5344 + }, + { + "epoch": 0.1, + "learning_rate": 1.794376917401266e-07, + "loss": 0.0182, + "step": 5345 + }, + { + "epoch": 0.1, + "learning_rate": 1.7943380839579045e-07, + "loss": 0.3198, + "step": 5346 + }, + { + "epoch": 0.1, + "learning_rate": 1.7942992505145432e-07, + "loss": 0.0152, + "step": 5347 + }, + { + "epoch": 0.1, + "learning_rate": 1.7942604170711816e-07, + "loss": 0.0551, + "step": 5348 + }, + { + "epoch": 0.1, + "learning_rate": 1.7942215836278204e-07, + "loss": 0.3859, + "step": 5349 + }, + { + "epoch": 0.1, + "learning_rate": 1.7941827501844588e-07, + "loss": 0.041, + "step": 5350 + }, + { + "epoch": 0.1, + "learning_rate": 1.7941439167410975e-07, + "loss": 0.1498, + "step": 5351 + }, + { + "epoch": 0.1, + "learning_rate": 1.794105083297736e-07, + "loss": 0.032, + "step": 5352 + }, + { + "epoch": 0.1, + "learning_rate": 1.7940662498543747e-07, + "loss": 0.0155, + "step": 5353 + }, + { + "epoch": 0.1, + "learning_rate": 1.794027416411013e-07, + "loss": 0.0275, + "step": 5354 + }, + { + "epoch": 0.1, + "learning_rate": 1.7939885829676518e-07, + "loss": 0.0192, + "step": 5355 + }, + { + "epoch": 0.1, + "learning_rate": 1.7939497495242903e-07, + "loss": 0.0584, + "step": 5356 + }, + { + "epoch": 0.1, + "learning_rate": 1.7939109160809287e-07, + "loss": 0.0205, + "step": 5357 + }, + { + "epoch": 0.1, + "learning_rate": 1.7938720826375672e-07, + "loss": 0.0224, + "step": 5358 + }, + { + "epoch": 0.1, + "learning_rate": 1.793833249194206e-07, + "loss": 0.0298, + "step": 5359 + }, + { + "epoch": 0.1, + "learning_rate": 1.7937944157508444e-07, + "loss": 0.3227, + "step": 5360 + }, + { + "epoch": 0.1, + "learning_rate": 1.793755582307483e-07, + "loss": 0.0142, + "step": 5361 + }, + { + "epoch": 0.1, + "learning_rate": 1.7937167488641215e-07, + "loss": 0.022, + "step": 5362 + }, + { + "epoch": 0.1, + "learning_rate": 1.7936779154207602e-07, + "loss": 0.0484, + "step": 5363 + }, + { + "epoch": 0.1, + "learning_rate": 1.7936390819773987e-07, + "loss": 0.0188, + "step": 5364 + }, + { + "epoch": 0.1, + "learning_rate": 1.7936002485340374e-07, + "loss": 0.016, + "step": 5365 + }, + { + "epoch": 0.1, + "learning_rate": 1.7935614150906759e-07, + "loss": 0.4985, + "step": 5366 + }, + { + "epoch": 0.1, + "learning_rate": 1.7935225816473146e-07, + "loss": 0.0452, + "step": 5367 + }, + { + "epoch": 0.1, + "learning_rate": 1.793483748203953e-07, + "loss": 0.3824, + "step": 5368 + }, + { + "epoch": 0.1, + "learning_rate": 1.7934449147605917e-07, + "loss": 0.0175, + "step": 5369 + }, + { + "epoch": 0.1, + "learning_rate": 1.7934060813172302e-07, + "loss": 0.016, + "step": 5370 + }, + { + "epoch": 0.1, + "learning_rate": 1.793367247873869e-07, + "loss": 0.0375, + "step": 5371 + }, + { + "epoch": 0.1, + "learning_rate": 1.7933284144305073e-07, + "loss": 0.0777, + "step": 5372 + }, + { + "epoch": 0.1, + "learning_rate": 1.793289580987146e-07, + "loss": 0.0317, + "step": 5373 + }, + { + "epoch": 0.1, + "learning_rate": 1.7932507475437845e-07, + "loss": 0.0347, + "step": 5374 + }, + { + "epoch": 0.1, + "learning_rate": 1.7932119141004232e-07, + "loss": 0.0551, + "step": 5375 + }, + { + "epoch": 0.1, + "learning_rate": 1.7931730806570617e-07, + "loss": 0.0458, + "step": 5376 + }, + { + "epoch": 0.1, + "learning_rate": 1.7931342472137004e-07, + "loss": 0.0145, + "step": 5377 + }, + { + "epoch": 0.1, + "learning_rate": 1.7930954137703388e-07, + "loss": 0.0341, + "step": 5378 + }, + { + "epoch": 0.1, + "learning_rate": 1.7930565803269776e-07, + "loss": 0.0213, + "step": 5379 + }, + { + "epoch": 0.1, + "learning_rate": 1.793017746883616e-07, + "loss": 0.2344, + "step": 5380 + }, + { + "epoch": 0.1, + "learning_rate": 1.7929789134402547e-07, + "loss": 0.095, + "step": 5381 + }, + { + "epoch": 0.1, + "learning_rate": 1.7929400799968932e-07, + "loss": 0.016, + "step": 5382 + }, + { + "epoch": 0.1, + "learning_rate": 1.792901246553532e-07, + "loss": 0.594, + "step": 5383 + }, + { + "epoch": 0.1, + "learning_rate": 1.7928624131101703e-07, + "loss": 0.0186, + "step": 5384 + }, + { + "epoch": 0.1, + "learning_rate": 1.792823579666809e-07, + "loss": 0.0204, + "step": 5385 + }, + { + "epoch": 0.1, + "learning_rate": 1.7927847462234475e-07, + "loss": 0.0205, + "step": 5386 + }, + { + "epoch": 0.1, + "learning_rate": 1.7927459127800862e-07, + "loss": 0.4315, + "step": 5387 + }, + { + "epoch": 0.1, + "learning_rate": 1.7927070793367247e-07, + "loss": 0.0204, + "step": 5388 + }, + { + "epoch": 0.1, + "learning_rate": 1.7926682458933634e-07, + "loss": 0.021, + "step": 5389 + }, + { + "epoch": 0.1, + "learning_rate": 1.7926294124500018e-07, + "loss": 0.0633, + "step": 5390 + }, + { + "epoch": 0.1, + "learning_rate": 1.7925905790066405e-07, + "loss": 0.013, + "step": 5391 + }, + { + "epoch": 0.1, + "learning_rate": 1.792551745563279e-07, + "loss": 0.0484, + "step": 5392 + }, + { + "epoch": 0.1, + "learning_rate": 1.7925129121199177e-07, + "loss": 0.0162, + "step": 5393 + }, + { + "epoch": 0.1, + "learning_rate": 1.7924740786765562e-07, + "loss": 0.0543, + "step": 5394 + }, + { + "epoch": 0.1, + "learning_rate": 1.792435245233195e-07, + "loss": 0.0258, + "step": 5395 + }, + { + "epoch": 0.1, + "learning_rate": 1.7923964117898333e-07, + "loss": 0.0205, + "step": 5396 + }, + { + "epoch": 0.1, + "learning_rate": 1.792357578346472e-07, + "loss": 0.0199, + "step": 5397 + }, + { + "epoch": 0.1, + "learning_rate": 1.7923187449031105e-07, + "loss": 0.0197, + "step": 5398 + }, + { + "epoch": 0.1, + "learning_rate": 1.7922799114597492e-07, + "loss": 0.4645, + "step": 5399 + }, + { + "epoch": 0.1, + "learning_rate": 1.7922410780163877e-07, + "loss": 0.015, + "step": 5400 + }, + { + "epoch": 0.1, + "learning_rate": 1.7922022445730264e-07, + "loss": 0.0363, + "step": 5401 + }, + { + "epoch": 0.1, + "learning_rate": 1.7921634111296648e-07, + "loss": 0.0161, + "step": 5402 + }, + { + "epoch": 0.1, + "learning_rate": 1.7921245776863035e-07, + "loss": 0.0195, + "step": 5403 + }, + { + "epoch": 0.1, + "learning_rate": 1.792085744242942e-07, + "loss": 0.0156, + "step": 5404 + }, + { + "epoch": 0.1, + "learning_rate": 1.7920469107995807e-07, + "loss": 0.0363, + "step": 5405 + }, + { + "epoch": 0.1, + "learning_rate": 1.7920080773562192e-07, + "loss": 0.0133, + "step": 5406 + }, + { + "epoch": 0.1, + "learning_rate": 1.791969243912858e-07, + "loss": 0.3531, + "step": 5407 + }, + { + "epoch": 0.1, + "learning_rate": 1.7919304104694963e-07, + "loss": 0.0468, + "step": 5408 + }, + { + "epoch": 0.1, + "learning_rate": 1.791891577026135e-07, + "loss": 0.101, + "step": 5409 + }, + { + "epoch": 0.1, + "learning_rate": 1.7918527435827735e-07, + "loss": 0.026, + "step": 5410 + }, + { + "epoch": 0.1, + "learning_rate": 1.7918139101394122e-07, + "loss": 0.0441, + "step": 5411 + }, + { + "epoch": 0.1, + "learning_rate": 1.7917750766960506e-07, + "loss": 0.0328, + "step": 5412 + }, + { + "epoch": 0.11, + "learning_rate": 1.7917362432526894e-07, + "loss": 0.0176, + "step": 5413 + }, + { + "epoch": 0.11, + "learning_rate": 1.7916974098093278e-07, + "loss": 0.0164, + "step": 5414 + }, + { + "epoch": 0.11, + "learning_rate": 1.7916585763659663e-07, + "loss": 0.3397, + "step": 5415 + }, + { + "epoch": 0.11, + "learning_rate": 1.7916197429226047e-07, + "loss": 0.0169, + "step": 5416 + }, + { + "epoch": 0.11, + "learning_rate": 1.7915809094792434e-07, + "loss": 0.0342, + "step": 5417 + }, + { + "epoch": 0.11, + "learning_rate": 1.791542076035882e-07, + "loss": 0.7437, + "step": 5418 + }, + { + "epoch": 0.11, + "learning_rate": 1.7915032425925206e-07, + "loss": 0.1073, + "step": 5419 + }, + { + "epoch": 0.11, + "learning_rate": 1.791464409149159e-07, + "loss": 0.3623, + "step": 5420 + }, + { + "epoch": 0.11, + "learning_rate": 1.7914255757057978e-07, + "loss": 0.0335, + "step": 5421 + }, + { + "epoch": 0.11, + "learning_rate": 1.7913867422624362e-07, + "loss": 0.1068, + "step": 5422 + }, + { + "epoch": 0.11, + "learning_rate": 1.791347908819075e-07, + "loss": 0.0328, + "step": 5423 + }, + { + "epoch": 0.11, + "learning_rate": 1.7913090753757134e-07, + "loss": 0.1657, + "step": 5424 + }, + { + "epoch": 0.11, + "learning_rate": 1.791270241932352e-07, + "loss": 0.3978, + "step": 5425 + }, + { + "epoch": 0.11, + "learning_rate": 1.7912314084889905e-07, + "loss": 0.075, + "step": 5426 + }, + { + "epoch": 0.11, + "learning_rate": 1.7911925750456293e-07, + "loss": 0.0164, + "step": 5427 + }, + { + "epoch": 0.11, + "learning_rate": 1.7911537416022677e-07, + "loss": 0.023, + "step": 5428 + }, + { + "epoch": 0.11, + "learning_rate": 1.7911149081589064e-07, + "loss": 0.0426, + "step": 5429 + }, + { + "epoch": 0.11, + "learning_rate": 1.7910760747155449e-07, + "loss": 0.0328, + "step": 5430 + }, + { + "epoch": 0.11, + "learning_rate": 1.7910372412721836e-07, + "loss": 0.7346, + "step": 5431 + }, + { + "epoch": 0.11, + "learning_rate": 1.790998407828822e-07, + "loss": 0.0663, + "step": 5432 + }, + { + "epoch": 0.11, + "learning_rate": 1.7909595743854607e-07, + "loss": 0.0198, + "step": 5433 + }, + { + "epoch": 0.11, + "learning_rate": 1.7909207409420992e-07, + "loss": 0.6024, + "step": 5434 + }, + { + "epoch": 0.11, + "learning_rate": 1.790881907498738e-07, + "loss": 0.0147, + "step": 5435 + }, + { + "epoch": 0.11, + "learning_rate": 1.7908430740553764e-07, + "loss": 0.0176, + "step": 5436 + }, + { + "epoch": 0.11, + "learning_rate": 1.790804240612015e-07, + "loss": 0.1921, + "step": 5437 + }, + { + "epoch": 0.11, + "learning_rate": 1.7907654071686535e-07, + "loss": 0.0193, + "step": 5438 + }, + { + "epoch": 0.11, + "learning_rate": 1.7907265737252922e-07, + "loss": 0.1323, + "step": 5439 + }, + { + "epoch": 0.11, + "learning_rate": 1.7906877402819307e-07, + "loss": 0.0198, + "step": 5440 + }, + { + "epoch": 0.11, + "learning_rate": 1.7906489068385694e-07, + "loss": 0.0304, + "step": 5441 + }, + { + "epoch": 0.11, + "learning_rate": 1.7906100733952079e-07, + "loss": 0.0695, + "step": 5442 + }, + { + "epoch": 0.11, + "learning_rate": 1.7905712399518466e-07, + "loss": 0.0185, + "step": 5443 + }, + { + "epoch": 0.11, + "learning_rate": 1.790532406508485e-07, + "loss": 0.0153, + "step": 5444 + }, + { + "epoch": 0.11, + "learning_rate": 1.7904935730651237e-07, + "loss": 0.0533, + "step": 5445 + }, + { + "epoch": 0.11, + "learning_rate": 1.7904547396217622e-07, + "loss": 0.0292, + "step": 5446 + }, + { + "epoch": 0.11, + "learning_rate": 1.790415906178401e-07, + "loss": 0.0725, + "step": 5447 + }, + { + "epoch": 0.11, + "learning_rate": 1.7903770727350394e-07, + "loss": 0.0185, + "step": 5448 + }, + { + "epoch": 0.11, + "learning_rate": 1.7903382392916778e-07, + "loss": 1.196, + "step": 5449 + }, + { + "epoch": 0.11, + "learning_rate": 1.7902994058483165e-07, + "loss": 0.0152, + "step": 5450 + }, + { + "epoch": 0.11, + "learning_rate": 1.790260572404955e-07, + "loss": 0.7651, + "step": 5451 + }, + { + "epoch": 0.11, + "learning_rate": 1.7902217389615937e-07, + "loss": 0.0231, + "step": 5452 + }, + { + "epoch": 0.11, + "learning_rate": 1.790182905518232e-07, + "loss": 0.078, + "step": 5453 + }, + { + "epoch": 0.11, + "learning_rate": 1.7901440720748708e-07, + "loss": 0.0258, + "step": 5454 + }, + { + "epoch": 0.11, + "learning_rate": 1.7901052386315093e-07, + "loss": 0.2751, + "step": 5455 + }, + { + "epoch": 0.11, + "learning_rate": 1.790066405188148e-07, + "loss": 0.0285, + "step": 5456 + }, + { + "epoch": 0.11, + "learning_rate": 1.7900275717447865e-07, + "loss": 0.1992, + "step": 5457 + }, + { + "epoch": 0.11, + "learning_rate": 1.7899887383014252e-07, + "loss": 0.076, + "step": 5458 + }, + { + "epoch": 0.11, + "learning_rate": 1.7899499048580636e-07, + "loss": 0.0174, + "step": 5459 + }, + { + "epoch": 0.11, + "learning_rate": 1.7899110714147023e-07, + "loss": 0.4666, + "step": 5460 + }, + { + "epoch": 0.11, + "learning_rate": 1.7898722379713408e-07, + "loss": 0.0154, + "step": 5461 + }, + { + "epoch": 0.11, + "learning_rate": 1.7898334045279795e-07, + "loss": 0.0165, + "step": 5462 + }, + { + "epoch": 0.11, + "learning_rate": 1.789794571084618e-07, + "loss": 0.0284, + "step": 5463 + }, + { + "epoch": 0.11, + "learning_rate": 1.7897557376412567e-07, + "loss": 0.2825, + "step": 5464 + }, + { + "epoch": 0.11, + "learning_rate": 1.789716904197895e-07, + "loss": 0.0218, + "step": 5465 + }, + { + "epoch": 0.11, + "learning_rate": 1.7896780707545338e-07, + "loss": 0.1125, + "step": 5466 + }, + { + "epoch": 0.11, + "learning_rate": 1.7896392373111723e-07, + "loss": 0.339, + "step": 5467 + }, + { + "epoch": 0.11, + "learning_rate": 1.789600403867811e-07, + "loss": 0.0463, + "step": 5468 + }, + { + "epoch": 0.11, + "learning_rate": 1.7895615704244494e-07, + "loss": 0.835, + "step": 5469 + }, + { + "epoch": 0.11, + "learning_rate": 1.7895227369810882e-07, + "loss": 0.6671, + "step": 5470 + }, + { + "epoch": 0.11, + "learning_rate": 1.7894839035377266e-07, + "loss": 0.2264, + "step": 5471 + }, + { + "epoch": 0.11, + "learning_rate": 1.7894450700943653e-07, + "loss": 0.019, + "step": 5472 + }, + { + "epoch": 0.11, + "learning_rate": 1.7894062366510038e-07, + "loss": 0.0183, + "step": 5473 + }, + { + "epoch": 0.11, + "learning_rate": 1.7893674032076422e-07, + "loss": 0.1544, + "step": 5474 + }, + { + "epoch": 0.11, + "learning_rate": 1.789328569764281e-07, + "loss": 0.2506, + "step": 5475 + }, + { + "epoch": 0.11, + "learning_rate": 1.7892897363209194e-07, + "loss": 0.017, + "step": 5476 + }, + { + "epoch": 0.11, + "learning_rate": 1.789250902877558e-07, + "loss": 0.0919, + "step": 5477 + }, + { + "epoch": 0.11, + "learning_rate": 1.7892120694341966e-07, + "loss": 0.0336, + "step": 5478 + }, + { + "epoch": 0.11, + "learning_rate": 1.789173235990835e-07, + "loss": 0.0364, + "step": 5479 + }, + { + "epoch": 0.11, + "learning_rate": 1.7891344025474737e-07, + "loss": 0.0522, + "step": 5480 + }, + { + "epoch": 0.11, + "learning_rate": 1.7890955691041122e-07, + "loss": 0.5945, + "step": 5481 + }, + { + "epoch": 0.11, + "learning_rate": 1.789056735660751e-07, + "loss": 0.022, + "step": 5482 + }, + { + "epoch": 0.11, + "learning_rate": 1.7890179022173893e-07, + "loss": 0.0703, + "step": 5483 + }, + { + "epoch": 0.11, + "learning_rate": 1.788979068774028e-07, + "loss": 0.0299, + "step": 5484 + }, + { + "epoch": 0.11, + "learning_rate": 1.7889402353306665e-07, + "loss": 0.0321, + "step": 5485 + }, + { + "epoch": 0.11, + "learning_rate": 1.7889014018873052e-07, + "loss": 0.2215, + "step": 5486 + }, + { + "epoch": 0.11, + "learning_rate": 1.7888625684439437e-07, + "loss": 0.0137, + "step": 5487 + }, + { + "epoch": 0.11, + "learning_rate": 1.7888237350005824e-07, + "loss": 0.0171, + "step": 5488 + }, + { + "epoch": 0.11, + "learning_rate": 1.7887849015572208e-07, + "loss": 0.0375, + "step": 5489 + }, + { + "epoch": 0.11, + "learning_rate": 1.7887460681138595e-07, + "loss": 0.0216, + "step": 5490 + }, + { + "epoch": 0.11, + "learning_rate": 1.788707234670498e-07, + "loss": 0.0163, + "step": 5491 + }, + { + "epoch": 0.11, + "learning_rate": 1.7886684012271367e-07, + "loss": 0.3321, + "step": 5492 + }, + { + "epoch": 0.11, + "learning_rate": 1.7886295677837752e-07, + "loss": 0.1832, + "step": 5493 + }, + { + "epoch": 0.11, + "learning_rate": 1.788590734340414e-07, + "loss": 0.0339, + "step": 5494 + }, + { + "epoch": 0.11, + "learning_rate": 1.7885519008970523e-07, + "loss": 0.0215, + "step": 5495 + }, + { + "epoch": 0.11, + "learning_rate": 1.788513067453691e-07, + "loss": 0.0188, + "step": 5496 + }, + { + "epoch": 0.11, + "learning_rate": 1.7884742340103295e-07, + "loss": 0.0212, + "step": 5497 + }, + { + "epoch": 0.11, + "learning_rate": 1.7884354005669682e-07, + "loss": 0.0239, + "step": 5498 + }, + { + "epoch": 0.11, + "learning_rate": 1.7883965671236067e-07, + "loss": 0.0249, + "step": 5499 + }, + { + "epoch": 0.11, + "learning_rate": 1.7883577336802454e-07, + "loss": 0.0231, + "step": 5500 + }, + { + "epoch": 0.11, + "learning_rate": 1.7883189002368838e-07, + "loss": 0.7853, + "step": 5501 + }, + { + "epoch": 0.11, + "learning_rate": 1.7882800667935225e-07, + "loss": 0.1707, + "step": 5502 + }, + { + "epoch": 0.11, + "learning_rate": 1.788241233350161e-07, + "loss": 0.1677, + "step": 5503 + }, + { + "epoch": 0.11, + "learning_rate": 1.7882023999067997e-07, + "loss": 0.0142, + "step": 5504 + }, + { + "epoch": 0.11, + "learning_rate": 1.7881635664634382e-07, + "loss": 0.1995, + "step": 5505 + }, + { + "epoch": 0.11, + "learning_rate": 1.788124733020077e-07, + "loss": 0.0582, + "step": 5506 + }, + { + "epoch": 0.11, + "learning_rate": 1.7880858995767153e-07, + "loss": 0.5881, + "step": 5507 + }, + { + "epoch": 0.11, + "learning_rate": 1.788047066133354e-07, + "loss": 0.0398, + "step": 5508 + }, + { + "epoch": 0.11, + "learning_rate": 1.7880082326899925e-07, + "loss": 0.291, + "step": 5509 + }, + { + "epoch": 0.11, + "learning_rate": 1.7879693992466312e-07, + "loss": 0.1993, + "step": 5510 + }, + { + "epoch": 0.11, + "learning_rate": 1.7879305658032696e-07, + "loss": 0.016, + "step": 5511 + }, + { + "epoch": 0.11, + "learning_rate": 1.7878917323599084e-07, + "loss": 0.2459, + "step": 5512 + }, + { + "epoch": 0.11, + "learning_rate": 1.7878528989165468e-07, + "loss": 0.3861, + "step": 5513 + }, + { + "epoch": 0.11, + "learning_rate": 1.7878140654731855e-07, + "loss": 0.0296, + "step": 5514 + }, + { + "epoch": 0.11, + "learning_rate": 1.787775232029824e-07, + "loss": 0.2693, + "step": 5515 + }, + { + "epoch": 0.11, + "learning_rate": 1.7877363985864627e-07, + "loss": 0.0239, + "step": 5516 + }, + { + "epoch": 0.11, + "learning_rate": 1.7876975651431011e-07, + "loss": 0.0231, + "step": 5517 + }, + { + "epoch": 0.11, + "learning_rate": 1.7876587316997399e-07, + "loss": 0.1487, + "step": 5518 + }, + { + "epoch": 0.11, + "learning_rate": 1.7876198982563783e-07, + "loss": 0.8637, + "step": 5519 + }, + { + "epoch": 0.11, + "learning_rate": 1.787581064813017e-07, + "loss": 0.2356, + "step": 5520 + }, + { + "epoch": 0.11, + "learning_rate": 1.7875422313696555e-07, + "loss": 0.0279, + "step": 5521 + }, + { + "epoch": 0.11, + "learning_rate": 1.7875033979262942e-07, + "loss": 0.0847, + "step": 5522 + }, + { + "epoch": 0.11, + "learning_rate": 1.7874645644829326e-07, + "loss": 0.0185, + "step": 5523 + }, + { + "epoch": 0.11, + "learning_rate": 1.7874257310395714e-07, + "loss": 0.0185, + "step": 5524 + }, + { + "epoch": 0.11, + "learning_rate": 1.7873868975962098e-07, + "loss": 0.0284, + "step": 5525 + }, + { + "epoch": 0.11, + "learning_rate": 1.7873480641528485e-07, + "loss": 0.0313, + "step": 5526 + }, + { + "epoch": 0.11, + "learning_rate": 1.787309230709487e-07, + "loss": 0.0191, + "step": 5527 + }, + { + "epoch": 0.11, + "learning_rate": 1.7872703972661257e-07, + "loss": 0.0219, + "step": 5528 + }, + { + "epoch": 0.11, + "learning_rate": 1.787231563822764e-07, + "loss": 0.0155, + "step": 5529 + }, + { + "epoch": 0.11, + "learning_rate": 1.7871927303794028e-07, + "loss": 0.0145, + "step": 5530 + }, + { + "epoch": 0.11, + "learning_rate": 1.787153896936041e-07, + "loss": 0.081, + "step": 5531 + }, + { + "epoch": 0.11, + "learning_rate": 1.7871150634926797e-07, + "loss": 0.0946, + "step": 5532 + }, + { + "epoch": 0.11, + "learning_rate": 1.7870762300493182e-07, + "loss": 0.0683, + "step": 5533 + }, + { + "epoch": 0.11, + "learning_rate": 1.787037396605957e-07, + "loss": 0.2586, + "step": 5534 + }, + { + "epoch": 0.11, + "learning_rate": 1.7869985631625954e-07, + "loss": 0.0215, + "step": 5535 + }, + { + "epoch": 0.11, + "learning_rate": 1.786959729719234e-07, + "loss": 0.3631, + "step": 5536 + }, + { + "epoch": 0.11, + "learning_rate": 1.7869208962758725e-07, + "loss": 0.1091, + "step": 5537 + }, + { + "epoch": 0.11, + "learning_rate": 1.7868820628325112e-07, + "loss": 0.0161, + "step": 5538 + }, + { + "epoch": 0.11, + "learning_rate": 1.7868432293891497e-07, + "loss": 0.0204, + "step": 5539 + }, + { + "epoch": 0.11, + "learning_rate": 1.7868043959457884e-07, + "loss": 0.0235, + "step": 5540 + }, + { + "epoch": 0.11, + "learning_rate": 1.7867655625024269e-07, + "loss": 0.0131, + "step": 5541 + }, + { + "epoch": 0.11, + "learning_rate": 1.7867267290590656e-07, + "loss": 0.0607, + "step": 5542 + }, + { + "epoch": 0.11, + "learning_rate": 1.786687895615704e-07, + "loss": 0.0258, + "step": 5543 + }, + { + "epoch": 0.11, + "learning_rate": 1.7866490621723427e-07, + "loss": 0.0263, + "step": 5544 + }, + { + "epoch": 0.11, + "learning_rate": 1.7866102287289812e-07, + "loss": 0.0569, + "step": 5545 + }, + { + "epoch": 0.11, + "learning_rate": 1.78657139528562e-07, + "loss": 0.024, + "step": 5546 + }, + { + "epoch": 0.11, + "learning_rate": 1.7865325618422584e-07, + "loss": 0.014, + "step": 5547 + }, + { + "epoch": 0.11, + "learning_rate": 1.786493728398897e-07, + "loss": 0.0954, + "step": 5548 + }, + { + "epoch": 0.11, + "learning_rate": 1.7864548949555355e-07, + "loss": 0.0412, + "step": 5549 + }, + { + "epoch": 0.11, + "learning_rate": 1.7864160615121742e-07, + "loss": 0.0141, + "step": 5550 + }, + { + "epoch": 0.11, + "learning_rate": 1.7863772280688127e-07, + "loss": 0.0506, + "step": 5551 + }, + { + "epoch": 0.11, + "learning_rate": 1.7863383946254514e-07, + "loss": 0.02, + "step": 5552 + }, + { + "epoch": 0.11, + "learning_rate": 1.7862995611820898e-07, + "loss": 0.0121, + "step": 5553 + }, + { + "epoch": 0.11, + "learning_rate": 1.7862607277387286e-07, + "loss": 0.0285, + "step": 5554 + }, + { + "epoch": 0.11, + "learning_rate": 1.786221894295367e-07, + "loss": 0.0288, + "step": 5555 + }, + { + "epoch": 0.11, + "learning_rate": 1.7861830608520057e-07, + "loss": 0.2527, + "step": 5556 + }, + { + "epoch": 0.11, + "learning_rate": 1.7861442274086442e-07, + "loss": 0.3053, + "step": 5557 + }, + { + "epoch": 0.11, + "learning_rate": 1.786105393965283e-07, + "loss": 0.0411, + "step": 5558 + }, + { + "epoch": 0.11, + "learning_rate": 1.7860665605219213e-07, + "loss": 0.2078, + "step": 5559 + }, + { + "epoch": 0.11, + "learning_rate": 1.78602772707856e-07, + "loss": 0.0622, + "step": 5560 + }, + { + "epoch": 0.11, + "learning_rate": 1.7859888936351985e-07, + "loss": 0.0345, + "step": 5561 + }, + { + "epoch": 0.11, + "learning_rate": 1.7859500601918372e-07, + "loss": 0.0188, + "step": 5562 + }, + { + "epoch": 0.11, + "learning_rate": 1.7859112267484757e-07, + "loss": 0.0223, + "step": 5563 + }, + { + "epoch": 0.11, + "learning_rate": 1.7858723933051144e-07, + "loss": 0.6294, + "step": 5564 + }, + { + "epoch": 0.11, + "learning_rate": 1.7858335598617528e-07, + "loss": 0.0467, + "step": 5565 + }, + { + "epoch": 0.11, + "learning_rate": 1.7857947264183915e-07, + "loss": 0.6662, + "step": 5566 + }, + { + "epoch": 0.11, + "learning_rate": 1.78575589297503e-07, + "loss": 0.0196, + "step": 5567 + }, + { + "epoch": 0.11, + "learning_rate": 1.7857170595316687e-07, + "loss": 0.0701, + "step": 5568 + }, + { + "epoch": 0.11, + "learning_rate": 1.7856782260883072e-07, + "loss": 0.0187, + "step": 5569 + }, + { + "epoch": 0.11, + "learning_rate": 1.785639392644946e-07, + "loss": 0.0297, + "step": 5570 + }, + { + "epoch": 0.11, + "learning_rate": 1.7856005592015843e-07, + "loss": 0.6277, + "step": 5571 + }, + { + "epoch": 0.11, + "learning_rate": 1.785561725758223e-07, + "loss": 0.035, + "step": 5572 + }, + { + "epoch": 0.11, + "learning_rate": 1.7855228923148615e-07, + "loss": 0.1271, + "step": 5573 + }, + { + "epoch": 0.11, + "learning_rate": 1.7854840588715002e-07, + "loss": 0.0143, + "step": 5574 + }, + { + "epoch": 0.11, + "learning_rate": 1.7854452254281387e-07, + "loss": 0.0178, + "step": 5575 + }, + { + "epoch": 0.11, + "learning_rate": 1.7854063919847774e-07, + "loss": 0.0511, + "step": 5576 + }, + { + "epoch": 0.11, + "learning_rate": 1.7853675585414158e-07, + "loss": 0.0138, + "step": 5577 + }, + { + "epoch": 0.11, + "learning_rate": 1.7853287250980545e-07, + "loss": 0.1323, + "step": 5578 + }, + { + "epoch": 0.11, + "learning_rate": 1.785289891654693e-07, + "loss": 0.0162, + "step": 5579 + }, + { + "epoch": 0.11, + "learning_rate": 1.7852510582113317e-07, + "loss": 0.4473, + "step": 5580 + }, + { + "epoch": 0.11, + "learning_rate": 1.7852122247679702e-07, + "loss": 0.0541, + "step": 5581 + }, + { + "epoch": 0.11, + "learning_rate": 1.785173391324609e-07, + "loss": 0.0486, + "step": 5582 + }, + { + "epoch": 0.11, + "learning_rate": 1.7851345578812473e-07, + "loss": 0.2538, + "step": 5583 + }, + { + "epoch": 0.11, + "learning_rate": 1.785095724437886e-07, + "loss": 0.7385, + "step": 5584 + }, + { + "epoch": 0.11, + "learning_rate": 1.7850568909945245e-07, + "loss": 0.0249, + "step": 5585 + }, + { + "epoch": 0.11, + "learning_rate": 1.7850180575511632e-07, + "loss": 0.0856, + "step": 5586 + }, + { + "epoch": 0.11, + "learning_rate": 1.7849792241078016e-07, + "loss": 0.014, + "step": 5587 + }, + { + "epoch": 0.11, + "learning_rate": 1.7849403906644404e-07, + "loss": 0.014, + "step": 5588 + }, + { + "epoch": 0.11, + "learning_rate": 1.7849015572210785e-07, + "loss": 0.0222, + "step": 5589 + }, + { + "epoch": 0.11, + "learning_rate": 1.7848627237777173e-07, + "loss": 0.1134, + "step": 5590 + }, + { + "epoch": 0.11, + "learning_rate": 1.7848238903343557e-07, + "loss": 0.0161, + "step": 5591 + }, + { + "epoch": 0.11, + "learning_rate": 1.7847850568909944e-07, + "loss": 0.0625, + "step": 5592 + }, + { + "epoch": 0.11, + "learning_rate": 1.784746223447633e-07, + "loss": 0.0133, + "step": 5593 + }, + { + "epoch": 0.11, + "learning_rate": 1.7847073900042716e-07, + "loss": 0.016, + "step": 5594 + }, + { + "epoch": 0.11, + "learning_rate": 1.78466855656091e-07, + "loss": 0.1105, + "step": 5595 + }, + { + "epoch": 0.11, + "learning_rate": 1.7846297231175488e-07, + "loss": 0.021, + "step": 5596 + }, + { + "epoch": 0.11, + "learning_rate": 1.7845908896741872e-07, + "loss": 0.0238, + "step": 5597 + }, + { + "epoch": 0.11, + "learning_rate": 1.784552056230826e-07, + "loss": 0.0395, + "step": 5598 + }, + { + "epoch": 0.11, + "learning_rate": 1.7845132227874644e-07, + "loss": 0.0135, + "step": 5599 + }, + { + "epoch": 0.11, + "learning_rate": 1.784474389344103e-07, + "loss": 0.0165, + "step": 5600 + }, + { + "epoch": 0.11, + "learning_rate": 1.7844355559007415e-07, + "loss": 0.0321, + "step": 5601 + }, + { + "epoch": 0.11, + "learning_rate": 1.7843967224573803e-07, + "loss": 0.0129, + "step": 5602 + }, + { + "epoch": 0.11, + "learning_rate": 1.7843578890140187e-07, + "loss": 0.0129, + "step": 5603 + }, + { + "epoch": 0.11, + "learning_rate": 1.7843190555706574e-07, + "loss": 0.0912, + "step": 5604 + }, + { + "epoch": 0.11, + "learning_rate": 1.784280222127296e-07, + "loss": 0.598, + "step": 5605 + }, + { + "epoch": 0.11, + "learning_rate": 1.7842413886839346e-07, + "loss": 0.014, + "step": 5606 + }, + { + "epoch": 0.11, + "learning_rate": 1.784202555240573e-07, + "loss": 0.0209, + "step": 5607 + }, + { + "epoch": 0.11, + "learning_rate": 1.7841637217972117e-07, + "loss": 0.0275, + "step": 5608 + }, + { + "epoch": 0.11, + "learning_rate": 1.7841248883538502e-07, + "loss": 0.5172, + "step": 5609 + }, + { + "epoch": 0.11, + "learning_rate": 1.784086054910489e-07, + "loss": 0.0341, + "step": 5610 + }, + { + "epoch": 0.11, + "learning_rate": 1.7840472214671274e-07, + "loss": 0.6981, + "step": 5611 + }, + { + "epoch": 0.11, + "learning_rate": 1.784008388023766e-07, + "loss": 0.0167, + "step": 5612 + }, + { + "epoch": 0.11, + "learning_rate": 1.7839695545804045e-07, + "loss": 0.1112, + "step": 5613 + }, + { + "epoch": 0.11, + "learning_rate": 1.7839307211370432e-07, + "loss": 0.0173, + "step": 5614 + }, + { + "epoch": 0.11, + "learning_rate": 1.7838918876936817e-07, + "loss": 0.0163, + "step": 5615 + }, + { + "epoch": 0.11, + "learning_rate": 1.7838530542503204e-07, + "loss": 0.0451, + "step": 5616 + }, + { + "epoch": 0.11, + "learning_rate": 1.7838142208069589e-07, + "loss": 0.0826, + "step": 5617 + }, + { + "epoch": 0.11, + "learning_rate": 1.7837753873635976e-07, + "loss": 0.014, + "step": 5618 + }, + { + "epoch": 0.11, + "learning_rate": 1.783736553920236e-07, + "loss": 0.4234, + "step": 5619 + }, + { + "epoch": 0.11, + "learning_rate": 1.7836977204768747e-07, + "loss": 0.0129, + "step": 5620 + }, + { + "epoch": 0.11, + "learning_rate": 1.7836588870335132e-07, + "loss": 0.0317, + "step": 5621 + }, + { + "epoch": 0.11, + "learning_rate": 1.783620053590152e-07, + "loss": 0.2346, + "step": 5622 + }, + { + "epoch": 0.11, + "learning_rate": 1.7835812201467904e-07, + "loss": 0.0145, + "step": 5623 + }, + { + "epoch": 0.11, + "learning_rate": 1.783542386703429e-07, + "loss": 0.0196, + "step": 5624 + }, + { + "epoch": 0.11, + "learning_rate": 1.7835035532600675e-07, + "loss": 0.1729, + "step": 5625 + }, + { + "epoch": 0.11, + "learning_rate": 1.783464719816706e-07, + "loss": 0.0194, + "step": 5626 + }, + { + "epoch": 0.11, + "learning_rate": 1.7834258863733447e-07, + "loss": 0.0727, + "step": 5627 + }, + { + "epoch": 0.11, + "learning_rate": 1.783387052929983e-07, + "loss": 0.0137, + "step": 5628 + }, + { + "epoch": 0.11, + "learning_rate": 1.7833482194866218e-07, + "loss": 0.013, + "step": 5629 + }, + { + "epoch": 0.11, + "learning_rate": 1.7833093860432603e-07, + "loss": 0.0199, + "step": 5630 + }, + { + "epoch": 0.11, + "learning_rate": 1.783270552599899e-07, + "loss": 0.4102, + "step": 5631 + }, + { + "epoch": 0.11, + "learning_rate": 1.7832317191565375e-07, + "loss": 0.0494, + "step": 5632 + }, + { + "epoch": 0.11, + "learning_rate": 1.7831928857131762e-07, + "loss": 0.9695, + "step": 5633 + }, + { + "epoch": 0.11, + "learning_rate": 1.7831540522698146e-07, + "loss": 0.0819, + "step": 5634 + }, + { + "epoch": 0.11, + "learning_rate": 1.7831152188264533e-07, + "loss": 0.0452, + "step": 5635 + }, + { + "epoch": 0.11, + "learning_rate": 1.7830763853830918e-07, + "loss": 0.0576, + "step": 5636 + }, + { + "epoch": 0.11, + "learning_rate": 1.7830375519397305e-07, + "loss": 0.0451, + "step": 5637 + }, + { + "epoch": 0.11, + "learning_rate": 1.782998718496369e-07, + "loss": 0.0174, + "step": 5638 + }, + { + "epoch": 0.11, + "learning_rate": 1.7829598850530077e-07, + "loss": 0.0168, + "step": 5639 + }, + { + "epoch": 0.11, + "learning_rate": 1.782921051609646e-07, + "loss": 0.0337, + "step": 5640 + }, + { + "epoch": 0.11, + "learning_rate": 1.7828822181662848e-07, + "loss": 0.0219, + "step": 5641 + }, + { + "epoch": 0.11, + "learning_rate": 1.7828433847229233e-07, + "loss": 0.0178, + "step": 5642 + }, + { + "epoch": 0.11, + "learning_rate": 1.782804551279562e-07, + "loss": 0.0433, + "step": 5643 + }, + { + "epoch": 0.11, + "learning_rate": 1.7827657178362005e-07, + "loss": 0.2664, + "step": 5644 + }, + { + "epoch": 0.11, + "learning_rate": 1.7827268843928392e-07, + "loss": 0.0414, + "step": 5645 + }, + { + "epoch": 0.11, + "learning_rate": 1.7826880509494776e-07, + "loss": 0.0158, + "step": 5646 + }, + { + "epoch": 0.11, + "learning_rate": 1.782649217506116e-07, + "loss": 0.0138, + "step": 5647 + }, + { + "epoch": 0.11, + "learning_rate": 1.7826103840627548e-07, + "loss": 0.4269, + "step": 5648 + }, + { + "epoch": 0.11, + "learning_rate": 1.7825715506193932e-07, + "loss": 0.0155, + "step": 5649 + }, + { + "epoch": 0.11, + "learning_rate": 1.782532717176032e-07, + "loss": 0.024, + "step": 5650 + }, + { + "epoch": 0.11, + "learning_rate": 1.7824938837326704e-07, + "loss": 0.0161, + "step": 5651 + }, + { + "epoch": 0.11, + "learning_rate": 1.782455050289309e-07, + "loss": 0.0147, + "step": 5652 + }, + { + "epoch": 0.11, + "learning_rate": 1.7824162168459476e-07, + "loss": 0.3282, + "step": 5653 + }, + { + "epoch": 0.11, + "learning_rate": 1.7823773834025863e-07, + "loss": 0.0229, + "step": 5654 + }, + { + "epoch": 0.11, + "learning_rate": 1.7823385499592247e-07, + "loss": 0.0173, + "step": 5655 + }, + { + "epoch": 0.11, + "learning_rate": 1.7822997165158632e-07, + "loss": 0.018, + "step": 5656 + }, + { + "epoch": 0.11, + "learning_rate": 1.782260883072502e-07, + "loss": 0.0402, + "step": 5657 + }, + { + "epoch": 0.11, + "learning_rate": 1.7822220496291403e-07, + "loss": 0.0221, + "step": 5658 + }, + { + "epoch": 0.11, + "learning_rate": 1.782183216185779e-07, + "loss": 0.1076, + "step": 5659 + }, + { + "epoch": 0.11, + "learning_rate": 1.7821443827424175e-07, + "loss": 0.3347, + "step": 5660 + }, + { + "epoch": 0.11, + "learning_rate": 1.7821055492990562e-07, + "loss": 0.0186, + "step": 5661 + }, + { + "epoch": 0.11, + "learning_rate": 1.7820667158556947e-07, + "loss": 0.0221, + "step": 5662 + }, + { + "epoch": 0.11, + "learning_rate": 1.7820278824123334e-07, + "loss": 0.5257, + "step": 5663 + }, + { + "epoch": 0.11, + "learning_rate": 1.7819890489689718e-07, + "loss": 0.2963, + "step": 5664 + }, + { + "epoch": 0.11, + "learning_rate": 1.7819502155256106e-07, + "loss": 0.0234, + "step": 5665 + }, + { + "epoch": 0.11, + "learning_rate": 1.781911382082249e-07, + "loss": 0.292, + "step": 5666 + }, + { + "epoch": 0.11, + "learning_rate": 1.7818725486388877e-07, + "loss": 0.3233, + "step": 5667 + }, + { + "epoch": 0.11, + "learning_rate": 1.7818337151955262e-07, + "loss": 0.2135, + "step": 5668 + }, + { + "epoch": 0.11, + "learning_rate": 1.781794881752165e-07, + "loss": 0.0414, + "step": 5669 + }, + { + "epoch": 0.11, + "learning_rate": 1.7817560483088033e-07, + "loss": 0.1675, + "step": 5670 + }, + { + "epoch": 0.11, + "learning_rate": 1.781717214865442e-07, + "loss": 0.0175, + "step": 5671 + }, + { + "epoch": 0.11, + "learning_rate": 1.7816783814220805e-07, + "loss": 0.7262, + "step": 5672 + }, + { + "epoch": 0.11, + "learning_rate": 1.7816395479787192e-07, + "loss": 0.456, + "step": 5673 + }, + { + "epoch": 0.11, + "learning_rate": 1.7816007145353577e-07, + "loss": 0.027, + "step": 5674 + }, + { + "epoch": 0.11, + "learning_rate": 1.7815618810919964e-07, + "loss": 0.6224, + "step": 5675 + }, + { + "epoch": 0.11, + "learning_rate": 1.7815230476486348e-07, + "loss": 0.0403, + "step": 5676 + }, + { + "epoch": 0.11, + "learning_rate": 1.7814842142052735e-07, + "loss": 0.0197, + "step": 5677 + }, + { + "epoch": 0.11, + "learning_rate": 1.781445380761912e-07, + "loss": 0.0373, + "step": 5678 + }, + { + "epoch": 0.11, + "learning_rate": 1.7814065473185507e-07, + "loss": 0.0116, + "step": 5679 + }, + { + "epoch": 0.11, + "learning_rate": 1.7813677138751892e-07, + "loss": 0.027, + "step": 5680 + }, + { + "epoch": 0.11, + "learning_rate": 1.781328880431828e-07, + "loss": 0.0381, + "step": 5681 + }, + { + "epoch": 0.11, + "learning_rate": 1.7812900469884663e-07, + "loss": 0.0217, + "step": 5682 + }, + { + "epoch": 0.11, + "learning_rate": 1.781251213545105e-07, + "loss": 0.1511, + "step": 5683 + }, + { + "epoch": 0.11, + "learning_rate": 1.7812123801017435e-07, + "loss": 0.0139, + "step": 5684 + }, + { + "epoch": 0.11, + "learning_rate": 1.7811735466583822e-07, + "loss": 0.0787, + "step": 5685 + }, + { + "epoch": 0.11, + "learning_rate": 1.7811347132150206e-07, + "loss": 0.0207, + "step": 5686 + }, + { + "epoch": 0.11, + "learning_rate": 1.7810958797716594e-07, + "loss": 0.0226, + "step": 5687 + }, + { + "epoch": 0.11, + "learning_rate": 1.7810570463282978e-07, + "loss": 0.0316, + "step": 5688 + }, + { + "epoch": 0.11, + "learning_rate": 1.7810182128849365e-07, + "loss": 0.4381, + "step": 5689 + }, + { + "epoch": 0.11, + "learning_rate": 1.780979379441575e-07, + "loss": 0.0222, + "step": 5690 + }, + { + "epoch": 0.11, + "learning_rate": 1.7809405459982137e-07, + "loss": 0.0142, + "step": 5691 + }, + { + "epoch": 0.11, + "learning_rate": 1.7809017125548521e-07, + "loss": 0.0243, + "step": 5692 + }, + { + "epoch": 0.11, + "learning_rate": 1.7808628791114909e-07, + "loss": 0.0184, + "step": 5693 + }, + { + "epoch": 0.11, + "learning_rate": 1.7808240456681293e-07, + "loss": 0.032, + "step": 5694 + }, + { + "epoch": 0.11, + "learning_rate": 1.780785212224768e-07, + "loss": 0.0183, + "step": 5695 + }, + { + "epoch": 0.11, + "learning_rate": 1.7807463787814065e-07, + "loss": 0.0123, + "step": 5696 + }, + { + "epoch": 0.11, + "learning_rate": 1.7807075453380452e-07, + "loss": 0.0389, + "step": 5697 + }, + { + "epoch": 0.11, + "learning_rate": 1.7806687118946836e-07, + "loss": 0.0476, + "step": 5698 + }, + { + "epoch": 0.11, + "learning_rate": 1.7806298784513224e-07, + "loss": 0.584, + "step": 5699 + }, + { + "epoch": 0.11, + "learning_rate": 1.7805910450079608e-07, + "loss": 0.0179, + "step": 5700 + }, + { + "epoch": 0.11, + "learning_rate": 1.7805522115645995e-07, + "loss": 0.0235, + "step": 5701 + }, + { + "epoch": 0.11, + "learning_rate": 1.780513378121238e-07, + "loss": 0.0167, + "step": 5702 + }, + { + "epoch": 0.11, + "learning_rate": 1.7804745446778767e-07, + "loss": 0.0761, + "step": 5703 + }, + { + "epoch": 0.11, + "learning_rate": 1.7804357112345151e-07, + "loss": 0.015, + "step": 5704 + }, + { + "epoch": 0.11, + "learning_rate": 1.7803968777911536e-07, + "loss": 0.0287, + "step": 5705 + }, + { + "epoch": 0.11, + "learning_rate": 1.780358044347792e-07, + "loss": 0.0221, + "step": 5706 + }, + { + "epoch": 0.11, + "learning_rate": 1.7803192109044307e-07, + "loss": 0.0769, + "step": 5707 + }, + { + "epoch": 0.11, + "learning_rate": 1.7802803774610692e-07, + "loss": 0.0837, + "step": 5708 + }, + { + "epoch": 0.11, + "learning_rate": 1.780241544017708e-07, + "loss": 0.0148, + "step": 5709 + }, + { + "epoch": 0.11, + "learning_rate": 1.7802027105743464e-07, + "loss": 0.0884, + "step": 5710 + }, + { + "epoch": 0.11, + "learning_rate": 1.780163877130985e-07, + "loss": 0.0205, + "step": 5711 + }, + { + "epoch": 0.11, + "learning_rate": 1.7801250436876235e-07, + "loss": 0.0123, + "step": 5712 + }, + { + "epoch": 0.11, + "learning_rate": 1.7800862102442622e-07, + "loss": 0.0152, + "step": 5713 + }, + { + "epoch": 0.11, + "learning_rate": 1.7800473768009007e-07, + "loss": 0.014, + "step": 5714 + }, + { + "epoch": 0.11, + "learning_rate": 1.7800085433575394e-07, + "loss": 0.0234, + "step": 5715 + }, + { + "epoch": 0.11, + "learning_rate": 1.7799697099141779e-07, + "loss": 0.0396, + "step": 5716 + }, + { + "epoch": 0.11, + "learning_rate": 1.7799308764708166e-07, + "loss": 0.0627, + "step": 5717 + }, + { + "epoch": 0.11, + "learning_rate": 1.779892043027455e-07, + "loss": 0.0205, + "step": 5718 + }, + { + "epoch": 0.11, + "learning_rate": 1.7798532095840937e-07, + "loss": 0.0147, + "step": 5719 + }, + { + "epoch": 0.11, + "learning_rate": 1.7798143761407322e-07, + "loss": 0.0204, + "step": 5720 + }, + { + "epoch": 0.11, + "learning_rate": 1.779775542697371e-07, + "loss": 0.0113, + "step": 5721 + }, + { + "epoch": 0.11, + "learning_rate": 1.7797367092540094e-07, + "loss": 0.0147, + "step": 5722 + }, + { + "epoch": 0.11, + "learning_rate": 1.779697875810648e-07, + "loss": 0.159, + "step": 5723 + }, + { + "epoch": 0.11, + "learning_rate": 1.7796590423672865e-07, + "loss": 0.0211, + "step": 5724 + }, + { + "epoch": 0.11, + "learning_rate": 1.7796202089239252e-07, + "loss": 0.0552, + "step": 5725 + }, + { + "epoch": 0.11, + "learning_rate": 1.7795813754805637e-07, + "loss": 0.0158, + "step": 5726 + }, + { + "epoch": 0.11, + "learning_rate": 1.7795425420372024e-07, + "loss": 0.0688, + "step": 5727 + }, + { + "epoch": 0.11, + "learning_rate": 1.7795037085938408e-07, + "loss": 0.0174, + "step": 5728 + }, + { + "epoch": 0.11, + "learning_rate": 1.7794648751504796e-07, + "loss": 0.0895, + "step": 5729 + }, + { + "epoch": 0.11, + "learning_rate": 1.779426041707118e-07, + "loss": 0.0257, + "step": 5730 + }, + { + "epoch": 0.11, + "learning_rate": 1.7793872082637567e-07, + "loss": 0.0383, + "step": 5731 + }, + { + "epoch": 0.11, + "learning_rate": 1.7793483748203952e-07, + "loss": 0.2916, + "step": 5732 + }, + { + "epoch": 0.11, + "learning_rate": 1.779309541377034e-07, + "loss": 0.0229, + "step": 5733 + }, + { + "epoch": 0.11, + "learning_rate": 1.7792707079336723e-07, + "loss": 0.0293, + "step": 5734 + }, + { + "epoch": 0.11, + "learning_rate": 1.779231874490311e-07, + "loss": 0.0708, + "step": 5735 + }, + { + "epoch": 0.11, + "learning_rate": 1.7791930410469495e-07, + "loss": 0.2832, + "step": 5736 + }, + { + "epoch": 0.11, + "learning_rate": 1.7791542076035882e-07, + "loss": 0.0198, + "step": 5737 + }, + { + "epoch": 0.11, + "learning_rate": 1.7791153741602267e-07, + "loss": 0.0282, + "step": 5738 + }, + { + "epoch": 0.11, + "learning_rate": 1.7790765407168654e-07, + "loss": 0.0182, + "step": 5739 + }, + { + "epoch": 0.11, + "learning_rate": 1.7790377072735038e-07, + "loss": 0.1138, + "step": 5740 + }, + { + "epoch": 0.11, + "learning_rate": 1.7789988738301426e-07, + "loss": 0.0196, + "step": 5741 + }, + { + "epoch": 0.11, + "learning_rate": 1.778960040386781e-07, + "loss": 0.0146, + "step": 5742 + }, + { + "epoch": 0.11, + "learning_rate": 1.7789212069434197e-07, + "loss": 0.0672, + "step": 5743 + }, + { + "epoch": 0.11, + "learning_rate": 1.7788823735000582e-07, + "loss": 0.2332, + "step": 5744 + }, + { + "epoch": 0.11, + "learning_rate": 1.778843540056697e-07, + "loss": 0.0221, + "step": 5745 + }, + { + "epoch": 0.11, + "learning_rate": 1.7788047066133353e-07, + "loss": 0.0281, + "step": 5746 + }, + { + "epoch": 0.11, + "learning_rate": 1.778765873169974e-07, + "loss": 0.0254, + "step": 5747 + }, + { + "epoch": 0.11, + "learning_rate": 1.7787270397266125e-07, + "loss": 0.0136, + "step": 5748 + }, + { + "epoch": 0.11, + "learning_rate": 1.7786882062832512e-07, + "loss": 0.7018, + "step": 5749 + }, + { + "epoch": 0.11, + "learning_rate": 1.7786493728398897e-07, + "loss": 0.3211, + "step": 5750 + }, + { + "epoch": 0.11, + "learning_rate": 1.7786105393965284e-07, + "loss": 0.6105, + "step": 5751 + }, + { + "epoch": 0.11, + "learning_rate": 1.7785717059531668e-07, + "loss": 0.0138, + "step": 5752 + }, + { + "epoch": 0.11, + "learning_rate": 1.7785328725098055e-07, + "loss": 0.7331, + "step": 5753 + }, + { + "epoch": 0.11, + "learning_rate": 1.778494039066444e-07, + "loss": 0.6157, + "step": 5754 + }, + { + "epoch": 0.11, + "learning_rate": 1.7784552056230827e-07, + "loss": 0.0163, + "step": 5755 + }, + { + "epoch": 0.11, + "learning_rate": 1.7784163721797212e-07, + "loss": 0.0152, + "step": 5756 + }, + { + "epoch": 0.11, + "learning_rate": 1.77837753873636e-07, + "loss": 0.036, + "step": 5757 + }, + { + "epoch": 0.11, + "learning_rate": 1.7783387052929983e-07, + "loss": 0.055, + "step": 5758 + }, + { + "epoch": 0.11, + "learning_rate": 1.778299871849637e-07, + "loss": 0.0162, + "step": 5759 + }, + { + "epoch": 0.11, + "learning_rate": 1.7782610384062755e-07, + "loss": 0.0808, + "step": 5760 + }, + { + "epoch": 0.11, + "learning_rate": 1.7782222049629142e-07, + "loss": 0.587, + "step": 5761 + }, + { + "epoch": 0.11, + "learning_rate": 1.7781833715195526e-07, + "loss": 0.4887, + "step": 5762 + }, + { + "epoch": 0.11, + "learning_rate": 1.778144538076191e-07, + "loss": 0.0155, + "step": 5763 + }, + { + "epoch": 0.11, + "learning_rate": 1.7781057046328296e-07, + "loss": 0.0129, + "step": 5764 + }, + { + "epoch": 0.11, + "learning_rate": 1.7780668711894683e-07, + "loss": 0.0122, + "step": 5765 + }, + { + "epoch": 0.11, + "learning_rate": 1.7780280377461067e-07, + "loss": 0.0377, + "step": 5766 + }, + { + "epoch": 0.11, + "learning_rate": 1.7779892043027454e-07, + "loss": 0.0418, + "step": 5767 + }, + { + "epoch": 0.11, + "learning_rate": 1.777950370859384e-07, + "loss": 0.0153, + "step": 5768 + }, + { + "epoch": 0.11, + "learning_rate": 1.7779115374160226e-07, + "loss": 0.0253, + "step": 5769 + }, + { + "epoch": 0.11, + "learning_rate": 1.777872703972661e-07, + "loss": 0.0124, + "step": 5770 + }, + { + "epoch": 0.11, + "learning_rate": 1.7778338705292998e-07, + "loss": 0.0132, + "step": 5771 + }, + { + "epoch": 0.11, + "learning_rate": 1.7777950370859382e-07, + "loss": 0.0164, + "step": 5772 + }, + { + "epoch": 0.11, + "learning_rate": 1.777756203642577e-07, + "loss": 0.0178, + "step": 5773 + }, + { + "epoch": 0.11, + "learning_rate": 1.7777173701992154e-07, + "loss": 0.0698, + "step": 5774 + }, + { + "epoch": 0.11, + "learning_rate": 1.777678536755854e-07, + "loss": 0.0279, + "step": 5775 + }, + { + "epoch": 0.11, + "learning_rate": 1.7776397033124925e-07, + "loss": 0.0186, + "step": 5776 + }, + { + "epoch": 0.11, + "learning_rate": 1.7776008698691313e-07, + "loss": 0.0163, + "step": 5777 + }, + { + "epoch": 0.11, + "learning_rate": 1.7775620364257697e-07, + "loss": 0.0165, + "step": 5778 + }, + { + "epoch": 0.11, + "learning_rate": 1.7775232029824084e-07, + "loss": 0.4599, + "step": 5779 + }, + { + "epoch": 0.11, + "learning_rate": 1.777484369539047e-07, + "loss": 0.0132, + "step": 5780 + }, + { + "epoch": 0.11, + "learning_rate": 1.7774455360956856e-07, + "loss": 0.0168, + "step": 5781 + }, + { + "epoch": 0.11, + "learning_rate": 1.777406702652324e-07, + "loss": 0.1039, + "step": 5782 + }, + { + "epoch": 0.11, + "learning_rate": 1.7773678692089627e-07, + "loss": 0.0147, + "step": 5783 + }, + { + "epoch": 0.11, + "learning_rate": 1.7773290357656012e-07, + "loss": 0.014, + "step": 5784 + }, + { + "epoch": 0.11, + "learning_rate": 1.77729020232224e-07, + "loss": 0.0169, + "step": 5785 + }, + { + "epoch": 0.11, + "learning_rate": 1.7772513688788784e-07, + "loss": 0.0308, + "step": 5786 + }, + { + "epoch": 0.11, + "learning_rate": 1.777212535435517e-07, + "loss": 0.4304, + "step": 5787 + }, + { + "epoch": 0.11, + "learning_rate": 1.7771737019921555e-07, + "loss": 0.1235, + "step": 5788 + }, + { + "epoch": 0.11, + "learning_rate": 1.7771348685487942e-07, + "loss": 0.0172, + "step": 5789 + }, + { + "epoch": 0.11, + "learning_rate": 1.7770960351054327e-07, + "loss": 0.0193, + "step": 5790 + }, + { + "epoch": 0.11, + "learning_rate": 1.7770572016620714e-07, + "loss": 0.021, + "step": 5791 + }, + { + "epoch": 0.11, + "learning_rate": 1.7770183682187099e-07, + "loss": 0.0885, + "step": 5792 + }, + { + "epoch": 0.11, + "learning_rate": 1.7769795347753486e-07, + "loss": 0.0358, + "step": 5793 + }, + { + "epoch": 0.11, + "learning_rate": 1.776940701331987e-07, + "loss": 0.0354, + "step": 5794 + }, + { + "epoch": 0.11, + "learning_rate": 1.7769018678886257e-07, + "loss": 0.0822, + "step": 5795 + }, + { + "epoch": 0.11, + "learning_rate": 1.7768630344452642e-07, + "loss": 0.0113, + "step": 5796 + }, + { + "epoch": 0.11, + "learning_rate": 1.776824201001903e-07, + "loss": 0.6455, + "step": 5797 + }, + { + "epoch": 0.11, + "learning_rate": 1.7767853675585414e-07, + "loss": 0.6833, + "step": 5798 + }, + { + "epoch": 0.11, + "learning_rate": 1.77674653411518e-07, + "loss": 0.0122, + "step": 5799 + }, + { + "epoch": 0.11, + "learning_rate": 1.7767077006718185e-07, + "loss": 1.0878, + "step": 5800 + }, + { + "epoch": 0.11, + "learning_rate": 1.7766688672284572e-07, + "loss": 0.0134, + "step": 5801 + }, + { + "epoch": 0.11, + "learning_rate": 1.7766300337850957e-07, + "loss": 0.0495, + "step": 5802 + }, + { + "epoch": 0.11, + "learning_rate": 1.7765912003417341e-07, + "loss": 0.0207, + "step": 5803 + }, + { + "epoch": 0.11, + "learning_rate": 1.7765523668983728e-07, + "loss": 0.0219, + "step": 5804 + }, + { + "epoch": 0.11, + "learning_rate": 1.7765135334550113e-07, + "loss": 0.0695, + "step": 5805 + }, + { + "epoch": 0.11, + "learning_rate": 1.77647470001165e-07, + "loss": 0.0938, + "step": 5806 + }, + { + "epoch": 0.11, + "learning_rate": 1.7764358665682885e-07, + "loss": 0.0123, + "step": 5807 + }, + { + "epoch": 0.11, + "learning_rate": 1.7763970331249272e-07, + "loss": 0.0134, + "step": 5808 + }, + { + "epoch": 0.11, + "learning_rate": 1.7763581996815656e-07, + "loss": 0.6492, + "step": 5809 + }, + { + "epoch": 0.11, + "learning_rate": 1.7763193662382043e-07, + "loss": 0.0139, + "step": 5810 + }, + { + "epoch": 0.11, + "learning_rate": 1.7762805327948428e-07, + "loss": 0.0463, + "step": 5811 + }, + { + "epoch": 0.11, + "learning_rate": 1.7762416993514815e-07, + "loss": 0.0447, + "step": 5812 + }, + { + "epoch": 0.11, + "learning_rate": 1.77620286590812e-07, + "loss": 0.0317, + "step": 5813 + }, + { + "epoch": 0.11, + "learning_rate": 1.7761640324647587e-07, + "loss": 0.0165, + "step": 5814 + }, + { + "epoch": 0.11, + "learning_rate": 1.776125199021397e-07, + "loss": 0.0409, + "step": 5815 + }, + { + "epoch": 0.11, + "learning_rate": 1.7760863655780358e-07, + "loss": 0.1112, + "step": 5816 + }, + { + "epoch": 0.11, + "learning_rate": 1.7760475321346743e-07, + "loss": 0.2595, + "step": 5817 + }, + { + "epoch": 0.11, + "learning_rate": 1.776008698691313e-07, + "loss": 0.0169, + "step": 5818 + }, + { + "epoch": 0.11, + "learning_rate": 1.7759698652479515e-07, + "loss": 0.4023, + "step": 5819 + }, + { + "epoch": 0.11, + "learning_rate": 1.7759310318045902e-07, + "loss": 0.0166, + "step": 5820 + }, + { + "epoch": 0.11, + "learning_rate": 1.7758921983612286e-07, + "loss": 0.0362, + "step": 5821 + }, + { + "epoch": 0.11, + "learning_rate": 1.775853364917867e-07, + "loss": 0.016, + "step": 5822 + }, + { + "epoch": 0.11, + "learning_rate": 1.7758145314745058e-07, + "loss": 0.0154, + "step": 5823 + }, + { + "epoch": 0.11, + "learning_rate": 1.7757756980311442e-07, + "loss": 0.0444, + "step": 5824 + }, + { + "epoch": 0.11, + "learning_rate": 1.775736864587783e-07, + "loss": 0.0104, + "step": 5825 + }, + { + "epoch": 0.11, + "learning_rate": 1.7756980311444214e-07, + "loss": 0.0172, + "step": 5826 + }, + { + "epoch": 0.11, + "learning_rate": 1.77565919770106e-07, + "loss": 0.0153, + "step": 5827 + }, + { + "epoch": 0.11, + "learning_rate": 1.7756203642576986e-07, + "loss": 0.015, + "step": 5828 + }, + { + "epoch": 0.11, + "learning_rate": 1.7755815308143373e-07, + "loss": 0.0382, + "step": 5829 + }, + { + "epoch": 0.11, + "learning_rate": 1.7755426973709757e-07, + "loss": 0.0178, + "step": 5830 + }, + { + "epoch": 0.11, + "learning_rate": 1.7755038639276144e-07, + "loss": 0.0115, + "step": 5831 + }, + { + "epoch": 0.11, + "learning_rate": 1.775465030484253e-07, + "loss": 0.014, + "step": 5832 + }, + { + "epoch": 0.11, + "learning_rate": 1.7754261970408913e-07, + "loss": 0.0133, + "step": 5833 + }, + { + "epoch": 0.11, + "learning_rate": 1.77538736359753e-07, + "loss": 0.088, + "step": 5834 + }, + { + "epoch": 0.11, + "learning_rate": 1.7753485301541685e-07, + "loss": 0.0153, + "step": 5835 + }, + { + "epoch": 0.11, + "learning_rate": 1.7753096967108072e-07, + "loss": 0.021, + "step": 5836 + }, + { + "epoch": 0.11, + "learning_rate": 1.7752708632674457e-07, + "loss": 0.0267, + "step": 5837 + }, + { + "epoch": 0.11, + "learning_rate": 1.7752320298240844e-07, + "loss": 0.0107, + "step": 5838 + }, + { + "epoch": 0.11, + "learning_rate": 1.7751931963807228e-07, + "loss": 0.0939, + "step": 5839 + }, + { + "epoch": 0.11, + "learning_rate": 1.7751543629373616e-07, + "loss": 0.4859, + "step": 5840 + }, + { + "epoch": 0.11, + "learning_rate": 1.775115529494e-07, + "loss": 0.0121, + "step": 5841 + }, + { + "epoch": 0.11, + "learning_rate": 1.7750766960506387e-07, + "loss": 0.0169, + "step": 5842 + }, + { + "epoch": 0.11, + "learning_rate": 1.7750378626072772e-07, + "loss": 0.0121, + "step": 5843 + }, + { + "epoch": 0.11, + "learning_rate": 1.774999029163916e-07, + "loss": 0.0163, + "step": 5844 + }, + { + "epoch": 0.11, + "learning_rate": 1.7749601957205543e-07, + "loss": 0.0335, + "step": 5845 + }, + { + "epoch": 0.11, + "learning_rate": 1.774921362277193e-07, + "loss": 0.0155, + "step": 5846 + }, + { + "epoch": 0.11, + "learning_rate": 1.7748825288338315e-07, + "loss": 0.022, + "step": 5847 + }, + { + "epoch": 0.11, + "learning_rate": 1.7748436953904702e-07, + "loss": 0.0233, + "step": 5848 + }, + { + "epoch": 0.11, + "learning_rate": 1.7748048619471087e-07, + "loss": 0.0118, + "step": 5849 + }, + { + "epoch": 0.11, + "learning_rate": 1.7747660285037474e-07, + "loss": 0.0124, + "step": 5850 + }, + { + "epoch": 0.11, + "learning_rate": 1.7747271950603858e-07, + "loss": 0.0146, + "step": 5851 + }, + { + "epoch": 0.11, + "learning_rate": 1.7746883616170245e-07, + "loss": 0.0203, + "step": 5852 + }, + { + "epoch": 0.11, + "learning_rate": 1.774649528173663e-07, + "loss": 0.5751, + "step": 5853 + }, + { + "epoch": 0.11, + "learning_rate": 1.7746106947303017e-07, + "loss": 0.0153, + "step": 5854 + }, + { + "epoch": 0.11, + "learning_rate": 1.7745718612869402e-07, + "loss": 0.011, + "step": 5855 + }, + { + "epoch": 0.11, + "learning_rate": 1.774533027843579e-07, + "loss": 0.0314, + "step": 5856 + }, + { + "epoch": 0.11, + "learning_rate": 1.7744941944002173e-07, + "loss": 0.0163, + "step": 5857 + }, + { + "epoch": 0.11, + "learning_rate": 1.774455360956856e-07, + "loss": 0.0647, + "step": 5858 + }, + { + "epoch": 0.11, + "learning_rate": 1.7744165275134945e-07, + "loss": 0.0127, + "step": 5859 + }, + { + "epoch": 0.11, + "learning_rate": 1.7743776940701332e-07, + "loss": 0.5171, + "step": 5860 + }, + { + "epoch": 0.11, + "learning_rate": 1.7743388606267717e-07, + "loss": 0.013, + "step": 5861 + }, + { + "epoch": 0.11, + "learning_rate": 1.7743000271834104e-07, + "loss": 0.0114, + "step": 5862 + }, + { + "epoch": 0.11, + "learning_rate": 1.7742611937400488e-07, + "loss": 0.0138, + "step": 5863 + }, + { + "epoch": 0.11, + "learning_rate": 1.7742223602966875e-07, + "loss": 0.0189, + "step": 5864 + }, + { + "epoch": 0.11, + "learning_rate": 1.774183526853326e-07, + "loss": 0.0187, + "step": 5865 + }, + { + "epoch": 0.11, + "learning_rate": 1.7741446934099647e-07, + "loss": 0.0673, + "step": 5866 + }, + { + "epoch": 0.11, + "learning_rate": 1.7741058599666031e-07, + "loss": 0.0339, + "step": 5867 + }, + { + "epoch": 0.11, + "learning_rate": 1.7740670265232419e-07, + "loss": 0.0123, + "step": 5868 + }, + { + "epoch": 0.11, + "learning_rate": 1.7740281930798803e-07, + "loss": 0.0157, + "step": 5869 + }, + { + "epoch": 0.11, + "learning_rate": 1.773989359636519e-07, + "loss": 0.6022, + "step": 5870 + }, + { + "epoch": 0.11, + "learning_rate": 1.7739505261931575e-07, + "loss": 0.1753, + "step": 5871 + }, + { + "epoch": 0.11, + "learning_rate": 1.7739116927497962e-07, + "loss": 0.0677, + "step": 5872 + }, + { + "epoch": 0.11, + "learning_rate": 1.7738728593064346e-07, + "loss": 0.062, + "step": 5873 + }, + { + "epoch": 0.11, + "learning_rate": 1.7738340258630734e-07, + "loss": 0.0189, + "step": 5874 + }, + { + "epoch": 0.11, + "learning_rate": 1.7737951924197118e-07, + "loss": 0.1101, + "step": 5875 + }, + { + "epoch": 0.11, + "learning_rate": 1.7737563589763505e-07, + "loss": 0.0105, + "step": 5876 + }, + { + "epoch": 0.11, + "learning_rate": 1.773717525532989e-07, + "loss": 0.0116, + "step": 5877 + }, + { + "epoch": 0.11, + "learning_rate": 1.7736786920896277e-07, + "loss": 0.0169, + "step": 5878 + }, + { + "epoch": 0.11, + "learning_rate": 1.773639858646266e-07, + "loss": 0.0139, + "step": 5879 + }, + { + "epoch": 0.11, + "learning_rate": 1.7736010252029046e-07, + "loss": 0.0119, + "step": 5880 + }, + { + "epoch": 0.11, + "learning_rate": 1.773562191759543e-07, + "loss": 0.0132, + "step": 5881 + }, + { + "epoch": 0.11, + "learning_rate": 1.7735233583161817e-07, + "loss": 0.0125, + "step": 5882 + }, + { + "epoch": 0.11, + "learning_rate": 1.7734845248728202e-07, + "loss": 0.0163, + "step": 5883 + }, + { + "epoch": 0.11, + "learning_rate": 1.773445691429459e-07, + "loss": 0.4379, + "step": 5884 + }, + { + "epoch": 0.11, + "learning_rate": 1.7734068579860974e-07, + "loss": 0.0141, + "step": 5885 + }, + { + "epoch": 0.11, + "learning_rate": 1.773368024542736e-07, + "loss": 0.0182, + "step": 5886 + }, + { + "epoch": 0.11, + "learning_rate": 1.7733291910993745e-07, + "loss": 0.4202, + "step": 5887 + }, + { + "epoch": 0.11, + "learning_rate": 1.7732903576560132e-07, + "loss": 0.2955, + "step": 5888 + }, + { + "epoch": 0.11, + "learning_rate": 1.7732515242126517e-07, + "loss": 0.1289, + "step": 5889 + }, + { + "epoch": 0.11, + "learning_rate": 1.7732126907692904e-07, + "loss": 0.0142, + "step": 5890 + }, + { + "epoch": 0.11, + "learning_rate": 1.7731738573259289e-07, + "loss": 0.0109, + "step": 5891 + }, + { + "epoch": 0.11, + "learning_rate": 1.7731350238825676e-07, + "loss": 0.1348, + "step": 5892 + }, + { + "epoch": 0.11, + "learning_rate": 1.773096190439206e-07, + "loss": 0.036, + "step": 5893 + }, + { + "epoch": 0.11, + "learning_rate": 1.7730573569958447e-07, + "loss": 0.16, + "step": 5894 + }, + { + "epoch": 0.11, + "learning_rate": 1.7730185235524832e-07, + "loss": 0.0158, + "step": 5895 + }, + { + "epoch": 0.11, + "learning_rate": 1.772979690109122e-07, + "loss": 0.0469, + "step": 5896 + }, + { + "epoch": 0.11, + "learning_rate": 1.7729408566657604e-07, + "loss": 0.0126, + "step": 5897 + }, + { + "epoch": 0.11, + "learning_rate": 1.772902023222399e-07, + "loss": 0.0141, + "step": 5898 + }, + { + "epoch": 0.11, + "learning_rate": 1.7728631897790375e-07, + "loss": 0.7549, + "step": 5899 + }, + { + "epoch": 0.11, + "learning_rate": 1.7728243563356762e-07, + "loss": 0.1294, + "step": 5900 + }, + { + "epoch": 0.11, + "learning_rate": 1.7727855228923147e-07, + "loss": 0.2802, + "step": 5901 + }, + { + "epoch": 0.11, + "learning_rate": 1.7727466894489534e-07, + "loss": 0.0953, + "step": 5902 + }, + { + "epoch": 0.11, + "learning_rate": 1.7727078560055918e-07, + "loss": 0.0822, + "step": 5903 + }, + { + "epoch": 0.11, + "learning_rate": 1.7726690225622306e-07, + "loss": 0.023, + "step": 5904 + }, + { + "epoch": 0.11, + "learning_rate": 1.772630189118869e-07, + "loss": 0.0199, + "step": 5905 + }, + { + "epoch": 0.11, + "learning_rate": 1.7725913556755077e-07, + "loss": 0.4243, + "step": 5906 + }, + { + "epoch": 0.11, + "learning_rate": 1.7725525222321462e-07, + "loss": 0.0133, + "step": 5907 + }, + { + "epoch": 0.11, + "learning_rate": 1.772513688788785e-07, + "loss": 0.5047, + "step": 5908 + }, + { + "epoch": 0.11, + "learning_rate": 1.7724748553454233e-07, + "loss": 0.1288, + "step": 5909 + }, + { + "epoch": 0.11, + "learning_rate": 1.772436021902062e-07, + "loss": 0.4119, + "step": 5910 + }, + { + "epoch": 0.11, + "learning_rate": 1.7723971884587005e-07, + "loss": 0.1278, + "step": 5911 + }, + { + "epoch": 0.11, + "learning_rate": 1.7723583550153392e-07, + "loss": 0.0107, + "step": 5912 + }, + { + "epoch": 0.11, + "learning_rate": 1.7723195215719777e-07, + "loss": 0.0126, + "step": 5913 + }, + { + "epoch": 0.11, + "learning_rate": 1.7722806881286164e-07, + "loss": 0.0468, + "step": 5914 + }, + { + "epoch": 0.11, + "learning_rate": 1.7722418546852548e-07, + "loss": 0.0153, + "step": 5915 + }, + { + "epoch": 0.11, + "learning_rate": 1.7722030212418936e-07, + "loss": 0.5518, + "step": 5916 + }, + { + "epoch": 0.11, + "learning_rate": 1.772164187798532e-07, + "loss": 0.0463, + "step": 5917 + }, + { + "epoch": 0.11, + "learning_rate": 1.7721253543551707e-07, + "loss": 0.011, + "step": 5918 + }, + { + "epoch": 0.11, + "learning_rate": 1.7720865209118092e-07, + "loss": 0.1023, + "step": 5919 + }, + { + "epoch": 0.11, + "learning_rate": 1.772047687468448e-07, + "loss": 1.2189, + "step": 5920 + }, + { + "epoch": 0.11, + "learning_rate": 1.7720088540250863e-07, + "loss": 0.019, + "step": 5921 + }, + { + "epoch": 0.11, + "learning_rate": 1.771970020581725e-07, + "loss": 0.0145, + "step": 5922 + }, + { + "epoch": 0.11, + "learning_rate": 1.7719311871383635e-07, + "loss": 0.0212, + "step": 5923 + }, + { + "epoch": 0.11, + "learning_rate": 1.7718923536950022e-07, + "loss": 0.0216, + "step": 5924 + }, + { + "epoch": 0.11, + "learning_rate": 1.7718535202516407e-07, + "loss": 0.0135, + "step": 5925 + }, + { + "epoch": 0.11, + "learning_rate": 1.7718146868082794e-07, + "loss": 0.6036, + "step": 5926 + }, + { + "epoch": 0.11, + "learning_rate": 1.7717758533649178e-07, + "loss": 0.0218, + "step": 5927 + }, + { + "epoch": 0.11, + "learning_rate": 1.7717370199215565e-07, + "loss": 0.0263, + "step": 5928 + }, + { + "epoch": 0.12, + "learning_rate": 1.771698186478195e-07, + "loss": 0.0184, + "step": 5929 + }, + { + "epoch": 0.12, + "learning_rate": 1.7716593530348337e-07, + "loss": 0.0141, + "step": 5930 + }, + { + "epoch": 0.12, + "learning_rate": 1.7716205195914722e-07, + "loss": 0.0137, + "step": 5931 + }, + { + "epoch": 0.12, + "learning_rate": 1.771581686148111e-07, + "loss": 0.0156, + "step": 5932 + }, + { + "epoch": 0.12, + "learning_rate": 1.7715428527047493e-07, + "loss": 0.0427, + "step": 5933 + }, + { + "epoch": 0.12, + "learning_rate": 1.771504019261388e-07, + "loss": 0.0141, + "step": 5934 + }, + { + "epoch": 0.12, + "learning_rate": 1.7714651858180265e-07, + "loss": 0.0235, + "step": 5935 + }, + { + "epoch": 0.12, + "learning_rate": 1.7714263523746652e-07, + "loss": 0.0294, + "step": 5936 + }, + { + "epoch": 0.12, + "learning_rate": 1.7713875189313034e-07, + "loss": 0.0319, + "step": 5937 + }, + { + "epoch": 0.12, + "learning_rate": 1.771348685487942e-07, + "loss": 0.0109, + "step": 5938 + }, + { + "epoch": 0.12, + "learning_rate": 1.7713098520445806e-07, + "loss": 0.0137, + "step": 5939 + }, + { + "epoch": 0.12, + "learning_rate": 1.7712710186012193e-07, + "loss": 0.0087, + "step": 5940 + }, + { + "epoch": 0.12, + "learning_rate": 1.7712321851578577e-07, + "loss": 0.1937, + "step": 5941 + }, + { + "epoch": 0.12, + "learning_rate": 1.7711933517144964e-07, + "loss": 0.0134, + "step": 5942 + }, + { + "epoch": 0.12, + "learning_rate": 1.771154518271135e-07, + "loss": 0.1276, + "step": 5943 + }, + { + "epoch": 0.12, + "learning_rate": 1.7711156848277736e-07, + "loss": 0.0239, + "step": 5944 + }, + { + "epoch": 0.12, + "learning_rate": 1.771076851384412e-07, + "loss": 0.598, + "step": 5945 + }, + { + "epoch": 0.12, + "learning_rate": 1.7710380179410508e-07, + "loss": 0.0297, + "step": 5946 + }, + { + "epoch": 0.12, + "learning_rate": 1.7709991844976892e-07, + "loss": 0.0324, + "step": 5947 + }, + { + "epoch": 0.12, + "learning_rate": 1.770960351054328e-07, + "loss": 0.5592, + "step": 5948 + }, + { + "epoch": 0.12, + "learning_rate": 1.7709215176109664e-07, + "loss": 0.2522, + "step": 5949 + }, + { + "epoch": 0.12, + "learning_rate": 1.770882684167605e-07, + "loss": 0.0103, + "step": 5950 + }, + { + "epoch": 0.12, + "learning_rate": 1.7708438507242435e-07, + "loss": 0.043, + "step": 5951 + }, + { + "epoch": 0.12, + "learning_rate": 1.7708050172808823e-07, + "loss": 0.229, + "step": 5952 + }, + { + "epoch": 0.12, + "learning_rate": 1.7707661838375207e-07, + "loss": 0.0801, + "step": 5953 + }, + { + "epoch": 0.12, + "learning_rate": 1.7707273503941594e-07, + "loss": 0.0214, + "step": 5954 + }, + { + "epoch": 0.12, + "learning_rate": 1.770688516950798e-07, + "loss": 0.065, + "step": 5955 + }, + { + "epoch": 0.12, + "learning_rate": 1.7706496835074366e-07, + "loss": 0.0128, + "step": 5956 + }, + { + "epoch": 0.12, + "learning_rate": 1.770610850064075e-07, + "loss": 0.2705, + "step": 5957 + }, + { + "epoch": 0.12, + "learning_rate": 1.7705720166207138e-07, + "loss": 0.6734, + "step": 5958 + }, + { + "epoch": 0.12, + "learning_rate": 1.7705331831773522e-07, + "loss": 0.0143, + "step": 5959 + }, + { + "epoch": 0.12, + "learning_rate": 1.770494349733991e-07, + "loss": 0.0415, + "step": 5960 + }, + { + "epoch": 0.12, + "learning_rate": 1.7704555162906294e-07, + "loss": 0.0171, + "step": 5961 + }, + { + "epoch": 0.12, + "learning_rate": 1.770416682847268e-07, + "loss": 0.018, + "step": 5962 + }, + { + "epoch": 0.12, + "learning_rate": 1.7703778494039065e-07, + "loss": 0.0382, + "step": 5963 + }, + { + "epoch": 0.12, + "learning_rate": 1.7703390159605452e-07, + "loss": 0.0131, + "step": 5964 + }, + { + "epoch": 0.12, + "learning_rate": 1.7703001825171837e-07, + "loss": 0.0194, + "step": 5965 + }, + { + "epoch": 0.12, + "learning_rate": 1.7702613490738224e-07, + "loss": 0.0161, + "step": 5966 + }, + { + "epoch": 0.12, + "learning_rate": 1.7702225156304609e-07, + "loss": 0.0181, + "step": 5967 + }, + { + "epoch": 0.12, + "learning_rate": 1.7701836821870996e-07, + "loss": 0.0119, + "step": 5968 + }, + { + "epoch": 0.12, + "learning_rate": 1.770144848743738e-07, + "loss": 0.0129, + "step": 5969 + }, + { + "epoch": 0.12, + "learning_rate": 1.7701060153003767e-07, + "loss": 0.0188, + "step": 5970 + }, + { + "epoch": 0.12, + "learning_rate": 1.7700671818570152e-07, + "loss": 0.0104, + "step": 5971 + }, + { + "epoch": 0.12, + "learning_rate": 1.770028348413654e-07, + "loss": 0.2144, + "step": 5972 + }, + { + "epoch": 0.12, + "learning_rate": 1.7699895149702924e-07, + "loss": 0.3207, + "step": 5973 + }, + { + "epoch": 0.12, + "learning_rate": 1.769950681526931e-07, + "loss": 1.1012, + "step": 5974 + }, + { + "epoch": 0.12, + "learning_rate": 1.7699118480835695e-07, + "loss": 0.0114, + "step": 5975 + }, + { + "epoch": 0.12, + "learning_rate": 1.7698730146402082e-07, + "loss": 0.1925, + "step": 5976 + }, + { + "epoch": 0.12, + "learning_rate": 1.7698341811968467e-07, + "loss": 0.0564, + "step": 5977 + }, + { + "epoch": 0.12, + "learning_rate": 1.7697953477534854e-07, + "loss": 0.3001, + "step": 5978 + }, + { + "epoch": 0.12, + "learning_rate": 1.7697565143101238e-07, + "loss": 0.0168, + "step": 5979 + }, + { + "epoch": 0.12, + "learning_rate": 1.7697176808667623e-07, + "loss": 0.0614, + "step": 5980 + }, + { + "epoch": 0.12, + "learning_rate": 1.769678847423401e-07, + "loss": 0.7483, + "step": 5981 + }, + { + "epoch": 0.12, + "learning_rate": 1.7696400139800395e-07, + "loss": 0.0868, + "step": 5982 + }, + { + "epoch": 0.12, + "learning_rate": 1.7696011805366782e-07, + "loss": 0.0093, + "step": 5983 + }, + { + "epoch": 0.12, + "learning_rate": 1.7695623470933166e-07, + "loss": 0.0438, + "step": 5984 + }, + { + "epoch": 0.12, + "learning_rate": 1.7695235136499553e-07, + "loss": 0.0147, + "step": 5985 + }, + { + "epoch": 0.12, + "learning_rate": 1.7694846802065938e-07, + "loss": 0.0123, + "step": 5986 + }, + { + "epoch": 0.12, + "learning_rate": 1.7694458467632325e-07, + "loss": 0.1239, + "step": 5987 + }, + { + "epoch": 0.12, + "learning_rate": 1.769407013319871e-07, + "loss": 0.0105, + "step": 5988 + }, + { + "epoch": 0.12, + "learning_rate": 1.7693681798765097e-07, + "loss": 0.062, + "step": 5989 + }, + { + "epoch": 0.12, + "learning_rate": 1.769329346433148e-07, + "loss": 0.1148, + "step": 5990 + }, + { + "epoch": 0.12, + "learning_rate": 1.7692905129897868e-07, + "loss": 0.0142, + "step": 5991 + }, + { + "epoch": 0.12, + "learning_rate": 1.7692516795464253e-07, + "loss": 0.0146, + "step": 5992 + }, + { + "epoch": 0.12, + "learning_rate": 1.769212846103064e-07, + "loss": 0.0286, + "step": 5993 + }, + { + "epoch": 0.12, + "learning_rate": 1.7691740126597025e-07, + "loss": 0.0204, + "step": 5994 + }, + { + "epoch": 0.12, + "learning_rate": 1.769135179216341e-07, + "loss": 0.0123, + "step": 5995 + }, + { + "epoch": 0.12, + "learning_rate": 1.7690963457729796e-07, + "loss": 0.0129, + "step": 5996 + }, + { + "epoch": 0.12, + "learning_rate": 1.769057512329618e-07, + "loss": 0.019, + "step": 5997 + }, + { + "epoch": 0.12, + "learning_rate": 1.7690186788862568e-07, + "loss": 0.0243, + "step": 5998 + }, + { + "epoch": 0.12, + "learning_rate": 1.7689798454428952e-07, + "loss": 0.0604, + "step": 5999 + }, + { + "epoch": 0.12, + "learning_rate": 1.768941011999534e-07, + "loss": 0.0379, + "step": 6000 + }, + { + "epoch": 0.12, + "learning_rate": 1.7689021785561724e-07, + "loss": 0.1718, + "step": 6001 + }, + { + "epoch": 0.12, + "learning_rate": 1.768863345112811e-07, + "loss": 0.0714, + "step": 6002 + }, + { + "epoch": 0.12, + "learning_rate": 1.7688245116694496e-07, + "loss": 0.02, + "step": 6003 + }, + { + "epoch": 0.12, + "learning_rate": 1.7687856782260883e-07, + "loss": 0.0118, + "step": 6004 + }, + { + "epoch": 0.12, + "learning_rate": 1.7687468447827267e-07, + "loss": 0.0116, + "step": 6005 + }, + { + "epoch": 0.12, + "learning_rate": 1.7687080113393654e-07, + "loss": 0.0123, + "step": 6006 + }, + { + "epoch": 0.12, + "learning_rate": 1.768669177896004e-07, + "loss": 0.0088, + "step": 6007 + }, + { + "epoch": 0.12, + "learning_rate": 1.7686303444526426e-07, + "loss": 0.015, + "step": 6008 + }, + { + "epoch": 0.12, + "learning_rate": 1.768591511009281e-07, + "loss": 0.3419, + "step": 6009 + }, + { + "epoch": 0.12, + "learning_rate": 1.7685526775659195e-07, + "loss": 0.0209, + "step": 6010 + }, + { + "epoch": 0.12, + "learning_rate": 1.7685138441225582e-07, + "loss": 0.0393, + "step": 6011 + }, + { + "epoch": 0.12, + "learning_rate": 1.7684750106791967e-07, + "loss": 0.02, + "step": 6012 + }, + { + "epoch": 0.12, + "learning_rate": 1.7684361772358354e-07, + "loss": 0.7565, + "step": 6013 + }, + { + "epoch": 0.12, + "learning_rate": 1.7683973437924738e-07, + "loss": 0.075, + "step": 6014 + }, + { + "epoch": 0.12, + "learning_rate": 1.7683585103491126e-07, + "loss": 0.0158, + "step": 6015 + }, + { + "epoch": 0.12, + "learning_rate": 1.768319676905751e-07, + "loss": 0.0626, + "step": 6016 + }, + { + "epoch": 0.12, + "learning_rate": 1.7682808434623897e-07, + "loss": 0.0252, + "step": 6017 + }, + { + "epoch": 0.12, + "learning_rate": 1.7682420100190282e-07, + "loss": 0.0128, + "step": 6018 + }, + { + "epoch": 0.12, + "learning_rate": 1.768203176575667e-07, + "loss": 0.0804, + "step": 6019 + }, + { + "epoch": 0.12, + "learning_rate": 1.7681643431323053e-07, + "loss": 0.0117, + "step": 6020 + }, + { + "epoch": 0.12, + "learning_rate": 1.768125509688944e-07, + "loss": 0.0102, + "step": 6021 + }, + { + "epoch": 0.12, + "learning_rate": 1.7680866762455825e-07, + "loss": 0.0103, + "step": 6022 + }, + { + "epoch": 0.12, + "learning_rate": 1.7680478428022212e-07, + "loss": 0.0145, + "step": 6023 + }, + { + "epoch": 0.12, + "learning_rate": 1.7680090093588597e-07, + "loss": 0.4205, + "step": 6024 + }, + { + "epoch": 0.12, + "learning_rate": 1.7679701759154984e-07, + "loss": 0.0146, + "step": 6025 + }, + { + "epoch": 0.12, + "learning_rate": 1.7679313424721368e-07, + "loss": 0.0148, + "step": 6026 + }, + { + "epoch": 0.12, + "learning_rate": 1.7678925090287755e-07, + "loss": 0.0306, + "step": 6027 + }, + { + "epoch": 0.12, + "learning_rate": 1.767853675585414e-07, + "loss": 0.341, + "step": 6028 + }, + { + "epoch": 0.12, + "learning_rate": 1.7678148421420527e-07, + "loss": 0.0194, + "step": 6029 + }, + { + "epoch": 0.12, + "learning_rate": 1.7677760086986912e-07, + "loss": 0.2471, + "step": 6030 + }, + { + "epoch": 0.12, + "learning_rate": 1.76773717525533e-07, + "loss": 0.0494, + "step": 6031 + }, + { + "epoch": 0.12, + "learning_rate": 1.7676983418119683e-07, + "loss": 0.0224, + "step": 6032 + }, + { + "epoch": 0.12, + "learning_rate": 1.767659508368607e-07, + "loss": 0.069, + "step": 6033 + }, + { + "epoch": 0.12, + "learning_rate": 1.7676206749252455e-07, + "loss": 0.0139, + "step": 6034 + }, + { + "epoch": 0.12, + "learning_rate": 1.7675818414818842e-07, + "loss": 0.0158, + "step": 6035 + }, + { + "epoch": 0.12, + "learning_rate": 1.7675430080385227e-07, + "loss": 0.5509, + "step": 6036 + }, + { + "epoch": 0.12, + "learning_rate": 1.7675041745951614e-07, + "loss": 0.0213, + "step": 6037 + }, + { + "epoch": 0.12, + "learning_rate": 1.7674653411517998e-07, + "loss": 0.4241, + "step": 6038 + }, + { + "epoch": 0.12, + "learning_rate": 1.7674265077084385e-07, + "loss": 0.0146, + "step": 6039 + }, + { + "epoch": 0.12, + "learning_rate": 1.767387674265077e-07, + "loss": 0.2478, + "step": 6040 + }, + { + "epoch": 0.12, + "learning_rate": 1.7673488408217157e-07, + "loss": 0.0143, + "step": 6041 + }, + { + "epoch": 0.12, + "learning_rate": 1.7673100073783541e-07, + "loss": 0.0104, + "step": 6042 + }, + { + "epoch": 0.12, + "learning_rate": 1.7672711739349929e-07, + "loss": 0.014, + "step": 6043 + }, + { + "epoch": 0.12, + "learning_rate": 1.7672323404916313e-07, + "loss": 0.0365, + "step": 6044 + }, + { + "epoch": 0.12, + "learning_rate": 1.76719350704827e-07, + "loss": 0.6642, + "step": 6045 + }, + { + "epoch": 0.12, + "learning_rate": 1.7671546736049085e-07, + "loss": 0.0429, + "step": 6046 + }, + { + "epoch": 0.12, + "learning_rate": 1.7671158401615472e-07, + "loss": 0.0121, + "step": 6047 + }, + { + "epoch": 0.12, + "learning_rate": 1.7670770067181856e-07, + "loss": 0.7326, + "step": 6048 + }, + { + "epoch": 0.12, + "learning_rate": 1.7670381732748244e-07, + "loss": 0.0219, + "step": 6049 + }, + { + "epoch": 0.12, + "learning_rate": 1.7669993398314628e-07, + "loss": 0.1291, + "step": 6050 + }, + { + "epoch": 0.12, + "learning_rate": 1.7669605063881015e-07, + "loss": 0.1807, + "step": 6051 + }, + { + "epoch": 0.12, + "learning_rate": 1.76692167294474e-07, + "loss": 0.0124, + "step": 6052 + }, + { + "epoch": 0.12, + "learning_rate": 1.7668828395013784e-07, + "loss": 0.1581, + "step": 6053 + }, + { + "epoch": 0.12, + "learning_rate": 1.766844006058017e-07, + "loss": 0.0356, + "step": 6054 + }, + { + "epoch": 0.12, + "learning_rate": 1.7668051726146556e-07, + "loss": 0.0141, + "step": 6055 + }, + { + "epoch": 0.12, + "learning_rate": 1.766766339171294e-07, + "loss": 0.0124, + "step": 6056 + }, + { + "epoch": 0.12, + "learning_rate": 1.7667275057279328e-07, + "loss": 0.0231, + "step": 6057 + }, + { + "epoch": 0.12, + "learning_rate": 1.7666886722845712e-07, + "loss": 0.0779, + "step": 6058 + }, + { + "epoch": 0.12, + "learning_rate": 1.76664983884121e-07, + "loss": 0.0165, + "step": 6059 + }, + { + "epoch": 0.12, + "learning_rate": 1.7666110053978484e-07, + "loss": 0.1693, + "step": 6060 + }, + { + "epoch": 0.12, + "learning_rate": 1.766572171954487e-07, + "loss": 0.0125, + "step": 6061 + }, + { + "epoch": 0.12, + "learning_rate": 1.7665333385111255e-07, + "loss": 0.1682, + "step": 6062 + }, + { + "epoch": 0.12, + "learning_rate": 1.7664945050677642e-07, + "loss": 0.0109, + "step": 6063 + }, + { + "epoch": 0.12, + "learning_rate": 1.7664556716244027e-07, + "loss": 0.0303, + "step": 6064 + }, + { + "epoch": 0.12, + "learning_rate": 1.7664168381810414e-07, + "loss": 0.421, + "step": 6065 + }, + { + "epoch": 0.12, + "learning_rate": 1.7663780047376799e-07, + "loss": 0.0123, + "step": 6066 + }, + { + "epoch": 0.12, + "learning_rate": 1.7663391712943186e-07, + "loss": 0.0799, + "step": 6067 + }, + { + "epoch": 0.12, + "learning_rate": 1.766300337850957e-07, + "loss": 0.0244, + "step": 6068 + }, + { + "epoch": 0.12, + "learning_rate": 1.7662615044075957e-07, + "loss": 0.0149, + "step": 6069 + }, + { + "epoch": 0.12, + "learning_rate": 1.7662226709642342e-07, + "loss": 0.5627, + "step": 6070 + }, + { + "epoch": 0.12, + "learning_rate": 1.766183837520873e-07, + "loss": 0.0386, + "step": 6071 + }, + { + "epoch": 0.12, + "learning_rate": 1.7661450040775114e-07, + "loss": 0.0215, + "step": 6072 + }, + { + "epoch": 0.12, + "learning_rate": 1.76610617063415e-07, + "loss": 0.0256, + "step": 6073 + }, + { + "epoch": 0.12, + "learning_rate": 1.7660673371907885e-07, + "loss": 0.3825, + "step": 6074 + }, + { + "epoch": 0.12, + "learning_rate": 1.7660285037474272e-07, + "loss": 0.0121, + "step": 6075 + }, + { + "epoch": 0.12, + "learning_rate": 1.7659896703040657e-07, + "loss": 0.1095, + "step": 6076 + }, + { + "epoch": 0.12, + "learning_rate": 1.7659508368607044e-07, + "loss": 0.0102, + "step": 6077 + }, + { + "epoch": 0.12, + "learning_rate": 1.7659120034173428e-07, + "loss": 0.0448, + "step": 6078 + }, + { + "epoch": 0.12, + "learning_rate": 1.7658731699739816e-07, + "loss": 0.0165, + "step": 6079 + }, + { + "epoch": 0.12, + "learning_rate": 1.76583433653062e-07, + "loss": 0.1659, + "step": 6080 + }, + { + "epoch": 0.12, + "learning_rate": 1.7657955030872587e-07, + "loss": 0.0116, + "step": 6081 + }, + { + "epoch": 0.12, + "learning_rate": 1.7657566696438972e-07, + "loss": 0.0724, + "step": 6082 + }, + { + "epoch": 0.12, + "learning_rate": 1.765717836200536e-07, + "loss": 0.015, + "step": 6083 + }, + { + "epoch": 0.12, + "learning_rate": 1.7656790027571743e-07, + "loss": 0.0479, + "step": 6084 + }, + { + "epoch": 0.12, + "learning_rate": 1.765640169313813e-07, + "loss": 0.0192, + "step": 6085 + }, + { + "epoch": 0.12, + "learning_rate": 1.7656013358704515e-07, + "loss": 0.0251, + "step": 6086 + }, + { + "epoch": 0.12, + "learning_rate": 1.7655625024270902e-07, + "loss": 1.1619, + "step": 6087 + }, + { + "epoch": 0.12, + "learning_rate": 1.7655236689837287e-07, + "loss": 0.019, + "step": 6088 + }, + { + "epoch": 0.12, + "learning_rate": 1.7654848355403674e-07, + "loss": 0.0238, + "step": 6089 + }, + { + "epoch": 0.12, + "learning_rate": 1.7654460020970058e-07, + "loss": 0.0375, + "step": 6090 + }, + { + "epoch": 0.12, + "learning_rate": 1.7654071686536446e-07, + "loss": 0.0269, + "step": 6091 + }, + { + "epoch": 0.12, + "learning_rate": 1.765368335210283e-07, + "loss": 0.0546, + "step": 6092 + }, + { + "epoch": 0.12, + "learning_rate": 1.7653295017669217e-07, + "loss": 0.0144, + "step": 6093 + }, + { + "epoch": 0.12, + "learning_rate": 1.7652906683235602e-07, + "loss": 0.0099, + "step": 6094 + }, + { + "epoch": 0.12, + "learning_rate": 1.765251834880199e-07, + "loss": 0.0105, + "step": 6095 + }, + { + "epoch": 0.12, + "learning_rate": 1.7652130014368373e-07, + "loss": 0.01, + "step": 6096 + }, + { + "epoch": 0.12, + "learning_rate": 1.765174167993476e-07, + "loss": 0.0398, + "step": 6097 + }, + { + "epoch": 0.12, + "learning_rate": 1.7651353345501145e-07, + "loss": 0.0285, + "step": 6098 + }, + { + "epoch": 0.12, + "learning_rate": 1.7650965011067532e-07, + "loss": 0.0114, + "step": 6099 + }, + { + "epoch": 0.12, + "learning_rate": 1.7650576676633917e-07, + "loss": 0.2341, + "step": 6100 + }, + { + "epoch": 0.12, + "learning_rate": 1.7650188342200304e-07, + "loss": 0.0135, + "step": 6101 + }, + { + "epoch": 0.12, + "learning_rate": 1.7649800007766688e-07, + "loss": 0.0599, + "step": 6102 + }, + { + "epoch": 0.12, + "learning_rate": 1.7649411673333075e-07, + "loss": 0.0374, + "step": 6103 + }, + { + "epoch": 0.12, + "learning_rate": 1.764902333889946e-07, + "loss": 0.0123, + "step": 6104 + }, + { + "epoch": 0.12, + "learning_rate": 1.7648635004465847e-07, + "loss": 0.0162, + "step": 6105 + }, + { + "epoch": 0.12, + "learning_rate": 1.7648246670032232e-07, + "loss": 0.2015, + "step": 6106 + }, + { + "epoch": 0.12, + "learning_rate": 1.764785833559862e-07, + "loss": 0.0136, + "step": 6107 + }, + { + "epoch": 0.12, + "learning_rate": 1.7647470001165003e-07, + "loss": 0.0205, + "step": 6108 + }, + { + "epoch": 0.12, + "learning_rate": 1.764708166673139e-07, + "loss": 0.0136, + "step": 6109 + }, + { + "epoch": 0.12, + "learning_rate": 1.7646693332297775e-07, + "loss": 0.0111, + "step": 6110 + }, + { + "epoch": 0.12, + "learning_rate": 1.764630499786416e-07, + "loss": 0.0259, + "step": 6111 + }, + { + "epoch": 0.12, + "learning_rate": 1.7645916663430544e-07, + "loss": 0.0174, + "step": 6112 + }, + { + "epoch": 0.12, + "learning_rate": 1.764552832899693e-07, + "loss": 0.0214, + "step": 6113 + }, + { + "epoch": 0.12, + "learning_rate": 1.7645139994563316e-07, + "loss": 0.4588, + "step": 6114 + }, + { + "epoch": 0.12, + "learning_rate": 1.7644751660129703e-07, + "loss": 0.0546, + "step": 6115 + }, + { + "epoch": 0.12, + "learning_rate": 1.7644363325696087e-07, + "loss": 0.0139, + "step": 6116 + }, + { + "epoch": 0.12, + "learning_rate": 1.7643974991262474e-07, + "loss": 0.8498, + "step": 6117 + }, + { + "epoch": 0.12, + "learning_rate": 1.764358665682886e-07, + "loss": 0.1365, + "step": 6118 + }, + { + "epoch": 0.12, + "learning_rate": 1.7643198322395246e-07, + "loss": 0.0135, + "step": 6119 + }, + { + "epoch": 0.12, + "learning_rate": 1.764280998796163e-07, + "loss": 0.5514, + "step": 6120 + }, + { + "epoch": 0.12, + "learning_rate": 1.7642421653528018e-07, + "loss": 0.2581, + "step": 6121 + }, + { + "epoch": 0.12, + "learning_rate": 1.7642033319094402e-07, + "loss": 0.0147, + "step": 6122 + }, + { + "epoch": 0.12, + "learning_rate": 1.764164498466079e-07, + "loss": 0.0221, + "step": 6123 + }, + { + "epoch": 0.12, + "learning_rate": 1.7641256650227174e-07, + "loss": 0.3716, + "step": 6124 + }, + { + "epoch": 0.12, + "learning_rate": 1.764086831579356e-07, + "loss": 0.0212, + "step": 6125 + }, + { + "epoch": 0.12, + "learning_rate": 1.7640479981359945e-07, + "loss": 0.0169, + "step": 6126 + }, + { + "epoch": 0.12, + "learning_rate": 1.7640091646926333e-07, + "loss": 0.139, + "step": 6127 + }, + { + "epoch": 0.12, + "learning_rate": 1.7639703312492717e-07, + "loss": 0.6743, + "step": 6128 + }, + { + "epoch": 0.12, + "learning_rate": 1.7639314978059104e-07, + "loss": 0.0194, + "step": 6129 + }, + { + "epoch": 0.12, + "learning_rate": 1.763892664362549e-07, + "loss": 0.0222, + "step": 6130 + }, + { + "epoch": 0.12, + "learning_rate": 1.7638538309191876e-07, + "loss": 0.4131, + "step": 6131 + }, + { + "epoch": 0.12, + "learning_rate": 1.763814997475826e-07, + "loss": 0.0116, + "step": 6132 + }, + { + "epoch": 0.12, + "learning_rate": 1.7637761640324648e-07, + "loss": 0.063, + "step": 6133 + }, + { + "epoch": 0.12, + "learning_rate": 1.7637373305891032e-07, + "loss": 0.0121, + "step": 6134 + }, + { + "epoch": 0.12, + "learning_rate": 1.763698497145742e-07, + "loss": 0.0317, + "step": 6135 + }, + { + "epoch": 0.12, + "learning_rate": 1.7636596637023804e-07, + "loss": 0.0104, + "step": 6136 + }, + { + "epoch": 0.12, + "learning_rate": 1.763620830259019e-07, + "loss": 0.3065, + "step": 6137 + }, + { + "epoch": 0.12, + "learning_rate": 1.7635819968156575e-07, + "loss": 0.0141, + "step": 6138 + }, + { + "epoch": 0.12, + "learning_rate": 1.7635431633722962e-07, + "loss": 0.1287, + "step": 6139 + }, + { + "epoch": 0.12, + "learning_rate": 1.7635043299289347e-07, + "loss": 0.6124, + "step": 6140 + }, + { + "epoch": 0.12, + "learning_rate": 1.7634654964855734e-07, + "loss": 0.011, + "step": 6141 + }, + { + "epoch": 0.12, + "learning_rate": 1.7634266630422119e-07, + "loss": 0.0174, + "step": 6142 + }, + { + "epoch": 0.12, + "learning_rate": 1.7633878295988506e-07, + "loss": 0.0108, + "step": 6143 + }, + { + "epoch": 0.12, + "learning_rate": 1.763348996155489e-07, + "loss": 0.3062, + "step": 6144 + }, + { + "epoch": 0.12, + "learning_rate": 1.7633101627121277e-07, + "loss": 0.0104, + "step": 6145 + }, + { + "epoch": 0.12, + "learning_rate": 1.7632713292687662e-07, + "loss": 0.2516, + "step": 6146 + }, + { + "epoch": 0.12, + "learning_rate": 1.763232495825405e-07, + "loss": 0.0142, + "step": 6147 + }, + { + "epoch": 0.12, + "learning_rate": 1.7631936623820434e-07, + "loss": 0.0116, + "step": 6148 + }, + { + "epoch": 0.12, + "learning_rate": 1.763154828938682e-07, + "loss": 0.2509, + "step": 6149 + }, + { + "epoch": 0.12, + "learning_rate": 1.7631159954953205e-07, + "loss": 0.3776, + "step": 6150 + }, + { + "epoch": 0.12, + "learning_rate": 1.7630771620519592e-07, + "loss": 0.011, + "step": 6151 + }, + { + "epoch": 0.12, + "learning_rate": 1.7630383286085977e-07, + "loss": 0.0244, + "step": 6152 + }, + { + "epoch": 0.12, + "learning_rate": 1.7629994951652364e-07, + "loss": 0.012, + "step": 6153 + }, + { + "epoch": 0.12, + "learning_rate": 1.7629606617218749e-07, + "loss": 0.0141, + "step": 6154 + }, + { + "epoch": 0.12, + "learning_rate": 1.7629218282785136e-07, + "loss": 0.0554, + "step": 6155 + }, + { + "epoch": 0.12, + "learning_rate": 1.762882994835152e-07, + "loss": 0.0164, + "step": 6156 + }, + { + "epoch": 0.12, + "learning_rate": 1.7628441613917905e-07, + "loss": 0.0759, + "step": 6157 + }, + { + "epoch": 0.12, + "learning_rate": 1.7628053279484292e-07, + "loss": 0.0137, + "step": 6158 + }, + { + "epoch": 0.12, + "learning_rate": 1.7627664945050676e-07, + "loss": 0.0133, + "step": 6159 + }, + { + "epoch": 0.12, + "learning_rate": 1.7627276610617063e-07, + "loss": 0.016, + "step": 6160 + }, + { + "epoch": 0.12, + "learning_rate": 1.7626888276183448e-07, + "loss": 0.0494, + "step": 6161 + }, + { + "epoch": 0.12, + "learning_rate": 1.7626499941749835e-07, + "loss": 0.0099, + "step": 6162 + }, + { + "epoch": 0.12, + "learning_rate": 1.762611160731622e-07, + "loss": 0.0518, + "step": 6163 + }, + { + "epoch": 0.12, + "learning_rate": 1.7625723272882607e-07, + "loss": 0.1619, + "step": 6164 + }, + { + "epoch": 0.12, + "learning_rate": 1.762533493844899e-07, + "loss": 0.0171, + "step": 6165 + }, + { + "epoch": 0.12, + "learning_rate": 1.7624946604015378e-07, + "loss": 0.0363, + "step": 6166 + }, + { + "epoch": 0.12, + "learning_rate": 1.7624558269581763e-07, + "loss": 0.0129, + "step": 6167 + }, + { + "epoch": 0.12, + "learning_rate": 1.762416993514815e-07, + "loss": 0.014, + "step": 6168 + }, + { + "epoch": 0.12, + "learning_rate": 1.7623781600714535e-07, + "loss": 0.0433, + "step": 6169 + }, + { + "epoch": 0.12, + "learning_rate": 1.762339326628092e-07, + "loss": 0.0092, + "step": 6170 + }, + { + "epoch": 0.12, + "learning_rate": 1.7623004931847306e-07, + "loss": 0.0165, + "step": 6171 + }, + { + "epoch": 0.12, + "learning_rate": 1.762261659741369e-07, + "loss": 0.0117, + "step": 6172 + }, + { + "epoch": 0.12, + "learning_rate": 1.7622228262980078e-07, + "loss": 0.0748, + "step": 6173 + }, + { + "epoch": 0.12, + "learning_rate": 1.7621839928546462e-07, + "loss": 0.4686, + "step": 6174 + }, + { + "epoch": 0.12, + "learning_rate": 1.762145159411285e-07, + "loss": 0.0399, + "step": 6175 + }, + { + "epoch": 0.12, + "learning_rate": 1.7621063259679234e-07, + "loss": 0.0133, + "step": 6176 + }, + { + "epoch": 0.12, + "learning_rate": 1.762067492524562e-07, + "loss": 0.046, + "step": 6177 + }, + { + "epoch": 0.12, + "learning_rate": 1.7620286590812006e-07, + "loss": 0.0124, + "step": 6178 + }, + { + "epoch": 0.12, + "learning_rate": 1.7619898256378393e-07, + "loss": 0.0223, + "step": 6179 + }, + { + "epoch": 0.12, + "learning_rate": 1.7619509921944777e-07, + "loss": 0.0113, + "step": 6180 + }, + { + "epoch": 0.12, + "learning_rate": 1.7619121587511164e-07, + "loss": 0.0091, + "step": 6181 + }, + { + "epoch": 0.12, + "learning_rate": 1.761873325307755e-07, + "loss": 0.0096, + "step": 6182 + }, + { + "epoch": 0.12, + "learning_rate": 1.7618344918643936e-07, + "loss": 0.0241, + "step": 6183 + }, + { + "epoch": 0.12, + "learning_rate": 1.761795658421032e-07, + "loss": 0.0129, + "step": 6184 + }, + { + "epoch": 0.12, + "learning_rate": 1.7617568249776708e-07, + "loss": 0.0129, + "step": 6185 + }, + { + "epoch": 0.12, + "learning_rate": 1.7617179915343092e-07, + "loss": 0.2871, + "step": 6186 + }, + { + "epoch": 0.12, + "learning_rate": 1.7616791580909477e-07, + "loss": 0.418, + "step": 6187 + }, + { + "epoch": 0.12, + "learning_rate": 1.7616403246475864e-07, + "loss": 0.0127, + "step": 6188 + }, + { + "epoch": 0.12, + "learning_rate": 1.7616014912042248e-07, + "loss": 0.0366, + "step": 6189 + }, + { + "epoch": 0.12, + "learning_rate": 1.7615626577608636e-07, + "loss": 0.0162, + "step": 6190 + }, + { + "epoch": 0.12, + "learning_rate": 1.761523824317502e-07, + "loss": 0.0316, + "step": 6191 + }, + { + "epoch": 0.12, + "learning_rate": 1.7614849908741407e-07, + "loss": 0.0145, + "step": 6192 + }, + { + "epoch": 0.12, + "learning_rate": 1.7614461574307792e-07, + "loss": 0.0109, + "step": 6193 + }, + { + "epoch": 0.12, + "learning_rate": 1.761407323987418e-07, + "loss": 0.0149, + "step": 6194 + }, + { + "epoch": 0.12, + "learning_rate": 1.7613684905440563e-07, + "loss": 0.0359, + "step": 6195 + }, + { + "epoch": 0.12, + "learning_rate": 1.761329657100695e-07, + "loss": 0.011, + "step": 6196 + }, + { + "epoch": 0.12, + "learning_rate": 1.7612908236573335e-07, + "loss": 0.0463, + "step": 6197 + }, + { + "epoch": 0.12, + "learning_rate": 1.7612519902139722e-07, + "loss": 0.0219, + "step": 6198 + }, + { + "epoch": 0.12, + "learning_rate": 1.7612131567706107e-07, + "loss": 0.0106, + "step": 6199 + }, + { + "epoch": 0.12, + "learning_rate": 1.7611743233272494e-07, + "loss": 0.0158, + "step": 6200 + }, + { + "epoch": 0.12, + "learning_rate": 1.7611354898838878e-07, + "loss": 0.0391, + "step": 6201 + }, + { + "epoch": 0.12, + "learning_rate": 1.7610966564405265e-07, + "loss": 0.0201, + "step": 6202 + }, + { + "epoch": 0.12, + "learning_rate": 1.761057822997165e-07, + "loss": 0.0228, + "step": 6203 + }, + { + "epoch": 0.12, + "learning_rate": 1.7610189895538037e-07, + "loss": 0.0115, + "step": 6204 + }, + { + "epoch": 0.12, + "learning_rate": 1.7609801561104422e-07, + "loss": 0.5414, + "step": 6205 + }, + { + "epoch": 0.12, + "learning_rate": 1.760941322667081e-07, + "loss": 0.012, + "step": 6206 + }, + { + "epoch": 0.12, + "learning_rate": 1.7609024892237193e-07, + "loss": 0.0635, + "step": 6207 + }, + { + "epoch": 0.12, + "learning_rate": 1.760863655780358e-07, + "loss": 0.8994, + "step": 6208 + }, + { + "epoch": 0.12, + "learning_rate": 1.7608248223369965e-07, + "loss": 0.7657, + "step": 6209 + }, + { + "epoch": 0.12, + "learning_rate": 1.7607859888936352e-07, + "loss": 0.0126, + "step": 6210 + }, + { + "epoch": 0.12, + "learning_rate": 1.7607471554502737e-07, + "loss": 0.0325, + "step": 6211 + }, + { + "epoch": 0.12, + "learning_rate": 1.7607083220069124e-07, + "loss": 0.0131, + "step": 6212 + }, + { + "epoch": 0.12, + "learning_rate": 1.7606694885635508e-07, + "loss": 0.0788, + "step": 6213 + }, + { + "epoch": 0.12, + "learning_rate": 1.7606306551201895e-07, + "loss": 0.0162, + "step": 6214 + }, + { + "epoch": 0.12, + "learning_rate": 1.760591821676828e-07, + "loss": 0.0093, + "step": 6215 + }, + { + "epoch": 0.12, + "learning_rate": 1.7605529882334667e-07, + "loss": 0.0106, + "step": 6216 + }, + { + "epoch": 0.12, + "learning_rate": 1.7605141547901051e-07, + "loss": 0.0205, + "step": 6217 + }, + { + "epoch": 0.12, + "learning_rate": 1.7604753213467439e-07, + "loss": 0.0151, + "step": 6218 + }, + { + "epoch": 0.12, + "learning_rate": 1.7604364879033823e-07, + "loss": 0.1916, + "step": 6219 + }, + { + "epoch": 0.12, + "learning_rate": 1.760397654460021e-07, + "loss": 0.1324, + "step": 6220 + }, + { + "epoch": 0.12, + "learning_rate": 1.7603588210166595e-07, + "loss": 0.0191, + "step": 6221 + }, + { + "epoch": 0.12, + "learning_rate": 1.7603199875732982e-07, + "loss": 0.0101, + "step": 6222 + }, + { + "epoch": 0.12, + "learning_rate": 1.7602811541299366e-07, + "loss": 0.021, + "step": 6223 + }, + { + "epoch": 0.12, + "learning_rate": 1.7602423206865754e-07, + "loss": 0.1796, + "step": 6224 + }, + { + "epoch": 0.12, + "learning_rate": 1.7602034872432138e-07, + "loss": 0.0128, + "step": 6225 + }, + { + "epoch": 0.12, + "learning_rate": 1.7601646537998525e-07, + "loss": 0.6901, + "step": 6226 + }, + { + "epoch": 0.12, + "learning_rate": 1.7601258203564907e-07, + "loss": 0.0102, + "step": 6227 + }, + { + "epoch": 0.12, + "learning_rate": 1.7600869869131294e-07, + "loss": 0.0118, + "step": 6228 + }, + { + "epoch": 0.12, + "learning_rate": 1.760048153469768e-07, + "loss": 0.0179, + "step": 6229 + }, + { + "epoch": 0.12, + "learning_rate": 1.7600093200264066e-07, + "loss": 0.0116, + "step": 6230 + }, + { + "epoch": 0.12, + "learning_rate": 1.759970486583045e-07, + "loss": 0.017, + "step": 6231 + }, + { + "epoch": 0.12, + "learning_rate": 1.7599316531396838e-07, + "loss": 0.0126, + "step": 6232 + }, + { + "epoch": 0.12, + "learning_rate": 1.7598928196963222e-07, + "loss": 0.0163, + "step": 6233 + }, + { + "epoch": 0.12, + "learning_rate": 1.759853986252961e-07, + "loss": 0.0283, + "step": 6234 + }, + { + "epoch": 0.12, + "learning_rate": 1.7598151528095994e-07, + "loss": 0.0098, + "step": 6235 + }, + { + "epoch": 0.12, + "learning_rate": 1.759776319366238e-07, + "loss": 0.0841, + "step": 6236 + }, + { + "epoch": 0.12, + "learning_rate": 1.7597374859228765e-07, + "loss": 0.0111, + "step": 6237 + }, + { + "epoch": 0.12, + "learning_rate": 1.7596986524795152e-07, + "loss": 0.0101, + "step": 6238 + }, + { + "epoch": 0.12, + "learning_rate": 1.7596598190361537e-07, + "loss": 0.0488, + "step": 6239 + }, + { + "epoch": 0.12, + "learning_rate": 1.7596209855927924e-07, + "loss": 0.0692, + "step": 6240 + }, + { + "epoch": 0.12, + "learning_rate": 1.7595821521494309e-07, + "loss": 0.021, + "step": 6241 + }, + { + "epoch": 0.12, + "learning_rate": 1.7595433187060696e-07, + "loss": 0.338, + "step": 6242 + }, + { + "epoch": 0.12, + "learning_rate": 1.759504485262708e-07, + "loss": 0.0086, + "step": 6243 + }, + { + "epoch": 0.12, + "learning_rate": 1.7594656518193467e-07, + "loss": 0.0133, + "step": 6244 + }, + { + "epoch": 0.12, + "learning_rate": 1.7594268183759852e-07, + "loss": 0.0101, + "step": 6245 + }, + { + "epoch": 0.12, + "learning_rate": 1.759387984932624e-07, + "loss": 0.009, + "step": 6246 + }, + { + "epoch": 0.12, + "learning_rate": 1.7593491514892624e-07, + "loss": 0.1483, + "step": 6247 + }, + { + "epoch": 0.12, + "learning_rate": 1.759310318045901e-07, + "loss": 0.0137, + "step": 6248 + }, + { + "epoch": 0.12, + "learning_rate": 1.7592714846025395e-07, + "loss": 0.0114, + "step": 6249 + }, + { + "epoch": 0.12, + "learning_rate": 1.7592326511591782e-07, + "loss": 0.0094, + "step": 6250 + }, + { + "epoch": 0.12, + "learning_rate": 1.7591938177158167e-07, + "loss": 0.0116, + "step": 6251 + }, + { + "epoch": 0.12, + "learning_rate": 1.7591549842724554e-07, + "loss": 0.01, + "step": 6252 + }, + { + "epoch": 0.12, + "learning_rate": 1.7591161508290939e-07, + "loss": 0.0989, + "step": 6253 + }, + { + "epoch": 0.12, + "learning_rate": 1.7590773173857326e-07, + "loss": 0.0629, + "step": 6254 + }, + { + "epoch": 0.12, + "learning_rate": 1.759038483942371e-07, + "loss": 0.0099, + "step": 6255 + }, + { + "epoch": 0.12, + "learning_rate": 1.7589996504990097e-07, + "loss": 0.0187, + "step": 6256 + }, + { + "epoch": 0.12, + "learning_rate": 1.7589608170556482e-07, + "loss": 0.0099, + "step": 6257 + }, + { + "epoch": 0.12, + "learning_rate": 1.758921983612287e-07, + "loss": 0.0125, + "step": 6258 + }, + { + "epoch": 0.12, + "learning_rate": 1.7588831501689253e-07, + "loss": 0.0859, + "step": 6259 + }, + { + "epoch": 0.12, + "learning_rate": 1.758844316725564e-07, + "loss": 0.4273, + "step": 6260 + }, + { + "epoch": 0.12, + "learning_rate": 1.7588054832822025e-07, + "loss": 0.574, + "step": 6261 + }, + { + "epoch": 0.12, + "learning_rate": 1.7587666498388412e-07, + "loss": 0.0113, + "step": 6262 + }, + { + "epoch": 0.12, + "learning_rate": 1.7587278163954797e-07, + "loss": 0.0288, + "step": 6263 + }, + { + "epoch": 0.12, + "learning_rate": 1.7586889829521184e-07, + "loss": 0.0136, + "step": 6264 + }, + { + "epoch": 0.12, + "learning_rate": 1.7586501495087568e-07, + "loss": 0.0169, + "step": 6265 + }, + { + "epoch": 0.12, + "learning_rate": 1.7586113160653956e-07, + "loss": 0.0184, + "step": 6266 + }, + { + "epoch": 0.12, + "learning_rate": 1.758572482622034e-07, + "loss": 0.0128, + "step": 6267 + }, + { + "epoch": 0.12, + "learning_rate": 1.7585336491786727e-07, + "loss": 0.02, + "step": 6268 + }, + { + "epoch": 0.12, + "learning_rate": 1.7584948157353112e-07, + "loss": 0.0264, + "step": 6269 + }, + { + "epoch": 0.12, + "learning_rate": 1.75845598229195e-07, + "loss": 0.0312, + "step": 6270 + }, + { + "epoch": 0.12, + "learning_rate": 1.7584171488485883e-07, + "loss": 0.1934, + "step": 6271 + }, + { + "epoch": 0.12, + "learning_rate": 1.758378315405227e-07, + "loss": 0.0087, + "step": 6272 + }, + { + "epoch": 0.12, + "learning_rate": 1.7583394819618655e-07, + "loss": 0.0116, + "step": 6273 + }, + { + "epoch": 0.12, + "learning_rate": 1.7583006485185042e-07, + "loss": 0.519, + "step": 6274 + }, + { + "epoch": 0.12, + "learning_rate": 1.7582618150751427e-07, + "loss": 0.0142, + "step": 6275 + }, + { + "epoch": 0.12, + "learning_rate": 1.7582229816317814e-07, + "loss": 0.0122, + "step": 6276 + }, + { + "epoch": 0.12, + "learning_rate": 1.7581841481884198e-07, + "loss": 0.011, + "step": 6277 + }, + { + "epoch": 0.12, + "learning_rate": 1.7581453147450585e-07, + "loss": 0.181, + "step": 6278 + }, + { + "epoch": 0.12, + "learning_rate": 1.758106481301697e-07, + "loss": 0.3667, + "step": 6279 + }, + { + "epoch": 0.12, + "learning_rate": 1.7580676478583357e-07, + "loss": 0.0237, + "step": 6280 + }, + { + "epoch": 0.12, + "learning_rate": 1.7580288144149742e-07, + "loss": 0.3495, + "step": 6281 + }, + { + "epoch": 0.12, + "learning_rate": 1.757989980971613e-07, + "loss": 0.0132, + "step": 6282 + }, + { + "epoch": 0.12, + "learning_rate": 1.7579511475282513e-07, + "loss": 0.0339, + "step": 6283 + }, + { + "epoch": 0.12, + "learning_rate": 1.75791231408489e-07, + "loss": 0.0682, + "step": 6284 + }, + { + "epoch": 0.12, + "learning_rate": 1.7578734806415282e-07, + "loss": 0.0102, + "step": 6285 + }, + { + "epoch": 0.12, + "learning_rate": 1.757834647198167e-07, + "loss": 0.0138, + "step": 6286 + }, + { + "epoch": 0.12, + "learning_rate": 1.7577958137548054e-07, + "loss": 0.046, + "step": 6287 + }, + { + "epoch": 0.12, + "learning_rate": 1.757756980311444e-07, + "loss": 0.0168, + "step": 6288 + }, + { + "epoch": 0.12, + "learning_rate": 1.7577181468680826e-07, + "loss": 0.0287, + "step": 6289 + }, + { + "epoch": 0.12, + "learning_rate": 1.7576793134247213e-07, + "loss": 0.0939, + "step": 6290 + }, + { + "epoch": 0.12, + "learning_rate": 1.7576404799813597e-07, + "loss": 0.0107, + "step": 6291 + }, + { + "epoch": 0.12, + "learning_rate": 1.7576016465379984e-07, + "loss": 0.3071, + "step": 6292 + }, + { + "epoch": 0.12, + "learning_rate": 1.757562813094637e-07, + "loss": 0.0094, + "step": 6293 + }, + { + "epoch": 0.12, + "learning_rate": 1.7575239796512756e-07, + "loss": 0.0098, + "step": 6294 + }, + { + "epoch": 0.12, + "learning_rate": 1.757485146207914e-07, + "loss": 0.0259, + "step": 6295 + }, + { + "epoch": 0.12, + "learning_rate": 1.7574463127645528e-07, + "loss": 0.0088, + "step": 6296 + }, + { + "epoch": 0.12, + "learning_rate": 1.7574074793211912e-07, + "loss": 0.9533, + "step": 6297 + }, + { + "epoch": 0.12, + "learning_rate": 1.75736864587783e-07, + "loss": 0.0105, + "step": 6298 + }, + { + "epoch": 0.12, + "learning_rate": 1.7573298124344684e-07, + "loss": 0.0101, + "step": 6299 + }, + { + "epoch": 0.12, + "learning_rate": 1.757290978991107e-07, + "loss": 0.0122, + "step": 6300 + }, + { + "epoch": 0.12, + "learning_rate": 1.7572521455477455e-07, + "loss": 0.013, + "step": 6301 + }, + { + "epoch": 0.12, + "learning_rate": 1.7572133121043843e-07, + "loss": 0.1332, + "step": 6302 + }, + { + "epoch": 0.12, + "learning_rate": 1.7571744786610227e-07, + "loss": 0.0362, + "step": 6303 + }, + { + "epoch": 0.12, + "learning_rate": 1.7571356452176614e-07, + "loss": 0.0114, + "step": 6304 + }, + { + "epoch": 0.12, + "learning_rate": 1.7570968117743e-07, + "loss": 0.055, + "step": 6305 + }, + { + "epoch": 0.12, + "learning_rate": 1.7570579783309386e-07, + "loss": 0.0473, + "step": 6306 + }, + { + "epoch": 0.12, + "learning_rate": 1.757019144887577e-07, + "loss": 0.0106, + "step": 6307 + }, + { + "epoch": 0.12, + "learning_rate": 1.7569803114442158e-07, + "loss": 0.2482, + "step": 6308 + }, + { + "epoch": 0.12, + "learning_rate": 1.7569414780008542e-07, + "loss": 0.0175, + "step": 6309 + }, + { + "epoch": 0.12, + "learning_rate": 1.756902644557493e-07, + "loss": 0.0289, + "step": 6310 + }, + { + "epoch": 0.12, + "learning_rate": 1.7568638111141314e-07, + "loss": 0.0141, + "step": 6311 + }, + { + "epoch": 0.12, + "learning_rate": 1.75682497767077e-07, + "loss": 0.0197, + "step": 6312 + }, + { + "epoch": 0.12, + "learning_rate": 1.7567861442274085e-07, + "loss": 0.0116, + "step": 6313 + }, + { + "epoch": 0.12, + "learning_rate": 1.7567473107840472e-07, + "loss": 0.725, + "step": 6314 + }, + { + "epoch": 0.12, + "learning_rate": 1.7567084773406857e-07, + "loss": 0.0096, + "step": 6315 + }, + { + "epoch": 0.12, + "learning_rate": 1.7566696438973244e-07, + "loss": 0.0121, + "step": 6316 + }, + { + "epoch": 0.12, + "learning_rate": 1.7566308104539629e-07, + "loss": 0.0098, + "step": 6317 + }, + { + "epoch": 0.12, + "learning_rate": 1.7565919770106016e-07, + "loss": 0.0133, + "step": 6318 + }, + { + "epoch": 0.12, + "learning_rate": 1.75655314356724e-07, + "loss": 0.5857, + "step": 6319 + }, + { + "epoch": 0.12, + "learning_rate": 1.7565143101238787e-07, + "loss": 0.0355, + "step": 6320 + }, + { + "epoch": 0.12, + "learning_rate": 1.7564754766805172e-07, + "loss": 0.0094, + "step": 6321 + }, + { + "epoch": 0.12, + "learning_rate": 1.756436643237156e-07, + "loss": 0.0096, + "step": 6322 + }, + { + "epoch": 0.12, + "learning_rate": 1.7563978097937944e-07, + "loss": 0.0557, + "step": 6323 + }, + { + "epoch": 0.12, + "learning_rate": 1.756358976350433e-07, + "loss": 0.1503, + "step": 6324 + }, + { + "epoch": 0.12, + "learning_rate": 1.7563201429070715e-07, + "loss": 0.8494, + "step": 6325 + }, + { + "epoch": 0.12, + "learning_rate": 1.7562813094637102e-07, + "loss": 0.0391, + "step": 6326 + }, + { + "epoch": 0.12, + "learning_rate": 1.7562424760203487e-07, + "loss": 0.6987, + "step": 6327 + }, + { + "epoch": 0.12, + "learning_rate": 1.7562036425769874e-07, + "loss": 0.738, + "step": 6328 + }, + { + "epoch": 0.12, + "learning_rate": 1.7561648091336259e-07, + "loss": 0.0661, + "step": 6329 + }, + { + "epoch": 0.12, + "learning_rate": 1.7561259756902646e-07, + "loss": 0.0164, + "step": 6330 + }, + { + "epoch": 0.12, + "learning_rate": 1.756087142246903e-07, + "loss": 0.0138, + "step": 6331 + }, + { + "epoch": 0.12, + "learning_rate": 1.7560483088035417e-07, + "loss": 0.0239, + "step": 6332 + }, + { + "epoch": 0.12, + "learning_rate": 1.7560094753601802e-07, + "loss": 0.0247, + "step": 6333 + }, + { + "epoch": 0.12, + "learning_rate": 1.7559706419168186e-07, + "loss": 0.0437, + "step": 6334 + }, + { + "epoch": 0.12, + "learning_rate": 1.7559318084734573e-07, + "loss": 0.1349, + "step": 6335 + }, + { + "epoch": 0.12, + "learning_rate": 1.7558929750300958e-07, + "loss": 0.0103, + "step": 6336 + }, + { + "epoch": 0.12, + "learning_rate": 1.7558541415867345e-07, + "loss": 0.0106, + "step": 6337 + }, + { + "epoch": 0.12, + "learning_rate": 1.755815308143373e-07, + "loss": 0.12, + "step": 6338 + }, + { + "epoch": 0.12, + "learning_rate": 1.7557764747000117e-07, + "loss": 0.1303, + "step": 6339 + }, + { + "epoch": 0.12, + "learning_rate": 1.75573764125665e-07, + "loss": 0.0102, + "step": 6340 + }, + { + "epoch": 0.12, + "learning_rate": 1.7556988078132888e-07, + "loss": 0.439, + "step": 6341 + }, + { + "epoch": 0.12, + "learning_rate": 1.7556599743699273e-07, + "loss": 0.0108, + "step": 6342 + }, + { + "epoch": 0.12, + "learning_rate": 1.7556211409265657e-07, + "loss": 0.08, + "step": 6343 + }, + { + "epoch": 0.12, + "learning_rate": 1.7555823074832045e-07, + "loss": 0.0373, + "step": 6344 + }, + { + "epoch": 0.12, + "learning_rate": 1.755543474039843e-07, + "loss": 0.2001, + "step": 6345 + }, + { + "epoch": 0.12, + "learning_rate": 1.7555046405964816e-07, + "loss": 0.7773, + "step": 6346 + }, + { + "epoch": 0.12, + "learning_rate": 1.75546580715312e-07, + "loss": 0.0111, + "step": 6347 + }, + { + "epoch": 0.12, + "learning_rate": 1.7554269737097588e-07, + "loss": 0.0195, + "step": 6348 + }, + { + "epoch": 0.12, + "learning_rate": 1.7553881402663972e-07, + "loss": 0.0135, + "step": 6349 + }, + { + "epoch": 0.12, + "learning_rate": 1.755349306823036e-07, + "loss": 0.2821, + "step": 6350 + }, + { + "epoch": 0.12, + "learning_rate": 1.7553104733796744e-07, + "loss": 0.032, + "step": 6351 + }, + { + "epoch": 0.12, + "learning_rate": 1.755271639936313e-07, + "loss": 0.2858, + "step": 6352 + }, + { + "epoch": 0.12, + "learning_rate": 1.7552328064929516e-07, + "loss": 0.0834, + "step": 6353 + }, + { + "epoch": 0.12, + "learning_rate": 1.7551939730495903e-07, + "loss": 0.0119, + "step": 6354 + }, + { + "epoch": 0.12, + "learning_rate": 1.7551551396062287e-07, + "loss": 0.0292, + "step": 6355 + }, + { + "epoch": 0.12, + "learning_rate": 1.7551163061628674e-07, + "loss": 0.0108, + "step": 6356 + }, + { + "epoch": 0.12, + "learning_rate": 1.755077472719506e-07, + "loss": 0.2756, + "step": 6357 + }, + { + "epoch": 0.12, + "learning_rate": 1.7550386392761446e-07, + "loss": 0.0212, + "step": 6358 + }, + { + "epoch": 0.12, + "learning_rate": 1.754999805832783e-07, + "loss": 0.263, + "step": 6359 + }, + { + "epoch": 0.12, + "learning_rate": 1.7549609723894218e-07, + "loss": 0.135, + "step": 6360 + }, + { + "epoch": 0.12, + "learning_rate": 1.7549221389460602e-07, + "loss": 0.0159, + "step": 6361 + }, + { + "epoch": 0.12, + "learning_rate": 1.754883305502699e-07, + "loss": 0.3218, + "step": 6362 + }, + { + "epoch": 0.12, + "learning_rate": 1.7548444720593374e-07, + "loss": 0.0103, + "step": 6363 + }, + { + "epoch": 0.12, + "learning_rate": 1.7548056386159758e-07, + "loss": 0.5396, + "step": 6364 + }, + { + "epoch": 0.12, + "learning_rate": 1.7547668051726146e-07, + "loss": 0.0151, + "step": 6365 + }, + { + "epoch": 0.12, + "learning_rate": 1.754727971729253e-07, + "loss": 0.0708, + "step": 6366 + }, + { + "epoch": 0.12, + "learning_rate": 1.7546891382858917e-07, + "loss": 0.0133, + "step": 6367 + }, + { + "epoch": 0.12, + "learning_rate": 1.7546503048425302e-07, + "loss": 0.0099, + "step": 6368 + }, + { + "epoch": 0.12, + "learning_rate": 1.754611471399169e-07, + "loss": 0.6803, + "step": 6369 + }, + { + "epoch": 0.12, + "learning_rate": 1.7545726379558073e-07, + "loss": 0.9251, + "step": 6370 + }, + { + "epoch": 0.12, + "learning_rate": 1.754533804512446e-07, + "loss": 0.01, + "step": 6371 + }, + { + "epoch": 0.12, + "learning_rate": 1.7544949710690845e-07, + "loss": 0.0114, + "step": 6372 + }, + { + "epoch": 0.12, + "learning_rate": 1.7544561376257232e-07, + "loss": 0.0087, + "step": 6373 + }, + { + "epoch": 0.12, + "learning_rate": 1.7544173041823617e-07, + "loss": 0.0144, + "step": 6374 + }, + { + "epoch": 0.12, + "learning_rate": 1.7543784707390004e-07, + "loss": 0.0408, + "step": 6375 + }, + { + "epoch": 0.12, + "learning_rate": 1.7543396372956388e-07, + "loss": 0.0126, + "step": 6376 + }, + { + "epoch": 0.12, + "learning_rate": 1.7543008038522775e-07, + "loss": 0.032, + "step": 6377 + }, + { + "epoch": 0.12, + "learning_rate": 1.754261970408916e-07, + "loss": 0.016, + "step": 6378 + }, + { + "epoch": 0.12, + "learning_rate": 1.7542231369655547e-07, + "loss": 0.3392, + "step": 6379 + }, + { + "epoch": 0.12, + "learning_rate": 1.7541843035221932e-07, + "loss": 0.1461, + "step": 6380 + }, + { + "epoch": 0.12, + "learning_rate": 1.754145470078832e-07, + "loss": 0.0108, + "step": 6381 + }, + { + "epoch": 0.12, + "learning_rate": 1.7541066366354703e-07, + "loss": 0.0245, + "step": 6382 + }, + { + "epoch": 0.12, + "learning_rate": 1.754067803192109e-07, + "loss": 0.0088, + "step": 6383 + }, + { + "epoch": 0.12, + "learning_rate": 1.7540289697487475e-07, + "loss": 0.4318, + "step": 6384 + }, + { + "epoch": 0.12, + "learning_rate": 1.7539901363053862e-07, + "loss": 0.0618, + "step": 6385 + }, + { + "epoch": 0.12, + "learning_rate": 1.7539513028620247e-07, + "loss": 0.0098, + "step": 6386 + }, + { + "epoch": 0.12, + "learning_rate": 1.7539124694186634e-07, + "loss": 0.013, + "step": 6387 + }, + { + "epoch": 0.12, + "learning_rate": 1.7538736359753018e-07, + "loss": 0.0202, + "step": 6388 + }, + { + "epoch": 0.12, + "learning_rate": 1.7538348025319405e-07, + "loss": 0.0124, + "step": 6389 + }, + { + "epoch": 0.12, + "learning_rate": 1.753795969088579e-07, + "loss": 0.0707, + "step": 6390 + }, + { + "epoch": 0.12, + "learning_rate": 1.7537571356452177e-07, + "loss": 0.0477, + "step": 6391 + }, + { + "epoch": 0.12, + "learning_rate": 1.7537183022018561e-07, + "loss": 0.0118, + "step": 6392 + }, + { + "epoch": 0.12, + "learning_rate": 1.7536794687584949e-07, + "loss": 0.011, + "step": 6393 + }, + { + "epoch": 0.12, + "learning_rate": 1.7536406353151333e-07, + "loss": 0.0116, + "step": 6394 + }, + { + "epoch": 0.12, + "learning_rate": 1.753601801871772e-07, + "loss": 0.4516, + "step": 6395 + }, + { + "epoch": 0.12, + "learning_rate": 1.7535629684284105e-07, + "loss": 0.3194, + "step": 6396 + }, + { + "epoch": 0.12, + "learning_rate": 1.7535241349850492e-07, + "loss": 0.0156, + "step": 6397 + }, + { + "epoch": 0.12, + "learning_rate": 1.7534853015416876e-07, + "loss": 0.0231, + "step": 6398 + }, + { + "epoch": 0.12, + "learning_rate": 1.7534464680983264e-07, + "loss": 0.289, + "step": 6399 + }, + { + "epoch": 0.12, + "learning_rate": 1.7534076346549648e-07, + "loss": 0.0135, + "step": 6400 + }, + { + "epoch": 0.12, + "learning_rate": 1.7533688012116033e-07, + "loss": 0.0111, + "step": 6401 + }, + { + "epoch": 0.12, + "learning_rate": 1.7533299677682417e-07, + "loss": 0.0817, + "step": 6402 + }, + { + "epoch": 0.12, + "learning_rate": 1.7532911343248804e-07, + "loss": 0.0144, + "step": 6403 + }, + { + "epoch": 0.12, + "learning_rate": 1.753252300881519e-07, + "loss": 0.1266, + "step": 6404 + }, + { + "epoch": 0.12, + "learning_rate": 1.7532134674381576e-07, + "loss": 0.0117, + "step": 6405 + }, + { + "epoch": 0.12, + "learning_rate": 1.753174633994796e-07, + "loss": 0.2626, + "step": 6406 + }, + { + "epoch": 0.12, + "learning_rate": 1.7531358005514348e-07, + "loss": 0.0112, + "step": 6407 + }, + { + "epoch": 0.12, + "learning_rate": 1.7530969671080732e-07, + "loss": 0.0132, + "step": 6408 + }, + { + "epoch": 0.12, + "learning_rate": 1.753058133664712e-07, + "loss": 0.0125, + "step": 6409 + }, + { + "epoch": 0.12, + "learning_rate": 1.7530193002213504e-07, + "loss": 0.0089, + "step": 6410 + }, + { + "epoch": 0.12, + "learning_rate": 1.752980466777989e-07, + "loss": 0.0107, + "step": 6411 + }, + { + "epoch": 0.12, + "learning_rate": 1.7529416333346275e-07, + "loss": 0.0232, + "step": 6412 + }, + { + "epoch": 0.12, + "learning_rate": 1.7529027998912662e-07, + "loss": 0.0139, + "step": 6413 + }, + { + "epoch": 0.12, + "learning_rate": 1.7528639664479047e-07, + "loss": 0.0153, + "step": 6414 + }, + { + "epoch": 0.12, + "learning_rate": 1.7528251330045434e-07, + "loss": 0.0151, + "step": 6415 + }, + { + "epoch": 0.12, + "learning_rate": 1.7527862995611819e-07, + "loss": 0.11, + "step": 6416 + }, + { + "epoch": 0.12, + "learning_rate": 1.7527474661178206e-07, + "loss": 0.0103, + "step": 6417 + }, + { + "epoch": 0.12, + "learning_rate": 1.752708632674459e-07, + "loss": 0.0912, + "step": 6418 + }, + { + "epoch": 0.12, + "learning_rate": 1.7526697992310977e-07, + "loss": 0.1035, + "step": 6419 + }, + { + "epoch": 0.12, + "learning_rate": 1.7526309657877362e-07, + "loss": 0.0192, + "step": 6420 + }, + { + "epoch": 0.12, + "learning_rate": 1.752592132344375e-07, + "loss": 0.3451, + "step": 6421 + }, + { + "epoch": 0.12, + "learning_rate": 1.7525532989010134e-07, + "loss": 0.011, + "step": 6422 + }, + { + "epoch": 0.12, + "learning_rate": 1.752514465457652e-07, + "loss": 0.0155, + "step": 6423 + }, + { + "epoch": 0.12, + "learning_rate": 1.7524756320142905e-07, + "loss": 0.0463, + "step": 6424 + }, + { + "epoch": 0.12, + "learning_rate": 1.7524367985709292e-07, + "loss": 0.0089, + "step": 6425 + }, + { + "epoch": 0.12, + "learning_rate": 1.7523979651275677e-07, + "loss": 0.0095, + "step": 6426 + }, + { + "epoch": 0.12, + "learning_rate": 1.7523591316842064e-07, + "loss": 0.0171, + "step": 6427 + }, + { + "epoch": 0.12, + "learning_rate": 1.7523202982408449e-07, + "loss": 0.0118, + "step": 6428 + }, + { + "epoch": 0.12, + "learning_rate": 1.7522814647974836e-07, + "loss": 0.0621, + "step": 6429 + }, + { + "epoch": 0.12, + "learning_rate": 1.752242631354122e-07, + "loss": 0.0135, + "step": 6430 + }, + { + "epoch": 0.12, + "learning_rate": 1.7522037979107607e-07, + "loss": 0.0116, + "step": 6431 + }, + { + "epoch": 0.12, + "learning_rate": 1.7521649644673992e-07, + "loss": 0.0107, + "step": 6432 + }, + { + "epoch": 0.12, + "learning_rate": 1.752126131024038e-07, + "loss": 0.0193, + "step": 6433 + }, + { + "epoch": 0.12, + "learning_rate": 1.7520872975806763e-07, + "loss": 0.0097, + "step": 6434 + }, + { + "epoch": 0.12, + "learning_rate": 1.752048464137315e-07, + "loss": 0.0343, + "step": 6435 + }, + { + "epoch": 0.12, + "learning_rate": 1.7520096306939535e-07, + "loss": 0.5616, + "step": 6436 + }, + { + "epoch": 0.12, + "learning_rate": 1.7519707972505922e-07, + "loss": 0.0302, + "step": 6437 + }, + { + "epoch": 0.12, + "learning_rate": 1.7519319638072307e-07, + "loss": 0.0175, + "step": 6438 + }, + { + "epoch": 0.12, + "learning_rate": 1.7518931303638694e-07, + "loss": 0.0182, + "step": 6439 + }, + { + "epoch": 0.12, + "learning_rate": 1.7518542969205078e-07, + "loss": 0.0191, + "step": 6440 + }, + { + "epoch": 0.12, + "learning_rate": 1.7518154634771466e-07, + "loss": 0.1905, + "step": 6441 + }, + { + "epoch": 0.12, + "learning_rate": 1.751776630033785e-07, + "loss": 0.0098, + "step": 6442 + }, + { + "epoch": 0.12, + "learning_rate": 1.7517377965904237e-07, + "loss": 0.0453, + "step": 6443 + }, + { + "epoch": 0.12, + "learning_rate": 1.7516989631470622e-07, + "loss": 0.0172, + "step": 6444 + }, + { + "epoch": 0.13, + "learning_rate": 1.751660129703701e-07, + "loss": 0.0139, + "step": 6445 + }, + { + "epoch": 0.13, + "learning_rate": 1.7516212962603393e-07, + "loss": 0.2273, + "step": 6446 + }, + { + "epoch": 0.13, + "learning_rate": 1.751582462816978e-07, + "loss": 0.0155, + "step": 6447 + }, + { + "epoch": 0.13, + "learning_rate": 1.7515436293736165e-07, + "loss": 0.3171, + "step": 6448 + }, + { + "epoch": 0.13, + "learning_rate": 1.7515047959302552e-07, + "loss": 0.0136, + "step": 6449 + }, + { + "epoch": 0.13, + "learning_rate": 1.7514659624868937e-07, + "loss": 0.0368, + "step": 6450 + }, + { + "epoch": 0.13, + "learning_rate": 1.7514271290435324e-07, + "loss": 0.0173, + "step": 6451 + }, + { + "epoch": 0.13, + "learning_rate": 1.7513882956001708e-07, + "loss": 0.0155, + "step": 6452 + }, + { + "epoch": 0.13, + "learning_rate": 1.7513494621568095e-07, + "loss": 0.009, + "step": 6453 + }, + { + "epoch": 0.13, + "learning_rate": 1.751310628713448e-07, + "loss": 0.3654, + "step": 6454 + }, + { + "epoch": 0.13, + "learning_rate": 1.7512717952700867e-07, + "loss": 0.0097, + "step": 6455 + }, + { + "epoch": 0.13, + "learning_rate": 1.7512329618267252e-07, + "loss": 0.3692, + "step": 6456 + }, + { + "epoch": 0.13, + "learning_rate": 1.751194128383364e-07, + "loss": 0.1125, + "step": 6457 + }, + { + "epoch": 0.13, + "learning_rate": 1.7511552949400023e-07, + "loss": 0.0116, + "step": 6458 + }, + { + "epoch": 0.13, + "learning_rate": 1.7511164614966408e-07, + "loss": 0.013, + "step": 6459 + }, + { + "epoch": 0.13, + "learning_rate": 1.7510776280532792e-07, + "loss": 0.0205, + "step": 6460 + }, + { + "epoch": 0.13, + "learning_rate": 1.751038794609918e-07, + "loss": 0.0163, + "step": 6461 + }, + { + "epoch": 0.13, + "learning_rate": 1.7509999611665564e-07, + "loss": 0.01, + "step": 6462 + }, + { + "epoch": 0.13, + "learning_rate": 1.750961127723195e-07, + "loss": 0.018, + "step": 6463 + }, + { + "epoch": 0.13, + "learning_rate": 1.7509222942798336e-07, + "loss": 0.0195, + "step": 6464 + }, + { + "epoch": 0.13, + "learning_rate": 1.7508834608364723e-07, + "loss": 0.2023, + "step": 6465 + }, + { + "epoch": 0.13, + "learning_rate": 1.7508446273931107e-07, + "loss": 0.0131, + "step": 6466 + }, + { + "epoch": 0.13, + "learning_rate": 1.7508057939497494e-07, + "loss": 0.0698, + "step": 6467 + }, + { + "epoch": 0.13, + "learning_rate": 1.750766960506388e-07, + "loss": 0.0091, + "step": 6468 + }, + { + "epoch": 0.13, + "learning_rate": 1.7507281270630266e-07, + "loss": 0.0223, + "step": 6469 + }, + { + "epoch": 0.13, + "learning_rate": 1.750689293619665e-07, + "loss": 0.3064, + "step": 6470 + }, + { + "epoch": 0.13, + "learning_rate": 1.7506504601763038e-07, + "loss": 0.0273, + "step": 6471 + }, + { + "epoch": 0.13, + "learning_rate": 1.7506116267329422e-07, + "loss": 0.0847, + "step": 6472 + }, + { + "epoch": 0.13, + "learning_rate": 1.750572793289581e-07, + "loss": 0.0086, + "step": 6473 + }, + { + "epoch": 0.13, + "learning_rate": 1.7505339598462194e-07, + "loss": 0.0264, + "step": 6474 + }, + { + "epoch": 0.13, + "learning_rate": 1.750495126402858e-07, + "loss": 0.0361, + "step": 6475 + }, + { + "epoch": 0.13, + "learning_rate": 1.7504562929594965e-07, + "loss": 0.3567, + "step": 6476 + }, + { + "epoch": 0.13, + "learning_rate": 1.7504174595161353e-07, + "loss": 0.6148, + "step": 6477 + }, + { + "epoch": 0.13, + "learning_rate": 1.7503786260727737e-07, + "loss": 0.2819, + "step": 6478 + }, + { + "epoch": 0.13, + "learning_rate": 1.7503397926294124e-07, + "loss": 0.0108, + "step": 6479 + }, + { + "epoch": 0.13, + "learning_rate": 1.750300959186051e-07, + "loss": 0.0149, + "step": 6480 + }, + { + "epoch": 0.13, + "learning_rate": 1.7502621257426896e-07, + "loss": 0.3468, + "step": 6481 + }, + { + "epoch": 0.13, + "learning_rate": 1.750223292299328e-07, + "loss": 0.0257, + "step": 6482 + }, + { + "epoch": 0.13, + "learning_rate": 1.7501844588559668e-07, + "loss": 0.0153, + "step": 6483 + }, + { + "epoch": 0.13, + "learning_rate": 1.7501456254126052e-07, + "loss": 0.0083, + "step": 6484 + }, + { + "epoch": 0.13, + "learning_rate": 1.750106791969244e-07, + "loss": 0.5078, + "step": 6485 + }, + { + "epoch": 0.13, + "learning_rate": 1.7500679585258824e-07, + "loss": 0.008, + "step": 6486 + }, + { + "epoch": 0.13, + "learning_rate": 1.750029125082521e-07, + "loss": 0.0107, + "step": 6487 + }, + { + "epoch": 0.13, + "learning_rate": 1.7499902916391595e-07, + "loss": 0.0089, + "step": 6488 + }, + { + "epoch": 0.13, + "learning_rate": 1.7499514581957982e-07, + "loss": 0.009, + "step": 6489 + }, + { + "epoch": 0.13, + "learning_rate": 1.7499126247524367e-07, + "loss": 0.2038, + "step": 6490 + }, + { + "epoch": 0.13, + "learning_rate": 1.7498737913090754e-07, + "loss": 0.0334, + "step": 6491 + }, + { + "epoch": 0.13, + "learning_rate": 1.7498349578657139e-07, + "loss": 0.0086, + "step": 6492 + }, + { + "epoch": 0.13, + "learning_rate": 1.7497961244223526e-07, + "loss": 0.0339, + "step": 6493 + }, + { + "epoch": 0.13, + "learning_rate": 1.749757290978991e-07, + "loss": 0.0109, + "step": 6494 + }, + { + "epoch": 0.13, + "learning_rate": 1.7497184575356297e-07, + "loss": 0.0109, + "step": 6495 + }, + { + "epoch": 0.13, + "learning_rate": 1.7496796240922682e-07, + "loss": 0.0087, + "step": 6496 + }, + { + "epoch": 0.13, + "learning_rate": 1.749640790648907e-07, + "loss": 0.0469, + "step": 6497 + }, + { + "epoch": 0.13, + "learning_rate": 1.7496019572055454e-07, + "loss": 0.0083, + "step": 6498 + }, + { + "epoch": 0.13, + "learning_rate": 1.749563123762184e-07, + "loss": 0.0078, + "step": 6499 + }, + { + "epoch": 0.13, + "learning_rate": 1.7495242903188225e-07, + "loss": 0.0134, + "step": 6500 + }, + { + "epoch": 0.13, + "learning_rate": 1.7494854568754612e-07, + "loss": 0.1577, + "step": 6501 + }, + { + "epoch": 0.13, + "learning_rate": 1.7494466234320997e-07, + "loss": 0.0709, + "step": 6502 + }, + { + "epoch": 0.13, + "learning_rate": 1.7494077899887384e-07, + "loss": 0.0133, + "step": 6503 + }, + { + "epoch": 0.13, + "learning_rate": 1.7493689565453769e-07, + "loss": 0.689, + "step": 6504 + }, + { + "epoch": 0.13, + "learning_rate": 1.7493301231020156e-07, + "loss": 0.0116, + "step": 6505 + }, + { + "epoch": 0.13, + "learning_rate": 1.749291289658654e-07, + "loss": 0.0183, + "step": 6506 + }, + { + "epoch": 0.13, + "learning_rate": 1.7492524562152927e-07, + "loss": 0.0214, + "step": 6507 + }, + { + "epoch": 0.13, + "learning_rate": 1.7492136227719312e-07, + "loss": 0.0101, + "step": 6508 + }, + { + "epoch": 0.13, + "learning_rate": 1.74917478932857e-07, + "loss": 0.2196, + "step": 6509 + }, + { + "epoch": 0.13, + "learning_rate": 1.7491359558852083e-07, + "loss": 0.0114, + "step": 6510 + }, + { + "epoch": 0.13, + "learning_rate": 1.7490971224418468e-07, + "loss": 0.0095, + "step": 6511 + }, + { + "epoch": 0.13, + "learning_rate": 1.7490582889984855e-07, + "loss": 0.4677, + "step": 6512 + }, + { + "epoch": 0.13, + "learning_rate": 1.749019455555124e-07, + "loss": 0.0074, + "step": 6513 + }, + { + "epoch": 0.13, + "learning_rate": 1.7489806221117627e-07, + "loss": 0.0087, + "step": 6514 + }, + { + "epoch": 0.13, + "learning_rate": 1.748941788668401e-07, + "loss": 0.0104, + "step": 6515 + }, + { + "epoch": 0.13, + "learning_rate": 1.7489029552250398e-07, + "loss": 0.0122, + "step": 6516 + }, + { + "epoch": 0.13, + "learning_rate": 1.7488641217816783e-07, + "loss": 0.0139, + "step": 6517 + }, + { + "epoch": 0.13, + "learning_rate": 1.7488252883383167e-07, + "loss": 0.174, + "step": 6518 + }, + { + "epoch": 0.13, + "learning_rate": 1.7487864548949555e-07, + "loss": 0.2267, + "step": 6519 + }, + { + "epoch": 0.13, + "learning_rate": 1.748747621451594e-07, + "loss": 0.1158, + "step": 6520 + }, + { + "epoch": 0.13, + "learning_rate": 1.7487087880082326e-07, + "loss": 0.0147, + "step": 6521 + }, + { + "epoch": 0.13, + "learning_rate": 1.748669954564871e-07, + "loss": 0.0114, + "step": 6522 + }, + { + "epoch": 0.13, + "learning_rate": 1.7486311211215098e-07, + "loss": 0.0095, + "step": 6523 + }, + { + "epoch": 0.13, + "learning_rate": 1.7485922876781482e-07, + "loss": 0.5452, + "step": 6524 + }, + { + "epoch": 0.13, + "learning_rate": 1.748553454234787e-07, + "loss": 0.3057, + "step": 6525 + }, + { + "epoch": 0.13, + "learning_rate": 1.7485146207914254e-07, + "loss": 0.013, + "step": 6526 + }, + { + "epoch": 0.13, + "learning_rate": 1.748475787348064e-07, + "loss": 0.0468, + "step": 6527 + }, + { + "epoch": 0.13, + "learning_rate": 1.7484369539047026e-07, + "loss": 0.0417, + "step": 6528 + }, + { + "epoch": 0.13, + "learning_rate": 1.7483981204613413e-07, + "loss": 0.0152, + "step": 6529 + }, + { + "epoch": 0.13, + "learning_rate": 1.7483592870179797e-07, + "loss": 0.0084, + "step": 6530 + }, + { + "epoch": 0.13, + "learning_rate": 1.7483204535746184e-07, + "loss": 0.01, + "step": 6531 + }, + { + "epoch": 0.13, + "learning_rate": 1.748281620131257e-07, + "loss": 0.0078, + "step": 6532 + }, + { + "epoch": 0.13, + "learning_rate": 1.7482427866878956e-07, + "loss": 0.0338, + "step": 6533 + }, + { + "epoch": 0.13, + "learning_rate": 1.748203953244534e-07, + "loss": 0.0341, + "step": 6534 + }, + { + "epoch": 0.13, + "learning_rate": 1.7481651198011728e-07, + "loss": 0.0251, + "step": 6535 + }, + { + "epoch": 0.13, + "learning_rate": 1.7481262863578112e-07, + "loss": 0.013, + "step": 6536 + }, + { + "epoch": 0.13, + "learning_rate": 1.74808745291445e-07, + "loss": 0.0194, + "step": 6537 + }, + { + "epoch": 0.13, + "learning_rate": 1.7480486194710884e-07, + "loss": 0.0216, + "step": 6538 + }, + { + "epoch": 0.13, + "learning_rate": 1.748009786027727e-07, + "loss": 0.0104, + "step": 6539 + }, + { + "epoch": 0.13, + "learning_rate": 1.7479709525843656e-07, + "loss": 0.0126, + "step": 6540 + }, + { + "epoch": 0.13, + "learning_rate": 1.747932119141004e-07, + "loss": 0.0101, + "step": 6541 + }, + { + "epoch": 0.13, + "learning_rate": 1.7478932856976427e-07, + "loss": 0.0087, + "step": 6542 + }, + { + "epoch": 0.13, + "learning_rate": 1.7478544522542812e-07, + "loss": 0.0181, + "step": 6543 + }, + { + "epoch": 0.13, + "learning_rate": 1.74781561881092e-07, + "loss": 0.354, + "step": 6544 + }, + { + "epoch": 0.13, + "learning_rate": 1.7477767853675583e-07, + "loss": 0.0137, + "step": 6545 + }, + { + "epoch": 0.13, + "learning_rate": 1.747737951924197e-07, + "loss": 0.0114, + "step": 6546 + }, + { + "epoch": 0.13, + "learning_rate": 1.7476991184808355e-07, + "loss": 0.459, + "step": 6547 + }, + { + "epoch": 0.13, + "learning_rate": 1.7476602850374742e-07, + "loss": 0.4084, + "step": 6548 + }, + { + "epoch": 0.13, + "learning_rate": 1.7476214515941127e-07, + "loss": 0.0311, + "step": 6549 + }, + { + "epoch": 0.13, + "learning_rate": 1.7475826181507514e-07, + "loss": 0.1637, + "step": 6550 + }, + { + "epoch": 0.13, + "learning_rate": 1.7475437847073898e-07, + "loss": 0.0168, + "step": 6551 + }, + { + "epoch": 0.13, + "learning_rate": 1.7475049512640285e-07, + "loss": 0.9584, + "step": 6552 + }, + { + "epoch": 0.13, + "learning_rate": 1.747466117820667e-07, + "loss": 0.0147, + "step": 6553 + }, + { + "epoch": 0.13, + "learning_rate": 1.7474272843773057e-07, + "loss": 0.6492, + "step": 6554 + }, + { + "epoch": 0.13, + "learning_rate": 1.7473884509339442e-07, + "loss": 0.2539, + "step": 6555 + }, + { + "epoch": 0.13, + "learning_rate": 1.747349617490583e-07, + "loss": 0.0104, + "step": 6556 + }, + { + "epoch": 0.13, + "learning_rate": 1.7473107840472213e-07, + "loss": 0.0582, + "step": 6557 + }, + { + "epoch": 0.13, + "learning_rate": 1.74727195060386e-07, + "loss": 0.8099, + "step": 6558 + }, + { + "epoch": 0.13, + "learning_rate": 1.7472331171604985e-07, + "loss": 0.009, + "step": 6559 + }, + { + "epoch": 0.13, + "learning_rate": 1.7471942837171372e-07, + "loss": 0.3739, + "step": 6560 + }, + { + "epoch": 0.13, + "learning_rate": 1.7471554502737757e-07, + "loss": 0.0085, + "step": 6561 + }, + { + "epoch": 0.13, + "learning_rate": 1.7471166168304144e-07, + "loss": 0.0102, + "step": 6562 + }, + { + "epoch": 0.13, + "learning_rate": 1.7470777833870528e-07, + "loss": 0.0086, + "step": 6563 + }, + { + "epoch": 0.13, + "learning_rate": 1.7470389499436915e-07, + "loss": 0.6558, + "step": 6564 + }, + { + "epoch": 0.13, + "learning_rate": 1.74700011650033e-07, + "loss": 0.0137, + "step": 6565 + }, + { + "epoch": 0.13, + "learning_rate": 1.7469612830569687e-07, + "loss": 0.0261, + "step": 6566 + }, + { + "epoch": 0.13, + "learning_rate": 1.7469224496136071e-07, + "loss": 0.024, + "step": 6567 + }, + { + "epoch": 0.13, + "learning_rate": 1.7468836161702459e-07, + "loss": 0.4033, + "step": 6568 + }, + { + "epoch": 0.13, + "learning_rate": 1.7468447827268843e-07, + "loss": 0.0307, + "step": 6569 + }, + { + "epoch": 0.13, + "learning_rate": 1.746805949283523e-07, + "loss": 0.0092, + "step": 6570 + }, + { + "epoch": 0.13, + "learning_rate": 1.7467671158401615e-07, + "loss": 0.0306, + "step": 6571 + }, + { + "epoch": 0.13, + "learning_rate": 1.7467282823968002e-07, + "loss": 0.013, + "step": 6572 + }, + { + "epoch": 0.13, + "learning_rate": 1.7466894489534386e-07, + "loss": 0.014, + "step": 6573 + }, + { + "epoch": 0.13, + "learning_rate": 1.7466506155100774e-07, + "loss": 0.0084, + "step": 6574 + }, + { + "epoch": 0.13, + "learning_rate": 1.7466117820667155e-07, + "loss": 0.0118, + "step": 6575 + }, + { + "epoch": 0.13, + "learning_rate": 1.7465729486233543e-07, + "loss": 0.0152, + "step": 6576 + }, + { + "epoch": 0.13, + "learning_rate": 1.7465341151799927e-07, + "loss": 0.107, + "step": 6577 + }, + { + "epoch": 0.13, + "learning_rate": 1.7464952817366314e-07, + "loss": 0.0124, + "step": 6578 + }, + { + "epoch": 0.13, + "learning_rate": 1.74645644829327e-07, + "loss": 0.0624, + "step": 6579 + }, + { + "epoch": 0.13, + "learning_rate": 1.7464176148499086e-07, + "loss": 0.189, + "step": 6580 + }, + { + "epoch": 0.13, + "learning_rate": 1.746378781406547e-07, + "loss": 0.013, + "step": 6581 + }, + { + "epoch": 0.13, + "learning_rate": 1.7463399479631858e-07, + "loss": 0.0083, + "step": 6582 + }, + { + "epoch": 0.13, + "learning_rate": 1.7463011145198242e-07, + "loss": 0.016, + "step": 6583 + }, + { + "epoch": 0.13, + "learning_rate": 1.746262281076463e-07, + "loss": 0.0311, + "step": 6584 + }, + { + "epoch": 0.13, + "learning_rate": 1.7462234476331014e-07, + "loss": 0.0167, + "step": 6585 + }, + { + "epoch": 0.13, + "learning_rate": 1.74618461418974e-07, + "loss": 0.0103, + "step": 6586 + }, + { + "epoch": 0.13, + "learning_rate": 1.7461457807463785e-07, + "loss": 0.1736, + "step": 6587 + }, + { + "epoch": 0.13, + "learning_rate": 1.7461069473030172e-07, + "loss": 0.1922, + "step": 6588 + }, + { + "epoch": 0.13, + "learning_rate": 1.7460681138596557e-07, + "loss": 0.0079, + "step": 6589 + }, + { + "epoch": 0.13, + "learning_rate": 1.7460292804162944e-07, + "loss": 0.0208, + "step": 6590 + }, + { + "epoch": 0.13, + "learning_rate": 1.7459904469729329e-07, + "loss": 0.0095, + "step": 6591 + }, + { + "epoch": 0.13, + "learning_rate": 1.7459516135295716e-07, + "loss": 0.1006, + "step": 6592 + }, + { + "epoch": 0.13, + "learning_rate": 1.74591278008621e-07, + "loss": 0.0088, + "step": 6593 + }, + { + "epoch": 0.13, + "learning_rate": 1.7458739466428487e-07, + "loss": 0.0169, + "step": 6594 + }, + { + "epoch": 0.13, + "learning_rate": 1.7458351131994872e-07, + "loss": 0.386, + "step": 6595 + }, + { + "epoch": 0.13, + "learning_rate": 1.745796279756126e-07, + "loss": 0.0112, + "step": 6596 + }, + { + "epoch": 0.13, + "learning_rate": 1.7457574463127644e-07, + "loss": 0.0285, + "step": 6597 + }, + { + "epoch": 0.13, + "learning_rate": 1.745718612869403e-07, + "loss": 0.1305, + "step": 6598 + }, + { + "epoch": 0.13, + "learning_rate": 1.7456797794260415e-07, + "loss": 0.0115, + "step": 6599 + }, + { + "epoch": 0.13, + "learning_rate": 1.7456409459826802e-07, + "loss": 0.013, + "step": 6600 + }, + { + "epoch": 0.13, + "learning_rate": 1.7456021125393187e-07, + "loss": 0.0105, + "step": 6601 + }, + { + "epoch": 0.13, + "learning_rate": 1.7455632790959574e-07, + "loss": 0.0087, + "step": 6602 + }, + { + "epoch": 0.13, + "learning_rate": 1.7455244456525959e-07, + "loss": 0.012, + "step": 6603 + }, + { + "epoch": 0.13, + "learning_rate": 1.7454856122092346e-07, + "loss": 0.503, + "step": 6604 + }, + { + "epoch": 0.13, + "learning_rate": 1.745446778765873e-07, + "loss": 0.0089, + "step": 6605 + }, + { + "epoch": 0.13, + "learning_rate": 1.7454079453225117e-07, + "loss": 0.4335, + "step": 6606 + }, + { + "epoch": 0.13, + "learning_rate": 1.7453691118791502e-07, + "loss": 0.0727, + "step": 6607 + }, + { + "epoch": 0.13, + "learning_rate": 1.745330278435789e-07, + "loss": 0.0076, + "step": 6608 + }, + { + "epoch": 0.13, + "learning_rate": 1.7452914449924273e-07, + "loss": 0.358, + "step": 6609 + }, + { + "epoch": 0.13, + "learning_rate": 1.745252611549066e-07, + "loss": 0.0096, + "step": 6610 + }, + { + "epoch": 0.13, + "learning_rate": 1.7452137781057045e-07, + "loss": 0.0145, + "step": 6611 + }, + { + "epoch": 0.13, + "learning_rate": 1.7451749446623432e-07, + "loss": 0.011, + "step": 6612 + }, + { + "epoch": 0.13, + "learning_rate": 1.7451361112189817e-07, + "loss": 0.3889, + "step": 6613 + }, + { + "epoch": 0.13, + "learning_rate": 1.7450972777756204e-07, + "loss": 0.021, + "step": 6614 + }, + { + "epoch": 0.13, + "learning_rate": 1.7450584443322588e-07, + "loss": 0.0074, + "step": 6615 + }, + { + "epoch": 0.13, + "learning_rate": 1.7450196108888976e-07, + "loss": 0.66, + "step": 6616 + }, + { + "epoch": 0.13, + "learning_rate": 1.744980777445536e-07, + "loss": 0.0751, + "step": 6617 + }, + { + "epoch": 0.13, + "learning_rate": 1.7449419440021747e-07, + "loss": 0.0116, + "step": 6618 + }, + { + "epoch": 0.13, + "learning_rate": 1.7449031105588132e-07, + "loss": 0.0107, + "step": 6619 + }, + { + "epoch": 0.13, + "learning_rate": 1.744864277115452e-07, + "loss": 0.0148, + "step": 6620 + }, + { + "epoch": 0.13, + "learning_rate": 1.7448254436720903e-07, + "loss": 0.0091, + "step": 6621 + }, + { + "epoch": 0.13, + "learning_rate": 1.744786610228729e-07, + "loss": 0.0081, + "step": 6622 + }, + { + "epoch": 0.13, + "learning_rate": 1.7447477767853675e-07, + "loss": 0.2976, + "step": 6623 + }, + { + "epoch": 0.13, + "learning_rate": 1.7447089433420062e-07, + "loss": 0.0113, + "step": 6624 + }, + { + "epoch": 0.13, + "learning_rate": 1.7446701098986447e-07, + "loss": 0.4381, + "step": 6625 + }, + { + "epoch": 0.13, + "learning_rate": 1.7446312764552834e-07, + "loss": 0.0151, + "step": 6626 + }, + { + "epoch": 0.13, + "learning_rate": 1.7445924430119218e-07, + "loss": 0.0412, + "step": 6627 + }, + { + "epoch": 0.13, + "learning_rate": 1.7445536095685605e-07, + "loss": 0.1345, + "step": 6628 + }, + { + "epoch": 0.13, + "learning_rate": 1.744514776125199e-07, + "loss": 0.0475, + "step": 6629 + }, + { + "epoch": 0.13, + "learning_rate": 1.7444759426818377e-07, + "loss": 0.0957, + "step": 6630 + }, + { + "epoch": 0.13, + "learning_rate": 1.7444371092384762e-07, + "loss": 0.0127, + "step": 6631 + }, + { + "epoch": 0.13, + "learning_rate": 1.744398275795115e-07, + "loss": 0.008, + "step": 6632 + }, + { + "epoch": 0.13, + "learning_rate": 1.744359442351753e-07, + "loss": 0.0178, + "step": 6633 + }, + { + "epoch": 0.13, + "learning_rate": 1.7443206089083918e-07, + "loss": 0.0076, + "step": 6634 + }, + { + "epoch": 0.13, + "learning_rate": 1.7442817754650302e-07, + "loss": 0.0109, + "step": 6635 + }, + { + "epoch": 0.13, + "learning_rate": 1.744242942021669e-07, + "loss": 0.0116, + "step": 6636 + }, + { + "epoch": 0.13, + "learning_rate": 1.7442041085783074e-07, + "loss": 0.0092, + "step": 6637 + }, + { + "epoch": 0.13, + "learning_rate": 1.744165275134946e-07, + "loss": 0.0091, + "step": 6638 + }, + { + "epoch": 0.13, + "learning_rate": 1.7441264416915846e-07, + "loss": 0.0584, + "step": 6639 + }, + { + "epoch": 0.13, + "learning_rate": 1.7440876082482233e-07, + "loss": 0.0076, + "step": 6640 + }, + { + "epoch": 0.13, + "learning_rate": 1.7440487748048617e-07, + "loss": 0.0191, + "step": 6641 + }, + { + "epoch": 0.13, + "learning_rate": 1.7440099413615004e-07, + "loss": 0.0357, + "step": 6642 + }, + { + "epoch": 0.13, + "learning_rate": 1.743971107918139e-07, + "loss": 0.0103, + "step": 6643 + }, + { + "epoch": 0.13, + "learning_rate": 1.7439322744747776e-07, + "loss": 0.0118, + "step": 6644 + }, + { + "epoch": 0.13, + "learning_rate": 1.743893441031416e-07, + "loss": 0.551, + "step": 6645 + }, + { + "epoch": 0.13, + "learning_rate": 1.7438546075880548e-07, + "loss": 0.2221, + "step": 6646 + }, + { + "epoch": 0.13, + "learning_rate": 1.7438157741446932e-07, + "loss": 0.0391, + "step": 6647 + }, + { + "epoch": 0.13, + "learning_rate": 1.743776940701332e-07, + "loss": 0.0112, + "step": 6648 + }, + { + "epoch": 0.13, + "learning_rate": 1.7437381072579704e-07, + "loss": 0.01, + "step": 6649 + }, + { + "epoch": 0.13, + "learning_rate": 1.743699273814609e-07, + "loss": 0.3859, + "step": 6650 + }, + { + "epoch": 0.13, + "learning_rate": 1.7436604403712475e-07, + "loss": 0.0225, + "step": 6651 + }, + { + "epoch": 0.13, + "learning_rate": 1.7436216069278863e-07, + "loss": 0.2589, + "step": 6652 + }, + { + "epoch": 0.13, + "learning_rate": 1.7435827734845247e-07, + "loss": 0.0151, + "step": 6653 + }, + { + "epoch": 0.13, + "learning_rate": 1.7435439400411634e-07, + "loss": 0.0096, + "step": 6654 + }, + { + "epoch": 0.13, + "learning_rate": 1.743505106597802e-07, + "loss": 0.0102, + "step": 6655 + }, + { + "epoch": 0.13, + "learning_rate": 1.7434662731544406e-07, + "loss": 0.0115, + "step": 6656 + }, + { + "epoch": 0.13, + "learning_rate": 1.743427439711079e-07, + "loss": 0.0136, + "step": 6657 + }, + { + "epoch": 0.13, + "learning_rate": 1.7433886062677178e-07, + "loss": 0.0074, + "step": 6658 + }, + { + "epoch": 0.13, + "learning_rate": 1.7433497728243562e-07, + "loss": 0.0093, + "step": 6659 + }, + { + "epoch": 0.13, + "learning_rate": 1.743310939380995e-07, + "loss": 0.0105, + "step": 6660 + }, + { + "epoch": 0.13, + "learning_rate": 1.7432721059376334e-07, + "loss": 0.0229, + "step": 6661 + }, + { + "epoch": 0.13, + "learning_rate": 1.743233272494272e-07, + "loss": 0.009, + "step": 6662 + }, + { + "epoch": 0.13, + "learning_rate": 1.7431944390509105e-07, + "loss": 0.0081, + "step": 6663 + }, + { + "epoch": 0.13, + "learning_rate": 1.7431556056075492e-07, + "loss": 0.0086, + "step": 6664 + }, + { + "epoch": 0.13, + "learning_rate": 1.7431167721641877e-07, + "loss": 0.0229, + "step": 6665 + }, + { + "epoch": 0.13, + "learning_rate": 1.7430779387208264e-07, + "loss": 0.0124, + "step": 6666 + }, + { + "epoch": 0.13, + "learning_rate": 1.7430391052774649e-07, + "loss": 0.0181, + "step": 6667 + }, + { + "epoch": 0.13, + "learning_rate": 1.7430002718341036e-07, + "loss": 0.2136, + "step": 6668 + }, + { + "epoch": 0.13, + "learning_rate": 1.742961438390742e-07, + "loss": 0.0096, + "step": 6669 + }, + { + "epoch": 0.13, + "learning_rate": 1.7429226049473807e-07, + "loss": 0.0123, + "step": 6670 + }, + { + "epoch": 0.13, + "learning_rate": 1.7428837715040192e-07, + "loss": 0.0346, + "step": 6671 + }, + { + "epoch": 0.13, + "learning_rate": 1.742844938060658e-07, + "loss": 0.0205, + "step": 6672 + }, + { + "epoch": 0.13, + "learning_rate": 1.7428061046172964e-07, + "loss": 0.0077, + "step": 6673 + }, + { + "epoch": 0.13, + "learning_rate": 1.742767271173935e-07, + "loss": 0.007, + "step": 6674 + }, + { + "epoch": 0.13, + "learning_rate": 1.7427284377305735e-07, + "loss": 0.0115, + "step": 6675 + }, + { + "epoch": 0.13, + "learning_rate": 1.7426896042872122e-07, + "loss": 0.6768, + "step": 6676 + }, + { + "epoch": 0.13, + "learning_rate": 1.7426507708438507e-07, + "loss": 0.0148, + "step": 6677 + }, + { + "epoch": 0.13, + "learning_rate": 1.7426119374004894e-07, + "loss": 0.238, + "step": 6678 + }, + { + "epoch": 0.13, + "learning_rate": 1.7425731039571279e-07, + "loss": 0.7843, + "step": 6679 + }, + { + "epoch": 0.13, + "learning_rate": 1.7425342705137666e-07, + "loss": 0.0122, + "step": 6680 + }, + { + "epoch": 0.13, + "learning_rate": 1.742495437070405e-07, + "loss": 0.0153, + "step": 6681 + }, + { + "epoch": 0.13, + "learning_rate": 1.7424566036270437e-07, + "loss": 0.0085, + "step": 6682 + }, + { + "epoch": 0.13, + "learning_rate": 1.7424177701836822e-07, + "loss": 0.0788, + "step": 6683 + }, + { + "epoch": 0.13, + "learning_rate": 1.742378936740321e-07, + "loss": 0.376, + "step": 6684 + }, + { + "epoch": 0.13, + "learning_rate": 1.7423401032969593e-07, + "loss": 0.1975, + "step": 6685 + }, + { + "epoch": 0.13, + "learning_rate": 1.742301269853598e-07, + "loss": 0.0085, + "step": 6686 + }, + { + "epoch": 0.13, + "learning_rate": 1.7422624364102365e-07, + "loss": 0.0171, + "step": 6687 + }, + { + "epoch": 0.13, + "learning_rate": 1.742223602966875e-07, + "loss": 0.0272, + "step": 6688 + }, + { + "epoch": 0.13, + "learning_rate": 1.7421847695235137e-07, + "loss": 0.0123, + "step": 6689 + }, + { + "epoch": 0.13, + "learning_rate": 1.742145936080152e-07, + "loss": 0.0094, + "step": 6690 + }, + { + "epoch": 0.13, + "learning_rate": 1.7421071026367906e-07, + "loss": 0.0085, + "step": 6691 + }, + { + "epoch": 0.13, + "learning_rate": 1.7420682691934293e-07, + "loss": 0.0442, + "step": 6692 + }, + { + "epoch": 0.13, + "learning_rate": 1.7420294357500677e-07, + "loss": 0.0368, + "step": 6693 + }, + { + "epoch": 0.13, + "learning_rate": 1.7419906023067065e-07, + "loss": 0.009, + "step": 6694 + }, + { + "epoch": 0.13, + "learning_rate": 1.741951768863345e-07, + "loss": 0.0087, + "step": 6695 + }, + { + "epoch": 0.13, + "learning_rate": 1.7419129354199836e-07, + "loss": 0.0113, + "step": 6696 + }, + { + "epoch": 0.13, + "learning_rate": 1.741874101976622e-07, + "loss": 0.6524, + "step": 6697 + }, + { + "epoch": 0.13, + "learning_rate": 1.7418352685332608e-07, + "loss": 0.6469, + "step": 6698 + }, + { + "epoch": 0.13, + "learning_rate": 1.7417964350898992e-07, + "loss": 0.0655, + "step": 6699 + }, + { + "epoch": 0.13, + "learning_rate": 1.741757601646538e-07, + "loss": 0.1273, + "step": 6700 + }, + { + "epoch": 0.13, + "learning_rate": 1.7417187682031764e-07, + "loss": 0.0074, + "step": 6701 + }, + { + "epoch": 0.13, + "learning_rate": 1.741679934759815e-07, + "loss": 0.0083, + "step": 6702 + }, + { + "epoch": 0.13, + "learning_rate": 1.7416411013164536e-07, + "loss": 0.712, + "step": 6703 + }, + { + "epoch": 0.13, + "learning_rate": 1.7416022678730923e-07, + "loss": 0.1781, + "step": 6704 + }, + { + "epoch": 0.13, + "learning_rate": 1.7415634344297307e-07, + "loss": 0.0097, + "step": 6705 + }, + { + "epoch": 0.13, + "learning_rate": 1.7415246009863694e-07, + "loss": 0.0097, + "step": 6706 + }, + { + "epoch": 0.13, + "learning_rate": 1.741485767543008e-07, + "loss": 0.0149, + "step": 6707 + }, + { + "epoch": 0.13, + "learning_rate": 1.7414469340996466e-07, + "loss": 0.0071, + "step": 6708 + }, + { + "epoch": 0.13, + "learning_rate": 1.741408100656285e-07, + "loss": 0.0119, + "step": 6709 + }, + { + "epoch": 0.13, + "learning_rate": 1.7413692672129238e-07, + "loss": 0.0617, + "step": 6710 + }, + { + "epoch": 0.13, + "learning_rate": 1.7413304337695622e-07, + "loss": 0.8743, + "step": 6711 + }, + { + "epoch": 0.13, + "learning_rate": 1.741291600326201e-07, + "loss": 0.9823, + "step": 6712 + }, + { + "epoch": 0.13, + "learning_rate": 1.7412527668828394e-07, + "loss": 0.1373, + "step": 6713 + }, + { + "epoch": 0.13, + "learning_rate": 1.741213933439478e-07, + "loss": 0.0111, + "step": 6714 + }, + { + "epoch": 0.13, + "learning_rate": 1.7411750999961166e-07, + "loss": 0.032, + "step": 6715 + }, + { + "epoch": 0.13, + "learning_rate": 1.7411362665527553e-07, + "loss": 0.1189, + "step": 6716 + }, + { + "epoch": 0.13, + "learning_rate": 1.7410974331093937e-07, + "loss": 0.0074, + "step": 6717 + }, + { + "epoch": 0.13, + "learning_rate": 1.7410585996660322e-07, + "loss": 0.0083, + "step": 6718 + }, + { + "epoch": 0.13, + "learning_rate": 1.741019766222671e-07, + "loss": 0.0089, + "step": 6719 + }, + { + "epoch": 0.13, + "learning_rate": 1.7409809327793093e-07, + "loss": 0.0134, + "step": 6720 + }, + { + "epoch": 0.13, + "learning_rate": 1.740942099335948e-07, + "loss": 0.7335, + "step": 6721 + }, + { + "epoch": 0.13, + "learning_rate": 1.7409032658925865e-07, + "loss": 0.0088, + "step": 6722 + }, + { + "epoch": 0.13, + "learning_rate": 1.7408644324492252e-07, + "loss": 0.0095, + "step": 6723 + }, + { + "epoch": 0.13, + "learning_rate": 1.7408255990058637e-07, + "loss": 0.0161, + "step": 6724 + }, + { + "epoch": 0.13, + "learning_rate": 1.7407867655625024e-07, + "loss": 0.0386, + "step": 6725 + }, + { + "epoch": 0.13, + "learning_rate": 1.7407479321191408e-07, + "loss": 0.2399, + "step": 6726 + }, + { + "epoch": 0.13, + "learning_rate": 1.7407090986757795e-07, + "loss": 0.0089, + "step": 6727 + }, + { + "epoch": 0.13, + "learning_rate": 1.740670265232418e-07, + "loss": 0.5411, + "step": 6728 + }, + { + "epoch": 0.13, + "learning_rate": 1.7406314317890567e-07, + "loss": 0.0102, + "step": 6729 + }, + { + "epoch": 0.13, + "learning_rate": 1.7405925983456952e-07, + "loss": 0.0102, + "step": 6730 + }, + { + "epoch": 0.13, + "learning_rate": 1.740553764902334e-07, + "loss": 0.0377, + "step": 6731 + }, + { + "epoch": 0.13, + "learning_rate": 1.7405149314589723e-07, + "loss": 0.0978, + "step": 6732 + }, + { + "epoch": 0.13, + "learning_rate": 1.740476098015611e-07, + "loss": 0.0147, + "step": 6733 + }, + { + "epoch": 0.13, + "learning_rate": 1.7404372645722495e-07, + "loss": 0.4684, + "step": 6734 + }, + { + "epoch": 0.13, + "learning_rate": 1.7403984311288882e-07, + "loss": 0.8423, + "step": 6735 + }, + { + "epoch": 0.13, + "learning_rate": 1.7403595976855267e-07, + "loss": 0.0115, + "step": 6736 + }, + { + "epoch": 0.13, + "learning_rate": 1.7403207642421654e-07, + "loss": 0.4012, + "step": 6737 + }, + { + "epoch": 0.13, + "learning_rate": 1.7402819307988038e-07, + "loss": 0.0106, + "step": 6738 + }, + { + "epoch": 0.13, + "learning_rate": 1.7402430973554425e-07, + "loss": 0.0132, + "step": 6739 + }, + { + "epoch": 0.13, + "learning_rate": 1.740204263912081e-07, + "loss": 0.0123, + "step": 6740 + }, + { + "epoch": 0.13, + "learning_rate": 1.7401654304687197e-07, + "loss": 0.0084, + "step": 6741 + }, + { + "epoch": 0.13, + "learning_rate": 1.7401265970253582e-07, + "loss": 0.0096, + "step": 6742 + }, + { + "epoch": 0.13, + "learning_rate": 1.7400877635819969e-07, + "loss": 0.0214, + "step": 6743 + }, + { + "epoch": 0.13, + "learning_rate": 1.7400489301386353e-07, + "loss": 0.0095, + "step": 6744 + }, + { + "epoch": 0.13, + "learning_rate": 1.740010096695274e-07, + "loss": 0.0076, + "step": 6745 + }, + { + "epoch": 0.13, + "learning_rate": 1.7399712632519125e-07, + "loss": 0.0092, + "step": 6746 + }, + { + "epoch": 0.13, + "learning_rate": 1.7399324298085512e-07, + "loss": 0.0202, + "step": 6747 + }, + { + "epoch": 0.13, + "learning_rate": 1.7398935963651896e-07, + "loss": 0.7379, + "step": 6748 + }, + { + "epoch": 0.13, + "learning_rate": 1.739854762921828e-07, + "loss": 0.0161, + "step": 6749 + }, + { + "epoch": 0.13, + "learning_rate": 1.7398159294784665e-07, + "loss": 0.014, + "step": 6750 + }, + { + "epoch": 0.13, + "learning_rate": 1.7397770960351053e-07, + "loss": 0.01, + "step": 6751 + }, + { + "epoch": 0.13, + "learning_rate": 1.7397382625917437e-07, + "loss": 0.0106, + "step": 6752 + }, + { + "epoch": 0.13, + "learning_rate": 1.7396994291483824e-07, + "loss": 0.9766, + "step": 6753 + }, + { + "epoch": 0.13, + "learning_rate": 1.739660595705021e-07, + "loss": 0.5556, + "step": 6754 + }, + { + "epoch": 0.13, + "learning_rate": 1.7396217622616596e-07, + "loss": 0.0099, + "step": 6755 + }, + { + "epoch": 0.13, + "learning_rate": 1.739582928818298e-07, + "loss": 0.0086, + "step": 6756 + }, + { + "epoch": 0.13, + "learning_rate": 1.7395440953749368e-07, + "loss": 0.0285, + "step": 6757 + }, + { + "epoch": 0.13, + "learning_rate": 1.7395052619315752e-07, + "loss": 0.0116, + "step": 6758 + }, + { + "epoch": 0.13, + "learning_rate": 1.739466428488214e-07, + "loss": 0.0118, + "step": 6759 + }, + { + "epoch": 0.13, + "learning_rate": 1.7394275950448524e-07, + "loss": 0.0112, + "step": 6760 + }, + { + "epoch": 0.13, + "learning_rate": 1.739388761601491e-07, + "loss": 0.0345, + "step": 6761 + }, + { + "epoch": 0.13, + "learning_rate": 1.7393499281581295e-07, + "loss": 0.0104, + "step": 6762 + }, + { + "epoch": 0.13, + "learning_rate": 1.7393110947147682e-07, + "loss": 0.0076, + "step": 6763 + }, + { + "epoch": 0.13, + "learning_rate": 1.7392722612714067e-07, + "loss": 0.0165, + "step": 6764 + }, + { + "epoch": 0.13, + "learning_rate": 1.7392334278280454e-07, + "loss": 0.0308, + "step": 6765 + }, + { + "epoch": 0.13, + "learning_rate": 1.7391945943846839e-07, + "loss": 0.0191, + "step": 6766 + }, + { + "epoch": 0.13, + "learning_rate": 1.7391557609413226e-07, + "loss": 0.3519, + "step": 6767 + }, + { + "epoch": 0.13, + "learning_rate": 1.739116927497961e-07, + "loss": 0.0202, + "step": 6768 + }, + { + "epoch": 0.13, + "learning_rate": 1.7390780940545997e-07, + "loss": 0.0126, + "step": 6769 + }, + { + "epoch": 0.13, + "learning_rate": 1.7390392606112382e-07, + "loss": 0.0222, + "step": 6770 + }, + { + "epoch": 0.13, + "learning_rate": 1.739000427167877e-07, + "loss": 0.3231, + "step": 6771 + }, + { + "epoch": 0.13, + "learning_rate": 1.7389615937245154e-07, + "loss": 0.2726, + "step": 6772 + }, + { + "epoch": 0.13, + "learning_rate": 1.738922760281154e-07, + "loss": 0.0084, + "step": 6773 + }, + { + "epoch": 0.13, + "learning_rate": 1.7388839268377925e-07, + "loss": 0.0105, + "step": 6774 + }, + { + "epoch": 0.13, + "learning_rate": 1.7388450933944312e-07, + "loss": 0.0375, + "step": 6775 + }, + { + "epoch": 0.13, + "learning_rate": 1.7388062599510697e-07, + "loss": 0.0817, + "step": 6776 + }, + { + "epoch": 0.13, + "learning_rate": 1.7387674265077084e-07, + "loss": 0.0096, + "step": 6777 + }, + { + "epoch": 0.13, + "learning_rate": 1.7387285930643469e-07, + "loss": 0.0105, + "step": 6778 + }, + { + "epoch": 0.13, + "learning_rate": 1.7386897596209856e-07, + "loss": 0.0089, + "step": 6779 + }, + { + "epoch": 0.13, + "learning_rate": 1.738650926177624e-07, + "loss": 0.0083, + "step": 6780 + }, + { + "epoch": 0.13, + "learning_rate": 1.7386120927342627e-07, + "loss": 0.0092, + "step": 6781 + }, + { + "epoch": 0.13, + "learning_rate": 1.7385732592909012e-07, + "loss": 0.2207, + "step": 6782 + }, + { + "epoch": 0.13, + "learning_rate": 1.73853442584754e-07, + "loss": 0.0093, + "step": 6783 + }, + { + "epoch": 0.13, + "learning_rate": 1.7384955924041783e-07, + "loss": 0.0399, + "step": 6784 + }, + { + "epoch": 0.13, + "learning_rate": 1.738456758960817e-07, + "loss": 0.0074, + "step": 6785 + }, + { + "epoch": 0.13, + "learning_rate": 1.7384179255174555e-07, + "loss": 0.0077, + "step": 6786 + }, + { + "epoch": 0.13, + "learning_rate": 1.7383790920740942e-07, + "loss": 0.3671, + "step": 6787 + }, + { + "epoch": 0.13, + "learning_rate": 1.7383402586307327e-07, + "loss": 0.7469, + "step": 6788 + }, + { + "epoch": 0.13, + "learning_rate": 1.7383014251873714e-07, + "loss": 0.0098, + "step": 6789 + }, + { + "epoch": 0.13, + "learning_rate": 1.7382625917440098e-07, + "loss": 0.0107, + "step": 6790 + }, + { + "epoch": 0.13, + "learning_rate": 1.7382237583006486e-07, + "loss": 0.007, + "step": 6791 + }, + { + "epoch": 0.13, + "learning_rate": 1.738184924857287e-07, + "loss": 0.009, + "step": 6792 + }, + { + "epoch": 0.13, + "learning_rate": 1.7381460914139257e-07, + "loss": 0.0215, + "step": 6793 + }, + { + "epoch": 0.13, + "learning_rate": 1.7381072579705642e-07, + "loss": 0.0658, + "step": 6794 + }, + { + "epoch": 0.13, + "learning_rate": 1.738068424527203e-07, + "loss": 0.0089, + "step": 6795 + }, + { + "epoch": 0.13, + "learning_rate": 1.7380295910838413e-07, + "loss": 0.0094, + "step": 6796 + }, + { + "epoch": 0.13, + "learning_rate": 1.73799075764048e-07, + "loss": 0.0096, + "step": 6797 + }, + { + "epoch": 0.13, + "learning_rate": 1.7379519241971185e-07, + "loss": 0.413, + "step": 6798 + }, + { + "epoch": 0.13, + "learning_rate": 1.7379130907537572e-07, + "loss": 0.0079, + "step": 6799 + }, + { + "epoch": 0.13, + "learning_rate": 1.7378742573103957e-07, + "loss": 0.0078, + "step": 6800 + }, + { + "epoch": 0.13, + "learning_rate": 1.7378354238670344e-07, + "loss": 0.011, + "step": 6801 + }, + { + "epoch": 0.13, + "learning_rate": 1.7377965904236728e-07, + "loss": 0.0096, + "step": 6802 + }, + { + "epoch": 0.13, + "learning_rate": 1.7377577569803115e-07, + "loss": 0.0074, + "step": 6803 + }, + { + "epoch": 0.13, + "learning_rate": 1.73771892353695e-07, + "loss": 0.0184, + "step": 6804 + }, + { + "epoch": 0.13, + "learning_rate": 1.7376800900935887e-07, + "loss": 0.0136, + "step": 6805 + }, + { + "epoch": 0.13, + "learning_rate": 1.7376412566502272e-07, + "loss": 0.0164, + "step": 6806 + }, + { + "epoch": 0.13, + "learning_rate": 1.7376024232068656e-07, + "loss": 0.0133, + "step": 6807 + }, + { + "epoch": 0.13, + "learning_rate": 1.737563589763504e-07, + "loss": 0.047, + "step": 6808 + }, + { + "epoch": 0.13, + "learning_rate": 1.7375247563201428e-07, + "loss": 0.0121, + "step": 6809 + }, + { + "epoch": 0.13, + "learning_rate": 1.7374859228767812e-07, + "loss": 0.0122, + "step": 6810 + }, + { + "epoch": 0.13, + "learning_rate": 1.73744708943342e-07, + "loss": 0.0093, + "step": 6811 + }, + { + "epoch": 0.13, + "learning_rate": 1.7374082559900584e-07, + "loss": 0.0107, + "step": 6812 + }, + { + "epoch": 0.13, + "learning_rate": 1.737369422546697e-07, + "loss": 0.0195, + "step": 6813 + }, + { + "epoch": 0.13, + "learning_rate": 1.7373305891033356e-07, + "loss": 0.0079, + "step": 6814 + }, + { + "epoch": 0.13, + "learning_rate": 1.7372917556599743e-07, + "loss": 0.0284, + "step": 6815 + }, + { + "epoch": 0.13, + "learning_rate": 1.7372529222166127e-07, + "loss": 0.0078, + "step": 6816 + }, + { + "epoch": 0.13, + "learning_rate": 1.7372140887732514e-07, + "loss": 0.5195, + "step": 6817 + }, + { + "epoch": 0.13, + "learning_rate": 1.73717525532989e-07, + "loss": 0.0092, + "step": 6818 + }, + { + "epoch": 0.13, + "learning_rate": 1.7371364218865286e-07, + "loss": 0.1044, + "step": 6819 + }, + { + "epoch": 0.13, + "learning_rate": 1.737097588443167e-07, + "loss": 0.0148, + "step": 6820 + }, + { + "epoch": 0.13, + "learning_rate": 1.7370587549998058e-07, + "loss": 0.5377, + "step": 6821 + }, + { + "epoch": 0.13, + "learning_rate": 1.7370199215564442e-07, + "loss": 0.0119, + "step": 6822 + }, + { + "epoch": 0.13, + "learning_rate": 1.736981088113083e-07, + "loss": 0.4442, + "step": 6823 + }, + { + "epoch": 0.13, + "learning_rate": 1.7369422546697214e-07, + "loss": 0.0129, + "step": 6824 + }, + { + "epoch": 0.13, + "learning_rate": 1.73690342122636e-07, + "loss": 0.0808, + "step": 6825 + }, + { + "epoch": 0.13, + "learning_rate": 1.7368645877829985e-07, + "loss": 0.0094, + "step": 6826 + }, + { + "epoch": 0.13, + "learning_rate": 1.7368257543396373e-07, + "loss": 0.7581, + "step": 6827 + }, + { + "epoch": 0.13, + "learning_rate": 1.7367869208962757e-07, + "loss": 0.0086, + "step": 6828 + }, + { + "epoch": 0.13, + "learning_rate": 1.7367480874529144e-07, + "loss": 0.0098, + "step": 6829 + }, + { + "epoch": 0.13, + "learning_rate": 1.736709254009553e-07, + "loss": 0.024, + "step": 6830 + }, + { + "epoch": 0.13, + "learning_rate": 1.7366704205661916e-07, + "loss": 0.0081, + "step": 6831 + }, + { + "epoch": 0.13, + "learning_rate": 1.73663158712283e-07, + "loss": 0.0087, + "step": 6832 + }, + { + "epoch": 0.13, + "learning_rate": 1.7365927536794688e-07, + "loss": 0.5308, + "step": 6833 + }, + { + "epoch": 0.13, + "learning_rate": 1.7365539202361072e-07, + "loss": 0.0128, + "step": 6834 + }, + { + "epoch": 0.13, + "learning_rate": 1.736515086792746e-07, + "loss": 0.069, + "step": 6835 + }, + { + "epoch": 0.13, + "learning_rate": 1.7364762533493844e-07, + "loss": 0.0082, + "step": 6836 + }, + { + "epoch": 0.13, + "learning_rate": 1.736437419906023e-07, + "loss": 0.0175, + "step": 6837 + }, + { + "epoch": 0.13, + "learning_rate": 1.7363985864626615e-07, + "loss": 0.0123, + "step": 6838 + }, + { + "epoch": 0.13, + "learning_rate": 1.7363597530193003e-07, + "loss": 0.0084, + "step": 6839 + }, + { + "epoch": 0.13, + "learning_rate": 1.7363209195759387e-07, + "loss": 0.0078, + "step": 6840 + }, + { + "epoch": 0.13, + "learning_rate": 1.7362820861325774e-07, + "loss": 0.0087, + "step": 6841 + }, + { + "epoch": 0.13, + "learning_rate": 1.7362432526892159e-07, + "loss": 0.0269, + "step": 6842 + }, + { + "epoch": 0.13, + "learning_rate": 1.7362044192458546e-07, + "loss": 0.0094, + "step": 6843 + }, + { + "epoch": 0.13, + "learning_rate": 1.736165585802493e-07, + "loss": 0.3539, + "step": 6844 + }, + { + "epoch": 0.13, + "learning_rate": 1.7361267523591317e-07, + "loss": 0.0094, + "step": 6845 + }, + { + "epoch": 0.13, + "learning_rate": 1.7360879189157702e-07, + "loss": 0.0079, + "step": 6846 + }, + { + "epoch": 0.13, + "learning_rate": 1.736049085472409e-07, + "loss": 0.2294, + "step": 6847 + }, + { + "epoch": 0.13, + "learning_rate": 1.7360102520290474e-07, + "loss": 0.008, + "step": 6848 + }, + { + "epoch": 0.13, + "learning_rate": 1.735971418585686e-07, + "loss": 0.0215, + "step": 6849 + }, + { + "epoch": 0.13, + "learning_rate": 1.7359325851423245e-07, + "loss": 0.0156, + "step": 6850 + }, + { + "epoch": 0.13, + "learning_rate": 1.7358937516989632e-07, + "loss": 0.0083, + "step": 6851 + }, + { + "epoch": 0.13, + "learning_rate": 1.7358549182556017e-07, + "loss": 0.0116, + "step": 6852 + }, + { + "epoch": 0.13, + "learning_rate": 1.7358160848122404e-07, + "loss": 0.0118, + "step": 6853 + }, + { + "epoch": 0.13, + "learning_rate": 1.7357772513688789e-07, + "loss": 0.0082, + "step": 6854 + }, + { + "epoch": 0.13, + "learning_rate": 1.7357384179255176e-07, + "loss": 0.0081, + "step": 6855 + }, + { + "epoch": 0.13, + "learning_rate": 1.735699584482156e-07, + "loss": 0.0102, + "step": 6856 + }, + { + "epoch": 0.13, + "learning_rate": 1.7356607510387947e-07, + "loss": 0.377, + "step": 6857 + }, + { + "epoch": 0.13, + "learning_rate": 1.7356219175954332e-07, + "loss": 0.0083, + "step": 6858 + }, + { + "epoch": 0.13, + "learning_rate": 1.735583084152072e-07, + "loss": 0.0229, + "step": 6859 + }, + { + "epoch": 0.13, + "learning_rate": 1.7355442507087103e-07, + "loss": 0.0066, + "step": 6860 + }, + { + "epoch": 0.13, + "learning_rate": 1.735505417265349e-07, + "loss": 0.2533, + "step": 6861 + }, + { + "epoch": 0.13, + "learning_rate": 1.7354665838219875e-07, + "loss": 0.095, + "step": 6862 + }, + { + "epoch": 0.13, + "learning_rate": 1.7354277503786262e-07, + "loss": 0.0079, + "step": 6863 + }, + { + "epoch": 0.13, + "learning_rate": 1.7353889169352647e-07, + "loss": 0.0069, + "step": 6864 + }, + { + "epoch": 0.13, + "learning_rate": 1.735350083491903e-07, + "loss": 0.0084, + "step": 6865 + }, + { + "epoch": 0.13, + "learning_rate": 1.7353112500485416e-07, + "loss": 0.0107, + "step": 6866 + }, + { + "epoch": 0.13, + "learning_rate": 1.7352724166051803e-07, + "loss": 0.0085, + "step": 6867 + }, + { + "epoch": 0.13, + "learning_rate": 1.7352335831618187e-07, + "loss": 0.0143, + "step": 6868 + }, + { + "epoch": 0.13, + "learning_rate": 1.7351947497184575e-07, + "loss": 0.676, + "step": 6869 + }, + { + "epoch": 0.13, + "learning_rate": 1.735155916275096e-07, + "loss": 0.2128, + "step": 6870 + }, + { + "epoch": 0.13, + "learning_rate": 1.7351170828317346e-07, + "loss": 0.0095, + "step": 6871 + }, + { + "epoch": 0.13, + "learning_rate": 1.735078249388373e-07, + "loss": 0.0086, + "step": 6872 + }, + { + "epoch": 0.13, + "learning_rate": 1.7350394159450118e-07, + "loss": 0.0066, + "step": 6873 + }, + { + "epoch": 0.13, + "learning_rate": 1.7350005825016502e-07, + "loss": 0.0082, + "step": 6874 + }, + { + "epoch": 0.13, + "learning_rate": 1.734961749058289e-07, + "loss": 0.009, + "step": 6875 + }, + { + "epoch": 0.13, + "learning_rate": 1.7349229156149274e-07, + "loss": 0.0088, + "step": 6876 + }, + { + "epoch": 0.13, + "learning_rate": 1.734884082171566e-07, + "loss": 0.0141, + "step": 6877 + }, + { + "epoch": 0.13, + "learning_rate": 1.7348452487282046e-07, + "loss": 0.0122, + "step": 6878 + }, + { + "epoch": 0.13, + "learning_rate": 1.7348064152848433e-07, + "loss": 0.2513, + "step": 6879 + }, + { + "epoch": 0.13, + "learning_rate": 1.7347675818414817e-07, + "loss": 0.0118, + "step": 6880 + }, + { + "epoch": 0.13, + "learning_rate": 1.7347287483981204e-07, + "loss": 0.0115, + "step": 6881 + }, + { + "epoch": 0.13, + "learning_rate": 1.734689914954759e-07, + "loss": 0.0138, + "step": 6882 + }, + { + "epoch": 0.13, + "learning_rate": 1.7346510815113976e-07, + "loss": 0.0157, + "step": 6883 + }, + { + "epoch": 0.13, + "learning_rate": 1.734612248068036e-07, + "loss": 0.4653, + "step": 6884 + }, + { + "epoch": 0.13, + "learning_rate": 1.7345734146246748e-07, + "loss": 0.2052, + "step": 6885 + }, + { + "epoch": 0.13, + "learning_rate": 1.7345345811813132e-07, + "loss": 0.0098, + "step": 6886 + }, + { + "epoch": 0.13, + "learning_rate": 1.734495747737952e-07, + "loss": 0.0263, + "step": 6887 + }, + { + "epoch": 0.13, + "learning_rate": 1.7344569142945904e-07, + "loss": 0.0078, + "step": 6888 + }, + { + "epoch": 0.13, + "learning_rate": 1.734418080851229e-07, + "loss": 0.6769, + "step": 6889 + }, + { + "epoch": 0.13, + "learning_rate": 1.7343792474078676e-07, + "loss": 0.3524, + "step": 6890 + }, + { + "epoch": 0.13, + "learning_rate": 1.7343404139645063e-07, + "loss": 0.0107, + "step": 6891 + }, + { + "epoch": 0.13, + "learning_rate": 1.7343015805211447e-07, + "loss": 0.0113, + "step": 6892 + }, + { + "epoch": 0.13, + "learning_rate": 1.7342627470777834e-07, + "loss": 0.0084, + "step": 6893 + }, + { + "epoch": 0.13, + "learning_rate": 1.734223913634422e-07, + "loss": 0.1692, + "step": 6894 + }, + { + "epoch": 0.13, + "learning_rate": 1.7341850801910603e-07, + "loss": 0.0075, + "step": 6895 + }, + { + "epoch": 0.13, + "learning_rate": 1.734146246747699e-07, + "loss": 0.2742, + "step": 6896 + }, + { + "epoch": 0.13, + "learning_rate": 1.7341074133043375e-07, + "loss": 0.0615, + "step": 6897 + }, + { + "epoch": 0.13, + "learning_rate": 1.7340685798609762e-07, + "loss": 0.2487, + "step": 6898 + }, + { + "epoch": 0.13, + "learning_rate": 1.7340297464176147e-07, + "loss": 0.0169, + "step": 6899 + }, + { + "epoch": 0.13, + "learning_rate": 1.7339909129742534e-07, + "loss": 0.0132, + "step": 6900 + }, + { + "epoch": 0.13, + "learning_rate": 1.7339520795308918e-07, + "loss": 0.0099, + "step": 6901 + }, + { + "epoch": 0.13, + "learning_rate": 1.7339132460875305e-07, + "loss": 0.0113, + "step": 6902 + }, + { + "epoch": 0.13, + "learning_rate": 1.733874412644169e-07, + "loss": 0.1447, + "step": 6903 + }, + { + "epoch": 0.13, + "learning_rate": 1.7338355792008077e-07, + "loss": 0.0079, + "step": 6904 + }, + { + "epoch": 0.13, + "learning_rate": 1.7337967457574462e-07, + "loss": 0.0208, + "step": 6905 + }, + { + "epoch": 0.13, + "learning_rate": 1.733757912314085e-07, + "loss": 0.0308, + "step": 6906 + }, + { + "epoch": 0.13, + "learning_rate": 1.7337190788707233e-07, + "loss": 0.0194, + "step": 6907 + }, + { + "epoch": 0.13, + "learning_rate": 1.733680245427362e-07, + "loss": 0.3866, + "step": 6908 + }, + { + "epoch": 0.13, + "learning_rate": 1.7336414119840005e-07, + "loss": 0.0071, + "step": 6909 + }, + { + "epoch": 0.13, + "learning_rate": 1.7336025785406392e-07, + "loss": 0.0431, + "step": 6910 + }, + { + "epoch": 0.13, + "learning_rate": 1.7335637450972777e-07, + "loss": 0.0102, + "step": 6911 + }, + { + "epoch": 0.13, + "learning_rate": 1.7335249116539164e-07, + "loss": 0.3966, + "step": 6912 + }, + { + "epoch": 0.13, + "learning_rate": 1.7334860782105548e-07, + "loss": 0.2188, + "step": 6913 + }, + { + "epoch": 0.13, + "learning_rate": 1.7334472447671935e-07, + "loss": 0.0321, + "step": 6914 + }, + { + "epoch": 0.13, + "learning_rate": 1.733408411323832e-07, + "loss": 0.4262, + "step": 6915 + }, + { + "epoch": 0.13, + "learning_rate": 1.7333695778804707e-07, + "loss": 0.0133, + "step": 6916 + }, + { + "epoch": 0.13, + "learning_rate": 1.7333307444371092e-07, + "loss": 0.2034, + "step": 6917 + }, + { + "epoch": 0.13, + "learning_rate": 1.7332919109937479e-07, + "loss": 0.0086, + "step": 6918 + }, + { + "epoch": 0.13, + "learning_rate": 1.7332530775503863e-07, + "loss": 0.0132, + "step": 6919 + }, + { + "epoch": 0.13, + "learning_rate": 1.733214244107025e-07, + "loss": 0.6814, + "step": 6920 + }, + { + "epoch": 0.13, + "learning_rate": 1.7331754106636635e-07, + "loss": 0.0126, + "step": 6921 + }, + { + "epoch": 0.13, + "learning_rate": 1.7331365772203022e-07, + "loss": 0.7908, + "step": 6922 + }, + { + "epoch": 0.13, + "learning_rate": 1.7330977437769404e-07, + "loss": 0.8011, + "step": 6923 + }, + { + "epoch": 0.13, + "learning_rate": 1.733058910333579e-07, + "loss": 0.169, + "step": 6924 + }, + { + "epoch": 0.13, + "learning_rate": 1.7330200768902175e-07, + "loss": 0.0189, + "step": 6925 + }, + { + "epoch": 0.13, + "learning_rate": 1.7329812434468563e-07, + "loss": 0.0264, + "step": 6926 + }, + { + "epoch": 0.13, + "learning_rate": 1.7329424100034947e-07, + "loss": 0.0106, + "step": 6927 + }, + { + "epoch": 0.13, + "learning_rate": 1.7329035765601334e-07, + "loss": 0.0078, + "step": 6928 + }, + { + "epoch": 0.13, + "learning_rate": 1.732864743116772e-07, + "loss": 0.0208, + "step": 6929 + }, + { + "epoch": 0.13, + "learning_rate": 1.7328259096734106e-07, + "loss": 0.0079, + "step": 6930 + }, + { + "epoch": 0.13, + "learning_rate": 1.732787076230049e-07, + "loss": 0.0072, + "step": 6931 + }, + { + "epoch": 0.13, + "learning_rate": 1.7327482427866878e-07, + "loss": 0.0084, + "step": 6932 + }, + { + "epoch": 0.13, + "learning_rate": 1.7327094093433262e-07, + "loss": 0.9488, + "step": 6933 + }, + { + "epoch": 0.13, + "learning_rate": 1.732670575899965e-07, + "loss": 0.0257, + "step": 6934 + }, + { + "epoch": 0.13, + "learning_rate": 1.7326317424566034e-07, + "loss": 0.3595, + "step": 6935 + }, + { + "epoch": 0.13, + "learning_rate": 1.732592909013242e-07, + "loss": 0.0076, + "step": 6936 + }, + { + "epoch": 0.13, + "learning_rate": 1.7325540755698805e-07, + "loss": 0.0578, + "step": 6937 + }, + { + "epoch": 0.13, + "learning_rate": 1.7325152421265193e-07, + "loss": 0.0134, + "step": 6938 + }, + { + "epoch": 0.13, + "learning_rate": 1.7324764086831577e-07, + "loss": 0.0285, + "step": 6939 + }, + { + "epoch": 0.13, + "learning_rate": 1.7324375752397964e-07, + "loss": 0.3736, + "step": 6940 + }, + { + "epoch": 0.13, + "learning_rate": 1.7323987417964349e-07, + "loss": 0.0086, + "step": 6941 + }, + { + "epoch": 0.13, + "learning_rate": 1.7323599083530736e-07, + "loss": 0.664, + "step": 6942 + }, + { + "epoch": 0.13, + "learning_rate": 1.732321074909712e-07, + "loss": 0.0083, + "step": 6943 + }, + { + "epoch": 0.13, + "learning_rate": 1.7322822414663507e-07, + "loss": 0.0093, + "step": 6944 + }, + { + "epoch": 0.13, + "learning_rate": 1.7322434080229892e-07, + "loss": 0.1155, + "step": 6945 + }, + { + "epoch": 0.13, + "learning_rate": 1.732204574579628e-07, + "loss": 0.0177, + "step": 6946 + }, + { + "epoch": 0.13, + "learning_rate": 1.7321657411362664e-07, + "loss": 0.0334, + "step": 6947 + }, + { + "epoch": 0.13, + "learning_rate": 1.732126907692905e-07, + "loss": 0.0092, + "step": 6948 + }, + { + "epoch": 0.13, + "learning_rate": 1.7320880742495435e-07, + "loss": 0.0585, + "step": 6949 + }, + { + "epoch": 0.13, + "learning_rate": 1.7320492408061822e-07, + "loss": 0.3366, + "step": 6950 + }, + { + "epoch": 0.13, + "learning_rate": 1.7320104073628207e-07, + "loss": 0.0071, + "step": 6951 + }, + { + "epoch": 0.13, + "learning_rate": 1.7319715739194594e-07, + "loss": 0.2554, + "step": 6952 + }, + { + "epoch": 0.13, + "learning_rate": 1.7319327404760979e-07, + "loss": 0.0642, + "step": 6953 + }, + { + "epoch": 0.13, + "learning_rate": 1.7318939070327366e-07, + "loss": 0.485, + "step": 6954 + }, + { + "epoch": 0.13, + "learning_rate": 1.731855073589375e-07, + "loss": 0.4728, + "step": 6955 + }, + { + "epoch": 0.13, + "learning_rate": 1.7318162401460137e-07, + "loss": 0.0787, + "step": 6956 + }, + { + "epoch": 0.13, + "learning_rate": 1.7317774067026522e-07, + "loss": 0.0472, + "step": 6957 + }, + { + "epoch": 0.13, + "learning_rate": 1.731738573259291e-07, + "loss": 0.0219, + "step": 6958 + }, + { + "epoch": 0.13, + "learning_rate": 1.7316997398159293e-07, + "loss": 0.0087, + "step": 6959 + }, + { + "epoch": 0.14, + "learning_rate": 1.731660906372568e-07, + "loss": 0.0068, + "step": 6960 + }, + { + "epoch": 0.14, + "learning_rate": 1.7316220729292065e-07, + "loss": 0.0066, + "step": 6961 + }, + { + "epoch": 0.14, + "learning_rate": 1.7315832394858452e-07, + "loss": 0.0485, + "step": 6962 + }, + { + "epoch": 0.14, + "learning_rate": 1.7315444060424837e-07, + "loss": 0.0073, + "step": 6963 + }, + { + "epoch": 0.14, + "learning_rate": 1.7315055725991224e-07, + "loss": 0.0096, + "step": 6964 + }, + { + "epoch": 0.14, + "learning_rate": 1.7314667391557608e-07, + "loss": 0.0075, + "step": 6965 + }, + { + "epoch": 0.14, + "learning_rate": 1.7314279057123996e-07, + "loss": 0.0512, + "step": 6966 + }, + { + "epoch": 0.14, + "learning_rate": 1.731389072269038e-07, + "loss": 0.0138, + "step": 6967 + }, + { + "epoch": 0.14, + "learning_rate": 1.7313502388256767e-07, + "loss": 0.0085, + "step": 6968 + }, + { + "epoch": 0.14, + "learning_rate": 1.7313114053823152e-07, + "loss": 0.0298, + "step": 6969 + }, + { + "epoch": 0.14, + "learning_rate": 1.731272571938954e-07, + "loss": 0.0446, + "step": 6970 + }, + { + "epoch": 0.14, + "learning_rate": 1.7312337384955923e-07, + "loss": 1.0255, + "step": 6971 + }, + { + "epoch": 0.14, + "learning_rate": 1.731194905052231e-07, + "loss": 0.0735, + "step": 6972 + }, + { + "epoch": 0.14, + "learning_rate": 1.7311560716088695e-07, + "loss": 0.0084, + "step": 6973 + }, + { + "epoch": 0.14, + "learning_rate": 1.7311172381655082e-07, + "loss": 0.8122, + "step": 6974 + }, + { + "epoch": 0.14, + "learning_rate": 1.7310784047221467e-07, + "loss": 0.0169, + "step": 6975 + }, + { + "epoch": 0.14, + "learning_rate": 1.7310395712787854e-07, + "loss": 0.3592, + "step": 6976 + }, + { + "epoch": 0.14, + "learning_rate": 1.7310007378354238e-07, + "loss": 0.0083, + "step": 6977 + }, + { + "epoch": 0.14, + "learning_rate": 1.7309619043920625e-07, + "loss": 0.0217, + "step": 6978 + }, + { + "epoch": 0.14, + "learning_rate": 1.730923070948701e-07, + "loss": 0.0394, + "step": 6979 + }, + { + "epoch": 0.14, + "learning_rate": 1.7308842375053397e-07, + "loss": 0.0108, + "step": 6980 + }, + { + "epoch": 0.14, + "learning_rate": 1.730845404061978e-07, + "loss": 0.0476, + "step": 6981 + }, + { + "epoch": 0.14, + "learning_rate": 1.7308065706186166e-07, + "loss": 0.0061, + "step": 6982 + }, + { + "epoch": 0.14, + "learning_rate": 1.730767737175255e-07, + "loss": 0.0075, + "step": 6983 + }, + { + "epoch": 0.14, + "learning_rate": 1.7307289037318938e-07, + "loss": 0.1182, + "step": 6984 + }, + { + "epoch": 0.14, + "learning_rate": 1.7306900702885322e-07, + "loss": 0.2958, + "step": 6985 + }, + { + "epoch": 0.14, + "learning_rate": 1.730651236845171e-07, + "loss": 0.0088, + "step": 6986 + }, + { + "epoch": 0.14, + "learning_rate": 1.7306124034018094e-07, + "loss": 0.7757, + "step": 6987 + }, + { + "epoch": 0.14, + "learning_rate": 1.730573569958448e-07, + "loss": 0.1077, + "step": 6988 + }, + { + "epoch": 0.14, + "learning_rate": 1.7305347365150866e-07, + "loss": 0.0075, + "step": 6989 + }, + { + "epoch": 0.14, + "learning_rate": 1.7304959030717253e-07, + "loss": 0.1457, + "step": 6990 + }, + { + "epoch": 0.14, + "learning_rate": 1.7304570696283637e-07, + "loss": 0.0082, + "step": 6991 + }, + { + "epoch": 0.14, + "learning_rate": 1.7304182361850024e-07, + "loss": 0.0089, + "step": 6992 + }, + { + "epoch": 0.14, + "learning_rate": 1.730379402741641e-07, + "loss": 0.0081, + "step": 6993 + }, + { + "epoch": 0.14, + "learning_rate": 1.7303405692982796e-07, + "loss": 0.0098, + "step": 6994 + }, + { + "epoch": 0.14, + "learning_rate": 1.730301735854918e-07, + "loss": 0.015, + "step": 6995 + }, + { + "epoch": 0.14, + "learning_rate": 1.7302629024115568e-07, + "loss": 0.0089, + "step": 6996 + }, + { + "epoch": 0.14, + "learning_rate": 1.7302240689681952e-07, + "loss": 0.4328, + "step": 6997 + }, + { + "epoch": 0.14, + "learning_rate": 1.730185235524834e-07, + "loss": 0.0098, + "step": 6998 + }, + { + "epoch": 0.14, + "learning_rate": 1.7301464020814724e-07, + "loss": 0.0275, + "step": 6999 + }, + { + "epoch": 0.14, + "learning_rate": 1.730107568638111e-07, + "loss": 0.1673, + "step": 7000 + }, + { + "epoch": 0.14, + "learning_rate": 1.7300687351947495e-07, + "loss": 0.0073, + "step": 7001 + }, + { + "epoch": 0.14, + "learning_rate": 1.7300299017513883e-07, + "loss": 0.0989, + "step": 7002 + }, + { + "epoch": 0.14, + "learning_rate": 1.7299910683080267e-07, + "loss": 0.1152, + "step": 7003 + }, + { + "epoch": 0.14, + "learning_rate": 1.7299522348646654e-07, + "loss": 0.0234, + "step": 7004 + }, + { + "epoch": 0.14, + "learning_rate": 1.729913401421304e-07, + "loss": 0.5462, + "step": 7005 + }, + { + "epoch": 0.14, + "learning_rate": 1.7298745679779426e-07, + "loss": 0.1025, + "step": 7006 + }, + { + "epoch": 0.14, + "learning_rate": 1.729835734534581e-07, + "loss": 0.007, + "step": 7007 + }, + { + "epoch": 0.14, + "learning_rate": 1.7297969010912198e-07, + "loss": 0.0126, + "step": 7008 + }, + { + "epoch": 0.14, + "learning_rate": 1.7297580676478582e-07, + "loss": 0.0227, + "step": 7009 + }, + { + "epoch": 0.14, + "learning_rate": 1.729719234204497e-07, + "loss": 0.0095, + "step": 7010 + }, + { + "epoch": 0.14, + "learning_rate": 1.7296804007611354e-07, + "loss": 0.0062, + "step": 7011 + }, + { + "epoch": 0.14, + "learning_rate": 1.729641567317774e-07, + "loss": 0.0278, + "step": 7012 + }, + { + "epoch": 0.14, + "learning_rate": 1.7296027338744125e-07, + "loss": 0.1351, + "step": 7013 + }, + { + "epoch": 0.14, + "learning_rate": 1.7295639004310513e-07, + "loss": 0.0056, + "step": 7014 + }, + { + "epoch": 0.14, + "learning_rate": 1.7295250669876897e-07, + "loss": 0.4901, + "step": 7015 + }, + { + "epoch": 0.14, + "learning_rate": 1.7294862335443284e-07, + "loss": 0.014, + "step": 7016 + }, + { + "epoch": 0.14, + "learning_rate": 1.7294474001009669e-07, + "loss": 0.0344, + "step": 7017 + }, + { + "epoch": 0.14, + "learning_rate": 1.7294085666576056e-07, + "loss": 0.0491, + "step": 7018 + }, + { + "epoch": 0.14, + "learning_rate": 1.729369733214244e-07, + "loss": 0.1009, + "step": 7019 + }, + { + "epoch": 0.14, + "learning_rate": 1.7293308997708827e-07, + "loss": 0.0095, + "step": 7020 + }, + { + "epoch": 0.14, + "learning_rate": 1.7292920663275212e-07, + "loss": 0.0067, + "step": 7021 + }, + { + "epoch": 0.14, + "learning_rate": 1.72925323288416e-07, + "loss": 0.0113, + "step": 7022 + }, + { + "epoch": 0.14, + "learning_rate": 1.7292143994407984e-07, + "loss": 0.1764, + "step": 7023 + }, + { + "epoch": 0.14, + "learning_rate": 1.729175565997437e-07, + "loss": 0.0219, + "step": 7024 + }, + { + "epoch": 0.14, + "learning_rate": 1.7291367325540755e-07, + "loss": 0.0079, + "step": 7025 + }, + { + "epoch": 0.14, + "learning_rate": 1.7290978991107142e-07, + "loss": 0.009, + "step": 7026 + }, + { + "epoch": 0.14, + "learning_rate": 1.7290590656673527e-07, + "loss": 0.0183, + "step": 7027 + }, + { + "epoch": 0.14, + "learning_rate": 1.7290202322239914e-07, + "loss": 0.0077, + "step": 7028 + }, + { + "epoch": 0.14, + "learning_rate": 1.7289813987806299e-07, + "loss": 0.0201, + "step": 7029 + }, + { + "epoch": 0.14, + "learning_rate": 1.7289425653372686e-07, + "loss": 0.0136, + "step": 7030 + }, + { + "epoch": 0.14, + "learning_rate": 1.728903731893907e-07, + "loss": 0.4977, + "step": 7031 + }, + { + "epoch": 0.14, + "learning_rate": 1.7288648984505457e-07, + "loss": 0.0129, + "step": 7032 + }, + { + "epoch": 0.14, + "learning_rate": 1.7288260650071842e-07, + "loss": 0.0089, + "step": 7033 + }, + { + "epoch": 0.14, + "learning_rate": 1.728787231563823e-07, + "loss": 0.1121, + "step": 7034 + }, + { + "epoch": 0.14, + "learning_rate": 1.7287483981204614e-07, + "loss": 0.0115, + "step": 7035 + }, + { + "epoch": 0.14, + "learning_rate": 1.7287095646771e-07, + "loss": 0.0066, + "step": 7036 + }, + { + "epoch": 0.14, + "learning_rate": 1.7286707312337385e-07, + "loss": 0.836, + "step": 7037 + }, + { + "epoch": 0.14, + "learning_rate": 1.7286318977903772e-07, + "loss": 0.0086, + "step": 7038 + }, + { + "epoch": 0.14, + "learning_rate": 1.7285930643470154e-07, + "loss": 0.0121, + "step": 7039 + }, + { + "epoch": 0.14, + "learning_rate": 1.728554230903654e-07, + "loss": 0.0061, + "step": 7040 + }, + { + "epoch": 0.14, + "learning_rate": 1.7285153974602926e-07, + "loss": 0.0068, + "step": 7041 + }, + { + "epoch": 0.14, + "learning_rate": 1.7284765640169313e-07, + "loss": 0.0101, + "step": 7042 + }, + { + "epoch": 0.14, + "learning_rate": 1.7284377305735697e-07, + "loss": 0.7357, + "step": 7043 + }, + { + "epoch": 0.14, + "learning_rate": 1.7283988971302085e-07, + "loss": 0.0198, + "step": 7044 + }, + { + "epoch": 0.14, + "learning_rate": 1.728360063686847e-07, + "loss": 0.071, + "step": 7045 + }, + { + "epoch": 0.14, + "learning_rate": 1.7283212302434856e-07, + "loss": 0.0135, + "step": 7046 + }, + { + "epoch": 0.14, + "learning_rate": 1.728282396800124e-07, + "loss": 0.044, + "step": 7047 + }, + { + "epoch": 0.14, + "learning_rate": 1.7282435633567628e-07, + "loss": 0.0297, + "step": 7048 + }, + { + "epoch": 0.14, + "learning_rate": 1.7282047299134012e-07, + "loss": 0.0061, + "step": 7049 + }, + { + "epoch": 0.14, + "learning_rate": 1.72816589647004e-07, + "loss": 0.0206, + "step": 7050 + }, + { + "epoch": 0.14, + "learning_rate": 1.7281270630266784e-07, + "loss": 0.022, + "step": 7051 + }, + { + "epoch": 0.14, + "learning_rate": 1.728088229583317e-07, + "loss": 0.0116, + "step": 7052 + }, + { + "epoch": 0.14, + "learning_rate": 1.7280493961399556e-07, + "loss": 0.0076, + "step": 7053 + }, + { + "epoch": 0.14, + "learning_rate": 1.7280105626965943e-07, + "loss": 0.0183, + "step": 7054 + }, + { + "epoch": 0.14, + "learning_rate": 1.7279717292532327e-07, + "loss": 0.0068, + "step": 7055 + }, + { + "epoch": 0.14, + "learning_rate": 1.7279328958098714e-07, + "loss": 0.0161, + "step": 7056 + }, + { + "epoch": 0.14, + "learning_rate": 1.72789406236651e-07, + "loss": 0.2682, + "step": 7057 + }, + { + "epoch": 0.14, + "learning_rate": 1.7278552289231486e-07, + "loss": 0.0151, + "step": 7058 + }, + { + "epoch": 0.14, + "learning_rate": 1.727816395479787e-07, + "loss": 0.0058, + "step": 7059 + }, + { + "epoch": 0.14, + "learning_rate": 1.7277775620364258e-07, + "loss": 0.0086, + "step": 7060 + }, + { + "epoch": 0.14, + "learning_rate": 1.7277387285930642e-07, + "loss": 0.0388, + "step": 7061 + }, + { + "epoch": 0.14, + "learning_rate": 1.727699895149703e-07, + "loss": 0.0074, + "step": 7062 + }, + { + "epoch": 0.14, + "learning_rate": 1.7276610617063414e-07, + "loss": 0.1597, + "step": 7063 + }, + { + "epoch": 0.14, + "learning_rate": 1.72762222826298e-07, + "loss": 0.009, + "step": 7064 + }, + { + "epoch": 0.14, + "learning_rate": 1.7275833948196186e-07, + "loss": 0.0075, + "step": 7065 + }, + { + "epoch": 0.14, + "learning_rate": 1.7275445613762573e-07, + "loss": 0.0081, + "step": 7066 + }, + { + "epoch": 0.14, + "learning_rate": 1.7275057279328957e-07, + "loss": 0.0104, + "step": 7067 + }, + { + "epoch": 0.14, + "learning_rate": 1.7274668944895344e-07, + "loss": 0.0075, + "step": 7068 + }, + { + "epoch": 0.14, + "learning_rate": 1.727428061046173e-07, + "loss": 0.5612, + "step": 7069 + }, + { + "epoch": 0.14, + "learning_rate": 1.7273892276028116e-07, + "loss": 0.0882, + "step": 7070 + }, + { + "epoch": 0.14, + "learning_rate": 1.72735039415945e-07, + "loss": 0.1003, + "step": 7071 + }, + { + "epoch": 0.14, + "learning_rate": 1.7273115607160885e-07, + "loss": 0.0193, + "step": 7072 + }, + { + "epoch": 0.14, + "learning_rate": 1.7272727272727272e-07, + "loss": 0.1493, + "step": 7073 + }, + { + "epoch": 0.14, + "learning_rate": 1.7272338938293657e-07, + "loss": 0.0108, + "step": 7074 + }, + { + "epoch": 0.14, + "learning_rate": 1.7271950603860044e-07, + "loss": 0.0627, + "step": 7075 + }, + { + "epoch": 0.14, + "learning_rate": 1.7271562269426428e-07, + "loss": 0.0141, + "step": 7076 + }, + { + "epoch": 0.14, + "learning_rate": 1.7271173934992815e-07, + "loss": 0.0313, + "step": 7077 + }, + { + "epoch": 0.14, + "learning_rate": 1.72707856005592e-07, + "loss": 0.4014, + "step": 7078 + }, + { + "epoch": 0.14, + "learning_rate": 1.7270397266125587e-07, + "loss": 0.006, + "step": 7079 + }, + { + "epoch": 0.14, + "learning_rate": 1.7270008931691972e-07, + "loss": 0.0889, + "step": 7080 + }, + { + "epoch": 0.14, + "learning_rate": 1.726962059725836e-07, + "loss": 0.0059, + "step": 7081 + }, + { + "epoch": 0.14, + "learning_rate": 1.7269232262824743e-07, + "loss": 0.0085, + "step": 7082 + }, + { + "epoch": 0.14, + "learning_rate": 1.726884392839113e-07, + "loss": 0.0127, + "step": 7083 + }, + { + "epoch": 0.14, + "learning_rate": 1.7268455593957515e-07, + "loss": 0.0071, + "step": 7084 + }, + { + "epoch": 0.14, + "learning_rate": 1.7268067259523902e-07, + "loss": 0.3084, + "step": 7085 + }, + { + "epoch": 0.14, + "learning_rate": 1.7267678925090287e-07, + "loss": 0.0361, + "step": 7086 + }, + { + "epoch": 0.14, + "learning_rate": 1.7267290590656674e-07, + "loss": 0.0079, + "step": 7087 + }, + { + "epoch": 0.14, + "learning_rate": 1.7266902256223058e-07, + "loss": 0.0362, + "step": 7088 + }, + { + "epoch": 0.14, + "learning_rate": 1.7266513921789445e-07, + "loss": 0.0504, + "step": 7089 + }, + { + "epoch": 0.14, + "learning_rate": 1.726612558735583e-07, + "loss": 0.007, + "step": 7090 + }, + { + "epoch": 0.14, + "learning_rate": 1.7265737252922217e-07, + "loss": 0.0168, + "step": 7091 + }, + { + "epoch": 0.14, + "learning_rate": 1.7265348918488602e-07, + "loss": 0.6649, + "step": 7092 + }, + { + "epoch": 0.14, + "learning_rate": 1.7264960584054989e-07, + "loss": 0.8912, + "step": 7093 + }, + { + "epoch": 0.14, + "learning_rate": 1.7264572249621373e-07, + "loss": 0.0592, + "step": 7094 + }, + { + "epoch": 0.14, + "learning_rate": 1.726418391518776e-07, + "loss": 0.0069, + "step": 7095 + }, + { + "epoch": 0.14, + "learning_rate": 1.7263795580754145e-07, + "loss": 0.0072, + "step": 7096 + }, + { + "epoch": 0.14, + "learning_rate": 1.726340724632053e-07, + "loss": 0.2243, + "step": 7097 + }, + { + "epoch": 0.14, + "learning_rate": 1.7263018911886916e-07, + "loss": 0.12, + "step": 7098 + }, + { + "epoch": 0.14, + "learning_rate": 1.72626305774533e-07, + "loss": 0.0072, + "step": 7099 + }, + { + "epoch": 0.14, + "learning_rate": 1.7262242243019685e-07, + "loss": 0.6135, + "step": 7100 + }, + { + "epoch": 0.14, + "learning_rate": 1.7261853908586073e-07, + "loss": 0.0078, + "step": 7101 + }, + { + "epoch": 0.14, + "learning_rate": 1.7261465574152457e-07, + "loss": 0.0078, + "step": 7102 + }, + { + "epoch": 0.14, + "learning_rate": 1.7261077239718844e-07, + "loss": 0.0066, + "step": 7103 + }, + { + "epoch": 0.14, + "learning_rate": 1.726068890528523e-07, + "loss": 0.0085, + "step": 7104 + }, + { + "epoch": 0.14, + "learning_rate": 1.7260300570851616e-07, + "loss": 0.009, + "step": 7105 + }, + { + "epoch": 0.14, + "learning_rate": 1.7259912236418e-07, + "loss": 0.0637, + "step": 7106 + }, + { + "epoch": 0.14, + "learning_rate": 1.7259523901984388e-07, + "loss": 0.0101, + "step": 7107 + }, + { + "epoch": 0.14, + "learning_rate": 1.7259135567550772e-07, + "loss": 0.0529, + "step": 7108 + }, + { + "epoch": 0.14, + "learning_rate": 1.725874723311716e-07, + "loss": 0.0057, + "step": 7109 + }, + { + "epoch": 0.14, + "learning_rate": 1.7258358898683544e-07, + "loss": 0.0138, + "step": 7110 + }, + { + "epoch": 0.14, + "learning_rate": 1.725797056424993e-07, + "loss": 0.0068, + "step": 7111 + }, + { + "epoch": 0.14, + "learning_rate": 1.7257582229816315e-07, + "loss": 0.0119, + "step": 7112 + }, + { + "epoch": 0.14, + "learning_rate": 1.7257193895382703e-07, + "loss": 0.0067, + "step": 7113 + }, + { + "epoch": 0.14, + "learning_rate": 1.7256805560949087e-07, + "loss": 0.0126, + "step": 7114 + }, + { + "epoch": 0.14, + "learning_rate": 1.7256417226515474e-07, + "loss": 0.0121, + "step": 7115 + }, + { + "epoch": 0.14, + "learning_rate": 1.7256028892081859e-07, + "loss": 0.0121, + "step": 7116 + }, + { + "epoch": 0.14, + "learning_rate": 1.7255640557648246e-07, + "loss": 0.0095, + "step": 7117 + }, + { + "epoch": 0.14, + "learning_rate": 1.725525222321463e-07, + "loss": 0.0109, + "step": 7118 + }, + { + "epoch": 0.14, + "learning_rate": 1.7254863888781017e-07, + "loss": 0.0057, + "step": 7119 + }, + { + "epoch": 0.14, + "learning_rate": 1.7254475554347402e-07, + "loss": 0.0693, + "step": 7120 + }, + { + "epoch": 0.14, + "learning_rate": 1.725408721991379e-07, + "loss": 0.0086, + "step": 7121 + }, + { + "epoch": 0.14, + "learning_rate": 1.7253698885480174e-07, + "loss": 0.1581, + "step": 7122 + }, + { + "epoch": 0.14, + "learning_rate": 1.725331055104656e-07, + "loss": 0.8878, + "step": 7123 + }, + { + "epoch": 0.14, + "learning_rate": 1.7252922216612945e-07, + "loss": 0.0596, + "step": 7124 + }, + { + "epoch": 0.14, + "learning_rate": 1.7252533882179332e-07, + "loss": 0.0079, + "step": 7125 + }, + { + "epoch": 0.14, + "learning_rate": 1.7252145547745717e-07, + "loss": 0.0228, + "step": 7126 + }, + { + "epoch": 0.14, + "learning_rate": 1.7251757213312104e-07, + "loss": 0.259, + "step": 7127 + }, + { + "epoch": 0.14, + "learning_rate": 1.7251368878878489e-07, + "loss": 0.2764, + "step": 7128 + }, + { + "epoch": 0.14, + "learning_rate": 1.7250980544444876e-07, + "loss": 0.2259, + "step": 7129 + }, + { + "epoch": 0.14, + "learning_rate": 1.725059221001126e-07, + "loss": 0.0084, + "step": 7130 + }, + { + "epoch": 0.14, + "learning_rate": 1.7250203875577647e-07, + "loss": 0.0075, + "step": 7131 + }, + { + "epoch": 0.14, + "learning_rate": 1.7249815541144032e-07, + "loss": 0.0061, + "step": 7132 + }, + { + "epoch": 0.14, + "learning_rate": 1.724942720671042e-07, + "loss": 0.8628, + "step": 7133 + }, + { + "epoch": 0.14, + "learning_rate": 1.7249038872276804e-07, + "loss": 0.0285, + "step": 7134 + }, + { + "epoch": 0.14, + "learning_rate": 1.724865053784319e-07, + "loss": 0.0082, + "step": 7135 + }, + { + "epoch": 0.14, + "learning_rate": 1.7248262203409575e-07, + "loss": 0.0078, + "step": 7136 + }, + { + "epoch": 0.14, + "learning_rate": 1.7247873868975962e-07, + "loss": 0.1163, + "step": 7137 + }, + { + "epoch": 0.14, + "learning_rate": 1.7247485534542347e-07, + "loss": 0.0086, + "step": 7138 + }, + { + "epoch": 0.14, + "learning_rate": 1.7247097200108734e-07, + "loss": 0.1263, + "step": 7139 + }, + { + "epoch": 0.14, + "learning_rate": 1.7246708865675118e-07, + "loss": 0.0168, + "step": 7140 + }, + { + "epoch": 0.14, + "learning_rate": 1.7246320531241506e-07, + "loss": 0.0074, + "step": 7141 + }, + { + "epoch": 0.14, + "learning_rate": 1.724593219680789e-07, + "loss": 0.852, + "step": 7142 + }, + { + "epoch": 0.14, + "learning_rate": 1.7245543862374277e-07, + "loss": 0.4271, + "step": 7143 + }, + { + "epoch": 0.14, + "learning_rate": 1.7245155527940662e-07, + "loss": 0.0086, + "step": 7144 + }, + { + "epoch": 0.14, + "learning_rate": 1.724476719350705e-07, + "loss": 0.0077, + "step": 7145 + }, + { + "epoch": 0.14, + "learning_rate": 1.7244378859073433e-07, + "loss": 0.5195, + "step": 7146 + }, + { + "epoch": 0.14, + "learning_rate": 1.724399052463982e-07, + "loss": 0.0062, + "step": 7147 + }, + { + "epoch": 0.14, + "learning_rate": 1.7243602190206205e-07, + "loss": 0.5487, + "step": 7148 + }, + { + "epoch": 0.14, + "learning_rate": 1.7243213855772592e-07, + "loss": 0.0265, + "step": 7149 + }, + { + "epoch": 0.14, + "learning_rate": 1.7242825521338977e-07, + "loss": 0.5406, + "step": 7150 + }, + { + "epoch": 0.14, + "learning_rate": 1.7242437186905364e-07, + "loss": 0.4262, + "step": 7151 + }, + { + "epoch": 0.14, + "learning_rate": 1.7242048852471748e-07, + "loss": 0.0069, + "step": 7152 + }, + { + "epoch": 0.14, + "learning_rate": 1.7241660518038135e-07, + "loss": 0.0279, + "step": 7153 + }, + { + "epoch": 0.14, + "learning_rate": 1.724127218360452e-07, + "loss": 0.1621, + "step": 7154 + }, + { + "epoch": 0.14, + "learning_rate": 1.7240883849170904e-07, + "loss": 0.0083, + "step": 7155 + }, + { + "epoch": 0.14, + "learning_rate": 1.724049551473729e-07, + "loss": 0.0106, + "step": 7156 + }, + { + "epoch": 0.14, + "learning_rate": 1.7240107180303676e-07, + "loss": 0.1862, + "step": 7157 + }, + { + "epoch": 0.14, + "learning_rate": 1.723971884587006e-07, + "loss": 0.0059, + "step": 7158 + }, + { + "epoch": 0.14, + "learning_rate": 1.7239330511436448e-07, + "loss": 0.0061, + "step": 7159 + }, + { + "epoch": 0.14, + "learning_rate": 1.7238942177002832e-07, + "loss": 0.0248, + "step": 7160 + }, + { + "epoch": 0.14, + "learning_rate": 1.723855384256922e-07, + "loss": 0.1002, + "step": 7161 + }, + { + "epoch": 0.14, + "learning_rate": 1.7238165508135604e-07, + "loss": 0.0078, + "step": 7162 + }, + { + "epoch": 0.14, + "learning_rate": 1.723777717370199e-07, + "loss": 0.0818, + "step": 7163 + }, + { + "epoch": 0.14, + "learning_rate": 1.7237388839268376e-07, + "loss": 0.0091, + "step": 7164 + }, + { + "epoch": 0.14, + "learning_rate": 1.7237000504834763e-07, + "loss": 0.0109, + "step": 7165 + }, + { + "epoch": 0.14, + "learning_rate": 1.7236612170401147e-07, + "loss": 0.3689, + "step": 7166 + }, + { + "epoch": 0.14, + "learning_rate": 1.7236223835967534e-07, + "loss": 0.0112, + "step": 7167 + }, + { + "epoch": 0.14, + "learning_rate": 1.723583550153392e-07, + "loss": 0.0088, + "step": 7168 + }, + { + "epoch": 0.14, + "learning_rate": 1.7235447167100306e-07, + "loss": 0.0082, + "step": 7169 + }, + { + "epoch": 0.14, + "learning_rate": 1.723505883266669e-07, + "loss": 0.0079, + "step": 7170 + }, + { + "epoch": 0.14, + "learning_rate": 1.7234670498233078e-07, + "loss": 0.0065, + "step": 7171 + }, + { + "epoch": 0.14, + "learning_rate": 1.7234282163799462e-07, + "loss": 0.0112, + "step": 7172 + }, + { + "epoch": 0.14, + "learning_rate": 1.723389382936585e-07, + "loss": 0.0082, + "step": 7173 + }, + { + "epoch": 0.14, + "learning_rate": 1.7233505494932234e-07, + "loss": 0.129, + "step": 7174 + }, + { + "epoch": 0.14, + "learning_rate": 1.723311716049862e-07, + "loss": 0.0112, + "step": 7175 + }, + { + "epoch": 0.14, + "learning_rate": 1.7232728826065005e-07, + "loss": 0.0119, + "step": 7176 + }, + { + "epoch": 0.14, + "learning_rate": 1.7232340491631393e-07, + "loss": 0.0068, + "step": 7177 + }, + { + "epoch": 0.14, + "learning_rate": 1.7231952157197777e-07, + "loss": 0.0321, + "step": 7178 + }, + { + "epoch": 0.14, + "learning_rate": 1.7231563822764164e-07, + "loss": 0.008, + "step": 7179 + }, + { + "epoch": 0.14, + "learning_rate": 1.723117548833055e-07, + "loss": 0.021, + "step": 7180 + }, + { + "epoch": 0.14, + "learning_rate": 1.7230787153896936e-07, + "loss": 0.0105, + "step": 7181 + }, + { + "epoch": 0.14, + "learning_rate": 1.723039881946332e-07, + "loss": 0.0406, + "step": 7182 + }, + { + "epoch": 0.14, + "learning_rate": 1.7230010485029708e-07, + "loss": 0.0081, + "step": 7183 + }, + { + "epoch": 0.14, + "learning_rate": 1.7229622150596092e-07, + "loss": 0.0068, + "step": 7184 + }, + { + "epoch": 0.14, + "learning_rate": 1.722923381616248e-07, + "loss": 0.0155, + "step": 7185 + }, + { + "epoch": 0.14, + "learning_rate": 1.7228845481728864e-07, + "loss": 0.0074, + "step": 7186 + }, + { + "epoch": 0.14, + "learning_rate": 1.722845714729525e-07, + "loss": 0.016, + "step": 7187 + }, + { + "epoch": 0.14, + "learning_rate": 1.7228068812861635e-07, + "loss": 0.0919, + "step": 7188 + }, + { + "epoch": 0.14, + "learning_rate": 1.7227680478428023e-07, + "loss": 0.0263, + "step": 7189 + }, + { + "epoch": 0.14, + "learning_rate": 1.7227292143994407e-07, + "loss": 0.0088, + "step": 7190 + }, + { + "epoch": 0.14, + "learning_rate": 1.7226903809560794e-07, + "loss": 0.1792, + "step": 7191 + }, + { + "epoch": 0.14, + "learning_rate": 1.7226515475127179e-07, + "loss": 0.0101, + "step": 7192 + }, + { + "epoch": 0.14, + "learning_rate": 1.7226127140693566e-07, + "loss": 0.0069, + "step": 7193 + }, + { + "epoch": 0.14, + "learning_rate": 1.722573880625995e-07, + "loss": 0.0561, + "step": 7194 + }, + { + "epoch": 0.14, + "learning_rate": 1.7225350471826337e-07, + "loss": 0.0259, + "step": 7195 + }, + { + "epoch": 0.14, + "learning_rate": 1.7224962137392722e-07, + "loss": 0.0074, + "step": 7196 + }, + { + "epoch": 0.14, + "learning_rate": 1.722457380295911e-07, + "loss": 0.0135, + "step": 7197 + }, + { + "epoch": 0.14, + "learning_rate": 1.7224185468525494e-07, + "loss": 0.0145, + "step": 7198 + }, + { + "epoch": 0.14, + "learning_rate": 1.722379713409188e-07, + "loss": 0.0085, + "step": 7199 + }, + { + "epoch": 0.14, + "learning_rate": 1.7223408799658265e-07, + "loss": 0.0151, + "step": 7200 + }, + { + "epoch": 0.14, + "learning_rate": 1.7223020465224652e-07, + "loss": 0.047, + "step": 7201 + }, + { + "epoch": 0.14, + "learning_rate": 1.7222632130791037e-07, + "loss": 0.0064, + "step": 7202 + }, + { + "epoch": 0.14, + "learning_rate": 1.7222243796357424e-07, + "loss": 0.0062, + "step": 7203 + }, + { + "epoch": 0.14, + "learning_rate": 1.7221855461923809e-07, + "loss": 0.013, + "step": 7204 + }, + { + "epoch": 0.14, + "learning_rate": 1.7221467127490196e-07, + "loss": 0.1473, + "step": 7205 + }, + { + "epoch": 0.14, + "learning_rate": 1.722107879305658e-07, + "loss": 0.2283, + "step": 7206 + }, + { + "epoch": 0.14, + "learning_rate": 1.7220690458622967e-07, + "loss": 0.0095, + "step": 7207 + }, + { + "epoch": 0.14, + "learning_rate": 1.7220302124189352e-07, + "loss": 0.0085, + "step": 7208 + }, + { + "epoch": 0.14, + "learning_rate": 1.721991378975574e-07, + "loss": 0.6746, + "step": 7209 + }, + { + "epoch": 0.14, + "learning_rate": 1.7219525455322124e-07, + "loss": 0.8297, + "step": 7210 + }, + { + "epoch": 0.14, + "learning_rate": 1.721913712088851e-07, + "loss": 0.0234, + "step": 7211 + }, + { + "epoch": 0.14, + "learning_rate": 1.7218748786454895e-07, + "loss": 0.0074, + "step": 7212 + }, + { + "epoch": 0.14, + "learning_rate": 1.721836045202128e-07, + "loss": 0.0074, + "step": 7213 + }, + { + "epoch": 0.14, + "learning_rate": 1.7217972117587664e-07, + "loss": 0.0206, + "step": 7214 + }, + { + "epoch": 0.14, + "learning_rate": 1.721758378315405e-07, + "loss": 0.5057, + "step": 7215 + }, + { + "epoch": 0.14, + "learning_rate": 1.7217195448720436e-07, + "loss": 0.0127, + "step": 7216 + }, + { + "epoch": 0.14, + "learning_rate": 1.7216807114286823e-07, + "loss": 0.6102, + "step": 7217 + }, + { + "epoch": 0.14, + "learning_rate": 1.7216418779853207e-07, + "loss": 0.0359, + "step": 7218 + }, + { + "epoch": 0.14, + "learning_rate": 1.7216030445419595e-07, + "loss": 0.1397, + "step": 7219 + }, + { + "epoch": 0.14, + "learning_rate": 1.721564211098598e-07, + "loss": 0.2963, + "step": 7220 + }, + { + "epoch": 0.14, + "learning_rate": 1.7215253776552366e-07, + "loss": 0.3338, + "step": 7221 + }, + { + "epoch": 0.14, + "learning_rate": 1.721486544211875e-07, + "loss": 0.0161, + "step": 7222 + }, + { + "epoch": 0.14, + "learning_rate": 1.7214477107685138e-07, + "loss": 0.0077, + "step": 7223 + }, + { + "epoch": 0.14, + "learning_rate": 1.7214088773251522e-07, + "loss": 0.2834, + "step": 7224 + }, + { + "epoch": 0.14, + "learning_rate": 1.721370043881791e-07, + "loss": 0.0086, + "step": 7225 + }, + { + "epoch": 0.14, + "learning_rate": 1.7213312104384294e-07, + "loss": 0.0077, + "step": 7226 + }, + { + "epoch": 0.14, + "learning_rate": 1.721292376995068e-07, + "loss": 0.3021, + "step": 7227 + }, + { + "epoch": 0.14, + "learning_rate": 1.7212535435517066e-07, + "loss": 0.0076, + "step": 7228 + }, + { + "epoch": 0.14, + "learning_rate": 1.7212147101083453e-07, + "loss": 0.0059, + "step": 7229 + }, + { + "epoch": 0.14, + "learning_rate": 1.7211758766649837e-07, + "loss": 0.0119, + "step": 7230 + }, + { + "epoch": 0.14, + "learning_rate": 1.7211370432216225e-07, + "loss": 0.0058, + "step": 7231 + }, + { + "epoch": 0.14, + "learning_rate": 1.721098209778261e-07, + "loss": 0.0392, + "step": 7232 + }, + { + "epoch": 0.14, + "learning_rate": 1.7210593763348996e-07, + "loss": 0.0087, + "step": 7233 + }, + { + "epoch": 0.14, + "learning_rate": 1.721020542891538e-07, + "loss": 0.2995, + "step": 7234 + }, + { + "epoch": 0.14, + "learning_rate": 1.7209817094481768e-07, + "loss": 0.0105, + "step": 7235 + }, + { + "epoch": 0.14, + "learning_rate": 1.7209428760048152e-07, + "loss": 0.0077, + "step": 7236 + }, + { + "epoch": 0.14, + "learning_rate": 1.720904042561454e-07, + "loss": 0.6236, + "step": 7237 + }, + { + "epoch": 0.14, + "learning_rate": 1.7208652091180924e-07, + "loss": 0.4248, + "step": 7238 + }, + { + "epoch": 0.14, + "learning_rate": 1.720826375674731e-07, + "loss": 0.0351, + "step": 7239 + }, + { + "epoch": 0.14, + "learning_rate": 1.7207875422313696e-07, + "loss": 0.0314, + "step": 7240 + }, + { + "epoch": 0.14, + "learning_rate": 1.7207487087880083e-07, + "loss": 0.0239, + "step": 7241 + }, + { + "epoch": 0.14, + "learning_rate": 1.7207098753446467e-07, + "loss": 0.2893, + "step": 7242 + }, + { + "epoch": 0.14, + "learning_rate": 1.7206710419012854e-07, + "loss": 0.1764, + "step": 7243 + }, + { + "epoch": 0.14, + "learning_rate": 1.720632208457924e-07, + "loss": 0.0072, + "step": 7244 + }, + { + "epoch": 0.14, + "learning_rate": 1.7205933750145626e-07, + "loss": 0.0078, + "step": 7245 + }, + { + "epoch": 0.14, + "learning_rate": 1.720554541571201e-07, + "loss": 0.1865, + "step": 7246 + }, + { + "epoch": 0.14, + "learning_rate": 1.7205157081278398e-07, + "loss": 0.0578, + "step": 7247 + }, + { + "epoch": 0.14, + "learning_rate": 1.7204768746844782e-07, + "loss": 0.011, + "step": 7248 + }, + { + "epoch": 0.14, + "learning_rate": 1.7204380412411167e-07, + "loss": 0.8561, + "step": 7249 + }, + { + "epoch": 0.14, + "learning_rate": 1.7203992077977554e-07, + "loss": 0.0059, + "step": 7250 + }, + { + "epoch": 0.14, + "learning_rate": 1.7203603743543938e-07, + "loss": 0.12, + "step": 7251 + }, + { + "epoch": 0.14, + "learning_rate": 1.7203215409110325e-07, + "loss": 0.0161, + "step": 7252 + }, + { + "epoch": 0.14, + "learning_rate": 1.720282707467671e-07, + "loss": 0.0097, + "step": 7253 + }, + { + "epoch": 0.14, + "learning_rate": 1.7202438740243097e-07, + "loss": 0.0339, + "step": 7254 + }, + { + "epoch": 0.14, + "learning_rate": 1.7202050405809482e-07, + "loss": 0.0144, + "step": 7255 + }, + { + "epoch": 0.14, + "learning_rate": 1.720166207137587e-07, + "loss": 0.0061, + "step": 7256 + }, + { + "epoch": 0.14, + "learning_rate": 1.7201273736942253e-07, + "loss": 0.5444, + "step": 7257 + }, + { + "epoch": 0.14, + "learning_rate": 1.720088540250864e-07, + "loss": 0.0083, + "step": 7258 + }, + { + "epoch": 0.14, + "learning_rate": 1.7200497068075025e-07, + "loss": 0.0066, + "step": 7259 + }, + { + "epoch": 0.14, + "learning_rate": 1.7200108733641412e-07, + "loss": 0.0149, + "step": 7260 + }, + { + "epoch": 0.14, + "learning_rate": 1.7199720399207797e-07, + "loss": 0.0098, + "step": 7261 + }, + { + "epoch": 0.14, + "learning_rate": 1.7199332064774184e-07, + "loss": 0.0078, + "step": 7262 + }, + { + "epoch": 0.14, + "learning_rate": 1.7198943730340568e-07, + "loss": 0.0117, + "step": 7263 + }, + { + "epoch": 0.14, + "learning_rate": 1.7198555395906955e-07, + "loss": 0.3965, + "step": 7264 + }, + { + "epoch": 0.14, + "learning_rate": 1.719816706147334e-07, + "loss": 0.0077, + "step": 7265 + }, + { + "epoch": 0.14, + "learning_rate": 1.7197778727039727e-07, + "loss": 0.0701, + "step": 7266 + }, + { + "epoch": 0.14, + "learning_rate": 1.7197390392606112e-07, + "loss": 0.3937, + "step": 7267 + }, + { + "epoch": 0.14, + "learning_rate": 1.71970020581725e-07, + "loss": 0.0076, + "step": 7268 + }, + { + "epoch": 0.14, + "learning_rate": 1.7196613723738883e-07, + "loss": 0.008, + "step": 7269 + }, + { + "epoch": 0.14, + "learning_rate": 1.719622538930527e-07, + "loss": 0.0112, + "step": 7270 + }, + { + "epoch": 0.14, + "learning_rate": 1.7195837054871655e-07, + "loss": 0.0082, + "step": 7271 + }, + { + "epoch": 0.14, + "learning_rate": 1.719544872043804e-07, + "loss": 0.2938, + "step": 7272 + }, + { + "epoch": 0.14, + "learning_rate": 1.7195060386004426e-07, + "loss": 0.009, + "step": 7273 + }, + { + "epoch": 0.14, + "learning_rate": 1.719467205157081e-07, + "loss": 0.0867, + "step": 7274 + }, + { + "epoch": 0.14, + "learning_rate": 1.7194283717137198e-07, + "loss": 0.0213, + "step": 7275 + }, + { + "epoch": 0.14, + "learning_rate": 1.7193895382703583e-07, + "loss": 0.0069, + "step": 7276 + }, + { + "epoch": 0.14, + "learning_rate": 1.7193507048269967e-07, + "loss": 0.0085, + "step": 7277 + }, + { + "epoch": 0.14, + "learning_rate": 1.7193118713836354e-07, + "loss": 0.0897, + "step": 7278 + }, + { + "epoch": 0.14, + "learning_rate": 1.719273037940274e-07, + "loss": 0.423, + "step": 7279 + }, + { + "epoch": 0.14, + "learning_rate": 1.7192342044969126e-07, + "loss": 0.0064, + "step": 7280 + }, + { + "epoch": 0.14, + "learning_rate": 1.719195371053551e-07, + "loss": 0.0098, + "step": 7281 + }, + { + "epoch": 0.14, + "learning_rate": 1.7191565376101898e-07, + "loss": 0.0056, + "step": 7282 + }, + { + "epoch": 0.14, + "learning_rate": 1.7191177041668282e-07, + "loss": 0.1365, + "step": 7283 + }, + { + "epoch": 0.14, + "learning_rate": 1.719078870723467e-07, + "loss": 0.4633, + "step": 7284 + }, + { + "epoch": 0.14, + "learning_rate": 1.7190400372801054e-07, + "loss": 0.3594, + "step": 7285 + }, + { + "epoch": 0.14, + "learning_rate": 1.719001203836744e-07, + "loss": 0.0062, + "step": 7286 + }, + { + "epoch": 0.14, + "learning_rate": 1.7189623703933825e-07, + "loss": 0.0078, + "step": 7287 + }, + { + "epoch": 0.14, + "learning_rate": 1.7189235369500213e-07, + "loss": 0.01, + "step": 7288 + }, + { + "epoch": 0.14, + "learning_rate": 1.7188847035066597e-07, + "loss": 0.0081, + "step": 7289 + }, + { + "epoch": 0.14, + "learning_rate": 1.7188458700632984e-07, + "loss": 0.265, + "step": 7290 + }, + { + "epoch": 0.14, + "learning_rate": 1.718807036619937e-07, + "loss": 0.0069, + "step": 7291 + }, + { + "epoch": 0.14, + "learning_rate": 1.7187682031765756e-07, + "loss": 0.0061, + "step": 7292 + }, + { + "epoch": 0.14, + "learning_rate": 1.718729369733214e-07, + "loss": 0.0094, + "step": 7293 + }, + { + "epoch": 0.14, + "learning_rate": 1.7186905362898527e-07, + "loss": 0.0058, + "step": 7294 + }, + { + "epoch": 0.14, + "learning_rate": 1.7186517028464912e-07, + "loss": 0.1036, + "step": 7295 + }, + { + "epoch": 0.14, + "learning_rate": 1.71861286940313e-07, + "loss": 0.0295, + "step": 7296 + }, + { + "epoch": 0.14, + "learning_rate": 1.7185740359597684e-07, + "loss": 0.0108, + "step": 7297 + }, + { + "epoch": 0.14, + "learning_rate": 1.718535202516407e-07, + "loss": 0.0062, + "step": 7298 + }, + { + "epoch": 0.14, + "learning_rate": 1.7184963690730455e-07, + "loss": 0.0087, + "step": 7299 + }, + { + "epoch": 0.14, + "learning_rate": 1.7184575356296842e-07, + "loss": 0.0065, + "step": 7300 + }, + { + "epoch": 0.14, + "learning_rate": 1.7184187021863227e-07, + "loss": 0.0071, + "step": 7301 + }, + { + "epoch": 0.14, + "learning_rate": 1.7183798687429614e-07, + "loss": 0.0076, + "step": 7302 + }, + { + "epoch": 0.14, + "learning_rate": 1.7183410352995999e-07, + "loss": 0.0187, + "step": 7303 + }, + { + "epoch": 0.14, + "learning_rate": 1.7183022018562386e-07, + "loss": 0.0065, + "step": 7304 + }, + { + "epoch": 0.14, + "learning_rate": 1.718263368412877e-07, + "loss": 0.1876, + "step": 7305 + }, + { + "epoch": 0.14, + "learning_rate": 1.7182245349695157e-07, + "loss": 0.0126, + "step": 7306 + }, + { + "epoch": 0.14, + "learning_rate": 1.7181857015261542e-07, + "loss": 0.4027, + "step": 7307 + }, + { + "epoch": 0.14, + "learning_rate": 1.718146868082793e-07, + "loss": 0.0073, + "step": 7308 + }, + { + "epoch": 0.14, + "learning_rate": 1.7181080346394314e-07, + "loss": 0.0083, + "step": 7309 + }, + { + "epoch": 0.14, + "learning_rate": 1.71806920119607e-07, + "loss": 0.0061, + "step": 7310 + }, + { + "epoch": 0.14, + "learning_rate": 1.7180303677527085e-07, + "loss": 0.0199, + "step": 7311 + }, + { + "epoch": 0.14, + "learning_rate": 1.7179915343093472e-07, + "loss": 0.18, + "step": 7312 + }, + { + "epoch": 0.14, + "learning_rate": 1.7179527008659857e-07, + "loss": 0.3257, + "step": 7313 + }, + { + "epoch": 0.14, + "learning_rate": 1.7179138674226244e-07, + "loss": 0.3548, + "step": 7314 + }, + { + "epoch": 0.14, + "learning_rate": 1.7178750339792628e-07, + "loss": 0.0356, + "step": 7315 + }, + { + "epoch": 0.14, + "learning_rate": 1.7178362005359016e-07, + "loss": 0.2959, + "step": 7316 + }, + { + "epoch": 0.14, + "learning_rate": 1.71779736709254e-07, + "loss": 0.006, + "step": 7317 + }, + { + "epoch": 0.14, + "learning_rate": 1.7177585336491787e-07, + "loss": 0.0135, + "step": 7318 + }, + { + "epoch": 0.14, + "learning_rate": 1.7177197002058172e-07, + "loss": 0.0055, + "step": 7319 + }, + { + "epoch": 0.14, + "learning_rate": 1.717680866762456e-07, + "loss": 1.3694, + "step": 7320 + }, + { + "epoch": 0.14, + "learning_rate": 1.7176420333190943e-07, + "loss": 0.0056, + "step": 7321 + }, + { + "epoch": 0.14, + "learning_rate": 1.717603199875733e-07, + "loss": 0.0101, + "step": 7322 + }, + { + "epoch": 0.14, + "learning_rate": 1.7175643664323715e-07, + "loss": 0.0153, + "step": 7323 + }, + { + "epoch": 0.14, + "learning_rate": 1.7175255329890102e-07, + "loss": 0.1179, + "step": 7324 + }, + { + "epoch": 0.14, + "learning_rate": 1.7174866995456487e-07, + "loss": 0.3398, + "step": 7325 + }, + { + "epoch": 0.14, + "learning_rate": 1.7174478661022874e-07, + "loss": 0.2424, + "step": 7326 + }, + { + "epoch": 0.14, + "learning_rate": 1.7174090326589258e-07, + "loss": 0.0058, + "step": 7327 + }, + { + "epoch": 0.14, + "learning_rate": 1.7173701992155646e-07, + "loss": 0.9532, + "step": 7328 + }, + { + "epoch": 0.14, + "learning_rate": 1.7173313657722027e-07, + "loss": 0.6752, + "step": 7329 + }, + { + "epoch": 0.14, + "learning_rate": 1.7172925323288415e-07, + "loss": 0.3366, + "step": 7330 + }, + { + "epoch": 0.14, + "learning_rate": 1.71725369888548e-07, + "loss": 0.4784, + "step": 7331 + }, + { + "epoch": 0.14, + "learning_rate": 1.7172148654421186e-07, + "loss": 0.0113, + "step": 7332 + }, + { + "epoch": 0.14, + "learning_rate": 1.717176031998757e-07, + "loss": 0.0073, + "step": 7333 + }, + { + "epoch": 0.14, + "learning_rate": 1.7171371985553958e-07, + "loss": 0.0108, + "step": 7334 + }, + { + "epoch": 0.14, + "learning_rate": 1.7170983651120342e-07, + "loss": 0.0076, + "step": 7335 + }, + { + "epoch": 0.14, + "learning_rate": 1.717059531668673e-07, + "loss": 0.0075, + "step": 7336 + }, + { + "epoch": 0.14, + "learning_rate": 1.7170206982253114e-07, + "loss": 0.0078, + "step": 7337 + }, + { + "epoch": 0.14, + "learning_rate": 1.71698186478195e-07, + "loss": 0.0066, + "step": 7338 + }, + { + "epoch": 0.14, + "learning_rate": 1.7169430313385886e-07, + "loss": 0.0048, + "step": 7339 + }, + { + "epoch": 0.14, + "learning_rate": 1.7169041978952273e-07, + "loss": 0.02, + "step": 7340 + }, + { + "epoch": 0.14, + "learning_rate": 1.7168653644518657e-07, + "loss": 0.0068, + "step": 7341 + }, + { + "epoch": 0.14, + "learning_rate": 1.7168265310085044e-07, + "loss": 0.0076, + "step": 7342 + }, + { + "epoch": 0.14, + "learning_rate": 1.716787697565143e-07, + "loss": 0.0861, + "step": 7343 + }, + { + "epoch": 0.14, + "learning_rate": 1.7167488641217816e-07, + "loss": 0.0215, + "step": 7344 + }, + { + "epoch": 0.14, + "learning_rate": 1.71671003067842e-07, + "loss": 0.0065, + "step": 7345 + }, + { + "epoch": 0.14, + "learning_rate": 1.7166711972350588e-07, + "loss": 0.0221, + "step": 7346 + }, + { + "epoch": 0.14, + "learning_rate": 1.7166323637916972e-07, + "loss": 0.0091, + "step": 7347 + }, + { + "epoch": 0.14, + "learning_rate": 1.716593530348336e-07, + "loss": 0.0063, + "step": 7348 + }, + { + "epoch": 0.14, + "learning_rate": 1.7165546969049744e-07, + "loss": 0.0066, + "step": 7349 + }, + { + "epoch": 0.14, + "learning_rate": 1.716515863461613e-07, + "loss": 0.007, + "step": 7350 + }, + { + "epoch": 0.14, + "learning_rate": 1.7164770300182515e-07, + "loss": 0.0146, + "step": 7351 + }, + { + "epoch": 0.14, + "learning_rate": 1.7164381965748903e-07, + "loss": 0.0076, + "step": 7352 + }, + { + "epoch": 0.14, + "learning_rate": 1.7163993631315287e-07, + "loss": 0.0184, + "step": 7353 + }, + { + "epoch": 0.14, + "learning_rate": 1.7163605296881674e-07, + "loss": 0.0129, + "step": 7354 + }, + { + "epoch": 0.14, + "learning_rate": 1.716321696244806e-07, + "loss": 0.412, + "step": 7355 + }, + { + "epoch": 0.14, + "learning_rate": 1.7162828628014446e-07, + "loss": 0.0057, + "step": 7356 + }, + { + "epoch": 0.14, + "learning_rate": 1.716244029358083e-07, + "loss": 0.0073, + "step": 7357 + }, + { + "epoch": 0.14, + "learning_rate": 1.7162051959147218e-07, + "loss": 0.0083, + "step": 7358 + }, + { + "epoch": 0.14, + "learning_rate": 1.7161663624713602e-07, + "loss": 0.0059, + "step": 7359 + }, + { + "epoch": 0.14, + "learning_rate": 1.716127529027999e-07, + "loss": 0.0284, + "step": 7360 + }, + { + "epoch": 0.14, + "learning_rate": 1.7160886955846374e-07, + "loss": 0.3068, + "step": 7361 + }, + { + "epoch": 0.14, + "learning_rate": 1.716049862141276e-07, + "loss": 0.0239, + "step": 7362 + }, + { + "epoch": 0.14, + "learning_rate": 1.7160110286979145e-07, + "loss": 0.0059, + "step": 7363 + }, + { + "epoch": 0.14, + "learning_rate": 1.7159721952545533e-07, + "loss": 0.1067, + "step": 7364 + }, + { + "epoch": 0.14, + "learning_rate": 1.7159333618111917e-07, + "loss": 0.008, + "step": 7365 + }, + { + "epoch": 0.14, + "learning_rate": 1.7158945283678304e-07, + "loss": 0.0087, + "step": 7366 + }, + { + "epoch": 0.14, + "learning_rate": 1.715855694924469e-07, + "loss": 0.0069, + "step": 7367 + }, + { + "epoch": 0.14, + "learning_rate": 1.7158168614811076e-07, + "loss": 0.011, + "step": 7368 + }, + { + "epoch": 0.14, + "learning_rate": 1.715778028037746e-07, + "loss": 0.0058, + "step": 7369 + }, + { + "epoch": 0.14, + "learning_rate": 1.7157391945943847e-07, + "loss": 0.0129, + "step": 7370 + }, + { + "epoch": 0.14, + "learning_rate": 1.7157003611510232e-07, + "loss": 0.0114, + "step": 7371 + }, + { + "epoch": 0.14, + "learning_rate": 1.715661527707662e-07, + "loss": 0.0901, + "step": 7372 + }, + { + "epoch": 0.14, + "learning_rate": 1.7156226942643004e-07, + "loss": 0.0082, + "step": 7373 + }, + { + "epoch": 0.14, + "learning_rate": 1.715583860820939e-07, + "loss": 0.0066, + "step": 7374 + }, + { + "epoch": 0.14, + "learning_rate": 1.7155450273775775e-07, + "loss": 0.0069, + "step": 7375 + }, + { + "epoch": 0.14, + "learning_rate": 1.7155061939342162e-07, + "loss": 0.0066, + "step": 7376 + }, + { + "epoch": 0.14, + "learning_rate": 1.7154673604908547e-07, + "loss": 0.0064, + "step": 7377 + }, + { + "epoch": 0.14, + "learning_rate": 1.7154285270474934e-07, + "loss": 0.1136, + "step": 7378 + }, + { + "epoch": 0.14, + "learning_rate": 1.7153896936041319e-07, + "loss": 0.005, + "step": 7379 + }, + { + "epoch": 0.14, + "learning_rate": 1.7153508601607706e-07, + "loss": 0.0342, + "step": 7380 + }, + { + "epoch": 0.14, + "learning_rate": 1.715312026717409e-07, + "loss": 0.0122, + "step": 7381 + }, + { + "epoch": 0.14, + "learning_rate": 1.7152731932740477e-07, + "loss": 0.0087, + "step": 7382 + }, + { + "epoch": 0.14, + "learning_rate": 1.7152343598306862e-07, + "loss": 0.6147, + "step": 7383 + }, + { + "epoch": 0.14, + "learning_rate": 1.715195526387325e-07, + "loss": 0.0116, + "step": 7384 + }, + { + "epoch": 0.14, + "learning_rate": 1.7151566929439634e-07, + "loss": 0.0063, + "step": 7385 + }, + { + "epoch": 0.14, + "learning_rate": 1.715117859500602e-07, + "loss": 0.0068, + "step": 7386 + }, + { + "epoch": 0.14, + "learning_rate": 1.7150790260572403e-07, + "loss": 0.0069, + "step": 7387 + }, + { + "epoch": 0.14, + "learning_rate": 1.715040192613879e-07, + "loss": 0.0093, + "step": 7388 + }, + { + "epoch": 0.14, + "learning_rate": 1.7150013591705174e-07, + "loss": 0.1015, + "step": 7389 + }, + { + "epoch": 0.14, + "learning_rate": 1.7149625257271561e-07, + "loss": 0.0091, + "step": 7390 + }, + { + "epoch": 0.14, + "learning_rate": 1.7149236922837946e-07, + "loss": 0.1243, + "step": 7391 + }, + { + "epoch": 0.14, + "learning_rate": 1.7148848588404333e-07, + "loss": 0.0185, + "step": 7392 + }, + { + "epoch": 0.14, + "learning_rate": 1.7148460253970717e-07, + "loss": 0.0068, + "step": 7393 + }, + { + "epoch": 0.14, + "learning_rate": 1.7148071919537105e-07, + "loss": 0.0438, + "step": 7394 + }, + { + "epoch": 0.14, + "learning_rate": 1.714768358510349e-07, + "loss": 0.0085, + "step": 7395 + }, + { + "epoch": 0.14, + "learning_rate": 1.7147295250669876e-07, + "loss": 0.0062, + "step": 7396 + }, + { + "epoch": 0.14, + "learning_rate": 1.714690691623626e-07, + "loss": 0.0153, + "step": 7397 + }, + { + "epoch": 0.14, + "learning_rate": 1.7146518581802648e-07, + "loss": 0.8813, + "step": 7398 + }, + { + "epoch": 0.14, + "learning_rate": 1.7146130247369032e-07, + "loss": 0.0119, + "step": 7399 + }, + { + "epoch": 0.14, + "learning_rate": 1.714574191293542e-07, + "loss": 0.0208, + "step": 7400 + }, + { + "epoch": 0.14, + "learning_rate": 1.7145353578501804e-07, + "loss": 0.4582, + "step": 7401 + }, + { + "epoch": 0.14, + "learning_rate": 1.714496524406819e-07, + "loss": 0.0073, + "step": 7402 + }, + { + "epoch": 0.14, + "learning_rate": 1.7144576909634576e-07, + "loss": 0.0304, + "step": 7403 + }, + { + "epoch": 0.14, + "learning_rate": 1.7144188575200963e-07, + "loss": 0.0057, + "step": 7404 + }, + { + "epoch": 0.14, + "learning_rate": 1.7143800240767347e-07, + "loss": 0.0168, + "step": 7405 + }, + { + "epoch": 0.14, + "learning_rate": 1.7143411906333735e-07, + "loss": 0.0552, + "step": 7406 + }, + { + "epoch": 0.14, + "learning_rate": 1.714302357190012e-07, + "loss": 0.0218, + "step": 7407 + }, + { + "epoch": 0.14, + "learning_rate": 1.7142635237466506e-07, + "loss": 0.0065, + "step": 7408 + }, + { + "epoch": 0.14, + "learning_rate": 1.714224690303289e-07, + "loss": 0.376, + "step": 7409 + }, + { + "epoch": 0.14, + "learning_rate": 1.7141858568599278e-07, + "loss": 0.1396, + "step": 7410 + }, + { + "epoch": 0.14, + "learning_rate": 1.7141470234165662e-07, + "loss": 0.2576, + "step": 7411 + }, + { + "epoch": 0.14, + "learning_rate": 1.714108189973205e-07, + "loss": 0.0065, + "step": 7412 + }, + { + "epoch": 0.14, + "learning_rate": 1.7140693565298434e-07, + "loss": 0.3, + "step": 7413 + }, + { + "epoch": 0.14, + "learning_rate": 1.714030523086482e-07, + "loss": 0.0366, + "step": 7414 + }, + { + "epoch": 0.14, + "learning_rate": 1.7139916896431206e-07, + "loss": 0.0059, + "step": 7415 + }, + { + "epoch": 0.14, + "learning_rate": 1.7139528561997593e-07, + "loss": 0.0066, + "step": 7416 + }, + { + "epoch": 0.14, + "learning_rate": 1.7139140227563977e-07, + "loss": 0.0066, + "step": 7417 + }, + { + "epoch": 0.14, + "learning_rate": 1.7138751893130364e-07, + "loss": 0.2997, + "step": 7418 + }, + { + "epoch": 0.14, + "learning_rate": 1.713836355869675e-07, + "loss": 0.5133, + "step": 7419 + }, + { + "epoch": 0.14, + "learning_rate": 1.7137975224263136e-07, + "loss": 0.0059, + "step": 7420 + }, + { + "epoch": 0.14, + "learning_rate": 1.713758688982952e-07, + "loss": 0.0067, + "step": 7421 + }, + { + "epoch": 0.14, + "learning_rate": 1.7137198555395908e-07, + "loss": 0.0074, + "step": 7422 + }, + { + "epoch": 0.14, + "learning_rate": 1.7136810220962292e-07, + "loss": 0.0064, + "step": 7423 + }, + { + "epoch": 0.14, + "learning_rate": 1.713642188652868e-07, + "loss": 0.0085, + "step": 7424 + }, + { + "epoch": 0.14, + "learning_rate": 1.7136033552095064e-07, + "loss": 0.0079, + "step": 7425 + }, + { + "epoch": 0.14, + "learning_rate": 1.7135645217661448e-07, + "loss": 0.0063, + "step": 7426 + }, + { + "epoch": 0.14, + "learning_rate": 1.7135256883227836e-07, + "loss": 0.0139, + "step": 7427 + }, + { + "epoch": 0.14, + "learning_rate": 1.713486854879422e-07, + "loss": 0.0065, + "step": 7428 + }, + { + "epoch": 0.14, + "learning_rate": 1.7134480214360607e-07, + "loss": 0.2021, + "step": 7429 + }, + { + "epoch": 0.14, + "learning_rate": 1.7134091879926992e-07, + "loss": 0.2089, + "step": 7430 + }, + { + "epoch": 0.14, + "learning_rate": 1.713370354549338e-07, + "loss": 0.0071, + "step": 7431 + }, + { + "epoch": 0.14, + "learning_rate": 1.7133315211059763e-07, + "loss": 0.0094, + "step": 7432 + }, + { + "epoch": 0.14, + "learning_rate": 1.713292687662615e-07, + "loss": 0.041, + "step": 7433 + }, + { + "epoch": 0.14, + "learning_rate": 1.7132538542192535e-07, + "loss": 0.0723, + "step": 7434 + }, + { + "epoch": 0.14, + "learning_rate": 1.7132150207758922e-07, + "loss": 0.0152, + "step": 7435 + }, + { + "epoch": 0.14, + "learning_rate": 1.7131761873325307e-07, + "loss": 0.0099, + "step": 7436 + }, + { + "epoch": 0.14, + "learning_rate": 1.7131373538891694e-07, + "loss": 1.1, + "step": 7437 + }, + { + "epoch": 0.14, + "learning_rate": 1.7130985204458078e-07, + "loss": 0.0098, + "step": 7438 + }, + { + "epoch": 0.14, + "learning_rate": 1.7130596870024465e-07, + "loss": 0.0098, + "step": 7439 + }, + { + "epoch": 0.14, + "learning_rate": 1.713020853559085e-07, + "loss": 0.0422, + "step": 7440 + }, + { + "epoch": 0.14, + "learning_rate": 1.7129820201157237e-07, + "loss": 0.5059, + "step": 7441 + }, + { + "epoch": 0.14, + "learning_rate": 1.7129431866723622e-07, + "loss": 0.1998, + "step": 7442 + }, + { + "epoch": 0.14, + "learning_rate": 1.712904353229001e-07, + "loss": 0.012, + "step": 7443 + }, + { + "epoch": 0.14, + "learning_rate": 1.7128655197856393e-07, + "loss": 0.2335, + "step": 7444 + }, + { + "epoch": 0.14, + "learning_rate": 1.7128266863422778e-07, + "loss": 0.0205, + "step": 7445 + }, + { + "epoch": 0.14, + "learning_rate": 1.7127878528989165e-07, + "loss": 0.7916, + "step": 7446 + }, + { + "epoch": 0.14, + "learning_rate": 1.712749019455555e-07, + "loss": 0.0115, + "step": 7447 + }, + { + "epoch": 0.14, + "learning_rate": 1.7127101860121936e-07, + "loss": 0.0089, + "step": 7448 + }, + { + "epoch": 0.14, + "learning_rate": 1.712671352568832e-07, + "loss": 0.0055, + "step": 7449 + }, + { + "epoch": 0.14, + "learning_rate": 1.7126325191254708e-07, + "loss": 0.0115, + "step": 7450 + }, + { + "epoch": 0.14, + "learning_rate": 1.7125936856821093e-07, + "loss": 0.0103, + "step": 7451 + }, + { + "epoch": 0.14, + "learning_rate": 1.712554852238748e-07, + "loss": 0.0107, + "step": 7452 + }, + { + "epoch": 0.14, + "learning_rate": 1.7125160187953864e-07, + "loss": 0.0079, + "step": 7453 + }, + { + "epoch": 0.14, + "learning_rate": 1.712477185352025e-07, + "loss": 0.0139, + "step": 7454 + }, + { + "epoch": 0.14, + "learning_rate": 1.7124383519086636e-07, + "loss": 0.0076, + "step": 7455 + }, + { + "epoch": 0.14, + "learning_rate": 1.712399518465302e-07, + "loss": 0.252, + "step": 7456 + }, + { + "epoch": 0.14, + "learning_rate": 1.7123606850219408e-07, + "loss": 0.2393, + "step": 7457 + }, + { + "epoch": 0.14, + "learning_rate": 1.7123218515785792e-07, + "loss": 0.005, + "step": 7458 + }, + { + "epoch": 0.14, + "learning_rate": 1.712283018135218e-07, + "loss": 0.0106, + "step": 7459 + }, + { + "epoch": 0.14, + "learning_rate": 1.7122441846918564e-07, + "loss": 0.3203, + "step": 7460 + }, + { + "epoch": 0.14, + "learning_rate": 1.712205351248495e-07, + "loss": 0.0068, + "step": 7461 + }, + { + "epoch": 0.14, + "learning_rate": 1.7121665178051335e-07, + "loss": 0.0128, + "step": 7462 + }, + { + "epoch": 0.14, + "learning_rate": 1.7121276843617723e-07, + "loss": 0.1507, + "step": 7463 + }, + { + "epoch": 0.14, + "learning_rate": 1.7120888509184107e-07, + "loss": 0.0077, + "step": 7464 + }, + { + "epoch": 0.14, + "learning_rate": 1.7120500174750494e-07, + "loss": 0.0141, + "step": 7465 + }, + { + "epoch": 0.14, + "learning_rate": 1.712011184031688e-07, + "loss": 0.0053, + "step": 7466 + }, + { + "epoch": 0.14, + "learning_rate": 1.7119723505883266e-07, + "loss": 0.0111, + "step": 7467 + }, + { + "epoch": 0.14, + "learning_rate": 1.711933517144965e-07, + "loss": 0.0137, + "step": 7468 + }, + { + "epoch": 0.14, + "learning_rate": 1.7118946837016037e-07, + "loss": 0.4072, + "step": 7469 + }, + { + "epoch": 0.14, + "learning_rate": 1.7118558502582422e-07, + "loss": 0.0086, + "step": 7470 + }, + { + "epoch": 0.14, + "learning_rate": 1.711817016814881e-07, + "loss": 0.0065, + "step": 7471 + }, + { + "epoch": 0.14, + "learning_rate": 1.7117781833715194e-07, + "loss": 0.009, + "step": 7472 + }, + { + "epoch": 0.14, + "learning_rate": 1.711739349928158e-07, + "loss": 0.0184, + "step": 7473 + }, + { + "epoch": 0.14, + "learning_rate": 1.7117005164847965e-07, + "loss": 0.0147, + "step": 7474 + }, + { + "epoch": 0.14, + "learning_rate": 1.7116616830414352e-07, + "loss": 0.0072, + "step": 7475 + }, + { + "epoch": 0.15, + "learning_rate": 1.7116228495980737e-07, + "loss": 0.0065, + "step": 7476 + }, + { + "epoch": 0.15, + "learning_rate": 1.7115840161547124e-07, + "loss": 0.2186, + "step": 7477 + }, + { + "epoch": 0.15, + "learning_rate": 1.7115451827113509e-07, + "loss": 0.0094, + "step": 7478 + }, + { + "epoch": 0.15, + "learning_rate": 1.7115063492679896e-07, + "loss": 0.0082, + "step": 7479 + }, + { + "epoch": 0.15, + "learning_rate": 1.711467515824628e-07, + "loss": 0.2938, + "step": 7480 + }, + { + "epoch": 0.15, + "learning_rate": 1.7114286823812667e-07, + "loss": 0.0316, + "step": 7481 + }, + { + "epoch": 0.15, + "learning_rate": 1.7113898489379052e-07, + "loss": 0.0109, + "step": 7482 + }, + { + "epoch": 0.15, + "learning_rate": 1.711351015494544e-07, + "loss": 0.06, + "step": 7483 + }, + { + "epoch": 0.15, + "learning_rate": 1.7113121820511824e-07, + "loss": 0.0107, + "step": 7484 + }, + { + "epoch": 0.15, + "learning_rate": 1.711273348607821e-07, + "loss": 0.0067, + "step": 7485 + }, + { + "epoch": 0.15, + "learning_rate": 1.7112345151644595e-07, + "loss": 0.0075, + "step": 7486 + }, + { + "epoch": 0.15, + "learning_rate": 1.7111956817210982e-07, + "loss": 0.969, + "step": 7487 + }, + { + "epoch": 0.15, + "learning_rate": 1.7111568482777367e-07, + "loss": 0.0065, + "step": 7488 + }, + { + "epoch": 0.15, + "learning_rate": 1.7111180148343754e-07, + "loss": 0.1694, + "step": 7489 + }, + { + "epoch": 0.15, + "learning_rate": 1.7110791813910138e-07, + "loss": 0.0072, + "step": 7490 + }, + { + "epoch": 0.15, + "learning_rate": 1.7110403479476526e-07, + "loss": 0.3395, + "step": 7491 + }, + { + "epoch": 0.15, + "learning_rate": 1.711001514504291e-07, + "loss": 0.0059, + "step": 7492 + }, + { + "epoch": 0.15, + "learning_rate": 1.7109626810609297e-07, + "loss": 0.0063, + "step": 7493 + }, + { + "epoch": 0.15, + "learning_rate": 1.7109238476175682e-07, + "loss": 0.0066, + "step": 7494 + }, + { + "epoch": 0.15, + "learning_rate": 1.710885014174207e-07, + "loss": 0.1951, + "step": 7495 + }, + { + "epoch": 0.15, + "learning_rate": 1.7108461807308453e-07, + "loss": 0.0088, + "step": 7496 + }, + { + "epoch": 0.15, + "learning_rate": 1.710807347287484e-07, + "loss": 0.0295, + "step": 7497 + }, + { + "epoch": 0.15, + "learning_rate": 1.7107685138441225e-07, + "loss": 0.0364, + "step": 7498 + }, + { + "epoch": 0.15, + "learning_rate": 1.7107296804007612e-07, + "loss": 0.0079, + "step": 7499 + }, + { + "epoch": 0.15, + "learning_rate": 1.7106908469573997e-07, + "loss": 0.0064, + "step": 7500 + }, + { + "epoch": 0.15, + "learning_rate": 1.7106520135140384e-07, + "loss": 0.0054, + "step": 7501 + }, + { + "epoch": 0.15, + "learning_rate": 1.7106131800706768e-07, + "loss": 0.0114, + "step": 7502 + }, + { + "epoch": 0.15, + "learning_rate": 1.7105743466273153e-07, + "loss": 0.4131, + "step": 7503 + }, + { + "epoch": 0.15, + "learning_rate": 1.7105355131839537e-07, + "loss": 0.0064, + "step": 7504 + }, + { + "epoch": 0.15, + "learning_rate": 1.7104966797405925e-07, + "loss": 0.007, + "step": 7505 + }, + { + "epoch": 0.15, + "learning_rate": 1.710457846297231e-07, + "loss": 0.0769, + "step": 7506 + }, + { + "epoch": 0.15, + "learning_rate": 1.7104190128538696e-07, + "loss": 0.0051, + "step": 7507 + }, + { + "epoch": 0.15, + "learning_rate": 1.710380179410508e-07, + "loss": 0.0269, + "step": 7508 + }, + { + "epoch": 0.15, + "learning_rate": 1.7103413459671468e-07, + "loss": 0.0072, + "step": 7509 + }, + { + "epoch": 0.15, + "learning_rate": 1.7103025125237852e-07, + "loss": 0.0123, + "step": 7510 + }, + { + "epoch": 0.15, + "learning_rate": 1.710263679080424e-07, + "loss": 0.0062, + "step": 7511 + }, + { + "epoch": 0.15, + "learning_rate": 1.7102248456370624e-07, + "loss": 0.0072, + "step": 7512 + }, + { + "epoch": 0.15, + "learning_rate": 1.710186012193701e-07, + "loss": 0.0148, + "step": 7513 + }, + { + "epoch": 0.15, + "learning_rate": 1.7101471787503396e-07, + "loss": 0.0073, + "step": 7514 + }, + { + "epoch": 0.15, + "learning_rate": 1.7101083453069783e-07, + "loss": 0.0087, + "step": 7515 + }, + { + "epoch": 0.15, + "learning_rate": 1.7100695118636167e-07, + "loss": 0.0075, + "step": 7516 + }, + { + "epoch": 0.15, + "learning_rate": 1.7100306784202554e-07, + "loss": 0.2034, + "step": 7517 + }, + { + "epoch": 0.15, + "learning_rate": 1.709991844976894e-07, + "loss": 0.1231, + "step": 7518 + }, + { + "epoch": 0.15, + "learning_rate": 1.7099530115335326e-07, + "loss": 0.0056, + "step": 7519 + }, + { + "epoch": 0.15, + "learning_rate": 1.709914178090171e-07, + "loss": 0.0094, + "step": 7520 + }, + { + "epoch": 0.15, + "learning_rate": 1.7098753446468098e-07, + "loss": 0.0122, + "step": 7521 + }, + { + "epoch": 0.15, + "learning_rate": 1.7098365112034482e-07, + "loss": 0.0113, + "step": 7522 + }, + { + "epoch": 0.15, + "learning_rate": 1.709797677760087e-07, + "loss": 0.0617, + "step": 7523 + }, + { + "epoch": 0.15, + "learning_rate": 1.7097588443167254e-07, + "loss": 0.0229, + "step": 7524 + }, + { + "epoch": 0.15, + "learning_rate": 1.709720010873364e-07, + "loss": 0.4643, + "step": 7525 + }, + { + "epoch": 0.15, + "learning_rate": 1.7096811774300026e-07, + "loss": 0.0105, + "step": 7526 + }, + { + "epoch": 0.15, + "learning_rate": 1.7096423439866413e-07, + "loss": 0.0066, + "step": 7527 + }, + { + "epoch": 0.15, + "learning_rate": 1.7096035105432797e-07, + "loss": 0.2348, + "step": 7528 + }, + { + "epoch": 0.15, + "learning_rate": 1.7095646770999184e-07, + "loss": 0.2264, + "step": 7529 + }, + { + "epoch": 0.15, + "learning_rate": 1.709525843656557e-07, + "loss": 0.01, + "step": 7530 + }, + { + "epoch": 0.15, + "learning_rate": 1.7094870102131956e-07, + "loss": 0.0075, + "step": 7531 + }, + { + "epoch": 0.15, + "learning_rate": 1.709448176769834e-07, + "loss": 0.0059, + "step": 7532 + }, + { + "epoch": 0.15, + "learning_rate": 1.7094093433264728e-07, + "loss": 0.0054, + "step": 7533 + }, + { + "epoch": 0.15, + "learning_rate": 1.7093705098831112e-07, + "loss": 0.0131, + "step": 7534 + }, + { + "epoch": 0.15, + "learning_rate": 1.70933167643975e-07, + "loss": 0.772, + "step": 7535 + }, + { + "epoch": 0.15, + "learning_rate": 1.7092928429963884e-07, + "loss": 0.0093, + "step": 7536 + }, + { + "epoch": 0.15, + "learning_rate": 1.709254009553027e-07, + "loss": 0.0154, + "step": 7537 + }, + { + "epoch": 0.15, + "learning_rate": 1.7092151761096655e-07, + "loss": 0.006, + "step": 7538 + }, + { + "epoch": 0.15, + "learning_rate": 1.7091763426663043e-07, + "loss": 0.4642, + "step": 7539 + }, + { + "epoch": 0.15, + "learning_rate": 1.7091375092229427e-07, + "loss": 0.1034, + "step": 7540 + }, + { + "epoch": 0.15, + "learning_rate": 1.7090986757795814e-07, + "loss": 0.0099, + "step": 7541 + }, + { + "epoch": 0.15, + "learning_rate": 1.70905984233622e-07, + "loss": 0.0516, + "step": 7542 + }, + { + "epoch": 0.15, + "learning_rate": 1.7090210088928586e-07, + "loss": 0.0082, + "step": 7543 + }, + { + "epoch": 0.15, + "learning_rate": 1.708982175449497e-07, + "loss": 0.2002, + "step": 7544 + }, + { + "epoch": 0.15, + "learning_rate": 1.7089433420061357e-07, + "loss": 0.4014, + "step": 7545 + }, + { + "epoch": 0.15, + "learning_rate": 1.7089045085627742e-07, + "loss": 0.0091, + "step": 7546 + }, + { + "epoch": 0.15, + "learning_rate": 1.708865675119413e-07, + "loss": 0.0226, + "step": 7547 + }, + { + "epoch": 0.15, + "learning_rate": 1.7088268416760514e-07, + "loss": 0.0051, + "step": 7548 + }, + { + "epoch": 0.15, + "learning_rate": 1.70878800823269e-07, + "loss": 0.0097, + "step": 7549 + }, + { + "epoch": 0.15, + "learning_rate": 1.7087491747893285e-07, + "loss": 0.0087, + "step": 7550 + }, + { + "epoch": 0.15, + "learning_rate": 1.7087103413459672e-07, + "loss": 0.0095, + "step": 7551 + }, + { + "epoch": 0.15, + "learning_rate": 1.7086715079026057e-07, + "loss": 0.0061, + "step": 7552 + }, + { + "epoch": 0.15, + "learning_rate": 1.7086326744592444e-07, + "loss": 0.0276, + "step": 7553 + }, + { + "epoch": 0.15, + "learning_rate": 1.7085938410158829e-07, + "loss": 0.0066, + "step": 7554 + }, + { + "epoch": 0.15, + "learning_rate": 1.7085550075725216e-07, + "loss": 0.0053, + "step": 7555 + }, + { + "epoch": 0.15, + "learning_rate": 1.70851617412916e-07, + "loss": 0.0072, + "step": 7556 + }, + { + "epoch": 0.15, + "learning_rate": 1.7084773406857987e-07, + "loss": 0.0065, + "step": 7557 + }, + { + "epoch": 0.15, + "learning_rate": 1.7084385072424372e-07, + "loss": 0.0078, + "step": 7558 + }, + { + "epoch": 0.15, + "learning_rate": 1.708399673799076e-07, + "loss": 0.0072, + "step": 7559 + }, + { + "epoch": 0.15, + "learning_rate": 1.7083608403557144e-07, + "loss": 0.3681, + "step": 7560 + }, + { + "epoch": 0.15, + "learning_rate": 1.7083220069123528e-07, + "loss": 0.8505, + "step": 7561 + }, + { + "epoch": 0.15, + "learning_rate": 1.7082831734689913e-07, + "loss": 0.0055, + "step": 7562 + }, + { + "epoch": 0.15, + "learning_rate": 1.70824434002563e-07, + "loss": 0.0068, + "step": 7563 + }, + { + "epoch": 0.15, + "learning_rate": 1.7082055065822684e-07, + "loss": 0.0084, + "step": 7564 + }, + { + "epoch": 0.15, + "learning_rate": 1.7081666731389071e-07, + "loss": 0.0088, + "step": 7565 + }, + { + "epoch": 0.15, + "learning_rate": 1.7081278396955456e-07, + "loss": 0.083, + "step": 7566 + }, + { + "epoch": 0.15, + "learning_rate": 1.7080890062521843e-07, + "loss": 0.0114, + "step": 7567 + }, + { + "epoch": 0.15, + "learning_rate": 1.7080501728088227e-07, + "loss": 0.0056, + "step": 7568 + }, + { + "epoch": 0.15, + "learning_rate": 1.7080113393654615e-07, + "loss": 0.17, + "step": 7569 + }, + { + "epoch": 0.15, + "learning_rate": 1.7079725059221e-07, + "loss": 0.0066, + "step": 7570 + }, + { + "epoch": 0.15, + "learning_rate": 1.7079336724787386e-07, + "loss": 0.0068, + "step": 7571 + }, + { + "epoch": 0.15, + "learning_rate": 1.707894839035377e-07, + "loss": 0.022, + "step": 7572 + }, + { + "epoch": 0.15, + "learning_rate": 1.7078560055920158e-07, + "loss": 0.0062, + "step": 7573 + }, + { + "epoch": 0.15, + "learning_rate": 1.7078171721486542e-07, + "loss": 0.0064, + "step": 7574 + }, + { + "epoch": 0.15, + "learning_rate": 1.707778338705293e-07, + "loss": 0.0079, + "step": 7575 + }, + { + "epoch": 0.15, + "learning_rate": 1.7077395052619314e-07, + "loss": 0.4148, + "step": 7576 + }, + { + "epoch": 0.15, + "learning_rate": 1.70770067181857e-07, + "loss": 0.2178, + "step": 7577 + }, + { + "epoch": 0.15, + "learning_rate": 1.7076618383752086e-07, + "loss": 0.0063, + "step": 7578 + }, + { + "epoch": 0.15, + "learning_rate": 1.7076230049318473e-07, + "loss": 0.1888, + "step": 7579 + }, + { + "epoch": 0.15, + "learning_rate": 1.7075841714884857e-07, + "loss": 0.0053, + "step": 7580 + }, + { + "epoch": 0.15, + "learning_rate": 1.7075453380451245e-07, + "loss": 0.0104, + "step": 7581 + }, + { + "epoch": 0.15, + "learning_rate": 1.707506504601763e-07, + "loss": 0.0069, + "step": 7582 + }, + { + "epoch": 0.15, + "learning_rate": 1.7074676711584016e-07, + "loss": 0.0073, + "step": 7583 + }, + { + "epoch": 0.15, + "learning_rate": 1.70742883771504e-07, + "loss": 0.0113, + "step": 7584 + }, + { + "epoch": 0.15, + "learning_rate": 1.7073900042716788e-07, + "loss": 0.0048, + "step": 7585 + }, + { + "epoch": 0.15, + "learning_rate": 1.7073511708283172e-07, + "loss": 0.122, + "step": 7586 + }, + { + "epoch": 0.15, + "learning_rate": 1.707312337384956e-07, + "loss": 0.0088, + "step": 7587 + }, + { + "epoch": 0.15, + "learning_rate": 1.7072735039415944e-07, + "loss": 0.1522, + "step": 7588 + }, + { + "epoch": 0.15, + "learning_rate": 1.707234670498233e-07, + "loss": 0.1028, + "step": 7589 + }, + { + "epoch": 0.15, + "learning_rate": 1.7071958370548716e-07, + "loss": 0.0084, + "step": 7590 + }, + { + "epoch": 0.15, + "learning_rate": 1.7071570036115103e-07, + "loss": 0.8826, + "step": 7591 + }, + { + "epoch": 0.15, + "learning_rate": 1.7071181701681487e-07, + "loss": 0.0081, + "step": 7592 + }, + { + "epoch": 0.15, + "learning_rate": 1.7070793367247874e-07, + "loss": 0.0084, + "step": 7593 + }, + { + "epoch": 0.15, + "learning_rate": 1.707040503281426e-07, + "loss": 0.006, + "step": 7594 + }, + { + "epoch": 0.15, + "learning_rate": 1.7070016698380646e-07, + "loss": 0.0102, + "step": 7595 + }, + { + "epoch": 0.15, + "learning_rate": 1.706962836394703e-07, + "loss": 0.0081, + "step": 7596 + }, + { + "epoch": 0.15, + "learning_rate": 1.7069240029513418e-07, + "loss": 0.0072, + "step": 7597 + }, + { + "epoch": 0.15, + "learning_rate": 1.7068851695079802e-07, + "loss": 0.0051, + "step": 7598 + }, + { + "epoch": 0.15, + "learning_rate": 1.706846336064619e-07, + "loss": 0.017, + "step": 7599 + }, + { + "epoch": 0.15, + "learning_rate": 1.7068075026212574e-07, + "loss": 0.0124, + "step": 7600 + }, + { + "epoch": 0.15, + "learning_rate": 1.706768669177896e-07, + "loss": 0.0424, + "step": 7601 + }, + { + "epoch": 0.15, + "learning_rate": 1.7067298357345346e-07, + "loss": 0.6771, + "step": 7602 + }, + { + "epoch": 0.15, + "learning_rate": 1.706691002291173e-07, + "loss": 0.0207, + "step": 7603 + }, + { + "epoch": 0.15, + "learning_rate": 1.7066521688478117e-07, + "loss": 0.0061, + "step": 7604 + }, + { + "epoch": 0.15, + "learning_rate": 1.7066133354044502e-07, + "loss": 0.006, + "step": 7605 + }, + { + "epoch": 0.15, + "learning_rate": 1.706574501961089e-07, + "loss": 0.0055, + "step": 7606 + }, + { + "epoch": 0.15, + "learning_rate": 1.7065356685177273e-07, + "loss": 0.0077, + "step": 7607 + }, + { + "epoch": 0.15, + "learning_rate": 1.706496835074366e-07, + "loss": 0.0081, + "step": 7608 + }, + { + "epoch": 0.15, + "learning_rate": 1.7064580016310045e-07, + "loss": 0.0094, + "step": 7609 + }, + { + "epoch": 0.15, + "learning_rate": 1.7064191681876432e-07, + "loss": 0.0066, + "step": 7610 + }, + { + "epoch": 0.15, + "learning_rate": 1.7063803347442817e-07, + "loss": 0.0066, + "step": 7611 + }, + { + "epoch": 0.15, + "learning_rate": 1.7063415013009204e-07, + "loss": 0.3882, + "step": 7612 + }, + { + "epoch": 0.15, + "learning_rate": 1.7063026678575588e-07, + "loss": 0.0078, + "step": 7613 + }, + { + "epoch": 0.15, + "learning_rate": 1.7062638344141975e-07, + "loss": 0.0081, + "step": 7614 + }, + { + "epoch": 0.15, + "learning_rate": 1.706225000970836e-07, + "loss": 0.034, + "step": 7615 + }, + { + "epoch": 0.15, + "learning_rate": 1.7061861675274747e-07, + "loss": 0.0068, + "step": 7616 + }, + { + "epoch": 0.15, + "learning_rate": 1.7061473340841132e-07, + "loss": 0.2722, + "step": 7617 + }, + { + "epoch": 0.15, + "learning_rate": 1.706108500640752e-07, + "loss": 1.3197, + "step": 7618 + }, + { + "epoch": 0.15, + "learning_rate": 1.7060696671973903e-07, + "loss": 0.0054, + "step": 7619 + }, + { + "epoch": 0.15, + "learning_rate": 1.7060308337540288e-07, + "loss": 0.0076, + "step": 7620 + }, + { + "epoch": 0.15, + "learning_rate": 1.7059920003106675e-07, + "loss": 0.0498, + "step": 7621 + }, + { + "epoch": 0.15, + "learning_rate": 1.705953166867306e-07, + "loss": 0.0064, + "step": 7622 + }, + { + "epoch": 0.15, + "learning_rate": 1.7059143334239447e-07, + "loss": 0.006, + "step": 7623 + }, + { + "epoch": 0.15, + "learning_rate": 1.705875499980583e-07, + "loss": 0.0058, + "step": 7624 + }, + { + "epoch": 0.15, + "learning_rate": 1.7058366665372218e-07, + "loss": 0.0143, + "step": 7625 + }, + { + "epoch": 0.15, + "learning_rate": 1.7057978330938603e-07, + "loss": 0.1398, + "step": 7626 + }, + { + "epoch": 0.15, + "learning_rate": 1.705758999650499e-07, + "loss": 0.0082, + "step": 7627 + }, + { + "epoch": 0.15, + "learning_rate": 1.7057201662071374e-07, + "loss": 0.0502, + "step": 7628 + }, + { + "epoch": 0.15, + "learning_rate": 1.7056813327637761e-07, + "loss": 0.0058, + "step": 7629 + }, + { + "epoch": 0.15, + "learning_rate": 1.7056424993204146e-07, + "loss": 0.0056, + "step": 7630 + }, + { + "epoch": 0.15, + "learning_rate": 1.705603665877053e-07, + "loss": 0.0247, + "step": 7631 + }, + { + "epoch": 0.15, + "learning_rate": 1.7055648324336918e-07, + "loss": 0.0058, + "step": 7632 + }, + { + "epoch": 0.15, + "learning_rate": 1.7055259989903302e-07, + "loss": 0.2732, + "step": 7633 + }, + { + "epoch": 0.15, + "learning_rate": 1.705487165546969e-07, + "loss": 0.0067, + "step": 7634 + }, + { + "epoch": 0.15, + "learning_rate": 1.7054483321036074e-07, + "loss": 0.0661, + "step": 7635 + }, + { + "epoch": 0.15, + "learning_rate": 1.705409498660246e-07, + "loss": 0.0227, + "step": 7636 + }, + { + "epoch": 0.15, + "learning_rate": 1.7053706652168845e-07, + "loss": 0.0058, + "step": 7637 + }, + { + "epoch": 0.15, + "learning_rate": 1.7053318317735233e-07, + "loss": 0.0093, + "step": 7638 + }, + { + "epoch": 0.15, + "learning_rate": 1.7052929983301617e-07, + "loss": 0.0077, + "step": 7639 + }, + { + "epoch": 0.15, + "learning_rate": 1.7052541648868004e-07, + "loss": 0.0057, + "step": 7640 + }, + { + "epoch": 0.15, + "learning_rate": 1.705215331443439e-07, + "loss": 0.6401, + "step": 7641 + }, + { + "epoch": 0.15, + "learning_rate": 1.7051764980000776e-07, + "loss": 0.0077, + "step": 7642 + }, + { + "epoch": 0.15, + "learning_rate": 1.705137664556716e-07, + "loss": 0.4615, + "step": 7643 + }, + { + "epoch": 0.15, + "learning_rate": 1.7050988311133547e-07, + "loss": 0.1018, + "step": 7644 + }, + { + "epoch": 0.15, + "learning_rate": 1.7050599976699932e-07, + "loss": 0.3473, + "step": 7645 + }, + { + "epoch": 0.15, + "learning_rate": 1.705021164226632e-07, + "loss": 0.2262, + "step": 7646 + }, + { + "epoch": 0.15, + "learning_rate": 1.7049823307832704e-07, + "loss": 0.2537, + "step": 7647 + }, + { + "epoch": 0.15, + "learning_rate": 1.704943497339909e-07, + "loss": 0.4212, + "step": 7648 + }, + { + "epoch": 0.15, + "learning_rate": 1.7049046638965475e-07, + "loss": 0.0885, + "step": 7649 + }, + { + "epoch": 0.15, + "learning_rate": 1.7048658304531862e-07, + "loss": 0.0275, + "step": 7650 + }, + { + "epoch": 0.15, + "learning_rate": 1.7048269970098247e-07, + "loss": 0.0053, + "step": 7651 + }, + { + "epoch": 0.15, + "learning_rate": 1.7047881635664634e-07, + "loss": 0.0048, + "step": 7652 + }, + { + "epoch": 0.15, + "learning_rate": 1.7047493301231019e-07, + "loss": 0.0054, + "step": 7653 + }, + { + "epoch": 0.15, + "learning_rate": 1.7047104966797406e-07, + "loss": 0.0056, + "step": 7654 + }, + { + "epoch": 0.15, + "learning_rate": 1.704671663236379e-07, + "loss": 0.005, + "step": 7655 + }, + { + "epoch": 0.15, + "learning_rate": 1.7046328297930177e-07, + "loss": 0.0084, + "step": 7656 + }, + { + "epoch": 0.15, + "learning_rate": 1.7045939963496562e-07, + "loss": 0.0053, + "step": 7657 + }, + { + "epoch": 0.15, + "learning_rate": 1.704555162906295e-07, + "loss": 0.0498, + "step": 7658 + }, + { + "epoch": 0.15, + "learning_rate": 1.7045163294629334e-07, + "loss": 0.0096, + "step": 7659 + }, + { + "epoch": 0.15, + "learning_rate": 1.704477496019572e-07, + "loss": 0.0062, + "step": 7660 + }, + { + "epoch": 0.15, + "learning_rate": 1.7044386625762105e-07, + "loss": 0.0068, + "step": 7661 + }, + { + "epoch": 0.15, + "learning_rate": 1.7043998291328492e-07, + "loss": 0.0145, + "step": 7662 + }, + { + "epoch": 0.15, + "learning_rate": 1.7043609956894877e-07, + "loss": 0.0785, + "step": 7663 + }, + { + "epoch": 0.15, + "learning_rate": 1.7043221622461264e-07, + "loss": 0.0151, + "step": 7664 + }, + { + "epoch": 0.15, + "learning_rate": 1.7042833288027648e-07, + "loss": 0.2727, + "step": 7665 + }, + { + "epoch": 0.15, + "learning_rate": 1.7042444953594036e-07, + "loss": 0.3489, + "step": 7666 + }, + { + "epoch": 0.15, + "learning_rate": 1.704205661916042e-07, + "loss": 0.0075, + "step": 7667 + }, + { + "epoch": 0.15, + "learning_rate": 1.7041668284726807e-07, + "loss": 0.0083, + "step": 7668 + }, + { + "epoch": 0.15, + "learning_rate": 1.7041279950293192e-07, + "loss": 0.0129, + "step": 7669 + }, + { + "epoch": 0.15, + "learning_rate": 1.704089161585958e-07, + "loss": 0.4541, + "step": 7670 + }, + { + "epoch": 0.15, + "learning_rate": 1.7040503281425963e-07, + "loss": 0.0146, + "step": 7671 + }, + { + "epoch": 0.15, + "learning_rate": 1.704011494699235e-07, + "loss": 0.3553, + "step": 7672 + }, + { + "epoch": 0.15, + "learning_rate": 1.7039726612558735e-07, + "loss": 0.0153, + "step": 7673 + }, + { + "epoch": 0.15, + "learning_rate": 1.7039338278125122e-07, + "loss": 0.0633, + "step": 7674 + }, + { + "epoch": 0.15, + "learning_rate": 1.7038949943691507e-07, + "loss": 0.0056, + "step": 7675 + }, + { + "epoch": 0.15, + "learning_rate": 1.7038561609257894e-07, + "loss": 0.0089, + "step": 7676 + }, + { + "epoch": 0.15, + "learning_rate": 1.7038173274824276e-07, + "loss": 0.0157, + "step": 7677 + }, + { + "epoch": 0.15, + "learning_rate": 1.7037784940390663e-07, + "loss": 0.0291, + "step": 7678 + }, + { + "epoch": 0.15, + "learning_rate": 1.7037396605957047e-07, + "loss": 0.0076, + "step": 7679 + }, + { + "epoch": 0.15, + "learning_rate": 1.7037008271523435e-07, + "loss": 0.0071, + "step": 7680 + }, + { + "epoch": 0.15, + "learning_rate": 1.703661993708982e-07, + "loss": 0.0048, + "step": 7681 + }, + { + "epoch": 0.15, + "learning_rate": 1.7036231602656206e-07, + "loss": 0.0338, + "step": 7682 + }, + { + "epoch": 0.15, + "learning_rate": 1.703584326822259e-07, + "loss": 0.0698, + "step": 7683 + }, + { + "epoch": 0.15, + "learning_rate": 1.7035454933788978e-07, + "loss": 0.0092, + "step": 7684 + }, + { + "epoch": 0.15, + "learning_rate": 1.7035066599355362e-07, + "loss": 0.0088, + "step": 7685 + }, + { + "epoch": 0.15, + "learning_rate": 1.703467826492175e-07, + "loss": 0.0072, + "step": 7686 + }, + { + "epoch": 0.15, + "learning_rate": 1.7034289930488134e-07, + "loss": 0.0123, + "step": 7687 + }, + { + "epoch": 0.15, + "learning_rate": 1.703390159605452e-07, + "loss": 0.0253, + "step": 7688 + }, + { + "epoch": 0.15, + "learning_rate": 1.7033513261620906e-07, + "loss": 0.0066, + "step": 7689 + }, + { + "epoch": 0.15, + "learning_rate": 1.7033124927187293e-07, + "loss": 0.0063, + "step": 7690 + }, + { + "epoch": 0.15, + "learning_rate": 1.7032736592753677e-07, + "loss": 0.0049, + "step": 7691 + }, + { + "epoch": 0.15, + "learning_rate": 1.7032348258320064e-07, + "loss": 0.02, + "step": 7692 + }, + { + "epoch": 0.15, + "learning_rate": 1.703195992388645e-07, + "loss": 0.005, + "step": 7693 + }, + { + "epoch": 0.15, + "learning_rate": 1.7031571589452836e-07, + "loss": 0.0043, + "step": 7694 + }, + { + "epoch": 0.15, + "learning_rate": 1.703118325501922e-07, + "loss": 0.0081, + "step": 7695 + }, + { + "epoch": 0.15, + "learning_rate": 1.7030794920585608e-07, + "loss": 0.0067, + "step": 7696 + }, + { + "epoch": 0.15, + "learning_rate": 1.7030406586151992e-07, + "loss": 0.0085, + "step": 7697 + }, + { + "epoch": 0.15, + "learning_rate": 1.703001825171838e-07, + "loss": 0.0057, + "step": 7698 + }, + { + "epoch": 0.15, + "learning_rate": 1.7029629917284764e-07, + "loss": 0.0074, + "step": 7699 + }, + { + "epoch": 0.15, + "learning_rate": 1.702924158285115e-07, + "loss": 0.0833, + "step": 7700 + }, + { + "epoch": 0.15, + "learning_rate": 1.7028853248417536e-07, + "loss": 0.0161, + "step": 7701 + }, + { + "epoch": 0.15, + "learning_rate": 1.7028464913983923e-07, + "loss": 0.0049, + "step": 7702 + }, + { + "epoch": 0.15, + "learning_rate": 1.7028076579550307e-07, + "loss": 0.0052, + "step": 7703 + }, + { + "epoch": 0.15, + "learning_rate": 1.7027688245116694e-07, + "loss": 0.0546, + "step": 7704 + }, + { + "epoch": 0.15, + "learning_rate": 1.702729991068308e-07, + "loss": 0.0067, + "step": 7705 + }, + { + "epoch": 0.15, + "learning_rate": 1.7026911576249466e-07, + "loss": 0.6628, + "step": 7706 + }, + { + "epoch": 0.15, + "learning_rate": 1.702652324181585e-07, + "loss": 0.006, + "step": 7707 + }, + { + "epoch": 0.15, + "learning_rate": 1.7026134907382238e-07, + "loss": 0.0068, + "step": 7708 + }, + { + "epoch": 0.15, + "learning_rate": 1.7025746572948622e-07, + "loss": 0.0066, + "step": 7709 + }, + { + "epoch": 0.15, + "learning_rate": 1.702535823851501e-07, + "loss": 0.0067, + "step": 7710 + }, + { + "epoch": 0.15, + "learning_rate": 1.7024969904081394e-07, + "loss": 0.0068, + "step": 7711 + }, + { + "epoch": 0.15, + "learning_rate": 1.702458156964778e-07, + "loss": 0.0062, + "step": 7712 + }, + { + "epoch": 0.15, + "learning_rate": 1.7024193235214165e-07, + "loss": 0.0066, + "step": 7713 + }, + { + "epoch": 0.15, + "learning_rate": 1.7023804900780553e-07, + "loss": 0.0059, + "step": 7714 + }, + { + "epoch": 0.15, + "learning_rate": 1.7023416566346937e-07, + "loss": 0.0096, + "step": 7715 + }, + { + "epoch": 0.15, + "learning_rate": 1.7023028231913324e-07, + "loss": 0.006, + "step": 7716 + }, + { + "epoch": 0.15, + "learning_rate": 1.702263989747971e-07, + "loss": 0.0051, + "step": 7717 + }, + { + "epoch": 0.15, + "learning_rate": 1.7022251563046096e-07, + "loss": 0.0085, + "step": 7718 + }, + { + "epoch": 0.15, + "learning_rate": 1.702186322861248e-07, + "loss": 0.0075, + "step": 7719 + }, + { + "epoch": 0.15, + "learning_rate": 1.7021474894178868e-07, + "loss": 0.0069, + "step": 7720 + }, + { + "epoch": 0.15, + "learning_rate": 1.7021086559745252e-07, + "loss": 0.0103, + "step": 7721 + }, + { + "epoch": 0.15, + "learning_rate": 1.702069822531164e-07, + "loss": 0.1013, + "step": 7722 + }, + { + "epoch": 0.15, + "learning_rate": 1.7020309890878024e-07, + "loss": 0.0063, + "step": 7723 + }, + { + "epoch": 0.15, + "learning_rate": 1.701992155644441e-07, + "loss": 0.1955, + "step": 7724 + }, + { + "epoch": 0.15, + "learning_rate": 1.7019533222010795e-07, + "loss": 0.0091, + "step": 7725 + }, + { + "epoch": 0.15, + "learning_rate": 1.7019144887577182e-07, + "loss": 0.0078, + "step": 7726 + }, + { + "epoch": 0.15, + "learning_rate": 1.7018756553143567e-07, + "loss": 0.1122, + "step": 7727 + }, + { + "epoch": 0.15, + "learning_rate": 1.7018368218709954e-07, + "loss": 0.6039, + "step": 7728 + }, + { + "epoch": 0.15, + "learning_rate": 1.7017979884276339e-07, + "loss": 0.0056, + "step": 7729 + }, + { + "epoch": 0.15, + "learning_rate": 1.7017591549842726e-07, + "loss": 0.0147, + "step": 7730 + }, + { + "epoch": 0.15, + "learning_rate": 1.701720321540911e-07, + "loss": 0.0053, + "step": 7731 + }, + { + "epoch": 0.15, + "learning_rate": 1.7016814880975497e-07, + "loss": 0.5494, + "step": 7732 + }, + { + "epoch": 0.15, + "learning_rate": 1.7016426546541882e-07, + "loss": 0.0925, + "step": 7733 + }, + { + "epoch": 0.15, + "learning_rate": 1.701603821210827e-07, + "loss": 0.0062, + "step": 7734 + }, + { + "epoch": 0.15, + "learning_rate": 1.701564987767465e-07, + "loss": 0.7633, + "step": 7735 + }, + { + "epoch": 0.15, + "learning_rate": 1.7015261543241038e-07, + "loss": 0.0081, + "step": 7736 + }, + { + "epoch": 0.15, + "learning_rate": 1.7014873208807423e-07, + "loss": 0.9768, + "step": 7737 + }, + { + "epoch": 0.15, + "learning_rate": 1.701448487437381e-07, + "loss": 0.0558, + "step": 7738 + }, + { + "epoch": 0.15, + "learning_rate": 1.7014096539940194e-07, + "loss": 0.0065, + "step": 7739 + }, + { + "epoch": 0.15, + "learning_rate": 1.7013708205506581e-07, + "loss": 0.3522, + "step": 7740 + }, + { + "epoch": 0.15, + "learning_rate": 1.7013319871072966e-07, + "loss": 0.0052, + "step": 7741 + }, + { + "epoch": 0.15, + "learning_rate": 1.7012931536639353e-07, + "loss": 0.0043, + "step": 7742 + }, + { + "epoch": 0.15, + "learning_rate": 1.7012543202205737e-07, + "loss": 0.0105, + "step": 7743 + }, + { + "epoch": 0.15, + "learning_rate": 1.7012154867772125e-07, + "loss": 0.7886, + "step": 7744 + }, + { + "epoch": 0.15, + "learning_rate": 1.701176653333851e-07, + "loss": 0.0124, + "step": 7745 + }, + { + "epoch": 0.15, + "learning_rate": 1.7011378198904896e-07, + "loss": 0.0611, + "step": 7746 + }, + { + "epoch": 0.15, + "learning_rate": 1.701098986447128e-07, + "loss": 1.0281, + "step": 7747 + }, + { + "epoch": 0.15, + "learning_rate": 1.7010601530037668e-07, + "loss": 0.1419, + "step": 7748 + }, + { + "epoch": 0.15, + "learning_rate": 1.7010213195604052e-07, + "loss": 0.0175, + "step": 7749 + }, + { + "epoch": 0.15, + "learning_rate": 1.700982486117044e-07, + "loss": 0.0191, + "step": 7750 + }, + { + "epoch": 0.15, + "learning_rate": 1.7009436526736824e-07, + "loss": 0.0168, + "step": 7751 + }, + { + "epoch": 0.15, + "learning_rate": 1.700904819230321e-07, + "loss": 0.0077, + "step": 7752 + }, + { + "epoch": 0.15, + "learning_rate": 1.7008659857869596e-07, + "loss": 0.0084, + "step": 7753 + }, + { + "epoch": 0.15, + "learning_rate": 1.7008271523435983e-07, + "loss": 0.0054, + "step": 7754 + }, + { + "epoch": 0.15, + "learning_rate": 1.7007883189002367e-07, + "loss": 0.0048, + "step": 7755 + }, + { + "epoch": 0.15, + "learning_rate": 1.7007494854568755e-07, + "loss": 0.006, + "step": 7756 + }, + { + "epoch": 0.15, + "learning_rate": 1.700710652013514e-07, + "loss": 0.0346, + "step": 7757 + }, + { + "epoch": 0.15, + "learning_rate": 1.7006718185701526e-07, + "loss": 0.1125, + "step": 7758 + }, + { + "epoch": 0.15, + "learning_rate": 1.700632985126791e-07, + "loss": 0.0067, + "step": 7759 + }, + { + "epoch": 0.15, + "learning_rate": 1.7005941516834298e-07, + "loss": 0.4158, + "step": 7760 + }, + { + "epoch": 0.15, + "learning_rate": 1.7005553182400682e-07, + "loss": 0.0114, + "step": 7761 + }, + { + "epoch": 0.15, + "learning_rate": 1.700516484796707e-07, + "loss": 0.0233, + "step": 7762 + }, + { + "epoch": 0.15, + "learning_rate": 1.7004776513533454e-07, + "loss": 0.0361, + "step": 7763 + }, + { + "epoch": 0.15, + "learning_rate": 1.700438817909984e-07, + "loss": 0.0179, + "step": 7764 + }, + { + "epoch": 0.15, + "learning_rate": 1.7003999844666226e-07, + "loss": 0.0066, + "step": 7765 + }, + { + "epoch": 0.15, + "learning_rate": 1.7003611510232613e-07, + "loss": 0.0098, + "step": 7766 + }, + { + "epoch": 0.15, + "learning_rate": 1.7003223175798997e-07, + "loss": 0.0053, + "step": 7767 + }, + { + "epoch": 0.15, + "learning_rate": 1.7002834841365384e-07, + "loss": 0.0609, + "step": 7768 + }, + { + "epoch": 0.15, + "learning_rate": 1.700244650693177e-07, + "loss": 0.0051, + "step": 7769 + }, + { + "epoch": 0.15, + "learning_rate": 1.7002058172498156e-07, + "loss": 0.0101, + "step": 7770 + }, + { + "epoch": 0.15, + "learning_rate": 1.700166983806454e-07, + "loss": 0.0467, + "step": 7771 + }, + { + "epoch": 0.15, + "learning_rate": 1.7001281503630928e-07, + "loss": 0.2162, + "step": 7772 + }, + { + "epoch": 0.15, + "learning_rate": 1.7000893169197312e-07, + "loss": 0.0079, + "step": 7773 + }, + { + "epoch": 0.15, + "learning_rate": 1.70005048347637e-07, + "loss": 0.024, + "step": 7774 + }, + { + "epoch": 0.15, + "learning_rate": 1.7000116500330084e-07, + "loss": 0.0065, + "step": 7775 + }, + { + "epoch": 0.15, + "learning_rate": 1.699972816589647e-07, + "loss": 0.3503, + "step": 7776 + }, + { + "epoch": 0.15, + "learning_rate": 1.6999339831462856e-07, + "loss": 0.0389, + "step": 7777 + }, + { + "epoch": 0.15, + "learning_rate": 1.6998951497029243e-07, + "loss": 0.0063, + "step": 7778 + }, + { + "epoch": 0.15, + "learning_rate": 1.6998563162595627e-07, + "loss": 0.1007, + "step": 7779 + }, + { + "epoch": 0.15, + "learning_rate": 1.6998174828162012e-07, + "loss": 0.0536, + "step": 7780 + }, + { + "epoch": 0.15, + "learning_rate": 1.69977864937284e-07, + "loss": 0.1743, + "step": 7781 + }, + { + "epoch": 0.15, + "learning_rate": 1.6997398159294783e-07, + "loss": 0.019, + "step": 7782 + }, + { + "epoch": 0.15, + "learning_rate": 1.699700982486117e-07, + "loss": 0.0168, + "step": 7783 + }, + { + "epoch": 0.15, + "learning_rate": 1.6996621490427555e-07, + "loss": 0.2164, + "step": 7784 + }, + { + "epoch": 0.15, + "learning_rate": 1.6996233155993942e-07, + "loss": 0.025, + "step": 7785 + }, + { + "epoch": 0.15, + "learning_rate": 1.6995844821560327e-07, + "loss": 0.032, + "step": 7786 + }, + { + "epoch": 0.15, + "learning_rate": 1.6995456487126714e-07, + "loss": 0.0045, + "step": 7787 + }, + { + "epoch": 0.15, + "learning_rate": 1.6995068152693098e-07, + "loss": 0.0865, + "step": 7788 + }, + { + "epoch": 0.15, + "learning_rate": 1.6994679818259485e-07, + "loss": 0.0055, + "step": 7789 + }, + { + "epoch": 0.15, + "learning_rate": 1.699429148382587e-07, + "loss": 0.0151, + "step": 7790 + }, + { + "epoch": 0.15, + "learning_rate": 1.6993903149392257e-07, + "loss": 0.8009, + "step": 7791 + }, + { + "epoch": 0.15, + "learning_rate": 1.6993514814958642e-07, + "loss": 0.0064, + "step": 7792 + }, + { + "epoch": 0.15, + "learning_rate": 1.6993126480525026e-07, + "loss": 0.5423, + "step": 7793 + }, + { + "epoch": 0.15, + "learning_rate": 1.6992738146091413e-07, + "loss": 0.014, + "step": 7794 + }, + { + "epoch": 0.15, + "learning_rate": 1.6992349811657798e-07, + "loss": 0.0064, + "step": 7795 + }, + { + "epoch": 0.15, + "learning_rate": 1.6991961477224185e-07, + "loss": 0.0082, + "step": 7796 + }, + { + "epoch": 0.15, + "learning_rate": 1.699157314279057e-07, + "loss": 0.0082, + "step": 7797 + }, + { + "epoch": 0.15, + "learning_rate": 1.6991184808356957e-07, + "loss": 0.0049, + "step": 7798 + }, + { + "epoch": 0.15, + "learning_rate": 1.699079647392334e-07, + "loss": 0.0066, + "step": 7799 + }, + { + "epoch": 0.15, + "learning_rate": 1.6990408139489728e-07, + "loss": 0.0058, + "step": 7800 + }, + { + "epoch": 0.15, + "learning_rate": 1.6990019805056113e-07, + "loss": 0.038, + "step": 7801 + }, + { + "epoch": 0.15, + "learning_rate": 1.69896314706225e-07, + "loss": 0.0192, + "step": 7802 + }, + { + "epoch": 0.15, + "learning_rate": 1.6989243136188884e-07, + "loss": 0.0053, + "step": 7803 + }, + { + "epoch": 0.15, + "learning_rate": 1.6988854801755271e-07, + "loss": 0.0061, + "step": 7804 + }, + { + "epoch": 0.15, + "learning_rate": 1.6988466467321656e-07, + "loss": 0.0065, + "step": 7805 + }, + { + "epoch": 0.15, + "learning_rate": 1.6988078132888043e-07, + "loss": 0.0126, + "step": 7806 + }, + { + "epoch": 0.15, + "learning_rate": 1.6987689798454428e-07, + "loss": 0.0215, + "step": 7807 + }, + { + "epoch": 0.15, + "learning_rate": 1.6987301464020812e-07, + "loss": 0.0089, + "step": 7808 + }, + { + "epoch": 0.15, + "learning_rate": 1.69869131295872e-07, + "loss": 0.2447, + "step": 7809 + }, + { + "epoch": 0.15, + "learning_rate": 1.6986524795153584e-07, + "loss": 0.6016, + "step": 7810 + }, + { + "epoch": 0.15, + "learning_rate": 1.698613646071997e-07, + "loss": 0.27, + "step": 7811 + }, + { + "epoch": 0.15, + "learning_rate": 1.6985748126286355e-07, + "loss": 0.011, + "step": 7812 + }, + { + "epoch": 0.15, + "learning_rate": 1.6985359791852743e-07, + "loss": 0.0262, + "step": 7813 + }, + { + "epoch": 0.15, + "learning_rate": 1.6984971457419127e-07, + "loss": 0.3874, + "step": 7814 + }, + { + "epoch": 0.15, + "learning_rate": 1.6984583122985514e-07, + "loss": 0.2008, + "step": 7815 + }, + { + "epoch": 0.15, + "learning_rate": 1.69841947885519e-07, + "loss": 0.4913, + "step": 7816 + }, + { + "epoch": 0.15, + "learning_rate": 1.6983806454118286e-07, + "loss": 0.1395, + "step": 7817 + }, + { + "epoch": 0.15, + "learning_rate": 1.698341811968467e-07, + "loss": 0.1587, + "step": 7818 + }, + { + "epoch": 0.15, + "learning_rate": 1.6983029785251058e-07, + "loss": 0.0063, + "step": 7819 + }, + { + "epoch": 0.15, + "learning_rate": 1.6982641450817442e-07, + "loss": 0.0521, + "step": 7820 + }, + { + "epoch": 0.15, + "learning_rate": 1.698225311638383e-07, + "loss": 0.0056, + "step": 7821 + }, + { + "epoch": 0.15, + "learning_rate": 1.6981864781950214e-07, + "loss": 0.0436, + "step": 7822 + }, + { + "epoch": 0.15, + "learning_rate": 1.69814764475166e-07, + "loss": 0.0077, + "step": 7823 + }, + { + "epoch": 0.15, + "learning_rate": 1.6981088113082985e-07, + "loss": 0.005, + "step": 7824 + }, + { + "epoch": 0.15, + "learning_rate": 1.6980699778649372e-07, + "loss": 0.017, + "step": 7825 + }, + { + "epoch": 0.15, + "learning_rate": 1.6980311444215757e-07, + "loss": 0.036, + "step": 7826 + }, + { + "epoch": 0.15, + "learning_rate": 1.6979923109782144e-07, + "loss": 0.0615, + "step": 7827 + }, + { + "epoch": 0.15, + "learning_rate": 1.6979534775348529e-07, + "loss": 0.0062, + "step": 7828 + }, + { + "epoch": 0.15, + "learning_rate": 1.6979146440914916e-07, + "loss": 0.0053, + "step": 7829 + }, + { + "epoch": 0.15, + "learning_rate": 1.69787581064813e-07, + "loss": 0.0065, + "step": 7830 + }, + { + "epoch": 0.15, + "learning_rate": 1.6978369772047687e-07, + "loss": 0.0053, + "step": 7831 + }, + { + "epoch": 0.15, + "learning_rate": 1.6977981437614072e-07, + "loss": 0.0045, + "step": 7832 + }, + { + "epoch": 0.15, + "learning_rate": 1.697759310318046e-07, + "loss": 0.2369, + "step": 7833 + }, + { + "epoch": 0.15, + "learning_rate": 1.6977204768746844e-07, + "loss": 0.0056, + "step": 7834 + }, + { + "epoch": 0.15, + "learning_rate": 1.697681643431323e-07, + "loss": 0.4418, + "step": 7835 + }, + { + "epoch": 0.15, + "learning_rate": 1.6976428099879615e-07, + "loss": 0.6529, + "step": 7836 + }, + { + "epoch": 0.15, + "learning_rate": 1.6976039765446002e-07, + "loss": 0.3391, + "step": 7837 + }, + { + "epoch": 0.15, + "learning_rate": 1.6975651431012387e-07, + "loss": 0.0063, + "step": 7838 + }, + { + "epoch": 0.15, + "learning_rate": 1.6975263096578774e-07, + "loss": 0.0127, + "step": 7839 + }, + { + "epoch": 0.15, + "learning_rate": 1.6974874762145158e-07, + "loss": 0.0964, + "step": 7840 + }, + { + "epoch": 0.15, + "learning_rate": 1.6974486427711546e-07, + "loss": 0.3507, + "step": 7841 + }, + { + "epoch": 0.15, + "learning_rate": 1.697409809327793e-07, + "loss": 0.0672, + "step": 7842 + }, + { + "epoch": 0.15, + "learning_rate": 1.6973709758844317e-07, + "loss": 0.0084, + "step": 7843 + }, + { + "epoch": 0.15, + "learning_rate": 1.6973321424410702e-07, + "loss": 0.0128, + "step": 7844 + }, + { + "epoch": 0.15, + "learning_rate": 1.697293308997709e-07, + "loss": 0.007, + "step": 7845 + }, + { + "epoch": 0.15, + "learning_rate": 1.6972544755543473e-07, + "loss": 0.0052, + "step": 7846 + }, + { + "epoch": 0.15, + "learning_rate": 1.697215642110986e-07, + "loss": 0.7822, + "step": 7847 + }, + { + "epoch": 0.15, + "learning_rate": 1.6971768086676245e-07, + "loss": 0.2325, + "step": 7848 + }, + { + "epoch": 0.15, + "learning_rate": 1.6971379752242632e-07, + "loss": 0.0063, + "step": 7849 + }, + { + "epoch": 0.15, + "learning_rate": 1.6970991417809017e-07, + "loss": 0.0272, + "step": 7850 + }, + { + "epoch": 0.15, + "learning_rate": 1.69706030833754e-07, + "loss": 0.0101, + "step": 7851 + }, + { + "epoch": 0.15, + "learning_rate": 1.6970214748941786e-07, + "loss": 0.0056, + "step": 7852 + }, + { + "epoch": 0.15, + "learning_rate": 1.6969826414508173e-07, + "loss": 0.009, + "step": 7853 + }, + { + "epoch": 0.15, + "learning_rate": 1.6969438080074557e-07, + "loss": 0.0207, + "step": 7854 + }, + { + "epoch": 0.15, + "learning_rate": 1.6969049745640945e-07, + "loss": 0.0052, + "step": 7855 + }, + { + "epoch": 0.15, + "learning_rate": 1.696866141120733e-07, + "loss": 0.6485, + "step": 7856 + }, + { + "epoch": 0.15, + "learning_rate": 1.6968273076773716e-07, + "loss": 0.0052, + "step": 7857 + }, + { + "epoch": 0.15, + "learning_rate": 1.69678847423401e-07, + "loss": 0.0046, + "step": 7858 + }, + { + "epoch": 0.15, + "learning_rate": 1.6967496407906488e-07, + "loss": 0.0123, + "step": 7859 + }, + { + "epoch": 0.15, + "learning_rate": 1.6967108073472872e-07, + "loss": 0.0202, + "step": 7860 + }, + { + "epoch": 0.15, + "learning_rate": 1.696671973903926e-07, + "loss": 0.0051, + "step": 7861 + }, + { + "epoch": 0.15, + "learning_rate": 1.6966331404605644e-07, + "loss": 0.0095, + "step": 7862 + }, + { + "epoch": 0.15, + "learning_rate": 1.696594307017203e-07, + "loss": 0.1936, + "step": 7863 + }, + { + "epoch": 0.15, + "learning_rate": 1.6965554735738416e-07, + "loss": 0.0214, + "step": 7864 + }, + { + "epoch": 0.15, + "learning_rate": 1.6965166401304803e-07, + "loss": 0.5521, + "step": 7865 + }, + { + "epoch": 0.15, + "learning_rate": 1.6964778066871187e-07, + "loss": 0.1471, + "step": 7866 + }, + { + "epoch": 0.15, + "learning_rate": 1.6964389732437574e-07, + "loss": 0.0818, + "step": 7867 + }, + { + "epoch": 0.15, + "learning_rate": 1.696400139800396e-07, + "loss": 0.026, + "step": 7868 + }, + { + "epoch": 0.15, + "learning_rate": 1.6963613063570346e-07, + "loss": 0.0133, + "step": 7869 + }, + { + "epoch": 0.15, + "learning_rate": 1.696322472913673e-07, + "loss": 0.0065, + "step": 7870 + }, + { + "epoch": 0.15, + "learning_rate": 1.6962836394703118e-07, + "loss": 0.0051, + "step": 7871 + }, + { + "epoch": 0.15, + "learning_rate": 1.6962448060269502e-07, + "loss": 0.1031, + "step": 7872 + }, + { + "epoch": 0.15, + "learning_rate": 1.696205972583589e-07, + "loss": 0.005, + "step": 7873 + }, + { + "epoch": 0.15, + "learning_rate": 1.6961671391402274e-07, + "loss": 0.0061, + "step": 7874 + }, + { + "epoch": 0.15, + "learning_rate": 1.696128305696866e-07, + "loss": 0.0146, + "step": 7875 + }, + { + "epoch": 0.15, + "learning_rate": 1.6960894722535046e-07, + "loss": 0.8055, + "step": 7876 + }, + { + "epoch": 0.15, + "learning_rate": 1.6960506388101433e-07, + "loss": 0.0051, + "step": 7877 + }, + { + "epoch": 0.15, + "learning_rate": 1.6960118053667817e-07, + "loss": 0.0076, + "step": 7878 + }, + { + "epoch": 0.15, + "learning_rate": 1.6959729719234204e-07, + "loss": 0.0047, + "step": 7879 + }, + { + "epoch": 0.15, + "learning_rate": 1.695934138480059e-07, + "loss": 0.0051, + "step": 7880 + }, + { + "epoch": 0.15, + "learning_rate": 1.6958953050366976e-07, + "loss": 0.007, + "step": 7881 + }, + { + "epoch": 0.15, + "learning_rate": 1.695856471593336e-07, + "loss": 0.0086, + "step": 7882 + }, + { + "epoch": 0.15, + "learning_rate": 1.6958176381499748e-07, + "loss": 0.0061, + "step": 7883 + }, + { + "epoch": 0.15, + "learning_rate": 1.6957788047066132e-07, + "loss": 0.0058, + "step": 7884 + }, + { + "epoch": 0.15, + "learning_rate": 1.695739971263252e-07, + "loss": 0.0514, + "step": 7885 + }, + { + "epoch": 0.15, + "learning_rate": 1.6957011378198904e-07, + "loss": 0.0143, + "step": 7886 + }, + { + "epoch": 0.15, + "learning_rate": 1.695662304376529e-07, + "loss": 0.0069, + "step": 7887 + }, + { + "epoch": 0.15, + "learning_rate": 1.6956234709331675e-07, + "loss": 0.0074, + "step": 7888 + }, + { + "epoch": 0.15, + "learning_rate": 1.6955846374898063e-07, + "loss": 0.0058, + "step": 7889 + }, + { + "epoch": 0.15, + "learning_rate": 1.6955458040464447e-07, + "loss": 0.0054, + "step": 7890 + }, + { + "epoch": 0.15, + "learning_rate": 1.6955069706030834e-07, + "loss": 0.1555, + "step": 7891 + }, + { + "epoch": 0.15, + "learning_rate": 1.695468137159722e-07, + "loss": 0.0047, + "step": 7892 + }, + { + "epoch": 0.15, + "learning_rate": 1.6954293037163606e-07, + "loss": 0.0136, + "step": 7893 + }, + { + "epoch": 0.15, + "learning_rate": 1.695390470272999e-07, + "loss": 0.1352, + "step": 7894 + }, + { + "epoch": 0.15, + "learning_rate": 1.6953516368296378e-07, + "loss": 0.0109, + "step": 7895 + }, + { + "epoch": 0.15, + "learning_rate": 1.6953128033862762e-07, + "loss": 0.0081, + "step": 7896 + }, + { + "epoch": 0.15, + "learning_rate": 1.695273969942915e-07, + "loss": 0.0048, + "step": 7897 + }, + { + "epoch": 0.15, + "learning_rate": 1.6952351364995534e-07, + "loss": 0.0104, + "step": 7898 + }, + { + "epoch": 0.15, + "learning_rate": 1.695196303056192e-07, + "loss": 0.0062, + "step": 7899 + }, + { + "epoch": 0.15, + "learning_rate": 1.6951574696128305e-07, + "loss": 0.0061, + "step": 7900 + }, + { + "epoch": 0.15, + "learning_rate": 1.6951186361694692e-07, + "loss": 0.0047, + "step": 7901 + }, + { + "epoch": 0.15, + "learning_rate": 1.6950798027261077e-07, + "loss": 0.6541, + "step": 7902 + }, + { + "epoch": 0.15, + "learning_rate": 1.6950409692827464e-07, + "loss": 0.0047, + "step": 7903 + }, + { + "epoch": 0.15, + "learning_rate": 1.6950021358393849e-07, + "loss": 0.0066, + "step": 7904 + }, + { + "epoch": 0.15, + "learning_rate": 1.6949633023960236e-07, + "loss": 0.7701, + "step": 7905 + }, + { + "epoch": 0.15, + "learning_rate": 1.694924468952662e-07, + "loss": 0.3083, + "step": 7906 + }, + { + "epoch": 0.15, + "learning_rate": 1.6948856355093007e-07, + "loss": 0.0078, + "step": 7907 + }, + { + "epoch": 0.15, + "learning_rate": 1.6948468020659392e-07, + "loss": 0.0348, + "step": 7908 + }, + { + "epoch": 0.15, + "learning_rate": 1.6948079686225776e-07, + "loss": 0.0201, + "step": 7909 + }, + { + "epoch": 0.15, + "learning_rate": 1.694769135179216e-07, + "loss": 0.006, + "step": 7910 + }, + { + "epoch": 0.15, + "learning_rate": 1.6947303017358548e-07, + "loss": 0.0082, + "step": 7911 + }, + { + "epoch": 0.15, + "learning_rate": 1.6946914682924933e-07, + "loss": 0.0061, + "step": 7912 + }, + { + "epoch": 0.15, + "learning_rate": 1.694652634849132e-07, + "loss": 0.0105, + "step": 7913 + }, + { + "epoch": 0.15, + "learning_rate": 1.6946138014057704e-07, + "loss": 0.1951, + "step": 7914 + }, + { + "epoch": 0.15, + "learning_rate": 1.6945749679624091e-07, + "loss": 0.0056, + "step": 7915 + }, + { + "epoch": 0.15, + "learning_rate": 1.6945361345190476e-07, + "loss": 0.0092, + "step": 7916 + }, + { + "epoch": 0.15, + "learning_rate": 1.6944973010756863e-07, + "loss": 0.042, + "step": 7917 + }, + { + "epoch": 0.15, + "learning_rate": 1.6944584676323248e-07, + "loss": 0.0208, + "step": 7918 + }, + { + "epoch": 0.15, + "learning_rate": 1.6944196341889635e-07, + "loss": 0.2336, + "step": 7919 + }, + { + "epoch": 0.15, + "learning_rate": 1.694380800745602e-07, + "loss": 0.2778, + "step": 7920 + }, + { + "epoch": 0.15, + "learning_rate": 1.6943419673022406e-07, + "loss": 0.0236, + "step": 7921 + }, + { + "epoch": 0.15, + "learning_rate": 1.694303133858879e-07, + "loss": 0.0062, + "step": 7922 + }, + { + "epoch": 0.15, + "learning_rate": 1.6942643004155178e-07, + "loss": 0.0155, + "step": 7923 + }, + { + "epoch": 0.15, + "learning_rate": 1.6942254669721562e-07, + "loss": 0.0465, + "step": 7924 + }, + { + "epoch": 0.15, + "learning_rate": 1.694186633528795e-07, + "loss": 0.0082, + "step": 7925 + }, + { + "epoch": 0.15, + "learning_rate": 1.6941478000854334e-07, + "loss": 0.0123, + "step": 7926 + }, + { + "epoch": 0.15, + "learning_rate": 1.694108966642072e-07, + "loss": 0.0049, + "step": 7927 + }, + { + "epoch": 0.15, + "learning_rate": 1.6940701331987106e-07, + "loss": 0.0239, + "step": 7928 + }, + { + "epoch": 0.15, + "learning_rate": 1.6940312997553493e-07, + "loss": 0.0073, + "step": 7929 + }, + { + "epoch": 0.15, + "learning_rate": 1.6939924663119877e-07, + "loss": 0.0051, + "step": 7930 + }, + { + "epoch": 0.15, + "learning_rate": 1.6939536328686265e-07, + "loss": 0.0054, + "step": 7931 + }, + { + "epoch": 0.15, + "learning_rate": 1.693914799425265e-07, + "loss": 0.0044, + "step": 7932 + }, + { + "epoch": 0.15, + "learning_rate": 1.6938759659819036e-07, + "loss": 0.0062, + "step": 7933 + }, + { + "epoch": 0.15, + "learning_rate": 1.693837132538542e-07, + "loss": 0.0071, + "step": 7934 + }, + { + "epoch": 0.15, + "learning_rate": 1.6937982990951808e-07, + "loss": 0.018, + "step": 7935 + }, + { + "epoch": 0.15, + "learning_rate": 1.6937594656518192e-07, + "loss": 0.0076, + "step": 7936 + }, + { + "epoch": 0.15, + "learning_rate": 1.693720632208458e-07, + "loss": 0.0051, + "step": 7937 + }, + { + "epoch": 0.15, + "learning_rate": 1.6936817987650964e-07, + "loss": 0.0375, + "step": 7938 + }, + { + "epoch": 0.15, + "learning_rate": 1.693642965321735e-07, + "loss": 0.0131, + "step": 7939 + }, + { + "epoch": 0.15, + "learning_rate": 1.6936041318783736e-07, + "loss": 0.0062, + "step": 7940 + }, + { + "epoch": 0.15, + "learning_rate": 1.6935652984350123e-07, + "loss": 0.0065, + "step": 7941 + }, + { + "epoch": 0.15, + "learning_rate": 1.6935264649916507e-07, + "loss": 0.0562, + "step": 7942 + }, + { + "epoch": 0.15, + "learning_rate": 1.6934876315482894e-07, + "loss": 0.2, + "step": 7943 + }, + { + "epoch": 0.15, + "learning_rate": 1.693448798104928e-07, + "loss": 0.0105, + "step": 7944 + }, + { + "epoch": 0.15, + "learning_rate": 1.6934099646615666e-07, + "loss": 0.007, + "step": 7945 + }, + { + "epoch": 0.15, + "learning_rate": 1.693371131218205e-07, + "loss": 0.0057, + "step": 7946 + }, + { + "epoch": 0.15, + "learning_rate": 1.6933322977748438e-07, + "loss": 0.9158, + "step": 7947 + }, + { + "epoch": 0.15, + "learning_rate": 1.6932934643314822e-07, + "loss": 0.1046, + "step": 7948 + }, + { + "epoch": 0.15, + "learning_rate": 1.693254630888121e-07, + "loss": 0.0163, + "step": 7949 + }, + { + "epoch": 0.15, + "learning_rate": 1.6932157974447594e-07, + "loss": 0.0057, + "step": 7950 + }, + { + "epoch": 0.15, + "learning_rate": 1.693176964001398e-07, + "loss": 0.242, + "step": 7951 + }, + { + "epoch": 0.15, + "learning_rate": 1.6931381305580366e-07, + "loss": 0.0054, + "step": 7952 + }, + { + "epoch": 0.15, + "learning_rate": 1.6930992971146753e-07, + "loss": 0.0053, + "step": 7953 + }, + { + "epoch": 0.15, + "learning_rate": 1.6930604636713137e-07, + "loss": 0.2391, + "step": 7954 + }, + { + "epoch": 0.15, + "learning_rate": 1.6930216302279524e-07, + "loss": 0.0371, + "step": 7955 + }, + { + "epoch": 0.15, + "learning_rate": 1.692982796784591e-07, + "loss": 0.9063, + "step": 7956 + }, + { + "epoch": 0.15, + "learning_rate": 1.6929439633412293e-07, + "loss": 0.6996, + "step": 7957 + }, + { + "epoch": 0.15, + "learning_rate": 1.692905129897868e-07, + "loss": 0.0054, + "step": 7958 + }, + { + "epoch": 0.15, + "learning_rate": 1.6928662964545065e-07, + "loss": 1.0585, + "step": 7959 + }, + { + "epoch": 0.15, + "learning_rate": 1.6928274630111452e-07, + "loss": 0.2079, + "step": 7960 + }, + { + "epoch": 0.15, + "learning_rate": 1.6927886295677837e-07, + "loss": 0.0407, + "step": 7961 + }, + { + "epoch": 0.15, + "learning_rate": 1.6927497961244224e-07, + "loss": 0.0694, + "step": 7962 + }, + { + "epoch": 0.15, + "learning_rate": 1.6927109626810608e-07, + "loss": 0.0051, + "step": 7963 + }, + { + "epoch": 0.15, + "learning_rate": 1.6926721292376995e-07, + "loss": 0.0082, + "step": 7964 + }, + { + "epoch": 0.15, + "learning_rate": 1.692633295794338e-07, + "loss": 0.0097, + "step": 7965 + }, + { + "epoch": 0.15, + "learning_rate": 1.6925944623509767e-07, + "loss": 0.341, + "step": 7966 + }, + { + "epoch": 0.15, + "learning_rate": 1.6925556289076152e-07, + "loss": 0.0067, + "step": 7967 + }, + { + "epoch": 0.15, + "learning_rate": 1.6925167954642536e-07, + "loss": 0.0116, + "step": 7968 + }, + { + "epoch": 0.15, + "learning_rate": 1.6924779620208923e-07, + "loss": 0.0054, + "step": 7969 + }, + { + "epoch": 0.15, + "learning_rate": 1.6924391285775308e-07, + "loss": 0.0053, + "step": 7970 + }, + { + "epoch": 0.15, + "learning_rate": 1.6924002951341695e-07, + "loss": 0.0056, + "step": 7971 + }, + { + "epoch": 0.15, + "learning_rate": 1.692361461690808e-07, + "loss": 0.0069, + "step": 7972 + }, + { + "epoch": 0.15, + "learning_rate": 1.6923226282474467e-07, + "loss": 0.0066, + "step": 7973 + }, + { + "epoch": 0.15, + "learning_rate": 1.692283794804085e-07, + "loss": 0.0075, + "step": 7974 + }, + { + "epoch": 0.15, + "learning_rate": 1.6922449613607238e-07, + "loss": 0.1256, + "step": 7975 + }, + { + "epoch": 0.15, + "learning_rate": 1.6922061279173623e-07, + "loss": 0.7111, + "step": 7976 + }, + { + "epoch": 0.15, + "learning_rate": 1.692167294474001e-07, + "loss": 0.0519, + "step": 7977 + }, + { + "epoch": 0.15, + "learning_rate": 1.6921284610306394e-07, + "loss": 0.7552, + "step": 7978 + }, + { + "epoch": 0.15, + "learning_rate": 1.6920896275872781e-07, + "loss": 0.0064, + "step": 7979 + }, + { + "epoch": 0.15, + "learning_rate": 1.6920507941439166e-07, + "loss": 0.0091, + "step": 7980 + }, + { + "epoch": 0.15, + "learning_rate": 1.6920119607005553e-07, + "loss": 0.0056, + "step": 7981 + }, + { + "epoch": 0.15, + "learning_rate": 1.6919731272571938e-07, + "loss": 0.0121, + "step": 7982 + }, + { + "epoch": 0.15, + "learning_rate": 1.6919342938138325e-07, + "loss": 0.0083, + "step": 7983 + }, + { + "epoch": 0.15, + "learning_rate": 1.691895460370471e-07, + "loss": 0.0373, + "step": 7984 + }, + { + "epoch": 0.15, + "learning_rate": 1.6918566269271094e-07, + "loss": 0.061, + "step": 7985 + }, + { + "epoch": 0.15, + "learning_rate": 1.691817793483748e-07, + "loss": 0.7206, + "step": 7986 + }, + { + "epoch": 0.15, + "learning_rate": 1.6917789600403865e-07, + "loss": 0.0231, + "step": 7987 + }, + { + "epoch": 0.15, + "learning_rate": 1.6917401265970253e-07, + "loss": 0.0075, + "step": 7988 + }, + { + "epoch": 0.15, + "learning_rate": 1.6917012931536637e-07, + "loss": 0.6876, + "step": 7989 + }, + { + "epoch": 0.15, + "learning_rate": 1.6916624597103024e-07, + "loss": 0.0089, + "step": 7990 + }, + { + "epoch": 0.16, + "learning_rate": 1.691623626266941e-07, + "loss": 0.0064, + "step": 7991 + }, + { + "epoch": 0.16, + "learning_rate": 1.6915847928235796e-07, + "loss": 0.4747, + "step": 7992 + }, + { + "epoch": 0.16, + "learning_rate": 1.691545959380218e-07, + "loss": 0.0071, + "step": 7993 + }, + { + "epoch": 0.16, + "learning_rate": 1.6915071259368568e-07, + "loss": 0.0148, + "step": 7994 + }, + { + "epoch": 0.16, + "learning_rate": 1.6914682924934952e-07, + "loss": 0.0055, + "step": 7995 + }, + { + "epoch": 0.16, + "learning_rate": 1.691429459050134e-07, + "loss": 0.0048, + "step": 7996 + }, + { + "epoch": 0.16, + "learning_rate": 1.6913906256067724e-07, + "loss": 0.0065, + "step": 7997 + }, + { + "epoch": 0.16, + "learning_rate": 1.691351792163411e-07, + "loss": 0.4172, + "step": 7998 + }, + { + "epoch": 0.16, + "learning_rate": 1.6913129587200495e-07, + "loss": 0.0073, + "step": 7999 + }, + { + "epoch": 0.16, + "learning_rate": 1.6912741252766882e-07, + "loss": 0.0054, + "step": 8000 + }, + { + "epoch": 0.16, + "learning_rate": 1.6912352918333267e-07, + "loss": 0.0056, + "step": 8001 + }, + { + "epoch": 0.16, + "learning_rate": 1.6911964583899654e-07, + "loss": 0.0934, + "step": 8002 + }, + { + "epoch": 0.16, + "learning_rate": 1.6911576249466039e-07, + "loss": 0.442, + "step": 8003 + }, + { + "epoch": 0.16, + "learning_rate": 1.6911187915032426e-07, + "loss": 0.0065, + "step": 8004 + }, + { + "epoch": 0.16, + "learning_rate": 1.691079958059881e-07, + "loss": 0.1984, + "step": 8005 + }, + { + "epoch": 0.16, + "learning_rate": 1.6910411246165197e-07, + "loss": 0.0082, + "step": 8006 + }, + { + "epoch": 0.16, + "learning_rate": 1.6910022911731582e-07, + "loss": 0.007, + "step": 8007 + }, + { + "epoch": 0.16, + "learning_rate": 1.690963457729797e-07, + "loss": 0.0048, + "step": 8008 + }, + { + "epoch": 0.16, + "learning_rate": 1.6909246242864354e-07, + "loss": 0.0063, + "step": 8009 + }, + { + "epoch": 0.16, + "learning_rate": 1.690885790843074e-07, + "loss": 0.051, + "step": 8010 + }, + { + "epoch": 0.16, + "learning_rate": 1.6908469573997125e-07, + "loss": 0.0042, + "step": 8011 + }, + { + "epoch": 0.16, + "learning_rate": 1.6908081239563512e-07, + "loss": 0.0049, + "step": 8012 + }, + { + "epoch": 0.16, + "learning_rate": 1.6907692905129897e-07, + "loss": 0.0052, + "step": 8013 + }, + { + "epoch": 0.16, + "learning_rate": 1.6907304570696284e-07, + "loss": 0.0159, + "step": 8014 + }, + { + "epoch": 0.16, + "learning_rate": 1.6906916236262669e-07, + "loss": 0.1061, + "step": 8015 + }, + { + "epoch": 0.16, + "learning_rate": 1.6906527901829056e-07, + "loss": 0.0071, + "step": 8016 + }, + { + "epoch": 0.16, + "learning_rate": 1.690613956739544e-07, + "loss": 0.0117, + "step": 8017 + }, + { + "epoch": 0.16, + "learning_rate": 1.6905751232961827e-07, + "loss": 0.0083, + "step": 8018 + }, + { + "epoch": 0.16, + "learning_rate": 1.6905362898528212e-07, + "loss": 0.0042, + "step": 8019 + }, + { + "epoch": 0.16, + "learning_rate": 1.69049745640946e-07, + "loss": 0.018, + "step": 8020 + }, + { + "epoch": 0.16, + "learning_rate": 1.6904586229660983e-07, + "loss": 0.0056, + "step": 8021 + }, + { + "epoch": 0.16, + "learning_rate": 1.690419789522737e-07, + "loss": 1.0878, + "step": 8022 + }, + { + "epoch": 0.16, + "learning_rate": 1.6903809560793755e-07, + "loss": 0.0074, + "step": 8023 + }, + { + "epoch": 0.16, + "learning_rate": 1.6903421226360142e-07, + "loss": 0.0227, + "step": 8024 + }, + { + "epoch": 0.16, + "learning_rate": 1.6903032891926524e-07, + "loss": 0.7146, + "step": 8025 + }, + { + "epoch": 0.16, + "learning_rate": 1.690264455749291e-07, + "loss": 0.0064, + "step": 8026 + }, + { + "epoch": 0.16, + "learning_rate": 1.6902256223059296e-07, + "loss": 0.352, + "step": 8027 + }, + { + "epoch": 0.16, + "learning_rate": 1.6901867888625683e-07, + "loss": 0.092, + "step": 8028 + }, + { + "epoch": 0.16, + "learning_rate": 1.6901479554192067e-07, + "loss": 1.0337, + "step": 8029 + }, + { + "epoch": 0.16, + "learning_rate": 1.6901091219758455e-07, + "loss": 0.4523, + "step": 8030 + }, + { + "epoch": 0.16, + "learning_rate": 1.690070288532484e-07, + "loss": 0.0062, + "step": 8031 + }, + { + "epoch": 0.16, + "learning_rate": 1.6900314550891226e-07, + "loss": 0.0165, + "step": 8032 + }, + { + "epoch": 0.16, + "learning_rate": 1.689992621645761e-07, + "loss": 0.0066, + "step": 8033 + }, + { + "epoch": 0.16, + "learning_rate": 1.6899537882023998e-07, + "loss": 0.0055, + "step": 8034 + }, + { + "epoch": 0.16, + "learning_rate": 1.6899149547590382e-07, + "loss": 0.0064, + "step": 8035 + }, + { + "epoch": 0.16, + "learning_rate": 1.689876121315677e-07, + "loss": 0.0218, + "step": 8036 + }, + { + "epoch": 0.16, + "learning_rate": 1.6898372878723154e-07, + "loss": 0.0053, + "step": 8037 + }, + { + "epoch": 0.16, + "learning_rate": 1.689798454428954e-07, + "loss": 0.0071, + "step": 8038 + }, + { + "epoch": 0.16, + "learning_rate": 1.6897596209855926e-07, + "loss": 0.0082, + "step": 8039 + }, + { + "epoch": 0.16, + "learning_rate": 1.6897207875422313e-07, + "loss": 0.0227, + "step": 8040 + }, + { + "epoch": 0.16, + "learning_rate": 1.6896819540988697e-07, + "loss": 0.2932, + "step": 8041 + }, + { + "epoch": 0.16, + "learning_rate": 1.6896431206555084e-07, + "loss": 0.005, + "step": 8042 + }, + { + "epoch": 0.16, + "learning_rate": 1.689604287212147e-07, + "loss": 0.0056, + "step": 8043 + }, + { + "epoch": 0.16, + "learning_rate": 1.6895654537687856e-07, + "loss": 0.0071, + "step": 8044 + }, + { + "epoch": 0.16, + "learning_rate": 1.689526620325424e-07, + "loss": 0.0548, + "step": 8045 + }, + { + "epoch": 0.16, + "learning_rate": 1.6894877868820628e-07, + "loss": 0.3557, + "step": 8046 + }, + { + "epoch": 0.16, + "learning_rate": 1.6894489534387012e-07, + "loss": 0.0042, + "step": 8047 + }, + { + "epoch": 0.16, + "learning_rate": 1.68941011999534e-07, + "loss": 0.0063, + "step": 8048 + }, + { + "epoch": 0.16, + "learning_rate": 1.6893712865519784e-07, + "loss": 0.0055, + "step": 8049 + }, + { + "epoch": 0.16, + "learning_rate": 1.689332453108617e-07, + "loss": 0.1317, + "step": 8050 + }, + { + "epoch": 0.16, + "learning_rate": 1.6892936196652556e-07, + "loss": 0.011, + "step": 8051 + }, + { + "epoch": 0.16, + "learning_rate": 1.6892547862218943e-07, + "loss": 0.0472, + "step": 8052 + }, + { + "epoch": 0.16, + "learning_rate": 1.6892159527785327e-07, + "loss": 0.3208, + "step": 8053 + }, + { + "epoch": 0.16, + "learning_rate": 1.6891771193351714e-07, + "loss": 0.0062, + "step": 8054 + }, + { + "epoch": 0.16, + "learning_rate": 1.68913828589181e-07, + "loss": 0.3591, + "step": 8055 + }, + { + "epoch": 0.16, + "learning_rate": 1.6890994524484486e-07, + "loss": 0.0048, + "step": 8056 + }, + { + "epoch": 0.16, + "learning_rate": 1.689060619005087e-07, + "loss": 0.0847, + "step": 8057 + }, + { + "epoch": 0.16, + "learning_rate": 1.6890217855617258e-07, + "loss": 0.0968, + "step": 8058 + }, + { + "epoch": 0.16, + "learning_rate": 1.6889829521183642e-07, + "loss": 0.0067, + "step": 8059 + }, + { + "epoch": 0.16, + "learning_rate": 1.688944118675003e-07, + "loss": 0.3885, + "step": 8060 + }, + { + "epoch": 0.16, + "learning_rate": 1.6889052852316414e-07, + "loss": 0.4186, + "step": 8061 + }, + { + "epoch": 0.16, + "learning_rate": 1.68886645178828e-07, + "loss": 0.0143, + "step": 8062 + }, + { + "epoch": 0.16, + "learning_rate": 1.6888276183449185e-07, + "loss": 0.0173, + "step": 8063 + }, + { + "epoch": 0.16, + "learning_rate": 1.6887887849015573e-07, + "loss": 0.0113, + "step": 8064 + }, + { + "epoch": 0.16, + "learning_rate": 1.6887499514581957e-07, + "loss": 0.0061, + "step": 8065 + }, + { + "epoch": 0.16, + "learning_rate": 1.6887111180148344e-07, + "loss": 0.0384, + "step": 8066 + }, + { + "epoch": 0.16, + "learning_rate": 1.688672284571473e-07, + "loss": 0.2953, + "step": 8067 + }, + { + "epoch": 0.16, + "learning_rate": 1.6886334511281116e-07, + "loss": 0.0075, + "step": 8068 + }, + { + "epoch": 0.16, + "learning_rate": 1.68859461768475e-07, + "loss": 0.0051, + "step": 8069 + }, + { + "epoch": 0.16, + "learning_rate": 1.6885557842413888e-07, + "loss": 0.0058, + "step": 8070 + }, + { + "epoch": 0.16, + "learning_rate": 1.6885169507980272e-07, + "loss": 0.0068, + "step": 8071 + }, + { + "epoch": 0.16, + "learning_rate": 1.688478117354666e-07, + "loss": 0.0047, + "step": 8072 + }, + { + "epoch": 0.16, + "learning_rate": 1.6884392839113044e-07, + "loss": 0.0057, + "step": 8073 + }, + { + "epoch": 0.16, + "learning_rate": 1.688400450467943e-07, + "loss": 0.0053, + "step": 8074 + }, + { + "epoch": 0.16, + "learning_rate": 1.6883616170245815e-07, + "loss": 0.0123, + "step": 8075 + }, + { + "epoch": 0.16, + "learning_rate": 1.6883227835812202e-07, + "loss": 0.7576, + "step": 8076 + }, + { + "epoch": 0.16, + "learning_rate": 1.6882839501378587e-07, + "loss": 0.0054, + "step": 8077 + }, + { + "epoch": 0.16, + "learning_rate": 1.6882451166944974e-07, + "loss": 0.8549, + "step": 8078 + }, + { + "epoch": 0.16, + "learning_rate": 1.6882062832511359e-07, + "loss": 0.0425, + "step": 8079 + }, + { + "epoch": 0.16, + "learning_rate": 1.6881674498077746e-07, + "loss": 0.0178, + "step": 8080 + }, + { + "epoch": 0.16, + "learning_rate": 1.688128616364413e-07, + "loss": 0.0067, + "step": 8081 + }, + { + "epoch": 0.16, + "learning_rate": 1.6880897829210517e-07, + "loss": 0.0712, + "step": 8082 + }, + { + "epoch": 0.16, + "learning_rate": 1.68805094947769e-07, + "loss": 0.0064, + "step": 8083 + }, + { + "epoch": 0.16, + "learning_rate": 1.6880121160343286e-07, + "loss": 0.4617, + "step": 8084 + }, + { + "epoch": 0.16, + "learning_rate": 1.687973282590967e-07, + "loss": 0.0049, + "step": 8085 + }, + { + "epoch": 0.16, + "learning_rate": 1.6879344491476058e-07, + "loss": 0.0069, + "step": 8086 + }, + { + "epoch": 0.16, + "learning_rate": 1.6878956157042443e-07, + "loss": 0.004, + "step": 8087 + }, + { + "epoch": 0.16, + "learning_rate": 1.687856782260883e-07, + "loss": 0.0153, + "step": 8088 + }, + { + "epoch": 0.16, + "learning_rate": 1.6878179488175214e-07, + "loss": 0.0046, + "step": 8089 + }, + { + "epoch": 0.16, + "learning_rate": 1.6877791153741601e-07, + "loss": 0.4333, + "step": 8090 + }, + { + "epoch": 0.16, + "learning_rate": 1.6877402819307986e-07, + "loss": 0.1924, + "step": 8091 + }, + { + "epoch": 0.16, + "learning_rate": 1.6877014484874373e-07, + "loss": 0.005, + "step": 8092 + }, + { + "epoch": 0.16, + "learning_rate": 1.6876626150440758e-07, + "loss": 0.0089, + "step": 8093 + }, + { + "epoch": 0.16, + "learning_rate": 1.6876237816007145e-07, + "loss": 0.4348, + "step": 8094 + }, + { + "epoch": 0.16, + "learning_rate": 1.687584948157353e-07, + "loss": 0.0065, + "step": 8095 + }, + { + "epoch": 0.16, + "learning_rate": 1.6875461147139916e-07, + "loss": 0.0062, + "step": 8096 + }, + { + "epoch": 0.16, + "learning_rate": 1.68750728127063e-07, + "loss": 0.0062, + "step": 8097 + }, + { + "epoch": 0.16, + "learning_rate": 1.6874684478272688e-07, + "loss": 0.0097, + "step": 8098 + }, + { + "epoch": 0.16, + "learning_rate": 1.6874296143839072e-07, + "loss": 0.0052, + "step": 8099 + }, + { + "epoch": 0.16, + "learning_rate": 1.687390780940546e-07, + "loss": 0.0055, + "step": 8100 + }, + { + "epoch": 0.16, + "learning_rate": 1.6873519474971844e-07, + "loss": 0.0147, + "step": 8101 + }, + { + "epoch": 0.16, + "learning_rate": 1.687313114053823e-07, + "loss": 0.0096, + "step": 8102 + }, + { + "epoch": 0.16, + "learning_rate": 1.6872742806104616e-07, + "loss": 0.0067, + "step": 8103 + }, + { + "epoch": 0.16, + "learning_rate": 1.6872354471671003e-07, + "loss": 0.015, + "step": 8104 + }, + { + "epoch": 0.16, + "learning_rate": 1.6871966137237387e-07, + "loss": 0.0136, + "step": 8105 + }, + { + "epoch": 0.16, + "learning_rate": 1.6871577802803775e-07, + "loss": 0.0069, + "step": 8106 + }, + { + "epoch": 0.16, + "learning_rate": 1.687118946837016e-07, + "loss": 0.0054, + "step": 8107 + }, + { + "epoch": 0.16, + "learning_rate": 1.6870801133936546e-07, + "loss": 0.7385, + "step": 8108 + }, + { + "epoch": 0.16, + "learning_rate": 1.687041279950293e-07, + "loss": 0.0042, + "step": 8109 + }, + { + "epoch": 0.16, + "learning_rate": 1.6870024465069318e-07, + "loss": 0.51, + "step": 8110 + }, + { + "epoch": 0.16, + "learning_rate": 1.6869636130635702e-07, + "loss": 0.0064, + "step": 8111 + }, + { + "epoch": 0.16, + "learning_rate": 1.686924779620209e-07, + "loss": 0.1739, + "step": 8112 + }, + { + "epoch": 0.16, + "learning_rate": 1.6868859461768474e-07, + "loss": 0.0694, + "step": 8113 + }, + { + "epoch": 0.16, + "learning_rate": 1.686847112733486e-07, + "loss": 0.0058, + "step": 8114 + }, + { + "epoch": 0.16, + "learning_rate": 1.6868082792901246e-07, + "loss": 0.1952, + "step": 8115 + }, + { + "epoch": 0.16, + "learning_rate": 1.6867694458467633e-07, + "loss": 0.0354, + "step": 8116 + }, + { + "epoch": 0.16, + "learning_rate": 1.6867306124034017e-07, + "loss": 0.0048, + "step": 8117 + }, + { + "epoch": 0.16, + "learning_rate": 1.6866917789600404e-07, + "loss": 0.034, + "step": 8118 + }, + { + "epoch": 0.16, + "learning_rate": 1.686652945516679e-07, + "loss": 0.0076, + "step": 8119 + }, + { + "epoch": 0.16, + "learning_rate": 1.6866141120733176e-07, + "loss": 0.0384, + "step": 8120 + }, + { + "epoch": 0.16, + "learning_rate": 1.686575278629956e-07, + "loss": 0.01, + "step": 8121 + }, + { + "epoch": 0.16, + "learning_rate": 1.6865364451865948e-07, + "loss": 0.3032, + "step": 8122 + }, + { + "epoch": 0.16, + "learning_rate": 1.6864976117432332e-07, + "loss": 0.0081, + "step": 8123 + }, + { + "epoch": 0.16, + "learning_rate": 1.686458778299872e-07, + "loss": 0.0074, + "step": 8124 + }, + { + "epoch": 0.16, + "learning_rate": 1.6864199448565104e-07, + "loss": 0.0088, + "step": 8125 + }, + { + "epoch": 0.16, + "learning_rate": 1.686381111413149e-07, + "loss": 0.0117, + "step": 8126 + }, + { + "epoch": 0.16, + "learning_rate": 1.6863422779697876e-07, + "loss": 0.053, + "step": 8127 + }, + { + "epoch": 0.16, + "learning_rate": 1.6863034445264263e-07, + "loss": 0.0046, + "step": 8128 + }, + { + "epoch": 0.16, + "learning_rate": 1.6862646110830647e-07, + "loss": 0.3723, + "step": 8129 + }, + { + "epoch": 0.16, + "learning_rate": 1.6862257776397034e-07, + "loss": 0.4459, + "step": 8130 + }, + { + "epoch": 0.16, + "learning_rate": 1.686186944196342e-07, + "loss": 0.0365, + "step": 8131 + }, + { + "epoch": 0.16, + "learning_rate": 1.6861481107529806e-07, + "loss": 0.0136, + "step": 8132 + }, + { + "epoch": 0.16, + "learning_rate": 1.686109277309619e-07, + "loss": 0.0062, + "step": 8133 + }, + { + "epoch": 0.16, + "learning_rate": 1.6860704438662575e-07, + "loss": 0.0046, + "step": 8134 + }, + { + "epoch": 0.16, + "learning_rate": 1.6860316104228962e-07, + "loss": 0.0049, + "step": 8135 + }, + { + "epoch": 0.16, + "learning_rate": 1.6859927769795347e-07, + "loss": 0.0067, + "step": 8136 + }, + { + "epoch": 0.16, + "learning_rate": 1.6859539435361734e-07, + "loss": 0.0046, + "step": 8137 + }, + { + "epoch": 0.16, + "learning_rate": 1.6859151100928118e-07, + "loss": 0.2789, + "step": 8138 + }, + { + "epoch": 0.16, + "learning_rate": 1.6858762766494505e-07, + "loss": 0.0084, + "step": 8139 + }, + { + "epoch": 0.16, + "learning_rate": 1.685837443206089e-07, + "loss": 0.0039, + "step": 8140 + }, + { + "epoch": 0.16, + "learning_rate": 1.6857986097627274e-07, + "loss": 0.0285, + "step": 8141 + }, + { + "epoch": 0.16, + "learning_rate": 1.6857597763193662e-07, + "loss": 0.8619, + "step": 8142 + }, + { + "epoch": 0.16, + "learning_rate": 1.6857209428760046e-07, + "loss": 0.0037, + "step": 8143 + }, + { + "epoch": 0.16, + "learning_rate": 1.6856821094326433e-07, + "loss": 0.0459, + "step": 8144 + }, + { + "epoch": 0.16, + "learning_rate": 1.6856432759892818e-07, + "loss": 0.6613, + "step": 8145 + }, + { + "epoch": 0.16, + "learning_rate": 1.6856044425459205e-07, + "loss": 0.0058, + "step": 8146 + }, + { + "epoch": 0.16, + "learning_rate": 1.685565609102559e-07, + "loss": 0.0608, + "step": 8147 + }, + { + "epoch": 0.16, + "learning_rate": 1.6855267756591977e-07, + "loss": 0.0056, + "step": 8148 + }, + { + "epoch": 0.16, + "learning_rate": 1.685487942215836e-07, + "loss": 0.2741, + "step": 8149 + }, + { + "epoch": 0.16, + "learning_rate": 1.6854491087724748e-07, + "loss": 0.0448, + "step": 8150 + }, + { + "epoch": 0.16, + "learning_rate": 1.6854102753291133e-07, + "loss": 0.0049, + "step": 8151 + }, + { + "epoch": 0.16, + "learning_rate": 1.685371441885752e-07, + "loss": 0.0047, + "step": 8152 + }, + { + "epoch": 0.16, + "learning_rate": 1.6853326084423904e-07, + "loss": 0.005, + "step": 8153 + }, + { + "epoch": 0.16, + "learning_rate": 1.6852937749990291e-07, + "loss": 0.036, + "step": 8154 + }, + { + "epoch": 0.16, + "learning_rate": 1.6852549415556676e-07, + "loss": 0.3313, + "step": 8155 + }, + { + "epoch": 0.16, + "learning_rate": 1.6852161081123063e-07, + "loss": 0.0908, + "step": 8156 + }, + { + "epoch": 0.16, + "learning_rate": 1.6851772746689448e-07, + "loss": 0.4565, + "step": 8157 + }, + { + "epoch": 0.16, + "learning_rate": 1.6851384412255835e-07, + "loss": 0.0055, + "step": 8158 + }, + { + "epoch": 0.16, + "learning_rate": 1.685099607782222e-07, + "loss": 0.0157, + "step": 8159 + }, + { + "epoch": 0.16, + "learning_rate": 1.6850607743388606e-07, + "loss": 0.1351, + "step": 8160 + }, + { + "epoch": 0.16, + "learning_rate": 1.685021940895499e-07, + "loss": 0.0048, + "step": 8161 + }, + { + "epoch": 0.16, + "learning_rate": 1.6849831074521375e-07, + "loss": 0.0052, + "step": 8162 + }, + { + "epoch": 0.16, + "learning_rate": 1.6849442740087763e-07, + "loss": 0.0047, + "step": 8163 + }, + { + "epoch": 0.16, + "learning_rate": 1.6849054405654147e-07, + "loss": 0.0401, + "step": 8164 + }, + { + "epoch": 0.16, + "learning_rate": 1.6848666071220534e-07, + "loss": 0.0225, + "step": 8165 + }, + { + "epoch": 0.16, + "learning_rate": 1.684827773678692e-07, + "loss": 0.5143, + "step": 8166 + }, + { + "epoch": 0.16, + "learning_rate": 1.6847889402353306e-07, + "loss": 0.0049, + "step": 8167 + }, + { + "epoch": 0.16, + "learning_rate": 1.684750106791969e-07, + "loss": 0.0046, + "step": 8168 + }, + { + "epoch": 0.16, + "learning_rate": 1.6847112733486078e-07, + "loss": 0.3988, + "step": 8169 + }, + { + "epoch": 0.16, + "learning_rate": 1.6846724399052462e-07, + "loss": 0.0059, + "step": 8170 + }, + { + "epoch": 0.16, + "learning_rate": 1.684633606461885e-07, + "loss": 0.0057, + "step": 8171 + }, + { + "epoch": 0.16, + "learning_rate": 1.6845947730185234e-07, + "loss": 0.0256, + "step": 8172 + }, + { + "epoch": 0.16, + "learning_rate": 1.684555939575162e-07, + "loss": 0.0224, + "step": 8173 + }, + { + "epoch": 0.16, + "learning_rate": 1.6845171061318005e-07, + "loss": 0.0043, + "step": 8174 + }, + { + "epoch": 0.16, + "learning_rate": 1.6844782726884392e-07, + "loss": 0.1036, + "step": 8175 + }, + { + "epoch": 0.16, + "learning_rate": 1.6844394392450777e-07, + "loss": 0.0048, + "step": 8176 + }, + { + "epoch": 0.16, + "learning_rate": 1.6844006058017164e-07, + "loss": 0.0293, + "step": 8177 + }, + { + "epoch": 0.16, + "learning_rate": 1.6843617723583549e-07, + "loss": 0.0054, + "step": 8178 + }, + { + "epoch": 0.16, + "learning_rate": 1.6843229389149936e-07, + "loss": 0.832, + "step": 8179 + }, + { + "epoch": 0.16, + "learning_rate": 1.684284105471632e-07, + "loss": 0.0052, + "step": 8180 + }, + { + "epoch": 0.16, + "learning_rate": 1.6842452720282707e-07, + "loss": 0.0041, + "step": 8181 + }, + { + "epoch": 0.16, + "learning_rate": 1.6842064385849092e-07, + "loss": 0.0043, + "step": 8182 + }, + { + "epoch": 0.16, + "learning_rate": 1.684167605141548e-07, + "loss": 0.5408, + "step": 8183 + }, + { + "epoch": 0.16, + "learning_rate": 1.6841287716981864e-07, + "loss": 0.006, + "step": 8184 + }, + { + "epoch": 0.16, + "learning_rate": 1.684089938254825e-07, + "loss": 0.0044, + "step": 8185 + }, + { + "epoch": 0.16, + "learning_rate": 1.6840511048114635e-07, + "loss": 0.0254, + "step": 8186 + }, + { + "epoch": 0.16, + "learning_rate": 1.6840122713681022e-07, + "loss": 0.0083, + "step": 8187 + }, + { + "epoch": 0.16, + "learning_rate": 1.6839734379247407e-07, + "loss": 0.0055, + "step": 8188 + }, + { + "epoch": 0.16, + "learning_rate": 1.6839346044813794e-07, + "loss": 0.0106, + "step": 8189 + }, + { + "epoch": 0.16, + "learning_rate": 1.6838957710380179e-07, + "loss": 0.0164, + "step": 8190 + }, + { + "epoch": 0.16, + "learning_rate": 1.6838569375946566e-07, + "loss": 0.012, + "step": 8191 + }, + { + "epoch": 0.16, + "learning_rate": 1.683818104151295e-07, + "loss": 0.0224, + "step": 8192 + }, + { + "epoch": 0.16, + "learning_rate": 1.6837792707079337e-07, + "loss": 0.3991, + "step": 8193 + }, + { + "epoch": 0.16, + "learning_rate": 1.6837404372645722e-07, + "loss": 0.1268, + "step": 8194 + }, + { + "epoch": 0.16, + "learning_rate": 1.683701603821211e-07, + "loss": 0.0176, + "step": 8195 + }, + { + "epoch": 0.16, + "learning_rate": 1.6836627703778493e-07, + "loss": 0.2472, + "step": 8196 + }, + { + "epoch": 0.16, + "learning_rate": 1.683623936934488e-07, + "loss": 0.0047, + "step": 8197 + }, + { + "epoch": 0.16, + "learning_rate": 1.6835851034911265e-07, + "loss": 0.0049, + "step": 8198 + }, + { + "epoch": 0.16, + "learning_rate": 1.683546270047765e-07, + "loss": 0.0056, + "step": 8199 + }, + { + "epoch": 0.16, + "learning_rate": 1.6835074366044034e-07, + "loss": 0.0061, + "step": 8200 + }, + { + "epoch": 0.16, + "learning_rate": 1.683468603161042e-07, + "loss": 0.0325, + "step": 8201 + }, + { + "epoch": 0.16, + "learning_rate": 1.6834297697176806e-07, + "loss": 0.0229, + "step": 8202 + }, + { + "epoch": 0.16, + "learning_rate": 1.6833909362743193e-07, + "loss": 0.1145, + "step": 8203 + }, + { + "epoch": 0.16, + "learning_rate": 1.6833521028309577e-07, + "loss": 0.0085, + "step": 8204 + }, + { + "epoch": 0.16, + "learning_rate": 1.6833132693875965e-07, + "loss": 0.5964, + "step": 8205 + }, + { + "epoch": 0.16, + "learning_rate": 1.683274435944235e-07, + "loss": 0.7345, + "step": 8206 + }, + { + "epoch": 0.16, + "learning_rate": 1.6832356025008736e-07, + "loss": 0.1046, + "step": 8207 + }, + { + "epoch": 0.16, + "learning_rate": 1.683196769057512e-07, + "loss": 0.2189, + "step": 8208 + }, + { + "epoch": 0.16, + "learning_rate": 1.6831579356141508e-07, + "loss": 0.0141, + "step": 8209 + }, + { + "epoch": 0.16, + "learning_rate": 1.6831191021707892e-07, + "loss": 0.0046, + "step": 8210 + }, + { + "epoch": 0.16, + "learning_rate": 1.683080268727428e-07, + "loss": 0.0064, + "step": 8211 + }, + { + "epoch": 0.16, + "learning_rate": 1.6830414352840664e-07, + "loss": 0.0234, + "step": 8212 + }, + { + "epoch": 0.16, + "learning_rate": 1.683002601840705e-07, + "loss": 0.0071, + "step": 8213 + }, + { + "epoch": 0.16, + "learning_rate": 1.6829637683973436e-07, + "loss": 0.0047, + "step": 8214 + }, + { + "epoch": 0.16, + "learning_rate": 1.6829249349539823e-07, + "loss": 0.0059, + "step": 8215 + }, + { + "epoch": 0.16, + "learning_rate": 1.6828861015106207e-07, + "loss": 0.0086, + "step": 8216 + }, + { + "epoch": 0.16, + "learning_rate": 1.6828472680672594e-07, + "loss": 0.013, + "step": 8217 + }, + { + "epoch": 0.16, + "learning_rate": 1.682808434623898e-07, + "loss": 0.0926, + "step": 8218 + }, + { + "epoch": 0.16, + "learning_rate": 1.6827696011805366e-07, + "loss": 0.0056, + "step": 8219 + }, + { + "epoch": 0.16, + "learning_rate": 1.682730767737175e-07, + "loss": 0.0049, + "step": 8220 + }, + { + "epoch": 0.16, + "learning_rate": 1.6826919342938138e-07, + "loss": 0.0352, + "step": 8221 + }, + { + "epoch": 0.16, + "learning_rate": 1.6826531008504522e-07, + "loss": 0.0599, + "step": 8222 + }, + { + "epoch": 0.16, + "learning_rate": 1.682614267407091e-07, + "loss": 0.052, + "step": 8223 + }, + { + "epoch": 0.16, + "learning_rate": 1.6825754339637294e-07, + "loss": 0.0051, + "step": 8224 + }, + { + "epoch": 0.16, + "learning_rate": 1.682536600520368e-07, + "loss": 0.041, + "step": 8225 + }, + { + "epoch": 0.16, + "learning_rate": 1.6824977670770066e-07, + "loss": 0.0053, + "step": 8226 + }, + { + "epoch": 0.16, + "learning_rate": 1.6824589336336453e-07, + "loss": 0.0044, + "step": 8227 + }, + { + "epoch": 0.16, + "learning_rate": 1.6824201001902837e-07, + "loss": 1.0944, + "step": 8228 + }, + { + "epoch": 0.16, + "learning_rate": 1.6823812667469224e-07, + "loss": 0.0041, + "step": 8229 + }, + { + "epoch": 0.16, + "learning_rate": 1.682342433303561e-07, + "loss": 0.0047, + "step": 8230 + }, + { + "epoch": 0.16, + "learning_rate": 1.6823035998601996e-07, + "loss": 0.0048, + "step": 8231 + }, + { + "epoch": 0.16, + "learning_rate": 1.682264766416838e-07, + "loss": 0.0042, + "step": 8232 + }, + { + "epoch": 0.16, + "learning_rate": 1.6822259329734768e-07, + "loss": 0.0042, + "step": 8233 + }, + { + "epoch": 0.16, + "learning_rate": 1.6821870995301152e-07, + "loss": 0.0047, + "step": 8234 + }, + { + "epoch": 0.16, + "learning_rate": 1.682148266086754e-07, + "loss": 0.0053, + "step": 8235 + }, + { + "epoch": 0.16, + "learning_rate": 1.6821094326433924e-07, + "loss": 0.127, + "step": 8236 + }, + { + "epoch": 0.16, + "learning_rate": 1.682070599200031e-07, + "loss": 0.0711, + "step": 8237 + }, + { + "epoch": 0.16, + "learning_rate": 1.6820317657566695e-07, + "loss": 0.0068, + "step": 8238 + }, + { + "epoch": 0.16, + "learning_rate": 1.6819929323133083e-07, + "loss": 0.0069, + "step": 8239 + }, + { + "epoch": 0.16, + "learning_rate": 1.6819540988699467e-07, + "loss": 0.0047, + "step": 8240 + }, + { + "epoch": 0.16, + "learning_rate": 1.6819152654265854e-07, + "loss": 0.0054, + "step": 8241 + }, + { + "epoch": 0.16, + "learning_rate": 1.681876431983224e-07, + "loss": 0.0047, + "step": 8242 + }, + { + "epoch": 0.16, + "learning_rate": 1.6818375985398626e-07, + "loss": 1.109, + "step": 8243 + }, + { + "epoch": 0.16, + "learning_rate": 1.681798765096501e-07, + "loss": 0.0047, + "step": 8244 + }, + { + "epoch": 0.16, + "learning_rate": 1.6817599316531398e-07, + "loss": 0.0055, + "step": 8245 + }, + { + "epoch": 0.16, + "learning_rate": 1.6817210982097782e-07, + "loss": 0.3835, + "step": 8246 + }, + { + "epoch": 0.16, + "learning_rate": 1.681682264766417e-07, + "loss": 0.6795, + "step": 8247 + }, + { + "epoch": 0.16, + "learning_rate": 1.6816434313230554e-07, + "loss": 0.0046, + "step": 8248 + }, + { + "epoch": 0.16, + "learning_rate": 1.681604597879694e-07, + "loss": 0.0059, + "step": 8249 + }, + { + "epoch": 0.16, + "learning_rate": 1.6815657644363325e-07, + "loss": 0.6366, + "step": 8250 + }, + { + "epoch": 0.16, + "learning_rate": 1.6815269309929712e-07, + "loss": 0.0043, + "step": 8251 + }, + { + "epoch": 0.16, + "learning_rate": 1.6814880975496097e-07, + "loss": 0.0065, + "step": 8252 + }, + { + "epoch": 0.16, + "learning_rate": 1.6814492641062484e-07, + "loss": 0.085, + "step": 8253 + }, + { + "epoch": 0.16, + "learning_rate": 1.6814104306628869e-07, + "loss": 0.0311, + "step": 8254 + }, + { + "epoch": 0.16, + "learning_rate": 1.6813715972195256e-07, + "loss": 0.023, + "step": 8255 + }, + { + "epoch": 0.16, + "learning_rate": 1.681332763776164e-07, + "loss": 0.0202, + "step": 8256 + }, + { + "epoch": 0.16, + "learning_rate": 1.6812939303328025e-07, + "loss": 0.0054, + "step": 8257 + }, + { + "epoch": 0.16, + "learning_rate": 1.681255096889441e-07, + "loss": 0.0218, + "step": 8258 + }, + { + "epoch": 0.16, + "learning_rate": 1.6812162634460796e-07, + "loss": 0.2733, + "step": 8259 + }, + { + "epoch": 0.16, + "learning_rate": 1.681177430002718e-07, + "loss": 0.2279, + "step": 8260 + }, + { + "epoch": 0.16, + "learning_rate": 1.6811385965593568e-07, + "loss": 0.0856, + "step": 8261 + }, + { + "epoch": 0.16, + "learning_rate": 1.6810997631159953e-07, + "loss": 0.0629, + "step": 8262 + }, + { + "epoch": 0.16, + "learning_rate": 1.681060929672634e-07, + "loss": 0.0341, + "step": 8263 + }, + { + "epoch": 0.16, + "learning_rate": 1.6810220962292724e-07, + "loss": 0.009, + "step": 8264 + }, + { + "epoch": 0.16, + "learning_rate": 1.6809832627859111e-07, + "loss": 0.0048, + "step": 8265 + }, + { + "epoch": 0.16, + "learning_rate": 1.6809444293425496e-07, + "loss": 0.005, + "step": 8266 + }, + { + "epoch": 0.16, + "learning_rate": 1.6809055958991883e-07, + "loss": 0.007, + "step": 8267 + }, + { + "epoch": 0.16, + "learning_rate": 1.6808667624558268e-07, + "loss": 0.0062, + "step": 8268 + }, + { + "epoch": 0.16, + "learning_rate": 1.6808279290124655e-07, + "loss": 0.0057, + "step": 8269 + }, + { + "epoch": 0.16, + "learning_rate": 1.680789095569104e-07, + "loss": 0.0134, + "step": 8270 + }, + { + "epoch": 0.16, + "learning_rate": 1.6807502621257426e-07, + "loss": 0.0052, + "step": 8271 + }, + { + "epoch": 0.16, + "learning_rate": 1.680711428682381e-07, + "loss": 0.0045, + "step": 8272 + }, + { + "epoch": 0.16, + "learning_rate": 1.6806725952390198e-07, + "loss": 0.0042, + "step": 8273 + }, + { + "epoch": 0.16, + "learning_rate": 1.6806337617956582e-07, + "loss": 0.0051, + "step": 8274 + }, + { + "epoch": 0.16, + "learning_rate": 1.680594928352297e-07, + "loss": 0.0146, + "step": 8275 + }, + { + "epoch": 0.16, + "learning_rate": 1.6805560949089354e-07, + "loss": 0.0053, + "step": 8276 + }, + { + "epoch": 0.16, + "learning_rate": 1.680517261465574e-07, + "loss": 0.0076, + "step": 8277 + }, + { + "epoch": 0.16, + "learning_rate": 1.6804784280222126e-07, + "loss": 0.0236, + "step": 8278 + }, + { + "epoch": 0.16, + "learning_rate": 1.6804395945788513e-07, + "loss": 0.1758, + "step": 8279 + }, + { + "epoch": 0.16, + "learning_rate": 1.6804007611354897e-07, + "loss": 0.0052, + "step": 8280 + }, + { + "epoch": 0.16, + "learning_rate": 1.6803619276921285e-07, + "loss": 0.0127, + "step": 8281 + }, + { + "epoch": 0.16, + "learning_rate": 1.680323094248767e-07, + "loss": 0.0061, + "step": 8282 + }, + { + "epoch": 0.16, + "learning_rate": 1.6802842608054056e-07, + "loss": 0.0074, + "step": 8283 + }, + { + "epoch": 0.16, + "learning_rate": 1.680245427362044e-07, + "loss": 0.0056, + "step": 8284 + }, + { + "epoch": 0.16, + "learning_rate": 1.6802065939186828e-07, + "loss": 0.0044, + "step": 8285 + }, + { + "epoch": 0.16, + "learning_rate": 1.6801677604753212e-07, + "loss": 0.3521, + "step": 8286 + }, + { + "epoch": 0.16, + "learning_rate": 1.68012892703196e-07, + "loss": 0.008, + "step": 8287 + }, + { + "epoch": 0.16, + "learning_rate": 1.6800900935885984e-07, + "loss": 0.011, + "step": 8288 + }, + { + "epoch": 0.16, + "learning_rate": 1.680051260145237e-07, + "loss": 0.005, + "step": 8289 + }, + { + "epoch": 0.16, + "learning_rate": 1.6800124267018756e-07, + "loss": 0.0048, + "step": 8290 + }, + { + "epoch": 0.16, + "learning_rate": 1.6799735932585143e-07, + "loss": 0.0051, + "step": 8291 + }, + { + "epoch": 0.16, + "learning_rate": 1.6799347598151527e-07, + "loss": 0.0051, + "step": 8292 + }, + { + "epoch": 0.16, + "learning_rate": 1.6798959263717914e-07, + "loss": 0.0057, + "step": 8293 + }, + { + "epoch": 0.16, + "learning_rate": 1.67985709292843e-07, + "loss": 0.0076, + "step": 8294 + }, + { + "epoch": 0.16, + "learning_rate": 1.6798182594850686e-07, + "loss": 0.0189, + "step": 8295 + }, + { + "epoch": 0.16, + "learning_rate": 1.679779426041707e-07, + "loss": 0.1936, + "step": 8296 + }, + { + "epoch": 0.16, + "learning_rate": 1.6797405925983458e-07, + "loss": 0.007, + "step": 8297 + }, + { + "epoch": 0.16, + "learning_rate": 1.6797017591549842e-07, + "loss": 0.0061, + "step": 8298 + }, + { + "epoch": 0.16, + "learning_rate": 1.679662925711623e-07, + "loss": 0.0046, + "step": 8299 + }, + { + "epoch": 0.16, + "learning_rate": 1.6796240922682614e-07, + "loss": 0.0043, + "step": 8300 + }, + { + "epoch": 0.16, + "learning_rate": 1.6795852588249e-07, + "loss": 0.0547, + "step": 8301 + }, + { + "epoch": 0.16, + "learning_rate": 1.6795464253815386e-07, + "loss": 0.0064, + "step": 8302 + }, + { + "epoch": 0.16, + "learning_rate": 1.6795075919381773e-07, + "loss": 0.1079, + "step": 8303 + }, + { + "epoch": 0.16, + "learning_rate": 1.6794687584948157e-07, + "loss": 0.0038, + "step": 8304 + }, + { + "epoch": 0.16, + "learning_rate": 1.6794299250514544e-07, + "loss": 0.0054, + "step": 8305 + }, + { + "epoch": 0.16, + "learning_rate": 1.679391091608093e-07, + "loss": 0.0041, + "step": 8306 + }, + { + "epoch": 0.16, + "learning_rate": 1.6793522581647316e-07, + "loss": 0.0045, + "step": 8307 + }, + { + "epoch": 0.16, + "learning_rate": 1.67931342472137e-07, + "loss": 0.3554, + "step": 8308 + }, + { + "epoch": 0.16, + "learning_rate": 1.6792745912780088e-07, + "loss": 0.007, + "step": 8309 + }, + { + "epoch": 0.16, + "learning_rate": 1.6792357578346472e-07, + "loss": 0.0043, + "step": 8310 + }, + { + "epoch": 0.16, + "learning_rate": 1.6791969243912857e-07, + "loss": 0.0046, + "step": 8311 + }, + { + "epoch": 0.16, + "learning_rate": 1.6791580909479244e-07, + "loss": 0.0064, + "step": 8312 + }, + { + "epoch": 0.16, + "learning_rate": 1.6791192575045628e-07, + "loss": 0.1271, + "step": 8313 + }, + { + "epoch": 0.16, + "learning_rate": 1.6790804240612015e-07, + "loss": 0.0046, + "step": 8314 + }, + { + "epoch": 0.16, + "learning_rate": 1.67904159061784e-07, + "loss": 0.0075, + "step": 8315 + }, + { + "epoch": 0.16, + "learning_rate": 1.6790027571744784e-07, + "loss": 0.0088, + "step": 8316 + }, + { + "epoch": 0.16, + "learning_rate": 1.6789639237311172e-07, + "loss": 0.1689, + "step": 8317 + }, + { + "epoch": 0.16, + "learning_rate": 1.6789250902877556e-07, + "loss": 0.0063, + "step": 8318 + }, + { + "epoch": 0.16, + "learning_rate": 1.6788862568443943e-07, + "loss": 0.0048, + "step": 8319 + }, + { + "epoch": 0.16, + "learning_rate": 1.6788474234010328e-07, + "loss": 0.0037, + "step": 8320 + }, + { + "epoch": 0.16, + "learning_rate": 1.6788085899576715e-07, + "loss": 0.0065, + "step": 8321 + }, + { + "epoch": 0.16, + "learning_rate": 1.67876975651431e-07, + "loss": 0.0116, + "step": 8322 + }, + { + "epoch": 0.16, + "learning_rate": 1.6787309230709487e-07, + "loss": 0.0126, + "step": 8323 + }, + { + "epoch": 0.16, + "learning_rate": 1.678692089627587e-07, + "loss": 0.0054, + "step": 8324 + }, + { + "epoch": 0.16, + "learning_rate": 1.6786532561842258e-07, + "loss": 0.0411, + "step": 8325 + }, + { + "epoch": 0.16, + "learning_rate": 1.6786144227408643e-07, + "loss": 1.4718, + "step": 8326 + }, + { + "epoch": 0.16, + "learning_rate": 1.678575589297503e-07, + "loss": 1.0948, + "step": 8327 + }, + { + "epoch": 0.16, + "learning_rate": 1.6785367558541414e-07, + "loss": 0.0043, + "step": 8328 + }, + { + "epoch": 0.16, + "learning_rate": 1.6784979224107801e-07, + "loss": 0.2481, + "step": 8329 + }, + { + "epoch": 0.16, + "learning_rate": 1.6784590889674186e-07, + "loss": 0.0046, + "step": 8330 + }, + { + "epoch": 0.16, + "learning_rate": 1.6784202555240573e-07, + "loss": 0.0057, + "step": 8331 + }, + { + "epoch": 0.16, + "learning_rate": 1.6783814220806958e-07, + "loss": 0.6756, + "step": 8332 + }, + { + "epoch": 0.16, + "learning_rate": 1.6783425886373345e-07, + "loss": 0.005, + "step": 8333 + }, + { + "epoch": 0.16, + "learning_rate": 1.678303755193973e-07, + "loss": 0.0307, + "step": 8334 + }, + { + "epoch": 0.16, + "learning_rate": 1.6782649217506116e-07, + "loss": 0.8031, + "step": 8335 + }, + { + "epoch": 0.16, + "learning_rate": 1.67822608830725e-07, + "loss": 0.0039, + "step": 8336 + }, + { + "epoch": 0.16, + "learning_rate": 1.6781872548638888e-07, + "loss": 0.0048, + "step": 8337 + }, + { + "epoch": 0.16, + "learning_rate": 1.6781484214205273e-07, + "loss": 0.0044, + "step": 8338 + }, + { + "epoch": 0.16, + "learning_rate": 1.6781095879771657e-07, + "loss": 0.0041, + "step": 8339 + }, + { + "epoch": 0.16, + "learning_rate": 1.6780707545338044e-07, + "loss": 0.0059, + "step": 8340 + }, + { + "epoch": 0.16, + "learning_rate": 1.678031921090443e-07, + "loss": 0.004, + "step": 8341 + }, + { + "epoch": 0.16, + "learning_rate": 1.6779930876470816e-07, + "loss": 0.0053, + "step": 8342 + }, + { + "epoch": 0.16, + "learning_rate": 1.67795425420372e-07, + "loss": 0.0047, + "step": 8343 + }, + { + "epoch": 0.16, + "learning_rate": 1.6779154207603588e-07, + "loss": 0.0048, + "step": 8344 + }, + { + "epoch": 0.16, + "learning_rate": 1.6778765873169972e-07, + "loss": 0.0154, + "step": 8345 + }, + { + "epoch": 0.16, + "learning_rate": 1.677837753873636e-07, + "loss": 0.0046, + "step": 8346 + }, + { + "epoch": 0.16, + "learning_rate": 1.6777989204302744e-07, + "loss": 0.0129, + "step": 8347 + }, + { + "epoch": 0.16, + "learning_rate": 1.677760086986913e-07, + "loss": 0.0049, + "step": 8348 + }, + { + "epoch": 0.16, + "learning_rate": 1.6777212535435515e-07, + "loss": 0.0132, + "step": 8349 + }, + { + "epoch": 0.16, + "learning_rate": 1.6776824201001902e-07, + "loss": 0.0924, + "step": 8350 + }, + { + "epoch": 0.16, + "learning_rate": 1.6776435866568287e-07, + "loss": 0.0039, + "step": 8351 + }, + { + "epoch": 0.16, + "learning_rate": 1.6776047532134674e-07, + "loss": 0.0053, + "step": 8352 + }, + { + "epoch": 0.16, + "learning_rate": 1.6775659197701059e-07, + "loss": 0.0789, + "step": 8353 + }, + { + "epoch": 0.16, + "learning_rate": 1.6775270863267446e-07, + "loss": 0.0041, + "step": 8354 + }, + { + "epoch": 0.16, + "learning_rate": 1.677488252883383e-07, + "loss": 0.4654, + "step": 8355 + }, + { + "epoch": 0.16, + "learning_rate": 1.6774494194400217e-07, + "loss": 0.0084, + "step": 8356 + }, + { + "epoch": 0.16, + "learning_rate": 1.6774105859966602e-07, + "loss": 1.3252, + "step": 8357 + }, + { + "epoch": 0.16, + "learning_rate": 1.677371752553299e-07, + "loss": 0.0178, + "step": 8358 + }, + { + "epoch": 0.16, + "learning_rate": 1.6773329191099374e-07, + "loss": 0.007, + "step": 8359 + }, + { + "epoch": 0.16, + "learning_rate": 1.677294085666576e-07, + "loss": 0.0056, + "step": 8360 + }, + { + "epoch": 0.16, + "learning_rate": 1.6772552522232145e-07, + "loss": 0.005, + "step": 8361 + }, + { + "epoch": 0.16, + "learning_rate": 1.6772164187798532e-07, + "loss": 0.5107, + "step": 8362 + }, + { + "epoch": 0.16, + "learning_rate": 1.6771775853364917e-07, + "loss": 0.2565, + "step": 8363 + }, + { + "epoch": 0.16, + "learning_rate": 1.6771387518931304e-07, + "loss": 0.0045, + "step": 8364 + }, + { + "epoch": 0.16, + "learning_rate": 1.6770999184497689e-07, + "loss": 0.0943, + "step": 8365 + }, + { + "epoch": 0.16, + "learning_rate": 1.6770610850064076e-07, + "loss": 0.0043, + "step": 8366 + }, + { + "epoch": 0.16, + "learning_rate": 1.677022251563046e-07, + "loss": 0.8436, + "step": 8367 + }, + { + "epoch": 0.16, + "learning_rate": 1.6769834181196847e-07, + "loss": 0.0224, + "step": 8368 + }, + { + "epoch": 0.16, + "learning_rate": 1.6769445846763232e-07, + "loss": 0.0071, + "step": 8369 + }, + { + "epoch": 0.16, + "learning_rate": 1.676905751232962e-07, + "loss": 0.0076, + "step": 8370 + }, + { + "epoch": 0.16, + "learning_rate": 1.6768669177896003e-07, + "loss": 0.0049, + "step": 8371 + }, + { + "epoch": 0.16, + "learning_rate": 1.676828084346239e-07, + "loss": 0.0128, + "step": 8372 + }, + { + "epoch": 0.16, + "learning_rate": 1.6767892509028772e-07, + "loss": 0.0041, + "step": 8373 + }, + { + "epoch": 0.16, + "learning_rate": 1.676750417459516e-07, + "loss": 0.0049, + "step": 8374 + }, + { + "epoch": 0.16, + "learning_rate": 1.6767115840161544e-07, + "loss": 0.2801, + "step": 8375 + }, + { + "epoch": 0.16, + "learning_rate": 1.676672750572793e-07, + "loss": 0.0137, + "step": 8376 + }, + { + "epoch": 0.16, + "learning_rate": 1.6766339171294316e-07, + "loss": 0.0046, + "step": 8377 + }, + { + "epoch": 0.16, + "learning_rate": 1.6765950836860703e-07, + "loss": 0.0069, + "step": 8378 + }, + { + "epoch": 0.16, + "learning_rate": 1.6765562502427087e-07, + "loss": 0.0143, + "step": 8379 + }, + { + "epoch": 0.16, + "learning_rate": 1.6765174167993475e-07, + "loss": 0.0405, + "step": 8380 + }, + { + "epoch": 0.16, + "learning_rate": 1.676478583355986e-07, + "loss": 0.006, + "step": 8381 + }, + { + "epoch": 0.16, + "learning_rate": 1.6764397499126246e-07, + "loss": 0.0051, + "step": 8382 + }, + { + "epoch": 0.16, + "learning_rate": 1.676400916469263e-07, + "loss": 0.0052, + "step": 8383 + }, + { + "epoch": 0.16, + "learning_rate": 1.6763620830259018e-07, + "loss": 0.0191, + "step": 8384 + }, + { + "epoch": 0.16, + "learning_rate": 1.6763232495825402e-07, + "loss": 0.0062, + "step": 8385 + }, + { + "epoch": 0.16, + "learning_rate": 1.676284416139179e-07, + "loss": 0.004, + "step": 8386 + }, + { + "epoch": 0.16, + "learning_rate": 1.6762455826958174e-07, + "loss": 0.0438, + "step": 8387 + }, + { + "epoch": 0.16, + "learning_rate": 1.676206749252456e-07, + "loss": 0.3406, + "step": 8388 + }, + { + "epoch": 0.16, + "learning_rate": 1.6761679158090946e-07, + "loss": 0.0404, + "step": 8389 + }, + { + "epoch": 0.16, + "learning_rate": 1.6761290823657333e-07, + "loss": 0.0108, + "step": 8390 + }, + { + "epoch": 0.16, + "learning_rate": 1.6760902489223717e-07, + "loss": 0.2344, + "step": 8391 + }, + { + "epoch": 0.16, + "learning_rate": 1.6760514154790104e-07, + "loss": 0.0046, + "step": 8392 + }, + { + "epoch": 0.16, + "learning_rate": 1.676012582035649e-07, + "loss": 0.0049, + "step": 8393 + }, + { + "epoch": 0.16, + "learning_rate": 1.6759737485922876e-07, + "loss": 0.0047, + "step": 8394 + }, + { + "epoch": 0.16, + "learning_rate": 1.675934915148926e-07, + "loss": 0.1345, + "step": 8395 + }, + { + "epoch": 0.16, + "learning_rate": 1.6758960817055648e-07, + "loss": 0.0248, + "step": 8396 + }, + { + "epoch": 0.16, + "learning_rate": 1.6758572482622032e-07, + "loss": 0.0051, + "step": 8397 + }, + { + "epoch": 0.16, + "learning_rate": 1.675818414818842e-07, + "loss": 0.0041, + "step": 8398 + }, + { + "epoch": 0.16, + "learning_rate": 1.6757795813754804e-07, + "loss": 0.0046, + "step": 8399 + }, + { + "epoch": 0.16, + "learning_rate": 1.675740747932119e-07, + "loss": 0.0143, + "step": 8400 + }, + { + "epoch": 0.16, + "learning_rate": 1.6757019144887576e-07, + "loss": 0.491, + "step": 8401 + }, + { + "epoch": 0.16, + "learning_rate": 1.6756630810453963e-07, + "loss": 0.0051, + "step": 8402 + }, + { + "epoch": 0.16, + "learning_rate": 1.6756242476020347e-07, + "loss": 0.0073, + "step": 8403 + }, + { + "epoch": 0.16, + "learning_rate": 1.6755854141586734e-07, + "loss": 0.1092, + "step": 8404 + }, + { + "epoch": 0.16, + "learning_rate": 1.675546580715312e-07, + "loss": 0.2183, + "step": 8405 + }, + { + "epoch": 0.16, + "learning_rate": 1.6755077472719506e-07, + "loss": 0.0072, + "step": 8406 + }, + { + "epoch": 0.16, + "learning_rate": 1.675468913828589e-07, + "loss": 0.0045, + "step": 8407 + }, + { + "epoch": 0.16, + "learning_rate": 1.6754300803852278e-07, + "loss": 0.0075, + "step": 8408 + }, + { + "epoch": 0.16, + "learning_rate": 1.6753912469418662e-07, + "loss": 0.0034, + "step": 8409 + }, + { + "epoch": 0.16, + "learning_rate": 1.675352413498505e-07, + "loss": 0.052, + "step": 8410 + }, + { + "epoch": 0.16, + "learning_rate": 1.6753135800551434e-07, + "loss": 0.0045, + "step": 8411 + }, + { + "epoch": 0.16, + "learning_rate": 1.675274746611782e-07, + "loss": 0.0051, + "step": 8412 + }, + { + "epoch": 0.16, + "learning_rate": 1.6752359131684205e-07, + "loss": 0.1201, + "step": 8413 + }, + { + "epoch": 0.16, + "learning_rate": 1.6751970797250593e-07, + "loss": 0.5148, + "step": 8414 + }, + { + "epoch": 0.16, + "learning_rate": 1.6751582462816977e-07, + "loss": 0.005, + "step": 8415 + }, + { + "epoch": 0.16, + "learning_rate": 1.6751194128383364e-07, + "loss": 0.0047, + "step": 8416 + }, + { + "epoch": 0.16, + "learning_rate": 1.675080579394975e-07, + "loss": 0.02, + "step": 8417 + }, + { + "epoch": 0.16, + "learning_rate": 1.6750417459516136e-07, + "loss": 0.041, + "step": 8418 + }, + { + "epoch": 0.16, + "learning_rate": 1.675002912508252e-07, + "loss": 0.0422, + "step": 8419 + }, + { + "epoch": 0.16, + "learning_rate": 1.6749640790648908e-07, + "loss": 0.0045, + "step": 8420 + }, + { + "epoch": 0.16, + "learning_rate": 1.6749252456215292e-07, + "loss": 0.0078, + "step": 8421 + }, + { + "epoch": 0.16, + "learning_rate": 1.674886412178168e-07, + "loss": 0.2907, + "step": 8422 + }, + { + "epoch": 0.16, + "learning_rate": 1.6748475787348064e-07, + "loss": 0.0636, + "step": 8423 + }, + { + "epoch": 0.16, + "learning_rate": 1.674808745291445e-07, + "loss": 0.005, + "step": 8424 + }, + { + "epoch": 0.16, + "learning_rate": 1.6747699118480835e-07, + "loss": 0.1672, + "step": 8425 + }, + { + "epoch": 0.16, + "learning_rate": 1.6747310784047222e-07, + "loss": 0.0079, + "step": 8426 + }, + { + "epoch": 0.16, + "learning_rate": 1.6746922449613607e-07, + "loss": 0.0076, + "step": 8427 + }, + { + "epoch": 0.16, + "learning_rate": 1.6746534115179994e-07, + "loss": 0.0062, + "step": 8428 + }, + { + "epoch": 0.16, + "learning_rate": 1.6746145780746379e-07, + "loss": 0.0049, + "step": 8429 + }, + { + "epoch": 0.16, + "learning_rate": 1.6745757446312766e-07, + "loss": 0.0261, + "step": 8430 + }, + { + "epoch": 0.16, + "learning_rate": 1.6745369111879148e-07, + "loss": 0.004, + "step": 8431 + }, + { + "epoch": 0.16, + "learning_rate": 1.6744980777445535e-07, + "loss": 0.0672, + "step": 8432 + }, + { + "epoch": 0.16, + "learning_rate": 1.674459244301192e-07, + "loss": 0.0082, + "step": 8433 + }, + { + "epoch": 0.16, + "learning_rate": 1.6744204108578306e-07, + "loss": 1.1323, + "step": 8434 + }, + { + "epoch": 0.16, + "learning_rate": 1.674381577414469e-07, + "loss": 0.0107, + "step": 8435 + }, + { + "epoch": 0.16, + "learning_rate": 1.6743427439711078e-07, + "loss": 0.0052, + "step": 8436 + }, + { + "epoch": 0.16, + "learning_rate": 1.6743039105277463e-07, + "loss": 0.004, + "step": 8437 + }, + { + "epoch": 0.16, + "learning_rate": 1.674265077084385e-07, + "loss": 0.1706, + "step": 8438 + }, + { + "epoch": 0.16, + "learning_rate": 1.6742262436410234e-07, + "loss": 0.0048, + "step": 8439 + }, + { + "epoch": 0.16, + "learning_rate": 1.6741874101976621e-07, + "loss": 0.0048, + "step": 8440 + }, + { + "epoch": 0.16, + "learning_rate": 1.6741485767543006e-07, + "loss": 0.0215, + "step": 8441 + }, + { + "epoch": 0.16, + "learning_rate": 1.6741097433109393e-07, + "loss": 0.7435, + "step": 8442 + }, + { + "epoch": 0.16, + "learning_rate": 1.6740709098675778e-07, + "loss": 0.0047, + "step": 8443 + }, + { + "epoch": 0.16, + "learning_rate": 1.6740320764242165e-07, + "loss": 0.572, + "step": 8444 + }, + { + "epoch": 0.16, + "learning_rate": 1.673993242980855e-07, + "loss": 0.1864, + "step": 8445 + }, + { + "epoch": 0.16, + "learning_rate": 1.6739544095374936e-07, + "loss": 0.0067, + "step": 8446 + }, + { + "epoch": 0.16, + "learning_rate": 1.673915576094132e-07, + "loss": 0.004, + "step": 8447 + }, + { + "epoch": 0.16, + "learning_rate": 1.6738767426507708e-07, + "loss": 0.0048, + "step": 8448 + }, + { + "epoch": 0.16, + "learning_rate": 1.6738379092074092e-07, + "loss": 0.0158, + "step": 8449 + }, + { + "epoch": 0.16, + "learning_rate": 1.673799075764048e-07, + "loss": 0.0041, + "step": 8450 + }, + { + "epoch": 0.16, + "learning_rate": 1.6737602423206864e-07, + "loss": 0.0077, + "step": 8451 + }, + { + "epoch": 0.16, + "learning_rate": 1.673721408877325e-07, + "loss": 0.0064, + "step": 8452 + }, + { + "epoch": 0.16, + "learning_rate": 1.6736825754339636e-07, + "loss": 0.0298, + "step": 8453 + }, + { + "epoch": 0.16, + "learning_rate": 1.6736437419906023e-07, + "loss": 0.0347, + "step": 8454 + }, + { + "epoch": 0.16, + "learning_rate": 1.6736049085472407e-07, + "loss": 0.0043, + "step": 8455 + }, + { + "epoch": 0.16, + "learning_rate": 1.6735660751038795e-07, + "loss": 0.0043, + "step": 8456 + }, + { + "epoch": 0.16, + "learning_rate": 1.673527241660518e-07, + "loss": 0.0112, + "step": 8457 + }, + { + "epoch": 0.16, + "learning_rate": 1.6734884082171566e-07, + "loss": 0.4932, + "step": 8458 + }, + { + "epoch": 0.16, + "learning_rate": 1.673449574773795e-07, + "loss": 0.0043, + "step": 8459 + }, + { + "epoch": 0.16, + "learning_rate": 1.6734107413304338e-07, + "loss": 0.0231, + "step": 8460 + }, + { + "epoch": 0.16, + "learning_rate": 1.6733719078870722e-07, + "loss": 0.1819, + "step": 8461 + }, + { + "epoch": 0.16, + "learning_rate": 1.673333074443711e-07, + "loss": 0.0052, + "step": 8462 + }, + { + "epoch": 0.16, + "learning_rate": 1.6732942410003494e-07, + "loss": 0.3899, + "step": 8463 + }, + { + "epoch": 0.16, + "learning_rate": 1.673255407556988e-07, + "loss": 0.048, + "step": 8464 + }, + { + "epoch": 0.16, + "learning_rate": 1.6732165741136266e-07, + "loss": 0.0085, + "step": 8465 + }, + { + "epoch": 0.16, + "learning_rate": 1.6731777406702653e-07, + "loss": 0.0045, + "step": 8466 + }, + { + "epoch": 0.16, + "learning_rate": 1.6731389072269037e-07, + "loss": 0.0051, + "step": 8467 + }, + { + "epoch": 0.16, + "learning_rate": 1.6731000737835424e-07, + "loss": 0.0045, + "step": 8468 + }, + { + "epoch": 0.16, + "learning_rate": 1.673061240340181e-07, + "loss": 0.0037, + "step": 8469 + }, + { + "epoch": 0.16, + "learning_rate": 1.6730224068968196e-07, + "loss": 0.2064, + "step": 8470 + }, + { + "epoch": 0.16, + "learning_rate": 1.672983573453458e-07, + "loss": 0.005, + "step": 8471 + }, + { + "epoch": 0.16, + "learning_rate": 1.6729447400100968e-07, + "loss": 0.0097, + "step": 8472 + }, + { + "epoch": 0.16, + "learning_rate": 1.6729059065667352e-07, + "loss": 0.005, + "step": 8473 + }, + { + "epoch": 0.16, + "learning_rate": 1.672867073123374e-07, + "loss": 0.1066, + "step": 8474 + }, + { + "epoch": 0.16, + "learning_rate": 1.6728282396800124e-07, + "loss": 0.0055, + "step": 8475 + }, + { + "epoch": 0.16, + "learning_rate": 1.672789406236651e-07, + "loss": 0.0044, + "step": 8476 + }, + { + "epoch": 0.16, + "learning_rate": 1.6727505727932896e-07, + "loss": 1.0998, + "step": 8477 + }, + { + "epoch": 0.16, + "learning_rate": 1.6727117393499283e-07, + "loss": 0.0042, + "step": 8478 + }, + { + "epoch": 0.16, + "learning_rate": 1.6726729059065667e-07, + "loss": 0.0074, + "step": 8479 + }, + { + "epoch": 0.16, + "learning_rate": 1.6726340724632054e-07, + "loss": 0.0082, + "step": 8480 + }, + { + "epoch": 0.16, + "learning_rate": 1.672595239019844e-07, + "loss": 0.0054, + "step": 8481 + }, + { + "epoch": 0.16, + "learning_rate": 1.6725564055764826e-07, + "loss": 0.0035, + "step": 8482 + }, + { + "epoch": 0.16, + "learning_rate": 1.672517572133121e-07, + "loss": 0.0083, + "step": 8483 + }, + { + "epoch": 0.16, + "learning_rate": 1.6724787386897598e-07, + "loss": 0.0055, + "step": 8484 + }, + { + "epoch": 0.16, + "learning_rate": 1.6724399052463982e-07, + "loss": 0.0048, + "step": 8485 + }, + { + "epoch": 0.16, + "learning_rate": 1.672401071803037e-07, + "loss": 0.0038, + "step": 8486 + }, + { + "epoch": 0.16, + "learning_rate": 1.6723622383596754e-07, + "loss": 0.0068, + "step": 8487 + }, + { + "epoch": 0.16, + "learning_rate": 1.6723234049163138e-07, + "loss": 0.0046, + "step": 8488 + }, + { + "epoch": 0.16, + "learning_rate": 1.6722845714729523e-07, + "loss": 0.3937, + "step": 8489 + }, + { + "epoch": 0.16, + "learning_rate": 1.672245738029591e-07, + "loss": 0.3329, + "step": 8490 + }, + { + "epoch": 0.16, + "learning_rate": 1.6722069045862294e-07, + "loss": 0.0047, + "step": 8491 + }, + { + "epoch": 0.16, + "learning_rate": 1.6721680711428682e-07, + "loss": 0.0141, + "step": 8492 + }, + { + "epoch": 0.16, + "learning_rate": 1.6721292376995066e-07, + "loss": 0.0121, + "step": 8493 + }, + { + "epoch": 0.16, + "learning_rate": 1.6720904042561453e-07, + "loss": 0.0089, + "step": 8494 + }, + { + "epoch": 0.16, + "learning_rate": 1.6720515708127838e-07, + "loss": 0.0154, + "step": 8495 + }, + { + "epoch": 0.16, + "learning_rate": 1.6720127373694225e-07, + "loss": 0.0556, + "step": 8496 + }, + { + "epoch": 0.16, + "learning_rate": 1.671973903926061e-07, + "loss": 0.012, + "step": 8497 + }, + { + "epoch": 0.16, + "learning_rate": 1.6719350704826997e-07, + "loss": 0.0047, + "step": 8498 + }, + { + "epoch": 0.16, + "learning_rate": 1.671896237039338e-07, + "loss": 0.1592, + "step": 8499 + }, + { + "epoch": 0.16, + "learning_rate": 1.6718574035959768e-07, + "loss": 0.0062, + "step": 8500 + }, + { + "epoch": 0.16, + "learning_rate": 1.6718185701526153e-07, + "loss": 0.0042, + "step": 8501 + }, + { + "epoch": 0.16, + "learning_rate": 1.671779736709254e-07, + "loss": 0.0134, + "step": 8502 + }, + { + "epoch": 0.16, + "learning_rate": 1.6717409032658924e-07, + "loss": 0.0056, + "step": 8503 + }, + { + "epoch": 0.16, + "learning_rate": 1.6717020698225312e-07, + "loss": 0.0052, + "step": 8504 + }, + { + "epoch": 0.16, + "learning_rate": 1.6716632363791696e-07, + "loss": 0.0066, + "step": 8505 + }, + { + "epoch": 0.16, + "learning_rate": 1.6716244029358083e-07, + "loss": 0.0062, + "step": 8506 + }, + { + "epoch": 0.17, + "learning_rate": 1.6715855694924468e-07, + "loss": 0.0099, + "step": 8507 + }, + { + "epoch": 0.17, + "learning_rate": 1.6715467360490855e-07, + "loss": 0.0979, + "step": 8508 + }, + { + "epoch": 0.17, + "learning_rate": 1.671507902605724e-07, + "loss": 0.0351, + "step": 8509 + }, + { + "epoch": 0.17, + "learning_rate": 1.6714690691623626e-07, + "loss": 0.073, + "step": 8510 + }, + { + "epoch": 0.17, + "learning_rate": 1.671430235719001e-07, + "loss": 0.5627, + "step": 8511 + }, + { + "epoch": 0.17, + "learning_rate": 1.6713914022756398e-07, + "loss": 0.1394, + "step": 8512 + }, + { + "epoch": 0.17, + "learning_rate": 1.6713525688322783e-07, + "loss": 0.5067, + "step": 8513 + }, + { + "epoch": 0.17, + "learning_rate": 1.671313735388917e-07, + "loss": 0.1353, + "step": 8514 + }, + { + "epoch": 0.17, + "learning_rate": 1.6712749019455554e-07, + "loss": 0.004, + "step": 8515 + }, + { + "epoch": 0.17, + "learning_rate": 1.671236068502194e-07, + "loss": 0.0803, + "step": 8516 + }, + { + "epoch": 0.17, + "learning_rate": 1.6711972350588326e-07, + "loss": 0.0079, + "step": 8517 + }, + { + "epoch": 0.17, + "learning_rate": 1.671158401615471e-07, + "loss": 0.0041, + "step": 8518 + }, + { + "epoch": 0.17, + "learning_rate": 1.6711195681721098e-07, + "loss": 0.0046, + "step": 8519 + }, + { + "epoch": 0.17, + "learning_rate": 1.6710807347287482e-07, + "loss": 0.0072, + "step": 8520 + }, + { + "epoch": 0.17, + "learning_rate": 1.671041901285387e-07, + "loss": 0.0452, + "step": 8521 + }, + { + "epoch": 0.17, + "learning_rate": 1.6710030678420254e-07, + "loss": 0.4615, + "step": 8522 + }, + { + "epoch": 0.17, + "learning_rate": 1.670964234398664e-07, + "loss": 0.0071, + "step": 8523 + }, + { + "epoch": 0.17, + "learning_rate": 1.6709254009553025e-07, + "loss": 0.0092, + "step": 8524 + }, + { + "epoch": 0.17, + "learning_rate": 1.6708865675119413e-07, + "loss": 0.0068, + "step": 8525 + }, + { + "epoch": 0.17, + "learning_rate": 1.6708477340685797e-07, + "loss": 0.0048, + "step": 8526 + }, + { + "epoch": 0.17, + "learning_rate": 1.6708089006252184e-07, + "loss": 0.094, + "step": 8527 + }, + { + "epoch": 0.17, + "learning_rate": 1.6707700671818569e-07, + "loss": 0.1067, + "step": 8528 + }, + { + "epoch": 0.17, + "learning_rate": 1.6707312337384956e-07, + "loss": 0.0063, + "step": 8529 + }, + { + "epoch": 0.17, + "learning_rate": 1.670692400295134e-07, + "loss": 0.0335, + "step": 8530 + }, + { + "epoch": 0.17, + "learning_rate": 1.6706535668517727e-07, + "loss": 0.0044, + "step": 8531 + }, + { + "epoch": 0.17, + "learning_rate": 1.6706147334084112e-07, + "loss": 0.0404, + "step": 8532 + }, + { + "epoch": 0.17, + "learning_rate": 1.67057589996505e-07, + "loss": 0.0147, + "step": 8533 + }, + { + "epoch": 0.17, + "learning_rate": 1.6705370665216884e-07, + "loss": 0.0039, + "step": 8534 + }, + { + "epoch": 0.17, + "learning_rate": 1.670498233078327e-07, + "loss": 0.0079, + "step": 8535 + }, + { + "epoch": 0.17, + "learning_rate": 1.6704593996349655e-07, + "loss": 0.0347, + "step": 8536 + }, + { + "epoch": 0.17, + "learning_rate": 1.6704205661916042e-07, + "loss": 0.0305, + "step": 8537 + }, + { + "epoch": 0.17, + "learning_rate": 1.6703817327482427e-07, + "loss": 0.0073, + "step": 8538 + }, + { + "epoch": 0.17, + "learning_rate": 1.6703428993048814e-07, + "loss": 0.0034, + "step": 8539 + }, + { + "epoch": 0.17, + "learning_rate": 1.6703040658615199e-07, + "loss": 0.1654, + "step": 8540 + }, + { + "epoch": 0.17, + "learning_rate": 1.6702652324181586e-07, + "loss": 0.0071, + "step": 8541 + }, + { + "epoch": 0.17, + "learning_rate": 1.670226398974797e-07, + "loss": 0.0048, + "step": 8542 + }, + { + "epoch": 0.17, + "learning_rate": 1.6701875655314357e-07, + "loss": 0.0082, + "step": 8543 + }, + { + "epoch": 0.17, + "learning_rate": 1.6701487320880742e-07, + "loss": 0.0118, + "step": 8544 + }, + { + "epoch": 0.17, + "learning_rate": 1.670109898644713e-07, + "loss": 0.0417, + "step": 8545 + }, + { + "epoch": 0.17, + "learning_rate": 1.6700710652013513e-07, + "loss": 0.0051, + "step": 8546 + }, + { + "epoch": 0.17, + "learning_rate": 1.6700322317579898e-07, + "loss": 0.0051, + "step": 8547 + }, + { + "epoch": 0.17, + "learning_rate": 1.6699933983146282e-07, + "loss": 0.0041, + "step": 8548 + }, + { + "epoch": 0.17, + "learning_rate": 1.669954564871267e-07, + "loss": 0.0059, + "step": 8549 + }, + { + "epoch": 0.17, + "learning_rate": 1.6699157314279054e-07, + "loss": 0.005, + "step": 8550 + }, + { + "epoch": 0.17, + "learning_rate": 1.669876897984544e-07, + "loss": 0.0047, + "step": 8551 + }, + { + "epoch": 0.17, + "learning_rate": 1.6698380645411826e-07, + "loss": 0.0622, + "step": 8552 + }, + { + "epoch": 0.17, + "learning_rate": 1.6697992310978213e-07, + "loss": 0.1418, + "step": 8553 + }, + { + "epoch": 0.17, + "learning_rate": 1.6697603976544597e-07, + "loss": 0.0054, + "step": 8554 + }, + { + "epoch": 0.17, + "learning_rate": 1.6697215642110985e-07, + "loss": 0.4423, + "step": 8555 + }, + { + "epoch": 0.17, + "learning_rate": 1.669682730767737e-07, + "loss": 0.0946, + "step": 8556 + }, + { + "epoch": 0.17, + "learning_rate": 1.6696438973243756e-07, + "loss": 0.006, + "step": 8557 + }, + { + "epoch": 0.17, + "learning_rate": 1.669605063881014e-07, + "loss": 0.7213, + "step": 8558 + }, + { + "epoch": 0.17, + "learning_rate": 1.6695662304376528e-07, + "loss": 0.1656, + "step": 8559 + }, + { + "epoch": 0.17, + "learning_rate": 1.6695273969942912e-07, + "loss": 1.1189, + "step": 8560 + }, + { + "epoch": 0.17, + "learning_rate": 1.66948856355093e-07, + "loss": 0.005, + "step": 8561 + }, + { + "epoch": 0.17, + "learning_rate": 1.6694497301075684e-07, + "loss": 0.0065, + "step": 8562 + }, + { + "epoch": 0.17, + "learning_rate": 1.669410896664207e-07, + "loss": 0.0111, + "step": 8563 + }, + { + "epoch": 0.17, + "learning_rate": 1.6693720632208456e-07, + "loss": 0.0262, + "step": 8564 + }, + { + "epoch": 0.17, + "learning_rate": 1.6693332297774843e-07, + "loss": 0.014, + "step": 8565 + }, + { + "epoch": 0.17, + "learning_rate": 1.6692943963341227e-07, + "loss": 0.0083, + "step": 8566 + }, + { + "epoch": 0.17, + "learning_rate": 1.6692555628907614e-07, + "loss": 0.0038, + "step": 8567 + }, + { + "epoch": 0.17, + "learning_rate": 1.6692167294474e-07, + "loss": 0.0424, + "step": 8568 + }, + { + "epoch": 0.17, + "learning_rate": 1.6691778960040386e-07, + "loss": 0.004, + "step": 8569 + }, + { + "epoch": 0.17, + "learning_rate": 1.669139062560677e-07, + "loss": 0.3881, + "step": 8570 + }, + { + "epoch": 0.17, + "learning_rate": 1.6691002291173158e-07, + "loss": 0.0059, + "step": 8571 + }, + { + "epoch": 0.17, + "learning_rate": 1.6690613956739542e-07, + "loss": 0.004, + "step": 8572 + }, + { + "epoch": 0.17, + "learning_rate": 1.669022562230593e-07, + "loss": 0.3163, + "step": 8573 + }, + { + "epoch": 0.17, + "learning_rate": 1.6689837287872314e-07, + "loss": 0.0844, + "step": 8574 + }, + { + "epoch": 0.17, + "learning_rate": 1.66894489534387e-07, + "loss": 0.8678, + "step": 8575 + }, + { + "epoch": 0.17, + "learning_rate": 1.6689060619005086e-07, + "loss": 0.0046, + "step": 8576 + }, + { + "epoch": 0.17, + "learning_rate": 1.6688672284571473e-07, + "loss": 0.0065, + "step": 8577 + }, + { + "epoch": 0.17, + "learning_rate": 1.6688283950137857e-07, + "loss": 0.8526, + "step": 8578 + }, + { + "epoch": 0.17, + "learning_rate": 1.6687895615704244e-07, + "loss": 0.0958, + "step": 8579 + }, + { + "epoch": 0.17, + "learning_rate": 1.668750728127063e-07, + "loss": 0.004, + "step": 8580 + }, + { + "epoch": 0.17, + "learning_rate": 1.6687118946837016e-07, + "loss": 0.1499, + "step": 8581 + }, + { + "epoch": 0.17, + "learning_rate": 1.66867306124034e-07, + "loss": 0.0044, + "step": 8582 + }, + { + "epoch": 0.17, + "learning_rate": 1.6686342277969788e-07, + "loss": 0.0046, + "step": 8583 + }, + { + "epoch": 0.17, + "learning_rate": 1.6685953943536172e-07, + "loss": 0.0036, + "step": 8584 + }, + { + "epoch": 0.17, + "learning_rate": 1.668556560910256e-07, + "loss": 0.0066, + "step": 8585 + }, + { + "epoch": 0.17, + "learning_rate": 1.6685177274668944e-07, + "loss": 0.0074, + "step": 8586 + }, + { + "epoch": 0.17, + "learning_rate": 1.668478894023533e-07, + "loss": 0.0047, + "step": 8587 + }, + { + "epoch": 0.17, + "learning_rate": 1.6684400605801715e-07, + "loss": 0.0043, + "step": 8588 + }, + { + "epoch": 0.17, + "learning_rate": 1.6684012271368103e-07, + "loss": 0.0083, + "step": 8589 + }, + { + "epoch": 0.17, + "learning_rate": 1.6683623936934487e-07, + "loss": 0.0053, + "step": 8590 + }, + { + "epoch": 0.17, + "learning_rate": 1.6683235602500874e-07, + "loss": 0.0045, + "step": 8591 + }, + { + "epoch": 0.17, + "learning_rate": 1.668284726806726e-07, + "loss": 0.007, + "step": 8592 + }, + { + "epoch": 0.17, + "learning_rate": 1.6682458933633646e-07, + "loss": 0.0156, + "step": 8593 + }, + { + "epoch": 0.17, + "learning_rate": 1.668207059920003e-07, + "loss": 0.0042, + "step": 8594 + }, + { + "epoch": 0.17, + "learning_rate": 1.6681682264766418e-07, + "loss": 0.0056, + "step": 8595 + }, + { + "epoch": 0.17, + "learning_rate": 1.6681293930332802e-07, + "loss": 0.0116, + "step": 8596 + }, + { + "epoch": 0.17, + "learning_rate": 1.668090559589919e-07, + "loss": 0.0043, + "step": 8597 + }, + { + "epoch": 0.17, + "learning_rate": 1.6680517261465574e-07, + "loss": 0.8545, + "step": 8598 + }, + { + "epoch": 0.17, + "learning_rate": 1.668012892703196e-07, + "loss": 0.0038, + "step": 8599 + }, + { + "epoch": 0.17, + "learning_rate": 1.6679740592598345e-07, + "loss": 0.0042, + "step": 8600 + }, + { + "epoch": 0.17, + "learning_rate": 1.6679352258164733e-07, + "loss": 0.0052, + "step": 8601 + }, + { + "epoch": 0.17, + "learning_rate": 1.6678963923731117e-07, + "loss": 0.007, + "step": 8602 + }, + { + "epoch": 0.17, + "learning_rate": 1.6678575589297504e-07, + "loss": 0.0447, + "step": 8603 + }, + { + "epoch": 0.17, + "learning_rate": 1.6678187254863889e-07, + "loss": 0.9334, + "step": 8604 + }, + { + "epoch": 0.17, + "learning_rate": 1.6677798920430273e-07, + "loss": 0.0064, + "step": 8605 + }, + { + "epoch": 0.17, + "learning_rate": 1.6677410585996658e-07, + "loss": 0.4369, + "step": 8606 + }, + { + "epoch": 0.17, + "learning_rate": 1.6677022251563045e-07, + "loss": 0.554, + "step": 8607 + }, + { + "epoch": 0.17, + "learning_rate": 1.667663391712943e-07, + "loss": 0.3321, + "step": 8608 + }, + { + "epoch": 0.17, + "learning_rate": 1.6676245582695816e-07, + "loss": 0.0054, + "step": 8609 + }, + { + "epoch": 0.17, + "learning_rate": 1.66758572482622e-07, + "loss": 0.0109, + "step": 8610 + }, + { + "epoch": 0.17, + "learning_rate": 1.6675468913828588e-07, + "loss": 0.1194, + "step": 8611 + }, + { + "epoch": 0.17, + "learning_rate": 1.6675080579394973e-07, + "loss": 0.0038, + "step": 8612 + }, + { + "epoch": 0.17, + "learning_rate": 1.667469224496136e-07, + "loss": 0.1782, + "step": 8613 + }, + { + "epoch": 0.17, + "learning_rate": 1.6674303910527744e-07, + "loss": 0.0104, + "step": 8614 + }, + { + "epoch": 0.17, + "learning_rate": 1.6673915576094131e-07, + "loss": 0.0054, + "step": 8615 + }, + { + "epoch": 0.17, + "learning_rate": 1.6673527241660516e-07, + "loss": 0.0042, + "step": 8616 + }, + { + "epoch": 0.17, + "learning_rate": 1.6673138907226903e-07, + "loss": 0.0063, + "step": 8617 + }, + { + "epoch": 0.17, + "learning_rate": 1.6672750572793288e-07, + "loss": 0.1854, + "step": 8618 + }, + { + "epoch": 0.17, + "learning_rate": 1.6672362238359675e-07, + "loss": 0.0063, + "step": 8619 + }, + { + "epoch": 0.17, + "learning_rate": 1.667197390392606e-07, + "loss": 0.0045, + "step": 8620 + }, + { + "epoch": 0.17, + "learning_rate": 1.6671585569492446e-07, + "loss": 0.0305, + "step": 8621 + }, + { + "epoch": 0.17, + "learning_rate": 1.667119723505883e-07, + "loss": 0.0094, + "step": 8622 + }, + { + "epoch": 0.17, + "learning_rate": 1.6670808900625218e-07, + "loss": 0.0054, + "step": 8623 + }, + { + "epoch": 0.17, + "learning_rate": 1.6670420566191603e-07, + "loss": 0.0064, + "step": 8624 + }, + { + "epoch": 0.17, + "learning_rate": 1.667003223175799e-07, + "loss": 0.006, + "step": 8625 + }, + { + "epoch": 0.17, + "learning_rate": 1.6669643897324374e-07, + "loss": 0.0045, + "step": 8626 + }, + { + "epoch": 0.17, + "learning_rate": 1.666925556289076e-07, + "loss": 0.006, + "step": 8627 + }, + { + "epoch": 0.17, + "learning_rate": 1.6668867228457146e-07, + "loss": 0.0053, + "step": 8628 + }, + { + "epoch": 0.17, + "learning_rate": 1.6668478894023533e-07, + "loss": 0.9051, + "step": 8629 + }, + { + "epoch": 0.17, + "learning_rate": 1.6668090559589917e-07, + "loss": 0.0114, + "step": 8630 + }, + { + "epoch": 0.17, + "learning_rate": 1.6667702225156305e-07, + "loss": 0.0048, + "step": 8631 + }, + { + "epoch": 0.17, + "learning_rate": 1.666731389072269e-07, + "loss": 0.0045, + "step": 8632 + }, + { + "epoch": 0.17, + "learning_rate": 1.6666925556289076e-07, + "loss": 0.0105, + "step": 8633 + }, + { + "epoch": 0.17, + "learning_rate": 1.666653722185546e-07, + "loss": 0.7991, + "step": 8634 + }, + { + "epoch": 0.17, + "learning_rate": 1.6666148887421848e-07, + "loss": 0.0284, + "step": 8635 + }, + { + "epoch": 0.17, + "learning_rate": 1.6665760552988232e-07, + "loss": 0.007, + "step": 8636 + }, + { + "epoch": 0.17, + "learning_rate": 1.666537221855462e-07, + "loss": 0.0049, + "step": 8637 + }, + { + "epoch": 0.17, + "learning_rate": 1.6664983884121004e-07, + "loss": 0.0043, + "step": 8638 + }, + { + "epoch": 0.17, + "learning_rate": 1.666459554968739e-07, + "loss": 0.4357, + "step": 8639 + }, + { + "epoch": 0.17, + "learning_rate": 1.6664207215253776e-07, + "loss": 0.0031, + "step": 8640 + }, + { + "epoch": 0.17, + "learning_rate": 1.6663818880820163e-07, + "loss": 0.0102, + "step": 8641 + }, + { + "epoch": 0.17, + "learning_rate": 1.6663430546386547e-07, + "loss": 0.0056, + "step": 8642 + }, + { + "epoch": 0.17, + "learning_rate": 1.6663042211952934e-07, + "loss": 0.0731, + "step": 8643 + }, + { + "epoch": 0.17, + "learning_rate": 1.666265387751932e-07, + "loss": 0.0199, + "step": 8644 + }, + { + "epoch": 0.17, + "learning_rate": 1.6662265543085706e-07, + "loss": 0.0036, + "step": 8645 + }, + { + "epoch": 0.17, + "learning_rate": 1.666187720865209e-07, + "loss": 0.005, + "step": 8646 + }, + { + "epoch": 0.17, + "learning_rate": 1.6661488874218478e-07, + "loss": 0.0036, + "step": 8647 + }, + { + "epoch": 0.17, + "learning_rate": 1.6661100539784862e-07, + "loss": 0.0049, + "step": 8648 + }, + { + "epoch": 0.17, + "learning_rate": 1.666071220535125e-07, + "loss": 0.006, + "step": 8649 + }, + { + "epoch": 0.17, + "learning_rate": 1.6660323870917634e-07, + "loss": 0.0044, + "step": 8650 + }, + { + "epoch": 0.17, + "learning_rate": 1.665993553648402e-07, + "loss": 0.0037, + "step": 8651 + }, + { + "epoch": 0.17, + "learning_rate": 1.6659547202050406e-07, + "loss": 0.0055, + "step": 8652 + }, + { + "epoch": 0.17, + "learning_rate": 1.6659158867616793e-07, + "loss": 0.0039, + "step": 8653 + }, + { + "epoch": 0.17, + "learning_rate": 1.6658770533183177e-07, + "loss": 0.0042, + "step": 8654 + }, + { + "epoch": 0.17, + "learning_rate": 1.6658382198749564e-07, + "loss": 0.2695, + "step": 8655 + }, + { + "epoch": 0.17, + "learning_rate": 1.665799386431595e-07, + "loss": 0.0118, + "step": 8656 + }, + { + "epoch": 0.17, + "learning_rate": 1.6657605529882336e-07, + "loss": 0.0043, + "step": 8657 + }, + { + "epoch": 0.17, + "learning_rate": 1.665721719544872e-07, + "loss": 0.0042, + "step": 8658 + }, + { + "epoch": 0.17, + "learning_rate": 1.6656828861015108e-07, + "loss": 0.0044, + "step": 8659 + }, + { + "epoch": 0.17, + "learning_rate": 1.6656440526581492e-07, + "loss": 0.0046, + "step": 8660 + }, + { + "epoch": 0.17, + "learning_rate": 1.665605219214788e-07, + "loss": 0.0035, + "step": 8661 + }, + { + "epoch": 0.17, + "learning_rate": 1.6655663857714264e-07, + "loss": 0.0044, + "step": 8662 + }, + { + "epoch": 0.17, + "learning_rate": 1.6655275523280648e-07, + "loss": 0.1287, + "step": 8663 + }, + { + "epoch": 0.17, + "learning_rate": 1.6654887188847033e-07, + "loss": 0.0058, + "step": 8664 + }, + { + "epoch": 0.17, + "learning_rate": 1.665449885441342e-07, + "loss": 0.0048, + "step": 8665 + }, + { + "epoch": 0.17, + "learning_rate": 1.6654110519979804e-07, + "loss": 0.7793, + "step": 8666 + }, + { + "epoch": 0.17, + "learning_rate": 1.6653722185546192e-07, + "loss": 0.1371, + "step": 8667 + }, + { + "epoch": 0.17, + "learning_rate": 1.6653333851112576e-07, + "loss": 0.6332, + "step": 8668 + }, + { + "epoch": 0.17, + "learning_rate": 1.6652945516678963e-07, + "loss": 0.0058, + "step": 8669 + }, + { + "epoch": 0.17, + "learning_rate": 1.6652557182245348e-07, + "loss": 0.8261, + "step": 8670 + }, + { + "epoch": 0.17, + "learning_rate": 1.6652168847811735e-07, + "loss": 0.0101, + "step": 8671 + }, + { + "epoch": 0.17, + "learning_rate": 1.665178051337812e-07, + "loss": 0.0041, + "step": 8672 + }, + { + "epoch": 0.17, + "learning_rate": 1.6651392178944507e-07, + "loss": 0.004, + "step": 8673 + }, + { + "epoch": 0.17, + "learning_rate": 1.665100384451089e-07, + "loss": 0.0048, + "step": 8674 + }, + { + "epoch": 0.17, + "learning_rate": 1.6650615510077278e-07, + "loss": 0.0113, + "step": 8675 + }, + { + "epoch": 0.17, + "learning_rate": 1.6650227175643663e-07, + "loss": 0.2011, + "step": 8676 + }, + { + "epoch": 0.17, + "learning_rate": 1.664983884121005e-07, + "loss": 0.0052, + "step": 8677 + }, + { + "epoch": 0.17, + "learning_rate": 1.6649450506776434e-07, + "loss": 0.008, + "step": 8678 + }, + { + "epoch": 0.17, + "learning_rate": 1.6649062172342822e-07, + "loss": 0.0467, + "step": 8679 + }, + { + "epoch": 0.17, + "learning_rate": 1.6648673837909206e-07, + "loss": 0.8676, + "step": 8680 + }, + { + "epoch": 0.17, + "learning_rate": 1.6648285503475593e-07, + "loss": 0.0119, + "step": 8681 + }, + { + "epoch": 0.17, + "learning_rate": 1.6647897169041978e-07, + "loss": 0.0038, + "step": 8682 + }, + { + "epoch": 0.17, + "learning_rate": 1.6647508834608365e-07, + "loss": 0.0054, + "step": 8683 + }, + { + "epoch": 0.17, + "learning_rate": 1.664712050017475e-07, + "loss": 0.0048, + "step": 8684 + }, + { + "epoch": 0.17, + "learning_rate": 1.6646732165741136e-07, + "loss": 0.0059, + "step": 8685 + }, + { + "epoch": 0.17, + "learning_rate": 1.664634383130752e-07, + "loss": 0.0123, + "step": 8686 + }, + { + "epoch": 0.17, + "learning_rate": 1.6645955496873908e-07, + "loss": 0.0264, + "step": 8687 + }, + { + "epoch": 0.17, + "learning_rate": 1.6645567162440293e-07, + "loss": 0.0047, + "step": 8688 + }, + { + "epoch": 0.17, + "learning_rate": 1.664517882800668e-07, + "loss": 0.0044, + "step": 8689 + }, + { + "epoch": 0.17, + "learning_rate": 1.6644790493573064e-07, + "loss": 0.007, + "step": 8690 + }, + { + "epoch": 0.17, + "learning_rate": 1.6644402159139451e-07, + "loss": 0.0081, + "step": 8691 + }, + { + "epoch": 0.17, + "learning_rate": 1.6644013824705836e-07, + "loss": 0.0046, + "step": 8692 + }, + { + "epoch": 0.17, + "learning_rate": 1.664362549027222e-07, + "loss": 0.0046, + "step": 8693 + }, + { + "epoch": 0.17, + "learning_rate": 1.6643237155838608e-07, + "loss": 0.0051, + "step": 8694 + }, + { + "epoch": 0.17, + "learning_rate": 1.6642848821404992e-07, + "loss": 0.0063, + "step": 8695 + }, + { + "epoch": 0.17, + "learning_rate": 1.664246048697138e-07, + "loss": 0.0032, + "step": 8696 + }, + { + "epoch": 0.17, + "learning_rate": 1.6642072152537764e-07, + "loss": 0.0044, + "step": 8697 + }, + { + "epoch": 0.17, + "learning_rate": 1.664168381810415e-07, + "loss": 0.0691, + "step": 8698 + }, + { + "epoch": 0.17, + "learning_rate": 1.6641295483670535e-07, + "loss": 0.0189, + "step": 8699 + }, + { + "epoch": 0.17, + "learning_rate": 1.6640907149236923e-07, + "loss": 0.0048, + "step": 8700 + }, + { + "epoch": 0.17, + "learning_rate": 1.6640518814803307e-07, + "loss": 0.0123, + "step": 8701 + }, + { + "epoch": 0.17, + "learning_rate": 1.6640130480369694e-07, + "loss": 0.004, + "step": 8702 + }, + { + "epoch": 0.17, + "learning_rate": 1.6639742145936079e-07, + "loss": 1.0173, + "step": 8703 + }, + { + "epoch": 0.17, + "learning_rate": 1.6639353811502466e-07, + "loss": 0.0065, + "step": 8704 + }, + { + "epoch": 0.17, + "learning_rate": 1.663896547706885e-07, + "loss": 0.0048, + "step": 8705 + }, + { + "epoch": 0.17, + "learning_rate": 1.6638577142635237e-07, + "loss": 0.0052, + "step": 8706 + }, + { + "epoch": 0.17, + "learning_rate": 1.6638188808201622e-07, + "loss": 0.0041, + "step": 8707 + }, + { + "epoch": 0.17, + "learning_rate": 1.663780047376801e-07, + "loss": 0.3728, + "step": 8708 + }, + { + "epoch": 0.17, + "learning_rate": 1.6637412139334394e-07, + "loss": 0.0053, + "step": 8709 + }, + { + "epoch": 0.17, + "learning_rate": 1.663702380490078e-07, + "loss": 0.0031, + "step": 8710 + }, + { + "epoch": 0.17, + "learning_rate": 1.6636635470467165e-07, + "loss": 0.327, + "step": 8711 + }, + { + "epoch": 0.17, + "learning_rate": 1.6636247136033552e-07, + "loss": 0.0199, + "step": 8712 + }, + { + "epoch": 0.17, + "learning_rate": 1.6635858801599937e-07, + "loss": 0.8646, + "step": 8713 + }, + { + "epoch": 0.17, + "learning_rate": 1.6635470467166324e-07, + "loss": 0.0117, + "step": 8714 + }, + { + "epoch": 0.17, + "learning_rate": 1.6635082132732709e-07, + "loss": 0.6096, + "step": 8715 + }, + { + "epoch": 0.17, + "learning_rate": 1.6634693798299096e-07, + "loss": 0.0981, + "step": 8716 + }, + { + "epoch": 0.17, + "learning_rate": 1.663430546386548e-07, + "loss": 0.0058, + "step": 8717 + }, + { + "epoch": 0.17, + "learning_rate": 1.6633917129431867e-07, + "loss": 0.8821, + "step": 8718 + }, + { + "epoch": 0.17, + "learning_rate": 1.6633528794998252e-07, + "loss": 0.0244, + "step": 8719 + }, + { + "epoch": 0.17, + "learning_rate": 1.663314046056464e-07, + "loss": 0.0218, + "step": 8720 + }, + { + "epoch": 0.17, + "learning_rate": 1.6632752126131024e-07, + "loss": 0.0043, + "step": 8721 + }, + { + "epoch": 0.17, + "learning_rate": 1.6632363791697408e-07, + "loss": 0.0123, + "step": 8722 + }, + { + "epoch": 0.17, + "learning_rate": 1.6631975457263793e-07, + "loss": 0.0298, + "step": 8723 + }, + { + "epoch": 0.17, + "learning_rate": 1.663158712283018e-07, + "loss": 0.0067, + "step": 8724 + }, + { + "epoch": 0.17, + "learning_rate": 1.6631198788396564e-07, + "loss": 0.0036, + "step": 8725 + }, + { + "epoch": 0.17, + "learning_rate": 1.663081045396295e-07, + "loss": 0.039, + "step": 8726 + }, + { + "epoch": 0.17, + "learning_rate": 1.6630422119529336e-07, + "loss": 0.457, + "step": 8727 + }, + { + "epoch": 0.17, + "learning_rate": 1.6630033785095723e-07, + "loss": 0.0108, + "step": 8728 + }, + { + "epoch": 0.17, + "learning_rate": 1.6629645450662107e-07, + "loss": 0.0043, + "step": 8729 + }, + { + "epoch": 0.17, + "learning_rate": 1.6629257116228495e-07, + "loss": 0.0068, + "step": 8730 + }, + { + "epoch": 0.17, + "learning_rate": 1.662886878179488e-07, + "loss": 0.0038, + "step": 8731 + }, + { + "epoch": 0.17, + "learning_rate": 1.6628480447361266e-07, + "loss": 0.0039, + "step": 8732 + }, + { + "epoch": 0.17, + "learning_rate": 1.662809211292765e-07, + "loss": 0.0131, + "step": 8733 + }, + { + "epoch": 0.17, + "learning_rate": 1.6627703778494038e-07, + "loss": 0.0052, + "step": 8734 + }, + { + "epoch": 0.17, + "learning_rate": 1.6627315444060422e-07, + "loss": 0.0065, + "step": 8735 + }, + { + "epoch": 0.17, + "learning_rate": 1.662692710962681e-07, + "loss": 0.0045, + "step": 8736 + }, + { + "epoch": 0.17, + "learning_rate": 1.6626538775193194e-07, + "loss": 0.0504, + "step": 8737 + }, + { + "epoch": 0.17, + "learning_rate": 1.662615044075958e-07, + "loss": 0.0471, + "step": 8738 + }, + { + "epoch": 0.17, + "learning_rate": 1.6625762106325966e-07, + "loss": 0.0052, + "step": 8739 + }, + { + "epoch": 0.17, + "learning_rate": 1.6625373771892353e-07, + "loss": 0.5994, + "step": 8740 + }, + { + "epoch": 0.17, + "learning_rate": 1.6624985437458737e-07, + "loss": 0.0046, + "step": 8741 + }, + { + "epoch": 0.17, + "learning_rate": 1.6624597103025124e-07, + "loss": 0.0033, + "step": 8742 + }, + { + "epoch": 0.17, + "learning_rate": 1.662420876859151e-07, + "loss": 0.0228, + "step": 8743 + }, + { + "epoch": 0.17, + "learning_rate": 1.6623820434157896e-07, + "loss": 0.0043, + "step": 8744 + }, + { + "epoch": 0.17, + "learning_rate": 1.662343209972428e-07, + "loss": 0.004, + "step": 8745 + }, + { + "epoch": 0.17, + "learning_rate": 1.6623043765290668e-07, + "loss": 0.008, + "step": 8746 + }, + { + "epoch": 0.17, + "learning_rate": 1.6622655430857052e-07, + "loss": 0.005, + "step": 8747 + }, + { + "epoch": 0.17, + "learning_rate": 1.662226709642344e-07, + "loss": 0.0108, + "step": 8748 + }, + { + "epoch": 0.17, + "learning_rate": 1.6621878761989824e-07, + "loss": 0.0045, + "step": 8749 + }, + { + "epoch": 0.17, + "learning_rate": 1.662149042755621e-07, + "loss": 0.2306, + "step": 8750 + }, + { + "epoch": 0.17, + "learning_rate": 1.6621102093122596e-07, + "loss": 0.0049, + "step": 8751 + }, + { + "epoch": 0.17, + "learning_rate": 1.6620713758688983e-07, + "loss": 0.0041, + "step": 8752 + }, + { + "epoch": 0.17, + "learning_rate": 1.6620325424255367e-07, + "loss": 0.005, + "step": 8753 + }, + { + "epoch": 0.17, + "learning_rate": 1.6619937089821754e-07, + "loss": 0.007, + "step": 8754 + }, + { + "epoch": 0.17, + "learning_rate": 1.661954875538814e-07, + "loss": 0.0045, + "step": 8755 + }, + { + "epoch": 0.17, + "learning_rate": 1.6619160420954526e-07, + "loss": 0.0066, + "step": 8756 + }, + { + "epoch": 0.17, + "learning_rate": 1.661877208652091e-07, + "loss": 0.0046, + "step": 8757 + }, + { + "epoch": 0.17, + "learning_rate": 1.6618383752087298e-07, + "loss": 0.0038, + "step": 8758 + }, + { + "epoch": 0.17, + "learning_rate": 1.6617995417653682e-07, + "loss": 0.004, + "step": 8759 + }, + { + "epoch": 0.17, + "learning_rate": 1.661760708322007e-07, + "loss": 0.0041, + "step": 8760 + }, + { + "epoch": 0.17, + "learning_rate": 1.6617218748786454e-07, + "loss": 0.0164, + "step": 8761 + }, + { + "epoch": 0.17, + "learning_rate": 1.661683041435284e-07, + "loss": 0.0061, + "step": 8762 + }, + { + "epoch": 0.17, + "learning_rate": 1.6616442079919225e-07, + "loss": 0.0044, + "step": 8763 + }, + { + "epoch": 0.17, + "learning_rate": 1.6616053745485613e-07, + "loss": 0.0057, + "step": 8764 + }, + { + "epoch": 0.17, + "learning_rate": 1.6615665411051997e-07, + "loss": 0.0036, + "step": 8765 + }, + { + "epoch": 0.17, + "learning_rate": 1.6615277076618384e-07, + "loss": 0.004, + "step": 8766 + }, + { + "epoch": 0.17, + "learning_rate": 1.661488874218477e-07, + "loss": 0.314, + "step": 8767 + }, + { + "epoch": 0.17, + "learning_rate": 1.6614500407751156e-07, + "loss": 0.0047, + "step": 8768 + }, + { + "epoch": 0.17, + "learning_rate": 1.661411207331754e-07, + "loss": 0.0035, + "step": 8769 + }, + { + "epoch": 0.17, + "learning_rate": 1.6613723738883928e-07, + "loss": 0.7408, + "step": 8770 + }, + { + "epoch": 0.17, + "learning_rate": 1.6613335404450312e-07, + "loss": 0.4802, + "step": 8771 + }, + { + "epoch": 0.17, + "learning_rate": 1.66129470700167e-07, + "loss": 0.0136, + "step": 8772 + }, + { + "epoch": 0.17, + "learning_rate": 1.6612558735583084e-07, + "loss": 0.0689, + "step": 8773 + }, + { + "epoch": 0.17, + "learning_rate": 1.661217040114947e-07, + "loss": 0.0042, + "step": 8774 + }, + { + "epoch": 0.17, + "learning_rate": 1.6611782066715855e-07, + "loss": 0.16, + "step": 8775 + }, + { + "epoch": 0.17, + "learning_rate": 1.6611393732282243e-07, + "loss": 0.0178, + "step": 8776 + }, + { + "epoch": 0.17, + "learning_rate": 1.6611005397848627e-07, + "loss": 0.0046, + "step": 8777 + }, + { + "epoch": 0.17, + "learning_rate": 1.6610617063415014e-07, + "loss": 0.6484, + "step": 8778 + }, + { + "epoch": 0.17, + "learning_rate": 1.6610228728981396e-07, + "loss": 0.0057, + "step": 8779 + }, + { + "epoch": 0.17, + "learning_rate": 1.6609840394547783e-07, + "loss": 0.4284, + "step": 8780 + }, + { + "epoch": 0.17, + "learning_rate": 1.6609452060114168e-07, + "loss": 0.0057, + "step": 8781 + }, + { + "epoch": 0.17, + "learning_rate": 1.6609063725680555e-07, + "loss": 0.007, + "step": 8782 + }, + { + "epoch": 0.17, + "learning_rate": 1.660867539124694e-07, + "loss": 0.0053, + "step": 8783 + }, + { + "epoch": 0.17, + "learning_rate": 1.6608287056813326e-07, + "loss": 0.9269, + "step": 8784 + }, + { + "epoch": 0.17, + "learning_rate": 1.660789872237971e-07, + "loss": 0.0095, + "step": 8785 + }, + { + "epoch": 0.17, + "learning_rate": 1.6607510387946098e-07, + "loss": 0.0038, + "step": 8786 + }, + { + "epoch": 0.17, + "learning_rate": 1.6607122053512483e-07, + "loss": 0.0048, + "step": 8787 + }, + { + "epoch": 0.17, + "learning_rate": 1.660673371907887e-07, + "loss": 0.0039, + "step": 8788 + }, + { + "epoch": 0.17, + "learning_rate": 1.6606345384645254e-07, + "loss": 0.2481, + "step": 8789 + }, + { + "epoch": 0.17, + "learning_rate": 1.6605957050211641e-07, + "loss": 0.004, + "step": 8790 + }, + { + "epoch": 0.17, + "learning_rate": 1.6605568715778026e-07, + "loss": 0.0057, + "step": 8791 + }, + { + "epoch": 0.17, + "learning_rate": 1.6605180381344413e-07, + "loss": 0.0038, + "step": 8792 + }, + { + "epoch": 0.17, + "learning_rate": 1.6604792046910798e-07, + "loss": 0.6965, + "step": 8793 + }, + { + "epoch": 0.17, + "learning_rate": 1.6604403712477185e-07, + "loss": 0.0628, + "step": 8794 + }, + { + "epoch": 0.17, + "learning_rate": 1.660401537804357e-07, + "loss": 0.0034, + "step": 8795 + }, + { + "epoch": 0.17, + "learning_rate": 1.6603627043609956e-07, + "loss": 0.1295, + "step": 8796 + }, + { + "epoch": 0.17, + "learning_rate": 1.660323870917634e-07, + "loss": 0.0035, + "step": 8797 + }, + { + "epoch": 0.17, + "learning_rate": 1.6602850374742728e-07, + "loss": 0.0038, + "step": 8798 + }, + { + "epoch": 0.17, + "learning_rate": 1.6602462040309113e-07, + "loss": 0.0033, + "step": 8799 + }, + { + "epoch": 0.17, + "learning_rate": 1.66020737058755e-07, + "loss": 0.0336, + "step": 8800 + }, + { + "epoch": 0.17, + "learning_rate": 1.6601685371441884e-07, + "loss": 0.0195, + "step": 8801 + }, + { + "epoch": 0.17, + "learning_rate": 1.660129703700827e-07, + "loss": 0.0084, + "step": 8802 + }, + { + "epoch": 0.17, + "learning_rate": 1.6600908702574656e-07, + "loss": 1.073, + "step": 8803 + }, + { + "epoch": 0.17, + "learning_rate": 1.6600520368141043e-07, + "loss": 0.0078, + "step": 8804 + }, + { + "epoch": 0.17, + "learning_rate": 1.6600132033707427e-07, + "loss": 0.0053, + "step": 8805 + }, + { + "epoch": 0.17, + "learning_rate": 1.6599743699273815e-07, + "loss": 0.0091, + "step": 8806 + }, + { + "epoch": 0.17, + "learning_rate": 1.65993553648402e-07, + "loss": 0.0041, + "step": 8807 + }, + { + "epoch": 0.17, + "learning_rate": 1.6598967030406586e-07, + "loss": 0.3157, + "step": 8808 + }, + { + "epoch": 0.17, + "learning_rate": 1.659857869597297e-07, + "loss": 0.3041, + "step": 8809 + }, + { + "epoch": 0.17, + "learning_rate": 1.6598190361539358e-07, + "loss": 0.004, + "step": 8810 + }, + { + "epoch": 0.17, + "learning_rate": 1.6597802027105742e-07, + "loss": 0.004, + "step": 8811 + }, + { + "epoch": 0.17, + "learning_rate": 1.659741369267213e-07, + "loss": 0.0123, + "step": 8812 + }, + { + "epoch": 0.17, + "learning_rate": 1.6597025358238514e-07, + "loss": 0.0059, + "step": 8813 + }, + { + "epoch": 0.17, + "learning_rate": 1.65966370238049e-07, + "loss": 0.0038, + "step": 8814 + }, + { + "epoch": 0.17, + "learning_rate": 1.6596248689371286e-07, + "loss": 0.0112, + "step": 8815 + }, + { + "epoch": 0.17, + "learning_rate": 1.6595860354937673e-07, + "loss": 0.0044, + "step": 8816 + }, + { + "epoch": 0.17, + "learning_rate": 1.6595472020504057e-07, + "loss": 0.0041, + "step": 8817 + }, + { + "epoch": 0.17, + "learning_rate": 1.6595083686070445e-07, + "loss": 0.0045, + "step": 8818 + }, + { + "epoch": 0.17, + "learning_rate": 1.659469535163683e-07, + "loss": 0.0044, + "step": 8819 + }, + { + "epoch": 0.17, + "learning_rate": 1.6594307017203216e-07, + "loss": 0.0034, + "step": 8820 + }, + { + "epoch": 0.17, + "learning_rate": 1.65939186827696e-07, + "loss": 0.005, + "step": 8821 + }, + { + "epoch": 0.17, + "learning_rate": 1.6593530348335988e-07, + "loss": 0.0064, + "step": 8822 + }, + { + "epoch": 0.17, + "learning_rate": 1.6593142013902372e-07, + "loss": 0.0074, + "step": 8823 + }, + { + "epoch": 0.17, + "learning_rate": 1.659275367946876e-07, + "loss": 0.728, + "step": 8824 + }, + { + "epoch": 0.17, + "learning_rate": 1.6592365345035144e-07, + "loss": 0.5096, + "step": 8825 + }, + { + "epoch": 0.17, + "learning_rate": 1.659197701060153e-07, + "loss": 0.3799, + "step": 8826 + }, + { + "epoch": 0.17, + "learning_rate": 1.6591588676167916e-07, + "loss": 0.0039, + "step": 8827 + }, + { + "epoch": 0.17, + "learning_rate": 1.6591200341734303e-07, + "loss": 0.0188, + "step": 8828 + }, + { + "epoch": 0.17, + "learning_rate": 1.6590812007300687e-07, + "loss": 0.0072, + "step": 8829 + }, + { + "epoch": 0.17, + "learning_rate": 1.6590423672867074e-07, + "loss": 0.0166, + "step": 8830 + }, + { + "epoch": 0.17, + "learning_rate": 1.659003533843346e-07, + "loss": 0.0057, + "step": 8831 + }, + { + "epoch": 0.17, + "learning_rate": 1.6589647003999846e-07, + "loss": 0.3971, + "step": 8832 + }, + { + "epoch": 0.17, + "learning_rate": 1.658925866956623e-07, + "loss": 0.5273, + "step": 8833 + }, + { + "epoch": 0.17, + "learning_rate": 1.6588870335132618e-07, + "loss": 0.0053, + "step": 8834 + }, + { + "epoch": 0.17, + "learning_rate": 1.6588482000699002e-07, + "loss": 1.1674, + "step": 8835 + }, + { + "epoch": 0.17, + "learning_rate": 1.658809366626539e-07, + "loss": 0.0042, + "step": 8836 + }, + { + "epoch": 0.17, + "learning_rate": 1.658770533183177e-07, + "loss": 0.0082, + "step": 8837 + }, + { + "epoch": 0.17, + "learning_rate": 1.6587316997398158e-07, + "loss": 0.0045, + "step": 8838 + }, + { + "epoch": 0.17, + "learning_rate": 1.6586928662964543e-07, + "loss": 0.3361, + "step": 8839 + }, + { + "epoch": 0.17, + "learning_rate": 1.658654032853093e-07, + "loss": 0.0043, + "step": 8840 + }, + { + "epoch": 0.17, + "learning_rate": 1.6586151994097314e-07, + "loss": 0.6021, + "step": 8841 + }, + { + "epoch": 0.17, + "learning_rate": 1.6585763659663702e-07, + "loss": 0.0064, + "step": 8842 + }, + { + "epoch": 0.17, + "learning_rate": 1.6585375325230086e-07, + "loss": 0.0052, + "step": 8843 + }, + { + "epoch": 0.17, + "learning_rate": 1.6584986990796473e-07, + "loss": 0.0178, + "step": 8844 + }, + { + "epoch": 0.17, + "learning_rate": 1.6584598656362858e-07, + "loss": 0.352, + "step": 8845 + }, + { + "epoch": 0.17, + "learning_rate": 1.6584210321929245e-07, + "loss": 0.0039, + "step": 8846 + }, + { + "epoch": 0.17, + "learning_rate": 1.658382198749563e-07, + "loss": 0.0063, + "step": 8847 + }, + { + "epoch": 0.17, + "learning_rate": 1.6583433653062017e-07, + "loss": 0.0079, + "step": 8848 + }, + { + "epoch": 0.17, + "learning_rate": 1.65830453186284e-07, + "loss": 0.0454, + "step": 8849 + }, + { + "epoch": 0.17, + "learning_rate": 1.6582656984194788e-07, + "loss": 0.1841, + "step": 8850 + }, + { + "epoch": 0.17, + "learning_rate": 1.6582268649761173e-07, + "loss": 0.0059, + "step": 8851 + }, + { + "epoch": 0.17, + "learning_rate": 1.658188031532756e-07, + "loss": 0.4081, + "step": 8852 + }, + { + "epoch": 0.17, + "learning_rate": 1.6581491980893944e-07, + "loss": 0.0039, + "step": 8853 + }, + { + "epoch": 0.17, + "learning_rate": 1.6581103646460332e-07, + "loss": 0.0042, + "step": 8854 + }, + { + "epoch": 0.17, + "learning_rate": 1.6580715312026716e-07, + "loss": 0.037, + "step": 8855 + }, + { + "epoch": 0.17, + "learning_rate": 1.6580326977593103e-07, + "loss": 0.0674, + "step": 8856 + }, + { + "epoch": 0.17, + "learning_rate": 1.6579938643159488e-07, + "loss": 0.0078, + "step": 8857 + }, + { + "epoch": 0.17, + "learning_rate": 1.6579550308725875e-07, + "loss": 0.0032, + "step": 8858 + }, + { + "epoch": 0.17, + "learning_rate": 1.657916197429226e-07, + "loss": 0.3412, + "step": 8859 + }, + { + "epoch": 0.17, + "learning_rate": 1.6578773639858646e-07, + "loss": 0.015, + "step": 8860 + }, + { + "epoch": 0.17, + "learning_rate": 1.657838530542503e-07, + "loss": 0.0045, + "step": 8861 + }, + { + "epoch": 0.17, + "learning_rate": 1.6577996970991418e-07, + "loss": 0.004, + "step": 8862 + }, + { + "epoch": 0.17, + "learning_rate": 1.6577608636557803e-07, + "loss": 0.0037, + "step": 8863 + }, + { + "epoch": 0.17, + "learning_rate": 1.657722030212419e-07, + "loss": 0.0046, + "step": 8864 + }, + { + "epoch": 0.17, + "learning_rate": 1.6576831967690574e-07, + "loss": 0.0047, + "step": 8865 + }, + { + "epoch": 0.17, + "learning_rate": 1.6576443633256961e-07, + "loss": 0.0035, + "step": 8866 + }, + { + "epoch": 0.17, + "learning_rate": 1.6576055298823346e-07, + "loss": 0.0042, + "step": 8867 + }, + { + "epoch": 0.17, + "learning_rate": 1.6575666964389733e-07, + "loss": 0.0919, + "step": 8868 + }, + { + "epoch": 0.17, + "learning_rate": 1.6575278629956118e-07, + "loss": 0.0055, + "step": 8869 + }, + { + "epoch": 0.17, + "learning_rate": 1.6574890295522502e-07, + "loss": 0.2242, + "step": 8870 + }, + { + "epoch": 0.17, + "learning_rate": 1.657450196108889e-07, + "loss": 0.0108, + "step": 8871 + }, + { + "epoch": 0.17, + "learning_rate": 1.6574113626655274e-07, + "loss": 0.3549, + "step": 8872 + }, + { + "epoch": 0.17, + "learning_rate": 1.657372529222166e-07, + "loss": 0.0048, + "step": 8873 + }, + { + "epoch": 0.17, + "learning_rate": 1.6573336957788045e-07, + "loss": 0.0036, + "step": 8874 + }, + { + "epoch": 0.17, + "learning_rate": 1.6572948623354433e-07, + "loss": 0.0044, + "step": 8875 + }, + { + "epoch": 0.17, + "learning_rate": 1.6572560288920817e-07, + "loss": 0.0378, + "step": 8876 + }, + { + "epoch": 0.17, + "learning_rate": 1.6572171954487204e-07, + "loss": 0.2665, + "step": 8877 + }, + { + "epoch": 0.17, + "learning_rate": 1.6571783620053589e-07, + "loss": 0.1028, + "step": 8878 + }, + { + "epoch": 0.17, + "learning_rate": 1.6571395285619976e-07, + "loss": 0.0363, + "step": 8879 + }, + { + "epoch": 0.17, + "learning_rate": 1.657100695118636e-07, + "loss": 0.0032, + "step": 8880 + }, + { + "epoch": 0.17, + "learning_rate": 1.6570618616752747e-07, + "loss": 0.1357, + "step": 8881 + }, + { + "epoch": 0.17, + "learning_rate": 1.6570230282319132e-07, + "loss": 0.0037, + "step": 8882 + }, + { + "epoch": 0.17, + "learning_rate": 1.656984194788552e-07, + "loss": 0.3858, + "step": 8883 + }, + { + "epoch": 0.17, + "learning_rate": 1.6569453613451904e-07, + "loss": 0.3792, + "step": 8884 + }, + { + "epoch": 0.17, + "learning_rate": 1.656906527901829e-07, + "loss": 0.0043, + "step": 8885 + }, + { + "epoch": 0.17, + "learning_rate": 1.6568676944584675e-07, + "loss": 0.0211, + "step": 8886 + }, + { + "epoch": 0.17, + "learning_rate": 1.6568288610151062e-07, + "loss": 0.0039, + "step": 8887 + }, + { + "epoch": 0.17, + "learning_rate": 1.6567900275717447e-07, + "loss": 0.006, + "step": 8888 + }, + { + "epoch": 0.17, + "learning_rate": 1.6567511941283834e-07, + "loss": 0.0033, + "step": 8889 + }, + { + "epoch": 0.17, + "learning_rate": 1.6567123606850219e-07, + "loss": 0.0142, + "step": 8890 + }, + { + "epoch": 0.17, + "learning_rate": 1.6566735272416606e-07, + "loss": 1.0317, + "step": 8891 + }, + { + "epoch": 0.17, + "learning_rate": 1.656634693798299e-07, + "loss": 0.0167, + "step": 8892 + }, + { + "epoch": 0.17, + "learning_rate": 1.6565958603549377e-07, + "loss": 0.1639, + "step": 8893 + }, + { + "epoch": 0.17, + "learning_rate": 1.6565570269115762e-07, + "loss": 0.7624, + "step": 8894 + }, + { + "epoch": 0.17, + "learning_rate": 1.6565181934682146e-07, + "loss": 0.0036, + "step": 8895 + }, + { + "epoch": 0.17, + "learning_rate": 1.6564793600248534e-07, + "loss": 0.0059, + "step": 8896 + }, + { + "epoch": 0.17, + "learning_rate": 1.6564405265814918e-07, + "loss": 0.0035, + "step": 8897 + }, + { + "epoch": 0.17, + "learning_rate": 1.6564016931381305e-07, + "loss": 0.0031, + "step": 8898 + }, + { + "epoch": 0.17, + "learning_rate": 1.656362859694769e-07, + "loss": 0.0046, + "step": 8899 + }, + { + "epoch": 0.17, + "learning_rate": 1.6563240262514074e-07, + "loss": 0.0042, + "step": 8900 + }, + { + "epoch": 0.17, + "learning_rate": 1.656285192808046e-07, + "loss": 0.0175, + "step": 8901 + }, + { + "epoch": 0.17, + "learning_rate": 1.6562463593646846e-07, + "loss": 0.0034, + "step": 8902 + }, + { + "epoch": 0.17, + "learning_rate": 1.6562075259213233e-07, + "loss": 1.3125, + "step": 8903 + }, + { + "epoch": 0.17, + "learning_rate": 1.6561686924779617e-07, + "loss": 0.5802, + "step": 8904 + }, + { + "epoch": 0.17, + "learning_rate": 1.6561298590346005e-07, + "loss": 0.2805, + "step": 8905 + }, + { + "epoch": 0.17, + "learning_rate": 1.656091025591239e-07, + "loss": 0.7222, + "step": 8906 + }, + { + "epoch": 0.17, + "learning_rate": 1.6560521921478776e-07, + "loss": 0.0891, + "step": 8907 + }, + { + "epoch": 0.17, + "learning_rate": 1.656013358704516e-07, + "loss": 0.0035, + "step": 8908 + }, + { + "epoch": 0.17, + "learning_rate": 1.6559745252611548e-07, + "loss": 0.6785, + "step": 8909 + }, + { + "epoch": 0.17, + "learning_rate": 1.6559356918177932e-07, + "loss": 0.0042, + "step": 8910 + }, + { + "epoch": 0.17, + "learning_rate": 1.655896858374432e-07, + "loss": 0.8636, + "step": 8911 + }, + { + "epoch": 0.17, + "learning_rate": 1.6558580249310704e-07, + "loss": 0.0038, + "step": 8912 + }, + { + "epoch": 0.17, + "learning_rate": 1.655819191487709e-07, + "loss": 0.0129, + "step": 8913 + }, + { + "epoch": 0.17, + "learning_rate": 1.6557803580443476e-07, + "loss": 0.0267, + "step": 8914 + }, + { + "epoch": 0.17, + "learning_rate": 1.6557415246009863e-07, + "loss": 0.0108, + "step": 8915 + }, + { + "epoch": 0.17, + "learning_rate": 1.6557026911576247e-07, + "loss": 0.012, + "step": 8916 + }, + { + "epoch": 0.17, + "learning_rate": 1.6556638577142635e-07, + "loss": 0.7314, + "step": 8917 + }, + { + "epoch": 0.17, + "learning_rate": 1.655625024270902e-07, + "loss": 0.0044, + "step": 8918 + }, + { + "epoch": 0.17, + "learning_rate": 1.6555861908275406e-07, + "loss": 0.0088, + "step": 8919 + }, + { + "epoch": 0.17, + "learning_rate": 1.655547357384179e-07, + "loss": 0.0034, + "step": 8920 + }, + { + "epoch": 0.17, + "learning_rate": 1.6555085239408178e-07, + "loss": 0.0073, + "step": 8921 + }, + { + "epoch": 0.17, + "learning_rate": 1.6554696904974562e-07, + "loss": 0.0031, + "step": 8922 + }, + { + "epoch": 0.17, + "learning_rate": 1.655430857054095e-07, + "loss": 0.0041, + "step": 8923 + }, + { + "epoch": 0.17, + "learning_rate": 1.6553920236107334e-07, + "loss": 0.3588, + "step": 8924 + }, + { + "epoch": 0.17, + "learning_rate": 1.655353190167372e-07, + "loss": 0.007, + "step": 8925 + }, + { + "epoch": 0.17, + "learning_rate": 1.6553143567240106e-07, + "loss": 0.0048, + "step": 8926 + }, + { + "epoch": 0.17, + "learning_rate": 1.6552755232806493e-07, + "loss": 0.005, + "step": 8927 + }, + { + "epoch": 0.17, + "learning_rate": 1.6552366898372877e-07, + "loss": 0.7149, + "step": 8928 + }, + { + "epoch": 0.17, + "learning_rate": 1.6551978563939264e-07, + "loss": 0.2759, + "step": 8929 + }, + { + "epoch": 0.17, + "learning_rate": 1.655159022950565e-07, + "loss": 0.0034, + "step": 8930 + }, + { + "epoch": 0.17, + "learning_rate": 1.6551201895072036e-07, + "loss": 0.0043, + "step": 8931 + }, + { + "epoch": 0.17, + "learning_rate": 1.655081356063842e-07, + "loss": 0.0044, + "step": 8932 + }, + { + "epoch": 0.17, + "learning_rate": 1.6550425226204808e-07, + "loss": 0.0965, + "step": 8933 + }, + { + "epoch": 0.17, + "learning_rate": 1.6550036891771192e-07, + "loss": 0.0045, + "step": 8934 + }, + { + "epoch": 0.17, + "learning_rate": 1.654964855733758e-07, + "loss": 0.0053, + "step": 8935 + }, + { + "epoch": 0.17, + "learning_rate": 1.6549260222903964e-07, + "loss": 0.0082, + "step": 8936 + }, + { + "epoch": 0.17, + "learning_rate": 1.654887188847035e-07, + "loss": 0.0408, + "step": 8937 + }, + { + "epoch": 0.17, + "learning_rate": 1.6548483554036735e-07, + "loss": 0.7237, + "step": 8938 + }, + { + "epoch": 0.17, + "learning_rate": 1.6548095219603123e-07, + "loss": 0.0059, + "step": 8939 + }, + { + "epoch": 0.17, + "learning_rate": 1.6547706885169507e-07, + "loss": 0.0034, + "step": 8940 + }, + { + "epoch": 0.17, + "learning_rate": 1.6547318550735894e-07, + "loss": 0.0101, + "step": 8941 + }, + { + "epoch": 0.17, + "learning_rate": 1.654693021630228e-07, + "loss": 0.0063, + "step": 8942 + }, + { + "epoch": 0.17, + "learning_rate": 1.6546541881868666e-07, + "loss": 1.2163, + "step": 8943 + }, + { + "epoch": 0.17, + "learning_rate": 1.654615354743505e-07, + "loss": 0.004, + "step": 8944 + }, + { + "epoch": 0.17, + "learning_rate": 1.6545765213001438e-07, + "loss": 0.1986, + "step": 8945 + }, + { + "epoch": 0.17, + "learning_rate": 1.6545376878567822e-07, + "loss": 0.0047, + "step": 8946 + }, + { + "epoch": 0.17, + "learning_rate": 1.654498854413421e-07, + "loss": 0.0118, + "step": 8947 + }, + { + "epoch": 0.17, + "learning_rate": 1.6544600209700594e-07, + "loss": 0.0054, + "step": 8948 + }, + { + "epoch": 0.17, + "learning_rate": 1.654421187526698e-07, + "loss": 0.3778, + "step": 8949 + }, + { + "epoch": 0.17, + "learning_rate": 1.6543823540833365e-07, + "loss": 0.4527, + "step": 8950 + }, + { + "epoch": 0.17, + "learning_rate": 1.6543435206399753e-07, + "loss": 0.0284, + "step": 8951 + }, + { + "epoch": 0.17, + "learning_rate": 1.6543046871966137e-07, + "loss": 0.0053, + "step": 8952 + }, + { + "epoch": 0.17, + "learning_rate": 1.6542658537532522e-07, + "loss": 0.0045, + "step": 8953 + }, + { + "epoch": 0.17, + "learning_rate": 1.6542270203098906e-07, + "loss": 0.0047, + "step": 8954 + }, + { + "epoch": 0.17, + "learning_rate": 1.6541881868665293e-07, + "loss": 0.0157, + "step": 8955 + }, + { + "epoch": 0.17, + "learning_rate": 1.6541493534231678e-07, + "loss": 0.8256, + "step": 8956 + }, + { + "epoch": 0.17, + "learning_rate": 1.6541105199798065e-07, + "loss": 0.8518, + "step": 8957 + }, + { + "epoch": 0.17, + "learning_rate": 1.654071686536445e-07, + "loss": 0.0641, + "step": 8958 + }, + { + "epoch": 0.17, + "learning_rate": 1.6540328530930836e-07, + "loss": 0.0033, + "step": 8959 + }, + { + "epoch": 0.17, + "learning_rate": 1.653994019649722e-07, + "loss": 0.0048, + "step": 8960 + }, + { + "epoch": 0.17, + "learning_rate": 1.6539551862063608e-07, + "loss": 0.0235, + "step": 8961 + }, + { + "epoch": 0.17, + "learning_rate": 1.6539163527629993e-07, + "loss": 0.124, + "step": 8962 + }, + { + "epoch": 0.17, + "learning_rate": 1.653877519319638e-07, + "loss": 0.0034, + "step": 8963 + }, + { + "epoch": 0.17, + "learning_rate": 1.6538386858762764e-07, + "loss": 0.0054, + "step": 8964 + }, + { + "epoch": 0.17, + "learning_rate": 1.6537998524329151e-07, + "loss": 0.0039, + "step": 8965 + }, + { + "epoch": 0.17, + "learning_rate": 1.6537610189895536e-07, + "loss": 0.0042, + "step": 8966 + }, + { + "epoch": 0.17, + "learning_rate": 1.6537221855461923e-07, + "loss": 0.0096, + "step": 8967 + }, + { + "epoch": 0.17, + "learning_rate": 1.6536833521028308e-07, + "loss": 0.0039, + "step": 8968 + }, + { + "epoch": 0.17, + "learning_rate": 1.6536445186594695e-07, + "loss": 0.0051, + "step": 8969 + }, + { + "epoch": 0.17, + "learning_rate": 1.653605685216108e-07, + "loss": 0.0061, + "step": 8970 + }, + { + "epoch": 0.17, + "learning_rate": 1.6535668517727466e-07, + "loss": 0.0089, + "step": 8971 + }, + { + "epoch": 0.17, + "learning_rate": 1.653528018329385e-07, + "loss": 0.5515, + "step": 8972 + }, + { + "epoch": 0.17, + "learning_rate": 1.6534891848860238e-07, + "loss": 0.0032, + "step": 8973 + }, + { + "epoch": 0.17, + "learning_rate": 1.6534503514426623e-07, + "loss": 0.0066, + "step": 8974 + }, + { + "epoch": 0.17, + "learning_rate": 1.653411517999301e-07, + "loss": 0.0039, + "step": 8975 + }, + { + "epoch": 0.17, + "learning_rate": 1.6533726845559394e-07, + "loss": 0.0039, + "step": 8976 + }, + { + "epoch": 0.17, + "learning_rate": 1.653333851112578e-07, + "loss": 0.6616, + "step": 8977 + }, + { + "epoch": 0.17, + "learning_rate": 1.6532950176692166e-07, + "loss": 0.0034, + "step": 8978 + }, + { + "epoch": 0.17, + "learning_rate": 1.6532561842258553e-07, + "loss": 0.0064, + "step": 8979 + }, + { + "epoch": 0.17, + "learning_rate": 1.6532173507824937e-07, + "loss": 0.0042, + "step": 8980 + }, + { + "epoch": 0.17, + "learning_rate": 1.6531785173391325e-07, + "loss": 0.0928, + "step": 8981 + }, + { + "epoch": 0.17, + "learning_rate": 1.653139683895771e-07, + "loss": 0.0088, + "step": 8982 + }, + { + "epoch": 0.17, + "learning_rate": 1.6531008504524096e-07, + "loss": 0.0038, + "step": 8983 + }, + { + "epoch": 0.17, + "learning_rate": 1.653062017009048e-07, + "loss": 0.0231, + "step": 8984 + }, + { + "epoch": 0.17, + "learning_rate": 1.6530231835656868e-07, + "loss": 0.0035, + "step": 8985 + }, + { + "epoch": 0.17, + "learning_rate": 1.6529843501223252e-07, + "loss": 0.0787, + "step": 8986 + }, + { + "epoch": 0.17, + "learning_rate": 1.652945516678964e-07, + "loss": 0.012, + "step": 8987 + }, + { + "epoch": 0.17, + "learning_rate": 1.6529066832356024e-07, + "loss": 0.0044, + "step": 8988 + }, + { + "epoch": 0.17, + "learning_rate": 1.652867849792241e-07, + "loss": 0.0074, + "step": 8989 + }, + { + "epoch": 0.17, + "learning_rate": 1.6528290163488796e-07, + "loss": 0.0103, + "step": 8990 + }, + { + "epoch": 0.17, + "learning_rate": 1.6527901829055183e-07, + "loss": 0.0051, + "step": 8991 + }, + { + "epoch": 0.17, + "learning_rate": 1.6527513494621567e-07, + "loss": 0.0036, + "step": 8992 + }, + { + "epoch": 0.17, + "learning_rate": 1.6527125160187955e-07, + "loss": 0.004, + "step": 8993 + }, + { + "epoch": 0.17, + "learning_rate": 1.652673682575434e-07, + "loss": 0.0077, + "step": 8994 + }, + { + "epoch": 0.17, + "learning_rate": 1.6526348491320726e-07, + "loss": 0.0118, + "step": 8995 + }, + { + "epoch": 0.17, + "learning_rate": 1.652596015688711e-07, + "loss": 0.0036, + "step": 8996 + }, + { + "epoch": 0.17, + "learning_rate": 1.6525571822453498e-07, + "loss": 0.0031, + "step": 8997 + }, + { + "epoch": 0.17, + "learning_rate": 1.6525183488019882e-07, + "loss": 0.0051, + "step": 8998 + }, + { + "epoch": 0.17, + "learning_rate": 1.652479515358627e-07, + "loss": 0.032, + "step": 8999 + }, + { + "epoch": 0.17, + "learning_rate": 1.6524406819152654e-07, + "loss": 0.0075, + "step": 9000 + }, + { + "epoch": 0.17, + "learning_rate": 1.652401848471904e-07, + "loss": 0.0041, + "step": 9001 + }, + { + "epoch": 0.17, + "learning_rate": 1.6523630150285426e-07, + "loss": 0.3486, + "step": 9002 + }, + { + "epoch": 0.17, + "learning_rate": 1.6523241815851813e-07, + "loss": 0.0055, + "step": 9003 + }, + { + "epoch": 0.17, + "learning_rate": 1.6522853481418197e-07, + "loss": 0.0036, + "step": 9004 + }, + { + "epoch": 0.17, + "learning_rate": 1.6522465146984584e-07, + "loss": 0.0069, + "step": 9005 + }, + { + "epoch": 0.17, + "learning_rate": 1.652207681255097e-07, + "loss": 0.0232, + "step": 9006 + }, + { + "epoch": 0.17, + "learning_rate": 1.6521688478117356e-07, + "loss": 0.0042, + "step": 9007 + }, + { + "epoch": 0.17, + "learning_rate": 1.652130014368374e-07, + "loss": 0.0069, + "step": 9008 + }, + { + "epoch": 0.17, + "learning_rate": 1.6520911809250128e-07, + "loss": 0.0589, + "step": 9009 + }, + { + "epoch": 0.17, + "learning_rate": 1.6520523474816512e-07, + "loss": 0.0041, + "step": 9010 + }, + { + "epoch": 0.17, + "learning_rate": 1.6520135140382897e-07, + "loss": 0.0045, + "step": 9011 + }, + { + "epoch": 0.17, + "learning_rate": 1.651974680594928e-07, + "loss": 0.0045, + "step": 9012 + }, + { + "epoch": 0.17, + "learning_rate": 1.6519358471515668e-07, + "loss": 0.9258, + "step": 9013 + }, + { + "epoch": 0.17, + "learning_rate": 1.6518970137082053e-07, + "loss": 0.0033, + "step": 9014 + }, + { + "epoch": 0.17, + "learning_rate": 1.651858180264844e-07, + "loss": 0.7822, + "step": 9015 + }, + { + "epoch": 0.17, + "learning_rate": 1.6518193468214825e-07, + "loss": 0.0082, + "step": 9016 + }, + { + "epoch": 0.17, + "learning_rate": 1.6517805133781212e-07, + "loss": 0.3555, + "step": 9017 + }, + { + "epoch": 0.17, + "learning_rate": 1.6517416799347596e-07, + "loss": 0.0394, + "step": 9018 + }, + { + "epoch": 0.17, + "learning_rate": 1.6517028464913983e-07, + "loss": 0.0215, + "step": 9019 + }, + { + "epoch": 0.17, + "learning_rate": 1.6516640130480368e-07, + "loss": 0.0034, + "step": 9020 + }, + { + "epoch": 0.17, + "learning_rate": 1.6516251796046755e-07, + "loss": 0.5659, + "step": 9021 + }, + { + "epoch": 0.18, + "learning_rate": 1.651586346161314e-07, + "loss": 0.8136, + "step": 9022 + }, + { + "epoch": 0.18, + "learning_rate": 1.6515475127179527e-07, + "loss": 0.0031, + "step": 9023 + }, + { + "epoch": 0.18, + "learning_rate": 1.651508679274591e-07, + "loss": 0.0109, + "step": 9024 + }, + { + "epoch": 0.18, + "learning_rate": 1.6514698458312298e-07, + "loss": 0.6374, + "step": 9025 + }, + { + "epoch": 0.18, + "learning_rate": 1.6514310123878683e-07, + "loss": 0.0432, + "step": 9026 + }, + { + "epoch": 0.18, + "learning_rate": 1.651392178944507e-07, + "loss": 0.0417, + "step": 9027 + }, + { + "epoch": 0.18, + "learning_rate": 1.6513533455011454e-07, + "loss": 0.2875, + "step": 9028 + }, + { + "epoch": 0.18, + "learning_rate": 1.6513145120577842e-07, + "loss": 0.7064, + "step": 9029 + }, + { + "epoch": 0.18, + "learning_rate": 1.6512756786144226e-07, + "loss": 0.0037, + "step": 9030 + }, + { + "epoch": 0.18, + "learning_rate": 1.6512368451710613e-07, + "loss": 0.0047, + "step": 9031 + }, + { + "epoch": 0.18, + "learning_rate": 1.6511980117276998e-07, + "loss": 0.0903, + "step": 9032 + }, + { + "epoch": 0.18, + "learning_rate": 1.6511591782843385e-07, + "loss": 0.0064, + "step": 9033 + }, + { + "epoch": 0.18, + "learning_rate": 1.651120344840977e-07, + "loss": 0.0416, + "step": 9034 + }, + { + "epoch": 0.18, + "learning_rate": 1.6510815113976156e-07, + "loss": 0.4469, + "step": 9035 + }, + { + "epoch": 0.18, + "learning_rate": 1.651042677954254e-07, + "loss": 0.0134, + "step": 9036 + }, + { + "epoch": 0.18, + "learning_rate": 1.6510038445108928e-07, + "loss": 0.0267, + "step": 9037 + }, + { + "epoch": 0.18, + "learning_rate": 1.6509650110675313e-07, + "loss": 0.0037, + "step": 9038 + }, + { + "epoch": 0.18, + "learning_rate": 1.65092617762417e-07, + "loss": 0.0039, + "step": 9039 + }, + { + "epoch": 0.18, + "learning_rate": 1.6508873441808084e-07, + "loss": 0.0148, + "step": 9040 + }, + { + "epoch": 0.18, + "learning_rate": 1.6508485107374471e-07, + "loss": 0.0423, + "step": 9041 + }, + { + "epoch": 0.18, + "learning_rate": 1.6508096772940856e-07, + "loss": 0.2356, + "step": 9042 + }, + { + "epoch": 0.18, + "learning_rate": 1.6507708438507243e-07, + "loss": 0.0036, + "step": 9043 + }, + { + "epoch": 0.18, + "learning_rate": 1.6507320104073628e-07, + "loss": 0.0046, + "step": 9044 + }, + { + "epoch": 0.18, + "learning_rate": 1.6506931769640015e-07, + "loss": 0.003, + "step": 9045 + }, + { + "epoch": 0.18, + "learning_rate": 1.65065434352064e-07, + "loss": 0.0041, + "step": 9046 + }, + { + "epoch": 0.18, + "learning_rate": 1.6506155100772784e-07, + "loss": 0.0056, + "step": 9047 + }, + { + "epoch": 0.18, + "learning_rate": 1.650576676633917e-07, + "loss": 0.0067, + "step": 9048 + }, + { + "epoch": 0.18, + "learning_rate": 1.6505378431905555e-07, + "loss": 1.0129, + "step": 9049 + }, + { + "epoch": 0.18, + "learning_rate": 1.6504990097471943e-07, + "loss": 0.0034, + "step": 9050 + }, + { + "epoch": 0.18, + "learning_rate": 1.6504601763038327e-07, + "loss": 0.0074, + "step": 9051 + }, + { + "epoch": 0.18, + "learning_rate": 1.6504213428604714e-07, + "loss": 0.004, + "step": 9052 + }, + { + "epoch": 0.18, + "learning_rate": 1.65038250941711e-07, + "loss": 1.4958, + "step": 9053 + }, + { + "epoch": 0.18, + "learning_rate": 1.6503436759737486e-07, + "loss": 0.0036, + "step": 9054 + }, + { + "epoch": 0.18, + "learning_rate": 1.650304842530387e-07, + "loss": 0.3314, + "step": 9055 + }, + { + "epoch": 0.18, + "learning_rate": 1.6502660090870257e-07, + "loss": 0.1368, + "step": 9056 + }, + { + "epoch": 0.18, + "learning_rate": 1.6502271756436642e-07, + "loss": 0.2051, + "step": 9057 + }, + { + "epoch": 0.18, + "learning_rate": 1.650188342200303e-07, + "loss": 0.4314, + "step": 9058 + }, + { + "epoch": 0.18, + "learning_rate": 1.6501495087569414e-07, + "loss": 0.004, + "step": 9059 + }, + { + "epoch": 0.18, + "learning_rate": 1.65011067531358e-07, + "loss": 0.0697, + "step": 9060 + }, + { + "epoch": 0.18, + "learning_rate": 1.6500718418702185e-07, + "loss": 0.0037, + "step": 9061 + }, + { + "epoch": 0.18, + "learning_rate": 1.6500330084268572e-07, + "loss": 0.0041, + "step": 9062 + }, + { + "epoch": 0.18, + "learning_rate": 1.6499941749834957e-07, + "loss": 0.0674, + "step": 9063 + }, + { + "epoch": 0.18, + "learning_rate": 1.6499553415401344e-07, + "loss": 0.0092, + "step": 9064 + }, + { + "epoch": 0.18, + "learning_rate": 1.6499165080967729e-07, + "loss": 0.0041, + "step": 9065 + }, + { + "epoch": 0.18, + "learning_rate": 1.6498776746534116e-07, + "loss": 0.0037, + "step": 9066 + }, + { + "epoch": 0.18, + "learning_rate": 1.64983884121005e-07, + "loss": 0.0032, + "step": 9067 + }, + { + "epoch": 0.18, + "learning_rate": 1.6498000077666887e-07, + "loss": 0.0158, + "step": 9068 + }, + { + "epoch": 0.18, + "learning_rate": 1.6497611743233272e-07, + "loss": 0.292, + "step": 9069 + }, + { + "epoch": 0.18, + "learning_rate": 1.6497223408799656e-07, + "loss": 0.0044, + "step": 9070 + }, + { + "epoch": 0.18, + "learning_rate": 1.6496835074366044e-07, + "loss": 0.8096, + "step": 9071 + }, + { + "epoch": 0.18, + "learning_rate": 1.6496446739932428e-07, + "loss": 0.5931, + "step": 9072 + }, + { + "epoch": 0.18, + "learning_rate": 1.6496058405498815e-07, + "loss": 0.0044, + "step": 9073 + }, + { + "epoch": 0.18, + "learning_rate": 1.64956700710652e-07, + "loss": 0.0076, + "step": 9074 + }, + { + "epoch": 0.18, + "learning_rate": 1.6495281736631587e-07, + "loss": 0.0039, + "step": 9075 + }, + { + "epoch": 0.18, + "learning_rate": 1.649489340219797e-07, + "loss": 0.0031, + "step": 9076 + }, + { + "epoch": 0.18, + "learning_rate": 1.6494505067764356e-07, + "loss": 0.0073, + "step": 9077 + }, + { + "epoch": 0.18, + "learning_rate": 1.6494116733330743e-07, + "loss": 0.1823, + "step": 9078 + }, + { + "epoch": 0.18, + "learning_rate": 1.6493728398897127e-07, + "loss": 0.0042, + "step": 9079 + }, + { + "epoch": 0.18, + "learning_rate": 1.6493340064463515e-07, + "loss": 0.0068, + "step": 9080 + }, + { + "epoch": 0.18, + "learning_rate": 1.64929517300299e-07, + "loss": 0.0336, + "step": 9081 + }, + { + "epoch": 0.18, + "learning_rate": 1.6492563395596286e-07, + "loss": 0.0046, + "step": 9082 + }, + { + "epoch": 0.18, + "learning_rate": 1.649217506116267e-07, + "loss": 0.0056, + "step": 9083 + }, + { + "epoch": 0.18, + "learning_rate": 1.6491786726729058e-07, + "loss": 0.0045, + "step": 9084 + }, + { + "epoch": 0.18, + "learning_rate": 1.6491398392295442e-07, + "loss": 0.1296, + "step": 9085 + }, + { + "epoch": 0.18, + "learning_rate": 1.649101005786183e-07, + "loss": 0.0048, + "step": 9086 + }, + { + "epoch": 0.18, + "learning_rate": 1.6490621723428214e-07, + "loss": 0.0032, + "step": 9087 + }, + { + "epoch": 0.18, + "learning_rate": 1.64902333889946e-07, + "loss": 0.0033, + "step": 9088 + }, + { + "epoch": 0.18, + "learning_rate": 1.6489845054560986e-07, + "loss": 0.0036, + "step": 9089 + }, + { + "epoch": 0.18, + "learning_rate": 1.6489456720127373e-07, + "loss": 0.4022, + "step": 9090 + }, + { + "epoch": 0.18, + "learning_rate": 1.6489068385693757e-07, + "loss": 0.0038, + "step": 9091 + }, + { + "epoch": 0.18, + "learning_rate": 1.6488680051260145e-07, + "loss": 0.0798, + "step": 9092 + }, + { + "epoch": 0.18, + "learning_rate": 1.648829171682653e-07, + "loss": 0.0054, + "step": 9093 + }, + { + "epoch": 0.18, + "learning_rate": 1.6487903382392916e-07, + "loss": 0.0065, + "step": 9094 + }, + { + "epoch": 0.18, + "learning_rate": 1.64875150479593e-07, + "loss": 0.0042, + "step": 9095 + }, + { + "epoch": 0.18, + "learning_rate": 1.6487126713525688e-07, + "loss": 0.189, + "step": 9096 + }, + { + "epoch": 0.18, + "learning_rate": 1.6486738379092072e-07, + "loss": 0.0034, + "step": 9097 + }, + { + "epoch": 0.18, + "learning_rate": 1.648635004465846e-07, + "loss": 0.1857, + "step": 9098 + }, + { + "epoch": 0.18, + "learning_rate": 1.6485961710224844e-07, + "loss": 0.0054, + "step": 9099 + }, + { + "epoch": 0.18, + "learning_rate": 1.648557337579123e-07, + "loss": 0.0108, + "step": 9100 + }, + { + "epoch": 0.18, + "learning_rate": 1.6485185041357616e-07, + "loss": 0.0042, + "step": 9101 + }, + { + "epoch": 0.18, + "learning_rate": 1.6484796706924003e-07, + "loss": 0.0118, + "step": 9102 + }, + { + "epoch": 0.18, + "learning_rate": 1.6484408372490387e-07, + "loss": 0.282, + "step": 9103 + }, + { + "epoch": 0.18, + "learning_rate": 1.6484020038056774e-07, + "loss": 0.1325, + "step": 9104 + }, + { + "epoch": 0.18, + "learning_rate": 1.648363170362316e-07, + "loss": 0.007, + "step": 9105 + }, + { + "epoch": 0.18, + "learning_rate": 1.6483243369189546e-07, + "loss": 0.0047, + "step": 9106 + }, + { + "epoch": 0.18, + "learning_rate": 1.648285503475593e-07, + "loss": 0.0027, + "step": 9107 + }, + { + "epoch": 0.18, + "learning_rate": 1.6482466700322318e-07, + "loss": 0.0034, + "step": 9108 + }, + { + "epoch": 0.18, + "learning_rate": 1.6482078365888702e-07, + "loss": 0.0057, + "step": 9109 + }, + { + "epoch": 0.18, + "learning_rate": 1.648169003145509e-07, + "loss": 0.4383, + "step": 9110 + }, + { + "epoch": 0.18, + "learning_rate": 1.6481301697021474e-07, + "loss": 0.0207, + "step": 9111 + }, + { + "epoch": 0.18, + "learning_rate": 1.648091336258786e-07, + "loss": 1.3228, + "step": 9112 + }, + { + "epoch": 0.18, + "learning_rate": 1.6480525028154246e-07, + "loss": 0.0034, + "step": 9113 + }, + { + "epoch": 0.18, + "learning_rate": 1.6480136693720633e-07, + "loss": 0.0036, + "step": 9114 + }, + { + "epoch": 0.18, + "learning_rate": 1.6479748359287017e-07, + "loss": 0.152, + "step": 9115 + }, + { + "epoch": 0.18, + "learning_rate": 1.6479360024853404e-07, + "loss": 0.0046, + "step": 9116 + }, + { + "epoch": 0.18, + "learning_rate": 1.647897169041979e-07, + "loss": 0.012, + "step": 9117 + }, + { + "epoch": 0.18, + "learning_rate": 1.6478583355986176e-07, + "loss": 0.0032, + "step": 9118 + }, + { + "epoch": 0.18, + "learning_rate": 1.647819502155256e-07, + "loss": 0.0039, + "step": 9119 + }, + { + "epoch": 0.18, + "learning_rate": 1.6477806687118948e-07, + "loss": 0.0066, + "step": 9120 + }, + { + "epoch": 0.18, + "learning_rate": 1.6477418352685332e-07, + "loss": 0.0046, + "step": 9121 + }, + { + "epoch": 0.18, + "learning_rate": 1.647703001825172e-07, + "loss": 0.0089, + "step": 9122 + }, + { + "epoch": 0.18, + "learning_rate": 1.6476641683818104e-07, + "loss": 0.0035, + "step": 9123 + }, + { + "epoch": 0.18, + "learning_rate": 1.647625334938449e-07, + "loss": 0.0161, + "step": 9124 + }, + { + "epoch": 0.18, + "learning_rate": 1.6475865014950875e-07, + "loss": 0.0038, + "step": 9125 + }, + { + "epoch": 0.18, + "learning_rate": 1.6475476680517263e-07, + "loss": 0.4865, + "step": 9126 + }, + { + "epoch": 0.18, + "learning_rate": 1.6475088346083644e-07, + "loss": 0.0032, + "step": 9127 + }, + { + "epoch": 0.18, + "learning_rate": 1.6474700011650032e-07, + "loss": 0.0073, + "step": 9128 + }, + { + "epoch": 0.18, + "learning_rate": 1.6474311677216416e-07, + "loss": 0.3285, + "step": 9129 + }, + { + "epoch": 0.18, + "learning_rate": 1.6473923342782803e-07, + "loss": 0.0042, + "step": 9130 + }, + { + "epoch": 0.18, + "learning_rate": 1.6473535008349188e-07, + "loss": 0.0214, + "step": 9131 + }, + { + "epoch": 0.18, + "learning_rate": 1.6473146673915575e-07, + "loss": 0.0031, + "step": 9132 + }, + { + "epoch": 0.18, + "learning_rate": 1.647275833948196e-07, + "loss": 0.0038, + "step": 9133 + }, + { + "epoch": 0.18, + "learning_rate": 1.6472370005048346e-07, + "loss": 0.0416, + "step": 9134 + }, + { + "epoch": 0.18, + "learning_rate": 1.647198167061473e-07, + "loss": 0.0031, + "step": 9135 + }, + { + "epoch": 0.18, + "learning_rate": 1.6471593336181118e-07, + "loss": 0.0047, + "step": 9136 + }, + { + "epoch": 0.18, + "learning_rate": 1.6471205001747503e-07, + "loss": 0.3943, + "step": 9137 + }, + { + "epoch": 0.18, + "learning_rate": 1.647081666731389e-07, + "loss": 0.0035, + "step": 9138 + }, + { + "epoch": 0.18, + "learning_rate": 1.6470428332880274e-07, + "loss": 0.0036, + "step": 9139 + }, + { + "epoch": 0.18, + "learning_rate": 1.6470039998446661e-07, + "loss": 0.0052, + "step": 9140 + }, + { + "epoch": 0.18, + "learning_rate": 1.6469651664013046e-07, + "loss": 0.8627, + "step": 9141 + }, + { + "epoch": 0.18, + "learning_rate": 1.6469263329579433e-07, + "loss": 0.0036, + "step": 9142 + }, + { + "epoch": 0.18, + "learning_rate": 1.6468874995145818e-07, + "loss": 0.0111, + "step": 9143 + }, + { + "epoch": 0.18, + "learning_rate": 1.6468486660712205e-07, + "loss": 0.0071, + "step": 9144 + }, + { + "epoch": 0.18, + "learning_rate": 1.646809832627859e-07, + "loss": 0.0159, + "step": 9145 + }, + { + "epoch": 0.18, + "learning_rate": 1.6467709991844976e-07, + "loss": 0.0032, + "step": 9146 + }, + { + "epoch": 0.18, + "learning_rate": 1.646732165741136e-07, + "loss": 0.9481, + "step": 9147 + }, + { + "epoch": 0.18, + "learning_rate": 1.6466933322977748e-07, + "loss": 0.0054, + "step": 9148 + }, + { + "epoch": 0.18, + "learning_rate": 1.6466544988544133e-07, + "loss": 0.0048, + "step": 9149 + }, + { + "epoch": 0.18, + "learning_rate": 1.646615665411052e-07, + "loss": 0.0039, + "step": 9150 + }, + { + "epoch": 0.18, + "learning_rate": 1.6465768319676904e-07, + "loss": 0.0968, + "step": 9151 + }, + { + "epoch": 0.18, + "learning_rate": 1.6465379985243291e-07, + "loss": 0.0032, + "step": 9152 + }, + { + "epoch": 0.18, + "learning_rate": 1.6464991650809676e-07, + "loss": 0.0033, + "step": 9153 + }, + { + "epoch": 0.18, + "learning_rate": 1.6464603316376063e-07, + "loss": 0.0032, + "step": 9154 + }, + { + "epoch": 0.18, + "learning_rate": 1.6464214981942447e-07, + "loss": 0.0058, + "step": 9155 + }, + { + "epoch": 0.18, + "learning_rate": 1.6463826647508835e-07, + "loss": 0.0034, + "step": 9156 + }, + { + "epoch": 0.18, + "learning_rate": 1.646343831307522e-07, + "loss": 0.2597, + "step": 9157 + }, + { + "epoch": 0.18, + "learning_rate": 1.6463049978641606e-07, + "loss": 0.0116, + "step": 9158 + }, + { + "epoch": 0.18, + "learning_rate": 1.646266164420799e-07, + "loss": 0.0028, + "step": 9159 + }, + { + "epoch": 0.18, + "learning_rate": 1.6462273309774378e-07, + "loss": 0.0034, + "step": 9160 + }, + { + "epoch": 0.18, + "learning_rate": 1.6461884975340762e-07, + "loss": 0.0079, + "step": 9161 + }, + { + "epoch": 0.18, + "learning_rate": 1.646149664090715e-07, + "loss": 0.3955, + "step": 9162 + }, + { + "epoch": 0.18, + "learning_rate": 1.6461108306473534e-07, + "loss": 0.0029, + "step": 9163 + }, + { + "epoch": 0.18, + "learning_rate": 1.646071997203992e-07, + "loss": 0.005, + "step": 9164 + }, + { + "epoch": 0.18, + "learning_rate": 1.6460331637606306e-07, + "loss": 0.5702, + "step": 9165 + }, + { + "epoch": 0.18, + "learning_rate": 1.6459943303172693e-07, + "loss": 0.0269, + "step": 9166 + }, + { + "epoch": 0.18, + "learning_rate": 1.6459554968739077e-07, + "loss": 0.0036, + "step": 9167 + }, + { + "epoch": 0.18, + "learning_rate": 1.6459166634305465e-07, + "loss": 0.6221, + "step": 9168 + }, + { + "epoch": 0.18, + "learning_rate": 1.645877829987185e-07, + "loss": 0.0036, + "step": 9169 + }, + { + "epoch": 0.18, + "learning_rate": 1.6458389965438236e-07, + "loss": 0.0087, + "step": 9170 + }, + { + "epoch": 0.18, + "learning_rate": 1.645800163100462e-07, + "loss": 0.8732, + "step": 9171 + }, + { + "epoch": 0.18, + "learning_rate": 1.6457613296571008e-07, + "loss": 0.0147, + "step": 9172 + }, + { + "epoch": 0.18, + "learning_rate": 1.6457224962137392e-07, + "loss": 0.004, + "step": 9173 + }, + { + "epoch": 0.18, + "learning_rate": 1.645683662770378e-07, + "loss": 0.0868, + "step": 9174 + }, + { + "epoch": 0.18, + "learning_rate": 1.6456448293270164e-07, + "loss": 0.0059, + "step": 9175 + }, + { + "epoch": 0.18, + "learning_rate": 1.645605995883655e-07, + "loss": 0.0109, + "step": 9176 + }, + { + "epoch": 0.18, + "learning_rate": 1.6455671624402936e-07, + "loss": 0.0765, + "step": 9177 + }, + { + "epoch": 0.18, + "learning_rate": 1.6455283289969323e-07, + "loss": 0.0042, + "step": 9178 + }, + { + "epoch": 0.18, + "learning_rate": 1.6454894955535707e-07, + "loss": 0.1692, + "step": 9179 + }, + { + "epoch": 0.18, + "learning_rate": 1.6454506621102094e-07, + "loss": 0.0305, + "step": 9180 + }, + { + "epoch": 0.18, + "learning_rate": 1.645411828666848e-07, + "loss": 0.0258, + "step": 9181 + }, + { + "epoch": 0.18, + "learning_rate": 1.6453729952234866e-07, + "loss": 0.0039, + "step": 9182 + }, + { + "epoch": 0.18, + "learning_rate": 1.645334161780125e-07, + "loss": 0.0132, + "step": 9183 + }, + { + "epoch": 0.18, + "learning_rate": 1.6452953283367638e-07, + "loss": 0.0047, + "step": 9184 + }, + { + "epoch": 0.18, + "learning_rate": 1.645256494893402e-07, + "loss": 0.0033, + "step": 9185 + }, + { + "epoch": 0.18, + "learning_rate": 1.6452176614500407e-07, + "loss": 0.006, + "step": 9186 + }, + { + "epoch": 0.18, + "learning_rate": 1.645178828006679e-07, + "loss": 0.0149, + "step": 9187 + }, + { + "epoch": 0.18, + "learning_rate": 1.6451399945633178e-07, + "loss": 0.0039, + "step": 9188 + }, + { + "epoch": 0.18, + "learning_rate": 1.6451011611199563e-07, + "loss": 0.0042, + "step": 9189 + }, + { + "epoch": 0.18, + "learning_rate": 1.645062327676595e-07, + "loss": 0.0034, + "step": 9190 + }, + { + "epoch": 0.18, + "learning_rate": 1.6450234942332335e-07, + "loss": 0.0045, + "step": 9191 + }, + { + "epoch": 0.18, + "learning_rate": 1.6449846607898722e-07, + "loss": 0.0052, + "step": 9192 + }, + { + "epoch": 0.18, + "learning_rate": 1.6449458273465106e-07, + "loss": 0.0041, + "step": 9193 + }, + { + "epoch": 0.18, + "learning_rate": 1.6449069939031493e-07, + "loss": 0.005, + "step": 9194 + }, + { + "epoch": 0.18, + "learning_rate": 1.6448681604597878e-07, + "loss": 0.0035, + "step": 9195 + }, + { + "epoch": 0.18, + "learning_rate": 1.6448293270164265e-07, + "loss": 0.0046, + "step": 9196 + }, + { + "epoch": 0.18, + "learning_rate": 1.644790493573065e-07, + "loss": 0.0049, + "step": 9197 + }, + { + "epoch": 0.18, + "learning_rate": 1.6447516601297037e-07, + "loss": 0.0049, + "step": 9198 + }, + { + "epoch": 0.18, + "learning_rate": 1.644712826686342e-07, + "loss": 0.003, + "step": 9199 + }, + { + "epoch": 0.18, + "learning_rate": 1.6446739932429808e-07, + "loss": 0.0677, + "step": 9200 + }, + { + "epoch": 0.18, + "learning_rate": 1.6446351597996193e-07, + "loss": 0.357, + "step": 9201 + }, + { + "epoch": 0.18, + "learning_rate": 1.644596326356258e-07, + "loss": 0.0082, + "step": 9202 + }, + { + "epoch": 0.18, + "learning_rate": 1.6445574929128964e-07, + "loss": 0.0091, + "step": 9203 + }, + { + "epoch": 0.18, + "learning_rate": 1.6445186594695352e-07, + "loss": 0.0045, + "step": 9204 + }, + { + "epoch": 0.18, + "learning_rate": 1.6444798260261736e-07, + "loss": 0.0045, + "step": 9205 + }, + { + "epoch": 0.18, + "learning_rate": 1.6444409925828123e-07, + "loss": 0.0122, + "step": 9206 + }, + { + "epoch": 0.18, + "learning_rate": 1.6444021591394508e-07, + "loss": 0.0053, + "step": 9207 + }, + { + "epoch": 0.18, + "learning_rate": 1.6443633256960895e-07, + "loss": 0.0111, + "step": 9208 + }, + { + "epoch": 0.18, + "learning_rate": 1.644324492252728e-07, + "loss": 0.0037, + "step": 9209 + }, + { + "epoch": 0.18, + "learning_rate": 1.6442856588093667e-07, + "loss": 0.0134, + "step": 9210 + }, + { + "epoch": 0.18, + "learning_rate": 1.644246825366005e-07, + "loss": 0.0046, + "step": 9211 + }, + { + "epoch": 0.18, + "learning_rate": 1.6442079919226438e-07, + "loss": 0.0236, + "step": 9212 + }, + { + "epoch": 0.18, + "learning_rate": 1.6441691584792823e-07, + "loss": 0.0066, + "step": 9213 + }, + { + "epoch": 0.18, + "learning_rate": 1.644130325035921e-07, + "loss": 0.004, + "step": 9214 + }, + { + "epoch": 0.18, + "learning_rate": 1.6440914915925594e-07, + "loss": 0.0028, + "step": 9215 + }, + { + "epoch": 0.18, + "learning_rate": 1.6440526581491981e-07, + "loss": 0.0052, + "step": 9216 + }, + { + "epoch": 0.18, + "learning_rate": 1.6440138247058366e-07, + "loss": 0.006, + "step": 9217 + }, + { + "epoch": 0.18, + "learning_rate": 1.6439749912624753e-07, + "loss": 0.0034, + "step": 9218 + }, + { + "epoch": 0.18, + "learning_rate": 1.6439361578191138e-07, + "loss": 0.7472, + "step": 9219 + }, + { + "epoch": 0.18, + "learning_rate": 1.6438973243757525e-07, + "loss": 0.0088, + "step": 9220 + }, + { + "epoch": 0.18, + "learning_rate": 1.643858490932391e-07, + "loss": 0.0033, + "step": 9221 + }, + { + "epoch": 0.18, + "learning_rate": 1.6438196574890296e-07, + "loss": 0.0039, + "step": 9222 + }, + { + "epoch": 0.18, + "learning_rate": 1.643780824045668e-07, + "loss": 0.9141, + "step": 9223 + }, + { + "epoch": 0.18, + "learning_rate": 1.6437419906023065e-07, + "loss": 0.0041, + "step": 9224 + }, + { + "epoch": 0.18, + "learning_rate": 1.6437031571589453e-07, + "loss": 0.0115, + "step": 9225 + }, + { + "epoch": 0.18, + "learning_rate": 1.6436643237155837e-07, + "loss": 0.9171, + "step": 9226 + }, + { + "epoch": 0.18, + "learning_rate": 1.6436254902722224e-07, + "loss": 0.6978, + "step": 9227 + }, + { + "epoch": 0.18, + "learning_rate": 1.643586656828861e-07, + "loss": 0.1048, + "step": 9228 + }, + { + "epoch": 0.18, + "learning_rate": 1.6435478233854996e-07, + "loss": 0.0054, + "step": 9229 + }, + { + "epoch": 0.18, + "learning_rate": 1.643508989942138e-07, + "loss": 0.0032, + "step": 9230 + }, + { + "epoch": 0.18, + "learning_rate": 1.6434701564987767e-07, + "loss": 0.4631, + "step": 9231 + }, + { + "epoch": 0.18, + "learning_rate": 1.6434313230554152e-07, + "loss": 0.0046, + "step": 9232 + }, + { + "epoch": 0.18, + "learning_rate": 1.643392489612054e-07, + "loss": 0.004, + "step": 9233 + }, + { + "epoch": 0.18, + "learning_rate": 1.6433536561686924e-07, + "loss": 0.004, + "step": 9234 + }, + { + "epoch": 0.18, + "learning_rate": 1.643314822725331e-07, + "loss": 0.0049, + "step": 9235 + }, + { + "epoch": 0.18, + "learning_rate": 1.6432759892819695e-07, + "loss": 0.0067, + "step": 9236 + }, + { + "epoch": 0.18, + "learning_rate": 1.6432371558386082e-07, + "loss": 0.0027, + "step": 9237 + }, + { + "epoch": 0.18, + "learning_rate": 1.6431983223952467e-07, + "loss": 0.0037, + "step": 9238 + }, + { + "epoch": 0.18, + "learning_rate": 1.6431594889518854e-07, + "loss": 0.0047, + "step": 9239 + }, + { + "epoch": 0.18, + "learning_rate": 1.6431206555085239e-07, + "loss": 0.0041, + "step": 9240 + }, + { + "epoch": 0.18, + "learning_rate": 1.6430818220651626e-07, + "loss": 0.0039, + "step": 9241 + }, + { + "epoch": 0.18, + "learning_rate": 1.643042988621801e-07, + "loss": 0.003, + "step": 9242 + }, + { + "epoch": 0.18, + "learning_rate": 1.6430041551784395e-07, + "loss": 0.0033, + "step": 9243 + }, + { + "epoch": 0.18, + "learning_rate": 1.6429653217350782e-07, + "loss": 0.0528, + "step": 9244 + }, + { + "epoch": 0.18, + "learning_rate": 1.6429264882917166e-07, + "loss": 0.0042, + "step": 9245 + }, + { + "epoch": 0.18, + "learning_rate": 1.6428876548483554e-07, + "loss": 0.0043, + "step": 9246 + }, + { + "epoch": 0.18, + "learning_rate": 1.6428488214049938e-07, + "loss": 0.1051, + "step": 9247 + }, + { + "epoch": 0.18, + "learning_rate": 1.6428099879616325e-07, + "loss": 0.0048, + "step": 9248 + }, + { + "epoch": 0.18, + "learning_rate": 1.642771154518271e-07, + "loss": 0.0044, + "step": 9249 + }, + { + "epoch": 0.18, + "learning_rate": 1.6427323210749097e-07, + "loss": 0.0029, + "step": 9250 + }, + { + "epoch": 0.18, + "learning_rate": 1.6426934876315481e-07, + "loss": 0.01, + "step": 9251 + }, + { + "epoch": 0.18, + "learning_rate": 1.6426546541881868e-07, + "loss": 0.0091, + "step": 9252 + }, + { + "epoch": 0.18, + "learning_rate": 1.6426158207448253e-07, + "loss": 0.0359, + "step": 9253 + }, + { + "epoch": 0.18, + "learning_rate": 1.6425769873014637e-07, + "loss": 0.0042, + "step": 9254 + }, + { + "epoch": 0.18, + "learning_rate": 1.6425381538581025e-07, + "loss": 0.0077, + "step": 9255 + }, + { + "epoch": 0.18, + "learning_rate": 1.642499320414741e-07, + "loss": 0.0036, + "step": 9256 + }, + { + "epoch": 0.18, + "learning_rate": 1.6424604869713796e-07, + "loss": 0.0057, + "step": 9257 + }, + { + "epoch": 0.18, + "learning_rate": 1.642421653528018e-07, + "loss": 0.0057, + "step": 9258 + }, + { + "epoch": 0.18, + "learning_rate": 1.6423828200846568e-07, + "loss": 0.0034, + "step": 9259 + }, + { + "epoch": 0.18, + "learning_rate": 1.6423439866412952e-07, + "loss": 0.0034, + "step": 9260 + }, + { + "epoch": 0.18, + "learning_rate": 1.642305153197934e-07, + "loss": 0.6923, + "step": 9261 + }, + { + "epoch": 0.18, + "learning_rate": 1.6422663197545724e-07, + "loss": 0.0331, + "step": 9262 + }, + { + "epoch": 0.18, + "learning_rate": 1.642227486311211e-07, + "loss": 0.0076, + "step": 9263 + }, + { + "epoch": 0.18, + "learning_rate": 1.6421886528678496e-07, + "loss": 0.006, + "step": 9264 + }, + { + "epoch": 0.18, + "learning_rate": 1.6421498194244883e-07, + "loss": 0.4628, + "step": 9265 + }, + { + "epoch": 0.18, + "learning_rate": 1.6421109859811267e-07, + "loss": 0.0054, + "step": 9266 + }, + { + "epoch": 0.18, + "learning_rate": 1.6420721525377655e-07, + "loss": 0.0076, + "step": 9267 + }, + { + "epoch": 0.18, + "learning_rate": 1.642033319094404e-07, + "loss": 0.0056, + "step": 9268 + }, + { + "epoch": 0.18, + "learning_rate": 1.6419944856510426e-07, + "loss": 0.0031, + "step": 9269 + }, + { + "epoch": 0.18, + "learning_rate": 1.641955652207681e-07, + "loss": 0.0037, + "step": 9270 + }, + { + "epoch": 0.18, + "learning_rate": 1.6419168187643198e-07, + "loss": 0.7288, + "step": 9271 + }, + { + "epoch": 0.18, + "learning_rate": 1.6418779853209582e-07, + "loss": 0.006, + "step": 9272 + }, + { + "epoch": 0.18, + "learning_rate": 1.641839151877597e-07, + "loss": 0.0034, + "step": 9273 + }, + { + "epoch": 0.18, + "learning_rate": 1.6418003184342354e-07, + "loss": 0.0039, + "step": 9274 + }, + { + "epoch": 0.18, + "learning_rate": 1.641761484990874e-07, + "loss": 0.0035, + "step": 9275 + }, + { + "epoch": 0.18, + "learning_rate": 1.6417226515475126e-07, + "loss": 0.6078, + "step": 9276 + }, + { + "epoch": 0.18, + "learning_rate": 1.6416838181041513e-07, + "loss": 0.7962, + "step": 9277 + }, + { + "epoch": 0.18, + "learning_rate": 1.6416449846607897e-07, + "loss": 0.0071, + "step": 9278 + }, + { + "epoch": 0.18, + "learning_rate": 1.6416061512174284e-07, + "loss": 0.0674, + "step": 9279 + }, + { + "epoch": 0.18, + "learning_rate": 1.641567317774067e-07, + "loss": 0.0036, + "step": 9280 + }, + { + "epoch": 0.18, + "learning_rate": 1.6415284843307056e-07, + "loss": 0.0025, + "step": 9281 + }, + { + "epoch": 0.18, + "learning_rate": 1.641489650887344e-07, + "loss": 0.0795, + "step": 9282 + }, + { + "epoch": 0.18, + "learning_rate": 1.6414508174439828e-07, + "loss": 0.0101, + "step": 9283 + }, + { + "epoch": 0.18, + "learning_rate": 1.6414119840006212e-07, + "loss": 0.0061, + "step": 9284 + }, + { + "epoch": 0.18, + "learning_rate": 1.64137315055726e-07, + "loss": 0.0038, + "step": 9285 + }, + { + "epoch": 0.18, + "learning_rate": 1.6413343171138984e-07, + "loss": 0.0055, + "step": 9286 + }, + { + "epoch": 0.18, + "learning_rate": 1.641295483670537e-07, + "loss": 0.0053, + "step": 9287 + }, + { + "epoch": 0.18, + "learning_rate": 1.6412566502271756e-07, + "loss": 0.1536, + "step": 9288 + }, + { + "epoch": 0.18, + "learning_rate": 1.6412178167838143e-07, + "loss": 0.0067, + "step": 9289 + }, + { + "epoch": 0.18, + "learning_rate": 1.6411789833404527e-07, + "loss": 0.005, + "step": 9290 + }, + { + "epoch": 0.18, + "learning_rate": 1.6411401498970914e-07, + "loss": 0.0421, + "step": 9291 + }, + { + "epoch": 0.18, + "learning_rate": 1.64110131645373e-07, + "loss": 0.0033, + "step": 9292 + }, + { + "epoch": 0.18, + "learning_rate": 1.6410624830103686e-07, + "loss": 0.0031, + "step": 9293 + }, + { + "epoch": 0.18, + "learning_rate": 1.641023649567007e-07, + "loss": 0.0424, + "step": 9294 + }, + { + "epoch": 0.18, + "learning_rate": 1.6409848161236458e-07, + "loss": 0.0095, + "step": 9295 + }, + { + "epoch": 0.18, + "learning_rate": 1.6409459826802842e-07, + "loss": 0.0047, + "step": 9296 + }, + { + "epoch": 0.18, + "learning_rate": 1.640907149236923e-07, + "loss": 0.0044, + "step": 9297 + }, + { + "epoch": 0.18, + "learning_rate": 1.6408683157935614e-07, + "loss": 0.0056, + "step": 9298 + }, + { + "epoch": 0.18, + "learning_rate": 1.6408294823502e-07, + "loss": 0.006, + "step": 9299 + }, + { + "epoch": 0.18, + "learning_rate": 1.6407906489068385e-07, + "loss": 0.0044, + "step": 9300 + }, + { + "epoch": 0.18, + "learning_rate": 1.640751815463477e-07, + "loss": 0.0034, + "step": 9301 + }, + { + "epoch": 0.18, + "learning_rate": 1.6407129820201154e-07, + "loss": 0.0037, + "step": 9302 + }, + { + "epoch": 0.18, + "learning_rate": 1.6406741485767542e-07, + "loss": 0.0054, + "step": 9303 + }, + { + "epoch": 0.18, + "learning_rate": 1.6406353151333926e-07, + "loss": 0.2528, + "step": 9304 + }, + { + "epoch": 0.18, + "learning_rate": 1.6405964816900313e-07, + "loss": 0.0038, + "step": 9305 + }, + { + "epoch": 0.18, + "learning_rate": 1.6405576482466698e-07, + "loss": 0.0045, + "step": 9306 + }, + { + "epoch": 0.18, + "learning_rate": 1.6405188148033085e-07, + "loss": 0.3754, + "step": 9307 + }, + { + "epoch": 0.18, + "learning_rate": 1.640479981359947e-07, + "loss": 0.5016, + "step": 9308 + }, + { + "epoch": 0.18, + "learning_rate": 1.6404411479165857e-07, + "loss": 0.0826, + "step": 9309 + }, + { + "epoch": 0.18, + "learning_rate": 1.640402314473224e-07, + "loss": 0.0042, + "step": 9310 + }, + { + "epoch": 0.18, + "learning_rate": 1.6403634810298628e-07, + "loss": 0.0059, + "step": 9311 + }, + { + "epoch": 0.18, + "learning_rate": 1.6403246475865013e-07, + "loss": 0.0079, + "step": 9312 + }, + { + "epoch": 0.18, + "learning_rate": 1.64028581414314e-07, + "loss": 0.0057, + "step": 9313 + }, + { + "epoch": 0.18, + "learning_rate": 1.6402469806997784e-07, + "loss": 0.0037, + "step": 9314 + }, + { + "epoch": 0.18, + "learning_rate": 1.6402081472564171e-07, + "loss": 0.0041, + "step": 9315 + }, + { + "epoch": 0.18, + "learning_rate": 1.6401693138130556e-07, + "loss": 0.0031, + "step": 9316 + }, + { + "epoch": 0.18, + "learning_rate": 1.6401304803696943e-07, + "loss": 0.0031, + "step": 9317 + }, + { + "epoch": 0.18, + "learning_rate": 1.6400916469263328e-07, + "loss": 0.0039, + "step": 9318 + }, + { + "epoch": 0.18, + "learning_rate": 1.6400528134829715e-07, + "loss": 0.0047, + "step": 9319 + }, + { + "epoch": 0.18, + "learning_rate": 1.64001398003961e-07, + "loss": 0.0036, + "step": 9320 + }, + { + "epoch": 0.18, + "learning_rate": 1.6399751465962486e-07, + "loss": 0.0062, + "step": 9321 + }, + { + "epoch": 0.18, + "learning_rate": 1.639936313152887e-07, + "loss": 0.0041, + "step": 9322 + }, + { + "epoch": 0.18, + "learning_rate": 1.6398974797095258e-07, + "loss": 0.123, + "step": 9323 + }, + { + "epoch": 0.18, + "learning_rate": 1.6398586462661643e-07, + "loss": 0.392, + "step": 9324 + }, + { + "epoch": 0.18, + "learning_rate": 1.639819812822803e-07, + "loss": 0.5568, + "step": 9325 + }, + { + "epoch": 0.18, + "learning_rate": 1.6397809793794414e-07, + "loss": 0.0091, + "step": 9326 + }, + { + "epoch": 0.18, + "learning_rate": 1.6397421459360801e-07, + "loss": 0.1281, + "step": 9327 + }, + { + "epoch": 0.18, + "learning_rate": 1.6397033124927186e-07, + "loss": 0.0223, + "step": 9328 + }, + { + "epoch": 0.18, + "learning_rate": 1.6396644790493573e-07, + "loss": 0.0062, + "step": 9329 + }, + { + "epoch": 0.18, + "learning_rate": 1.6396256456059957e-07, + "loss": 0.0028, + "step": 9330 + }, + { + "epoch": 0.18, + "learning_rate": 1.6395868121626345e-07, + "loss": 0.004, + "step": 9331 + }, + { + "epoch": 0.18, + "learning_rate": 1.639547978719273e-07, + "loss": 0.0028, + "step": 9332 + }, + { + "epoch": 0.18, + "learning_rate": 1.6395091452759116e-07, + "loss": 0.5825, + "step": 9333 + }, + { + "epoch": 0.18, + "learning_rate": 1.63947031183255e-07, + "loss": 0.0035, + "step": 9334 + }, + { + "epoch": 0.18, + "learning_rate": 1.6394314783891888e-07, + "loss": 0.1111, + "step": 9335 + }, + { + "epoch": 0.18, + "learning_rate": 1.6393926449458272e-07, + "loss": 0.0221, + "step": 9336 + }, + { + "epoch": 0.18, + "learning_rate": 1.639353811502466e-07, + "loss": 0.0037, + "step": 9337 + }, + { + "epoch": 0.18, + "learning_rate": 1.6393149780591044e-07, + "loss": 0.0064, + "step": 9338 + }, + { + "epoch": 0.18, + "learning_rate": 1.639276144615743e-07, + "loss": 0.0033, + "step": 9339 + }, + { + "epoch": 0.18, + "learning_rate": 1.6392373111723816e-07, + "loss": 0.0379, + "step": 9340 + }, + { + "epoch": 0.18, + "learning_rate": 1.6391984777290203e-07, + "loss": 0.0169, + "step": 9341 + }, + { + "epoch": 0.18, + "learning_rate": 1.6391596442856587e-07, + "loss": 0.0029, + "step": 9342 + }, + { + "epoch": 0.18, + "learning_rate": 1.6391208108422975e-07, + "loss": 0.0039, + "step": 9343 + }, + { + "epoch": 0.18, + "learning_rate": 1.639081977398936e-07, + "loss": 0.0103, + "step": 9344 + }, + { + "epoch": 0.18, + "learning_rate": 1.6390431439555746e-07, + "loss": 0.0042, + "step": 9345 + }, + { + "epoch": 0.18, + "learning_rate": 1.639004310512213e-07, + "loss": 0.0881, + "step": 9346 + }, + { + "epoch": 0.18, + "learning_rate": 1.6389654770688518e-07, + "loss": 0.0151, + "step": 9347 + }, + { + "epoch": 0.18, + "learning_rate": 1.6389266436254902e-07, + "loss": 0.0045, + "step": 9348 + }, + { + "epoch": 0.18, + "learning_rate": 1.638887810182129e-07, + "loss": 0.5555, + "step": 9349 + }, + { + "epoch": 0.18, + "learning_rate": 1.6388489767387674e-07, + "loss": 0.0145, + "step": 9350 + }, + { + "epoch": 0.18, + "learning_rate": 1.638810143295406e-07, + "loss": 0.3816, + "step": 9351 + }, + { + "epoch": 0.18, + "learning_rate": 1.6387713098520446e-07, + "loss": 0.0036, + "step": 9352 + }, + { + "epoch": 0.18, + "learning_rate": 1.6387324764086833e-07, + "loss": 0.0071, + "step": 9353 + }, + { + "epoch": 0.18, + "learning_rate": 1.6386936429653217e-07, + "loss": 0.003, + "step": 9354 + }, + { + "epoch": 0.18, + "learning_rate": 1.6386548095219604e-07, + "loss": 0.2063, + "step": 9355 + }, + { + "epoch": 0.18, + "learning_rate": 1.638615976078599e-07, + "loss": 0.0634, + "step": 9356 + }, + { + "epoch": 0.18, + "learning_rate": 1.6385771426352376e-07, + "loss": 0.01, + "step": 9357 + }, + { + "epoch": 0.18, + "learning_rate": 1.638538309191876e-07, + "loss": 0.0046, + "step": 9358 + }, + { + "epoch": 0.18, + "learning_rate": 1.6384994757485145e-07, + "loss": 0.0041, + "step": 9359 + }, + { + "epoch": 0.18, + "learning_rate": 1.638460642305153e-07, + "loss": 0.0067, + "step": 9360 + }, + { + "epoch": 0.18, + "learning_rate": 1.6384218088617917e-07, + "loss": 0.0037, + "step": 9361 + }, + { + "epoch": 0.18, + "learning_rate": 1.63838297541843e-07, + "loss": 0.003, + "step": 9362 + }, + { + "epoch": 0.18, + "learning_rate": 1.6383441419750688e-07, + "loss": 0.0074, + "step": 9363 + }, + { + "epoch": 0.18, + "learning_rate": 1.6383053085317073e-07, + "loss": 0.4517, + "step": 9364 + }, + { + "epoch": 0.18, + "learning_rate": 1.638266475088346e-07, + "loss": 0.0033, + "step": 9365 + }, + { + "epoch": 0.18, + "learning_rate": 1.6382276416449845e-07, + "loss": 0.0041, + "step": 9366 + }, + { + "epoch": 0.18, + "learning_rate": 1.6381888082016232e-07, + "loss": 0.006, + "step": 9367 + }, + { + "epoch": 0.18, + "learning_rate": 1.6381499747582616e-07, + "loss": 0.0042, + "step": 9368 + }, + { + "epoch": 0.18, + "learning_rate": 1.6381111413149003e-07, + "loss": 0.7237, + "step": 9369 + }, + { + "epoch": 0.18, + "learning_rate": 1.6380723078715388e-07, + "loss": 0.9905, + "step": 9370 + }, + { + "epoch": 0.18, + "learning_rate": 1.6380334744281775e-07, + "loss": 0.0257, + "step": 9371 + }, + { + "epoch": 0.18, + "learning_rate": 1.637994640984816e-07, + "loss": 0.0034, + "step": 9372 + }, + { + "epoch": 0.18, + "learning_rate": 1.6379558075414547e-07, + "loss": 0.0097, + "step": 9373 + }, + { + "epoch": 0.18, + "learning_rate": 1.637916974098093e-07, + "loss": 0.0031, + "step": 9374 + }, + { + "epoch": 0.18, + "learning_rate": 1.6378781406547318e-07, + "loss": 0.7456, + "step": 9375 + }, + { + "epoch": 0.18, + "learning_rate": 1.6378393072113703e-07, + "loss": 0.0038, + "step": 9376 + }, + { + "epoch": 0.18, + "learning_rate": 1.637800473768009e-07, + "loss": 0.4205, + "step": 9377 + }, + { + "epoch": 0.18, + "learning_rate": 1.6377616403246474e-07, + "loss": 0.0032, + "step": 9378 + }, + { + "epoch": 0.18, + "learning_rate": 1.6377228068812862e-07, + "loss": 0.0048, + "step": 9379 + }, + { + "epoch": 0.18, + "learning_rate": 1.6376839734379246e-07, + "loss": 0.0053, + "step": 9380 + }, + { + "epoch": 0.18, + "learning_rate": 1.6376451399945633e-07, + "loss": 0.0049, + "step": 9381 + }, + { + "epoch": 0.18, + "learning_rate": 1.6376063065512018e-07, + "loss": 0.5458, + "step": 9382 + }, + { + "epoch": 0.18, + "learning_rate": 1.6375674731078405e-07, + "loss": 0.005, + "step": 9383 + }, + { + "epoch": 0.18, + "learning_rate": 1.637528639664479e-07, + "loss": 0.0062, + "step": 9384 + }, + { + "epoch": 0.18, + "learning_rate": 1.6374898062211177e-07, + "loss": 0.0057, + "step": 9385 + }, + { + "epoch": 0.18, + "learning_rate": 1.637450972777756e-07, + "loss": 0.0052, + "step": 9386 + }, + { + "epoch": 0.18, + "learning_rate": 1.6374121393343948e-07, + "loss": 0.0662, + "step": 9387 + }, + { + "epoch": 0.18, + "learning_rate": 1.6373733058910333e-07, + "loss": 0.0047, + "step": 9388 + }, + { + "epoch": 0.18, + "learning_rate": 1.637334472447672e-07, + "loss": 0.3061, + "step": 9389 + }, + { + "epoch": 0.18, + "learning_rate": 1.6372956390043104e-07, + "loss": 0.0055, + "step": 9390 + }, + { + "epoch": 0.18, + "learning_rate": 1.6372568055609491e-07, + "loss": 0.6117, + "step": 9391 + }, + { + "epoch": 0.18, + "learning_rate": 1.6372179721175876e-07, + "loss": 0.0034, + "step": 9392 + }, + { + "epoch": 0.18, + "learning_rate": 1.6371791386742263e-07, + "loss": 0.0031, + "step": 9393 + }, + { + "epoch": 0.18, + "learning_rate": 1.6371403052308648e-07, + "loss": 0.0056, + "step": 9394 + }, + { + "epoch": 0.18, + "learning_rate": 1.6371014717875035e-07, + "loss": 0.0528, + "step": 9395 + }, + { + "epoch": 0.18, + "learning_rate": 1.637062638344142e-07, + "loss": 0.0038, + "step": 9396 + }, + { + "epoch": 0.18, + "learning_rate": 1.6370238049007806e-07, + "loss": 0.0039, + "step": 9397 + }, + { + "epoch": 0.18, + "learning_rate": 1.636984971457419e-07, + "loss": 0.0037, + "step": 9398 + }, + { + "epoch": 0.18, + "learning_rate": 1.6369461380140578e-07, + "loss": 0.6812, + "step": 9399 + }, + { + "epoch": 0.18, + "learning_rate": 1.6369073045706963e-07, + "loss": 0.0029, + "step": 9400 + }, + { + "epoch": 0.18, + "learning_rate": 1.6368684711273347e-07, + "loss": 0.0075, + "step": 9401 + }, + { + "epoch": 0.18, + "learning_rate": 1.6368296376839734e-07, + "loss": 0.0035, + "step": 9402 + }, + { + "epoch": 0.18, + "learning_rate": 1.636790804240612e-07, + "loss": 0.0044, + "step": 9403 + }, + { + "epoch": 0.18, + "learning_rate": 1.6367519707972506e-07, + "loss": 0.5805, + "step": 9404 + }, + { + "epoch": 0.18, + "learning_rate": 1.636713137353889e-07, + "loss": 0.004, + "step": 9405 + }, + { + "epoch": 0.18, + "learning_rate": 1.6366743039105278e-07, + "loss": 0.003, + "step": 9406 + }, + { + "epoch": 0.18, + "learning_rate": 1.6366354704671662e-07, + "loss": 0.0525, + "step": 9407 + }, + { + "epoch": 0.18, + "learning_rate": 1.636596637023805e-07, + "loss": 0.0492, + "step": 9408 + }, + { + "epoch": 0.18, + "learning_rate": 1.6365578035804434e-07, + "loss": 0.0035, + "step": 9409 + }, + { + "epoch": 0.18, + "learning_rate": 1.636518970137082e-07, + "loss": 0.0035, + "step": 9410 + }, + { + "epoch": 0.18, + "learning_rate": 1.6364801366937205e-07, + "loss": 0.2707, + "step": 9411 + }, + { + "epoch": 0.18, + "learning_rate": 1.6364413032503592e-07, + "loss": 0.01, + "step": 9412 + }, + { + "epoch": 0.18, + "learning_rate": 1.6364024698069977e-07, + "loss": 0.006, + "step": 9413 + }, + { + "epoch": 0.18, + "learning_rate": 1.6363636363636364e-07, + "loss": 0.0049, + "step": 9414 + }, + { + "epoch": 0.18, + "learning_rate": 1.6363248029202749e-07, + "loss": 0.2358, + "step": 9415 + }, + { + "epoch": 0.18, + "learning_rate": 1.6362859694769136e-07, + "loss": 0.0408, + "step": 9416 + }, + { + "epoch": 0.18, + "learning_rate": 1.636247136033552e-07, + "loss": 0.5008, + "step": 9417 + }, + { + "epoch": 0.18, + "learning_rate": 1.6362083025901905e-07, + "loss": 0.0078, + "step": 9418 + }, + { + "epoch": 0.18, + "learning_rate": 1.6361694691468292e-07, + "loss": 0.5226, + "step": 9419 + }, + { + "epoch": 0.18, + "learning_rate": 1.6361306357034676e-07, + "loss": 0.0087, + "step": 9420 + }, + { + "epoch": 0.18, + "learning_rate": 1.6360918022601064e-07, + "loss": 0.5071, + "step": 9421 + }, + { + "epoch": 0.18, + "learning_rate": 1.6360529688167448e-07, + "loss": 0.2949, + "step": 9422 + }, + { + "epoch": 0.18, + "learning_rate": 1.6360141353733835e-07, + "loss": 0.9795, + "step": 9423 + }, + { + "epoch": 0.18, + "learning_rate": 1.635975301930022e-07, + "loss": 0.0602, + "step": 9424 + }, + { + "epoch": 0.18, + "learning_rate": 1.6359364684866607e-07, + "loss": 0.0031, + "step": 9425 + }, + { + "epoch": 0.18, + "learning_rate": 1.6358976350432991e-07, + "loss": 0.0043, + "step": 9426 + }, + { + "epoch": 0.18, + "learning_rate": 1.6358588015999378e-07, + "loss": 0.0071, + "step": 9427 + }, + { + "epoch": 0.18, + "learning_rate": 1.6358199681565763e-07, + "loss": 0.6269, + "step": 9428 + }, + { + "epoch": 0.18, + "learning_rate": 1.635781134713215e-07, + "loss": 0.0053, + "step": 9429 + }, + { + "epoch": 0.18, + "learning_rate": 1.6357423012698535e-07, + "loss": 0.0197, + "step": 9430 + }, + { + "epoch": 0.18, + "learning_rate": 1.635703467826492e-07, + "loss": 0.0034, + "step": 9431 + }, + { + "epoch": 0.18, + "learning_rate": 1.6356646343831306e-07, + "loss": 0.0246, + "step": 9432 + }, + { + "epoch": 0.18, + "learning_rate": 1.635625800939769e-07, + "loss": 0.0029, + "step": 9433 + }, + { + "epoch": 0.18, + "learning_rate": 1.6355869674964078e-07, + "loss": 0.2749, + "step": 9434 + }, + { + "epoch": 0.18, + "learning_rate": 1.6355481340530462e-07, + "loss": 0.069, + "step": 9435 + }, + { + "epoch": 0.18, + "learning_rate": 1.635509300609685e-07, + "loss": 0.0034, + "step": 9436 + }, + { + "epoch": 0.18, + "learning_rate": 1.6354704671663234e-07, + "loss": 0.0031, + "step": 9437 + }, + { + "epoch": 0.18, + "learning_rate": 1.635431633722962e-07, + "loss": 0.0038, + "step": 9438 + }, + { + "epoch": 0.18, + "learning_rate": 1.6353928002796006e-07, + "loss": 0.0048, + "step": 9439 + }, + { + "epoch": 0.18, + "learning_rate": 1.6353539668362393e-07, + "loss": 0.0055, + "step": 9440 + }, + { + "epoch": 0.18, + "learning_rate": 1.6353151333928777e-07, + "loss": 0.0123, + "step": 9441 + }, + { + "epoch": 0.18, + "learning_rate": 1.6352762999495165e-07, + "loss": 0.4982, + "step": 9442 + }, + { + "epoch": 0.18, + "learning_rate": 1.635237466506155e-07, + "loss": 0.0057, + "step": 9443 + }, + { + "epoch": 0.18, + "learning_rate": 1.6351986330627936e-07, + "loss": 0.0032, + "step": 9444 + }, + { + "epoch": 0.18, + "learning_rate": 1.635159799619432e-07, + "loss": 0.0037, + "step": 9445 + }, + { + "epoch": 0.18, + "learning_rate": 1.6351209661760708e-07, + "loss": 0.0027, + "step": 9446 + }, + { + "epoch": 0.18, + "learning_rate": 1.6350821327327092e-07, + "loss": 0.0553, + "step": 9447 + }, + { + "epoch": 0.18, + "learning_rate": 1.635043299289348e-07, + "loss": 0.3674, + "step": 9448 + }, + { + "epoch": 0.18, + "learning_rate": 1.6350044658459864e-07, + "loss": 0.009, + "step": 9449 + }, + { + "epoch": 0.18, + "learning_rate": 1.634965632402625e-07, + "loss": 0.0033, + "step": 9450 + }, + { + "epoch": 0.18, + "learning_rate": 1.6349267989592636e-07, + "loss": 0.0036, + "step": 9451 + }, + { + "epoch": 0.18, + "learning_rate": 1.6348879655159023e-07, + "loss": 0.0039, + "step": 9452 + }, + { + "epoch": 0.18, + "learning_rate": 1.6348491320725407e-07, + "loss": 0.7616, + "step": 9453 + }, + { + "epoch": 0.18, + "learning_rate": 1.6348102986291794e-07, + "loss": 0.006, + "step": 9454 + }, + { + "epoch": 0.18, + "learning_rate": 1.634771465185818e-07, + "loss": 0.0029, + "step": 9455 + }, + { + "epoch": 0.18, + "learning_rate": 1.6347326317424566e-07, + "loss": 0.0199, + "step": 9456 + }, + { + "epoch": 0.18, + "learning_rate": 1.634693798299095e-07, + "loss": 0.0919, + "step": 9457 + }, + { + "epoch": 0.18, + "learning_rate": 1.6346549648557338e-07, + "loss": 0.003, + "step": 9458 + }, + { + "epoch": 0.18, + "learning_rate": 1.6346161314123722e-07, + "loss": 0.222, + "step": 9459 + }, + { + "epoch": 0.18, + "learning_rate": 1.634577297969011e-07, + "loss": 0.0029, + "step": 9460 + }, + { + "epoch": 0.18, + "learning_rate": 1.6345384645256494e-07, + "loss": 0.0043, + "step": 9461 + }, + { + "epoch": 0.18, + "learning_rate": 1.634499631082288e-07, + "loss": 0.0054, + "step": 9462 + }, + { + "epoch": 0.18, + "learning_rate": 1.6344607976389266e-07, + "loss": 0.3648, + "step": 9463 + }, + { + "epoch": 0.18, + "learning_rate": 1.6344219641955653e-07, + "loss": 0.691, + "step": 9464 + }, + { + "epoch": 0.18, + "learning_rate": 1.6343831307522037e-07, + "loss": 0.0036, + "step": 9465 + }, + { + "epoch": 0.18, + "learning_rate": 1.6343442973088424e-07, + "loss": 0.0028, + "step": 9466 + }, + { + "epoch": 0.18, + "learning_rate": 1.634305463865481e-07, + "loss": 0.0047, + "step": 9467 + }, + { + "epoch": 0.18, + "learning_rate": 1.6342666304221196e-07, + "loss": 0.0049, + "step": 9468 + }, + { + "epoch": 0.18, + "learning_rate": 1.634227796978758e-07, + "loss": 0.0573, + "step": 9469 + }, + { + "epoch": 0.18, + "learning_rate": 1.6341889635353968e-07, + "loss": 0.0031, + "step": 9470 + }, + { + "epoch": 0.18, + "learning_rate": 1.6341501300920352e-07, + "loss": 0.0154, + "step": 9471 + }, + { + "epoch": 0.18, + "learning_rate": 1.634111296648674e-07, + "loss": 0.0033, + "step": 9472 + }, + { + "epoch": 0.18, + "learning_rate": 1.6340724632053124e-07, + "loss": 0.003, + "step": 9473 + }, + { + "epoch": 0.18, + "learning_rate": 1.634033629761951e-07, + "loss": 0.0026, + "step": 9474 + }, + { + "epoch": 0.18, + "learning_rate": 1.6339947963185893e-07, + "loss": 0.003, + "step": 9475 + }, + { + "epoch": 0.18, + "learning_rate": 1.633955962875228e-07, + "loss": 0.0035, + "step": 9476 + }, + { + "epoch": 0.18, + "learning_rate": 1.6339171294318664e-07, + "loss": 0.0042, + "step": 9477 + }, + { + "epoch": 0.18, + "learning_rate": 1.6338782959885052e-07, + "loss": 0.0171, + "step": 9478 + }, + { + "epoch": 0.18, + "learning_rate": 1.6338394625451436e-07, + "loss": 0.0055, + "step": 9479 + }, + { + "epoch": 0.18, + "learning_rate": 1.6338006291017823e-07, + "loss": 0.0038, + "step": 9480 + }, + { + "epoch": 0.18, + "learning_rate": 1.6337617956584208e-07, + "loss": 0.2462, + "step": 9481 + }, + { + "epoch": 0.18, + "learning_rate": 1.6337229622150595e-07, + "loss": 0.0027, + "step": 9482 + }, + { + "epoch": 0.18, + "learning_rate": 1.633684128771698e-07, + "loss": 0.0163, + "step": 9483 + }, + { + "epoch": 0.18, + "learning_rate": 1.6336452953283367e-07, + "loss": 0.0037, + "step": 9484 + }, + { + "epoch": 0.18, + "learning_rate": 1.633606461884975e-07, + "loss": 0.499, + "step": 9485 + }, + { + "epoch": 0.18, + "learning_rate": 1.6335676284416138e-07, + "loss": 0.0045, + "step": 9486 + }, + { + "epoch": 0.18, + "learning_rate": 1.6335287949982523e-07, + "loss": 0.0069, + "step": 9487 + }, + { + "epoch": 0.18, + "learning_rate": 1.633489961554891e-07, + "loss": 0.0033, + "step": 9488 + }, + { + "epoch": 0.18, + "learning_rate": 1.6334511281115294e-07, + "loss": 0.0046, + "step": 9489 + }, + { + "epoch": 0.18, + "learning_rate": 1.6334122946681681e-07, + "loss": 0.2284, + "step": 9490 + }, + { + "epoch": 0.18, + "learning_rate": 1.6333734612248066e-07, + "loss": 0.3992, + "step": 9491 + }, + { + "epoch": 0.18, + "learning_rate": 1.6333346277814453e-07, + "loss": 0.0031, + "step": 9492 + }, + { + "epoch": 0.18, + "learning_rate": 1.6332957943380838e-07, + "loss": 0.0558, + "step": 9493 + }, + { + "epoch": 0.18, + "learning_rate": 1.6332569608947225e-07, + "loss": 0.0032, + "step": 9494 + }, + { + "epoch": 0.18, + "learning_rate": 1.633218127451361e-07, + "loss": 0.0063, + "step": 9495 + }, + { + "epoch": 0.18, + "learning_rate": 1.6331792940079996e-07, + "loss": 0.2646, + "step": 9496 + }, + { + "epoch": 0.18, + "learning_rate": 1.633140460564638e-07, + "loss": 0.0058, + "step": 9497 + }, + { + "epoch": 0.18, + "learning_rate": 1.6331016271212768e-07, + "loss": 0.0059, + "step": 9498 + }, + { + "epoch": 0.18, + "learning_rate": 1.6330627936779153e-07, + "loss": 0.3412, + "step": 9499 + }, + { + "epoch": 0.18, + "learning_rate": 1.633023960234554e-07, + "loss": 0.1786, + "step": 9500 + }, + { + "epoch": 0.18, + "learning_rate": 1.6329851267911924e-07, + "loss": 0.0047, + "step": 9501 + }, + { + "epoch": 0.18, + "learning_rate": 1.6329462933478311e-07, + "loss": 0.0028, + "step": 9502 + }, + { + "epoch": 0.18, + "learning_rate": 1.6329074599044696e-07, + "loss": 0.0029, + "step": 9503 + }, + { + "epoch": 0.18, + "learning_rate": 1.6328686264611083e-07, + "loss": 0.4849, + "step": 9504 + }, + { + "epoch": 0.18, + "learning_rate": 1.6328297930177468e-07, + "loss": 0.005, + "step": 9505 + }, + { + "epoch": 0.18, + "learning_rate": 1.6327909595743855e-07, + "loss": 0.096, + "step": 9506 + }, + { + "epoch": 0.18, + "learning_rate": 1.632752126131024e-07, + "loss": 0.0034, + "step": 9507 + }, + { + "epoch": 0.18, + "learning_rate": 1.6327132926876626e-07, + "loss": 0.0043, + "step": 9508 + }, + { + "epoch": 0.18, + "learning_rate": 1.632674459244301e-07, + "loss": 0.0043, + "step": 9509 + }, + { + "epoch": 0.18, + "learning_rate": 1.6326356258009398e-07, + "loss": 0.0028, + "step": 9510 + }, + { + "epoch": 0.18, + "learning_rate": 1.6325967923575782e-07, + "loss": 0.0029, + "step": 9511 + }, + { + "epoch": 0.18, + "learning_rate": 1.632557958914217e-07, + "loss": 0.033, + "step": 9512 + }, + { + "epoch": 0.18, + "learning_rate": 1.6325191254708554e-07, + "loss": 0.0037, + "step": 9513 + }, + { + "epoch": 0.18, + "learning_rate": 1.632480292027494e-07, + "loss": 0.004, + "step": 9514 + }, + { + "epoch": 0.18, + "learning_rate": 1.6324414585841326e-07, + "loss": 0.0034, + "step": 9515 + }, + { + "epoch": 0.18, + "learning_rate": 1.6324026251407713e-07, + "loss": 0.0031, + "step": 9516 + }, + { + "epoch": 0.18, + "learning_rate": 1.6323637916974097e-07, + "loss": 0.0034, + "step": 9517 + }, + { + "epoch": 0.18, + "learning_rate": 1.6323249582540485e-07, + "loss": 0.0104, + "step": 9518 + }, + { + "epoch": 0.18, + "learning_rate": 1.632286124810687e-07, + "loss": 0.0036, + "step": 9519 + }, + { + "epoch": 0.18, + "learning_rate": 1.6322472913673256e-07, + "loss": 0.0034, + "step": 9520 + }, + { + "epoch": 0.18, + "learning_rate": 1.632208457923964e-07, + "loss": 0.017, + "step": 9521 + }, + { + "epoch": 0.18, + "learning_rate": 1.6321696244806028e-07, + "loss": 0.0149, + "step": 9522 + }, + { + "epoch": 0.18, + "learning_rate": 1.6321307910372412e-07, + "loss": 0.0035, + "step": 9523 + }, + { + "epoch": 0.18, + "learning_rate": 1.63209195759388e-07, + "loss": 0.0032, + "step": 9524 + }, + { + "epoch": 0.18, + "learning_rate": 1.6320531241505184e-07, + "loss": 0.004, + "step": 9525 + }, + { + "epoch": 0.18, + "learning_rate": 1.632014290707157e-07, + "loss": 0.0041, + "step": 9526 + }, + { + "epoch": 0.18, + "learning_rate": 1.6319754572637956e-07, + "loss": 0.2198, + "step": 9527 + }, + { + "epoch": 0.18, + "learning_rate": 1.6319366238204343e-07, + "loss": 0.0029, + "step": 9528 + }, + { + "epoch": 0.18, + "learning_rate": 1.6318977903770727e-07, + "loss": 0.0038, + "step": 9529 + }, + { + "epoch": 0.18, + "learning_rate": 1.6318589569337114e-07, + "loss": 0.7041, + "step": 9530 + }, + { + "epoch": 0.18, + "learning_rate": 1.63182012349035e-07, + "loss": 0.0038, + "step": 9531 + }, + { + "epoch": 0.18, + "learning_rate": 1.6317812900469886e-07, + "loss": 0.0047, + "step": 9532 + }, + { + "epoch": 0.18, + "learning_rate": 1.6317424566036268e-07, + "loss": 0.0037, + "step": 9533 + }, + { + "epoch": 0.18, + "learning_rate": 1.6317036231602655e-07, + "loss": 0.2821, + "step": 9534 + }, + { + "epoch": 0.18, + "learning_rate": 1.631664789716904e-07, + "loss": 0.0057, + "step": 9535 + }, + { + "epoch": 0.18, + "learning_rate": 1.6316259562735427e-07, + "loss": 0.0047, + "step": 9536 + }, + { + "epoch": 0.18, + "learning_rate": 1.631587122830181e-07, + "loss": 0.0041, + "step": 9537 + }, + { + "epoch": 0.19, + "learning_rate": 1.6315482893868198e-07, + "loss": 0.0056, + "step": 9538 + }, + { + "epoch": 0.19, + "learning_rate": 1.6315094559434583e-07, + "loss": 0.0117, + "step": 9539 + }, + { + "epoch": 0.19, + "learning_rate": 1.631470622500097e-07, + "loss": 0.0229, + "step": 9540 + }, + { + "epoch": 0.19, + "learning_rate": 1.6314317890567355e-07, + "loss": 0.0036, + "step": 9541 + }, + { + "epoch": 0.19, + "learning_rate": 1.6313929556133742e-07, + "loss": 0.0031, + "step": 9542 + }, + { + "epoch": 0.19, + "learning_rate": 1.6313541221700126e-07, + "loss": 0.0028, + "step": 9543 + }, + { + "epoch": 0.19, + "learning_rate": 1.6313152887266513e-07, + "loss": 0.0282, + "step": 9544 + }, + { + "epoch": 0.19, + "learning_rate": 1.6312764552832898e-07, + "loss": 0.0028, + "step": 9545 + }, + { + "epoch": 0.19, + "learning_rate": 1.6312376218399285e-07, + "loss": 0.0033, + "step": 9546 + }, + { + "epoch": 0.19, + "learning_rate": 1.631198788396567e-07, + "loss": 0.003, + "step": 9547 + }, + { + "epoch": 0.19, + "learning_rate": 1.6311599549532057e-07, + "loss": 0.0046, + "step": 9548 + }, + { + "epoch": 0.19, + "learning_rate": 1.631121121509844e-07, + "loss": 0.0032, + "step": 9549 + }, + { + "epoch": 0.19, + "learning_rate": 1.6310822880664828e-07, + "loss": 0.0201, + "step": 9550 + }, + { + "epoch": 0.19, + "learning_rate": 1.6310434546231213e-07, + "loss": 0.0063, + "step": 9551 + }, + { + "epoch": 0.19, + "learning_rate": 1.63100462117976e-07, + "loss": 0.0034, + "step": 9552 + }, + { + "epoch": 0.19, + "learning_rate": 1.6309657877363984e-07, + "loss": 0.0034, + "step": 9553 + }, + { + "epoch": 0.19, + "learning_rate": 1.6309269542930372e-07, + "loss": 0.1136, + "step": 9554 + }, + { + "epoch": 0.19, + "learning_rate": 1.6308881208496756e-07, + "loss": 0.0042, + "step": 9555 + }, + { + "epoch": 0.19, + "learning_rate": 1.6308492874063143e-07, + "loss": 0.005, + "step": 9556 + }, + { + "epoch": 0.19, + "learning_rate": 1.6308104539629528e-07, + "loss": 0.003, + "step": 9557 + }, + { + "epoch": 0.19, + "learning_rate": 1.6307716205195915e-07, + "loss": 0.2085, + "step": 9558 + }, + { + "epoch": 0.19, + "learning_rate": 1.63073278707623e-07, + "loss": 0.0173, + "step": 9559 + }, + { + "epoch": 0.19, + "learning_rate": 1.6306939536328687e-07, + "loss": 0.0045, + "step": 9560 + }, + { + "epoch": 0.19, + "learning_rate": 1.630655120189507e-07, + "loss": 0.004, + "step": 9561 + }, + { + "epoch": 0.19, + "learning_rate": 1.6306162867461458e-07, + "loss": 0.1319, + "step": 9562 + }, + { + "epoch": 0.19, + "learning_rate": 1.6305774533027843e-07, + "loss": 0.1214, + "step": 9563 + }, + { + "epoch": 0.19, + "learning_rate": 1.630538619859423e-07, + "loss": 0.7792, + "step": 9564 + }, + { + "epoch": 0.19, + "learning_rate": 1.6304997864160614e-07, + "loss": 0.0047, + "step": 9565 + }, + { + "epoch": 0.19, + "learning_rate": 1.6304609529727001e-07, + "loss": 0.0029, + "step": 9566 + }, + { + "epoch": 0.19, + "learning_rate": 1.6304221195293386e-07, + "loss": 0.003, + "step": 9567 + }, + { + "epoch": 0.19, + "learning_rate": 1.6303832860859773e-07, + "loss": 0.0032, + "step": 9568 + }, + { + "epoch": 0.19, + "learning_rate": 1.6303444526426158e-07, + "loss": 0.2368, + "step": 9569 + }, + { + "epoch": 0.19, + "learning_rate": 1.6303056191992545e-07, + "loss": 0.8521, + "step": 9570 + }, + { + "epoch": 0.19, + "learning_rate": 1.630266785755893e-07, + "loss": 0.0027, + "step": 9571 + }, + { + "epoch": 0.19, + "learning_rate": 1.6302279523125316e-07, + "loss": 0.8583, + "step": 9572 + }, + { + "epoch": 0.19, + "learning_rate": 1.63018911886917e-07, + "loss": 0.0112, + "step": 9573 + }, + { + "epoch": 0.19, + "learning_rate": 1.6301502854258088e-07, + "loss": 0.0078, + "step": 9574 + }, + { + "epoch": 0.19, + "learning_rate": 1.6301114519824473e-07, + "loss": 0.0117, + "step": 9575 + }, + { + "epoch": 0.19, + "learning_rate": 1.630072618539086e-07, + "loss": 0.4476, + "step": 9576 + }, + { + "epoch": 0.19, + "learning_rate": 1.6300337850957244e-07, + "loss": 0.0049, + "step": 9577 + }, + { + "epoch": 0.19, + "learning_rate": 1.629994951652363e-07, + "loss": 0.0044, + "step": 9578 + }, + { + "epoch": 0.19, + "learning_rate": 1.6299561182090016e-07, + "loss": 0.0166, + "step": 9579 + }, + { + "epoch": 0.19, + "learning_rate": 1.62991728476564e-07, + "loss": 0.003, + "step": 9580 + }, + { + "epoch": 0.19, + "learning_rate": 1.6298784513222788e-07, + "loss": 0.0029, + "step": 9581 + }, + { + "epoch": 0.19, + "learning_rate": 1.6298396178789172e-07, + "loss": 0.2925, + "step": 9582 + }, + { + "epoch": 0.19, + "learning_rate": 1.629800784435556e-07, + "loss": 0.0147, + "step": 9583 + }, + { + "epoch": 0.19, + "learning_rate": 1.6297619509921944e-07, + "loss": 0.2671, + "step": 9584 + }, + { + "epoch": 0.19, + "learning_rate": 1.629723117548833e-07, + "loss": 0.0217, + "step": 9585 + }, + { + "epoch": 0.19, + "learning_rate": 1.6296842841054715e-07, + "loss": 0.0032, + "step": 9586 + }, + { + "epoch": 0.19, + "learning_rate": 1.6296454506621102e-07, + "loss": 0.0034, + "step": 9587 + }, + { + "epoch": 0.19, + "learning_rate": 1.6296066172187487e-07, + "loss": 0.0083, + "step": 9588 + }, + { + "epoch": 0.19, + "learning_rate": 1.6295677837753874e-07, + "loss": 0.0055, + "step": 9589 + }, + { + "epoch": 0.19, + "learning_rate": 1.6295289503320259e-07, + "loss": 0.003, + "step": 9590 + }, + { + "epoch": 0.19, + "learning_rate": 1.6294901168886643e-07, + "loss": 0.0042, + "step": 9591 + }, + { + "epoch": 0.19, + "learning_rate": 1.629451283445303e-07, + "loss": 0.0034, + "step": 9592 + }, + { + "epoch": 0.19, + "learning_rate": 1.6294124500019415e-07, + "loss": 0.0039, + "step": 9593 + }, + { + "epoch": 0.19, + "learning_rate": 1.6293736165585802e-07, + "loss": 0.0024, + "step": 9594 + }, + { + "epoch": 0.19, + "learning_rate": 1.6293347831152186e-07, + "loss": 0.0155, + "step": 9595 + }, + { + "epoch": 0.19, + "learning_rate": 1.6292959496718574e-07, + "loss": 0.003, + "step": 9596 + }, + { + "epoch": 0.19, + "learning_rate": 1.6292571162284958e-07, + "loss": 0.007, + "step": 9597 + }, + { + "epoch": 0.19, + "learning_rate": 1.6292182827851345e-07, + "loss": 0.004, + "step": 9598 + }, + { + "epoch": 0.19, + "learning_rate": 1.629179449341773e-07, + "loss": 0.1848, + "step": 9599 + }, + { + "epoch": 0.19, + "learning_rate": 1.6291406158984117e-07, + "loss": 0.1028, + "step": 9600 + }, + { + "epoch": 0.19, + "learning_rate": 1.6291017824550501e-07, + "loss": 0.0048, + "step": 9601 + }, + { + "epoch": 0.19, + "learning_rate": 1.6290629490116889e-07, + "loss": 0.0033, + "step": 9602 + }, + { + "epoch": 0.19, + "learning_rate": 1.6290241155683273e-07, + "loss": 0.0041, + "step": 9603 + }, + { + "epoch": 0.19, + "learning_rate": 1.628985282124966e-07, + "loss": 0.004, + "step": 9604 + }, + { + "epoch": 0.19, + "learning_rate": 1.6289464486816045e-07, + "loss": 0.0975, + "step": 9605 + }, + { + "epoch": 0.19, + "learning_rate": 1.6289076152382432e-07, + "loss": 0.2599, + "step": 9606 + }, + { + "epoch": 0.19, + "learning_rate": 1.6288687817948816e-07, + "loss": 0.0024, + "step": 9607 + }, + { + "epoch": 0.19, + "learning_rate": 1.62882994835152e-07, + "loss": 0.0032, + "step": 9608 + }, + { + "epoch": 0.19, + "learning_rate": 1.6287911149081588e-07, + "loss": 0.0034, + "step": 9609 + }, + { + "epoch": 0.19, + "learning_rate": 1.6287522814647972e-07, + "loss": 0.0077, + "step": 9610 + }, + { + "epoch": 0.19, + "learning_rate": 1.628713448021436e-07, + "loss": 0.884, + "step": 9611 + }, + { + "epoch": 0.19, + "learning_rate": 1.6286746145780744e-07, + "loss": 0.008, + "step": 9612 + }, + { + "epoch": 0.19, + "learning_rate": 1.628635781134713e-07, + "loss": 0.0033, + "step": 9613 + }, + { + "epoch": 0.19, + "learning_rate": 1.6285969476913516e-07, + "loss": 0.0035, + "step": 9614 + }, + { + "epoch": 0.19, + "learning_rate": 1.6285581142479903e-07, + "loss": 0.0053, + "step": 9615 + }, + { + "epoch": 0.19, + "learning_rate": 1.6285192808046287e-07, + "loss": 0.0026, + "step": 9616 + }, + { + "epoch": 0.19, + "learning_rate": 1.6284804473612675e-07, + "loss": 0.0506, + "step": 9617 + }, + { + "epoch": 0.19, + "learning_rate": 1.628441613917906e-07, + "loss": 0.003, + "step": 9618 + }, + { + "epoch": 0.19, + "learning_rate": 1.6284027804745446e-07, + "loss": 0.0037, + "step": 9619 + }, + { + "epoch": 0.19, + "learning_rate": 1.628363947031183e-07, + "loss": 0.2579, + "step": 9620 + }, + { + "epoch": 0.19, + "learning_rate": 1.6283251135878218e-07, + "loss": 0.3896, + "step": 9621 + }, + { + "epoch": 0.19, + "learning_rate": 1.6282862801444602e-07, + "loss": 0.0968, + "step": 9622 + }, + { + "epoch": 0.19, + "learning_rate": 1.628247446701099e-07, + "loss": 0.0055, + "step": 9623 + }, + { + "epoch": 0.19, + "learning_rate": 1.6282086132577374e-07, + "loss": 0.0051, + "step": 9624 + }, + { + "epoch": 0.19, + "learning_rate": 1.628169779814376e-07, + "loss": 0.3224, + "step": 9625 + }, + { + "epoch": 0.19, + "learning_rate": 1.6281309463710146e-07, + "loss": 0.0031, + "step": 9626 + }, + { + "epoch": 0.19, + "learning_rate": 1.6280921129276533e-07, + "loss": 0.8622, + "step": 9627 + }, + { + "epoch": 0.19, + "learning_rate": 1.6280532794842917e-07, + "loss": 0.0042, + "step": 9628 + }, + { + "epoch": 0.19, + "learning_rate": 1.6280144460409304e-07, + "loss": 0.3471, + "step": 9629 + }, + { + "epoch": 0.19, + "learning_rate": 1.627975612597569e-07, + "loss": 0.6873, + "step": 9630 + }, + { + "epoch": 0.19, + "learning_rate": 1.6279367791542076e-07, + "loss": 0.0037, + "step": 9631 + }, + { + "epoch": 0.19, + "learning_rate": 1.627897945710846e-07, + "loss": 0.0048, + "step": 9632 + }, + { + "epoch": 0.19, + "learning_rate": 1.6278591122674848e-07, + "loss": 0.0598, + "step": 9633 + }, + { + "epoch": 0.19, + "learning_rate": 1.6278202788241232e-07, + "loss": 0.0029, + "step": 9634 + }, + { + "epoch": 0.19, + "learning_rate": 1.627781445380762e-07, + "loss": 0.0029, + "step": 9635 + }, + { + "epoch": 0.19, + "learning_rate": 1.6277426119374004e-07, + "loss": 0.0059, + "step": 9636 + }, + { + "epoch": 0.19, + "learning_rate": 1.627703778494039e-07, + "loss": 0.0038, + "step": 9637 + }, + { + "epoch": 0.19, + "learning_rate": 1.6276649450506776e-07, + "loss": 1.1455, + "step": 9638 + }, + { + "epoch": 0.19, + "learning_rate": 1.6276261116073163e-07, + "loss": 0.0045, + "step": 9639 + }, + { + "epoch": 0.19, + "learning_rate": 1.6275872781639547e-07, + "loss": 0.465, + "step": 9640 + }, + { + "epoch": 0.19, + "learning_rate": 1.6275484447205934e-07, + "loss": 0.0033, + "step": 9641 + }, + { + "epoch": 0.19, + "learning_rate": 1.627509611277232e-07, + "loss": 0.0045, + "step": 9642 + }, + { + "epoch": 0.19, + "learning_rate": 1.6274707778338706e-07, + "loss": 0.0103, + "step": 9643 + }, + { + "epoch": 0.19, + "learning_rate": 1.627431944390509e-07, + "loss": 0.0381, + "step": 9644 + }, + { + "epoch": 0.19, + "learning_rate": 1.6273931109471478e-07, + "loss": 0.0029, + "step": 9645 + }, + { + "epoch": 0.19, + "learning_rate": 1.6273542775037862e-07, + "loss": 0.0557, + "step": 9646 + }, + { + "epoch": 0.19, + "learning_rate": 1.627315444060425e-07, + "loss": 0.0246, + "step": 9647 + }, + { + "epoch": 0.19, + "learning_rate": 1.6272766106170634e-07, + "loss": 0.0395, + "step": 9648 + }, + { + "epoch": 0.19, + "learning_rate": 1.6272377771737018e-07, + "loss": 0.0033, + "step": 9649 + }, + { + "epoch": 0.19, + "learning_rate": 1.6271989437303403e-07, + "loss": 0.3787, + "step": 9650 + }, + { + "epoch": 0.19, + "learning_rate": 1.627160110286979e-07, + "loss": 0.0031, + "step": 9651 + }, + { + "epoch": 0.19, + "learning_rate": 1.6271212768436174e-07, + "loss": 0.0028, + "step": 9652 + }, + { + "epoch": 0.19, + "learning_rate": 1.6270824434002562e-07, + "loss": 0.0036, + "step": 9653 + }, + { + "epoch": 0.19, + "learning_rate": 1.6270436099568946e-07, + "loss": 0.0059, + "step": 9654 + }, + { + "epoch": 0.19, + "learning_rate": 1.6270047765135333e-07, + "loss": 0.0028, + "step": 9655 + }, + { + "epoch": 0.19, + "learning_rate": 1.6269659430701718e-07, + "loss": 0.0069, + "step": 9656 + }, + { + "epoch": 0.19, + "learning_rate": 1.6269271096268105e-07, + "loss": 0.0035, + "step": 9657 + }, + { + "epoch": 0.19, + "learning_rate": 1.626888276183449e-07, + "loss": 0.0031, + "step": 9658 + }, + { + "epoch": 0.19, + "learning_rate": 1.6268494427400877e-07, + "loss": 0.6808, + "step": 9659 + }, + { + "epoch": 0.19, + "learning_rate": 1.626810609296726e-07, + "loss": 0.1606, + "step": 9660 + }, + { + "epoch": 0.19, + "learning_rate": 1.6267717758533648e-07, + "loss": 0.7704, + "step": 9661 + }, + { + "epoch": 0.19, + "learning_rate": 1.6267329424100033e-07, + "loss": 0.35, + "step": 9662 + }, + { + "epoch": 0.19, + "learning_rate": 1.626694108966642e-07, + "loss": 0.0044, + "step": 9663 + }, + { + "epoch": 0.19, + "learning_rate": 1.6266552755232804e-07, + "loss": 0.005, + "step": 9664 + }, + { + "epoch": 0.19, + "learning_rate": 1.6266164420799191e-07, + "loss": 0.0219, + "step": 9665 + }, + { + "epoch": 0.19, + "learning_rate": 1.6265776086365576e-07, + "loss": 0.8458, + "step": 9666 + }, + { + "epoch": 0.19, + "learning_rate": 1.6265387751931963e-07, + "loss": 0.0033, + "step": 9667 + }, + { + "epoch": 0.19, + "learning_rate": 1.6264999417498348e-07, + "loss": 0.0079, + "step": 9668 + }, + { + "epoch": 0.19, + "learning_rate": 1.6264611083064735e-07, + "loss": 0.0038, + "step": 9669 + }, + { + "epoch": 0.19, + "learning_rate": 1.626422274863112e-07, + "loss": 0.0029, + "step": 9670 + }, + { + "epoch": 0.19, + "learning_rate": 1.6263834414197506e-07, + "loss": 0.0033, + "step": 9671 + }, + { + "epoch": 0.19, + "learning_rate": 1.626344607976389e-07, + "loss": 0.0049, + "step": 9672 + }, + { + "epoch": 0.19, + "learning_rate": 1.6263057745330278e-07, + "loss": 0.0038, + "step": 9673 + }, + { + "epoch": 0.19, + "learning_rate": 1.6262669410896663e-07, + "loss": 0.004, + "step": 9674 + }, + { + "epoch": 0.19, + "learning_rate": 1.626228107646305e-07, + "loss": 0.0084, + "step": 9675 + }, + { + "epoch": 0.19, + "learning_rate": 1.6261892742029434e-07, + "loss": 0.0066, + "step": 9676 + }, + { + "epoch": 0.19, + "learning_rate": 1.6261504407595821e-07, + "loss": 0.0045, + "step": 9677 + }, + { + "epoch": 0.19, + "learning_rate": 1.6261116073162206e-07, + "loss": 0.0077, + "step": 9678 + }, + { + "epoch": 0.19, + "learning_rate": 1.6260727738728593e-07, + "loss": 0.0028, + "step": 9679 + }, + { + "epoch": 0.19, + "learning_rate": 1.6260339404294978e-07, + "loss": 0.0081, + "step": 9680 + }, + { + "epoch": 0.19, + "learning_rate": 1.6259951069861365e-07, + "loss": 0.0021, + "step": 9681 + }, + { + "epoch": 0.19, + "learning_rate": 1.625956273542775e-07, + "loss": 0.0031, + "step": 9682 + }, + { + "epoch": 0.19, + "learning_rate": 1.6259174400994136e-07, + "loss": 0.0038, + "step": 9683 + }, + { + "epoch": 0.19, + "learning_rate": 1.625878606656052e-07, + "loss": 0.0029, + "step": 9684 + }, + { + "epoch": 0.19, + "learning_rate": 1.6258397732126908e-07, + "loss": 0.0033, + "step": 9685 + }, + { + "epoch": 0.19, + "learning_rate": 1.6258009397693292e-07, + "loss": 0.0086, + "step": 9686 + }, + { + "epoch": 0.19, + "learning_rate": 1.625762106325968e-07, + "loss": 0.0067, + "step": 9687 + }, + { + "epoch": 0.19, + "learning_rate": 1.6257232728826064e-07, + "loss": 0.0027, + "step": 9688 + }, + { + "epoch": 0.19, + "learning_rate": 1.625684439439245e-07, + "loss": 0.0034, + "step": 9689 + }, + { + "epoch": 0.19, + "learning_rate": 1.6256456059958836e-07, + "loss": 0.2835, + "step": 9690 + }, + { + "epoch": 0.19, + "learning_rate": 1.6256067725525223e-07, + "loss": 0.003, + "step": 9691 + }, + { + "epoch": 0.19, + "learning_rate": 1.6255679391091607e-07, + "loss": 0.0366, + "step": 9692 + }, + { + "epoch": 0.19, + "learning_rate": 1.6255291056657995e-07, + "loss": 0.0043, + "step": 9693 + }, + { + "epoch": 0.19, + "learning_rate": 1.625490272222438e-07, + "loss": 0.0022, + "step": 9694 + }, + { + "epoch": 0.19, + "learning_rate": 1.6254514387790766e-07, + "loss": 0.0031, + "step": 9695 + }, + { + "epoch": 0.19, + "learning_rate": 1.625412605335715e-07, + "loss": 0.0123, + "step": 9696 + }, + { + "epoch": 0.19, + "learning_rate": 1.6253737718923538e-07, + "loss": 0.0064, + "step": 9697 + }, + { + "epoch": 0.19, + "learning_rate": 1.6253349384489922e-07, + "loss": 0.0027, + "step": 9698 + }, + { + "epoch": 0.19, + "learning_rate": 1.625296105005631e-07, + "loss": 0.0031, + "step": 9699 + }, + { + "epoch": 0.19, + "learning_rate": 1.6252572715622694e-07, + "loss": 0.0026, + "step": 9700 + }, + { + "epoch": 0.19, + "learning_rate": 1.625218438118908e-07, + "loss": 0.0025, + "step": 9701 + }, + { + "epoch": 0.19, + "learning_rate": 1.6251796046755466e-07, + "loss": 0.0307, + "step": 9702 + }, + { + "epoch": 0.19, + "learning_rate": 1.6251407712321853e-07, + "loss": 0.1294, + "step": 9703 + }, + { + "epoch": 0.19, + "learning_rate": 1.6251019377888237e-07, + "loss": 0.0241, + "step": 9704 + }, + { + "epoch": 0.19, + "learning_rate": 1.6250631043454624e-07, + "loss": 0.0032, + "step": 9705 + }, + { + "epoch": 0.19, + "learning_rate": 1.625024270902101e-07, + "loss": 0.0029, + "step": 9706 + }, + { + "epoch": 0.19, + "learning_rate": 1.6249854374587393e-07, + "loss": 0.0025, + "step": 9707 + }, + { + "epoch": 0.19, + "learning_rate": 1.6249466040153778e-07, + "loss": 0.0184, + "step": 9708 + }, + { + "epoch": 0.19, + "learning_rate": 1.6249077705720165e-07, + "loss": 0.2658, + "step": 9709 + }, + { + "epoch": 0.19, + "learning_rate": 1.624868937128655e-07, + "loss": 0.0073, + "step": 9710 + }, + { + "epoch": 0.19, + "learning_rate": 1.6248301036852937e-07, + "loss": 0.6944, + "step": 9711 + }, + { + "epoch": 0.19, + "learning_rate": 1.624791270241932e-07, + "loss": 0.0035, + "step": 9712 + }, + { + "epoch": 0.19, + "learning_rate": 1.6247524367985708e-07, + "loss": 0.003, + "step": 9713 + }, + { + "epoch": 0.19, + "learning_rate": 1.6247136033552093e-07, + "loss": 0.0157, + "step": 9714 + }, + { + "epoch": 0.19, + "learning_rate": 1.624674769911848e-07, + "loss": 0.0285, + "step": 9715 + }, + { + "epoch": 0.19, + "learning_rate": 1.6246359364684865e-07, + "loss": 0.1998, + "step": 9716 + }, + { + "epoch": 0.19, + "learning_rate": 1.6245971030251252e-07, + "loss": 0.0029, + "step": 9717 + }, + { + "epoch": 0.19, + "learning_rate": 1.6245582695817636e-07, + "loss": 0.0036, + "step": 9718 + }, + { + "epoch": 0.19, + "learning_rate": 1.6245194361384023e-07, + "loss": 0.0026, + "step": 9719 + }, + { + "epoch": 0.19, + "learning_rate": 1.6244806026950408e-07, + "loss": 0.0027, + "step": 9720 + }, + { + "epoch": 0.19, + "learning_rate": 1.6244417692516795e-07, + "loss": 0.0084, + "step": 9721 + }, + { + "epoch": 0.19, + "learning_rate": 1.624402935808318e-07, + "loss": 0.2472, + "step": 9722 + }, + { + "epoch": 0.19, + "learning_rate": 1.6243641023649567e-07, + "loss": 0.0071, + "step": 9723 + }, + { + "epoch": 0.19, + "learning_rate": 1.624325268921595e-07, + "loss": 0.0305, + "step": 9724 + }, + { + "epoch": 0.19, + "learning_rate": 1.6242864354782338e-07, + "loss": 0.0031, + "step": 9725 + }, + { + "epoch": 0.19, + "learning_rate": 1.6242476020348723e-07, + "loss": 0.0033, + "step": 9726 + }, + { + "epoch": 0.19, + "learning_rate": 1.624208768591511e-07, + "loss": 0.0037, + "step": 9727 + }, + { + "epoch": 0.19, + "learning_rate": 1.6241699351481494e-07, + "loss": 0.0032, + "step": 9728 + }, + { + "epoch": 0.19, + "learning_rate": 1.6241311017047882e-07, + "loss": 0.4313, + "step": 9729 + }, + { + "epoch": 0.19, + "learning_rate": 1.6240922682614266e-07, + "loss": 0.1247, + "step": 9730 + }, + { + "epoch": 0.19, + "learning_rate": 1.6240534348180653e-07, + "loss": 0.5337, + "step": 9731 + }, + { + "epoch": 0.19, + "learning_rate": 1.6240146013747038e-07, + "loss": 0.0038, + "step": 9732 + }, + { + "epoch": 0.19, + "learning_rate": 1.6239757679313425e-07, + "loss": 0.5555, + "step": 9733 + }, + { + "epoch": 0.19, + "learning_rate": 1.623936934487981e-07, + "loss": 0.0304, + "step": 9734 + }, + { + "epoch": 0.19, + "learning_rate": 1.6238981010446197e-07, + "loss": 0.1312, + "step": 9735 + }, + { + "epoch": 0.19, + "learning_rate": 1.623859267601258e-07, + "loss": 0.0027, + "step": 9736 + }, + { + "epoch": 0.19, + "learning_rate": 1.6238204341578968e-07, + "loss": 0.0038, + "step": 9737 + }, + { + "epoch": 0.19, + "learning_rate": 1.6237816007145353e-07, + "loss": 0.0038, + "step": 9738 + }, + { + "epoch": 0.19, + "learning_rate": 1.623742767271174e-07, + "loss": 0.0062, + "step": 9739 + }, + { + "epoch": 0.19, + "learning_rate": 1.6237039338278124e-07, + "loss": 0.0032, + "step": 9740 + }, + { + "epoch": 0.19, + "learning_rate": 1.6236651003844511e-07, + "loss": 0.0037, + "step": 9741 + }, + { + "epoch": 0.19, + "learning_rate": 1.6236262669410896e-07, + "loss": 0.0032, + "step": 9742 + }, + { + "epoch": 0.19, + "learning_rate": 1.6235874334977283e-07, + "loss": 0.0032, + "step": 9743 + }, + { + "epoch": 0.19, + "learning_rate": 1.6235486000543668e-07, + "loss": 0.0103, + "step": 9744 + }, + { + "epoch": 0.19, + "learning_rate": 1.6235097666110055e-07, + "loss": 0.6732, + "step": 9745 + }, + { + "epoch": 0.19, + "learning_rate": 1.623470933167644e-07, + "loss": 0.0028, + "step": 9746 + }, + { + "epoch": 0.19, + "learning_rate": 1.6234320997242826e-07, + "loss": 0.0038, + "step": 9747 + }, + { + "epoch": 0.19, + "learning_rate": 1.623393266280921e-07, + "loss": 0.2097, + "step": 9748 + }, + { + "epoch": 0.19, + "learning_rate": 1.6233544328375598e-07, + "loss": 0.0033, + "step": 9749 + }, + { + "epoch": 0.19, + "learning_rate": 1.6233155993941983e-07, + "loss": 0.0056, + "step": 9750 + }, + { + "epoch": 0.19, + "learning_rate": 1.623276765950837e-07, + "loss": 0.1316, + "step": 9751 + }, + { + "epoch": 0.19, + "learning_rate": 1.6232379325074754e-07, + "loss": 0.0079, + "step": 9752 + }, + { + "epoch": 0.19, + "learning_rate": 1.6231990990641141e-07, + "loss": 0.0037, + "step": 9753 + }, + { + "epoch": 0.19, + "learning_rate": 1.6231602656207526e-07, + "loss": 0.0024, + "step": 9754 + }, + { + "epoch": 0.19, + "learning_rate": 1.623121432177391e-07, + "loss": 0.0034, + "step": 9755 + }, + { + "epoch": 0.19, + "learning_rate": 1.6230825987340298e-07, + "loss": 0.0029, + "step": 9756 + }, + { + "epoch": 0.19, + "learning_rate": 1.6230437652906682e-07, + "loss": 0.3204, + "step": 9757 + }, + { + "epoch": 0.19, + "learning_rate": 1.623004931847307e-07, + "loss": 0.0051, + "step": 9758 + }, + { + "epoch": 0.19, + "learning_rate": 1.6229660984039454e-07, + "loss": 0.7404, + "step": 9759 + }, + { + "epoch": 0.19, + "learning_rate": 1.622927264960584e-07, + "loss": 0.0089, + "step": 9760 + }, + { + "epoch": 0.19, + "learning_rate": 1.6228884315172225e-07, + "loss": 0.9019, + "step": 9761 + }, + { + "epoch": 0.19, + "learning_rate": 1.6228495980738612e-07, + "loss": 0.0029, + "step": 9762 + }, + { + "epoch": 0.19, + "learning_rate": 1.6228107646304997e-07, + "loss": 0.0415, + "step": 9763 + }, + { + "epoch": 0.19, + "learning_rate": 1.6227719311871384e-07, + "loss": 0.3045, + "step": 9764 + }, + { + "epoch": 0.19, + "learning_rate": 1.6227330977437769e-07, + "loss": 0.0046, + "step": 9765 + }, + { + "epoch": 0.19, + "learning_rate": 1.6226942643004153e-07, + "loss": 0.3507, + "step": 9766 + }, + { + "epoch": 0.19, + "learning_rate": 1.622655430857054e-07, + "loss": 1.4935, + "step": 9767 + }, + { + "epoch": 0.19, + "learning_rate": 1.6226165974136925e-07, + "loss": 0.009, + "step": 9768 + }, + { + "epoch": 0.19, + "learning_rate": 1.6225777639703312e-07, + "loss": 0.9282, + "step": 9769 + }, + { + "epoch": 0.19, + "learning_rate": 1.6225389305269696e-07, + "loss": 0.0071, + "step": 9770 + }, + { + "epoch": 0.19, + "learning_rate": 1.6225000970836084e-07, + "loss": 0.1182, + "step": 9771 + }, + { + "epoch": 0.19, + "learning_rate": 1.6224612636402468e-07, + "loss": 0.0027, + "step": 9772 + }, + { + "epoch": 0.19, + "learning_rate": 1.6224224301968855e-07, + "loss": 0.02, + "step": 9773 + }, + { + "epoch": 0.19, + "learning_rate": 1.622383596753524e-07, + "loss": 0.0033, + "step": 9774 + }, + { + "epoch": 0.19, + "learning_rate": 1.6223447633101627e-07, + "loss": 0.0037, + "step": 9775 + }, + { + "epoch": 0.19, + "learning_rate": 1.6223059298668011e-07, + "loss": 0.0125, + "step": 9776 + }, + { + "epoch": 0.19, + "learning_rate": 1.6222670964234399e-07, + "loss": 0.0026, + "step": 9777 + }, + { + "epoch": 0.19, + "learning_rate": 1.6222282629800783e-07, + "loss": 0.6122, + "step": 9778 + }, + { + "epoch": 0.19, + "learning_rate": 1.622189429536717e-07, + "loss": 0.0036, + "step": 9779 + }, + { + "epoch": 0.19, + "learning_rate": 1.6221505960933555e-07, + "loss": 0.0029, + "step": 9780 + }, + { + "epoch": 0.19, + "learning_rate": 1.6221117626499942e-07, + "loss": 0.0064, + "step": 9781 + }, + { + "epoch": 0.19, + "learning_rate": 1.6220729292066326e-07, + "loss": 0.0029, + "step": 9782 + }, + { + "epoch": 0.19, + "learning_rate": 1.6220340957632713e-07, + "loss": 0.5108, + "step": 9783 + }, + { + "epoch": 0.19, + "learning_rate": 1.6219952623199098e-07, + "loss": 0.003, + "step": 9784 + }, + { + "epoch": 0.19, + "learning_rate": 1.6219564288765482e-07, + "loss": 0.0065, + "step": 9785 + }, + { + "epoch": 0.19, + "learning_rate": 1.621917595433187e-07, + "loss": 0.0311, + "step": 9786 + }, + { + "epoch": 0.19, + "learning_rate": 1.6218787619898254e-07, + "loss": 0.0089, + "step": 9787 + }, + { + "epoch": 0.19, + "learning_rate": 1.621839928546464e-07, + "loss": 0.0124, + "step": 9788 + }, + { + "epoch": 0.19, + "learning_rate": 1.6218010951031026e-07, + "loss": 0.0075, + "step": 9789 + }, + { + "epoch": 0.19, + "learning_rate": 1.6217622616597413e-07, + "loss": 0.3551, + "step": 9790 + }, + { + "epoch": 0.19, + "learning_rate": 1.6217234282163797e-07, + "loss": 0.0027, + "step": 9791 + }, + { + "epoch": 0.19, + "learning_rate": 1.6216845947730185e-07, + "loss": 0.0026, + "step": 9792 + }, + { + "epoch": 0.19, + "learning_rate": 1.621645761329657e-07, + "loss": 0.0032, + "step": 9793 + }, + { + "epoch": 0.19, + "learning_rate": 1.6216069278862956e-07, + "loss": 0.3477, + "step": 9794 + }, + { + "epoch": 0.19, + "learning_rate": 1.621568094442934e-07, + "loss": 0.0033, + "step": 9795 + }, + { + "epoch": 0.19, + "learning_rate": 1.6215292609995728e-07, + "loss": 0.0027, + "step": 9796 + }, + { + "epoch": 0.19, + "learning_rate": 1.6214904275562112e-07, + "loss": 0.0031, + "step": 9797 + }, + { + "epoch": 0.19, + "learning_rate": 1.62145159411285e-07, + "loss": 0.0056, + "step": 9798 + }, + { + "epoch": 0.19, + "learning_rate": 1.6214127606694884e-07, + "loss": 0.0934, + "step": 9799 + }, + { + "epoch": 0.19, + "learning_rate": 1.621373927226127e-07, + "loss": 0.0032, + "step": 9800 + }, + { + "epoch": 0.19, + "learning_rate": 1.6213350937827656e-07, + "loss": 0.1915, + "step": 9801 + }, + { + "epoch": 0.19, + "learning_rate": 1.6212962603394043e-07, + "loss": 0.0055, + "step": 9802 + }, + { + "epoch": 0.19, + "learning_rate": 1.6212574268960427e-07, + "loss": 0.003, + "step": 9803 + }, + { + "epoch": 0.19, + "learning_rate": 1.6212185934526814e-07, + "loss": 0.0027, + "step": 9804 + }, + { + "epoch": 0.19, + "learning_rate": 1.62117976000932e-07, + "loss": 0.0038, + "step": 9805 + }, + { + "epoch": 0.19, + "learning_rate": 1.6211409265659586e-07, + "loss": 0.0045, + "step": 9806 + }, + { + "epoch": 0.19, + "learning_rate": 1.621102093122597e-07, + "loss": 0.1318, + "step": 9807 + }, + { + "epoch": 0.19, + "learning_rate": 1.6210632596792358e-07, + "loss": 0.0025, + "step": 9808 + }, + { + "epoch": 0.19, + "learning_rate": 1.6210244262358742e-07, + "loss": 0.0033, + "step": 9809 + }, + { + "epoch": 0.19, + "learning_rate": 1.620985592792513e-07, + "loss": 0.0036, + "step": 9810 + }, + { + "epoch": 0.19, + "learning_rate": 1.6209467593491514e-07, + "loss": 0.0054, + "step": 9811 + }, + { + "epoch": 0.19, + "learning_rate": 1.62090792590579e-07, + "loss": 0.0049, + "step": 9812 + }, + { + "epoch": 0.19, + "learning_rate": 1.6208690924624286e-07, + "loss": 0.0024, + "step": 9813 + }, + { + "epoch": 0.19, + "learning_rate": 1.6208302590190673e-07, + "loss": 0.0034, + "step": 9814 + }, + { + "epoch": 0.19, + "learning_rate": 1.6207914255757057e-07, + "loss": 0.0302, + "step": 9815 + }, + { + "epoch": 0.19, + "learning_rate": 1.6207525921323444e-07, + "loss": 0.0034, + "step": 9816 + }, + { + "epoch": 0.19, + "learning_rate": 1.620713758688983e-07, + "loss": 0.0031, + "step": 9817 + }, + { + "epoch": 0.19, + "learning_rate": 1.6206749252456216e-07, + "loss": 0.0034, + "step": 9818 + }, + { + "epoch": 0.19, + "learning_rate": 1.62063609180226e-07, + "loss": 0.018, + "step": 9819 + }, + { + "epoch": 0.19, + "learning_rate": 1.6205972583588988e-07, + "loss": 0.1895, + "step": 9820 + }, + { + "epoch": 0.19, + "learning_rate": 1.6205584249155372e-07, + "loss": 0.5124, + "step": 9821 + }, + { + "epoch": 0.19, + "learning_rate": 1.620519591472176e-07, + "loss": 0.1199, + "step": 9822 + }, + { + "epoch": 0.19, + "learning_rate": 1.620480758028814e-07, + "loss": 0.0033, + "step": 9823 + }, + { + "epoch": 0.19, + "learning_rate": 1.6204419245854528e-07, + "loss": 0.0032, + "step": 9824 + }, + { + "epoch": 0.19, + "learning_rate": 1.6204030911420913e-07, + "loss": 0.0025, + "step": 9825 + }, + { + "epoch": 0.19, + "learning_rate": 1.62036425769873e-07, + "loss": 0.5016, + "step": 9826 + }, + { + "epoch": 0.19, + "learning_rate": 1.6203254242553684e-07, + "loss": 0.0026, + "step": 9827 + }, + { + "epoch": 0.19, + "learning_rate": 1.6202865908120072e-07, + "loss": 0.3355, + "step": 9828 + }, + { + "epoch": 0.19, + "learning_rate": 1.6202477573686456e-07, + "loss": 0.0154, + "step": 9829 + }, + { + "epoch": 0.19, + "learning_rate": 1.6202089239252843e-07, + "loss": 0.5048, + "step": 9830 + }, + { + "epoch": 0.19, + "learning_rate": 1.6201700904819228e-07, + "loss": 0.0028, + "step": 9831 + }, + { + "epoch": 0.19, + "learning_rate": 1.6201312570385615e-07, + "loss": 0.0055, + "step": 9832 + }, + { + "epoch": 0.19, + "learning_rate": 1.6200924235952e-07, + "loss": 0.0035, + "step": 9833 + }, + { + "epoch": 0.19, + "learning_rate": 1.6200535901518387e-07, + "loss": 0.0085, + "step": 9834 + }, + { + "epoch": 0.19, + "learning_rate": 1.620014756708477e-07, + "loss": 0.0139, + "step": 9835 + }, + { + "epoch": 0.19, + "learning_rate": 1.6199759232651158e-07, + "loss": 0.0033, + "step": 9836 + }, + { + "epoch": 0.19, + "learning_rate": 1.6199370898217543e-07, + "loss": 0.0043, + "step": 9837 + }, + { + "epoch": 0.19, + "learning_rate": 1.619898256378393e-07, + "loss": 0.0055, + "step": 9838 + }, + { + "epoch": 0.19, + "learning_rate": 1.6198594229350314e-07, + "loss": 0.7462, + "step": 9839 + }, + { + "epoch": 0.19, + "learning_rate": 1.6198205894916701e-07, + "loss": 0.0032, + "step": 9840 + }, + { + "epoch": 0.19, + "learning_rate": 1.6197817560483086e-07, + "loss": 0.0037, + "step": 9841 + }, + { + "epoch": 0.19, + "learning_rate": 1.6197429226049473e-07, + "loss": 0.6033, + "step": 9842 + }, + { + "epoch": 0.19, + "learning_rate": 1.6197040891615858e-07, + "loss": 0.0057, + "step": 9843 + }, + { + "epoch": 0.19, + "learning_rate": 1.6196652557182245e-07, + "loss": 0.7092, + "step": 9844 + }, + { + "epoch": 0.19, + "learning_rate": 1.619626422274863e-07, + "loss": 0.3616, + "step": 9845 + }, + { + "epoch": 0.19, + "learning_rate": 1.6195875888315016e-07, + "loss": 0.003, + "step": 9846 + }, + { + "epoch": 0.19, + "learning_rate": 1.61954875538814e-07, + "loss": 0.0061, + "step": 9847 + }, + { + "epoch": 0.19, + "learning_rate": 1.6195099219447788e-07, + "loss": 0.5528, + "step": 9848 + }, + { + "epoch": 0.19, + "learning_rate": 1.6194710885014173e-07, + "loss": 0.0027, + "step": 9849 + }, + { + "epoch": 0.19, + "learning_rate": 1.619432255058056e-07, + "loss": 0.0035, + "step": 9850 + }, + { + "epoch": 0.19, + "learning_rate": 1.6193934216146944e-07, + "loss": 0.303, + "step": 9851 + }, + { + "epoch": 0.19, + "learning_rate": 1.6193545881713331e-07, + "loss": 0.0089, + "step": 9852 + }, + { + "epoch": 0.19, + "learning_rate": 1.6193157547279716e-07, + "loss": 0.0064, + "step": 9853 + }, + { + "epoch": 0.19, + "learning_rate": 1.6192769212846103e-07, + "loss": 0.0036, + "step": 9854 + }, + { + "epoch": 0.19, + "learning_rate": 1.6192380878412488e-07, + "loss": 0.0052, + "step": 9855 + }, + { + "epoch": 0.19, + "learning_rate": 1.6191992543978875e-07, + "loss": 0.0142, + "step": 9856 + }, + { + "epoch": 0.19, + "learning_rate": 1.619160420954526e-07, + "loss": 0.0129, + "step": 9857 + }, + { + "epoch": 0.19, + "learning_rate": 1.6191215875111646e-07, + "loss": 0.0057, + "step": 9858 + }, + { + "epoch": 0.19, + "learning_rate": 1.619082754067803e-07, + "loss": 0.003, + "step": 9859 + }, + { + "epoch": 0.19, + "learning_rate": 1.6190439206244418e-07, + "loss": 0.0042, + "step": 9860 + }, + { + "epoch": 0.19, + "learning_rate": 1.6190050871810802e-07, + "loss": 0.0038, + "step": 9861 + }, + { + "epoch": 0.19, + "learning_rate": 1.618966253737719e-07, + "loss": 0.0217, + "step": 9862 + }, + { + "epoch": 0.19, + "learning_rate": 1.6189274202943574e-07, + "loss": 0.0026, + "step": 9863 + }, + { + "epoch": 0.19, + "learning_rate": 1.618888586850996e-07, + "loss": 0.0025, + "step": 9864 + }, + { + "epoch": 0.19, + "learning_rate": 1.6188497534076346e-07, + "loss": 0.0606, + "step": 9865 + }, + { + "epoch": 0.19, + "learning_rate": 1.6188109199642733e-07, + "loss": 0.0053, + "step": 9866 + }, + { + "epoch": 0.19, + "learning_rate": 1.6187720865209117e-07, + "loss": 0.0033, + "step": 9867 + }, + { + "epoch": 0.19, + "learning_rate": 1.6187332530775505e-07, + "loss": 0.0033, + "step": 9868 + }, + { + "epoch": 0.19, + "learning_rate": 1.618694419634189e-07, + "loss": 0.0029, + "step": 9869 + }, + { + "epoch": 0.19, + "learning_rate": 1.6186555861908276e-07, + "loss": 0.0161, + "step": 9870 + }, + { + "epoch": 0.19, + "learning_rate": 1.618616752747466e-07, + "loss": 0.0031, + "step": 9871 + }, + { + "epoch": 0.19, + "learning_rate": 1.6185779193041048e-07, + "loss": 0.0033, + "step": 9872 + }, + { + "epoch": 0.19, + "learning_rate": 1.6185390858607432e-07, + "loss": 0.12, + "step": 9873 + }, + { + "epoch": 0.19, + "learning_rate": 1.618500252417382e-07, + "loss": 0.0032, + "step": 9874 + }, + { + "epoch": 0.19, + "learning_rate": 1.6184614189740204e-07, + "loss": 0.0048, + "step": 9875 + }, + { + "epoch": 0.19, + "learning_rate": 1.618422585530659e-07, + "loss": 0.0024, + "step": 9876 + }, + { + "epoch": 0.19, + "learning_rate": 1.6183837520872976e-07, + "loss": 0.0127, + "step": 9877 + }, + { + "epoch": 0.19, + "learning_rate": 1.6183449186439363e-07, + "loss": 0.0038, + "step": 9878 + }, + { + "epoch": 0.19, + "learning_rate": 1.6183060852005747e-07, + "loss": 0.0032, + "step": 9879 + }, + { + "epoch": 0.19, + "learning_rate": 1.6182672517572134e-07, + "loss": 0.0031, + "step": 9880 + }, + { + "epoch": 0.19, + "learning_rate": 1.6182284183138516e-07, + "loss": 0.0043, + "step": 9881 + }, + { + "epoch": 0.19, + "learning_rate": 1.6181895848704903e-07, + "loss": 0.0032, + "step": 9882 + }, + { + "epoch": 0.19, + "learning_rate": 1.6181507514271288e-07, + "loss": 0.0041, + "step": 9883 + }, + { + "epoch": 0.19, + "learning_rate": 1.6181119179837675e-07, + "loss": 0.0024, + "step": 9884 + }, + { + "epoch": 0.19, + "learning_rate": 1.618073084540406e-07, + "loss": 0.0029, + "step": 9885 + }, + { + "epoch": 0.19, + "learning_rate": 1.6180342510970447e-07, + "loss": 0.9854, + "step": 9886 + }, + { + "epoch": 0.19, + "learning_rate": 1.617995417653683e-07, + "loss": 0.0026, + "step": 9887 + }, + { + "epoch": 0.19, + "learning_rate": 1.6179565842103218e-07, + "loss": 0.0027, + "step": 9888 + }, + { + "epoch": 0.19, + "learning_rate": 1.6179177507669603e-07, + "loss": 0.5471, + "step": 9889 + }, + { + "epoch": 0.19, + "learning_rate": 1.617878917323599e-07, + "loss": 0.0033, + "step": 9890 + }, + { + "epoch": 0.19, + "learning_rate": 1.6178400838802375e-07, + "loss": 0.032, + "step": 9891 + }, + { + "epoch": 0.19, + "learning_rate": 1.6178012504368762e-07, + "loss": 0.0027, + "step": 9892 + }, + { + "epoch": 0.19, + "learning_rate": 1.6177624169935146e-07, + "loss": 0.0041, + "step": 9893 + }, + { + "epoch": 0.19, + "learning_rate": 1.6177235835501533e-07, + "loss": 0.003, + "step": 9894 + }, + { + "epoch": 0.19, + "learning_rate": 1.6176847501067918e-07, + "loss": 0.0278, + "step": 9895 + }, + { + "epoch": 0.19, + "learning_rate": 1.6176459166634305e-07, + "loss": 1.1081, + "step": 9896 + }, + { + "epoch": 0.19, + "learning_rate": 1.617607083220069e-07, + "loss": 0.3484, + "step": 9897 + }, + { + "epoch": 0.19, + "learning_rate": 1.6175682497767077e-07, + "loss": 0.0038, + "step": 9898 + }, + { + "epoch": 0.19, + "learning_rate": 1.617529416333346e-07, + "loss": 0.0031, + "step": 9899 + }, + { + "epoch": 0.19, + "learning_rate": 1.6174905828899848e-07, + "loss": 0.0128, + "step": 9900 + }, + { + "epoch": 0.19, + "learning_rate": 1.6174517494466233e-07, + "loss": 0.0041, + "step": 9901 + }, + { + "epoch": 0.19, + "learning_rate": 1.617412916003262e-07, + "loss": 0.0033, + "step": 9902 + }, + { + "epoch": 0.19, + "learning_rate": 1.6173740825599004e-07, + "loss": 0.0039, + "step": 9903 + }, + { + "epoch": 0.19, + "learning_rate": 1.6173352491165392e-07, + "loss": 0.1778, + "step": 9904 + }, + { + "epoch": 0.19, + "learning_rate": 1.6172964156731776e-07, + "loss": 0.01, + "step": 9905 + }, + { + "epoch": 0.19, + "learning_rate": 1.6172575822298163e-07, + "loss": 0.0039, + "step": 9906 + }, + { + "epoch": 0.19, + "learning_rate": 1.6172187487864548e-07, + "loss": 0.0025, + "step": 9907 + }, + { + "epoch": 0.19, + "learning_rate": 1.6171799153430935e-07, + "loss": 0.0033, + "step": 9908 + }, + { + "epoch": 0.19, + "learning_rate": 1.617141081899732e-07, + "loss": 0.6225, + "step": 9909 + }, + { + "epoch": 0.19, + "learning_rate": 1.6171022484563707e-07, + "loss": 0.7919, + "step": 9910 + }, + { + "epoch": 0.19, + "learning_rate": 1.617063415013009e-07, + "loss": 0.0036, + "step": 9911 + }, + { + "epoch": 0.19, + "learning_rate": 1.6170245815696478e-07, + "loss": 0.0153, + "step": 9912 + }, + { + "epoch": 0.19, + "learning_rate": 1.6169857481262863e-07, + "loss": 0.8834, + "step": 9913 + }, + { + "epoch": 0.19, + "learning_rate": 1.616946914682925e-07, + "loss": 0.0061, + "step": 9914 + }, + { + "epoch": 0.19, + "learning_rate": 1.6169080812395634e-07, + "loss": 0.0054, + "step": 9915 + }, + { + "epoch": 0.19, + "learning_rate": 1.6168692477962021e-07, + "loss": 0.0037, + "step": 9916 + }, + { + "epoch": 0.19, + "learning_rate": 1.6168304143528406e-07, + "loss": 1.3557, + "step": 9917 + }, + { + "epoch": 0.19, + "learning_rate": 1.6167915809094793e-07, + "loss": 0.0198, + "step": 9918 + }, + { + "epoch": 0.19, + "learning_rate": 1.6167527474661178e-07, + "loss": 0.0034, + "step": 9919 + }, + { + "epoch": 0.19, + "learning_rate": 1.6167139140227565e-07, + "loss": 0.0024, + "step": 9920 + }, + { + "epoch": 0.19, + "learning_rate": 1.616675080579395e-07, + "loss": 0.0052, + "step": 9921 + }, + { + "epoch": 0.19, + "learning_rate": 1.6166362471360336e-07, + "loss": 0.1755, + "step": 9922 + }, + { + "epoch": 0.19, + "learning_rate": 1.616597413692672e-07, + "loss": 0.0415, + "step": 9923 + }, + { + "epoch": 0.19, + "learning_rate": 1.6165585802493108e-07, + "loss": 0.0031, + "step": 9924 + }, + { + "epoch": 0.19, + "learning_rate": 1.6165197468059493e-07, + "loss": 0.0029, + "step": 9925 + }, + { + "epoch": 0.19, + "learning_rate": 1.616480913362588e-07, + "loss": 0.0031, + "step": 9926 + }, + { + "epoch": 0.19, + "learning_rate": 1.6164420799192264e-07, + "loss": 0.6326, + "step": 9927 + }, + { + "epoch": 0.19, + "learning_rate": 1.6164032464758651e-07, + "loss": 0.6845, + "step": 9928 + }, + { + "epoch": 0.19, + "learning_rate": 1.6163644130325036e-07, + "loss": 0.674, + "step": 9929 + }, + { + "epoch": 0.19, + "learning_rate": 1.6163255795891423e-07, + "loss": 0.0091, + "step": 9930 + }, + { + "epoch": 0.19, + "learning_rate": 1.6162867461457808e-07, + "loss": 0.0026, + "step": 9931 + }, + { + "epoch": 0.19, + "learning_rate": 1.6162479127024192e-07, + "loss": 0.0825, + "step": 9932 + }, + { + "epoch": 0.19, + "learning_rate": 1.616209079259058e-07, + "loss": 0.0072, + "step": 9933 + }, + { + "epoch": 0.19, + "learning_rate": 1.6161702458156964e-07, + "loss": 0.0717, + "step": 9934 + }, + { + "epoch": 0.19, + "learning_rate": 1.616131412372335e-07, + "loss": 0.0036, + "step": 9935 + }, + { + "epoch": 0.19, + "learning_rate": 1.6160925789289735e-07, + "loss": 0.0028, + "step": 9936 + }, + { + "epoch": 0.19, + "learning_rate": 1.6160537454856122e-07, + "loss": 0.003, + "step": 9937 + }, + { + "epoch": 0.19, + "learning_rate": 1.6160149120422507e-07, + "loss": 0.007, + "step": 9938 + }, + { + "epoch": 0.19, + "learning_rate": 1.6159760785988891e-07, + "loss": 0.0022, + "step": 9939 + }, + { + "epoch": 0.19, + "learning_rate": 1.6159372451555279e-07, + "loss": 0.0035, + "step": 9940 + }, + { + "epoch": 0.19, + "learning_rate": 1.6158984117121663e-07, + "loss": 0.9354, + "step": 9941 + }, + { + "epoch": 0.19, + "learning_rate": 1.615859578268805e-07, + "loss": 0.4805, + "step": 9942 + }, + { + "epoch": 0.19, + "learning_rate": 1.6158207448254435e-07, + "loss": 0.0086, + "step": 9943 + }, + { + "epoch": 0.19, + "learning_rate": 1.6157819113820822e-07, + "loss": 0.0027, + "step": 9944 + }, + { + "epoch": 0.19, + "learning_rate": 1.6157430779387206e-07, + "loss": 0.0044, + "step": 9945 + }, + { + "epoch": 0.19, + "learning_rate": 1.6157042444953594e-07, + "loss": 0.3069, + "step": 9946 + }, + { + "epoch": 0.19, + "learning_rate": 1.6156654110519978e-07, + "loss": 0.0049, + "step": 9947 + }, + { + "epoch": 0.19, + "learning_rate": 1.6156265776086365e-07, + "loss": 0.019, + "step": 9948 + }, + { + "epoch": 0.19, + "learning_rate": 1.615587744165275e-07, + "loss": 0.4794, + "step": 9949 + }, + { + "epoch": 0.19, + "learning_rate": 1.6155489107219137e-07, + "loss": 0.0038, + "step": 9950 + }, + { + "epoch": 0.19, + "learning_rate": 1.6155100772785521e-07, + "loss": 0.003, + "step": 9951 + }, + { + "epoch": 0.19, + "learning_rate": 1.6154712438351909e-07, + "loss": 0.0079, + "step": 9952 + }, + { + "epoch": 0.19, + "learning_rate": 1.6154324103918293e-07, + "loss": 0.0142, + "step": 9953 + }, + { + "epoch": 0.19, + "learning_rate": 1.615393576948468e-07, + "loss": 0.0477, + "step": 9954 + }, + { + "epoch": 0.19, + "learning_rate": 1.6153547435051065e-07, + "loss": 0.385, + "step": 9955 + }, + { + "epoch": 0.19, + "learning_rate": 1.6153159100617452e-07, + "loss": 0.0028, + "step": 9956 + }, + { + "epoch": 0.19, + "learning_rate": 1.6152770766183836e-07, + "loss": 0.003, + "step": 9957 + }, + { + "epoch": 0.19, + "learning_rate": 1.6152382431750223e-07, + "loss": 0.0037, + "step": 9958 + }, + { + "epoch": 0.19, + "learning_rate": 1.6151994097316608e-07, + "loss": 1.1594, + "step": 9959 + }, + { + "epoch": 0.19, + "learning_rate": 1.6151605762882995e-07, + "loss": 0.0024, + "step": 9960 + }, + { + "epoch": 0.19, + "learning_rate": 1.615121742844938e-07, + "loss": 0.0095, + "step": 9961 + }, + { + "epoch": 0.19, + "learning_rate": 1.6150829094015764e-07, + "loss": 0.0027, + "step": 9962 + }, + { + "epoch": 0.19, + "learning_rate": 1.615044075958215e-07, + "loss": 0.0029, + "step": 9963 + }, + { + "epoch": 0.19, + "learning_rate": 1.6150052425148536e-07, + "loss": 0.0035, + "step": 9964 + }, + { + "epoch": 0.19, + "learning_rate": 1.6149664090714923e-07, + "loss": 0.003, + "step": 9965 + }, + { + "epoch": 0.19, + "learning_rate": 1.6149275756281307e-07, + "loss": 0.0034, + "step": 9966 + }, + { + "epoch": 0.19, + "learning_rate": 1.6148887421847695e-07, + "loss": 0.0036, + "step": 9967 + }, + { + "epoch": 0.19, + "learning_rate": 1.614849908741408e-07, + "loss": 0.0051, + "step": 9968 + }, + { + "epoch": 0.19, + "learning_rate": 1.6148110752980466e-07, + "loss": 0.003, + "step": 9969 + }, + { + "epoch": 0.19, + "learning_rate": 1.614772241854685e-07, + "loss": 0.0097, + "step": 9970 + }, + { + "epoch": 0.19, + "learning_rate": 1.6147334084113238e-07, + "loss": 0.503, + "step": 9971 + }, + { + "epoch": 0.19, + "learning_rate": 1.6146945749679622e-07, + "loss": 0.0063, + "step": 9972 + }, + { + "epoch": 0.19, + "learning_rate": 1.614655741524601e-07, + "loss": 0.0043, + "step": 9973 + }, + { + "epoch": 0.19, + "learning_rate": 1.6146169080812394e-07, + "loss": 0.0077, + "step": 9974 + }, + { + "epoch": 0.19, + "learning_rate": 1.614578074637878e-07, + "loss": 0.5236, + "step": 9975 + }, + { + "epoch": 0.19, + "learning_rate": 1.6145392411945166e-07, + "loss": 0.3238, + "step": 9976 + }, + { + "epoch": 0.19, + "learning_rate": 1.6145004077511553e-07, + "loss": 0.0127, + "step": 9977 + }, + { + "epoch": 0.19, + "learning_rate": 1.6144615743077937e-07, + "loss": 0.0028, + "step": 9978 + }, + { + "epoch": 0.19, + "learning_rate": 1.6144227408644324e-07, + "loss": 0.0028, + "step": 9979 + }, + { + "epoch": 0.19, + "learning_rate": 1.614383907421071e-07, + "loss": 0.003, + "step": 9980 + }, + { + "epoch": 0.19, + "learning_rate": 1.6143450739777096e-07, + "loss": 0.004, + "step": 9981 + }, + { + "epoch": 0.19, + "learning_rate": 1.614306240534348e-07, + "loss": 0.0028, + "step": 9982 + }, + { + "epoch": 0.19, + "learning_rate": 1.6142674070909868e-07, + "loss": 0.0511, + "step": 9983 + }, + { + "epoch": 0.19, + "learning_rate": 1.6142285736476252e-07, + "loss": 0.009, + "step": 9984 + }, + { + "epoch": 0.19, + "learning_rate": 1.614189740204264e-07, + "loss": 0.0033, + "step": 9985 + }, + { + "epoch": 0.19, + "learning_rate": 1.6141509067609024e-07, + "loss": 0.5226, + "step": 9986 + }, + { + "epoch": 0.19, + "learning_rate": 1.614112073317541e-07, + "loss": 0.0839, + "step": 9987 + }, + { + "epoch": 0.19, + "learning_rate": 1.6140732398741796e-07, + "loss": 0.0038, + "step": 9988 + }, + { + "epoch": 0.19, + "learning_rate": 1.6140344064308183e-07, + "loss": 0.0029, + "step": 9989 + }, + { + "epoch": 0.19, + "learning_rate": 1.6139955729874567e-07, + "loss": 0.0144, + "step": 9990 + }, + { + "epoch": 0.19, + "learning_rate": 1.6139567395440954e-07, + "loss": 0.0039, + "step": 9991 + }, + { + "epoch": 0.19, + "learning_rate": 1.613917906100734e-07, + "loss": 0.4602, + "step": 9992 + }, + { + "epoch": 0.19, + "learning_rate": 1.6138790726573726e-07, + "loss": 0.0034, + "step": 9993 + }, + { + "epoch": 0.19, + "learning_rate": 1.613840239214011e-07, + "loss": 0.0026, + "step": 9994 + }, + { + "epoch": 0.19, + "learning_rate": 1.6138014057706498e-07, + "loss": 0.0164, + "step": 9995 + }, + { + "epoch": 0.19, + "learning_rate": 1.6137625723272882e-07, + "loss": 0.0084, + "step": 9996 + }, + { + "epoch": 0.19, + "learning_rate": 1.6137237388839267e-07, + "loss": 0.7321, + "step": 9997 + }, + { + "epoch": 0.19, + "learning_rate": 1.613684905440565e-07, + "loss": 0.1028, + "step": 9998 + }, + { + "epoch": 0.19, + "learning_rate": 1.6136460719972038e-07, + "loss": 0.0041, + "step": 9999 + }, + { + "epoch": 0.19, + "learning_rate": 1.6136072385538423e-07, + "loss": 0.0037, + "step": 10000 + }, + { + "epoch": 0.19, + "learning_rate": 1.613568405110481e-07, + "loss": 0.0038, + "step": 10001 + }, + { + "epoch": 0.19, + "learning_rate": 1.6135295716671194e-07, + "loss": 0.0023, + "step": 10002 + }, + { + "epoch": 0.19, + "learning_rate": 1.6134907382237582e-07, + "loss": 0.0029, + "step": 10003 + }, + { + "epoch": 0.19, + "learning_rate": 1.6134519047803966e-07, + "loss": 0.0106, + "step": 10004 + }, + { + "epoch": 0.19, + "learning_rate": 1.6134130713370353e-07, + "loss": 0.0023, + "step": 10005 + }, + { + "epoch": 0.19, + "learning_rate": 1.6133742378936738e-07, + "loss": 0.0044, + "step": 10006 + }, + { + "epoch": 0.19, + "learning_rate": 1.6133354044503125e-07, + "loss": 0.0032, + "step": 10007 + }, + { + "epoch": 0.19, + "learning_rate": 1.613296571006951e-07, + "loss": 0.0032, + "step": 10008 + }, + { + "epoch": 0.19, + "learning_rate": 1.6132577375635897e-07, + "loss": 0.3411, + "step": 10009 + }, + { + "epoch": 0.19, + "learning_rate": 1.613218904120228e-07, + "loss": 0.003, + "step": 10010 + }, + { + "epoch": 0.19, + "learning_rate": 1.6131800706768668e-07, + "loss": 0.0075, + "step": 10011 + }, + { + "epoch": 0.19, + "learning_rate": 1.6131412372335053e-07, + "loss": 0.0079, + "step": 10012 + }, + { + "epoch": 0.19, + "learning_rate": 1.613102403790144e-07, + "loss": 0.3893, + "step": 10013 + }, + { + "epoch": 0.19, + "learning_rate": 1.6130635703467824e-07, + "loss": 0.0028, + "step": 10014 + }, + { + "epoch": 0.19, + "learning_rate": 1.6130247369034211e-07, + "loss": 0.0036, + "step": 10015 + }, + { + "epoch": 0.19, + "learning_rate": 1.6129859034600596e-07, + "loss": 0.0025, + "step": 10016 + }, + { + "epoch": 0.19, + "learning_rate": 1.6129470700166983e-07, + "loss": 0.0031, + "step": 10017 + }, + { + "epoch": 0.19, + "learning_rate": 1.6129082365733368e-07, + "loss": 0.0033, + "step": 10018 + }, + { + "epoch": 0.19, + "learning_rate": 1.6128694031299755e-07, + "loss": 0.0029, + "step": 10019 + }, + { + "epoch": 0.19, + "learning_rate": 1.612830569686614e-07, + "loss": 0.0059, + "step": 10020 + }, + { + "epoch": 0.19, + "learning_rate": 1.6127917362432526e-07, + "loss": 0.2439, + "step": 10021 + }, + { + "epoch": 0.19, + "learning_rate": 1.612752902799891e-07, + "loss": 0.0039, + "step": 10022 + }, + { + "epoch": 0.19, + "learning_rate": 1.6127140693565298e-07, + "loss": 0.0105, + "step": 10023 + }, + { + "epoch": 0.19, + "learning_rate": 1.6126752359131683e-07, + "loss": 0.0026, + "step": 10024 + }, + { + "epoch": 0.19, + "learning_rate": 1.612636402469807e-07, + "loss": 0.0028, + "step": 10025 + }, + { + "epoch": 0.19, + "learning_rate": 1.6125975690264454e-07, + "loss": 0.0042, + "step": 10026 + }, + { + "epoch": 0.19, + "learning_rate": 1.6125587355830841e-07, + "loss": 0.4354, + "step": 10027 + }, + { + "epoch": 0.19, + "learning_rate": 1.6125199021397226e-07, + "loss": 0.0323, + "step": 10028 + }, + { + "epoch": 0.19, + "learning_rate": 1.6124810686963613e-07, + "loss": 0.0034, + "step": 10029 + }, + { + "epoch": 0.19, + "learning_rate": 1.6124422352529998e-07, + "loss": 0.0037, + "step": 10030 + }, + { + "epoch": 0.19, + "learning_rate": 1.6124034018096385e-07, + "loss": 0.0034, + "step": 10031 + }, + { + "epoch": 0.19, + "learning_rate": 1.612364568366277e-07, + "loss": 0.0031, + "step": 10032 + }, + { + "epoch": 0.19, + "learning_rate": 1.6123257349229156e-07, + "loss": 0.2292, + "step": 10033 + }, + { + "epoch": 0.19, + "learning_rate": 1.612286901479554e-07, + "loss": 0.0031, + "step": 10034 + }, + { + "epoch": 0.19, + "learning_rate": 1.6122480680361928e-07, + "loss": 0.4008, + "step": 10035 + }, + { + "epoch": 0.19, + "learning_rate": 1.6122092345928312e-07, + "loss": 0.5513, + "step": 10036 + }, + { + "epoch": 0.19, + "learning_rate": 1.61217040114947e-07, + "loss": 0.0473, + "step": 10037 + }, + { + "epoch": 0.19, + "learning_rate": 1.6121315677061084e-07, + "loss": 0.0038, + "step": 10038 + }, + { + "epoch": 0.19, + "learning_rate": 1.612092734262747e-07, + "loss": 0.0026, + "step": 10039 + }, + { + "epoch": 0.19, + "learning_rate": 1.6120539008193856e-07, + "loss": 0.0335, + "step": 10040 + }, + { + "epoch": 0.19, + "learning_rate": 1.6120150673760243e-07, + "loss": 0.2795, + "step": 10041 + }, + { + "epoch": 0.19, + "learning_rate": 1.6119762339326627e-07, + "loss": 0.0083, + "step": 10042 + }, + { + "epoch": 0.19, + "learning_rate": 1.6119374004893015e-07, + "loss": 0.0031, + "step": 10043 + }, + { + "epoch": 0.19, + "learning_rate": 1.61189856704594e-07, + "loss": 0.3624, + "step": 10044 + }, + { + "epoch": 0.19, + "learning_rate": 1.6118597336025786e-07, + "loss": 0.0033, + "step": 10045 + }, + { + "epoch": 0.19, + "learning_rate": 1.611820900159217e-07, + "loss": 0.0037, + "step": 10046 + }, + { + "epoch": 0.19, + "learning_rate": 1.6117820667158558e-07, + "loss": 0.0037, + "step": 10047 + }, + { + "epoch": 0.19, + "learning_rate": 1.6117432332724942e-07, + "loss": 0.0031, + "step": 10048 + }, + { + "epoch": 0.19, + "learning_rate": 1.611704399829133e-07, + "loss": 0.0025, + "step": 10049 + }, + { + "epoch": 0.19, + "learning_rate": 1.6116655663857714e-07, + "loss": 0.0071, + "step": 10050 + }, + { + "epoch": 0.19, + "learning_rate": 1.61162673294241e-07, + "loss": 0.0054, + "step": 10051 + }, + { + "epoch": 0.19, + "learning_rate": 1.6115878994990486e-07, + "loss": 0.0031, + "step": 10052 + }, + { + "epoch": 0.2, + "learning_rate": 1.6115490660556873e-07, + "loss": 0.0209, + "step": 10053 + }, + { + "epoch": 0.2, + "learning_rate": 1.6115102326123257e-07, + "loss": 0.0027, + "step": 10054 + }, + { + "epoch": 0.2, + "learning_rate": 1.6114713991689642e-07, + "loss": 0.2164, + "step": 10055 + }, + { + "epoch": 0.2, + "learning_rate": 1.6114325657256026e-07, + "loss": 0.0143, + "step": 10056 + }, + { + "epoch": 0.2, + "learning_rate": 1.6113937322822413e-07, + "loss": 0.0031, + "step": 10057 + }, + { + "epoch": 0.2, + "learning_rate": 1.6113548988388798e-07, + "loss": 0.0062, + "step": 10058 + }, + { + "epoch": 0.2, + "learning_rate": 1.6113160653955185e-07, + "loss": 0.0074, + "step": 10059 + }, + { + "epoch": 0.2, + "learning_rate": 1.611277231952157e-07, + "loss": 0.004, + "step": 10060 + }, + { + "epoch": 0.2, + "learning_rate": 1.6112383985087957e-07, + "loss": 0.003, + "step": 10061 + }, + { + "epoch": 0.2, + "learning_rate": 1.611199565065434e-07, + "loss": 0.0033, + "step": 10062 + }, + { + "epoch": 0.2, + "learning_rate": 1.6111607316220728e-07, + "loss": 0.0029, + "step": 10063 + }, + { + "epoch": 0.2, + "learning_rate": 1.6111218981787113e-07, + "loss": 0.0048, + "step": 10064 + }, + { + "epoch": 0.2, + "learning_rate": 1.61108306473535e-07, + "loss": 0.0031, + "step": 10065 + }, + { + "epoch": 0.2, + "learning_rate": 1.6110442312919885e-07, + "loss": 0.0028, + "step": 10066 + }, + { + "epoch": 0.2, + "learning_rate": 1.6110053978486272e-07, + "loss": 0.0028, + "step": 10067 + }, + { + "epoch": 0.2, + "learning_rate": 1.6109665644052656e-07, + "loss": 0.0131, + "step": 10068 + }, + { + "epoch": 0.2, + "learning_rate": 1.6109277309619043e-07, + "loss": 0.2325, + "step": 10069 + }, + { + "epoch": 0.2, + "learning_rate": 1.6108888975185428e-07, + "loss": 0.0029, + "step": 10070 + }, + { + "epoch": 0.2, + "learning_rate": 1.6108500640751815e-07, + "loss": 0.2966, + "step": 10071 + }, + { + "epoch": 0.2, + "learning_rate": 1.61081123063182e-07, + "loss": 0.0055, + "step": 10072 + }, + { + "epoch": 0.2, + "learning_rate": 1.6107723971884587e-07, + "loss": 0.0221, + "step": 10073 + }, + { + "epoch": 0.2, + "learning_rate": 1.610733563745097e-07, + "loss": 0.0027, + "step": 10074 + }, + { + "epoch": 0.2, + "learning_rate": 1.6106947303017358e-07, + "loss": 0.7918, + "step": 10075 + }, + { + "epoch": 0.2, + "learning_rate": 1.6106558968583743e-07, + "loss": 0.0029, + "step": 10076 + }, + { + "epoch": 0.2, + "learning_rate": 1.610617063415013e-07, + "loss": 0.0277, + "step": 10077 + }, + { + "epoch": 0.2, + "learning_rate": 1.6105782299716514e-07, + "loss": 0.1151, + "step": 10078 + }, + { + "epoch": 0.2, + "learning_rate": 1.6105393965282902e-07, + "loss": 0.0028, + "step": 10079 + }, + { + "epoch": 0.2, + "learning_rate": 1.6105005630849286e-07, + "loss": 0.3816, + "step": 10080 + }, + { + "epoch": 0.2, + "learning_rate": 1.6104617296415673e-07, + "loss": 0.003, + "step": 10081 + }, + { + "epoch": 0.2, + "learning_rate": 1.6104228961982058e-07, + "loss": 0.0034, + "step": 10082 + }, + { + "epoch": 0.2, + "learning_rate": 1.6103840627548445e-07, + "loss": 0.003, + "step": 10083 + }, + { + "epoch": 0.2, + "learning_rate": 1.610345229311483e-07, + "loss": 0.0029, + "step": 10084 + }, + { + "epoch": 0.2, + "learning_rate": 1.6103063958681217e-07, + "loss": 0.005, + "step": 10085 + }, + { + "epoch": 0.2, + "learning_rate": 1.61026756242476e-07, + "loss": 0.0484, + "step": 10086 + }, + { + "epoch": 0.2, + "learning_rate": 1.6102287289813988e-07, + "loss": 0.3285, + "step": 10087 + }, + { + "epoch": 0.2, + "learning_rate": 1.6101898955380373e-07, + "loss": 0.0029, + "step": 10088 + }, + { + "epoch": 0.2, + "learning_rate": 1.610151062094676e-07, + "loss": 0.0026, + "step": 10089 + }, + { + "epoch": 0.2, + "learning_rate": 1.6101122286513144e-07, + "loss": 0.0027, + "step": 10090 + }, + { + "epoch": 0.2, + "learning_rate": 1.6100733952079532e-07, + "loss": 0.2562, + "step": 10091 + }, + { + "epoch": 0.2, + "learning_rate": 1.6100345617645916e-07, + "loss": 0.0034, + "step": 10092 + }, + { + "epoch": 0.2, + "learning_rate": 1.6099957283212303e-07, + "loss": 0.0047, + "step": 10093 + }, + { + "epoch": 0.2, + "learning_rate": 1.6099568948778688e-07, + "loss": 0.0034, + "step": 10094 + }, + { + "epoch": 0.2, + "learning_rate": 1.6099180614345075e-07, + "loss": 0.0032, + "step": 10095 + }, + { + "epoch": 0.2, + "learning_rate": 1.609879227991146e-07, + "loss": 0.0028, + "step": 10096 + }, + { + "epoch": 0.2, + "learning_rate": 1.6098403945477846e-07, + "loss": 0.0028, + "step": 10097 + }, + { + "epoch": 0.2, + "learning_rate": 1.609801561104423e-07, + "loss": 0.8342, + "step": 10098 + }, + { + "epoch": 0.2, + "learning_rate": 1.6097627276610618e-07, + "loss": 0.0034, + "step": 10099 + }, + { + "epoch": 0.2, + "learning_rate": 1.6097238942177003e-07, + "loss": 0.0025, + "step": 10100 + }, + { + "epoch": 0.2, + "learning_rate": 1.609685060774339e-07, + "loss": 0.0037, + "step": 10101 + }, + { + "epoch": 0.2, + "learning_rate": 1.6096462273309774e-07, + "loss": 0.058, + "step": 10102 + }, + { + "epoch": 0.2, + "learning_rate": 1.6096073938876161e-07, + "loss": 0.003, + "step": 10103 + }, + { + "epoch": 0.2, + "learning_rate": 1.6095685604442546e-07, + "loss": 0.004, + "step": 10104 + }, + { + "epoch": 0.2, + "learning_rate": 1.6095297270008933e-07, + "loss": 0.0097, + "step": 10105 + }, + { + "epoch": 0.2, + "learning_rate": 1.6094908935575318e-07, + "loss": 0.0303, + "step": 10106 + }, + { + "epoch": 0.2, + "learning_rate": 1.6094520601141705e-07, + "loss": 0.0851, + "step": 10107 + }, + { + "epoch": 0.2, + "learning_rate": 1.609413226670809e-07, + "loss": 0.0133, + "step": 10108 + }, + { + "epoch": 0.2, + "learning_rate": 1.6093743932274474e-07, + "loss": 0.5569, + "step": 10109 + }, + { + "epoch": 0.2, + "learning_rate": 1.609335559784086e-07, + "loss": 0.1503, + "step": 10110 + }, + { + "epoch": 0.2, + "learning_rate": 1.6092967263407245e-07, + "loss": 0.0629, + "step": 10111 + }, + { + "epoch": 0.2, + "learning_rate": 1.6092578928973632e-07, + "loss": 0.4347, + "step": 10112 + }, + { + "epoch": 0.2, + "learning_rate": 1.6092190594540017e-07, + "loss": 0.0559, + "step": 10113 + }, + { + "epoch": 0.2, + "learning_rate": 1.6091802260106401e-07, + "loss": 0.0035, + "step": 10114 + }, + { + "epoch": 0.2, + "learning_rate": 1.6091413925672789e-07, + "loss": 0.0486, + "step": 10115 + }, + { + "epoch": 0.2, + "learning_rate": 1.6091025591239173e-07, + "loss": 0.0025, + "step": 10116 + }, + { + "epoch": 0.2, + "learning_rate": 1.609063725680556e-07, + "loss": 0.0041, + "step": 10117 + }, + { + "epoch": 0.2, + "learning_rate": 1.6090248922371945e-07, + "loss": 0.0469, + "step": 10118 + }, + { + "epoch": 0.2, + "learning_rate": 1.6089860587938332e-07, + "loss": 0.0133, + "step": 10119 + }, + { + "epoch": 0.2, + "learning_rate": 1.6089472253504716e-07, + "loss": 0.0022, + "step": 10120 + }, + { + "epoch": 0.2, + "learning_rate": 1.6089083919071104e-07, + "loss": 0.0024, + "step": 10121 + }, + { + "epoch": 0.2, + "learning_rate": 1.6088695584637488e-07, + "loss": 0.647, + "step": 10122 + }, + { + "epoch": 0.2, + "learning_rate": 1.6088307250203875e-07, + "loss": 0.0049, + "step": 10123 + }, + { + "epoch": 0.2, + "learning_rate": 1.608791891577026e-07, + "loss": 0.0028, + "step": 10124 + }, + { + "epoch": 0.2, + "learning_rate": 1.6087530581336647e-07, + "loss": 0.003, + "step": 10125 + }, + { + "epoch": 0.2, + "learning_rate": 1.6087142246903031e-07, + "loss": 0.1598, + "step": 10126 + }, + { + "epoch": 0.2, + "learning_rate": 1.6086753912469419e-07, + "loss": 0.0021, + "step": 10127 + }, + { + "epoch": 0.2, + "learning_rate": 1.6086365578035803e-07, + "loss": 0.0036, + "step": 10128 + }, + { + "epoch": 0.2, + "learning_rate": 1.608597724360219e-07, + "loss": 0.0028, + "step": 10129 + }, + { + "epoch": 0.2, + "learning_rate": 1.6085588909168575e-07, + "loss": 0.005, + "step": 10130 + }, + { + "epoch": 0.2, + "learning_rate": 1.6085200574734962e-07, + "loss": 0.0033, + "step": 10131 + }, + { + "epoch": 0.2, + "learning_rate": 1.6084812240301346e-07, + "loss": 0.0282, + "step": 10132 + }, + { + "epoch": 0.2, + "learning_rate": 1.6084423905867733e-07, + "loss": 0.0024, + "step": 10133 + }, + { + "epoch": 0.2, + "learning_rate": 1.6084035571434118e-07, + "loss": 0.1543, + "step": 10134 + }, + { + "epoch": 0.2, + "learning_rate": 1.6083647237000505e-07, + "loss": 0.0026, + "step": 10135 + }, + { + "epoch": 0.2, + "learning_rate": 1.608325890256689e-07, + "loss": 0.0077, + "step": 10136 + }, + { + "epoch": 0.2, + "learning_rate": 1.6082870568133277e-07, + "loss": 0.0049, + "step": 10137 + }, + { + "epoch": 0.2, + "learning_rate": 1.608248223369966e-07, + "loss": 0.0024, + "step": 10138 + }, + { + "epoch": 0.2, + "learning_rate": 1.6082093899266046e-07, + "loss": 0.0076, + "step": 10139 + }, + { + "epoch": 0.2, + "learning_rate": 1.6081705564832433e-07, + "loss": 0.0029, + "step": 10140 + }, + { + "epoch": 0.2, + "learning_rate": 1.6081317230398817e-07, + "loss": 0.0026, + "step": 10141 + }, + { + "epoch": 0.2, + "learning_rate": 1.6080928895965205e-07, + "loss": 0.0123, + "step": 10142 + }, + { + "epoch": 0.2, + "learning_rate": 1.608054056153159e-07, + "loss": 0.0027, + "step": 10143 + }, + { + "epoch": 0.2, + "learning_rate": 1.6080152227097976e-07, + "loss": 0.6531, + "step": 10144 + }, + { + "epoch": 0.2, + "learning_rate": 1.607976389266436e-07, + "loss": 1.5524, + "step": 10145 + }, + { + "epoch": 0.2, + "learning_rate": 1.6079375558230748e-07, + "loss": 0.4309, + "step": 10146 + }, + { + "epoch": 0.2, + "learning_rate": 1.6078987223797132e-07, + "loss": 0.0083, + "step": 10147 + }, + { + "epoch": 0.2, + "learning_rate": 1.607859888936352e-07, + "loss": 0.0029, + "step": 10148 + }, + { + "epoch": 0.2, + "learning_rate": 1.6078210554929904e-07, + "loss": 0.0115, + "step": 10149 + }, + { + "epoch": 0.2, + "learning_rate": 1.607782222049629e-07, + "loss": 0.0025, + "step": 10150 + }, + { + "epoch": 0.2, + "learning_rate": 1.6077433886062676e-07, + "loss": 0.0039, + "step": 10151 + }, + { + "epoch": 0.2, + "learning_rate": 1.6077045551629063e-07, + "loss": 0.003, + "step": 10152 + }, + { + "epoch": 0.2, + "learning_rate": 1.6076657217195447e-07, + "loss": 0.0031, + "step": 10153 + }, + { + "epoch": 0.2, + "learning_rate": 1.6076268882761834e-07, + "loss": 0.0119, + "step": 10154 + }, + { + "epoch": 0.2, + "learning_rate": 1.607588054832822e-07, + "loss": 0.0033, + "step": 10155 + }, + { + "epoch": 0.2, + "learning_rate": 1.6075492213894606e-07, + "loss": 0.0033, + "step": 10156 + }, + { + "epoch": 0.2, + "learning_rate": 1.607510387946099e-07, + "loss": 0.8918, + "step": 10157 + }, + { + "epoch": 0.2, + "learning_rate": 1.6074715545027378e-07, + "loss": 0.0024, + "step": 10158 + }, + { + "epoch": 0.2, + "learning_rate": 1.6074327210593762e-07, + "loss": 0.0031, + "step": 10159 + }, + { + "epoch": 0.2, + "learning_rate": 1.607393887616015e-07, + "loss": 0.9613, + "step": 10160 + }, + { + "epoch": 0.2, + "learning_rate": 1.6073550541726534e-07, + "loss": 0.519, + "step": 10161 + }, + { + "epoch": 0.2, + "learning_rate": 1.607316220729292e-07, + "loss": 0.029, + "step": 10162 + }, + { + "epoch": 0.2, + "learning_rate": 1.6072773872859306e-07, + "loss": 0.0026, + "step": 10163 + }, + { + "epoch": 0.2, + "learning_rate": 1.6072385538425693e-07, + "loss": 0.0261, + "step": 10164 + }, + { + "epoch": 0.2, + "learning_rate": 1.6071997203992077e-07, + "loss": 0.0586, + "step": 10165 + }, + { + "epoch": 0.2, + "learning_rate": 1.6071608869558464e-07, + "loss": 0.0104, + "step": 10166 + }, + { + "epoch": 0.2, + "learning_rate": 1.607122053512485e-07, + "loss": 0.0039, + "step": 10167 + }, + { + "epoch": 0.2, + "learning_rate": 1.6070832200691236e-07, + "loss": 0.0027, + "step": 10168 + }, + { + "epoch": 0.2, + "learning_rate": 1.607044386625762e-07, + "loss": 0.046, + "step": 10169 + }, + { + "epoch": 0.2, + "learning_rate": 1.6070055531824008e-07, + "loss": 0.0417, + "step": 10170 + }, + { + "epoch": 0.2, + "learning_rate": 1.606966719739039e-07, + "loss": 0.012, + "step": 10171 + }, + { + "epoch": 0.2, + "learning_rate": 1.6069278862956777e-07, + "loss": 0.0055, + "step": 10172 + }, + { + "epoch": 0.2, + "learning_rate": 1.606889052852316e-07, + "loss": 0.0027, + "step": 10173 + }, + { + "epoch": 0.2, + "learning_rate": 1.6068502194089548e-07, + "loss": 0.0039, + "step": 10174 + }, + { + "epoch": 0.2, + "learning_rate": 1.6068113859655933e-07, + "loss": 0.003, + "step": 10175 + }, + { + "epoch": 0.2, + "learning_rate": 1.606772552522232e-07, + "loss": 0.0028, + "step": 10176 + }, + { + "epoch": 0.2, + "learning_rate": 1.6067337190788704e-07, + "loss": 0.1325, + "step": 10177 + }, + { + "epoch": 0.2, + "learning_rate": 1.6066948856355092e-07, + "loss": 0.0028, + "step": 10178 + }, + { + "epoch": 0.2, + "learning_rate": 1.6066560521921476e-07, + "loss": 0.0026, + "step": 10179 + }, + { + "epoch": 0.2, + "learning_rate": 1.6066172187487863e-07, + "loss": 0.004, + "step": 10180 + }, + { + "epoch": 0.2, + "learning_rate": 1.6065783853054248e-07, + "loss": 0.0081, + "step": 10181 + }, + { + "epoch": 0.2, + "learning_rate": 1.6065395518620635e-07, + "loss": 0.0182, + "step": 10182 + }, + { + "epoch": 0.2, + "learning_rate": 1.606500718418702e-07, + "loss": 0.0083, + "step": 10183 + }, + { + "epoch": 0.2, + "learning_rate": 1.6064618849753407e-07, + "loss": 0.818, + "step": 10184 + }, + { + "epoch": 0.2, + "learning_rate": 1.606423051531979e-07, + "loss": 0.0061, + "step": 10185 + }, + { + "epoch": 0.2, + "learning_rate": 1.6063842180886178e-07, + "loss": 0.5577, + "step": 10186 + }, + { + "epoch": 0.2, + "learning_rate": 1.6063453846452563e-07, + "loss": 1.1387, + "step": 10187 + }, + { + "epoch": 0.2, + "learning_rate": 1.606306551201895e-07, + "loss": 0.0026, + "step": 10188 + }, + { + "epoch": 0.2, + "learning_rate": 1.6062677177585334e-07, + "loss": 0.0059, + "step": 10189 + }, + { + "epoch": 0.2, + "learning_rate": 1.6062288843151722e-07, + "loss": 0.0033, + "step": 10190 + }, + { + "epoch": 0.2, + "learning_rate": 1.6061900508718106e-07, + "loss": 0.0039, + "step": 10191 + }, + { + "epoch": 0.2, + "learning_rate": 1.6061512174284493e-07, + "loss": 0.0032, + "step": 10192 + }, + { + "epoch": 0.2, + "learning_rate": 1.6061123839850878e-07, + "loss": 0.0024, + "step": 10193 + }, + { + "epoch": 0.2, + "learning_rate": 1.6060735505417265e-07, + "loss": 0.0028, + "step": 10194 + }, + { + "epoch": 0.2, + "learning_rate": 1.606034717098365e-07, + "loss": 0.005, + "step": 10195 + }, + { + "epoch": 0.2, + "learning_rate": 1.6059958836550036e-07, + "loss": 0.0458, + "step": 10196 + }, + { + "epoch": 0.2, + "learning_rate": 1.605957050211642e-07, + "loss": 0.0037, + "step": 10197 + }, + { + "epoch": 0.2, + "learning_rate": 1.6059182167682808e-07, + "loss": 0.0054, + "step": 10198 + }, + { + "epoch": 0.2, + "learning_rate": 1.6058793833249193e-07, + "loss": 0.0027, + "step": 10199 + }, + { + "epoch": 0.2, + "learning_rate": 1.605840549881558e-07, + "loss": 0.4902, + "step": 10200 + }, + { + "epoch": 0.2, + "learning_rate": 1.6058017164381964e-07, + "loss": 0.2592, + "step": 10201 + }, + { + "epoch": 0.2, + "learning_rate": 1.6057628829948351e-07, + "loss": 0.0034, + "step": 10202 + }, + { + "epoch": 0.2, + "learning_rate": 1.6057240495514736e-07, + "loss": 0.0319, + "step": 10203 + }, + { + "epoch": 0.2, + "learning_rate": 1.6056852161081123e-07, + "loss": 0.4336, + "step": 10204 + }, + { + "epoch": 0.2, + "learning_rate": 1.6056463826647508e-07, + "loss": 0.1959, + "step": 10205 + }, + { + "epoch": 0.2, + "learning_rate": 1.6056075492213895e-07, + "loss": 0.1301, + "step": 10206 + }, + { + "epoch": 0.2, + "learning_rate": 1.605568715778028e-07, + "loss": 0.0033, + "step": 10207 + }, + { + "epoch": 0.2, + "learning_rate": 1.6055298823346666e-07, + "loss": 0.0023, + "step": 10208 + }, + { + "epoch": 0.2, + "learning_rate": 1.605491048891305e-07, + "loss": 0.0044, + "step": 10209 + }, + { + "epoch": 0.2, + "learning_rate": 1.6054522154479438e-07, + "loss": 0.0028, + "step": 10210 + }, + { + "epoch": 0.2, + "learning_rate": 1.6054133820045822e-07, + "loss": 0.0036, + "step": 10211 + }, + { + "epoch": 0.2, + "learning_rate": 1.605374548561221e-07, + "loss": 0.0049, + "step": 10212 + }, + { + "epoch": 0.2, + "learning_rate": 1.6053357151178594e-07, + "loss": 0.0034, + "step": 10213 + }, + { + "epoch": 0.2, + "learning_rate": 1.605296881674498e-07, + "loss": 0.2999, + "step": 10214 + }, + { + "epoch": 0.2, + "learning_rate": 1.6052580482311366e-07, + "loss": 0.0045, + "step": 10215 + }, + { + "epoch": 0.2, + "learning_rate": 1.6052192147877753e-07, + "loss": 0.5056, + "step": 10216 + }, + { + "epoch": 0.2, + "learning_rate": 1.6051803813444137e-07, + "loss": 0.0213, + "step": 10217 + }, + { + "epoch": 0.2, + "learning_rate": 1.6051415479010525e-07, + "loss": 0.2911, + "step": 10218 + }, + { + "epoch": 0.2, + "learning_rate": 1.605102714457691e-07, + "loss": 0.0025, + "step": 10219 + }, + { + "epoch": 0.2, + "learning_rate": 1.6050638810143296e-07, + "loss": 0.0038, + "step": 10220 + }, + { + "epoch": 0.2, + "learning_rate": 1.605025047570968e-07, + "loss": 0.003, + "step": 10221 + }, + { + "epoch": 0.2, + "learning_rate": 1.6049862141276068e-07, + "loss": 0.0026, + "step": 10222 + }, + { + "epoch": 0.2, + "learning_rate": 1.6049473806842452e-07, + "loss": 0.0035, + "step": 10223 + }, + { + "epoch": 0.2, + "learning_rate": 1.604908547240884e-07, + "loss": 0.003, + "step": 10224 + }, + { + "epoch": 0.2, + "learning_rate": 1.6048697137975224e-07, + "loss": 0.7929, + "step": 10225 + }, + { + "epoch": 0.2, + "learning_rate": 1.604830880354161e-07, + "loss": 0.0025, + "step": 10226 + }, + { + "epoch": 0.2, + "learning_rate": 1.6047920469107996e-07, + "loss": 0.004, + "step": 10227 + }, + { + "epoch": 0.2, + "learning_rate": 1.6047532134674383e-07, + "loss": 0.017, + "step": 10228 + }, + { + "epoch": 0.2, + "learning_rate": 1.6047143800240765e-07, + "loss": 0.0031, + "step": 10229 + }, + { + "epoch": 0.2, + "learning_rate": 1.6046755465807152e-07, + "loss": 0.0782, + "step": 10230 + }, + { + "epoch": 0.2, + "learning_rate": 1.6046367131373536e-07, + "loss": 0.04, + "step": 10231 + }, + { + "epoch": 0.2, + "learning_rate": 1.6045978796939923e-07, + "loss": 0.0056, + "step": 10232 + }, + { + "epoch": 0.2, + "learning_rate": 1.6045590462506308e-07, + "loss": 0.0385, + "step": 10233 + }, + { + "epoch": 0.2, + "learning_rate": 1.6045202128072695e-07, + "loss": 0.0047, + "step": 10234 + }, + { + "epoch": 0.2, + "learning_rate": 1.604481379363908e-07, + "loss": 0.8191, + "step": 10235 + }, + { + "epoch": 0.2, + "learning_rate": 1.6044425459205467e-07, + "loss": 0.0281, + "step": 10236 + }, + { + "epoch": 0.2, + "learning_rate": 1.604403712477185e-07, + "loss": 0.0025, + "step": 10237 + }, + { + "epoch": 0.2, + "learning_rate": 1.6043648790338238e-07, + "loss": 0.0024, + "step": 10238 + }, + { + "epoch": 0.2, + "learning_rate": 1.6043260455904623e-07, + "loss": 0.0031, + "step": 10239 + }, + { + "epoch": 0.2, + "learning_rate": 1.604287212147101e-07, + "loss": 0.0022, + "step": 10240 + }, + { + "epoch": 0.2, + "learning_rate": 1.6042483787037395e-07, + "loss": 0.0093, + "step": 10241 + }, + { + "epoch": 0.2, + "learning_rate": 1.6042095452603782e-07, + "loss": 0.0035, + "step": 10242 + }, + { + "epoch": 0.2, + "learning_rate": 1.6041707118170166e-07, + "loss": 0.0057, + "step": 10243 + }, + { + "epoch": 0.2, + "learning_rate": 1.6041318783736553e-07, + "loss": 0.0039, + "step": 10244 + }, + { + "epoch": 0.2, + "learning_rate": 1.6040930449302938e-07, + "loss": 0.0044, + "step": 10245 + }, + { + "epoch": 0.2, + "learning_rate": 1.6040542114869325e-07, + "loss": 0.0027, + "step": 10246 + }, + { + "epoch": 0.2, + "learning_rate": 1.604015378043571e-07, + "loss": 0.0045, + "step": 10247 + }, + { + "epoch": 0.2, + "learning_rate": 1.6039765446002097e-07, + "loss": 0.0026, + "step": 10248 + }, + { + "epoch": 0.2, + "learning_rate": 1.603937711156848e-07, + "loss": 0.0026, + "step": 10249 + }, + { + "epoch": 0.2, + "learning_rate": 1.6038988777134868e-07, + "loss": 0.0066, + "step": 10250 + }, + { + "epoch": 0.2, + "learning_rate": 1.6038600442701253e-07, + "loss": 0.0029, + "step": 10251 + }, + { + "epoch": 0.2, + "learning_rate": 1.603821210826764e-07, + "loss": 0.4145, + "step": 10252 + }, + { + "epoch": 0.2, + "learning_rate": 1.6037823773834024e-07, + "loss": 0.0026, + "step": 10253 + }, + { + "epoch": 0.2, + "learning_rate": 1.6037435439400412e-07, + "loss": 0.2838, + "step": 10254 + }, + { + "epoch": 0.2, + "learning_rate": 1.6037047104966796e-07, + "loss": 0.0031, + "step": 10255 + }, + { + "epoch": 0.2, + "learning_rate": 1.6036658770533183e-07, + "loss": 0.0023, + "step": 10256 + }, + { + "epoch": 0.2, + "learning_rate": 1.6036270436099568e-07, + "loss": 0.0023, + "step": 10257 + }, + { + "epoch": 0.2, + "learning_rate": 1.6035882101665955e-07, + "loss": 0.0161, + "step": 10258 + }, + { + "epoch": 0.2, + "learning_rate": 1.603549376723234e-07, + "loss": 0.0026, + "step": 10259 + }, + { + "epoch": 0.2, + "learning_rate": 1.6035105432798727e-07, + "loss": 0.0038, + "step": 10260 + }, + { + "epoch": 0.2, + "learning_rate": 1.603471709836511e-07, + "loss": 0.0024, + "step": 10261 + }, + { + "epoch": 0.2, + "learning_rate": 1.6034328763931498e-07, + "loss": 0.0031, + "step": 10262 + }, + { + "epoch": 0.2, + "learning_rate": 1.6033940429497883e-07, + "loss": 0.0031, + "step": 10263 + }, + { + "epoch": 0.2, + "learning_rate": 1.603355209506427e-07, + "loss": 0.0139, + "step": 10264 + }, + { + "epoch": 0.2, + "learning_rate": 1.6033163760630654e-07, + "loss": 0.0024, + "step": 10265 + }, + { + "epoch": 0.2, + "learning_rate": 1.6032775426197042e-07, + "loss": 0.0025, + "step": 10266 + }, + { + "epoch": 0.2, + "learning_rate": 1.6032387091763426e-07, + "loss": 0.0025, + "step": 10267 + }, + { + "epoch": 0.2, + "learning_rate": 1.6031998757329813e-07, + "loss": 0.0039, + "step": 10268 + }, + { + "epoch": 0.2, + "learning_rate": 1.6031610422896198e-07, + "loss": 0.0127, + "step": 10269 + }, + { + "epoch": 0.2, + "learning_rate": 1.6031222088462585e-07, + "loss": 0.0292, + "step": 10270 + }, + { + "epoch": 0.2, + "learning_rate": 1.603083375402897e-07, + "loss": 0.0028, + "step": 10271 + }, + { + "epoch": 0.2, + "learning_rate": 1.6030445419595356e-07, + "loss": 0.1263, + "step": 10272 + }, + { + "epoch": 0.2, + "learning_rate": 1.603005708516174e-07, + "loss": 0.005, + "step": 10273 + }, + { + "epoch": 0.2, + "learning_rate": 1.6029668750728128e-07, + "loss": 0.0027, + "step": 10274 + }, + { + "epoch": 0.2, + "learning_rate": 1.6029280416294513e-07, + "loss": 0.0028, + "step": 10275 + }, + { + "epoch": 0.2, + "learning_rate": 1.60288920818609e-07, + "loss": 0.0027, + "step": 10276 + }, + { + "epoch": 0.2, + "learning_rate": 1.6028503747427284e-07, + "loss": 0.3598, + "step": 10277 + }, + { + "epoch": 0.2, + "learning_rate": 1.6028115412993671e-07, + "loss": 0.4251, + "step": 10278 + }, + { + "epoch": 0.2, + "learning_rate": 1.6027727078560056e-07, + "loss": 0.525, + "step": 10279 + }, + { + "epoch": 0.2, + "learning_rate": 1.6027338744126443e-07, + "loss": 0.1358, + "step": 10280 + }, + { + "epoch": 0.2, + "learning_rate": 1.6026950409692828e-07, + "loss": 0.8001, + "step": 10281 + }, + { + "epoch": 0.2, + "learning_rate": 1.6026562075259215e-07, + "loss": 0.6008, + "step": 10282 + }, + { + "epoch": 0.2, + "learning_rate": 1.60261737408256e-07, + "loss": 0.003, + "step": 10283 + }, + { + "epoch": 0.2, + "learning_rate": 1.6025785406391986e-07, + "loss": 0.6361, + "step": 10284 + }, + { + "epoch": 0.2, + "learning_rate": 1.602539707195837e-07, + "loss": 0.015, + "step": 10285 + }, + { + "epoch": 0.2, + "learning_rate": 1.6025008737524755e-07, + "loss": 0.0198, + "step": 10286 + }, + { + "epoch": 0.2, + "learning_rate": 1.602462040309114e-07, + "loss": 0.0025, + "step": 10287 + }, + { + "epoch": 0.2, + "learning_rate": 1.6024232068657527e-07, + "loss": 0.004, + "step": 10288 + }, + { + "epoch": 0.2, + "learning_rate": 1.6023843734223912e-07, + "loss": 0.003, + "step": 10289 + }, + { + "epoch": 0.2, + "learning_rate": 1.6023455399790299e-07, + "loss": 0.0263, + "step": 10290 + }, + { + "epoch": 0.2, + "learning_rate": 1.6023067065356683e-07, + "loss": 0.0032, + "step": 10291 + }, + { + "epoch": 0.2, + "learning_rate": 1.602267873092307e-07, + "loss": 0.0032, + "step": 10292 + }, + { + "epoch": 0.2, + "learning_rate": 1.6022290396489455e-07, + "loss": 0.0029, + "step": 10293 + }, + { + "epoch": 0.2, + "learning_rate": 1.6021902062055842e-07, + "loss": 0.3577, + "step": 10294 + }, + { + "epoch": 0.2, + "learning_rate": 1.6021513727622226e-07, + "loss": 0.0036, + "step": 10295 + }, + { + "epoch": 0.2, + "learning_rate": 1.6021125393188614e-07, + "loss": 0.1294, + "step": 10296 + }, + { + "epoch": 0.2, + "learning_rate": 1.6020737058754998e-07, + "loss": 0.0027, + "step": 10297 + }, + { + "epoch": 0.2, + "learning_rate": 1.6020348724321385e-07, + "loss": 0.0026, + "step": 10298 + }, + { + "epoch": 0.2, + "learning_rate": 1.601996038988777e-07, + "loss": 0.8322, + "step": 10299 + }, + { + "epoch": 0.2, + "learning_rate": 1.6019572055454157e-07, + "loss": 0.0035, + "step": 10300 + }, + { + "epoch": 0.2, + "learning_rate": 1.6019183721020541e-07, + "loss": 0.0039, + "step": 10301 + }, + { + "epoch": 0.2, + "learning_rate": 1.6018795386586929e-07, + "loss": 0.0039, + "step": 10302 + }, + { + "epoch": 0.2, + "learning_rate": 1.6018407052153313e-07, + "loss": 0.0075, + "step": 10303 + }, + { + "epoch": 0.2, + "learning_rate": 1.60180187177197e-07, + "loss": 0.0066, + "step": 10304 + }, + { + "epoch": 0.2, + "learning_rate": 1.6017630383286085e-07, + "loss": 0.3046, + "step": 10305 + }, + { + "epoch": 0.2, + "learning_rate": 1.6017242048852472e-07, + "loss": 0.0029, + "step": 10306 + }, + { + "epoch": 0.2, + "learning_rate": 1.6016853714418856e-07, + "loss": 0.0036, + "step": 10307 + }, + { + "epoch": 0.2, + "learning_rate": 1.6016465379985243e-07, + "loss": 0.6599, + "step": 10308 + }, + { + "epoch": 0.2, + "learning_rate": 1.6016077045551628e-07, + "loss": 0.0037, + "step": 10309 + }, + { + "epoch": 0.2, + "learning_rate": 1.6015688711118015e-07, + "loss": 0.0023, + "step": 10310 + }, + { + "epoch": 0.2, + "learning_rate": 1.60153003766844e-07, + "loss": 0.6485, + "step": 10311 + }, + { + "epoch": 0.2, + "learning_rate": 1.6014912042250787e-07, + "loss": 0.003, + "step": 10312 + }, + { + "epoch": 0.2, + "learning_rate": 1.601452370781717e-07, + "loss": 0.0223, + "step": 10313 + }, + { + "epoch": 0.2, + "learning_rate": 1.6014135373383558e-07, + "loss": 0.0026, + "step": 10314 + }, + { + "epoch": 0.2, + "learning_rate": 1.6013747038949943e-07, + "loss": 0.0387, + "step": 10315 + }, + { + "epoch": 0.2, + "learning_rate": 1.6013358704516327e-07, + "loss": 0.0022, + "step": 10316 + }, + { + "epoch": 0.2, + "learning_rate": 1.6012970370082715e-07, + "loss": 0.0053, + "step": 10317 + }, + { + "epoch": 0.2, + "learning_rate": 1.60125820356491e-07, + "loss": 1.0585, + "step": 10318 + }, + { + "epoch": 0.2, + "learning_rate": 1.6012193701215486e-07, + "loss": 0.0032, + "step": 10319 + }, + { + "epoch": 0.2, + "learning_rate": 1.601180536678187e-07, + "loss": 0.0287, + "step": 10320 + }, + { + "epoch": 0.2, + "learning_rate": 1.6011417032348258e-07, + "loss": 0.0067, + "step": 10321 + }, + { + "epoch": 0.2, + "learning_rate": 1.6011028697914642e-07, + "loss": 0.0184, + "step": 10322 + }, + { + "epoch": 0.2, + "learning_rate": 1.601064036348103e-07, + "loss": 0.0037, + "step": 10323 + }, + { + "epoch": 0.2, + "learning_rate": 1.6010252029047414e-07, + "loss": 0.0041, + "step": 10324 + }, + { + "epoch": 0.2, + "learning_rate": 1.60098636946138e-07, + "loss": 0.0048, + "step": 10325 + }, + { + "epoch": 0.2, + "learning_rate": 1.6009475360180186e-07, + "loss": 0.0394, + "step": 10326 + }, + { + "epoch": 0.2, + "learning_rate": 1.6009087025746573e-07, + "loss": 0.0047, + "step": 10327 + }, + { + "epoch": 0.2, + "learning_rate": 1.6008698691312957e-07, + "loss": 0.0026, + "step": 10328 + }, + { + "epoch": 0.2, + "learning_rate": 1.6008310356879344e-07, + "loss": 0.0456, + "step": 10329 + }, + { + "epoch": 0.2, + "learning_rate": 1.600792202244573e-07, + "loss": 0.0033, + "step": 10330 + }, + { + "epoch": 0.2, + "learning_rate": 1.6007533688012116e-07, + "loss": 0.003, + "step": 10331 + }, + { + "epoch": 0.2, + "learning_rate": 1.60071453535785e-07, + "loss": 0.8175, + "step": 10332 + }, + { + "epoch": 0.2, + "learning_rate": 1.6006757019144888e-07, + "loss": 0.0033, + "step": 10333 + }, + { + "epoch": 0.2, + "learning_rate": 1.6006368684711272e-07, + "loss": 0.9631, + "step": 10334 + }, + { + "epoch": 0.2, + "learning_rate": 1.600598035027766e-07, + "loss": 0.0032, + "step": 10335 + }, + { + "epoch": 0.2, + "learning_rate": 1.6005592015844044e-07, + "loss": 0.0042, + "step": 10336 + }, + { + "epoch": 0.2, + "learning_rate": 1.600520368141043e-07, + "loss": 0.1222, + "step": 10337 + }, + { + "epoch": 0.2, + "learning_rate": 1.6004815346976816e-07, + "loss": 0.0031, + "step": 10338 + }, + { + "epoch": 0.2, + "learning_rate": 1.6004427012543203e-07, + "loss": 0.0023, + "step": 10339 + }, + { + "epoch": 0.2, + "learning_rate": 1.6004038678109587e-07, + "loss": 0.0242, + "step": 10340 + }, + { + "epoch": 0.2, + "learning_rate": 1.6003650343675974e-07, + "loss": 0.0027, + "step": 10341 + }, + { + "epoch": 0.2, + "learning_rate": 1.600326200924236e-07, + "loss": 0.0063, + "step": 10342 + }, + { + "epoch": 0.2, + "learning_rate": 1.6002873674808746e-07, + "loss": 0.0056, + "step": 10343 + }, + { + "epoch": 0.2, + "learning_rate": 1.600248534037513e-07, + "loss": 0.002, + "step": 10344 + }, + { + "epoch": 0.2, + "learning_rate": 1.6002097005941515e-07, + "loss": 0.0658, + "step": 10345 + }, + { + "epoch": 0.2, + "learning_rate": 1.60017086715079e-07, + "loss": 0.0558, + "step": 10346 + }, + { + "epoch": 0.2, + "learning_rate": 1.6001320337074287e-07, + "loss": 0.7246, + "step": 10347 + }, + { + "epoch": 0.2, + "learning_rate": 1.600093200264067e-07, + "loss": 0.3392, + "step": 10348 + }, + { + "epoch": 0.2, + "learning_rate": 1.6000543668207058e-07, + "loss": 0.0979, + "step": 10349 + }, + { + "epoch": 0.2, + "learning_rate": 1.6000155333773443e-07, + "loss": 0.0372, + "step": 10350 + }, + { + "epoch": 0.2, + "learning_rate": 1.599976699933983e-07, + "loss": 0.0037, + "step": 10351 + }, + { + "epoch": 0.2, + "learning_rate": 1.5999378664906214e-07, + "loss": 0.4228, + "step": 10352 + }, + { + "epoch": 0.2, + "learning_rate": 1.5998990330472602e-07, + "loss": 0.0024, + "step": 10353 + }, + { + "epoch": 0.2, + "learning_rate": 1.5998601996038986e-07, + "loss": 0.0093, + "step": 10354 + }, + { + "epoch": 0.2, + "learning_rate": 1.5998213661605373e-07, + "loss": 0.0048, + "step": 10355 + }, + { + "epoch": 0.2, + "learning_rate": 1.5997825327171758e-07, + "loss": 0.0031, + "step": 10356 + }, + { + "epoch": 0.2, + "learning_rate": 1.5997436992738145e-07, + "loss": 0.0029, + "step": 10357 + }, + { + "epoch": 0.2, + "learning_rate": 1.599704865830453e-07, + "loss": 0.1168, + "step": 10358 + }, + { + "epoch": 0.2, + "learning_rate": 1.5996660323870917e-07, + "loss": 0.0032, + "step": 10359 + }, + { + "epoch": 0.2, + "learning_rate": 1.59962719894373e-07, + "loss": 0.0038, + "step": 10360 + }, + { + "epoch": 0.2, + "learning_rate": 1.5995883655003688e-07, + "loss": 0.6441, + "step": 10361 + }, + { + "epoch": 0.2, + "learning_rate": 1.5995495320570073e-07, + "loss": 0.0306, + "step": 10362 + }, + { + "epoch": 0.2, + "learning_rate": 1.599510698613646e-07, + "loss": 0.0077, + "step": 10363 + }, + { + "epoch": 0.2, + "learning_rate": 1.5994718651702844e-07, + "loss": 0.0231, + "step": 10364 + }, + { + "epoch": 0.2, + "learning_rate": 1.5994330317269232e-07, + "loss": 0.0183, + "step": 10365 + }, + { + "epoch": 0.2, + "learning_rate": 1.5993941982835616e-07, + "loss": 0.4825, + "step": 10366 + }, + { + "epoch": 0.2, + "learning_rate": 1.5993553648402003e-07, + "loss": 0.0033, + "step": 10367 + }, + { + "epoch": 0.2, + "learning_rate": 1.5993165313968388e-07, + "loss": 0.0037, + "step": 10368 + }, + { + "epoch": 0.2, + "learning_rate": 1.5992776979534775e-07, + "loss": 0.923, + "step": 10369 + }, + { + "epoch": 0.2, + "learning_rate": 1.599238864510116e-07, + "loss": 0.003, + "step": 10370 + }, + { + "epoch": 0.2, + "learning_rate": 1.5992000310667546e-07, + "loss": 0.0025, + "step": 10371 + }, + { + "epoch": 0.2, + "learning_rate": 1.599161197623393e-07, + "loss": 0.36, + "step": 10372 + }, + { + "epoch": 0.2, + "learning_rate": 1.5991223641800318e-07, + "loss": 0.0029, + "step": 10373 + }, + { + "epoch": 0.2, + "learning_rate": 1.5990835307366703e-07, + "loss": 0.0027, + "step": 10374 + }, + { + "epoch": 0.2, + "learning_rate": 1.599044697293309e-07, + "loss": 0.0154, + "step": 10375 + }, + { + "epoch": 0.2, + "learning_rate": 1.5990058638499474e-07, + "loss": 0.0084, + "step": 10376 + }, + { + "epoch": 0.2, + "learning_rate": 1.5989670304065861e-07, + "loss": 0.0027, + "step": 10377 + }, + { + "epoch": 0.2, + "learning_rate": 1.5989281969632246e-07, + "loss": 0.0027, + "step": 10378 + }, + { + "epoch": 0.2, + "learning_rate": 1.5988893635198633e-07, + "loss": 0.0039, + "step": 10379 + }, + { + "epoch": 0.2, + "learning_rate": 1.5988505300765018e-07, + "loss": 0.0026, + "step": 10380 + }, + { + "epoch": 0.2, + "learning_rate": 1.5988116966331405e-07, + "loss": 0.0051, + "step": 10381 + }, + { + "epoch": 0.2, + "learning_rate": 1.598772863189779e-07, + "loss": 0.0026, + "step": 10382 + }, + { + "epoch": 0.2, + "learning_rate": 1.5987340297464176e-07, + "loss": 0.0027, + "step": 10383 + }, + { + "epoch": 0.2, + "learning_rate": 1.598695196303056e-07, + "loss": 0.0035, + "step": 10384 + }, + { + "epoch": 0.2, + "learning_rate": 1.5986563628596948e-07, + "loss": 0.0102, + "step": 10385 + }, + { + "epoch": 0.2, + "learning_rate": 1.5986175294163333e-07, + "loss": 0.0032, + "step": 10386 + }, + { + "epoch": 0.2, + "learning_rate": 1.598578695972972e-07, + "loss": 0.0045, + "step": 10387 + }, + { + "epoch": 0.2, + "learning_rate": 1.5985398625296104e-07, + "loss": 0.0022, + "step": 10388 + }, + { + "epoch": 0.2, + "learning_rate": 1.598501029086249e-07, + "loss": 0.0024, + "step": 10389 + }, + { + "epoch": 0.2, + "learning_rate": 1.5984621956428876e-07, + "loss": 0.0028, + "step": 10390 + }, + { + "epoch": 0.2, + "learning_rate": 1.5984233621995263e-07, + "loss": 0.0041, + "step": 10391 + }, + { + "epoch": 0.2, + "learning_rate": 1.5983845287561647e-07, + "loss": 0.003, + "step": 10392 + }, + { + "epoch": 0.2, + "learning_rate": 1.5983456953128035e-07, + "loss": 0.0037, + "step": 10393 + }, + { + "epoch": 0.2, + "learning_rate": 1.598306861869442e-07, + "loss": 0.1679, + "step": 10394 + }, + { + "epoch": 0.2, + "learning_rate": 1.5982680284260806e-07, + "loss": 0.0037, + "step": 10395 + }, + { + "epoch": 0.2, + "learning_rate": 1.598229194982719e-07, + "loss": 0.0547, + "step": 10396 + }, + { + "epoch": 0.2, + "learning_rate": 1.5981903615393578e-07, + "loss": 0.1493, + "step": 10397 + }, + { + "epoch": 0.2, + "learning_rate": 1.5981515280959962e-07, + "loss": 0.0046, + "step": 10398 + }, + { + "epoch": 0.2, + "learning_rate": 1.598112694652635e-07, + "loss": 0.3869, + "step": 10399 + }, + { + "epoch": 0.2, + "learning_rate": 1.5980738612092734e-07, + "loss": 0.0021, + "step": 10400 + }, + { + "epoch": 0.2, + "learning_rate": 1.598035027765912e-07, + "loss": 0.3492, + "step": 10401 + }, + { + "epoch": 0.2, + "learning_rate": 1.5979961943225506e-07, + "loss": 0.0048, + "step": 10402 + }, + { + "epoch": 0.2, + "learning_rate": 1.597957360879189e-07, + "loss": 0.0022, + "step": 10403 + }, + { + "epoch": 0.2, + "learning_rate": 1.5979185274358275e-07, + "loss": 0.2041, + "step": 10404 + }, + { + "epoch": 0.2, + "learning_rate": 1.5978796939924662e-07, + "loss": 0.0399, + "step": 10405 + }, + { + "epoch": 0.2, + "learning_rate": 1.5978408605491046e-07, + "loss": 0.0024, + "step": 10406 + }, + { + "epoch": 0.2, + "learning_rate": 1.5978020271057433e-07, + "loss": 0.0031, + "step": 10407 + }, + { + "epoch": 0.2, + "learning_rate": 1.5977631936623818e-07, + "loss": 0.2729, + "step": 10408 + }, + { + "epoch": 0.2, + "learning_rate": 1.5977243602190205e-07, + "loss": 0.0028, + "step": 10409 + }, + { + "epoch": 0.2, + "learning_rate": 1.597685526775659e-07, + "loss": 0.0057, + "step": 10410 + }, + { + "epoch": 0.2, + "learning_rate": 1.5976466933322977e-07, + "loss": 0.0035, + "step": 10411 + }, + { + "epoch": 0.2, + "learning_rate": 1.597607859888936e-07, + "loss": 0.008, + "step": 10412 + }, + { + "epoch": 0.2, + "learning_rate": 1.5975690264455748e-07, + "loss": 0.5966, + "step": 10413 + }, + { + "epoch": 0.2, + "learning_rate": 1.5975301930022133e-07, + "loss": 0.0029, + "step": 10414 + }, + { + "epoch": 0.2, + "learning_rate": 1.597491359558852e-07, + "loss": 0.621, + "step": 10415 + }, + { + "epoch": 0.2, + "learning_rate": 1.5974525261154905e-07, + "loss": 0.0032, + "step": 10416 + }, + { + "epoch": 0.2, + "learning_rate": 1.5974136926721292e-07, + "loss": 0.0024, + "step": 10417 + }, + { + "epoch": 0.2, + "learning_rate": 1.5973748592287676e-07, + "loss": 0.0035, + "step": 10418 + }, + { + "epoch": 0.2, + "learning_rate": 1.5973360257854063e-07, + "loss": 0.5038, + "step": 10419 + }, + { + "epoch": 0.2, + "learning_rate": 1.5972971923420448e-07, + "loss": 0.0024, + "step": 10420 + }, + { + "epoch": 0.2, + "learning_rate": 1.5972583588986835e-07, + "loss": 0.0024, + "step": 10421 + }, + { + "epoch": 0.2, + "learning_rate": 1.597219525455322e-07, + "loss": 0.0071, + "step": 10422 + }, + { + "epoch": 0.2, + "learning_rate": 1.5971806920119607e-07, + "loss": 0.0406, + "step": 10423 + }, + { + "epoch": 0.2, + "learning_rate": 1.597141858568599e-07, + "loss": 0.0029, + "step": 10424 + }, + { + "epoch": 0.2, + "learning_rate": 1.5971030251252378e-07, + "loss": 0.4216, + "step": 10425 + }, + { + "epoch": 0.2, + "learning_rate": 1.5970641916818763e-07, + "loss": 0.0029, + "step": 10426 + }, + { + "epoch": 0.2, + "learning_rate": 1.597025358238515e-07, + "loss": 0.0032, + "step": 10427 + }, + { + "epoch": 0.2, + "learning_rate": 1.5969865247951534e-07, + "loss": 0.5608, + "step": 10428 + }, + { + "epoch": 0.2, + "learning_rate": 1.5969476913517922e-07, + "loss": 0.4721, + "step": 10429 + }, + { + "epoch": 0.2, + "learning_rate": 1.5969088579084306e-07, + "loss": 0.0026, + "step": 10430 + }, + { + "epoch": 0.2, + "learning_rate": 1.5968700244650693e-07, + "loss": 0.003, + "step": 10431 + }, + { + "epoch": 0.2, + "learning_rate": 1.5968311910217078e-07, + "loss": 0.003, + "step": 10432 + }, + { + "epoch": 0.2, + "learning_rate": 1.5967923575783465e-07, + "loss": 0.0025, + "step": 10433 + }, + { + "epoch": 0.2, + "learning_rate": 1.596753524134985e-07, + "loss": 0.0304, + "step": 10434 + }, + { + "epoch": 0.2, + "learning_rate": 1.5967146906916237e-07, + "loss": 0.0027, + "step": 10435 + }, + { + "epoch": 0.2, + "learning_rate": 1.596675857248262e-07, + "loss": 0.0026, + "step": 10436 + }, + { + "epoch": 0.2, + "learning_rate": 1.5966370238049008e-07, + "loss": 0.489, + "step": 10437 + }, + { + "epoch": 0.2, + "learning_rate": 1.5965981903615393e-07, + "loss": 0.2219, + "step": 10438 + }, + { + "epoch": 0.2, + "learning_rate": 1.596559356918178e-07, + "loss": 0.247, + "step": 10439 + }, + { + "epoch": 0.2, + "learning_rate": 1.5965205234748164e-07, + "loss": 0.0021, + "step": 10440 + }, + { + "epoch": 0.2, + "learning_rate": 1.5964816900314552e-07, + "loss": 0.0047, + "step": 10441 + }, + { + "epoch": 0.2, + "learning_rate": 1.5964428565880936e-07, + "loss": 0.6343, + "step": 10442 + }, + { + "epoch": 0.2, + "learning_rate": 1.5964040231447323e-07, + "loss": 0.0036, + "step": 10443 + }, + { + "epoch": 0.2, + "learning_rate": 1.5963651897013708e-07, + "loss": 0.0401, + "step": 10444 + }, + { + "epoch": 0.2, + "learning_rate": 1.5963263562580095e-07, + "loss": 0.0024, + "step": 10445 + }, + { + "epoch": 0.2, + "learning_rate": 1.596287522814648e-07, + "loss": 0.0025, + "step": 10446 + }, + { + "epoch": 0.2, + "learning_rate": 1.5962486893712866e-07, + "loss": 0.0213, + "step": 10447 + }, + { + "epoch": 0.2, + "learning_rate": 1.596209855927925e-07, + "loss": 0.0063, + "step": 10448 + }, + { + "epoch": 0.2, + "learning_rate": 1.5961710224845638e-07, + "loss": 0.0154, + "step": 10449 + }, + { + "epoch": 0.2, + "learning_rate": 1.5961321890412023e-07, + "loss": 0.0023, + "step": 10450 + }, + { + "epoch": 0.2, + "learning_rate": 1.596093355597841e-07, + "loss": 0.003, + "step": 10451 + }, + { + "epoch": 0.2, + "learning_rate": 1.5960545221544794e-07, + "loss": 0.0043, + "step": 10452 + }, + { + "epoch": 0.2, + "learning_rate": 1.5960156887111181e-07, + "loss": 0.1434, + "step": 10453 + }, + { + "epoch": 0.2, + "learning_rate": 1.5959768552677566e-07, + "loss": 0.0023, + "step": 10454 + }, + { + "epoch": 0.2, + "learning_rate": 1.5959380218243953e-07, + "loss": 0.0711, + "step": 10455 + }, + { + "epoch": 0.2, + "learning_rate": 1.5958991883810338e-07, + "loss": 0.0033, + "step": 10456 + }, + { + "epoch": 0.2, + "learning_rate": 1.5958603549376725e-07, + "loss": 0.0025, + "step": 10457 + }, + { + "epoch": 0.2, + "learning_rate": 1.595821521494311e-07, + "loss": 0.0329, + "step": 10458 + }, + { + "epoch": 0.2, + "learning_rate": 1.5957826880509496e-07, + "loss": 0.0027, + "step": 10459 + }, + { + "epoch": 0.2, + "learning_rate": 1.595743854607588e-07, + "loss": 0.0023, + "step": 10460 + }, + { + "epoch": 0.2, + "learning_rate": 1.5957050211642265e-07, + "loss": 0.1185, + "step": 10461 + }, + { + "epoch": 0.2, + "learning_rate": 1.595666187720865e-07, + "loss": 0.2599, + "step": 10462 + }, + { + "epoch": 0.2, + "learning_rate": 1.5956273542775037e-07, + "loss": 0.0234, + "step": 10463 + }, + { + "epoch": 0.2, + "learning_rate": 1.5955885208341422e-07, + "loss": 0.5663, + "step": 10464 + }, + { + "epoch": 0.2, + "learning_rate": 1.5955496873907809e-07, + "loss": 0.0186, + "step": 10465 + }, + { + "epoch": 0.2, + "learning_rate": 1.5955108539474193e-07, + "loss": 0.003, + "step": 10466 + }, + { + "epoch": 0.2, + "learning_rate": 1.595472020504058e-07, + "loss": 0.0026, + "step": 10467 + }, + { + "epoch": 0.2, + "learning_rate": 1.5954331870606965e-07, + "loss": 0.003, + "step": 10468 + }, + { + "epoch": 0.2, + "learning_rate": 1.5953943536173352e-07, + "loss": 0.003, + "step": 10469 + }, + { + "epoch": 0.2, + "learning_rate": 1.5953555201739736e-07, + "loss": 0.0176, + "step": 10470 + }, + { + "epoch": 0.2, + "learning_rate": 1.5953166867306124e-07, + "loss": 0.7318, + "step": 10471 + }, + { + "epoch": 0.2, + "learning_rate": 1.5952778532872508e-07, + "loss": 0.0025, + "step": 10472 + }, + { + "epoch": 0.2, + "learning_rate": 1.5952390198438895e-07, + "loss": 0.9308, + "step": 10473 + }, + { + "epoch": 0.2, + "learning_rate": 1.595200186400528e-07, + "loss": 0.6667, + "step": 10474 + }, + { + "epoch": 0.2, + "learning_rate": 1.5951613529571667e-07, + "loss": 0.5631, + "step": 10475 + }, + { + "epoch": 0.2, + "learning_rate": 1.5951225195138051e-07, + "loss": 0.0022, + "step": 10476 + }, + { + "epoch": 0.2, + "learning_rate": 1.5950836860704439e-07, + "loss": 0.0073, + "step": 10477 + }, + { + "epoch": 0.2, + "learning_rate": 1.5950448526270823e-07, + "loss": 0.0054, + "step": 10478 + }, + { + "epoch": 0.2, + "learning_rate": 1.595006019183721e-07, + "loss": 0.0059, + "step": 10479 + }, + { + "epoch": 0.2, + "learning_rate": 1.5949671857403595e-07, + "loss": 0.0023, + "step": 10480 + }, + { + "epoch": 0.2, + "learning_rate": 1.5949283522969982e-07, + "loss": 0.0958, + "step": 10481 + }, + { + "epoch": 0.2, + "learning_rate": 1.5948895188536366e-07, + "loss": 0.0025, + "step": 10482 + }, + { + "epoch": 0.2, + "learning_rate": 1.5948506854102754e-07, + "loss": 0.0029, + "step": 10483 + }, + { + "epoch": 0.2, + "learning_rate": 1.5948118519669138e-07, + "loss": 0.0027, + "step": 10484 + }, + { + "epoch": 0.2, + "learning_rate": 1.5947730185235525e-07, + "loss": 0.0046, + "step": 10485 + }, + { + "epoch": 0.2, + "learning_rate": 1.594734185080191e-07, + "loss": 0.0037, + "step": 10486 + }, + { + "epoch": 0.2, + "learning_rate": 1.5946953516368297e-07, + "loss": 0.0029, + "step": 10487 + }, + { + "epoch": 0.2, + "learning_rate": 1.594656518193468e-07, + "loss": 0.0042, + "step": 10488 + }, + { + "epoch": 0.2, + "learning_rate": 1.5946176847501068e-07, + "loss": 0.0069, + "step": 10489 + }, + { + "epoch": 0.2, + "learning_rate": 1.5945788513067453e-07, + "loss": 0.2174, + "step": 10490 + }, + { + "epoch": 0.2, + "learning_rate": 1.594540017863384e-07, + "loss": 0.5594, + "step": 10491 + }, + { + "epoch": 0.2, + "learning_rate": 1.5945011844200225e-07, + "loss": 0.0216, + "step": 10492 + }, + { + "epoch": 0.2, + "learning_rate": 1.594462350976661e-07, + "loss": 0.0054, + "step": 10493 + }, + { + "epoch": 0.2, + "learning_rate": 1.5944235175332996e-07, + "loss": 0.0033, + "step": 10494 + }, + { + "epoch": 0.2, + "learning_rate": 1.594384684089938e-07, + "loss": 0.0474, + "step": 10495 + }, + { + "epoch": 0.2, + "learning_rate": 1.5943458506465768e-07, + "loss": 0.0031, + "step": 10496 + }, + { + "epoch": 0.2, + "learning_rate": 1.5943070172032152e-07, + "loss": 0.0024, + "step": 10497 + }, + { + "epoch": 0.2, + "learning_rate": 1.594268183759854e-07, + "loss": 0.0029, + "step": 10498 + }, + { + "epoch": 0.2, + "learning_rate": 1.5942293503164924e-07, + "loss": 0.0025, + "step": 10499 + }, + { + "epoch": 0.2, + "learning_rate": 1.594190516873131e-07, + "loss": 0.4274, + "step": 10500 + }, + { + "epoch": 0.2, + "learning_rate": 1.5941516834297696e-07, + "loss": 0.0024, + "step": 10501 + }, + { + "epoch": 0.2, + "learning_rate": 1.5941128499864083e-07, + "loss": 0.0029, + "step": 10502 + }, + { + "epoch": 0.2, + "learning_rate": 1.5940740165430467e-07, + "loss": 0.003, + "step": 10503 + }, + { + "epoch": 0.2, + "learning_rate": 1.5940351830996854e-07, + "loss": 0.0037, + "step": 10504 + }, + { + "epoch": 0.2, + "learning_rate": 1.593996349656324e-07, + "loss": 0.0023, + "step": 10505 + }, + { + "epoch": 0.2, + "learning_rate": 1.5939575162129626e-07, + "loss": 0.0029, + "step": 10506 + }, + { + "epoch": 0.2, + "learning_rate": 1.593918682769601e-07, + "loss": 0.0026, + "step": 10507 + }, + { + "epoch": 0.2, + "learning_rate": 1.5938798493262398e-07, + "loss": 0.0031, + "step": 10508 + }, + { + "epoch": 0.2, + "learning_rate": 1.5938410158828782e-07, + "loss": 0.0078, + "step": 10509 + }, + { + "epoch": 0.2, + "learning_rate": 1.593802182439517e-07, + "loss": 0.002, + "step": 10510 + }, + { + "epoch": 0.2, + "learning_rate": 1.5937633489961554e-07, + "loss": 0.0029, + "step": 10511 + }, + { + "epoch": 0.2, + "learning_rate": 1.593724515552794e-07, + "loss": 0.0028, + "step": 10512 + }, + { + "epoch": 0.2, + "learning_rate": 1.5936856821094326e-07, + "loss": 0.0083, + "step": 10513 + }, + { + "epoch": 0.2, + "learning_rate": 1.5936468486660713e-07, + "loss": 0.7784, + "step": 10514 + }, + { + "epoch": 0.2, + "learning_rate": 1.5936080152227097e-07, + "loss": 0.0025, + "step": 10515 + }, + { + "epoch": 0.2, + "learning_rate": 1.5935691817793484e-07, + "loss": 0.0204, + "step": 10516 + }, + { + "epoch": 0.2, + "learning_rate": 1.593530348335987e-07, + "loss": 0.0024, + "step": 10517 + }, + { + "epoch": 0.2, + "learning_rate": 1.5934915148926256e-07, + "loss": 0.003, + "step": 10518 + }, + { + "epoch": 0.2, + "learning_rate": 1.593452681449264e-07, + "loss": 0.6113, + "step": 10519 + }, + { + "epoch": 0.2, + "learning_rate": 1.5934138480059025e-07, + "loss": 0.0104, + "step": 10520 + }, + { + "epoch": 0.2, + "learning_rate": 1.5933750145625412e-07, + "loss": 0.028, + "step": 10521 + }, + { + "epoch": 0.2, + "learning_rate": 1.5933361811191797e-07, + "loss": 0.0144, + "step": 10522 + }, + { + "epoch": 0.2, + "learning_rate": 1.593297347675818e-07, + "loss": 0.0019, + "step": 10523 + }, + { + "epoch": 0.2, + "learning_rate": 1.5932585142324568e-07, + "loss": 0.0023, + "step": 10524 + }, + { + "epoch": 0.2, + "learning_rate": 1.5932196807890953e-07, + "loss": 0.0028, + "step": 10525 + }, + { + "epoch": 0.2, + "learning_rate": 1.593180847345734e-07, + "loss": 0.0025, + "step": 10526 + }, + { + "epoch": 0.2, + "learning_rate": 1.5931420139023724e-07, + "loss": 0.0039, + "step": 10527 + }, + { + "epoch": 0.2, + "learning_rate": 1.5931031804590112e-07, + "loss": 0.0035, + "step": 10528 + }, + { + "epoch": 0.2, + "learning_rate": 1.5930643470156496e-07, + "loss": 0.0117, + "step": 10529 + }, + { + "epoch": 0.2, + "learning_rate": 1.5930255135722883e-07, + "loss": 0.0033, + "step": 10530 + }, + { + "epoch": 0.2, + "learning_rate": 1.5929866801289268e-07, + "loss": 0.0024, + "step": 10531 + }, + { + "epoch": 0.2, + "learning_rate": 1.5929478466855655e-07, + "loss": 0.0237, + "step": 10532 + }, + { + "epoch": 0.2, + "learning_rate": 1.592909013242204e-07, + "loss": 0.0029, + "step": 10533 + }, + { + "epoch": 0.2, + "learning_rate": 1.5928701797988427e-07, + "loss": 0.0026, + "step": 10534 + }, + { + "epoch": 0.2, + "learning_rate": 1.592831346355481e-07, + "loss": 0.325, + "step": 10535 + }, + { + "epoch": 0.2, + "learning_rate": 1.5927925129121198e-07, + "loss": 0.0026, + "step": 10536 + }, + { + "epoch": 0.2, + "learning_rate": 1.5927536794687583e-07, + "loss": 0.0059, + "step": 10537 + }, + { + "epoch": 0.2, + "learning_rate": 1.592714846025397e-07, + "loss": 0.0031, + "step": 10538 + }, + { + "epoch": 0.2, + "learning_rate": 1.5926760125820354e-07, + "loss": 0.0027, + "step": 10539 + }, + { + "epoch": 0.2, + "learning_rate": 1.5926371791386742e-07, + "loss": 0.014, + "step": 10540 + }, + { + "epoch": 0.2, + "learning_rate": 1.5925983456953126e-07, + "loss": 0.0049, + "step": 10541 + }, + { + "epoch": 0.2, + "learning_rate": 1.5925595122519513e-07, + "loss": 0.039, + "step": 10542 + }, + { + "epoch": 0.2, + "learning_rate": 1.5925206788085898e-07, + "loss": 0.002, + "step": 10543 + }, + { + "epoch": 0.2, + "learning_rate": 1.5924818453652285e-07, + "loss": 0.0026, + "step": 10544 + }, + { + "epoch": 0.2, + "learning_rate": 1.592443011921867e-07, + "loss": 0.0111, + "step": 10545 + }, + { + "epoch": 0.2, + "learning_rate": 1.5924041784785056e-07, + "loss": 0.8764, + "step": 10546 + }, + { + "epoch": 0.2, + "learning_rate": 1.592365345035144e-07, + "loss": 0.003, + "step": 10547 + }, + { + "epoch": 0.2, + "learning_rate": 1.5923265115917828e-07, + "loss": 0.005, + "step": 10548 + }, + { + "epoch": 0.2, + "learning_rate": 1.5922876781484213e-07, + "loss": 0.0032, + "step": 10549 + }, + { + "epoch": 0.2, + "learning_rate": 1.59224884470506e-07, + "loss": 0.0043, + "step": 10550 + }, + { + "epoch": 0.2, + "learning_rate": 1.5922100112616984e-07, + "loss": 0.6082, + "step": 10551 + }, + { + "epoch": 0.2, + "learning_rate": 1.5921711778183371e-07, + "loss": 0.0057, + "step": 10552 + }, + { + "epoch": 0.2, + "learning_rate": 1.5921323443749756e-07, + "loss": 0.0019, + "step": 10553 + }, + { + "epoch": 0.2, + "learning_rate": 1.5920935109316143e-07, + "loss": 0.0019, + "step": 10554 + }, + { + "epoch": 0.2, + "learning_rate": 1.5920546774882528e-07, + "loss": 0.0022, + "step": 10555 + }, + { + "epoch": 0.2, + "learning_rate": 1.5920158440448915e-07, + "loss": 0.0026, + "step": 10556 + }, + { + "epoch": 0.2, + "learning_rate": 1.59197701060153e-07, + "loss": 0.0029, + "step": 10557 + }, + { + "epoch": 0.2, + "learning_rate": 1.5919381771581686e-07, + "loss": 0.0053, + "step": 10558 + }, + { + "epoch": 0.2, + "learning_rate": 1.591899343714807e-07, + "loss": 0.0024, + "step": 10559 + }, + { + "epoch": 0.2, + "learning_rate": 1.5918605102714458e-07, + "loss": 0.0025, + "step": 10560 + }, + { + "epoch": 0.2, + "learning_rate": 1.5918216768280843e-07, + "loss": 0.0018, + "step": 10561 + }, + { + "epoch": 0.2, + "learning_rate": 1.591782843384723e-07, + "loss": 0.0025, + "step": 10562 + }, + { + "epoch": 0.2, + "learning_rate": 1.5917440099413614e-07, + "loss": 0.0051, + "step": 10563 + }, + { + "epoch": 0.2, + "learning_rate": 1.591705176498e-07, + "loss": 0.0035, + "step": 10564 + }, + { + "epoch": 0.2, + "learning_rate": 1.5916663430546386e-07, + "loss": 0.3835, + "step": 10565 + }, + { + "epoch": 0.2, + "learning_rate": 1.5916275096112773e-07, + "loss": 0.0049, + "step": 10566 + }, + { + "epoch": 0.2, + "learning_rate": 1.5915886761679157e-07, + "loss": 0.0025, + "step": 10567 + }, + { + "epoch": 0.2, + "learning_rate": 1.5915498427245545e-07, + "loss": 0.0104, + "step": 10568 + }, + { + "epoch": 0.21, + "learning_rate": 1.591511009281193e-07, + "loss": 0.0021, + "step": 10569 + }, + { + "epoch": 0.21, + "learning_rate": 1.5914721758378316e-07, + "loss": 0.5294, + "step": 10570 + }, + { + "epoch": 0.21, + "learning_rate": 1.59143334239447e-07, + "loss": 0.0035, + "step": 10571 + }, + { + "epoch": 0.21, + "learning_rate": 1.5913945089511088e-07, + "loss": 0.0681, + "step": 10572 + }, + { + "epoch": 0.21, + "learning_rate": 1.5913556755077472e-07, + "loss": 0.6006, + "step": 10573 + }, + { + "epoch": 0.21, + "learning_rate": 1.591316842064386e-07, + "loss": 0.0021, + "step": 10574 + }, + { + "epoch": 0.21, + "learning_rate": 1.5912780086210244e-07, + "loss": 0.4172, + "step": 10575 + }, + { + "epoch": 0.21, + "learning_rate": 1.591239175177663e-07, + "loss": 0.0021, + "step": 10576 + }, + { + "epoch": 0.21, + "learning_rate": 1.5912003417343013e-07, + "loss": 0.0027, + "step": 10577 + }, + { + "epoch": 0.21, + "learning_rate": 1.59116150829094e-07, + "loss": 0.0025, + "step": 10578 + }, + { + "epoch": 0.21, + "learning_rate": 1.5911226748475785e-07, + "loss": 0.003, + "step": 10579 + }, + { + "epoch": 0.21, + "learning_rate": 1.5910838414042172e-07, + "loss": 0.0314, + "step": 10580 + }, + { + "epoch": 0.21, + "learning_rate": 1.5910450079608556e-07, + "loss": 0.0038, + "step": 10581 + }, + { + "epoch": 0.21, + "learning_rate": 1.5910061745174944e-07, + "loss": 0.0766, + "step": 10582 + }, + { + "epoch": 0.21, + "learning_rate": 1.5909673410741328e-07, + "loss": 0.0028, + "step": 10583 + }, + { + "epoch": 0.21, + "learning_rate": 1.5909285076307715e-07, + "loss": 0.0139, + "step": 10584 + }, + { + "epoch": 0.21, + "learning_rate": 1.59088967418741e-07, + "loss": 0.0025, + "step": 10585 + }, + { + "epoch": 0.21, + "learning_rate": 1.5908508407440487e-07, + "loss": 0.0029, + "step": 10586 + }, + { + "epoch": 0.21, + "learning_rate": 1.590812007300687e-07, + "loss": 0.0029, + "step": 10587 + }, + { + "epoch": 0.21, + "learning_rate": 1.5907731738573258e-07, + "loss": 0.8909, + "step": 10588 + }, + { + "epoch": 0.21, + "learning_rate": 1.5907343404139643e-07, + "loss": 0.0022, + "step": 10589 + }, + { + "epoch": 0.21, + "learning_rate": 1.590695506970603e-07, + "loss": 0.3159, + "step": 10590 + }, + { + "epoch": 0.21, + "learning_rate": 1.5906566735272415e-07, + "loss": 0.0046, + "step": 10591 + }, + { + "epoch": 0.21, + "learning_rate": 1.5906178400838802e-07, + "loss": 0.0052, + "step": 10592 + }, + { + "epoch": 0.21, + "learning_rate": 1.5905790066405186e-07, + "loss": 0.0034, + "step": 10593 + }, + { + "epoch": 0.21, + "learning_rate": 1.5905401731971573e-07, + "loss": 0.9261, + "step": 10594 + }, + { + "epoch": 0.21, + "learning_rate": 1.5905013397537958e-07, + "loss": 0.0036, + "step": 10595 + }, + { + "epoch": 0.21, + "learning_rate": 1.5904625063104345e-07, + "loss": 0.0028, + "step": 10596 + }, + { + "epoch": 0.21, + "learning_rate": 1.590423672867073e-07, + "loss": 0.4573, + "step": 10597 + }, + { + "epoch": 0.21, + "learning_rate": 1.5903848394237117e-07, + "loss": 0.0046, + "step": 10598 + }, + { + "epoch": 0.21, + "learning_rate": 1.59034600598035e-07, + "loss": 0.0035, + "step": 10599 + }, + { + "epoch": 0.21, + "learning_rate": 1.5903071725369888e-07, + "loss": 0.0029, + "step": 10600 + }, + { + "epoch": 0.21, + "learning_rate": 1.5902683390936273e-07, + "loss": 0.5205, + "step": 10601 + }, + { + "epoch": 0.21, + "learning_rate": 1.590229505650266e-07, + "loss": 0.0038, + "step": 10602 + }, + { + "epoch": 0.21, + "learning_rate": 1.5901906722069044e-07, + "loss": 0.3307, + "step": 10603 + }, + { + "epoch": 0.21, + "learning_rate": 1.5901518387635432e-07, + "loss": 0.0029, + "step": 10604 + }, + { + "epoch": 0.21, + "learning_rate": 1.5901130053201816e-07, + "loss": 0.0025, + "step": 10605 + }, + { + "epoch": 0.21, + "learning_rate": 1.5900741718768203e-07, + "loss": 0.0025, + "step": 10606 + }, + { + "epoch": 0.21, + "learning_rate": 1.5900353384334588e-07, + "loss": 0.0024, + "step": 10607 + }, + { + "epoch": 0.21, + "learning_rate": 1.5899965049900975e-07, + "loss": 0.0025, + "step": 10608 + }, + { + "epoch": 0.21, + "learning_rate": 1.589957671546736e-07, + "loss": 0.0054, + "step": 10609 + }, + { + "epoch": 0.21, + "learning_rate": 1.5899188381033747e-07, + "loss": 0.0045, + "step": 10610 + }, + { + "epoch": 0.21, + "learning_rate": 1.589880004660013e-07, + "loss": 0.0022, + "step": 10611 + }, + { + "epoch": 0.21, + "learning_rate": 1.5898411712166518e-07, + "loss": 0.5828, + "step": 10612 + }, + { + "epoch": 0.21, + "learning_rate": 1.5898023377732903e-07, + "loss": 0.788, + "step": 10613 + }, + { + "epoch": 0.21, + "learning_rate": 1.589763504329929e-07, + "loss": 0.0029, + "step": 10614 + }, + { + "epoch": 0.21, + "learning_rate": 1.5897246708865674e-07, + "loss": 0.0029, + "step": 10615 + }, + { + "epoch": 0.21, + "learning_rate": 1.5896858374432062e-07, + "loss": 0.533, + "step": 10616 + }, + { + "epoch": 0.21, + "learning_rate": 1.5896470039998446e-07, + "loss": 0.2795, + "step": 10617 + }, + { + "epoch": 0.21, + "learning_rate": 1.5896081705564833e-07, + "loss": 0.0067, + "step": 10618 + }, + { + "epoch": 0.21, + "learning_rate": 1.5895693371131218e-07, + "loss": 0.0022, + "step": 10619 + }, + { + "epoch": 0.21, + "learning_rate": 1.5895305036697605e-07, + "loss": 0.0031, + "step": 10620 + }, + { + "epoch": 0.21, + "learning_rate": 1.589491670226399e-07, + "loss": 0.1419, + "step": 10621 + }, + { + "epoch": 0.21, + "learning_rate": 1.5894528367830376e-07, + "loss": 0.0029, + "step": 10622 + }, + { + "epoch": 0.21, + "learning_rate": 1.589414003339676e-07, + "loss": 0.0034, + "step": 10623 + }, + { + "epoch": 0.21, + "learning_rate": 1.5893751698963148e-07, + "loss": 0.4442, + "step": 10624 + }, + { + "epoch": 0.21, + "learning_rate": 1.5893363364529533e-07, + "loss": 0.4976, + "step": 10625 + }, + { + "epoch": 0.21, + "learning_rate": 1.589297503009592e-07, + "loss": 0.3035, + "step": 10626 + }, + { + "epoch": 0.21, + "learning_rate": 1.5892586695662304e-07, + "loss": 0.0023, + "step": 10627 + }, + { + "epoch": 0.21, + "learning_rate": 1.5892198361228691e-07, + "loss": 0.0023, + "step": 10628 + }, + { + "epoch": 0.21, + "learning_rate": 1.5891810026795076e-07, + "loss": 0.0154, + "step": 10629 + }, + { + "epoch": 0.21, + "learning_rate": 1.5891421692361463e-07, + "loss": 0.0028, + "step": 10630 + }, + { + "epoch": 0.21, + "learning_rate": 1.5891033357927848e-07, + "loss": 0.0021, + "step": 10631 + }, + { + "epoch": 0.21, + "learning_rate": 1.5890645023494235e-07, + "loss": 0.0063, + "step": 10632 + }, + { + "epoch": 0.21, + "learning_rate": 1.589025668906062e-07, + "loss": 0.0026, + "step": 10633 + }, + { + "epoch": 0.21, + "learning_rate": 1.5889868354627006e-07, + "loss": 0.0105, + "step": 10634 + }, + { + "epoch": 0.21, + "learning_rate": 1.5889480020193388e-07, + "loss": 0.236, + "step": 10635 + }, + { + "epoch": 0.21, + "learning_rate": 1.5889091685759775e-07, + "loss": 0.3616, + "step": 10636 + }, + { + "epoch": 0.21, + "learning_rate": 1.588870335132616e-07, + "loss": 0.0027, + "step": 10637 + }, + { + "epoch": 0.21, + "learning_rate": 1.5888315016892547e-07, + "loss": 0.5995, + "step": 10638 + }, + { + "epoch": 0.21, + "learning_rate": 1.5887926682458932e-07, + "loss": 0.5922, + "step": 10639 + }, + { + "epoch": 0.21, + "learning_rate": 1.588753834802532e-07, + "loss": 0.0114, + "step": 10640 + }, + { + "epoch": 0.21, + "learning_rate": 1.5887150013591703e-07, + "loss": 0.0745, + "step": 10641 + }, + { + "epoch": 0.21, + "learning_rate": 1.588676167915809e-07, + "loss": 0.0026, + "step": 10642 + }, + { + "epoch": 0.21, + "learning_rate": 1.5886373344724475e-07, + "loss": 0.0031, + "step": 10643 + }, + { + "epoch": 0.21, + "learning_rate": 1.5885985010290862e-07, + "loss": 0.0049, + "step": 10644 + }, + { + "epoch": 0.21, + "learning_rate": 1.5885596675857246e-07, + "loss": 0.0025, + "step": 10645 + }, + { + "epoch": 0.21, + "learning_rate": 1.5885208341423634e-07, + "loss": 0.0023, + "step": 10646 + }, + { + "epoch": 0.21, + "learning_rate": 1.5884820006990018e-07, + "loss": 0.0026, + "step": 10647 + }, + { + "epoch": 0.21, + "learning_rate": 1.5884431672556405e-07, + "loss": 0.0021, + "step": 10648 + }, + { + "epoch": 0.21, + "learning_rate": 1.588404333812279e-07, + "loss": 0.0037, + "step": 10649 + }, + { + "epoch": 0.21, + "learning_rate": 1.5883655003689177e-07, + "loss": 0.004, + "step": 10650 + }, + { + "epoch": 0.21, + "learning_rate": 1.5883266669255561e-07, + "loss": 0.0025, + "step": 10651 + }, + { + "epoch": 0.21, + "learning_rate": 1.5882878334821949e-07, + "loss": 0.0028, + "step": 10652 + }, + { + "epoch": 0.21, + "learning_rate": 1.5882490000388333e-07, + "loss": 0.4326, + "step": 10653 + }, + { + "epoch": 0.21, + "learning_rate": 1.588210166595472e-07, + "loss": 0.0037, + "step": 10654 + }, + { + "epoch": 0.21, + "learning_rate": 1.5881713331521105e-07, + "loss": 0.0104, + "step": 10655 + }, + { + "epoch": 0.21, + "learning_rate": 1.5881324997087492e-07, + "loss": 0.0076, + "step": 10656 + }, + { + "epoch": 0.21, + "learning_rate": 1.5880936662653876e-07, + "loss": 0.0041, + "step": 10657 + }, + { + "epoch": 0.21, + "learning_rate": 1.5880548328220264e-07, + "loss": 0.0028, + "step": 10658 + }, + { + "epoch": 0.21, + "learning_rate": 1.5880159993786648e-07, + "loss": 0.6416, + "step": 10659 + }, + { + "epoch": 0.21, + "learning_rate": 1.5879771659353035e-07, + "loss": 0.0023, + "step": 10660 + }, + { + "epoch": 0.21, + "learning_rate": 1.587938332491942e-07, + "loss": 0.0032, + "step": 10661 + }, + { + "epoch": 0.21, + "learning_rate": 1.5878994990485807e-07, + "loss": 0.0041, + "step": 10662 + }, + { + "epoch": 0.21, + "learning_rate": 1.587860665605219e-07, + "loss": 0.2596, + "step": 10663 + }, + { + "epoch": 0.21, + "learning_rate": 1.5878218321618578e-07, + "loss": 0.0024, + "step": 10664 + }, + { + "epoch": 0.21, + "learning_rate": 1.5877829987184963e-07, + "loss": 0.0026, + "step": 10665 + }, + { + "epoch": 0.21, + "learning_rate": 1.587744165275135e-07, + "loss": 0.0043, + "step": 10666 + }, + { + "epoch": 0.21, + "learning_rate": 1.5877053318317735e-07, + "loss": 0.003, + "step": 10667 + }, + { + "epoch": 0.21, + "learning_rate": 1.5876664983884122e-07, + "loss": 0.0028, + "step": 10668 + }, + { + "epoch": 0.21, + "learning_rate": 1.5876276649450506e-07, + "loss": 0.0029, + "step": 10669 + }, + { + "epoch": 0.21, + "learning_rate": 1.587588831501689e-07, + "loss": 0.0037, + "step": 10670 + }, + { + "epoch": 0.21, + "learning_rate": 1.5875499980583278e-07, + "loss": 0.8298, + "step": 10671 + }, + { + "epoch": 0.21, + "learning_rate": 1.5875111646149662e-07, + "loss": 0.0165, + "step": 10672 + }, + { + "epoch": 0.21, + "learning_rate": 1.587472331171605e-07, + "loss": 0.5058, + "step": 10673 + }, + { + "epoch": 0.21, + "learning_rate": 1.5874334977282434e-07, + "loss": 0.0074, + "step": 10674 + }, + { + "epoch": 0.21, + "learning_rate": 1.587394664284882e-07, + "loss": 0.2163, + "step": 10675 + }, + { + "epoch": 0.21, + "learning_rate": 1.5873558308415206e-07, + "loss": 0.0033, + "step": 10676 + }, + { + "epoch": 0.21, + "learning_rate": 1.5873169973981593e-07, + "loss": 0.0047, + "step": 10677 + }, + { + "epoch": 0.21, + "learning_rate": 1.5872781639547977e-07, + "loss": 0.0281, + "step": 10678 + }, + { + "epoch": 0.21, + "learning_rate": 1.5872393305114365e-07, + "loss": 0.0155, + "step": 10679 + }, + { + "epoch": 0.21, + "learning_rate": 1.587200497068075e-07, + "loss": 0.0023, + "step": 10680 + }, + { + "epoch": 0.21, + "learning_rate": 1.5871616636247136e-07, + "loss": 0.0074, + "step": 10681 + }, + { + "epoch": 0.21, + "learning_rate": 1.587122830181352e-07, + "loss": 0.0054, + "step": 10682 + }, + { + "epoch": 0.21, + "learning_rate": 1.5870839967379908e-07, + "loss": 0.0032, + "step": 10683 + }, + { + "epoch": 0.21, + "learning_rate": 1.5870451632946292e-07, + "loss": 0.0029, + "step": 10684 + }, + { + "epoch": 0.21, + "learning_rate": 1.587006329851268e-07, + "loss": 0.0183, + "step": 10685 + }, + { + "epoch": 0.21, + "learning_rate": 1.5869674964079064e-07, + "loss": 0.005, + "step": 10686 + }, + { + "epoch": 0.21, + "learning_rate": 1.586928662964545e-07, + "loss": 0.0026, + "step": 10687 + }, + { + "epoch": 0.21, + "learning_rate": 1.5868898295211836e-07, + "loss": 0.5954, + "step": 10688 + }, + { + "epoch": 0.21, + "learning_rate": 1.5868509960778223e-07, + "loss": 0.0019, + "step": 10689 + }, + { + "epoch": 0.21, + "learning_rate": 1.5868121626344607e-07, + "loss": 0.0072, + "step": 10690 + }, + { + "epoch": 0.21, + "learning_rate": 1.5867733291910994e-07, + "loss": 0.0022, + "step": 10691 + }, + { + "epoch": 0.21, + "learning_rate": 1.586734495747738e-07, + "loss": 0.0032, + "step": 10692 + }, + { + "epoch": 0.21, + "learning_rate": 1.5866956623043763e-07, + "loss": 0.0027, + "step": 10693 + }, + { + "epoch": 0.21, + "learning_rate": 1.586656828861015e-07, + "loss": 0.0022, + "step": 10694 + }, + { + "epoch": 0.21, + "learning_rate": 1.5866179954176535e-07, + "loss": 0.831, + "step": 10695 + }, + { + "epoch": 0.21, + "learning_rate": 1.5865791619742922e-07, + "loss": 0.0023, + "step": 10696 + }, + { + "epoch": 0.21, + "learning_rate": 1.5865403285309307e-07, + "loss": 0.0022, + "step": 10697 + }, + { + "epoch": 0.21, + "learning_rate": 1.5865014950875694e-07, + "loss": 0.0027, + "step": 10698 + }, + { + "epoch": 0.21, + "learning_rate": 1.5864626616442078e-07, + "loss": 0.0067, + "step": 10699 + }, + { + "epoch": 0.21, + "learning_rate": 1.5864238282008463e-07, + "loss": 0.0312, + "step": 10700 + }, + { + "epoch": 0.21, + "learning_rate": 1.586384994757485e-07, + "loss": 0.0021, + "step": 10701 + }, + { + "epoch": 0.21, + "learning_rate": 1.5863461613141235e-07, + "loss": 0.0037, + "step": 10702 + }, + { + "epoch": 0.21, + "learning_rate": 1.5863073278707622e-07, + "loss": 0.003, + "step": 10703 + }, + { + "epoch": 0.21, + "learning_rate": 1.5862684944274006e-07, + "loss": 0.0118, + "step": 10704 + }, + { + "epoch": 0.21, + "learning_rate": 1.5862296609840393e-07, + "loss": 0.006, + "step": 10705 + }, + { + "epoch": 0.21, + "learning_rate": 1.5861908275406778e-07, + "loss": 0.0019, + "step": 10706 + }, + { + "epoch": 0.21, + "learning_rate": 1.5861519940973165e-07, + "loss": 0.0025, + "step": 10707 + }, + { + "epoch": 0.21, + "learning_rate": 1.586113160653955e-07, + "loss": 0.0023, + "step": 10708 + }, + { + "epoch": 0.21, + "learning_rate": 1.5860743272105937e-07, + "loss": 0.0034, + "step": 10709 + }, + { + "epoch": 0.21, + "learning_rate": 1.586035493767232e-07, + "loss": 0.2578, + "step": 10710 + }, + { + "epoch": 0.21, + "learning_rate": 1.5859966603238708e-07, + "loss": 0.029, + "step": 10711 + }, + { + "epoch": 0.21, + "learning_rate": 1.5859578268805093e-07, + "loss": 0.011, + "step": 10712 + }, + { + "epoch": 0.21, + "learning_rate": 1.585918993437148e-07, + "loss": 0.0033, + "step": 10713 + }, + { + "epoch": 0.21, + "learning_rate": 1.5858801599937864e-07, + "loss": 0.1483, + "step": 10714 + }, + { + "epoch": 0.21, + "learning_rate": 1.5858413265504252e-07, + "loss": 0.0076, + "step": 10715 + }, + { + "epoch": 0.21, + "learning_rate": 1.5858024931070636e-07, + "loss": 0.0027, + "step": 10716 + }, + { + "epoch": 0.21, + "learning_rate": 1.5857636596637023e-07, + "loss": 0.0028, + "step": 10717 + }, + { + "epoch": 0.21, + "learning_rate": 1.5857248262203408e-07, + "loss": 0.0023, + "step": 10718 + }, + { + "epoch": 0.21, + "learning_rate": 1.5856859927769795e-07, + "loss": 0.0022, + "step": 10719 + }, + { + "epoch": 0.21, + "learning_rate": 1.585647159333618e-07, + "loss": 0.4582, + "step": 10720 + }, + { + "epoch": 0.21, + "learning_rate": 1.5856083258902566e-07, + "loss": 0.011, + "step": 10721 + }, + { + "epoch": 0.21, + "learning_rate": 1.585569492446895e-07, + "loss": 0.0044, + "step": 10722 + }, + { + "epoch": 0.21, + "learning_rate": 1.5855306590035338e-07, + "loss": 0.3924, + "step": 10723 + }, + { + "epoch": 0.21, + "learning_rate": 1.5854918255601723e-07, + "loss": 0.3373, + "step": 10724 + }, + { + "epoch": 0.21, + "learning_rate": 1.585452992116811e-07, + "loss": 0.0024, + "step": 10725 + }, + { + "epoch": 0.21, + "learning_rate": 1.5854141586734494e-07, + "loss": 1.0438, + "step": 10726 + }, + { + "epoch": 0.21, + "learning_rate": 1.5853753252300881e-07, + "loss": 0.007, + "step": 10727 + }, + { + "epoch": 0.21, + "learning_rate": 1.5853364917867266e-07, + "loss": 0.0022, + "step": 10728 + }, + { + "epoch": 0.21, + "learning_rate": 1.5852976583433653e-07, + "loss": 0.0033, + "step": 10729 + }, + { + "epoch": 0.21, + "learning_rate": 1.5852588249000038e-07, + "loss": 0.0019, + "step": 10730 + }, + { + "epoch": 0.21, + "learning_rate": 1.5852199914566425e-07, + "loss": 0.0978, + "step": 10731 + }, + { + "epoch": 0.21, + "learning_rate": 1.585181158013281e-07, + "loss": 0.0027, + "step": 10732 + }, + { + "epoch": 0.21, + "learning_rate": 1.5851423245699196e-07, + "loss": 0.1463, + "step": 10733 + }, + { + "epoch": 0.21, + "learning_rate": 1.585103491126558e-07, + "loss": 0.0021, + "step": 10734 + }, + { + "epoch": 0.21, + "learning_rate": 1.5850646576831968e-07, + "loss": 0.0056, + "step": 10735 + }, + { + "epoch": 0.21, + "learning_rate": 1.5850258242398353e-07, + "loss": 0.0026, + "step": 10736 + }, + { + "epoch": 0.21, + "learning_rate": 1.584986990796474e-07, + "loss": 0.0027, + "step": 10737 + }, + { + "epoch": 0.21, + "learning_rate": 1.5849481573531124e-07, + "loss": 0.0661, + "step": 10738 + }, + { + "epoch": 0.21, + "learning_rate": 1.5849093239097511e-07, + "loss": 0.0017, + "step": 10739 + }, + { + "epoch": 0.21, + "learning_rate": 1.5848704904663896e-07, + "loss": 0.0047, + "step": 10740 + }, + { + "epoch": 0.21, + "learning_rate": 1.5848316570230283e-07, + "loss": 0.003, + "step": 10741 + }, + { + "epoch": 0.21, + "learning_rate": 1.5847928235796667e-07, + "loss": 0.0112, + "step": 10742 + }, + { + "epoch": 0.21, + "learning_rate": 1.5847539901363055e-07, + "loss": 0.0026, + "step": 10743 + }, + { + "epoch": 0.21, + "learning_rate": 1.584715156692944e-07, + "loss": 0.0024, + "step": 10744 + }, + { + "epoch": 0.21, + "learning_rate": 1.5846763232495826e-07, + "loss": 0.0024, + "step": 10745 + }, + { + "epoch": 0.21, + "learning_rate": 1.584637489806221e-07, + "loss": 0.0025, + "step": 10746 + }, + { + "epoch": 0.21, + "learning_rate": 1.5845986563628598e-07, + "loss": 0.0032, + "step": 10747 + }, + { + "epoch": 0.21, + "learning_rate": 1.5845598229194982e-07, + "loss": 0.0028, + "step": 10748 + }, + { + "epoch": 0.21, + "learning_rate": 1.584520989476137e-07, + "loss": 1.0712, + "step": 10749 + }, + { + "epoch": 0.21, + "learning_rate": 1.5844821560327754e-07, + "loss": 0.0052, + "step": 10750 + }, + { + "epoch": 0.21, + "learning_rate": 1.5844433225894139e-07, + "loss": 0.0479, + "step": 10751 + }, + { + "epoch": 0.21, + "learning_rate": 1.5844044891460523e-07, + "loss": 0.0023, + "step": 10752 + }, + { + "epoch": 0.21, + "learning_rate": 1.584365655702691e-07, + "loss": 0.5257, + "step": 10753 + }, + { + "epoch": 0.21, + "learning_rate": 1.5843268222593295e-07, + "loss": 0.3783, + "step": 10754 + }, + { + "epoch": 0.21, + "learning_rate": 1.5842879888159682e-07, + "loss": 0.0022, + "step": 10755 + }, + { + "epoch": 0.21, + "learning_rate": 1.5842491553726066e-07, + "loss": 0.0049, + "step": 10756 + }, + { + "epoch": 0.21, + "learning_rate": 1.5842103219292454e-07, + "loss": 0.3758, + "step": 10757 + }, + { + "epoch": 0.21, + "learning_rate": 1.5841714884858838e-07, + "loss": 0.0027, + "step": 10758 + }, + { + "epoch": 0.21, + "learning_rate": 1.5841326550425225e-07, + "loss": 0.0092, + "step": 10759 + }, + { + "epoch": 0.21, + "learning_rate": 1.584093821599161e-07, + "loss": 0.0046, + "step": 10760 + }, + { + "epoch": 0.21, + "learning_rate": 1.5840549881557997e-07, + "loss": 0.0661, + "step": 10761 + }, + { + "epoch": 0.21, + "learning_rate": 1.584016154712438e-07, + "loss": 0.0022, + "step": 10762 + }, + { + "epoch": 0.21, + "learning_rate": 1.5839773212690768e-07, + "loss": 0.0024, + "step": 10763 + }, + { + "epoch": 0.21, + "learning_rate": 1.5839384878257153e-07, + "loss": 0.0043, + "step": 10764 + }, + { + "epoch": 0.21, + "learning_rate": 1.583899654382354e-07, + "loss": 0.0031, + "step": 10765 + }, + { + "epoch": 0.21, + "learning_rate": 1.5838608209389925e-07, + "loss": 0.0019, + "step": 10766 + }, + { + "epoch": 0.21, + "learning_rate": 1.5838219874956312e-07, + "loss": 0.1114, + "step": 10767 + }, + { + "epoch": 0.21, + "learning_rate": 1.5837831540522696e-07, + "loss": 0.0047, + "step": 10768 + }, + { + "epoch": 0.21, + "learning_rate": 1.5837443206089083e-07, + "loss": 0.2666, + "step": 10769 + }, + { + "epoch": 0.21, + "learning_rate": 1.5837054871655468e-07, + "loss": 0.0074, + "step": 10770 + }, + { + "epoch": 0.21, + "learning_rate": 1.5836666537221855e-07, + "loss": 0.0032, + "step": 10771 + }, + { + "epoch": 0.21, + "learning_rate": 1.583627820278824e-07, + "loss": 0.0023, + "step": 10772 + }, + { + "epoch": 0.21, + "learning_rate": 1.5835889868354627e-07, + "loss": 0.0895, + "step": 10773 + }, + { + "epoch": 0.21, + "learning_rate": 1.583550153392101e-07, + "loss": 0.0018, + "step": 10774 + }, + { + "epoch": 0.21, + "learning_rate": 1.5835113199487398e-07, + "loss": 0.0025, + "step": 10775 + }, + { + "epoch": 0.21, + "learning_rate": 1.5834724865053783e-07, + "loss": 0.0033, + "step": 10776 + }, + { + "epoch": 0.21, + "learning_rate": 1.583433653062017e-07, + "loss": 0.0022, + "step": 10777 + }, + { + "epoch": 0.21, + "learning_rate": 1.5833948196186555e-07, + "loss": 0.0031, + "step": 10778 + }, + { + "epoch": 0.21, + "learning_rate": 1.5833559861752942e-07, + "loss": 0.0582, + "step": 10779 + }, + { + "epoch": 0.21, + "learning_rate": 1.5833171527319326e-07, + "loss": 0.003, + "step": 10780 + }, + { + "epoch": 0.21, + "learning_rate": 1.5832783192885713e-07, + "loss": 0.0046, + "step": 10781 + }, + { + "epoch": 0.21, + "learning_rate": 1.5832394858452098e-07, + "loss": 0.0027, + "step": 10782 + }, + { + "epoch": 0.21, + "learning_rate": 1.5832006524018485e-07, + "loss": 0.0038, + "step": 10783 + }, + { + "epoch": 0.21, + "learning_rate": 1.583161818958487e-07, + "loss": 0.0031, + "step": 10784 + }, + { + "epoch": 0.21, + "learning_rate": 1.5831229855151257e-07, + "loss": 0.0024, + "step": 10785 + }, + { + "epoch": 0.21, + "learning_rate": 1.583084152071764e-07, + "loss": 0.0103, + "step": 10786 + }, + { + "epoch": 0.21, + "learning_rate": 1.5830453186284028e-07, + "loss": 0.0025, + "step": 10787 + }, + { + "epoch": 0.21, + "learning_rate": 1.5830064851850413e-07, + "loss": 0.0031, + "step": 10788 + }, + { + "epoch": 0.21, + "learning_rate": 1.58296765174168e-07, + "loss": 0.0026, + "step": 10789 + }, + { + "epoch": 0.21, + "learning_rate": 1.5829288182983184e-07, + "loss": 0.0025, + "step": 10790 + }, + { + "epoch": 0.21, + "learning_rate": 1.5828899848549572e-07, + "loss": 0.0018, + "step": 10791 + }, + { + "epoch": 0.21, + "learning_rate": 1.5828511514115956e-07, + "loss": 0.0023, + "step": 10792 + }, + { + "epoch": 0.21, + "learning_rate": 1.5828123179682343e-07, + "loss": 0.0022, + "step": 10793 + }, + { + "epoch": 0.21, + "learning_rate": 1.5827734845248728e-07, + "loss": 0.0028, + "step": 10794 + }, + { + "epoch": 0.21, + "learning_rate": 1.5827346510815115e-07, + "loss": 0.0073, + "step": 10795 + }, + { + "epoch": 0.21, + "learning_rate": 1.58269581763815e-07, + "loss": 0.0022, + "step": 10796 + }, + { + "epoch": 0.21, + "learning_rate": 1.5826569841947886e-07, + "loss": 0.0023, + "step": 10797 + }, + { + "epoch": 0.21, + "learning_rate": 1.582618150751427e-07, + "loss": 0.0028, + "step": 10798 + }, + { + "epoch": 0.21, + "learning_rate": 1.5825793173080658e-07, + "loss": 0.1129, + "step": 10799 + }, + { + "epoch": 0.21, + "learning_rate": 1.5825404838647043e-07, + "loss": 0.0024, + "step": 10800 + }, + { + "epoch": 0.21, + "learning_rate": 1.582501650421343e-07, + "loss": 0.0027, + "step": 10801 + }, + { + "epoch": 0.21, + "learning_rate": 1.5824628169779814e-07, + "loss": 0.0024, + "step": 10802 + }, + { + "epoch": 0.21, + "learning_rate": 1.5824239835346201e-07, + "loss": 0.0024, + "step": 10803 + }, + { + "epoch": 0.21, + "learning_rate": 1.5823851500912586e-07, + "loss": 0.2715, + "step": 10804 + }, + { + "epoch": 0.21, + "learning_rate": 1.5823463166478973e-07, + "loss": 0.0602, + "step": 10805 + }, + { + "epoch": 0.21, + "learning_rate": 1.5823074832045358e-07, + "loss": 0.5392, + "step": 10806 + }, + { + "epoch": 0.21, + "learning_rate": 1.5822686497611745e-07, + "loss": 0.5059, + "step": 10807 + }, + { + "epoch": 0.21, + "learning_rate": 1.582229816317813e-07, + "loss": 0.0022, + "step": 10808 + }, + { + "epoch": 0.21, + "learning_rate": 1.5821909828744514e-07, + "loss": 0.0025, + "step": 10809 + }, + { + "epoch": 0.21, + "learning_rate": 1.5821521494310898e-07, + "loss": 0.005, + "step": 10810 + }, + { + "epoch": 0.21, + "learning_rate": 1.5821133159877285e-07, + "loss": 0.0029, + "step": 10811 + }, + { + "epoch": 0.21, + "learning_rate": 1.582074482544367e-07, + "loss": 0.0024, + "step": 10812 + }, + { + "epoch": 0.21, + "learning_rate": 1.5820356491010057e-07, + "loss": 0.0021, + "step": 10813 + }, + { + "epoch": 0.21, + "learning_rate": 1.5819968156576442e-07, + "loss": 0.5133, + "step": 10814 + }, + { + "epoch": 0.21, + "learning_rate": 1.581957982214283e-07, + "loss": 0.0021, + "step": 10815 + }, + { + "epoch": 0.21, + "learning_rate": 1.5819191487709213e-07, + "loss": 0.0034, + "step": 10816 + }, + { + "epoch": 0.21, + "learning_rate": 1.58188031532756e-07, + "loss": 0.2525, + "step": 10817 + }, + { + "epoch": 0.21, + "learning_rate": 1.5818414818841985e-07, + "loss": 0.003, + "step": 10818 + }, + { + "epoch": 0.21, + "learning_rate": 1.5818026484408372e-07, + "loss": 0.002, + "step": 10819 + }, + { + "epoch": 0.21, + "learning_rate": 1.5817638149974756e-07, + "loss": 0.002, + "step": 10820 + }, + { + "epoch": 0.21, + "learning_rate": 1.5817249815541144e-07, + "loss": 0.0068, + "step": 10821 + }, + { + "epoch": 0.21, + "learning_rate": 1.5816861481107528e-07, + "loss": 0.0091, + "step": 10822 + }, + { + "epoch": 0.21, + "learning_rate": 1.5816473146673915e-07, + "loss": 0.2088, + "step": 10823 + }, + { + "epoch": 0.21, + "learning_rate": 1.58160848122403e-07, + "loss": 0.002, + "step": 10824 + }, + { + "epoch": 0.21, + "learning_rate": 1.5815696477806687e-07, + "loss": 0.0026, + "step": 10825 + }, + { + "epoch": 0.21, + "learning_rate": 1.5815308143373071e-07, + "loss": 0.0058, + "step": 10826 + }, + { + "epoch": 0.21, + "learning_rate": 1.5814919808939459e-07, + "loss": 0.6875, + "step": 10827 + }, + { + "epoch": 0.21, + "learning_rate": 1.5814531474505843e-07, + "loss": 0.0025, + "step": 10828 + }, + { + "epoch": 0.21, + "learning_rate": 1.581414314007223e-07, + "loss": 0.0032, + "step": 10829 + }, + { + "epoch": 0.21, + "learning_rate": 1.5813754805638615e-07, + "loss": 0.0036, + "step": 10830 + }, + { + "epoch": 0.21, + "learning_rate": 1.5813366471205002e-07, + "loss": 0.5218, + "step": 10831 + }, + { + "epoch": 0.21, + "learning_rate": 1.5812978136771386e-07, + "loss": 0.0585, + "step": 10832 + }, + { + "epoch": 0.21, + "learning_rate": 1.5812589802337774e-07, + "loss": 0.0027, + "step": 10833 + }, + { + "epoch": 0.21, + "learning_rate": 1.5812201467904158e-07, + "loss": 0.0022, + "step": 10834 + }, + { + "epoch": 0.21, + "learning_rate": 1.5811813133470545e-07, + "loss": 0.0041, + "step": 10835 + }, + { + "epoch": 0.21, + "learning_rate": 1.581142479903693e-07, + "loss": 0.0091, + "step": 10836 + }, + { + "epoch": 0.21, + "learning_rate": 1.5811036464603317e-07, + "loss": 0.0319, + "step": 10837 + }, + { + "epoch": 0.21, + "learning_rate": 1.5810648130169701e-07, + "loss": 0.0039, + "step": 10838 + }, + { + "epoch": 0.21, + "learning_rate": 1.5810259795736088e-07, + "loss": 0.0026, + "step": 10839 + }, + { + "epoch": 0.21, + "learning_rate": 1.5809871461302473e-07, + "loss": 0.0018, + "step": 10840 + }, + { + "epoch": 0.21, + "learning_rate": 1.580948312686886e-07, + "loss": 0.0061, + "step": 10841 + }, + { + "epoch": 0.21, + "learning_rate": 1.5809094792435245e-07, + "loss": 0.0062, + "step": 10842 + }, + { + "epoch": 0.21, + "learning_rate": 1.5808706458001632e-07, + "loss": 0.0022, + "step": 10843 + }, + { + "epoch": 0.21, + "learning_rate": 1.5808318123568016e-07, + "loss": 0.0018, + "step": 10844 + }, + { + "epoch": 0.21, + "learning_rate": 1.5807929789134403e-07, + "loss": 0.4409, + "step": 10845 + }, + { + "epoch": 0.21, + "learning_rate": 1.5807541454700788e-07, + "loss": 0.0551, + "step": 10846 + }, + { + "epoch": 0.21, + "learning_rate": 1.5807153120267172e-07, + "loss": 0.0027, + "step": 10847 + }, + { + "epoch": 0.21, + "learning_rate": 1.580676478583356e-07, + "loss": 0.0024, + "step": 10848 + }, + { + "epoch": 0.21, + "learning_rate": 1.5806376451399944e-07, + "loss": 0.0077, + "step": 10849 + }, + { + "epoch": 0.21, + "learning_rate": 1.580598811696633e-07, + "loss": 0.0077, + "step": 10850 + }, + { + "epoch": 0.21, + "learning_rate": 1.5805599782532716e-07, + "loss": 0.0035, + "step": 10851 + }, + { + "epoch": 0.21, + "learning_rate": 1.5805211448099103e-07, + "loss": 0.0021, + "step": 10852 + }, + { + "epoch": 0.21, + "learning_rate": 1.5804823113665487e-07, + "loss": 0.0052, + "step": 10853 + }, + { + "epoch": 0.21, + "learning_rate": 1.5804434779231875e-07, + "loss": 0.3335, + "step": 10854 + }, + { + "epoch": 0.21, + "learning_rate": 1.580404644479826e-07, + "loss": 0.0024, + "step": 10855 + }, + { + "epoch": 0.21, + "learning_rate": 1.5803658110364646e-07, + "loss": 0.0044, + "step": 10856 + }, + { + "epoch": 0.21, + "learning_rate": 1.580326977593103e-07, + "loss": 0.0025, + "step": 10857 + }, + { + "epoch": 0.21, + "learning_rate": 1.5802881441497418e-07, + "loss": 0.0031, + "step": 10858 + }, + { + "epoch": 0.21, + "learning_rate": 1.5802493107063802e-07, + "loss": 0.7976, + "step": 10859 + }, + { + "epoch": 0.21, + "learning_rate": 1.580210477263019e-07, + "loss": 0.0055, + "step": 10860 + }, + { + "epoch": 0.21, + "learning_rate": 1.5801716438196574e-07, + "loss": 0.0019, + "step": 10861 + }, + { + "epoch": 0.21, + "learning_rate": 1.580132810376296e-07, + "loss": 0.002, + "step": 10862 + }, + { + "epoch": 0.21, + "learning_rate": 1.5800939769329346e-07, + "loss": 0.0146, + "step": 10863 + }, + { + "epoch": 0.21, + "learning_rate": 1.5800551434895733e-07, + "loss": 0.0373, + "step": 10864 + }, + { + "epoch": 0.21, + "learning_rate": 1.5800163100462117e-07, + "loss": 0.0048, + "step": 10865 + }, + { + "epoch": 0.21, + "learning_rate": 1.5799774766028504e-07, + "loss": 0.0323, + "step": 10866 + }, + { + "epoch": 0.21, + "learning_rate": 1.579938643159489e-07, + "loss": 0.0027, + "step": 10867 + }, + { + "epoch": 0.21, + "learning_rate": 1.5798998097161273e-07, + "loss": 0.003, + "step": 10868 + }, + { + "epoch": 0.21, + "learning_rate": 1.579860976272766e-07, + "loss": 0.024, + "step": 10869 + }, + { + "epoch": 0.21, + "learning_rate": 1.5798221428294045e-07, + "loss": 0.0067, + "step": 10870 + }, + { + "epoch": 0.21, + "learning_rate": 1.5797833093860432e-07, + "loss": 0.2546, + "step": 10871 + }, + { + "epoch": 0.21, + "learning_rate": 1.5797444759426817e-07, + "loss": 0.066, + "step": 10872 + }, + { + "epoch": 0.21, + "learning_rate": 1.5797056424993204e-07, + "loss": 0.0037, + "step": 10873 + }, + { + "epoch": 0.21, + "learning_rate": 1.5796668090559588e-07, + "loss": 0.8111, + "step": 10874 + }, + { + "epoch": 0.21, + "learning_rate": 1.5796279756125976e-07, + "loss": 0.0954, + "step": 10875 + }, + { + "epoch": 0.21, + "learning_rate": 1.579589142169236e-07, + "loss": 0.6376, + "step": 10876 + }, + { + "epoch": 0.21, + "learning_rate": 1.5795503087258745e-07, + "loss": 0.0046, + "step": 10877 + }, + { + "epoch": 0.21, + "learning_rate": 1.5795114752825132e-07, + "loss": 0.0101, + "step": 10878 + }, + { + "epoch": 0.21, + "learning_rate": 1.5794726418391516e-07, + "loss": 0.0203, + "step": 10879 + }, + { + "epoch": 0.21, + "learning_rate": 1.5794338083957903e-07, + "loss": 0.0025, + "step": 10880 + }, + { + "epoch": 0.21, + "learning_rate": 1.5793949749524288e-07, + "loss": 0.0044, + "step": 10881 + }, + { + "epoch": 0.21, + "learning_rate": 1.5793561415090675e-07, + "loss": 0.0021, + "step": 10882 + }, + { + "epoch": 0.21, + "learning_rate": 1.579317308065706e-07, + "loss": 0.0026, + "step": 10883 + }, + { + "epoch": 0.21, + "learning_rate": 1.5792784746223447e-07, + "loss": 0.0027, + "step": 10884 + }, + { + "epoch": 0.21, + "learning_rate": 1.579239641178983e-07, + "loss": 0.8478, + "step": 10885 + }, + { + "epoch": 0.21, + "learning_rate": 1.5792008077356218e-07, + "loss": 0.0021, + "step": 10886 + }, + { + "epoch": 0.21, + "learning_rate": 1.5791619742922603e-07, + "loss": 0.9719, + "step": 10887 + }, + { + "epoch": 0.21, + "learning_rate": 1.579123140848899e-07, + "loss": 0.0164, + "step": 10888 + }, + { + "epoch": 0.21, + "learning_rate": 1.5790843074055374e-07, + "loss": 0.0025, + "step": 10889 + }, + { + "epoch": 0.21, + "learning_rate": 1.5790454739621762e-07, + "loss": 0.0023, + "step": 10890 + }, + { + "epoch": 0.21, + "learning_rate": 1.5790066405188146e-07, + "loss": 0.005, + "step": 10891 + }, + { + "epoch": 0.21, + "learning_rate": 1.5789678070754533e-07, + "loss": 0.0024, + "step": 10892 + }, + { + "epoch": 0.21, + "learning_rate": 1.5789289736320918e-07, + "loss": 0.4978, + "step": 10893 + }, + { + "epoch": 0.21, + "learning_rate": 1.5788901401887305e-07, + "loss": 0.0943, + "step": 10894 + }, + { + "epoch": 0.21, + "learning_rate": 1.578851306745369e-07, + "loss": 0.0023, + "step": 10895 + }, + { + "epoch": 0.21, + "learning_rate": 1.5788124733020076e-07, + "loss": 0.0039, + "step": 10896 + }, + { + "epoch": 0.21, + "learning_rate": 1.578773639858646e-07, + "loss": 0.0025, + "step": 10897 + }, + { + "epoch": 0.21, + "learning_rate": 1.5787348064152848e-07, + "loss": 0.0936, + "step": 10898 + }, + { + "epoch": 0.21, + "learning_rate": 1.5786959729719233e-07, + "loss": 0.0021, + "step": 10899 + }, + { + "epoch": 0.21, + "learning_rate": 1.578657139528562e-07, + "loss": 0.4763, + "step": 10900 + }, + { + "epoch": 0.21, + "learning_rate": 1.5786183060852004e-07, + "loss": 0.0024, + "step": 10901 + }, + { + "epoch": 0.21, + "learning_rate": 1.5785794726418391e-07, + "loss": 0.0019, + "step": 10902 + }, + { + "epoch": 0.21, + "learning_rate": 1.5785406391984776e-07, + "loss": 0.8165, + "step": 10903 + }, + { + "epoch": 0.21, + "learning_rate": 1.5785018057551163e-07, + "loss": 0.0163, + "step": 10904 + }, + { + "epoch": 0.21, + "learning_rate": 1.5784629723117548e-07, + "loss": 0.0022, + "step": 10905 + }, + { + "epoch": 0.21, + "learning_rate": 1.5784241388683935e-07, + "loss": 0.0028, + "step": 10906 + }, + { + "epoch": 0.21, + "learning_rate": 1.578385305425032e-07, + "loss": 0.002, + "step": 10907 + }, + { + "epoch": 0.21, + "learning_rate": 1.5783464719816706e-07, + "loss": 0.0744, + "step": 10908 + }, + { + "epoch": 0.21, + "learning_rate": 1.578307638538309e-07, + "loss": 0.0054, + "step": 10909 + }, + { + "epoch": 0.21, + "learning_rate": 1.5782688050949478e-07, + "loss": 0.6141, + "step": 10910 + }, + { + "epoch": 0.21, + "learning_rate": 1.5782299716515863e-07, + "loss": 0.003, + "step": 10911 + }, + { + "epoch": 0.21, + "learning_rate": 1.578191138208225e-07, + "loss": 0.003, + "step": 10912 + }, + { + "epoch": 0.21, + "learning_rate": 1.5781523047648634e-07, + "loss": 0.0022, + "step": 10913 + }, + { + "epoch": 0.21, + "learning_rate": 1.5781134713215021e-07, + "loss": 0.002, + "step": 10914 + }, + { + "epoch": 0.21, + "learning_rate": 1.5780746378781406e-07, + "loss": 1.0324, + "step": 10915 + }, + { + "epoch": 0.21, + "learning_rate": 1.5780358044347793e-07, + "loss": 0.508, + "step": 10916 + }, + { + "epoch": 0.21, + "learning_rate": 1.5779969709914177e-07, + "loss": 0.0084, + "step": 10917 + }, + { + "epoch": 0.21, + "learning_rate": 1.5779581375480565e-07, + "loss": 0.0161, + "step": 10918 + }, + { + "epoch": 0.21, + "learning_rate": 1.577919304104695e-07, + "loss": 0.0033, + "step": 10919 + }, + { + "epoch": 0.21, + "learning_rate": 1.5778804706613336e-07, + "loss": 0.0035, + "step": 10920 + }, + { + "epoch": 0.21, + "learning_rate": 1.577841637217972e-07, + "loss": 0.002, + "step": 10921 + }, + { + "epoch": 0.21, + "learning_rate": 1.5778028037746108e-07, + "loss": 0.003, + "step": 10922 + }, + { + "epoch": 0.21, + "learning_rate": 1.5777639703312492e-07, + "loss": 0.0021, + "step": 10923 + }, + { + "epoch": 0.21, + "learning_rate": 1.577725136887888e-07, + "loss": 0.0049, + "step": 10924 + }, + { + "epoch": 0.21, + "learning_rate": 1.5776863034445261e-07, + "loss": 0.003, + "step": 10925 + }, + { + "epoch": 0.21, + "learning_rate": 1.5776474700011649e-07, + "loss": 0.0046, + "step": 10926 + }, + { + "epoch": 0.21, + "learning_rate": 1.5776086365578033e-07, + "loss": 0.0037, + "step": 10927 + }, + { + "epoch": 0.21, + "learning_rate": 1.577569803114442e-07, + "loss": 0.0047, + "step": 10928 + }, + { + "epoch": 0.21, + "learning_rate": 1.5775309696710805e-07, + "loss": 0.0028, + "step": 10929 + }, + { + "epoch": 0.21, + "learning_rate": 1.5774921362277192e-07, + "loss": 0.0594, + "step": 10930 + }, + { + "epoch": 0.21, + "learning_rate": 1.5774533027843576e-07, + "loss": 0.0026, + "step": 10931 + }, + { + "epoch": 0.21, + "learning_rate": 1.5774144693409964e-07, + "loss": 0.6812, + "step": 10932 + }, + { + "epoch": 0.21, + "learning_rate": 1.5773756358976348e-07, + "loss": 0.0024, + "step": 10933 + }, + { + "epoch": 0.21, + "learning_rate": 1.5773368024542735e-07, + "loss": 0.0034, + "step": 10934 + }, + { + "epoch": 0.21, + "learning_rate": 1.577297969010912e-07, + "loss": 0.0021, + "step": 10935 + }, + { + "epoch": 0.21, + "learning_rate": 1.5772591355675507e-07, + "loss": 0.0025, + "step": 10936 + }, + { + "epoch": 0.21, + "learning_rate": 1.5772203021241891e-07, + "loss": 0.0131, + "step": 10937 + }, + { + "epoch": 0.21, + "learning_rate": 1.5771814686808278e-07, + "loss": 0.0035, + "step": 10938 + }, + { + "epoch": 0.21, + "learning_rate": 1.5771426352374663e-07, + "loss": 0.002, + "step": 10939 + }, + { + "epoch": 0.21, + "learning_rate": 1.577103801794105e-07, + "loss": 0.1745, + "step": 10940 + }, + { + "epoch": 0.21, + "learning_rate": 1.5770649683507435e-07, + "loss": 0.0024, + "step": 10941 + }, + { + "epoch": 0.21, + "learning_rate": 1.5770261349073822e-07, + "loss": 0.0737, + "step": 10942 + }, + { + "epoch": 0.21, + "learning_rate": 1.5769873014640206e-07, + "loss": 0.0041, + "step": 10943 + }, + { + "epoch": 0.21, + "learning_rate": 1.5769484680206593e-07, + "loss": 0.0035, + "step": 10944 + }, + { + "epoch": 0.21, + "learning_rate": 1.5769096345772978e-07, + "loss": 0.0039, + "step": 10945 + }, + { + "epoch": 0.21, + "learning_rate": 1.5768708011339365e-07, + "loss": 0.0021, + "step": 10946 + }, + { + "epoch": 0.21, + "learning_rate": 1.576831967690575e-07, + "loss": 0.0021, + "step": 10947 + }, + { + "epoch": 0.21, + "learning_rate": 1.5767931342472137e-07, + "loss": 0.0037, + "step": 10948 + }, + { + "epoch": 0.21, + "learning_rate": 1.576754300803852e-07, + "loss": 0.0024, + "step": 10949 + }, + { + "epoch": 0.21, + "learning_rate": 1.5767154673604908e-07, + "loss": 0.0026, + "step": 10950 + }, + { + "epoch": 0.21, + "learning_rate": 1.5766766339171293e-07, + "loss": 0.0371, + "step": 10951 + }, + { + "epoch": 0.21, + "learning_rate": 1.576637800473768e-07, + "loss": 0.0023, + "step": 10952 + }, + { + "epoch": 0.21, + "learning_rate": 1.5765989670304065e-07, + "loss": 0.0031, + "step": 10953 + }, + { + "epoch": 0.21, + "learning_rate": 1.5765601335870452e-07, + "loss": 1.3422, + "step": 10954 + }, + { + "epoch": 0.21, + "learning_rate": 1.5765213001436836e-07, + "loss": 0.0296, + "step": 10955 + }, + { + "epoch": 0.21, + "learning_rate": 1.5764824667003223e-07, + "loss": 0.0786, + "step": 10956 + }, + { + "epoch": 0.21, + "learning_rate": 1.5764436332569608e-07, + "loss": 0.0047, + "step": 10957 + }, + { + "epoch": 0.21, + "learning_rate": 1.5764047998135995e-07, + "loss": 0.002, + "step": 10958 + }, + { + "epoch": 0.21, + "learning_rate": 1.576365966370238e-07, + "loss": 0.0075, + "step": 10959 + }, + { + "epoch": 0.21, + "learning_rate": 1.5763271329268767e-07, + "loss": 0.0025, + "step": 10960 + }, + { + "epoch": 0.21, + "learning_rate": 1.576288299483515e-07, + "loss": 0.0023, + "step": 10961 + }, + { + "epoch": 0.21, + "learning_rate": 1.5762494660401538e-07, + "loss": 0.003, + "step": 10962 + }, + { + "epoch": 0.21, + "learning_rate": 1.5762106325967923e-07, + "loss": 0.6939, + "step": 10963 + }, + { + "epoch": 0.21, + "learning_rate": 1.576171799153431e-07, + "loss": 0.0093, + "step": 10964 + }, + { + "epoch": 0.21, + "learning_rate": 1.5761329657100694e-07, + "loss": 0.0056, + "step": 10965 + }, + { + "epoch": 0.21, + "learning_rate": 1.5760941322667082e-07, + "loss": 0.0028, + "step": 10966 + }, + { + "epoch": 0.21, + "learning_rate": 1.5760552988233466e-07, + "loss": 0.0024, + "step": 10967 + }, + { + "epoch": 0.21, + "learning_rate": 1.5760164653799853e-07, + "loss": 0.4818, + "step": 10968 + }, + { + "epoch": 0.21, + "learning_rate": 1.5759776319366238e-07, + "loss": 0.1004, + "step": 10969 + }, + { + "epoch": 0.21, + "learning_rate": 1.5759387984932625e-07, + "loss": 0.0031, + "step": 10970 + }, + { + "epoch": 0.21, + "learning_rate": 1.575899965049901e-07, + "loss": 0.1272, + "step": 10971 + }, + { + "epoch": 0.21, + "learning_rate": 1.5758611316065397e-07, + "loss": 0.0103, + "step": 10972 + }, + { + "epoch": 0.21, + "learning_rate": 1.575822298163178e-07, + "loss": 0.006, + "step": 10973 + }, + { + "epoch": 0.21, + "learning_rate": 1.5757834647198168e-07, + "loss": 0.0385, + "step": 10974 + }, + { + "epoch": 0.21, + "learning_rate": 1.5757446312764553e-07, + "loss": 0.0023, + "step": 10975 + }, + { + "epoch": 0.21, + "learning_rate": 1.575705797833094e-07, + "loss": 0.0144, + "step": 10976 + }, + { + "epoch": 0.21, + "learning_rate": 1.5756669643897324e-07, + "loss": 0.1477, + "step": 10977 + }, + { + "epoch": 0.21, + "learning_rate": 1.5756281309463711e-07, + "loss": 0.0028, + "step": 10978 + }, + { + "epoch": 0.21, + "learning_rate": 1.5755892975030096e-07, + "loss": 0.006, + "step": 10979 + }, + { + "epoch": 0.21, + "learning_rate": 1.5755504640596483e-07, + "loss": 0.4453, + "step": 10980 + }, + { + "epoch": 0.21, + "learning_rate": 1.5755116306162868e-07, + "loss": 0.0024, + "step": 10981 + }, + { + "epoch": 0.21, + "learning_rate": 1.5754727971729255e-07, + "loss": 0.0021, + "step": 10982 + }, + { + "epoch": 0.21, + "learning_rate": 1.5754339637295637e-07, + "loss": 0.0024, + "step": 10983 + }, + { + "epoch": 0.21, + "learning_rate": 1.5753951302862024e-07, + "loss": 0.3012, + "step": 10984 + }, + { + "epoch": 0.21, + "learning_rate": 1.5753562968428408e-07, + "loss": 0.0028, + "step": 10985 + }, + { + "epoch": 0.21, + "learning_rate": 1.5753174633994795e-07, + "loss": 0.0065, + "step": 10986 + }, + { + "epoch": 0.21, + "learning_rate": 1.575278629956118e-07, + "loss": 0.0591, + "step": 10987 + }, + { + "epoch": 0.21, + "learning_rate": 1.5752397965127567e-07, + "loss": 0.0035, + "step": 10988 + }, + { + "epoch": 0.21, + "learning_rate": 1.5752009630693952e-07, + "loss": 0.002, + "step": 10989 + }, + { + "epoch": 0.21, + "learning_rate": 1.575162129626034e-07, + "loss": 0.0102, + "step": 10990 + }, + { + "epoch": 0.21, + "learning_rate": 1.5751232961826723e-07, + "loss": 0.0024, + "step": 10991 + }, + { + "epoch": 0.21, + "learning_rate": 1.575084462739311e-07, + "loss": 0.002, + "step": 10992 + }, + { + "epoch": 0.21, + "learning_rate": 1.5750456292959495e-07, + "loss": 0.1434, + "step": 10993 + }, + { + "epoch": 0.21, + "learning_rate": 1.5750067958525882e-07, + "loss": 0.0023, + "step": 10994 + }, + { + "epoch": 0.21, + "learning_rate": 1.5749679624092267e-07, + "loss": 0.0048, + "step": 10995 + }, + { + "epoch": 0.21, + "learning_rate": 1.5749291289658654e-07, + "loss": 0.0482, + "step": 10996 + }, + { + "epoch": 0.21, + "learning_rate": 1.5748902955225038e-07, + "loss": 0.0025, + "step": 10997 + }, + { + "epoch": 0.21, + "learning_rate": 1.5748514620791425e-07, + "loss": 0.0031, + "step": 10998 + }, + { + "epoch": 0.21, + "learning_rate": 1.574812628635781e-07, + "loss": 0.0052, + "step": 10999 + }, + { + "epoch": 0.21, + "learning_rate": 1.5747737951924197e-07, + "loss": 0.0022, + "step": 11000 + }, + { + "epoch": 0.21, + "learning_rate": 1.5747349617490581e-07, + "loss": 0.7342, + "step": 11001 + }, + { + "epoch": 0.21, + "learning_rate": 1.5746961283056969e-07, + "loss": 0.0029, + "step": 11002 + }, + { + "epoch": 0.21, + "learning_rate": 1.5746572948623353e-07, + "loss": 0.0736, + "step": 11003 + }, + { + "epoch": 0.21, + "learning_rate": 1.574618461418974e-07, + "loss": 0.7188, + "step": 11004 + }, + { + "epoch": 0.21, + "learning_rate": 1.5745796279756125e-07, + "loss": 0.0024, + "step": 11005 + }, + { + "epoch": 0.21, + "learning_rate": 1.5745407945322512e-07, + "loss": 0.0026, + "step": 11006 + }, + { + "epoch": 0.21, + "learning_rate": 1.5745019610888896e-07, + "loss": 0.0019, + "step": 11007 + }, + { + "epoch": 0.21, + "learning_rate": 1.5744631276455284e-07, + "loss": 0.0018, + "step": 11008 + }, + { + "epoch": 0.21, + "learning_rate": 1.5744242942021668e-07, + "loss": 0.0023, + "step": 11009 + }, + { + "epoch": 0.21, + "learning_rate": 1.5743854607588055e-07, + "loss": 0.0023, + "step": 11010 + }, + { + "epoch": 0.21, + "learning_rate": 1.574346627315444e-07, + "loss": 0.0028, + "step": 11011 + }, + { + "epoch": 0.21, + "learning_rate": 1.5743077938720827e-07, + "loss": 0.0172, + "step": 11012 + }, + { + "epoch": 0.21, + "learning_rate": 1.5742689604287211e-07, + "loss": 0.0029, + "step": 11013 + }, + { + "epoch": 0.21, + "learning_rate": 1.5742301269853598e-07, + "loss": 0.2886, + "step": 11014 + }, + { + "epoch": 0.21, + "learning_rate": 1.5741912935419983e-07, + "loss": 0.0033, + "step": 11015 + }, + { + "epoch": 0.21, + "learning_rate": 1.574152460098637e-07, + "loss": 0.004, + "step": 11016 + }, + { + "epoch": 0.21, + "learning_rate": 1.5741136266552755e-07, + "loss": 0.2845, + "step": 11017 + }, + { + "epoch": 0.21, + "learning_rate": 1.5740747932119142e-07, + "loss": 0.0019, + "step": 11018 + }, + { + "epoch": 0.21, + "learning_rate": 1.5740359597685526e-07, + "loss": 0.0026, + "step": 11019 + }, + { + "epoch": 0.21, + "learning_rate": 1.5739971263251913e-07, + "loss": 0.0022, + "step": 11020 + }, + { + "epoch": 0.21, + "learning_rate": 1.5739582928818298e-07, + "loss": 0.0175, + "step": 11021 + }, + { + "epoch": 0.21, + "learning_rate": 1.5739194594384685e-07, + "loss": 0.0092, + "step": 11022 + }, + { + "epoch": 0.21, + "learning_rate": 1.573880625995107e-07, + "loss": 0.0019, + "step": 11023 + }, + { + "epoch": 0.21, + "learning_rate": 1.5738417925517454e-07, + "loss": 0.0089, + "step": 11024 + }, + { + "epoch": 0.21, + "learning_rate": 1.573802959108384e-07, + "loss": 0.9006, + "step": 11025 + }, + { + "epoch": 0.21, + "learning_rate": 1.5737641256650226e-07, + "loss": 0.0027, + "step": 11026 + }, + { + "epoch": 0.21, + "learning_rate": 1.5737252922216613e-07, + "loss": 0.0027, + "step": 11027 + }, + { + "epoch": 0.21, + "learning_rate": 1.5736864587782997e-07, + "loss": 0.8297, + "step": 11028 + }, + { + "epoch": 0.21, + "learning_rate": 1.5736476253349385e-07, + "loss": 0.0347, + "step": 11029 + }, + { + "epoch": 0.21, + "learning_rate": 1.573608791891577e-07, + "loss": 0.0205, + "step": 11030 + }, + { + "epoch": 0.21, + "learning_rate": 1.5735699584482156e-07, + "loss": 0.453, + "step": 11031 + }, + { + "epoch": 0.21, + "learning_rate": 1.573531125004854e-07, + "loss": 0.2539, + "step": 11032 + }, + { + "epoch": 0.21, + "learning_rate": 1.5734922915614928e-07, + "loss": 0.746, + "step": 11033 + }, + { + "epoch": 0.21, + "learning_rate": 1.5734534581181312e-07, + "loss": 0.003, + "step": 11034 + }, + { + "epoch": 0.21, + "learning_rate": 1.57341462467477e-07, + "loss": 0.254, + "step": 11035 + }, + { + "epoch": 0.21, + "learning_rate": 1.5733757912314084e-07, + "loss": 0.0028, + "step": 11036 + }, + { + "epoch": 0.21, + "learning_rate": 1.573336957788047e-07, + "loss": 0.0035, + "step": 11037 + }, + { + "epoch": 0.21, + "learning_rate": 1.5732981243446856e-07, + "loss": 0.0193, + "step": 11038 + }, + { + "epoch": 0.21, + "learning_rate": 1.5732592909013243e-07, + "loss": 0.0232, + "step": 11039 + }, + { + "epoch": 0.21, + "learning_rate": 1.5732204574579627e-07, + "loss": 0.0024, + "step": 11040 + }, + { + "epoch": 0.21, + "learning_rate": 1.5731816240146012e-07, + "loss": 0.0024, + "step": 11041 + }, + { + "epoch": 0.21, + "learning_rate": 1.57314279057124e-07, + "loss": 0.0175, + "step": 11042 + }, + { + "epoch": 0.21, + "learning_rate": 1.5731039571278783e-07, + "loss": 0.002, + "step": 11043 + }, + { + "epoch": 0.21, + "learning_rate": 1.573065123684517e-07, + "loss": 0.0494, + "step": 11044 + }, + { + "epoch": 0.21, + "learning_rate": 1.5730262902411555e-07, + "loss": 0.003, + "step": 11045 + }, + { + "epoch": 0.21, + "learning_rate": 1.5729874567977942e-07, + "loss": 0.0034, + "step": 11046 + }, + { + "epoch": 0.21, + "learning_rate": 1.5729486233544327e-07, + "loss": 0.0026, + "step": 11047 + }, + { + "epoch": 0.21, + "learning_rate": 1.5729097899110714e-07, + "loss": 0.0077, + "step": 11048 + }, + { + "epoch": 0.21, + "learning_rate": 1.5728709564677098e-07, + "loss": 0.2774, + "step": 11049 + }, + { + "epoch": 0.21, + "learning_rate": 1.5728321230243486e-07, + "loss": 0.0029, + "step": 11050 + }, + { + "epoch": 0.21, + "learning_rate": 1.572793289580987e-07, + "loss": 0.2996, + "step": 11051 + }, + { + "epoch": 0.21, + "learning_rate": 1.5727544561376257e-07, + "loss": 0.002, + "step": 11052 + }, + { + "epoch": 0.21, + "learning_rate": 1.5727156226942642e-07, + "loss": 0.0201, + "step": 11053 + }, + { + "epoch": 0.21, + "learning_rate": 1.5726767892509026e-07, + "loss": 0.0029, + "step": 11054 + }, + { + "epoch": 0.21, + "learning_rate": 1.5726379558075413e-07, + "loss": 0.0036, + "step": 11055 + }, + { + "epoch": 0.21, + "learning_rate": 1.5725991223641798e-07, + "loss": 0.0028, + "step": 11056 + }, + { + "epoch": 0.21, + "learning_rate": 1.5725602889208185e-07, + "loss": 0.0016, + "step": 11057 + }, + { + "epoch": 0.21, + "learning_rate": 1.572521455477457e-07, + "loss": 0.0016, + "step": 11058 + }, + { + "epoch": 0.21, + "learning_rate": 1.5724826220340957e-07, + "loss": 0.0023, + "step": 11059 + }, + { + "epoch": 0.21, + "learning_rate": 1.572443788590734e-07, + "loss": 0.0027, + "step": 11060 + }, + { + "epoch": 0.21, + "learning_rate": 1.5724049551473728e-07, + "loss": 0.0033, + "step": 11061 + }, + { + "epoch": 0.21, + "learning_rate": 1.5723661217040113e-07, + "loss": 0.0022, + "step": 11062 + }, + { + "epoch": 0.21, + "learning_rate": 1.57232728826065e-07, + "loss": 0.0022, + "step": 11063 + }, + { + "epoch": 0.21, + "learning_rate": 1.5722884548172884e-07, + "loss": 0.0023, + "step": 11064 + }, + { + "epoch": 0.21, + "learning_rate": 1.5722496213739272e-07, + "loss": 0.0032, + "step": 11065 + }, + { + "epoch": 0.21, + "learning_rate": 1.5722107879305656e-07, + "loss": 0.0025, + "step": 11066 + }, + { + "epoch": 0.21, + "learning_rate": 1.5721719544872043e-07, + "loss": 0.0021, + "step": 11067 + }, + { + "epoch": 0.21, + "learning_rate": 1.5721331210438428e-07, + "loss": 0.0038, + "step": 11068 + }, + { + "epoch": 0.21, + "learning_rate": 1.5720942876004815e-07, + "loss": 0.0028, + "step": 11069 + }, + { + "epoch": 0.21, + "learning_rate": 1.57205545415712e-07, + "loss": 0.6457, + "step": 11070 + }, + { + "epoch": 0.21, + "learning_rate": 1.5720166207137587e-07, + "loss": 0.0019, + "step": 11071 + }, + { + "epoch": 0.21, + "learning_rate": 1.571977787270397e-07, + "loss": 0.0023, + "step": 11072 + }, + { + "epoch": 0.21, + "learning_rate": 1.5719389538270358e-07, + "loss": 0.0029, + "step": 11073 + }, + { + "epoch": 0.21, + "learning_rate": 1.5719001203836743e-07, + "loss": 0.0028, + "step": 11074 + }, + { + "epoch": 0.21, + "learning_rate": 1.571861286940313e-07, + "loss": 0.0028, + "step": 11075 + }, + { + "epoch": 0.21, + "learning_rate": 1.5718224534969514e-07, + "loss": 0.0226, + "step": 11076 + }, + { + "epoch": 0.21, + "learning_rate": 1.5717836200535901e-07, + "loss": 0.0029, + "step": 11077 + }, + { + "epoch": 0.21, + "learning_rate": 1.5717447866102286e-07, + "loss": 0.0033, + "step": 11078 + }, + { + "epoch": 0.21, + "learning_rate": 1.5717059531668673e-07, + "loss": 0.0073, + "step": 11079 + }, + { + "epoch": 0.21, + "learning_rate": 1.5716671197235058e-07, + "loss": 0.4729, + "step": 11080 + }, + { + "epoch": 0.21, + "learning_rate": 1.5716282862801445e-07, + "loss": 0.0022, + "step": 11081 + }, + { + "epoch": 0.21, + "learning_rate": 1.571589452836783e-07, + "loss": 0.0022, + "step": 11082 + }, + { + "epoch": 0.21, + "learning_rate": 1.5715506193934216e-07, + "loss": 0.0021, + "step": 11083 + }, + { + "epoch": 0.22, + "learning_rate": 1.57151178595006e-07, + "loss": 0.003, + "step": 11084 + }, + { + "epoch": 0.22, + "learning_rate": 1.5714729525066988e-07, + "loss": 0.0025, + "step": 11085 + }, + { + "epoch": 0.22, + "learning_rate": 1.5714341190633373e-07, + "loss": 0.0026, + "step": 11086 + }, + { + "epoch": 0.22, + "learning_rate": 1.571395285619976e-07, + "loss": 0.003, + "step": 11087 + }, + { + "epoch": 0.22, + "learning_rate": 1.5713564521766144e-07, + "loss": 1.2272, + "step": 11088 + }, + { + "epoch": 0.22, + "learning_rate": 1.5713176187332531e-07, + "loss": 0.0029, + "step": 11089 + }, + { + "epoch": 0.22, + "learning_rate": 1.5712787852898916e-07, + "loss": 0.0024, + "step": 11090 + }, + { + "epoch": 0.22, + "learning_rate": 1.5712399518465303e-07, + "loss": 0.0019, + "step": 11091 + }, + { + "epoch": 0.22, + "learning_rate": 1.5712011184031688e-07, + "loss": 0.9009, + "step": 11092 + }, + { + "epoch": 0.22, + "learning_rate": 1.5711622849598075e-07, + "loss": 0.0259, + "step": 11093 + }, + { + "epoch": 0.22, + "learning_rate": 1.571123451516446e-07, + "loss": 0.0019, + "step": 11094 + }, + { + "epoch": 0.22, + "learning_rate": 1.5710846180730846e-07, + "loss": 0.5571, + "step": 11095 + }, + { + "epoch": 0.22, + "learning_rate": 1.571045784629723e-07, + "loss": 0.0033, + "step": 11096 + }, + { + "epoch": 0.22, + "learning_rate": 1.5710069511863618e-07, + "loss": 0.0023, + "step": 11097 + }, + { + "epoch": 0.22, + "learning_rate": 1.5709681177430002e-07, + "loss": 0.0422, + "step": 11098 + }, + { + "epoch": 0.22, + "learning_rate": 1.5709292842996387e-07, + "loss": 0.0086, + "step": 11099 + }, + { + "epoch": 0.22, + "learning_rate": 1.5708904508562771e-07, + "loss": 0.0029, + "step": 11100 + }, + { + "epoch": 0.22, + "learning_rate": 1.5708516174129159e-07, + "loss": 0.0027, + "step": 11101 + }, + { + "epoch": 0.22, + "learning_rate": 1.5708127839695543e-07, + "loss": 0.0022, + "step": 11102 + }, + { + "epoch": 0.22, + "learning_rate": 1.570773950526193e-07, + "loss": 0.9295, + "step": 11103 + }, + { + "epoch": 0.22, + "learning_rate": 1.5707351170828315e-07, + "loss": 0.0025, + "step": 11104 + }, + { + "epoch": 0.22, + "learning_rate": 1.5706962836394702e-07, + "loss": 0.0299, + "step": 11105 + }, + { + "epoch": 0.22, + "learning_rate": 1.5706574501961086e-07, + "loss": 0.002, + "step": 11106 + }, + { + "epoch": 0.22, + "learning_rate": 1.5706186167527474e-07, + "loss": 0.034, + "step": 11107 + }, + { + "epoch": 0.22, + "learning_rate": 1.5705797833093858e-07, + "loss": 0.0021, + "step": 11108 + }, + { + "epoch": 0.22, + "learning_rate": 1.5705409498660245e-07, + "loss": 0.0257, + "step": 11109 + }, + { + "epoch": 0.22, + "learning_rate": 1.570502116422663e-07, + "loss": 0.0038, + "step": 11110 + }, + { + "epoch": 0.22, + "learning_rate": 1.5704632829793017e-07, + "loss": 0.1564, + "step": 11111 + }, + { + "epoch": 0.22, + "learning_rate": 1.5704244495359401e-07, + "loss": 0.0104, + "step": 11112 + }, + { + "epoch": 0.22, + "learning_rate": 1.5703856160925788e-07, + "loss": 0.01, + "step": 11113 + }, + { + "epoch": 0.22, + "learning_rate": 1.5703467826492173e-07, + "loss": 0.0023, + "step": 11114 + }, + { + "epoch": 0.22, + "learning_rate": 1.570307949205856e-07, + "loss": 0.0026, + "step": 11115 + }, + { + "epoch": 0.22, + "learning_rate": 1.5702691157624945e-07, + "loss": 0.0199, + "step": 11116 + }, + { + "epoch": 0.22, + "learning_rate": 1.5702302823191332e-07, + "loss": 0.0054, + "step": 11117 + }, + { + "epoch": 0.22, + "learning_rate": 1.5701914488757716e-07, + "loss": 0.2545, + "step": 11118 + }, + { + "epoch": 0.22, + "learning_rate": 1.5701526154324103e-07, + "loss": 0.0023, + "step": 11119 + }, + { + "epoch": 0.22, + "learning_rate": 1.5701137819890488e-07, + "loss": 0.0028, + "step": 11120 + }, + { + "epoch": 0.22, + "learning_rate": 1.5700749485456875e-07, + "loss": 0.0023, + "step": 11121 + }, + { + "epoch": 0.22, + "learning_rate": 1.570036115102326e-07, + "loss": 0.0974, + "step": 11122 + }, + { + "epoch": 0.22, + "learning_rate": 1.5699972816589647e-07, + "loss": 0.0376, + "step": 11123 + }, + { + "epoch": 0.22, + "learning_rate": 1.569958448215603e-07, + "loss": 0.0176, + "step": 11124 + }, + { + "epoch": 0.22, + "learning_rate": 1.5699196147722418e-07, + "loss": 0.0034, + "step": 11125 + }, + { + "epoch": 0.22, + "learning_rate": 1.5698807813288803e-07, + "loss": 0.0022, + "step": 11126 + }, + { + "epoch": 0.22, + "learning_rate": 1.569841947885519e-07, + "loss": 0.0041, + "step": 11127 + }, + { + "epoch": 0.22, + "learning_rate": 1.5698031144421575e-07, + "loss": 0.0042, + "step": 11128 + }, + { + "epoch": 0.22, + "learning_rate": 1.5697642809987962e-07, + "loss": 0.0045, + "step": 11129 + }, + { + "epoch": 0.22, + "learning_rate": 1.5697254475554346e-07, + "loss": 0.286, + "step": 11130 + }, + { + "epoch": 0.22, + "learning_rate": 1.5696866141120733e-07, + "loss": 0.0026, + "step": 11131 + }, + { + "epoch": 0.22, + "learning_rate": 1.5696477806687118e-07, + "loss": 0.005, + "step": 11132 + }, + { + "epoch": 0.22, + "learning_rate": 1.5696089472253505e-07, + "loss": 0.0034, + "step": 11133 + }, + { + "epoch": 0.22, + "learning_rate": 1.569570113781989e-07, + "loss": 0.0839, + "step": 11134 + }, + { + "epoch": 0.22, + "learning_rate": 1.5695312803386277e-07, + "loss": 0.0047, + "step": 11135 + }, + { + "epoch": 0.22, + "learning_rate": 1.569492446895266e-07, + "loss": 0.0028, + "step": 11136 + }, + { + "epoch": 0.22, + "learning_rate": 1.5694536134519048e-07, + "loss": 0.0024, + "step": 11137 + }, + { + "epoch": 0.22, + "learning_rate": 1.5694147800085433e-07, + "loss": 0.4645, + "step": 11138 + }, + { + "epoch": 0.22, + "learning_rate": 1.569375946565182e-07, + "loss": 0.004, + "step": 11139 + }, + { + "epoch": 0.22, + "learning_rate": 1.5693371131218204e-07, + "loss": 0.0022, + "step": 11140 + }, + { + "epoch": 0.22, + "learning_rate": 1.5692982796784592e-07, + "loss": 0.0026, + "step": 11141 + }, + { + "epoch": 0.22, + "learning_rate": 1.5692594462350976e-07, + "loss": 0.0057, + "step": 11142 + }, + { + "epoch": 0.22, + "learning_rate": 1.5692206127917363e-07, + "loss": 0.0028, + "step": 11143 + }, + { + "epoch": 0.22, + "learning_rate": 1.5691817793483748e-07, + "loss": 0.0024, + "step": 11144 + }, + { + "epoch": 0.22, + "learning_rate": 1.5691429459050135e-07, + "loss": 0.0019, + "step": 11145 + }, + { + "epoch": 0.22, + "learning_rate": 1.569104112461652e-07, + "loss": 0.0021, + "step": 11146 + }, + { + "epoch": 0.22, + "learning_rate": 1.5690652790182907e-07, + "loss": 0.0022, + "step": 11147 + }, + { + "epoch": 0.22, + "learning_rate": 1.569026445574929e-07, + "loss": 0.002, + "step": 11148 + }, + { + "epoch": 0.22, + "learning_rate": 1.5689876121315678e-07, + "loss": 0.0027, + "step": 11149 + }, + { + "epoch": 0.22, + "learning_rate": 1.5689487786882063e-07, + "loss": 0.002, + "step": 11150 + }, + { + "epoch": 0.22, + "learning_rate": 1.568909945244845e-07, + "loss": 0.4891, + "step": 11151 + }, + { + "epoch": 0.22, + "learning_rate": 1.5688711118014834e-07, + "loss": 0.0019, + "step": 11152 + }, + { + "epoch": 0.22, + "learning_rate": 1.5688322783581221e-07, + "loss": 0.4686, + "step": 11153 + }, + { + "epoch": 0.22, + "learning_rate": 1.5687934449147606e-07, + "loss": 0.203, + "step": 11154 + }, + { + "epoch": 0.22, + "learning_rate": 1.5687546114713993e-07, + "loss": 0.0028, + "step": 11155 + }, + { + "epoch": 0.22, + "learning_rate": 1.5687157780280378e-07, + "loss": 0.0021, + "step": 11156 + }, + { + "epoch": 0.22, + "learning_rate": 1.5686769445846762e-07, + "loss": 0.0047, + "step": 11157 + }, + { + "epoch": 0.22, + "learning_rate": 1.5686381111413147e-07, + "loss": 0.0024, + "step": 11158 + }, + { + "epoch": 0.22, + "learning_rate": 1.5685992776979534e-07, + "loss": 0.0024, + "step": 11159 + }, + { + "epoch": 0.22, + "learning_rate": 1.5685604442545918e-07, + "loss": 0.0027, + "step": 11160 + }, + { + "epoch": 0.22, + "learning_rate": 1.5685216108112305e-07, + "loss": 0.0018, + "step": 11161 + }, + { + "epoch": 0.22, + "learning_rate": 1.568482777367869e-07, + "loss": 0.0022, + "step": 11162 + }, + { + "epoch": 0.22, + "learning_rate": 1.5684439439245077e-07, + "loss": 0.0024, + "step": 11163 + }, + { + "epoch": 0.22, + "learning_rate": 1.5684051104811462e-07, + "loss": 0.0021, + "step": 11164 + }, + { + "epoch": 0.22, + "learning_rate": 1.568366277037785e-07, + "loss": 0.0018, + "step": 11165 + }, + { + "epoch": 0.22, + "learning_rate": 1.5683274435944233e-07, + "loss": 0.0027, + "step": 11166 + }, + { + "epoch": 0.22, + "learning_rate": 1.568288610151062e-07, + "loss": 0.0022, + "step": 11167 + }, + { + "epoch": 0.22, + "learning_rate": 1.5682497767077005e-07, + "loss": 0.0025, + "step": 11168 + }, + { + "epoch": 0.22, + "learning_rate": 1.5682109432643392e-07, + "loss": 0.0021, + "step": 11169 + }, + { + "epoch": 0.22, + "learning_rate": 1.5681721098209777e-07, + "loss": 0.0026, + "step": 11170 + }, + { + "epoch": 0.22, + "learning_rate": 1.5681332763776164e-07, + "loss": 0.0035, + "step": 11171 + }, + { + "epoch": 0.22, + "learning_rate": 1.5680944429342548e-07, + "loss": 0.002, + "step": 11172 + }, + { + "epoch": 0.22, + "learning_rate": 1.5680556094908935e-07, + "loss": 0.0021, + "step": 11173 + }, + { + "epoch": 0.22, + "learning_rate": 1.568016776047532e-07, + "loss": 0.0603, + "step": 11174 + }, + { + "epoch": 0.22, + "learning_rate": 1.5679779426041707e-07, + "loss": 0.0108, + "step": 11175 + }, + { + "epoch": 0.22, + "learning_rate": 1.5679391091608091e-07, + "loss": 0.0019, + "step": 11176 + }, + { + "epoch": 0.22, + "learning_rate": 1.5679002757174479e-07, + "loss": 0.5839, + "step": 11177 + }, + { + "epoch": 0.22, + "learning_rate": 1.5678614422740863e-07, + "loss": 0.9558, + "step": 11178 + }, + { + "epoch": 0.22, + "learning_rate": 1.567822608830725e-07, + "loss": 0.0021, + "step": 11179 + }, + { + "epoch": 0.22, + "learning_rate": 1.5677837753873635e-07, + "loss": 0.019, + "step": 11180 + }, + { + "epoch": 0.22, + "learning_rate": 1.5677449419440022e-07, + "loss": 0.0023, + "step": 11181 + }, + { + "epoch": 0.22, + "learning_rate": 1.5677061085006406e-07, + "loss": 0.0019, + "step": 11182 + }, + { + "epoch": 0.22, + "learning_rate": 1.5676672750572794e-07, + "loss": 0.003, + "step": 11183 + }, + { + "epoch": 0.22, + "learning_rate": 1.5676284416139178e-07, + "loss": 0.0029, + "step": 11184 + }, + { + "epoch": 0.22, + "learning_rate": 1.5675896081705565e-07, + "loss": 0.1073, + "step": 11185 + }, + { + "epoch": 0.22, + "learning_rate": 1.567550774727195e-07, + "loss": 0.0018, + "step": 11186 + }, + { + "epoch": 0.22, + "learning_rate": 1.5675119412838337e-07, + "loss": 0.0519, + "step": 11187 + }, + { + "epoch": 0.22, + "learning_rate": 1.5674731078404721e-07, + "loss": 0.0027, + "step": 11188 + }, + { + "epoch": 0.22, + "learning_rate": 1.5674342743971108e-07, + "loss": 0.0969, + "step": 11189 + }, + { + "epoch": 0.22, + "learning_rate": 1.5673954409537493e-07, + "loss": 0.4514, + "step": 11190 + }, + { + "epoch": 0.22, + "learning_rate": 1.567356607510388e-07, + "loss": 0.0026, + "step": 11191 + }, + { + "epoch": 0.22, + "learning_rate": 1.5673177740670265e-07, + "loss": 0.0024, + "step": 11192 + }, + { + "epoch": 0.22, + "learning_rate": 1.5672789406236652e-07, + "loss": 0.0023, + "step": 11193 + }, + { + "epoch": 0.22, + "learning_rate": 1.5672401071803036e-07, + "loss": 0.0023, + "step": 11194 + }, + { + "epoch": 0.22, + "learning_rate": 1.5672012737369423e-07, + "loss": 0.0022, + "step": 11195 + }, + { + "epoch": 0.22, + "learning_rate": 1.5671624402935808e-07, + "loss": 0.0019, + "step": 11196 + }, + { + "epoch": 0.22, + "learning_rate": 1.5671236068502195e-07, + "loss": 0.0026, + "step": 11197 + }, + { + "epoch": 0.22, + "learning_rate": 1.567084773406858e-07, + "loss": 0.0024, + "step": 11198 + }, + { + "epoch": 0.22, + "learning_rate": 1.5670459399634967e-07, + "loss": 0.0023, + "step": 11199 + }, + { + "epoch": 0.22, + "learning_rate": 1.567007106520135e-07, + "loss": 0.0033, + "step": 11200 + }, + { + "epoch": 0.22, + "learning_rate": 1.5669682730767736e-07, + "loss": 0.0049, + "step": 11201 + }, + { + "epoch": 0.22, + "learning_rate": 1.5669294396334123e-07, + "loss": 0.2756, + "step": 11202 + }, + { + "epoch": 0.22, + "learning_rate": 1.5668906061900507e-07, + "loss": 0.2114, + "step": 11203 + }, + { + "epoch": 0.22, + "learning_rate": 1.5668517727466895e-07, + "loss": 0.007, + "step": 11204 + }, + { + "epoch": 0.22, + "learning_rate": 1.566812939303328e-07, + "loss": 0.0047, + "step": 11205 + }, + { + "epoch": 0.22, + "learning_rate": 1.5667741058599666e-07, + "loss": 0.0069, + "step": 11206 + }, + { + "epoch": 0.22, + "learning_rate": 1.566735272416605e-07, + "loss": 0.0021, + "step": 11207 + }, + { + "epoch": 0.22, + "learning_rate": 1.5666964389732438e-07, + "loss": 0.0028, + "step": 11208 + }, + { + "epoch": 0.22, + "learning_rate": 1.5666576055298822e-07, + "loss": 0.0023, + "step": 11209 + }, + { + "epoch": 0.22, + "learning_rate": 1.566618772086521e-07, + "loss": 0.0024, + "step": 11210 + }, + { + "epoch": 0.22, + "learning_rate": 1.5665799386431594e-07, + "loss": 0.008, + "step": 11211 + }, + { + "epoch": 0.22, + "learning_rate": 1.566541105199798e-07, + "loss": 0.0272, + "step": 11212 + }, + { + "epoch": 0.22, + "learning_rate": 1.5665022717564366e-07, + "loss": 0.002, + "step": 11213 + }, + { + "epoch": 0.22, + "learning_rate": 1.5664634383130753e-07, + "loss": 0.0399, + "step": 11214 + }, + { + "epoch": 0.22, + "learning_rate": 1.5664246048697137e-07, + "loss": 0.0232, + "step": 11215 + }, + { + "epoch": 0.22, + "learning_rate": 1.5663857714263522e-07, + "loss": 0.003, + "step": 11216 + }, + { + "epoch": 0.22, + "learning_rate": 1.566346937982991e-07, + "loss": 0.0025, + "step": 11217 + }, + { + "epoch": 0.22, + "learning_rate": 1.5663081045396293e-07, + "loss": 0.0027, + "step": 11218 + }, + { + "epoch": 0.22, + "learning_rate": 1.566269271096268e-07, + "loss": 0.002, + "step": 11219 + }, + { + "epoch": 0.22, + "learning_rate": 1.5662304376529065e-07, + "loss": 0.0039, + "step": 11220 + }, + { + "epoch": 0.22, + "learning_rate": 1.5661916042095452e-07, + "loss": 0.0024, + "step": 11221 + }, + { + "epoch": 0.22, + "learning_rate": 1.5661527707661837e-07, + "loss": 0.0034, + "step": 11222 + }, + { + "epoch": 0.22, + "learning_rate": 1.5661139373228224e-07, + "loss": 0.0023, + "step": 11223 + }, + { + "epoch": 0.22, + "learning_rate": 1.5660751038794608e-07, + "loss": 0.0023, + "step": 11224 + }, + { + "epoch": 0.22, + "learning_rate": 1.5660362704360996e-07, + "loss": 0.27, + "step": 11225 + }, + { + "epoch": 0.22, + "learning_rate": 1.565997436992738e-07, + "loss": 0.0031, + "step": 11226 + }, + { + "epoch": 0.22, + "learning_rate": 1.5659586035493767e-07, + "loss": 0.002, + "step": 11227 + }, + { + "epoch": 0.22, + "learning_rate": 1.5659197701060152e-07, + "loss": 0.0015, + "step": 11228 + }, + { + "epoch": 0.22, + "learning_rate": 1.565880936662654e-07, + "loss": 0.0149, + "step": 11229 + }, + { + "epoch": 0.22, + "learning_rate": 1.5658421032192923e-07, + "loss": 0.0024, + "step": 11230 + }, + { + "epoch": 0.22, + "learning_rate": 1.5658032697759308e-07, + "loss": 0.0034, + "step": 11231 + }, + { + "epoch": 0.22, + "learning_rate": 1.5657644363325695e-07, + "loss": 0.0021, + "step": 11232 + }, + { + "epoch": 0.22, + "learning_rate": 1.565725602889208e-07, + "loss": 0.0034, + "step": 11233 + }, + { + "epoch": 0.22, + "learning_rate": 1.5656867694458467e-07, + "loss": 0.4727, + "step": 11234 + }, + { + "epoch": 0.22, + "learning_rate": 1.565647936002485e-07, + "loss": 0.0026, + "step": 11235 + }, + { + "epoch": 0.22, + "learning_rate": 1.5656091025591238e-07, + "loss": 0.0023, + "step": 11236 + }, + { + "epoch": 0.22, + "learning_rate": 1.5655702691157623e-07, + "loss": 0.0023, + "step": 11237 + }, + { + "epoch": 0.22, + "learning_rate": 1.565531435672401e-07, + "loss": 0.0027, + "step": 11238 + }, + { + "epoch": 0.22, + "learning_rate": 1.5654926022290394e-07, + "loss": 0.0062, + "step": 11239 + }, + { + "epoch": 0.22, + "learning_rate": 1.5654537687856782e-07, + "loss": 0.0039, + "step": 11240 + }, + { + "epoch": 0.22, + "learning_rate": 1.5654149353423166e-07, + "loss": 0.0019, + "step": 11241 + }, + { + "epoch": 0.22, + "learning_rate": 1.5653761018989553e-07, + "loss": 0.0021, + "step": 11242 + }, + { + "epoch": 0.22, + "learning_rate": 1.5653372684555938e-07, + "loss": 0.0024, + "step": 11243 + }, + { + "epoch": 0.22, + "learning_rate": 1.5652984350122325e-07, + "loss": 0.1667, + "step": 11244 + }, + { + "epoch": 0.22, + "learning_rate": 1.565259601568871e-07, + "loss": 0.2874, + "step": 11245 + }, + { + "epoch": 0.22, + "learning_rate": 1.5652207681255097e-07, + "loss": 0.0022, + "step": 11246 + }, + { + "epoch": 0.22, + "learning_rate": 1.565181934682148e-07, + "loss": 0.5379, + "step": 11247 + }, + { + "epoch": 0.22, + "learning_rate": 1.5651431012387868e-07, + "loss": 0.5872, + "step": 11248 + }, + { + "epoch": 0.22, + "learning_rate": 1.5651042677954253e-07, + "loss": 0.0024, + "step": 11249 + }, + { + "epoch": 0.22, + "learning_rate": 1.565065434352064e-07, + "loss": 0.0026, + "step": 11250 + }, + { + "epoch": 0.22, + "learning_rate": 1.5650266009087024e-07, + "loss": 0.003, + "step": 11251 + }, + { + "epoch": 0.22, + "learning_rate": 1.5649877674653411e-07, + "loss": 0.004, + "step": 11252 + }, + { + "epoch": 0.22, + "learning_rate": 1.5649489340219796e-07, + "loss": 0.0036, + "step": 11253 + }, + { + "epoch": 0.22, + "learning_rate": 1.5649101005786183e-07, + "loss": 0.015, + "step": 11254 + }, + { + "epoch": 0.22, + "learning_rate": 1.5648712671352568e-07, + "loss": 0.002, + "step": 11255 + }, + { + "epoch": 0.22, + "learning_rate": 1.5648324336918955e-07, + "loss": 0.3843, + "step": 11256 + }, + { + "epoch": 0.22, + "learning_rate": 1.564793600248534e-07, + "loss": 1.0566, + "step": 11257 + }, + { + "epoch": 0.22, + "learning_rate": 1.5647547668051726e-07, + "loss": 0.0037, + "step": 11258 + }, + { + "epoch": 0.22, + "learning_rate": 1.564715933361811e-07, + "loss": 0.0026, + "step": 11259 + }, + { + "epoch": 0.22, + "learning_rate": 1.5646770999184498e-07, + "loss": 0.0455, + "step": 11260 + }, + { + "epoch": 0.22, + "learning_rate": 1.5646382664750883e-07, + "loss": 0.0021, + "step": 11261 + }, + { + "epoch": 0.22, + "learning_rate": 1.564599433031727e-07, + "loss": 0.023, + "step": 11262 + }, + { + "epoch": 0.22, + "learning_rate": 1.5645605995883654e-07, + "loss": 0.0032, + "step": 11263 + }, + { + "epoch": 0.22, + "learning_rate": 1.5645217661450041e-07, + "loss": 0.0033, + "step": 11264 + }, + { + "epoch": 0.22, + "learning_rate": 1.5644829327016426e-07, + "loss": 0.0047, + "step": 11265 + }, + { + "epoch": 0.22, + "learning_rate": 1.5644440992582813e-07, + "loss": 0.0515, + "step": 11266 + }, + { + "epoch": 0.22, + "learning_rate": 1.5644052658149198e-07, + "loss": 0.0045, + "step": 11267 + }, + { + "epoch": 0.22, + "learning_rate": 1.5643664323715585e-07, + "loss": 0.7692, + "step": 11268 + }, + { + "epoch": 0.22, + "learning_rate": 1.564327598928197e-07, + "loss": 0.0025, + "step": 11269 + }, + { + "epoch": 0.22, + "learning_rate": 1.5642887654848356e-07, + "loss": 0.008, + "step": 11270 + }, + { + "epoch": 0.22, + "learning_rate": 1.564249932041474e-07, + "loss": 0.0131, + "step": 11271 + }, + { + "epoch": 0.22, + "learning_rate": 1.5642110985981128e-07, + "loss": 0.0131, + "step": 11272 + }, + { + "epoch": 0.22, + "learning_rate": 1.564172265154751e-07, + "loss": 0.0026, + "step": 11273 + }, + { + "epoch": 0.22, + "learning_rate": 1.5641334317113897e-07, + "loss": 0.003, + "step": 11274 + }, + { + "epoch": 0.22, + "learning_rate": 1.5640945982680281e-07, + "loss": 0.0021, + "step": 11275 + }, + { + "epoch": 0.22, + "learning_rate": 1.5640557648246669e-07, + "loss": 0.0037, + "step": 11276 + }, + { + "epoch": 0.22, + "learning_rate": 1.5640169313813053e-07, + "loss": 0.0033, + "step": 11277 + }, + { + "epoch": 0.22, + "learning_rate": 1.563978097937944e-07, + "loss": 0.0048, + "step": 11278 + }, + { + "epoch": 0.22, + "learning_rate": 1.5639392644945825e-07, + "loss": 0.0024, + "step": 11279 + }, + { + "epoch": 0.22, + "learning_rate": 1.5639004310512212e-07, + "loss": 0.0025, + "step": 11280 + }, + { + "epoch": 0.22, + "learning_rate": 1.5638615976078596e-07, + "loss": 0.0028, + "step": 11281 + }, + { + "epoch": 0.22, + "learning_rate": 1.5638227641644984e-07, + "loss": 0.0515, + "step": 11282 + }, + { + "epoch": 0.22, + "learning_rate": 1.5637839307211368e-07, + "loss": 0.0093, + "step": 11283 + }, + { + "epoch": 0.22, + "learning_rate": 1.5637450972777755e-07, + "loss": 0.0025, + "step": 11284 + }, + { + "epoch": 0.22, + "learning_rate": 1.563706263834414e-07, + "loss": 0.0177, + "step": 11285 + }, + { + "epoch": 0.22, + "learning_rate": 1.5636674303910527e-07, + "loss": 0.0049, + "step": 11286 + }, + { + "epoch": 0.22, + "learning_rate": 1.5636285969476911e-07, + "loss": 0.002, + "step": 11287 + }, + { + "epoch": 0.22, + "learning_rate": 1.5635897635043299e-07, + "loss": 0.0024, + "step": 11288 + }, + { + "epoch": 0.22, + "learning_rate": 1.5635509300609683e-07, + "loss": 0.874, + "step": 11289 + }, + { + "epoch": 0.22, + "learning_rate": 1.563512096617607e-07, + "loss": 0.0032, + "step": 11290 + }, + { + "epoch": 0.22, + "learning_rate": 1.5634732631742455e-07, + "loss": 0.0567, + "step": 11291 + }, + { + "epoch": 0.22, + "learning_rate": 1.5634344297308842e-07, + "loss": 0.0025, + "step": 11292 + }, + { + "epoch": 0.22, + "learning_rate": 1.5633955962875226e-07, + "loss": 0.3527, + "step": 11293 + }, + { + "epoch": 0.22, + "learning_rate": 1.5633567628441613e-07, + "loss": 0.0025, + "step": 11294 + }, + { + "epoch": 0.22, + "learning_rate": 1.5633179294007998e-07, + "loss": 0.1507, + "step": 11295 + }, + { + "epoch": 0.22, + "learning_rate": 1.5632790959574385e-07, + "loss": 0.0032, + "step": 11296 + }, + { + "epoch": 0.22, + "learning_rate": 1.563240262514077e-07, + "loss": 0.0053, + "step": 11297 + }, + { + "epoch": 0.22, + "learning_rate": 1.5632014290707157e-07, + "loss": 0.0024, + "step": 11298 + }, + { + "epoch": 0.22, + "learning_rate": 1.563162595627354e-07, + "loss": 0.1228, + "step": 11299 + }, + { + "epoch": 0.22, + "learning_rate": 1.5631237621839928e-07, + "loss": 0.0025, + "step": 11300 + }, + { + "epoch": 0.22, + "learning_rate": 1.5630849287406313e-07, + "loss": 0.0027, + "step": 11301 + }, + { + "epoch": 0.22, + "learning_rate": 1.56304609529727e-07, + "loss": 0.0018, + "step": 11302 + }, + { + "epoch": 0.22, + "learning_rate": 1.5630072618539085e-07, + "loss": 1.6418, + "step": 11303 + }, + { + "epoch": 0.22, + "learning_rate": 1.5629684284105472e-07, + "loss": 0.0018, + "step": 11304 + }, + { + "epoch": 0.22, + "learning_rate": 1.5629295949671856e-07, + "loss": 0.0059, + "step": 11305 + }, + { + "epoch": 0.22, + "learning_rate": 1.5628907615238243e-07, + "loss": 0.0039, + "step": 11306 + }, + { + "epoch": 0.22, + "learning_rate": 1.5628519280804628e-07, + "loss": 0.3225, + "step": 11307 + }, + { + "epoch": 0.22, + "learning_rate": 1.5628130946371015e-07, + "loss": 0.688, + "step": 11308 + }, + { + "epoch": 0.22, + "learning_rate": 1.56277426119374e-07, + "loss": 0.0021, + "step": 11309 + }, + { + "epoch": 0.22, + "learning_rate": 1.5627354277503787e-07, + "loss": 0.0074, + "step": 11310 + }, + { + "epoch": 0.22, + "learning_rate": 1.562696594307017e-07, + "loss": 0.0036, + "step": 11311 + }, + { + "epoch": 0.22, + "learning_rate": 1.5626577608636558e-07, + "loss": 0.4009, + "step": 11312 + }, + { + "epoch": 0.22, + "learning_rate": 1.5626189274202943e-07, + "loss": 0.9098, + "step": 11313 + }, + { + "epoch": 0.22, + "learning_rate": 1.562580093976933e-07, + "loss": 0.006, + "step": 11314 + }, + { + "epoch": 0.22, + "learning_rate": 1.5625412605335714e-07, + "loss": 0.004, + "step": 11315 + }, + { + "epoch": 0.22, + "learning_rate": 1.5625024270902102e-07, + "loss": 0.0178, + "step": 11316 + }, + { + "epoch": 0.22, + "learning_rate": 1.5624635936468486e-07, + "loss": 0.0017, + "step": 11317 + }, + { + "epoch": 0.22, + "learning_rate": 1.5624247602034873e-07, + "loss": 0.0074, + "step": 11318 + }, + { + "epoch": 0.22, + "learning_rate": 1.5623859267601258e-07, + "loss": 0.0215, + "step": 11319 + }, + { + "epoch": 0.22, + "learning_rate": 1.5623470933167645e-07, + "loss": 0.002, + "step": 11320 + }, + { + "epoch": 0.22, + "learning_rate": 1.562308259873403e-07, + "loss": 0.0031, + "step": 11321 + }, + { + "epoch": 0.22, + "learning_rate": 1.5622694264300417e-07, + "loss": 0.0022, + "step": 11322 + }, + { + "epoch": 0.22, + "learning_rate": 1.56223059298668e-07, + "loss": 0.0866, + "step": 11323 + }, + { + "epoch": 0.22, + "learning_rate": 1.5621917595433188e-07, + "loss": 0.2174, + "step": 11324 + }, + { + "epoch": 0.22, + "learning_rate": 1.5621529260999573e-07, + "loss": 0.0031, + "step": 11325 + }, + { + "epoch": 0.22, + "learning_rate": 1.562114092656596e-07, + "loss": 0.9088, + "step": 11326 + }, + { + "epoch": 0.22, + "learning_rate": 1.5620752592132344e-07, + "loss": 0.0018, + "step": 11327 + }, + { + "epoch": 0.22, + "learning_rate": 1.5620364257698731e-07, + "loss": 0.0028, + "step": 11328 + }, + { + "epoch": 0.22, + "learning_rate": 1.5619975923265116e-07, + "loss": 0.0032, + "step": 11329 + }, + { + "epoch": 0.22, + "learning_rate": 1.5619587588831503e-07, + "loss": 0.002, + "step": 11330 + }, + { + "epoch": 0.22, + "learning_rate": 1.5619199254397885e-07, + "loss": 0.0028, + "step": 11331 + }, + { + "epoch": 0.22, + "learning_rate": 1.5618810919964272e-07, + "loss": 0.3405, + "step": 11332 + }, + { + "epoch": 0.22, + "learning_rate": 1.5618422585530657e-07, + "loss": 0.002, + "step": 11333 + }, + { + "epoch": 0.22, + "learning_rate": 1.5618034251097044e-07, + "loss": 0.546, + "step": 11334 + }, + { + "epoch": 0.22, + "learning_rate": 1.5617645916663428e-07, + "loss": 0.0286, + "step": 11335 + }, + { + "epoch": 0.22, + "learning_rate": 1.5617257582229815e-07, + "loss": 0.0057, + "step": 11336 + }, + { + "epoch": 0.22, + "learning_rate": 1.56168692477962e-07, + "loss": 0.0033, + "step": 11337 + }, + { + "epoch": 0.22, + "learning_rate": 1.5616480913362587e-07, + "loss": 0.0031, + "step": 11338 + }, + { + "epoch": 0.22, + "learning_rate": 1.5616092578928972e-07, + "loss": 0.0045, + "step": 11339 + }, + { + "epoch": 0.22, + "learning_rate": 1.561570424449536e-07, + "loss": 0.0025, + "step": 11340 + }, + { + "epoch": 0.22, + "learning_rate": 1.5615315910061743e-07, + "loss": 0.1762, + "step": 11341 + }, + { + "epoch": 0.22, + "learning_rate": 1.561492757562813e-07, + "loss": 0.0027, + "step": 11342 + }, + { + "epoch": 0.22, + "learning_rate": 1.5614539241194515e-07, + "loss": 0.0146, + "step": 11343 + }, + { + "epoch": 0.22, + "learning_rate": 1.5614150906760902e-07, + "loss": 0.006, + "step": 11344 + }, + { + "epoch": 0.22, + "learning_rate": 1.5613762572327287e-07, + "loss": 0.0025, + "step": 11345 + }, + { + "epoch": 0.22, + "learning_rate": 1.5613374237893674e-07, + "loss": 0.0023, + "step": 11346 + }, + { + "epoch": 0.22, + "learning_rate": 1.5612985903460058e-07, + "loss": 0.5493, + "step": 11347 + }, + { + "epoch": 0.22, + "learning_rate": 1.5612597569026445e-07, + "loss": 0.002, + "step": 11348 + }, + { + "epoch": 0.22, + "learning_rate": 1.561220923459283e-07, + "loss": 0.0028, + "step": 11349 + }, + { + "epoch": 0.22, + "learning_rate": 1.5611820900159217e-07, + "loss": 0.0023, + "step": 11350 + }, + { + "epoch": 0.22, + "learning_rate": 1.5611432565725601e-07, + "loss": 0.002, + "step": 11351 + }, + { + "epoch": 0.22, + "learning_rate": 1.5611044231291989e-07, + "loss": 0.1907, + "step": 11352 + }, + { + "epoch": 0.22, + "learning_rate": 1.5610655896858373e-07, + "loss": 0.0018, + "step": 11353 + }, + { + "epoch": 0.22, + "learning_rate": 1.561026756242476e-07, + "loss": 0.0019, + "step": 11354 + }, + { + "epoch": 0.22, + "learning_rate": 1.5609879227991145e-07, + "loss": 0.4618, + "step": 11355 + }, + { + "epoch": 0.22, + "learning_rate": 1.5609490893557532e-07, + "loss": 0.0021, + "step": 11356 + }, + { + "epoch": 0.22, + "learning_rate": 1.5609102559123916e-07, + "loss": 0.002, + "step": 11357 + }, + { + "epoch": 0.22, + "learning_rate": 1.5608714224690304e-07, + "loss": 0.0023, + "step": 11358 + }, + { + "epoch": 0.22, + "learning_rate": 1.5608325890256688e-07, + "loss": 0.0021, + "step": 11359 + }, + { + "epoch": 0.22, + "learning_rate": 1.5607937555823075e-07, + "loss": 0.0031, + "step": 11360 + }, + { + "epoch": 0.22, + "learning_rate": 1.560754922138946e-07, + "loss": 0.0677, + "step": 11361 + }, + { + "epoch": 0.22, + "learning_rate": 1.5607160886955847e-07, + "loss": 0.0062, + "step": 11362 + }, + { + "epoch": 0.22, + "learning_rate": 1.5606772552522231e-07, + "loss": 0.0017, + "step": 11363 + }, + { + "epoch": 0.22, + "learning_rate": 1.5606384218088619e-07, + "loss": 0.0018, + "step": 11364 + }, + { + "epoch": 0.22, + "learning_rate": 1.5605995883655003e-07, + "loss": 0.0021, + "step": 11365 + }, + { + "epoch": 0.22, + "learning_rate": 1.560560754922139e-07, + "loss": 0.0023, + "step": 11366 + }, + { + "epoch": 0.22, + "learning_rate": 1.5605219214787775e-07, + "loss": 0.003, + "step": 11367 + }, + { + "epoch": 0.22, + "learning_rate": 1.5604830880354162e-07, + "loss": 0.0026, + "step": 11368 + }, + { + "epoch": 0.22, + "learning_rate": 1.5604442545920546e-07, + "loss": 0.002, + "step": 11369 + }, + { + "epoch": 0.22, + "learning_rate": 1.5604054211486933e-07, + "loss": 0.0019, + "step": 11370 + }, + { + "epoch": 0.22, + "learning_rate": 1.5603665877053318e-07, + "loss": 0.003, + "step": 11371 + }, + { + "epoch": 0.22, + "learning_rate": 1.5603277542619705e-07, + "loss": 0.2411, + "step": 11372 + }, + { + "epoch": 0.22, + "learning_rate": 1.560288920818609e-07, + "loss": 0.0019, + "step": 11373 + }, + { + "epoch": 0.22, + "learning_rate": 1.5602500873752477e-07, + "loss": 0.0021, + "step": 11374 + }, + { + "epoch": 0.22, + "learning_rate": 1.560211253931886e-07, + "loss": 0.004, + "step": 11375 + }, + { + "epoch": 0.22, + "learning_rate": 1.5601724204885248e-07, + "loss": 0.0043, + "step": 11376 + }, + { + "epoch": 0.22, + "learning_rate": 1.5601335870451633e-07, + "loss": 0.0021, + "step": 11377 + }, + { + "epoch": 0.22, + "learning_rate": 1.5600947536018017e-07, + "loss": 0.0017, + "step": 11378 + }, + { + "epoch": 0.22, + "learning_rate": 1.5600559201584405e-07, + "loss": 0.0024, + "step": 11379 + }, + { + "epoch": 0.22, + "learning_rate": 1.560017086715079e-07, + "loss": 0.0026, + "step": 11380 + }, + { + "epoch": 0.22, + "learning_rate": 1.5599782532717176e-07, + "loss": 0.221, + "step": 11381 + }, + { + "epoch": 0.22, + "learning_rate": 1.559939419828356e-07, + "loss": 0.5849, + "step": 11382 + }, + { + "epoch": 0.22, + "learning_rate": 1.5599005863849948e-07, + "loss": 0.0034, + "step": 11383 + }, + { + "epoch": 0.22, + "learning_rate": 1.5598617529416332e-07, + "loss": 0.0022, + "step": 11384 + }, + { + "epoch": 0.22, + "learning_rate": 1.559822919498272e-07, + "loss": 0.0026, + "step": 11385 + }, + { + "epoch": 0.22, + "learning_rate": 1.5597840860549104e-07, + "loss": 0.4094, + "step": 11386 + }, + { + "epoch": 0.22, + "learning_rate": 1.559745252611549e-07, + "loss": 0.0035, + "step": 11387 + }, + { + "epoch": 0.22, + "learning_rate": 1.5597064191681876e-07, + "loss": 0.0043, + "step": 11388 + }, + { + "epoch": 0.22, + "learning_rate": 1.559667585724826e-07, + "loss": 0.0018, + "step": 11389 + }, + { + "epoch": 0.22, + "learning_rate": 1.5596287522814647e-07, + "loss": 0.1209, + "step": 11390 + }, + { + "epoch": 0.22, + "learning_rate": 1.5595899188381032e-07, + "loss": 0.0023, + "step": 11391 + }, + { + "epoch": 0.22, + "learning_rate": 1.559551085394742e-07, + "loss": 0.0029, + "step": 11392 + }, + { + "epoch": 0.22, + "learning_rate": 1.5595122519513803e-07, + "loss": 1.0403, + "step": 11393 + }, + { + "epoch": 0.22, + "learning_rate": 1.559473418508019e-07, + "loss": 0.5223, + "step": 11394 + }, + { + "epoch": 0.22, + "learning_rate": 1.5594345850646575e-07, + "loss": 0.0042, + "step": 11395 + }, + { + "epoch": 0.22, + "learning_rate": 1.5593957516212962e-07, + "loss": 0.0024, + "step": 11396 + }, + { + "epoch": 0.22, + "learning_rate": 1.5593569181779347e-07, + "loss": 0.0076, + "step": 11397 + }, + { + "epoch": 0.22, + "learning_rate": 1.5593180847345734e-07, + "loss": 0.0023, + "step": 11398 + }, + { + "epoch": 0.22, + "learning_rate": 1.5592792512912118e-07, + "loss": 0.0041, + "step": 11399 + }, + { + "epoch": 0.22, + "learning_rate": 1.5592404178478506e-07, + "loss": 0.0469, + "step": 11400 + }, + { + "epoch": 0.22, + "learning_rate": 1.559201584404489e-07, + "loss": 0.0019, + "step": 11401 + }, + { + "epoch": 0.22, + "learning_rate": 1.5591627509611277e-07, + "loss": 0.0097, + "step": 11402 + }, + { + "epoch": 0.22, + "learning_rate": 1.5591239175177662e-07, + "loss": 0.8331, + "step": 11403 + }, + { + "epoch": 0.22, + "learning_rate": 1.559085084074405e-07, + "loss": 0.0145, + "step": 11404 + }, + { + "epoch": 0.22, + "learning_rate": 1.5590462506310433e-07, + "loss": 0.0027, + "step": 11405 + }, + { + "epoch": 0.22, + "learning_rate": 1.559007417187682e-07, + "loss": 0.0259, + "step": 11406 + }, + { + "epoch": 0.22, + "learning_rate": 1.5589685837443205e-07, + "loss": 0.0187, + "step": 11407 + }, + { + "epoch": 0.22, + "learning_rate": 1.558929750300959e-07, + "loss": 0.0022, + "step": 11408 + }, + { + "epoch": 0.22, + "learning_rate": 1.5588909168575977e-07, + "loss": 0.0033, + "step": 11409 + }, + { + "epoch": 0.22, + "learning_rate": 1.558852083414236e-07, + "loss": 0.0103, + "step": 11410 + }, + { + "epoch": 0.22, + "learning_rate": 1.5588132499708748e-07, + "loss": 0.0024, + "step": 11411 + }, + { + "epoch": 0.22, + "learning_rate": 1.5587744165275133e-07, + "loss": 0.0022, + "step": 11412 + }, + { + "epoch": 0.22, + "learning_rate": 1.558735583084152e-07, + "loss": 0.0091, + "step": 11413 + }, + { + "epoch": 0.22, + "learning_rate": 1.5586967496407904e-07, + "loss": 0.002, + "step": 11414 + }, + { + "epoch": 0.22, + "learning_rate": 1.5586579161974292e-07, + "loss": 0.0024, + "step": 11415 + }, + { + "epoch": 0.22, + "learning_rate": 1.5586190827540676e-07, + "loss": 0.0025, + "step": 11416 + }, + { + "epoch": 0.22, + "learning_rate": 1.5585802493107063e-07, + "loss": 0.0047, + "step": 11417 + }, + { + "epoch": 0.22, + "learning_rate": 1.5585414158673448e-07, + "loss": 0.0076, + "step": 11418 + }, + { + "epoch": 0.22, + "learning_rate": 1.5585025824239835e-07, + "loss": 0.0606, + "step": 11419 + }, + { + "epoch": 0.22, + "learning_rate": 1.558463748980622e-07, + "loss": 0.6909, + "step": 11420 + }, + { + "epoch": 0.22, + "learning_rate": 1.5584249155372607e-07, + "loss": 0.0076, + "step": 11421 + }, + { + "epoch": 0.22, + "learning_rate": 1.558386082093899e-07, + "loss": 0.7069, + "step": 11422 + }, + { + "epoch": 0.22, + "learning_rate": 1.5583472486505378e-07, + "loss": 0.0119, + "step": 11423 + }, + { + "epoch": 0.22, + "learning_rate": 1.5583084152071763e-07, + "loss": 0.0035, + "step": 11424 + }, + { + "epoch": 0.22, + "learning_rate": 1.558269581763815e-07, + "loss": 0.002, + "step": 11425 + }, + { + "epoch": 0.22, + "learning_rate": 1.5582307483204534e-07, + "loss": 0.3678, + "step": 11426 + }, + { + "epoch": 0.22, + "learning_rate": 1.5581919148770921e-07, + "loss": 0.0032, + "step": 11427 + }, + { + "epoch": 0.22, + "learning_rate": 1.5581530814337306e-07, + "loss": 0.0022, + "step": 11428 + }, + { + "epoch": 0.22, + "learning_rate": 1.5581142479903693e-07, + "loss": 0.0017, + "step": 11429 + }, + { + "epoch": 0.22, + "learning_rate": 1.5580754145470078e-07, + "loss": 0.0019, + "step": 11430 + }, + { + "epoch": 0.22, + "learning_rate": 1.5580365811036465e-07, + "loss": 0.8367, + "step": 11431 + }, + { + "epoch": 0.22, + "learning_rate": 1.557997747660285e-07, + "loss": 0.0038, + "step": 11432 + }, + { + "epoch": 0.22, + "learning_rate": 1.5579589142169236e-07, + "loss": 0.0021, + "step": 11433 + }, + { + "epoch": 0.22, + "learning_rate": 1.557920080773562e-07, + "loss": 0.0019, + "step": 11434 + }, + { + "epoch": 0.22, + "learning_rate": 1.5578812473302008e-07, + "loss": 0.0019, + "step": 11435 + }, + { + "epoch": 0.22, + "learning_rate": 1.5578424138868393e-07, + "loss": 0.0141, + "step": 11436 + }, + { + "epoch": 0.22, + "learning_rate": 1.557803580443478e-07, + "loss": 0.0045, + "step": 11437 + }, + { + "epoch": 0.22, + "learning_rate": 1.5577647470001164e-07, + "loss": 0.0028, + "step": 11438 + }, + { + "epoch": 0.22, + "learning_rate": 1.5577259135567551e-07, + "loss": 0.0019, + "step": 11439 + }, + { + "epoch": 0.22, + "learning_rate": 1.5576870801133936e-07, + "loss": 0.0024, + "step": 11440 + }, + { + "epoch": 0.22, + "learning_rate": 1.5576482466700323e-07, + "loss": 0.003, + "step": 11441 + }, + { + "epoch": 0.22, + "learning_rate": 1.5576094132266708e-07, + "loss": 0.0023, + "step": 11442 + }, + { + "epoch": 0.22, + "learning_rate": 1.5575705797833095e-07, + "loss": 0.0236, + "step": 11443 + }, + { + "epoch": 0.22, + "learning_rate": 1.557531746339948e-07, + "loss": 0.0043, + "step": 11444 + }, + { + "epoch": 0.22, + "learning_rate": 1.5574929128965866e-07, + "loss": 0.0022, + "step": 11445 + }, + { + "epoch": 0.22, + "learning_rate": 1.557454079453225e-07, + "loss": 0.0021, + "step": 11446 + }, + { + "epoch": 0.22, + "learning_rate": 1.5574152460098635e-07, + "loss": 0.0025, + "step": 11447 + }, + { + "epoch": 0.22, + "learning_rate": 1.557376412566502e-07, + "loss": 0.0018, + "step": 11448 + }, + { + "epoch": 0.22, + "learning_rate": 1.5573375791231407e-07, + "loss": 0.0041, + "step": 11449 + }, + { + "epoch": 0.22, + "learning_rate": 1.5572987456797791e-07, + "loss": 0.0022, + "step": 11450 + }, + { + "epoch": 0.22, + "learning_rate": 1.5572599122364179e-07, + "loss": 0.0029, + "step": 11451 + }, + { + "epoch": 0.22, + "learning_rate": 1.5572210787930563e-07, + "loss": 0.65, + "step": 11452 + }, + { + "epoch": 0.22, + "learning_rate": 1.557182245349695e-07, + "loss": 0.2982, + "step": 11453 + }, + { + "epoch": 0.22, + "learning_rate": 1.5571434119063335e-07, + "loss": 0.002, + "step": 11454 + }, + { + "epoch": 0.22, + "learning_rate": 1.5571045784629722e-07, + "loss": 0.003, + "step": 11455 + }, + { + "epoch": 0.22, + "learning_rate": 1.5570657450196106e-07, + "loss": 0.7271, + "step": 11456 + }, + { + "epoch": 0.22, + "learning_rate": 1.5570269115762494e-07, + "loss": 0.0022, + "step": 11457 + }, + { + "epoch": 0.22, + "learning_rate": 1.5569880781328878e-07, + "loss": 0.002, + "step": 11458 + }, + { + "epoch": 0.22, + "learning_rate": 1.5569492446895265e-07, + "loss": 0.0139, + "step": 11459 + }, + { + "epoch": 0.22, + "learning_rate": 1.556910411246165e-07, + "loss": 0.0157, + "step": 11460 + }, + { + "epoch": 0.22, + "learning_rate": 1.5568715778028037e-07, + "loss": 0.0022, + "step": 11461 + }, + { + "epoch": 0.22, + "learning_rate": 1.5568327443594421e-07, + "loss": 0.0021, + "step": 11462 + }, + { + "epoch": 0.22, + "learning_rate": 1.5567939109160809e-07, + "loss": 0.0018, + "step": 11463 + }, + { + "epoch": 0.22, + "learning_rate": 1.5567550774727193e-07, + "loss": 0.0019, + "step": 11464 + }, + { + "epoch": 0.22, + "learning_rate": 1.556716244029358e-07, + "loss": 0.0022, + "step": 11465 + }, + { + "epoch": 0.22, + "learning_rate": 1.5566774105859965e-07, + "loss": 0.0019, + "step": 11466 + }, + { + "epoch": 0.22, + "learning_rate": 1.5566385771426352e-07, + "loss": 0.0418, + "step": 11467 + }, + { + "epoch": 0.22, + "learning_rate": 1.5565997436992736e-07, + "loss": 0.0021, + "step": 11468 + }, + { + "epoch": 0.22, + "learning_rate": 1.5565609102559123e-07, + "loss": 0.0021, + "step": 11469 + }, + { + "epoch": 0.22, + "learning_rate": 1.5565220768125508e-07, + "loss": 0.0031, + "step": 11470 + }, + { + "epoch": 0.22, + "learning_rate": 1.5564832433691895e-07, + "loss": 0.002, + "step": 11471 + }, + { + "epoch": 0.22, + "learning_rate": 1.556444409925828e-07, + "loss": 0.0038, + "step": 11472 + }, + { + "epoch": 0.22, + "learning_rate": 1.5564055764824667e-07, + "loss": 0.002, + "step": 11473 + }, + { + "epoch": 0.22, + "learning_rate": 1.556366743039105e-07, + "loss": 0.0024, + "step": 11474 + }, + { + "epoch": 0.22, + "learning_rate": 1.5563279095957438e-07, + "loss": 0.0018, + "step": 11475 + }, + { + "epoch": 0.22, + "learning_rate": 1.5562890761523823e-07, + "loss": 0.0026, + "step": 11476 + }, + { + "epoch": 0.22, + "learning_rate": 1.556250242709021e-07, + "loss": 0.0033, + "step": 11477 + }, + { + "epoch": 0.22, + "learning_rate": 1.5562114092656595e-07, + "loss": 0.0019, + "step": 11478 + }, + { + "epoch": 0.22, + "learning_rate": 1.5561725758222982e-07, + "loss": 0.0022, + "step": 11479 + }, + { + "epoch": 0.22, + "learning_rate": 1.5561337423789366e-07, + "loss": 0.0033, + "step": 11480 + }, + { + "epoch": 0.22, + "learning_rate": 1.5560949089355753e-07, + "loss": 0.0014, + "step": 11481 + }, + { + "epoch": 0.22, + "learning_rate": 1.5560560754922138e-07, + "loss": 0.0031, + "step": 11482 + }, + { + "epoch": 0.22, + "learning_rate": 1.5560172420488525e-07, + "loss": 0.3323, + "step": 11483 + }, + { + "epoch": 0.22, + "learning_rate": 1.555978408605491e-07, + "loss": 1.0676, + "step": 11484 + }, + { + "epoch": 0.22, + "learning_rate": 1.5559395751621297e-07, + "loss": 0.0023, + "step": 11485 + }, + { + "epoch": 0.22, + "learning_rate": 1.555900741718768e-07, + "loss": 0.1098, + "step": 11486 + }, + { + "epoch": 0.22, + "learning_rate": 1.5558619082754068e-07, + "loss": 0.8976, + "step": 11487 + }, + { + "epoch": 0.22, + "learning_rate": 1.5558230748320453e-07, + "loss": 0.3303, + "step": 11488 + }, + { + "epoch": 0.22, + "learning_rate": 1.555784241388684e-07, + "loss": 0.0021, + "step": 11489 + }, + { + "epoch": 0.22, + "learning_rate": 1.5557454079453224e-07, + "loss": 0.0063, + "step": 11490 + }, + { + "epoch": 0.22, + "learning_rate": 1.5557065745019612e-07, + "loss": 0.0028, + "step": 11491 + }, + { + "epoch": 0.22, + "learning_rate": 1.5556677410585996e-07, + "loss": 0.0021, + "step": 11492 + }, + { + "epoch": 0.22, + "learning_rate": 1.5556289076152383e-07, + "loss": 0.5865, + "step": 11493 + }, + { + "epoch": 0.22, + "learning_rate": 1.5555900741718768e-07, + "loss": 0.5018, + "step": 11494 + }, + { + "epoch": 0.22, + "learning_rate": 1.5555512407285155e-07, + "loss": 0.0021, + "step": 11495 + }, + { + "epoch": 0.22, + "learning_rate": 1.555512407285154e-07, + "loss": 0.8844, + "step": 11496 + }, + { + "epoch": 0.22, + "learning_rate": 1.5554735738417927e-07, + "loss": 0.0019, + "step": 11497 + }, + { + "epoch": 0.22, + "learning_rate": 1.555434740398431e-07, + "loss": 0.0021, + "step": 11498 + }, + { + "epoch": 0.22, + "learning_rate": 1.5553959069550698e-07, + "loss": 0.003, + "step": 11499 + }, + { + "epoch": 0.22, + "learning_rate": 1.5553570735117083e-07, + "loss": 0.0055, + "step": 11500 + }, + { + "epoch": 0.22, + "learning_rate": 1.555318240068347e-07, + "loss": 0.023, + "step": 11501 + }, + { + "epoch": 0.22, + "learning_rate": 1.5552794066249854e-07, + "loss": 0.0067, + "step": 11502 + }, + { + "epoch": 0.22, + "learning_rate": 1.5552405731816241e-07, + "loss": 0.0021, + "step": 11503 + }, + { + "epoch": 0.22, + "learning_rate": 1.5552017397382626e-07, + "loss": 0.1687, + "step": 11504 + }, + { + "epoch": 0.22, + "learning_rate": 1.555162906294901e-07, + "loss": 0.0023, + "step": 11505 + }, + { + "epoch": 0.22, + "learning_rate": 1.5551240728515395e-07, + "loss": 0.0018, + "step": 11506 + }, + { + "epoch": 0.22, + "learning_rate": 1.5550852394081782e-07, + "loss": 0.0019, + "step": 11507 + }, + { + "epoch": 0.22, + "learning_rate": 1.5550464059648167e-07, + "loss": 0.0117, + "step": 11508 + }, + { + "epoch": 0.22, + "learning_rate": 1.5550075725214554e-07, + "loss": 0.0026, + "step": 11509 + }, + { + "epoch": 0.22, + "learning_rate": 1.5549687390780938e-07, + "loss": 0.0021, + "step": 11510 + }, + { + "epoch": 0.22, + "learning_rate": 1.5549299056347325e-07, + "loss": 0.0027, + "step": 11511 + }, + { + "epoch": 0.22, + "learning_rate": 1.554891072191371e-07, + "loss": 0.518, + "step": 11512 + }, + { + "epoch": 0.22, + "learning_rate": 1.5548522387480097e-07, + "loss": 0.9211, + "step": 11513 + }, + { + "epoch": 0.22, + "learning_rate": 1.5548134053046482e-07, + "loss": 0.0021, + "step": 11514 + }, + { + "epoch": 0.22, + "learning_rate": 1.554774571861287e-07, + "loss": 0.0021, + "step": 11515 + }, + { + "epoch": 0.22, + "learning_rate": 1.5547357384179253e-07, + "loss": 0.0076, + "step": 11516 + }, + { + "epoch": 0.22, + "learning_rate": 1.554696904974564e-07, + "loss": 0.0151, + "step": 11517 + }, + { + "epoch": 0.22, + "learning_rate": 1.5546580715312025e-07, + "loss": 0.0021, + "step": 11518 + }, + { + "epoch": 0.22, + "learning_rate": 1.5546192380878412e-07, + "loss": 0.1169, + "step": 11519 + }, + { + "epoch": 0.22, + "learning_rate": 1.5545804046444797e-07, + "loss": 0.0021, + "step": 11520 + }, + { + "epoch": 0.22, + "learning_rate": 1.5545415712011184e-07, + "loss": 0.0044, + "step": 11521 + }, + { + "epoch": 0.22, + "learning_rate": 1.5545027377577568e-07, + "loss": 0.0025, + "step": 11522 + }, + { + "epoch": 0.22, + "learning_rate": 1.5544639043143955e-07, + "loss": 0.0049, + "step": 11523 + }, + { + "epoch": 0.22, + "learning_rate": 1.554425070871034e-07, + "loss": 0.0033, + "step": 11524 + }, + { + "epoch": 0.22, + "learning_rate": 1.5543862374276727e-07, + "loss": 0.0022, + "step": 11525 + }, + { + "epoch": 0.22, + "learning_rate": 1.5543474039843111e-07, + "loss": 0.0019, + "step": 11526 + }, + { + "epoch": 0.22, + "learning_rate": 1.5543085705409499e-07, + "loss": 0.0027, + "step": 11527 + }, + { + "epoch": 0.22, + "learning_rate": 1.5542697370975883e-07, + "loss": 0.0019, + "step": 11528 + }, + { + "epoch": 0.22, + "learning_rate": 1.554230903654227e-07, + "loss": 0.0038, + "step": 11529 + }, + { + "epoch": 0.22, + "learning_rate": 1.5541920702108655e-07, + "loss": 0.002, + "step": 11530 + }, + { + "epoch": 0.22, + "learning_rate": 1.5541532367675042e-07, + "loss": 0.0024, + "step": 11531 + }, + { + "epoch": 0.22, + "learning_rate": 1.5541144033241426e-07, + "loss": 0.0019, + "step": 11532 + }, + { + "epoch": 0.22, + "learning_rate": 1.5540755698807814e-07, + "loss": 0.0022, + "step": 11533 + }, + { + "epoch": 0.22, + "learning_rate": 1.5540367364374198e-07, + "loss": 0.0034, + "step": 11534 + }, + { + "epoch": 0.22, + "learning_rate": 1.5539979029940585e-07, + "loss": 1.2333, + "step": 11535 + }, + { + "epoch": 0.22, + "learning_rate": 1.553959069550697e-07, + "loss": 0.7371, + "step": 11536 + }, + { + "epoch": 0.22, + "learning_rate": 1.5539202361073357e-07, + "loss": 0.0037, + "step": 11537 + }, + { + "epoch": 0.22, + "learning_rate": 1.5538814026639741e-07, + "loss": 0.0026, + "step": 11538 + }, + { + "epoch": 0.22, + "learning_rate": 1.5538425692206129e-07, + "loss": 0.0029, + "step": 11539 + }, + { + "epoch": 0.22, + "learning_rate": 1.5538037357772513e-07, + "loss": 0.0022, + "step": 11540 + }, + { + "epoch": 0.22, + "learning_rate": 1.55376490233389e-07, + "loss": 0.0027, + "step": 11541 + }, + { + "epoch": 0.22, + "learning_rate": 1.5537260688905285e-07, + "loss": 0.0021, + "step": 11542 + }, + { + "epoch": 0.22, + "learning_rate": 1.5536872354471672e-07, + "loss": 0.0019, + "step": 11543 + }, + { + "epoch": 0.22, + "learning_rate": 1.5536484020038056e-07, + "loss": 0.0025, + "step": 11544 + }, + { + "epoch": 0.22, + "learning_rate": 1.5536095685604443e-07, + "loss": 0.0023, + "step": 11545 + }, + { + "epoch": 0.22, + "learning_rate": 1.5535707351170828e-07, + "loss": 0.0024, + "step": 11546 + }, + { + "epoch": 0.22, + "learning_rate": 1.5535319016737215e-07, + "loss": 0.0209, + "step": 11547 + }, + { + "epoch": 0.22, + "learning_rate": 1.55349306823036e-07, + "loss": 0.0173, + "step": 11548 + }, + { + "epoch": 0.22, + "learning_rate": 1.5534542347869987e-07, + "loss": 0.4893, + "step": 11549 + }, + { + "epoch": 0.22, + "learning_rate": 1.553415401343637e-07, + "loss": 0.0334, + "step": 11550 + }, + { + "epoch": 0.22, + "learning_rate": 1.5533765679002758e-07, + "loss": 0.0025, + "step": 11551 + }, + { + "epoch": 0.22, + "learning_rate": 1.5533377344569143e-07, + "loss": 0.0021, + "step": 11552 + }, + { + "epoch": 0.22, + "learning_rate": 1.553298901013553e-07, + "loss": 0.0022, + "step": 11553 + }, + { + "epoch": 0.22, + "learning_rate": 1.5532600675701915e-07, + "loss": 0.003, + "step": 11554 + }, + { + "epoch": 0.22, + "learning_rate": 1.55322123412683e-07, + "loss": 0.0051, + "step": 11555 + }, + { + "epoch": 0.22, + "learning_rate": 1.5531824006834686e-07, + "loss": 0.5967, + "step": 11556 + }, + { + "epoch": 0.22, + "learning_rate": 1.553143567240107e-07, + "loss": 0.0025, + "step": 11557 + }, + { + "epoch": 0.22, + "learning_rate": 1.5531047337967458e-07, + "loss": 0.0107, + "step": 11558 + }, + { + "epoch": 0.22, + "learning_rate": 1.5530659003533842e-07, + "loss": 0.0046, + "step": 11559 + }, + { + "epoch": 0.22, + "learning_rate": 1.553027066910023e-07, + "loss": 0.0033, + "step": 11560 + }, + { + "epoch": 0.22, + "learning_rate": 1.5529882334666614e-07, + "loss": 0.9409, + "step": 11561 + }, + { + "epoch": 0.22, + "learning_rate": 1.5529494000233e-07, + "loss": 0.0023, + "step": 11562 + }, + { + "epoch": 0.22, + "learning_rate": 1.5529105665799386e-07, + "loss": 0.1169, + "step": 11563 + }, + { + "epoch": 0.22, + "learning_rate": 1.552871733136577e-07, + "loss": 0.0017, + "step": 11564 + }, + { + "epoch": 0.22, + "learning_rate": 1.5528328996932157e-07, + "loss": 0.0022, + "step": 11565 + }, + { + "epoch": 0.22, + "learning_rate": 1.5527940662498542e-07, + "loss": 0.0025, + "step": 11566 + }, + { + "epoch": 0.22, + "learning_rate": 1.552755232806493e-07, + "loss": 0.0581, + "step": 11567 + }, + { + "epoch": 0.22, + "learning_rate": 1.5527163993631313e-07, + "loss": 0.0032, + "step": 11568 + }, + { + "epoch": 0.22, + "learning_rate": 1.55267756591977e-07, + "loss": 0.0022, + "step": 11569 + }, + { + "epoch": 0.22, + "learning_rate": 1.5526387324764085e-07, + "loss": 0.002, + "step": 11570 + }, + { + "epoch": 0.22, + "learning_rate": 1.5525998990330472e-07, + "loss": 0.0018, + "step": 11571 + }, + { + "epoch": 0.22, + "learning_rate": 1.5525610655896857e-07, + "loss": 0.0021, + "step": 11572 + }, + { + "epoch": 0.22, + "learning_rate": 1.5525222321463244e-07, + "loss": 0.002, + "step": 11573 + }, + { + "epoch": 0.22, + "learning_rate": 1.5524833987029628e-07, + "loss": 0.0022, + "step": 11574 + }, + { + "epoch": 0.22, + "learning_rate": 1.5524445652596016e-07, + "loss": 0.0033, + "step": 11575 + }, + { + "epoch": 0.22, + "learning_rate": 1.55240573181624e-07, + "loss": 0.4003, + "step": 11576 + }, + { + "epoch": 0.22, + "learning_rate": 1.5523668983728787e-07, + "loss": 0.0023, + "step": 11577 + }, + { + "epoch": 0.22, + "learning_rate": 1.5523280649295172e-07, + "loss": 0.0031, + "step": 11578 + }, + { + "epoch": 0.22, + "learning_rate": 1.552289231486156e-07, + "loss": 0.0064, + "step": 11579 + }, + { + "epoch": 0.22, + "learning_rate": 1.5522503980427943e-07, + "loss": 0.0022, + "step": 11580 + }, + { + "epoch": 0.22, + "learning_rate": 1.552211564599433e-07, + "loss": 0.0246, + "step": 11581 + }, + { + "epoch": 0.22, + "learning_rate": 1.5521727311560715e-07, + "loss": 0.0022, + "step": 11582 + }, + { + "epoch": 0.22, + "learning_rate": 1.5521338977127102e-07, + "loss": 0.0182, + "step": 11583 + }, + { + "epoch": 0.22, + "learning_rate": 1.5520950642693487e-07, + "loss": 0.0094, + "step": 11584 + }, + { + "epoch": 0.22, + "learning_rate": 1.552056230825987e-07, + "loss": 0.0029, + "step": 11585 + }, + { + "epoch": 0.22, + "learning_rate": 1.5520173973826258e-07, + "loss": 0.0031, + "step": 11586 + }, + { + "epoch": 0.22, + "learning_rate": 1.5519785639392643e-07, + "loss": 0.0104, + "step": 11587 + }, + { + "epoch": 0.22, + "learning_rate": 1.551939730495903e-07, + "loss": 0.2497, + "step": 11588 + }, + { + "epoch": 0.22, + "learning_rate": 1.5519008970525414e-07, + "loss": 0.0034, + "step": 11589 + }, + { + "epoch": 0.22, + "learning_rate": 1.5518620636091802e-07, + "loss": 0.0029, + "step": 11590 + }, + { + "epoch": 0.22, + "learning_rate": 1.5518232301658186e-07, + "loss": 0.0119, + "step": 11591 + }, + { + "epoch": 0.22, + "learning_rate": 1.5517843967224573e-07, + "loss": 0.0031, + "step": 11592 + }, + { + "epoch": 0.22, + "learning_rate": 1.5517455632790958e-07, + "loss": 0.0061, + "step": 11593 + }, + { + "epoch": 0.22, + "learning_rate": 1.5517067298357345e-07, + "loss": 0.0018, + "step": 11594 + }, + { + "epoch": 0.22, + "learning_rate": 1.551667896392373e-07, + "loss": 0.9256, + "step": 11595 + }, + { + "epoch": 0.22, + "learning_rate": 1.5516290629490117e-07, + "loss": 0.0021, + "step": 11596 + }, + { + "epoch": 0.22, + "learning_rate": 1.55159022950565e-07, + "loss": 0.1586, + "step": 11597 + }, + { + "epoch": 0.22, + "learning_rate": 1.5515513960622888e-07, + "loss": 0.0316, + "step": 11598 + }, + { + "epoch": 0.22, + "learning_rate": 1.5515125626189273e-07, + "loss": 0.0017, + "step": 11599 + }, + { + "epoch": 0.23, + "learning_rate": 1.551473729175566e-07, + "loss": 0.0077, + "step": 11600 + }, + { + "epoch": 0.23, + "learning_rate": 1.5514348957322044e-07, + "loss": 0.3553, + "step": 11601 + }, + { + "epoch": 0.23, + "learning_rate": 1.5513960622888431e-07, + "loss": 0.0021, + "step": 11602 + }, + { + "epoch": 0.23, + "learning_rate": 1.5513572288454816e-07, + "loss": 0.0028, + "step": 11603 + }, + { + "epoch": 0.23, + "learning_rate": 1.5513183954021203e-07, + "loss": 0.1496, + "step": 11604 + }, + { + "epoch": 0.23, + "learning_rate": 1.5512795619587588e-07, + "loss": 0.0018, + "step": 11605 + }, + { + "epoch": 0.23, + "learning_rate": 1.5512407285153975e-07, + "loss": 0.4088, + "step": 11606 + }, + { + "epoch": 0.23, + "learning_rate": 1.551201895072036e-07, + "loss": 0.3772, + "step": 11607 + }, + { + "epoch": 0.23, + "learning_rate": 1.5511630616286746e-07, + "loss": 0.0022, + "step": 11608 + }, + { + "epoch": 0.23, + "learning_rate": 1.551124228185313e-07, + "loss": 0.002, + "step": 11609 + }, + { + "epoch": 0.23, + "learning_rate": 1.5510853947419518e-07, + "loss": 0.0024, + "step": 11610 + }, + { + "epoch": 0.23, + "learning_rate": 1.5510465612985903e-07, + "loss": 0.0355, + "step": 11611 + }, + { + "epoch": 0.23, + "learning_rate": 1.551007727855229e-07, + "loss": 0.0076, + "step": 11612 + }, + { + "epoch": 0.23, + "learning_rate": 1.5509688944118674e-07, + "loss": 0.0034, + "step": 11613 + }, + { + "epoch": 0.23, + "learning_rate": 1.5509300609685061e-07, + "loss": 0.0029, + "step": 11614 + }, + { + "epoch": 0.23, + "learning_rate": 1.5508912275251446e-07, + "loss": 0.0025, + "step": 11615 + }, + { + "epoch": 0.23, + "learning_rate": 1.5508523940817833e-07, + "loss": 1.2175, + "step": 11616 + }, + { + "epoch": 0.23, + "learning_rate": 1.5508135606384218e-07, + "loss": 0.004, + "step": 11617 + }, + { + "epoch": 0.23, + "learning_rate": 1.5507747271950605e-07, + "loss": 0.0021, + "step": 11618 + }, + { + "epoch": 0.23, + "learning_rate": 1.550735893751699e-07, + "loss": 0.4092, + "step": 11619 + }, + { + "epoch": 0.23, + "learning_rate": 1.5506970603083376e-07, + "loss": 0.0461, + "step": 11620 + }, + { + "epoch": 0.23, + "learning_rate": 1.5506582268649758e-07, + "loss": 0.0041, + "step": 11621 + }, + { + "epoch": 0.23, + "learning_rate": 1.5506193934216145e-07, + "loss": 0.0041, + "step": 11622 + }, + { + "epoch": 0.23, + "learning_rate": 1.550580559978253e-07, + "loss": 0.0067, + "step": 11623 + }, + { + "epoch": 0.23, + "learning_rate": 1.5505417265348917e-07, + "loss": 0.0018, + "step": 11624 + }, + { + "epoch": 0.23, + "learning_rate": 1.5505028930915301e-07, + "loss": 0.0019, + "step": 11625 + }, + { + "epoch": 0.23, + "learning_rate": 1.5504640596481689e-07, + "loss": 0.4389, + "step": 11626 + }, + { + "epoch": 0.23, + "learning_rate": 1.5504252262048073e-07, + "loss": 0.0152, + "step": 11627 + }, + { + "epoch": 0.23, + "learning_rate": 1.550386392761446e-07, + "loss": 0.0022, + "step": 11628 + }, + { + "epoch": 0.23, + "learning_rate": 1.5503475593180845e-07, + "loss": 0.0021, + "step": 11629 + }, + { + "epoch": 0.23, + "learning_rate": 1.5503087258747232e-07, + "loss": 0.0025, + "step": 11630 + }, + { + "epoch": 0.23, + "learning_rate": 1.5502698924313616e-07, + "loss": 0.0024, + "step": 11631 + }, + { + "epoch": 0.23, + "learning_rate": 1.5502310589880004e-07, + "loss": 0.0023, + "step": 11632 + }, + { + "epoch": 0.23, + "learning_rate": 1.5501922255446388e-07, + "loss": 0.0022, + "step": 11633 + }, + { + "epoch": 0.23, + "learning_rate": 1.5501533921012775e-07, + "loss": 0.0456, + "step": 11634 + }, + { + "epoch": 0.23, + "learning_rate": 1.550114558657916e-07, + "loss": 0.0022, + "step": 11635 + }, + { + "epoch": 0.23, + "learning_rate": 1.5500757252145547e-07, + "loss": 0.002, + "step": 11636 + }, + { + "epoch": 0.23, + "learning_rate": 1.5500368917711931e-07, + "loss": 0.0037, + "step": 11637 + }, + { + "epoch": 0.23, + "learning_rate": 1.5499980583278319e-07, + "loss": 0.002, + "step": 11638 + }, + { + "epoch": 0.23, + "learning_rate": 1.5499592248844703e-07, + "loss": 0.3285, + "step": 11639 + }, + { + "epoch": 0.23, + "learning_rate": 1.549920391441109e-07, + "loss": 0.4731, + "step": 11640 + }, + { + "epoch": 0.23, + "learning_rate": 1.5498815579977475e-07, + "loss": 0.0033, + "step": 11641 + }, + { + "epoch": 0.23, + "learning_rate": 1.5498427245543862e-07, + "loss": 0.0024, + "step": 11642 + }, + { + "epoch": 0.23, + "learning_rate": 1.5498038911110246e-07, + "loss": 0.0023, + "step": 11643 + }, + { + "epoch": 0.23, + "learning_rate": 1.5497650576676633e-07, + "loss": 0.0034, + "step": 11644 + }, + { + "epoch": 0.23, + "learning_rate": 1.5497262242243018e-07, + "loss": 0.0019, + "step": 11645 + }, + { + "epoch": 0.23, + "learning_rate": 1.5496873907809405e-07, + "loss": 0.0015, + "step": 11646 + }, + { + "epoch": 0.23, + "learning_rate": 1.549648557337579e-07, + "loss": 0.002, + "step": 11647 + }, + { + "epoch": 0.23, + "learning_rate": 1.5496097238942177e-07, + "loss": 0.2804, + "step": 11648 + }, + { + "epoch": 0.23, + "learning_rate": 1.549570890450856e-07, + "loss": 0.0078, + "step": 11649 + }, + { + "epoch": 0.23, + "learning_rate": 1.5495320570074948e-07, + "loss": 0.0018, + "step": 11650 + }, + { + "epoch": 0.23, + "learning_rate": 1.5494932235641333e-07, + "loss": 0.0023, + "step": 11651 + }, + { + "epoch": 0.23, + "learning_rate": 1.549454390120772e-07, + "loss": 0.0018, + "step": 11652 + }, + { + "epoch": 0.23, + "learning_rate": 1.5494155566774105e-07, + "loss": 0.002, + "step": 11653 + }, + { + "epoch": 0.23, + "learning_rate": 1.5493767232340492e-07, + "loss": 0.0129, + "step": 11654 + }, + { + "epoch": 0.23, + "learning_rate": 1.5493378897906876e-07, + "loss": 0.0022, + "step": 11655 + }, + { + "epoch": 0.23, + "learning_rate": 1.5492990563473263e-07, + "loss": 0.002, + "step": 11656 + }, + { + "epoch": 0.23, + "learning_rate": 1.5492602229039648e-07, + "loss": 0.0033, + "step": 11657 + }, + { + "epoch": 0.23, + "learning_rate": 1.5492213894606035e-07, + "loss": 0.0039, + "step": 11658 + }, + { + "epoch": 0.23, + "learning_rate": 1.549182556017242e-07, + "loss": 0.0024, + "step": 11659 + }, + { + "epoch": 0.23, + "learning_rate": 1.5491437225738807e-07, + "loss": 0.0018, + "step": 11660 + }, + { + "epoch": 0.23, + "learning_rate": 1.549104889130519e-07, + "loss": 0.0016, + "step": 11661 + }, + { + "epoch": 0.23, + "learning_rate": 1.5490660556871578e-07, + "loss": 0.3573, + "step": 11662 + }, + { + "epoch": 0.23, + "learning_rate": 1.5490272222437963e-07, + "loss": 0.5072, + "step": 11663 + }, + { + "epoch": 0.23, + "learning_rate": 1.548988388800435e-07, + "loss": 0.0015, + "step": 11664 + }, + { + "epoch": 0.23, + "learning_rate": 1.5489495553570734e-07, + "loss": 0.4276, + "step": 11665 + }, + { + "epoch": 0.23, + "learning_rate": 1.5489107219137122e-07, + "loss": 0.0202, + "step": 11666 + }, + { + "epoch": 0.23, + "learning_rate": 1.5488718884703506e-07, + "loss": 0.0096, + "step": 11667 + }, + { + "epoch": 0.23, + "learning_rate": 1.5488330550269893e-07, + "loss": 0.0023, + "step": 11668 + }, + { + "epoch": 0.23, + "learning_rate": 1.5487942215836278e-07, + "loss": 1.4773, + "step": 11669 + }, + { + "epoch": 0.23, + "learning_rate": 1.5487553881402665e-07, + "loss": 0.6224, + "step": 11670 + }, + { + "epoch": 0.23, + "learning_rate": 1.548716554696905e-07, + "loss": 0.0021, + "step": 11671 + }, + { + "epoch": 0.23, + "learning_rate": 1.5486777212535437e-07, + "loss": 1.0979, + "step": 11672 + }, + { + "epoch": 0.23, + "learning_rate": 1.548638887810182e-07, + "loss": 0.0024, + "step": 11673 + }, + { + "epoch": 0.23, + "learning_rate": 1.5486000543668208e-07, + "loss": 0.0022, + "step": 11674 + }, + { + "epoch": 0.23, + "learning_rate": 1.5485612209234593e-07, + "loss": 0.0463, + "step": 11675 + }, + { + "epoch": 0.23, + "learning_rate": 1.548522387480098e-07, + "loss": 0.0022, + "step": 11676 + }, + { + "epoch": 0.23, + "learning_rate": 1.5484835540367364e-07, + "loss": 0.0033, + "step": 11677 + }, + { + "epoch": 0.23, + "learning_rate": 1.5484447205933752e-07, + "loss": 0.012, + "step": 11678 + }, + { + "epoch": 0.23, + "learning_rate": 1.5484058871500133e-07, + "loss": 0.0023, + "step": 11679 + }, + { + "epoch": 0.23, + "learning_rate": 1.548367053706652e-07, + "loss": 0.0019, + "step": 11680 + }, + { + "epoch": 0.23, + "learning_rate": 1.5483282202632905e-07, + "loss": 0.7581, + "step": 11681 + }, + { + "epoch": 0.23, + "learning_rate": 1.5482893868199292e-07, + "loss": 0.0143, + "step": 11682 + }, + { + "epoch": 0.23, + "learning_rate": 1.5482505533765677e-07, + "loss": 0.6706, + "step": 11683 + }, + { + "epoch": 0.23, + "learning_rate": 1.5482117199332064e-07, + "loss": 0.002, + "step": 11684 + }, + { + "epoch": 0.23, + "learning_rate": 1.5481728864898448e-07, + "loss": 0.0081, + "step": 11685 + }, + { + "epoch": 0.23, + "learning_rate": 1.5481340530464835e-07, + "loss": 0.0021, + "step": 11686 + }, + { + "epoch": 0.23, + "learning_rate": 1.548095219603122e-07, + "loss": 0.0097, + "step": 11687 + }, + { + "epoch": 0.23, + "learning_rate": 1.5480563861597607e-07, + "loss": 0.0055, + "step": 11688 + }, + { + "epoch": 0.23, + "learning_rate": 1.5480175527163992e-07, + "loss": 0.0021, + "step": 11689 + }, + { + "epoch": 0.23, + "learning_rate": 1.547978719273038e-07, + "loss": 1.1446, + "step": 11690 + }, + { + "epoch": 0.23, + "learning_rate": 1.5479398858296763e-07, + "loss": 0.0024, + "step": 11691 + }, + { + "epoch": 0.23, + "learning_rate": 1.547901052386315e-07, + "loss": 0.0014, + "step": 11692 + }, + { + "epoch": 0.23, + "learning_rate": 1.5478622189429535e-07, + "loss": 0.0057, + "step": 11693 + }, + { + "epoch": 0.23, + "learning_rate": 1.5478233854995922e-07, + "loss": 0.0019, + "step": 11694 + }, + { + "epoch": 0.23, + "learning_rate": 1.5477845520562307e-07, + "loss": 0.0022, + "step": 11695 + }, + { + "epoch": 0.23, + "learning_rate": 1.5477457186128694e-07, + "loss": 0.015, + "step": 11696 + }, + { + "epoch": 0.23, + "learning_rate": 1.5477068851695078e-07, + "loss": 0.005, + "step": 11697 + }, + { + "epoch": 0.23, + "learning_rate": 1.5476680517261465e-07, + "loss": 0.0028, + "step": 11698 + }, + { + "epoch": 0.23, + "learning_rate": 1.547629218282785e-07, + "loss": 0.0026, + "step": 11699 + }, + { + "epoch": 0.23, + "learning_rate": 1.5475903848394237e-07, + "loss": 0.0991, + "step": 11700 + }, + { + "epoch": 0.23, + "learning_rate": 1.5475515513960621e-07, + "loss": 0.0017, + "step": 11701 + }, + { + "epoch": 0.23, + "learning_rate": 1.5475127179527009e-07, + "loss": 0.0018, + "step": 11702 + }, + { + "epoch": 0.23, + "learning_rate": 1.5474738845093393e-07, + "loss": 0.0097, + "step": 11703 + }, + { + "epoch": 0.23, + "learning_rate": 1.547435051065978e-07, + "loss": 0.0024, + "step": 11704 + }, + { + "epoch": 0.23, + "learning_rate": 1.5473962176226165e-07, + "loss": 0.0155, + "step": 11705 + }, + { + "epoch": 0.23, + "learning_rate": 1.5473573841792552e-07, + "loss": 0.0019, + "step": 11706 + }, + { + "epoch": 0.23, + "learning_rate": 1.5473185507358936e-07, + "loss": 0.9569, + "step": 11707 + }, + { + "epoch": 0.23, + "learning_rate": 1.5472797172925324e-07, + "loss": 0.0022, + "step": 11708 + }, + { + "epoch": 0.23, + "learning_rate": 1.5472408838491708e-07, + "loss": 0.002, + "step": 11709 + }, + { + "epoch": 0.23, + "learning_rate": 1.5472020504058095e-07, + "loss": 0.0106, + "step": 11710 + }, + { + "epoch": 0.23, + "learning_rate": 1.547163216962448e-07, + "loss": 0.0032, + "step": 11711 + }, + { + "epoch": 0.23, + "learning_rate": 1.5471243835190867e-07, + "loss": 0.5341, + "step": 11712 + }, + { + "epoch": 0.23, + "learning_rate": 1.5470855500757251e-07, + "loss": 0.0029, + "step": 11713 + }, + { + "epoch": 0.23, + "learning_rate": 1.5470467166323639e-07, + "loss": 0.0189, + "step": 11714 + }, + { + "epoch": 0.23, + "learning_rate": 1.5470078831890023e-07, + "loss": 0.0074, + "step": 11715 + }, + { + "epoch": 0.23, + "learning_rate": 1.546969049745641e-07, + "loss": 0.1965, + "step": 11716 + }, + { + "epoch": 0.23, + "learning_rate": 1.5469302163022795e-07, + "loss": 0.1978, + "step": 11717 + }, + { + "epoch": 0.23, + "learning_rate": 1.5468913828589182e-07, + "loss": 0.7781, + "step": 11718 + }, + { + "epoch": 0.23, + "learning_rate": 1.5468525494155566e-07, + "loss": 0.0066, + "step": 11719 + }, + { + "epoch": 0.23, + "learning_rate": 1.5468137159721953e-07, + "loss": 0.1286, + "step": 11720 + }, + { + "epoch": 0.23, + "learning_rate": 1.5467748825288338e-07, + "loss": 0.0017, + "step": 11721 + }, + { + "epoch": 0.23, + "learning_rate": 1.5467360490854725e-07, + "loss": 0.0027, + "step": 11722 + }, + { + "epoch": 0.23, + "learning_rate": 1.546697215642111e-07, + "loss": 0.0029, + "step": 11723 + }, + { + "epoch": 0.23, + "learning_rate": 1.5466583821987497e-07, + "loss": 0.0039, + "step": 11724 + }, + { + "epoch": 0.23, + "learning_rate": 1.546619548755388e-07, + "loss": 0.0016, + "step": 11725 + }, + { + "epoch": 0.23, + "learning_rate": 1.5465807153120268e-07, + "loss": 0.0021, + "step": 11726 + }, + { + "epoch": 0.23, + "learning_rate": 1.5465418818686653e-07, + "loss": 0.0021, + "step": 11727 + }, + { + "epoch": 0.23, + "learning_rate": 1.546503048425304e-07, + "loss": 0.3806, + "step": 11728 + }, + { + "epoch": 0.23, + "learning_rate": 1.5464642149819425e-07, + "loss": 0.002, + "step": 11729 + }, + { + "epoch": 0.23, + "learning_rate": 1.5464253815385812e-07, + "loss": 0.0018, + "step": 11730 + }, + { + "epoch": 0.23, + "learning_rate": 1.5463865480952196e-07, + "loss": 0.0017, + "step": 11731 + }, + { + "epoch": 0.23, + "learning_rate": 1.546347714651858e-07, + "loss": 0.0024, + "step": 11732 + }, + { + "epoch": 0.23, + "learning_rate": 1.5463088812084968e-07, + "loss": 0.0017, + "step": 11733 + }, + { + "epoch": 0.23, + "learning_rate": 1.5462700477651352e-07, + "loss": 0.0072, + "step": 11734 + }, + { + "epoch": 0.23, + "learning_rate": 1.546231214321774e-07, + "loss": 0.0349, + "step": 11735 + }, + { + "epoch": 0.23, + "learning_rate": 1.5461923808784124e-07, + "loss": 0.0017, + "step": 11736 + }, + { + "epoch": 0.23, + "learning_rate": 1.5461535474350509e-07, + "loss": 0.0019, + "step": 11737 + }, + { + "epoch": 0.23, + "learning_rate": 1.5461147139916896e-07, + "loss": 0.0022, + "step": 11738 + }, + { + "epoch": 0.23, + "learning_rate": 1.546075880548328e-07, + "loss": 0.0029, + "step": 11739 + }, + { + "epoch": 0.23, + "learning_rate": 1.5460370471049667e-07, + "loss": 0.0022, + "step": 11740 + }, + { + "epoch": 0.23, + "learning_rate": 1.5459982136616052e-07, + "loss": 0.003, + "step": 11741 + }, + { + "epoch": 0.23, + "learning_rate": 1.545959380218244e-07, + "loss": 0.0019, + "step": 11742 + }, + { + "epoch": 0.23, + "learning_rate": 1.5459205467748823e-07, + "loss": 0.002, + "step": 11743 + }, + { + "epoch": 0.23, + "learning_rate": 1.545881713331521e-07, + "loss": 0.0022, + "step": 11744 + }, + { + "epoch": 0.23, + "learning_rate": 1.5458428798881595e-07, + "loss": 0.0029, + "step": 11745 + }, + { + "epoch": 0.23, + "learning_rate": 1.5458040464447982e-07, + "loss": 0.0028, + "step": 11746 + }, + { + "epoch": 0.23, + "learning_rate": 1.5457652130014367e-07, + "loss": 0.0023, + "step": 11747 + }, + { + "epoch": 0.23, + "learning_rate": 1.5457263795580754e-07, + "loss": 0.0024, + "step": 11748 + }, + { + "epoch": 0.23, + "learning_rate": 1.5456875461147138e-07, + "loss": 0.0043, + "step": 11749 + }, + { + "epoch": 0.23, + "learning_rate": 1.5456487126713526e-07, + "loss": 0.0021, + "step": 11750 + }, + { + "epoch": 0.23, + "learning_rate": 1.545609879227991e-07, + "loss": 0.1589, + "step": 11751 + }, + { + "epoch": 0.23, + "learning_rate": 1.5455710457846297e-07, + "loss": 0.0574, + "step": 11752 + }, + { + "epoch": 0.23, + "learning_rate": 1.5455322123412682e-07, + "loss": 0.1326, + "step": 11753 + }, + { + "epoch": 0.23, + "learning_rate": 1.545493378897907e-07, + "loss": 0.0053, + "step": 11754 + }, + { + "epoch": 0.23, + "learning_rate": 1.5454545454545453e-07, + "loss": 0.0019, + "step": 11755 + }, + { + "epoch": 0.23, + "learning_rate": 1.545415712011184e-07, + "loss": 0.0016, + "step": 11756 + }, + { + "epoch": 0.23, + "learning_rate": 1.5453768785678225e-07, + "loss": 0.0021, + "step": 11757 + }, + { + "epoch": 0.23, + "learning_rate": 1.5453380451244612e-07, + "loss": 0.0075, + "step": 11758 + }, + { + "epoch": 0.23, + "learning_rate": 1.5452992116810997e-07, + "loss": 0.0021, + "step": 11759 + }, + { + "epoch": 0.23, + "learning_rate": 1.5452603782377384e-07, + "loss": 0.2209, + "step": 11760 + }, + { + "epoch": 0.23, + "learning_rate": 1.5452215447943768e-07, + "loss": 0.0021, + "step": 11761 + }, + { + "epoch": 0.23, + "learning_rate": 1.5451827113510153e-07, + "loss": 0.0022, + "step": 11762 + }, + { + "epoch": 0.23, + "learning_rate": 1.545143877907654e-07, + "loss": 0.0033, + "step": 11763 + }, + { + "epoch": 0.23, + "learning_rate": 1.5451050444642924e-07, + "loss": 0.0018, + "step": 11764 + }, + { + "epoch": 0.23, + "learning_rate": 1.5450662110209312e-07, + "loss": 0.0016, + "step": 11765 + }, + { + "epoch": 0.23, + "learning_rate": 1.5450273775775696e-07, + "loss": 0.0018, + "step": 11766 + }, + { + "epoch": 0.23, + "learning_rate": 1.5449885441342083e-07, + "loss": 0.002, + "step": 11767 + }, + { + "epoch": 0.23, + "learning_rate": 1.5449497106908468e-07, + "loss": 0.0019, + "step": 11768 + }, + { + "epoch": 0.23, + "learning_rate": 1.5449108772474855e-07, + "loss": 0.002, + "step": 11769 + }, + { + "epoch": 0.23, + "learning_rate": 1.544872043804124e-07, + "loss": 0.0021, + "step": 11770 + }, + { + "epoch": 0.23, + "learning_rate": 1.5448332103607627e-07, + "loss": 0.0016, + "step": 11771 + }, + { + "epoch": 0.23, + "learning_rate": 1.544794376917401e-07, + "loss": 0.0016, + "step": 11772 + }, + { + "epoch": 0.23, + "learning_rate": 1.5447555434740398e-07, + "loss": 0.0023, + "step": 11773 + }, + { + "epoch": 0.23, + "learning_rate": 1.5447167100306783e-07, + "loss": 1.0163, + "step": 11774 + }, + { + "epoch": 0.23, + "learning_rate": 1.544677876587317e-07, + "loss": 0.0018, + "step": 11775 + }, + { + "epoch": 0.23, + "learning_rate": 1.5446390431439554e-07, + "loss": 0.0022, + "step": 11776 + }, + { + "epoch": 0.23, + "learning_rate": 1.5446002097005942e-07, + "loss": 0.0037, + "step": 11777 + }, + { + "epoch": 0.23, + "learning_rate": 1.5445613762572326e-07, + "loss": 0.0016, + "step": 11778 + }, + { + "epoch": 0.23, + "learning_rate": 1.5445225428138713e-07, + "loss": 0.0022, + "step": 11779 + }, + { + "epoch": 0.23, + "learning_rate": 1.5444837093705098e-07, + "loss": 0.0019, + "step": 11780 + }, + { + "epoch": 0.23, + "learning_rate": 1.5444448759271485e-07, + "loss": 0.2751, + "step": 11781 + }, + { + "epoch": 0.23, + "learning_rate": 1.544406042483787e-07, + "loss": 0.0015, + "step": 11782 + }, + { + "epoch": 0.23, + "learning_rate": 1.5443672090404256e-07, + "loss": 0.0047, + "step": 11783 + }, + { + "epoch": 0.23, + "learning_rate": 1.544328375597064e-07, + "loss": 0.1127, + "step": 11784 + }, + { + "epoch": 0.23, + "learning_rate": 1.5442895421537028e-07, + "loss": 0.0032, + "step": 11785 + }, + { + "epoch": 0.23, + "learning_rate": 1.5442507087103413e-07, + "loss": 0.0017, + "step": 11786 + }, + { + "epoch": 0.23, + "learning_rate": 1.54421187526698e-07, + "loss": 0.5778, + "step": 11787 + }, + { + "epoch": 0.23, + "learning_rate": 1.5441730418236184e-07, + "loss": 0.0021, + "step": 11788 + }, + { + "epoch": 0.23, + "learning_rate": 1.5441342083802571e-07, + "loss": 0.0019, + "step": 11789 + }, + { + "epoch": 0.23, + "learning_rate": 1.5440953749368956e-07, + "loss": 0.0019, + "step": 11790 + }, + { + "epoch": 0.23, + "learning_rate": 1.5440565414935343e-07, + "loss": 0.0016, + "step": 11791 + }, + { + "epoch": 0.23, + "learning_rate": 1.5440177080501728e-07, + "loss": 0.0018, + "step": 11792 + }, + { + "epoch": 0.23, + "learning_rate": 1.5439788746068115e-07, + "loss": 0.0019, + "step": 11793 + }, + { + "epoch": 0.23, + "learning_rate": 1.54394004116345e-07, + "loss": 0.0027, + "step": 11794 + }, + { + "epoch": 0.23, + "learning_rate": 1.5439012077200884e-07, + "loss": 0.002, + "step": 11795 + }, + { + "epoch": 0.23, + "learning_rate": 1.5438623742767268e-07, + "loss": 0.0037, + "step": 11796 + }, + { + "epoch": 0.23, + "learning_rate": 1.5438235408333655e-07, + "loss": 0.0015, + "step": 11797 + }, + { + "epoch": 0.23, + "learning_rate": 1.543784707390004e-07, + "loss": 0.4695, + "step": 11798 + }, + { + "epoch": 0.23, + "learning_rate": 1.5437458739466427e-07, + "loss": 0.0022, + "step": 11799 + }, + { + "epoch": 0.23, + "learning_rate": 1.5437070405032811e-07, + "loss": 0.0078, + "step": 11800 + }, + { + "epoch": 0.23, + "learning_rate": 1.5436682070599199e-07, + "loss": 0.0021, + "step": 11801 + }, + { + "epoch": 0.23, + "learning_rate": 1.5436293736165583e-07, + "loss": 0.0028, + "step": 11802 + }, + { + "epoch": 0.23, + "learning_rate": 1.543590540173197e-07, + "loss": 0.0021, + "step": 11803 + }, + { + "epoch": 0.23, + "learning_rate": 1.5435517067298355e-07, + "loss": 0.8454, + "step": 11804 + }, + { + "epoch": 0.23, + "learning_rate": 1.5435128732864742e-07, + "loss": 0.002, + "step": 11805 + }, + { + "epoch": 0.23, + "learning_rate": 1.5434740398431126e-07, + "loss": 1.091, + "step": 11806 + }, + { + "epoch": 0.23, + "learning_rate": 1.5434352063997514e-07, + "loss": 0.0018, + "step": 11807 + }, + { + "epoch": 0.23, + "learning_rate": 1.5433963729563898e-07, + "loss": 0.0091, + "step": 11808 + }, + { + "epoch": 0.23, + "learning_rate": 1.5433575395130285e-07, + "loss": 0.0017, + "step": 11809 + }, + { + "epoch": 0.23, + "learning_rate": 1.543318706069667e-07, + "loss": 0.0016, + "step": 11810 + }, + { + "epoch": 0.23, + "learning_rate": 1.5432798726263057e-07, + "loss": 0.9511, + "step": 11811 + }, + { + "epoch": 0.23, + "learning_rate": 1.5432410391829441e-07, + "loss": 0.002, + "step": 11812 + }, + { + "epoch": 0.23, + "learning_rate": 1.5432022057395829e-07, + "loss": 0.0085, + "step": 11813 + }, + { + "epoch": 0.23, + "learning_rate": 1.5431633722962213e-07, + "loss": 0.0024, + "step": 11814 + }, + { + "epoch": 0.23, + "learning_rate": 1.54312453885286e-07, + "loss": 0.7819, + "step": 11815 + }, + { + "epoch": 0.23, + "learning_rate": 1.5430857054094985e-07, + "loss": 0.0019, + "step": 11816 + }, + { + "epoch": 0.23, + "learning_rate": 1.5430468719661372e-07, + "loss": 0.0018, + "step": 11817 + }, + { + "epoch": 0.23, + "learning_rate": 1.5430080385227756e-07, + "loss": 0.0079, + "step": 11818 + }, + { + "epoch": 0.23, + "learning_rate": 1.5429692050794143e-07, + "loss": 0.0427, + "step": 11819 + }, + { + "epoch": 0.23, + "learning_rate": 1.5429303716360528e-07, + "loss": 0.0019, + "step": 11820 + }, + { + "epoch": 0.23, + "learning_rate": 1.5428915381926915e-07, + "loss": 0.0026, + "step": 11821 + }, + { + "epoch": 0.23, + "learning_rate": 1.54285270474933e-07, + "loss": 0.9448, + "step": 11822 + }, + { + "epoch": 0.23, + "learning_rate": 1.5428138713059687e-07, + "loss": 0.0048, + "step": 11823 + }, + { + "epoch": 0.23, + "learning_rate": 1.542775037862607e-07, + "loss": 0.0019, + "step": 11824 + }, + { + "epoch": 0.23, + "learning_rate": 1.5427362044192458e-07, + "loss": 0.002, + "step": 11825 + }, + { + "epoch": 0.23, + "learning_rate": 1.5426973709758843e-07, + "loss": 0.0022, + "step": 11826 + }, + { + "epoch": 0.23, + "learning_rate": 1.542658537532523e-07, + "loss": 0.0858, + "step": 11827 + }, + { + "epoch": 0.23, + "learning_rate": 1.5426197040891615e-07, + "loss": 0.0166, + "step": 11828 + }, + { + "epoch": 0.23, + "learning_rate": 1.5425808706458002e-07, + "loss": 0.002, + "step": 11829 + }, + { + "epoch": 0.23, + "learning_rate": 1.5425420372024386e-07, + "loss": 0.0021, + "step": 11830 + }, + { + "epoch": 0.23, + "learning_rate": 1.5425032037590773e-07, + "loss": 0.0039, + "step": 11831 + }, + { + "epoch": 0.23, + "learning_rate": 1.5424643703157158e-07, + "loss": 0.0111, + "step": 11832 + }, + { + "epoch": 0.23, + "learning_rate": 1.5424255368723545e-07, + "loss": 0.0049, + "step": 11833 + }, + { + "epoch": 0.23, + "learning_rate": 1.542386703428993e-07, + "loss": 0.0026, + "step": 11834 + }, + { + "epoch": 0.23, + "learning_rate": 1.5423478699856317e-07, + "loss": 0.0021, + "step": 11835 + }, + { + "epoch": 0.23, + "learning_rate": 1.54230903654227e-07, + "loss": 0.0023, + "step": 11836 + }, + { + "epoch": 0.23, + "learning_rate": 1.5422702030989088e-07, + "loss": 0.0019, + "step": 11837 + }, + { + "epoch": 0.23, + "learning_rate": 1.5422313696555473e-07, + "loss": 0.0022, + "step": 11838 + }, + { + "epoch": 0.23, + "learning_rate": 1.542192536212186e-07, + "loss": 0.0018, + "step": 11839 + }, + { + "epoch": 0.23, + "learning_rate": 1.5421537027688244e-07, + "loss": 0.0052, + "step": 11840 + }, + { + "epoch": 0.23, + "learning_rate": 1.5421148693254632e-07, + "loss": 0.0027, + "step": 11841 + }, + { + "epoch": 0.23, + "learning_rate": 1.5420760358821016e-07, + "loss": 0.7404, + "step": 11842 + }, + { + "epoch": 0.23, + "learning_rate": 1.5420372024387403e-07, + "loss": 0.0025, + "step": 11843 + }, + { + "epoch": 0.23, + "learning_rate": 1.5419983689953788e-07, + "loss": 0.0057, + "step": 11844 + }, + { + "epoch": 0.23, + "learning_rate": 1.5419595355520175e-07, + "loss": 0.3849, + "step": 11845 + }, + { + "epoch": 0.23, + "learning_rate": 1.541920702108656e-07, + "loss": 0.002, + "step": 11846 + }, + { + "epoch": 0.23, + "learning_rate": 1.5418818686652947e-07, + "loss": 0.003, + "step": 11847 + }, + { + "epoch": 0.23, + "learning_rate": 1.541843035221933e-07, + "loss": 0.1137, + "step": 11848 + }, + { + "epoch": 0.23, + "learning_rate": 1.5418042017785718e-07, + "loss": 0.0018, + "step": 11849 + }, + { + "epoch": 0.23, + "learning_rate": 1.5417653683352103e-07, + "loss": 0.0035, + "step": 11850 + }, + { + "epoch": 0.23, + "learning_rate": 1.541726534891849e-07, + "loss": 0.0193, + "step": 11851 + }, + { + "epoch": 0.23, + "learning_rate": 1.5416877014484874e-07, + "loss": 0.0088, + "step": 11852 + }, + { + "epoch": 0.23, + "learning_rate": 1.541648868005126e-07, + "loss": 0.0017, + "step": 11853 + }, + { + "epoch": 0.23, + "learning_rate": 1.5416100345617643e-07, + "loss": 0.5198, + "step": 11854 + }, + { + "epoch": 0.23, + "learning_rate": 1.541571201118403e-07, + "loss": 0.1562, + "step": 11855 + }, + { + "epoch": 0.23, + "learning_rate": 1.5415323676750415e-07, + "loss": 0.0132, + "step": 11856 + }, + { + "epoch": 0.23, + "learning_rate": 1.5414935342316802e-07, + "loss": 0.0021, + "step": 11857 + }, + { + "epoch": 0.23, + "learning_rate": 1.5414547007883187e-07, + "loss": 0.0016, + "step": 11858 + }, + { + "epoch": 0.23, + "learning_rate": 1.5414158673449574e-07, + "loss": 1.0549, + "step": 11859 + }, + { + "epoch": 0.23, + "learning_rate": 1.5413770339015958e-07, + "loss": 0.0069, + "step": 11860 + }, + { + "epoch": 0.23, + "learning_rate": 1.5413382004582345e-07, + "loss": 0.002, + "step": 11861 + }, + { + "epoch": 0.23, + "learning_rate": 1.541299367014873e-07, + "loss": 0.002, + "step": 11862 + }, + { + "epoch": 0.23, + "learning_rate": 1.5412605335715117e-07, + "loss": 0.4384, + "step": 11863 + }, + { + "epoch": 0.23, + "learning_rate": 1.5412217001281502e-07, + "loss": 0.0031, + "step": 11864 + }, + { + "epoch": 0.23, + "learning_rate": 1.541182866684789e-07, + "loss": 0.0018, + "step": 11865 + }, + { + "epoch": 0.23, + "learning_rate": 1.5411440332414273e-07, + "loss": 0.0019, + "step": 11866 + }, + { + "epoch": 0.23, + "learning_rate": 1.541105199798066e-07, + "loss": 0.01, + "step": 11867 + }, + { + "epoch": 0.23, + "learning_rate": 1.5410663663547045e-07, + "loss": 0.0098, + "step": 11868 + }, + { + "epoch": 0.23, + "learning_rate": 1.5410275329113432e-07, + "loss": 0.0014, + "step": 11869 + }, + { + "epoch": 0.23, + "learning_rate": 1.5409886994679817e-07, + "loss": 0.012, + "step": 11870 + }, + { + "epoch": 0.23, + "learning_rate": 1.5409498660246204e-07, + "loss": 0.0022, + "step": 11871 + }, + { + "epoch": 0.23, + "learning_rate": 1.5409110325812588e-07, + "loss": 0.0036, + "step": 11872 + }, + { + "epoch": 0.23, + "learning_rate": 1.5408721991378975e-07, + "loss": 0.0019, + "step": 11873 + }, + { + "epoch": 0.23, + "learning_rate": 1.540833365694536e-07, + "loss": 0.0019, + "step": 11874 + }, + { + "epoch": 0.23, + "learning_rate": 1.5407945322511747e-07, + "loss": 0.0018, + "step": 11875 + }, + { + "epoch": 0.23, + "learning_rate": 1.5407556988078132e-07, + "loss": 0.0018, + "step": 11876 + }, + { + "epoch": 0.23, + "learning_rate": 1.5407168653644519e-07, + "loss": 0.0045, + "step": 11877 + }, + { + "epoch": 0.23, + "learning_rate": 1.5406780319210903e-07, + "loss": 0.0024, + "step": 11878 + }, + { + "epoch": 0.23, + "learning_rate": 1.540639198477729e-07, + "loss": 0.0014, + "step": 11879 + }, + { + "epoch": 0.23, + "learning_rate": 1.5406003650343675e-07, + "loss": 0.0019, + "step": 11880 + }, + { + "epoch": 0.23, + "learning_rate": 1.5405615315910062e-07, + "loss": 0.0016, + "step": 11881 + }, + { + "epoch": 0.23, + "learning_rate": 1.5405226981476446e-07, + "loss": 0.0588, + "step": 11882 + }, + { + "epoch": 0.23, + "learning_rate": 1.5404838647042834e-07, + "loss": 0.5509, + "step": 11883 + }, + { + "epoch": 0.23, + "learning_rate": 1.5404450312609218e-07, + "loss": 0.0084, + "step": 11884 + }, + { + "epoch": 0.23, + "learning_rate": 1.5404061978175605e-07, + "loss": 0.0015, + "step": 11885 + }, + { + "epoch": 0.23, + "learning_rate": 1.540367364374199e-07, + "loss": 0.0018, + "step": 11886 + }, + { + "epoch": 0.23, + "learning_rate": 1.5403285309308377e-07, + "loss": 0.0023, + "step": 11887 + }, + { + "epoch": 0.23, + "learning_rate": 1.5402896974874761e-07, + "loss": 0.0483, + "step": 11888 + }, + { + "epoch": 0.23, + "learning_rate": 1.5402508640441149e-07, + "loss": 0.0191, + "step": 11889 + }, + { + "epoch": 0.23, + "learning_rate": 1.5402120306007533e-07, + "loss": 0.0014, + "step": 11890 + }, + { + "epoch": 0.23, + "learning_rate": 1.540173197157392e-07, + "loss": 0.002, + "step": 11891 + }, + { + "epoch": 0.23, + "learning_rate": 1.5401343637140305e-07, + "loss": 0.0023, + "step": 11892 + }, + { + "epoch": 0.23, + "learning_rate": 1.5400955302706692e-07, + "loss": 0.0019, + "step": 11893 + }, + { + "epoch": 0.23, + "learning_rate": 1.5400566968273076e-07, + "loss": 0.0022, + "step": 11894 + }, + { + "epoch": 0.23, + "learning_rate": 1.5400178633839463e-07, + "loss": 0.0189, + "step": 11895 + }, + { + "epoch": 0.23, + "learning_rate": 1.5399790299405848e-07, + "loss": 0.0043, + "step": 11896 + }, + { + "epoch": 0.23, + "learning_rate": 1.5399401964972235e-07, + "loss": 0.0067, + "step": 11897 + }, + { + "epoch": 0.23, + "learning_rate": 1.539901363053862e-07, + "loss": 0.0128, + "step": 11898 + }, + { + "epoch": 0.23, + "learning_rate": 1.5398625296105007e-07, + "loss": 0.0092, + "step": 11899 + }, + { + "epoch": 0.23, + "learning_rate": 1.539823696167139e-07, + "loss": 0.0026, + "step": 11900 + }, + { + "epoch": 0.23, + "learning_rate": 1.5397848627237778e-07, + "loss": 0.0035, + "step": 11901 + }, + { + "epoch": 0.23, + "learning_rate": 1.5397460292804163e-07, + "loss": 0.0032, + "step": 11902 + }, + { + "epoch": 0.23, + "learning_rate": 1.539707195837055e-07, + "loss": 0.0019, + "step": 11903 + }, + { + "epoch": 0.23, + "learning_rate": 1.5396683623936935e-07, + "loss": 0.5258, + "step": 11904 + }, + { + "epoch": 0.23, + "learning_rate": 1.5396295289503322e-07, + "loss": 0.0021, + "step": 11905 + }, + { + "epoch": 0.23, + "learning_rate": 1.5395906955069706e-07, + "loss": 0.0021, + "step": 11906 + }, + { + "epoch": 0.23, + "learning_rate": 1.5395518620636093e-07, + "loss": 0.0139, + "step": 11907 + }, + { + "epoch": 0.23, + "learning_rate": 1.5395130286202478e-07, + "loss": 0.0073, + "step": 11908 + }, + { + "epoch": 0.23, + "learning_rate": 1.5394741951768862e-07, + "loss": 0.0025, + "step": 11909 + }, + { + "epoch": 0.23, + "learning_rate": 1.539435361733525e-07, + "loss": 0.0018, + "step": 11910 + }, + { + "epoch": 0.23, + "learning_rate": 1.5393965282901634e-07, + "loss": 0.0018, + "step": 11911 + }, + { + "epoch": 0.23, + "learning_rate": 1.5393576948468019e-07, + "loss": 0.002, + "step": 11912 + }, + { + "epoch": 0.23, + "learning_rate": 1.5393188614034406e-07, + "loss": 0.0015, + "step": 11913 + }, + { + "epoch": 0.23, + "learning_rate": 1.539280027960079e-07, + "loss": 0.0017, + "step": 11914 + }, + { + "epoch": 0.23, + "learning_rate": 1.5392411945167177e-07, + "loss": 0.02, + "step": 11915 + }, + { + "epoch": 0.23, + "learning_rate": 1.5392023610733562e-07, + "loss": 0.0019, + "step": 11916 + }, + { + "epoch": 0.23, + "learning_rate": 1.539163527629995e-07, + "loss": 0.1808, + "step": 11917 + }, + { + "epoch": 0.23, + "learning_rate": 1.5391246941866333e-07, + "loss": 0.7676, + "step": 11918 + }, + { + "epoch": 0.23, + "learning_rate": 1.539085860743272e-07, + "loss": 0.0025, + "step": 11919 + }, + { + "epoch": 0.23, + "learning_rate": 1.5390470272999105e-07, + "loss": 0.0051, + "step": 11920 + }, + { + "epoch": 0.23, + "learning_rate": 1.5390081938565492e-07, + "loss": 0.0024, + "step": 11921 + }, + { + "epoch": 0.23, + "learning_rate": 1.5389693604131877e-07, + "loss": 0.2953, + "step": 11922 + }, + { + "epoch": 0.23, + "learning_rate": 1.5389305269698264e-07, + "loss": 0.0042, + "step": 11923 + }, + { + "epoch": 0.23, + "learning_rate": 1.5388916935264648e-07, + "loss": 0.1515, + "step": 11924 + }, + { + "epoch": 0.23, + "learning_rate": 1.5388528600831036e-07, + "loss": 0.0019, + "step": 11925 + }, + { + "epoch": 0.23, + "learning_rate": 1.538814026639742e-07, + "loss": 0.0022, + "step": 11926 + }, + { + "epoch": 0.23, + "learning_rate": 1.5387751931963807e-07, + "loss": 0.0016, + "step": 11927 + }, + { + "epoch": 0.23, + "learning_rate": 1.5387363597530192e-07, + "loss": 0.0029, + "step": 11928 + }, + { + "epoch": 0.23, + "learning_rate": 1.538697526309658e-07, + "loss": 0.0013, + "step": 11929 + }, + { + "epoch": 0.23, + "learning_rate": 1.5386586928662963e-07, + "loss": 0.0023, + "step": 11930 + }, + { + "epoch": 0.23, + "learning_rate": 1.538619859422935e-07, + "loss": 0.0025, + "step": 11931 + }, + { + "epoch": 0.23, + "learning_rate": 1.5385810259795735e-07, + "loss": 0.0022, + "step": 11932 + }, + { + "epoch": 0.23, + "learning_rate": 1.5385421925362122e-07, + "loss": 0.0021, + "step": 11933 + }, + { + "epoch": 0.23, + "learning_rate": 1.5385033590928507e-07, + "loss": 0.0015, + "step": 11934 + }, + { + "epoch": 0.23, + "learning_rate": 1.5384645256494894e-07, + "loss": 0.0018, + "step": 11935 + }, + { + "epoch": 0.23, + "learning_rate": 1.5384256922061278e-07, + "loss": 0.237, + "step": 11936 + }, + { + "epoch": 0.23, + "learning_rate": 1.5383868587627665e-07, + "loss": 0.0016, + "step": 11937 + }, + { + "epoch": 0.23, + "learning_rate": 1.538348025319405e-07, + "loss": 0.0016, + "step": 11938 + }, + { + "epoch": 0.23, + "learning_rate": 1.5383091918760434e-07, + "loss": 0.0029, + "step": 11939 + }, + { + "epoch": 0.23, + "learning_rate": 1.5382703584326822e-07, + "loss": 0.0015, + "step": 11940 + }, + { + "epoch": 0.23, + "learning_rate": 1.5382315249893206e-07, + "loss": 0.2052, + "step": 11941 + }, + { + "epoch": 0.23, + "learning_rate": 1.5381926915459593e-07, + "loss": 0.0056, + "step": 11942 + }, + { + "epoch": 0.23, + "learning_rate": 1.5381538581025978e-07, + "loss": 0.0019, + "step": 11943 + }, + { + "epoch": 0.23, + "learning_rate": 1.5381150246592365e-07, + "loss": 1.7453, + "step": 11944 + }, + { + "epoch": 0.23, + "learning_rate": 1.538076191215875e-07, + "loss": 0.0023, + "step": 11945 + }, + { + "epoch": 0.23, + "learning_rate": 1.5380373577725137e-07, + "loss": 0.0069, + "step": 11946 + }, + { + "epoch": 0.23, + "learning_rate": 1.537998524329152e-07, + "loss": 0.0018, + "step": 11947 + }, + { + "epoch": 0.23, + "learning_rate": 1.5379596908857908e-07, + "loss": 0.0156, + "step": 11948 + }, + { + "epoch": 0.23, + "learning_rate": 1.5379208574424293e-07, + "loss": 0.0013, + "step": 11949 + }, + { + "epoch": 0.23, + "learning_rate": 1.537882023999068e-07, + "loss": 0.0028, + "step": 11950 + }, + { + "epoch": 0.23, + "learning_rate": 1.5378431905557064e-07, + "loss": 0.0017, + "step": 11951 + }, + { + "epoch": 0.23, + "learning_rate": 1.5378043571123452e-07, + "loss": 0.0025, + "step": 11952 + }, + { + "epoch": 0.23, + "learning_rate": 1.5377655236689836e-07, + "loss": 0.002, + "step": 11953 + }, + { + "epoch": 0.23, + "learning_rate": 1.5377266902256223e-07, + "loss": 0.0026, + "step": 11954 + }, + { + "epoch": 0.23, + "learning_rate": 1.5376878567822608e-07, + "loss": 0.0065, + "step": 11955 + }, + { + "epoch": 0.23, + "learning_rate": 1.5376490233388995e-07, + "loss": 0.002, + "step": 11956 + }, + { + "epoch": 0.23, + "learning_rate": 1.537610189895538e-07, + "loss": 0.0168, + "step": 11957 + }, + { + "epoch": 0.23, + "learning_rate": 1.5375713564521766e-07, + "loss": 0.0016, + "step": 11958 + }, + { + "epoch": 0.23, + "learning_rate": 1.537532523008815e-07, + "loss": 0.0016, + "step": 11959 + }, + { + "epoch": 0.23, + "learning_rate": 1.5374936895654538e-07, + "loss": 0.0019, + "step": 11960 + }, + { + "epoch": 0.23, + "learning_rate": 1.5374548561220923e-07, + "loss": 0.6656, + "step": 11961 + }, + { + "epoch": 0.23, + "learning_rate": 1.537416022678731e-07, + "loss": 0.0031, + "step": 11962 + }, + { + "epoch": 0.23, + "learning_rate": 1.5373771892353694e-07, + "loss": 0.0019, + "step": 11963 + }, + { + "epoch": 0.23, + "learning_rate": 1.5373383557920081e-07, + "loss": 0.0112, + "step": 11964 + }, + { + "epoch": 0.23, + "learning_rate": 1.5372995223486466e-07, + "loss": 0.002, + "step": 11965 + }, + { + "epoch": 0.23, + "learning_rate": 1.5372606889052853e-07, + "loss": 0.1264, + "step": 11966 + }, + { + "epoch": 0.23, + "learning_rate": 1.5372218554619238e-07, + "loss": 0.0036, + "step": 11967 + }, + { + "epoch": 0.23, + "learning_rate": 1.5371830220185625e-07, + "loss": 0.0049, + "step": 11968 + }, + { + "epoch": 0.23, + "learning_rate": 1.5371441885752007e-07, + "loss": 0.0048, + "step": 11969 + }, + { + "epoch": 0.23, + "learning_rate": 1.5371053551318394e-07, + "loss": 0.015, + "step": 11970 + }, + { + "epoch": 0.23, + "learning_rate": 1.5370665216884778e-07, + "loss": 0.0029, + "step": 11971 + }, + { + "epoch": 0.23, + "learning_rate": 1.5370276882451165e-07, + "loss": 0.0091, + "step": 11972 + }, + { + "epoch": 0.23, + "learning_rate": 1.536988854801755e-07, + "loss": 0.0014, + "step": 11973 + }, + { + "epoch": 0.23, + "learning_rate": 1.5369500213583937e-07, + "loss": 0.0022, + "step": 11974 + }, + { + "epoch": 0.23, + "learning_rate": 1.5369111879150322e-07, + "loss": 0.002, + "step": 11975 + }, + { + "epoch": 0.23, + "learning_rate": 1.5368723544716709e-07, + "loss": 0.0015, + "step": 11976 + }, + { + "epoch": 0.23, + "learning_rate": 1.5368335210283093e-07, + "loss": 0.0025, + "step": 11977 + }, + { + "epoch": 0.23, + "learning_rate": 1.536794687584948e-07, + "loss": 0.0018, + "step": 11978 + }, + { + "epoch": 0.23, + "learning_rate": 1.5367558541415865e-07, + "loss": 0.6632, + "step": 11979 + }, + { + "epoch": 0.23, + "learning_rate": 1.5367170206982252e-07, + "loss": 0.0018, + "step": 11980 + }, + { + "epoch": 0.23, + "learning_rate": 1.5366781872548636e-07, + "loss": 0.0023, + "step": 11981 + }, + { + "epoch": 0.23, + "learning_rate": 1.5366393538115024e-07, + "loss": 0.0536, + "step": 11982 + }, + { + "epoch": 0.23, + "learning_rate": 1.5366005203681408e-07, + "loss": 0.0017, + "step": 11983 + }, + { + "epoch": 0.23, + "learning_rate": 1.5365616869247795e-07, + "loss": 0.0051, + "step": 11984 + }, + { + "epoch": 0.23, + "learning_rate": 1.536522853481418e-07, + "loss": 0.5664, + "step": 11985 + }, + { + "epoch": 0.23, + "learning_rate": 1.5364840200380567e-07, + "loss": 0.0018, + "step": 11986 + }, + { + "epoch": 0.23, + "learning_rate": 1.5364451865946951e-07, + "loss": 0.0032, + "step": 11987 + }, + { + "epoch": 0.23, + "learning_rate": 1.5364063531513339e-07, + "loss": 0.6741, + "step": 11988 + }, + { + "epoch": 0.23, + "learning_rate": 1.5363675197079723e-07, + "loss": 0.0054, + "step": 11989 + }, + { + "epoch": 0.23, + "learning_rate": 1.536328686264611e-07, + "loss": 0.0022, + "step": 11990 + }, + { + "epoch": 0.23, + "learning_rate": 1.5362898528212495e-07, + "loss": 0.0015, + "step": 11991 + }, + { + "epoch": 0.23, + "learning_rate": 1.5362510193778882e-07, + "loss": 0.0016, + "step": 11992 + }, + { + "epoch": 0.23, + "learning_rate": 1.5362121859345266e-07, + "loss": 0.1739, + "step": 11993 + }, + { + "epoch": 0.23, + "learning_rate": 1.5361733524911653e-07, + "loss": 0.0032, + "step": 11994 + }, + { + "epoch": 0.23, + "learning_rate": 1.5361345190478038e-07, + "loss": 0.0036, + "step": 11995 + }, + { + "epoch": 0.23, + "learning_rate": 1.5360956856044425e-07, + "loss": 0.0016, + "step": 11996 + }, + { + "epoch": 0.23, + "learning_rate": 1.536056852161081e-07, + "loss": 0.0016, + "step": 11997 + }, + { + "epoch": 0.23, + "learning_rate": 1.5360180187177197e-07, + "loss": 1.0231, + "step": 11998 + }, + { + "epoch": 0.23, + "learning_rate": 1.535979185274358e-07, + "loss": 0.01, + "step": 11999 + }, + { + "epoch": 0.23, + "learning_rate": 1.5359403518309968e-07, + "loss": 0.0058, + "step": 12000 + }, + { + "epoch": 0.23, + "learning_rate": 1.5359015183876353e-07, + "loss": 0.002, + "step": 12001 + }, + { + "epoch": 0.23, + "learning_rate": 1.535862684944274e-07, + "loss": 0.0023, + "step": 12002 + }, + { + "epoch": 0.23, + "learning_rate": 1.5358238515009125e-07, + "loss": 0.0029, + "step": 12003 + }, + { + "epoch": 0.23, + "learning_rate": 1.5357850180575512e-07, + "loss": 0.0017, + "step": 12004 + }, + { + "epoch": 0.23, + "learning_rate": 1.5357461846141896e-07, + "loss": 0.0018, + "step": 12005 + }, + { + "epoch": 0.23, + "learning_rate": 1.5357073511708283e-07, + "loss": 0.0555, + "step": 12006 + }, + { + "epoch": 0.23, + "learning_rate": 1.5356685177274668e-07, + "loss": 0.0017, + "step": 12007 + }, + { + "epoch": 0.23, + "learning_rate": 1.5356296842841055e-07, + "loss": 0.0324, + "step": 12008 + }, + { + "epoch": 0.23, + "learning_rate": 1.535590850840744e-07, + "loss": 0.0017, + "step": 12009 + }, + { + "epoch": 0.23, + "learning_rate": 1.5355520173973827e-07, + "loss": 0.0084, + "step": 12010 + }, + { + "epoch": 0.23, + "learning_rate": 1.535513183954021e-07, + "loss": 0.0018, + "step": 12011 + }, + { + "epoch": 0.23, + "learning_rate": 1.5354743505106598e-07, + "loss": 0.0018, + "step": 12012 + }, + { + "epoch": 0.23, + "learning_rate": 1.5354355170672983e-07, + "loss": 0.0024, + "step": 12013 + }, + { + "epoch": 0.23, + "learning_rate": 1.535396683623937e-07, + "loss": 0.0061, + "step": 12014 + }, + { + "epoch": 0.23, + "learning_rate": 1.5353578501805754e-07, + "loss": 0.0017, + "step": 12015 + }, + { + "epoch": 0.23, + "learning_rate": 1.5353190167372142e-07, + "loss": 0.0016, + "step": 12016 + }, + { + "epoch": 0.23, + "learning_rate": 1.5352801832938526e-07, + "loss": 0.0018, + "step": 12017 + }, + { + "epoch": 0.23, + "learning_rate": 1.5352413498504913e-07, + "loss": 0.005, + "step": 12018 + }, + { + "epoch": 0.23, + "learning_rate": 1.5352025164071298e-07, + "loss": 0.0063, + "step": 12019 + }, + { + "epoch": 0.23, + "learning_rate": 1.5351636829637685e-07, + "loss": 0.0019, + "step": 12020 + }, + { + "epoch": 0.23, + "learning_rate": 1.535124849520407e-07, + "loss": 0.0024, + "step": 12021 + }, + { + "epoch": 0.23, + "learning_rate": 1.5350860160770457e-07, + "loss": 0.0037, + "step": 12022 + }, + { + "epoch": 0.23, + "learning_rate": 1.535047182633684e-07, + "loss": 0.0018, + "step": 12023 + }, + { + "epoch": 0.23, + "learning_rate": 1.5350083491903228e-07, + "loss": 0.6346, + "step": 12024 + }, + { + "epoch": 0.23, + "learning_rate": 1.5349695157469613e-07, + "loss": 0.0038, + "step": 12025 + }, + { + "epoch": 0.23, + "learning_rate": 1.5349306823036e-07, + "loss": 0.0127, + "step": 12026 + }, + { + "epoch": 0.23, + "learning_rate": 1.5348918488602382e-07, + "loss": 0.3674, + "step": 12027 + }, + { + "epoch": 0.23, + "learning_rate": 1.534853015416877e-07, + "loss": 0.0028, + "step": 12028 + }, + { + "epoch": 0.23, + "learning_rate": 1.5348141819735153e-07, + "loss": 0.2787, + "step": 12029 + }, + { + "epoch": 0.23, + "learning_rate": 1.534775348530154e-07, + "loss": 0.0017, + "step": 12030 + }, + { + "epoch": 0.23, + "learning_rate": 1.5347365150867925e-07, + "loss": 0.2196, + "step": 12031 + }, + { + "epoch": 0.23, + "learning_rate": 1.5346976816434312e-07, + "loss": 0.0081, + "step": 12032 + }, + { + "epoch": 0.23, + "learning_rate": 1.5346588482000697e-07, + "loss": 0.0035, + "step": 12033 + }, + { + "epoch": 0.23, + "learning_rate": 1.5346200147567084e-07, + "loss": 0.0066, + "step": 12034 + }, + { + "epoch": 0.23, + "learning_rate": 1.5345811813133468e-07, + "loss": 0.0267, + "step": 12035 + }, + { + "epoch": 0.23, + "learning_rate": 1.5345423478699855e-07, + "loss": 0.0047, + "step": 12036 + }, + { + "epoch": 0.23, + "learning_rate": 1.534503514426624e-07, + "loss": 0.0032, + "step": 12037 + }, + { + "epoch": 0.23, + "learning_rate": 1.5344646809832627e-07, + "loss": 0.0025, + "step": 12038 + }, + { + "epoch": 0.23, + "learning_rate": 1.5344258475399012e-07, + "loss": 0.0016, + "step": 12039 + }, + { + "epoch": 0.23, + "learning_rate": 1.53438701409654e-07, + "loss": 1.171, + "step": 12040 + }, + { + "epoch": 0.23, + "learning_rate": 1.5343481806531783e-07, + "loss": 0.0022, + "step": 12041 + }, + { + "epoch": 0.23, + "learning_rate": 1.534309347209817e-07, + "loss": 0.0014, + "step": 12042 + }, + { + "epoch": 0.23, + "learning_rate": 1.5342705137664555e-07, + "loss": 0.0017, + "step": 12043 + }, + { + "epoch": 0.23, + "learning_rate": 1.5342316803230942e-07, + "loss": 0.0022, + "step": 12044 + }, + { + "epoch": 0.23, + "learning_rate": 1.5341928468797327e-07, + "loss": 0.0051, + "step": 12045 + }, + { + "epoch": 0.23, + "learning_rate": 1.5341540134363714e-07, + "loss": 0.5712, + "step": 12046 + }, + { + "epoch": 0.23, + "learning_rate": 1.5341151799930098e-07, + "loss": 0.0264, + "step": 12047 + }, + { + "epoch": 0.23, + "learning_rate": 1.5340763465496485e-07, + "loss": 0.0043, + "step": 12048 + }, + { + "epoch": 0.23, + "learning_rate": 1.534037513106287e-07, + "loss": 0.0041, + "step": 12049 + }, + { + "epoch": 0.23, + "learning_rate": 1.5339986796629257e-07, + "loss": 0.0017, + "step": 12050 + }, + { + "epoch": 0.23, + "learning_rate": 1.5339598462195642e-07, + "loss": 0.0024, + "step": 12051 + }, + { + "epoch": 0.23, + "learning_rate": 1.5339210127762029e-07, + "loss": 0.0292, + "step": 12052 + }, + { + "epoch": 0.23, + "learning_rate": 1.5338821793328413e-07, + "loss": 0.0202, + "step": 12053 + }, + { + "epoch": 0.23, + "learning_rate": 1.53384334588948e-07, + "loss": 0.4264, + "step": 12054 + }, + { + "epoch": 0.23, + "learning_rate": 1.5338045124461185e-07, + "loss": 0.0022, + "step": 12055 + }, + { + "epoch": 0.23, + "learning_rate": 1.5337656790027572e-07, + "loss": 0.002, + "step": 12056 + }, + { + "epoch": 0.23, + "learning_rate": 1.5337268455593956e-07, + "loss": 0.0021, + "step": 12057 + }, + { + "epoch": 0.23, + "learning_rate": 1.5336880121160344e-07, + "loss": 0.0017, + "step": 12058 + }, + { + "epoch": 0.23, + "learning_rate": 1.5336491786726728e-07, + "loss": 0.002, + "step": 12059 + }, + { + "epoch": 0.23, + "learning_rate": 1.5336103452293115e-07, + "loss": 0.0025, + "step": 12060 + }, + { + "epoch": 0.23, + "learning_rate": 1.53357151178595e-07, + "loss": 0.0026, + "step": 12061 + }, + { + "epoch": 0.23, + "learning_rate": 1.5335326783425887e-07, + "loss": 0.0024, + "step": 12062 + }, + { + "epoch": 0.23, + "learning_rate": 1.5334938448992271e-07, + "loss": 2.1192, + "step": 12063 + }, + { + "epoch": 0.23, + "learning_rate": 1.5334550114558659e-07, + "loss": 0.003, + "step": 12064 + }, + { + "epoch": 0.23, + "learning_rate": 1.5334161780125043e-07, + "loss": 0.0021, + "step": 12065 + }, + { + "epoch": 0.23, + "learning_rate": 1.533377344569143e-07, + "loss": 0.0019, + "step": 12066 + }, + { + "epoch": 0.23, + "learning_rate": 1.5333385111257815e-07, + "loss": 0.0021, + "step": 12067 + }, + { + "epoch": 0.23, + "learning_rate": 1.5332996776824202e-07, + "loss": 0.0018, + "step": 12068 + }, + { + "epoch": 0.23, + "learning_rate": 1.5332608442390586e-07, + "loss": 0.0121, + "step": 12069 + }, + { + "epoch": 0.23, + "learning_rate": 1.5332220107956974e-07, + "loss": 0.0017, + "step": 12070 + }, + { + "epoch": 0.23, + "learning_rate": 1.5331831773523358e-07, + "loss": 0.3339, + "step": 12071 + }, + { + "epoch": 0.23, + "learning_rate": 1.5331443439089745e-07, + "loss": 0.5142, + "step": 12072 + }, + { + "epoch": 0.23, + "learning_rate": 1.533105510465613e-07, + "loss": 0.002, + "step": 12073 + }, + { + "epoch": 0.23, + "learning_rate": 1.5330666770222517e-07, + "loss": 0.0876, + "step": 12074 + }, + { + "epoch": 0.23, + "learning_rate": 1.53302784357889e-07, + "loss": 0.0116, + "step": 12075 + }, + { + "epoch": 0.23, + "learning_rate": 1.5329890101355288e-07, + "loss": 0.0024, + "step": 12076 + }, + { + "epoch": 0.23, + "learning_rate": 1.5329501766921673e-07, + "loss": 0.0021, + "step": 12077 + }, + { + "epoch": 0.23, + "learning_rate": 1.532911343248806e-07, + "loss": 0.0018, + "step": 12078 + }, + { + "epoch": 0.23, + "learning_rate": 1.5328725098054445e-07, + "loss": 0.9751, + "step": 12079 + }, + { + "epoch": 0.23, + "learning_rate": 1.5328336763620832e-07, + "loss": 0.0021, + "step": 12080 + }, + { + "epoch": 0.23, + "learning_rate": 1.5327948429187216e-07, + "loss": 0.0021, + "step": 12081 + }, + { + "epoch": 0.23, + "learning_rate": 1.5327560094753603e-07, + "loss": 0.0014, + "step": 12082 + }, + { + "epoch": 0.23, + "learning_rate": 1.5327171760319988e-07, + "loss": 0.0018, + "step": 12083 + }, + { + "epoch": 0.23, + "learning_rate": 1.5326783425886375e-07, + "loss": 0.0067, + "step": 12084 + }, + { + "epoch": 0.23, + "learning_rate": 1.5326395091452757e-07, + "loss": 0.0275, + "step": 12085 + }, + { + "epoch": 0.23, + "learning_rate": 1.5326006757019144e-07, + "loss": 0.0035, + "step": 12086 + }, + { + "epoch": 0.23, + "learning_rate": 1.5325618422585529e-07, + "loss": 0.0018, + "step": 12087 + }, + { + "epoch": 0.23, + "learning_rate": 1.5325230088151916e-07, + "loss": 0.0037, + "step": 12088 + }, + { + "epoch": 0.23, + "learning_rate": 1.53248417537183e-07, + "loss": 0.0025, + "step": 12089 + }, + { + "epoch": 0.23, + "learning_rate": 1.5324453419284687e-07, + "loss": 0.4024, + "step": 12090 + }, + { + "epoch": 0.23, + "learning_rate": 1.5324065084851072e-07, + "loss": 0.0022, + "step": 12091 + }, + { + "epoch": 0.23, + "learning_rate": 1.532367675041746e-07, + "loss": 0.3118, + "step": 12092 + }, + { + "epoch": 0.23, + "learning_rate": 1.5323288415983843e-07, + "loss": 0.0022, + "step": 12093 + }, + { + "epoch": 0.23, + "learning_rate": 1.532290008155023e-07, + "loss": 0.0022, + "step": 12094 + }, + { + "epoch": 0.23, + "learning_rate": 1.5322511747116615e-07, + "loss": 0.0016, + "step": 12095 + }, + { + "epoch": 0.23, + "learning_rate": 1.5322123412683002e-07, + "loss": 0.0016, + "step": 12096 + }, + { + "epoch": 0.23, + "learning_rate": 1.5321735078249387e-07, + "loss": 0.0022, + "step": 12097 + }, + { + "epoch": 0.23, + "learning_rate": 1.5321346743815774e-07, + "loss": 0.0019, + "step": 12098 + }, + { + "epoch": 0.23, + "learning_rate": 1.5320958409382158e-07, + "loss": 0.5229, + "step": 12099 + }, + { + "epoch": 0.23, + "learning_rate": 1.5320570074948546e-07, + "loss": 0.0022, + "step": 12100 + }, + { + "epoch": 0.23, + "learning_rate": 1.532018174051493e-07, + "loss": 0.0026, + "step": 12101 + }, + { + "epoch": 0.23, + "learning_rate": 1.5319793406081317e-07, + "loss": 0.0134, + "step": 12102 + }, + { + "epoch": 0.23, + "learning_rate": 1.5319405071647702e-07, + "loss": 0.0021, + "step": 12103 + }, + { + "epoch": 0.23, + "learning_rate": 1.531901673721409e-07, + "loss": 0.0019, + "step": 12104 + }, + { + "epoch": 0.23, + "learning_rate": 1.5318628402780473e-07, + "loss": 0.0026, + "step": 12105 + }, + { + "epoch": 0.23, + "learning_rate": 1.531824006834686e-07, + "loss": 0.0018, + "step": 12106 + }, + { + "epoch": 0.23, + "learning_rate": 1.5317851733913245e-07, + "loss": 0.075, + "step": 12107 + }, + { + "epoch": 0.23, + "learning_rate": 1.5317463399479632e-07, + "loss": 0.0015, + "step": 12108 + }, + { + "epoch": 0.23, + "learning_rate": 1.5317075065046017e-07, + "loss": 0.0017, + "step": 12109 + }, + { + "epoch": 0.23, + "learning_rate": 1.5316686730612404e-07, + "loss": 0.0015, + "step": 12110 + }, + { + "epoch": 0.23, + "learning_rate": 1.5316298396178788e-07, + "loss": 0.0017, + "step": 12111 + }, + { + "epoch": 0.23, + "learning_rate": 1.5315910061745175e-07, + "loss": 0.0021, + "step": 12112 + }, + { + "epoch": 0.23, + "learning_rate": 1.531552172731156e-07, + "loss": 0.0073, + "step": 12113 + }, + { + "epoch": 0.23, + "learning_rate": 1.5315133392877947e-07, + "loss": 0.0025, + "step": 12114 + }, + { + "epoch": 0.24, + "learning_rate": 1.5314745058444332e-07, + "loss": 0.0017, + "step": 12115 + }, + { + "epoch": 0.24, + "learning_rate": 1.5314356724010716e-07, + "loss": 0.0018, + "step": 12116 + }, + { + "epoch": 0.24, + "learning_rate": 1.5313968389577103e-07, + "loss": 0.0016, + "step": 12117 + }, + { + "epoch": 0.24, + "learning_rate": 1.5313580055143488e-07, + "loss": 0.0021, + "step": 12118 + }, + { + "epoch": 0.24, + "learning_rate": 1.5313191720709875e-07, + "loss": 0.0026, + "step": 12119 + }, + { + "epoch": 0.24, + "learning_rate": 1.531280338627626e-07, + "loss": 0.0016, + "step": 12120 + }, + { + "epoch": 0.24, + "learning_rate": 1.5312415051842647e-07, + "loss": 0.0018, + "step": 12121 + }, + { + "epoch": 0.24, + "learning_rate": 1.531202671740903e-07, + "loss": 0.018, + "step": 12122 + }, + { + "epoch": 0.24, + "learning_rate": 1.5311638382975418e-07, + "loss": 0.002, + "step": 12123 + }, + { + "epoch": 0.24, + "learning_rate": 1.5311250048541803e-07, + "loss": 0.1462, + "step": 12124 + }, + { + "epoch": 0.24, + "learning_rate": 1.531086171410819e-07, + "loss": 0.0014, + "step": 12125 + }, + { + "epoch": 0.24, + "learning_rate": 1.5310473379674574e-07, + "loss": 0.0018, + "step": 12126 + }, + { + "epoch": 0.24, + "learning_rate": 1.5310085045240962e-07, + "loss": 0.003, + "step": 12127 + }, + { + "epoch": 0.24, + "learning_rate": 1.5309696710807346e-07, + "loss": 0.0053, + "step": 12128 + }, + { + "epoch": 0.24, + "learning_rate": 1.5309308376373733e-07, + "loss": 0.0032, + "step": 12129 + }, + { + "epoch": 0.24, + "learning_rate": 1.5308920041940118e-07, + "loss": 0.0069, + "step": 12130 + }, + { + "epoch": 0.24, + "learning_rate": 1.5308531707506505e-07, + "loss": 0.0022, + "step": 12131 + }, + { + "epoch": 0.24, + "learning_rate": 1.530814337307289e-07, + "loss": 0.0022, + "step": 12132 + }, + { + "epoch": 0.24, + "learning_rate": 1.5307755038639276e-07, + "loss": 0.0016, + "step": 12133 + }, + { + "epoch": 0.24, + "learning_rate": 1.530736670420566e-07, + "loss": 0.0043, + "step": 12134 + }, + { + "epoch": 0.24, + "learning_rate": 1.5306978369772048e-07, + "loss": 0.5441, + "step": 12135 + }, + { + "epoch": 0.24, + "learning_rate": 1.5306590035338433e-07, + "loss": 0.0039, + "step": 12136 + }, + { + "epoch": 0.24, + "learning_rate": 1.530620170090482e-07, + "loss": 0.002, + "step": 12137 + }, + { + "epoch": 0.24, + "learning_rate": 1.5305813366471204e-07, + "loss": 0.5498, + "step": 12138 + }, + { + "epoch": 0.24, + "learning_rate": 1.5305425032037591e-07, + "loss": 0.6588, + "step": 12139 + }, + { + "epoch": 0.24, + "learning_rate": 1.5305036697603976e-07, + "loss": 0.0084, + "step": 12140 + }, + { + "epoch": 0.24, + "learning_rate": 1.5304648363170363e-07, + "loss": 0.0028, + "step": 12141 + }, + { + "epoch": 0.24, + "learning_rate": 1.5304260028736748e-07, + "loss": 0.0021, + "step": 12142 + }, + { + "epoch": 0.24, + "learning_rate": 1.5303871694303132e-07, + "loss": 0.0023, + "step": 12143 + }, + { + "epoch": 0.24, + "learning_rate": 1.5303483359869517e-07, + "loss": 0.0034, + "step": 12144 + }, + { + "epoch": 0.24, + "learning_rate": 1.5303095025435904e-07, + "loss": 0.0026, + "step": 12145 + }, + { + "epoch": 0.24, + "learning_rate": 1.5302706691002288e-07, + "loss": 0.9874, + "step": 12146 + }, + { + "epoch": 0.24, + "learning_rate": 1.5302318356568675e-07, + "loss": 0.3296, + "step": 12147 + }, + { + "epoch": 0.24, + "learning_rate": 1.530193002213506e-07, + "loss": 0.0016, + "step": 12148 + }, + { + "epoch": 0.24, + "learning_rate": 1.5301541687701447e-07, + "loss": 0.0017, + "step": 12149 + }, + { + "epoch": 0.24, + "learning_rate": 1.5301153353267832e-07, + "loss": 0.0644, + "step": 12150 + }, + { + "epoch": 0.24, + "learning_rate": 1.5300765018834219e-07, + "loss": 0.0017, + "step": 12151 + }, + { + "epoch": 0.24, + "learning_rate": 1.5300376684400603e-07, + "loss": 0.0028, + "step": 12152 + }, + { + "epoch": 0.24, + "learning_rate": 1.529998834996699e-07, + "loss": 0.6954, + "step": 12153 + }, + { + "epoch": 0.24, + "learning_rate": 1.5299600015533375e-07, + "loss": 0.0016, + "step": 12154 + }, + { + "epoch": 0.24, + "learning_rate": 1.5299211681099762e-07, + "loss": 0.0077, + "step": 12155 + }, + { + "epoch": 0.24, + "learning_rate": 1.5298823346666146e-07, + "loss": 0.011, + "step": 12156 + }, + { + "epoch": 0.24, + "learning_rate": 1.5298435012232534e-07, + "loss": 0.0023, + "step": 12157 + }, + { + "epoch": 0.24, + "learning_rate": 1.5298046677798918e-07, + "loss": 0.138, + "step": 12158 + }, + { + "epoch": 0.24, + "learning_rate": 1.5297658343365305e-07, + "loss": 0.0034, + "step": 12159 + }, + { + "epoch": 0.24, + "learning_rate": 1.529727000893169e-07, + "loss": 0.0025, + "step": 12160 + }, + { + "epoch": 0.24, + "learning_rate": 1.5296881674498077e-07, + "loss": 1.0676, + "step": 12161 + }, + { + "epoch": 0.24, + "learning_rate": 1.5296493340064461e-07, + "loss": 0.0021, + "step": 12162 + }, + { + "epoch": 0.24, + "learning_rate": 1.5296105005630849e-07, + "loss": 0.1189, + "step": 12163 + }, + { + "epoch": 0.24, + "learning_rate": 1.5295716671197233e-07, + "loss": 0.0038, + "step": 12164 + }, + { + "epoch": 0.24, + "learning_rate": 1.529532833676362e-07, + "loss": 0.0018, + "step": 12165 + }, + { + "epoch": 0.24, + "learning_rate": 1.5294940002330005e-07, + "loss": 0.0012, + "step": 12166 + }, + { + "epoch": 0.24, + "learning_rate": 1.5294551667896392e-07, + "loss": 0.0027, + "step": 12167 + }, + { + "epoch": 0.24, + "learning_rate": 1.5294163333462776e-07, + "loss": 0.0015, + "step": 12168 + }, + { + "epoch": 0.24, + "learning_rate": 1.5293774999029164e-07, + "loss": 0.0021, + "step": 12169 + }, + { + "epoch": 0.24, + "learning_rate": 1.5293386664595548e-07, + "loss": 0.003, + "step": 12170 + }, + { + "epoch": 0.24, + "learning_rate": 1.5292998330161935e-07, + "loss": 0.0017, + "step": 12171 + }, + { + "epoch": 0.24, + "learning_rate": 1.529260999572832e-07, + "loss": 0.0861, + "step": 12172 + }, + { + "epoch": 0.24, + "learning_rate": 1.5292221661294707e-07, + "loss": 0.0142, + "step": 12173 + }, + { + "epoch": 0.24, + "learning_rate": 1.529183332686109e-07, + "loss": 0.0018, + "step": 12174 + }, + { + "epoch": 0.24, + "learning_rate": 1.5291444992427478e-07, + "loss": 0.0051, + "step": 12175 + }, + { + "epoch": 0.24, + "learning_rate": 1.5291056657993863e-07, + "loss": 0.002, + "step": 12176 + }, + { + "epoch": 0.24, + "learning_rate": 1.529066832356025e-07, + "loss": 0.002, + "step": 12177 + }, + { + "epoch": 0.24, + "learning_rate": 1.5290279989126635e-07, + "loss": 0.0019, + "step": 12178 + }, + { + "epoch": 0.24, + "learning_rate": 1.5289891654693022e-07, + "loss": 1.326, + "step": 12179 + }, + { + "epoch": 0.24, + "learning_rate": 1.5289503320259406e-07, + "loss": 0.0017, + "step": 12180 + }, + { + "epoch": 0.24, + "learning_rate": 1.5289114985825793e-07, + "loss": 0.0023, + "step": 12181 + }, + { + "epoch": 0.24, + "learning_rate": 1.5288726651392178e-07, + "loss": 0.0016, + "step": 12182 + }, + { + "epoch": 0.24, + "learning_rate": 1.5288338316958565e-07, + "loss": 0.0026, + "step": 12183 + }, + { + "epoch": 0.24, + "learning_rate": 1.528794998252495e-07, + "loss": 0.0046, + "step": 12184 + }, + { + "epoch": 0.24, + "learning_rate": 1.5287561648091337e-07, + "loss": 0.0037, + "step": 12185 + }, + { + "epoch": 0.24, + "learning_rate": 1.528717331365772e-07, + "loss": 0.5026, + "step": 12186 + }, + { + "epoch": 0.24, + "learning_rate": 1.5286784979224108e-07, + "loss": 0.0027, + "step": 12187 + }, + { + "epoch": 0.24, + "learning_rate": 1.5286396644790493e-07, + "loss": 0.002, + "step": 12188 + }, + { + "epoch": 0.24, + "learning_rate": 1.528600831035688e-07, + "loss": 0.0019, + "step": 12189 + }, + { + "epoch": 0.24, + "learning_rate": 1.5285619975923264e-07, + "loss": 0.0017, + "step": 12190 + }, + { + "epoch": 0.24, + "learning_rate": 1.5285231641489652e-07, + "loss": 0.0035, + "step": 12191 + }, + { + "epoch": 0.24, + "learning_rate": 1.5284843307056036e-07, + "loss": 0.002, + "step": 12192 + }, + { + "epoch": 0.24, + "learning_rate": 1.5284454972622423e-07, + "loss": 0.0124, + "step": 12193 + }, + { + "epoch": 0.24, + "learning_rate": 1.5284066638188808e-07, + "loss": 0.0032, + "step": 12194 + }, + { + "epoch": 0.24, + "learning_rate": 1.5283678303755195e-07, + "loss": 0.1171, + "step": 12195 + }, + { + "epoch": 0.24, + "learning_rate": 1.528328996932158e-07, + "loss": 0.0016, + "step": 12196 + }, + { + "epoch": 0.24, + "learning_rate": 1.5282901634887967e-07, + "loss": 0.0017, + "step": 12197 + }, + { + "epoch": 0.24, + "learning_rate": 1.528251330045435e-07, + "loss": 0.0017, + "step": 12198 + }, + { + "epoch": 0.24, + "learning_rate": 1.5282124966020738e-07, + "loss": 0.7138, + "step": 12199 + }, + { + "epoch": 0.24, + "learning_rate": 1.5281736631587123e-07, + "loss": 0.002, + "step": 12200 + }, + { + "epoch": 0.24, + "learning_rate": 1.5281348297153507e-07, + "loss": 0.0024, + "step": 12201 + }, + { + "epoch": 0.24, + "learning_rate": 1.5280959962719892e-07, + "loss": 0.0051, + "step": 12202 + }, + { + "epoch": 0.24, + "learning_rate": 1.528057162828628e-07, + "loss": 0.0032, + "step": 12203 + }, + { + "epoch": 0.24, + "learning_rate": 1.5280183293852663e-07, + "loss": 0.0034, + "step": 12204 + }, + { + "epoch": 0.24, + "learning_rate": 1.527979495941905e-07, + "loss": 0.2124, + "step": 12205 + }, + { + "epoch": 0.24, + "learning_rate": 1.5279406624985435e-07, + "loss": 0.0029, + "step": 12206 + }, + { + "epoch": 0.24, + "learning_rate": 1.5279018290551822e-07, + "loss": 0.1063, + "step": 12207 + }, + { + "epoch": 0.24, + "learning_rate": 1.5278629956118207e-07, + "loss": 0.0159, + "step": 12208 + }, + { + "epoch": 0.24, + "learning_rate": 1.5278241621684594e-07, + "loss": 0.0029, + "step": 12209 + }, + { + "epoch": 0.24, + "learning_rate": 1.5277853287250978e-07, + "loss": 0.0016, + "step": 12210 + }, + { + "epoch": 0.24, + "learning_rate": 1.5277464952817365e-07, + "loss": 0.0019, + "step": 12211 + }, + { + "epoch": 0.24, + "learning_rate": 1.527707661838375e-07, + "loss": 0.0019, + "step": 12212 + }, + { + "epoch": 0.24, + "learning_rate": 1.5276688283950137e-07, + "loss": 0.0098, + "step": 12213 + }, + { + "epoch": 0.24, + "learning_rate": 1.5276299949516522e-07, + "loss": 0.0057, + "step": 12214 + }, + { + "epoch": 0.24, + "learning_rate": 1.527591161508291e-07, + "loss": 0.0022, + "step": 12215 + }, + { + "epoch": 0.24, + "learning_rate": 1.5275523280649293e-07, + "loss": 0.0018, + "step": 12216 + }, + { + "epoch": 0.24, + "learning_rate": 1.527513494621568e-07, + "loss": 0.002, + "step": 12217 + }, + { + "epoch": 0.24, + "learning_rate": 1.5274746611782065e-07, + "loss": 0.0027, + "step": 12218 + }, + { + "epoch": 0.24, + "learning_rate": 1.5274358277348452e-07, + "loss": 0.0111, + "step": 12219 + }, + { + "epoch": 0.24, + "learning_rate": 1.5273969942914837e-07, + "loss": 0.2035, + "step": 12220 + }, + { + "epoch": 0.24, + "learning_rate": 1.5273581608481224e-07, + "loss": 0.0045, + "step": 12221 + }, + { + "epoch": 0.24, + "learning_rate": 1.5273193274047608e-07, + "loss": 0.002, + "step": 12222 + }, + { + "epoch": 0.24, + "learning_rate": 1.5272804939613995e-07, + "loss": 0.0015, + "step": 12223 + }, + { + "epoch": 0.24, + "learning_rate": 1.527241660518038e-07, + "loss": 0.0022, + "step": 12224 + }, + { + "epoch": 0.24, + "learning_rate": 1.5272028270746767e-07, + "loss": 0.0017, + "step": 12225 + }, + { + "epoch": 0.24, + "learning_rate": 1.5271639936313152e-07, + "loss": 0.0024, + "step": 12226 + }, + { + "epoch": 0.24, + "learning_rate": 1.5271251601879539e-07, + "loss": 0.0018, + "step": 12227 + }, + { + "epoch": 0.24, + "learning_rate": 1.5270863267445923e-07, + "loss": 0.0017, + "step": 12228 + }, + { + "epoch": 0.24, + "learning_rate": 1.527047493301231e-07, + "loss": 0.0032, + "step": 12229 + }, + { + "epoch": 0.24, + "learning_rate": 1.5270086598578695e-07, + "loss": 0.0026, + "step": 12230 + }, + { + "epoch": 0.24, + "learning_rate": 1.5269698264145082e-07, + "loss": 0.003, + "step": 12231 + }, + { + "epoch": 0.24, + "learning_rate": 1.5269309929711466e-07, + "loss": 0.0036, + "step": 12232 + }, + { + "epoch": 0.24, + "learning_rate": 1.5268921595277854e-07, + "loss": 0.015, + "step": 12233 + }, + { + "epoch": 0.24, + "learning_rate": 1.5268533260844238e-07, + "loss": 0.0019, + "step": 12234 + }, + { + "epoch": 0.24, + "learning_rate": 1.5268144926410625e-07, + "loss": 0.5313, + "step": 12235 + }, + { + "epoch": 0.24, + "learning_rate": 1.526775659197701e-07, + "loss": 0.4875, + "step": 12236 + }, + { + "epoch": 0.24, + "learning_rate": 1.5267368257543397e-07, + "loss": 0.0015, + "step": 12237 + }, + { + "epoch": 0.24, + "learning_rate": 1.5266979923109781e-07, + "loss": 0.0014, + "step": 12238 + }, + { + "epoch": 0.24, + "learning_rate": 1.5266591588676169e-07, + "loss": 0.0016, + "step": 12239 + }, + { + "epoch": 0.24, + "learning_rate": 1.5266203254242553e-07, + "loss": 0.2863, + "step": 12240 + }, + { + "epoch": 0.24, + "learning_rate": 1.526581491980894e-07, + "loss": 0.005, + "step": 12241 + }, + { + "epoch": 0.24, + "learning_rate": 1.5265426585375325e-07, + "loss": 0.0018, + "step": 12242 + }, + { + "epoch": 0.24, + "learning_rate": 1.5265038250941712e-07, + "loss": 0.0027, + "step": 12243 + }, + { + "epoch": 0.24, + "learning_rate": 1.5264649916508096e-07, + "loss": 0.0021, + "step": 12244 + }, + { + "epoch": 0.24, + "learning_rate": 1.5264261582074484e-07, + "loss": 0.002, + "step": 12245 + }, + { + "epoch": 0.24, + "learning_rate": 1.5263873247640868e-07, + "loss": 0.0018, + "step": 12246 + }, + { + "epoch": 0.24, + "learning_rate": 1.5263484913207255e-07, + "loss": 0.007, + "step": 12247 + }, + { + "epoch": 0.24, + "learning_rate": 1.526309657877364e-07, + "loss": 0.0021, + "step": 12248 + }, + { + "epoch": 0.24, + "learning_rate": 1.5262708244340027e-07, + "loss": 0.0027, + "step": 12249 + }, + { + "epoch": 0.24, + "learning_rate": 1.526231990990641e-07, + "loss": 0.0017, + "step": 12250 + }, + { + "epoch": 0.24, + "learning_rate": 1.5261931575472798e-07, + "loss": 0.0061, + "step": 12251 + }, + { + "epoch": 0.24, + "learning_rate": 1.5261543241039183e-07, + "loss": 0.0019, + "step": 12252 + }, + { + "epoch": 0.24, + "learning_rate": 1.526115490660557e-07, + "loss": 0.0019, + "step": 12253 + }, + { + "epoch": 0.24, + "learning_rate": 1.5260766572171955e-07, + "loss": 0.0062, + "step": 12254 + }, + { + "epoch": 0.24, + "learning_rate": 1.5260378237738342e-07, + "loss": 0.0037, + "step": 12255 + }, + { + "epoch": 0.24, + "learning_rate": 1.5259989903304726e-07, + "loss": 0.0046, + "step": 12256 + }, + { + "epoch": 0.24, + "learning_rate": 1.5259601568871113e-07, + "loss": 0.0017, + "step": 12257 + }, + { + "epoch": 0.24, + "learning_rate": 1.5259213234437498e-07, + "loss": 0.0017, + "step": 12258 + }, + { + "epoch": 0.24, + "learning_rate": 1.5258824900003882e-07, + "loss": 0.0017, + "step": 12259 + }, + { + "epoch": 0.24, + "learning_rate": 1.5258436565570267e-07, + "loss": 0.0017, + "step": 12260 + }, + { + "epoch": 0.24, + "learning_rate": 1.5258048231136654e-07, + "loss": 0.0042, + "step": 12261 + }, + { + "epoch": 0.24, + "learning_rate": 1.5257659896703039e-07, + "loss": 0.0042, + "step": 12262 + }, + { + "epoch": 0.24, + "learning_rate": 1.5257271562269426e-07, + "loss": 0.008, + "step": 12263 + }, + { + "epoch": 0.24, + "learning_rate": 1.525688322783581e-07, + "loss": 0.0017, + "step": 12264 + }, + { + "epoch": 0.24, + "learning_rate": 1.5256494893402197e-07, + "loss": 0.3114, + "step": 12265 + }, + { + "epoch": 0.24, + "learning_rate": 1.5256106558968582e-07, + "loss": 1.1665, + "step": 12266 + }, + { + "epoch": 0.24, + "learning_rate": 1.525571822453497e-07, + "loss": 0.0028, + "step": 12267 + }, + { + "epoch": 0.24, + "learning_rate": 1.5255329890101354e-07, + "loss": 0.0015, + "step": 12268 + }, + { + "epoch": 0.24, + "learning_rate": 1.525494155566774e-07, + "loss": 0.0067, + "step": 12269 + }, + { + "epoch": 0.24, + "learning_rate": 1.5254553221234125e-07, + "loss": 0.0017, + "step": 12270 + }, + { + "epoch": 0.24, + "learning_rate": 1.5254164886800512e-07, + "loss": 0.004, + "step": 12271 + }, + { + "epoch": 0.24, + "learning_rate": 1.5253776552366897e-07, + "loss": 0.6732, + "step": 12272 + }, + { + "epoch": 0.24, + "learning_rate": 1.5253388217933284e-07, + "loss": 0.0024, + "step": 12273 + }, + { + "epoch": 0.24, + "learning_rate": 1.5252999883499668e-07, + "loss": 0.002, + "step": 12274 + }, + { + "epoch": 0.24, + "learning_rate": 1.5252611549066056e-07, + "loss": 0.0034, + "step": 12275 + }, + { + "epoch": 0.24, + "learning_rate": 1.525222321463244e-07, + "loss": 0.8929, + "step": 12276 + }, + { + "epoch": 0.24, + "learning_rate": 1.5251834880198827e-07, + "loss": 0.0028, + "step": 12277 + }, + { + "epoch": 0.24, + "learning_rate": 1.5251446545765212e-07, + "loss": 0.0022, + "step": 12278 + }, + { + "epoch": 0.24, + "learning_rate": 1.52510582113316e-07, + "loss": 0.5584, + "step": 12279 + }, + { + "epoch": 0.24, + "learning_rate": 1.5250669876897983e-07, + "loss": 0.0147, + "step": 12280 + }, + { + "epoch": 0.24, + "learning_rate": 1.525028154246437e-07, + "loss": 0.002, + "step": 12281 + }, + { + "epoch": 0.24, + "learning_rate": 1.5249893208030755e-07, + "loss": 0.0868, + "step": 12282 + }, + { + "epoch": 0.24, + "learning_rate": 1.5249504873597142e-07, + "loss": 0.0337, + "step": 12283 + }, + { + "epoch": 0.24, + "learning_rate": 1.5249116539163527e-07, + "loss": 0.0023, + "step": 12284 + }, + { + "epoch": 0.24, + "learning_rate": 1.5248728204729914e-07, + "loss": 0.0014, + "step": 12285 + }, + { + "epoch": 0.24, + "learning_rate": 1.5248339870296298e-07, + "loss": 0.0015, + "step": 12286 + }, + { + "epoch": 0.24, + "learning_rate": 1.5247951535862685e-07, + "loss": 0.0018, + "step": 12287 + }, + { + "epoch": 0.24, + "learning_rate": 1.524756320142907e-07, + "loss": 0.0018, + "step": 12288 + }, + { + "epoch": 0.24, + "learning_rate": 1.5247174866995457e-07, + "loss": 0.0256, + "step": 12289 + }, + { + "epoch": 0.24, + "learning_rate": 1.5246786532561842e-07, + "loss": 0.0016, + "step": 12290 + }, + { + "epoch": 0.24, + "learning_rate": 1.524639819812823e-07, + "loss": 0.0015, + "step": 12291 + }, + { + "epoch": 0.24, + "learning_rate": 1.5246009863694613e-07, + "loss": 0.0021, + "step": 12292 + }, + { + "epoch": 0.24, + "learning_rate": 1.5245621529260998e-07, + "loss": 0.0017, + "step": 12293 + }, + { + "epoch": 0.24, + "learning_rate": 1.5245233194827385e-07, + "loss": 0.0013, + "step": 12294 + }, + { + "epoch": 0.24, + "learning_rate": 1.524484486039377e-07, + "loss": 0.0135, + "step": 12295 + }, + { + "epoch": 0.24, + "learning_rate": 1.5244456525960157e-07, + "loss": 0.0021, + "step": 12296 + }, + { + "epoch": 0.24, + "learning_rate": 1.524406819152654e-07, + "loss": 0.0017, + "step": 12297 + }, + { + "epoch": 0.24, + "learning_rate": 1.5243679857092928e-07, + "loss": 0.0371, + "step": 12298 + }, + { + "epoch": 0.24, + "learning_rate": 1.5243291522659313e-07, + "loss": 0.0028, + "step": 12299 + }, + { + "epoch": 0.24, + "learning_rate": 1.52429031882257e-07, + "loss": 0.0024, + "step": 12300 + }, + { + "epoch": 0.24, + "learning_rate": 1.5242514853792084e-07, + "loss": 0.0018, + "step": 12301 + }, + { + "epoch": 0.24, + "learning_rate": 1.5242126519358472e-07, + "loss": 0.005, + "step": 12302 + }, + { + "epoch": 0.24, + "learning_rate": 1.5241738184924856e-07, + "loss": 0.9408, + "step": 12303 + }, + { + "epoch": 0.24, + "learning_rate": 1.5241349850491243e-07, + "loss": 0.0015, + "step": 12304 + }, + { + "epoch": 0.24, + "learning_rate": 1.5240961516057628e-07, + "loss": 0.0666, + "step": 12305 + }, + { + "epoch": 0.24, + "learning_rate": 1.5240573181624015e-07, + "loss": 0.0217, + "step": 12306 + }, + { + "epoch": 0.24, + "learning_rate": 1.52401848471904e-07, + "loss": 0.0164, + "step": 12307 + }, + { + "epoch": 0.24, + "learning_rate": 1.5239796512756786e-07, + "loss": 1.8551, + "step": 12308 + }, + { + "epoch": 0.24, + "learning_rate": 1.523940817832317e-07, + "loss": 0.0033, + "step": 12309 + }, + { + "epoch": 0.24, + "learning_rate": 1.5239019843889558e-07, + "loss": 0.0047, + "step": 12310 + }, + { + "epoch": 0.24, + "learning_rate": 1.5238631509455943e-07, + "loss": 0.0024, + "step": 12311 + }, + { + "epoch": 0.24, + "learning_rate": 1.523824317502233e-07, + "loss": 0.0109, + "step": 12312 + }, + { + "epoch": 0.24, + "learning_rate": 1.5237854840588714e-07, + "loss": 0.0034, + "step": 12313 + }, + { + "epoch": 0.24, + "learning_rate": 1.5237466506155101e-07, + "loss": 0.0027, + "step": 12314 + }, + { + "epoch": 0.24, + "learning_rate": 1.5237078171721486e-07, + "loss": 0.0056, + "step": 12315 + }, + { + "epoch": 0.24, + "learning_rate": 1.5236689837287873e-07, + "loss": 0.0019, + "step": 12316 + }, + { + "epoch": 0.24, + "learning_rate": 1.5236301502854258e-07, + "loss": 0.005, + "step": 12317 + }, + { + "epoch": 0.24, + "learning_rate": 1.5235913168420642e-07, + "loss": 0.0022, + "step": 12318 + }, + { + "epoch": 0.24, + "learning_rate": 1.523552483398703e-07, + "loss": 0.0022, + "step": 12319 + }, + { + "epoch": 0.24, + "learning_rate": 1.5235136499553414e-07, + "loss": 0.0066, + "step": 12320 + }, + { + "epoch": 0.24, + "learning_rate": 1.5234748165119798e-07, + "loss": 0.0036, + "step": 12321 + }, + { + "epoch": 0.24, + "learning_rate": 1.5234359830686185e-07, + "loss": 0.2864, + "step": 12322 + }, + { + "epoch": 0.24, + "learning_rate": 1.523397149625257e-07, + "loss": 0.0032, + "step": 12323 + }, + { + "epoch": 0.24, + "learning_rate": 1.5233583161818957e-07, + "loss": 0.002, + "step": 12324 + }, + { + "epoch": 0.24, + "learning_rate": 1.5233194827385342e-07, + "loss": 0.0021, + "step": 12325 + }, + { + "epoch": 0.24, + "learning_rate": 1.5232806492951729e-07, + "loss": 0.0017, + "step": 12326 + }, + { + "epoch": 0.24, + "learning_rate": 1.5232418158518113e-07, + "loss": 0.0028, + "step": 12327 + }, + { + "epoch": 0.24, + "learning_rate": 1.52320298240845e-07, + "loss": 0.0018, + "step": 12328 + }, + { + "epoch": 0.24, + "learning_rate": 1.5231641489650885e-07, + "loss": 0.0561, + "step": 12329 + }, + { + "epoch": 0.24, + "learning_rate": 1.5231253155217272e-07, + "loss": 0.0019, + "step": 12330 + }, + { + "epoch": 0.24, + "learning_rate": 1.5230864820783656e-07, + "loss": 0.0017, + "step": 12331 + }, + { + "epoch": 0.24, + "learning_rate": 1.5230476486350044e-07, + "loss": 0.0017, + "step": 12332 + }, + { + "epoch": 0.24, + "learning_rate": 1.5230088151916428e-07, + "loss": 0.0027, + "step": 12333 + }, + { + "epoch": 0.24, + "learning_rate": 1.5229699817482815e-07, + "loss": 0.0012, + "step": 12334 + }, + { + "epoch": 0.24, + "learning_rate": 1.52293114830492e-07, + "loss": 0.0094, + "step": 12335 + }, + { + "epoch": 0.24, + "learning_rate": 1.5228923148615587e-07, + "loss": 0.0018, + "step": 12336 + }, + { + "epoch": 0.24, + "learning_rate": 1.5228534814181971e-07, + "loss": 0.0043, + "step": 12337 + }, + { + "epoch": 0.24, + "learning_rate": 1.5228146479748359e-07, + "loss": 0.0055, + "step": 12338 + }, + { + "epoch": 0.24, + "learning_rate": 1.5227758145314743e-07, + "loss": 0.0528, + "step": 12339 + }, + { + "epoch": 0.24, + "learning_rate": 1.522736981088113e-07, + "loss": 0.0088, + "step": 12340 + }, + { + "epoch": 0.24, + "learning_rate": 1.5226981476447515e-07, + "loss": 0.0015, + "step": 12341 + }, + { + "epoch": 0.24, + "learning_rate": 1.5226593142013902e-07, + "loss": 0.0024, + "step": 12342 + }, + { + "epoch": 0.24, + "learning_rate": 1.5226204807580286e-07, + "loss": 0.0136, + "step": 12343 + }, + { + "epoch": 0.24, + "learning_rate": 1.5225816473146674e-07, + "loss": 0.002, + "step": 12344 + }, + { + "epoch": 0.24, + "learning_rate": 1.5225428138713058e-07, + "loss": 0.002, + "step": 12345 + }, + { + "epoch": 0.24, + "learning_rate": 1.5225039804279445e-07, + "loss": 0.0033, + "step": 12346 + }, + { + "epoch": 0.24, + "learning_rate": 1.522465146984583e-07, + "loss": 0.0016, + "step": 12347 + }, + { + "epoch": 0.24, + "learning_rate": 1.5224263135412217e-07, + "loss": 0.89, + "step": 12348 + }, + { + "epoch": 0.24, + "learning_rate": 1.52238748009786e-07, + "loss": 0.0059, + "step": 12349 + }, + { + "epoch": 0.24, + "learning_rate": 1.5223486466544988e-07, + "loss": 0.0019, + "step": 12350 + }, + { + "epoch": 0.24, + "learning_rate": 1.5223098132111373e-07, + "loss": 0.0019, + "step": 12351 + }, + { + "epoch": 0.24, + "learning_rate": 1.522270979767776e-07, + "loss": 0.0018, + "step": 12352 + }, + { + "epoch": 0.24, + "learning_rate": 1.5222321463244145e-07, + "loss": 0.0025, + "step": 12353 + }, + { + "epoch": 0.24, + "learning_rate": 1.5221933128810532e-07, + "loss": 0.519, + "step": 12354 + }, + { + "epoch": 0.24, + "learning_rate": 1.5221544794376916e-07, + "loss": 0.0023, + "step": 12355 + }, + { + "epoch": 0.24, + "learning_rate": 1.5221156459943303e-07, + "loss": 0.0025, + "step": 12356 + }, + { + "epoch": 0.24, + "learning_rate": 1.5220768125509688e-07, + "loss": 0.0026, + "step": 12357 + }, + { + "epoch": 0.24, + "learning_rate": 1.5220379791076075e-07, + "loss": 0.0019, + "step": 12358 + }, + { + "epoch": 0.24, + "learning_rate": 1.521999145664246e-07, + "loss": 0.0123, + "step": 12359 + }, + { + "epoch": 0.24, + "learning_rate": 1.5219603122208847e-07, + "loss": 0.0021, + "step": 12360 + }, + { + "epoch": 0.24, + "learning_rate": 1.521921478777523e-07, + "loss": 0.002, + "step": 12361 + }, + { + "epoch": 0.24, + "learning_rate": 1.5218826453341618e-07, + "loss": 0.8886, + "step": 12362 + }, + { + "epoch": 0.24, + "learning_rate": 1.5218438118908003e-07, + "loss": 0.0025, + "step": 12363 + }, + { + "epoch": 0.24, + "learning_rate": 1.521804978447439e-07, + "loss": 0.0016, + "step": 12364 + }, + { + "epoch": 0.24, + "learning_rate": 1.5217661450040775e-07, + "loss": 0.0018, + "step": 12365 + }, + { + "epoch": 0.24, + "learning_rate": 1.5217273115607162e-07, + "loss": 0.003, + "step": 12366 + }, + { + "epoch": 0.24, + "learning_rate": 1.5216884781173546e-07, + "loss": 0.2499, + "step": 12367 + }, + { + "epoch": 0.24, + "learning_rate": 1.5216496446739933e-07, + "loss": 0.0019, + "step": 12368 + }, + { + "epoch": 0.24, + "learning_rate": 1.5216108112306318e-07, + "loss": 0.0017, + "step": 12369 + }, + { + "epoch": 0.24, + "learning_rate": 1.5215719777872705e-07, + "loss": 0.0015, + "step": 12370 + }, + { + "epoch": 0.24, + "learning_rate": 1.521533144343909e-07, + "loss": 0.0026, + "step": 12371 + }, + { + "epoch": 0.24, + "learning_rate": 1.5214943109005477e-07, + "loss": 0.2427, + "step": 12372 + }, + { + "epoch": 0.24, + "learning_rate": 1.521455477457186e-07, + "loss": 0.0026, + "step": 12373 + }, + { + "epoch": 0.24, + "learning_rate": 1.5214166440138248e-07, + "loss": 0.0017, + "step": 12374 + }, + { + "epoch": 0.24, + "learning_rate": 1.521377810570463e-07, + "loss": 0.0016, + "step": 12375 + }, + { + "epoch": 0.24, + "learning_rate": 1.5213389771271017e-07, + "loss": 0.0015, + "step": 12376 + }, + { + "epoch": 0.24, + "learning_rate": 1.5213001436837402e-07, + "loss": 0.002, + "step": 12377 + }, + { + "epoch": 0.24, + "learning_rate": 1.521261310240379e-07, + "loss": 0.0015, + "step": 12378 + }, + { + "epoch": 0.24, + "learning_rate": 1.5212224767970173e-07, + "loss": 0.0017, + "step": 12379 + }, + { + "epoch": 0.24, + "learning_rate": 1.521183643353656e-07, + "loss": 0.0016, + "step": 12380 + }, + { + "epoch": 0.24, + "learning_rate": 1.5211448099102945e-07, + "loss": 0.0964, + "step": 12381 + }, + { + "epoch": 0.24, + "learning_rate": 1.5211059764669332e-07, + "loss": 0.0731, + "step": 12382 + }, + { + "epoch": 0.24, + "learning_rate": 1.5210671430235717e-07, + "loss": 0.0018, + "step": 12383 + }, + { + "epoch": 0.24, + "learning_rate": 1.5210283095802104e-07, + "loss": 0.7719, + "step": 12384 + }, + { + "epoch": 0.24, + "learning_rate": 1.5209894761368488e-07, + "loss": 0.0023, + "step": 12385 + }, + { + "epoch": 0.24, + "learning_rate": 1.5209506426934875e-07, + "loss": 0.002, + "step": 12386 + }, + { + "epoch": 0.24, + "learning_rate": 1.520911809250126e-07, + "loss": 0.6373, + "step": 12387 + }, + { + "epoch": 0.24, + "learning_rate": 1.5208729758067647e-07, + "loss": 0.0157, + "step": 12388 + }, + { + "epoch": 0.24, + "learning_rate": 1.5208341423634032e-07, + "loss": 0.0147, + "step": 12389 + }, + { + "epoch": 0.24, + "learning_rate": 1.520795308920042e-07, + "loss": 0.0015, + "step": 12390 + }, + { + "epoch": 0.24, + "learning_rate": 1.5207564754766803e-07, + "loss": 0.0015, + "step": 12391 + }, + { + "epoch": 0.24, + "learning_rate": 1.520717642033319e-07, + "loss": 0.0015, + "step": 12392 + }, + { + "epoch": 0.24, + "learning_rate": 1.5206788085899575e-07, + "loss": 0.4829, + "step": 12393 + }, + { + "epoch": 0.24, + "learning_rate": 1.5206399751465962e-07, + "loss": 0.0026, + "step": 12394 + }, + { + "epoch": 0.24, + "learning_rate": 1.5206011417032347e-07, + "loss": 0.0037, + "step": 12395 + }, + { + "epoch": 0.24, + "learning_rate": 1.5205623082598734e-07, + "loss": 0.0104, + "step": 12396 + }, + { + "epoch": 0.24, + "learning_rate": 1.5205234748165118e-07, + "loss": 0.0213, + "step": 12397 + }, + { + "epoch": 0.24, + "learning_rate": 1.5204846413731505e-07, + "loss": 0.0021, + "step": 12398 + }, + { + "epoch": 0.24, + "learning_rate": 1.520445807929789e-07, + "loss": 0.0023, + "step": 12399 + }, + { + "epoch": 0.24, + "learning_rate": 1.5204069744864277e-07, + "loss": 0.7459, + "step": 12400 + }, + { + "epoch": 0.24, + "learning_rate": 1.5203681410430662e-07, + "loss": 0.457, + "step": 12401 + }, + { + "epoch": 0.24, + "learning_rate": 1.520329307599705e-07, + "loss": 0.0019, + "step": 12402 + }, + { + "epoch": 0.24, + "learning_rate": 1.5202904741563433e-07, + "loss": 0.0019, + "step": 12403 + }, + { + "epoch": 0.24, + "learning_rate": 1.520251640712982e-07, + "loss": 0.0019, + "step": 12404 + }, + { + "epoch": 0.24, + "learning_rate": 1.5202128072696205e-07, + "loss": 0.0021, + "step": 12405 + }, + { + "epoch": 0.24, + "learning_rate": 1.5201739738262592e-07, + "loss": 0.0029, + "step": 12406 + }, + { + "epoch": 0.24, + "learning_rate": 1.5201351403828976e-07, + "loss": 0.0015, + "step": 12407 + }, + { + "epoch": 0.24, + "learning_rate": 1.5200963069395364e-07, + "loss": 0.0999, + "step": 12408 + }, + { + "epoch": 0.24, + "learning_rate": 1.5200574734961748e-07, + "loss": 0.0019, + "step": 12409 + }, + { + "epoch": 0.24, + "learning_rate": 1.5200186400528135e-07, + "loss": 0.0016, + "step": 12410 + }, + { + "epoch": 0.24, + "learning_rate": 1.519979806609452e-07, + "loss": 0.0016, + "step": 12411 + }, + { + "epoch": 0.24, + "learning_rate": 1.5199409731660907e-07, + "loss": 0.0048, + "step": 12412 + }, + { + "epoch": 0.24, + "learning_rate": 1.5199021397227291e-07, + "loss": 0.002, + "step": 12413 + }, + { + "epoch": 0.24, + "learning_rate": 1.5198633062793679e-07, + "loss": 0.0022, + "step": 12414 + }, + { + "epoch": 0.24, + "learning_rate": 1.5198244728360063e-07, + "loss": 0.4403, + "step": 12415 + }, + { + "epoch": 0.24, + "learning_rate": 1.519785639392645e-07, + "loss": 0.0017, + "step": 12416 + }, + { + "epoch": 0.24, + "learning_rate": 1.5197468059492835e-07, + "loss": 0.0015, + "step": 12417 + }, + { + "epoch": 0.24, + "learning_rate": 1.5197079725059222e-07, + "loss": 0.0019, + "step": 12418 + }, + { + "epoch": 0.24, + "learning_rate": 1.5196691390625606e-07, + "loss": 0.0043, + "step": 12419 + }, + { + "epoch": 0.24, + "learning_rate": 1.5196303056191994e-07, + "loss": 0.3887, + "step": 12420 + }, + { + "epoch": 0.24, + "learning_rate": 1.5195914721758378e-07, + "loss": 0.0017, + "step": 12421 + }, + { + "epoch": 0.24, + "learning_rate": 1.5195526387324765e-07, + "loss": 0.0017, + "step": 12422 + }, + { + "epoch": 0.24, + "learning_rate": 1.519513805289115e-07, + "loss": 0.0179, + "step": 12423 + }, + { + "epoch": 0.24, + "learning_rate": 1.5194749718457537e-07, + "loss": 0.0276, + "step": 12424 + }, + { + "epoch": 0.24, + "learning_rate": 1.5194361384023921e-07, + "loss": 0.0014, + "step": 12425 + }, + { + "epoch": 0.24, + "learning_rate": 1.5193973049590308e-07, + "loss": 0.0014, + "step": 12426 + }, + { + "epoch": 0.24, + "learning_rate": 1.5193584715156693e-07, + "loss": 0.0017, + "step": 12427 + }, + { + "epoch": 0.24, + "learning_rate": 1.519319638072308e-07, + "loss": 0.0016, + "step": 12428 + }, + { + "epoch": 0.24, + "learning_rate": 1.5192808046289465e-07, + "loss": 0.0021, + "step": 12429 + }, + { + "epoch": 0.24, + "learning_rate": 1.5192419711855852e-07, + "loss": 0.0015, + "step": 12430 + }, + { + "epoch": 0.24, + "learning_rate": 1.5192031377422236e-07, + "loss": 0.0017, + "step": 12431 + }, + { + "epoch": 0.24, + "learning_rate": 1.5191643042988623e-07, + "loss": 0.0294, + "step": 12432 + }, + { + "epoch": 0.24, + "learning_rate": 1.5191254708555005e-07, + "loss": 0.9435, + "step": 12433 + }, + { + "epoch": 0.24, + "learning_rate": 1.5190866374121392e-07, + "loss": 0.0021, + "step": 12434 + }, + { + "epoch": 0.24, + "learning_rate": 1.5190478039687777e-07, + "loss": 0.0015, + "step": 12435 + }, + { + "epoch": 0.24, + "learning_rate": 1.5190089705254164e-07, + "loss": 0.0028, + "step": 12436 + }, + { + "epoch": 0.24, + "learning_rate": 1.5189701370820549e-07, + "loss": 1.0754, + "step": 12437 + }, + { + "epoch": 0.24, + "learning_rate": 1.5189313036386936e-07, + "loss": 0.2223, + "step": 12438 + }, + { + "epoch": 0.24, + "learning_rate": 1.518892470195332e-07, + "loss": 0.0017, + "step": 12439 + }, + { + "epoch": 0.24, + "learning_rate": 1.5188536367519707e-07, + "loss": 0.0037, + "step": 12440 + }, + { + "epoch": 0.24, + "learning_rate": 1.5188148033086092e-07, + "loss": 0.0061, + "step": 12441 + }, + { + "epoch": 0.24, + "learning_rate": 1.518775969865248e-07, + "loss": 0.232, + "step": 12442 + }, + { + "epoch": 0.24, + "learning_rate": 1.5187371364218864e-07, + "loss": 0.0052, + "step": 12443 + }, + { + "epoch": 0.24, + "learning_rate": 1.518698302978525e-07, + "loss": 0.0036, + "step": 12444 + }, + { + "epoch": 0.24, + "learning_rate": 1.5186594695351635e-07, + "loss": 0.0021, + "step": 12445 + }, + { + "epoch": 0.24, + "learning_rate": 1.5186206360918022e-07, + "loss": 0.0056, + "step": 12446 + }, + { + "epoch": 0.24, + "learning_rate": 1.5185818026484407e-07, + "loss": 1.0394, + "step": 12447 + }, + { + "epoch": 0.24, + "learning_rate": 1.5185429692050794e-07, + "loss": 0.003, + "step": 12448 + }, + { + "epoch": 0.24, + "learning_rate": 1.5185041357617178e-07, + "loss": 0.0018, + "step": 12449 + }, + { + "epoch": 0.24, + "learning_rate": 1.5184653023183566e-07, + "loss": 0.0038, + "step": 12450 + }, + { + "epoch": 0.24, + "learning_rate": 1.518426468874995e-07, + "loss": 0.002, + "step": 12451 + }, + { + "epoch": 0.24, + "learning_rate": 1.5183876354316337e-07, + "loss": 0.0016, + "step": 12452 + }, + { + "epoch": 0.24, + "learning_rate": 1.5183488019882722e-07, + "loss": 0.0019, + "step": 12453 + }, + { + "epoch": 0.24, + "learning_rate": 1.518309968544911e-07, + "loss": 0.0044, + "step": 12454 + }, + { + "epoch": 0.24, + "learning_rate": 1.5182711351015493e-07, + "loss": 0.0017, + "step": 12455 + }, + { + "epoch": 0.24, + "learning_rate": 1.518232301658188e-07, + "loss": 0.0378, + "step": 12456 + }, + { + "epoch": 0.24, + "learning_rate": 1.5181934682148265e-07, + "loss": 0.0226, + "step": 12457 + }, + { + "epoch": 0.24, + "learning_rate": 1.5181546347714652e-07, + "loss": 0.0016, + "step": 12458 + }, + { + "epoch": 0.24, + "learning_rate": 1.5181158013281037e-07, + "loss": 0.004, + "step": 12459 + }, + { + "epoch": 0.24, + "learning_rate": 1.5180769678847424e-07, + "loss": 0.0014, + "step": 12460 + }, + { + "epoch": 0.24, + "learning_rate": 1.5180381344413808e-07, + "loss": 0.0017, + "step": 12461 + }, + { + "epoch": 0.24, + "learning_rate": 1.5179993009980196e-07, + "loss": 0.0037, + "step": 12462 + }, + { + "epoch": 0.24, + "learning_rate": 1.517960467554658e-07, + "loss": 0.0014, + "step": 12463 + }, + { + "epoch": 0.24, + "learning_rate": 1.5179216341112967e-07, + "loss": 0.7932, + "step": 12464 + }, + { + "epoch": 0.24, + "learning_rate": 1.5178828006679352e-07, + "loss": 0.0232, + "step": 12465 + }, + { + "epoch": 0.24, + "learning_rate": 1.517843967224574e-07, + "loss": 1.1545, + "step": 12466 + }, + { + "epoch": 0.24, + "learning_rate": 1.5178051337812123e-07, + "loss": 0.0015, + "step": 12467 + }, + { + "epoch": 0.24, + "learning_rate": 1.517766300337851e-07, + "loss": 0.0019, + "step": 12468 + }, + { + "epoch": 0.24, + "learning_rate": 1.5177274668944895e-07, + "loss": 0.0025, + "step": 12469 + }, + { + "epoch": 0.24, + "learning_rate": 1.517688633451128e-07, + "loss": 0.0026, + "step": 12470 + }, + { + "epoch": 0.24, + "learning_rate": 1.5176498000077667e-07, + "loss": 0.0053, + "step": 12471 + }, + { + "epoch": 0.24, + "learning_rate": 1.517610966564405e-07, + "loss": 0.5825, + "step": 12472 + }, + { + "epoch": 0.24, + "learning_rate": 1.5175721331210438e-07, + "loss": 0.0048, + "step": 12473 + }, + { + "epoch": 0.24, + "learning_rate": 1.5175332996776823e-07, + "loss": 0.0015, + "step": 12474 + }, + { + "epoch": 0.24, + "learning_rate": 1.517494466234321e-07, + "loss": 0.0018, + "step": 12475 + }, + { + "epoch": 0.24, + "learning_rate": 1.5174556327909594e-07, + "loss": 0.9735, + "step": 12476 + }, + { + "epoch": 0.24, + "learning_rate": 1.5174167993475982e-07, + "loss": 0.0019, + "step": 12477 + }, + { + "epoch": 0.24, + "learning_rate": 1.5173779659042366e-07, + "loss": 0.4044, + "step": 12478 + }, + { + "epoch": 0.24, + "learning_rate": 1.5173391324608753e-07, + "loss": 0.0022, + "step": 12479 + }, + { + "epoch": 0.24, + "learning_rate": 1.5173002990175138e-07, + "loss": 0.0058, + "step": 12480 + }, + { + "epoch": 0.24, + "learning_rate": 1.5172614655741525e-07, + "loss": 0.0025, + "step": 12481 + }, + { + "epoch": 0.24, + "learning_rate": 1.517222632130791e-07, + "loss": 0.0017, + "step": 12482 + }, + { + "epoch": 0.24, + "learning_rate": 1.5171837986874296e-07, + "loss": 0.002, + "step": 12483 + }, + { + "epoch": 0.24, + "learning_rate": 1.517144965244068e-07, + "loss": 0.0025, + "step": 12484 + }, + { + "epoch": 0.24, + "learning_rate": 1.5171061318007068e-07, + "loss": 0.0637, + "step": 12485 + }, + { + "epoch": 0.24, + "learning_rate": 1.5170672983573453e-07, + "loss": 0.0037, + "step": 12486 + }, + { + "epoch": 0.24, + "learning_rate": 1.517028464913984e-07, + "loss": 0.0043, + "step": 12487 + }, + { + "epoch": 0.24, + "learning_rate": 1.5169896314706224e-07, + "loss": 0.0014, + "step": 12488 + }, + { + "epoch": 0.24, + "learning_rate": 1.5169507980272611e-07, + "loss": 0.0015, + "step": 12489 + }, + { + "epoch": 0.24, + "learning_rate": 1.5169119645838996e-07, + "loss": 0.0016, + "step": 12490 + }, + { + "epoch": 0.24, + "learning_rate": 1.516873131140538e-07, + "loss": 0.0018, + "step": 12491 + }, + { + "epoch": 0.24, + "learning_rate": 1.5168342976971768e-07, + "loss": 0.0015, + "step": 12492 + }, + { + "epoch": 0.24, + "learning_rate": 1.5167954642538152e-07, + "loss": 0.0019, + "step": 12493 + }, + { + "epoch": 0.24, + "learning_rate": 1.516756630810454e-07, + "loss": 0.0047, + "step": 12494 + }, + { + "epoch": 0.24, + "learning_rate": 1.5167177973670924e-07, + "loss": 0.0023, + "step": 12495 + }, + { + "epoch": 0.24, + "learning_rate": 1.516678963923731e-07, + "loss": 0.0018, + "step": 12496 + }, + { + "epoch": 0.24, + "learning_rate": 1.5166401304803695e-07, + "loss": 0.0018, + "step": 12497 + }, + { + "epoch": 0.24, + "learning_rate": 1.516601297037008e-07, + "loss": 0.0018, + "step": 12498 + }, + { + "epoch": 0.24, + "learning_rate": 1.5165624635936467e-07, + "loss": 0.0015, + "step": 12499 + }, + { + "epoch": 0.24, + "learning_rate": 1.5165236301502852e-07, + "loss": 0.0048, + "step": 12500 + }, + { + "epoch": 0.24, + "learning_rate": 1.516484796706924e-07, + "loss": 0.0073, + "step": 12501 + }, + { + "epoch": 0.24, + "learning_rate": 1.5164459632635623e-07, + "loss": 0.0019, + "step": 12502 + }, + { + "epoch": 0.24, + "learning_rate": 1.516407129820201e-07, + "loss": 0.0023, + "step": 12503 + }, + { + "epoch": 0.24, + "learning_rate": 1.5163682963768395e-07, + "loss": 0.012, + "step": 12504 + }, + { + "epoch": 0.24, + "learning_rate": 1.5163294629334782e-07, + "loss": 0.0018, + "step": 12505 + }, + { + "epoch": 0.24, + "learning_rate": 1.5162906294901166e-07, + "loss": 0.0024, + "step": 12506 + }, + { + "epoch": 0.24, + "learning_rate": 1.5162517960467554e-07, + "loss": 1.2087, + "step": 12507 + }, + { + "epoch": 0.24, + "learning_rate": 1.5162129626033938e-07, + "loss": 0.2961, + "step": 12508 + }, + { + "epoch": 0.24, + "learning_rate": 1.5161741291600325e-07, + "loss": 0.0018, + "step": 12509 + }, + { + "epoch": 0.24, + "learning_rate": 1.516135295716671e-07, + "loss": 0.0214, + "step": 12510 + }, + { + "epoch": 0.24, + "learning_rate": 1.5160964622733097e-07, + "loss": 0.0027, + "step": 12511 + }, + { + "epoch": 0.24, + "learning_rate": 1.5160576288299481e-07, + "loss": 0.0022, + "step": 12512 + }, + { + "epoch": 0.24, + "learning_rate": 1.5160187953865869e-07, + "loss": 0.0024, + "step": 12513 + }, + { + "epoch": 0.24, + "learning_rate": 1.5159799619432253e-07, + "loss": 0.3913, + "step": 12514 + }, + { + "epoch": 0.24, + "learning_rate": 1.515941128499864e-07, + "loss": 0.0023, + "step": 12515 + }, + { + "epoch": 0.24, + "learning_rate": 1.5159022950565025e-07, + "loss": 0.0023, + "step": 12516 + }, + { + "epoch": 0.24, + "learning_rate": 1.5158634616131412e-07, + "loss": 0.012, + "step": 12517 + }, + { + "epoch": 0.24, + "learning_rate": 1.5158246281697796e-07, + "loss": 0.0026, + "step": 12518 + }, + { + "epoch": 0.24, + "learning_rate": 1.5157857947264184e-07, + "loss": 0.0043, + "step": 12519 + }, + { + "epoch": 0.24, + "learning_rate": 1.5157469612830568e-07, + "loss": 0.0018, + "step": 12520 + }, + { + "epoch": 0.24, + "learning_rate": 1.5157081278396955e-07, + "loss": 0.0018, + "step": 12521 + }, + { + "epoch": 0.24, + "learning_rate": 1.515669294396334e-07, + "loss": 0.003, + "step": 12522 + }, + { + "epoch": 0.24, + "learning_rate": 1.5156304609529727e-07, + "loss": 0.0021, + "step": 12523 + }, + { + "epoch": 0.24, + "learning_rate": 1.5155916275096111e-07, + "loss": 0.5149, + "step": 12524 + }, + { + "epoch": 0.24, + "learning_rate": 1.5155527940662498e-07, + "loss": 0.0018, + "step": 12525 + }, + { + "epoch": 0.24, + "learning_rate": 1.5155139606228883e-07, + "loss": 0.0018, + "step": 12526 + }, + { + "epoch": 0.24, + "learning_rate": 1.515475127179527e-07, + "loss": 0.0025, + "step": 12527 + }, + { + "epoch": 0.24, + "learning_rate": 1.5154362937361655e-07, + "loss": 0.0024, + "step": 12528 + }, + { + "epoch": 0.24, + "learning_rate": 1.5153974602928042e-07, + "loss": 0.0015, + "step": 12529 + }, + { + "epoch": 0.24, + "learning_rate": 1.5153586268494426e-07, + "loss": 0.1814, + "step": 12530 + }, + { + "epoch": 0.24, + "learning_rate": 1.5153197934060813e-07, + "loss": 0.0329, + "step": 12531 + }, + { + "epoch": 0.24, + "learning_rate": 1.5152809599627198e-07, + "loss": 0.1476, + "step": 12532 + }, + { + "epoch": 0.24, + "learning_rate": 1.5152421265193585e-07, + "loss": 0.004, + "step": 12533 + }, + { + "epoch": 0.24, + "learning_rate": 1.515203293075997e-07, + "loss": 0.0097, + "step": 12534 + }, + { + "epoch": 0.24, + "learning_rate": 1.5151644596326357e-07, + "loss": 0.0032, + "step": 12535 + }, + { + "epoch": 0.24, + "learning_rate": 1.515125626189274e-07, + "loss": 0.0027, + "step": 12536 + }, + { + "epoch": 0.24, + "learning_rate": 1.5150867927459128e-07, + "loss": 0.0016, + "step": 12537 + }, + { + "epoch": 0.24, + "learning_rate": 1.5150479593025513e-07, + "loss": 0.0014, + "step": 12538 + }, + { + "epoch": 0.24, + "learning_rate": 1.51500912585919e-07, + "loss": 0.0016, + "step": 12539 + }, + { + "epoch": 0.24, + "learning_rate": 1.5149702924158285e-07, + "loss": 0.0022, + "step": 12540 + }, + { + "epoch": 0.24, + "learning_rate": 1.5149314589724672e-07, + "loss": 0.0015, + "step": 12541 + }, + { + "epoch": 0.24, + "learning_rate": 1.5148926255291056e-07, + "loss": 0.0017, + "step": 12542 + }, + { + "epoch": 0.24, + "learning_rate": 1.5148537920857443e-07, + "loss": 0.0015, + "step": 12543 + }, + { + "epoch": 0.24, + "learning_rate": 1.5148149586423828e-07, + "loss": 0.36, + "step": 12544 + }, + { + "epoch": 0.24, + "learning_rate": 1.5147761251990215e-07, + "loss": 0.002, + "step": 12545 + }, + { + "epoch": 0.24, + "learning_rate": 1.51473729175566e-07, + "loss": 0.0504, + "step": 12546 + }, + { + "epoch": 0.24, + "learning_rate": 1.5146984583122987e-07, + "loss": 0.0017, + "step": 12547 + }, + { + "epoch": 0.24, + "learning_rate": 1.514659624868937e-07, + "loss": 0.0015, + "step": 12548 + }, + { + "epoch": 0.24, + "learning_rate": 1.5146207914255756e-07, + "loss": 0.0027, + "step": 12549 + }, + { + "epoch": 0.24, + "learning_rate": 1.514581957982214e-07, + "loss": 0.0133, + "step": 12550 + }, + { + "epoch": 0.24, + "learning_rate": 1.5145431245388527e-07, + "loss": 0.0057, + "step": 12551 + }, + { + "epoch": 0.24, + "learning_rate": 1.5145042910954912e-07, + "loss": 0.0025, + "step": 12552 + }, + { + "epoch": 0.24, + "learning_rate": 1.51446545765213e-07, + "loss": 0.0026, + "step": 12553 + }, + { + "epoch": 0.24, + "learning_rate": 1.5144266242087683e-07, + "loss": 0.0028, + "step": 12554 + }, + { + "epoch": 0.24, + "learning_rate": 1.514387790765407e-07, + "loss": 0.6279, + "step": 12555 + }, + { + "epoch": 0.24, + "learning_rate": 1.5143489573220455e-07, + "loss": 0.0018, + "step": 12556 + }, + { + "epoch": 0.24, + "learning_rate": 1.5143101238786842e-07, + "loss": 0.0017, + "step": 12557 + }, + { + "epoch": 0.24, + "learning_rate": 1.5142712904353227e-07, + "loss": 0.0016, + "step": 12558 + }, + { + "epoch": 0.24, + "learning_rate": 1.5142324569919614e-07, + "loss": 0.674, + "step": 12559 + }, + { + "epoch": 0.24, + "learning_rate": 1.5141936235485998e-07, + "loss": 0.0149, + "step": 12560 + }, + { + "epoch": 0.24, + "learning_rate": 1.5141547901052386e-07, + "loss": 0.0033, + "step": 12561 + }, + { + "epoch": 0.24, + "learning_rate": 1.514115956661877e-07, + "loss": 0.0651, + "step": 12562 + }, + { + "epoch": 0.24, + "learning_rate": 1.5140771232185157e-07, + "loss": 0.002, + "step": 12563 + }, + { + "epoch": 0.24, + "learning_rate": 1.5140382897751542e-07, + "loss": 0.0027, + "step": 12564 + }, + { + "epoch": 0.24, + "learning_rate": 1.513999456331793e-07, + "loss": 0.4737, + "step": 12565 + }, + { + "epoch": 0.24, + "learning_rate": 1.5139606228884313e-07, + "loss": 0.0023, + "step": 12566 + }, + { + "epoch": 0.24, + "learning_rate": 1.51392178944507e-07, + "loss": 0.5567, + "step": 12567 + }, + { + "epoch": 0.24, + "learning_rate": 1.5138829560017085e-07, + "loss": 0.0527, + "step": 12568 + }, + { + "epoch": 0.24, + "learning_rate": 1.5138441225583472e-07, + "loss": 0.0069, + "step": 12569 + }, + { + "epoch": 0.24, + "learning_rate": 1.5138052891149857e-07, + "loss": 0.0044, + "step": 12570 + }, + { + "epoch": 0.24, + "learning_rate": 1.5137664556716244e-07, + "loss": 0.8261, + "step": 12571 + }, + { + "epoch": 0.24, + "learning_rate": 1.5137276222282628e-07, + "loss": 0.8274, + "step": 12572 + }, + { + "epoch": 0.24, + "learning_rate": 1.5136887887849015e-07, + "loss": 0.0019, + "step": 12573 + }, + { + "epoch": 0.24, + "learning_rate": 1.51364995534154e-07, + "loss": 0.0026, + "step": 12574 + }, + { + "epoch": 0.24, + "learning_rate": 1.5136111218981787e-07, + "loss": 0.0021, + "step": 12575 + }, + { + "epoch": 0.24, + "learning_rate": 1.5135722884548172e-07, + "loss": 0.0032, + "step": 12576 + }, + { + "epoch": 0.24, + "learning_rate": 1.513533455011456e-07, + "loss": 0.1028, + "step": 12577 + }, + { + "epoch": 0.24, + "learning_rate": 1.5134946215680943e-07, + "loss": 0.0015, + "step": 12578 + }, + { + "epoch": 0.24, + "learning_rate": 1.513455788124733e-07, + "loss": 0.0018, + "step": 12579 + }, + { + "epoch": 0.24, + "learning_rate": 1.5134169546813715e-07, + "loss": 0.0017, + "step": 12580 + }, + { + "epoch": 0.24, + "learning_rate": 1.5133781212380102e-07, + "loss": 0.4183, + "step": 12581 + }, + { + "epoch": 0.24, + "learning_rate": 1.5133392877946486e-07, + "loss": 0.0059, + "step": 12582 + }, + { + "epoch": 0.24, + "learning_rate": 1.5133004543512874e-07, + "loss": 0.6415, + "step": 12583 + }, + { + "epoch": 0.24, + "learning_rate": 1.5132616209079258e-07, + "loss": 0.004, + "step": 12584 + }, + { + "epoch": 0.24, + "learning_rate": 1.5132227874645645e-07, + "loss": 0.0018, + "step": 12585 + }, + { + "epoch": 0.24, + "learning_rate": 1.513183954021203e-07, + "loss": 0.0025, + "step": 12586 + }, + { + "epoch": 0.24, + "learning_rate": 1.5131451205778417e-07, + "loss": 0.0023, + "step": 12587 + }, + { + "epoch": 0.24, + "learning_rate": 1.5131062871344801e-07, + "loss": 0.0046, + "step": 12588 + }, + { + "epoch": 0.24, + "learning_rate": 1.5130674536911189e-07, + "loss": 0.1034, + "step": 12589 + }, + { + "epoch": 0.24, + "learning_rate": 1.5130286202477573e-07, + "loss": 0.0019, + "step": 12590 + }, + { + "epoch": 0.24, + "learning_rate": 1.512989786804396e-07, + "loss": 0.0528, + "step": 12591 + }, + { + "epoch": 0.24, + "learning_rate": 1.5129509533610345e-07, + "loss": 0.0018, + "step": 12592 + }, + { + "epoch": 0.24, + "learning_rate": 1.5129121199176732e-07, + "loss": 0.0019, + "step": 12593 + }, + { + "epoch": 0.24, + "learning_rate": 1.5128732864743116e-07, + "loss": 0.0017, + "step": 12594 + }, + { + "epoch": 0.24, + "learning_rate": 1.5128344530309504e-07, + "loss": 0.9385, + "step": 12595 + }, + { + "epoch": 0.24, + "learning_rate": 1.5127956195875888e-07, + "loss": 0.0016, + "step": 12596 + }, + { + "epoch": 0.24, + "learning_rate": 1.5127567861442275e-07, + "loss": 0.0635, + "step": 12597 + }, + { + "epoch": 0.24, + "learning_rate": 1.512717952700866e-07, + "loss": 0.0057, + "step": 12598 + }, + { + "epoch": 0.24, + "learning_rate": 1.5126791192575047e-07, + "loss": 0.0017, + "step": 12599 + }, + { + "epoch": 0.24, + "learning_rate": 1.5126402858141431e-07, + "loss": 0.0016, + "step": 12600 + }, + { + "epoch": 0.24, + "learning_rate": 1.5126014523707818e-07, + "loss": 0.0015, + "step": 12601 + }, + { + "epoch": 0.24, + "learning_rate": 1.5125626189274203e-07, + "loss": 0.0015, + "step": 12602 + }, + { + "epoch": 0.24, + "learning_rate": 1.512523785484059e-07, + "loss": 0.0026, + "step": 12603 + }, + { + "epoch": 0.24, + "learning_rate": 1.5124849520406975e-07, + "loss": 0.0022, + "step": 12604 + }, + { + "epoch": 0.24, + "learning_rate": 1.5124461185973362e-07, + "loss": 1.1054, + "step": 12605 + }, + { + "epoch": 0.24, + "learning_rate": 1.5124072851539746e-07, + "loss": 0.0044, + "step": 12606 + }, + { + "epoch": 0.24, + "learning_rate": 1.512368451710613e-07, + "loss": 0.002, + "step": 12607 + }, + { + "epoch": 0.24, + "learning_rate": 1.5123296182672515e-07, + "loss": 0.005, + "step": 12608 + }, + { + "epoch": 0.24, + "learning_rate": 1.5122907848238902e-07, + "loss": 0.0016, + "step": 12609 + }, + { + "epoch": 0.24, + "learning_rate": 1.5122519513805287e-07, + "loss": 0.0019, + "step": 12610 + }, + { + "epoch": 0.24, + "learning_rate": 1.5122131179371674e-07, + "loss": 0.0025, + "step": 12611 + }, + { + "epoch": 0.24, + "learning_rate": 1.5121742844938059e-07, + "loss": 0.0752, + "step": 12612 + }, + { + "epoch": 0.24, + "learning_rate": 1.5121354510504446e-07, + "loss": 0.0013, + "step": 12613 + }, + { + "epoch": 0.24, + "learning_rate": 1.512096617607083e-07, + "loss": 0.0016, + "step": 12614 + }, + { + "epoch": 0.24, + "learning_rate": 1.5120577841637217e-07, + "loss": 0.0017, + "step": 12615 + }, + { + "epoch": 0.24, + "learning_rate": 1.5120189507203602e-07, + "loss": 0.0021, + "step": 12616 + }, + { + "epoch": 0.24, + "learning_rate": 1.511980117276999e-07, + "loss": 0.0018, + "step": 12617 + }, + { + "epoch": 0.24, + "learning_rate": 1.5119412838336374e-07, + "loss": 0.0019, + "step": 12618 + }, + { + "epoch": 0.24, + "learning_rate": 1.511902450390276e-07, + "loss": 0.0026, + "step": 12619 + }, + { + "epoch": 0.24, + "learning_rate": 1.5118636169469145e-07, + "loss": 0.0014, + "step": 12620 + }, + { + "epoch": 0.24, + "learning_rate": 1.5118247835035532e-07, + "loss": 0.0014, + "step": 12621 + }, + { + "epoch": 0.24, + "learning_rate": 1.5117859500601917e-07, + "loss": 0.0751, + "step": 12622 + }, + { + "epoch": 0.24, + "learning_rate": 1.5117471166168304e-07, + "loss": 0.0018, + "step": 12623 + }, + { + "epoch": 0.24, + "learning_rate": 1.5117082831734688e-07, + "loss": 0.0048, + "step": 12624 + }, + { + "epoch": 0.24, + "learning_rate": 1.5116694497301076e-07, + "loss": 0.0021, + "step": 12625 + }, + { + "epoch": 0.24, + "learning_rate": 1.511630616286746e-07, + "loss": 0.0015, + "step": 12626 + }, + { + "epoch": 0.24, + "learning_rate": 1.5115917828433847e-07, + "loss": 0.0015, + "step": 12627 + }, + { + "epoch": 0.24, + "learning_rate": 1.5115529494000232e-07, + "loss": 0.0019, + "step": 12628 + }, + { + "epoch": 0.24, + "learning_rate": 1.511514115956662e-07, + "loss": 0.0016, + "step": 12629 + }, + { + "epoch": 0.24, + "learning_rate": 1.5114752825133003e-07, + "loss": 0.0016, + "step": 12630 + }, + { + "epoch": 0.25, + "learning_rate": 1.511436449069939e-07, + "loss": 0.0029, + "step": 12631 + }, + { + "epoch": 0.25, + "learning_rate": 1.5113976156265775e-07, + "loss": 0.0018, + "step": 12632 + }, + { + "epoch": 0.25, + "learning_rate": 1.5113587821832162e-07, + "loss": 0.0023, + "step": 12633 + }, + { + "epoch": 0.25, + "learning_rate": 1.5113199487398547e-07, + "loss": 0.0029, + "step": 12634 + }, + { + "epoch": 0.25, + "learning_rate": 1.5112811152964934e-07, + "loss": 0.0019, + "step": 12635 + }, + { + "epoch": 0.25, + "learning_rate": 1.5112422818531318e-07, + "loss": 0.0042, + "step": 12636 + }, + { + "epoch": 0.25, + "learning_rate": 1.5112034484097706e-07, + "loss": 0.004, + "step": 12637 + }, + { + "epoch": 0.25, + "learning_rate": 1.511164614966409e-07, + "loss": 0.0017, + "step": 12638 + }, + { + "epoch": 0.25, + "learning_rate": 1.5111257815230477e-07, + "loss": 0.0016, + "step": 12639 + }, + { + "epoch": 0.25, + "learning_rate": 1.5110869480796862e-07, + "loss": 0.0017, + "step": 12640 + }, + { + "epoch": 0.25, + "learning_rate": 1.511048114636325e-07, + "loss": 0.0017, + "step": 12641 + }, + { + "epoch": 0.25, + "learning_rate": 1.5110092811929633e-07, + "loss": 0.0022, + "step": 12642 + }, + { + "epoch": 0.25, + "learning_rate": 1.510970447749602e-07, + "loss": 0.2037, + "step": 12643 + }, + { + "epoch": 0.25, + "learning_rate": 1.5109316143062405e-07, + "loss": 0.0166, + "step": 12644 + }, + { + "epoch": 0.25, + "learning_rate": 1.5108927808628792e-07, + "loss": 0.0015, + "step": 12645 + }, + { + "epoch": 0.25, + "learning_rate": 1.5108539474195177e-07, + "loss": 0.0016, + "step": 12646 + }, + { + "epoch": 0.25, + "learning_rate": 1.510815113976156e-07, + "loss": 0.0013, + "step": 12647 + }, + { + "epoch": 0.25, + "learning_rate": 1.5107762805327948e-07, + "loss": 0.0152, + "step": 12648 + }, + { + "epoch": 0.25, + "learning_rate": 1.5107374470894333e-07, + "loss": 0.0044, + "step": 12649 + }, + { + "epoch": 0.25, + "learning_rate": 1.510698613646072e-07, + "loss": 0.0019, + "step": 12650 + }, + { + "epoch": 0.25, + "learning_rate": 1.5106597802027104e-07, + "loss": 0.0014, + "step": 12651 + }, + { + "epoch": 0.25, + "learning_rate": 1.5106209467593492e-07, + "loss": 0.0024, + "step": 12652 + }, + { + "epoch": 0.25, + "learning_rate": 1.5105821133159876e-07, + "loss": 0.0022, + "step": 12653 + }, + { + "epoch": 0.25, + "learning_rate": 1.5105432798726263e-07, + "loss": 0.0018, + "step": 12654 + }, + { + "epoch": 0.25, + "learning_rate": 1.5105044464292648e-07, + "loss": 0.0017, + "step": 12655 + }, + { + "epoch": 0.25, + "learning_rate": 1.5104656129859035e-07, + "loss": 0.0013, + "step": 12656 + }, + { + "epoch": 0.25, + "learning_rate": 1.510426779542542e-07, + "loss": 0.0038, + "step": 12657 + }, + { + "epoch": 0.25, + "learning_rate": 1.5103879460991807e-07, + "loss": 0.0489, + "step": 12658 + }, + { + "epoch": 0.25, + "learning_rate": 1.510349112655819e-07, + "loss": 0.0016, + "step": 12659 + }, + { + "epoch": 0.25, + "learning_rate": 1.5103102792124578e-07, + "loss": 0.0731, + "step": 12660 + }, + { + "epoch": 0.25, + "learning_rate": 1.5102714457690963e-07, + "loss": 0.0017, + "step": 12661 + }, + { + "epoch": 0.25, + "learning_rate": 1.510232612325735e-07, + "loss": 0.0017, + "step": 12662 + }, + { + "epoch": 0.25, + "learning_rate": 1.5101937788823734e-07, + "loss": 0.0016, + "step": 12663 + }, + { + "epoch": 0.25, + "learning_rate": 1.5101549454390121e-07, + "loss": 0.0035, + "step": 12664 + }, + { + "epoch": 0.25, + "learning_rate": 1.5101161119956506e-07, + "loss": 0.0021, + "step": 12665 + }, + { + "epoch": 0.25, + "learning_rate": 1.510077278552289e-07, + "loss": 0.0376, + "step": 12666 + }, + { + "epoch": 0.25, + "learning_rate": 1.5100384451089278e-07, + "loss": 0.0041, + "step": 12667 + }, + { + "epoch": 0.25, + "learning_rate": 1.5099996116655662e-07, + "loss": 0.0018, + "step": 12668 + }, + { + "epoch": 0.25, + "learning_rate": 1.509960778222205e-07, + "loss": 0.0035, + "step": 12669 + }, + { + "epoch": 0.25, + "learning_rate": 1.5099219447788434e-07, + "loss": 0.0019, + "step": 12670 + }, + { + "epoch": 0.25, + "learning_rate": 1.509883111335482e-07, + "loss": 0.0015, + "step": 12671 + }, + { + "epoch": 0.25, + "learning_rate": 1.5098442778921205e-07, + "loss": 0.0017, + "step": 12672 + }, + { + "epoch": 0.25, + "learning_rate": 1.5098054444487593e-07, + "loss": 0.0015, + "step": 12673 + }, + { + "epoch": 0.25, + "learning_rate": 1.5097666110053977e-07, + "loss": 0.0014, + "step": 12674 + }, + { + "epoch": 0.25, + "learning_rate": 1.5097277775620362e-07, + "loss": 0.0026, + "step": 12675 + }, + { + "epoch": 0.25, + "learning_rate": 1.509688944118675e-07, + "loss": 0.0019, + "step": 12676 + }, + { + "epoch": 0.25, + "learning_rate": 1.5096501106753133e-07, + "loss": 0.0022, + "step": 12677 + }, + { + "epoch": 0.25, + "learning_rate": 1.509611277231952e-07, + "loss": 0.0014, + "step": 12678 + }, + { + "epoch": 0.25, + "learning_rate": 1.5095724437885905e-07, + "loss": 0.008, + "step": 12679 + }, + { + "epoch": 0.25, + "learning_rate": 1.5095336103452292e-07, + "loss": 0.0021, + "step": 12680 + }, + { + "epoch": 0.25, + "learning_rate": 1.5094947769018676e-07, + "loss": 0.0265, + "step": 12681 + }, + { + "epoch": 0.25, + "learning_rate": 1.5094559434585064e-07, + "loss": 0.364, + "step": 12682 + }, + { + "epoch": 0.25, + "learning_rate": 1.5094171100151448e-07, + "loss": 0.1945, + "step": 12683 + }, + { + "epoch": 0.25, + "learning_rate": 1.5093782765717835e-07, + "loss": 0.0017, + "step": 12684 + }, + { + "epoch": 0.25, + "learning_rate": 1.509339443128422e-07, + "loss": 0.3344, + "step": 12685 + }, + { + "epoch": 0.25, + "learning_rate": 1.5093006096850607e-07, + "loss": 0.4533, + "step": 12686 + }, + { + "epoch": 0.25, + "learning_rate": 1.5092617762416991e-07, + "loss": 0.0034, + "step": 12687 + }, + { + "epoch": 0.25, + "learning_rate": 1.5092229427983379e-07, + "loss": 0.0016, + "step": 12688 + }, + { + "epoch": 0.25, + "learning_rate": 1.5091841093549763e-07, + "loss": 0.0025, + "step": 12689 + }, + { + "epoch": 0.25, + "learning_rate": 1.509145275911615e-07, + "loss": 0.7246, + "step": 12690 + }, + { + "epoch": 0.25, + "learning_rate": 1.5091064424682535e-07, + "loss": 0.0018, + "step": 12691 + }, + { + "epoch": 0.25, + "learning_rate": 1.5090676090248922e-07, + "loss": 0.0018, + "step": 12692 + }, + { + "epoch": 0.25, + "learning_rate": 1.5090287755815306e-07, + "loss": 0.0324, + "step": 12693 + }, + { + "epoch": 0.25, + "learning_rate": 1.5089899421381694e-07, + "loss": 0.0012, + "step": 12694 + }, + { + "epoch": 0.25, + "learning_rate": 1.5089511086948078e-07, + "loss": 0.0043, + "step": 12695 + }, + { + "epoch": 0.25, + "learning_rate": 1.5089122752514465e-07, + "loss": 0.0016, + "step": 12696 + }, + { + "epoch": 0.25, + "learning_rate": 1.508873441808085e-07, + "loss": 0.0583, + "step": 12697 + }, + { + "epoch": 0.25, + "learning_rate": 1.5088346083647237e-07, + "loss": 0.0492, + "step": 12698 + }, + { + "epoch": 0.25, + "learning_rate": 1.5087957749213621e-07, + "loss": 1.2035, + "step": 12699 + }, + { + "epoch": 0.25, + "learning_rate": 1.5087569414780008e-07, + "loss": 0.0017, + "step": 12700 + }, + { + "epoch": 0.25, + "learning_rate": 1.5087181080346393e-07, + "loss": 0.8137, + "step": 12701 + }, + { + "epoch": 0.25, + "learning_rate": 1.508679274591278e-07, + "loss": 0.0016, + "step": 12702 + }, + { + "epoch": 0.25, + "learning_rate": 1.5086404411479165e-07, + "loss": 0.1924, + "step": 12703 + }, + { + "epoch": 0.25, + "learning_rate": 1.5086016077045552e-07, + "loss": 0.1625, + "step": 12704 + }, + { + "epoch": 0.25, + "learning_rate": 1.5085627742611936e-07, + "loss": 0.0019, + "step": 12705 + }, + { + "epoch": 0.25, + "learning_rate": 1.5085239408178323e-07, + "loss": 0.0053, + "step": 12706 + }, + { + "epoch": 0.25, + "learning_rate": 1.5084851073744708e-07, + "loss": 0.0017, + "step": 12707 + }, + { + "epoch": 0.25, + "learning_rate": 1.5084462739311095e-07, + "loss": 0.0017, + "step": 12708 + }, + { + "epoch": 0.25, + "learning_rate": 1.508407440487748e-07, + "loss": 0.0017, + "step": 12709 + }, + { + "epoch": 0.25, + "learning_rate": 1.5083686070443867e-07, + "loss": 0.0019, + "step": 12710 + }, + { + "epoch": 0.25, + "learning_rate": 1.508329773601025e-07, + "loss": 0.04, + "step": 12711 + }, + { + "epoch": 0.25, + "learning_rate": 1.5082909401576638e-07, + "loss": 0.6173, + "step": 12712 + }, + { + "epoch": 0.25, + "learning_rate": 1.5082521067143023e-07, + "loss": 0.0132, + "step": 12713 + }, + { + "epoch": 0.25, + "learning_rate": 1.508213273270941e-07, + "loss": 0.0015, + "step": 12714 + }, + { + "epoch": 0.25, + "learning_rate": 1.5081744398275795e-07, + "loss": 0.0018, + "step": 12715 + }, + { + "epoch": 0.25, + "learning_rate": 1.5081356063842182e-07, + "loss": 0.002, + "step": 12716 + }, + { + "epoch": 0.25, + "learning_rate": 1.5080967729408566e-07, + "loss": 0.1217, + "step": 12717 + }, + { + "epoch": 0.25, + "learning_rate": 1.5080579394974953e-07, + "loss": 0.006, + "step": 12718 + }, + { + "epoch": 0.25, + "learning_rate": 1.5080191060541338e-07, + "loss": 0.002, + "step": 12719 + }, + { + "epoch": 0.25, + "learning_rate": 1.5079802726107725e-07, + "loss": 0.0035, + "step": 12720 + }, + { + "epoch": 0.25, + "learning_rate": 1.507941439167411e-07, + "loss": 0.002, + "step": 12721 + }, + { + "epoch": 0.25, + "learning_rate": 1.5079026057240497e-07, + "loss": 0.0303, + "step": 12722 + }, + { + "epoch": 0.25, + "learning_rate": 1.5078637722806878e-07, + "loss": 0.5005, + "step": 12723 + }, + { + "epoch": 0.25, + "learning_rate": 1.5078249388373266e-07, + "loss": 0.0058, + "step": 12724 + }, + { + "epoch": 0.25, + "learning_rate": 1.507786105393965e-07, + "loss": 0.0033, + "step": 12725 + }, + { + "epoch": 0.25, + "learning_rate": 1.5077472719506037e-07, + "loss": 0.2574, + "step": 12726 + }, + { + "epoch": 0.25, + "learning_rate": 1.5077084385072422e-07, + "loss": 0.0016, + "step": 12727 + }, + { + "epoch": 0.25, + "learning_rate": 1.507669605063881e-07, + "loss": 0.0112, + "step": 12728 + }, + { + "epoch": 0.25, + "learning_rate": 1.5076307716205193e-07, + "loss": 1.092, + "step": 12729 + }, + { + "epoch": 0.25, + "learning_rate": 1.507591938177158e-07, + "loss": 0.0015, + "step": 12730 + }, + { + "epoch": 0.25, + "learning_rate": 1.5075531047337965e-07, + "loss": 0.0204, + "step": 12731 + }, + { + "epoch": 0.25, + "learning_rate": 1.5075142712904352e-07, + "loss": 0.0016, + "step": 12732 + }, + { + "epoch": 0.25, + "learning_rate": 1.5074754378470737e-07, + "loss": 0.002, + "step": 12733 + }, + { + "epoch": 0.25, + "learning_rate": 1.5074366044037124e-07, + "loss": 0.0131, + "step": 12734 + }, + { + "epoch": 0.25, + "learning_rate": 1.5073977709603508e-07, + "loss": 0.0014, + "step": 12735 + }, + { + "epoch": 0.25, + "learning_rate": 1.5073589375169896e-07, + "loss": 0.0085, + "step": 12736 + }, + { + "epoch": 0.25, + "learning_rate": 1.507320104073628e-07, + "loss": 0.0036, + "step": 12737 + }, + { + "epoch": 0.25, + "learning_rate": 1.5072812706302667e-07, + "loss": 0.002, + "step": 12738 + }, + { + "epoch": 0.25, + "learning_rate": 1.5072424371869052e-07, + "loss": 0.0022, + "step": 12739 + }, + { + "epoch": 0.25, + "learning_rate": 1.507203603743544e-07, + "loss": 0.0017, + "step": 12740 + }, + { + "epoch": 0.25, + "learning_rate": 1.5071647703001823e-07, + "loss": 0.0042, + "step": 12741 + }, + { + "epoch": 0.25, + "learning_rate": 1.507125936856821e-07, + "loss": 0.002, + "step": 12742 + }, + { + "epoch": 0.25, + "learning_rate": 1.5070871034134595e-07, + "loss": 0.0018, + "step": 12743 + }, + { + "epoch": 0.25, + "learning_rate": 1.5070482699700982e-07, + "loss": 0.0022, + "step": 12744 + }, + { + "epoch": 0.25, + "learning_rate": 1.5070094365267367e-07, + "loss": 0.0017, + "step": 12745 + }, + { + "epoch": 0.25, + "learning_rate": 1.5069706030833754e-07, + "loss": 0.0016, + "step": 12746 + }, + { + "epoch": 0.25, + "learning_rate": 1.5069317696400138e-07, + "loss": 0.002, + "step": 12747 + }, + { + "epoch": 0.25, + "learning_rate": 1.5068929361966525e-07, + "loss": 0.0017, + "step": 12748 + }, + { + "epoch": 0.25, + "learning_rate": 1.506854102753291e-07, + "loss": 0.0014, + "step": 12749 + }, + { + "epoch": 0.25, + "learning_rate": 1.5068152693099297e-07, + "loss": 0.0036, + "step": 12750 + }, + { + "epoch": 0.25, + "learning_rate": 1.5067764358665682e-07, + "loss": 0.0024, + "step": 12751 + }, + { + "epoch": 0.25, + "learning_rate": 1.506737602423207e-07, + "loss": 0.424, + "step": 12752 + }, + { + "epoch": 0.25, + "learning_rate": 1.5066987689798453e-07, + "loss": 0.7735, + "step": 12753 + }, + { + "epoch": 0.25, + "learning_rate": 1.506659935536484e-07, + "loss": 0.0214, + "step": 12754 + }, + { + "epoch": 0.25, + "learning_rate": 1.5066211020931225e-07, + "loss": 0.6947, + "step": 12755 + }, + { + "epoch": 0.25, + "learning_rate": 1.5065822686497612e-07, + "loss": 0.0017, + "step": 12756 + }, + { + "epoch": 0.25, + "learning_rate": 1.5065434352063997e-07, + "loss": 0.0013, + "step": 12757 + }, + { + "epoch": 0.25, + "learning_rate": 1.5065046017630384e-07, + "loss": 0.0156, + "step": 12758 + }, + { + "epoch": 0.25, + "learning_rate": 1.5064657683196768e-07, + "loss": 0.0016, + "step": 12759 + }, + { + "epoch": 0.25, + "learning_rate": 1.5064269348763155e-07, + "loss": 0.0282, + "step": 12760 + }, + { + "epoch": 0.25, + "learning_rate": 1.506388101432954e-07, + "loss": 0.0016, + "step": 12761 + }, + { + "epoch": 0.25, + "learning_rate": 1.5063492679895927e-07, + "loss": 0.0018, + "step": 12762 + }, + { + "epoch": 0.25, + "learning_rate": 1.5063104345462311e-07, + "loss": 0.0016, + "step": 12763 + }, + { + "epoch": 0.25, + "learning_rate": 1.5062716011028699e-07, + "loss": 0.0015, + "step": 12764 + }, + { + "epoch": 0.25, + "learning_rate": 1.5062327676595083e-07, + "loss": 0.003, + "step": 12765 + }, + { + "epoch": 0.25, + "learning_rate": 1.506193934216147e-07, + "loss": 0.0014, + "step": 12766 + }, + { + "epoch": 0.25, + "learning_rate": 1.5061551007727855e-07, + "loss": 0.0013, + "step": 12767 + }, + { + "epoch": 0.25, + "learning_rate": 1.5061162673294242e-07, + "loss": 0.2103, + "step": 12768 + }, + { + "epoch": 0.25, + "learning_rate": 1.5060774338860626e-07, + "loss": 0.0024, + "step": 12769 + }, + { + "epoch": 0.25, + "learning_rate": 1.5060386004427014e-07, + "loss": 0.0022, + "step": 12770 + }, + { + "epoch": 0.25, + "learning_rate": 1.5059997669993398e-07, + "loss": 0.3577, + "step": 12771 + }, + { + "epoch": 0.25, + "learning_rate": 1.5059609335559785e-07, + "loss": 0.0017, + "step": 12772 + }, + { + "epoch": 0.25, + "learning_rate": 1.505922100112617e-07, + "loss": 0.0016, + "step": 12773 + }, + { + "epoch": 0.25, + "learning_rate": 1.5058832666692557e-07, + "loss": 0.0018, + "step": 12774 + }, + { + "epoch": 0.25, + "learning_rate": 1.5058444332258941e-07, + "loss": 0.0079, + "step": 12775 + }, + { + "epoch": 0.25, + "learning_rate": 1.5058055997825328e-07, + "loss": 0.0015, + "step": 12776 + }, + { + "epoch": 0.25, + "learning_rate": 1.5057667663391713e-07, + "loss": 0.0016, + "step": 12777 + }, + { + "epoch": 0.25, + "learning_rate": 1.50572793289581e-07, + "loss": 0.5386, + "step": 12778 + }, + { + "epoch": 0.25, + "learning_rate": 1.5056890994524485e-07, + "loss": 0.0015, + "step": 12779 + }, + { + "epoch": 0.25, + "learning_rate": 1.5056502660090872e-07, + "loss": 0.0018, + "step": 12780 + }, + { + "epoch": 0.25, + "learning_rate": 1.5056114325657254e-07, + "loss": 0.0022, + "step": 12781 + }, + { + "epoch": 0.25, + "learning_rate": 1.505572599122364e-07, + "loss": 1.2675, + "step": 12782 + }, + { + "epoch": 0.25, + "learning_rate": 1.5055337656790025e-07, + "loss": 0.1323, + "step": 12783 + }, + { + "epoch": 0.25, + "learning_rate": 1.5054949322356412e-07, + "loss": 0.0017, + "step": 12784 + }, + { + "epoch": 0.25, + "learning_rate": 1.5054560987922797e-07, + "loss": 0.0018, + "step": 12785 + }, + { + "epoch": 0.25, + "learning_rate": 1.5054172653489184e-07, + "loss": 0.4787, + "step": 12786 + }, + { + "epoch": 0.25, + "learning_rate": 1.5053784319055569e-07, + "loss": 0.0317, + "step": 12787 + }, + { + "epoch": 0.25, + "learning_rate": 1.5053395984621956e-07, + "loss": 0.0029, + "step": 12788 + }, + { + "epoch": 0.25, + "learning_rate": 1.505300765018834e-07, + "loss": 0.0017, + "step": 12789 + }, + { + "epoch": 0.25, + "learning_rate": 1.5052619315754727e-07, + "loss": 0.0019, + "step": 12790 + }, + { + "epoch": 0.25, + "learning_rate": 1.5052230981321112e-07, + "loss": 0.0323, + "step": 12791 + }, + { + "epoch": 0.25, + "learning_rate": 1.50518426468875e-07, + "loss": 0.0017, + "step": 12792 + }, + { + "epoch": 0.25, + "learning_rate": 1.5051454312453884e-07, + "loss": 0.943, + "step": 12793 + }, + { + "epoch": 0.25, + "learning_rate": 1.505106597802027e-07, + "loss": 0.7619, + "step": 12794 + }, + { + "epoch": 0.25, + "learning_rate": 1.5050677643586655e-07, + "loss": 0.0061, + "step": 12795 + }, + { + "epoch": 0.25, + "learning_rate": 1.5050289309153042e-07, + "loss": 0.0018, + "step": 12796 + }, + { + "epoch": 0.25, + "learning_rate": 1.5049900974719427e-07, + "loss": 0.0022, + "step": 12797 + }, + { + "epoch": 0.25, + "learning_rate": 1.5049512640285814e-07, + "loss": 0.0014, + "step": 12798 + }, + { + "epoch": 0.25, + "learning_rate": 1.5049124305852198e-07, + "loss": 0.0017, + "step": 12799 + }, + { + "epoch": 0.25, + "learning_rate": 1.5048735971418586e-07, + "loss": 0.0047, + "step": 12800 + }, + { + "epoch": 0.25, + "learning_rate": 1.504834763698497e-07, + "loss": 0.0013, + "step": 12801 + }, + { + "epoch": 0.25, + "learning_rate": 1.5047959302551357e-07, + "loss": 0.0014, + "step": 12802 + }, + { + "epoch": 0.25, + "learning_rate": 1.5047570968117742e-07, + "loss": 0.0018, + "step": 12803 + }, + { + "epoch": 0.25, + "learning_rate": 1.504718263368413e-07, + "loss": 0.0015, + "step": 12804 + }, + { + "epoch": 0.25, + "learning_rate": 1.5046794299250513e-07, + "loss": 0.0015, + "step": 12805 + }, + { + "epoch": 0.25, + "learning_rate": 1.50464059648169e-07, + "loss": 0.0019, + "step": 12806 + }, + { + "epoch": 0.25, + "learning_rate": 1.5046017630383285e-07, + "loss": 0.0027, + "step": 12807 + }, + { + "epoch": 0.25, + "learning_rate": 1.5045629295949672e-07, + "loss": 0.0015, + "step": 12808 + }, + { + "epoch": 0.25, + "learning_rate": 1.5045240961516057e-07, + "loss": 0.6353, + "step": 12809 + }, + { + "epoch": 0.25, + "learning_rate": 1.5044852627082444e-07, + "loss": 0.2751, + "step": 12810 + }, + { + "epoch": 0.25, + "learning_rate": 1.5044464292648828e-07, + "loss": 0.0074, + "step": 12811 + }, + { + "epoch": 0.25, + "learning_rate": 1.5044075958215216e-07, + "loss": 0.0021, + "step": 12812 + }, + { + "epoch": 0.25, + "learning_rate": 1.50436876237816e-07, + "loss": 0.0196, + "step": 12813 + }, + { + "epoch": 0.25, + "learning_rate": 1.5043299289347987e-07, + "loss": 0.4219, + "step": 12814 + }, + { + "epoch": 0.25, + "learning_rate": 1.5042910954914372e-07, + "loss": 0.0014, + "step": 12815 + }, + { + "epoch": 0.25, + "learning_rate": 1.504252262048076e-07, + "loss": 0.6717, + "step": 12816 + }, + { + "epoch": 0.25, + "learning_rate": 1.5042134286047143e-07, + "loss": 0.0059, + "step": 12817 + }, + { + "epoch": 0.25, + "learning_rate": 1.504174595161353e-07, + "loss": 0.0016, + "step": 12818 + }, + { + "epoch": 0.25, + "learning_rate": 1.5041357617179915e-07, + "loss": 0.0479, + "step": 12819 + }, + { + "epoch": 0.25, + "learning_rate": 1.5040969282746302e-07, + "loss": 0.0044, + "step": 12820 + }, + { + "epoch": 0.25, + "learning_rate": 1.5040580948312687e-07, + "loss": 0.1699, + "step": 12821 + }, + { + "epoch": 0.25, + "learning_rate": 1.5040192613879074e-07, + "loss": 0.0218, + "step": 12822 + }, + { + "epoch": 0.25, + "learning_rate": 1.5039804279445458e-07, + "loss": 0.4681, + "step": 12823 + }, + { + "epoch": 0.25, + "learning_rate": 1.5039415945011843e-07, + "loss": 0.0075, + "step": 12824 + }, + { + "epoch": 0.25, + "learning_rate": 1.503902761057823e-07, + "loss": 0.0287, + "step": 12825 + }, + { + "epoch": 0.25, + "learning_rate": 1.5038639276144614e-07, + "loss": 1.0624, + "step": 12826 + }, + { + "epoch": 0.25, + "learning_rate": 1.5038250941711002e-07, + "loss": 0.0014, + "step": 12827 + }, + { + "epoch": 0.25, + "learning_rate": 1.5037862607277386e-07, + "loss": 0.6185, + "step": 12828 + }, + { + "epoch": 0.25, + "learning_rate": 1.5037474272843773e-07, + "loss": 0.0016, + "step": 12829 + }, + { + "epoch": 0.25, + "learning_rate": 1.5037085938410158e-07, + "loss": 0.0327, + "step": 12830 + }, + { + "epoch": 0.25, + "learning_rate": 1.5036697603976545e-07, + "loss": 0.0015, + "step": 12831 + }, + { + "epoch": 0.25, + "learning_rate": 1.503630926954293e-07, + "loss": 0.0022, + "step": 12832 + }, + { + "epoch": 0.25, + "learning_rate": 1.5035920935109317e-07, + "loss": 0.0062, + "step": 12833 + }, + { + "epoch": 0.25, + "learning_rate": 1.50355326006757e-07, + "loss": 0.0025, + "step": 12834 + }, + { + "epoch": 0.25, + "learning_rate": 1.5035144266242088e-07, + "loss": 0.002, + "step": 12835 + }, + { + "epoch": 0.25, + "learning_rate": 1.5034755931808473e-07, + "loss": 0.0021, + "step": 12836 + }, + { + "epoch": 0.25, + "learning_rate": 1.503436759737486e-07, + "loss": 0.2466, + "step": 12837 + }, + { + "epoch": 0.25, + "learning_rate": 1.5033979262941244e-07, + "loss": 0.0015, + "step": 12838 + }, + { + "epoch": 0.25, + "learning_rate": 1.503359092850763e-07, + "loss": 0.0015, + "step": 12839 + }, + { + "epoch": 0.25, + "learning_rate": 1.5033202594074016e-07, + "loss": 0.0016, + "step": 12840 + }, + { + "epoch": 0.25, + "learning_rate": 1.50328142596404e-07, + "loss": 0.0016, + "step": 12841 + }, + { + "epoch": 0.25, + "learning_rate": 1.5032425925206788e-07, + "loss": 0.0051, + "step": 12842 + }, + { + "epoch": 0.25, + "learning_rate": 1.5032037590773172e-07, + "loss": 0.0018, + "step": 12843 + }, + { + "epoch": 0.25, + "learning_rate": 1.503164925633956e-07, + "loss": 0.0017, + "step": 12844 + }, + { + "epoch": 0.25, + "learning_rate": 1.5031260921905944e-07, + "loss": 0.0016, + "step": 12845 + }, + { + "epoch": 0.25, + "learning_rate": 1.503087258747233e-07, + "loss": 0.2422, + "step": 12846 + }, + { + "epoch": 0.25, + "learning_rate": 1.5030484253038715e-07, + "loss": 0.5906, + "step": 12847 + }, + { + "epoch": 0.25, + "learning_rate": 1.5030095918605103e-07, + "loss": 0.0017, + "step": 12848 + }, + { + "epoch": 0.25, + "learning_rate": 1.5029707584171487e-07, + "loss": 0.0017, + "step": 12849 + }, + { + "epoch": 0.25, + "learning_rate": 1.5029319249737874e-07, + "loss": 0.0019, + "step": 12850 + }, + { + "epoch": 0.25, + "learning_rate": 1.502893091530426e-07, + "loss": 0.0024, + "step": 12851 + }, + { + "epoch": 0.25, + "learning_rate": 1.5028542580870643e-07, + "loss": 0.2641, + "step": 12852 + }, + { + "epoch": 0.25, + "learning_rate": 1.502815424643703e-07, + "loss": 0.0283, + "step": 12853 + }, + { + "epoch": 0.25, + "learning_rate": 1.5027765912003415e-07, + "loss": 0.0015, + "step": 12854 + }, + { + "epoch": 0.25, + "learning_rate": 1.5027377577569802e-07, + "loss": 0.002, + "step": 12855 + }, + { + "epoch": 0.25, + "learning_rate": 1.5026989243136187e-07, + "loss": 0.6094, + "step": 12856 + }, + { + "epoch": 0.25, + "learning_rate": 1.5026600908702574e-07, + "loss": 0.0017, + "step": 12857 + }, + { + "epoch": 0.25, + "learning_rate": 1.5026212574268958e-07, + "loss": 0.0034, + "step": 12858 + }, + { + "epoch": 0.25, + "learning_rate": 1.5025824239835345e-07, + "loss": 0.0134, + "step": 12859 + }, + { + "epoch": 0.25, + "learning_rate": 1.502543590540173e-07, + "loss": 0.0018, + "step": 12860 + }, + { + "epoch": 0.25, + "learning_rate": 1.5025047570968117e-07, + "loss": 0.0032, + "step": 12861 + }, + { + "epoch": 0.25, + "learning_rate": 1.5024659236534501e-07, + "loss": 0.0161, + "step": 12862 + }, + { + "epoch": 0.25, + "learning_rate": 1.5024270902100889e-07, + "loss": 0.5821, + "step": 12863 + }, + { + "epoch": 0.25, + "learning_rate": 1.5023882567667273e-07, + "loss": 0.0016, + "step": 12864 + }, + { + "epoch": 0.25, + "learning_rate": 1.502349423323366e-07, + "loss": 0.0017, + "step": 12865 + }, + { + "epoch": 0.25, + "learning_rate": 1.5023105898800045e-07, + "loss": 0.1963, + "step": 12866 + }, + { + "epoch": 0.25, + "learning_rate": 1.5022717564366432e-07, + "loss": 0.0024, + "step": 12867 + }, + { + "epoch": 0.25, + "learning_rate": 1.5022329229932816e-07, + "loss": 0.0022, + "step": 12868 + }, + { + "epoch": 0.25, + "learning_rate": 1.5021940895499204e-07, + "loss": 0.002, + "step": 12869 + }, + { + "epoch": 0.25, + "learning_rate": 1.5021552561065588e-07, + "loss": 0.0025, + "step": 12870 + }, + { + "epoch": 0.25, + "learning_rate": 1.5021164226631975e-07, + "loss": 0.0014, + "step": 12871 + }, + { + "epoch": 0.25, + "learning_rate": 1.502077589219836e-07, + "loss": 0.4879, + "step": 12872 + }, + { + "epoch": 0.25, + "learning_rate": 1.5020387557764747e-07, + "loss": 0.0014, + "step": 12873 + }, + { + "epoch": 0.25, + "learning_rate": 1.5019999223331131e-07, + "loss": 0.0018, + "step": 12874 + }, + { + "epoch": 0.25, + "learning_rate": 1.5019610888897518e-07, + "loss": 0.0046, + "step": 12875 + }, + { + "epoch": 0.25, + "learning_rate": 1.5019222554463903e-07, + "loss": 0.0018, + "step": 12876 + }, + { + "epoch": 0.25, + "learning_rate": 1.501883422003029e-07, + "loss": 0.0014, + "step": 12877 + }, + { + "epoch": 0.25, + "learning_rate": 1.5018445885596675e-07, + "loss": 0.0012, + "step": 12878 + }, + { + "epoch": 0.25, + "learning_rate": 1.5018057551163062e-07, + "loss": 0.0015, + "step": 12879 + }, + { + "epoch": 0.25, + "learning_rate": 1.5017669216729446e-07, + "loss": 0.0019, + "step": 12880 + }, + { + "epoch": 0.25, + "learning_rate": 1.5017280882295833e-07, + "loss": 0.0016, + "step": 12881 + }, + { + "epoch": 0.25, + "learning_rate": 1.5016892547862218e-07, + "loss": 1.1076, + "step": 12882 + }, + { + "epoch": 0.25, + "learning_rate": 1.5016504213428605e-07, + "loss": 0.4434, + "step": 12883 + }, + { + "epoch": 0.25, + "learning_rate": 1.501611587899499e-07, + "loss": 0.0019, + "step": 12884 + }, + { + "epoch": 0.25, + "learning_rate": 1.5015727544561377e-07, + "loss": 0.0016, + "step": 12885 + }, + { + "epoch": 0.25, + "learning_rate": 1.501533921012776e-07, + "loss": 0.3916, + "step": 12886 + }, + { + "epoch": 0.25, + "learning_rate": 1.5014950875694148e-07, + "loss": 0.0057, + "step": 12887 + }, + { + "epoch": 0.25, + "learning_rate": 1.5014562541260533e-07, + "loss": 1.0923, + "step": 12888 + }, + { + "epoch": 0.25, + "learning_rate": 1.501417420682692e-07, + "loss": 0.0014, + "step": 12889 + }, + { + "epoch": 0.25, + "learning_rate": 1.5013785872393305e-07, + "loss": 0.0012, + "step": 12890 + }, + { + "epoch": 0.25, + "learning_rate": 1.5013397537959692e-07, + "loss": 0.0026, + "step": 12891 + }, + { + "epoch": 0.25, + "learning_rate": 1.5013009203526076e-07, + "loss": 0.0025, + "step": 12892 + }, + { + "epoch": 0.25, + "learning_rate": 1.5012620869092463e-07, + "loss": 0.0014, + "step": 12893 + }, + { + "epoch": 0.25, + "learning_rate": 1.5012232534658848e-07, + "loss": 0.0026, + "step": 12894 + }, + { + "epoch": 0.25, + "learning_rate": 1.5011844200225235e-07, + "loss": 0.0024, + "step": 12895 + }, + { + "epoch": 0.25, + "learning_rate": 1.501145586579162e-07, + "loss": 0.0016, + "step": 12896 + }, + { + "epoch": 0.25, + "learning_rate": 1.5011067531358004e-07, + "loss": 0.0056, + "step": 12897 + }, + { + "epoch": 0.25, + "learning_rate": 1.5010679196924388e-07, + "loss": 0.0013, + "step": 12898 + }, + { + "epoch": 0.25, + "learning_rate": 1.5010290862490776e-07, + "loss": 0.0018, + "step": 12899 + }, + { + "epoch": 0.25, + "learning_rate": 1.500990252805716e-07, + "loss": 0.036, + "step": 12900 + }, + { + "epoch": 0.25, + "learning_rate": 1.5009514193623547e-07, + "loss": 0.0015, + "step": 12901 + }, + { + "epoch": 0.25, + "learning_rate": 1.5009125859189932e-07, + "loss": 1.4805, + "step": 12902 + }, + { + "epoch": 0.25, + "learning_rate": 1.500873752475632e-07, + "loss": 0.0016, + "step": 12903 + }, + { + "epoch": 0.25, + "learning_rate": 1.5008349190322703e-07, + "loss": 0.0016, + "step": 12904 + }, + { + "epoch": 0.25, + "learning_rate": 1.500796085588909e-07, + "loss": 0.0039, + "step": 12905 + }, + { + "epoch": 0.25, + "learning_rate": 1.5007572521455475e-07, + "loss": 0.002, + "step": 12906 + }, + { + "epoch": 0.25, + "learning_rate": 1.5007184187021862e-07, + "loss": 1.1865, + "step": 12907 + }, + { + "epoch": 0.25, + "learning_rate": 1.5006795852588247e-07, + "loss": 0.0184, + "step": 12908 + }, + { + "epoch": 0.25, + "learning_rate": 1.5006407518154634e-07, + "loss": 1.0966, + "step": 12909 + }, + { + "epoch": 0.25, + "learning_rate": 1.5006019183721018e-07, + "loss": 0.0015, + "step": 12910 + }, + { + "epoch": 0.25, + "learning_rate": 1.5005630849287406e-07, + "loss": 0.0262, + "step": 12911 + }, + { + "epoch": 0.25, + "learning_rate": 1.500524251485379e-07, + "loss": 0.0164, + "step": 12912 + }, + { + "epoch": 0.25, + "learning_rate": 1.5004854180420177e-07, + "loss": 0.0011, + "step": 12913 + }, + { + "epoch": 0.25, + "learning_rate": 1.5004465845986562e-07, + "loss": 0.0029, + "step": 12914 + }, + { + "epoch": 0.25, + "learning_rate": 1.500407751155295e-07, + "loss": 0.002, + "step": 12915 + }, + { + "epoch": 0.25, + "learning_rate": 1.5003689177119333e-07, + "loss": 0.0017, + "step": 12916 + }, + { + "epoch": 0.25, + "learning_rate": 1.500330084268572e-07, + "loss": 0.0015, + "step": 12917 + }, + { + "epoch": 0.25, + "learning_rate": 1.5002912508252105e-07, + "loss": 0.0013, + "step": 12918 + }, + { + "epoch": 0.25, + "learning_rate": 1.5002524173818492e-07, + "loss": 0.0639, + "step": 12919 + }, + { + "epoch": 0.25, + "learning_rate": 1.5002135839384877e-07, + "loss": 0.0014, + "step": 12920 + }, + { + "epoch": 0.25, + "learning_rate": 1.5001747504951264e-07, + "loss": 0.0014, + "step": 12921 + }, + { + "epoch": 0.25, + "learning_rate": 1.5001359170517648e-07, + "loss": 0.0171, + "step": 12922 + }, + { + "epoch": 0.25, + "learning_rate": 1.5000970836084035e-07, + "loss": 0.0034, + "step": 12923 + }, + { + "epoch": 0.25, + "learning_rate": 1.500058250165042e-07, + "loss": 0.002, + "step": 12924 + }, + { + "epoch": 0.25, + "learning_rate": 1.5000194167216807e-07, + "loss": 0.116, + "step": 12925 + }, + { + "epoch": 0.25, + "learning_rate": 1.4999805832783192e-07, + "loss": 0.0038, + "step": 12926 + }, + { + "epoch": 0.25, + "learning_rate": 1.499941749834958e-07, + "loss": 0.0024, + "step": 12927 + }, + { + "epoch": 0.25, + "learning_rate": 1.4999029163915963e-07, + "loss": 1.0394, + "step": 12928 + }, + { + "epoch": 0.25, + "learning_rate": 1.499864082948235e-07, + "loss": 0.0045, + "step": 12929 + }, + { + "epoch": 0.25, + "learning_rate": 1.4998252495048735e-07, + "loss": 0.0022, + "step": 12930 + }, + { + "epoch": 0.25, + "learning_rate": 1.4997864160615122e-07, + "loss": 0.0072, + "step": 12931 + }, + { + "epoch": 0.25, + "learning_rate": 1.4997475826181507e-07, + "loss": 0.0267, + "step": 12932 + }, + { + "epoch": 0.25, + "learning_rate": 1.4997087491747894e-07, + "loss": 0.0017, + "step": 12933 + }, + { + "epoch": 0.25, + "learning_rate": 1.4996699157314278e-07, + "loss": 0.0016, + "step": 12934 + }, + { + "epoch": 0.25, + "learning_rate": 1.4996310822880665e-07, + "loss": 0.1073, + "step": 12935 + }, + { + "epoch": 0.25, + "learning_rate": 1.499592248844705e-07, + "loss": 0.0018, + "step": 12936 + }, + { + "epoch": 0.25, + "learning_rate": 1.4995534154013437e-07, + "loss": 0.0015, + "step": 12937 + }, + { + "epoch": 0.25, + "learning_rate": 1.4995145819579821e-07, + "loss": 0.0017, + "step": 12938 + }, + { + "epoch": 0.25, + "learning_rate": 1.4994757485146209e-07, + "loss": 0.0016, + "step": 12939 + }, + { + "epoch": 0.25, + "learning_rate": 1.4994369150712593e-07, + "loss": 0.0015, + "step": 12940 + }, + { + "epoch": 0.25, + "learning_rate": 1.499398081627898e-07, + "loss": 0.0015, + "step": 12941 + }, + { + "epoch": 0.25, + "learning_rate": 1.4993592481845365e-07, + "loss": 0.1073, + "step": 12942 + }, + { + "epoch": 0.25, + "learning_rate": 1.4993204147411752e-07, + "loss": 0.0014, + "step": 12943 + }, + { + "epoch": 0.25, + "learning_rate": 1.4992815812978136e-07, + "loss": 0.0024, + "step": 12944 + }, + { + "epoch": 0.25, + "learning_rate": 1.4992427478544524e-07, + "loss": 0.0015, + "step": 12945 + }, + { + "epoch": 0.25, + "learning_rate": 1.4992039144110908e-07, + "loss": 0.0018, + "step": 12946 + }, + { + "epoch": 0.25, + "learning_rate": 1.4991650809677295e-07, + "loss": 0.0151, + "step": 12947 + }, + { + "epoch": 0.25, + "learning_rate": 1.499126247524368e-07, + "loss": 0.0018, + "step": 12948 + }, + { + "epoch": 0.25, + "learning_rate": 1.4990874140810067e-07, + "loss": 0.1778, + "step": 12949 + }, + { + "epoch": 0.25, + "learning_rate": 1.4990485806376451e-07, + "loss": 0.3716, + "step": 12950 + }, + { + "epoch": 0.25, + "learning_rate": 1.4990097471942839e-07, + "loss": 0.0015, + "step": 12951 + }, + { + "epoch": 0.25, + "learning_rate": 1.4989709137509223e-07, + "loss": 0.0023, + "step": 12952 + }, + { + "epoch": 0.25, + "learning_rate": 1.498932080307561e-07, + "loss": 0.0021, + "step": 12953 + }, + { + "epoch": 0.25, + "learning_rate": 1.4988932468641995e-07, + "loss": 0.0016, + "step": 12954 + }, + { + "epoch": 0.25, + "learning_rate": 1.498854413420838e-07, + "loss": 0.0017, + "step": 12955 + }, + { + "epoch": 0.25, + "learning_rate": 1.4988155799774764e-07, + "loss": 0.0016, + "step": 12956 + }, + { + "epoch": 0.25, + "learning_rate": 1.498776746534115e-07, + "loss": 0.0014, + "step": 12957 + }, + { + "epoch": 0.25, + "learning_rate": 1.4987379130907535e-07, + "loss": 0.0018, + "step": 12958 + }, + { + "epoch": 0.25, + "learning_rate": 1.4986990796473922e-07, + "loss": 0.0015, + "step": 12959 + }, + { + "epoch": 0.25, + "learning_rate": 1.4986602462040307e-07, + "loss": 0.0017, + "step": 12960 + }, + { + "epoch": 0.25, + "learning_rate": 1.4986214127606694e-07, + "loss": 0.5304, + "step": 12961 + }, + { + "epoch": 0.25, + "learning_rate": 1.4985825793173079e-07, + "loss": 0.625, + "step": 12962 + }, + { + "epoch": 0.25, + "learning_rate": 1.4985437458739466e-07, + "loss": 0.0012, + "step": 12963 + }, + { + "epoch": 0.25, + "learning_rate": 1.498504912430585e-07, + "loss": 0.0022, + "step": 12964 + }, + { + "epoch": 0.25, + "learning_rate": 1.4984660789872237e-07, + "loss": 0.0014, + "step": 12965 + }, + { + "epoch": 0.25, + "learning_rate": 1.4984272455438622e-07, + "loss": 0.0066, + "step": 12966 + }, + { + "epoch": 0.25, + "learning_rate": 1.498388412100501e-07, + "loss": 0.0014, + "step": 12967 + }, + { + "epoch": 0.25, + "learning_rate": 1.4983495786571394e-07, + "loss": 0.0021, + "step": 12968 + }, + { + "epoch": 0.25, + "learning_rate": 1.498310745213778e-07, + "loss": 0.0551, + "step": 12969 + }, + { + "epoch": 0.25, + "learning_rate": 1.4982719117704165e-07, + "loss": 0.0029, + "step": 12970 + }, + { + "epoch": 0.25, + "learning_rate": 1.4982330783270552e-07, + "loss": 0.2062, + "step": 12971 + }, + { + "epoch": 0.25, + "learning_rate": 1.4981942448836937e-07, + "loss": 0.0018, + "step": 12972 + }, + { + "epoch": 0.25, + "learning_rate": 1.4981554114403324e-07, + "loss": 0.0772, + "step": 12973 + }, + { + "epoch": 0.25, + "learning_rate": 1.4981165779969708e-07, + "loss": 0.0143, + "step": 12974 + }, + { + "epoch": 0.25, + "learning_rate": 1.4980777445536096e-07, + "loss": 0.1528, + "step": 12975 + }, + { + "epoch": 0.25, + "learning_rate": 1.498038911110248e-07, + "loss": 0.6644, + "step": 12976 + }, + { + "epoch": 0.25, + "learning_rate": 1.4980000776668867e-07, + "loss": 0.0015, + "step": 12977 + }, + { + "epoch": 0.25, + "learning_rate": 1.4979612442235252e-07, + "loss": 0.0015, + "step": 12978 + }, + { + "epoch": 0.25, + "learning_rate": 1.497922410780164e-07, + "loss": 0.0012, + "step": 12979 + }, + { + "epoch": 0.25, + "learning_rate": 1.4978835773368023e-07, + "loss": 0.003, + "step": 12980 + }, + { + "epoch": 0.25, + "learning_rate": 1.497844743893441e-07, + "loss": 0.0015, + "step": 12981 + }, + { + "epoch": 0.25, + "learning_rate": 1.4978059104500795e-07, + "loss": 0.0013, + "step": 12982 + }, + { + "epoch": 0.25, + "learning_rate": 1.4977670770067182e-07, + "loss": 0.028, + "step": 12983 + }, + { + "epoch": 0.25, + "learning_rate": 1.4977282435633567e-07, + "loss": 0.0015, + "step": 12984 + }, + { + "epoch": 0.25, + "learning_rate": 1.4976894101199954e-07, + "loss": 0.0021, + "step": 12985 + }, + { + "epoch": 0.25, + "learning_rate": 1.4976505766766338e-07, + "loss": 0.0015, + "step": 12986 + }, + { + "epoch": 0.25, + "learning_rate": 1.4976117432332726e-07, + "loss": 0.0017, + "step": 12987 + }, + { + "epoch": 0.25, + "learning_rate": 1.497572909789911e-07, + "loss": 0.0017, + "step": 12988 + }, + { + "epoch": 0.25, + "learning_rate": 1.4975340763465497e-07, + "loss": 0.0048, + "step": 12989 + }, + { + "epoch": 0.25, + "learning_rate": 1.4974952429031882e-07, + "loss": 0.0173, + "step": 12990 + }, + { + "epoch": 0.25, + "learning_rate": 1.497456409459827e-07, + "loss": 0.13, + "step": 12991 + }, + { + "epoch": 0.25, + "learning_rate": 1.4974175760164653e-07, + "loss": 0.0466, + "step": 12992 + }, + { + "epoch": 0.25, + "learning_rate": 1.497378742573104e-07, + "loss": 0.0035, + "step": 12993 + }, + { + "epoch": 0.25, + "learning_rate": 1.4973399091297425e-07, + "loss": 0.0021, + "step": 12994 + }, + { + "epoch": 0.25, + "learning_rate": 1.4973010756863812e-07, + "loss": 0.0036, + "step": 12995 + }, + { + "epoch": 0.25, + "learning_rate": 1.4972622422430197e-07, + "loss": 0.0962, + "step": 12996 + }, + { + "epoch": 0.25, + "learning_rate": 1.4972234087996584e-07, + "loss": 0.0035, + "step": 12997 + }, + { + "epoch": 0.25, + "learning_rate": 1.4971845753562968e-07, + "loss": 0.2134, + "step": 12998 + }, + { + "epoch": 0.25, + "learning_rate": 1.4971457419129355e-07, + "loss": 0.0209, + "step": 12999 + }, + { + "epoch": 0.25, + "learning_rate": 1.497106908469574e-07, + "loss": 0.0018, + "step": 13000 + }, + { + "epoch": 0.25, + "learning_rate": 1.4970680750262124e-07, + "loss": 0.0014, + "step": 13001 + }, + { + "epoch": 0.25, + "learning_rate": 1.4970292415828512e-07, + "loss": 0.0017, + "step": 13002 + }, + { + "epoch": 0.25, + "learning_rate": 1.4969904081394896e-07, + "loss": 0.0026, + "step": 13003 + }, + { + "epoch": 0.25, + "learning_rate": 1.4969515746961283e-07, + "loss": 0.0027, + "step": 13004 + }, + { + "epoch": 0.25, + "learning_rate": 1.4969127412527668e-07, + "loss": 0.0278, + "step": 13005 + }, + { + "epoch": 0.25, + "learning_rate": 1.4968739078094055e-07, + "loss": 0.0028, + "step": 13006 + }, + { + "epoch": 0.25, + "learning_rate": 1.496835074366044e-07, + "loss": 0.0027, + "step": 13007 + }, + { + "epoch": 0.25, + "learning_rate": 1.4967962409226827e-07, + "loss": 0.0051, + "step": 13008 + }, + { + "epoch": 0.25, + "learning_rate": 1.496757407479321e-07, + "loss": 0.0026, + "step": 13009 + }, + { + "epoch": 0.25, + "learning_rate": 1.4967185740359598e-07, + "loss": 0.0016, + "step": 13010 + }, + { + "epoch": 0.25, + "learning_rate": 1.4966797405925983e-07, + "loss": 0.0013, + "step": 13011 + }, + { + "epoch": 0.25, + "learning_rate": 1.496640907149237e-07, + "loss": 0.2777, + "step": 13012 + }, + { + "epoch": 0.25, + "learning_rate": 1.4966020737058754e-07, + "loss": 0.0039, + "step": 13013 + }, + { + "epoch": 0.25, + "learning_rate": 1.496563240262514e-07, + "loss": 0.2353, + "step": 13014 + }, + { + "epoch": 0.25, + "learning_rate": 1.4965244068191526e-07, + "loss": 0.0017, + "step": 13015 + }, + { + "epoch": 0.25, + "learning_rate": 1.496485573375791e-07, + "loss": 0.0015, + "step": 13016 + }, + { + "epoch": 0.25, + "learning_rate": 1.4964467399324298e-07, + "loss": 0.0041, + "step": 13017 + }, + { + "epoch": 0.25, + "learning_rate": 1.4964079064890682e-07, + "loss": 0.0015, + "step": 13018 + }, + { + "epoch": 0.25, + "learning_rate": 1.496369073045707e-07, + "loss": 0.0026, + "step": 13019 + }, + { + "epoch": 0.25, + "learning_rate": 1.4963302396023454e-07, + "loss": 0.016, + "step": 13020 + }, + { + "epoch": 0.25, + "learning_rate": 1.496291406158984e-07, + "loss": 0.0016, + "step": 13021 + }, + { + "epoch": 0.25, + "learning_rate": 1.4962525727156225e-07, + "loss": 0.0054, + "step": 13022 + }, + { + "epoch": 0.25, + "learning_rate": 1.4962137392722613e-07, + "loss": 0.0117, + "step": 13023 + }, + { + "epoch": 0.25, + "learning_rate": 1.4961749058288997e-07, + "loss": 0.0076, + "step": 13024 + }, + { + "epoch": 0.25, + "learning_rate": 1.4961360723855384e-07, + "loss": 0.0018, + "step": 13025 + }, + { + "epoch": 0.25, + "learning_rate": 1.496097238942177e-07, + "loss": 0.0014, + "step": 13026 + }, + { + "epoch": 0.25, + "learning_rate": 1.4960584054988156e-07, + "loss": 0.009, + "step": 13027 + }, + { + "epoch": 0.25, + "learning_rate": 1.496019572055454e-07, + "loss": 0.0015, + "step": 13028 + }, + { + "epoch": 0.25, + "learning_rate": 1.4959807386120925e-07, + "loss": 0.0028, + "step": 13029 + }, + { + "epoch": 0.25, + "learning_rate": 1.4959419051687312e-07, + "loss": 0.0019, + "step": 13030 + }, + { + "epoch": 0.25, + "learning_rate": 1.4959030717253697e-07, + "loss": 1.1328, + "step": 13031 + }, + { + "epoch": 0.25, + "learning_rate": 1.4958642382820084e-07, + "loss": 0.0015, + "step": 13032 + }, + { + "epoch": 0.25, + "learning_rate": 1.4958254048386468e-07, + "loss": 0.0098, + "step": 13033 + }, + { + "epoch": 0.25, + "learning_rate": 1.4957865713952855e-07, + "loss": 0.5141, + "step": 13034 + }, + { + "epoch": 0.25, + "learning_rate": 1.495747737951924e-07, + "loss": 0.0023, + "step": 13035 + }, + { + "epoch": 0.25, + "learning_rate": 1.4957089045085627e-07, + "loss": 0.0058, + "step": 13036 + }, + { + "epoch": 0.25, + "learning_rate": 1.4956700710652011e-07, + "loss": 0.0017, + "step": 13037 + }, + { + "epoch": 0.25, + "learning_rate": 1.4956312376218399e-07, + "loss": 0.0098, + "step": 13038 + }, + { + "epoch": 0.25, + "learning_rate": 1.4955924041784783e-07, + "loss": 0.0017, + "step": 13039 + }, + { + "epoch": 0.25, + "learning_rate": 1.495553570735117e-07, + "loss": 0.0022, + "step": 13040 + }, + { + "epoch": 0.25, + "learning_rate": 1.4955147372917555e-07, + "loss": 0.0017, + "step": 13041 + }, + { + "epoch": 0.25, + "learning_rate": 1.4954759038483942e-07, + "loss": 0.0068, + "step": 13042 + }, + { + "epoch": 0.25, + "learning_rate": 1.4954370704050326e-07, + "loss": 0.0016, + "step": 13043 + }, + { + "epoch": 0.25, + "learning_rate": 1.4953982369616714e-07, + "loss": 0.4165, + "step": 13044 + }, + { + "epoch": 0.25, + "learning_rate": 1.4953594035183098e-07, + "loss": 0.0014, + "step": 13045 + }, + { + "epoch": 0.25, + "learning_rate": 1.4953205700749485e-07, + "loss": 0.0017, + "step": 13046 + }, + { + "epoch": 0.25, + "learning_rate": 1.495281736631587e-07, + "loss": 1.1185, + "step": 13047 + }, + { + "epoch": 0.25, + "learning_rate": 1.4952429031882257e-07, + "loss": 0.0129, + "step": 13048 + }, + { + "epoch": 0.25, + "learning_rate": 1.4952040697448641e-07, + "loss": 0.0124, + "step": 13049 + }, + { + "epoch": 0.25, + "learning_rate": 1.4951652363015029e-07, + "loss": 0.9236, + "step": 13050 + }, + { + "epoch": 0.25, + "learning_rate": 1.4951264028581413e-07, + "loss": 0.0017, + "step": 13051 + }, + { + "epoch": 0.25, + "learning_rate": 1.49508756941478e-07, + "loss": 0.0018, + "step": 13052 + }, + { + "epoch": 0.25, + "learning_rate": 1.4950487359714185e-07, + "loss": 0.0026, + "step": 13053 + }, + { + "epoch": 0.25, + "learning_rate": 1.4950099025280572e-07, + "loss": 0.002, + "step": 13054 + }, + { + "epoch": 0.25, + "learning_rate": 1.4949710690846956e-07, + "loss": 0.0189, + "step": 13055 + }, + { + "epoch": 0.25, + "learning_rate": 1.4949322356413343e-07, + "loss": 0.0015, + "step": 13056 + }, + { + "epoch": 0.25, + "learning_rate": 1.4948934021979728e-07, + "loss": 0.0018, + "step": 13057 + }, + { + "epoch": 0.25, + "learning_rate": 1.4948545687546115e-07, + "loss": 0.0026, + "step": 13058 + }, + { + "epoch": 0.25, + "learning_rate": 1.49481573531125e-07, + "loss": 0.0018, + "step": 13059 + }, + { + "epoch": 0.25, + "learning_rate": 1.4947769018678887e-07, + "loss": 0.0021, + "step": 13060 + }, + { + "epoch": 0.25, + "learning_rate": 1.494738068424527e-07, + "loss": 0.0028, + "step": 13061 + }, + { + "epoch": 0.25, + "learning_rate": 1.4946992349811658e-07, + "loss": 0.0019, + "step": 13062 + }, + { + "epoch": 0.25, + "learning_rate": 1.4946604015378043e-07, + "loss": 0.3562, + "step": 13063 + }, + { + "epoch": 0.25, + "learning_rate": 1.494621568094443e-07, + "loss": 0.0024, + "step": 13064 + }, + { + "epoch": 0.25, + "learning_rate": 1.4945827346510815e-07, + "loss": 0.0056, + "step": 13065 + }, + { + "epoch": 0.25, + "learning_rate": 1.4945439012077202e-07, + "loss": 0.0013, + "step": 13066 + }, + { + "epoch": 0.25, + "learning_rate": 1.4945050677643586e-07, + "loss": 0.0016, + "step": 13067 + }, + { + "epoch": 0.25, + "learning_rate": 1.4944662343209973e-07, + "loss": 0.0026, + "step": 13068 + }, + { + "epoch": 0.25, + "learning_rate": 1.4944274008776358e-07, + "loss": 0.0018, + "step": 13069 + }, + { + "epoch": 0.25, + "learning_rate": 1.4943885674342745e-07, + "loss": 0.0678, + "step": 13070 + }, + { + "epoch": 0.25, + "learning_rate": 1.4943497339909127e-07, + "loss": 0.006, + "step": 13071 + }, + { + "epoch": 0.25, + "learning_rate": 1.4943109005475514e-07, + "loss": 0.0022, + "step": 13072 + }, + { + "epoch": 0.25, + "learning_rate": 1.4942720671041898e-07, + "loss": 0.0021, + "step": 13073 + }, + { + "epoch": 0.25, + "learning_rate": 1.4942332336608286e-07, + "loss": 0.3693, + "step": 13074 + }, + { + "epoch": 0.25, + "learning_rate": 1.494194400217467e-07, + "loss": 0.0019, + "step": 13075 + }, + { + "epoch": 0.25, + "learning_rate": 1.4941555667741057e-07, + "loss": 0.0019, + "step": 13076 + }, + { + "epoch": 0.25, + "learning_rate": 1.4941167333307442e-07, + "loss": 0.0523, + "step": 13077 + }, + { + "epoch": 0.25, + "learning_rate": 1.494077899887383e-07, + "loss": 0.0019, + "step": 13078 + }, + { + "epoch": 0.25, + "learning_rate": 1.4940390664440213e-07, + "loss": 0.0016, + "step": 13079 + }, + { + "epoch": 0.25, + "learning_rate": 1.49400023300066e-07, + "loss": 0.0054, + "step": 13080 + }, + { + "epoch": 0.25, + "learning_rate": 1.4939613995572985e-07, + "loss": 0.0078, + "step": 13081 + }, + { + "epoch": 0.25, + "learning_rate": 1.4939225661139372e-07, + "loss": 1.1941, + "step": 13082 + }, + { + "epoch": 0.25, + "learning_rate": 1.4938837326705757e-07, + "loss": 0.0011, + "step": 13083 + }, + { + "epoch": 0.25, + "learning_rate": 1.4938448992272144e-07, + "loss": 0.0015, + "step": 13084 + }, + { + "epoch": 0.25, + "learning_rate": 1.4938060657838528e-07, + "loss": 0.002, + "step": 13085 + }, + { + "epoch": 0.25, + "learning_rate": 1.4937672323404916e-07, + "loss": 0.0023, + "step": 13086 + }, + { + "epoch": 0.25, + "learning_rate": 1.49372839889713e-07, + "loss": 0.0344, + "step": 13087 + }, + { + "epoch": 0.25, + "learning_rate": 1.4936895654537687e-07, + "loss": 0.0019, + "step": 13088 + }, + { + "epoch": 0.25, + "learning_rate": 1.4936507320104072e-07, + "loss": 0.098, + "step": 13089 + }, + { + "epoch": 0.25, + "learning_rate": 1.493611898567046e-07, + "loss": 0.0014, + "step": 13090 + }, + { + "epoch": 0.25, + "learning_rate": 1.4935730651236843e-07, + "loss": 0.0017, + "step": 13091 + }, + { + "epoch": 0.25, + "learning_rate": 1.493534231680323e-07, + "loss": 0.0019, + "step": 13092 + }, + { + "epoch": 0.25, + "learning_rate": 1.4934953982369615e-07, + "loss": 0.0013, + "step": 13093 + }, + { + "epoch": 0.25, + "learning_rate": 1.4934565647936002e-07, + "loss": 0.002, + "step": 13094 + }, + { + "epoch": 0.25, + "learning_rate": 1.4934177313502387e-07, + "loss": 0.0022, + "step": 13095 + }, + { + "epoch": 0.25, + "learning_rate": 1.4933788979068774e-07, + "loss": 0.0021, + "step": 13096 + }, + { + "epoch": 0.25, + "learning_rate": 1.4933400644635158e-07, + "loss": 0.002, + "step": 13097 + }, + { + "epoch": 0.25, + "learning_rate": 1.4933012310201545e-07, + "loss": 0.1632, + "step": 13098 + }, + { + "epoch": 0.25, + "learning_rate": 1.493262397576793e-07, + "loss": 0.0299, + "step": 13099 + }, + { + "epoch": 0.25, + "learning_rate": 1.4932235641334317e-07, + "loss": 0.3221, + "step": 13100 + }, + { + "epoch": 0.25, + "learning_rate": 1.4931847306900702e-07, + "loss": 0.0016, + "step": 13101 + }, + { + "epoch": 0.25, + "learning_rate": 1.493145897246709e-07, + "loss": 0.5236, + "step": 13102 + }, + { + "epoch": 0.25, + "learning_rate": 1.4931070638033473e-07, + "loss": 0.0055, + "step": 13103 + }, + { + "epoch": 0.25, + "learning_rate": 1.493068230359986e-07, + "loss": 0.0015, + "step": 13104 + }, + { + "epoch": 0.25, + "learning_rate": 1.4930293969166245e-07, + "loss": 0.0037, + "step": 13105 + }, + { + "epoch": 0.25, + "learning_rate": 1.4929905634732632e-07, + "loss": 1.0324, + "step": 13106 + }, + { + "epoch": 0.25, + "learning_rate": 1.4929517300299017e-07, + "loss": 0.9741, + "step": 13107 + }, + { + "epoch": 0.25, + "learning_rate": 1.4929128965865404e-07, + "loss": 0.6373, + "step": 13108 + }, + { + "epoch": 0.25, + "learning_rate": 1.4928740631431788e-07, + "loss": 0.5919, + "step": 13109 + }, + { + "epoch": 0.25, + "learning_rate": 1.4928352296998175e-07, + "loss": 0.0014, + "step": 13110 + }, + { + "epoch": 0.25, + "learning_rate": 1.492796396256456e-07, + "loss": 0.0015, + "step": 13111 + }, + { + "epoch": 0.25, + "learning_rate": 1.4927575628130947e-07, + "loss": 0.0033, + "step": 13112 + }, + { + "epoch": 0.25, + "learning_rate": 1.4927187293697331e-07, + "loss": 0.0025, + "step": 13113 + }, + { + "epoch": 0.25, + "learning_rate": 1.4926798959263719e-07, + "loss": 0.8962, + "step": 13114 + }, + { + "epoch": 0.25, + "learning_rate": 1.4926410624830103e-07, + "loss": 0.0018, + "step": 13115 + }, + { + "epoch": 0.25, + "learning_rate": 1.492602229039649e-07, + "loss": 0.1122, + "step": 13116 + }, + { + "epoch": 0.25, + "learning_rate": 1.4925633955962875e-07, + "loss": 0.0019, + "step": 13117 + }, + { + "epoch": 0.25, + "learning_rate": 1.4925245621529262e-07, + "loss": 0.0016, + "step": 13118 + }, + { + "epoch": 0.25, + "learning_rate": 1.4924857287095646e-07, + "loss": 0.0017, + "step": 13119 + }, + { + "epoch": 0.25, + "learning_rate": 1.4924468952662034e-07, + "loss": 0.0014, + "step": 13120 + }, + { + "epoch": 0.25, + "learning_rate": 1.4924080618228418e-07, + "loss": 0.0647, + "step": 13121 + }, + { + "epoch": 0.25, + "learning_rate": 1.4923692283794805e-07, + "loss": 0.0012, + "step": 13122 + }, + { + "epoch": 0.25, + "learning_rate": 1.492330394936119e-07, + "loss": 0.0017, + "step": 13123 + }, + { + "epoch": 0.25, + "learning_rate": 1.4922915614927577e-07, + "loss": 0.003, + "step": 13124 + }, + { + "epoch": 0.25, + "learning_rate": 1.4922527280493961e-07, + "loss": 0.0034, + "step": 13125 + }, + { + "epoch": 0.25, + "learning_rate": 1.4922138946060349e-07, + "loss": 0.0108, + "step": 13126 + }, + { + "epoch": 0.25, + "learning_rate": 1.4921750611626733e-07, + "loss": 0.0043, + "step": 13127 + }, + { + "epoch": 0.25, + "learning_rate": 1.492136227719312e-07, + "loss": 0.0302, + "step": 13128 + }, + { + "epoch": 0.25, + "learning_rate": 1.4920973942759502e-07, + "loss": 0.0014, + "step": 13129 + }, + { + "epoch": 0.25, + "learning_rate": 1.492058560832589e-07, + "loss": 0.6959, + "step": 13130 + }, + { + "epoch": 0.25, + "learning_rate": 1.4920197273892274e-07, + "loss": 0.3888, + "step": 13131 + }, + { + "epoch": 0.25, + "learning_rate": 1.491980893945866e-07, + "loss": 0.0047, + "step": 13132 + }, + { + "epoch": 0.25, + "learning_rate": 1.4919420605025045e-07, + "loss": 0.006, + "step": 13133 + }, + { + "epoch": 0.25, + "learning_rate": 1.4919032270591432e-07, + "loss": 0.0099, + "step": 13134 + }, + { + "epoch": 0.25, + "learning_rate": 1.4918643936157817e-07, + "loss": 0.0019, + "step": 13135 + }, + { + "epoch": 0.25, + "learning_rate": 1.4918255601724204e-07, + "loss": 0.0015, + "step": 13136 + }, + { + "epoch": 0.25, + "learning_rate": 1.4917867267290589e-07, + "loss": 0.0014, + "step": 13137 + }, + { + "epoch": 0.25, + "learning_rate": 1.4917478932856976e-07, + "loss": 0.0092, + "step": 13138 + }, + { + "epoch": 0.25, + "learning_rate": 1.491709059842336e-07, + "loss": 0.0017, + "step": 13139 + }, + { + "epoch": 0.25, + "learning_rate": 1.4916702263989747e-07, + "loss": 0.2132, + "step": 13140 + }, + { + "epoch": 0.25, + "learning_rate": 1.4916313929556132e-07, + "loss": 0.0053, + "step": 13141 + }, + { + "epoch": 0.25, + "learning_rate": 1.491592559512252e-07, + "loss": 0.0021, + "step": 13142 + }, + { + "epoch": 0.25, + "learning_rate": 1.4915537260688904e-07, + "loss": 0.0014, + "step": 13143 + }, + { + "epoch": 0.25, + "learning_rate": 1.491514892625529e-07, + "loss": 0.0014, + "step": 13144 + }, + { + "epoch": 0.25, + "learning_rate": 1.4914760591821675e-07, + "loss": 0.0015, + "step": 13145 + }, + { + "epoch": 0.26, + "learning_rate": 1.4914372257388062e-07, + "loss": 0.0013, + "step": 13146 + }, + { + "epoch": 0.26, + "learning_rate": 1.4913983922954447e-07, + "loss": 0.0016, + "step": 13147 + }, + { + "epoch": 0.26, + "learning_rate": 1.4913595588520834e-07, + "loss": 0.0029, + "step": 13148 + }, + { + "epoch": 0.26, + "learning_rate": 1.4913207254087219e-07, + "loss": 0.002, + "step": 13149 + }, + { + "epoch": 0.26, + "learning_rate": 1.4912818919653606e-07, + "loss": 0.0143, + "step": 13150 + }, + { + "epoch": 0.26, + "learning_rate": 1.491243058521999e-07, + "loss": 0.0017, + "step": 13151 + }, + { + "epoch": 0.26, + "learning_rate": 1.4912042250786377e-07, + "loss": 0.0023, + "step": 13152 + }, + { + "epoch": 0.26, + "learning_rate": 1.4911653916352762e-07, + "loss": 0.0017, + "step": 13153 + }, + { + "epoch": 0.26, + "learning_rate": 1.491126558191915e-07, + "loss": 0.0054, + "step": 13154 + }, + { + "epoch": 0.26, + "learning_rate": 1.4910877247485533e-07, + "loss": 0.0055, + "step": 13155 + }, + { + "epoch": 0.26, + "learning_rate": 1.491048891305192e-07, + "loss": 0.0015, + "step": 13156 + }, + { + "epoch": 0.26, + "learning_rate": 1.4910100578618305e-07, + "loss": 0.0012, + "step": 13157 + }, + { + "epoch": 0.26, + "learning_rate": 1.4909712244184692e-07, + "loss": 0.0014, + "step": 13158 + }, + { + "epoch": 0.26, + "learning_rate": 1.4909323909751077e-07, + "loss": 0.0018, + "step": 13159 + }, + { + "epoch": 0.26, + "learning_rate": 1.4908935575317464e-07, + "loss": 0.0078, + "step": 13160 + }, + { + "epoch": 0.26, + "learning_rate": 1.4908547240883848e-07, + "loss": 0.0015, + "step": 13161 + }, + { + "epoch": 0.26, + "learning_rate": 1.4908158906450236e-07, + "loss": 0.002, + "step": 13162 + }, + { + "epoch": 0.26, + "learning_rate": 1.490777057201662e-07, + "loss": 0.0018, + "step": 13163 + }, + { + "epoch": 0.26, + "learning_rate": 1.4907382237583007e-07, + "loss": 0.1405, + "step": 13164 + }, + { + "epoch": 0.26, + "learning_rate": 1.4906993903149392e-07, + "loss": 0.5759, + "step": 13165 + }, + { + "epoch": 0.26, + "learning_rate": 1.490660556871578e-07, + "loss": 0.0019, + "step": 13166 + }, + { + "epoch": 0.26, + "learning_rate": 1.4906217234282163e-07, + "loss": 0.0052, + "step": 13167 + }, + { + "epoch": 0.26, + "learning_rate": 1.490582889984855e-07, + "loss": 0.0039, + "step": 13168 + }, + { + "epoch": 0.26, + "learning_rate": 1.4905440565414935e-07, + "loss": 0.019, + "step": 13169 + }, + { + "epoch": 0.26, + "learning_rate": 1.4905052230981322e-07, + "loss": 0.0015, + "step": 13170 + }, + { + "epoch": 0.26, + "learning_rate": 1.4904663896547707e-07, + "loss": 0.0018, + "step": 13171 + }, + { + "epoch": 0.26, + "learning_rate": 1.4904275562114094e-07, + "loss": 0.0018, + "step": 13172 + }, + { + "epoch": 0.26, + "learning_rate": 1.4903887227680478e-07, + "loss": 0.0014, + "step": 13173 + }, + { + "epoch": 0.26, + "learning_rate": 1.4903498893246865e-07, + "loss": 0.0017, + "step": 13174 + }, + { + "epoch": 0.26, + "learning_rate": 1.490311055881325e-07, + "loss": 0.0018, + "step": 13175 + }, + { + "epoch": 0.26, + "learning_rate": 1.4902722224379637e-07, + "loss": 0.0025, + "step": 13176 + }, + { + "epoch": 0.26, + "learning_rate": 1.4902333889946022e-07, + "loss": 0.0026, + "step": 13177 + }, + { + "epoch": 0.26, + "learning_rate": 1.4901945555512406e-07, + "loss": 0.0019, + "step": 13178 + }, + { + "epoch": 0.26, + "learning_rate": 1.4901557221078793e-07, + "loss": 0.9388, + "step": 13179 + }, + { + "epoch": 0.26, + "learning_rate": 1.4901168886645178e-07, + "loss": 0.0011, + "step": 13180 + }, + { + "epoch": 0.26, + "learning_rate": 1.4900780552211565e-07, + "loss": 0.0041, + "step": 13181 + }, + { + "epoch": 0.26, + "learning_rate": 1.490039221777795e-07, + "loss": 0.5833, + "step": 13182 + }, + { + "epoch": 0.26, + "learning_rate": 1.4900003883344337e-07, + "loss": 0.0025, + "step": 13183 + }, + { + "epoch": 0.26, + "learning_rate": 1.489961554891072e-07, + "loss": 0.0016, + "step": 13184 + }, + { + "epoch": 0.26, + "learning_rate": 1.4899227214477108e-07, + "loss": 0.0021, + "step": 13185 + }, + { + "epoch": 0.26, + "learning_rate": 1.4898838880043493e-07, + "loss": 0.0014, + "step": 13186 + }, + { + "epoch": 0.26, + "learning_rate": 1.4898450545609877e-07, + "loss": 0.0017, + "step": 13187 + }, + { + "epoch": 0.26, + "learning_rate": 1.4898062211176264e-07, + "loss": 0.0211, + "step": 13188 + }, + { + "epoch": 0.26, + "learning_rate": 1.489767387674265e-07, + "loss": 0.0033, + "step": 13189 + }, + { + "epoch": 0.26, + "learning_rate": 1.4897285542309036e-07, + "loss": 0.8772, + "step": 13190 + }, + { + "epoch": 0.26, + "learning_rate": 1.489689720787542e-07, + "loss": 0.0063, + "step": 13191 + }, + { + "epoch": 0.26, + "learning_rate": 1.4896508873441808e-07, + "loss": 0.0017, + "step": 13192 + }, + { + "epoch": 0.26, + "learning_rate": 1.4896120539008192e-07, + "loss": 0.8013, + "step": 13193 + }, + { + "epoch": 0.26, + "learning_rate": 1.489573220457458e-07, + "loss": 0.0022, + "step": 13194 + }, + { + "epoch": 0.26, + "learning_rate": 1.4895343870140964e-07, + "loss": 0.0049, + "step": 13195 + }, + { + "epoch": 0.26, + "learning_rate": 1.489495553570735e-07, + "loss": 0.002, + "step": 13196 + }, + { + "epoch": 0.26, + "learning_rate": 1.4894567201273735e-07, + "loss": 0.0019, + "step": 13197 + }, + { + "epoch": 0.26, + "learning_rate": 1.4894178866840123e-07, + "loss": 0.0024, + "step": 13198 + }, + { + "epoch": 0.26, + "learning_rate": 1.4893790532406507e-07, + "loss": 0.0577, + "step": 13199 + }, + { + "epoch": 0.26, + "learning_rate": 1.4893402197972894e-07, + "loss": 0.0027, + "step": 13200 + }, + { + "epoch": 0.26, + "learning_rate": 1.489301386353928e-07, + "loss": 0.0016, + "step": 13201 + }, + { + "epoch": 0.26, + "learning_rate": 1.4892625529105666e-07, + "loss": 0.0013, + "step": 13202 + }, + { + "epoch": 0.26, + "learning_rate": 1.489223719467205e-07, + "loss": 0.0013, + "step": 13203 + }, + { + "epoch": 0.26, + "learning_rate": 1.4891848860238438e-07, + "loss": 0.0024, + "step": 13204 + }, + { + "epoch": 0.26, + "learning_rate": 1.4891460525804822e-07, + "loss": 0.0018, + "step": 13205 + }, + { + "epoch": 0.26, + "learning_rate": 1.4891072191371207e-07, + "loss": 0.0017, + "step": 13206 + }, + { + "epoch": 0.26, + "learning_rate": 1.4890683856937594e-07, + "loss": 0.0015, + "step": 13207 + }, + { + "epoch": 0.26, + "learning_rate": 1.4890295522503978e-07, + "loss": 0.0024, + "step": 13208 + }, + { + "epoch": 0.26, + "learning_rate": 1.4889907188070365e-07, + "loss": 0.0016, + "step": 13209 + }, + { + "epoch": 0.26, + "learning_rate": 1.488951885363675e-07, + "loss": 0.0013, + "step": 13210 + }, + { + "epoch": 0.26, + "learning_rate": 1.4889130519203137e-07, + "loss": 0.6129, + "step": 13211 + }, + { + "epoch": 0.26, + "learning_rate": 1.4888742184769521e-07, + "loss": 0.0015, + "step": 13212 + }, + { + "epoch": 0.26, + "learning_rate": 1.4888353850335909e-07, + "loss": 0.0211, + "step": 13213 + }, + { + "epoch": 0.26, + "learning_rate": 1.4887965515902293e-07, + "loss": 0.0018, + "step": 13214 + }, + { + "epoch": 0.26, + "learning_rate": 1.488757718146868e-07, + "loss": 0.0015, + "step": 13215 + }, + { + "epoch": 0.26, + "learning_rate": 1.4887188847035065e-07, + "loss": 0.0021, + "step": 13216 + }, + { + "epoch": 0.26, + "learning_rate": 1.4886800512601452e-07, + "loss": 0.0035, + "step": 13217 + }, + { + "epoch": 0.26, + "learning_rate": 1.4886412178167836e-07, + "loss": 0.7494, + "step": 13218 + }, + { + "epoch": 0.26, + "learning_rate": 1.4886023843734224e-07, + "loss": 0.0462, + "step": 13219 + }, + { + "epoch": 0.26, + "learning_rate": 1.4885635509300608e-07, + "loss": 0.0027, + "step": 13220 + }, + { + "epoch": 0.26, + "learning_rate": 1.4885247174866995e-07, + "loss": 0.9472, + "step": 13221 + }, + { + "epoch": 0.26, + "learning_rate": 1.488485884043338e-07, + "loss": 0.001, + "step": 13222 + }, + { + "epoch": 0.26, + "learning_rate": 1.4884470505999767e-07, + "loss": 0.0013, + "step": 13223 + }, + { + "epoch": 0.26, + "learning_rate": 1.4884082171566151e-07, + "loss": 0.0018, + "step": 13224 + }, + { + "epoch": 0.26, + "learning_rate": 1.4883693837132539e-07, + "loss": 0.0018, + "step": 13225 + }, + { + "epoch": 0.26, + "learning_rate": 1.4883305502698923e-07, + "loss": 0.0015, + "step": 13226 + }, + { + "epoch": 0.26, + "learning_rate": 1.488291716826531e-07, + "loss": 0.0016, + "step": 13227 + }, + { + "epoch": 0.26, + "learning_rate": 1.4882528833831695e-07, + "loss": 0.002, + "step": 13228 + }, + { + "epoch": 0.26, + "learning_rate": 1.4882140499398082e-07, + "loss": 0.0014, + "step": 13229 + }, + { + "epoch": 0.26, + "learning_rate": 1.4881752164964466e-07, + "loss": 0.0037, + "step": 13230 + }, + { + "epoch": 0.26, + "learning_rate": 1.4881363830530853e-07, + "loss": 0.0753, + "step": 13231 + }, + { + "epoch": 0.26, + "learning_rate": 1.4880975496097238e-07, + "loss": 0.0022, + "step": 13232 + }, + { + "epoch": 0.26, + "learning_rate": 1.4880587161663625e-07, + "loss": 0.0012, + "step": 13233 + }, + { + "epoch": 0.26, + "learning_rate": 1.488019882723001e-07, + "loss": 0.0016, + "step": 13234 + }, + { + "epoch": 0.26, + "learning_rate": 1.4879810492796397e-07, + "loss": 0.0015, + "step": 13235 + }, + { + "epoch": 0.26, + "learning_rate": 1.487942215836278e-07, + "loss": 0.0081, + "step": 13236 + }, + { + "epoch": 0.26, + "learning_rate": 1.4879033823929168e-07, + "loss": 0.0019, + "step": 13237 + }, + { + "epoch": 0.26, + "learning_rate": 1.4878645489495553e-07, + "loss": 0.0041, + "step": 13238 + }, + { + "epoch": 0.26, + "learning_rate": 1.487825715506194e-07, + "loss": 0.0017, + "step": 13239 + }, + { + "epoch": 0.26, + "learning_rate": 1.4877868820628325e-07, + "loss": 0.2236, + "step": 13240 + }, + { + "epoch": 0.26, + "learning_rate": 1.4877480486194712e-07, + "loss": 0.0014, + "step": 13241 + }, + { + "epoch": 0.26, + "learning_rate": 1.4877092151761096e-07, + "loss": 0.002, + "step": 13242 + }, + { + "epoch": 0.26, + "learning_rate": 1.4876703817327483e-07, + "loss": 0.0053, + "step": 13243 + }, + { + "epoch": 0.26, + "learning_rate": 1.4876315482893868e-07, + "loss": 0.6305, + "step": 13244 + }, + { + "epoch": 0.26, + "learning_rate": 1.4875927148460252e-07, + "loss": 0.0028, + "step": 13245 + }, + { + "epoch": 0.26, + "learning_rate": 1.4875538814026637e-07, + "loss": 0.0014, + "step": 13246 + }, + { + "epoch": 0.26, + "learning_rate": 1.4875150479593024e-07, + "loss": 0.0026, + "step": 13247 + }, + { + "epoch": 0.26, + "learning_rate": 1.4874762145159409e-07, + "loss": 0.0015, + "step": 13248 + }, + { + "epoch": 0.26, + "learning_rate": 1.4874373810725796e-07, + "loss": 0.0011, + "step": 13249 + }, + { + "epoch": 0.26, + "learning_rate": 1.487398547629218e-07, + "loss": 0.0018, + "step": 13250 + }, + { + "epoch": 0.26, + "learning_rate": 1.4873597141858567e-07, + "loss": 0.0391, + "step": 13251 + }, + { + "epoch": 0.26, + "learning_rate": 1.4873208807424952e-07, + "loss": 0.0018, + "step": 13252 + }, + { + "epoch": 0.26, + "learning_rate": 1.487282047299134e-07, + "loss": 0.7592, + "step": 13253 + }, + { + "epoch": 0.26, + "learning_rate": 1.4872432138557723e-07, + "loss": 0.0015, + "step": 13254 + }, + { + "epoch": 0.26, + "learning_rate": 1.487204380412411e-07, + "loss": 0.002, + "step": 13255 + }, + { + "epoch": 0.26, + "learning_rate": 1.4871655469690495e-07, + "loss": 0.0012, + "step": 13256 + }, + { + "epoch": 0.26, + "learning_rate": 1.4871267135256882e-07, + "loss": 0.0012, + "step": 13257 + }, + { + "epoch": 0.26, + "learning_rate": 1.4870878800823267e-07, + "loss": 0.0831, + "step": 13258 + }, + { + "epoch": 0.26, + "learning_rate": 1.4870490466389654e-07, + "loss": 0.1669, + "step": 13259 + }, + { + "epoch": 0.26, + "learning_rate": 1.4870102131956038e-07, + "loss": 0.0025, + "step": 13260 + }, + { + "epoch": 0.26, + "learning_rate": 1.4869713797522426e-07, + "loss": 0.002, + "step": 13261 + }, + { + "epoch": 0.26, + "learning_rate": 1.486932546308881e-07, + "loss": 0.6957, + "step": 13262 + }, + { + "epoch": 0.26, + "learning_rate": 1.4868937128655197e-07, + "loss": 0.0013, + "step": 13263 + }, + { + "epoch": 0.26, + "learning_rate": 1.4868548794221582e-07, + "loss": 0.0013, + "step": 13264 + }, + { + "epoch": 0.26, + "learning_rate": 1.486816045978797e-07, + "loss": 0.0032, + "step": 13265 + }, + { + "epoch": 0.26, + "learning_rate": 1.4867772125354353e-07, + "loss": 0.0024, + "step": 13266 + }, + { + "epoch": 0.26, + "learning_rate": 1.486738379092074e-07, + "loss": 0.0016, + "step": 13267 + }, + { + "epoch": 0.26, + "learning_rate": 1.4866995456487125e-07, + "loss": 0.0015, + "step": 13268 + }, + { + "epoch": 0.26, + "learning_rate": 1.4866607122053512e-07, + "loss": 0.6341, + "step": 13269 + }, + { + "epoch": 0.26, + "learning_rate": 1.4866218787619897e-07, + "loss": 0.0659, + "step": 13270 + }, + { + "epoch": 0.26, + "learning_rate": 1.4865830453186284e-07, + "loss": 0.0116, + "step": 13271 + }, + { + "epoch": 0.26, + "learning_rate": 1.4865442118752668e-07, + "loss": 0.0603, + "step": 13272 + }, + { + "epoch": 0.26, + "learning_rate": 1.4865053784319055e-07, + "loss": 0.0016, + "step": 13273 + }, + { + "epoch": 0.26, + "learning_rate": 1.486466544988544e-07, + "loss": 0.0023, + "step": 13274 + }, + { + "epoch": 0.26, + "learning_rate": 1.4864277115451827e-07, + "loss": 0.0017, + "step": 13275 + }, + { + "epoch": 0.26, + "learning_rate": 1.4863888781018212e-07, + "loss": 0.0013, + "step": 13276 + }, + { + "epoch": 0.26, + "learning_rate": 1.48635004465846e-07, + "loss": 0.0015, + "step": 13277 + }, + { + "epoch": 0.26, + "learning_rate": 1.4863112112150983e-07, + "loss": 0.0029, + "step": 13278 + }, + { + "epoch": 0.26, + "learning_rate": 1.486272377771737e-07, + "loss": 0.0018, + "step": 13279 + }, + { + "epoch": 0.26, + "learning_rate": 1.4862335443283755e-07, + "loss": 0.0013, + "step": 13280 + }, + { + "epoch": 0.26, + "learning_rate": 1.4861947108850142e-07, + "loss": 0.0018, + "step": 13281 + }, + { + "epoch": 0.26, + "learning_rate": 1.4861558774416527e-07, + "loss": 0.2263, + "step": 13282 + }, + { + "epoch": 0.26, + "learning_rate": 1.4861170439982914e-07, + "loss": 0.0025, + "step": 13283 + }, + { + "epoch": 0.26, + "learning_rate": 1.4860782105549298e-07, + "loss": 0.0014, + "step": 13284 + }, + { + "epoch": 0.26, + "learning_rate": 1.4860393771115685e-07, + "loss": 0.0017, + "step": 13285 + }, + { + "epoch": 0.26, + "learning_rate": 1.486000543668207e-07, + "loss": 0.0017, + "step": 13286 + }, + { + "epoch": 0.26, + "learning_rate": 1.4859617102248457e-07, + "loss": 0.0046, + "step": 13287 + }, + { + "epoch": 0.26, + "learning_rate": 1.4859228767814841e-07, + "loss": 0.0014, + "step": 13288 + }, + { + "epoch": 0.26, + "learning_rate": 1.4858840433381229e-07, + "loss": 0.0228, + "step": 13289 + }, + { + "epoch": 0.26, + "learning_rate": 1.4858452098947613e-07, + "loss": 0.0016, + "step": 13290 + }, + { + "epoch": 0.26, + "learning_rate": 1.4858063764514e-07, + "loss": 0.0319, + "step": 13291 + }, + { + "epoch": 0.26, + "learning_rate": 1.4857675430080385e-07, + "loss": 0.0011, + "step": 13292 + }, + { + "epoch": 0.26, + "learning_rate": 1.4857287095646772e-07, + "loss": 0.0018, + "step": 13293 + }, + { + "epoch": 0.26, + "learning_rate": 1.4856898761213156e-07, + "loss": 0.0014, + "step": 13294 + }, + { + "epoch": 0.26, + "learning_rate": 1.4856510426779544e-07, + "loss": 0.0019, + "step": 13295 + }, + { + "epoch": 0.26, + "learning_rate": 1.4856122092345928e-07, + "loss": 0.0024, + "step": 13296 + }, + { + "epoch": 0.26, + "learning_rate": 1.4855733757912315e-07, + "loss": 0.0016, + "step": 13297 + }, + { + "epoch": 0.26, + "learning_rate": 1.48553454234787e-07, + "loss": 0.0072, + "step": 13298 + }, + { + "epoch": 0.26, + "learning_rate": 1.4854957089045087e-07, + "loss": 0.0013, + "step": 13299 + }, + { + "epoch": 0.26, + "learning_rate": 1.4854568754611471e-07, + "loss": 0.0029, + "step": 13300 + }, + { + "epoch": 0.26, + "learning_rate": 1.4854180420177859e-07, + "loss": 0.0027, + "step": 13301 + }, + { + "epoch": 0.26, + "learning_rate": 1.4853792085744243e-07, + "loss": 0.0235, + "step": 13302 + }, + { + "epoch": 0.26, + "learning_rate": 1.4853403751310628e-07, + "loss": 0.0356, + "step": 13303 + }, + { + "epoch": 0.26, + "learning_rate": 1.4853015416877012e-07, + "loss": 0.0012, + "step": 13304 + }, + { + "epoch": 0.26, + "learning_rate": 1.48526270824434e-07, + "loss": 0.0016, + "step": 13305 + }, + { + "epoch": 0.26, + "learning_rate": 1.4852238748009784e-07, + "loss": 0.0015, + "step": 13306 + }, + { + "epoch": 0.26, + "learning_rate": 1.485185041357617e-07, + "loss": 0.0016, + "step": 13307 + }, + { + "epoch": 0.26, + "learning_rate": 1.4851462079142555e-07, + "loss": 0.0023, + "step": 13308 + }, + { + "epoch": 0.26, + "learning_rate": 1.4851073744708942e-07, + "loss": 0.0014, + "step": 13309 + }, + { + "epoch": 0.26, + "learning_rate": 1.4850685410275327e-07, + "loss": 0.0046, + "step": 13310 + }, + { + "epoch": 0.26, + "learning_rate": 1.4850297075841714e-07, + "loss": 0.0018, + "step": 13311 + }, + { + "epoch": 0.26, + "learning_rate": 1.4849908741408099e-07, + "loss": 0.0122, + "step": 13312 + }, + { + "epoch": 0.26, + "learning_rate": 1.4849520406974486e-07, + "loss": 0.0022, + "step": 13313 + }, + { + "epoch": 0.26, + "learning_rate": 1.484913207254087e-07, + "loss": 0.1824, + "step": 13314 + }, + { + "epoch": 0.26, + "learning_rate": 1.4848743738107257e-07, + "loss": 0.0016, + "step": 13315 + }, + { + "epoch": 0.26, + "learning_rate": 1.4848355403673642e-07, + "loss": 0.0013, + "step": 13316 + }, + { + "epoch": 0.26, + "learning_rate": 1.484796706924003e-07, + "loss": 0.0016, + "step": 13317 + }, + { + "epoch": 0.26, + "learning_rate": 1.4847578734806414e-07, + "loss": 0.8013, + "step": 13318 + }, + { + "epoch": 0.26, + "learning_rate": 1.48471904003728e-07, + "loss": 0.0019, + "step": 13319 + }, + { + "epoch": 0.26, + "learning_rate": 1.4846802065939185e-07, + "loss": 0.0016, + "step": 13320 + }, + { + "epoch": 0.26, + "learning_rate": 1.4846413731505572e-07, + "loss": 0.0017, + "step": 13321 + }, + { + "epoch": 0.26, + "learning_rate": 1.4846025397071957e-07, + "loss": 0.2821, + "step": 13322 + }, + { + "epoch": 0.26, + "learning_rate": 1.4845637062638344e-07, + "loss": 0.0051, + "step": 13323 + }, + { + "epoch": 0.26, + "learning_rate": 1.4845248728204729e-07, + "loss": 0.0017, + "step": 13324 + }, + { + "epoch": 0.26, + "learning_rate": 1.4844860393771116e-07, + "loss": 0.0015, + "step": 13325 + }, + { + "epoch": 0.26, + "learning_rate": 1.48444720593375e-07, + "loss": 0.0016, + "step": 13326 + }, + { + "epoch": 0.26, + "learning_rate": 1.4844083724903887e-07, + "loss": 0.045, + "step": 13327 + }, + { + "epoch": 0.26, + "learning_rate": 1.4843695390470272e-07, + "loss": 0.0014, + "step": 13328 + }, + { + "epoch": 0.26, + "learning_rate": 1.484330705603666e-07, + "loss": 0.0575, + "step": 13329 + }, + { + "epoch": 0.26, + "learning_rate": 1.4842918721603043e-07, + "loss": 0.7559, + "step": 13330 + }, + { + "epoch": 0.26, + "learning_rate": 1.484253038716943e-07, + "loss": 0.0016, + "step": 13331 + }, + { + "epoch": 0.26, + "learning_rate": 1.4842142052735815e-07, + "loss": 0.0013, + "step": 13332 + }, + { + "epoch": 0.26, + "learning_rate": 1.4841753718302202e-07, + "loss": 0.0139, + "step": 13333 + }, + { + "epoch": 0.26, + "learning_rate": 1.4841365383868587e-07, + "loss": 0.0018, + "step": 13334 + }, + { + "epoch": 0.26, + "learning_rate": 1.4840977049434974e-07, + "loss": 0.0017, + "step": 13335 + }, + { + "epoch": 0.26, + "learning_rate": 1.4840588715001358e-07, + "loss": 0.0021, + "step": 13336 + }, + { + "epoch": 0.26, + "learning_rate": 1.4840200380567746e-07, + "loss": 0.0075, + "step": 13337 + }, + { + "epoch": 0.26, + "learning_rate": 1.483981204613413e-07, + "loss": 0.0016, + "step": 13338 + }, + { + "epoch": 0.26, + "learning_rate": 1.4839423711700517e-07, + "loss": 0.0021, + "step": 13339 + }, + { + "epoch": 0.26, + "learning_rate": 1.4839035377266902e-07, + "loss": 0.3361, + "step": 13340 + }, + { + "epoch": 0.26, + "learning_rate": 1.483864704283329e-07, + "loss": 0.0015, + "step": 13341 + }, + { + "epoch": 0.26, + "learning_rate": 1.4838258708399673e-07, + "loss": 0.0012, + "step": 13342 + }, + { + "epoch": 0.26, + "learning_rate": 1.483787037396606e-07, + "loss": 0.0027, + "step": 13343 + }, + { + "epoch": 0.26, + "learning_rate": 1.4837482039532445e-07, + "loss": 0.002, + "step": 13344 + }, + { + "epoch": 0.26, + "learning_rate": 1.4837093705098832e-07, + "loss": 0.0032, + "step": 13345 + }, + { + "epoch": 0.26, + "learning_rate": 1.4836705370665217e-07, + "loss": 0.1478, + "step": 13346 + }, + { + "epoch": 0.26, + "learning_rate": 1.4836317036231604e-07, + "loss": 0.0831, + "step": 13347 + }, + { + "epoch": 0.26, + "learning_rate": 1.4835928701797988e-07, + "loss": 0.0011, + "step": 13348 + }, + { + "epoch": 0.26, + "learning_rate": 1.4835540367364375e-07, + "loss": 0.0027, + "step": 13349 + }, + { + "epoch": 0.26, + "learning_rate": 1.483515203293076e-07, + "loss": 0.0018, + "step": 13350 + }, + { + "epoch": 0.26, + "learning_rate": 1.4834763698497147e-07, + "loss": 0.0015, + "step": 13351 + }, + { + "epoch": 0.26, + "learning_rate": 1.4834375364063532e-07, + "loss": 0.0016, + "step": 13352 + }, + { + "epoch": 0.26, + "learning_rate": 1.483398702962992e-07, + "loss": 0.0102, + "step": 13353 + }, + { + "epoch": 0.26, + "learning_rate": 1.4833598695196303e-07, + "loss": 0.0019, + "step": 13354 + }, + { + "epoch": 0.26, + "learning_rate": 1.4833210360762688e-07, + "loss": 0.1339, + "step": 13355 + }, + { + "epoch": 0.26, + "learning_rate": 1.4832822026329075e-07, + "loss": 0.2259, + "step": 13356 + }, + { + "epoch": 0.26, + "learning_rate": 1.483243369189546e-07, + "loss": 0.0024, + "step": 13357 + }, + { + "epoch": 0.26, + "learning_rate": 1.4832045357461847e-07, + "loss": 0.0018, + "step": 13358 + }, + { + "epoch": 0.26, + "learning_rate": 1.483165702302823e-07, + "loss": 0.0017, + "step": 13359 + }, + { + "epoch": 0.26, + "learning_rate": 1.4831268688594618e-07, + "loss": 0.0016, + "step": 13360 + }, + { + "epoch": 0.26, + "learning_rate": 1.4830880354161003e-07, + "loss": 0.4109, + "step": 13361 + }, + { + "epoch": 0.26, + "learning_rate": 1.4830492019727387e-07, + "loss": 0.0016, + "step": 13362 + }, + { + "epoch": 0.26, + "learning_rate": 1.4830103685293774e-07, + "loss": 0.002, + "step": 13363 + }, + { + "epoch": 0.26, + "learning_rate": 1.482971535086016e-07, + "loss": 0.0022, + "step": 13364 + }, + { + "epoch": 0.26, + "learning_rate": 1.4829327016426546e-07, + "loss": 0.0038, + "step": 13365 + }, + { + "epoch": 0.26, + "learning_rate": 1.482893868199293e-07, + "loss": 0.0016, + "step": 13366 + }, + { + "epoch": 0.26, + "learning_rate": 1.4828550347559318e-07, + "loss": 0.5202, + "step": 13367 + }, + { + "epoch": 0.26, + "learning_rate": 1.4828162013125702e-07, + "loss": 0.0019, + "step": 13368 + }, + { + "epoch": 0.26, + "learning_rate": 1.482777367869209e-07, + "loss": 0.0017, + "step": 13369 + }, + { + "epoch": 0.26, + "learning_rate": 1.4827385344258474e-07, + "loss": 0.0032, + "step": 13370 + }, + { + "epoch": 0.26, + "learning_rate": 1.482699700982486e-07, + "loss": 0.0017, + "step": 13371 + }, + { + "epoch": 0.26, + "learning_rate": 1.4826608675391245e-07, + "loss": 0.6988, + "step": 13372 + }, + { + "epoch": 0.26, + "learning_rate": 1.4826220340957633e-07, + "loss": 0.0018, + "step": 13373 + }, + { + "epoch": 0.26, + "learning_rate": 1.4825832006524017e-07, + "loss": 0.0032, + "step": 13374 + }, + { + "epoch": 0.26, + "learning_rate": 1.4825443672090404e-07, + "loss": 0.0019, + "step": 13375 + }, + { + "epoch": 0.26, + "learning_rate": 1.482505533765679e-07, + "loss": 0.0032, + "step": 13376 + }, + { + "epoch": 0.26, + "learning_rate": 1.4824667003223176e-07, + "loss": 0.0012, + "step": 13377 + }, + { + "epoch": 0.26, + "learning_rate": 1.482427866878956e-07, + "loss": 0.002, + "step": 13378 + }, + { + "epoch": 0.26, + "learning_rate": 1.4823890334355948e-07, + "loss": 0.0051, + "step": 13379 + }, + { + "epoch": 0.26, + "learning_rate": 1.4823501999922332e-07, + "loss": 0.0015, + "step": 13380 + }, + { + "epoch": 0.26, + "learning_rate": 1.482311366548872e-07, + "loss": 0.0014, + "step": 13381 + }, + { + "epoch": 0.26, + "learning_rate": 1.4822725331055104e-07, + "loss": 0.0016, + "step": 13382 + }, + { + "epoch": 0.26, + "learning_rate": 1.4822336996621488e-07, + "loss": 0.0038, + "step": 13383 + }, + { + "epoch": 0.26, + "learning_rate": 1.4821948662187875e-07, + "loss": 0.0017, + "step": 13384 + }, + { + "epoch": 0.26, + "learning_rate": 1.482156032775426e-07, + "loss": 0.0016, + "step": 13385 + }, + { + "epoch": 0.26, + "learning_rate": 1.4821171993320647e-07, + "loss": 0.0014, + "step": 13386 + }, + { + "epoch": 0.26, + "learning_rate": 1.4820783658887031e-07, + "loss": 0.0012, + "step": 13387 + }, + { + "epoch": 0.26, + "learning_rate": 1.4820395324453419e-07, + "loss": 0.0049, + "step": 13388 + }, + { + "epoch": 0.26, + "learning_rate": 1.4820006990019803e-07, + "loss": 0.1797, + "step": 13389 + }, + { + "epoch": 0.26, + "learning_rate": 1.481961865558619e-07, + "loss": 0.0161, + "step": 13390 + }, + { + "epoch": 0.26, + "learning_rate": 1.4819230321152575e-07, + "loss": 0.0017, + "step": 13391 + }, + { + "epoch": 0.26, + "learning_rate": 1.4818841986718962e-07, + "loss": 0.0019, + "step": 13392 + }, + { + "epoch": 0.26, + "learning_rate": 1.4818453652285346e-07, + "loss": 0.0018, + "step": 13393 + }, + { + "epoch": 0.26, + "learning_rate": 1.4818065317851734e-07, + "loss": 0.0014, + "step": 13394 + }, + { + "epoch": 0.26, + "learning_rate": 1.4817676983418118e-07, + "loss": 0.0012, + "step": 13395 + }, + { + "epoch": 0.26, + "learning_rate": 1.4817288648984505e-07, + "loss": 0.0258, + "step": 13396 + }, + { + "epoch": 0.26, + "learning_rate": 1.481690031455089e-07, + "loss": 1.1166, + "step": 13397 + }, + { + "epoch": 0.26, + "learning_rate": 1.4816511980117277e-07, + "loss": 0.6182, + "step": 13398 + }, + { + "epoch": 0.26, + "learning_rate": 1.4816123645683661e-07, + "loss": 0.0087, + "step": 13399 + }, + { + "epoch": 0.26, + "learning_rate": 1.4815735311250049e-07, + "loss": 0.0014, + "step": 13400 + }, + { + "epoch": 0.26, + "learning_rate": 1.4815346976816433e-07, + "loss": 0.0028, + "step": 13401 + }, + { + "epoch": 0.26, + "learning_rate": 1.481495864238282e-07, + "loss": 0.0015, + "step": 13402 + }, + { + "epoch": 0.26, + "learning_rate": 1.4814570307949205e-07, + "loss": 0.0013, + "step": 13403 + }, + { + "epoch": 0.26, + "learning_rate": 1.4814181973515592e-07, + "loss": 0.0019, + "step": 13404 + }, + { + "epoch": 0.26, + "learning_rate": 1.4813793639081976e-07, + "loss": 0.0013, + "step": 13405 + }, + { + "epoch": 0.26, + "learning_rate": 1.4813405304648363e-07, + "loss": 0.002, + "step": 13406 + }, + { + "epoch": 0.26, + "learning_rate": 1.4813016970214748e-07, + "loss": 0.0011, + "step": 13407 + }, + { + "epoch": 0.26, + "learning_rate": 1.4812628635781135e-07, + "loss": 0.0021, + "step": 13408 + }, + { + "epoch": 0.26, + "learning_rate": 1.481224030134752e-07, + "loss": 0.002, + "step": 13409 + }, + { + "epoch": 0.26, + "learning_rate": 1.4811851966913907e-07, + "loss": 0.2307, + "step": 13410 + }, + { + "epoch": 0.26, + "learning_rate": 1.481146363248029e-07, + "loss": 0.8967, + "step": 13411 + }, + { + "epoch": 0.26, + "learning_rate": 1.4811075298046678e-07, + "loss": 0.0032, + "step": 13412 + }, + { + "epoch": 0.26, + "learning_rate": 1.4810686963613063e-07, + "loss": 0.0014, + "step": 13413 + }, + { + "epoch": 0.26, + "learning_rate": 1.481029862917945e-07, + "loss": 0.0014, + "step": 13414 + }, + { + "epoch": 0.26, + "learning_rate": 1.4809910294745835e-07, + "loss": 0.0012, + "step": 13415 + }, + { + "epoch": 0.26, + "learning_rate": 1.4809521960312222e-07, + "loss": 0.0015, + "step": 13416 + }, + { + "epoch": 0.26, + "learning_rate": 1.4809133625878606e-07, + "loss": 0.0016, + "step": 13417 + }, + { + "epoch": 0.26, + "learning_rate": 1.4808745291444993e-07, + "loss": 0.0013, + "step": 13418 + }, + { + "epoch": 0.26, + "learning_rate": 1.4808356957011375e-07, + "loss": 0.0035, + "step": 13419 + }, + { + "epoch": 0.26, + "learning_rate": 1.4807968622577762e-07, + "loss": 0.0012, + "step": 13420 + }, + { + "epoch": 0.26, + "learning_rate": 1.4807580288144147e-07, + "loss": 0.0012, + "step": 13421 + }, + { + "epoch": 0.26, + "learning_rate": 1.4807191953710534e-07, + "loss": 0.0028, + "step": 13422 + }, + { + "epoch": 0.26, + "learning_rate": 1.4806803619276919e-07, + "loss": 0.0117, + "step": 13423 + }, + { + "epoch": 0.26, + "learning_rate": 1.4806415284843306e-07, + "loss": 0.0012, + "step": 13424 + }, + { + "epoch": 0.26, + "learning_rate": 1.480602695040969e-07, + "loss": 0.0124, + "step": 13425 + }, + { + "epoch": 0.26, + "learning_rate": 1.4805638615976077e-07, + "loss": 0.2932, + "step": 13426 + }, + { + "epoch": 0.26, + "learning_rate": 1.4805250281542462e-07, + "loss": 0.0361, + "step": 13427 + }, + { + "epoch": 0.26, + "learning_rate": 1.480486194710885e-07, + "loss": 0.1903, + "step": 13428 + }, + { + "epoch": 0.26, + "learning_rate": 1.4804473612675233e-07, + "loss": 0.0014, + "step": 13429 + }, + { + "epoch": 0.26, + "learning_rate": 1.480408527824162e-07, + "loss": 0.0379, + "step": 13430 + }, + { + "epoch": 0.26, + "learning_rate": 1.4803696943808005e-07, + "loss": 0.0024, + "step": 13431 + }, + { + "epoch": 0.26, + "learning_rate": 1.4803308609374392e-07, + "loss": 0.0496, + "step": 13432 + }, + { + "epoch": 0.26, + "learning_rate": 1.4802920274940777e-07, + "loss": 0.0014, + "step": 13433 + }, + { + "epoch": 0.26, + "learning_rate": 1.4802531940507164e-07, + "loss": 0.002, + "step": 13434 + }, + { + "epoch": 0.26, + "learning_rate": 1.4802143606073548e-07, + "loss": 0.0015, + "step": 13435 + }, + { + "epoch": 0.26, + "learning_rate": 1.4801755271639936e-07, + "loss": 0.0016, + "step": 13436 + }, + { + "epoch": 0.26, + "learning_rate": 1.480136693720632e-07, + "loss": 0.0016, + "step": 13437 + }, + { + "epoch": 0.26, + "learning_rate": 1.4800978602772707e-07, + "loss": 0.0025, + "step": 13438 + }, + { + "epoch": 0.26, + "learning_rate": 1.4800590268339092e-07, + "loss": 0.0011, + "step": 13439 + }, + { + "epoch": 0.26, + "learning_rate": 1.480020193390548e-07, + "loss": 0.0025, + "step": 13440 + }, + { + "epoch": 0.26, + "learning_rate": 1.4799813599471863e-07, + "loss": 0.0018, + "step": 13441 + }, + { + "epoch": 0.26, + "learning_rate": 1.479942526503825e-07, + "loss": 0.0011, + "step": 13442 + }, + { + "epoch": 0.26, + "learning_rate": 1.4799036930604635e-07, + "loss": 0.0015, + "step": 13443 + }, + { + "epoch": 0.26, + "learning_rate": 1.4798648596171022e-07, + "loss": 0.0012, + "step": 13444 + }, + { + "epoch": 0.26, + "learning_rate": 1.4798260261737407e-07, + "loss": 0.1599, + "step": 13445 + }, + { + "epoch": 0.26, + "learning_rate": 1.4797871927303794e-07, + "loss": 0.0515, + "step": 13446 + }, + { + "epoch": 0.26, + "learning_rate": 1.4797483592870178e-07, + "loss": 0.0219, + "step": 13447 + }, + { + "epoch": 0.26, + "learning_rate": 1.4797095258436565e-07, + "loss": 0.0013, + "step": 13448 + }, + { + "epoch": 0.26, + "learning_rate": 1.479670692400295e-07, + "loss": 0.5199, + "step": 13449 + }, + { + "epoch": 0.26, + "learning_rate": 1.4796318589569337e-07, + "loss": 0.6453, + "step": 13450 + }, + { + "epoch": 0.26, + "learning_rate": 1.4795930255135722e-07, + "loss": 0.0014, + "step": 13451 + }, + { + "epoch": 0.26, + "learning_rate": 1.479554192070211e-07, + "loss": 0.0027, + "step": 13452 + }, + { + "epoch": 0.26, + "learning_rate": 1.4795153586268493e-07, + "loss": 0.0161, + "step": 13453 + }, + { + "epoch": 0.26, + "learning_rate": 1.479476525183488e-07, + "loss": 0.0013, + "step": 13454 + }, + { + "epoch": 0.26, + "learning_rate": 1.4794376917401265e-07, + "loss": 0.7447, + "step": 13455 + }, + { + "epoch": 0.26, + "learning_rate": 1.4793988582967652e-07, + "loss": 0.0014, + "step": 13456 + }, + { + "epoch": 0.26, + "learning_rate": 1.4793600248534037e-07, + "loss": 0.0013, + "step": 13457 + }, + { + "epoch": 0.26, + "learning_rate": 1.4793211914100424e-07, + "loss": 0.0012, + "step": 13458 + }, + { + "epoch": 0.26, + "learning_rate": 1.4792823579666808e-07, + "loss": 0.002, + "step": 13459 + }, + { + "epoch": 0.26, + "learning_rate": 1.4792435245233195e-07, + "loss": 0.0014, + "step": 13460 + }, + { + "epoch": 0.26, + "learning_rate": 1.479204691079958e-07, + "loss": 0.0017, + "step": 13461 + }, + { + "epoch": 0.26, + "learning_rate": 1.4791658576365967e-07, + "loss": 0.0011, + "step": 13462 + }, + { + "epoch": 0.26, + "learning_rate": 1.4791270241932351e-07, + "loss": 0.0018, + "step": 13463 + }, + { + "epoch": 0.26, + "learning_rate": 1.4790881907498739e-07, + "loss": 0.0015, + "step": 13464 + }, + { + "epoch": 0.26, + "learning_rate": 1.4790493573065123e-07, + "loss": 0.0017, + "step": 13465 + }, + { + "epoch": 0.26, + "learning_rate": 1.479010523863151e-07, + "loss": 0.005, + "step": 13466 + }, + { + "epoch": 0.26, + "learning_rate": 1.4789716904197895e-07, + "loss": 0.0017, + "step": 13467 + }, + { + "epoch": 0.26, + "learning_rate": 1.4789328569764282e-07, + "loss": 0.0015, + "step": 13468 + }, + { + "epoch": 0.26, + "learning_rate": 1.4788940235330666e-07, + "loss": 0.0143, + "step": 13469 + }, + { + "epoch": 0.26, + "learning_rate": 1.4788551900897054e-07, + "loss": 0.0662, + "step": 13470 + }, + { + "epoch": 0.26, + "learning_rate": 1.4788163566463438e-07, + "loss": 0.0018, + "step": 13471 + }, + { + "epoch": 0.26, + "learning_rate": 1.4787775232029825e-07, + "loss": 0.0073, + "step": 13472 + }, + { + "epoch": 0.26, + "learning_rate": 1.478738689759621e-07, + "loss": 0.03, + "step": 13473 + }, + { + "epoch": 0.26, + "learning_rate": 1.4786998563162597e-07, + "loss": 1.2151, + "step": 13474 + }, + { + "epoch": 0.26, + "learning_rate": 1.4786610228728981e-07, + "loss": 0.0019, + "step": 13475 + }, + { + "epoch": 0.26, + "learning_rate": 1.4786221894295369e-07, + "loss": 0.0029, + "step": 13476 + }, + { + "epoch": 0.26, + "learning_rate": 1.478583355986175e-07, + "loss": 0.0023, + "step": 13477 + }, + { + "epoch": 0.26, + "learning_rate": 1.4785445225428138e-07, + "loss": 0.0015, + "step": 13478 + }, + { + "epoch": 0.26, + "learning_rate": 1.4785056890994522e-07, + "loss": 0.0018, + "step": 13479 + }, + { + "epoch": 0.26, + "learning_rate": 1.478466855656091e-07, + "loss": 0.0015, + "step": 13480 + }, + { + "epoch": 0.26, + "learning_rate": 1.4784280222127294e-07, + "loss": 0.0018, + "step": 13481 + }, + { + "epoch": 0.26, + "learning_rate": 1.478389188769368e-07, + "loss": 0.9288, + "step": 13482 + }, + { + "epoch": 0.26, + "learning_rate": 1.4783503553260065e-07, + "loss": 0.0012, + "step": 13483 + }, + { + "epoch": 0.26, + "learning_rate": 1.4783115218826452e-07, + "loss": 0.7814, + "step": 13484 + }, + { + "epoch": 0.26, + "learning_rate": 1.4782726884392837e-07, + "loss": 0.0119, + "step": 13485 + }, + { + "epoch": 0.26, + "learning_rate": 1.4782338549959224e-07, + "loss": 0.2725, + "step": 13486 + }, + { + "epoch": 0.26, + "learning_rate": 1.4781950215525609e-07, + "loss": 0.9788, + "step": 13487 + }, + { + "epoch": 0.26, + "learning_rate": 1.4781561881091996e-07, + "loss": 0.0012, + "step": 13488 + }, + { + "epoch": 0.26, + "learning_rate": 1.478117354665838e-07, + "loss": 0.0012, + "step": 13489 + }, + { + "epoch": 0.26, + "learning_rate": 1.4780785212224767e-07, + "loss": 0.002, + "step": 13490 + }, + { + "epoch": 0.26, + "learning_rate": 1.4780396877791152e-07, + "loss": 0.0704, + "step": 13491 + }, + { + "epoch": 0.26, + "learning_rate": 1.478000854335754e-07, + "loss": 0.0015, + "step": 13492 + }, + { + "epoch": 0.26, + "learning_rate": 1.4779620208923924e-07, + "loss": 1.0612, + "step": 13493 + }, + { + "epoch": 0.26, + "learning_rate": 1.477923187449031e-07, + "loss": 1.1425, + "step": 13494 + }, + { + "epoch": 0.26, + "learning_rate": 1.4778843540056695e-07, + "loss": 0.0016, + "step": 13495 + }, + { + "epoch": 0.26, + "learning_rate": 1.4778455205623082e-07, + "loss": 0.0641, + "step": 13496 + }, + { + "epoch": 0.26, + "learning_rate": 1.4778066871189467e-07, + "loss": 0.0022, + "step": 13497 + }, + { + "epoch": 0.26, + "learning_rate": 1.4777678536755854e-07, + "loss": 0.0028, + "step": 13498 + }, + { + "epoch": 0.26, + "learning_rate": 1.4777290202322239e-07, + "loss": 0.0971, + "step": 13499 + }, + { + "epoch": 0.26, + "learning_rate": 1.4776901867888626e-07, + "loss": 0.0018, + "step": 13500 + }, + { + "epoch": 0.26, + "learning_rate": 1.477651353345501e-07, + "loss": 1.0225, + "step": 13501 + }, + { + "epoch": 0.26, + "learning_rate": 1.4776125199021397e-07, + "loss": 0.8792, + "step": 13502 + }, + { + "epoch": 0.26, + "learning_rate": 1.4775736864587782e-07, + "loss": 0.0021, + "step": 13503 + }, + { + "epoch": 0.26, + "learning_rate": 1.477534853015417e-07, + "loss": 0.0027, + "step": 13504 + }, + { + "epoch": 0.26, + "learning_rate": 1.4774960195720553e-07, + "loss": 0.0014, + "step": 13505 + }, + { + "epoch": 0.26, + "learning_rate": 1.477457186128694e-07, + "loss": 0.0067, + "step": 13506 + }, + { + "epoch": 0.26, + "learning_rate": 1.4774183526853325e-07, + "loss": 0.0012, + "step": 13507 + }, + { + "epoch": 0.26, + "learning_rate": 1.4773795192419712e-07, + "loss": 0.432, + "step": 13508 + }, + { + "epoch": 0.26, + "learning_rate": 1.4773406857986097e-07, + "loss": 0.0148, + "step": 13509 + }, + { + "epoch": 0.26, + "learning_rate": 1.4773018523552484e-07, + "loss": 0.8378, + "step": 13510 + }, + { + "epoch": 0.26, + "learning_rate": 1.4772630189118868e-07, + "loss": 0.0015, + "step": 13511 + }, + { + "epoch": 0.26, + "learning_rate": 1.4772241854685256e-07, + "loss": 0.1302, + "step": 13512 + }, + { + "epoch": 0.26, + "learning_rate": 1.477185352025164e-07, + "loss": 0.0015, + "step": 13513 + }, + { + "epoch": 0.26, + "learning_rate": 1.4771465185818027e-07, + "loss": 0.0014, + "step": 13514 + }, + { + "epoch": 0.26, + "learning_rate": 1.4771076851384412e-07, + "loss": 0.0014, + "step": 13515 + }, + { + "epoch": 0.26, + "learning_rate": 1.47706885169508e-07, + "loss": 0.0014, + "step": 13516 + }, + { + "epoch": 0.26, + "learning_rate": 1.4770300182517183e-07, + "loss": 0.0013, + "step": 13517 + }, + { + "epoch": 0.26, + "learning_rate": 1.476991184808357e-07, + "loss": 0.0013, + "step": 13518 + }, + { + "epoch": 0.26, + "learning_rate": 1.4769523513649955e-07, + "loss": 0.0018, + "step": 13519 + }, + { + "epoch": 0.26, + "learning_rate": 1.4769135179216342e-07, + "loss": 0.0019, + "step": 13520 + }, + { + "epoch": 0.26, + "learning_rate": 1.4768746844782727e-07, + "loss": 0.0015, + "step": 13521 + }, + { + "epoch": 0.26, + "learning_rate": 1.4768358510349114e-07, + "loss": 0.0014, + "step": 13522 + }, + { + "epoch": 0.26, + "learning_rate": 1.4767970175915498e-07, + "loss": 0.0018, + "step": 13523 + }, + { + "epoch": 0.26, + "learning_rate": 1.4767581841481885e-07, + "loss": 0.0013, + "step": 13524 + }, + { + "epoch": 0.26, + "learning_rate": 1.476719350704827e-07, + "loss": 0.0018, + "step": 13525 + }, + { + "epoch": 0.26, + "learning_rate": 1.4766805172614657e-07, + "loss": 0.0058, + "step": 13526 + }, + { + "epoch": 0.26, + "learning_rate": 1.4766416838181042e-07, + "loss": 0.0024, + "step": 13527 + }, + { + "epoch": 0.26, + "learning_rate": 1.476602850374743e-07, + "loss": 0.0025, + "step": 13528 + }, + { + "epoch": 0.26, + "learning_rate": 1.4765640169313813e-07, + "loss": 0.0016, + "step": 13529 + }, + { + "epoch": 0.26, + "learning_rate": 1.47652518348802e-07, + "loss": 0.014, + "step": 13530 + }, + { + "epoch": 0.26, + "learning_rate": 1.4764863500446585e-07, + "loss": 0.0028, + "step": 13531 + }, + { + "epoch": 0.26, + "learning_rate": 1.476447516601297e-07, + "loss": 0.0014, + "step": 13532 + }, + { + "epoch": 0.26, + "learning_rate": 1.4764086831579357e-07, + "loss": 0.0026, + "step": 13533 + }, + { + "epoch": 0.26, + "learning_rate": 1.476369849714574e-07, + "loss": 0.0017, + "step": 13534 + }, + { + "epoch": 0.26, + "learning_rate": 1.4763310162712126e-07, + "loss": 0.0021, + "step": 13535 + }, + { + "epoch": 0.26, + "learning_rate": 1.4762921828278513e-07, + "loss": 0.0015, + "step": 13536 + }, + { + "epoch": 0.26, + "learning_rate": 1.4762533493844897e-07, + "loss": 0.0016, + "step": 13537 + }, + { + "epoch": 0.26, + "learning_rate": 1.4762145159411284e-07, + "loss": 0.7011, + "step": 13538 + }, + { + "epoch": 0.26, + "learning_rate": 1.476175682497767e-07, + "loss": 0.0015, + "step": 13539 + }, + { + "epoch": 0.26, + "learning_rate": 1.4761368490544056e-07, + "loss": 0.0698, + "step": 13540 + }, + { + "epoch": 0.26, + "learning_rate": 1.476098015611044e-07, + "loss": 0.0014, + "step": 13541 + }, + { + "epoch": 0.26, + "learning_rate": 1.4760591821676828e-07, + "loss": 0.0922, + "step": 13542 + }, + { + "epoch": 0.26, + "learning_rate": 1.4760203487243212e-07, + "loss": 0.0013, + "step": 13543 + }, + { + "epoch": 0.26, + "learning_rate": 1.47598151528096e-07, + "loss": 0.0018, + "step": 13544 + }, + { + "epoch": 0.26, + "learning_rate": 1.4759426818375984e-07, + "loss": 0.5987, + "step": 13545 + }, + { + "epoch": 0.26, + "learning_rate": 1.475903848394237e-07, + "loss": 0.0012, + "step": 13546 + }, + { + "epoch": 0.26, + "learning_rate": 1.4758650149508755e-07, + "loss": 0.0015, + "step": 13547 + }, + { + "epoch": 0.26, + "learning_rate": 1.4758261815075143e-07, + "loss": 0.0013, + "step": 13548 + }, + { + "epoch": 0.26, + "learning_rate": 1.4757873480641527e-07, + "loss": 0.0014, + "step": 13549 + }, + { + "epoch": 0.26, + "learning_rate": 1.4757485146207914e-07, + "loss": 0.0048, + "step": 13550 + }, + { + "epoch": 0.26, + "learning_rate": 1.47570968117743e-07, + "loss": 0.0015, + "step": 13551 + }, + { + "epoch": 0.26, + "learning_rate": 1.4756708477340686e-07, + "loss": 0.0015, + "step": 13552 + }, + { + "epoch": 0.26, + "learning_rate": 1.475632014290707e-07, + "loss": 0.0023, + "step": 13553 + }, + { + "epoch": 0.26, + "learning_rate": 1.4755931808473458e-07, + "loss": 0.001, + "step": 13554 + }, + { + "epoch": 0.26, + "learning_rate": 1.4755543474039842e-07, + "loss": 0.1057, + "step": 13555 + }, + { + "epoch": 0.26, + "learning_rate": 1.475515513960623e-07, + "loss": 0.0987, + "step": 13556 + }, + { + "epoch": 0.26, + "learning_rate": 1.4754766805172614e-07, + "loss": 0.0027, + "step": 13557 + }, + { + "epoch": 0.26, + "learning_rate": 1.4754378470739e-07, + "loss": 0.0032, + "step": 13558 + }, + { + "epoch": 0.26, + "learning_rate": 1.4753990136305385e-07, + "loss": 0.0028, + "step": 13559 + }, + { + "epoch": 0.26, + "learning_rate": 1.475360180187177e-07, + "loss": 0.021, + "step": 13560 + }, + { + "epoch": 0.26, + "learning_rate": 1.4753213467438157e-07, + "loss": 0.2773, + "step": 13561 + }, + { + "epoch": 0.26, + "learning_rate": 1.4752825133004542e-07, + "loss": 0.0056, + "step": 13562 + }, + { + "epoch": 0.26, + "learning_rate": 1.4752436798570929e-07, + "loss": 0.0015, + "step": 13563 + }, + { + "epoch": 0.26, + "learning_rate": 1.4752048464137313e-07, + "loss": 0.0019, + "step": 13564 + }, + { + "epoch": 0.26, + "learning_rate": 1.47516601297037e-07, + "loss": 0.0246, + "step": 13565 + }, + { + "epoch": 0.26, + "learning_rate": 1.4751271795270085e-07, + "loss": 0.0016, + "step": 13566 + }, + { + "epoch": 0.26, + "learning_rate": 1.4750883460836472e-07, + "loss": 0.0017, + "step": 13567 + }, + { + "epoch": 0.26, + "learning_rate": 1.4750495126402856e-07, + "loss": 0.0175, + "step": 13568 + }, + { + "epoch": 0.26, + "learning_rate": 1.4750106791969244e-07, + "loss": 0.0012, + "step": 13569 + }, + { + "epoch": 0.26, + "learning_rate": 1.4749718457535628e-07, + "loss": 0.0012, + "step": 13570 + }, + { + "epoch": 0.26, + "learning_rate": 1.4749330123102015e-07, + "loss": 0.0012, + "step": 13571 + }, + { + "epoch": 0.26, + "learning_rate": 1.47489417886684e-07, + "loss": 0.0013, + "step": 13572 + }, + { + "epoch": 0.26, + "learning_rate": 1.4748553454234787e-07, + "loss": 0.0016, + "step": 13573 + }, + { + "epoch": 0.26, + "learning_rate": 1.4748165119801171e-07, + "loss": 0.0029, + "step": 13574 + }, + { + "epoch": 0.26, + "learning_rate": 1.4747776785367559e-07, + "loss": 0.0012, + "step": 13575 + }, + { + "epoch": 0.26, + "learning_rate": 1.4747388450933943e-07, + "loss": 0.0013, + "step": 13576 + }, + { + "epoch": 0.26, + "learning_rate": 1.474700011650033e-07, + "loss": 1.2774, + "step": 13577 + }, + { + "epoch": 0.26, + "learning_rate": 1.4746611782066715e-07, + "loss": 0.8422, + "step": 13578 + }, + { + "epoch": 0.26, + "learning_rate": 1.4746223447633102e-07, + "loss": 0.0015, + "step": 13579 + }, + { + "epoch": 0.26, + "learning_rate": 1.4745835113199486e-07, + "loss": 0.0027, + "step": 13580 + }, + { + "epoch": 0.26, + "learning_rate": 1.4745446778765873e-07, + "loss": 0.0019, + "step": 13581 + }, + { + "epoch": 0.26, + "learning_rate": 1.4745058444332258e-07, + "loss": 1.5769, + "step": 13582 + }, + { + "epoch": 0.26, + "learning_rate": 1.4744670109898645e-07, + "loss": 0.0027, + "step": 13583 + }, + { + "epoch": 0.26, + "learning_rate": 1.474428177546503e-07, + "loss": 0.0017, + "step": 13584 + }, + { + "epoch": 0.26, + "learning_rate": 1.4743893441031417e-07, + "loss": 0.117, + "step": 13585 + }, + { + "epoch": 0.26, + "learning_rate": 1.47435051065978e-07, + "loss": 0.0306, + "step": 13586 + }, + { + "epoch": 0.26, + "learning_rate": 1.4743116772164188e-07, + "loss": 0.0013, + "step": 13587 + }, + { + "epoch": 0.26, + "learning_rate": 1.4742728437730573e-07, + "loss": 0.0015, + "step": 13588 + }, + { + "epoch": 0.26, + "learning_rate": 1.474234010329696e-07, + "loss": 0.0017, + "step": 13589 + }, + { + "epoch": 0.26, + "learning_rate": 1.4741951768863345e-07, + "loss": 0.0015, + "step": 13590 + }, + { + "epoch": 0.26, + "learning_rate": 1.4741563434429732e-07, + "loss": 0.0047, + "step": 13591 + }, + { + "epoch": 0.26, + "learning_rate": 1.4741175099996116e-07, + "loss": 0.0024, + "step": 13592 + }, + { + "epoch": 0.26, + "learning_rate": 1.47407867655625e-07, + "loss": 0.6466, + "step": 13593 + }, + { + "epoch": 0.26, + "learning_rate": 1.4740398431128885e-07, + "loss": 0.0013, + "step": 13594 + }, + { + "epoch": 0.26, + "learning_rate": 1.4740010096695272e-07, + "loss": 0.0013, + "step": 13595 + }, + { + "epoch": 0.26, + "learning_rate": 1.4739621762261657e-07, + "loss": 0.3863, + "step": 13596 + }, + { + "epoch": 0.26, + "learning_rate": 1.4739233427828044e-07, + "loss": 0.0011, + "step": 13597 + }, + { + "epoch": 0.26, + "learning_rate": 1.4738845093394429e-07, + "loss": 0.0016, + "step": 13598 + }, + { + "epoch": 0.26, + "learning_rate": 1.4738456758960816e-07, + "loss": 0.0014, + "step": 13599 + }, + { + "epoch": 0.26, + "learning_rate": 1.47380684245272e-07, + "loss": 0.0018, + "step": 13600 + }, + { + "epoch": 0.26, + "learning_rate": 1.4737680090093587e-07, + "loss": 0.0013, + "step": 13601 + }, + { + "epoch": 0.26, + "learning_rate": 1.4737291755659972e-07, + "loss": 0.0016, + "step": 13602 + }, + { + "epoch": 0.26, + "learning_rate": 1.473690342122636e-07, + "loss": 0.0015, + "step": 13603 + }, + { + "epoch": 0.26, + "learning_rate": 1.4736515086792743e-07, + "loss": 0.0016, + "step": 13604 + }, + { + "epoch": 0.26, + "learning_rate": 1.473612675235913e-07, + "loss": 0.6448, + "step": 13605 + }, + { + "epoch": 0.26, + "learning_rate": 1.4735738417925515e-07, + "loss": 0.0021, + "step": 13606 + }, + { + "epoch": 0.26, + "learning_rate": 1.4735350083491902e-07, + "loss": 0.0017, + "step": 13607 + }, + { + "epoch": 0.26, + "learning_rate": 1.4734961749058287e-07, + "loss": 0.0021, + "step": 13608 + }, + { + "epoch": 0.26, + "learning_rate": 1.4734573414624674e-07, + "loss": 0.5948, + "step": 13609 + }, + { + "epoch": 0.26, + "learning_rate": 1.4734185080191058e-07, + "loss": 0.0866, + "step": 13610 + }, + { + "epoch": 0.26, + "learning_rate": 1.4733796745757446e-07, + "loss": 0.0014, + "step": 13611 + }, + { + "epoch": 0.26, + "learning_rate": 1.473340841132383e-07, + "loss": 0.0016, + "step": 13612 + }, + { + "epoch": 0.26, + "learning_rate": 1.4733020076890217e-07, + "loss": 0.0031, + "step": 13613 + }, + { + "epoch": 0.26, + "learning_rate": 1.4732631742456602e-07, + "loss": 0.0018, + "step": 13614 + }, + { + "epoch": 0.26, + "learning_rate": 1.473224340802299e-07, + "loss": 0.0193, + "step": 13615 + }, + { + "epoch": 0.26, + "learning_rate": 1.4731855073589373e-07, + "loss": 0.0051, + "step": 13616 + }, + { + "epoch": 0.26, + "learning_rate": 1.473146673915576e-07, + "loss": 0.0015, + "step": 13617 + }, + { + "epoch": 0.26, + "learning_rate": 1.4731078404722145e-07, + "loss": 0.0013, + "step": 13618 + }, + { + "epoch": 0.26, + "learning_rate": 1.4730690070288532e-07, + "loss": 0.0013, + "step": 13619 + }, + { + "epoch": 0.26, + "learning_rate": 1.4730301735854917e-07, + "loss": 0.0018, + "step": 13620 + }, + { + "epoch": 0.26, + "learning_rate": 1.4729913401421304e-07, + "loss": 0.0294, + "step": 13621 + }, + { + "epoch": 0.26, + "learning_rate": 1.4729525066987688e-07, + "loss": 0.0045, + "step": 13622 + }, + { + "epoch": 0.26, + "learning_rate": 1.4729136732554075e-07, + "loss": 1.2245, + "step": 13623 + }, + { + "epoch": 0.26, + "learning_rate": 1.472874839812046e-07, + "loss": 0.1124, + "step": 13624 + }, + { + "epoch": 0.26, + "learning_rate": 1.4728360063686847e-07, + "loss": 0.0021, + "step": 13625 + }, + { + "epoch": 0.26, + "learning_rate": 1.4727971729253232e-07, + "loss": 0.0018, + "step": 13626 + }, + { + "epoch": 0.26, + "learning_rate": 1.472758339481962e-07, + "loss": 0.0017, + "step": 13627 + }, + { + "epoch": 0.26, + "learning_rate": 1.4727195060386003e-07, + "loss": 0.0015, + "step": 13628 + }, + { + "epoch": 0.26, + "learning_rate": 1.472680672595239e-07, + "loss": 0.0016, + "step": 13629 + }, + { + "epoch": 0.26, + "learning_rate": 1.4726418391518775e-07, + "loss": 0.0014, + "step": 13630 + }, + { + "epoch": 0.26, + "learning_rate": 1.4726030057085162e-07, + "loss": 0.0015, + "step": 13631 + }, + { + "epoch": 0.26, + "learning_rate": 1.4725641722651547e-07, + "loss": 0.3829, + "step": 13632 + }, + { + "epoch": 0.26, + "learning_rate": 1.4725253388217934e-07, + "loss": 0.0018, + "step": 13633 + }, + { + "epoch": 0.26, + "learning_rate": 1.4724865053784318e-07, + "loss": 0.0014, + "step": 13634 + }, + { + "epoch": 0.26, + "learning_rate": 1.4724476719350705e-07, + "loss": 0.1127, + "step": 13635 + }, + { + "epoch": 0.26, + "learning_rate": 1.472408838491709e-07, + "loss": 0.0023, + "step": 13636 + }, + { + "epoch": 0.26, + "learning_rate": 1.4723700050483477e-07, + "loss": 1.3781, + "step": 13637 + }, + { + "epoch": 0.26, + "learning_rate": 1.4723311716049862e-07, + "loss": 0.0014, + "step": 13638 + }, + { + "epoch": 0.26, + "learning_rate": 1.4722923381616249e-07, + "loss": 0.0016, + "step": 13639 + }, + { + "epoch": 0.26, + "learning_rate": 1.4722535047182633e-07, + "loss": 0.0055, + "step": 13640 + }, + { + "epoch": 0.26, + "learning_rate": 1.472214671274902e-07, + "loss": 0.0035, + "step": 13641 + }, + { + "epoch": 0.26, + "learning_rate": 1.4721758378315405e-07, + "loss": 0.0017, + "step": 13642 + }, + { + "epoch": 0.26, + "learning_rate": 1.4721370043881792e-07, + "loss": 0.0015, + "step": 13643 + }, + { + "epoch": 0.26, + "learning_rate": 1.4720981709448176e-07, + "loss": 0.0021, + "step": 13644 + }, + { + "epoch": 0.26, + "learning_rate": 1.4720593375014564e-07, + "loss": 0.002, + "step": 13645 + }, + { + "epoch": 0.26, + "learning_rate": 1.4720205040580948e-07, + "loss": 0.0072, + "step": 13646 + }, + { + "epoch": 0.26, + "learning_rate": 1.4719816706147335e-07, + "loss": 0.0026, + "step": 13647 + }, + { + "epoch": 0.26, + "learning_rate": 1.471942837171372e-07, + "loss": 0.0012, + "step": 13648 + }, + { + "epoch": 0.26, + "learning_rate": 1.4719040037280107e-07, + "loss": 0.0017, + "step": 13649 + }, + { + "epoch": 0.26, + "learning_rate": 1.4718651702846491e-07, + "loss": 0.0014, + "step": 13650 + }, + { + "epoch": 0.26, + "learning_rate": 1.4718263368412876e-07, + "loss": 0.0042, + "step": 13651 + }, + { + "epoch": 0.26, + "learning_rate": 1.471787503397926e-07, + "loss": 0.002, + "step": 13652 + }, + { + "epoch": 0.26, + "learning_rate": 1.4717486699545648e-07, + "loss": 0.0027, + "step": 13653 + }, + { + "epoch": 0.26, + "learning_rate": 1.4717098365112032e-07, + "loss": 0.0015, + "step": 13654 + }, + { + "epoch": 0.26, + "learning_rate": 1.471671003067842e-07, + "loss": 0.0239, + "step": 13655 + }, + { + "epoch": 0.26, + "learning_rate": 1.4716321696244804e-07, + "loss": 0.6031, + "step": 13656 + }, + { + "epoch": 0.26, + "learning_rate": 1.471593336181119e-07, + "loss": 0.0012, + "step": 13657 + }, + { + "epoch": 0.26, + "learning_rate": 1.4715545027377575e-07, + "loss": 0.0359, + "step": 13658 + }, + { + "epoch": 0.26, + "learning_rate": 1.4715156692943962e-07, + "loss": 0.0018, + "step": 13659 + }, + { + "epoch": 0.26, + "learning_rate": 1.4714768358510347e-07, + "loss": 1.2727, + "step": 13660 + }, + { + "epoch": 0.26, + "learning_rate": 1.4714380024076734e-07, + "loss": 0.0019, + "step": 13661 + }, + { + "epoch": 0.27, + "learning_rate": 1.4713991689643119e-07, + "loss": 0.0012, + "step": 13662 + }, + { + "epoch": 0.27, + "learning_rate": 1.4713603355209506e-07, + "loss": 0.0011, + "step": 13663 + }, + { + "epoch": 0.27, + "learning_rate": 1.471321502077589e-07, + "loss": 0.0014, + "step": 13664 + }, + { + "epoch": 0.27, + "learning_rate": 1.4712826686342277e-07, + "loss": 0.0143, + "step": 13665 + }, + { + "epoch": 0.27, + "learning_rate": 1.4712438351908662e-07, + "loss": 0.0016, + "step": 13666 + }, + { + "epoch": 0.27, + "learning_rate": 1.471205001747505e-07, + "loss": 0.002, + "step": 13667 + }, + { + "epoch": 0.27, + "learning_rate": 1.4711661683041434e-07, + "loss": 0.0013, + "step": 13668 + }, + { + "epoch": 0.27, + "learning_rate": 1.471127334860782e-07, + "loss": 0.0017, + "step": 13669 + }, + { + "epoch": 0.27, + "learning_rate": 1.4710885014174205e-07, + "loss": 0.0422, + "step": 13670 + }, + { + "epoch": 0.27, + "learning_rate": 1.4710496679740592e-07, + "loss": 0.0023, + "step": 13671 + }, + { + "epoch": 0.27, + "learning_rate": 1.4710108345306977e-07, + "loss": 0.0016, + "step": 13672 + }, + { + "epoch": 0.27, + "learning_rate": 1.4709720010873364e-07, + "loss": 0.0013, + "step": 13673 + }, + { + "epoch": 0.27, + "learning_rate": 1.4709331676439749e-07, + "loss": 0.0014, + "step": 13674 + }, + { + "epoch": 0.27, + "learning_rate": 1.4708943342006136e-07, + "loss": 0.0016, + "step": 13675 + }, + { + "epoch": 0.27, + "learning_rate": 1.470855500757252e-07, + "loss": 0.2618, + "step": 13676 + }, + { + "epoch": 0.27, + "learning_rate": 1.4708166673138907e-07, + "loss": 0.0012, + "step": 13677 + }, + { + "epoch": 0.27, + "learning_rate": 1.4707778338705292e-07, + "loss": 0.0014, + "step": 13678 + }, + { + "epoch": 0.27, + "learning_rate": 1.470739000427168e-07, + "loss": 0.7229, + "step": 13679 + }, + { + "epoch": 0.27, + "learning_rate": 1.4707001669838063e-07, + "loss": 0.0013, + "step": 13680 + }, + { + "epoch": 0.27, + "learning_rate": 1.470661333540445e-07, + "loss": 0.0012, + "step": 13681 + }, + { + "epoch": 0.27, + "learning_rate": 1.4706225000970835e-07, + "loss": 0.0025, + "step": 13682 + }, + { + "epoch": 0.27, + "learning_rate": 1.4705836666537222e-07, + "loss": 0.0194, + "step": 13683 + }, + { + "epoch": 0.27, + "learning_rate": 1.4705448332103607e-07, + "loss": 0.0148, + "step": 13684 + }, + { + "epoch": 0.27, + "learning_rate": 1.4705059997669994e-07, + "loss": 0.0015, + "step": 13685 + }, + { + "epoch": 0.27, + "learning_rate": 1.4704671663236378e-07, + "loss": 0.0019, + "step": 13686 + }, + { + "epoch": 0.27, + "learning_rate": 1.4704283328802766e-07, + "loss": 0.002, + "step": 13687 + }, + { + "epoch": 0.27, + "learning_rate": 1.470389499436915e-07, + "loss": 0.015, + "step": 13688 + }, + { + "epoch": 0.27, + "learning_rate": 1.4703506659935537e-07, + "loss": 0.0016, + "step": 13689 + }, + { + "epoch": 0.27, + "learning_rate": 1.4703118325501922e-07, + "loss": 0.0011, + "step": 13690 + }, + { + "epoch": 0.27, + "learning_rate": 1.470272999106831e-07, + "loss": 0.5881, + "step": 13691 + }, + { + "epoch": 0.27, + "learning_rate": 1.4702341656634693e-07, + "loss": 0.0014, + "step": 13692 + }, + { + "epoch": 0.27, + "learning_rate": 1.470195332220108e-07, + "loss": 0.0018, + "step": 13693 + }, + { + "epoch": 0.27, + "learning_rate": 1.4701564987767465e-07, + "loss": 0.6393, + "step": 13694 + }, + { + "epoch": 0.27, + "learning_rate": 1.4701176653333852e-07, + "loss": 1.0734, + "step": 13695 + }, + { + "epoch": 0.27, + "learning_rate": 1.4700788318900237e-07, + "loss": 0.1012, + "step": 13696 + }, + { + "epoch": 0.27, + "learning_rate": 1.4700399984466624e-07, + "loss": 0.0022, + "step": 13697 + }, + { + "epoch": 0.27, + "learning_rate": 1.4700011650033008e-07, + "loss": 0.0434, + "step": 13698 + }, + { + "epoch": 0.27, + "learning_rate": 1.4699623315599395e-07, + "loss": 0.0019, + "step": 13699 + }, + { + "epoch": 0.27, + "learning_rate": 1.469923498116578e-07, + "loss": 0.0015, + "step": 13700 + }, + { + "epoch": 0.27, + "learning_rate": 1.4698846646732167e-07, + "loss": 0.6797, + "step": 13701 + }, + { + "epoch": 0.27, + "learning_rate": 1.4698458312298552e-07, + "loss": 0.0019, + "step": 13702 + }, + { + "epoch": 0.27, + "learning_rate": 1.469806997786494e-07, + "loss": 0.0025, + "step": 13703 + }, + { + "epoch": 0.27, + "learning_rate": 1.4697681643431323e-07, + "loss": 0.0015, + "step": 13704 + }, + { + "epoch": 0.27, + "learning_rate": 1.469729330899771e-07, + "loss": 0.0014, + "step": 13705 + }, + { + "epoch": 0.27, + "learning_rate": 1.4696904974564095e-07, + "loss": 0.0015, + "step": 13706 + }, + { + "epoch": 0.27, + "learning_rate": 1.4696516640130482e-07, + "loss": 0.0049, + "step": 13707 + }, + { + "epoch": 0.27, + "learning_rate": 1.4696128305696867e-07, + "loss": 0.0019, + "step": 13708 + }, + { + "epoch": 0.27, + "learning_rate": 1.469573997126325e-07, + "loss": 0.0014, + "step": 13709 + }, + { + "epoch": 0.27, + "learning_rate": 1.4695351636829636e-07, + "loss": 0.0018, + "step": 13710 + }, + { + "epoch": 0.27, + "learning_rate": 1.4694963302396023e-07, + "loss": 0.0014, + "step": 13711 + }, + { + "epoch": 0.27, + "learning_rate": 1.4694574967962407e-07, + "loss": 0.6926, + "step": 13712 + }, + { + "epoch": 0.27, + "learning_rate": 1.4694186633528794e-07, + "loss": 0.0011, + "step": 13713 + }, + { + "epoch": 0.27, + "learning_rate": 1.469379829909518e-07, + "loss": 0.5726, + "step": 13714 + }, + { + "epoch": 0.27, + "learning_rate": 1.4693409964661566e-07, + "loss": 0.0014, + "step": 13715 + }, + { + "epoch": 0.27, + "learning_rate": 1.469302163022795e-07, + "loss": 0.0087, + "step": 13716 + }, + { + "epoch": 0.27, + "learning_rate": 1.4692633295794338e-07, + "loss": 0.0013, + "step": 13717 + }, + { + "epoch": 0.27, + "learning_rate": 1.4692244961360722e-07, + "loss": 0.0014, + "step": 13718 + }, + { + "epoch": 0.27, + "learning_rate": 1.469185662692711e-07, + "loss": 0.0011, + "step": 13719 + }, + { + "epoch": 0.27, + "learning_rate": 1.4691468292493494e-07, + "loss": 0.1407, + "step": 13720 + }, + { + "epoch": 0.27, + "learning_rate": 1.469107995805988e-07, + "loss": 0.0022, + "step": 13721 + }, + { + "epoch": 0.27, + "learning_rate": 1.4690691623626265e-07, + "loss": 0.0015, + "step": 13722 + }, + { + "epoch": 0.27, + "learning_rate": 1.4690303289192653e-07, + "loss": 0.0016, + "step": 13723 + }, + { + "epoch": 0.27, + "learning_rate": 1.4689914954759037e-07, + "loss": 0.0061, + "step": 13724 + }, + { + "epoch": 0.27, + "learning_rate": 1.4689526620325424e-07, + "loss": 0.3734, + "step": 13725 + }, + { + "epoch": 0.27, + "learning_rate": 1.468913828589181e-07, + "loss": 0.0015, + "step": 13726 + }, + { + "epoch": 0.27, + "learning_rate": 1.4688749951458196e-07, + "loss": 0.0015, + "step": 13727 + }, + { + "epoch": 0.27, + "learning_rate": 1.468836161702458e-07, + "loss": 0.0015, + "step": 13728 + }, + { + "epoch": 0.27, + "learning_rate": 1.4687973282590968e-07, + "loss": 0.0067, + "step": 13729 + }, + { + "epoch": 0.27, + "learning_rate": 1.4687584948157352e-07, + "loss": 0.0107, + "step": 13730 + }, + { + "epoch": 0.27, + "learning_rate": 1.468719661372374e-07, + "loss": 0.0019, + "step": 13731 + }, + { + "epoch": 0.27, + "learning_rate": 1.4686808279290124e-07, + "loss": 0.1897, + "step": 13732 + }, + { + "epoch": 0.27, + "learning_rate": 1.468641994485651e-07, + "loss": 0.0016, + "step": 13733 + }, + { + "epoch": 0.27, + "learning_rate": 1.4686031610422895e-07, + "loss": 0.0014, + "step": 13734 + }, + { + "epoch": 0.27, + "learning_rate": 1.4685643275989283e-07, + "loss": 0.0016, + "step": 13735 + }, + { + "epoch": 0.27, + "learning_rate": 1.4685254941555667e-07, + "loss": 0.0017, + "step": 13736 + }, + { + "epoch": 0.27, + "learning_rate": 1.4684866607122052e-07, + "loss": 0.0016, + "step": 13737 + }, + { + "epoch": 0.27, + "learning_rate": 1.4684478272688439e-07, + "loss": 0.4356, + "step": 13738 + }, + { + "epoch": 0.27, + "learning_rate": 1.4684089938254823e-07, + "loss": 0.0021, + "step": 13739 + }, + { + "epoch": 0.27, + "learning_rate": 1.468370160382121e-07, + "loss": 0.0026, + "step": 13740 + }, + { + "epoch": 0.27, + "learning_rate": 1.4683313269387595e-07, + "loss": 0.0022, + "step": 13741 + }, + { + "epoch": 0.27, + "learning_rate": 1.4682924934953982e-07, + "loss": 0.0056, + "step": 13742 + }, + { + "epoch": 0.27, + "learning_rate": 1.4682536600520366e-07, + "loss": 0.0025, + "step": 13743 + }, + { + "epoch": 0.27, + "learning_rate": 1.4682148266086754e-07, + "loss": 0.0015, + "step": 13744 + }, + { + "epoch": 0.27, + "learning_rate": 1.4681759931653138e-07, + "loss": 0.0486, + "step": 13745 + }, + { + "epoch": 0.27, + "learning_rate": 1.4681371597219525e-07, + "loss": 0.0011, + "step": 13746 + }, + { + "epoch": 0.27, + "learning_rate": 1.468098326278591e-07, + "loss": 0.2765, + "step": 13747 + }, + { + "epoch": 0.27, + "learning_rate": 1.4680594928352297e-07, + "loss": 0.0281, + "step": 13748 + }, + { + "epoch": 0.27, + "learning_rate": 1.4680206593918681e-07, + "loss": 0.0016, + "step": 13749 + }, + { + "epoch": 0.27, + "learning_rate": 1.4679818259485069e-07, + "loss": 0.0013, + "step": 13750 + }, + { + "epoch": 0.27, + "learning_rate": 1.4679429925051453e-07, + "loss": 0.0013, + "step": 13751 + }, + { + "epoch": 0.27, + "learning_rate": 1.467904159061784e-07, + "loss": 0.0013, + "step": 13752 + }, + { + "epoch": 0.27, + "learning_rate": 1.4678653256184225e-07, + "loss": 0.0012, + "step": 13753 + }, + { + "epoch": 0.27, + "learning_rate": 1.4678264921750612e-07, + "loss": 0.0017, + "step": 13754 + }, + { + "epoch": 0.27, + "learning_rate": 1.4677876587316996e-07, + "loss": 0.4058, + "step": 13755 + }, + { + "epoch": 0.27, + "learning_rate": 1.4677488252883383e-07, + "loss": 0.0014, + "step": 13756 + }, + { + "epoch": 0.27, + "learning_rate": 1.4677099918449768e-07, + "loss": 0.0014, + "step": 13757 + }, + { + "epoch": 0.27, + "learning_rate": 1.4676711584016155e-07, + "loss": 0.0029, + "step": 13758 + }, + { + "epoch": 0.27, + "learning_rate": 1.467632324958254e-07, + "loss": 0.5465, + "step": 13759 + }, + { + "epoch": 0.27, + "learning_rate": 1.4675934915148927e-07, + "loss": 0.0045, + "step": 13760 + }, + { + "epoch": 0.27, + "learning_rate": 1.467554658071531e-07, + "loss": 0.9989, + "step": 13761 + }, + { + "epoch": 0.27, + "learning_rate": 1.4675158246281698e-07, + "loss": 0.002, + "step": 13762 + }, + { + "epoch": 0.27, + "learning_rate": 1.4674769911848083e-07, + "loss": 0.0013, + "step": 13763 + }, + { + "epoch": 0.27, + "learning_rate": 1.467438157741447e-07, + "loss": 0.001, + "step": 13764 + }, + { + "epoch": 0.27, + "learning_rate": 1.4673993242980855e-07, + "loss": 0.0095, + "step": 13765 + }, + { + "epoch": 0.27, + "learning_rate": 1.4673604908547242e-07, + "loss": 0.0015, + "step": 13766 + }, + { + "epoch": 0.27, + "learning_rate": 1.4673216574113624e-07, + "loss": 0.0019, + "step": 13767 + }, + { + "epoch": 0.27, + "learning_rate": 1.467282823968001e-07, + "loss": 0.0016, + "step": 13768 + }, + { + "epoch": 0.27, + "learning_rate": 1.4672439905246395e-07, + "loss": 0.8342, + "step": 13769 + }, + { + "epoch": 0.27, + "learning_rate": 1.4672051570812782e-07, + "loss": 0.0014, + "step": 13770 + }, + { + "epoch": 0.27, + "learning_rate": 1.4671663236379167e-07, + "loss": 0.001, + "step": 13771 + }, + { + "epoch": 0.27, + "learning_rate": 1.4671274901945554e-07, + "loss": 0.0054, + "step": 13772 + }, + { + "epoch": 0.27, + "learning_rate": 1.4670886567511939e-07, + "loss": 0.0017, + "step": 13773 + }, + { + "epoch": 0.27, + "learning_rate": 1.4670498233078326e-07, + "loss": 0.0014, + "step": 13774 + }, + { + "epoch": 0.27, + "learning_rate": 1.467010989864471e-07, + "loss": 0.1983, + "step": 13775 + }, + { + "epoch": 0.27, + "learning_rate": 1.4669721564211097e-07, + "loss": 0.0017, + "step": 13776 + }, + { + "epoch": 0.27, + "learning_rate": 1.4669333229777482e-07, + "loss": 0.6065, + "step": 13777 + }, + { + "epoch": 0.27, + "learning_rate": 1.466894489534387e-07, + "loss": 0.002, + "step": 13778 + }, + { + "epoch": 0.27, + "learning_rate": 1.4668556560910253e-07, + "loss": 0.0019, + "step": 13779 + }, + { + "epoch": 0.27, + "learning_rate": 1.466816822647664e-07, + "loss": 0.002, + "step": 13780 + }, + { + "epoch": 0.27, + "learning_rate": 1.4667779892043025e-07, + "loss": 0.0017, + "step": 13781 + }, + { + "epoch": 0.27, + "learning_rate": 1.4667391557609412e-07, + "loss": 0.002, + "step": 13782 + }, + { + "epoch": 0.27, + "learning_rate": 1.4667003223175797e-07, + "loss": 0.5501, + "step": 13783 + }, + { + "epoch": 0.27, + "learning_rate": 1.4666614888742184e-07, + "loss": 0.0025, + "step": 13784 + }, + { + "epoch": 0.27, + "learning_rate": 1.4666226554308568e-07, + "loss": 0.8229, + "step": 13785 + }, + { + "epoch": 0.27, + "learning_rate": 1.4665838219874956e-07, + "loss": 0.0073, + "step": 13786 + }, + { + "epoch": 0.27, + "learning_rate": 1.466544988544134e-07, + "loss": 0.7943, + "step": 13787 + }, + { + "epoch": 0.27, + "learning_rate": 1.4665061551007727e-07, + "loss": 0.0016, + "step": 13788 + }, + { + "epoch": 0.27, + "learning_rate": 1.4664673216574112e-07, + "loss": 0.0016, + "step": 13789 + }, + { + "epoch": 0.27, + "learning_rate": 1.46642848821405e-07, + "loss": 0.0016, + "step": 13790 + }, + { + "epoch": 0.27, + "learning_rate": 1.4663896547706883e-07, + "loss": 0.0018, + "step": 13791 + }, + { + "epoch": 0.27, + "learning_rate": 1.466350821327327e-07, + "loss": 0.0014, + "step": 13792 + }, + { + "epoch": 0.27, + "learning_rate": 1.4663119878839655e-07, + "loss": 1.3311, + "step": 13793 + }, + { + "epoch": 0.27, + "learning_rate": 1.4662731544406042e-07, + "loss": 0.0013, + "step": 13794 + }, + { + "epoch": 0.27, + "learning_rate": 1.4662343209972427e-07, + "loss": 0.0014, + "step": 13795 + }, + { + "epoch": 0.27, + "learning_rate": 1.4661954875538814e-07, + "loss": 0.0082, + "step": 13796 + }, + { + "epoch": 0.27, + "learning_rate": 1.4661566541105198e-07, + "loss": 0.0024, + "step": 13797 + }, + { + "epoch": 0.27, + "learning_rate": 1.4661178206671585e-07, + "loss": 0.0022, + "step": 13798 + }, + { + "epoch": 0.27, + "learning_rate": 1.466078987223797e-07, + "loss": 0.0015, + "step": 13799 + }, + { + "epoch": 0.27, + "learning_rate": 1.4660401537804357e-07, + "loss": 0.0012, + "step": 13800 + }, + { + "epoch": 0.27, + "learning_rate": 1.4660013203370742e-07, + "loss": 0.2072, + "step": 13801 + }, + { + "epoch": 0.27, + "learning_rate": 1.465962486893713e-07, + "loss": 0.4463, + "step": 13802 + }, + { + "epoch": 0.27, + "learning_rate": 1.4659236534503513e-07, + "loss": 0.0015, + "step": 13803 + }, + { + "epoch": 0.27, + "learning_rate": 1.46588482000699e-07, + "loss": 0.0023, + "step": 13804 + }, + { + "epoch": 0.27, + "learning_rate": 1.4658459865636285e-07, + "loss": 0.0085, + "step": 13805 + }, + { + "epoch": 0.27, + "learning_rate": 1.4658071531202672e-07, + "loss": 0.5172, + "step": 13806 + }, + { + "epoch": 0.27, + "learning_rate": 1.4657683196769057e-07, + "loss": 0.1777, + "step": 13807 + }, + { + "epoch": 0.27, + "learning_rate": 1.4657294862335444e-07, + "loss": 0.0016, + "step": 13808 + }, + { + "epoch": 0.27, + "learning_rate": 1.4656906527901828e-07, + "loss": 0.0018, + "step": 13809 + }, + { + "epoch": 0.27, + "learning_rate": 1.4656518193468215e-07, + "loss": 0.0016, + "step": 13810 + }, + { + "epoch": 0.27, + "learning_rate": 1.46561298590346e-07, + "loss": 0.0029, + "step": 13811 + }, + { + "epoch": 0.27, + "learning_rate": 1.4655741524600987e-07, + "loss": 0.0015, + "step": 13812 + }, + { + "epoch": 0.27, + "learning_rate": 1.4655353190167372e-07, + "loss": 0.05, + "step": 13813 + }, + { + "epoch": 0.27, + "learning_rate": 1.4654964855733759e-07, + "loss": 0.1571, + "step": 13814 + }, + { + "epoch": 0.27, + "learning_rate": 1.4654576521300143e-07, + "loss": 0.0014, + "step": 13815 + }, + { + "epoch": 0.27, + "learning_rate": 1.465418818686653e-07, + "loss": 0.0022, + "step": 13816 + }, + { + "epoch": 0.27, + "learning_rate": 1.4653799852432915e-07, + "loss": 0.0014, + "step": 13817 + }, + { + "epoch": 0.27, + "learning_rate": 1.4653411517999302e-07, + "loss": 0.0015, + "step": 13818 + }, + { + "epoch": 0.27, + "learning_rate": 1.4653023183565686e-07, + "loss": 0.0013, + "step": 13819 + }, + { + "epoch": 0.27, + "learning_rate": 1.4652634849132074e-07, + "loss": 0.7514, + "step": 13820 + }, + { + "epoch": 0.27, + "learning_rate": 1.4652246514698458e-07, + "loss": 1.7025, + "step": 13821 + }, + { + "epoch": 0.27, + "learning_rate": 1.4651858180264845e-07, + "loss": 0.0024, + "step": 13822 + }, + { + "epoch": 0.27, + "learning_rate": 1.465146984583123e-07, + "loss": 0.001, + "step": 13823 + }, + { + "epoch": 0.27, + "learning_rate": 1.4651081511397617e-07, + "loss": 0.3201, + "step": 13824 + }, + { + "epoch": 0.27, + "learning_rate": 1.4650693176964e-07, + "loss": 0.2966, + "step": 13825 + }, + { + "epoch": 0.27, + "learning_rate": 1.4650304842530386e-07, + "loss": 0.0014, + "step": 13826 + }, + { + "epoch": 0.27, + "learning_rate": 1.464991650809677e-07, + "loss": 0.4452, + "step": 13827 + }, + { + "epoch": 0.27, + "learning_rate": 1.4649528173663158e-07, + "loss": 0.0016, + "step": 13828 + }, + { + "epoch": 0.27, + "learning_rate": 1.4649139839229542e-07, + "loss": 0.0017, + "step": 13829 + }, + { + "epoch": 0.27, + "learning_rate": 1.464875150479593e-07, + "loss": 0.0019, + "step": 13830 + }, + { + "epoch": 0.27, + "learning_rate": 1.4648363170362314e-07, + "loss": 0.0033, + "step": 13831 + }, + { + "epoch": 0.27, + "learning_rate": 1.46479748359287e-07, + "loss": 0.0013, + "step": 13832 + }, + { + "epoch": 0.27, + "learning_rate": 1.4647586501495085e-07, + "loss": 1.1075, + "step": 13833 + }, + { + "epoch": 0.27, + "learning_rate": 1.4647198167061473e-07, + "loss": 0.0119, + "step": 13834 + }, + { + "epoch": 0.27, + "learning_rate": 1.4646809832627857e-07, + "loss": 0.0013, + "step": 13835 + }, + { + "epoch": 0.27, + "learning_rate": 1.4646421498194244e-07, + "loss": 0.0012, + "step": 13836 + }, + { + "epoch": 0.27, + "learning_rate": 1.4646033163760629e-07, + "loss": 0.0014, + "step": 13837 + }, + { + "epoch": 0.27, + "learning_rate": 1.4645644829327016e-07, + "loss": 0.6935, + "step": 13838 + }, + { + "epoch": 0.27, + "learning_rate": 1.46452564948934e-07, + "loss": 0.0012, + "step": 13839 + }, + { + "epoch": 0.27, + "learning_rate": 1.4644868160459787e-07, + "loss": 0.0014, + "step": 13840 + }, + { + "epoch": 0.27, + "learning_rate": 1.4644479826026172e-07, + "loss": 0.0012, + "step": 13841 + }, + { + "epoch": 0.27, + "learning_rate": 1.464409149159256e-07, + "loss": 0.0014, + "step": 13842 + }, + { + "epoch": 0.27, + "learning_rate": 1.4643703157158944e-07, + "loss": 0.3117, + "step": 13843 + }, + { + "epoch": 0.27, + "learning_rate": 1.464331482272533e-07, + "loss": 0.0016, + "step": 13844 + }, + { + "epoch": 0.27, + "learning_rate": 1.4642926488291715e-07, + "loss": 0.0012, + "step": 13845 + }, + { + "epoch": 0.27, + "learning_rate": 1.4642538153858102e-07, + "loss": 0.0189, + "step": 13846 + }, + { + "epoch": 0.27, + "learning_rate": 1.4642149819424487e-07, + "loss": 0.0016, + "step": 13847 + }, + { + "epoch": 0.27, + "learning_rate": 1.4641761484990874e-07, + "loss": 0.0016, + "step": 13848 + }, + { + "epoch": 0.27, + "learning_rate": 1.4641373150557259e-07, + "loss": 0.0011, + "step": 13849 + }, + { + "epoch": 0.27, + "learning_rate": 1.4640984816123646e-07, + "loss": 0.0013, + "step": 13850 + }, + { + "epoch": 0.27, + "learning_rate": 1.464059648169003e-07, + "loss": 0.0017, + "step": 13851 + }, + { + "epoch": 0.27, + "learning_rate": 1.4640208147256417e-07, + "loss": 0.0009, + "step": 13852 + }, + { + "epoch": 0.27, + "learning_rate": 1.4639819812822802e-07, + "loss": 0.0329, + "step": 13853 + }, + { + "epoch": 0.27, + "learning_rate": 1.463943147838919e-07, + "loss": 0.1008, + "step": 13854 + }, + { + "epoch": 0.27, + "learning_rate": 1.4639043143955574e-07, + "loss": 0.7071, + "step": 13855 + }, + { + "epoch": 0.27, + "learning_rate": 1.463865480952196e-07, + "loss": 0.0026, + "step": 13856 + }, + { + "epoch": 0.27, + "learning_rate": 1.4638266475088345e-07, + "loss": 0.0015, + "step": 13857 + }, + { + "epoch": 0.27, + "learning_rate": 1.4637878140654732e-07, + "loss": 0.0015, + "step": 13858 + }, + { + "epoch": 0.27, + "learning_rate": 1.4637489806221117e-07, + "loss": 0.0026, + "step": 13859 + }, + { + "epoch": 0.27, + "learning_rate": 1.4637101471787504e-07, + "loss": 0.0018, + "step": 13860 + }, + { + "epoch": 0.27, + "learning_rate": 1.4636713137353888e-07, + "loss": 0.0022, + "step": 13861 + }, + { + "epoch": 0.27, + "learning_rate": 1.4636324802920276e-07, + "loss": 0.2504, + "step": 13862 + }, + { + "epoch": 0.27, + "learning_rate": 1.463593646848666e-07, + "loss": 0.0015, + "step": 13863 + }, + { + "epoch": 0.27, + "learning_rate": 1.4635548134053047e-07, + "loss": 0.0039, + "step": 13864 + }, + { + "epoch": 0.27, + "learning_rate": 1.4635159799619432e-07, + "loss": 0.0035, + "step": 13865 + }, + { + "epoch": 0.27, + "learning_rate": 1.463477146518582e-07, + "loss": 0.0019, + "step": 13866 + }, + { + "epoch": 0.27, + "learning_rate": 1.4634383130752203e-07, + "loss": 0.0041, + "step": 13867 + }, + { + "epoch": 0.27, + "learning_rate": 1.463399479631859e-07, + "loss": 0.0031, + "step": 13868 + }, + { + "epoch": 0.27, + "learning_rate": 1.4633606461884975e-07, + "loss": 0.0014, + "step": 13869 + }, + { + "epoch": 0.27, + "learning_rate": 1.4633218127451362e-07, + "loss": 0.0018, + "step": 13870 + }, + { + "epoch": 0.27, + "learning_rate": 1.4632829793017747e-07, + "loss": 0.0021, + "step": 13871 + }, + { + "epoch": 0.27, + "learning_rate": 1.4632441458584134e-07, + "loss": 0.0173, + "step": 13872 + }, + { + "epoch": 0.27, + "learning_rate": 1.4632053124150518e-07, + "loss": 0.0016, + "step": 13873 + }, + { + "epoch": 0.27, + "learning_rate": 1.4631664789716905e-07, + "loss": 0.3192, + "step": 13874 + }, + { + "epoch": 0.27, + "learning_rate": 1.463127645528329e-07, + "loss": 0.0025, + "step": 13875 + }, + { + "epoch": 0.27, + "learning_rate": 1.4630888120849677e-07, + "loss": 0.6255, + "step": 13876 + }, + { + "epoch": 0.27, + "learning_rate": 1.4630499786416062e-07, + "loss": 0.004, + "step": 13877 + }, + { + "epoch": 0.27, + "learning_rate": 1.463011145198245e-07, + "loss": 0.3016, + "step": 13878 + }, + { + "epoch": 0.27, + "learning_rate": 1.4629723117548833e-07, + "loss": 0.0016, + "step": 13879 + }, + { + "epoch": 0.27, + "learning_rate": 1.462933478311522e-07, + "loss": 0.0014, + "step": 13880 + }, + { + "epoch": 0.27, + "learning_rate": 1.4628946448681605e-07, + "loss": 0.0128, + "step": 13881 + }, + { + "epoch": 0.27, + "learning_rate": 1.4628558114247992e-07, + "loss": 0.0013, + "step": 13882 + }, + { + "epoch": 0.27, + "learning_rate": 1.4628169779814374e-07, + "loss": 0.0012, + "step": 13883 + }, + { + "epoch": 0.27, + "learning_rate": 1.462778144538076e-07, + "loss": 1.1058, + "step": 13884 + }, + { + "epoch": 0.27, + "learning_rate": 1.4627393110947146e-07, + "loss": 0.8336, + "step": 13885 + }, + { + "epoch": 0.27, + "learning_rate": 1.4627004776513533e-07, + "loss": 0.0009, + "step": 13886 + }, + { + "epoch": 0.27, + "learning_rate": 1.4626616442079917e-07, + "loss": 1.077, + "step": 13887 + }, + { + "epoch": 0.27, + "learning_rate": 1.4626228107646304e-07, + "loss": 0.0016, + "step": 13888 + }, + { + "epoch": 0.27, + "learning_rate": 1.462583977321269e-07, + "loss": 0.0016, + "step": 13889 + }, + { + "epoch": 0.27, + "learning_rate": 1.4625451438779076e-07, + "loss": 0.0012, + "step": 13890 + }, + { + "epoch": 0.27, + "learning_rate": 1.462506310434546e-07, + "loss": 0.0017, + "step": 13891 + }, + { + "epoch": 0.27, + "learning_rate": 1.4624674769911848e-07, + "loss": 0.0135, + "step": 13892 + }, + { + "epoch": 0.27, + "learning_rate": 1.4624286435478232e-07, + "loss": 0.0012, + "step": 13893 + }, + { + "epoch": 0.27, + "learning_rate": 1.462389810104462e-07, + "loss": 0.0022, + "step": 13894 + }, + { + "epoch": 0.27, + "learning_rate": 1.4623509766611004e-07, + "loss": 0.0012, + "step": 13895 + }, + { + "epoch": 0.27, + "learning_rate": 1.462312143217739e-07, + "loss": 0.0016, + "step": 13896 + }, + { + "epoch": 0.27, + "learning_rate": 1.4622733097743775e-07, + "loss": 0.001, + "step": 13897 + }, + { + "epoch": 0.27, + "learning_rate": 1.4622344763310163e-07, + "loss": 0.4111, + "step": 13898 + }, + { + "epoch": 0.27, + "learning_rate": 1.4621956428876547e-07, + "loss": 0.0177, + "step": 13899 + }, + { + "epoch": 0.27, + "learning_rate": 1.4621568094442934e-07, + "loss": 0.0013, + "step": 13900 + }, + { + "epoch": 0.27, + "learning_rate": 1.462117976000932e-07, + "loss": 0.0024, + "step": 13901 + }, + { + "epoch": 0.27, + "learning_rate": 1.4620791425575706e-07, + "loss": 0.0073, + "step": 13902 + }, + { + "epoch": 0.27, + "learning_rate": 1.462040309114209e-07, + "loss": 0.0031, + "step": 13903 + }, + { + "epoch": 0.27, + "learning_rate": 1.4620014756708478e-07, + "loss": 0.0014, + "step": 13904 + }, + { + "epoch": 0.27, + "learning_rate": 1.4619626422274862e-07, + "loss": 0.0012, + "step": 13905 + }, + { + "epoch": 0.27, + "learning_rate": 1.461923808784125e-07, + "loss": 0.6858, + "step": 13906 + }, + { + "epoch": 0.27, + "learning_rate": 1.4618849753407634e-07, + "loss": 0.0299, + "step": 13907 + }, + { + "epoch": 0.27, + "learning_rate": 1.461846141897402e-07, + "loss": 0.0013, + "step": 13908 + }, + { + "epoch": 0.27, + "learning_rate": 1.4618073084540405e-07, + "loss": 0.0012, + "step": 13909 + }, + { + "epoch": 0.27, + "learning_rate": 1.4617684750106793e-07, + "loss": 0.0014, + "step": 13910 + }, + { + "epoch": 0.27, + "learning_rate": 1.4617296415673177e-07, + "loss": 0.0478, + "step": 13911 + }, + { + "epoch": 0.27, + "learning_rate": 1.4616908081239564e-07, + "loss": 0.4654, + "step": 13912 + }, + { + "epoch": 0.27, + "learning_rate": 1.4616519746805949e-07, + "loss": 0.0357, + "step": 13913 + }, + { + "epoch": 0.27, + "learning_rate": 1.4616131412372333e-07, + "loss": 0.0015, + "step": 13914 + }, + { + "epoch": 0.27, + "learning_rate": 1.461574307793872e-07, + "loss": 0.0018, + "step": 13915 + }, + { + "epoch": 0.27, + "learning_rate": 1.4615354743505105e-07, + "loss": 0.0023, + "step": 13916 + }, + { + "epoch": 0.27, + "learning_rate": 1.4614966409071492e-07, + "loss": 0.001, + "step": 13917 + }, + { + "epoch": 0.27, + "learning_rate": 1.4614578074637876e-07, + "loss": 0.0018, + "step": 13918 + }, + { + "epoch": 0.27, + "learning_rate": 1.4614189740204264e-07, + "loss": 0.0015, + "step": 13919 + }, + { + "epoch": 0.27, + "learning_rate": 1.4613801405770648e-07, + "loss": 0.0041, + "step": 13920 + }, + { + "epoch": 0.27, + "learning_rate": 1.4613413071337035e-07, + "loss": 0.001, + "step": 13921 + }, + { + "epoch": 0.27, + "learning_rate": 1.461302473690342e-07, + "loss": 0.0016, + "step": 13922 + }, + { + "epoch": 0.27, + "learning_rate": 1.4612636402469807e-07, + "loss": 0.0013, + "step": 13923 + }, + { + "epoch": 0.27, + "learning_rate": 1.4612248068036191e-07, + "loss": 0.0014, + "step": 13924 + }, + { + "epoch": 0.27, + "learning_rate": 1.4611859733602579e-07, + "loss": 0.0016, + "step": 13925 + }, + { + "epoch": 0.27, + "learning_rate": 1.4611471399168963e-07, + "loss": 0.0038, + "step": 13926 + }, + { + "epoch": 0.27, + "learning_rate": 1.461108306473535e-07, + "loss": 0.1819, + "step": 13927 + }, + { + "epoch": 0.27, + "learning_rate": 1.4610694730301735e-07, + "loss": 0.0013, + "step": 13928 + }, + { + "epoch": 0.27, + "learning_rate": 1.4610306395868122e-07, + "loss": 0.0016, + "step": 13929 + }, + { + "epoch": 0.27, + "learning_rate": 1.4609918061434506e-07, + "loss": 0.0016, + "step": 13930 + }, + { + "epoch": 0.27, + "learning_rate": 1.4609529727000894e-07, + "loss": 0.0021, + "step": 13931 + }, + { + "epoch": 0.27, + "learning_rate": 1.4609141392567278e-07, + "loss": 0.0012, + "step": 13932 + }, + { + "epoch": 0.27, + "learning_rate": 1.4608753058133665e-07, + "loss": 0.0013, + "step": 13933 + }, + { + "epoch": 0.27, + "learning_rate": 1.460836472370005e-07, + "loss": 0.0013, + "step": 13934 + }, + { + "epoch": 0.27, + "learning_rate": 1.4607976389266437e-07, + "loss": 0.0012, + "step": 13935 + }, + { + "epoch": 0.27, + "learning_rate": 1.460758805483282e-07, + "loss": 0.0021, + "step": 13936 + }, + { + "epoch": 0.27, + "learning_rate": 1.4607199720399208e-07, + "loss": 0.0013, + "step": 13937 + }, + { + "epoch": 0.27, + "learning_rate": 1.4606811385965593e-07, + "loss": 0.0011, + "step": 13938 + }, + { + "epoch": 0.27, + "learning_rate": 1.460642305153198e-07, + "loss": 0.0012, + "step": 13939 + }, + { + "epoch": 0.27, + "learning_rate": 1.4606034717098365e-07, + "loss": 0.0015, + "step": 13940 + }, + { + "epoch": 0.27, + "learning_rate": 1.460564638266475e-07, + "loss": 0.0018, + "step": 13941 + }, + { + "epoch": 0.27, + "learning_rate": 1.4605258048231136e-07, + "loss": 0.1865, + "step": 13942 + }, + { + "epoch": 0.27, + "learning_rate": 1.460486971379752e-07, + "loss": 0.305, + "step": 13943 + }, + { + "epoch": 0.27, + "learning_rate": 1.4604481379363905e-07, + "loss": 0.0047, + "step": 13944 + }, + { + "epoch": 0.27, + "learning_rate": 1.4604093044930292e-07, + "loss": 0.0011, + "step": 13945 + }, + { + "epoch": 0.27, + "learning_rate": 1.4603704710496677e-07, + "loss": 0.0039, + "step": 13946 + }, + { + "epoch": 0.27, + "learning_rate": 1.4603316376063064e-07, + "loss": 0.0016, + "step": 13947 + }, + { + "epoch": 0.27, + "learning_rate": 1.4602928041629449e-07, + "loss": 0.0011, + "step": 13948 + }, + { + "epoch": 0.27, + "learning_rate": 1.4602539707195836e-07, + "loss": 0.0017, + "step": 13949 + }, + { + "epoch": 0.27, + "learning_rate": 1.460215137276222e-07, + "loss": 0.0014, + "step": 13950 + }, + { + "epoch": 0.27, + "learning_rate": 1.4601763038328607e-07, + "loss": 0.0015, + "step": 13951 + }, + { + "epoch": 0.27, + "learning_rate": 1.4601374703894992e-07, + "loss": 0.0017, + "step": 13952 + }, + { + "epoch": 0.27, + "learning_rate": 1.460098636946138e-07, + "loss": 0.0697, + "step": 13953 + }, + { + "epoch": 0.27, + "learning_rate": 1.4600598035027764e-07, + "loss": 0.0013, + "step": 13954 + }, + { + "epoch": 0.27, + "learning_rate": 1.460020970059415e-07, + "loss": 0.4886, + "step": 13955 + }, + { + "epoch": 0.27, + "learning_rate": 1.4599821366160535e-07, + "loss": 0.0083, + "step": 13956 + }, + { + "epoch": 0.27, + "learning_rate": 1.4599433031726922e-07, + "loss": 0.0022, + "step": 13957 + }, + { + "epoch": 0.27, + "learning_rate": 1.4599044697293307e-07, + "loss": 0.0012, + "step": 13958 + }, + { + "epoch": 0.27, + "learning_rate": 1.4598656362859694e-07, + "loss": 0.0458, + "step": 13959 + }, + { + "epoch": 0.27, + "learning_rate": 1.4598268028426078e-07, + "loss": 0.097, + "step": 13960 + }, + { + "epoch": 0.27, + "learning_rate": 1.4597879693992466e-07, + "loss": 0.0789, + "step": 13961 + }, + { + "epoch": 0.27, + "learning_rate": 1.459749135955885e-07, + "loss": 0.0016, + "step": 13962 + }, + { + "epoch": 0.27, + "learning_rate": 1.4597103025125237e-07, + "loss": 0.0026, + "step": 13963 + }, + { + "epoch": 0.27, + "learning_rate": 1.4596714690691622e-07, + "loss": 0.0025, + "step": 13964 + }, + { + "epoch": 0.27, + "learning_rate": 1.459632635625801e-07, + "loss": 0.0015, + "step": 13965 + }, + { + "epoch": 0.27, + "learning_rate": 1.4595938021824393e-07, + "loss": 0.002, + "step": 13966 + }, + { + "epoch": 0.27, + "learning_rate": 1.459554968739078e-07, + "loss": 0.0016, + "step": 13967 + }, + { + "epoch": 0.27, + "learning_rate": 1.4595161352957165e-07, + "loss": 0.0013, + "step": 13968 + }, + { + "epoch": 0.27, + "learning_rate": 1.4594773018523552e-07, + "loss": 0.2065, + "step": 13969 + }, + { + "epoch": 0.27, + "learning_rate": 1.4594384684089937e-07, + "loss": 0.0016, + "step": 13970 + }, + { + "epoch": 0.27, + "learning_rate": 1.4593996349656324e-07, + "loss": 0.0013, + "step": 13971 + }, + { + "epoch": 0.27, + "learning_rate": 1.4593608015222708e-07, + "loss": 0.0256, + "step": 13972 + }, + { + "epoch": 0.27, + "learning_rate": 1.4593219680789095e-07, + "loss": 0.0049, + "step": 13973 + }, + { + "epoch": 0.27, + "learning_rate": 1.459283134635548e-07, + "loss": 0.0012, + "step": 13974 + }, + { + "epoch": 0.27, + "learning_rate": 1.4592443011921867e-07, + "loss": 0.0018, + "step": 13975 + }, + { + "epoch": 0.27, + "learning_rate": 1.4592054677488252e-07, + "loss": 0.0021, + "step": 13976 + }, + { + "epoch": 0.27, + "learning_rate": 1.459166634305464e-07, + "loss": 0.0041, + "step": 13977 + }, + { + "epoch": 0.27, + "learning_rate": 1.4591278008621023e-07, + "loss": 0.9642, + "step": 13978 + }, + { + "epoch": 0.27, + "learning_rate": 1.459088967418741e-07, + "loss": 0.0015, + "step": 13979 + }, + { + "epoch": 0.27, + "learning_rate": 1.4590501339753795e-07, + "loss": 0.0016, + "step": 13980 + }, + { + "epoch": 0.27, + "learning_rate": 1.4590113005320182e-07, + "loss": 0.0022, + "step": 13981 + }, + { + "epoch": 0.27, + "learning_rate": 1.4589724670886567e-07, + "loss": 0.0013, + "step": 13982 + }, + { + "epoch": 0.27, + "learning_rate": 1.4589336336452954e-07, + "loss": 0.0013, + "step": 13983 + }, + { + "epoch": 0.27, + "learning_rate": 1.4588948002019338e-07, + "loss": 0.138, + "step": 13984 + }, + { + "epoch": 0.27, + "learning_rate": 1.4588559667585725e-07, + "loss": 0.0012, + "step": 13985 + }, + { + "epoch": 0.27, + "learning_rate": 1.458817133315211e-07, + "loss": 0.0029, + "step": 13986 + }, + { + "epoch": 0.27, + "learning_rate": 1.4587782998718497e-07, + "loss": 0.0109, + "step": 13987 + }, + { + "epoch": 0.27, + "learning_rate": 1.4587394664284882e-07, + "loss": 0.0154, + "step": 13988 + }, + { + "epoch": 0.27, + "learning_rate": 1.458700632985127e-07, + "loss": 0.0023, + "step": 13989 + }, + { + "epoch": 0.27, + "learning_rate": 1.4586617995417653e-07, + "loss": 0.0097, + "step": 13990 + }, + { + "epoch": 0.27, + "learning_rate": 1.458622966098404e-07, + "loss": 0.0011, + "step": 13991 + }, + { + "epoch": 0.27, + "learning_rate": 1.4585841326550425e-07, + "loss": 0.0012, + "step": 13992 + }, + { + "epoch": 0.27, + "learning_rate": 1.4585452992116812e-07, + "loss": 0.0016, + "step": 13993 + }, + { + "epoch": 0.27, + "learning_rate": 1.4585064657683196e-07, + "loss": 0.0497, + "step": 13994 + }, + { + "epoch": 0.27, + "learning_rate": 1.4584676323249584e-07, + "loss": 0.0137, + "step": 13995 + }, + { + "epoch": 0.27, + "learning_rate": 1.4584287988815968e-07, + "loss": 0.0139, + "step": 13996 + }, + { + "epoch": 0.27, + "learning_rate": 1.4583899654382355e-07, + "loss": 0.0012, + "step": 13997 + }, + { + "epoch": 0.27, + "learning_rate": 1.458351131994874e-07, + "loss": 0.006, + "step": 13998 + }, + { + "epoch": 0.27, + "learning_rate": 1.4583122985515124e-07, + "loss": 0.0012, + "step": 13999 + }, + { + "epoch": 0.27, + "learning_rate": 1.458273465108151e-07, + "loss": 0.002, + "step": 14000 + }, + { + "epoch": 0.27, + "learning_rate": 1.4582346316647896e-07, + "loss": 0.0021, + "step": 14001 + }, + { + "epoch": 0.27, + "learning_rate": 1.458195798221428e-07, + "loss": 0.0012, + "step": 14002 + }, + { + "epoch": 0.27, + "learning_rate": 1.4581569647780668e-07, + "loss": 0.001, + "step": 14003 + }, + { + "epoch": 0.27, + "learning_rate": 1.4581181313347052e-07, + "loss": 0.0023, + "step": 14004 + }, + { + "epoch": 0.27, + "learning_rate": 1.458079297891344e-07, + "loss": 0.0019, + "step": 14005 + }, + { + "epoch": 0.27, + "learning_rate": 1.4580404644479824e-07, + "loss": 0.0017, + "step": 14006 + }, + { + "epoch": 0.27, + "learning_rate": 1.458001631004621e-07, + "loss": 0.0013, + "step": 14007 + }, + { + "epoch": 0.27, + "learning_rate": 1.4579627975612595e-07, + "loss": 0.0148, + "step": 14008 + }, + { + "epoch": 0.27, + "learning_rate": 1.4579239641178983e-07, + "loss": 0.1611, + "step": 14009 + }, + { + "epoch": 0.27, + "learning_rate": 1.4578851306745367e-07, + "loss": 0.9346, + "step": 14010 + }, + { + "epoch": 0.27, + "learning_rate": 1.4578462972311754e-07, + "loss": 0.9202, + "step": 14011 + }, + { + "epoch": 0.27, + "learning_rate": 1.4578074637878139e-07, + "loss": 0.0016, + "step": 14012 + }, + { + "epoch": 0.27, + "learning_rate": 1.4577686303444526e-07, + "loss": 0.0071, + "step": 14013 + }, + { + "epoch": 0.27, + "learning_rate": 1.457729796901091e-07, + "loss": 0.0027, + "step": 14014 + }, + { + "epoch": 0.27, + "learning_rate": 1.4576909634577297e-07, + "loss": 0.0165, + "step": 14015 + }, + { + "epoch": 0.27, + "learning_rate": 1.4576521300143682e-07, + "loss": 0.9502, + "step": 14016 + }, + { + "epoch": 0.27, + "learning_rate": 1.457613296571007e-07, + "loss": 0.0013, + "step": 14017 + }, + { + "epoch": 0.27, + "learning_rate": 1.4575744631276454e-07, + "loss": 0.0022, + "step": 14018 + }, + { + "epoch": 0.27, + "learning_rate": 1.457535629684284e-07, + "loss": 0.0034, + "step": 14019 + }, + { + "epoch": 0.27, + "learning_rate": 1.4574967962409225e-07, + "loss": 0.0197, + "step": 14020 + }, + { + "epoch": 0.27, + "learning_rate": 1.4574579627975612e-07, + "loss": 0.0077, + "step": 14021 + }, + { + "epoch": 0.27, + "learning_rate": 1.4574191293541997e-07, + "loss": 0.0335, + "step": 14022 + }, + { + "epoch": 0.27, + "learning_rate": 1.4573802959108384e-07, + "loss": 0.0018, + "step": 14023 + }, + { + "epoch": 0.27, + "learning_rate": 1.4573414624674769e-07, + "loss": 0.0012, + "step": 14024 + }, + { + "epoch": 0.27, + "learning_rate": 1.4573026290241156e-07, + "loss": 0.0012, + "step": 14025 + }, + { + "epoch": 0.27, + "learning_rate": 1.457263795580754e-07, + "loss": 0.2985, + "step": 14026 + }, + { + "epoch": 0.27, + "learning_rate": 1.4572249621373927e-07, + "loss": 0.0012, + "step": 14027 + }, + { + "epoch": 0.27, + "learning_rate": 1.4571861286940312e-07, + "loss": 0.0017, + "step": 14028 + }, + { + "epoch": 0.27, + "learning_rate": 1.45714729525067e-07, + "loss": 0.008, + "step": 14029 + }, + { + "epoch": 0.27, + "learning_rate": 1.4571084618073084e-07, + "loss": 0.0014, + "step": 14030 + }, + { + "epoch": 0.27, + "learning_rate": 1.457069628363947e-07, + "loss": 0.0014, + "step": 14031 + }, + { + "epoch": 0.27, + "learning_rate": 1.4570307949205855e-07, + "loss": 0.7017, + "step": 14032 + }, + { + "epoch": 0.27, + "learning_rate": 1.4569919614772242e-07, + "loss": 0.0047, + "step": 14033 + }, + { + "epoch": 0.27, + "learning_rate": 1.4569531280338627e-07, + "loss": 0.0122, + "step": 14034 + }, + { + "epoch": 0.27, + "learning_rate": 1.4569142945905014e-07, + "loss": 0.8599, + "step": 14035 + }, + { + "epoch": 0.27, + "learning_rate": 1.4568754611471398e-07, + "loss": 1.2052, + "step": 14036 + }, + { + "epoch": 0.27, + "learning_rate": 1.4568366277037786e-07, + "loss": 0.0016, + "step": 14037 + }, + { + "epoch": 0.27, + "learning_rate": 1.456797794260417e-07, + "loss": 0.482, + "step": 14038 + }, + { + "epoch": 0.27, + "learning_rate": 1.4567589608170557e-07, + "loss": 0.0024, + "step": 14039 + }, + { + "epoch": 0.27, + "learning_rate": 1.4567201273736942e-07, + "loss": 0.0014, + "step": 14040 + }, + { + "epoch": 0.27, + "learning_rate": 1.456681293930333e-07, + "loss": 0.0013, + "step": 14041 + }, + { + "epoch": 0.27, + "learning_rate": 1.4566424604869713e-07, + "loss": 0.123, + "step": 14042 + }, + { + "epoch": 0.27, + "learning_rate": 1.45660362704361e-07, + "loss": 0.0014, + "step": 14043 + }, + { + "epoch": 0.27, + "learning_rate": 1.4565647936002485e-07, + "loss": 0.0017, + "step": 14044 + }, + { + "epoch": 0.27, + "learning_rate": 1.4565259601568872e-07, + "loss": 0.0013, + "step": 14045 + }, + { + "epoch": 0.27, + "learning_rate": 1.4564871267135257e-07, + "loss": 0.0011, + "step": 14046 + }, + { + "epoch": 0.27, + "learning_rate": 1.4564482932701644e-07, + "loss": 0.0596, + "step": 14047 + }, + { + "epoch": 0.27, + "learning_rate": 1.4564094598268028e-07, + "loss": 0.0015, + "step": 14048 + }, + { + "epoch": 0.27, + "learning_rate": 1.4563706263834415e-07, + "loss": 0.0014, + "step": 14049 + }, + { + "epoch": 0.27, + "learning_rate": 1.45633179294008e-07, + "loss": 0.002, + "step": 14050 + }, + { + "epoch": 0.27, + "learning_rate": 1.4562929594967187e-07, + "loss": 0.0014, + "step": 14051 + }, + { + "epoch": 0.27, + "learning_rate": 1.4562541260533572e-07, + "loss": 0.0021, + "step": 14052 + }, + { + "epoch": 0.27, + "learning_rate": 1.456215292609996e-07, + "loss": 0.0015, + "step": 14053 + }, + { + "epoch": 0.27, + "learning_rate": 1.4561764591666343e-07, + "loss": 0.0014, + "step": 14054 + }, + { + "epoch": 0.27, + "learning_rate": 1.456137625723273e-07, + "loss": 0.0485, + "step": 14055 + }, + { + "epoch": 0.27, + "learning_rate": 1.4560987922799115e-07, + "loss": 0.0025, + "step": 14056 + }, + { + "epoch": 0.27, + "learning_rate": 1.45605995883655e-07, + "loss": 0.0012, + "step": 14057 + }, + { + "epoch": 0.27, + "learning_rate": 1.4560211253931884e-07, + "loss": 0.0015, + "step": 14058 + }, + { + "epoch": 0.27, + "learning_rate": 1.455982291949827e-07, + "loss": 0.0019, + "step": 14059 + }, + { + "epoch": 0.27, + "learning_rate": 1.4559434585064656e-07, + "loss": 1.5833, + "step": 14060 + }, + { + "epoch": 0.27, + "learning_rate": 1.4559046250631043e-07, + "loss": 0.0014, + "step": 14061 + }, + { + "epoch": 0.27, + "learning_rate": 1.4558657916197427e-07, + "loss": 0.1121, + "step": 14062 + }, + { + "epoch": 0.27, + "learning_rate": 1.4558269581763814e-07, + "loss": 0.0018, + "step": 14063 + }, + { + "epoch": 0.27, + "learning_rate": 1.45578812473302e-07, + "loss": 0.001, + "step": 14064 + }, + { + "epoch": 0.27, + "learning_rate": 1.4557492912896586e-07, + "loss": 1.4666, + "step": 14065 + }, + { + "epoch": 0.27, + "learning_rate": 1.455710457846297e-07, + "loss": 0.0916, + "step": 14066 + }, + { + "epoch": 0.27, + "learning_rate": 1.4556716244029358e-07, + "loss": 0.0065, + "step": 14067 + }, + { + "epoch": 0.27, + "learning_rate": 1.4556327909595742e-07, + "loss": 0.0016, + "step": 14068 + }, + { + "epoch": 0.27, + "learning_rate": 1.455593957516213e-07, + "loss": 0.0018, + "step": 14069 + }, + { + "epoch": 0.27, + "learning_rate": 1.4555551240728514e-07, + "loss": 0.0582, + "step": 14070 + }, + { + "epoch": 0.27, + "learning_rate": 1.45551629062949e-07, + "loss": 0.0009, + "step": 14071 + }, + { + "epoch": 0.27, + "learning_rate": 1.4554774571861285e-07, + "loss": 0.3827, + "step": 14072 + }, + { + "epoch": 0.27, + "learning_rate": 1.4554386237427673e-07, + "loss": 0.0012, + "step": 14073 + }, + { + "epoch": 0.27, + "learning_rate": 1.4553997902994057e-07, + "loss": 0.3188, + "step": 14074 + }, + { + "epoch": 0.27, + "learning_rate": 1.4553609568560444e-07, + "loss": 0.0023, + "step": 14075 + }, + { + "epoch": 0.27, + "learning_rate": 1.455322123412683e-07, + "loss": 0.1291, + "step": 14076 + }, + { + "epoch": 0.27, + "learning_rate": 1.4552832899693216e-07, + "loss": 0.0015, + "step": 14077 + }, + { + "epoch": 0.27, + "learning_rate": 1.45524445652596e-07, + "loss": 0.0015, + "step": 14078 + }, + { + "epoch": 0.27, + "learning_rate": 1.4552056230825988e-07, + "loss": 0.0015, + "step": 14079 + }, + { + "epoch": 0.27, + "learning_rate": 1.4551667896392372e-07, + "loss": 0.0013, + "step": 14080 + }, + { + "epoch": 0.27, + "learning_rate": 1.455127956195876e-07, + "loss": 0.6095, + "step": 14081 + }, + { + "epoch": 0.27, + "learning_rate": 1.4550891227525144e-07, + "loss": 0.0016, + "step": 14082 + }, + { + "epoch": 0.27, + "learning_rate": 1.455050289309153e-07, + "loss": 0.0015, + "step": 14083 + }, + { + "epoch": 0.27, + "learning_rate": 1.4550114558657915e-07, + "loss": 0.5143, + "step": 14084 + }, + { + "epoch": 0.27, + "learning_rate": 1.4549726224224303e-07, + "loss": 0.0018, + "step": 14085 + }, + { + "epoch": 0.27, + "learning_rate": 1.4549337889790687e-07, + "loss": 0.0014, + "step": 14086 + }, + { + "epoch": 0.27, + "learning_rate": 1.4548949555357074e-07, + "loss": 0.0022, + "step": 14087 + }, + { + "epoch": 0.27, + "learning_rate": 1.454856122092346e-07, + "loss": 1.5892, + "step": 14088 + }, + { + "epoch": 0.27, + "learning_rate": 1.4548172886489846e-07, + "loss": 0.004, + "step": 14089 + }, + { + "epoch": 0.27, + "learning_rate": 1.454778455205623e-07, + "loss": 0.0014, + "step": 14090 + }, + { + "epoch": 0.27, + "learning_rate": 1.4547396217622615e-07, + "loss": 0.0028, + "step": 14091 + }, + { + "epoch": 0.27, + "learning_rate": 1.4547007883189002e-07, + "loss": 0.0016, + "step": 14092 + }, + { + "epoch": 0.27, + "learning_rate": 1.4546619548755386e-07, + "loss": 0.0032, + "step": 14093 + }, + { + "epoch": 0.27, + "learning_rate": 1.4546231214321774e-07, + "loss": 0.0015, + "step": 14094 + }, + { + "epoch": 0.27, + "learning_rate": 1.4545842879888158e-07, + "loss": 0.0942, + "step": 14095 + }, + { + "epoch": 0.27, + "learning_rate": 1.4545454545454545e-07, + "loss": 0.0354, + "step": 14096 + }, + { + "epoch": 0.27, + "learning_rate": 1.454506621102093e-07, + "loss": 0.0103, + "step": 14097 + }, + { + "epoch": 0.27, + "learning_rate": 1.4544677876587317e-07, + "loss": 0.0015, + "step": 14098 + }, + { + "epoch": 0.27, + "learning_rate": 1.4544289542153701e-07, + "loss": 0.0055, + "step": 14099 + }, + { + "epoch": 0.27, + "learning_rate": 1.4543901207720089e-07, + "loss": 0.0011, + "step": 14100 + }, + { + "epoch": 0.27, + "learning_rate": 1.4543512873286473e-07, + "loss": 0.0056, + "step": 14101 + }, + { + "epoch": 0.27, + "learning_rate": 1.454312453885286e-07, + "loss": 0.2762, + "step": 14102 + }, + { + "epoch": 0.27, + "learning_rate": 1.4542736204419245e-07, + "loss": 0.0018, + "step": 14103 + }, + { + "epoch": 0.27, + "learning_rate": 1.4542347869985632e-07, + "loss": 0.0219, + "step": 14104 + }, + { + "epoch": 0.27, + "learning_rate": 1.4541959535552016e-07, + "loss": 0.0213, + "step": 14105 + }, + { + "epoch": 0.27, + "learning_rate": 1.4541571201118404e-07, + "loss": 0.0012, + "step": 14106 + }, + { + "epoch": 0.27, + "learning_rate": 1.4541182866684788e-07, + "loss": 0.0012, + "step": 14107 + }, + { + "epoch": 0.27, + "learning_rate": 1.4540794532251175e-07, + "loss": 0.0038, + "step": 14108 + }, + { + "epoch": 0.27, + "learning_rate": 1.454040619781756e-07, + "loss": 0.0014, + "step": 14109 + }, + { + "epoch": 0.27, + "learning_rate": 1.4540017863383947e-07, + "loss": 0.4558, + "step": 14110 + }, + { + "epoch": 0.27, + "learning_rate": 1.453962952895033e-07, + "loss": 0.001, + "step": 14111 + }, + { + "epoch": 0.27, + "learning_rate": 1.4539241194516718e-07, + "loss": 0.0015, + "step": 14112 + }, + { + "epoch": 0.27, + "learning_rate": 1.4538852860083103e-07, + "loss": 0.0513, + "step": 14113 + }, + { + "epoch": 0.27, + "learning_rate": 1.453846452564949e-07, + "loss": 0.8576, + "step": 14114 + }, + { + "epoch": 0.27, + "learning_rate": 1.4538076191215875e-07, + "loss": 0.0013, + "step": 14115 + }, + { + "epoch": 0.27, + "learning_rate": 1.453768785678226e-07, + "loss": 0.0018, + "step": 14116 + }, + { + "epoch": 0.27, + "learning_rate": 1.4537299522348646e-07, + "loss": 0.0013, + "step": 14117 + }, + { + "epoch": 0.27, + "learning_rate": 1.453691118791503e-07, + "loss": 0.0012, + "step": 14118 + }, + { + "epoch": 0.27, + "learning_rate": 1.4536522853481418e-07, + "loss": 0.0947, + "step": 14119 + }, + { + "epoch": 0.27, + "learning_rate": 1.4536134519047802e-07, + "loss": 0.0012, + "step": 14120 + }, + { + "epoch": 0.27, + "learning_rate": 1.4535746184614187e-07, + "loss": 0.9532, + "step": 14121 + }, + { + "epoch": 0.27, + "learning_rate": 1.4535357850180574e-07, + "loss": 0.0205, + "step": 14122 + }, + { + "epoch": 0.27, + "learning_rate": 1.4534969515746959e-07, + "loss": 0.0014, + "step": 14123 + }, + { + "epoch": 0.27, + "learning_rate": 1.4534581181313346e-07, + "loss": 0.0012, + "step": 14124 + }, + { + "epoch": 0.27, + "learning_rate": 1.453419284687973e-07, + "loss": 0.0015, + "step": 14125 + }, + { + "epoch": 0.27, + "learning_rate": 1.4533804512446117e-07, + "loss": 0.0014, + "step": 14126 + }, + { + "epoch": 0.27, + "learning_rate": 1.4533416178012502e-07, + "loss": 0.003, + "step": 14127 + }, + { + "epoch": 0.27, + "learning_rate": 1.453302784357889e-07, + "loss": 0.7178, + "step": 14128 + }, + { + "epoch": 0.27, + "learning_rate": 1.4532639509145274e-07, + "loss": 0.1138, + "step": 14129 + }, + { + "epoch": 0.27, + "learning_rate": 1.453225117471166e-07, + "loss": 0.0321, + "step": 14130 + }, + { + "epoch": 0.27, + "learning_rate": 1.4531862840278045e-07, + "loss": 0.0014, + "step": 14131 + }, + { + "epoch": 0.27, + "learning_rate": 1.4531474505844432e-07, + "loss": 0.0025, + "step": 14132 + }, + { + "epoch": 0.27, + "learning_rate": 1.4531086171410817e-07, + "loss": 0.0012, + "step": 14133 + }, + { + "epoch": 0.27, + "learning_rate": 1.4530697836977204e-07, + "loss": 0.0013, + "step": 14134 + }, + { + "epoch": 0.27, + "learning_rate": 1.4530309502543588e-07, + "loss": 0.0065, + "step": 14135 + }, + { + "epoch": 0.27, + "learning_rate": 1.4529921168109976e-07, + "loss": 0.0021, + "step": 14136 + }, + { + "epoch": 0.27, + "learning_rate": 1.452953283367636e-07, + "loss": 0.0015, + "step": 14137 + }, + { + "epoch": 0.27, + "learning_rate": 1.4529144499242747e-07, + "loss": 0.0012, + "step": 14138 + }, + { + "epoch": 0.27, + "learning_rate": 1.4528756164809132e-07, + "loss": 0.5913, + "step": 14139 + }, + { + "epoch": 0.27, + "learning_rate": 1.452836783037552e-07, + "loss": 0.1205, + "step": 14140 + }, + { + "epoch": 0.27, + "learning_rate": 1.4527979495941903e-07, + "loss": 1.8675, + "step": 14141 + }, + { + "epoch": 0.27, + "learning_rate": 1.452759116150829e-07, + "loss": 0.4942, + "step": 14142 + }, + { + "epoch": 0.27, + "learning_rate": 1.4527202827074675e-07, + "loss": 0.0012, + "step": 14143 + }, + { + "epoch": 0.27, + "learning_rate": 1.4526814492641062e-07, + "loss": 0.0014, + "step": 14144 + }, + { + "epoch": 0.27, + "learning_rate": 1.4526426158207447e-07, + "loss": 0.0013, + "step": 14145 + }, + { + "epoch": 0.27, + "learning_rate": 1.4526037823773834e-07, + "loss": 0.0012, + "step": 14146 + }, + { + "epoch": 0.27, + "learning_rate": 1.4525649489340218e-07, + "loss": 0.3018, + "step": 14147 + }, + { + "epoch": 0.27, + "learning_rate": 1.4525261154906606e-07, + "loss": 0.0013, + "step": 14148 + }, + { + "epoch": 0.27, + "learning_rate": 1.452487282047299e-07, + "loss": 0.0013, + "step": 14149 + }, + { + "epoch": 0.27, + "learning_rate": 1.4524484486039377e-07, + "loss": 0.0016, + "step": 14150 + }, + { + "epoch": 0.27, + "learning_rate": 1.4524096151605762e-07, + "loss": 0.0028, + "step": 14151 + }, + { + "epoch": 0.27, + "learning_rate": 1.452370781717215e-07, + "loss": 0.0018, + "step": 14152 + }, + { + "epoch": 0.27, + "learning_rate": 1.4523319482738533e-07, + "loss": 0.0061, + "step": 14153 + }, + { + "epoch": 0.27, + "learning_rate": 1.452293114830492e-07, + "loss": 0.0016, + "step": 14154 + }, + { + "epoch": 0.27, + "learning_rate": 1.4522542813871305e-07, + "loss": 0.0028, + "step": 14155 + }, + { + "epoch": 0.27, + "learning_rate": 1.4522154479437692e-07, + "loss": 0.0012, + "step": 14156 + }, + { + "epoch": 0.27, + "learning_rate": 1.4521766145004077e-07, + "loss": 0.0012, + "step": 14157 + }, + { + "epoch": 0.27, + "learning_rate": 1.4521377810570464e-07, + "loss": 0.0016, + "step": 14158 + }, + { + "epoch": 0.27, + "learning_rate": 1.4520989476136848e-07, + "loss": 0.7311, + "step": 14159 + }, + { + "epoch": 0.27, + "learning_rate": 1.4520601141703235e-07, + "loss": 0.0017, + "step": 14160 + }, + { + "epoch": 0.27, + "learning_rate": 1.452021280726962e-07, + "loss": 0.0016, + "step": 14161 + }, + { + "epoch": 0.27, + "learning_rate": 1.4519824472836007e-07, + "loss": 1.5057, + "step": 14162 + }, + { + "epoch": 0.27, + "learning_rate": 1.4519436138402392e-07, + "loss": 0.0029, + "step": 14163 + }, + { + "epoch": 0.27, + "learning_rate": 1.451904780396878e-07, + "loss": 0.0012, + "step": 14164 + }, + { + "epoch": 0.27, + "learning_rate": 1.4518659469535163e-07, + "loss": 0.8757, + "step": 14165 + }, + { + "epoch": 0.27, + "learning_rate": 1.451827113510155e-07, + "loss": 1.1384, + "step": 14166 + }, + { + "epoch": 0.27, + "learning_rate": 1.4517882800667935e-07, + "loss": 0.0023, + "step": 14167 + }, + { + "epoch": 0.27, + "learning_rate": 1.4517494466234322e-07, + "loss": 0.0018, + "step": 14168 + }, + { + "epoch": 0.27, + "learning_rate": 1.4517106131800706e-07, + "loss": 0.0224, + "step": 14169 + }, + { + "epoch": 0.27, + "learning_rate": 1.4516717797367094e-07, + "loss": 0.0015, + "step": 14170 + }, + { + "epoch": 0.27, + "learning_rate": 1.4516329462933478e-07, + "loss": 0.4021, + "step": 14171 + }, + { + "epoch": 0.27, + "learning_rate": 1.4515941128499865e-07, + "loss": 0.5458, + "step": 14172 + }, + { + "epoch": 0.27, + "learning_rate": 1.4515552794066247e-07, + "loss": 0.0014, + "step": 14173 + }, + { + "epoch": 0.27, + "learning_rate": 1.4515164459632634e-07, + "loss": 0.4058, + "step": 14174 + }, + { + "epoch": 0.27, + "learning_rate": 1.451477612519902e-07, + "loss": 0.0014, + "step": 14175 + }, + { + "epoch": 0.27, + "learning_rate": 1.4514387790765406e-07, + "loss": 0.0751, + "step": 14176 + }, + { + "epoch": 0.28, + "learning_rate": 1.451399945633179e-07, + "loss": 0.0014, + "step": 14177 + }, + { + "epoch": 0.28, + "learning_rate": 1.4513611121898178e-07, + "loss": 0.2856, + "step": 14178 + }, + { + "epoch": 0.28, + "learning_rate": 1.4513222787464562e-07, + "loss": 0.0011, + "step": 14179 + }, + { + "epoch": 0.28, + "learning_rate": 1.451283445303095e-07, + "loss": 0.0014, + "step": 14180 + }, + { + "epoch": 0.28, + "learning_rate": 1.4512446118597334e-07, + "loss": 0.0052, + "step": 14181 + }, + { + "epoch": 0.28, + "learning_rate": 1.451205778416372e-07, + "loss": 0.0015, + "step": 14182 + }, + { + "epoch": 0.28, + "learning_rate": 1.4511669449730105e-07, + "loss": 0.0039, + "step": 14183 + }, + { + "epoch": 0.28, + "learning_rate": 1.4511281115296493e-07, + "loss": 0.0016, + "step": 14184 + }, + { + "epoch": 0.28, + "learning_rate": 1.4510892780862877e-07, + "loss": 0.0025, + "step": 14185 + }, + { + "epoch": 0.28, + "learning_rate": 1.4510504446429264e-07, + "loss": 0.001, + "step": 14186 + }, + { + "epoch": 0.28, + "learning_rate": 1.451011611199565e-07, + "loss": 0.1001, + "step": 14187 + }, + { + "epoch": 0.28, + "learning_rate": 1.4509727777562036e-07, + "loss": 0.9527, + "step": 14188 + }, + { + "epoch": 0.28, + "learning_rate": 1.450933944312842e-07, + "loss": 0.0039, + "step": 14189 + }, + { + "epoch": 0.28, + "learning_rate": 1.4508951108694807e-07, + "loss": 0.0033, + "step": 14190 + }, + { + "epoch": 0.28, + "learning_rate": 1.4508562774261192e-07, + "loss": 0.0021, + "step": 14191 + }, + { + "epoch": 0.28, + "learning_rate": 1.450817443982758e-07, + "loss": 0.002, + "step": 14192 + }, + { + "epoch": 0.28, + "learning_rate": 1.4507786105393964e-07, + "loss": 0.003, + "step": 14193 + }, + { + "epoch": 0.28, + "learning_rate": 1.450739777096035e-07, + "loss": 0.1973, + "step": 14194 + }, + { + "epoch": 0.28, + "learning_rate": 1.4507009436526735e-07, + "loss": 0.0013, + "step": 14195 + }, + { + "epoch": 0.28, + "learning_rate": 1.4506621102093122e-07, + "loss": 0.0011, + "step": 14196 + }, + { + "epoch": 0.28, + "learning_rate": 1.4506232767659507e-07, + "loss": 0.0024, + "step": 14197 + }, + { + "epoch": 0.28, + "learning_rate": 1.4505844433225894e-07, + "loss": 0.0014, + "step": 14198 + }, + { + "epoch": 0.28, + "learning_rate": 1.4505456098792279e-07, + "loss": 0.0013, + "step": 14199 + }, + { + "epoch": 0.28, + "learning_rate": 1.4505067764358666e-07, + "loss": 0.0171, + "step": 14200 + }, + { + "epoch": 0.28, + "learning_rate": 1.450467942992505e-07, + "loss": 0.0039, + "step": 14201 + }, + { + "epoch": 0.28, + "learning_rate": 1.4504291095491437e-07, + "loss": 0.6297, + "step": 14202 + }, + { + "epoch": 0.28, + "learning_rate": 1.4503902761057822e-07, + "loss": 0.0012, + "step": 14203 + }, + { + "epoch": 0.28, + "learning_rate": 1.450351442662421e-07, + "loss": 0.0409, + "step": 14204 + }, + { + "epoch": 0.28, + "learning_rate": 1.4503126092190594e-07, + "loss": 0.0015, + "step": 14205 + }, + { + "epoch": 0.28, + "learning_rate": 1.450273775775698e-07, + "loss": 0.0013, + "step": 14206 + }, + { + "epoch": 0.28, + "learning_rate": 1.4502349423323365e-07, + "loss": 0.0014, + "step": 14207 + }, + { + "epoch": 0.28, + "learning_rate": 1.4501961088889752e-07, + "loss": 0.0019, + "step": 14208 + }, + { + "epoch": 0.28, + "learning_rate": 1.4501572754456137e-07, + "loss": 0.0014, + "step": 14209 + }, + { + "epoch": 0.28, + "learning_rate": 1.4501184420022524e-07, + "loss": 0.0019, + "step": 14210 + }, + { + "epoch": 0.28, + "learning_rate": 1.4500796085588908e-07, + "loss": 0.0015, + "step": 14211 + }, + { + "epoch": 0.28, + "learning_rate": 1.4500407751155296e-07, + "loss": 0.0618, + "step": 14212 + }, + { + "epoch": 0.28, + "learning_rate": 1.450001941672168e-07, + "loss": 0.0013, + "step": 14213 + }, + { + "epoch": 0.28, + "learning_rate": 1.4499631082288067e-07, + "loss": 0.003, + "step": 14214 + }, + { + "epoch": 0.28, + "learning_rate": 1.4499242747854452e-07, + "loss": 0.0014, + "step": 14215 + }, + { + "epoch": 0.28, + "learning_rate": 1.449885441342084e-07, + "loss": 0.0017, + "step": 14216 + }, + { + "epoch": 0.28, + "learning_rate": 1.4498466078987223e-07, + "loss": 0.0011, + "step": 14217 + }, + { + "epoch": 0.28, + "learning_rate": 1.449807774455361e-07, + "loss": 0.0014, + "step": 14218 + }, + { + "epoch": 0.28, + "learning_rate": 1.4497689410119995e-07, + "loss": 0.1753, + "step": 14219 + }, + { + "epoch": 0.28, + "learning_rate": 1.4497301075686382e-07, + "loss": 0.0013, + "step": 14220 + }, + { + "epoch": 0.28, + "learning_rate": 1.4496912741252767e-07, + "loss": 0.0015, + "step": 14221 + }, + { + "epoch": 0.28, + "learning_rate": 1.4496524406819154e-07, + "loss": 1.212, + "step": 14222 + }, + { + "epoch": 0.28, + "learning_rate": 1.4496136072385538e-07, + "loss": 0.0766, + "step": 14223 + }, + { + "epoch": 0.28, + "learning_rate": 1.4495747737951926e-07, + "loss": 0.0014, + "step": 14224 + }, + { + "epoch": 0.28, + "learning_rate": 1.449535940351831e-07, + "loss": 0.1548, + "step": 14225 + }, + { + "epoch": 0.28, + "learning_rate": 1.4494971069084697e-07, + "loss": 0.0018, + "step": 14226 + }, + { + "epoch": 0.28, + "learning_rate": 1.4494582734651082e-07, + "loss": 0.0088, + "step": 14227 + }, + { + "epoch": 0.28, + "learning_rate": 1.449419440021747e-07, + "loss": 0.0052, + "step": 14228 + }, + { + "epoch": 0.28, + "learning_rate": 1.4493806065783853e-07, + "loss": 0.0015, + "step": 14229 + }, + { + "epoch": 0.28, + "learning_rate": 1.449341773135024e-07, + "loss": 0.1503, + "step": 14230 + }, + { + "epoch": 0.28, + "learning_rate": 1.4493029396916622e-07, + "loss": 0.3848, + "step": 14231 + }, + { + "epoch": 0.28, + "learning_rate": 1.449264106248301e-07, + "loss": 0.0017, + "step": 14232 + }, + { + "epoch": 0.28, + "learning_rate": 1.4492252728049394e-07, + "loss": 0.0179, + "step": 14233 + }, + { + "epoch": 0.28, + "learning_rate": 1.449186439361578e-07, + "loss": 0.0013, + "step": 14234 + }, + { + "epoch": 0.28, + "learning_rate": 1.4491476059182166e-07, + "loss": 0.004, + "step": 14235 + }, + { + "epoch": 0.28, + "learning_rate": 1.4491087724748553e-07, + "loss": 0.0022, + "step": 14236 + }, + { + "epoch": 0.28, + "learning_rate": 1.4490699390314937e-07, + "loss": 0.0015, + "step": 14237 + }, + { + "epoch": 0.28, + "learning_rate": 1.4490311055881324e-07, + "loss": 0.8723, + "step": 14238 + }, + { + "epoch": 0.28, + "learning_rate": 1.448992272144771e-07, + "loss": 0.0252, + "step": 14239 + }, + { + "epoch": 0.28, + "learning_rate": 1.4489534387014096e-07, + "loss": 0.001, + "step": 14240 + }, + { + "epoch": 0.28, + "learning_rate": 1.448914605258048e-07, + "loss": 0.002, + "step": 14241 + }, + { + "epoch": 0.28, + "learning_rate": 1.4488757718146868e-07, + "loss": 0.0012, + "step": 14242 + }, + { + "epoch": 0.28, + "learning_rate": 1.4488369383713252e-07, + "loss": 0.0015, + "step": 14243 + }, + { + "epoch": 0.28, + "learning_rate": 1.448798104927964e-07, + "loss": 0.8654, + "step": 14244 + }, + { + "epoch": 0.28, + "learning_rate": 1.4487592714846024e-07, + "loss": 0.0015, + "step": 14245 + }, + { + "epoch": 0.28, + "learning_rate": 1.448720438041241e-07, + "loss": 0.0013, + "step": 14246 + }, + { + "epoch": 0.28, + "learning_rate": 1.4486816045978796e-07, + "loss": 0.0012, + "step": 14247 + }, + { + "epoch": 0.28, + "learning_rate": 1.4486427711545183e-07, + "loss": 1.3512, + "step": 14248 + }, + { + "epoch": 0.28, + "learning_rate": 1.4486039377111567e-07, + "loss": 0.0012, + "step": 14249 + }, + { + "epoch": 0.28, + "learning_rate": 1.4485651042677954e-07, + "loss": 0.0015, + "step": 14250 + }, + { + "epoch": 0.28, + "learning_rate": 1.448526270824434e-07, + "loss": 0.0013, + "step": 14251 + }, + { + "epoch": 0.28, + "learning_rate": 1.4484874373810726e-07, + "loss": 0.5025, + "step": 14252 + }, + { + "epoch": 0.28, + "learning_rate": 1.448448603937711e-07, + "loss": 0.003, + "step": 14253 + }, + { + "epoch": 0.28, + "learning_rate": 1.4484097704943498e-07, + "loss": 0.041, + "step": 14254 + }, + { + "epoch": 0.28, + "learning_rate": 1.4483709370509882e-07, + "loss": 0.0015, + "step": 14255 + }, + { + "epoch": 0.28, + "learning_rate": 1.448332103607627e-07, + "loss": 0.0167, + "step": 14256 + }, + { + "epoch": 0.28, + "learning_rate": 1.4482932701642654e-07, + "loss": 1.0059, + "step": 14257 + }, + { + "epoch": 0.28, + "learning_rate": 1.448254436720904e-07, + "loss": 0.0014, + "step": 14258 + }, + { + "epoch": 0.28, + "learning_rate": 1.4482156032775425e-07, + "loss": 0.0261, + "step": 14259 + }, + { + "epoch": 0.28, + "learning_rate": 1.4481767698341813e-07, + "loss": 0.0014, + "step": 14260 + }, + { + "epoch": 0.28, + "learning_rate": 1.4481379363908197e-07, + "loss": 0.0151, + "step": 14261 + }, + { + "epoch": 0.28, + "learning_rate": 1.4480991029474584e-07, + "loss": 0.0014, + "step": 14262 + }, + { + "epoch": 0.28, + "learning_rate": 1.448060269504097e-07, + "loss": 0.2255, + "step": 14263 + }, + { + "epoch": 0.28, + "learning_rate": 1.4480214360607356e-07, + "loss": 0.0034, + "step": 14264 + }, + { + "epoch": 0.28, + "learning_rate": 1.447982602617374e-07, + "loss": 0.0017, + "step": 14265 + }, + { + "epoch": 0.28, + "learning_rate": 1.4479437691740127e-07, + "loss": 0.0031, + "step": 14266 + }, + { + "epoch": 0.28, + "learning_rate": 1.4479049357306512e-07, + "loss": 0.0019, + "step": 14267 + }, + { + "epoch": 0.28, + "learning_rate": 1.4478661022872896e-07, + "loss": 0.0014, + "step": 14268 + }, + { + "epoch": 0.28, + "learning_rate": 1.4478272688439284e-07, + "loss": 0.0111, + "step": 14269 + }, + { + "epoch": 0.28, + "learning_rate": 1.4477884354005668e-07, + "loss": 0.0014, + "step": 14270 + }, + { + "epoch": 0.28, + "learning_rate": 1.4477496019572055e-07, + "loss": 0.0013, + "step": 14271 + }, + { + "epoch": 0.28, + "learning_rate": 1.447710768513844e-07, + "loss": 0.0012, + "step": 14272 + }, + { + "epoch": 0.28, + "learning_rate": 1.4476719350704827e-07, + "loss": 0.0217, + "step": 14273 + }, + { + "epoch": 0.28, + "learning_rate": 1.4476331016271211e-07, + "loss": 0.0017, + "step": 14274 + }, + { + "epoch": 0.28, + "learning_rate": 1.4475942681837599e-07, + "loss": 0.0014, + "step": 14275 + }, + { + "epoch": 0.28, + "learning_rate": 1.4475554347403983e-07, + "loss": 0.0012, + "step": 14276 + }, + { + "epoch": 0.28, + "learning_rate": 1.447516601297037e-07, + "loss": 0.0013, + "step": 14277 + }, + { + "epoch": 0.28, + "learning_rate": 1.4474777678536755e-07, + "loss": 0.0013, + "step": 14278 + }, + { + "epoch": 0.28, + "learning_rate": 1.4474389344103142e-07, + "loss": 0.0036, + "step": 14279 + }, + { + "epoch": 0.28, + "learning_rate": 1.4474001009669526e-07, + "loss": 0.0013, + "step": 14280 + }, + { + "epoch": 0.28, + "learning_rate": 1.4473612675235914e-07, + "loss": 0.0204, + "step": 14281 + }, + { + "epoch": 0.28, + "learning_rate": 1.4473224340802298e-07, + "loss": 0.1028, + "step": 14282 + }, + { + "epoch": 0.28, + "learning_rate": 1.4472836006368685e-07, + "loss": 0.0062, + "step": 14283 + }, + { + "epoch": 0.28, + "learning_rate": 1.447244767193507e-07, + "loss": 0.0045, + "step": 14284 + }, + { + "epoch": 0.28, + "learning_rate": 1.4472059337501457e-07, + "loss": 0.0061, + "step": 14285 + }, + { + "epoch": 0.28, + "learning_rate": 1.4471671003067841e-07, + "loss": 0.005, + "step": 14286 + }, + { + "epoch": 0.28, + "learning_rate": 1.4471282668634228e-07, + "loss": 0.0015, + "step": 14287 + }, + { + "epoch": 0.28, + "learning_rate": 1.4470894334200613e-07, + "loss": 0.7182, + "step": 14288 + }, + { + "epoch": 0.28, + "learning_rate": 1.4470505999766997e-07, + "loss": 0.0021, + "step": 14289 + }, + { + "epoch": 0.28, + "learning_rate": 1.4470117665333385e-07, + "loss": 0.004, + "step": 14290 + }, + { + "epoch": 0.28, + "learning_rate": 1.446972933089977e-07, + "loss": 0.0018, + "step": 14291 + }, + { + "epoch": 0.28, + "learning_rate": 1.4469340996466156e-07, + "loss": 0.0014, + "step": 14292 + }, + { + "epoch": 0.28, + "learning_rate": 1.446895266203254e-07, + "loss": 0.795, + "step": 14293 + }, + { + "epoch": 0.28, + "learning_rate": 1.4468564327598928e-07, + "loss": 0.0016, + "step": 14294 + }, + { + "epoch": 0.28, + "learning_rate": 1.4468175993165312e-07, + "loss": 0.0022, + "step": 14295 + }, + { + "epoch": 0.28, + "learning_rate": 1.44677876587317e-07, + "loss": 0.0011, + "step": 14296 + }, + { + "epoch": 0.28, + "learning_rate": 1.4467399324298084e-07, + "loss": 0.0016, + "step": 14297 + }, + { + "epoch": 0.28, + "learning_rate": 1.4467010989864469e-07, + "loss": 0.0074, + "step": 14298 + }, + { + "epoch": 0.28, + "learning_rate": 1.4466622655430856e-07, + "loss": 0.0014, + "step": 14299 + }, + { + "epoch": 0.28, + "learning_rate": 1.446623432099724e-07, + "loss": 0.0014, + "step": 14300 + }, + { + "epoch": 0.28, + "learning_rate": 1.4465845986563627e-07, + "loss": 0.001, + "step": 14301 + }, + { + "epoch": 0.28, + "learning_rate": 1.4465457652130012e-07, + "loss": 0.0034, + "step": 14302 + }, + { + "epoch": 0.28, + "learning_rate": 1.44650693176964e-07, + "loss": 0.0014, + "step": 14303 + }, + { + "epoch": 0.28, + "learning_rate": 1.4464680983262784e-07, + "loss": 0.0011, + "step": 14304 + }, + { + "epoch": 0.28, + "learning_rate": 1.446429264882917e-07, + "loss": 0.0022, + "step": 14305 + }, + { + "epoch": 0.28, + "learning_rate": 1.4463904314395555e-07, + "loss": 0.0017, + "step": 14306 + }, + { + "epoch": 0.28, + "learning_rate": 1.4463515979961942e-07, + "loss": 0.9334, + "step": 14307 + }, + { + "epoch": 0.28, + "learning_rate": 1.4463127645528327e-07, + "loss": 0.0023, + "step": 14308 + }, + { + "epoch": 0.28, + "learning_rate": 1.4462739311094714e-07, + "loss": 0.0014, + "step": 14309 + }, + { + "epoch": 0.28, + "learning_rate": 1.4462350976661098e-07, + "loss": 0.0011, + "step": 14310 + }, + { + "epoch": 0.28, + "learning_rate": 1.4461962642227486e-07, + "loss": 0.0014, + "step": 14311 + }, + { + "epoch": 0.28, + "learning_rate": 1.446157430779387e-07, + "loss": 0.0016, + "step": 14312 + }, + { + "epoch": 0.28, + "learning_rate": 1.4461185973360257e-07, + "loss": 0.0014, + "step": 14313 + }, + { + "epoch": 0.28, + "learning_rate": 1.4460797638926642e-07, + "loss": 0.0012, + "step": 14314 + }, + { + "epoch": 0.28, + "learning_rate": 1.446040930449303e-07, + "loss": 0.1904, + "step": 14315 + }, + { + "epoch": 0.28, + "learning_rate": 1.4460020970059413e-07, + "loss": 0.002, + "step": 14316 + }, + { + "epoch": 0.28, + "learning_rate": 1.44596326356258e-07, + "loss": 0.0012, + "step": 14317 + }, + { + "epoch": 0.28, + "learning_rate": 1.4459244301192185e-07, + "loss": 0.0011, + "step": 14318 + }, + { + "epoch": 0.28, + "learning_rate": 1.4458855966758572e-07, + "loss": 0.2381, + "step": 14319 + }, + { + "epoch": 0.28, + "learning_rate": 1.4458467632324957e-07, + "loss": 0.3765, + "step": 14320 + }, + { + "epoch": 0.28, + "learning_rate": 1.4458079297891344e-07, + "loss": 0.0013, + "step": 14321 + }, + { + "epoch": 0.28, + "learning_rate": 1.4457690963457728e-07, + "loss": 0.0017, + "step": 14322 + }, + { + "epoch": 0.28, + "learning_rate": 1.4457302629024116e-07, + "loss": 0.0014, + "step": 14323 + }, + { + "epoch": 0.28, + "learning_rate": 1.44569142945905e-07, + "loss": 0.0184, + "step": 14324 + }, + { + "epoch": 0.28, + "learning_rate": 1.4456525960156887e-07, + "loss": 0.0055, + "step": 14325 + }, + { + "epoch": 0.28, + "learning_rate": 1.4456137625723272e-07, + "loss": 0.0014, + "step": 14326 + }, + { + "epoch": 0.28, + "learning_rate": 1.445574929128966e-07, + "loss": 0.0013, + "step": 14327 + }, + { + "epoch": 0.28, + "learning_rate": 1.4455360956856043e-07, + "loss": 0.0021, + "step": 14328 + }, + { + "epoch": 0.28, + "learning_rate": 1.445497262242243e-07, + "loss": 0.0011, + "step": 14329 + }, + { + "epoch": 0.28, + "learning_rate": 1.4454584287988815e-07, + "loss": 0.002, + "step": 14330 + }, + { + "epoch": 0.28, + "learning_rate": 1.4454195953555202e-07, + "loss": 0.0019, + "step": 14331 + }, + { + "epoch": 0.28, + "learning_rate": 1.4453807619121587e-07, + "loss": 0.0012, + "step": 14332 + }, + { + "epoch": 0.28, + "learning_rate": 1.4453419284687974e-07, + "loss": 0.4543, + "step": 14333 + }, + { + "epoch": 0.28, + "learning_rate": 1.4453030950254358e-07, + "loss": 0.0954, + "step": 14334 + }, + { + "epoch": 0.28, + "learning_rate": 1.4452642615820745e-07, + "loss": 0.0047, + "step": 14335 + }, + { + "epoch": 0.28, + "learning_rate": 1.445225428138713e-07, + "loss": 0.0018, + "step": 14336 + }, + { + "epoch": 0.28, + "learning_rate": 1.4451865946953517e-07, + "loss": 0.0013, + "step": 14337 + }, + { + "epoch": 0.28, + "learning_rate": 1.4451477612519902e-07, + "loss": 0.0016, + "step": 14338 + }, + { + "epoch": 0.28, + "learning_rate": 1.445108927808629e-07, + "loss": 0.0058, + "step": 14339 + }, + { + "epoch": 0.28, + "learning_rate": 1.4450700943652673e-07, + "loss": 0.0297, + "step": 14340 + }, + { + "epoch": 0.28, + "learning_rate": 1.445031260921906e-07, + "loss": 0.0012, + "step": 14341 + }, + { + "epoch": 0.28, + "learning_rate": 1.4449924274785445e-07, + "loss": 0.0354, + "step": 14342 + }, + { + "epoch": 0.28, + "learning_rate": 1.4449535940351832e-07, + "loss": 0.0015, + "step": 14343 + }, + { + "epoch": 0.28, + "learning_rate": 1.4449147605918217e-07, + "loss": 0.0015, + "step": 14344 + }, + { + "epoch": 0.28, + "learning_rate": 1.4448759271484604e-07, + "loss": 0.0012, + "step": 14345 + }, + { + "epoch": 0.28, + "learning_rate": 1.4448370937050988e-07, + "loss": 0.0989, + "step": 14346 + }, + { + "epoch": 0.28, + "learning_rate": 1.4447982602617373e-07, + "loss": 0.8739, + "step": 14347 + }, + { + "epoch": 0.28, + "learning_rate": 1.4447594268183757e-07, + "loss": 0.0065, + "step": 14348 + }, + { + "epoch": 0.28, + "learning_rate": 1.4447205933750144e-07, + "loss": 0.0022, + "step": 14349 + }, + { + "epoch": 0.28, + "learning_rate": 1.444681759931653e-07, + "loss": 0.0163, + "step": 14350 + }, + { + "epoch": 0.28, + "learning_rate": 1.4446429264882916e-07, + "loss": 0.3712, + "step": 14351 + }, + { + "epoch": 0.28, + "learning_rate": 1.44460409304493e-07, + "loss": 0.0026, + "step": 14352 + }, + { + "epoch": 0.28, + "learning_rate": 1.4445652596015688e-07, + "loss": 0.0071, + "step": 14353 + }, + { + "epoch": 0.28, + "learning_rate": 1.4445264261582072e-07, + "loss": 0.0016, + "step": 14354 + }, + { + "epoch": 0.28, + "learning_rate": 1.444487592714846e-07, + "loss": 0.0098, + "step": 14355 + }, + { + "epoch": 0.28, + "learning_rate": 1.4444487592714844e-07, + "loss": 0.0052, + "step": 14356 + }, + { + "epoch": 0.28, + "learning_rate": 1.444409925828123e-07, + "loss": 0.1861, + "step": 14357 + }, + { + "epoch": 0.28, + "learning_rate": 1.4443710923847615e-07, + "loss": 0.0013, + "step": 14358 + }, + { + "epoch": 0.28, + "learning_rate": 1.4443322589414003e-07, + "loss": 1.0824, + "step": 14359 + }, + { + "epoch": 0.28, + "learning_rate": 1.4442934254980387e-07, + "loss": 0.016, + "step": 14360 + }, + { + "epoch": 0.28, + "learning_rate": 1.4442545920546774e-07, + "loss": 0.0023, + "step": 14361 + }, + { + "epoch": 0.28, + "learning_rate": 1.444215758611316e-07, + "loss": 0.0012, + "step": 14362 + }, + { + "epoch": 0.28, + "learning_rate": 1.4441769251679546e-07, + "loss": 0.0048, + "step": 14363 + }, + { + "epoch": 0.28, + "learning_rate": 1.444138091724593e-07, + "loss": 0.0014, + "step": 14364 + }, + { + "epoch": 0.28, + "learning_rate": 1.4440992582812317e-07, + "loss": 0.0018, + "step": 14365 + }, + { + "epoch": 0.28, + "learning_rate": 1.4440604248378702e-07, + "loss": 0.0014, + "step": 14366 + }, + { + "epoch": 0.28, + "learning_rate": 1.444021591394509e-07, + "loss": 0.0198, + "step": 14367 + }, + { + "epoch": 0.28, + "learning_rate": 1.4439827579511474e-07, + "loss": 0.0013, + "step": 14368 + }, + { + "epoch": 0.28, + "learning_rate": 1.443943924507786e-07, + "loss": 0.3264, + "step": 14369 + }, + { + "epoch": 0.28, + "learning_rate": 1.4439050910644245e-07, + "loss": 0.0015, + "step": 14370 + }, + { + "epoch": 0.28, + "learning_rate": 1.4438662576210632e-07, + "loss": 0.0015, + "step": 14371 + }, + { + "epoch": 0.28, + "learning_rate": 1.4438274241777017e-07, + "loss": 0.5476, + "step": 14372 + }, + { + "epoch": 0.28, + "learning_rate": 1.4437885907343404e-07, + "loss": 0.0015, + "step": 14373 + }, + { + "epoch": 0.28, + "learning_rate": 1.4437497572909789e-07, + "loss": 0.3054, + "step": 14374 + }, + { + "epoch": 0.28, + "learning_rate": 1.4437109238476176e-07, + "loss": 0.0012, + "step": 14375 + }, + { + "epoch": 0.28, + "learning_rate": 1.443672090404256e-07, + "loss": 0.0014, + "step": 14376 + }, + { + "epoch": 0.28, + "learning_rate": 1.4436332569608947e-07, + "loss": 0.002, + "step": 14377 + }, + { + "epoch": 0.28, + "learning_rate": 1.4435944235175332e-07, + "loss": 0.1831, + "step": 14378 + }, + { + "epoch": 0.28, + "learning_rate": 1.443555590074172e-07, + "loss": 0.0016, + "step": 14379 + }, + { + "epoch": 0.28, + "learning_rate": 1.4435167566308104e-07, + "loss": 0.0014, + "step": 14380 + }, + { + "epoch": 0.28, + "learning_rate": 1.443477923187449e-07, + "loss": 0.0155, + "step": 14381 + }, + { + "epoch": 0.28, + "learning_rate": 1.4434390897440875e-07, + "loss": 0.0063, + "step": 14382 + }, + { + "epoch": 0.28, + "learning_rate": 1.4434002563007262e-07, + "loss": 0.026, + "step": 14383 + }, + { + "epoch": 0.28, + "learning_rate": 1.4433614228573647e-07, + "loss": 0.0011, + "step": 14384 + }, + { + "epoch": 0.28, + "learning_rate": 1.4433225894140034e-07, + "loss": 0.0015, + "step": 14385 + }, + { + "epoch": 0.28, + "learning_rate": 1.4432837559706418e-07, + "loss": 0.0019, + "step": 14386 + }, + { + "epoch": 0.28, + "learning_rate": 1.4432449225272806e-07, + "loss": 0.5398, + "step": 14387 + }, + { + "epoch": 0.28, + "learning_rate": 1.443206089083919e-07, + "loss": 0.0017, + "step": 14388 + }, + { + "epoch": 0.28, + "learning_rate": 1.4431672556405577e-07, + "loss": 0.0016, + "step": 14389 + }, + { + "epoch": 0.28, + "learning_rate": 1.4431284221971962e-07, + "loss": 0.003, + "step": 14390 + }, + { + "epoch": 0.28, + "learning_rate": 1.443089588753835e-07, + "loss": 0.0601, + "step": 14391 + }, + { + "epoch": 0.28, + "learning_rate": 1.4430507553104733e-07, + "loss": 0.0028, + "step": 14392 + }, + { + "epoch": 0.28, + "learning_rate": 1.443011921867112e-07, + "loss": 0.0019, + "step": 14393 + }, + { + "epoch": 0.28, + "learning_rate": 1.4429730884237505e-07, + "loss": 0.0013, + "step": 14394 + }, + { + "epoch": 0.28, + "learning_rate": 1.4429342549803892e-07, + "loss": 0.0014, + "step": 14395 + }, + { + "epoch": 0.28, + "learning_rate": 1.4428954215370277e-07, + "loss": 0.0015, + "step": 14396 + }, + { + "epoch": 0.28, + "learning_rate": 1.4428565880936664e-07, + "loss": 0.4575, + "step": 14397 + }, + { + "epoch": 0.28, + "learning_rate": 1.4428177546503048e-07, + "loss": 0.0011, + "step": 14398 + }, + { + "epoch": 0.28, + "learning_rate": 1.4427789212069436e-07, + "loss": 0.3363, + "step": 14399 + }, + { + "epoch": 0.28, + "learning_rate": 1.442740087763582e-07, + "loss": 0.0015, + "step": 14400 + }, + { + "epoch": 0.28, + "learning_rate": 1.4427012543202207e-07, + "loss": 0.002, + "step": 14401 + }, + { + "epoch": 0.28, + "learning_rate": 1.4426624208768592e-07, + "loss": 0.0027, + "step": 14402 + }, + { + "epoch": 0.28, + "learning_rate": 1.442623587433498e-07, + "loss": 0.0011, + "step": 14403 + }, + { + "epoch": 0.28, + "learning_rate": 1.4425847539901363e-07, + "loss": 0.0012, + "step": 14404 + }, + { + "epoch": 0.28, + "learning_rate": 1.4425459205467748e-07, + "loss": 0.5722, + "step": 14405 + }, + { + "epoch": 0.28, + "learning_rate": 1.4425070871034132e-07, + "loss": 0.0013, + "step": 14406 + }, + { + "epoch": 0.28, + "learning_rate": 1.442468253660052e-07, + "loss": 0.004, + "step": 14407 + }, + { + "epoch": 0.28, + "learning_rate": 1.4424294202166904e-07, + "loss": 1.1782, + "step": 14408 + }, + { + "epoch": 0.28, + "learning_rate": 1.442390586773329e-07, + "loss": 0.0045, + "step": 14409 + }, + { + "epoch": 0.28, + "learning_rate": 1.4423517533299676e-07, + "loss": 0.0013, + "step": 14410 + }, + { + "epoch": 0.28, + "learning_rate": 1.4423129198866063e-07, + "loss": 0.0013, + "step": 14411 + }, + { + "epoch": 0.28, + "learning_rate": 1.4422740864432447e-07, + "loss": 0.0026, + "step": 14412 + }, + { + "epoch": 0.28, + "learning_rate": 1.4422352529998834e-07, + "loss": 0.0804, + "step": 14413 + }, + { + "epoch": 0.28, + "learning_rate": 1.442196419556522e-07, + "loss": 0.0051, + "step": 14414 + }, + { + "epoch": 0.28, + "learning_rate": 1.4421575861131606e-07, + "loss": 0.0014, + "step": 14415 + }, + { + "epoch": 0.28, + "learning_rate": 1.442118752669799e-07, + "loss": 0.0015, + "step": 14416 + }, + { + "epoch": 0.28, + "learning_rate": 1.4420799192264378e-07, + "loss": 0.0017, + "step": 14417 + }, + { + "epoch": 0.28, + "learning_rate": 1.4420410857830762e-07, + "loss": 0.0013, + "step": 14418 + }, + { + "epoch": 0.28, + "learning_rate": 1.442002252339715e-07, + "loss": 0.0013, + "step": 14419 + }, + { + "epoch": 0.28, + "learning_rate": 1.4419634188963534e-07, + "loss": 0.0019, + "step": 14420 + }, + { + "epoch": 0.28, + "learning_rate": 1.441924585452992e-07, + "loss": 0.0013, + "step": 14421 + }, + { + "epoch": 0.28, + "learning_rate": 1.4418857520096306e-07, + "loss": 0.0082, + "step": 14422 + }, + { + "epoch": 0.28, + "learning_rate": 1.4418469185662693e-07, + "loss": 0.0026, + "step": 14423 + }, + { + "epoch": 0.28, + "learning_rate": 1.4418080851229077e-07, + "loss": 0.0025, + "step": 14424 + }, + { + "epoch": 0.28, + "learning_rate": 1.4417692516795464e-07, + "loss": 0.0073, + "step": 14425 + }, + { + "epoch": 0.28, + "learning_rate": 1.441730418236185e-07, + "loss": 0.0016, + "step": 14426 + }, + { + "epoch": 0.28, + "learning_rate": 1.4416915847928236e-07, + "loss": 0.0042, + "step": 14427 + }, + { + "epoch": 0.28, + "learning_rate": 1.441652751349462e-07, + "loss": 0.0123, + "step": 14428 + }, + { + "epoch": 0.28, + "learning_rate": 1.4416139179061008e-07, + "loss": 0.0013, + "step": 14429 + }, + { + "epoch": 0.28, + "learning_rate": 1.4415750844627392e-07, + "loss": 0.0012, + "step": 14430 + }, + { + "epoch": 0.28, + "learning_rate": 1.441536251019378e-07, + "loss": 0.0015, + "step": 14431 + }, + { + "epoch": 0.28, + "learning_rate": 1.4414974175760164e-07, + "loss": 0.0016, + "step": 14432 + }, + { + "epoch": 0.28, + "learning_rate": 1.441458584132655e-07, + "loss": 0.006, + "step": 14433 + }, + { + "epoch": 0.28, + "learning_rate": 1.4414197506892935e-07, + "loss": 0.0017, + "step": 14434 + }, + { + "epoch": 0.28, + "learning_rate": 1.4413809172459323e-07, + "loss": 0.0014, + "step": 14435 + }, + { + "epoch": 0.28, + "learning_rate": 1.4413420838025707e-07, + "loss": 0.0013, + "step": 14436 + }, + { + "epoch": 0.28, + "learning_rate": 1.4413032503592094e-07, + "loss": 0.0017, + "step": 14437 + }, + { + "epoch": 0.28, + "learning_rate": 1.441264416915848e-07, + "loss": 0.0018, + "step": 14438 + }, + { + "epoch": 0.28, + "learning_rate": 1.4412255834724866e-07, + "loss": 0.0013, + "step": 14439 + }, + { + "epoch": 0.28, + "learning_rate": 1.441186750029125e-07, + "loss": 0.0022, + "step": 14440 + }, + { + "epoch": 0.28, + "learning_rate": 1.4411479165857638e-07, + "loss": 0.0027, + "step": 14441 + }, + { + "epoch": 0.28, + "learning_rate": 1.4411090831424022e-07, + "loss": 0.0052, + "step": 14442 + }, + { + "epoch": 0.28, + "learning_rate": 1.441070249699041e-07, + "loss": 0.0014, + "step": 14443 + }, + { + "epoch": 0.28, + "learning_rate": 1.4410314162556794e-07, + "loss": 0.0011, + "step": 14444 + }, + { + "epoch": 0.28, + "learning_rate": 1.4409925828123178e-07, + "loss": 0.73, + "step": 14445 + }, + { + "epoch": 0.28, + "learning_rate": 1.4409537493689565e-07, + "loss": 0.002, + "step": 14446 + }, + { + "epoch": 0.28, + "learning_rate": 1.440914915925595e-07, + "loss": 0.0016, + "step": 14447 + }, + { + "epoch": 0.28, + "learning_rate": 1.4408760824822337e-07, + "loss": 0.0013, + "step": 14448 + }, + { + "epoch": 0.28, + "learning_rate": 1.4408372490388721e-07, + "loss": 0.0012, + "step": 14449 + }, + { + "epoch": 0.28, + "learning_rate": 1.4407984155955109e-07, + "loss": 0.0015, + "step": 14450 + }, + { + "epoch": 0.28, + "learning_rate": 1.4407595821521493e-07, + "loss": 0.0033, + "step": 14451 + }, + { + "epoch": 0.28, + "learning_rate": 1.440720748708788e-07, + "loss": 0.0017, + "step": 14452 + }, + { + "epoch": 0.28, + "learning_rate": 1.4406819152654265e-07, + "loss": 0.45, + "step": 14453 + }, + { + "epoch": 0.28, + "learning_rate": 1.4406430818220652e-07, + "loss": 0.1908, + "step": 14454 + }, + { + "epoch": 0.28, + "learning_rate": 1.4406042483787036e-07, + "loss": 0.0014, + "step": 14455 + }, + { + "epoch": 0.28, + "learning_rate": 1.4405654149353424e-07, + "loss": 0.0013, + "step": 14456 + }, + { + "epoch": 0.28, + "learning_rate": 1.4405265814919808e-07, + "loss": 0.0013, + "step": 14457 + }, + { + "epoch": 0.28, + "learning_rate": 1.4404877480486195e-07, + "loss": 0.0014, + "step": 14458 + }, + { + "epoch": 0.28, + "learning_rate": 1.440448914605258e-07, + "loss": 0.0022, + "step": 14459 + }, + { + "epoch": 0.28, + "learning_rate": 1.4404100811618967e-07, + "loss": 0.0013, + "step": 14460 + }, + { + "epoch": 0.28, + "learning_rate": 1.4403712477185351e-07, + "loss": 0.002, + "step": 14461 + }, + { + "epoch": 0.28, + "learning_rate": 1.4403324142751738e-07, + "loss": 0.0084, + "step": 14462 + }, + { + "epoch": 0.28, + "learning_rate": 1.4402935808318123e-07, + "loss": 0.0331, + "step": 14463 + }, + { + "epoch": 0.28, + "learning_rate": 1.4402547473884507e-07, + "loss": 0.0813, + "step": 14464 + }, + { + "epoch": 0.28, + "learning_rate": 1.4402159139450895e-07, + "loss": 0.0014, + "step": 14465 + }, + { + "epoch": 0.28, + "learning_rate": 1.440177080501728e-07, + "loss": 0.0012, + "step": 14466 + }, + { + "epoch": 0.28, + "learning_rate": 1.4401382470583666e-07, + "loss": 0.0017, + "step": 14467 + }, + { + "epoch": 0.28, + "learning_rate": 1.440099413615005e-07, + "loss": 0.0014, + "step": 14468 + }, + { + "epoch": 0.28, + "learning_rate": 1.4400605801716438e-07, + "loss": 0.0009, + "step": 14469 + }, + { + "epoch": 0.28, + "learning_rate": 1.4400217467282822e-07, + "loss": 0.0019, + "step": 14470 + }, + { + "epoch": 0.28, + "learning_rate": 1.439982913284921e-07, + "loss": 0.0014, + "step": 14471 + }, + { + "epoch": 0.28, + "learning_rate": 1.4399440798415594e-07, + "loss": 0.0014, + "step": 14472 + }, + { + "epoch": 0.28, + "learning_rate": 1.439905246398198e-07, + "loss": 0.0009, + "step": 14473 + }, + { + "epoch": 0.28, + "learning_rate": 1.4398664129548366e-07, + "loss": 0.0014, + "step": 14474 + }, + { + "epoch": 0.28, + "learning_rate": 1.439827579511475e-07, + "loss": 0.0015, + "step": 14475 + }, + { + "epoch": 0.28, + "learning_rate": 1.4397887460681137e-07, + "loss": 0.0827, + "step": 14476 + }, + { + "epoch": 0.28, + "learning_rate": 1.4397499126247522e-07, + "loss": 0.0013, + "step": 14477 + }, + { + "epoch": 0.28, + "learning_rate": 1.439711079181391e-07, + "loss": 0.0012, + "step": 14478 + }, + { + "epoch": 0.28, + "learning_rate": 1.4396722457380294e-07, + "loss": 0.0443, + "step": 14479 + }, + { + "epoch": 0.28, + "learning_rate": 1.439633412294668e-07, + "loss": 0.0012, + "step": 14480 + }, + { + "epoch": 0.28, + "learning_rate": 1.4395945788513065e-07, + "loss": 0.0011, + "step": 14481 + }, + { + "epoch": 0.28, + "learning_rate": 1.4395557454079452e-07, + "loss": 0.5158, + "step": 14482 + }, + { + "epoch": 0.28, + "learning_rate": 1.4395169119645837e-07, + "loss": 0.0022, + "step": 14483 + }, + { + "epoch": 0.28, + "learning_rate": 1.4394780785212224e-07, + "loss": 0.0022, + "step": 14484 + }, + { + "epoch": 0.28, + "learning_rate": 1.4394392450778608e-07, + "loss": 0.0046, + "step": 14485 + }, + { + "epoch": 0.28, + "learning_rate": 1.4394004116344996e-07, + "loss": 0.0016, + "step": 14486 + }, + { + "epoch": 0.28, + "learning_rate": 1.439361578191138e-07, + "loss": 0.001, + "step": 14487 + }, + { + "epoch": 0.28, + "learning_rate": 1.4393227447477767e-07, + "loss": 0.5762, + "step": 14488 + }, + { + "epoch": 0.28, + "learning_rate": 1.4392839113044152e-07, + "loss": 0.4579, + "step": 14489 + }, + { + "epoch": 0.28, + "learning_rate": 1.439245077861054e-07, + "loss": 0.0013, + "step": 14490 + }, + { + "epoch": 0.28, + "learning_rate": 1.4392062444176923e-07, + "loss": 0.0022, + "step": 14491 + }, + { + "epoch": 0.28, + "learning_rate": 1.439167410974331e-07, + "loss": 0.0015, + "step": 14492 + }, + { + "epoch": 0.28, + "learning_rate": 1.4391285775309695e-07, + "loss": 0.0012, + "step": 14493 + }, + { + "epoch": 0.28, + "learning_rate": 1.4390897440876082e-07, + "loss": 0.0013, + "step": 14494 + }, + { + "epoch": 0.28, + "learning_rate": 1.4390509106442467e-07, + "loss": 0.7835, + "step": 14495 + }, + { + "epoch": 0.28, + "learning_rate": 1.4390120772008854e-07, + "loss": 0.0118, + "step": 14496 + }, + { + "epoch": 0.28, + "learning_rate": 1.4389732437575238e-07, + "loss": 0.0012, + "step": 14497 + }, + { + "epoch": 0.28, + "learning_rate": 1.4389344103141626e-07, + "loss": 0.0013, + "step": 14498 + }, + { + "epoch": 0.28, + "learning_rate": 1.438895576870801e-07, + "loss": 0.0013, + "step": 14499 + }, + { + "epoch": 0.28, + "learning_rate": 1.4388567434274397e-07, + "loss": 0.0012, + "step": 14500 + }, + { + "epoch": 0.28, + "learning_rate": 1.4388179099840782e-07, + "loss": 0.0023, + "step": 14501 + }, + { + "epoch": 0.28, + "learning_rate": 1.438779076540717e-07, + "loss": 0.7054, + "step": 14502 + }, + { + "epoch": 0.28, + "learning_rate": 1.4387402430973553e-07, + "loss": 0.0436, + "step": 14503 + }, + { + "epoch": 0.28, + "learning_rate": 1.438701409653994e-07, + "loss": 0.0026, + "step": 14504 + }, + { + "epoch": 0.28, + "learning_rate": 1.4386625762106325e-07, + "loss": 0.0028, + "step": 14505 + }, + { + "epoch": 0.28, + "learning_rate": 1.4386237427672712e-07, + "loss": 0.3567, + "step": 14506 + }, + { + "epoch": 0.28, + "learning_rate": 1.4385849093239097e-07, + "loss": 0.0011, + "step": 14507 + }, + { + "epoch": 0.28, + "learning_rate": 1.4385460758805484e-07, + "loss": 0.0008, + "step": 14508 + }, + { + "epoch": 0.28, + "learning_rate": 1.4385072424371868e-07, + "loss": 0.0021, + "step": 14509 + }, + { + "epoch": 0.28, + "learning_rate": 1.4384684089938255e-07, + "loss": 0.0013, + "step": 14510 + }, + { + "epoch": 0.28, + "learning_rate": 1.438429575550464e-07, + "loss": 0.3845, + "step": 14511 + }, + { + "epoch": 0.28, + "learning_rate": 1.4383907421071027e-07, + "loss": 0.4035, + "step": 14512 + }, + { + "epoch": 0.28, + "learning_rate": 1.4383519086637412e-07, + "loss": 0.0011, + "step": 14513 + }, + { + "epoch": 0.28, + "learning_rate": 1.43831307522038e-07, + "loss": 0.0031, + "step": 14514 + }, + { + "epoch": 0.28, + "learning_rate": 1.4382742417770183e-07, + "loss": 0.0013, + "step": 14515 + }, + { + "epoch": 0.28, + "learning_rate": 1.438235408333657e-07, + "loss": 0.2964, + "step": 14516 + }, + { + "epoch": 0.28, + "learning_rate": 1.4381965748902955e-07, + "loss": 0.0015, + "step": 14517 + }, + { + "epoch": 0.28, + "learning_rate": 1.4381577414469342e-07, + "loss": 0.0012, + "step": 14518 + }, + { + "epoch": 0.28, + "learning_rate": 1.4381189080035727e-07, + "loss": 0.0013, + "step": 14519 + }, + { + "epoch": 0.28, + "learning_rate": 1.4380800745602114e-07, + "loss": 0.0015, + "step": 14520 + }, + { + "epoch": 0.28, + "learning_rate": 1.4380412411168496e-07, + "loss": 0.0014, + "step": 14521 + }, + { + "epoch": 0.28, + "learning_rate": 1.4380024076734883e-07, + "loss": 0.0021, + "step": 14522 + }, + { + "epoch": 0.28, + "learning_rate": 1.4379635742301267e-07, + "loss": 0.0122, + "step": 14523 + }, + { + "epoch": 0.28, + "learning_rate": 1.4379247407867654e-07, + "loss": 0.0011, + "step": 14524 + }, + { + "epoch": 0.28, + "learning_rate": 1.437885907343404e-07, + "loss": 0.5642, + "step": 14525 + }, + { + "epoch": 0.28, + "learning_rate": 1.4378470739000426e-07, + "loss": 0.0265, + "step": 14526 + }, + { + "epoch": 0.28, + "learning_rate": 1.437808240456681e-07, + "loss": 0.0422, + "step": 14527 + }, + { + "epoch": 0.28, + "learning_rate": 1.4377694070133198e-07, + "loss": 0.0012, + "step": 14528 + }, + { + "epoch": 0.28, + "learning_rate": 1.4377305735699582e-07, + "loss": 0.0115, + "step": 14529 + }, + { + "epoch": 0.28, + "learning_rate": 1.437691740126597e-07, + "loss": 0.0017, + "step": 14530 + }, + { + "epoch": 0.28, + "learning_rate": 1.4376529066832354e-07, + "loss": 0.0024, + "step": 14531 + }, + { + "epoch": 0.28, + "learning_rate": 1.437614073239874e-07, + "loss": 0.0015, + "step": 14532 + }, + { + "epoch": 0.28, + "learning_rate": 1.4375752397965125e-07, + "loss": 0.0014, + "step": 14533 + }, + { + "epoch": 0.28, + "learning_rate": 1.4375364063531513e-07, + "loss": 0.008, + "step": 14534 + }, + { + "epoch": 0.28, + "learning_rate": 1.4374975729097897e-07, + "loss": 1.0566, + "step": 14535 + }, + { + "epoch": 0.28, + "learning_rate": 1.4374587394664284e-07, + "loss": 0.0017, + "step": 14536 + }, + { + "epoch": 0.28, + "learning_rate": 1.437419906023067e-07, + "loss": 0.0038, + "step": 14537 + }, + { + "epoch": 0.28, + "learning_rate": 1.4373810725797056e-07, + "loss": 0.0012, + "step": 14538 + }, + { + "epoch": 0.28, + "learning_rate": 1.437342239136344e-07, + "loss": 0.0015, + "step": 14539 + }, + { + "epoch": 0.28, + "learning_rate": 1.4373034056929828e-07, + "loss": 0.0011, + "step": 14540 + }, + { + "epoch": 0.28, + "learning_rate": 1.4372645722496212e-07, + "loss": 0.0014, + "step": 14541 + }, + { + "epoch": 0.28, + "learning_rate": 1.43722573880626e-07, + "loss": 0.0013, + "step": 14542 + }, + { + "epoch": 0.28, + "learning_rate": 1.4371869053628984e-07, + "loss": 0.0013, + "step": 14543 + }, + { + "epoch": 0.28, + "learning_rate": 1.437148071919537e-07, + "loss": 0.0061, + "step": 14544 + }, + { + "epoch": 0.28, + "learning_rate": 1.4371092384761755e-07, + "loss": 0.0013, + "step": 14545 + }, + { + "epoch": 0.28, + "learning_rate": 1.4370704050328142e-07, + "loss": 0.9806, + "step": 14546 + }, + { + "epoch": 0.28, + "learning_rate": 1.4370315715894527e-07, + "loss": 0.0011, + "step": 14547 + }, + { + "epoch": 0.28, + "learning_rate": 1.4369927381460914e-07, + "loss": 0.0211, + "step": 14548 + }, + { + "epoch": 0.28, + "learning_rate": 1.4369539047027299e-07, + "loss": 0.0016, + "step": 14549 + }, + { + "epoch": 0.28, + "learning_rate": 1.4369150712593686e-07, + "loss": 0.001, + "step": 14550 + }, + { + "epoch": 0.28, + "learning_rate": 1.436876237816007e-07, + "loss": 0.0014, + "step": 14551 + }, + { + "epoch": 0.28, + "learning_rate": 1.4368374043726457e-07, + "loss": 0.026, + "step": 14552 + }, + { + "epoch": 0.28, + "learning_rate": 1.4367985709292842e-07, + "loss": 0.0017, + "step": 14553 + }, + { + "epoch": 0.28, + "learning_rate": 1.436759737485923e-07, + "loss": 0.0011, + "step": 14554 + }, + { + "epoch": 0.28, + "learning_rate": 1.4367209040425614e-07, + "loss": 0.1692, + "step": 14555 + }, + { + "epoch": 0.28, + "learning_rate": 1.4366820705992e-07, + "loss": 0.1252, + "step": 14556 + }, + { + "epoch": 0.28, + "learning_rate": 1.4366432371558385e-07, + "loss": 0.0018, + "step": 14557 + }, + { + "epoch": 0.28, + "learning_rate": 1.4366044037124772e-07, + "loss": 0.0031, + "step": 14558 + }, + { + "epoch": 0.28, + "learning_rate": 1.4365655702691157e-07, + "loss": 0.0132, + "step": 14559 + }, + { + "epoch": 0.28, + "learning_rate": 1.4365267368257544e-07, + "loss": 0.0834, + "step": 14560 + }, + { + "epoch": 0.28, + "learning_rate": 1.4364879033823928e-07, + "loss": 0.0014, + "step": 14561 + }, + { + "epoch": 0.28, + "learning_rate": 1.4364490699390316e-07, + "loss": 0.1735, + "step": 14562 + }, + { + "epoch": 0.28, + "learning_rate": 1.43641023649567e-07, + "loss": 0.0014, + "step": 14563 + }, + { + "epoch": 0.28, + "learning_rate": 1.4363714030523087e-07, + "loss": 0.0016, + "step": 14564 + }, + { + "epoch": 0.28, + "learning_rate": 1.4363325696089472e-07, + "loss": 0.0012, + "step": 14565 + }, + { + "epoch": 0.28, + "learning_rate": 1.436293736165586e-07, + "loss": 0.0025, + "step": 14566 + }, + { + "epoch": 0.28, + "learning_rate": 1.4362549027222243e-07, + "loss": 1.1138, + "step": 14567 + }, + { + "epoch": 0.28, + "learning_rate": 1.436216069278863e-07, + "loss": 0.0018, + "step": 14568 + }, + { + "epoch": 0.28, + "learning_rate": 1.4361772358355015e-07, + "loss": 0.0015, + "step": 14569 + }, + { + "epoch": 0.28, + "learning_rate": 1.4361384023921402e-07, + "loss": 0.0014, + "step": 14570 + }, + { + "epoch": 0.28, + "learning_rate": 1.4360995689487787e-07, + "loss": 0.0089, + "step": 14571 + }, + { + "epoch": 0.28, + "learning_rate": 1.4360607355054174e-07, + "loss": 0.0012, + "step": 14572 + }, + { + "epoch": 0.28, + "learning_rate": 1.4360219020620558e-07, + "loss": 0.0019, + "step": 14573 + }, + { + "epoch": 0.28, + "learning_rate": 1.4359830686186946e-07, + "loss": 0.0012, + "step": 14574 + }, + { + "epoch": 0.28, + "learning_rate": 1.435944235175333e-07, + "loss": 0.3726, + "step": 14575 + }, + { + "epoch": 0.28, + "learning_rate": 1.4359054017319717e-07, + "loss": 0.0125, + "step": 14576 + }, + { + "epoch": 0.28, + "learning_rate": 1.4358665682886102e-07, + "loss": 0.0011, + "step": 14577 + }, + { + "epoch": 0.28, + "learning_rate": 1.435827734845249e-07, + "loss": 0.0015, + "step": 14578 + }, + { + "epoch": 0.28, + "learning_rate": 1.435788901401887e-07, + "loss": 0.001, + "step": 14579 + }, + { + "epoch": 0.28, + "learning_rate": 1.4357500679585258e-07, + "loss": 0.0014, + "step": 14580 + }, + { + "epoch": 0.28, + "learning_rate": 1.4357112345151642e-07, + "loss": 0.0013, + "step": 14581 + }, + { + "epoch": 0.28, + "learning_rate": 1.435672401071803e-07, + "loss": 0.0093, + "step": 14582 + }, + { + "epoch": 0.28, + "learning_rate": 1.4356335676284414e-07, + "loss": 0.003, + "step": 14583 + }, + { + "epoch": 0.28, + "learning_rate": 1.43559473418508e-07, + "loss": 0.0013, + "step": 14584 + }, + { + "epoch": 0.28, + "learning_rate": 1.4355559007417186e-07, + "loss": 1.0137, + "step": 14585 + }, + { + "epoch": 0.28, + "learning_rate": 1.4355170672983573e-07, + "loss": 0.3482, + "step": 14586 + }, + { + "epoch": 0.28, + "learning_rate": 1.4354782338549957e-07, + "loss": 0.0012, + "step": 14587 + }, + { + "epoch": 0.28, + "learning_rate": 1.4354394004116344e-07, + "loss": 0.0015, + "step": 14588 + }, + { + "epoch": 0.28, + "learning_rate": 1.435400566968273e-07, + "loss": 0.001, + "step": 14589 + }, + { + "epoch": 0.28, + "learning_rate": 1.4353617335249116e-07, + "loss": 0.0016, + "step": 14590 + }, + { + "epoch": 0.28, + "learning_rate": 1.43532290008155e-07, + "loss": 0.0013, + "step": 14591 + }, + { + "epoch": 0.28, + "learning_rate": 1.4352840666381888e-07, + "loss": 0.0011, + "step": 14592 + }, + { + "epoch": 0.28, + "learning_rate": 1.4352452331948272e-07, + "loss": 0.0013, + "step": 14593 + }, + { + "epoch": 0.28, + "learning_rate": 1.435206399751466e-07, + "loss": 0.0011, + "step": 14594 + }, + { + "epoch": 0.28, + "learning_rate": 1.4351675663081044e-07, + "loss": 0.0013, + "step": 14595 + }, + { + "epoch": 0.28, + "learning_rate": 1.435128732864743e-07, + "loss": 0.0108, + "step": 14596 + }, + { + "epoch": 0.28, + "learning_rate": 1.4350898994213816e-07, + "loss": 0.001, + "step": 14597 + }, + { + "epoch": 0.28, + "learning_rate": 1.4350510659780203e-07, + "loss": 0.0011, + "step": 14598 + }, + { + "epoch": 0.28, + "learning_rate": 1.4350122325346587e-07, + "loss": 0.0752, + "step": 14599 + }, + { + "epoch": 0.28, + "learning_rate": 1.4349733990912974e-07, + "loss": 0.0883, + "step": 14600 + }, + { + "epoch": 0.28, + "learning_rate": 1.434934565647936e-07, + "loss": 0.0334, + "step": 14601 + }, + { + "epoch": 0.28, + "learning_rate": 1.4348957322045746e-07, + "loss": 0.0011, + "step": 14602 + }, + { + "epoch": 0.28, + "learning_rate": 1.434856898761213e-07, + "loss": 0.0013, + "step": 14603 + }, + { + "epoch": 0.28, + "learning_rate": 1.4348180653178518e-07, + "loss": 0.0181, + "step": 14604 + }, + { + "epoch": 0.28, + "learning_rate": 1.4347792318744902e-07, + "loss": 0.0027, + "step": 14605 + }, + { + "epoch": 0.28, + "learning_rate": 1.434740398431129e-07, + "loss": 0.0012, + "step": 14606 + }, + { + "epoch": 0.28, + "learning_rate": 1.4347015649877674e-07, + "loss": 0.0018, + "step": 14607 + }, + { + "epoch": 0.28, + "learning_rate": 1.434662731544406e-07, + "loss": 0.0013, + "step": 14608 + }, + { + "epoch": 0.28, + "learning_rate": 1.4346238981010445e-07, + "loss": 0.013, + "step": 14609 + }, + { + "epoch": 0.28, + "learning_rate": 1.4345850646576833e-07, + "loss": 0.0013, + "step": 14610 + }, + { + "epoch": 0.28, + "learning_rate": 1.4345462312143217e-07, + "loss": 0.2928, + "step": 14611 + }, + { + "epoch": 0.28, + "learning_rate": 1.4345073977709604e-07, + "loss": 0.0014, + "step": 14612 + }, + { + "epoch": 0.28, + "learning_rate": 1.434468564327599e-07, + "loss": 0.0254, + "step": 14613 + }, + { + "epoch": 0.28, + "learning_rate": 1.4344297308842376e-07, + "loss": 0.0033, + "step": 14614 + }, + { + "epoch": 0.28, + "learning_rate": 1.434390897440876e-07, + "loss": 0.385, + "step": 14615 + }, + { + "epoch": 0.28, + "learning_rate": 1.4343520639975148e-07, + "loss": 0.0012, + "step": 14616 + }, + { + "epoch": 0.28, + "learning_rate": 1.4343132305541532e-07, + "loss": 0.001, + "step": 14617 + }, + { + "epoch": 0.28, + "learning_rate": 1.434274397110792e-07, + "loss": 0.0043, + "step": 14618 + }, + { + "epoch": 0.28, + "learning_rate": 1.4342355636674304e-07, + "loss": 0.0575, + "step": 14619 + }, + { + "epoch": 0.28, + "learning_rate": 1.434196730224069e-07, + "loss": 0.3924, + "step": 14620 + }, + { + "epoch": 0.28, + "learning_rate": 1.4341578967807075e-07, + "loss": 0.001, + "step": 14621 + }, + { + "epoch": 0.28, + "learning_rate": 1.434119063337346e-07, + "loss": 0.0013, + "step": 14622 + }, + { + "epoch": 0.28, + "learning_rate": 1.4340802298939847e-07, + "loss": 0.0014, + "step": 14623 + }, + { + "epoch": 0.28, + "learning_rate": 1.4340413964506231e-07, + "loss": 0.0012, + "step": 14624 + }, + { + "epoch": 0.28, + "learning_rate": 1.4340025630072619e-07, + "loss": 0.0012, + "step": 14625 + }, + { + "epoch": 0.28, + "learning_rate": 1.4339637295639003e-07, + "loss": 0.0017, + "step": 14626 + }, + { + "epoch": 0.28, + "learning_rate": 1.433924896120539e-07, + "loss": 0.0012, + "step": 14627 + }, + { + "epoch": 0.28, + "learning_rate": 1.4338860626771775e-07, + "loss": 0.0011, + "step": 14628 + }, + { + "epoch": 0.28, + "learning_rate": 1.4338472292338162e-07, + "loss": 0.0023, + "step": 14629 + }, + { + "epoch": 0.28, + "learning_rate": 1.4338083957904546e-07, + "loss": 0.0988, + "step": 14630 + }, + { + "epoch": 0.28, + "learning_rate": 1.4337695623470934e-07, + "loss": 0.002, + "step": 14631 + }, + { + "epoch": 0.28, + "learning_rate": 1.4337307289037318e-07, + "loss": 0.0014, + "step": 14632 + }, + { + "epoch": 0.28, + "learning_rate": 1.4336918954603705e-07, + "loss": 0.9651, + "step": 14633 + }, + { + "epoch": 0.28, + "learning_rate": 1.433653062017009e-07, + "loss": 0.0015, + "step": 14634 + }, + { + "epoch": 0.28, + "learning_rate": 1.4336142285736477e-07, + "loss": 0.0015, + "step": 14635 + }, + { + "epoch": 0.28, + "learning_rate": 1.4335753951302861e-07, + "loss": 0.0019, + "step": 14636 + }, + { + "epoch": 0.28, + "learning_rate": 1.4335365616869246e-07, + "loss": 0.3877, + "step": 14637 + }, + { + "epoch": 0.28, + "learning_rate": 1.4334977282435633e-07, + "loss": 0.0013, + "step": 14638 + }, + { + "epoch": 0.28, + "learning_rate": 1.4334588948002018e-07, + "loss": 0.0015, + "step": 14639 + }, + { + "epoch": 0.28, + "learning_rate": 1.4334200613568405e-07, + "loss": 0.0021, + "step": 14640 + }, + { + "epoch": 0.28, + "learning_rate": 1.433381227913479e-07, + "loss": 0.3004, + "step": 14641 + }, + { + "epoch": 0.28, + "learning_rate": 1.4333423944701176e-07, + "loss": 0.0013, + "step": 14642 + }, + { + "epoch": 0.28, + "learning_rate": 1.433303561026756e-07, + "loss": 0.0014, + "step": 14643 + }, + { + "epoch": 0.28, + "learning_rate": 1.4332647275833948e-07, + "loss": 0.0009, + "step": 14644 + }, + { + "epoch": 0.28, + "learning_rate": 1.4332258941400332e-07, + "loss": 0.0042, + "step": 14645 + }, + { + "epoch": 0.28, + "learning_rate": 1.433187060696672e-07, + "loss": 0.001, + "step": 14646 + }, + { + "epoch": 0.28, + "learning_rate": 1.4331482272533104e-07, + "loss": 0.6158, + "step": 14647 + }, + { + "epoch": 0.28, + "learning_rate": 1.433109393809949e-07, + "loss": 0.0017, + "step": 14648 + }, + { + "epoch": 0.28, + "learning_rate": 1.4330705603665876e-07, + "loss": 0.3084, + "step": 14649 + }, + { + "epoch": 0.28, + "learning_rate": 1.4330317269232263e-07, + "loss": 0.0033, + "step": 14650 + }, + { + "epoch": 0.28, + "learning_rate": 1.4329928934798647e-07, + "loss": 0.0011, + "step": 14651 + }, + { + "epoch": 0.28, + "learning_rate": 1.4329540600365032e-07, + "loss": 0.0018, + "step": 14652 + }, + { + "epoch": 0.28, + "learning_rate": 1.432915226593142e-07, + "loss": 0.2526, + "step": 14653 + }, + { + "epoch": 0.28, + "learning_rate": 1.4328763931497804e-07, + "loss": 0.0017, + "step": 14654 + }, + { + "epoch": 0.28, + "learning_rate": 1.432837559706419e-07, + "loss": 0.0012, + "step": 14655 + }, + { + "epoch": 0.28, + "learning_rate": 1.4327987262630575e-07, + "loss": 0.471, + "step": 14656 + }, + { + "epoch": 0.28, + "learning_rate": 1.4327598928196962e-07, + "loss": 0.0012, + "step": 14657 + }, + { + "epoch": 0.28, + "learning_rate": 1.4327210593763347e-07, + "loss": 0.0014, + "step": 14658 + }, + { + "epoch": 0.28, + "learning_rate": 1.4326822259329734e-07, + "loss": 0.3336, + "step": 14659 + }, + { + "epoch": 0.28, + "learning_rate": 1.4326433924896118e-07, + "loss": 0.0014, + "step": 14660 + }, + { + "epoch": 0.28, + "learning_rate": 1.4326045590462506e-07, + "loss": 0.0012, + "step": 14661 + }, + { + "epoch": 0.28, + "learning_rate": 1.432565725602889e-07, + "loss": 0.0046, + "step": 14662 + }, + { + "epoch": 0.28, + "learning_rate": 1.4325268921595277e-07, + "loss": 0.0012, + "step": 14663 + }, + { + "epoch": 0.28, + "learning_rate": 1.4324880587161662e-07, + "loss": 0.001, + "step": 14664 + }, + { + "epoch": 0.28, + "learning_rate": 1.432449225272805e-07, + "loss": 0.6287, + "step": 14665 + }, + { + "epoch": 0.28, + "learning_rate": 1.4324103918294433e-07, + "loss": 0.1738, + "step": 14666 + }, + { + "epoch": 0.28, + "learning_rate": 1.432371558386082e-07, + "loss": 0.0009, + "step": 14667 + }, + { + "epoch": 0.28, + "learning_rate": 1.4323327249427205e-07, + "loss": 0.0015, + "step": 14668 + }, + { + "epoch": 0.28, + "learning_rate": 1.4322938914993592e-07, + "loss": 0.0012, + "step": 14669 + }, + { + "epoch": 0.28, + "learning_rate": 1.4322550580559977e-07, + "loss": 0.0016, + "step": 14670 + }, + { + "epoch": 0.28, + "learning_rate": 1.4322162246126364e-07, + "loss": 0.0013, + "step": 14671 + }, + { + "epoch": 0.28, + "learning_rate": 1.4321773911692748e-07, + "loss": 0.0015, + "step": 14672 + }, + { + "epoch": 0.28, + "learning_rate": 1.4321385577259136e-07, + "loss": 0.0014, + "step": 14673 + }, + { + "epoch": 0.28, + "learning_rate": 1.432099724282552e-07, + "loss": 0.0013, + "step": 14674 + }, + { + "epoch": 0.28, + "learning_rate": 1.4320608908391907e-07, + "loss": 0.0012, + "step": 14675 + }, + { + "epoch": 0.28, + "learning_rate": 1.4320220573958292e-07, + "loss": 0.0012, + "step": 14676 + }, + { + "epoch": 0.28, + "learning_rate": 1.431983223952468e-07, + "loss": 0.0011, + "step": 14677 + }, + { + "epoch": 0.28, + "learning_rate": 1.4319443905091063e-07, + "loss": 0.0021, + "step": 14678 + }, + { + "epoch": 0.28, + "learning_rate": 1.431905557065745e-07, + "loss": 0.0012, + "step": 14679 + }, + { + "epoch": 0.28, + "learning_rate": 1.4318667236223835e-07, + "loss": 0.0104, + "step": 14680 + }, + { + "epoch": 0.28, + "learning_rate": 1.4318278901790222e-07, + "loss": 0.62, + "step": 14681 + }, + { + "epoch": 0.28, + "learning_rate": 1.4317890567356607e-07, + "loss": 0.7488, + "step": 14682 + }, + { + "epoch": 0.28, + "learning_rate": 1.4317502232922994e-07, + "loss": 0.0033, + "step": 14683 + }, + { + "epoch": 0.28, + "learning_rate": 1.4317113898489378e-07, + "loss": 0.0018, + "step": 14684 + }, + { + "epoch": 0.28, + "learning_rate": 1.4316725564055765e-07, + "loss": 0.0019, + "step": 14685 + }, + { + "epoch": 0.28, + "learning_rate": 1.431633722962215e-07, + "loss": 0.0019, + "step": 14686 + }, + { + "epoch": 0.28, + "learning_rate": 1.4315948895188537e-07, + "loss": 0.0014, + "step": 14687 + }, + { + "epoch": 0.28, + "learning_rate": 1.4315560560754922e-07, + "loss": 0.0012, + "step": 14688 + }, + { + "epoch": 0.28, + "learning_rate": 1.431517222632131e-07, + "loss": 0.0049, + "step": 14689 + }, + { + "epoch": 0.28, + "learning_rate": 1.4314783891887693e-07, + "loss": 0.0029, + "step": 14690 + }, + { + "epoch": 0.28, + "learning_rate": 1.431439555745408e-07, + "loss": 0.0013, + "step": 14691 + }, + { + "epoch": 0.28, + "learning_rate": 1.4314007223020465e-07, + "loss": 0.0011, + "step": 14692 + }, + { + "epoch": 0.29, + "learning_rate": 1.4313618888586852e-07, + "loss": 0.001, + "step": 14693 + }, + { + "epoch": 0.29, + "learning_rate": 1.4313230554153237e-07, + "loss": 0.0032, + "step": 14694 + }, + { + "epoch": 0.29, + "learning_rate": 1.431284221971962e-07, + "loss": 0.007, + "step": 14695 + }, + { + "epoch": 0.29, + "learning_rate": 1.4312453885286006e-07, + "loss": 0.0011, + "step": 14696 + }, + { + "epoch": 0.29, + "learning_rate": 1.4312065550852393e-07, + "loss": 0.0139, + "step": 14697 + }, + { + "epoch": 0.29, + "learning_rate": 1.4311677216418777e-07, + "loss": 0.0017, + "step": 14698 + }, + { + "epoch": 0.29, + "learning_rate": 1.4311288881985164e-07, + "loss": 0.0014, + "step": 14699 + }, + { + "epoch": 0.29, + "learning_rate": 1.431090054755155e-07, + "loss": 0.9432, + "step": 14700 + }, + { + "epoch": 0.29, + "learning_rate": 1.4310512213117936e-07, + "loss": 0.0017, + "step": 14701 + }, + { + "epoch": 0.29, + "learning_rate": 1.431012387868432e-07, + "loss": 0.0015, + "step": 14702 + }, + { + "epoch": 0.29, + "learning_rate": 1.4309735544250708e-07, + "loss": 0.0016, + "step": 14703 + }, + { + "epoch": 0.29, + "learning_rate": 1.4309347209817092e-07, + "loss": 0.0013, + "step": 14704 + }, + { + "epoch": 0.29, + "learning_rate": 1.430895887538348e-07, + "loss": 0.0014, + "step": 14705 + }, + { + "epoch": 0.29, + "learning_rate": 1.4308570540949864e-07, + "loss": 0.0329, + "step": 14706 + }, + { + "epoch": 0.29, + "learning_rate": 1.430818220651625e-07, + "loss": 0.0082, + "step": 14707 + }, + { + "epoch": 0.29, + "learning_rate": 1.4307793872082635e-07, + "loss": 0.0012, + "step": 14708 + }, + { + "epoch": 0.29, + "learning_rate": 1.4307405537649023e-07, + "loss": 0.0013, + "step": 14709 + }, + { + "epoch": 0.29, + "learning_rate": 1.4307017203215407e-07, + "loss": 0.8286, + "step": 14710 + }, + { + "epoch": 0.29, + "learning_rate": 1.4306628868781794e-07, + "loss": 0.0013, + "step": 14711 + }, + { + "epoch": 0.29, + "learning_rate": 1.430624053434818e-07, + "loss": 0.0014, + "step": 14712 + }, + { + "epoch": 0.29, + "learning_rate": 1.4305852199914566e-07, + "loss": 0.0012, + "step": 14713 + }, + { + "epoch": 0.29, + "learning_rate": 1.430546386548095e-07, + "loss": 0.0032, + "step": 14714 + }, + { + "epoch": 0.29, + "learning_rate": 1.4305075531047338e-07, + "loss": 0.0015, + "step": 14715 + }, + { + "epoch": 0.29, + "learning_rate": 1.4304687196613722e-07, + "loss": 0.0014, + "step": 14716 + }, + { + "epoch": 0.29, + "learning_rate": 1.430429886218011e-07, + "loss": 0.0016, + "step": 14717 + }, + { + "epoch": 0.29, + "learning_rate": 1.4303910527746494e-07, + "loss": 0.001, + "step": 14718 + }, + { + "epoch": 0.29, + "learning_rate": 1.430352219331288e-07, + "loss": 0.003, + "step": 14719 + }, + { + "epoch": 0.29, + "learning_rate": 1.4303133858879265e-07, + "loss": 0.001, + "step": 14720 + }, + { + "epoch": 0.29, + "learning_rate": 1.4302745524445652e-07, + "loss": 0.0223, + "step": 14721 + }, + { + "epoch": 0.29, + "learning_rate": 1.4302357190012037e-07, + "loss": 0.0034, + "step": 14722 + }, + { + "epoch": 0.29, + "learning_rate": 1.4301968855578424e-07, + "loss": 0.0211, + "step": 14723 + }, + { + "epoch": 0.29, + "learning_rate": 1.4301580521144809e-07, + "loss": 0.0037, + "step": 14724 + }, + { + "epoch": 0.29, + "learning_rate": 1.4301192186711196e-07, + "loss": 0.0027, + "step": 14725 + }, + { + "epoch": 0.29, + "learning_rate": 1.430080385227758e-07, + "loss": 0.2412, + "step": 14726 + }, + { + "epoch": 0.29, + "learning_rate": 1.4300415517843967e-07, + "loss": 0.0013, + "step": 14727 + }, + { + "epoch": 0.29, + "learning_rate": 1.4300027183410352e-07, + "loss": 0.0037, + "step": 14728 + }, + { + "epoch": 0.29, + "learning_rate": 1.429963884897674e-07, + "loss": 1.308, + "step": 14729 + }, + { + "epoch": 0.29, + "learning_rate": 1.4299250514543124e-07, + "loss": 0.0011, + "step": 14730 + }, + { + "epoch": 0.29, + "learning_rate": 1.429886218010951e-07, + "loss": 0.0044, + "step": 14731 + }, + { + "epoch": 0.29, + "learning_rate": 1.4298473845675895e-07, + "loss": 0.0031, + "step": 14732 + }, + { + "epoch": 0.29, + "learning_rate": 1.4298085511242282e-07, + "loss": 0.0016, + "step": 14733 + }, + { + "epoch": 0.29, + "learning_rate": 1.4297697176808667e-07, + "loss": 0.0018, + "step": 14734 + }, + { + "epoch": 0.29, + "learning_rate": 1.4297308842375054e-07, + "loss": 0.0011, + "step": 14735 + }, + { + "epoch": 0.29, + "learning_rate": 1.4296920507941439e-07, + "loss": 0.0015, + "step": 14736 + }, + { + "epoch": 0.29, + "learning_rate": 1.4296532173507826e-07, + "loss": 0.0217, + "step": 14737 + }, + { + "epoch": 0.29, + "learning_rate": 1.429614383907421e-07, + "loss": 0.0016, + "step": 14738 + }, + { + "epoch": 0.29, + "learning_rate": 1.4295755504640597e-07, + "loss": 0.0014, + "step": 14739 + }, + { + "epoch": 0.29, + "learning_rate": 1.4295367170206982e-07, + "loss": 0.0013, + "step": 14740 + }, + { + "epoch": 0.29, + "learning_rate": 1.429497883577337e-07, + "loss": 0.0052, + "step": 14741 + }, + { + "epoch": 0.29, + "learning_rate": 1.4294590501339753e-07, + "loss": 0.0026, + "step": 14742 + }, + { + "epoch": 0.29, + "learning_rate": 1.429420216690614e-07, + "loss": 0.4309, + "step": 14743 + }, + { + "epoch": 0.29, + "learning_rate": 1.4293813832472525e-07, + "loss": 0.004, + "step": 14744 + }, + { + "epoch": 0.29, + "learning_rate": 1.4293425498038912e-07, + "loss": 0.002, + "step": 14745 + }, + { + "epoch": 0.29, + "learning_rate": 1.4293037163605297e-07, + "loss": 0.0027, + "step": 14746 + }, + { + "epoch": 0.29, + "learning_rate": 1.4292648829171684e-07, + "loss": 0.0025, + "step": 14747 + }, + { + "epoch": 0.29, + "learning_rate": 1.4292260494738068e-07, + "loss": 0.0184, + "step": 14748 + }, + { + "epoch": 0.29, + "learning_rate": 1.4291872160304456e-07, + "loss": 1.2243, + "step": 14749 + }, + { + "epoch": 0.29, + "learning_rate": 1.429148382587084e-07, + "loss": 0.0014, + "step": 14750 + }, + { + "epoch": 0.29, + "learning_rate": 1.4291095491437227e-07, + "loss": 0.0012, + "step": 14751 + }, + { + "epoch": 0.29, + "learning_rate": 1.4290707157003612e-07, + "loss": 0.0015, + "step": 14752 + }, + { + "epoch": 0.29, + "learning_rate": 1.4290318822569996e-07, + "loss": 0.3238, + "step": 14753 + }, + { + "epoch": 0.29, + "learning_rate": 1.428993048813638e-07, + "loss": 0.0358, + "step": 14754 + }, + { + "epoch": 0.29, + "learning_rate": 1.4289542153702768e-07, + "loss": 0.0018, + "step": 14755 + }, + { + "epoch": 0.29, + "learning_rate": 1.4289153819269152e-07, + "loss": 0.0012, + "step": 14756 + }, + { + "epoch": 0.29, + "learning_rate": 1.428876548483554e-07, + "loss": 0.0014, + "step": 14757 + }, + { + "epoch": 0.29, + "learning_rate": 1.4288377150401924e-07, + "loss": 0.0013, + "step": 14758 + }, + { + "epoch": 0.29, + "learning_rate": 1.428798881596831e-07, + "loss": 0.3638, + "step": 14759 + }, + { + "epoch": 0.29, + "learning_rate": 1.4287600481534696e-07, + "loss": 0.0016, + "step": 14760 + }, + { + "epoch": 0.29, + "learning_rate": 1.4287212147101083e-07, + "loss": 0.0059, + "step": 14761 + }, + { + "epoch": 0.29, + "learning_rate": 1.4286823812667467e-07, + "loss": 0.7538, + "step": 14762 + }, + { + "epoch": 0.29, + "learning_rate": 1.4286435478233854e-07, + "loss": 0.0016, + "step": 14763 + }, + { + "epoch": 0.29, + "learning_rate": 1.428604714380024e-07, + "loss": 0.0012, + "step": 14764 + }, + { + "epoch": 0.29, + "learning_rate": 1.4285658809366626e-07, + "loss": 0.0023, + "step": 14765 + }, + { + "epoch": 0.29, + "learning_rate": 1.428527047493301e-07, + "loss": 0.0011, + "step": 14766 + }, + { + "epoch": 0.29, + "learning_rate": 1.4284882140499398e-07, + "loss": 0.0216, + "step": 14767 + }, + { + "epoch": 0.29, + "learning_rate": 1.4284493806065782e-07, + "loss": 0.0012, + "step": 14768 + }, + { + "epoch": 0.29, + "learning_rate": 1.428410547163217e-07, + "loss": 0.0014, + "step": 14769 + }, + { + "epoch": 0.29, + "learning_rate": 1.4283717137198554e-07, + "loss": 0.0022, + "step": 14770 + }, + { + "epoch": 0.29, + "learning_rate": 1.428332880276494e-07, + "loss": 0.0011, + "step": 14771 + }, + { + "epoch": 0.29, + "learning_rate": 1.4282940468331326e-07, + "loss": 0.0012, + "step": 14772 + }, + { + "epoch": 0.29, + "learning_rate": 1.4282552133897713e-07, + "loss": 0.0011, + "step": 14773 + }, + { + "epoch": 0.29, + "learning_rate": 1.4282163799464097e-07, + "loss": 0.002, + "step": 14774 + }, + { + "epoch": 0.29, + "learning_rate": 1.4281775465030484e-07, + "loss": 0.0015, + "step": 14775 + }, + { + "epoch": 0.29, + "learning_rate": 1.428138713059687e-07, + "loss": 0.0009, + "step": 14776 + }, + { + "epoch": 0.29, + "learning_rate": 1.4280998796163256e-07, + "loss": 0.3604, + "step": 14777 + }, + { + "epoch": 0.29, + "learning_rate": 1.428061046172964e-07, + "loss": 0.0014, + "step": 14778 + }, + { + "epoch": 0.29, + "learning_rate": 1.4280222127296028e-07, + "loss": 0.1125, + "step": 14779 + }, + { + "epoch": 0.29, + "learning_rate": 1.4279833792862412e-07, + "loss": 0.0013, + "step": 14780 + }, + { + "epoch": 0.29, + "learning_rate": 1.42794454584288e-07, + "loss": 0.0012, + "step": 14781 + }, + { + "epoch": 0.29, + "learning_rate": 1.4279057123995184e-07, + "loss": 0.0151, + "step": 14782 + }, + { + "epoch": 0.29, + "learning_rate": 1.427866878956157e-07, + "loss": 0.0011, + "step": 14783 + }, + { + "epoch": 0.29, + "learning_rate": 1.4278280455127955e-07, + "loss": 0.0016, + "step": 14784 + }, + { + "epoch": 0.29, + "learning_rate": 1.4277892120694343e-07, + "loss": 0.0013, + "step": 14785 + }, + { + "epoch": 0.29, + "learning_rate": 1.4277503786260727e-07, + "loss": 0.0011, + "step": 14786 + }, + { + "epoch": 0.29, + "learning_rate": 1.4277115451827114e-07, + "loss": 0.001, + "step": 14787 + }, + { + "epoch": 0.29, + "learning_rate": 1.42767271173935e-07, + "loss": 0.2792, + "step": 14788 + }, + { + "epoch": 0.29, + "learning_rate": 1.4276338782959886e-07, + "loss": 0.0014, + "step": 14789 + }, + { + "epoch": 0.29, + "learning_rate": 1.427595044852627e-07, + "loss": 0.001, + "step": 14790 + }, + { + "epoch": 0.29, + "learning_rate": 1.4275562114092658e-07, + "loss": 0.0014, + "step": 14791 + }, + { + "epoch": 0.29, + "learning_rate": 1.4275173779659042e-07, + "loss": 0.8753, + "step": 14792 + }, + { + "epoch": 0.29, + "learning_rate": 1.427478544522543e-07, + "loss": 0.0014, + "step": 14793 + }, + { + "epoch": 0.29, + "learning_rate": 1.4274397110791814e-07, + "loss": 0.0017, + "step": 14794 + }, + { + "epoch": 0.29, + "learning_rate": 1.42740087763582e-07, + "loss": 0.002, + "step": 14795 + }, + { + "epoch": 0.29, + "learning_rate": 1.4273620441924585e-07, + "loss": 0.0022, + "step": 14796 + }, + { + "epoch": 0.29, + "learning_rate": 1.4273232107490972e-07, + "loss": 0.0012, + "step": 14797 + }, + { + "epoch": 0.29, + "learning_rate": 1.4272843773057357e-07, + "loss": 0.2224, + "step": 14798 + }, + { + "epoch": 0.29, + "learning_rate": 1.4272455438623741e-07, + "loss": 0.0011, + "step": 14799 + }, + { + "epoch": 0.29, + "learning_rate": 1.4272067104190129e-07, + "loss": 0.0012, + "step": 14800 + }, + { + "epoch": 0.29, + "learning_rate": 1.4271678769756513e-07, + "loss": 0.011, + "step": 14801 + }, + { + "epoch": 0.29, + "learning_rate": 1.42712904353229e-07, + "loss": 0.0011, + "step": 14802 + }, + { + "epoch": 0.29, + "learning_rate": 1.4270902100889285e-07, + "loss": 0.001, + "step": 14803 + }, + { + "epoch": 0.29, + "learning_rate": 1.4270513766455672e-07, + "loss": 0.0012, + "step": 14804 + }, + { + "epoch": 0.29, + "learning_rate": 1.4270125432022056e-07, + "loss": 0.0553, + "step": 14805 + }, + { + "epoch": 0.29, + "learning_rate": 1.4269737097588444e-07, + "loss": 0.0023, + "step": 14806 + }, + { + "epoch": 0.29, + "learning_rate": 1.4269348763154828e-07, + "loss": 0.0016, + "step": 14807 + }, + { + "epoch": 0.29, + "learning_rate": 1.4268960428721215e-07, + "loss": 0.0012, + "step": 14808 + }, + { + "epoch": 0.29, + "learning_rate": 1.42685720942876e-07, + "loss": 0.2814, + "step": 14809 + }, + { + "epoch": 0.29, + "learning_rate": 1.4268183759853987e-07, + "loss": 0.0018, + "step": 14810 + }, + { + "epoch": 0.29, + "learning_rate": 1.4267795425420371e-07, + "loss": 0.0013, + "step": 14811 + }, + { + "epoch": 0.29, + "learning_rate": 1.4267407090986756e-07, + "loss": 0.0026, + "step": 14812 + }, + { + "epoch": 0.29, + "learning_rate": 1.4267018756553143e-07, + "loss": 0.0034, + "step": 14813 + }, + { + "epoch": 0.29, + "learning_rate": 1.4266630422119528e-07, + "loss": 0.0014, + "step": 14814 + }, + { + "epoch": 0.29, + "learning_rate": 1.4266242087685915e-07, + "loss": 1.1575, + "step": 14815 + }, + { + "epoch": 0.29, + "learning_rate": 1.42658537532523e-07, + "loss": 0.0012, + "step": 14816 + }, + { + "epoch": 0.29, + "learning_rate": 1.4265465418818686e-07, + "loss": 0.0298, + "step": 14817 + }, + { + "epoch": 0.29, + "learning_rate": 1.426507708438507e-07, + "loss": 0.0125, + "step": 14818 + }, + { + "epoch": 0.29, + "learning_rate": 1.4264688749951458e-07, + "loss": 0.0011, + "step": 14819 + }, + { + "epoch": 0.29, + "learning_rate": 1.4264300415517842e-07, + "loss": 0.0013, + "step": 14820 + }, + { + "epoch": 0.29, + "learning_rate": 1.426391208108423e-07, + "loss": 0.0021, + "step": 14821 + }, + { + "epoch": 0.29, + "learning_rate": 1.4263523746650614e-07, + "loss": 0.0601, + "step": 14822 + }, + { + "epoch": 0.29, + "learning_rate": 1.4263135412217e-07, + "loss": 0.0355, + "step": 14823 + }, + { + "epoch": 0.29, + "learning_rate": 1.4262747077783386e-07, + "loss": 0.0015, + "step": 14824 + }, + { + "epoch": 0.29, + "learning_rate": 1.4262358743349773e-07, + "loss": 0.0012, + "step": 14825 + }, + { + "epoch": 0.29, + "learning_rate": 1.4261970408916157e-07, + "loss": 0.001, + "step": 14826 + }, + { + "epoch": 0.29, + "learning_rate": 1.4261582074482545e-07, + "loss": 0.0065, + "step": 14827 + }, + { + "epoch": 0.29, + "learning_rate": 1.426119374004893e-07, + "loss": 0.0011, + "step": 14828 + }, + { + "epoch": 0.29, + "learning_rate": 1.4260805405615314e-07, + "loss": 0.0013, + "step": 14829 + }, + { + "epoch": 0.29, + "learning_rate": 1.42604170711817e-07, + "loss": 0.0015, + "step": 14830 + }, + { + "epoch": 0.29, + "learning_rate": 1.4260028736748085e-07, + "loss": 0.0017, + "step": 14831 + }, + { + "epoch": 0.29, + "learning_rate": 1.4259640402314472e-07, + "loss": 0.155, + "step": 14832 + }, + { + "epoch": 0.29, + "learning_rate": 1.4259252067880857e-07, + "loss": 0.0011, + "step": 14833 + }, + { + "epoch": 0.29, + "learning_rate": 1.4258863733447244e-07, + "loss": 0.0016, + "step": 14834 + }, + { + "epoch": 0.29, + "learning_rate": 1.4258475399013629e-07, + "loss": 0.0011, + "step": 14835 + }, + { + "epoch": 0.29, + "learning_rate": 1.4258087064580016e-07, + "loss": 0.0014, + "step": 14836 + }, + { + "epoch": 0.29, + "learning_rate": 1.42576987301464e-07, + "loss": 0.001, + "step": 14837 + }, + { + "epoch": 0.29, + "learning_rate": 1.4257310395712787e-07, + "loss": 0.0011, + "step": 14838 + }, + { + "epoch": 0.29, + "learning_rate": 1.4256922061279172e-07, + "loss": 0.0017, + "step": 14839 + }, + { + "epoch": 0.29, + "learning_rate": 1.425653372684556e-07, + "loss": 0.002, + "step": 14840 + }, + { + "epoch": 0.29, + "learning_rate": 1.4256145392411943e-07, + "loss": 0.002, + "step": 14841 + }, + { + "epoch": 0.29, + "learning_rate": 1.425575705797833e-07, + "loss": 0.0013, + "step": 14842 + }, + { + "epoch": 0.29, + "learning_rate": 1.4255368723544715e-07, + "loss": 0.0018, + "step": 14843 + }, + { + "epoch": 0.29, + "learning_rate": 1.4254980389111102e-07, + "loss": 0.0012, + "step": 14844 + }, + { + "epoch": 0.29, + "learning_rate": 1.4254592054677487e-07, + "loss": 0.0032, + "step": 14845 + }, + { + "epoch": 0.29, + "learning_rate": 1.4254203720243874e-07, + "loss": 0.0011, + "step": 14846 + }, + { + "epoch": 0.29, + "learning_rate": 1.4253815385810258e-07, + "loss": 0.0012, + "step": 14847 + }, + { + "epoch": 0.29, + "learning_rate": 1.4253427051376646e-07, + "loss": 0.2249, + "step": 14848 + }, + { + "epoch": 0.29, + "learning_rate": 1.425303871694303e-07, + "loss": 0.0013, + "step": 14849 + }, + { + "epoch": 0.29, + "learning_rate": 1.4252650382509417e-07, + "loss": 0.0014, + "step": 14850 + }, + { + "epoch": 0.29, + "learning_rate": 1.4252262048075802e-07, + "loss": 0.0061, + "step": 14851 + }, + { + "epoch": 0.29, + "learning_rate": 1.425187371364219e-07, + "loss": 0.0299, + "step": 14852 + }, + { + "epoch": 0.29, + "learning_rate": 1.4251485379208573e-07, + "loss": 0.4855, + "step": 14853 + }, + { + "epoch": 0.29, + "learning_rate": 1.425109704477496e-07, + "loss": 0.0015, + "step": 14854 + }, + { + "epoch": 0.29, + "learning_rate": 1.4250708710341345e-07, + "loss": 0.0013, + "step": 14855 + }, + { + "epoch": 0.29, + "learning_rate": 1.4250320375907732e-07, + "loss": 0.0063, + "step": 14856 + }, + { + "epoch": 0.29, + "learning_rate": 1.4249932041474117e-07, + "loss": 0.0011, + "step": 14857 + }, + { + "epoch": 0.29, + "learning_rate": 1.4249543707040504e-07, + "loss": 0.0014, + "step": 14858 + }, + { + "epoch": 0.29, + "learning_rate": 1.4249155372606888e-07, + "loss": 0.0012, + "step": 14859 + }, + { + "epoch": 0.29, + "learning_rate": 1.4248767038173275e-07, + "loss": 0.7166, + "step": 14860 + }, + { + "epoch": 0.29, + "learning_rate": 1.424837870373966e-07, + "loss": 0.1215, + "step": 14861 + }, + { + "epoch": 0.29, + "learning_rate": 1.4247990369306047e-07, + "loss": 0.0018, + "step": 14862 + }, + { + "epoch": 0.29, + "learning_rate": 1.4247602034872432e-07, + "loss": 0.0018, + "step": 14863 + }, + { + "epoch": 0.29, + "learning_rate": 1.424721370043882e-07, + "loss": 0.0019, + "step": 14864 + }, + { + "epoch": 0.29, + "learning_rate": 1.4246825366005203e-07, + "loss": 0.0011, + "step": 14865 + }, + { + "epoch": 0.29, + "learning_rate": 1.424643703157159e-07, + "loss": 0.0026, + "step": 14866 + }, + { + "epoch": 0.29, + "learning_rate": 1.4246048697137975e-07, + "loss": 0.1908, + "step": 14867 + }, + { + "epoch": 0.29, + "learning_rate": 1.4245660362704362e-07, + "loss": 0.0015, + "step": 14868 + }, + { + "epoch": 0.29, + "learning_rate": 1.4245272028270744e-07, + "loss": 0.0013, + "step": 14869 + }, + { + "epoch": 0.29, + "learning_rate": 1.424488369383713e-07, + "loss": 0.0017, + "step": 14870 + }, + { + "epoch": 0.29, + "learning_rate": 1.4244495359403516e-07, + "loss": 0.4204, + "step": 14871 + }, + { + "epoch": 0.29, + "learning_rate": 1.4244107024969903e-07, + "loss": 0.0013, + "step": 14872 + }, + { + "epoch": 0.29, + "learning_rate": 1.4243718690536287e-07, + "loss": 0.0043, + "step": 14873 + }, + { + "epoch": 0.29, + "learning_rate": 1.4243330356102674e-07, + "loss": 0.0018, + "step": 14874 + }, + { + "epoch": 0.29, + "learning_rate": 1.424294202166906e-07, + "loss": 0.4606, + "step": 14875 + }, + { + "epoch": 0.29, + "learning_rate": 1.4242553687235446e-07, + "loss": 0.3001, + "step": 14876 + }, + { + "epoch": 0.29, + "learning_rate": 1.424216535280183e-07, + "loss": 0.0013, + "step": 14877 + }, + { + "epoch": 0.29, + "learning_rate": 1.4241777018368218e-07, + "loss": 0.0014, + "step": 14878 + }, + { + "epoch": 0.29, + "learning_rate": 1.4241388683934602e-07, + "loss": 0.9828, + "step": 14879 + }, + { + "epoch": 0.29, + "learning_rate": 1.424100034950099e-07, + "loss": 0.8084, + "step": 14880 + }, + { + "epoch": 0.29, + "learning_rate": 1.4240612015067374e-07, + "loss": 0.0297, + "step": 14881 + }, + { + "epoch": 0.29, + "learning_rate": 1.424022368063376e-07, + "loss": 0.0044, + "step": 14882 + }, + { + "epoch": 0.29, + "learning_rate": 1.4239835346200145e-07, + "loss": 0.0015, + "step": 14883 + }, + { + "epoch": 0.29, + "learning_rate": 1.4239447011766533e-07, + "loss": 0.0016, + "step": 14884 + }, + { + "epoch": 0.29, + "learning_rate": 1.4239058677332917e-07, + "loss": 0.0024, + "step": 14885 + }, + { + "epoch": 0.29, + "learning_rate": 1.4238670342899304e-07, + "loss": 0.0029, + "step": 14886 + }, + { + "epoch": 0.29, + "learning_rate": 1.423828200846569e-07, + "loss": 0.0034, + "step": 14887 + }, + { + "epoch": 0.29, + "learning_rate": 1.4237893674032076e-07, + "loss": 0.0017, + "step": 14888 + }, + { + "epoch": 0.29, + "learning_rate": 1.423750533959846e-07, + "loss": 0.0297, + "step": 14889 + }, + { + "epoch": 0.29, + "learning_rate": 1.4237117005164848e-07, + "loss": 0.0013, + "step": 14890 + }, + { + "epoch": 0.29, + "learning_rate": 1.4236728670731232e-07, + "loss": 0.0011, + "step": 14891 + }, + { + "epoch": 0.29, + "learning_rate": 1.423634033629762e-07, + "loss": 0.526, + "step": 14892 + }, + { + "epoch": 0.29, + "learning_rate": 1.4235952001864004e-07, + "loss": 0.0024, + "step": 14893 + }, + { + "epoch": 0.29, + "learning_rate": 1.423556366743039e-07, + "loss": 0.0012, + "step": 14894 + }, + { + "epoch": 0.29, + "learning_rate": 1.4235175332996775e-07, + "loss": 0.0012, + "step": 14895 + }, + { + "epoch": 0.29, + "learning_rate": 1.4234786998563162e-07, + "loss": 0.0021, + "step": 14896 + }, + { + "epoch": 0.29, + "learning_rate": 1.4234398664129547e-07, + "loss": 0.0012, + "step": 14897 + }, + { + "epoch": 0.29, + "learning_rate": 1.4234010329695934e-07, + "loss": 0.0015, + "step": 14898 + }, + { + "epoch": 0.29, + "learning_rate": 1.4233621995262319e-07, + "loss": 0.0011, + "step": 14899 + }, + { + "epoch": 0.29, + "learning_rate": 1.4233233660828706e-07, + "loss": 0.001, + "step": 14900 + }, + { + "epoch": 0.29, + "learning_rate": 1.423284532639509e-07, + "loss": 0.1514, + "step": 14901 + }, + { + "epoch": 0.29, + "learning_rate": 1.4232456991961477e-07, + "loss": 0.0013, + "step": 14902 + }, + { + "epoch": 0.29, + "learning_rate": 1.4232068657527862e-07, + "loss": 0.0022, + "step": 14903 + }, + { + "epoch": 0.29, + "learning_rate": 1.423168032309425e-07, + "loss": 0.0017, + "step": 14904 + }, + { + "epoch": 0.29, + "learning_rate": 1.4231291988660634e-07, + "loss": 0.0015, + "step": 14905 + }, + { + "epoch": 0.29, + "learning_rate": 1.423090365422702e-07, + "loss": 0.001, + "step": 14906 + }, + { + "epoch": 0.29, + "learning_rate": 1.4230515319793405e-07, + "loss": 0.0012, + "step": 14907 + }, + { + "epoch": 0.29, + "learning_rate": 1.4230126985359792e-07, + "loss": 0.0013, + "step": 14908 + }, + { + "epoch": 0.29, + "learning_rate": 1.4229738650926177e-07, + "loss": 0.0013, + "step": 14909 + }, + { + "epoch": 0.29, + "learning_rate": 1.4229350316492564e-07, + "loss": 0.0011, + "step": 14910 + }, + { + "epoch": 0.29, + "learning_rate": 1.4228961982058949e-07, + "loss": 0.0009, + "step": 14911 + }, + { + "epoch": 0.29, + "learning_rate": 1.4228573647625336e-07, + "loss": 0.0012, + "step": 14912 + }, + { + "epoch": 0.29, + "learning_rate": 1.422818531319172e-07, + "loss": 0.0017, + "step": 14913 + }, + { + "epoch": 0.29, + "learning_rate": 1.4227796978758107e-07, + "loss": 0.0296, + "step": 14914 + }, + { + "epoch": 0.29, + "learning_rate": 1.4227408644324492e-07, + "loss": 0.0036, + "step": 14915 + }, + { + "epoch": 0.29, + "learning_rate": 1.422702030989088e-07, + "loss": 0.2988, + "step": 14916 + }, + { + "epoch": 0.29, + "learning_rate": 1.4226631975457263e-07, + "loss": 0.0039, + "step": 14917 + }, + { + "epoch": 0.29, + "learning_rate": 1.422624364102365e-07, + "loss": 0.0013, + "step": 14918 + }, + { + "epoch": 0.29, + "learning_rate": 1.4225855306590035e-07, + "loss": 0.0013, + "step": 14919 + }, + { + "epoch": 0.29, + "learning_rate": 1.4225466972156422e-07, + "loss": 0.7201, + "step": 14920 + }, + { + "epoch": 0.29, + "learning_rate": 1.4225078637722807e-07, + "loss": 0.001, + "step": 14921 + }, + { + "epoch": 0.29, + "learning_rate": 1.4224690303289194e-07, + "loss": 0.0055, + "step": 14922 + }, + { + "epoch": 0.29, + "learning_rate": 1.4224301968855578e-07, + "loss": 0.0013, + "step": 14923 + }, + { + "epoch": 0.29, + "learning_rate": 1.4223913634421966e-07, + "loss": 0.0014, + "step": 14924 + }, + { + "epoch": 0.29, + "learning_rate": 1.422352529998835e-07, + "loss": 0.0012, + "step": 14925 + }, + { + "epoch": 0.29, + "learning_rate": 1.4223136965554737e-07, + "loss": 0.0026, + "step": 14926 + }, + { + "epoch": 0.29, + "learning_rate": 1.422274863112112e-07, + "loss": 0.0028, + "step": 14927 + }, + { + "epoch": 0.29, + "learning_rate": 1.4222360296687506e-07, + "loss": 0.0703, + "step": 14928 + }, + { + "epoch": 0.29, + "learning_rate": 1.422197196225389e-07, + "loss": 0.0031, + "step": 14929 + }, + { + "epoch": 0.29, + "learning_rate": 1.4221583627820278e-07, + "loss": 0.0012, + "step": 14930 + }, + { + "epoch": 0.29, + "learning_rate": 1.4221195293386662e-07, + "loss": 0.0011, + "step": 14931 + }, + { + "epoch": 0.29, + "learning_rate": 1.422080695895305e-07, + "loss": 1.509, + "step": 14932 + }, + { + "epoch": 0.29, + "learning_rate": 1.4220418624519434e-07, + "loss": 0.0018, + "step": 14933 + }, + { + "epoch": 0.29, + "learning_rate": 1.422003029008582e-07, + "loss": 0.0015, + "step": 14934 + }, + { + "epoch": 0.29, + "learning_rate": 1.4219641955652206e-07, + "loss": 0.2523, + "step": 14935 + }, + { + "epoch": 0.29, + "learning_rate": 1.4219253621218593e-07, + "loss": 0.0015, + "step": 14936 + }, + { + "epoch": 0.29, + "learning_rate": 1.4218865286784977e-07, + "loss": 0.0025, + "step": 14937 + }, + { + "epoch": 0.29, + "learning_rate": 1.4218476952351364e-07, + "loss": 0.0013, + "step": 14938 + }, + { + "epoch": 0.29, + "learning_rate": 1.421808861791775e-07, + "loss": 0.0012, + "step": 14939 + }, + { + "epoch": 0.29, + "learning_rate": 1.4217700283484136e-07, + "loss": 0.0012, + "step": 14940 + }, + { + "epoch": 0.29, + "learning_rate": 1.421731194905052e-07, + "loss": 0.0015, + "step": 14941 + }, + { + "epoch": 0.29, + "learning_rate": 1.4216923614616908e-07, + "loss": 0.584, + "step": 14942 + }, + { + "epoch": 0.29, + "learning_rate": 1.4216535280183292e-07, + "loss": 0.0017, + "step": 14943 + }, + { + "epoch": 0.29, + "learning_rate": 1.421614694574968e-07, + "loss": 0.0027, + "step": 14944 + }, + { + "epoch": 0.29, + "learning_rate": 1.4215758611316064e-07, + "loss": 0.434, + "step": 14945 + }, + { + "epoch": 0.29, + "learning_rate": 1.421537027688245e-07, + "loss": 0.0018, + "step": 14946 + }, + { + "epoch": 0.29, + "learning_rate": 1.4214981942448836e-07, + "loss": 0.002, + "step": 14947 + }, + { + "epoch": 0.29, + "learning_rate": 1.4214593608015223e-07, + "loss": 0.0011, + "step": 14948 + }, + { + "epoch": 0.29, + "learning_rate": 1.4214205273581607e-07, + "loss": 0.2688, + "step": 14949 + }, + { + "epoch": 0.29, + "learning_rate": 1.4213816939147994e-07, + "loss": 0.0395, + "step": 14950 + }, + { + "epoch": 0.29, + "learning_rate": 1.421342860471438e-07, + "loss": 0.0522, + "step": 14951 + }, + { + "epoch": 0.29, + "learning_rate": 1.4213040270280766e-07, + "loss": 0.0171, + "step": 14952 + }, + { + "epoch": 0.29, + "learning_rate": 1.421265193584715e-07, + "loss": 0.0021, + "step": 14953 + }, + { + "epoch": 0.29, + "learning_rate": 1.4212263601413538e-07, + "loss": 0.0013, + "step": 14954 + }, + { + "epoch": 0.29, + "learning_rate": 1.4211875266979922e-07, + "loss": 0.0702, + "step": 14955 + }, + { + "epoch": 0.29, + "learning_rate": 1.421148693254631e-07, + "loss": 0.0051, + "step": 14956 + }, + { + "epoch": 0.29, + "learning_rate": 1.4211098598112694e-07, + "loss": 0.1264, + "step": 14957 + }, + { + "epoch": 0.29, + "learning_rate": 1.421071026367908e-07, + "loss": 0.0013, + "step": 14958 + }, + { + "epoch": 0.29, + "learning_rate": 1.4210321929245465e-07, + "loss": 0.0023, + "step": 14959 + }, + { + "epoch": 0.29, + "learning_rate": 1.4209933594811853e-07, + "loss": 0.0019, + "step": 14960 + }, + { + "epoch": 0.29, + "learning_rate": 1.4209545260378237e-07, + "loss": 0.0013, + "step": 14961 + }, + { + "epoch": 0.29, + "learning_rate": 1.4209156925944624e-07, + "loss": 0.001, + "step": 14962 + }, + { + "epoch": 0.29, + "learning_rate": 1.420876859151101e-07, + "loss": 0.002, + "step": 14963 + }, + { + "epoch": 0.29, + "learning_rate": 1.4208380257077396e-07, + "loss": 0.0016, + "step": 14964 + }, + { + "epoch": 0.29, + "learning_rate": 1.420799192264378e-07, + "loss": 0.1571, + "step": 14965 + }, + { + "epoch": 0.29, + "learning_rate": 1.4207603588210168e-07, + "loss": 0.0012, + "step": 14966 + }, + { + "epoch": 0.29, + "learning_rate": 1.4207215253776552e-07, + "loss": 0.1722, + "step": 14967 + }, + { + "epoch": 0.29, + "learning_rate": 1.420682691934294e-07, + "loss": 0.0012, + "step": 14968 + }, + { + "epoch": 0.29, + "learning_rate": 1.4206438584909324e-07, + "loss": 0.0021, + "step": 14969 + }, + { + "epoch": 0.29, + "learning_rate": 1.420605025047571e-07, + "loss": 0.0012, + "step": 14970 + }, + { + "epoch": 0.29, + "learning_rate": 1.4205661916042095e-07, + "loss": 0.0014, + "step": 14971 + }, + { + "epoch": 0.29, + "learning_rate": 1.4205273581608482e-07, + "loss": 0.3407, + "step": 14972 + }, + { + "epoch": 0.29, + "learning_rate": 1.4204885247174867e-07, + "loss": 0.0015, + "step": 14973 + }, + { + "epoch": 0.29, + "learning_rate": 1.4204496912741254e-07, + "loss": 0.0012, + "step": 14974 + }, + { + "epoch": 0.29, + "learning_rate": 1.4204108578307639e-07, + "loss": 0.7601, + "step": 14975 + }, + { + "epoch": 0.29, + "learning_rate": 1.4203720243874023e-07, + "loss": 0.0013, + "step": 14976 + }, + { + "epoch": 0.29, + "learning_rate": 1.420333190944041e-07, + "loss": 0.0017, + "step": 14977 + }, + { + "epoch": 0.29, + "learning_rate": 1.4202943575006795e-07, + "loss": 0.0013, + "step": 14978 + }, + { + "epoch": 0.29, + "learning_rate": 1.4202555240573182e-07, + "loss": 0.001, + "step": 14979 + }, + { + "epoch": 0.29, + "learning_rate": 1.4202166906139566e-07, + "loss": 0.0016, + "step": 14980 + }, + { + "epoch": 0.29, + "learning_rate": 1.4201778571705954e-07, + "loss": 0.1362, + "step": 14981 + }, + { + "epoch": 0.29, + "learning_rate": 1.4201390237272338e-07, + "loss": 0.0197, + "step": 14982 + }, + { + "epoch": 0.29, + "learning_rate": 1.4201001902838725e-07, + "loss": 0.4542, + "step": 14983 + }, + { + "epoch": 0.29, + "learning_rate": 1.420061356840511e-07, + "loss": 0.0267, + "step": 14984 + }, + { + "epoch": 0.29, + "learning_rate": 1.4200225233971494e-07, + "loss": 0.0016, + "step": 14985 + }, + { + "epoch": 0.29, + "learning_rate": 1.4199836899537881e-07, + "loss": 0.0011, + "step": 14986 + }, + { + "epoch": 0.29, + "learning_rate": 1.4199448565104266e-07, + "loss": 0.001, + "step": 14987 + }, + { + "epoch": 0.29, + "learning_rate": 1.4199060230670653e-07, + "loss": 0.0032, + "step": 14988 + }, + { + "epoch": 0.29, + "learning_rate": 1.4198671896237038e-07, + "loss": 0.0013, + "step": 14989 + }, + { + "epoch": 0.29, + "learning_rate": 1.4198283561803425e-07, + "loss": 0.0011, + "step": 14990 + }, + { + "epoch": 0.29, + "learning_rate": 1.419789522736981e-07, + "loss": 0.0014, + "step": 14991 + }, + { + "epoch": 0.29, + "learning_rate": 1.4197506892936196e-07, + "loss": 0.0012, + "step": 14992 + }, + { + "epoch": 0.29, + "learning_rate": 1.419711855850258e-07, + "loss": 0.001, + "step": 14993 + }, + { + "epoch": 0.29, + "learning_rate": 1.4196730224068968e-07, + "loss": 0.0022, + "step": 14994 + }, + { + "epoch": 0.29, + "learning_rate": 1.4196341889635352e-07, + "loss": 0.0065, + "step": 14995 + }, + { + "epoch": 0.29, + "learning_rate": 1.419595355520174e-07, + "loss": 0.0023, + "step": 14996 + }, + { + "epoch": 0.29, + "learning_rate": 1.4195565220768124e-07, + "loss": 0.0021, + "step": 14997 + }, + { + "epoch": 0.29, + "learning_rate": 1.419517688633451e-07, + "loss": 0.0012, + "step": 14998 + }, + { + "epoch": 0.29, + "learning_rate": 1.4194788551900896e-07, + "loss": 0.0409, + "step": 14999 + }, + { + "epoch": 0.29, + "learning_rate": 1.4194400217467283e-07, + "loss": 0.0012, + "step": 15000 + }, + { + "epoch": 0.29, + "learning_rate": 1.4194011883033667e-07, + "loss": 0.0017, + "step": 15001 + }, + { + "epoch": 0.29, + "learning_rate": 1.4193623548600055e-07, + "loss": 0.0041, + "step": 15002 + }, + { + "epoch": 0.29, + "learning_rate": 1.419323521416644e-07, + "loss": 0.0011, + "step": 15003 + }, + { + "epoch": 0.29, + "learning_rate": 1.4192846879732826e-07, + "loss": 0.0104, + "step": 15004 + }, + { + "epoch": 0.29, + "learning_rate": 1.419245854529921e-07, + "loss": 0.0018, + "step": 15005 + }, + { + "epoch": 0.29, + "learning_rate": 1.4192070210865595e-07, + "loss": 0.0089, + "step": 15006 + }, + { + "epoch": 0.29, + "learning_rate": 1.4191681876431982e-07, + "loss": 0.0035, + "step": 15007 + }, + { + "epoch": 0.29, + "learning_rate": 1.4191293541998367e-07, + "loss": 0.0011, + "step": 15008 + }, + { + "epoch": 0.29, + "learning_rate": 1.4190905207564754e-07, + "loss": 0.0011, + "step": 15009 + }, + { + "epoch": 0.29, + "learning_rate": 1.4190516873131139e-07, + "loss": 0.0034, + "step": 15010 + }, + { + "epoch": 0.29, + "learning_rate": 1.4190128538697526e-07, + "loss": 0.0015, + "step": 15011 + }, + { + "epoch": 0.29, + "learning_rate": 1.418974020426391e-07, + "loss": 0.0012, + "step": 15012 + }, + { + "epoch": 0.29, + "learning_rate": 1.4189351869830297e-07, + "loss": 0.0012, + "step": 15013 + }, + { + "epoch": 0.29, + "learning_rate": 1.4188963535396682e-07, + "loss": 0.0144, + "step": 15014 + }, + { + "epoch": 0.29, + "learning_rate": 1.418857520096307e-07, + "loss": 0.001, + "step": 15015 + }, + { + "epoch": 0.29, + "learning_rate": 1.4188186866529453e-07, + "loss": 0.1248, + "step": 15016 + }, + { + "epoch": 0.29, + "learning_rate": 1.418779853209584e-07, + "loss": 0.0014, + "step": 15017 + }, + { + "epoch": 0.29, + "learning_rate": 1.4187410197662225e-07, + "loss": 0.0016, + "step": 15018 + }, + { + "epoch": 0.29, + "learning_rate": 1.4187021863228612e-07, + "loss": 0.001, + "step": 15019 + }, + { + "epoch": 0.29, + "learning_rate": 1.4186633528794997e-07, + "loss": 0.0015, + "step": 15020 + }, + { + "epoch": 0.29, + "learning_rate": 1.4186245194361384e-07, + "loss": 0.0011, + "step": 15021 + }, + { + "epoch": 0.29, + "learning_rate": 1.4185856859927768e-07, + "loss": 0.0013, + "step": 15022 + }, + { + "epoch": 0.29, + "learning_rate": 1.4185468525494156e-07, + "loss": 0.0011, + "step": 15023 + }, + { + "epoch": 0.29, + "learning_rate": 1.418508019106054e-07, + "loss": 0.0011, + "step": 15024 + }, + { + "epoch": 0.29, + "learning_rate": 1.4184691856626927e-07, + "loss": 0.7344, + "step": 15025 + }, + { + "epoch": 0.29, + "learning_rate": 1.4184303522193312e-07, + "loss": 0.0725, + "step": 15026 + }, + { + "epoch": 0.29, + "learning_rate": 1.41839151877597e-07, + "loss": 0.0381, + "step": 15027 + }, + { + "epoch": 0.29, + "learning_rate": 1.4183526853326083e-07, + "loss": 0.0011, + "step": 15028 + }, + { + "epoch": 0.29, + "learning_rate": 1.418313851889247e-07, + "loss": 0.0019, + "step": 15029 + }, + { + "epoch": 0.29, + "learning_rate": 1.4182750184458855e-07, + "loss": 0.0015, + "step": 15030 + }, + { + "epoch": 0.29, + "learning_rate": 1.4182361850025242e-07, + "loss": 0.0024, + "step": 15031 + }, + { + "epoch": 0.29, + "learning_rate": 1.4181973515591627e-07, + "loss": 0.6789, + "step": 15032 + }, + { + "epoch": 0.29, + "learning_rate": 1.4181585181158014e-07, + "loss": 0.0019, + "step": 15033 + }, + { + "epoch": 0.29, + "learning_rate": 1.4181196846724398e-07, + "loss": 0.0012, + "step": 15034 + }, + { + "epoch": 0.29, + "learning_rate": 1.4180808512290785e-07, + "loss": 0.6806, + "step": 15035 + }, + { + "epoch": 0.29, + "learning_rate": 1.418042017785717e-07, + "loss": 0.001, + "step": 15036 + }, + { + "epoch": 0.29, + "learning_rate": 1.4180031843423557e-07, + "loss": 0.002, + "step": 15037 + }, + { + "epoch": 0.29, + "learning_rate": 1.4179643508989942e-07, + "loss": 0.4749, + "step": 15038 + }, + { + "epoch": 0.29, + "learning_rate": 1.417925517455633e-07, + "loss": 0.001, + "step": 15039 + }, + { + "epoch": 0.29, + "learning_rate": 1.4178866840122713e-07, + "loss": 0.0014, + "step": 15040 + }, + { + "epoch": 0.29, + "learning_rate": 1.41784785056891e-07, + "loss": 0.0014, + "step": 15041 + }, + { + "epoch": 0.29, + "learning_rate": 1.4178090171255485e-07, + "loss": 1.3307, + "step": 15042 + }, + { + "epoch": 0.29, + "learning_rate": 1.417770183682187e-07, + "loss": 0.0015, + "step": 15043 + }, + { + "epoch": 0.29, + "learning_rate": 1.4177313502388254e-07, + "loss": 0.0015, + "step": 15044 + }, + { + "epoch": 0.29, + "learning_rate": 1.417692516795464e-07, + "loss": 0.0017, + "step": 15045 + }, + { + "epoch": 0.29, + "learning_rate": 1.4176536833521026e-07, + "loss": 0.002, + "step": 15046 + }, + { + "epoch": 0.29, + "learning_rate": 1.4176148499087413e-07, + "loss": 0.0013, + "step": 15047 + }, + { + "epoch": 0.29, + "learning_rate": 1.4175760164653797e-07, + "loss": 0.0017, + "step": 15048 + }, + { + "epoch": 0.29, + "learning_rate": 1.4175371830220184e-07, + "loss": 0.0018, + "step": 15049 + }, + { + "epoch": 0.29, + "learning_rate": 1.417498349578657e-07, + "loss": 0.0137, + "step": 15050 + }, + { + "epoch": 0.29, + "learning_rate": 1.4174595161352956e-07, + "loss": 0.0021, + "step": 15051 + }, + { + "epoch": 0.29, + "learning_rate": 1.417420682691934e-07, + "loss": 0.0011, + "step": 15052 + }, + { + "epoch": 0.29, + "learning_rate": 1.4173818492485728e-07, + "loss": 0.0012, + "step": 15053 + }, + { + "epoch": 0.29, + "learning_rate": 1.4173430158052112e-07, + "loss": 0.0056, + "step": 15054 + }, + { + "epoch": 0.29, + "learning_rate": 1.41730418236185e-07, + "loss": 0.0014, + "step": 15055 + }, + { + "epoch": 0.29, + "learning_rate": 1.4172653489184884e-07, + "loss": 0.0012, + "step": 15056 + }, + { + "epoch": 0.29, + "learning_rate": 1.417226515475127e-07, + "loss": 0.0013, + "step": 15057 + }, + { + "epoch": 0.29, + "learning_rate": 1.4171876820317655e-07, + "loss": 0.0009, + "step": 15058 + }, + { + "epoch": 0.29, + "learning_rate": 1.4171488485884043e-07, + "loss": 0.0009, + "step": 15059 + }, + { + "epoch": 0.29, + "learning_rate": 1.4171100151450427e-07, + "loss": 0.0015, + "step": 15060 + }, + { + "epoch": 0.29, + "learning_rate": 1.4170711817016814e-07, + "loss": 0.0014, + "step": 15061 + }, + { + "epoch": 0.29, + "learning_rate": 1.41703234825832e-07, + "loss": 0.0012, + "step": 15062 + }, + { + "epoch": 0.29, + "learning_rate": 1.4169935148149586e-07, + "loss": 0.0021, + "step": 15063 + }, + { + "epoch": 0.29, + "learning_rate": 1.416954681371597e-07, + "loss": 0.0013, + "step": 15064 + }, + { + "epoch": 0.29, + "learning_rate": 1.4169158479282358e-07, + "loss": 0.0015, + "step": 15065 + }, + { + "epoch": 0.29, + "learning_rate": 1.4168770144848742e-07, + "loss": 0.0568, + "step": 15066 + }, + { + "epoch": 0.29, + "learning_rate": 1.416838181041513e-07, + "loss": 0.7958, + "step": 15067 + }, + { + "epoch": 0.29, + "learning_rate": 1.4167993475981514e-07, + "loss": 0.0011, + "step": 15068 + }, + { + "epoch": 0.29, + "learning_rate": 1.41676051415479e-07, + "loss": 0.0018, + "step": 15069 + }, + { + "epoch": 0.29, + "learning_rate": 1.4167216807114285e-07, + "loss": 0.0013, + "step": 15070 + }, + { + "epoch": 0.29, + "learning_rate": 1.4166828472680672e-07, + "loss": 0.0013, + "step": 15071 + }, + { + "epoch": 0.29, + "learning_rate": 1.4166440138247057e-07, + "loss": 0.0012, + "step": 15072 + }, + { + "epoch": 0.29, + "learning_rate": 1.4166051803813444e-07, + "loss": 0.0151, + "step": 15073 + }, + { + "epoch": 0.29, + "learning_rate": 1.4165663469379829e-07, + "loss": 0.0013, + "step": 15074 + }, + { + "epoch": 0.29, + "learning_rate": 1.4165275134946216e-07, + "loss": 0.001, + "step": 15075 + }, + { + "epoch": 0.29, + "learning_rate": 1.41648868005126e-07, + "loss": 0.0064, + "step": 15076 + }, + { + "epoch": 0.29, + "learning_rate": 1.4164498466078987e-07, + "loss": 0.7304, + "step": 15077 + }, + { + "epoch": 0.29, + "learning_rate": 1.4164110131645372e-07, + "loss": 0.0013, + "step": 15078 + }, + { + "epoch": 0.29, + "learning_rate": 1.416372179721176e-07, + "loss": 0.0016, + "step": 15079 + }, + { + "epoch": 0.29, + "learning_rate": 1.4163333462778144e-07, + "loss": 0.0123, + "step": 15080 + }, + { + "epoch": 0.29, + "learning_rate": 1.416294512834453e-07, + "loss": 0.0009, + "step": 15081 + }, + { + "epoch": 0.29, + "learning_rate": 1.4162556793910915e-07, + "loss": 0.1462, + "step": 15082 + }, + { + "epoch": 0.29, + "learning_rate": 1.4162168459477302e-07, + "loss": 0.0016, + "step": 15083 + }, + { + "epoch": 0.29, + "learning_rate": 1.4161780125043687e-07, + "loss": 0.0011, + "step": 15084 + }, + { + "epoch": 0.29, + "learning_rate": 1.4161391790610074e-07, + "loss": 0.0012, + "step": 15085 + }, + { + "epoch": 0.29, + "learning_rate": 1.4161003456176459e-07, + "loss": 0.0014, + "step": 15086 + }, + { + "epoch": 0.29, + "learning_rate": 1.4160615121742846e-07, + "loss": 0.0026, + "step": 15087 + }, + { + "epoch": 0.29, + "learning_rate": 1.416022678730923e-07, + "loss": 0.0013, + "step": 15088 + }, + { + "epoch": 0.29, + "learning_rate": 1.4159838452875617e-07, + "loss": 0.2796, + "step": 15089 + }, + { + "epoch": 0.29, + "learning_rate": 1.4159450118442002e-07, + "loss": 0.0013, + "step": 15090 + }, + { + "epoch": 0.29, + "learning_rate": 1.415906178400839e-07, + "loss": 0.0041, + "step": 15091 + }, + { + "epoch": 0.29, + "learning_rate": 1.4158673449574773e-07, + "loss": 0.001, + "step": 15092 + }, + { + "epoch": 0.29, + "learning_rate": 1.415828511514116e-07, + "loss": 0.0017, + "step": 15093 + }, + { + "epoch": 0.29, + "learning_rate": 1.4157896780707545e-07, + "loss": 0.0017, + "step": 15094 + }, + { + "epoch": 0.29, + "learning_rate": 1.4157508446273932e-07, + "loss": 0.3643, + "step": 15095 + }, + { + "epoch": 0.29, + "learning_rate": 1.4157120111840317e-07, + "loss": 0.0013, + "step": 15096 + }, + { + "epoch": 0.29, + "learning_rate": 1.4156731777406704e-07, + "loss": 0.0011, + "step": 15097 + }, + { + "epoch": 0.29, + "learning_rate": 1.4156343442973088e-07, + "loss": 0.0171, + "step": 15098 + }, + { + "epoch": 0.29, + "learning_rate": 1.4155955108539476e-07, + "loss": 0.6375, + "step": 15099 + }, + { + "epoch": 0.29, + "learning_rate": 1.415556677410586e-07, + "loss": 0.0015, + "step": 15100 + }, + { + "epoch": 0.29, + "learning_rate": 1.4155178439672245e-07, + "loss": 0.0018, + "step": 15101 + }, + { + "epoch": 0.29, + "learning_rate": 1.415479010523863e-07, + "loss": 0.0014, + "step": 15102 + }, + { + "epoch": 0.29, + "learning_rate": 1.4154401770805016e-07, + "loss": 0.0015, + "step": 15103 + }, + { + "epoch": 0.29, + "learning_rate": 1.41540134363714e-07, + "loss": 0.4917, + "step": 15104 + }, + { + "epoch": 0.29, + "learning_rate": 1.4153625101937788e-07, + "loss": 0.0011, + "step": 15105 + }, + { + "epoch": 0.29, + "learning_rate": 1.4153236767504172e-07, + "loss": 0.0394, + "step": 15106 + }, + { + "epoch": 0.29, + "learning_rate": 1.415284843307056e-07, + "loss": 0.0012, + "step": 15107 + }, + { + "epoch": 0.29, + "learning_rate": 1.4152460098636944e-07, + "loss": 0.0085, + "step": 15108 + }, + { + "epoch": 0.29, + "learning_rate": 1.415207176420333e-07, + "loss": 0.0013, + "step": 15109 + }, + { + "epoch": 0.29, + "learning_rate": 1.4151683429769716e-07, + "loss": 0.0179, + "step": 15110 + }, + { + "epoch": 0.29, + "learning_rate": 1.4151295095336103e-07, + "loss": 0.001, + "step": 15111 + }, + { + "epoch": 0.29, + "learning_rate": 1.4150906760902487e-07, + "loss": 0.1205, + "step": 15112 + }, + { + "epoch": 0.29, + "learning_rate": 1.4150518426468874e-07, + "loss": 0.0013, + "step": 15113 + }, + { + "epoch": 0.29, + "learning_rate": 1.415013009203526e-07, + "loss": 0.001, + "step": 15114 + }, + { + "epoch": 0.29, + "learning_rate": 1.4149741757601646e-07, + "loss": 0.0029, + "step": 15115 + }, + { + "epoch": 0.29, + "learning_rate": 1.414935342316803e-07, + "loss": 0.0015, + "step": 15116 + }, + { + "epoch": 0.29, + "learning_rate": 1.4148965088734418e-07, + "loss": 0.001, + "step": 15117 + }, + { + "epoch": 0.29, + "learning_rate": 1.4148576754300802e-07, + "loss": 0.0016, + "step": 15118 + }, + { + "epoch": 0.29, + "learning_rate": 1.414818841986719e-07, + "loss": 0.0016, + "step": 15119 + }, + { + "epoch": 0.29, + "learning_rate": 1.4147800085433574e-07, + "loss": 0.0158, + "step": 15120 + }, + { + "epoch": 0.29, + "learning_rate": 1.414741175099996e-07, + "loss": 0.0014, + "step": 15121 + }, + { + "epoch": 0.29, + "learning_rate": 1.4147023416566346e-07, + "loss": 0.0014, + "step": 15122 + }, + { + "epoch": 0.29, + "learning_rate": 1.4146635082132733e-07, + "loss": 0.0009, + "step": 15123 + }, + { + "epoch": 0.29, + "learning_rate": 1.4146246747699117e-07, + "loss": 0.0026, + "step": 15124 + }, + { + "epoch": 0.29, + "learning_rate": 1.4145858413265504e-07, + "loss": 0.0008, + "step": 15125 + }, + { + "epoch": 0.29, + "learning_rate": 1.414547007883189e-07, + "loss": 0.0061, + "step": 15126 + }, + { + "epoch": 0.29, + "learning_rate": 1.4145081744398276e-07, + "loss": 0.0013, + "step": 15127 + }, + { + "epoch": 0.29, + "learning_rate": 1.414469340996466e-07, + "loss": 0.002, + "step": 15128 + }, + { + "epoch": 0.29, + "learning_rate": 1.4144305075531048e-07, + "loss": 0.0011, + "step": 15129 + }, + { + "epoch": 0.29, + "learning_rate": 1.4143916741097432e-07, + "loss": 0.0013, + "step": 15130 + }, + { + "epoch": 0.29, + "learning_rate": 1.414352840666382e-07, + "loss": 0.0012, + "step": 15131 + }, + { + "epoch": 0.29, + "learning_rate": 1.4143140072230204e-07, + "loss": 0.0015, + "step": 15132 + }, + { + "epoch": 0.29, + "learning_rate": 1.414275173779659e-07, + "loss": 0.0017, + "step": 15133 + }, + { + "epoch": 0.29, + "learning_rate": 1.4142363403362975e-07, + "loss": 0.0113, + "step": 15134 + }, + { + "epoch": 0.29, + "learning_rate": 1.4141975068929363e-07, + "loss": 0.001, + "step": 15135 + }, + { + "epoch": 0.29, + "learning_rate": 1.4141586734495747e-07, + "loss": 0.0012, + "step": 15136 + }, + { + "epoch": 0.29, + "learning_rate": 1.4141198400062134e-07, + "loss": 0.0012, + "step": 15137 + }, + { + "epoch": 0.29, + "learning_rate": 1.414081006562852e-07, + "loss": 0.0011, + "step": 15138 + }, + { + "epoch": 0.29, + "learning_rate": 1.4140421731194906e-07, + "loss": 0.123, + "step": 15139 + }, + { + "epoch": 0.29, + "learning_rate": 1.414003339676129e-07, + "loss": 0.0014, + "step": 15140 + }, + { + "epoch": 0.29, + "learning_rate": 1.4139645062327678e-07, + "loss": 0.0011, + "step": 15141 + }, + { + "epoch": 0.29, + "learning_rate": 1.4139256727894062e-07, + "loss": 0.4222, + "step": 15142 + }, + { + "epoch": 0.29, + "learning_rate": 1.413886839346045e-07, + "loss": 0.0418, + "step": 15143 + }, + { + "epoch": 0.29, + "learning_rate": 1.4138480059026834e-07, + "loss": 0.0012, + "step": 15144 + }, + { + "epoch": 0.29, + "learning_rate": 1.413809172459322e-07, + "loss": 0.0017, + "step": 15145 + }, + { + "epoch": 0.29, + "learning_rate": 1.4137703390159605e-07, + "loss": 0.0028, + "step": 15146 + }, + { + "epoch": 0.29, + "learning_rate": 1.4137315055725992e-07, + "loss": 0.0723, + "step": 15147 + }, + { + "epoch": 0.29, + "learning_rate": 1.4136926721292377e-07, + "loss": 0.0012, + "step": 15148 + }, + { + "epoch": 0.29, + "learning_rate": 1.4136538386858764e-07, + "loss": 0.0009, + "step": 15149 + }, + { + "epoch": 0.29, + "learning_rate": 1.4136150052425149e-07, + "loss": 0.4209, + "step": 15150 + }, + { + "epoch": 0.29, + "learning_rate": 1.4135761717991536e-07, + "loss": 0.2935, + "step": 15151 + }, + { + "epoch": 0.29, + "learning_rate": 1.413537338355792e-07, + "loss": 0.0018, + "step": 15152 + }, + { + "epoch": 0.29, + "learning_rate": 1.4134985049124305e-07, + "loss": 0.0017, + "step": 15153 + }, + { + "epoch": 0.29, + "learning_rate": 1.4134596714690692e-07, + "loss": 0.0817, + "step": 15154 + }, + { + "epoch": 0.29, + "learning_rate": 1.4134208380257076e-07, + "loss": 0.0012, + "step": 15155 + }, + { + "epoch": 0.29, + "learning_rate": 1.4133820045823464e-07, + "loss": 0.0045, + "step": 15156 + }, + { + "epoch": 0.29, + "learning_rate": 1.4133431711389848e-07, + "loss": 0.0094, + "step": 15157 + }, + { + "epoch": 0.29, + "learning_rate": 1.4133043376956235e-07, + "loss": 0.0012, + "step": 15158 + }, + { + "epoch": 0.29, + "learning_rate": 1.413265504252262e-07, + "loss": 0.0013, + "step": 15159 + }, + { + "epoch": 0.29, + "learning_rate": 1.4132266708089004e-07, + "loss": 0.0016, + "step": 15160 + }, + { + "epoch": 0.29, + "learning_rate": 1.4131878373655391e-07, + "loss": 0.0012, + "step": 15161 + }, + { + "epoch": 0.29, + "learning_rate": 1.4131490039221776e-07, + "loss": 0.0027, + "step": 15162 + }, + { + "epoch": 0.29, + "learning_rate": 1.4131101704788163e-07, + "loss": 0.0011, + "step": 15163 + }, + { + "epoch": 0.29, + "learning_rate": 1.4130713370354548e-07, + "loss": 0.3895, + "step": 15164 + }, + { + "epoch": 0.29, + "learning_rate": 1.4130325035920935e-07, + "loss": 0.0014, + "step": 15165 + }, + { + "epoch": 0.29, + "learning_rate": 1.412993670148732e-07, + "loss": 0.004, + "step": 15166 + }, + { + "epoch": 0.29, + "learning_rate": 1.4129548367053706e-07, + "loss": 0.001, + "step": 15167 + }, + { + "epoch": 0.29, + "learning_rate": 1.412916003262009e-07, + "loss": 0.0012, + "step": 15168 + }, + { + "epoch": 0.29, + "learning_rate": 1.4128771698186478e-07, + "loss": 0.001, + "step": 15169 + }, + { + "epoch": 0.29, + "learning_rate": 1.4128383363752862e-07, + "loss": 0.0014, + "step": 15170 + }, + { + "epoch": 0.29, + "learning_rate": 1.412799502931925e-07, + "loss": 0.0008, + "step": 15171 + }, + { + "epoch": 0.29, + "learning_rate": 1.4127606694885634e-07, + "loss": 0.0012, + "step": 15172 + }, + { + "epoch": 0.29, + "learning_rate": 1.412721836045202e-07, + "loss": 0.6907, + "step": 15173 + }, + { + "epoch": 0.29, + "learning_rate": 1.4126830026018406e-07, + "loss": 0.0011, + "step": 15174 + }, + { + "epoch": 0.29, + "learning_rate": 1.4126441691584793e-07, + "loss": 0.0018, + "step": 15175 + }, + { + "epoch": 0.29, + "learning_rate": 1.4126053357151177e-07, + "loss": 0.0013, + "step": 15176 + }, + { + "epoch": 0.29, + "learning_rate": 1.4125665022717565e-07, + "loss": 0.0011, + "step": 15177 + }, + { + "epoch": 0.29, + "learning_rate": 1.412527668828395e-07, + "loss": 0.001, + "step": 15178 + }, + { + "epoch": 0.29, + "learning_rate": 1.4124888353850336e-07, + "loss": 0.0027, + "step": 15179 + }, + { + "epoch": 0.29, + "learning_rate": 1.412450001941672e-07, + "loss": 0.002, + "step": 15180 + }, + { + "epoch": 0.29, + "learning_rate": 1.4124111684983108e-07, + "loss": 0.1304, + "step": 15181 + }, + { + "epoch": 0.29, + "learning_rate": 1.4123723350549492e-07, + "loss": 0.0324, + "step": 15182 + }, + { + "epoch": 0.29, + "learning_rate": 1.4123335016115877e-07, + "loss": 0.0013, + "step": 15183 + }, + { + "epoch": 0.29, + "learning_rate": 1.4122946681682264e-07, + "loss": 0.0017, + "step": 15184 + }, + { + "epoch": 0.29, + "learning_rate": 1.4122558347248649e-07, + "loss": 0.0015, + "step": 15185 + }, + { + "epoch": 0.29, + "learning_rate": 1.4122170012815036e-07, + "loss": 0.001, + "step": 15186 + }, + { + "epoch": 0.29, + "learning_rate": 1.412178167838142e-07, + "loss": 0.0014, + "step": 15187 + }, + { + "epoch": 0.29, + "learning_rate": 1.4121393343947807e-07, + "loss": 0.0031, + "step": 15188 + }, + { + "epoch": 0.29, + "learning_rate": 1.4121005009514192e-07, + "loss": 0.0716, + "step": 15189 + }, + { + "epoch": 0.29, + "learning_rate": 1.412061667508058e-07, + "loss": 0.0012, + "step": 15190 + }, + { + "epoch": 0.29, + "learning_rate": 1.4120228340646963e-07, + "loss": 0.002, + "step": 15191 + }, + { + "epoch": 0.29, + "learning_rate": 1.411984000621335e-07, + "loss": 0.0016, + "step": 15192 + }, + { + "epoch": 0.29, + "learning_rate": 1.4119451671779735e-07, + "loss": 0.0015, + "step": 15193 + }, + { + "epoch": 0.29, + "learning_rate": 1.4119063337346122e-07, + "loss": 0.0015, + "step": 15194 + }, + { + "epoch": 0.29, + "learning_rate": 1.4118675002912507e-07, + "loss": 0.0015, + "step": 15195 + }, + { + "epoch": 0.29, + "learning_rate": 1.4118286668478894e-07, + "loss": 0.0657, + "step": 15196 + }, + { + "epoch": 0.29, + "learning_rate": 1.4117898334045278e-07, + "loss": 0.017, + "step": 15197 + }, + { + "epoch": 0.29, + "learning_rate": 1.4117509999611666e-07, + "loss": 0.0011, + "step": 15198 + }, + { + "epoch": 0.29, + "learning_rate": 1.411712166517805e-07, + "loss": 0.0014, + "step": 15199 + }, + { + "epoch": 0.29, + "learning_rate": 1.4116733330744437e-07, + "loss": 0.0014, + "step": 15200 + }, + { + "epoch": 0.29, + "learning_rate": 1.4116344996310822e-07, + "loss": 0.001, + "step": 15201 + }, + { + "epoch": 0.29, + "learning_rate": 1.411595666187721e-07, + "loss": 0.0011, + "step": 15202 + }, + { + "epoch": 0.29, + "learning_rate": 1.4115568327443593e-07, + "loss": 0.2096, + "step": 15203 + }, + { + "epoch": 0.29, + "learning_rate": 1.411517999300998e-07, + "loss": 0.0013, + "step": 15204 + }, + { + "epoch": 0.29, + "learning_rate": 1.4114791658576365e-07, + "loss": 0.0025, + "step": 15205 + }, + { + "epoch": 0.29, + "learning_rate": 1.4114403324142752e-07, + "loss": 0.0008, + "step": 15206 + }, + { + "epoch": 0.29, + "learning_rate": 1.4114014989709137e-07, + "loss": 0.0017, + "step": 15207 + }, + { + "epoch": 0.3, + "learning_rate": 1.4113626655275524e-07, + "loss": 0.0031, + "step": 15208 + }, + { + "epoch": 0.3, + "learning_rate": 1.4113238320841908e-07, + "loss": 0.1905, + "step": 15209 + }, + { + "epoch": 0.3, + "learning_rate": 1.4112849986408295e-07, + "loss": 0.0013, + "step": 15210 + }, + { + "epoch": 0.3, + "learning_rate": 1.411246165197468e-07, + "loss": 0.0014, + "step": 15211 + }, + { + "epoch": 0.3, + "learning_rate": 1.4112073317541067e-07, + "loss": 0.001, + "step": 15212 + }, + { + "epoch": 0.3, + "learning_rate": 1.4111684983107452e-07, + "loss": 0.0015, + "step": 15213 + }, + { + "epoch": 0.3, + "learning_rate": 1.411129664867384e-07, + "loss": 0.0016, + "step": 15214 + }, + { + "epoch": 0.3, + "learning_rate": 1.4110908314240223e-07, + "loss": 0.0023, + "step": 15215 + }, + { + "epoch": 0.3, + "learning_rate": 1.411051997980661e-07, + "loss": 0.0011, + "step": 15216 + }, + { + "epoch": 0.3, + "learning_rate": 1.4110131645372992e-07, + "loss": 0.001, + "step": 15217 + }, + { + "epoch": 0.3, + "learning_rate": 1.410974331093938e-07, + "loss": 0.0012, + "step": 15218 + }, + { + "epoch": 0.3, + "learning_rate": 1.4109354976505764e-07, + "loss": 0.8246, + "step": 15219 + }, + { + "epoch": 0.3, + "learning_rate": 1.410896664207215e-07, + "loss": 0.3048, + "step": 15220 + }, + { + "epoch": 0.3, + "learning_rate": 1.4108578307638536e-07, + "loss": 0.0013, + "step": 15221 + }, + { + "epoch": 0.3, + "learning_rate": 1.4108189973204923e-07, + "loss": 0.0044, + "step": 15222 + }, + { + "epoch": 0.3, + "learning_rate": 1.4107801638771307e-07, + "loss": 0.0012, + "step": 15223 + }, + { + "epoch": 0.3, + "learning_rate": 1.4107413304337694e-07, + "loss": 0.0012, + "step": 15224 + }, + { + "epoch": 0.3, + "learning_rate": 1.410702496990408e-07, + "loss": 0.5046, + "step": 15225 + }, + { + "epoch": 0.3, + "learning_rate": 1.4106636635470466e-07, + "loss": 0.001, + "step": 15226 + }, + { + "epoch": 0.3, + "learning_rate": 1.410624830103685e-07, + "loss": 0.001, + "step": 15227 + }, + { + "epoch": 0.3, + "learning_rate": 1.4105859966603238e-07, + "loss": 0.001, + "step": 15228 + }, + { + "epoch": 0.3, + "learning_rate": 1.4105471632169622e-07, + "loss": 0.2654, + "step": 15229 + }, + { + "epoch": 0.3, + "learning_rate": 1.410508329773601e-07, + "loss": 0.3977, + "step": 15230 + }, + { + "epoch": 0.3, + "learning_rate": 1.4104694963302394e-07, + "loss": 0.7928, + "step": 15231 + }, + { + "epoch": 0.3, + "learning_rate": 1.410430662886878e-07, + "loss": 0.0011, + "step": 15232 + }, + { + "epoch": 0.3, + "learning_rate": 1.4103918294435165e-07, + "loss": 0.003, + "step": 15233 + }, + { + "epoch": 0.3, + "learning_rate": 1.4103529960001553e-07, + "loss": 0.001, + "step": 15234 + }, + { + "epoch": 0.3, + "learning_rate": 1.4103141625567937e-07, + "loss": 0.004, + "step": 15235 + }, + { + "epoch": 0.3, + "learning_rate": 1.4102753291134324e-07, + "loss": 0.0014, + "step": 15236 + }, + { + "epoch": 0.3, + "learning_rate": 1.410236495670071e-07, + "loss": 0.0012, + "step": 15237 + }, + { + "epoch": 0.3, + "learning_rate": 1.4101976622267096e-07, + "loss": 0.0015, + "step": 15238 + }, + { + "epoch": 0.3, + "learning_rate": 1.410158828783348e-07, + "loss": 0.1199, + "step": 15239 + }, + { + "epoch": 0.3, + "learning_rate": 1.4101199953399868e-07, + "loss": 0.0051, + "step": 15240 + }, + { + "epoch": 0.3, + "learning_rate": 1.4100811618966252e-07, + "loss": 0.0028, + "step": 15241 + }, + { + "epoch": 0.3, + "learning_rate": 1.410042328453264e-07, + "loss": 0.0012, + "step": 15242 + }, + { + "epoch": 0.3, + "learning_rate": 1.4100034950099024e-07, + "loss": 0.0017, + "step": 15243 + }, + { + "epoch": 0.3, + "learning_rate": 1.409964661566541e-07, + "loss": 0.0027, + "step": 15244 + }, + { + "epoch": 0.3, + "learning_rate": 1.4099258281231795e-07, + "loss": 0.0015, + "step": 15245 + }, + { + "epoch": 0.3, + "learning_rate": 1.4098869946798182e-07, + "loss": 0.0013, + "step": 15246 + }, + { + "epoch": 0.3, + "learning_rate": 1.4098481612364567e-07, + "loss": 0.8749, + "step": 15247 + }, + { + "epoch": 0.3, + "learning_rate": 1.4098093277930954e-07, + "loss": 0.0012, + "step": 15248 + }, + { + "epoch": 0.3, + "learning_rate": 1.4097704943497339e-07, + "loss": 0.0009, + "step": 15249 + }, + { + "epoch": 0.3, + "learning_rate": 1.4097316609063726e-07, + "loss": 1.0812, + "step": 15250 + }, + { + "epoch": 0.3, + "learning_rate": 1.409692827463011e-07, + "loss": 0.0011, + "step": 15251 + }, + { + "epoch": 0.3, + "learning_rate": 1.4096539940196497e-07, + "loss": 0.0009, + "step": 15252 + }, + { + "epoch": 0.3, + "learning_rate": 1.4096151605762882e-07, + "loss": 0.0014, + "step": 15253 + }, + { + "epoch": 0.3, + "learning_rate": 1.409576327132927e-07, + "loss": 0.0011, + "step": 15254 + }, + { + "epoch": 0.3, + "learning_rate": 1.4095374936895654e-07, + "loss": 0.0087, + "step": 15255 + }, + { + "epoch": 0.3, + "learning_rate": 1.409498660246204e-07, + "loss": 0.487, + "step": 15256 + }, + { + "epoch": 0.3, + "learning_rate": 1.4094598268028425e-07, + "loss": 0.0021, + "step": 15257 + }, + { + "epoch": 0.3, + "learning_rate": 1.4094209933594812e-07, + "loss": 0.0195, + "step": 15258 + }, + { + "epoch": 0.3, + "learning_rate": 1.4093821599161197e-07, + "loss": 0.0012, + "step": 15259 + }, + { + "epoch": 0.3, + "learning_rate": 1.4093433264727584e-07, + "loss": 0.3359, + "step": 15260 + }, + { + "epoch": 0.3, + "learning_rate": 1.4093044930293969e-07, + "loss": 0.0112, + "step": 15261 + }, + { + "epoch": 0.3, + "learning_rate": 1.4092656595860356e-07, + "loss": 0.0017, + "step": 15262 + }, + { + "epoch": 0.3, + "learning_rate": 1.409226826142674e-07, + "loss": 1.3325, + "step": 15263 + }, + { + "epoch": 0.3, + "learning_rate": 1.4091879926993127e-07, + "loss": 0.1431, + "step": 15264 + }, + { + "epoch": 0.3, + "learning_rate": 1.4091491592559512e-07, + "loss": 0.0013, + "step": 15265 + }, + { + "epoch": 0.3, + "learning_rate": 1.40911032581259e-07, + "loss": 0.4162, + "step": 15266 + }, + { + "epoch": 0.3, + "learning_rate": 1.4090714923692283e-07, + "loss": 0.0009, + "step": 15267 + }, + { + "epoch": 0.3, + "learning_rate": 1.409032658925867e-07, + "loss": 0.0013, + "step": 15268 + }, + { + "epoch": 0.3, + "learning_rate": 1.4089938254825055e-07, + "loss": 0.0012, + "step": 15269 + }, + { + "epoch": 0.3, + "learning_rate": 1.4089549920391442e-07, + "loss": 0.0332, + "step": 15270 + }, + { + "epoch": 0.3, + "learning_rate": 1.4089161585957827e-07, + "loss": 0.8274, + "step": 15271 + }, + { + "epoch": 0.3, + "learning_rate": 1.4088773251524214e-07, + "loss": 0.0015, + "step": 15272 + }, + { + "epoch": 0.3, + "learning_rate": 1.4088384917090598e-07, + "loss": 0.1491, + "step": 15273 + }, + { + "epoch": 0.3, + "learning_rate": 1.4087996582656986e-07, + "loss": 0.0092, + "step": 15274 + }, + { + "epoch": 0.3, + "learning_rate": 1.4087608248223367e-07, + "loss": 0.0018, + "step": 15275 + }, + { + "epoch": 0.3, + "learning_rate": 1.4087219913789755e-07, + "loss": 0.001, + "step": 15276 + }, + { + "epoch": 0.3, + "learning_rate": 1.408683157935614e-07, + "loss": 0.0031, + "step": 15277 + }, + { + "epoch": 0.3, + "learning_rate": 1.4086443244922526e-07, + "loss": 0.4571, + "step": 15278 + }, + { + "epoch": 0.3, + "learning_rate": 1.408605491048891e-07, + "loss": 0.0009, + "step": 15279 + }, + { + "epoch": 0.3, + "learning_rate": 1.4085666576055298e-07, + "loss": 0.0019, + "step": 15280 + }, + { + "epoch": 0.3, + "learning_rate": 1.4085278241621682e-07, + "loss": 0.001, + "step": 15281 + }, + { + "epoch": 0.3, + "learning_rate": 1.408488990718807e-07, + "loss": 0.0412, + "step": 15282 + }, + { + "epoch": 0.3, + "learning_rate": 1.4084501572754454e-07, + "loss": 0.0029, + "step": 15283 + }, + { + "epoch": 0.3, + "learning_rate": 1.408411323832084e-07, + "loss": 0.0013, + "step": 15284 + }, + { + "epoch": 0.3, + "learning_rate": 1.4083724903887226e-07, + "loss": 0.0013, + "step": 15285 + }, + { + "epoch": 0.3, + "learning_rate": 1.4083336569453613e-07, + "loss": 0.0016, + "step": 15286 + }, + { + "epoch": 0.3, + "learning_rate": 1.4082948235019997e-07, + "loss": 0.0313, + "step": 15287 + }, + { + "epoch": 0.3, + "learning_rate": 1.4082559900586384e-07, + "loss": 0.0012, + "step": 15288 + }, + { + "epoch": 0.3, + "learning_rate": 1.408217156615277e-07, + "loss": 0.2252, + "step": 15289 + }, + { + "epoch": 0.3, + "learning_rate": 1.4081783231719156e-07, + "loss": 0.0012, + "step": 15290 + }, + { + "epoch": 0.3, + "learning_rate": 1.408139489728554e-07, + "loss": 0.0013, + "step": 15291 + }, + { + "epoch": 0.3, + "learning_rate": 1.4081006562851928e-07, + "loss": 0.0012, + "step": 15292 + }, + { + "epoch": 0.3, + "learning_rate": 1.4080618228418312e-07, + "loss": 0.012, + "step": 15293 + }, + { + "epoch": 0.3, + "learning_rate": 1.40802298939847e-07, + "loss": 0.0013, + "step": 15294 + }, + { + "epoch": 0.3, + "learning_rate": 1.4079841559551084e-07, + "loss": 0.0011, + "step": 15295 + }, + { + "epoch": 0.3, + "learning_rate": 1.407945322511747e-07, + "loss": 0.0008, + "step": 15296 + }, + { + "epoch": 0.3, + "learning_rate": 1.4079064890683856e-07, + "loss": 0.0039, + "step": 15297 + }, + { + "epoch": 0.3, + "learning_rate": 1.4078676556250243e-07, + "loss": 0.0012, + "step": 15298 + }, + { + "epoch": 0.3, + "learning_rate": 1.4078288221816627e-07, + "loss": 0.0013, + "step": 15299 + }, + { + "epoch": 0.3, + "learning_rate": 1.4077899887383014e-07, + "loss": 0.1612, + "step": 15300 + }, + { + "epoch": 0.3, + "learning_rate": 1.40775115529494e-07, + "loss": 0.9188, + "step": 15301 + }, + { + "epoch": 0.3, + "learning_rate": 1.4077123218515786e-07, + "loss": 0.0013, + "step": 15302 + }, + { + "epoch": 0.3, + "learning_rate": 1.407673488408217e-07, + "loss": 0.0016, + "step": 15303 + }, + { + "epoch": 0.3, + "learning_rate": 1.4076346549648558e-07, + "loss": 0.0011, + "step": 15304 + }, + { + "epoch": 0.3, + "learning_rate": 1.4075958215214942e-07, + "loss": 0.1218, + "step": 15305 + }, + { + "epoch": 0.3, + "learning_rate": 1.407556988078133e-07, + "loss": 0.0015, + "step": 15306 + }, + { + "epoch": 0.3, + "learning_rate": 1.4075181546347714e-07, + "loss": 0.0012, + "step": 15307 + }, + { + "epoch": 0.3, + "learning_rate": 1.40747932119141e-07, + "loss": 0.0009, + "step": 15308 + }, + { + "epoch": 0.3, + "learning_rate": 1.4074404877480485e-07, + "loss": 0.0011, + "step": 15309 + }, + { + "epoch": 0.3, + "learning_rate": 1.4074016543046873e-07, + "loss": 0.0011, + "step": 15310 + }, + { + "epoch": 0.3, + "learning_rate": 1.4073628208613257e-07, + "loss": 0.0011, + "step": 15311 + }, + { + "epoch": 0.3, + "learning_rate": 1.4073239874179644e-07, + "loss": 0.0014, + "step": 15312 + }, + { + "epoch": 0.3, + "learning_rate": 1.407285153974603e-07, + "loss": 0.0012, + "step": 15313 + }, + { + "epoch": 0.3, + "learning_rate": 1.4072463205312416e-07, + "loss": 0.002, + "step": 15314 + }, + { + "epoch": 0.3, + "learning_rate": 1.40720748708788e-07, + "loss": 0.541, + "step": 15315 + }, + { + "epoch": 0.3, + "learning_rate": 1.4071686536445188e-07, + "loss": 0.6542, + "step": 15316 + }, + { + "epoch": 0.3, + "learning_rate": 1.4071298202011572e-07, + "loss": 1.2299, + "step": 15317 + }, + { + "epoch": 0.3, + "learning_rate": 1.407090986757796e-07, + "loss": 0.1474, + "step": 15318 + }, + { + "epoch": 0.3, + "learning_rate": 1.4070521533144344e-07, + "loss": 0.0014, + "step": 15319 + }, + { + "epoch": 0.3, + "learning_rate": 1.407013319871073e-07, + "loss": 0.001, + "step": 15320 + }, + { + "epoch": 0.3, + "learning_rate": 1.4069744864277115e-07, + "loss": 0.0028, + "step": 15321 + }, + { + "epoch": 0.3, + "learning_rate": 1.4069356529843503e-07, + "loss": 0.0022, + "step": 15322 + }, + { + "epoch": 0.3, + "learning_rate": 1.4068968195409887e-07, + "loss": 0.001, + "step": 15323 + }, + { + "epoch": 0.3, + "learning_rate": 1.4068579860976274e-07, + "loss": 0.0012, + "step": 15324 + }, + { + "epoch": 0.3, + "learning_rate": 1.4068191526542659e-07, + "loss": 0.0011, + "step": 15325 + }, + { + "epoch": 0.3, + "learning_rate": 1.4067803192109046e-07, + "loss": 0.0011, + "step": 15326 + }, + { + "epoch": 0.3, + "learning_rate": 1.406741485767543e-07, + "loss": 0.0012, + "step": 15327 + }, + { + "epoch": 0.3, + "learning_rate": 1.4067026523241817e-07, + "loss": 0.7985, + "step": 15328 + }, + { + "epoch": 0.3, + "learning_rate": 1.4066638188808202e-07, + "loss": 0.0013, + "step": 15329 + }, + { + "epoch": 0.3, + "learning_rate": 1.4066249854374586e-07, + "loss": 0.0009, + "step": 15330 + }, + { + "epoch": 0.3, + "learning_rate": 1.4065861519940974e-07, + "loss": 0.754, + "step": 15331 + }, + { + "epoch": 0.3, + "learning_rate": 1.4065473185507358e-07, + "loss": 0.0028, + "step": 15332 + }, + { + "epoch": 0.3, + "learning_rate": 1.4065084851073743e-07, + "loss": 0.1653, + "step": 15333 + }, + { + "epoch": 0.3, + "learning_rate": 1.406469651664013e-07, + "loss": 0.0012, + "step": 15334 + }, + { + "epoch": 0.3, + "learning_rate": 1.4064308182206514e-07, + "loss": 0.6416, + "step": 15335 + }, + { + "epoch": 0.3, + "learning_rate": 1.4063919847772901e-07, + "loss": 0.0014, + "step": 15336 + }, + { + "epoch": 0.3, + "learning_rate": 1.4063531513339286e-07, + "loss": 0.0011, + "step": 15337 + }, + { + "epoch": 0.3, + "learning_rate": 1.4063143178905673e-07, + "loss": 0.0012, + "step": 15338 + }, + { + "epoch": 0.3, + "learning_rate": 1.4062754844472058e-07, + "loss": 0.0009, + "step": 15339 + }, + { + "epoch": 0.3, + "learning_rate": 1.4062366510038445e-07, + "loss": 0.0017, + "step": 15340 + }, + { + "epoch": 0.3, + "learning_rate": 1.406197817560483e-07, + "loss": 0.0021, + "step": 15341 + }, + { + "epoch": 0.3, + "learning_rate": 1.4061589841171216e-07, + "loss": 0.0011, + "step": 15342 + }, + { + "epoch": 0.3, + "learning_rate": 1.40612015067376e-07, + "loss": 0.081, + "step": 15343 + }, + { + "epoch": 0.3, + "learning_rate": 1.4060813172303988e-07, + "loss": 0.002, + "step": 15344 + }, + { + "epoch": 0.3, + "learning_rate": 1.4060424837870372e-07, + "loss": 0.0013, + "step": 15345 + }, + { + "epoch": 0.3, + "learning_rate": 1.406003650343676e-07, + "loss": 0.0012, + "step": 15346 + }, + { + "epoch": 0.3, + "learning_rate": 1.4059648169003144e-07, + "loss": 0.0012, + "step": 15347 + }, + { + "epoch": 0.3, + "learning_rate": 1.405925983456953e-07, + "loss": 0.001, + "step": 15348 + }, + { + "epoch": 0.3, + "learning_rate": 1.4058871500135916e-07, + "loss": 0.0013, + "step": 15349 + }, + { + "epoch": 0.3, + "learning_rate": 1.4058483165702303e-07, + "loss": 0.0026, + "step": 15350 + }, + { + "epoch": 0.3, + "learning_rate": 1.4058094831268687e-07, + "loss": 0.0016, + "step": 15351 + }, + { + "epoch": 0.3, + "learning_rate": 1.4057706496835075e-07, + "loss": 0.001, + "step": 15352 + }, + { + "epoch": 0.3, + "learning_rate": 1.405731816240146e-07, + "loss": 0.0037, + "step": 15353 + }, + { + "epoch": 0.3, + "learning_rate": 1.4056929827967846e-07, + "loss": 0.001, + "step": 15354 + }, + { + "epoch": 0.3, + "learning_rate": 1.405654149353423e-07, + "loss": 0.0009, + "step": 15355 + }, + { + "epoch": 0.3, + "learning_rate": 1.4056153159100618e-07, + "loss": 0.0014, + "step": 15356 + }, + { + "epoch": 0.3, + "learning_rate": 1.4055764824667002e-07, + "loss": 0.0014, + "step": 15357 + }, + { + "epoch": 0.3, + "learning_rate": 1.405537649023339e-07, + "loss": 0.1639, + "step": 15358 + }, + { + "epoch": 0.3, + "learning_rate": 1.4054988155799774e-07, + "loss": 0.0012, + "step": 15359 + }, + { + "epoch": 0.3, + "learning_rate": 1.4054599821366159e-07, + "loss": 0.0011, + "step": 15360 + }, + { + "epoch": 0.3, + "learning_rate": 1.4054211486932546e-07, + "loss": 0.6101, + "step": 15361 + }, + { + "epoch": 0.3, + "learning_rate": 1.405382315249893e-07, + "loss": 0.5462, + "step": 15362 + }, + { + "epoch": 0.3, + "learning_rate": 1.4053434818065317e-07, + "loss": 0.0032, + "step": 15363 + }, + { + "epoch": 0.3, + "learning_rate": 1.4053046483631702e-07, + "loss": 0.0013, + "step": 15364 + }, + { + "epoch": 0.3, + "learning_rate": 1.405265814919809e-07, + "loss": 0.2856, + "step": 15365 + }, + { + "epoch": 0.3, + "learning_rate": 1.4052269814764473e-07, + "loss": 0.7281, + "step": 15366 + }, + { + "epoch": 0.3, + "learning_rate": 1.405188148033086e-07, + "loss": 1.6897, + "step": 15367 + }, + { + "epoch": 0.3, + "learning_rate": 1.4051493145897245e-07, + "loss": 0.0016, + "step": 15368 + }, + { + "epoch": 0.3, + "learning_rate": 1.4051104811463632e-07, + "loss": 0.0025, + "step": 15369 + }, + { + "epoch": 0.3, + "learning_rate": 1.4050716477030017e-07, + "loss": 0.0012, + "step": 15370 + }, + { + "epoch": 0.3, + "learning_rate": 1.4050328142596404e-07, + "loss": 0.0017, + "step": 15371 + }, + { + "epoch": 0.3, + "learning_rate": 1.4049939808162788e-07, + "loss": 0.873, + "step": 15372 + }, + { + "epoch": 0.3, + "learning_rate": 1.4049551473729176e-07, + "loss": 0.0013, + "step": 15373 + }, + { + "epoch": 0.3, + "learning_rate": 1.404916313929556e-07, + "loss": 0.0017, + "step": 15374 + }, + { + "epoch": 0.3, + "learning_rate": 1.4048774804861947e-07, + "loss": 0.0015, + "step": 15375 + }, + { + "epoch": 0.3, + "learning_rate": 1.4048386470428332e-07, + "loss": 0.0018, + "step": 15376 + }, + { + "epoch": 0.3, + "learning_rate": 1.404799813599472e-07, + "loss": 0.0015, + "step": 15377 + }, + { + "epoch": 0.3, + "learning_rate": 1.4047609801561103e-07, + "loss": 0.0723, + "step": 15378 + }, + { + "epoch": 0.3, + "learning_rate": 1.404722146712749e-07, + "loss": 0.0013, + "step": 15379 + }, + { + "epoch": 0.3, + "learning_rate": 1.4046833132693875e-07, + "loss": 0.0222, + "step": 15380 + }, + { + "epoch": 0.3, + "learning_rate": 1.4046444798260262e-07, + "loss": 1.1023, + "step": 15381 + }, + { + "epoch": 0.3, + "learning_rate": 1.4046056463826647e-07, + "loss": 0.0019, + "step": 15382 + }, + { + "epoch": 0.3, + "learning_rate": 1.4045668129393034e-07, + "loss": 0.0014, + "step": 15383 + }, + { + "epoch": 0.3, + "learning_rate": 1.4045279794959418e-07, + "loss": 0.0009, + "step": 15384 + }, + { + "epoch": 0.3, + "learning_rate": 1.4044891460525805e-07, + "loss": 0.0013, + "step": 15385 + }, + { + "epoch": 0.3, + "learning_rate": 1.404450312609219e-07, + "loss": 0.0012, + "step": 15386 + }, + { + "epoch": 0.3, + "learning_rate": 1.4044114791658577e-07, + "loss": 0.0013, + "step": 15387 + }, + { + "epoch": 0.3, + "learning_rate": 1.4043726457224962e-07, + "loss": 0.0012, + "step": 15388 + }, + { + "epoch": 0.3, + "learning_rate": 1.404333812279135e-07, + "loss": 0.0011, + "step": 15389 + }, + { + "epoch": 0.3, + "learning_rate": 1.4042949788357733e-07, + "loss": 0.001, + "step": 15390 + }, + { + "epoch": 0.3, + "learning_rate": 1.4042561453924118e-07, + "loss": 0.0011, + "step": 15391 + }, + { + "epoch": 0.3, + "learning_rate": 1.4042173119490502e-07, + "loss": 0.001, + "step": 15392 + }, + { + "epoch": 0.3, + "learning_rate": 1.404178478505689e-07, + "loss": 0.0012, + "step": 15393 + }, + { + "epoch": 0.3, + "learning_rate": 1.4041396450623274e-07, + "loss": 0.0011, + "step": 15394 + }, + { + "epoch": 0.3, + "learning_rate": 1.404100811618966e-07, + "loss": 0.0008, + "step": 15395 + }, + { + "epoch": 0.3, + "learning_rate": 1.4040619781756046e-07, + "loss": 0.001, + "step": 15396 + }, + { + "epoch": 0.3, + "learning_rate": 1.4040231447322433e-07, + "loss": 0.0013, + "step": 15397 + }, + { + "epoch": 0.3, + "learning_rate": 1.4039843112888817e-07, + "loss": 0.0014, + "step": 15398 + }, + { + "epoch": 0.3, + "learning_rate": 1.4039454778455204e-07, + "loss": 0.0021, + "step": 15399 + }, + { + "epoch": 0.3, + "learning_rate": 1.403906644402159e-07, + "loss": 0.0682, + "step": 15400 + }, + { + "epoch": 0.3, + "learning_rate": 1.4038678109587976e-07, + "loss": 0.0012, + "step": 15401 + }, + { + "epoch": 0.3, + "learning_rate": 1.403828977515436e-07, + "loss": 0.1437, + "step": 15402 + }, + { + "epoch": 0.3, + "learning_rate": 1.4037901440720748e-07, + "loss": 0.0018, + "step": 15403 + }, + { + "epoch": 0.3, + "learning_rate": 1.4037513106287132e-07, + "loss": 0.001, + "step": 15404 + }, + { + "epoch": 0.3, + "learning_rate": 1.403712477185352e-07, + "loss": 0.0011, + "step": 15405 + }, + { + "epoch": 0.3, + "learning_rate": 1.4036736437419904e-07, + "loss": 0.8443, + "step": 15406 + }, + { + "epoch": 0.3, + "learning_rate": 1.403634810298629e-07, + "loss": 0.1901, + "step": 15407 + }, + { + "epoch": 0.3, + "learning_rate": 1.4035959768552675e-07, + "loss": 0.1424, + "step": 15408 + }, + { + "epoch": 0.3, + "learning_rate": 1.4035571434119063e-07, + "loss": 0.0014, + "step": 15409 + }, + { + "epoch": 0.3, + "learning_rate": 1.4035183099685447e-07, + "loss": 0.0014, + "step": 15410 + }, + { + "epoch": 0.3, + "learning_rate": 1.4034794765251834e-07, + "loss": 0.0011, + "step": 15411 + }, + { + "epoch": 0.3, + "learning_rate": 1.403440643081822e-07, + "loss": 0.0028, + "step": 15412 + }, + { + "epoch": 0.3, + "learning_rate": 1.4034018096384606e-07, + "loss": 0.0673, + "step": 15413 + }, + { + "epoch": 0.3, + "learning_rate": 1.403362976195099e-07, + "loss": 0.0033, + "step": 15414 + }, + { + "epoch": 0.3, + "learning_rate": 1.4033241427517378e-07, + "loss": 0.0011, + "step": 15415 + }, + { + "epoch": 0.3, + "learning_rate": 1.4032853093083762e-07, + "loss": 0.4869, + "step": 15416 + }, + { + "epoch": 0.3, + "learning_rate": 1.403246475865015e-07, + "loss": 0.0018, + "step": 15417 + }, + { + "epoch": 0.3, + "learning_rate": 1.4032076424216534e-07, + "loss": 0.001, + "step": 15418 + }, + { + "epoch": 0.3, + "learning_rate": 1.403168808978292e-07, + "loss": 0.2838, + "step": 15419 + }, + { + "epoch": 0.3, + "learning_rate": 1.4031299755349305e-07, + "loss": 0.001, + "step": 15420 + }, + { + "epoch": 0.3, + "learning_rate": 1.4030911420915693e-07, + "loss": 0.0059, + "step": 15421 + }, + { + "epoch": 0.3, + "learning_rate": 1.4030523086482077e-07, + "loss": 0.0012, + "step": 15422 + }, + { + "epoch": 0.3, + "learning_rate": 1.4030134752048464e-07, + "loss": 0.1574, + "step": 15423 + }, + { + "epoch": 0.3, + "learning_rate": 1.4029746417614849e-07, + "loss": 0.0026, + "step": 15424 + }, + { + "epoch": 0.3, + "learning_rate": 1.4029358083181236e-07, + "loss": 0.0015, + "step": 15425 + }, + { + "epoch": 0.3, + "learning_rate": 1.402896974874762e-07, + "loss": 0.0011, + "step": 15426 + }, + { + "epoch": 0.3, + "learning_rate": 1.4028581414314007e-07, + "loss": 0.0013, + "step": 15427 + }, + { + "epoch": 0.3, + "learning_rate": 1.4028193079880392e-07, + "loss": 0.0011, + "step": 15428 + }, + { + "epoch": 0.3, + "learning_rate": 1.402780474544678e-07, + "loss": 0.0011, + "step": 15429 + }, + { + "epoch": 0.3, + "learning_rate": 1.4027416411013164e-07, + "loss": 0.0011, + "step": 15430 + }, + { + "epoch": 0.3, + "learning_rate": 1.402702807657955e-07, + "loss": 0.0012, + "step": 15431 + }, + { + "epoch": 0.3, + "learning_rate": 1.4026639742145935e-07, + "loss": 0.0072, + "step": 15432 + }, + { + "epoch": 0.3, + "learning_rate": 1.4026251407712322e-07, + "loss": 0.0011, + "step": 15433 + }, + { + "epoch": 0.3, + "learning_rate": 1.4025863073278707e-07, + "loss": 0.9632, + "step": 15434 + }, + { + "epoch": 0.3, + "learning_rate": 1.4025474738845094e-07, + "loss": 0.0012, + "step": 15435 + }, + { + "epoch": 0.3, + "learning_rate": 1.4025086404411479e-07, + "loss": 0.0015, + "step": 15436 + }, + { + "epoch": 0.3, + "learning_rate": 1.4024698069977866e-07, + "loss": 0.0013, + "step": 15437 + }, + { + "epoch": 0.3, + "learning_rate": 1.402430973554425e-07, + "loss": 0.0011, + "step": 15438 + }, + { + "epoch": 0.3, + "learning_rate": 1.4023921401110637e-07, + "loss": 0.0176, + "step": 15439 + }, + { + "epoch": 0.3, + "learning_rate": 1.4023533066677022e-07, + "loss": 0.003, + "step": 15440 + }, + { + "epoch": 0.3, + "learning_rate": 1.402314473224341e-07, + "loss": 0.0499, + "step": 15441 + }, + { + "epoch": 0.3, + "learning_rate": 1.4022756397809793e-07, + "loss": 0.001, + "step": 15442 + }, + { + "epoch": 0.3, + "learning_rate": 1.402236806337618e-07, + "loss": 0.0036, + "step": 15443 + }, + { + "epoch": 0.3, + "learning_rate": 1.4021979728942565e-07, + "loss": 0.0013, + "step": 15444 + }, + { + "epoch": 0.3, + "learning_rate": 1.4021591394508952e-07, + "loss": 0.0013, + "step": 15445 + }, + { + "epoch": 0.3, + "learning_rate": 1.4021203060075337e-07, + "loss": 0.4957, + "step": 15446 + }, + { + "epoch": 0.3, + "learning_rate": 1.4020814725641724e-07, + "loss": 0.0064, + "step": 15447 + }, + { + "epoch": 0.3, + "learning_rate": 1.4020426391208108e-07, + "loss": 0.0018, + "step": 15448 + }, + { + "epoch": 0.3, + "learning_rate": 1.4020038056774493e-07, + "loss": 0.0013, + "step": 15449 + }, + { + "epoch": 0.3, + "learning_rate": 1.4019649722340877e-07, + "loss": 0.0013, + "step": 15450 + }, + { + "epoch": 0.3, + "learning_rate": 1.4019261387907265e-07, + "loss": 0.9465, + "step": 15451 + }, + { + "epoch": 0.3, + "learning_rate": 1.401887305347365e-07, + "loss": 0.0034, + "step": 15452 + }, + { + "epoch": 0.3, + "learning_rate": 1.4018484719040036e-07, + "loss": 0.0015, + "step": 15453 + }, + { + "epoch": 0.3, + "learning_rate": 1.401809638460642e-07, + "loss": 0.0025, + "step": 15454 + }, + { + "epoch": 0.3, + "learning_rate": 1.4017708050172808e-07, + "loss": 0.0011, + "step": 15455 + }, + { + "epoch": 0.3, + "learning_rate": 1.4017319715739192e-07, + "loss": 0.0014, + "step": 15456 + }, + { + "epoch": 0.3, + "learning_rate": 1.401693138130558e-07, + "loss": 0.001, + "step": 15457 + }, + { + "epoch": 0.3, + "learning_rate": 1.4016543046871964e-07, + "loss": 0.0013, + "step": 15458 + }, + { + "epoch": 0.3, + "learning_rate": 1.401615471243835e-07, + "loss": 0.0015, + "step": 15459 + }, + { + "epoch": 0.3, + "learning_rate": 1.4015766378004736e-07, + "loss": 0.1559, + "step": 15460 + }, + { + "epoch": 0.3, + "learning_rate": 1.4015378043571123e-07, + "loss": 0.0011, + "step": 15461 + }, + { + "epoch": 0.3, + "learning_rate": 1.4014989709137507e-07, + "loss": 0.0019, + "step": 15462 + }, + { + "epoch": 0.3, + "learning_rate": 1.4014601374703894e-07, + "loss": 0.0025, + "step": 15463 + }, + { + "epoch": 0.3, + "learning_rate": 1.401421304027028e-07, + "loss": 0.0012, + "step": 15464 + }, + { + "epoch": 0.3, + "learning_rate": 1.4013824705836666e-07, + "loss": 0.0012, + "step": 15465 + }, + { + "epoch": 0.3, + "learning_rate": 1.401343637140305e-07, + "loss": 0.0013, + "step": 15466 + }, + { + "epoch": 0.3, + "learning_rate": 1.4013048036969438e-07, + "loss": 0.0011, + "step": 15467 + }, + { + "epoch": 0.3, + "learning_rate": 1.4012659702535822e-07, + "loss": 0.0019, + "step": 15468 + }, + { + "epoch": 0.3, + "learning_rate": 1.401227136810221e-07, + "loss": 0.8374, + "step": 15469 + }, + { + "epoch": 0.3, + "learning_rate": 1.4011883033668594e-07, + "loss": 0.0015, + "step": 15470 + }, + { + "epoch": 0.3, + "learning_rate": 1.401149469923498e-07, + "loss": 0.0037, + "step": 15471 + }, + { + "epoch": 0.3, + "learning_rate": 1.4011106364801366e-07, + "loss": 0.0008, + "step": 15472 + }, + { + "epoch": 0.3, + "learning_rate": 1.4010718030367753e-07, + "loss": 0.084, + "step": 15473 + }, + { + "epoch": 0.3, + "learning_rate": 1.4010329695934137e-07, + "loss": 0.0305, + "step": 15474 + }, + { + "epoch": 0.3, + "learning_rate": 1.4009941361500524e-07, + "loss": 0.0011, + "step": 15475 + }, + { + "epoch": 0.3, + "learning_rate": 1.400955302706691e-07, + "loss": 0.001, + "step": 15476 + }, + { + "epoch": 0.3, + "learning_rate": 1.4009164692633296e-07, + "loss": 0.0012, + "step": 15477 + }, + { + "epoch": 0.3, + "learning_rate": 1.400877635819968e-07, + "loss": 0.0014, + "step": 15478 + }, + { + "epoch": 0.3, + "learning_rate": 1.4008388023766068e-07, + "loss": 0.5301, + "step": 15479 + }, + { + "epoch": 0.3, + "learning_rate": 1.4007999689332452e-07, + "loss": 0.0036, + "step": 15480 + }, + { + "epoch": 0.3, + "learning_rate": 1.400761135489884e-07, + "loss": 0.0017, + "step": 15481 + }, + { + "epoch": 0.3, + "learning_rate": 1.4007223020465224e-07, + "loss": 0.0014, + "step": 15482 + }, + { + "epoch": 0.3, + "learning_rate": 1.400683468603161e-07, + "loss": 0.001, + "step": 15483 + }, + { + "epoch": 0.3, + "learning_rate": 1.4006446351597995e-07, + "loss": 0.0039, + "step": 15484 + }, + { + "epoch": 0.3, + "learning_rate": 1.4006058017164383e-07, + "loss": 0.0009, + "step": 15485 + }, + { + "epoch": 0.3, + "learning_rate": 1.4005669682730767e-07, + "loss": 0.0948, + "step": 15486 + }, + { + "epoch": 0.3, + "learning_rate": 1.4005281348297154e-07, + "loss": 0.0024, + "step": 15487 + }, + { + "epoch": 0.3, + "learning_rate": 1.400489301386354e-07, + "loss": 0.7757, + "step": 15488 + }, + { + "epoch": 0.3, + "learning_rate": 1.4004504679429926e-07, + "loss": 0.4683, + "step": 15489 + }, + { + "epoch": 0.3, + "learning_rate": 1.400411634499631e-07, + "loss": 0.0012, + "step": 15490 + }, + { + "epoch": 0.3, + "learning_rate": 1.4003728010562698e-07, + "loss": 0.001, + "step": 15491 + }, + { + "epoch": 0.3, + "learning_rate": 1.4003339676129082e-07, + "loss": 0.001, + "step": 15492 + }, + { + "epoch": 0.3, + "learning_rate": 1.400295134169547e-07, + "loss": 0.0011, + "step": 15493 + }, + { + "epoch": 0.3, + "learning_rate": 1.4002563007261854e-07, + "loss": 0.1834, + "step": 15494 + }, + { + "epoch": 0.3, + "learning_rate": 1.400217467282824e-07, + "loss": 0.0013, + "step": 15495 + }, + { + "epoch": 0.3, + "learning_rate": 1.4001786338394625e-07, + "loss": 0.0012, + "step": 15496 + }, + { + "epoch": 0.3, + "learning_rate": 1.4001398003961013e-07, + "loss": 0.0015, + "step": 15497 + }, + { + "epoch": 0.3, + "learning_rate": 1.4001009669527397e-07, + "loss": 0.0015, + "step": 15498 + }, + { + "epoch": 0.3, + "learning_rate": 1.4000621335093784e-07, + "loss": 0.0013, + "step": 15499 + }, + { + "epoch": 0.3, + "learning_rate": 1.4000233000660169e-07, + "loss": 0.0011, + "step": 15500 + }, + { + "epoch": 0.3, + "learning_rate": 1.3999844666226556e-07, + "loss": 0.0014, + "step": 15501 + }, + { + "epoch": 0.3, + "learning_rate": 1.399945633179294e-07, + "loss": 0.0569, + "step": 15502 + }, + { + "epoch": 0.3, + "learning_rate": 1.3999067997359327e-07, + "loss": 0.0011, + "step": 15503 + }, + { + "epoch": 0.3, + "learning_rate": 1.3998679662925712e-07, + "loss": 0.0034, + "step": 15504 + }, + { + "epoch": 0.3, + "learning_rate": 1.39982913284921e-07, + "loss": 0.7388, + "step": 15505 + }, + { + "epoch": 0.3, + "learning_rate": 1.3997902994058484e-07, + "loss": 0.0009, + "step": 15506 + }, + { + "epoch": 0.3, + "learning_rate": 1.3997514659624868e-07, + "loss": 0.3422, + "step": 15507 + }, + { + "epoch": 0.3, + "learning_rate": 1.3997126325191253e-07, + "loss": 0.0012, + "step": 15508 + }, + { + "epoch": 0.3, + "learning_rate": 1.399673799075764e-07, + "loss": 0.0014, + "step": 15509 + }, + { + "epoch": 0.3, + "learning_rate": 1.3996349656324024e-07, + "loss": 0.001, + "step": 15510 + }, + { + "epoch": 0.3, + "learning_rate": 1.3995961321890411e-07, + "loss": 0.0015, + "step": 15511 + }, + { + "epoch": 0.3, + "learning_rate": 1.3995572987456796e-07, + "loss": 0.0022, + "step": 15512 + }, + { + "epoch": 0.3, + "learning_rate": 1.3995184653023183e-07, + "loss": 0.0011, + "step": 15513 + }, + { + "epoch": 0.3, + "learning_rate": 1.3994796318589568e-07, + "loss": 0.0016, + "step": 15514 + }, + { + "epoch": 0.3, + "learning_rate": 1.3994407984155955e-07, + "loss": 0.001, + "step": 15515 + }, + { + "epoch": 0.3, + "learning_rate": 1.399401964972234e-07, + "loss": 0.0014, + "step": 15516 + }, + { + "epoch": 0.3, + "learning_rate": 1.3993631315288726e-07, + "loss": 0.0013, + "step": 15517 + }, + { + "epoch": 0.3, + "learning_rate": 1.399324298085511e-07, + "loss": 0.0185, + "step": 15518 + }, + { + "epoch": 0.3, + "learning_rate": 1.3992854646421498e-07, + "loss": 0.0014, + "step": 15519 + }, + { + "epoch": 0.3, + "learning_rate": 1.3992466311987883e-07, + "loss": 0.0011, + "step": 15520 + }, + { + "epoch": 0.3, + "learning_rate": 1.399207797755427e-07, + "loss": 0.0012, + "step": 15521 + }, + { + "epoch": 0.3, + "learning_rate": 1.3991689643120654e-07, + "loss": 0.0024, + "step": 15522 + }, + { + "epoch": 0.3, + "learning_rate": 1.399130130868704e-07, + "loss": 0.0012, + "step": 15523 + }, + { + "epoch": 0.3, + "learning_rate": 1.3990912974253426e-07, + "loss": 0.0012, + "step": 15524 + }, + { + "epoch": 0.3, + "learning_rate": 1.3990524639819813e-07, + "loss": 0.0017, + "step": 15525 + }, + { + "epoch": 0.3, + "learning_rate": 1.3990136305386197e-07, + "loss": 0.9848, + "step": 15526 + }, + { + "epoch": 0.3, + "learning_rate": 1.3989747970952585e-07, + "loss": 0.0018, + "step": 15527 + }, + { + "epoch": 0.3, + "learning_rate": 1.398935963651897e-07, + "loss": 0.9093, + "step": 15528 + }, + { + "epoch": 0.3, + "learning_rate": 1.3988971302085356e-07, + "loss": 0.0018, + "step": 15529 + }, + { + "epoch": 0.3, + "learning_rate": 1.398858296765174e-07, + "loss": 0.0013, + "step": 15530 + }, + { + "epoch": 0.3, + "learning_rate": 1.3988194633218128e-07, + "loss": 0.0011, + "step": 15531 + }, + { + "epoch": 0.3, + "learning_rate": 1.3987806298784512e-07, + "loss": 0.001, + "step": 15532 + }, + { + "epoch": 0.3, + "learning_rate": 1.39874179643509e-07, + "loss": 0.0021, + "step": 15533 + }, + { + "epoch": 0.3, + "learning_rate": 1.3987029629917284e-07, + "loss": 0.0015, + "step": 15534 + }, + { + "epoch": 0.3, + "learning_rate": 1.398664129548367e-07, + "loss": 0.0018, + "step": 15535 + }, + { + "epoch": 0.3, + "learning_rate": 1.3986252961050056e-07, + "loss": 0.0035, + "step": 15536 + }, + { + "epoch": 0.3, + "learning_rate": 1.398586462661644e-07, + "loss": 0.0011, + "step": 15537 + }, + { + "epoch": 0.3, + "learning_rate": 1.3985476292182827e-07, + "loss": 0.0013, + "step": 15538 + }, + { + "epoch": 0.3, + "learning_rate": 1.3985087957749212e-07, + "loss": 0.3978, + "step": 15539 + }, + { + "epoch": 0.3, + "learning_rate": 1.39846996233156e-07, + "loss": 0.0011, + "step": 15540 + }, + { + "epoch": 0.3, + "learning_rate": 1.3984311288881983e-07, + "loss": 0.0199, + "step": 15541 + }, + { + "epoch": 0.3, + "learning_rate": 1.398392295444837e-07, + "loss": 0.1736, + "step": 15542 + }, + { + "epoch": 0.3, + "learning_rate": 1.3983534620014755e-07, + "loss": 0.001, + "step": 15543 + }, + { + "epoch": 0.3, + "learning_rate": 1.3983146285581142e-07, + "loss": 0.001, + "step": 15544 + }, + { + "epoch": 0.3, + "learning_rate": 1.3982757951147527e-07, + "loss": 0.0015, + "step": 15545 + }, + { + "epoch": 0.3, + "learning_rate": 1.3982369616713914e-07, + "loss": 0.0021, + "step": 15546 + }, + { + "epoch": 0.3, + "learning_rate": 1.3981981282280298e-07, + "loss": 0.0329, + "step": 15547 + }, + { + "epoch": 0.3, + "learning_rate": 1.3981592947846686e-07, + "loss": 0.0013, + "step": 15548 + }, + { + "epoch": 0.3, + "learning_rate": 1.398120461341307e-07, + "loss": 0.0011, + "step": 15549 + }, + { + "epoch": 0.3, + "learning_rate": 1.3980816278979457e-07, + "loss": 0.0168, + "step": 15550 + }, + { + "epoch": 0.3, + "learning_rate": 1.3980427944545842e-07, + "loss": 0.6412, + "step": 15551 + }, + { + "epoch": 0.3, + "learning_rate": 1.398003961011223e-07, + "loss": 0.2528, + "step": 15552 + }, + { + "epoch": 0.3, + "learning_rate": 1.3979651275678613e-07, + "loss": 0.0069, + "step": 15553 + }, + { + "epoch": 0.3, + "learning_rate": 1.3979262941245e-07, + "loss": 0.0011, + "step": 15554 + }, + { + "epoch": 0.3, + "learning_rate": 1.3978874606811385e-07, + "loss": 0.0009, + "step": 15555 + }, + { + "epoch": 0.3, + "learning_rate": 1.3978486272377772e-07, + "loss": 0.0013, + "step": 15556 + }, + { + "epoch": 0.3, + "learning_rate": 1.3978097937944157e-07, + "loss": 0.0012, + "step": 15557 + }, + { + "epoch": 0.3, + "learning_rate": 1.3977709603510544e-07, + "loss": 0.0015, + "step": 15558 + }, + { + "epoch": 0.3, + "learning_rate": 1.3977321269076928e-07, + "loss": 0.0014, + "step": 15559 + }, + { + "epoch": 0.3, + "learning_rate": 1.3976932934643315e-07, + "loss": 0.0009, + "step": 15560 + }, + { + "epoch": 0.3, + "learning_rate": 1.39765446002097e-07, + "loss": 0.0008, + "step": 15561 + }, + { + "epoch": 0.3, + "learning_rate": 1.3976156265776087e-07, + "loss": 0.001, + "step": 15562 + }, + { + "epoch": 0.3, + "learning_rate": 1.3975767931342472e-07, + "loss": 0.4789, + "step": 15563 + }, + { + "epoch": 0.3, + "learning_rate": 1.397537959690886e-07, + "loss": 0.0013, + "step": 15564 + }, + { + "epoch": 0.3, + "learning_rate": 1.3974991262475243e-07, + "loss": 0.0011, + "step": 15565 + }, + { + "epoch": 0.3, + "learning_rate": 1.3974602928041628e-07, + "loss": 0.0546, + "step": 15566 + }, + { + "epoch": 0.3, + "learning_rate": 1.3974214593608012e-07, + "loss": 0.001, + "step": 15567 + }, + { + "epoch": 0.3, + "learning_rate": 1.39738262591744e-07, + "loss": 0.0009, + "step": 15568 + }, + { + "epoch": 0.3, + "learning_rate": 1.3973437924740784e-07, + "loss": 0.0016, + "step": 15569 + }, + { + "epoch": 0.3, + "learning_rate": 1.397304959030717e-07, + "loss": 0.0015, + "step": 15570 + }, + { + "epoch": 0.3, + "learning_rate": 1.3972661255873556e-07, + "loss": 0.5557, + "step": 15571 + }, + { + "epoch": 0.3, + "learning_rate": 1.3972272921439943e-07, + "loss": 0.0092, + "step": 15572 + }, + { + "epoch": 0.3, + "learning_rate": 1.3971884587006327e-07, + "loss": 1.0276, + "step": 15573 + }, + { + "epoch": 0.3, + "learning_rate": 1.3971496252572714e-07, + "loss": 0.0014, + "step": 15574 + }, + { + "epoch": 0.3, + "learning_rate": 1.39711079181391e-07, + "loss": 0.0014, + "step": 15575 + }, + { + "epoch": 0.3, + "learning_rate": 1.3970719583705486e-07, + "loss": 0.0226, + "step": 15576 + }, + { + "epoch": 0.3, + "learning_rate": 1.397033124927187e-07, + "loss": 0.0017, + "step": 15577 + }, + { + "epoch": 0.3, + "learning_rate": 1.3969942914838258e-07, + "loss": 0.001, + "step": 15578 + }, + { + "epoch": 0.3, + "learning_rate": 1.3969554580404642e-07, + "loss": 0.0017, + "step": 15579 + }, + { + "epoch": 0.3, + "learning_rate": 1.396916624597103e-07, + "loss": 0.0011, + "step": 15580 + }, + { + "epoch": 0.3, + "learning_rate": 1.3968777911537414e-07, + "loss": 0.0011, + "step": 15581 + }, + { + "epoch": 0.3, + "learning_rate": 1.39683895771038e-07, + "loss": 0.0017, + "step": 15582 + }, + { + "epoch": 0.3, + "learning_rate": 1.3968001242670185e-07, + "loss": 0.0014, + "step": 15583 + }, + { + "epoch": 0.3, + "learning_rate": 1.3967612908236573e-07, + "loss": 0.4717, + "step": 15584 + }, + { + "epoch": 0.3, + "learning_rate": 1.3967224573802957e-07, + "loss": 0.0152, + "step": 15585 + }, + { + "epoch": 0.3, + "learning_rate": 1.3966836239369344e-07, + "loss": 0.7873, + "step": 15586 + }, + { + "epoch": 0.3, + "learning_rate": 1.396644790493573e-07, + "loss": 0.5635, + "step": 15587 + }, + { + "epoch": 0.3, + "learning_rate": 1.3966059570502116e-07, + "loss": 0.0009, + "step": 15588 + }, + { + "epoch": 0.3, + "learning_rate": 1.39656712360685e-07, + "loss": 0.0018, + "step": 15589 + }, + { + "epoch": 0.3, + "learning_rate": 1.3965282901634888e-07, + "loss": 0.0017, + "step": 15590 + }, + { + "epoch": 0.3, + "learning_rate": 1.3964894567201272e-07, + "loss": 0.0052, + "step": 15591 + }, + { + "epoch": 0.3, + "learning_rate": 1.396450623276766e-07, + "loss": 1.194, + "step": 15592 + }, + { + "epoch": 0.3, + "learning_rate": 1.3964117898334044e-07, + "loss": 0.0011, + "step": 15593 + }, + { + "epoch": 0.3, + "learning_rate": 1.396372956390043e-07, + "loss": 0.0016, + "step": 15594 + }, + { + "epoch": 0.3, + "learning_rate": 1.3963341229466815e-07, + "loss": 0.0015, + "step": 15595 + }, + { + "epoch": 0.3, + "learning_rate": 1.3962952895033203e-07, + "loss": 0.001, + "step": 15596 + }, + { + "epoch": 0.3, + "learning_rate": 1.3962564560599587e-07, + "loss": 0.0328, + "step": 15597 + }, + { + "epoch": 0.3, + "learning_rate": 1.3962176226165974e-07, + "loss": 0.0012, + "step": 15598 + }, + { + "epoch": 0.3, + "learning_rate": 1.3961787891732359e-07, + "loss": 0.0015, + "step": 15599 + }, + { + "epoch": 0.3, + "learning_rate": 1.3961399557298746e-07, + "loss": 0.0239, + "step": 15600 + }, + { + "epoch": 0.3, + "learning_rate": 1.396101122286513e-07, + "loss": 0.001, + "step": 15601 + }, + { + "epoch": 0.3, + "learning_rate": 1.3960622888431517e-07, + "loss": 0.0855, + "step": 15602 + }, + { + "epoch": 0.3, + "learning_rate": 1.3960234553997902e-07, + "loss": 0.0011, + "step": 15603 + }, + { + "epoch": 0.3, + "learning_rate": 1.395984621956429e-07, + "loss": 0.0011, + "step": 15604 + }, + { + "epoch": 0.3, + "learning_rate": 1.3959457885130674e-07, + "loss": 0.0074, + "step": 15605 + }, + { + "epoch": 0.3, + "learning_rate": 1.395906955069706e-07, + "loss": 0.6603, + "step": 15606 + }, + { + "epoch": 0.3, + "learning_rate": 1.3958681216263445e-07, + "loss": 1.1301, + "step": 15607 + }, + { + "epoch": 0.3, + "learning_rate": 1.3958292881829832e-07, + "loss": 0.001, + "step": 15608 + }, + { + "epoch": 0.3, + "learning_rate": 1.3957904547396217e-07, + "loss": 1.0052, + "step": 15609 + }, + { + "epoch": 0.3, + "learning_rate": 1.3957516212962604e-07, + "loss": 0.0035, + "step": 15610 + }, + { + "epoch": 0.3, + "learning_rate": 1.3957127878528989e-07, + "loss": 0.7977, + "step": 15611 + }, + { + "epoch": 0.3, + "learning_rate": 1.3956739544095376e-07, + "loss": 0.0014, + "step": 15612 + }, + { + "epoch": 0.3, + "learning_rate": 1.395635120966176e-07, + "loss": 0.0012, + "step": 15613 + }, + { + "epoch": 0.3, + "learning_rate": 1.3955962875228147e-07, + "loss": 0.5393, + "step": 15614 + }, + { + "epoch": 0.3, + "learning_rate": 1.3955574540794532e-07, + "loss": 0.7873, + "step": 15615 + }, + { + "epoch": 0.3, + "learning_rate": 1.395518620636092e-07, + "loss": 0.5017, + "step": 15616 + }, + { + "epoch": 0.3, + "learning_rate": 1.3954797871927304e-07, + "loss": 0.042, + "step": 15617 + }, + { + "epoch": 0.3, + "learning_rate": 1.395440953749369e-07, + "loss": 0.0031, + "step": 15618 + }, + { + "epoch": 0.3, + "learning_rate": 1.3954021203060075e-07, + "loss": 0.0018, + "step": 15619 + }, + { + "epoch": 0.3, + "learning_rate": 1.3953632868626462e-07, + "loss": 0.0016, + "step": 15620 + }, + { + "epoch": 0.3, + "learning_rate": 1.3953244534192847e-07, + "loss": 0.0014, + "step": 15621 + }, + { + "epoch": 0.3, + "learning_rate": 1.3952856199759234e-07, + "loss": 0.0009, + "step": 15622 + }, + { + "epoch": 0.3, + "learning_rate": 1.3952467865325616e-07, + "loss": 0.0074, + "step": 15623 + }, + { + "epoch": 0.3, + "learning_rate": 1.3952079530892003e-07, + "loss": 0.0057, + "step": 15624 + }, + { + "epoch": 0.3, + "learning_rate": 1.3951691196458387e-07, + "loss": 0.6367, + "step": 15625 + }, + { + "epoch": 0.3, + "learning_rate": 1.3951302862024775e-07, + "loss": 0.003, + "step": 15626 + }, + { + "epoch": 0.3, + "learning_rate": 1.395091452759116e-07, + "loss": 0.0013, + "step": 15627 + }, + { + "epoch": 0.3, + "learning_rate": 1.3950526193157546e-07, + "loss": 0.0009, + "step": 15628 + }, + { + "epoch": 0.3, + "learning_rate": 1.395013785872393e-07, + "loss": 0.0012, + "step": 15629 + }, + { + "epoch": 0.3, + "learning_rate": 1.3949749524290318e-07, + "loss": 0.4711, + "step": 15630 + }, + { + "epoch": 0.3, + "learning_rate": 1.3949361189856702e-07, + "loss": 0.0012, + "step": 15631 + }, + { + "epoch": 0.3, + "learning_rate": 1.394897285542309e-07, + "loss": 0.0025, + "step": 15632 + }, + { + "epoch": 0.3, + "learning_rate": 1.3948584520989474e-07, + "loss": 0.0012, + "step": 15633 + }, + { + "epoch": 0.3, + "learning_rate": 1.394819618655586e-07, + "loss": 0.0007, + "step": 15634 + }, + { + "epoch": 0.3, + "learning_rate": 1.3947807852122246e-07, + "loss": 0.0011, + "step": 15635 + }, + { + "epoch": 0.3, + "learning_rate": 1.3947419517688633e-07, + "loss": 0.0012, + "step": 15636 + }, + { + "epoch": 0.3, + "learning_rate": 1.3947031183255017e-07, + "loss": 0.0071, + "step": 15637 + }, + { + "epoch": 0.3, + "learning_rate": 1.3946642848821404e-07, + "loss": 0.0011, + "step": 15638 + }, + { + "epoch": 0.3, + "learning_rate": 1.394625451438779e-07, + "loss": 0.001, + "step": 15639 + }, + { + "epoch": 0.3, + "learning_rate": 1.3945866179954176e-07, + "loss": 0.0007, + "step": 15640 + }, + { + "epoch": 0.3, + "learning_rate": 1.394547784552056e-07, + "loss": 0.001, + "step": 15641 + }, + { + "epoch": 0.3, + "learning_rate": 1.3945089511086948e-07, + "loss": 0.1986, + "step": 15642 + }, + { + "epoch": 0.3, + "learning_rate": 1.3944701176653332e-07, + "loss": 0.0046, + "step": 15643 + }, + { + "epoch": 0.3, + "learning_rate": 1.394431284221972e-07, + "loss": 0.0012, + "step": 15644 + }, + { + "epoch": 0.3, + "learning_rate": 1.3943924507786104e-07, + "loss": 0.8195, + "step": 15645 + }, + { + "epoch": 0.3, + "learning_rate": 1.394353617335249e-07, + "loss": 0.0011, + "step": 15646 + }, + { + "epoch": 0.3, + "learning_rate": 1.3943147838918876e-07, + "loss": 0.0018, + "step": 15647 + }, + { + "epoch": 0.3, + "learning_rate": 1.3942759504485263e-07, + "loss": 0.0012, + "step": 15648 + }, + { + "epoch": 0.3, + "learning_rate": 1.3942371170051647e-07, + "loss": 0.0014, + "step": 15649 + }, + { + "epoch": 0.3, + "learning_rate": 1.3941982835618034e-07, + "loss": 0.0008, + "step": 15650 + }, + { + "epoch": 0.3, + "learning_rate": 1.394159450118442e-07, + "loss": 0.0024, + "step": 15651 + }, + { + "epoch": 0.3, + "learning_rate": 1.3941206166750806e-07, + "loss": 0.0055, + "step": 15652 + }, + { + "epoch": 0.3, + "learning_rate": 1.394081783231719e-07, + "loss": 0.0065, + "step": 15653 + }, + { + "epoch": 0.3, + "learning_rate": 1.3940429497883578e-07, + "loss": 0.0011, + "step": 15654 + }, + { + "epoch": 0.3, + "learning_rate": 1.3940041163449962e-07, + "loss": 0.002, + "step": 15655 + }, + { + "epoch": 0.3, + "learning_rate": 1.393965282901635e-07, + "loss": 0.0011, + "step": 15656 + }, + { + "epoch": 0.3, + "learning_rate": 1.3939264494582734e-07, + "loss": 0.0011, + "step": 15657 + }, + { + "epoch": 0.3, + "learning_rate": 1.393887616014912e-07, + "loss": 0.0012, + "step": 15658 + }, + { + "epoch": 0.3, + "learning_rate": 1.3938487825715505e-07, + "loss": 0.0008, + "step": 15659 + }, + { + "epoch": 0.3, + "learning_rate": 1.3938099491281893e-07, + "loss": 0.0007, + "step": 15660 + }, + { + "epoch": 0.3, + "learning_rate": 1.3937711156848277e-07, + "loss": 0.0099, + "step": 15661 + }, + { + "epoch": 0.3, + "learning_rate": 1.3937322822414664e-07, + "loss": 0.0011, + "step": 15662 + }, + { + "epoch": 0.3, + "learning_rate": 1.393693448798105e-07, + "loss": 0.0012, + "step": 15663 + }, + { + "epoch": 0.3, + "learning_rate": 1.3936546153547436e-07, + "loss": 0.0012, + "step": 15664 + }, + { + "epoch": 0.3, + "learning_rate": 1.393615781911382e-07, + "loss": 0.0011, + "step": 15665 + }, + { + "epoch": 0.3, + "learning_rate": 1.3935769484680208e-07, + "loss": 0.0008, + "step": 15666 + }, + { + "epoch": 0.3, + "learning_rate": 1.3935381150246592e-07, + "loss": 0.0425, + "step": 15667 + }, + { + "epoch": 0.3, + "learning_rate": 1.393499281581298e-07, + "loss": 0.0022, + "step": 15668 + }, + { + "epoch": 0.3, + "learning_rate": 1.3934604481379364e-07, + "loss": 0.0031, + "step": 15669 + }, + { + "epoch": 0.3, + "learning_rate": 1.393421614694575e-07, + "loss": 0.001, + "step": 15670 + }, + { + "epoch": 0.3, + "learning_rate": 1.3933827812512135e-07, + "loss": 0.001, + "step": 15671 + }, + { + "epoch": 0.3, + "learning_rate": 1.3933439478078523e-07, + "loss": 0.0155, + "step": 15672 + }, + { + "epoch": 0.3, + "learning_rate": 1.3933051143644907e-07, + "loss": 0.0011, + "step": 15673 + }, + { + "epoch": 0.3, + "learning_rate": 1.3932662809211294e-07, + "loss": 0.0014, + "step": 15674 + }, + { + "epoch": 0.3, + "learning_rate": 1.393227447477768e-07, + "loss": 0.0013, + "step": 15675 + }, + { + "epoch": 0.3, + "learning_rate": 1.3931886140344066e-07, + "loss": 0.579, + "step": 15676 + }, + { + "epoch": 0.3, + "learning_rate": 1.393149780591045e-07, + "loss": 0.0202, + "step": 15677 + }, + { + "epoch": 0.3, + "learning_rate": 1.3931109471476837e-07, + "loss": 0.0011, + "step": 15678 + }, + { + "epoch": 0.3, + "learning_rate": 1.3930721137043222e-07, + "loss": 0.0679, + "step": 15679 + }, + { + "epoch": 0.3, + "learning_rate": 1.393033280260961e-07, + "loss": 0.0021, + "step": 15680 + }, + { + "epoch": 0.3, + "learning_rate": 1.392994446817599e-07, + "loss": 0.0026, + "step": 15681 + }, + { + "epoch": 0.3, + "learning_rate": 1.3929556133742378e-07, + "loss": 0.0008, + "step": 15682 + }, + { + "epoch": 0.3, + "learning_rate": 1.3929167799308763e-07, + "loss": 0.2596, + "step": 15683 + }, + { + "epoch": 0.3, + "learning_rate": 1.392877946487515e-07, + "loss": 0.0016, + "step": 15684 + }, + { + "epoch": 0.3, + "learning_rate": 1.3928391130441534e-07, + "loss": 0.0009, + "step": 15685 + }, + { + "epoch": 0.3, + "learning_rate": 1.3928002796007921e-07, + "loss": 0.0022, + "step": 15686 + }, + { + "epoch": 0.3, + "learning_rate": 1.3927614461574306e-07, + "loss": 0.0704, + "step": 15687 + }, + { + "epoch": 0.3, + "learning_rate": 1.3927226127140693e-07, + "loss": 0.0019, + "step": 15688 + }, + { + "epoch": 0.3, + "learning_rate": 1.3926837792707078e-07, + "loss": 0.0011, + "step": 15689 + }, + { + "epoch": 0.3, + "learning_rate": 1.3926449458273465e-07, + "loss": 0.0007, + "step": 15690 + }, + { + "epoch": 0.3, + "learning_rate": 1.392606112383985e-07, + "loss": 0.0046, + "step": 15691 + }, + { + "epoch": 0.3, + "learning_rate": 1.3925672789406236e-07, + "loss": 0.0013, + "step": 15692 + }, + { + "epoch": 0.3, + "learning_rate": 1.392528445497262e-07, + "loss": 0.0016, + "step": 15693 + }, + { + "epoch": 0.3, + "learning_rate": 1.3924896120539008e-07, + "loss": 0.0012, + "step": 15694 + }, + { + "epoch": 0.3, + "learning_rate": 1.3924507786105393e-07, + "loss": 0.3782, + "step": 15695 + }, + { + "epoch": 0.3, + "learning_rate": 1.392411945167178e-07, + "loss": 0.001, + "step": 15696 + }, + { + "epoch": 0.3, + "learning_rate": 1.3923731117238164e-07, + "loss": 0.0014, + "step": 15697 + }, + { + "epoch": 0.3, + "learning_rate": 1.392334278280455e-07, + "loss": 0.0561, + "step": 15698 + }, + { + "epoch": 0.3, + "learning_rate": 1.3922954448370936e-07, + "loss": 0.0012, + "step": 15699 + }, + { + "epoch": 0.3, + "learning_rate": 1.3922566113937323e-07, + "loss": 0.0013, + "step": 15700 + }, + { + "epoch": 0.3, + "learning_rate": 1.3922177779503707e-07, + "loss": 0.0028, + "step": 15701 + }, + { + "epoch": 0.3, + "learning_rate": 1.3921789445070095e-07, + "loss": 0.001, + "step": 15702 + }, + { + "epoch": 0.3, + "learning_rate": 1.392140111063648e-07, + "loss": 0.0013, + "step": 15703 + }, + { + "epoch": 0.3, + "learning_rate": 1.3921012776202866e-07, + "loss": 0.0015, + "step": 15704 + }, + { + "epoch": 0.3, + "learning_rate": 1.392062444176925e-07, + "loss": 0.0268, + "step": 15705 + }, + { + "epoch": 0.3, + "learning_rate": 1.3920236107335638e-07, + "loss": 0.0017, + "step": 15706 + }, + { + "epoch": 0.3, + "learning_rate": 1.3919847772902022e-07, + "loss": 0.997, + "step": 15707 + }, + { + "epoch": 0.3, + "learning_rate": 1.391945943846841e-07, + "loss": 0.0011, + "step": 15708 + }, + { + "epoch": 0.3, + "learning_rate": 1.3919071104034794e-07, + "loss": 0.0016, + "step": 15709 + }, + { + "epoch": 0.3, + "learning_rate": 1.391868276960118e-07, + "loss": 0.0012, + "step": 15710 + }, + { + "epoch": 0.3, + "learning_rate": 1.3918294435167566e-07, + "loss": 0.0062, + "step": 15711 + }, + { + "epoch": 0.3, + "learning_rate": 1.3917906100733953e-07, + "loss": 0.001, + "step": 15712 + }, + { + "epoch": 0.3, + "learning_rate": 1.3917517766300337e-07, + "loss": 0.001, + "step": 15713 + }, + { + "epoch": 0.3, + "learning_rate": 1.3917129431866722e-07, + "loss": 0.0011, + "step": 15714 + }, + { + "epoch": 0.3, + "learning_rate": 1.391674109743311e-07, + "loss": 0.0103, + "step": 15715 + }, + { + "epoch": 0.3, + "learning_rate": 1.3916352762999494e-07, + "loss": 0.0026, + "step": 15716 + }, + { + "epoch": 0.3, + "learning_rate": 1.391596442856588e-07, + "loss": 0.2893, + "step": 15717 + }, + { + "epoch": 0.3, + "learning_rate": 1.3915576094132265e-07, + "loss": 0.001, + "step": 15718 + }, + { + "epoch": 0.3, + "learning_rate": 1.3915187759698652e-07, + "loss": 0.1225, + "step": 15719 + }, + { + "epoch": 0.3, + "learning_rate": 1.3914799425265037e-07, + "loss": 0.713, + "step": 15720 + }, + { + "epoch": 0.3, + "learning_rate": 1.3914411090831424e-07, + "loss": 0.0012, + "step": 15721 + }, + { + "epoch": 0.3, + "learning_rate": 1.3914022756397808e-07, + "loss": 0.9064, + "step": 15722 + }, + { + "epoch": 0.3, + "learning_rate": 1.3913634421964196e-07, + "loss": 0.5457, + "step": 15723 + }, + { + "epoch": 0.31, + "learning_rate": 1.391324608753058e-07, + "loss": 0.012, + "step": 15724 + }, + { + "epoch": 0.31, + "learning_rate": 1.3912857753096967e-07, + "loss": 0.0011, + "step": 15725 + }, + { + "epoch": 0.31, + "learning_rate": 1.3912469418663352e-07, + "loss": 0.6306, + "step": 15726 + }, + { + "epoch": 0.31, + "learning_rate": 1.391208108422974e-07, + "loss": 0.0011, + "step": 15727 + }, + { + "epoch": 0.31, + "learning_rate": 1.3911692749796123e-07, + "loss": 0.0011, + "step": 15728 + }, + { + "epoch": 0.31, + "learning_rate": 1.391130441536251e-07, + "loss": 0.0011, + "step": 15729 + }, + { + "epoch": 0.31, + "learning_rate": 1.3910916080928895e-07, + "loss": 0.0055, + "step": 15730 + }, + { + "epoch": 0.31, + "learning_rate": 1.3910527746495282e-07, + "loss": 0.1032, + "step": 15731 + }, + { + "epoch": 0.31, + "learning_rate": 1.3910139412061667e-07, + "loss": 0.0014, + "step": 15732 + }, + { + "epoch": 0.31, + "learning_rate": 1.3909751077628054e-07, + "loss": 0.0011, + "step": 15733 + }, + { + "epoch": 0.31, + "learning_rate": 1.3909362743194438e-07, + "loss": 0.0012, + "step": 15734 + }, + { + "epoch": 0.31, + "learning_rate": 1.3908974408760825e-07, + "loss": 0.0013, + "step": 15735 + }, + { + "epoch": 0.31, + "learning_rate": 1.390858607432721e-07, + "loss": 0.0016, + "step": 15736 + }, + { + "epoch": 0.31, + "learning_rate": 1.3908197739893597e-07, + "loss": 0.0016, + "step": 15737 + }, + { + "epoch": 0.31, + "learning_rate": 1.3907809405459982e-07, + "loss": 0.0037, + "step": 15738 + }, + { + "epoch": 0.31, + "learning_rate": 1.3907421071026366e-07, + "loss": 0.0011, + "step": 15739 + }, + { + "epoch": 0.31, + "learning_rate": 1.3907032736592753e-07, + "loss": 0.0014, + "step": 15740 + }, + { + "epoch": 0.31, + "learning_rate": 1.3906644402159138e-07, + "loss": 0.0009, + "step": 15741 + }, + { + "epoch": 0.31, + "learning_rate": 1.3906256067725525e-07, + "loss": 0.0012, + "step": 15742 + }, + { + "epoch": 0.31, + "learning_rate": 1.390586773329191e-07, + "loss": 0.0016, + "step": 15743 + }, + { + "epoch": 0.31, + "learning_rate": 1.3905479398858294e-07, + "loss": 0.3965, + "step": 15744 + }, + { + "epoch": 0.31, + "learning_rate": 1.390509106442468e-07, + "loss": 0.0008, + "step": 15745 + }, + { + "epoch": 0.31, + "learning_rate": 1.3904702729991066e-07, + "loss": 0.001, + "step": 15746 + }, + { + "epoch": 0.31, + "learning_rate": 1.3904314395557453e-07, + "loss": 0.0011, + "step": 15747 + }, + { + "epoch": 0.31, + "learning_rate": 1.3903926061123837e-07, + "loss": 0.0011, + "step": 15748 + }, + { + "epoch": 0.31, + "learning_rate": 1.3903537726690224e-07, + "loss": 0.0015, + "step": 15749 + }, + { + "epoch": 0.31, + "learning_rate": 1.390314939225661e-07, + "loss": 0.0009, + "step": 15750 + }, + { + "epoch": 0.31, + "learning_rate": 1.3902761057822996e-07, + "loss": 0.0017, + "step": 15751 + }, + { + "epoch": 0.31, + "learning_rate": 1.390237272338938e-07, + "loss": 0.002, + "step": 15752 + }, + { + "epoch": 0.31, + "learning_rate": 1.3901984388955768e-07, + "loss": 0.0012, + "step": 15753 + }, + { + "epoch": 0.31, + "learning_rate": 1.3901596054522152e-07, + "loss": 0.0014, + "step": 15754 + }, + { + "epoch": 0.31, + "learning_rate": 1.390120772008854e-07, + "loss": 0.2426, + "step": 15755 + }, + { + "epoch": 0.31, + "learning_rate": 1.3900819385654924e-07, + "loss": 0.0021, + "step": 15756 + }, + { + "epoch": 0.31, + "learning_rate": 1.390043105122131e-07, + "loss": 0.4505, + "step": 15757 + }, + { + "epoch": 0.31, + "learning_rate": 1.3900042716787695e-07, + "loss": 0.0016, + "step": 15758 + }, + { + "epoch": 0.31, + "learning_rate": 1.3899654382354083e-07, + "loss": 0.0011, + "step": 15759 + }, + { + "epoch": 0.31, + "learning_rate": 1.3899266047920467e-07, + "loss": 0.5188, + "step": 15760 + }, + { + "epoch": 0.31, + "learning_rate": 1.3898877713486854e-07, + "loss": 0.0712, + "step": 15761 + }, + { + "epoch": 0.31, + "learning_rate": 1.389848937905324e-07, + "loss": 0.0011, + "step": 15762 + }, + { + "epoch": 0.31, + "learning_rate": 1.3898101044619626e-07, + "loss": 0.0014, + "step": 15763 + }, + { + "epoch": 0.31, + "learning_rate": 1.389771271018601e-07, + "loss": 0.0013, + "step": 15764 + }, + { + "epoch": 0.31, + "learning_rate": 1.3897324375752398e-07, + "loss": 0.0021, + "step": 15765 + }, + { + "epoch": 0.31, + "learning_rate": 1.3896936041318782e-07, + "loss": 0.418, + "step": 15766 + }, + { + "epoch": 0.31, + "learning_rate": 1.389654770688517e-07, + "loss": 0.002, + "step": 15767 + }, + { + "epoch": 0.31, + "learning_rate": 1.3896159372451554e-07, + "loss": 0.0013, + "step": 15768 + }, + { + "epoch": 0.31, + "learning_rate": 1.389577103801794e-07, + "loss": 0.0011, + "step": 15769 + }, + { + "epoch": 0.31, + "learning_rate": 1.3895382703584325e-07, + "loss": 0.0088, + "step": 15770 + }, + { + "epoch": 0.31, + "learning_rate": 1.3894994369150713e-07, + "loss": 0.001, + "step": 15771 + }, + { + "epoch": 0.31, + "learning_rate": 1.3894606034717097e-07, + "loss": 0.0011, + "step": 15772 + }, + { + "epoch": 0.31, + "learning_rate": 1.3894217700283484e-07, + "loss": 0.0011, + "step": 15773 + }, + { + "epoch": 0.31, + "learning_rate": 1.389382936584987e-07, + "loss": 0.0011, + "step": 15774 + }, + { + "epoch": 0.31, + "learning_rate": 1.3893441031416256e-07, + "loss": 0.0011, + "step": 15775 + }, + { + "epoch": 0.31, + "learning_rate": 1.389305269698264e-07, + "loss": 0.0175, + "step": 15776 + }, + { + "epoch": 0.31, + "learning_rate": 1.3892664362549027e-07, + "loss": 0.0012, + "step": 15777 + }, + { + "epoch": 0.31, + "learning_rate": 1.3892276028115412e-07, + "loss": 0.0079, + "step": 15778 + }, + { + "epoch": 0.31, + "learning_rate": 1.38918876936818e-07, + "loss": 0.666, + "step": 15779 + }, + { + "epoch": 0.31, + "learning_rate": 1.3891499359248184e-07, + "loss": 0.0009, + "step": 15780 + }, + { + "epoch": 0.31, + "learning_rate": 1.389111102481457e-07, + "loss": 0.0037, + "step": 15781 + }, + { + "epoch": 0.31, + "learning_rate": 1.3890722690380955e-07, + "loss": 0.0011, + "step": 15782 + }, + { + "epoch": 0.31, + "learning_rate": 1.3890334355947342e-07, + "loss": 0.0011, + "step": 15783 + }, + { + "epoch": 0.31, + "learning_rate": 1.3889946021513727e-07, + "loss": 0.001, + "step": 15784 + }, + { + "epoch": 0.31, + "learning_rate": 1.3889557687080114e-07, + "loss": 0.0055, + "step": 15785 + }, + { + "epoch": 0.31, + "learning_rate": 1.3889169352646499e-07, + "loss": 0.0012, + "step": 15786 + }, + { + "epoch": 0.31, + "learning_rate": 1.3888781018212886e-07, + "loss": 0.0011, + "step": 15787 + }, + { + "epoch": 0.31, + "learning_rate": 1.388839268377927e-07, + "loss": 0.0012, + "step": 15788 + }, + { + "epoch": 0.31, + "learning_rate": 1.3888004349345657e-07, + "loss": 0.0019, + "step": 15789 + }, + { + "epoch": 0.31, + "learning_rate": 1.3887616014912042e-07, + "loss": 0.0043, + "step": 15790 + }, + { + "epoch": 0.31, + "learning_rate": 1.388722768047843e-07, + "loss": 0.0261, + "step": 15791 + }, + { + "epoch": 0.31, + "learning_rate": 1.3886839346044814e-07, + "loss": 0.0016, + "step": 15792 + }, + { + "epoch": 0.31, + "learning_rate": 1.38864510116112e-07, + "loss": 0.0011, + "step": 15793 + }, + { + "epoch": 0.31, + "learning_rate": 1.3886062677177585e-07, + "loss": 0.0058, + "step": 15794 + }, + { + "epoch": 0.31, + "learning_rate": 1.3885674342743972e-07, + "loss": 0.0027, + "step": 15795 + }, + { + "epoch": 0.31, + "learning_rate": 1.3885286008310357e-07, + "loss": 0.0009, + "step": 15796 + }, + { + "epoch": 0.31, + "learning_rate": 1.388489767387674e-07, + "loss": 0.001, + "step": 15797 + }, + { + "epoch": 0.31, + "learning_rate": 1.3884509339443126e-07, + "loss": 0.1189, + "step": 15798 + }, + { + "epoch": 0.31, + "learning_rate": 1.3884121005009513e-07, + "loss": 0.9605, + "step": 15799 + }, + { + "epoch": 0.31, + "learning_rate": 1.3883732670575897e-07, + "loss": 0.0013, + "step": 15800 + }, + { + "epoch": 0.31, + "learning_rate": 1.3883344336142285e-07, + "loss": 0.0011, + "step": 15801 + }, + { + "epoch": 0.31, + "learning_rate": 1.388295600170867e-07, + "loss": 0.0011, + "step": 15802 + }, + { + "epoch": 0.31, + "learning_rate": 1.3882567667275056e-07, + "loss": 0.015, + "step": 15803 + }, + { + "epoch": 0.31, + "learning_rate": 1.388217933284144e-07, + "loss": 0.001, + "step": 15804 + }, + { + "epoch": 0.31, + "learning_rate": 1.3881790998407828e-07, + "loss": 0.0035, + "step": 15805 + }, + { + "epoch": 0.31, + "learning_rate": 1.3881402663974212e-07, + "loss": 0.002, + "step": 15806 + }, + { + "epoch": 0.31, + "learning_rate": 1.38810143295406e-07, + "loss": 0.001, + "step": 15807 + }, + { + "epoch": 0.31, + "learning_rate": 1.3880625995106984e-07, + "loss": 0.0111, + "step": 15808 + }, + { + "epoch": 0.31, + "learning_rate": 1.388023766067337e-07, + "loss": 0.3888, + "step": 15809 + }, + { + "epoch": 0.31, + "learning_rate": 1.3879849326239756e-07, + "loss": 0.0118, + "step": 15810 + }, + { + "epoch": 0.31, + "learning_rate": 1.3879460991806143e-07, + "loss": 0.0032, + "step": 15811 + }, + { + "epoch": 0.31, + "learning_rate": 1.3879072657372527e-07, + "loss": 0.0012, + "step": 15812 + }, + { + "epoch": 0.31, + "learning_rate": 1.3878684322938915e-07, + "loss": 0.0011, + "step": 15813 + }, + { + "epoch": 0.31, + "learning_rate": 1.38782959885053e-07, + "loss": 0.0019, + "step": 15814 + }, + { + "epoch": 0.31, + "learning_rate": 1.3877907654071686e-07, + "loss": 0.0009, + "step": 15815 + }, + { + "epoch": 0.31, + "learning_rate": 1.387751931963807e-07, + "loss": 0.0018, + "step": 15816 + }, + { + "epoch": 0.31, + "learning_rate": 1.3877130985204458e-07, + "loss": 0.0011, + "step": 15817 + }, + { + "epoch": 0.31, + "learning_rate": 1.3876742650770842e-07, + "loss": 0.001, + "step": 15818 + }, + { + "epoch": 0.31, + "learning_rate": 1.387635431633723e-07, + "loss": 0.5852, + "step": 15819 + }, + { + "epoch": 0.31, + "learning_rate": 1.3875965981903614e-07, + "loss": 0.0009, + "step": 15820 + }, + { + "epoch": 0.31, + "learning_rate": 1.387557764747e-07, + "loss": 0.0009, + "step": 15821 + }, + { + "epoch": 0.31, + "learning_rate": 1.3875189313036386e-07, + "loss": 0.4411, + "step": 15822 + }, + { + "epoch": 0.31, + "learning_rate": 1.3874800978602773e-07, + "loss": 0.0013, + "step": 15823 + }, + { + "epoch": 0.31, + "learning_rate": 1.3874412644169157e-07, + "loss": 0.0012, + "step": 15824 + }, + { + "epoch": 0.31, + "learning_rate": 1.3874024309735544e-07, + "loss": 0.0009, + "step": 15825 + }, + { + "epoch": 0.31, + "learning_rate": 1.387363597530193e-07, + "loss": 0.0015, + "step": 15826 + }, + { + "epoch": 0.31, + "learning_rate": 1.3873247640868316e-07, + "loss": 0.0014, + "step": 15827 + }, + { + "epoch": 0.31, + "learning_rate": 1.38728593064347e-07, + "loss": 0.0303, + "step": 15828 + }, + { + "epoch": 0.31, + "learning_rate": 1.3872470972001088e-07, + "loss": 0.0018, + "step": 15829 + }, + { + "epoch": 0.31, + "learning_rate": 1.3872082637567472e-07, + "loss": 0.0012, + "step": 15830 + }, + { + "epoch": 0.31, + "learning_rate": 1.387169430313386e-07, + "loss": 0.0425, + "step": 15831 + }, + { + "epoch": 0.31, + "learning_rate": 1.3871305968700244e-07, + "loss": 0.0011, + "step": 15832 + }, + { + "epoch": 0.31, + "learning_rate": 1.387091763426663e-07, + "loss": 0.001, + "step": 15833 + }, + { + "epoch": 0.31, + "learning_rate": 1.3870529299833015e-07, + "loss": 0.258, + "step": 15834 + }, + { + "epoch": 0.31, + "learning_rate": 1.3870140965399403e-07, + "loss": 0.2766, + "step": 15835 + }, + { + "epoch": 0.31, + "learning_rate": 1.3869752630965787e-07, + "loss": 0.0009, + "step": 15836 + }, + { + "epoch": 0.31, + "learning_rate": 1.3869364296532174e-07, + "loss": 0.058, + "step": 15837 + }, + { + "epoch": 0.31, + "learning_rate": 1.386897596209856e-07, + "loss": 0.8768, + "step": 15838 + }, + { + "epoch": 0.31, + "learning_rate": 1.3868587627664946e-07, + "loss": 0.001, + "step": 15839 + }, + { + "epoch": 0.31, + "learning_rate": 1.386819929323133e-07, + "loss": 0.0011, + "step": 15840 + }, + { + "epoch": 0.31, + "learning_rate": 1.3867810958797718e-07, + "loss": 0.4366, + "step": 15841 + }, + { + "epoch": 0.31, + "learning_rate": 1.3867422624364102e-07, + "loss": 0.0012, + "step": 15842 + }, + { + "epoch": 0.31, + "learning_rate": 1.386703428993049e-07, + "loss": 0.0012, + "step": 15843 + }, + { + "epoch": 0.31, + "learning_rate": 1.3866645955496874e-07, + "loss": 0.005, + "step": 15844 + }, + { + "epoch": 0.31, + "learning_rate": 1.386625762106326e-07, + "loss": 0.0011, + "step": 15845 + }, + { + "epoch": 0.31, + "learning_rate": 1.3865869286629645e-07, + "loss": 0.0197, + "step": 15846 + }, + { + "epoch": 0.31, + "learning_rate": 1.3865480952196033e-07, + "loss": 0.0105, + "step": 15847 + }, + { + "epoch": 0.31, + "learning_rate": 1.3865092617762417e-07, + "loss": 0.0015, + "step": 15848 + }, + { + "epoch": 0.31, + "learning_rate": 1.3864704283328804e-07, + "loss": 0.017, + "step": 15849 + }, + { + "epoch": 0.31, + "learning_rate": 1.386431594889519e-07, + "loss": 0.0015, + "step": 15850 + }, + { + "epoch": 0.31, + "learning_rate": 1.3863927614461576e-07, + "loss": 0.0017, + "step": 15851 + }, + { + "epoch": 0.31, + "learning_rate": 1.386353928002796e-07, + "loss": 1.2217, + "step": 15852 + }, + { + "epoch": 0.31, + "learning_rate": 1.3863150945594347e-07, + "loss": 1.0292, + "step": 15853 + }, + { + "epoch": 0.31, + "learning_rate": 1.3862762611160732e-07, + "loss": 0.0037, + "step": 15854 + }, + { + "epoch": 0.31, + "learning_rate": 1.3862374276727116e-07, + "loss": 0.0009, + "step": 15855 + }, + { + "epoch": 0.31, + "learning_rate": 1.38619859422935e-07, + "loss": 0.0009, + "step": 15856 + }, + { + "epoch": 0.31, + "learning_rate": 1.3861597607859888e-07, + "loss": 0.001, + "step": 15857 + }, + { + "epoch": 0.31, + "learning_rate": 1.3861209273426273e-07, + "loss": 0.0011, + "step": 15858 + }, + { + "epoch": 0.31, + "learning_rate": 1.386082093899266e-07, + "loss": 0.0008, + "step": 15859 + }, + { + "epoch": 0.31, + "learning_rate": 1.3860432604559044e-07, + "loss": 0.4995, + "step": 15860 + }, + { + "epoch": 0.31, + "learning_rate": 1.3860044270125431e-07, + "loss": 0.6194, + "step": 15861 + }, + { + "epoch": 0.31, + "learning_rate": 1.3859655935691816e-07, + "loss": 0.0011, + "step": 15862 + }, + { + "epoch": 0.31, + "learning_rate": 1.3859267601258203e-07, + "loss": 0.0031, + "step": 15863 + }, + { + "epoch": 0.31, + "learning_rate": 1.3858879266824588e-07, + "loss": 0.0057, + "step": 15864 + }, + { + "epoch": 0.31, + "learning_rate": 1.3858490932390975e-07, + "loss": 0.0011, + "step": 15865 + }, + { + "epoch": 0.31, + "learning_rate": 1.385810259795736e-07, + "loss": 0.0012, + "step": 15866 + }, + { + "epoch": 0.31, + "learning_rate": 1.3857714263523746e-07, + "loss": 0.0057, + "step": 15867 + }, + { + "epoch": 0.31, + "learning_rate": 1.385732592909013e-07, + "loss": 0.5241, + "step": 15868 + }, + { + "epoch": 0.31, + "learning_rate": 1.3856937594656518e-07, + "loss": 0.0129, + "step": 15869 + }, + { + "epoch": 0.31, + "learning_rate": 1.3856549260222903e-07, + "loss": 0.0011, + "step": 15870 + }, + { + "epoch": 0.31, + "learning_rate": 1.385616092578929e-07, + "loss": 0.0011, + "step": 15871 + }, + { + "epoch": 0.31, + "learning_rate": 1.3855772591355674e-07, + "loss": 0.001, + "step": 15872 + }, + { + "epoch": 0.31, + "learning_rate": 1.3855384256922061e-07, + "loss": 0.0038, + "step": 15873 + }, + { + "epoch": 0.31, + "learning_rate": 1.3854995922488446e-07, + "loss": 0.0011, + "step": 15874 + }, + { + "epoch": 0.31, + "learning_rate": 1.3854607588054833e-07, + "loss": 0.0011, + "step": 15875 + }, + { + "epoch": 0.31, + "learning_rate": 1.3854219253621217e-07, + "loss": 0.0014, + "step": 15876 + }, + { + "epoch": 0.31, + "learning_rate": 1.3853830919187605e-07, + "loss": 0.0014, + "step": 15877 + }, + { + "epoch": 0.31, + "learning_rate": 1.385344258475399e-07, + "loss": 0.001, + "step": 15878 + }, + { + "epoch": 0.31, + "learning_rate": 1.3853054250320376e-07, + "loss": 0.3028, + "step": 15879 + }, + { + "epoch": 0.31, + "learning_rate": 1.385266591588676e-07, + "loss": 0.0011, + "step": 15880 + }, + { + "epoch": 0.31, + "learning_rate": 1.3852277581453148e-07, + "loss": 0.0018, + "step": 15881 + }, + { + "epoch": 0.31, + "learning_rate": 1.3851889247019532e-07, + "loss": 0.0015, + "step": 15882 + }, + { + "epoch": 0.31, + "learning_rate": 1.385150091258592e-07, + "loss": 0.0009, + "step": 15883 + }, + { + "epoch": 0.31, + "learning_rate": 1.3851112578152304e-07, + "loss": 0.0018, + "step": 15884 + }, + { + "epoch": 0.31, + "learning_rate": 1.385072424371869e-07, + "loss": 0.0099, + "step": 15885 + }, + { + "epoch": 0.31, + "learning_rate": 1.3850335909285076e-07, + "loss": 0.0038, + "step": 15886 + }, + { + "epoch": 0.31, + "learning_rate": 1.3849947574851463e-07, + "loss": 0.0018, + "step": 15887 + }, + { + "epoch": 0.31, + "learning_rate": 1.3849559240417847e-07, + "loss": 0.0011, + "step": 15888 + }, + { + "epoch": 0.31, + "learning_rate": 1.3849170905984235e-07, + "loss": 0.0021, + "step": 15889 + }, + { + "epoch": 0.31, + "learning_rate": 1.384878257155062e-07, + "loss": 0.2933, + "step": 15890 + }, + { + "epoch": 0.31, + "learning_rate": 1.3848394237117004e-07, + "loss": 0.0026, + "step": 15891 + }, + { + "epoch": 0.31, + "learning_rate": 1.384800590268339e-07, + "loss": 0.0018, + "step": 15892 + }, + { + "epoch": 0.31, + "learning_rate": 1.3847617568249775e-07, + "loss": 0.1645, + "step": 15893 + }, + { + "epoch": 0.31, + "learning_rate": 1.3847229233816162e-07, + "loss": 0.0016, + "step": 15894 + }, + { + "epoch": 0.31, + "learning_rate": 1.3846840899382547e-07, + "loss": 0.0016, + "step": 15895 + }, + { + "epoch": 0.31, + "learning_rate": 1.3846452564948934e-07, + "loss": 0.0059, + "step": 15896 + }, + { + "epoch": 0.31, + "learning_rate": 1.3846064230515318e-07, + "loss": 0.001, + "step": 15897 + }, + { + "epoch": 0.31, + "learning_rate": 1.3845675896081706e-07, + "loss": 0.0012, + "step": 15898 + }, + { + "epoch": 0.31, + "learning_rate": 1.384528756164809e-07, + "loss": 0.0018, + "step": 15899 + }, + { + "epoch": 0.31, + "learning_rate": 1.3844899227214477e-07, + "loss": 0.4055, + "step": 15900 + }, + { + "epoch": 0.31, + "learning_rate": 1.3844510892780862e-07, + "loss": 0.0012, + "step": 15901 + }, + { + "epoch": 0.31, + "learning_rate": 1.384412255834725e-07, + "loss": 0.0048, + "step": 15902 + }, + { + "epoch": 0.31, + "learning_rate": 1.3843734223913633e-07, + "loss": 0.051, + "step": 15903 + }, + { + "epoch": 0.31, + "learning_rate": 1.384334588948002e-07, + "loss": 0.9414, + "step": 15904 + }, + { + "epoch": 0.31, + "learning_rate": 1.3842957555046405e-07, + "loss": 0.1912, + "step": 15905 + }, + { + "epoch": 0.31, + "learning_rate": 1.3842569220612792e-07, + "loss": 0.0026, + "step": 15906 + }, + { + "epoch": 0.31, + "learning_rate": 1.3842180886179177e-07, + "loss": 0.746, + "step": 15907 + }, + { + "epoch": 0.31, + "learning_rate": 1.3841792551745564e-07, + "loss": 0.0013, + "step": 15908 + }, + { + "epoch": 0.31, + "learning_rate": 1.3841404217311948e-07, + "loss": 0.1566, + "step": 15909 + }, + { + "epoch": 0.31, + "learning_rate": 1.3841015882878336e-07, + "loss": 0.5201, + "step": 15910 + }, + { + "epoch": 0.31, + "learning_rate": 1.384062754844472e-07, + "loss": 0.001, + "step": 15911 + }, + { + "epoch": 0.31, + "learning_rate": 1.3840239214011107e-07, + "loss": 0.001, + "step": 15912 + }, + { + "epoch": 0.31, + "learning_rate": 1.3839850879577492e-07, + "loss": 0.0026, + "step": 15913 + }, + { + "epoch": 0.31, + "learning_rate": 1.3839462545143876e-07, + "loss": 0.0021, + "step": 15914 + }, + { + "epoch": 0.31, + "learning_rate": 1.3839074210710263e-07, + "loss": 0.0009, + "step": 15915 + }, + { + "epoch": 0.31, + "learning_rate": 1.3838685876276648e-07, + "loss": 0.0016, + "step": 15916 + }, + { + "epoch": 0.31, + "learning_rate": 1.3838297541843035e-07, + "loss": 0.0337, + "step": 15917 + }, + { + "epoch": 0.31, + "learning_rate": 1.383790920740942e-07, + "loss": 1.0106, + "step": 15918 + }, + { + "epoch": 0.31, + "learning_rate": 1.3837520872975807e-07, + "loss": 0.0025, + "step": 15919 + }, + { + "epoch": 0.31, + "learning_rate": 1.383713253854219e-07, + "loss": 0.0037, + "step": 15920 + }, + { + "epoch": 0.31, + "learning_rate": 1.3836744204108576e-07, + "loss": 0.001, + "step": 15921 + }, + { + "epoch": 0.31, + "learning_rate": 1.3836355869674963e-07, + "loss": 1.1463, + "step": 15922 + }, + { + "epoch": 0.31, + "learning_rate": 1.3835967535241347e-07, + "loss": 0.0009, + "step": 15923 + }, + { + "epoch": 0.31, + "learning_rate": 1.3835579200807734e-07, + "loss": 0.001, + "step": 15924 + }, + { + "epoch": 0.31, + "learning_rate": 1.383519086637412e-07, + "loss": 0.0011, + "step": 15925 + }, + { + "epoch": 0.31, + "learning_rate": 1.3834802531940506e-07, + "loss": 0.0355, + "step": 15926 + }, + { + "epoch": 0.31, + "learning_rate": 1.383441419750689e-07, + "loss": 0.0754, + "step": 15927 + }, + { + "epoch": 0.31, + "learning_rate": 1.3834025863073278e-07, + "loss": 0.0011, + "step": 15928 + }, + { + "epoch": 0.31, + "learning_rate": 1.3833637528639662e-07, + "loss": 0.0008, + "step": 15929 + }, + { + "epoch": 0.31, + "learning_rate": 1.383324919420605e-07, + "loss": 0.0025, + "step": 15930 + }, + { + "epoch": 0.31, + "learning_rate": 1.3832860859772434e-07, + "loss": 0.0011, + "step": 15931 + }, + { + "epoch": 0.31, + "learning_rate": 1.383247252533882e-07, + "loss": 0.001, + "step": 15932 + }, + { + "epoch": 0.31, + "learning_rate": 1.3832084190905205e-07, + "loss": 0.011, + "step": 15933 + }, + { + "epoch": 0.31, + "learning_rate": 1.3831695856471593e-07, + "loss": 0.001, + "step": 15934 + }, + { + "epoch": 0.31, + "learning_rate": 1.3831307522037977e-07, + "loss": 0.0009, + "step": 15935 + }, + { + "epoch": 0.31, + "learning_rate": 1.3830919187604364e-07, + "loss": 0.5652, + "step": 15936 + }, + { + "epoch": 0.31, + "learning_rate": 1.383053085317075e-07, + "loss": 0.001, + "step": 15937 + }, + { + "epoch": 0.31, + "learning_rate": 1.3830142518737136e-07, + "loss": 0.001, + "step": 15938 + }, + { + "epoch": 0.31, + "learning_rate": 1.382975418430352e-07, + "loss": 0.0011, + "step": 15939 + }, + { + "epoch": 0.31, + "learning_rate": 1.3829365849869908e-07, + "loss": 0.001, + "step": 15940 + }, + { + "epoch": 0.31, + "learning_rate": 1.3828977515436292e-07, + "loss": 0.0017, + "step": 15941 + }, + { + "epoch": 0.31, + "learning_rate": 1.382858918100268e-07, + "loss": 0.8389, + "step": 15942 + }, + { + "epoch": 0.31, + "learning_rate": 1.3828200846569064e-07, + "loss": 0.3038, + "step": 15943 + }, + { + "epoch": 0.31, + "learning_rate": 1.382781251213545e-07, + "loss": 0.0014, + "step": 15944 + }, + { + "epoch": 0.31, + "learning_rate": 1.3827424177701835e-07, + "loss": 0.0009, + "step": 15945 + }, + { + "epoch": 0.31, + "learning_rate": 1.3827035843268223e-07, + "loss": 0.0014, + "step": 15946 + }, + { + "epoch": 0.31, + "learning_rate": 1.3826647508834607e-07, + "loss": 0.001, + "step": 15947 + }, + { + "epoch": 0.31, + "learning_rate": 1.3826259174400994e-07, + "loss": 0.0329, + "step": 15948 + }, + { + "epoch": 0.31, + "learning_rate": 1.382587083996738e-07, + "loss": 0.2745, + "step": 15949 + }, + { + "epoch": 0.31, + "learning_rate": 1.3825482505533766e-07, + "loss": 0.0012, + "step": 15950 + }, + { + "epoch": 0.31, + "learning_rate": 1.382509417110015e-07, + "loss": 0.001, + "step": 15951 + }, + { + "epoch": 0.31, + "learning_rate": 1.3824705836666537e-07, + "loss": 0.0015, + "step": 15952 + }, + { + "epoch": 0.31, + "learning_rate": 1.3824317502232922e-07, + "loss": 0.173, + "step": 15953 + }, + { + "epoch": 0.31, + "learning_rate": 1.382392916779931e-07, + "loss": 0.001, + "step": 15954 + }, + { + "epoch": 0.31, + "learning_rate": 1.3823540833365694e-07, + "loss": 0.001, + "step": 15955 + }, + { + "epoch": 0.31, + "learning_rate": 1.382315249893208e-07, + "loss": 0.0012, + "step": 15956 + }, + { + "epoch": 0.31, + "learning_rate": 1.3822764164498465e-07, + "loss": 0.0362, + "step": 15957 + }, + { + "epoch": 0.31, + "learning_rate": 1.3822375830064852e-07, + "loss": 0.0014, + "step": 15958 + }, + { + "epoch": 0.31, + "learning_rate": 1.3821987495631237e-07, + "loss": 0.0011, + "step": 15959 + }, + { + "epoch": 0.31, + "learning_rate": 1.3821599161197624e-07, + "loss": 0.0018, + "step": 15960 + }, + { + "epoch": 0.31, + "learning_rate": 1.3821210826764009e-07, + "loss": 0.001, + "step": 15961 + }, + { + "epoch": 0.31, + "learning_rate": 1.3820822492330396e-07, + "loss": 0.0009, + "step": 15962 + }, + { + "epoch": 0.31, + "learning_rate": 1.382043415789678e-07, + "loss": 0.0009, + "step": 15963 + }, + { + "epoch": 0.31, + "learning_rate": 1.3820045823463167e-07, + "loss": 0.0014, + "step": 15964 + }, + { + "epoch": 0.31, + "learning_rate": 1.3819657489029552e-07, + "loss": 0.6332, + "step": 15965 + }, + { + "epoch": 0.31, + "learning_rate": 1.381926915459594e-07, + "loss": 0.9372, + "step": 15966 + }, + { + "epoch": 0.31, + "learning_rate": 1.3818880820162324e-07, + "loss": 0.0176, + "step": 15967 + }, + { + "epoch": 0.31, + "learning_rate": 1.381849248572871e-07, + "loss": 0.0009, + "step": 15968 + }, + { + "epoch": 0.31, + "learning_rate": 1.3818104151295095e-07, + "loss": 0.0013, + "step": 15969 + }, + { + "epoch": 0.31, + "learning_rate": 1.3817715816861482e-07, + "loss": 0.4909, + "step": 15970 + }, + { + "epoch": 0.31, + "learning_rate": 1.3817327482427864e-07, + "loss": 0.0013, + "step": 15971 + }, + { + "epoch": 0.31, + "learning_rate": 1.3816939147994251e-07, + "loss": 0.0056, + "step": 15972 + }, + { + "epoch": 0.31, + "learning_rate": 1.3816550813560636e-07, + "loss": 0.0013, + "step": 15973 + }, + { + "epoch": 0.31, + "learning_rate": 1.3816162479127023e-07, + "loss": 0.0011, + "step": 15974 + }, + { + "epoch": 0.31, + "learning_rate": 1.3815774144693407e-07, + "loss": 0.0011, + "step": 15975 + }, + { + "epoch": 0.31, + "learning_rate": 1.3815385810259795e-07, + "loss": 0.0011, + "step": 15976 + }, + { + "epoch": 0.31, + "learning_rate": 1.381499747582618e-07, + "loss": 0.0013, + "step": 15977 + }, + { + "epoch": 0.31, + "learning_rate": 1.3814609141392566e-07, + "loss": 0.0012, + "step": 15978 + }, + { + "epoch": 0.31, + "learning_rate": 1.381422080695895e-07, + "loss": 0.0065, + "step": 15979 + }, + { + "epoch": 0.31, + "learning_rate": 1.3813832472525338e-07, + "loss": 0.0045, + "step": 15980 + }, + { + "epoch": 0.31, + "learning_rate": 1.3813444138091722e-07, + "loss": 0.0016, + "step": 15981 + }, + { + "epoch": 0.31, + "learning_rate": 1.381305580365811e-07, + "loss": 0.7091, + "step": 15982 + }, + { + "epoch": 0.31, + "learning_rate": 1.3812667469224494e-07, + "loss": 0.0469, + "step": 15983 + }, + { + "epoch": 0.31, + "learning_rate": 1.381227913479088e-07, + "loss": 0.0012, + "step": 15984 + }, + { + "epoch": 0.31, + "learning_rate": 1.3811890800357266e-07, + "loss": 0.0138, + "step": 15985 + }, + { + "epoch": 0.31, + "learning_rate": 1.3811502465923653e-07, + "loss": 0.0017, + "step": 15986 + }, + { + "epoch": 0.31, + "learning_rate": 1.3811114131490037e-07, + "loss": 0.001, + "step": 15987 + }, + { + "epoch": 0.31, + "learning_rate": 1.3810725797056425e-07, + "loss": 0.0294, + "step": 15988 + }, + { + "epoch": 0.31, + "learning_rate": 1.381033746262281e-07, + "loss": 0.8687, + "step": 15989 + }, + { + "epoch": 0.31, + "learning_rate": 1.3809949128189196e-07, + "loss": 0.0011, + "step": 15990 + }, + { + "epoch": 0.31, + "learning_rate": 1.380956079375558e-07, + "loss": 0.001, + "step": 15991 + }, + { + "epoch": 0.31, + "learning_rate": 1.3809172459321968e-07, + "loss": 0.0008, + "step": 15992 + }, + { + "epoch": 0.31, + "learning_rate": 1.3808784124888352e-07, + "loss": 0.001, + "step": 15993 + }, + { + "epoch": 0.31, + "learning_rate": 1.380839579045474e-07, + "loss": 0.2407, + "step": 15994 + }, + { + "epoch": 0.31, + "learning_rate": 1.3808007456021124e-07, + "loss": 0.0013, + "step": 15995 + }, + { + "epoch": 0.31, + "learning_rate": 1.380761912158751e-07, + "loss": 0.0314, + "step": 15996 + }, + { + "epoch": 0.31, + "learning_rate": 1.3807230787153896e-07, + "loss": 0.0297, + "step": 15997 + }, + { + "epoch": 0.31, + "learning_rate": 1.3806842452720283e-07, + "loss": 0.0012, + "step": 15998 + }, + { + "epoch": 0.31, + "learning_rate": 1.3806454118286667e-07, + "loss": 0.001, + "step": 15999 + }, + { + "epoch": 0.31, + "learning_rate": 1.3806065783853054e-07, + "loss": 1.1071, + "step": 16000 + }, + { + "epoch": 0.31, + "learning_rate": 1.380567744941944e-07, + "loss": 0.0009, + "step": 16001 + }, + { + "epoch": 0.31, + "learning_rate": 1.3805289114985826e-07, + "loss": 0.001, + "step": 16002 + }, + { + "epoch": 0.31, + "learning_rate": 1.380490078055221e-07, + "loss": 0.0009, + "step": 16003 + }, + { + "epoch": 0.31, + "learning_rate": 1.3804512446118598e-07, + "loss": 0.0023, + "step": 16004 + }, + { + "epoch": 0.31, + "learning_rate": 1.3804124111684982e-07, + "loss": 0.0011, + "step": 16005 + }, + { + "epoch": 0.31, + "learning_rate": 1.380373577725137e-07, + "loss": 0.8125, + "step": 16006 + }, + { + "epoch": 0.31, + "learning_rate": 1.3803347442817754e-07, + "loss": 0.0448, + "step": 16007 + }, + { + "epoch": 0.31, + "learning_rate": 1.380295910838414e-07, + "loss": 0.001, + "step": 16008 + }, + { + "epoch": 0.31, + "learning_rate": 1.3802570773950526e-07, + "loss": 0.0014, + "step": 16009 + }, + { + "epoch": 0.31, + "learning_rate": 1.3802182439516913e-07, + "loss": 0.0009, + "step": 16010 + }, + { + "epoch": 0.31, + "learning_rate": 1.3801794105083297e-07, + "loss": 0.0086, + "step": 16011 + }, + { + "epoch": 0.31, + "learning_rate": 1.3801405770649684e-07, + "loss": 0.001, + "step": 16012 + }, + { + "epoch": 0.31, + "learning_rate": 1.380101743621607e-07, + "loss": 0.002, + "step": 16013 + }, + { + "epoch": 0.31, + "learning_rate": 1.3800629101782456e-07, + "loss": 0.001, + "step": 16014 + }, + { + "epoch": 0.31, + "learning_rate": 1.380024076734884e-07, + "loss": 0.0027, + "step": 16015 + }, + { + "epoch": 0.31, + "learning_rate": 1.3799852432915228e-07, + "loss": 0.002, + "step": 16016 + }, + { + "epoch": 0.31, + "learning_rate": 1.3799464098481612e-07, + "loss": 0.0487, + "step": 16017 + }, + { + "epoch": 0.31, + "learning_rate": 1.3799075764048e-07, + "loss": 0.6022, + "step": 16018 + }, + { + "epoch": 0.31, + "learning_rate": 1.3798687429614384e-07, + "loss": 0.0011, + "step": 16019 + }, + { + "epoch": 0.31, + "learning_rate": 1.379829909518077e-07, + "loss": 0.3768, + "step": 16020 + }, + { + "epoch": 0.31, + "learning_rate": 1.3797910760747155e-07, + "loss": 0.3569, + "step": 16021 + }, + { + "epoch": 0.31, + "learning_rate": 1.3797522426313543e-07, + "loss": 0.0013, + "step": 16022 + }, + { + "epoch": 0.31, + "learning_rate": 1.3797134091879927e-07, + "loss": 0.001, + "step": 16023 + }, + { + "epoch": 0.31, + "learning_rate": 1.3796745757446314e-07, + "loss": 0.0014, + "step": 16024 + }, + { + "epoch": 0.31, + "learning_rate": 1.37963574230127e-07, + "loss": 0.0009, + "step": 16025 + }, + { + "epoch": 0.31, + "learning_rate": 1.3795969088579086e-07, + "loss": 0.0016, + "step": 16026 + }, + { + "epoch": 0.31, + "learning_rate": 1.379558075414547e-07, + "loss": 0.0045, + "step": 16027 + }, + { + "epoch": 0.31, + "learning_rate": 1.3795192419711857e-07, + "loss": 0.003, + "step": 16028 + }, + { + "epoch": 0.31, + "learning_rate": 1.379480408527824e-07, + "loss": 0.0009, + "step": 16029 + }, + { + "epoch": 0.31, + "learning_rate": 1.3794415750844626e-07, + "loss": 0.0015, + "step": 16030 + }, + { + "epoch": 0.31, + "learning_rate": 1.379402741641101e-07, + "loss": 0.9617, + "step": 16031 + }, + { + "epoch": 0.31, + "learning_rate": 1.3793639081977398e-07, + "loss": 0.001, + "step": 16032 + }, + { + "epoch": 0.31, + "learning_rate": 1.3793250747543783e-07, + "loss": 0.0048, + "step": 16033 + }, + { + "epoch": 0.31, + "learning_rate": 1.379286241311017e-07, + "loss": 0.1029, + "step": 16034 + }, + { + "epoch": 0.31, + "learning_rate": 1.3792474078676554e-07, + "loss": 0.2501, + "step": 16035 + }, + { + "epoch": 0.31, + "learning_rate": 1.3792085744242941e-07, + "loss": 0.001, + "step": 16036 + }, + { + "epoch": 0.31, + "learning_rate": 1.3791697409809326e-07, + "loss": 0.0257, + "step": 16037 + }, + { + "epoch": 0.31, + "learning_rate": 1.3791309075375713e-07, + "loss": 0.0011, + "step": 16038 + }, + { + "epoch": 0.31, + "learning_rate": 1.3790920740942098e-07, + "loss": 0.0015, + "step": 16039 + }, + { + "epoch": 0.31, + "learning_rate": 1.3790532406508485e-07, + "loss": 0.0009, + "step": 16040 + }, + { + "epoch": 0.31, + "learning_rate": 1.379014407207487e-07, + "loss": 0.0013, + "step": 16041 + }, + { + "epoch": 0.31, + "learning_rate": 1.3789755737641256e-07, + "loss": 0.0009, + "step": 16042 + }, + { + "epoch": 0.31, + "learning_rate": 1.378936740320764e-07, + "loss": 0.0011, + "step": 16043 + }, + { + "epoch": 0.31, + "learning_rate": 1.3788979068774028e-07, + "loss": 0.0013, + "step": 16044 + }, + { + "epoch": 0.31, + "learning_rate": 1.3788590734340413e-07, + "loss": 0.0015, + "step": 16045 + }, + { + "epoch": 0.31, + "learning_rate": 1.37882023999068e-07, + "loss": 0.0011, + "step": 16046 + }, + { + "epoch": 0.31, + "learning_rate": 1.3787814065473184e-07, + "loss": 0.001, + "step": 16047 + }, + { + "epoch": 0.31, + "learning_rate": 1.3787425731039571e-07, + "loss": 0.0007, + "step": 16048 + }, + { + "epoch": 0.31, + "learning_rate": 1.3787037396605956e-07, + "loss": 0.0009, + "step": 16049 + }, + { + "epoch": 0.31, + "learning_rate": 1.3786649062172343e-07, + "loss": 0.3393, + "step": 16050 + }, + { + "epoch": 0.31, + "learning_rate": 1.3786260727738727e-07, + "loss": 0.0033, + "step": 16051 + }, + { + "epoch": 0.31, + "learning_rate": 1.3785872393305115e-07, + "loss": 0.0021, + "step": 16052 + }, + { + "epoch": 0.31, + "learning_rate": 1.37854840588715e-07, + "loss": 0.0011, + "step": 16053 + }, + { + "epoch": 0.31, + "learning_rate": 1.3785095724437886e-07, + "loss": 0.001, + "step": 16054 + }, + { + "epoch": 0.31, + "learning_rate": 1.378470739000427e-07, + "loss": 0.0009, + "step": 16055 + }, + { + "epoch": 0.31, + "learning_rate": 1.3784319055570658e-07, + "loss": 0.001, + "step": 16056 + }, + { + "epoch": 0.31, + "learning_rate": 1.3783930721137042e-07, + "loss": 0.001, + "step": 16057 + }, + { + "epoch": 0.31, + "learning_rate": 1.378354238670343e-07, + "loss": 0.4426, + "step": 16058 + }, + { + "epoch": 0.31, + "learning_rate": 1.3783154052269814e-07, + "loss": 0.0013, + "step": 16059 + }, + { + "epoch": 0.31, + "learning_rate": 1.37827657178362e-07, + "loss": 0.1495, + "step": 16060 + }, + { + "epoch": 0.31, + "learning_rate": 1.3782377383402586e-07, + "loss": 0.0013, + "step": 16061 + }, + { + "epoch": 0.31, + "learning_rate": 1.3781989048968973e-07, + "loss": 0.0299, + "step": 16062 + }, + { + "epoch": 0.31, + "learning_rate": 1.3781600714535357e-07, + "loss": 0.009, + "step": 16063 + }, + { + "epoch": 0.31, + "learning_rate": 1.3781212380101745e-07, + "loss": 0.0055, + "step": 16064 + }, + { + "epoch": 0.31, + "learning_rate": 1.378082404566813e-07, + "loss": 0.0014, + "step": 16065 + }, + { + "epoch": 0.31, + "learning_rate": 1.3780435711234516e-07, + "loss": 0.0033, + "step": 16066 + }, + { + "epoch": 0.31, + "learning_rate": 1.37800473768009e-07, + "loss": 0.0019, + "step": 16067 + }, + { + "epoch": 0.31, + "learning_rate": 1.3779659042367285e-07, + "loss": 0.0497, + "step": 16068 + }, + { + "epoch": 0.31, + "learning_rate": 1.3779270707933672e-07, + "loss": 0.0113, + "step": 16069 + }, + { + "epoch": 0.31, + "learning_rate": 1.3778882373500057e-07, + "loss": 0.1374, + "step": 16070 + }, + { + "epoch": 0.31, + "learning_rate": 1.3778494039066444e-07, + "loss": 0.0015, + "step": 16071 + }, + { + "epoch": 0.31, + "learning_rate": 1.3778105704632828e-07, + "loss": 0.0014, + "step": 16072 + }, + { + "epoch": 0.31, + "learning_rate": 1.3777717370199216e-07, + "loss": 0.0008, + "step": 16073 + }, + { + "epoch": 0.31, + "learning_rate": 1.37773290357656e-07, + "loss": 0.4092, + "step": 16074 + }, + { + "epoch": 0.31, + "learning_rate": 1.3776940701331987e-07, + "loss": 0.0015, + "step": 16075 + }, + { + "epoch": 0.31, + "learning_rate": 1.3776552366898372e-07, + "loss": 0.7393, + "step": 16076 + }, + { + "epoch": 0.31, + "learning_rate": 1.377616403246476e-07, + "loss": 0.0011, + "step": 16077 + }, + { + "epoch": 0.31, + "learning_rate": 1.3775775698031143e-07, + "loss": 0.0009, + "step": 16078 + }, + { + "epoch": 0.31, + "learning_rate": 1.377538736359753e-07, + "loss": 0.0013, + "step": 16079 + }, + { + "epoch": 0.31, + "learning_rate": 1.3774999029163915e-07, + "loss": 0.0011, + "step": 16080 + }, + { + "epoch": 0.31, + "learning_rate": 1.3774610694730302e-07, + "loss": 0.3623, + "step": 16081 + }, + { + "epoch": 0.31, + "learning_rate": 1.3774222360296687e-07, + "loss": 0.0013, + "step": 16082 + }, + { + "epoch": 0.31, + "learning_rate": 1.3773834025863074e-07, + "loss": 0.0011, + "step": 16083 + }, + { + "epoch": 0.31, + "learning_rate": 1.3773445691429458e-07, + "loss": 0.0009, + "step": 16084 + }, + { + "epoch": 0.31, + "learning_rate": 1.3773057356995846e-07, + "loss": 0.0302, + "step": 16085 + }, + { + "epoch": 0.31, + "learning_rate": 1.377266902256223e-07, + "loss": 0.2991, + "step": 16086 + }, + { + "epoch": 0.31, + "learning_rate": 1.3772280688128615e-07, + "loss": 0.0009, + "step": 16087 + }, + { + "epoch": 0.31, + "learning_rate": 1.3771892353695002e-07, + "loss": 0.0011, + "step": 16088 + }, + { + "epoch": 0.31, + "learning_rate": 1.3771504019261386e-07, + "loss": 0.0803, + "step": 16089 + }, + { + "epoch": 0.31, + "learning_rate": 1.3771115684827773e-07, + "loss": 0.0014, + "step": 16090 + }, + { + "epoch": 0.31, + "learning_rate": 1.3770727350394158e-07, + "loss": 0.0009, + "step": 16091 + }, + { + "epoch": 0.31, + "learning_rate": 1.3770339015960545e-07, + "loss": 0.001, + "step": 16092 + }, + { + "epoch": 0.31, + "learning_rate": 1.376995068152693e-07, + "loss": 0.0017, + "step": 16093 + }, + { + "epoch": 0.31, + "learning_rate": 1.3769562347093317e-07, + "loss": 0.0665, + "step": 16094 + }, + { + "epoch": 0.31, + "learning_rate": 1.37691740126597e-07, + "loss": 0.001, + "step": 16095 + }, + { + "epoch": 0.31, + "learning_rate": 1.3768785678226088e-07, + "loss": 0.0009, + "step": 16096 + }, + { + "epoch": 0.31, + "learning_rate": 1.3768397343792473e-07, + "loss": 0.003, + "step": 16097 + }, + { + "epoch": 0.31, + "learning_rate": 1.3768009009358857e-07, + "loss": 0.0011, + "step": 16098 + }, + { + "epoch": 0.31, + "learning_rate": 1.3767620674925244e-07, + "loss": 0.0011, + "step": 16099 + }, + { + "epoch": 0.31, + "learning_rate": 1.376723234049163e-07, + "loss": 0.001, + "step": 16100 + }, + { + "epoch": 0.31, + "learning_rate": 1.3766844006058016e-07, + "loss": 0.0011, + "step": 16101 + }, + { + "epoch": 0.31, + "learning_rate": 1.37664556716244e-07, + "loss": 0.0124, + "step": 16102 + }, + { + "epoch": 0.31, + "learning_rate": 1.3766067337190788e-07, + "loss": 0.0014, + "step": 16103 + }, + { + "epoch": 0.31, + "learning_rate": 1.3765679002757172e-07, + "loss": 1.0229, + "step": 16104 + }, + { + "epoch": 0.31, + "learning_rate": 1.376529066832356e-07, + "loss": 0.0013, + "step": 16105 + }, + { + "epoch": 0.31, + "learning_rate": 1.3764902333889944e-07, + "loss": 0.001, + "step": 16106 + }, + { + "epoch": 0.31, + "learning_rate": 1.376451399945633e-07, + "loss": 0.0046, + "step": 16107 + }, + { + "epoch": 0.31, + "learning_rate": 1.3764125665022716e-07, + "loss": 0.0009, + "step": 16108 + }, + { + "epoch": 0.31, + "learning_rate": 1.3763737330589103e-07, + "loss": 0.0012, + "step": 16109 + }, + { + "epoch": 0.31, + "learning_rate": 1.3763348996155487e-07, + "loss": 0.9836, + "step": 16110 + }, + { + "epoch": 0.31, + "learning_rate": 1.3762960661721874e-07, + "loss": 0.001, + "step": 16111 + }, + { + "epoch": 0.31, + "learning_rate": 1.376257232728826e-07, + "loss": 0.0009, + "step": 16112 + }, + { + "epoch": 0.31, + "learning_rate": 1.3762183992854646e-07, + "loss": 0.0013, + "step": 16113 + }, + { + "epoch": 0.31, + "learning_rate": 1.376179565842103e-07, + "loss": 0.6754, + "step": 16114 + }, + { + "epoch": 0.31, + "learning_rate": 1.3761407323987418e-07, + "loss": 0.0093, + "step": 16115 + }, + { + "epoch": 0.31, + "learning_rate": 1.3761018989553802e-07, + "loss": 0.0013, + "step": 16116 + }, + { + "epoch": 0.31, + "learning_rate": 1.376063065512019e-07, + "loss": 0.001, + "step": 16117 + }, + { + "epoch": 0.31, + "learning_rate": 1.3760242320686574e-07, + "loss": 0.8476, + "step": 16118 + }, + { + "epoch": 0.31, + "learning_rate": 1.375985398625296e-07, + "loss": 0.0013, + "step": 16119 + }, + { + "epoch": 0.31, + "learning_rate": 1.3759465651819345e-07, + "loss": 0.0895, + "step": 16120 + }, + { + "epoch": 0.31, + "learning_rate": 1.3759077317385733e-07, + "loss": 0.4883, + "step": 16121 + }, + { + "epoch": 0.31, + "learning_rate": 1.3758688982952117e-07, + "loss": 0.0017, + "step": 16122 + }, + { + "epoch": 0.31, + "learning_rate": 1.3758300648518504e-07, + "loss": 0.0011, + "step": 16123 + }, + { + "epoch": 0.31, + "learning_rate": 1.375791231408489e-07, + "loss": 0.0012, + "step": 16124 + }, + { + "epoch": 0.31, + "learning_rate": 1.3757523979651276e-07, + "loss": 0.0011, + "step": 16125 + }, + { + "epoch": 0.31, + "learning_rate": 1.375713564521766e-07, + "loss": 0.1074, + "step": 16126 + }, + { + "epoch": 0.31, + "learning_rate": 1.3756747310784047e-07, + "loss": 0.1419, + "step": 16127 + }, + { + "epoch": 0.31, + "learning_rate": 1.3756358976350432e-07, + "loss": 1.2807, + "step": 16128 + }, + { + "epoch": 0.31, + "learning_rate": 1.375597064191682e-07, + "loss": 0.0011, + "step": 16129 + }, + { + "epoch": 0.31, + "learning_rate": 1.3755582307483204e-07, + "loss": 0.8198, + "step": 16130 + }, + { + "epoch": 0.31, + "learning_rate": 1.375519397304959e-07, + "loss": 0.0032, + "step": 16131 + }, + { + "epoch": 0.31, + "learning_rate": 1.3754805638615975e-07, + "loss": 0.0015, + "step": 16132 + }, + { + "epoch": 0.31, + "learning_rate": 1.3754417304182362e-07, + "loss": 1.1999, + "step": 16133 + }, + { + "epoch": 0.31, + "learning_rate": 1.3754028969748747e-07, + "loss": 0.001, + "step": 16134 + }, + { + "epoch": 0.31, + "learning_rate": 1.3753640635315134e-07, + "loss": 0.0013, + "step": 16135 + }, + { + "epoch": 0.31, + "learning_rate": 1.3753252300881519e-07, + "loss": 0.9078, + "step": 16136 + }, + { + "epoch": 0.31, + "learning_rate": 1.3752863966447906e-07, + "loss": 0.0061, + "step": 16137 + }, + { + "epoch": 0.31, + "learning_rate": 1.375247563201429e-07, + "loss": 0.002, + "step": 16138 + }, + { + "epoch": 0.31, + "learning_rate": 1.3752087297580677e-07, + "loss": 0.001, + "step": 16139 + }, + { + "epoch": 0.31, + "learning_rate": 1.3751698963147062e-07, + "loss": 0.001, + "step": 16140 + }, + { + "epoch": 0.31, + "learning_rate": 1.375131062871345e-07, + "loss": 0.0011, + "step": 16141 + }, + { + "epoch": 0.31, + "learning_rate": 1.3750922294279834e-07, + "loss": 0.0016, + "step": 16142 + }, + { + "epoch": 0.31, + "learning_rate": 1.375053395984622e-07, + "loss": 0.0011, + "step": 16143 + }, + { + "epoch": 0.31, + "learning_rate": 1.3750145625412605e-07, + "loss": 0.001, + "step": 16144 + }, + { + "epoch": 0.31, + "learning_rate": 1.374975729097899e-07, + "loss": 0.0012, + "step": 16145 + }, + { + "epoch": 0.31, + "learning_rate": 1.3749368956545374e-07, + "loss": 0.0021, + "step": 16146 + }, + { + "epoch": 0.31, + "learning_rate": 1.3748980622111761e-07, + "loss": 0.3094, + "step": 16147 + }, + { + "epoch": 0.31, + "learning_rate": 1.3748592287678146e-07, + "loss": 0.0022, + "step": 16148 + }, + { + "epoch": 0.31, + "learning_rate": 1.3748203953244533e-07, + "loss": 0.5576, + "step": 16149 + }, + { + "epoch": 0.31, + "learning_rate": 1.3747815618810917e-07, + "loss": 0.0012, + "step": 16150 + }, + { + "epoch": 0.31, + "learning_rate": 1.3747427284377305e-07, + "loss": 0.3553, + "step": 16151 + }, + { + "epoch": 0.31, + "learning_rate": 1.374703894994369e-07, + "loss": 0.0013, + "step": 16152 + }, + { + "epoch": 0.31, + "learning_rate": 1.3746650615510076e-07, + "loss": 0.0013, + "step": 16153 + }, + { + "epoch": 0.31, + "learning_rate": 1.374626228107646e-07, + "loss": 0.0009, + "step": 16154 + }, + { + "epoch": 0.31, + "learning_rate": 1.3745873946642848e-07, + "loss": 0.1241, + "step": 16155 + }, + { + "epoch": 0.31, + "learning_rate": 1.3745485612209232e-07, + "loss": 0.0011, + "step": 16156 + }, + { + "epoch": 0.31, + "learning_rate": 1.374509727777562e-07, + "loss": 0.0009, + "step": 16157 + }, + { + "epoch": 0.31, + "learning_rate": 1.3744708943342004e-07, + "loss": 0.1163, + "step": 16158 + }, + { + "epoch": 0.31, + "learning_rate": 1.374432060890839e-07, + "loss": 0.0014, + "step": 16159 + }, + { + "epoch": 0.31, + "learning_rate": 1.3743932274474776e-07, + "loss": 0.0009, + "step": 16160 + }, + { + "epoch": 0.31, + "learning_rate": 1.3743543940041163e-07, + "loss": 0.0011, + "step": 16161 + }, + { + "epoch": 0.31, + "learning_rate": 1.3743155605607547e-07, + "loss": 0.0015, + "step": 16162 + }, + { + "epoch": 0.31, + "learning_rate": 1.3742767271173935e-07, + "loss": 0.0008, + "step": 16163 + }, + { + "epoch": 0.31, + "learning_rate": 1.374237893674032e-07, + "loss": 0.0024, + "step": 16164 + }, + { + "epoch": 0.31, + "learning_rate": 1.3741990602306706e-07, + "loss": 0.001, + "step": 16165 + }, + { + "epoch": 0.31, + "learning_rate": 1.374160226787309e-07, + "loss": 0.0011, + "step": 16166 + }, + { + "epoch": 0.31, + "learning_rate": 1.3741213933439478e-07, + "loss": 0.0154, + "step": 16167 + }, + { + "epoch": 0.31, + "learning_rate": 1.3740825599005862e-07, + "loss": 0.0015, + "step": 16168 + }, + { + "epoch": 0.31, + "learning_rate": 1.374043726457225e-07, + "loss": 0.0011, + "step": 16169 + }, + { + "epoch": 0.31, + "learning_rate": 1.3740048930138634e-07, + "loss": 0.0022, + "step": 16170 + }, + { + "epoch": 0.31, + "learning_rate": 1.373966059570502e-07, + "loss": 0.0011, + "step": 16171 + }, + { + "epoch": 0.31, + "learning_rate": 1.3739272261271406e-07, + "loss": 0.0014, + "step": 16172 + }, + { + "epoch": 0.31, + "learning_rate": 1.3738883926837793e-07, + "loss": 0.0083, + "step": 16173 + }, + { + "epoch": 0.31, + "learning_rate": 1.3738495592404177e-07, + "loss": 0.0017, + "step": 16174 + }, + { + "epoch": 0.31, + "learning_rate": 1.3738107257970564e-07, + "loss": 0.001, + "step": 16175 + }, + { + "epoch": 0.31, + "learning_rate": 1.373771892353695e-07, + "loss": 0.1792, + "step": 16176 + }, + { + "epoch": 0.31, + "learning_rate": 1.3737330589103336e-07, + "loss": 0.0012, + "step": 16177 + }, + { + "epoch": 0.31, + "learning_rate": 1.373694225466972e-07, + "loss": 0.001, + "step": 16178 + }, + { + "epoch": 0.31, + "learning_rate": 1.3736553920236108e-07, + "loss": 0.001, + "step": 16179 + }, + { + "epoch": 0.31, + "learning_rate": 1.3736165585802492e-07, + "loss": 0.0043, + "step": 16180 + }, + { + "epoch": 0.31, + "learning_rate": 1.373577725136888e-07, + "loss": 0.292, + "step": 16181 + }, + { + "epoch": 0.31, + "learning_rate": 1.3735388916935264e-07, + "loss": 0.2333, + "step": 16182 + }, + { + "epoch": 0.31, + "learning_rate": 1.373500058250165e-07, + "loss": 0.0011, + "step": 16183 + }, + { + "epoch": 0.31, + "learning_rate": 1.3734612248068036e-07, + "loss": 0.0012, + "step": 16184 + }, + { + "epoch": 0.31, + "learning_rate": 1.3734223913634423e-07, + "loss": 0.089, + "step": 16185 + }, + { + "epoch": 0.31, + "learning_rate": 1.3733835579200807e-07, + "loss": 0.0162, + "step": 16186 + }, + { + "epoch": 0.31, + "learning_rate": 1.3733447244767194e-07, + "loss": 0.0013, + "step": 16187 + }, + { + "epoch": 0.31, + "learning_rate": 1.373305891033358e-07, + "loss": 0.001, + "step": 16188 + }, + { + "epoch": 0.31, + "learning_rate": 1.3732670575899966e-07, + "loss": 0.001, + "step": 16189 + }, + { + "epoch": 0.31, + "learning_rate": 1.373228224146635e-07, + "loss": 0.0013, + "step": 16190 + }, + { + "epoch": 0.31, + "learning_rate": 1.3731893907032738e-07, + "loss": 0.0011, + "step": 16191 + }, + { + "epoch": 0.31, + "learning_rate": 1.3731505572599122e-07, + "loss": 0.0016, + "step": 16192 + }, + { + "epoch": 0.31, + "learning_rate": 1.373111723816551e-07, + "loss": 0.0012, + "step": 16193 + }, + { + "epoch": 0.31, + "learning_rate": 1.3730728903731894e-07, + "loss": 0.0011, + "step": 16194 + }, + { + "epoch": 0.31, + "learning_rate": 1.373034056929828e-07, + "loss": 0.001, + "step": 16195 + }, + { + "epoch": 0.31, + "learning_rate": 1.3729952234864665e-07, + "loss": 0.0008, + "step": 16196 + }, + { + "epoch": 0.31, + "learning_rate": 1.3729563900431053e-07, + "loss": 0.0125, + "step": 16197 + }, + { + "epoch": 0.31, + "learning_rate": 1.3729175565997437e-07, + "loss": 0.0518, + "step": 16198 + }, + { + "epoch": 0.31, + "learning_rate": 1.3728787231563824e-07, + "loss": 0.0009, + "step": 16199 + }, + { + "epoch": 0.31, + "learning_rate": 1.372839889713021e-07, + "loss": 0.0013, + "step": 16200 + }, + { + "epoch": 0.31, + "learning_rate": 1.3728010562696596e-07, + "loss": 0.0014, + "step": 16201 + }, + { + "epoch": 0.31, + "learning_rate": 1.372762222826298e-07, + "loss": 0.0009, + "step": 16202 + }, + { + "epoch": 0.31, + "learning_rate": 1.3727233893829365e-07, + "loss": 0.0933, + "step": 16203 + }, + { + "epoch": 0.31, + "learning_rate": 1.372684555939575e-07, + "loss": 0.0058, + "step": 16204 + }, + { + "epoch": 0.31, + "learning_rate": 1.3726457224962137e-07, + "loss": 0.0014, + "step": 16205 + }, + { + "epoch": 0.31, + "learning_rate": 1.372606889052852e-07, + "loss": 0.0443, + "step": 16206 + }, + { + "epoch": 0.31, + "learning_rate": 1.3725680556094908e-07, + "loss": 0.0012, + "step": 16207 + }, + { + "epoch": 0.31, + "learning_rate": 1.3725292221661293e-07, + "loss": 0.0011, + "step": 16208 + }, + { + "epoch": 0.31, + "learning_rate": 1.372490388722768e-07, + "loss": 0.0012, + "step": 16209 + }, + { + "epoch": 0.31, + "learning_rate": 1.3724515552794064e-07, + "loss": 0.0009, + "step": 16210 + }, + { + "epoch": 0.31, + "learning_rate": 1.3724127218360451e-07, + "loss": 0.001, + "step": 16211 + }, + { + "epoch": 0.31, + "learning_rate": 1.3723738883926836e-07, + "loss": 0.0017, + "step": 16212 + }, + { + "epoch": 0.31, + "learning_rate": 1.3723350549493223e-07, + "loss": 0.0009, + "step": 16213 + }, + { + "epoch": 0.31, + "learning_rate": 1.3722962215059608e-07, + "loss": 0.0013, + "step": 16214 + }, + { + "epoch": 0.31, + "learning_rate": 1.3722573880625995e-07, + "loss": 0.0083, + "step": 16215 + }, + { + "epoch": 0.31, + "learning_rate": 1.372218554619238e-07, + "loss": 0.5673, + "step": 16216 + }, + { + "epoch": 0.31, + "learning_rate": 1.3721797211758766e-07, + "loss": 0.3644, + "step": 16217 + }, + { + "epoch": 0.31, + "learning_rate": 1.372140887732515e-07, + "loss": 0.0031, + "step": 16218 + }, + { + "epoch": 0.31, + "learning_rate": 1.3721020542891538e-07, + "loss": 0.001, + "step": 16219 + }, + { + "epoch": 0.31, + "learning_rate": 1.3720632208457923e-07, + "loss": 0.0015, + "step": 16220 + }, + { + "epoch": 0.31, + "learning_rate": 1.372024387402431e-07, + "loss": 0.0014, + "step": 16221 + }, + { + "epoch": 0.31, + "learning_rate": 1.3719855539590694e-07, + "loss": 0.0008, + "step": 16222 + }, + { + "epoch": 0.31, + "learning_rate": 1.3719467205157081e-07, + "loss": 0.0012, + "step": 16223 + }, + { + "epoch": 0.31, + "learning_rate": 1.3719078870723466e-07, + "loss": 0.0011, + "step": 16224 + }, + { + "epoch": 0.31, + "learning_rate": 1.3718690536289853e-07, + "loss": 0.2232, + "step": 16225 + }, + { + "epoch": 0.31, + "learning_rate": 1.3718302201856237e-07, + "loss": 0.001, + "step": 16226 + }, + { + "epoch": 0.31, + "learning_rate": 1.3717913867422625e-07, + "loss": 0.0011, + "step": 16227 + }, + { + "epoch": 0.31, + "learning_rate": 1.371752553298901e-07, + "loss": 0.0011, + "step": 16228 + }, + { + "epoch": 0.31, + "learning_rate": 1.3717137198555396e-07, + "loss": 0.0333, + "step": 16229 + }, + { + "epoch": 0.31, + "learning_rate": 1.371674886412178e-07, + "loss": 0.0012, + "step": 16230 + }, + { + "epoch": 0.31, + "learning_rate": 1.3716360529688168e-07, + "loss": 0.0021, + "step": 16231 + }, + { + "epoch": 0.31, + "learning_rate": 1.3715972195254552e-07, + "loss": 0.006, + "step": 16232 + }, + { + "epoch": 0.31, + "learning_rate": 1.371558386082094e-07, + "loss": 0.0011, + "step": 16233 + }, + { + "epoch": 0.31, + "learning_rate": 1.3715195526387324e-07, + "loss": 0.4004, + "step": 16234 + }, + { + "epoch": 0.31, + "learning_rate": 1.371480719195371e-07, + "loss": 0.4959, + "step": 16235 + }, + { + "epoch": 0.31, + "learning_rate": 1.3714418857520096e-07, + "loss": 0.0124, + "step": 16236 + }, + { + "epoch": 0.31, + "learning_rate": 1.3714030523086483e-07, + "loss": 0.0015, + "step": 16237 + }, + { + "epoch": 0.31, + "learning_rate": 1.3713642188652867e-07, + "loss": 0.1402, + "step": 16238 + }, + { + "epoch": 0.32, + "learning_rate": 1.3713253854219255e-07, + "loss": 0.001, + "step": 16239 + }, + { + "epoch": 0.32, + "learning_rate": 1.371286551978564e-07, + "loss": 0.0013, + "step": 16240 + }, + { + "epoch": 0.32, + "learning_rate": 1.3712477185352026e-07, + "loss": 0.0014, + "step": 16241 + }, + { + "epoch": 0.32, + "learning_rate": 1.371208885091841e-07, + "loss": 0.5125, + "step": 16242 + }, + { + "epoch": 0.32, + "learning_rate": 1.3711700516484798e-07, + "loss": 0.0012, + "step": 16243 + }, + { + "epoch": 0.32, + "learning_rate": 1.3711312182051182e-07, + "loss": 0.0007, + "step": 16244 + }, + { + "epoch": 0.32, + "learning_rate": 1.3710923847617567e-07, + "loss": 0.0017, + "step": 16245 + }, + { + "epoch": 0.32, + "learning_rate": 1.3710535513183954e-07, + "loss": 0.0443, + "step": 16246 + }, + { + "epoch": 0.32, + "learning_rate": 1.3710147178750338e-07, + "loss": 0.0011, + "step": 16247 + }, + { + "epoch": 0.32, + "learning_rate": 1.3709758844316726e-07, + "loss": 0.0011, + "step": 16248 + }, + { + "epoch": 0.32, + "learning_rate": 1.370937050988311e-07, + "loss": 0.0011, + "step": 16249 + }, + { + "epoch": 0.32, + "learning_rate": 1.3708982175449497e-07, + "loss": 0.0008, + "step": 16250 + }, + { + "epoch": 0.32, + "learning_rate": 1.3708593841015882e-07, + "loss": 0.0019, + "step": 16251 + }, + { + "epoch": 0.32, + "learning_rate": 1.370820550658227e-07, + "loss": 0.0015, + "step": 16252 + }, + { + "epoch": 0.32, + "learning_rate": 1.3707817172148653e-07, + "loss": 0.0013, + "step": 16253 + }, + { + "epoch": 0.32, + "learning_rate": 1.370742883771504e-07, + "loss": 0.0012, + "step": 16254 + }, + { + "epoch": 0.32, + "learning_rate": 1.3707040503281425e-07, + "loss": 0.001, + "step": 16255 + }, + { + "epoch": 0.32, + "learning_rate": 1.3706652168847812e-07, + "loss": 0.0008, + "step": 16256 + }, + { + "epoch": 0.32, + "learning_rate": 1.3706263834414197e-07, + "loss": 0.0013, + "step": 16257 + }, + { + "epoch": 0.32, + "learning_rate": 1.3705875499980584e-07, + "loss": 0.0992, + "step": 16258 + }, + { + "epoch": 0.32, + "learning_rate": 1.3705487165546968e-07, + "loss": 0.3832, + "step": 16259 + }, + { + "epoch": 0.32, + "learning_rate": 1.3705098831113356e-07, + "loss": 0.0011, + "step": 16260 + }, + { + "epoch": 0.32, + "learning_rate": 1.370471049667974e-07, + "loss": 0.0047, + "step": 16261 + }, + { + "epoch": 0.32, + "learning_rate": 1.3704322162246125e-07, + "loss": 1.0278, + "step": 16262 + }, + { + "epoch": 0.32, + "learning_rate": 1.3703933827812512e-07, + "loss": 0.0011, + "step": 16263 + }, + { + "epoch": 0.32, + "learning_rate": 1.3703545493378896e-07, + "loss": 0.0011, + "step": 16264 + }, + { + "epoch": 0.32, + "learning_rate": 1.3703157158945283e-07, + "loss": 0.0017, + "step": 16265 + }, + { + "epoch": 0.32, + "learning_rate": 1.3702768824511668e-07, + "loss": 0.0068, + "step": 16266 + }, + { + "epoch": 0.32, + "learning_rate": 1.3702380490078055e-07, + "loss": 0.0014, + "step": 16267 + }, + { + "epoch": 0.32, + "learning_rate": 1.370199215564444e-07, + "loss": 0.0011, + "step": 16268 + }, + { + "epoch": 0.32, + "learning_rate": 1.3701603821210827e-07, + "loss": 0.0016, + "step": 16269 + }, + { + "epoch": 0.32, + "learning_rate": 1.370121548677721e-07, + "loss": 0.002, + "step": 16270 + }, + { + "epoch": 0.32, + "learning_rate": 1.3700827152343598e-07, + "loss": 0.0438, + "step": 16271 + }, + { + "epoch": 0.32, + "learning_rate": 1.3700438817909983e-07, + "loss": 0.0295, + "step": 16272 + }, + { + "epoch": 0.32, + "learning_rate": 1.370005048347637e-07, + "loss": 0.0037, + "step": 16273 + }, + { + "epoch": 0.32, + "learning_rate": 1.3699662149042754e-07, + "loss": 0.0009, + "step": 16274 + }, + { + "epoch": 0.32, + "learning_rate": 1.369927381460914e-07, + "loss": 0.0016, + "step": 16275 + }, + { + "epoch": 0.32, + "learning_rate": 1.3698885480175526e-07, + "loss": 0.0017, + "step": 16276 + }, + { + "epoch": 0.32, + "learning_rate": 1.369849714574191e-07, + "loss": 0.0009, + "step": 16277 + }, + { + "epoch": 0.32, + "learning_rate": 1.3698108811308298e-07, + "loss": 0.0021, + "step": 16278 + }, + { + "epoch": 0.32, + "learning_rate": 1.3697720476874682e-07, + "loss": 0.002, + "step": 16279 + }, + { + "epoch": 0.32, + "learning_rate": 1.369733214244107e-07, + "loss": 0.0013, + "step": 16280 + }, + { + "epoch": 0.32, + "learning_rate": 1.3696943808007454e-07, + "loss": 0.0316, + "step": 16281 + }, + { + "epoch": 0.32, + "learning_rate": 1.369655547357384e-07, + "loss": 0.3764, + "step": 16282 + }, + { + "epoch": 0.32, + "learning_rate": 1.3696167139140226e-07, + "loss": 0.0021, + "step": 16283 + }, + { + "epoch": 0.32, + "learning_rate": 1.3695778804706613e-07, + "loss": 0.0013, + "step": 16284 + }, + { + "epoch": 0.32, + "learning_rate": 1.3695390470272997e-07, + "loss": 0.0017, + "step": 16285 + }, + { + "epoch": 0.32, + "learning_rate": 1.3695002135839384e-07, + "loss": 0.0011, + "step": 16286 + }, + { + "epoch": 0.32, + "learning_rate": 1.369461380140577e-07, + "loss": 0.001, + "step": 16287 + }, + { + "epoch": 0.32, + "learning_rate": 1.3694225466972156e-07, + "loss": 0.0015, + "step": 16288 + }, + { + "epoch": 0.32, + "learning_rate": 1.369383713253854e-07, + "loss": 0.0011, + "step": 16289 + }, + { + "epoch": 0.32, + "learning_rate": 1.3693448798104928e-07, + "loss": 0.001, + "step": 16290 + }, + { + "epoch": 0.32, + "learning_rate": 1.3693060463671312e-07, + "loss": 0.0195, + "step": 16291 + }, + { + "epoch": 0.32, + "learning_rate": 1.36926721292377e-07, + "loss": 0.0014, + "step": 16292 + }, + { + "epoch": 0.32, + "learning_rate": 1.3692283794804084e-07, + "loss": 0.0012, + "step": 16293 + }, + { + "epoch": 0.32, + "learning_rate": 1.369189546037047e-07, + "loss": 0.0408, + "step": 16294 + }, + { + "epoch": 0.32, + "learning_rate": 1.3691507125936855e-07, + "loss": 0.0013, + "step": 16295 + }, + { + "epoch": 0.32, + "learning_rate": 1.3691118791503243e-07, + "loss": 0.0013, + "step": 16296 + }, + { + "epoch": 0.32, + "learning_rate": 1.3690730457069627e-07, + "loss": 0.0364, + "step": 16297 + }, + { + "epoch": 0.32, + "learning_rate": 1.3690342122636014e-07, + "loss": 0.7157, + "step": 16298 + }, + { + "epoch": 0.32, + "learning_rate": 1.36899537882024e-07, + "loss": 0.001, + "step": 16299 + }, + { + "epoch": 0.32, + "learning_rate": 1.3689565453768786e-07, + "loss": 0.0264, + "step": 16300 + }, + { + "epoch": 0.32, + "learning_rate": 1.368917711933517e-07, + "loss": 0.0022, + "step": 16301 + }, + { + "epoch": 0.32, + "learning_rate": 1.3688788784901558e-07, + "loss": 0.0051, + "step": 16302 + }, + { + "epoch": 0.32, + "learning_rate": 1.3688400450467942e-07, + "loss": 0.0257, + "step": 16303 + }, + { + "epoch": 0.32, + "learning_rate": 1.368801211603433e-07, + "loss": 0.0019, + "step": 16304 + }, + { + "epoch": 0.32, + "learning_rate": 1.3687623781600714e-07, + "loss": 0.0009, + "step": 16305 + }, + { + "epoch": 0.32, + "learning_rate": 1.36872354471671e-07, + "loss": 0.0012, + "step": 16306 + }, + { + "epoch": 0.32, + "learning_rate": 1.3686847112733485e-07, + "loss": 0.0009, + "step": 16307 + }, + { + "epoch": 0.32, + "learning_rate": 1.3686458778299872e-07, + "loss": 0.0015, + "step": 16308 + }, + { + "epoch": 0.32, + "learning_rate": 1.3686070443866257e-07, + "loss": 0.0012, + "step": 16309 + }, + { + "epoch": 0.32, + "learning_rate": 1.3685682109432644e-07, + "loss": 0.0009, + "step": 16310 + }, + { + "epoch": 0.32, + "learning_rate": 1.3685293774999029e-07, + "loss": 0.0011, + "step": 16311 + }, + { + "epoch": 0.32, + "learning_rate": 1.3684905440565416e-07, + "loss": 0.0012, + "step": 16312 + }, + { + "epoch": 0.32, + "learning_rate": 1.36845171061318e-07, + "loss": 0.0148, + "step": 16313 + }, + { + "epoch": 0.32, + "learning_rate": 1.3684128771698187e-07, + "loss": 0.001, + "step": 16314 + }, + { + "epoch": 0.32, + "learning_rate": 1.3683740437264572e-07, + "loss": 0.0009, + "step": 16315 + }, + { + "epoch": 0.32, + "learning_rate": 1.368335210283096e-07, + "loss": 0.0012, + "step": 16316 + }, + { + "epoch": 0.32, + "learning_rate": 1.3682963768397344e-07, + "loss": 0.0013, + "step": 16317 + }, + { + "epoch": 0.32, + "learning_rate": 1.368257543396373e-07, + "loss": 0.0999, + "step": 16318 + }, + { + "epoch": 0.32, + "learning_rate": 1.3682187099530113e-07, + "loss": 0.0015, + "step": 16319 + }, + { + "epoch": 0.32, + "learning_rate": 1.36817987650965e-07, + "loss": 0.0112, + "step": 16320 + }, + { + "epoch": 0.32, + "learning_rate": 1.3681410430662884e-07, + "loss": 0.0013, + "step": 16321 + }, + { + "epoch": 0.32, + "learning_rate": 1.3681022096229271e-07, + "loss": 0.0007, + "step": 16322 + }, + { + "epoch": 0.32, + "learning_rate": 1.3680633761795656e-07, + "loss": 0.0011, + "step": 16323 + }, + { + "epoch": 0.32, + "learning_rate": 1.3680245427362043e-07, + "loss": 0.0009, + "step": 16324 + }, + { + "epoch": 0.32, + "learning_rate": 1.3679857092928428e-07, + "loss": 0.0011, + "step": 16325 + }, + { + "epoch": 0.32, + "learning_rate": 1.3679468758494815e-07, + "loss": 0.0014, + "step": 16326 + }, + { + "epoch": 0.32, + "learning_rate": 1.36790804240612e-07, + "loss": 0.0019, + "step": 16327 + }, + { + "epoch": 0.32, + "learning_rate": 1.3678692089627586e-07, + "loss": 0.0014, + "step": 16328 + }, + { + "epoch": 0.32, + "learning_rate": 1.367830375519397e-07, + "loss": 0.0011, + "step": 16329 + }, + { + "epoch": 0.32, + "learning_rate": 1.3677915420760358e-07, + "loss": 0.0014, + "step": 16330 + }, + { + "epoch": 0.32, + "learning_rate": 1.3677527086326742e-07, + "loss": 0.001, + "step": 16331 + }, + { + "epoch": 0.32, + "learning_rate": 1.367713875189313e-07, + "loss": 0.1719, + "step": 16332 + }, + { + "epoch": 0.32, + "learning_rate": 1.3676750417459514e-07, + "loss": 0.0067, + "step": 16333 + }, + { + "epoch": 0.32, + "learning_rate": 1.36763620830259e-07, + "loss": 0.0012, + "step": 16334 + }, + { + "epoch": 0.32, + "learning_rate": 1.3675973748592286e-07, + "loss": 0.0012, + "step": 16335 + }, + { + "epoch": 0.32, + "learning_rate": 1.3675585414158673e-07, + "loss": 0.4172, + "step": 16336 + }, + { + "epoch": 0.32, + "learning_rate": 1.3675197079725057e-07, + "loss": 0.0013, + "step": 16337 + }, + { + "epoch": 0.32, + "learning_rate": 1.3674808745291445e-07, + "loss": 0.0014, + "step": 16338 + }, + { + "epoch": 0.32, + "learning_rate": 1.367442041085783e-07, + "loss": 0.0015, + "step": 16339 + }, + { + "epoch": 0.32, + "learning_rate": 1.3674032076424216e-07, + "loss": 0.0008, + "step": 16340 + }, + { + "epoch": 0.32, + "learning_rate": 1.36736437419906e-07, + "loss": 0.0013, + "step": 16341 + }, + { + "epoch": 0.32, + "learning_rate": 1.3673255407556988e-07, + "loss": 0.0016, + "step": 16342 + }, + { + "epoch": 0.32, + "learning_rate": 1.3672867073123372e-07, + "loss": 0.0009, + "step": 16343 + }, + { + "epoch": 0.32, + "learning_rate": 1.367247873868976e-07, + "loss": 0.0011, + "step": 16344 + }, + { + "epoch": 0.32, + "learning_rate": 1.3672090404256144e-07, + "loss": 0.0252, + "step": 16345 + }, + { + "epoch": 0.32, + "learning_rate": 1.367170206982253e-07, + "loss": 0.0028, + "step": 16346 + }, + { + "epoch": 0.32, + "learning_rate": 1.3671313735388916e-07, + "loss": 0.0012, + "step": 16347 + }, + { + "epoch": 0.32, + "learning_rate": 1.3670925400955303e-07, + "loss": 0.0012, + "step": 16348 + }, + { + "epoch": 0.32, + "learning_rate": 1.3670537066521687e-07, + "loss": 0.001, + "step": 16349 + }, + { + "epoch": 0.32, + "learning_rate": 1.3670148732088074e-07, + "loss": 0.0011, + "step": 16350 + }, + { + "epoch": 0.32, + "learning_rate": 1.366976039765446e-07, + "loss": 0.0008, + "step": 16351 + }, + { + "epoch": 0.32, + "learning_rate": 1.3669372063220846e-07, + "loss": 0.0015, + "step": 16352 + }, + { + "epoch": 0.32, + "learning_rate": 1.366898372878723e-07, + "loss": 0.0748, + "step": 16353 + }, + { + "epoch": 0.32, + "learning_rate": 1.3668595394353618e-07, + "loss": 0.0017, + "step": 16354 + }, + { + "epoch": 0.32, + "learning_rate": 1.3668207059920002e-07, + "loss": 0.0011, + "step": 16355 + }, + { + "epoch": 0.32, + "learning_rate": 1.366781872548639e-07, + "loss": 0.002, + "step": 16356 + }, + { + "epoch": 0.32, + "learning_rate": 1.3667430391052774e-07, + "loss": 0.0008, + "step": 16357 + }, + { + "epoch": 0.32, + "learning_rate": 1.366704205661916e-07, + "loss": 0.2702, + "step": 16358 + }, + { + "epoch": 0.32, + "learning_rate": 1.3666653722185546e-07, + "loss": 0.0009, + "step": 16359 + }, + { + "epoch": 0.32, + "learning_rate": 1.3666265387751933e-07, + "loss": 0.0596, + "step": 16360 + }, + { + "epoch": 0.32, + "learning_rate": 1.3665877053318317e-07, + "loss": 0.6364, + "step": 16361 + }, + { + "epoch": 0.32, + "learning_rate": 1.3665488718884704e-07, + "loss": 0.0009, + "step": 16362 + }, + { + "epoch": 0.32, + "learning_rate": 1.366510038445109e-07, + "loss": 0.001, + "step": 16363 + }, + { + "epoch": 0.32, + "learning_rate": 1.3664712050017476e-07, + "loss": 0.0009, + "step": 16364 + }, + { + "epoch": 0.32, + "learning_rate": 1.366432371558386e-07, + "loss": 0.0077, + "step": 16365 + }, + { + "epoch": 0.32, + "learning_rate": 1.3663935381150248e-07, + "loss": 0.0009, + "step": 16366 + }, + { + "epoch": 0.32, + "learning_rate": 1.3663547046716632e-07, + "loss": 0.0007, + "step": 16367 + }, + { + "epoch": 0.32, + "learning_rate": 1.366315871228302e-07, + "loss": 0.0009, + "step": 16368 + }, + { + "epoch": 0.32, + "learning_rate": 1.3662770377849404e-07, + "loss": 0.8312, + "step": 16369 + }, + { + "epoch": 0.32, + "learning_rate": 1.366238204341579e-07, + "loss": 0.031, + "step": 16370 + }, + { + "epoch": 0.32, + "learning_rate": 1.3661993708982175e-07, + "loss": 0.0012, + "step": 16371 + }, + { + "epoch": 0.32, + "learning_rate": 1.3661605374548563e-07, + "loss": 0.0009, + "step": 16372 + }, + { + "epoch": 0.32, + "learning_rate": 1.3661217040114947e-07, + "loss": 0.001, + "step": 16373 + }, + { + "epoch": 0.32, + "learning_rate": 1.3660828705681334e-07, + "loss": 0.0008, + "step": 16374 + }, + { + "epoch": 0.32, + "learning_rate": 1.366044037124772e-07, + "loss": 0.0009, + "step": 16375 + }, + { + "epoch": 0.32, + "learning_rate": 1.3660052036814106e-07, + "loss": 0.001, + "step": 16376 + }, + { + "epoch": 0.32, + "learning_rate": 1.3659663702380488e-07, + "loss": 0.001, + "step": 16377 + }, + { + "epoch": 0.32, + "learning_rate": 1.3659275367946875e-07, + "loss": 0.0015, + "step": 16378 + }, + { + "epoch": 0.32, + "learning_rate": 1.365888703351326e-07, + "loss": 0.001, + "step": 16379 + }, + { + "epoch": 0.32, + "learning_rate": 1.3658498699079647e-07, + "loss": 0.0015, + "step": 16380 + }, + { + "epoch": 0.32, + "learning_rate": 1.365811036464603e-07, + "loss": 0.0849, + "step": 16381 + }, + { + "epoch": 0.32, + "learning_rate": 1.3657722030212418e-07, + "loss": 0.0072, + "step": 16382 + }, + { + "epoch": 0.32, + "learning_rate": 1.3657333695778803e-07, + "loss": 0.0011, + "step": 16383 + }, + { + "epoch": 0.32, + "learning_rate": 1.365694536134519e-07, + "loss": 0.0021, + "step": 16384 + }, + { + "epoch": 0.32, + "learning_rate": 1.3656557026911574e-07, + "loss": 0.6656, + "step": 16385 + }, + { + "epoch": 0.32, + "learning_rate": 1.3656168692477961e-07, + "loss": 0.0009, + "step": 16386 + }, + { + "epoch": 0.32, + "learning_rate": 1.3655780358044346e-07, + "loss": 0.0012, + "step": 16387 + }, + { + "epoch": 0.32, + "learning_rate": 1.3655392023610733e-07, + "loss": 0.001, + "step": 16388 + }, + { + "epoch": 0.32, + "learning_rate": 1.3655003689177118e-07, + "loss": 0.0008, + "step": 16389 + }, + { + "epoch": 0.32, + "learning_rate": 1.3654615354743505e-07, + "loss": 0.8884, + "step": 16390 + }, + { + "epoch": 0.32, + "learning_rate": 1.365422702030989e-07, + "loss": 0.0007, + "step": 16391 + }, + { + "epoch": 0.32, + "learning_rate": 1.3653838685876276e-07, + "loss": 0.0025, + "step": 16392 + }, + { + "epoch": 0.32, + "learning_rate": 1.365345035144266e-07, + "loss": 0.0043, + "step": 16393 + }, + { + "epoch": 0.32, + "learning_rate": 1.3653062017009048e-07, + "loss": 0.0012, + "step": 16394 + }, + { + "epoch": 0.32, + "learning_rate": 1.3652673682575433e-07, + "loss": 0.001, + "step": 16395 + }, + { + "epoch": 0.32, + "learning_rate": 1.365228534814182e-07, + "loss": 0.0009, + "step": 16396 + }, + { + "epoch": 0.32, + "learning_rate": 1.3651897013708204e-07, + "loss": 0.0041, + "step": 16397 + }, + { + "epoch": 0.32, + "learning_rate": 1.3651508679274591e-07, + "loss": 0.0012, + "step": 16398 + }, + { + "epoch": 0.32, + "learning_rate": 1.3651120344840976e-07, + "loss": 0.001, + "step": 16399 + }, + { + "epoch": 0.32, + "learning_rate": 1.3650732010407363e-07, + "loss": 0.001, + "step": 16400 + }, + { + "epoch": 0.32, + "learning_rate": 1.3650343675973748e-07, + "loss": 0.0013, + "step": 16401 + }, + { + "epoch": 0.32, + "learning_rate": 1.3649955341540135e-07, + "loss": 0.0012, + "step": 16402 + }, + { + "epoch": 0.32, + "learning_rate": 1.364956700710652e-07, + "loss": 0.0013, + "step": 16403 + }, + { + "epoch": 0.32, + "learning_rate": 1.3649178672672906e-07, + "loss": 0.0009, + "step": 16404 + }, + { + "epoch": 0.32, + "learning_rate": 1.364879033823929e-07, + "loss": 0.001, + "step": 16405 + }, + { + "epoch": 0.32, + "learning_rate": 1.3648402003805678e-07, + "loss": 0.0014, + "step": 16406 + }, + { + "epoch": 0.32, + "learning_rate": 1.3648013669372062e-07, + "loss": 0.0015, + "step": 16407 + }, + { + "epoch": 0.32, + "learning_rate": 1.364762533493845e-07, + "loss": 0.0008, + "step": 16408 + }, + { + "epoch": 0.32, + "learning_rate": 1.3647237000504834e-07, + "loss": 0.0011, + "step": 16409 + }, + { + "epoch": 0.32, + "learning_rate": 1.364684866607122e-07, + "loss": 0.0018, + "step": 16410 + }, + { + "epoch": 0.32, + "learning_rate": 1.3646460331637606e-07, + "loss": 0.0012, + "step": 16411 + }, + { + "epoch": 0.32, + "learning_rate": 1.3646071997203993e-07, + "loss": 0.001, + "step": 16412 + }, + { + "epoch": 0.32, + "learning_rate": 1.3645683662770377e-07, + "loss": 0.3409, + "step": 16413 + }, + { + "epoch": 0.32, + "learning_rate": 1.3645295328336765e-07, + "loss": 0.001, + "step": 16414 + }, + { + "epoch": 0.32, + "learning_rate": 1.364490699390315e-07, + "loss": 0.0014, + "step": 16415 + }, + { + "epoch": 0.32, + "learning_rate": 1.3644518659469536e-07, + "loss": 0.0029, + "step": 16416 + }, + { + "epoch": 0.32, + "learning_rate": 1.364413032503592e-07, + "loss": 0.0014, + "step": 16417 + }, + { + "epoch": 0.32, + "learning_rate": 1.3643741990602308e-07, + "loss": 0.0012, + "step": 16418 + }, + { + "epoch": 0.32, + "learning_rate": 1.3643353656168692e-07, + "loss": 0.0015, + "step": 16419 + }, + { + "epoch": 0.32, + "learning_rate": 1.364296532173508e-07, + "loss": 0.0011, + "step": 16420 + }, + { + "epoch": 0.32, + "learning_rate": 1.3642576987301464e-07, + "loss": 0.2512, + "step": 16421 + }, + { + "epoch": 0.32, + "learning_rate": 1.3642188652867849e-07, + "loss": 0.0012, + "step": 16422 + }, + { + "epoch": 0.32, + "learning_rate": 1.3641800318434236e-07, + "loss": 0.6544, + "step": 16423 + }, + { + "epoch": 0.32, + "learning_rate": 1.364141198400062e-07, + "loss": 0.0016, + "step": 16424 + }, + { + "epoch": 0.32, + "learning_rate": 1.3641023649567007e-07, + "loss": 0.0009, + "step": 16425 + }, + { + "epoch": 0.32, + "learning_rate": 1.3640635315133392e-07, + "loss": 0.0027, + "step": 16426 + }, + { + "epoch": 0.32, + "learning_rate": 1.364024698069978e-07, + "loss": 0.0282, + "step": 16427 + }, + { + "epoch": 0.32, + "learning_rate": 1.3639858646266163e-07, + "loss": 0.6572, + "step": 16428 + }, + { + "epoch": 0.32, + "learning_rate": 1.363947031183255e-07, + "loss": 0.0026, + "step": 16429 + }, + { + "epoch": 0.32, + "learning_rate": 1.3639081977398935e-07, + "loss": 0.0037, + "step": 16430 + }, + { + "epoch": 0.32, + "learning_rate": 1.3638693642965322e-07, + "loss": 0.0013, + "step": 16431 + }, + { + "epoch": 0.32, + "learning_rate": 1.3638305308531707e-07, + "loss": 0.0009, + "step": 16432 + }, + { + "epoch": 0.32, + "learning_rate": 1.3637916974098094e-07, + "loss": 0.0044, + "step": 16433 + }, + { + "epoch": 0.32, + "learning_rate": 1.3637528639664478e-07, + "loss": 0.0011, + "step": 16434 + }, + { + "epoch": 0.32, + "learning_rate": 1.3637140305230863e-07, + "loss": 0.0068, + "step": 16435 + }, + { + "epoch": 0.32, + "learning_rate": 1.363675197079725e-07, + "loss": 0.0013, + "step": 16436 + }, + { + "epoch": 0.32, + "learning_rate": 1.3636363636363635e-07, + "loss": 0.001, + "step": 16437 + }, + { + "epoch": 0.32, + "learning_rate": 1.3635975301930022e-07, + "loss": 0.0011, + "step": 16438 + }, + { + "epoch": 0.32, + "learning_rate": 1.3635586967496406e-07, + "loss": 0.0013, + "step": 16439 + }, + { + "epoch": 0.32, + "learning_rate": 1.3635198633062793e-07, + "loss": 0.0011, + "step": 16440 + }, + { + "epoch": 0.32, + "learning_rate": 1.3634810298629178e-07, + "loss": 0.0008, + "step": 16441 + }, + { + "epoch": 0.32, + "learning_rate": 1.3634421964195565e-07, + "loss": 0.0031, + "step": 16442 + }, + { + "epoch": 0.32, + "learning_rate": 1.363403362976195e-07, + "loss": 0.001, + "step": 16443 + }, + { + "epoch": 0.32, + "learning_rate": 1.3633645295328337e-07, + "loss": 0.0008, + "step": 16444 + }, + { + "epoch": 0.32, + "learning_rate": 1.363325696089472e-07, + "loss": 0.0007, + "step": 16445 + }, + { + "epoch": 0.32, + "learning_rate": 1.3632868626461108e-07, + "loss": 0.639, + "step": 16446 + }, + { + "epoch": 0.32, + "learning_rate": 1.3632480292027493e-07, + "loss": 0.001, + "step": 16447 + }, + { + "epoch": 0.32, + "learning_rate": 1.363209195759388e-07, + "loss": 0.0009, + "step": 16448 + }, + { + "epoch": 0.32, + "learning_rate": 1.3631703623160264e-07, + "loss": 0.0007, + "step": 16449 + }, + { + "epoch": 0.32, + "learning_rate": 1.3631315288726652e-07, + "loss": 0.0011, + "step": 16450 + }, + { + "epoch": 0.32, + "learning_rate": 1.3630926954293036e-07, + "loss": 0.0045, + "step": 16451 + }, + { + "epoch": 0.32, + "learning_rate": 1.363053861985942e-07, + "loss": 0.0017, + "step": 16452 + }, + { + "epoch": 0.32, + "learning_rate": 1.3630150285425808e-07, + "loss": 0.0008, + "step": 16453 + }, + { + "epoch": 0.32, + "learning_rate": 1.3629761950992192e-07, + "loss": 0.0018, + "step": 16454 + }, + { + "epoch": 0.32, + "learning_rate": 1.362937361655858e-07, + "loss": 0.0015, + "step": 16455 + }, + { + "epoch": 0.32, + "learning_rate": 1.3628985282124964e-07, + "loss": 0.0013, + "step": 16456 + }, + { + "epoch": 0.32, + "learning_rate": 1.362859694769135e-07, + "loss": 0.6462, + "step": 16457 + }, + { + "epoch": 0.32, + "learning_rate": 1.3628208613257736e-07, + "loss": 0.001, + "step": 16458 + }, + { + "epoch": 0.32, + "learning_rate": 1.3627820278824123e-07, + "loss": 0.0018, + "step": 16459 + }, + { + "epoch": 0.32, + "learning_rate": 1.3627431944390507e-07, + "loss": 0.0011, + "step": 16460 + }, + { + "epoch": 0.32, + "learning_rate": 1.3627043609956894e-07, + "loss": 0.0008, + "step": 16461 + }, + { + "epoch": 0.32, + "learning_rate": 1.362665527552328e-07, + "loss": 0.001, + "step": 16462 + }, + { + "epoch": 0.32, + "learning_rate": 1.3626266941089666e-07, + "loss": 0.012, + "step": 16463 + }, + { + "epoch": 0.32, + "learning_rate": 1.362587860665605e-07, + "loss": 0.001, + "step": 16464 + }, + { + "epoch": 0.32, + "learning_rate": 1.3625490272222438e-07, + "loss": 0.0012, + "step": 16465 + }, + { + "epoch": 0.32, + "learning_rate": 1.3625101937788822e-07, + "loss": 0.001, + "step": 16466 + }, + { + "epoch": 0.32, + "learning_rate": 1.362471360335521e-07, + "loss": 0.0324, + "step": 16467 + }, + { + "epoch": 0.32, + "learning_rate": 1.3624325268921594e-07, + "loss": 0.001, + "step": 16468 + }, + { + "epoch": 0.32, + "learning_rate": 1.362393693448798e-07, + "loss": 0.0008, + "step": 16469 + }, + { + "epoch": 0.32, + "learning_rate": 1.3623548600054365e-07, + "loss": 0.0011, + "step": 16470 + }, + { + "epoch": 0.32, + "learning_rate": 1.3623160265620753e-07, + "loss": 0.0057, + "step": 16471 + }, + { + "epoch": 0.32, + "learning_rate": 1.3622771931187137e-07, + "loss": 0.0017, + "step": 16472 + }, + { + "epoch": 0.32, + "learning_rate": 1.3622383596753524e-07, + "loss": 0.6607, + "step": 16473 + }, + { + "epoch": 0.32, + "learning_rate": 1.362199526231991e-07, + "loss": 1.8335, + "step": 16474 + }, + { + "epoch": 0.32, + "learning_rate": 1.3621606927886296e-07, + "loss": 0.0008, + "step": 16475 + }, + { + "epoch": 0.32, + "learning_rate": 1.362121859345268e-07, + "loss": 0.0021, + "step": 16476 + }, + { + "epoch": 0.32, + "learning_rate": 1.3620830259019068e-07, + "loss": 0.5339, + "step": 16477 + }, + { + "epoch": 0.32, + "learning_rate": 1.3620441924585452e-07, + "loss": 0.0029, + "step": 16478 + }, + { + "epoch": 0.32, + "learning_rate": 1.362005359015184e-07, + "loss": 0.0009, + "step": 16479 + }, + { + "epoch": 0.32, + "learning_rate": 1.3619665255718224e-07, + "loss": 0.0009, + "step": 16480 + }, + { + "epoch": 0.32, + "learning_rate": 1.361927692128461e-07, + "loss": 0.0008, + "step": 16481 + }, + { + "epoch": 0.32, + "learning_rate": 1.3618888586850995e-07, + "loss": 0.0009, + "step": 16482 + }, + { + "epoch": 0.32, + "learning_rate": 1.3618500252417382e-07, + "loss": 0.012, + "step": 16483 + }, + { + "epoch": 0.32, + "learning_rate": 1.3618111917983767e-07, + "loss": 0.0009, + "step": 16484 + }, + { + "epoch": 0.32, + "learning_rate": 1.3617723583550154e-07, + "loss": 0.0015, + "step": 16485 + }, + { + "epoch": 0.32, + "learning_rate": 1.3617335249116539e-07, + "loss": 0.0012, + "step": 16486 + }, + { + "epoch": 0.32, + "learning_rate": 1.3616946914682926e-07, + "loss": 0.001, + "step": 16487 + }, + { + "epoch": 0.32, + "learning_rate": 1.361655858024931e-07, + "loss": 0.001, + "step": 16488 + }, + { + "epoch": 0.32, + "learning_rate": 1.3616170245815697e-07, + "loss": 0.0048, + "step": 16489 + }, + { + "epoch": 0.32, + "learning_rate": 1.3615781911382082e-07, + "loss": 0.0011, + "step": 16490 + }, + { + "epoch": 0.32, + "learning_rate": 1.361539357694847e-07, + "loss": 0.0008, + "step": 16491 + }, + { + "epoch": 0.32, + "learning_rate": 1.3615005242514854e-07, + "loss": 0.001, + "step": 16492 + }, + { + "epoch": 0.32, + "learning_rate": 1.3614616908081238e-07, + "loss": 0.0013, + "step": 16493 + }, + { + "epoch": 0.32, + "learning_rate": 1.3614228573647623e-07, + "loss": 0.001, + "step": 16494 + }, + { + "epoch": 0.32, + "learning_rate": 1.361384023921401e-07, + "loss": 0.001, + "step": 16495 + }, + { + "epoch": 0.32, + "learning_rate": 1.3613451904780394e-07, + "loss": 0.0015, + "step": 16496 + }, + { + "epoch": 0.32, + "learning_rate": 1.3613063570346781e-07, + "loss": 0.0009, + "step": 16497 + }, + { + "epoch": 0.32, + "learning_rate": 1.3612675235913166e-07, + "loss": 0.3144, + "step": 16498 + }, + { + "epoch": 0.32, + "learning_rate": 1.3612286901479553e-07, + "loss": 0.0009, + "step": 16499 + }, + { + "epoch": 0.32, + "learning_rate": 1.3611898567045938e-07, + "loss": 0.0011, + "step": 16500 + }, + { + "epoch": 0.32, + "learning_rate": 1.3611510232612325e-07, + "loss": 0.0009, + "step": 16501 + }, + { + "epoch": 0.32, + "learning_rate": 1.361112189817871e-07, + "loss": 0.001, + "step": 16502 + }, + { + "epoch": 0.32, + "learning_rate": 1.3610733563745096e-07, + "loss": 0.0007, + "step": 16503 + }, + { + "epoch": 0.32, + "learning_rate": 1.361034522931148e-07, + "loss": 0.0008, + "step": 16504 + }, + { + "epoch": 0.32, + "learning_rate": 1.3609956894877868e-07, + "loss": 0.001, + "step": 16505 + }, + { + "epoch": 0.32, + "learning_rate": 1.3609568560444252e-07, + "loss": 0.0014, + "step": 16506 + }, + { + "epoch": 0.32, + "learning_rate": 1.360918022601064e-07, + "loss": 0.0014, + "step": 16507 + }, + { + "epoch": 0.32, + "learning_rate": 1.3608791891577024e-07, + "loss": 0.7604, + "step": 16508 + }, + { + "epoch": 0.32, + "learning_rate": 1.360840355714341e-07, + "loss": 0.0008, + "step": 16509 + }, + { + "epoch": 0.32, + "learning_rate": 1.3608015222709796e-07, + "loss": 0.0013, + "step": 16510 + }, + { + "epoch": 0.32, + "learning_rate": 1.3607626888276183e-07, + "loss": 0.0012, + "step": 16511 + }, + { + "epoch": 0.32, + "learning_rate": 1.3607238553842567e-07, + "loss": 0.0054, + "step": 16512 + }, + { + "epoch": 0.32, + "learning_rate": 1.3606850219408955e-07, + "loss": 0.0009, + "step": 16513 + }, + { + "epoch": 0.32, + "learning_rate": 1.360646188497534e-07, + "loss": 0.001, + "step": 16514 + }, + { + "epoch": 0.32, + "learning_rate": 1.3606073550541726e-07, + "loss": 0.0012, + "step": 16515 + }, + { + "epoch": 0.32, + "learning_rate": 1.360568521610811e-07, + "loss": 0.0011, + "step": 16516 + }, + { + "epoch": 0.32, + "learning_rate": 1.3605296881674498e-07, + "loss": 0.6674, + "step": 16517 + }, + { + "epoch": 0.32, + "learning_rate": 1.3604908547240882e-07, + "loss": 0.0458, + "step": 16518 + }, + { + "epoch": 0.32, + "learning_rate": 1.360452021280727e-07, + "loss": 0.0008, + "step": 16519 + }, + { + "epoch": 0.32, + "learning_rate": 1.3604131878373654e-07, + "loss": 0.5029, + "step": 16520 + }, + { + "epoch": 0.32, + "learning_rate": 1.360374354394004e-07, + "loss": 0.0014, + "step": 16521 + }, + { + "epoch": 0.32, + "learning_rate": 1.3603355209506426e-07, + "loss": 0.0008, + "step": 16522 + }, + { + "epoch": 0.32, + "learning_rate": 1.3602966875072813e-07, + "loss": 0.0012, + "step": 16523 + }, + { + "epoch": 0.32, + "learning_rate": 1.3602578540639197e-07, + "loss": 1.0892, + "step": 16524 + }, + { + "epoch": 0.32, + "learning_rate": 1.3602190206205584e-07, + "loss": 0.0014, + "step": 16525 + }, + { + "epoch": 0.32, + "learning_rate": 1.360180187177197e-07, + "loss": 0.0279, + "step": 16526 + }, + { + "epoch": 0.32, + "learning_rate": 1.3601413537338356e-07, + "loss": 0.0009, + "step": 16527 + }, + { + "epoch": 0.32, + "learning_rate": 1.360102520290474e-07, + "loss": 0.2134, + "step": 16528 + }, + { + "epoch": 0.32, + "learning_rate": 1.3600636868471128e-07, + "loss": 0.0034, + "step": 16529 + }, + { + "epoch": 0.32, + "learning_rate": 1.3600248534037512e-07, + "loss": 0.001, + "step": 16530 + }, + { + "epoch": 0.32, + "learning_rate": 1.35998601996039e-07, + "loss": 0.0013, + "step": 16531 + }, + { + "epoch": 0.32, + "learning_rate": 1.3599471865170284e-07, + "loss": 0.0009, + "step": 16532 + }, + { + "epoch": 0.32, + "learning_rate": 1.359908353073667e-07, + "loss": 0.0012, + "step": 16533 + }, + { + "epoch": 0.32, + "learning_rate": 1.3598695196303056e-07, + "loss": 0.0013, + "step": 16534 + }, + { + "epoch": 0.32, + "learning_rate": 1.3598306861869443e-07, + "loss": 0.0006, + "step": 16535 + }, + { + "epoch": 0.32, + "learning_rate": 1.3597918527435827e-07, + "loss": 0.0009, + "step": 16536 + }, + { + "epoch": 0.32, + "learning_rate": 1.3597530193002214e-07, + "loss": 0.0064, + "step": 16537 + }, + { + "epoch": 0.32, + "learning_rate": 1.35971418585686e-07, + "loss": 0.4133, + "step": 16538 + }, + { + "epoch": 0.32, + "learning_rate": 1.3596753524134986e-07, + "loss": 0.0188, + "step": 16539 + }, + { + "epoch": 0.32, + "learning_rate": 1.359636518970137e-07, + "loss": 0.001, + "step": 16540 + }, + { + "epoch": 0.32, + "learning_rate": 1.3595976855267758e-07, + "loss": 0.0501, + "step": 16541 + }, + { + "epoch": 0.32, + "learning_rate": 1.3595588520834142e-07, + "loss": 0.001, + "step": 16542 + }, + { + "epoch": 0.32, + "learning_rate": 1.359520018640053e-07, + "loss": 0.0009, + "step": 16543 + }, + { + "epoch": 0.32, + "learning_rate": 1.3594811851966914e-07, + "loss": 0.0009, + "step": 16544 + }, + { + "epoch": 0.32, + "learning_rate": 1.35944235175333e-07, + "loss": 0.0217, + "step": 16545 + }, + { + "epoch": 0.32, + "learning_rate": 1.3594035183099685e-07, + "loss": 0.001, + "step": 16546 + }, + { + "epoch": 0.32, + "learning_rate": 1.3593646848666073e-07, + "loss": 0.0011, + "step": 16547 + }, + { + "epoch": 0.32, + "learning_rate": 1.3593258514232457e-07, + "loss": 0.0011, + "step": 16548 + }, + { + "epoch": 0.32, + "learning_rate": 1.3592870179798844e-07, + "loss": 0.001, + "step": 16549 + }, + { + "epoch": 0.32, + "learning_rate": 1.359248184536523e-07, + "loss": 0.8461, + "step": 16550 + }, + { + "epoch": 0.32, + "learning_rate": 1.3592093510931613e-07, + "loss": 0.0026, + "step": 16551 + }, + { + "epoch": 0.32, + "learning_rate": 1.3591705176497998e-07, + "loss": 0.0008, + "step": 16552 + }, + { + "epoch": 0.32, + "learning_rate": 1.3591316842064385e-07, + "loss": 0.4289, + "step": 16553 + }, + { + "epoch": 0.32, + "learning_rate": 1.359092850763077e-07, + "loss": 0.0011, + "step": 16554 + }, + { + "epoch": 0.32, + "learning_rate": 1.3590540173197157e-07, + "loss": 0.0011, + "step": 16555 + }, + { + "epoch": 0.32, + "learning_rate": 1.359015183876354e-07, + "loss": 0.2205, + "step": 16556 + }, + { + "epoch": 0.32, + "learning_rate": 1.3589763504329928e-07, + "loss": 0.0017, + "step": 16557 + }, + { + "epoch": 0.32, + "learning_rate": 1.3589375169896313e-07, + "loss": 0.001, + "step": 16558 + }, + { + "epoch": 0.32, + "learning_rate": 1.35889868354627e-07, + "loss": 0.0009, + "step": 16559 + }, + { + "epoch": 0.32, + "learning_rate": 1.3588598501029084e-07, + "loss": 0.0226, + "step": 16560 + }, + { + "epoch": 0.32, + "learning_rate": 1.3588210166595471e-07, + "loss": 0.0093, + "step": 16561 + }, + { + "epoch": 0.32, + "learning_rate": 1.3587821832161856e-07, + "loss": 0.0034, + "step": 16562 + }, + { + "epoch": 0.32, + "learning_rate": 1.3587433497728243e-07, + "loss": 0.0012, + "step": 16563 + }, + { + "epoch": 0.32, + "learning_rate": 1.3587045163294628e-07, + "loss": 0.0027, + "step": 16564 + }, + { + "epoch": 0.32, + "learning_rate": 1.3586656828861015e-07, + "loss": 0.0011, + "step": 16565 + }, + { + "epoch": 0.32, + "learning_rate": 1.35862684944274e-07, + "loss": 0.0011, + "step": 16566 + }, + { + "epoch": 0.32, + "learning_rate": 1.3585880159993786e-07, + "loss": 0.0015, + "step": 16567 + }, + { + "epoch": 0.32, + "learning_rate": 1.358549182556017e-07, + "loss": 0.0624, + "step": 16568 + }, + { + "epoch": 0.32, + "learning_rate": 1.3585103491126558e-07, + "loss": 0.0014, + "step": 16569 + }, + { + "epoch": 0.32, + "learning_rate": 1.3584715156692943e-07, + "loss": 0.001, + "step": 16570 + }, + { + "epoch": 0.32, + "learning_rate": 1.358432682225933e-07, + "loss": 0.649, + "step": 16571 + }, + { + "epoch": 0.32, + "learning_rate": 1.3583938487825714e-07, + "loss": 0.3621, + "step": 16572 + }, + { + "epoch": 0.32, + "learning_rate": 1.3583550153392101e-07, + "loss": 0.0008, + "step": 16573 + }, + { + "epoch": 0.32, + "learning_rate": 1.3583161818958486e-07, + "loss": 0.0009, + "step": 16574 + }, + { + "epoch": 0.32, + "learning_rate": 1.3582773484524873e-07, + "loss": 0.001, + "step": 16575 + }, + { + "epoch": 0.32, + "learning_rate": 1.3582385150091258e-07, + "loss": 0.0012, + "step": 16576 + }, + { + "epoch": 0.32, + "learning_rate": 1.3581996815657645e-07, + "loss": 0.0009, + "step": 16577 + }, + { + "epoch": 0.32, + "learning_rate": 1.358160848122403e-07, + "loss": 0.001, + "step": 16578 + }, + { + "epoch": 0.32, + "learning_rate": 1.3581220146790416e-07, + "loss": 0.001, + "step": 16579 + }, + { + "epoch": 0.32, + "learning_rate": 1.35808318123568e-07, + "loss": 0.0035, + "step": 16580 + }, + { + "epoch": 0.32, + "learning_rate": 1.3580443477923188e-07, + "loss": 0.0008, + "step": 16581 + }, + { + "epoch": 0.32, + "learning_rate": 1.3580055143489572e-07, + "loss": 0.001, + "step": 16582 + }, + { + "epoch": 0.32, + "learning_rate": 1.357966680905596e-07, + "loss": 0.7836, + "step": 16583 + }, + { + "epoch": 0.32, + "learning_rate": 1.3579278474622344e-07, + "loss": 0.0013, + "step": 16584 + }, + { + "epoch": 0.32, + "learning_rate": 1.357889014018873e-07, + "loss": 0.6263, + "step": 16585 + }, + { + "epoch": 0.32, + "learning_rate": 1.3578501805755116e-07, + "loss": 0.001, + "step": 16586 + }, + { + "epoch": 0.32, + "learning_rate": 1.3578113471321503e-07, + "loss": 0.001, + "step": 16587 + }, + { + "epoch": 0.32, + "learning_rate": 1.3577725136887887e-07, + "loss": 0.0011, + "step": 16588 + }, + { + "epoch": 0.32, + "learning_rate": 1.3577336802454275e-07, + "loss": 0.1658, + "step": 16589 + }, + { + "epoch": 0.32, + "learning_rate": 1.357694846802066e-07, + "loss": 0.0014, + "step": 16590 + }, + { + "epoch": 0.32, + "learning_rate": 1.3576560133587046e-07, + "loss": 0.001, + "step": 16591 + }, + { + "epoch": 0.32, + "learning_rate": 1.357617179915343e-07, + "loss": 0.0011, + "step": 16592 + }, + { + "epoch": 0.32, + "learning_rate": 1.3575783464719818e-07, + "loss": 0.001, + "step": 16593 + }, + { + "epoch": 0.32, + "learning_rate": 1.3575395130286202e-07, + "loss": 0.0022, + "step": 16594 + }, + { + "epoch": 0.32, + "learning_rate": 1.357500679585259e-07, + "loss": 0.002, + "step": 16595 + }, + { + "epoch": 0.32, + "learning_rate": 1.3574618461418974e-07, + "loss": 0.0014, + "step": 16596 + }, + { + "epoch": 0.32, + "learning_rate": 1.357423012698536e-07, + "loss": 0.0011, + "step": 16597 + }, + { + "epoch": 0.32, + "learning_rate": 1.3573841792551746e-07, + "loss": 0.5598, + "step": 16598 + }, + { + "epoch": 0.32, + "learning_rate": 1.357345345811813e-07, + "loss": 0.0009, + "step": 16599 + }, + { + "epoch": 0.32, + "learning_rate": 1.3573065123684517e-07, + "loss": 0.8245, + "step": 16600 + }, + { + "epoch": 0.32, + "learning_rate": 1.3572676789250902e-07, + "loss": 0.0016, + "step": 16601 + }, + { + "epoch": 0.32, + "learning_rate": 1.357228845481729e-07, + "loss": 0.0051, + "step": 16602 + }, + { + "epoch": 0.32, + "learning_rate": 1.3571900120383673e-07, + "loss": 0.0012, + "step": 16603 + }, + { + "epoch": 0.32, + "learning_rate": 1.357151178595006e-07, + "loss": 0.0011, + "step": 16604 + }, + { + "epoch": 0.32, + "learning_rate": 1.3571123451516445e-07, + "loss": 0.0014, + "step": 16605 + }, + { + "epoch": 0.32, + "learning_rate": 1.3570735117082832e-07, + "loss": 0.001, + "step": 16606 + }, + { + "epoch": 0.32, + "learning_rate": 1.3570346782649217e-07, + "loss": 0.0009, + "step": 16607 + }, + { + "epoch": 0.32, + "learning_rate": 1.3569958448215604e-07, + "loss": 0.0011, + "step": 16608 + }, + { + "epoch": 0.32, + "learning_rate": 1.3569570113781988e-07, + "loss": 0.2278, + "step": 16609 + }, + { + "epoch": 0.32, + "learning_rate": 1.3569181779348373e-07, + "loss": 0.005, + "step": 16610 + }, + { + "epoch": 0.32, + "learning_rate": 1.356879344491476e-07, + "loss": 0.001, + "step": 16611 + }, + { + "epoch": 0.32, + "learning_rate": 1.3568405110481145e-07, + "loss": 0.2621, + "step": 16612 + }, + { + "epoch": 0.32, + "learning_rate": 1.3568016776047532e-07, + "loss": 0.135, + "step": 16613 + }, + { + "epoch": 0.32, + "learning_rate": 1.3567628441613916e-07, + "loss": 0.001, + "step": 16614 + }, + { + "epoch": 0.32, + "learning_rate": 1.3567240107180303e-07, + "loss": 0.0192, + "step": 16615 + }, + { + "epoch": 0.32, + "learning_rate": 1.3566851772746688e-07, + "loss": 0.0021, + "step": 16616 + }, + { + "epoch": 0.32, + "learning_rate": 1.3566463438313075e-07, + "loss": 0.0019, + "step": 16617 + }, + { + "epoch": 0.32, + "learning_rate": 1.356607510387946e-07, + "loss": 0.0009, + "step": 16618 + }, + { + "epoch": 0.32, + "learning_rate": 1.3565686769445847e-07, + "loss": 0.0023, + "step": 16619 + }, + { + "epoch": 0.32, + "learning_rate": 1.356529843501223e-07, + "loss": 0.0007, + "step": 16620 + }, + { + "epoch": 0.32, + "learning_rate": 1.3564910100578618e-07, + "loss": 0.0012, + "step": 16621 + }, + { + "epoch": 0.32, + "learning_rate": 1.3564521766145003e-07, + "loss": 0.0009, + "step": 16622 + }, + { + "epoch": 0.32, + "learning_rate": 1.356413343171139e-07, + "loss": 0.9816, + "step": 16623 + }, + { + "epoch": 0.32, + "learning_rate": 1.3563745097277774e-07, + "loss": 0.0011, + "step": 16624 + }, + { + "epoch": 0.32, + "learning_rate": 1.3563356762844162e-07, + "loss": 0.042, + "step": 16625 + }, + { + "epoch": 0.32, + "learning_rate": 1.3562968428410546e-07, + "loss": 0.001, + "step": 16626 + }, + { + "epoch": 0.32, + "learning_rate": 1.3562580093976933e-07, + "loss": 0.0011, + "step": 16627 + }, + { + "epoch": 0.32, + "learning_rate": 1.3562191759543318e-07, + "loss": 0.0012, + "step": 16628 + }, + { + "epoch": 0.32, + "learning_rate": 1.3561803425109702e-07, + "loss": 0.0015, + "step": 16629 + }, + { + "epoch": 0.32, + "learning_rate": 1.356141509067609e-07, + "loss": 0.001, + "step": 16630 + }, + { + "epoch": 0.32, + "learning_rate": 1.3561026756242474e-07, + "loss": 0.001, + "step": 16631 + }, + { + "epoch": 0.32, + "learning_rate": 1.356063842180886e-07, + "loss": 0.7438, + "step": 16632 + }, + { + "epoch": 0.32, + "learning_rate": 1.3560250087375246e-07, + "loss": 0.001, + "step": 16633 + }, + { + "epoch": 0.32, + "learning_rate": 1.3559861752941633e-07, + "loss": 0.0013, + "step": 16634 + }, + { + "epoch": 0.32, + "learning_rate": 1.3559473418508017e-07, + "loss": 0.884, + "step": 16635 + }, + { + "epoch": 0.32, + "learning_rate": 1.3559085084074404e-07, + "loss": 0.0011, + "step": 16636 + }, + { + "epoch": 0.32, + "learning_rate": 1.355869674964079e-07, + "loss": 0.0011, + "step": 16637 + }, + { + "epoch": 0.32, + "learning_rate": 1.3558308415207176e-07, + "loss": 0.0013, + "step": 16638 + }, + { + "epoch": 0.32, + "learning_rate": 1.355792008077356e-07, + "loss": 0.0007, + "step": 16639 + }, + { + "epoch": 0.32, + "learning_rate": 1.3557531746339948e-07, + "loss": 0.003, + "step": 16640 + }, + { + "epoch": 0.32, + "learning_rate": 1.3557143411906332e-07, + "loss": 0.8555, + "step": 16641 + }, + { + "epoch": 0.32, + "learning_rate": 1.355675507747272e-07, + "loss": 0.001, + "step": 16642 + }, + { + "epoch": 0.32, + "learning_rate": 1.3556366743039104e-07, + "loss": 0.0124, + "step": 16643 + }, + { + "epoch": 0.32, + "learning_rate": 1.355597840860549e-07, + "loss": 0.0013, + "step": 16644 + }, + { + "epoch": 0.32, + "learning_rate": 1.3555590074171875e-07, + "loss": 0.0009, + "step": 16645 + }, + { + "epoch": 0.32, + "learning_rate": 1.3555201739738263e-07, + "loss": 0.001, + "step": 16646 + }, + { + "epoch": 0.32, + "learning_rate": 1.3554813405304647e-07, + "loss": 0.0012, + "step": 16647 + }, + { + "epoch": 0.32, + "learning_rate": 1.3554425070871034e-07, + "loss": 0.0013, + "step": 16648 + }, + { + "epoch": 0.32, + "learning_rate": 1.355403673643742e-07, + "loss": 0.0012, + "step": 16649 + }, + { + "epoch": 0.32, + "learning_rate": 1.3553648402003806e-07, + "loss": 0.0009, + "step": 16650 + }, + { + "epoch": 0.32, + "learning_rate": 1.355326006757019e-07, + "loss": 0.1578, + "step": 16651 + }, + { + "epoch": 0.32, + "learning_rate": 1.3552871733136578e-07, + "loss": 0.0016, + "step": 16652 + }, + { + "epoch": 0.32, + "learning_rate": 1.3552483398702962e-07, + "loss": 0.0015, + "step": 16653 + }, + { + "epoch": 0.32, + "learning_rate": 1.355209506426935e-07, + "loss": 0.4691, + "step": 16654 + }, + { + "epoch": 0.32, + "learning_rate": 1.3551706729835734e-07, + "loss": 0.245, + "step": 16655 + }, + { + "epoch": 0.32, + "learning_rate": 1.355131839540212e-07, + "loss": 0.0011, + "step": 16656 + }, + { + "epoch": 0.32, + "learning_rate": 1.3550930060968505e-07, + "loss": 0.0009, + "step": 16657 + }, + { + "epoch": 0.32, + "learning_rate": 1.3550541726534892e-07, + "loss": 0.0008, + "step": 16658 + }, + { + "epoch": 0.32, + "learning_rate": 1.3550153392101277e-07, + "loss": 0.0009, + "step": 16659 + }, + { + "epoch": 0.32, + "learning_rate": 1.3549765057667664e-07, + "loss": 0.0007, + "step": 16660 + }, + { + "epoch": 0.32, + "learning_rate": 1.3549376723234049e-07, + "loss": 0.0014, + "step": 16661 + }, + { + "epoch": 0.32, + "learning_rate": 1.3548988388800436e-07, + "loss": 0.0011, + "step": 16662 + }, + { + "epoch": 0.32, + "learning_rate": 1.354860005436682e-07, + "loss": 0.0014, + "step": 16663 + }, + { + "epoch": 0.32, + "learning_rate": 1.3548211719933207e-07, + "loss": 0.0008, + "step": 16664 + }, + { + "epoch": 0.32, + "learning_rate": 1.3547823385499592e-07, + "loss": 0.0009, + "step": 16665 + }, + { + "epoch": 0.32, + "learning_rate": 1.354743505106598e-07, + "loss": 0.0009, + "step": 16666 + }, + { + "epoch": 0.32, + "learning_rate": 1.354704671663236e-07, + "loss": 0.0013, + "step": 16667 + }, + { + "epoch": 0.32, + "learning_rate": 1.3546658382198748e-07, + "loss": 0.0009, + "step": 16668 + }, + { + "epoch": 0.32, + "learning_rate": 1.3546270047765133e-07, + "loss": 0.0022, + "step": 16669 + }, + { + "epoch": 0.32, + "learning_rate": 1.354588171333152e-07, + "loss": 0.0009, + "step": 16670 + }, + { + "epoch": 0.32, + "learning_rate": 1.3545493378897904e-07, + "loss": 0.3161, + "step": 16671 + }, + { + "epoch": 0.32, + "learning_rate": 1.3545105044464291e-07, + "loss": 0.0017, + "step": 16672 + }, + { + "epoch": 0.32, + "learning_rate": 1.3544716710030676e-07, + "loss": 0.0012, + "step": 16673 + }, + { + "epoch": 0.32, + "learning_rate": 1.3544328375597063e-07, + "loss": 0.0032, + "step": 16674 + }, + { + "epoch": 0.32, + "learning_rate": 1.3543940041163448e-07, + "loss": 0.001, + "step": 16675 + }, + { + "epoch": 0.32, + "learning_rate": 1.3543551706729835e-07, + "loss": 0.0013, + "step": 16676 + }, + { + "epoch": 0.32, + "learning_rate": 1.354316337229622e-07, + "loss": 0.0009, + "step": 16677 + }, + { + "epoch": 0.32, + "learning_rate": 1.3542775037862606e-07, + "loss": 0.0011, + "step": 16678 + }, + { + "epoch": 0.32, + "learning_rate": 1.354238670342899e-07, + "loss": 0.0011, + "step": 16679 + }, + { + "epoch": 0.32, + "learning_rate": 1.3541998368995378e-07, + "loss": 0.0014, + "step": 16680 + }, + { + "epoch": 0.32, + "learning_rate": 1.3541610034561762e-07, + "loss": 0.0085, + "step": 16681 + }, + { + "epoch": 0.32, + "learning_rate": 1.354122170012815e-07, + "loss": 0.0009, + "step": 16682 + }, + { + "epoch": 0.32, + "learning_rate": 1.3540833365694534e-07, + "loss": 0.001, + "step": 16683 + }, + { + "epoch": 0.32, + "learning_rate": 1.354044503126092e-07, + "loss": 0.0008, + "step": 16684 + }, + { + "epoch": 0.32, + "learning_rate": 1.3540056696827306e-07, + "loss": 0.0017, + "step": 16685 + }, + { + "epoch": 0.32, + "learning_rate": 1.3539668362393693e-07, + "loss": 0.0008, + "step": 16686 + }, + { + "epoch": 0.32, + "learning_rate": 1.3539280027960077e-07, + "loss": 0.0009, + "step": 16687 + }, + { + "epoch": 0.32, + "learning_rate": 1.3538891693526465e-07, + "loss": 0.001, + "step": 16688 + }, + { + "epoch": 0.32, + "learning_rate": 1.353850335909285e-07, + "loss": 0.0008, + "step": 16689 + }, + { + "epoch": 0.32, + "learning_rate": 1.3538115024659236e-07, + "loss": 0.0007, + "step": 16690 + }, + { + "epoch": 0.32, + "learning_rate": 1.353772669022562e-07, + "loss": 0.0011, + "step": 16691 + }, + { + "epoch": 0.32, + "learning_rate": 1.3537338355792008e-07, + "loss": 0.0012, + "step": 16692 + }, + { + "epoch": 0.32, + "learning_rate": 1.3536950021358392e-07, + "loss": 0.9981, + "step": 16693 + }, + { + "epoch": 0.32, + "learning_rate": 1.353656168692478e-07, + "loss": 0.61, + "step": 16694 + }, + { + "epoch": 0.32, + "learning_rate": 1.3536173352491164e-07, + "loss": 0.0007, + "step": 16695 + }, + { + "epoch": 0.32, + "learning_rate": 1.353578501805755e-07, + "loss": 0.0137, + "step": 16696 + }, + { + "epoch": 0.32, + "learning_rate": 1.3535396683623936e-07, + "loss": 0.0008, + "step": 16697 + }, + { + "epoch": 0.32, + "learning_rate": 1.3535008349190323e-07, + "loss": 0.0015, + "step": 16698 + }, + { + "epoch": 0.32, + "learning_rate": 1.3534620014756707e-07, + "loss": 0.0229, + "step": 16699 + }, + { + "epoch": 0.32, + "learning_rate": 1.3534231680323094e-07, + "loss": 0.0011, + "step": 16700 + }, + { + "epoch": 0.32, + "learning_rate": 1.353384334588948e-07, + "loss": 0.0012, + "step": 16701 + }, + { + "epoch": 0.32, + "learning_rate": 1.3533455011455866e-07, + "loss": 0.0011, + "step": 16702 + }, + { + "epoch": 0.32, + "learning_rate": 1.353306667702225e-07, + "loss": 0.0012, + "step": 16703 + }, + { + "epoch": 0.32, + "learning_rate": 1.3532678342588638e-07, + "loss": 0.4946, + "step": 16704 + }, + { + "epoch": 0.32, + "learning_rate": 1.3532290008155022e-07, + "loss": 0.0012, + "step": 16705 + }, + { + "epoch": 0.32, + "learning_rate": 1.353190167372141e-07, + "loss": 0.001, + "step": 16706 + }, + { + "epoch": 0.32, + "learning_rate": 1.3531513339287794e-07, + "loss": 0.0023, + "step": 16707 + }, + { + "epoch": 0.32, + "learning_rate": 1.353112500485418e-07, + "loss": 1.3106, + "step": 16708 + }, + { + "epoch": 0.32, + "learning_rate": 1.3530736670420566e-07, + "loss": 0.0011, + "step": 16709 + }, + { + "epoch": 0.32, + "learning_rate": 1.3530348335986953e-07, + "loss": 0.001, + "step": 16710 + }, + { + "epoch": 0.32, + "learning_rate": 1.3529960001553337e-07, + "loss": 0.0025, + "step": 16711 + }, + { + "epoch": 0.32, + "learning_rate": 1.3529571667119724e-07, + "loss": 0.0009, + "step": 16712 + }, + { + "epoch": 0.32, + "learning_rate": 1.352918333268611e-07, + "loss": 0.0022, + "step": 16713 + }, + { + "epoch": 0.32, + "learning_rate": 1.3528794998252496e-07, + "loss": 0.7908, + "step": 16714 + }, + { + "epoch": 0.32, + "learning_rate": 1.352840666381888e-07, + "loss": 0.3538, + "step": 16715 + }, + { + "epoch": 0.32, + "learning_rate": 1.3528018329385268e-07, + "loss": 0.0009, + "step": 16716 + }, + { + "epoch": 0.32, + "learning_rate": 1.3527629994951652e-07, + "loss": 0.0009, + "step": 16717 + }, + { + "epoch": 0.32, + "learning_rate": 1.352724166051804e-07, + "loss": 0.0479, + "step": 16718 + }, + { + "epoch": 0.32, + "learning_rate": 1.3526853326084424e-07, + "loss": 0.0023, + "step": 16719 + }, + { + "epoch": 0.32, + "learning_rate": 1.352646499165081e-07, + "loss": 0.0294, + "step": 16720 + }, + { + "epoch": 0.32, + "learning_rate": 1.3526076657217195e-07, + "loss": 0.0011, + "step": 16721 + }, + { + "epoch": 0.32, + "learning_rate": 1.3525688322783583e-07, + "loss": 0.9332, + "step": 16722 + }, + { + "epoch": 0.32, + "learning_rate": 1.3525299988349967e-07, + "loss": 0.0012, + "step": 16723 + }, + { + "epoch": 0.32, + "learning_rate": 1.3524911653916354e-07, + "loss": 0.0017, + "step": 16724 + }, + { + "epoch": 0.32, + "learning_rate": 1.3524523319482736e-07, + "loss": 1.1713, + "step": 16725 + }, + { + "epoch": 0.32, + "learning_rate": 1.3524134985049123e-07, + "loss": 0.0009, + "step": 16726 + }, + { + "epoch": 0.32, + "learning_rate": 1.3523746650615508e-07, + "loss": 0.0695, + "step": 16727 + }, + { + "epoch": 0.32, + "learning_rate": 1.3523358316181895e-07, + "loss": 0.0009, + "step": 16728 + }, + { + "epoch": 0.32, + "learning_rate": 1.352296998174828e-07, + "loss": 0.0008, + "step": 16729 + }, + { + "epoch": 0.32, + "learning_rate": 1.3522581647314667e-07, + "loss": 0.0022, + "step": 16730 + }, + { + "epoch": 0.32, + "learning_rate": 1.352219331288105e-07, + "loss": 0.0008, + "step": 16731 + }, + { + "epoch": 0.32, + "learning_rate": 1.3521804978447438e-07, + "loss": 0.0011, + "step": 16732 + }, + { + "epoch": 0.32, + "learning_rate": 1.3521416644013823e-07, + "loss": 0.0011, + "step": 16733 + }, + { + "epoch": 0.32, + "learning_rate": 1.352102830958021e-07, + "loss": 0.001, + "step": 16734 + }, + { + "epoch": 0.32, + "learning_rate": 1.3520639975146594e-07, + "loss": 0.0012, + "step": 16735 + }, + { + "epoch": 0.32, + "learning_rate": 1.3520251640712981e-07, + "loss": 0.0247, + "step": 16736 + }, + { + "epoch": 0.32, + "learning_rate": 1.3519863306279366e-07, + "loss": 0.0012, + "step": 16737 + }, + { + "epoch": 0.32, + "learning_rate": 1.3519474971845753e-07, + "loss": 0.0259, + "step": 16738 + }, + { + "epoch": 0.32, + "learning_rate": 1.3519086637412138e-07, + "loss": 0.134, + "step": 16739 + }, + { + "epoch": 0.32, + "learning_rate": 1.3518698302978525e-07, + "loss": 0.0016, + "step": 16740 + }, + { + "epoch": 0.32, + "learning_rate": 1.351830996854491e-07, + "loss": 0.0151, + "step": 16741 + }, + { + "epoch": 0.32, + "learning_rate": 1.3517921634111296e-07, + "loss": 0.0022, + "step": 16742 + }, + { + "epoch": 0.32, + "learning_rate": 1.351753329967768e-07, + "loss": 0.0014, + "step": 16743 + }, + { + "epoch": 0.32, + "learning_rate": 1.3517144965244068e-07, + "loss": 0.001, + "step": 16744 + }, + { + "epoch": 0.32, + "learning_rate": 1.3516756630810453e-07, + "loss": 0.002, + "step": 16745 + }, + { + "epoch": 0.32, + "learning_rate": 1.351636829637684e-07, + "loss": 0.0007, + "step": 16746 + }, + { + "epoch": 0.32, + "learning_rate": 1.3515979961943224e-07, + "loss": 0.0012, + "step": 16747 + }, + { + "epoch": 0.32, + "learning_rate": 1.3515591627509611e-07, + "loss": 0.5466, + "step": 16748 + }, + { + "epoch": 0.32, + "learning_rate": 1.3515203293075996e-07, + "loss": 0.0024, + "step": 16749 + }, + { + "epoch": 0.32, + "learning_rate": 1.3514814958642383e-07, + "loss": 0.001, + "step": 16750 + }, + { + "epoch": 0.32, + "learning_rate": 1.3514426624208768e-07, + "loss": 0.0008, + "step": 16751 + }, + { + "epoch": 0.32, + "learning_rate": 1.3514038289775155e-07, + "loss": 0.001, + "step": 16752 + }, + { + "epoch": 0.32, + "learning_rate": 1.351364995534154e-07, + "loss": 0.0035, + "step": 16753 + }, + { + "epoch": 0.32, + "learning_rate": 1.3513261620907926e-07, + "loss": 0.0011, + "step": 16754 + }, + { + "epoch": 0.33, + "learning_rate": 1.351287328647431e-07, + "loss": 0.0023, + "step": 16755 + }, + { + "epoch": 0.33, + "learning_rate": 1.3512484952040698e-07, + "loss": 0.0007, + "step": 16756 + }, + { + "epoch": 0.33, + "learning_rate": 1.3512096617607082e-07, + "loss": 0.0021, + "step": 16757 + }, + { + "epoch": 0.33, + "learning_rate": 1.351170828317347e-07, + "loss": 0.0012, + "step": 16758 + }, + { + "epoch": 0.33, + "learning_rate": 1.3511319948739854e-07, + "loss": 0.001, + "step": 16759 + }, + { + "epoch": 0.33, + "learning_rate": 1.351093161430624e-07, + "loss": 0.0014, + "step": 16760 + }, + { + "epoch": 0.33, + "learning_rate": 1.3510543279872626e-07, + "loss": 0.0012, + "step": 16761 + }, + { + "epoch": 0.33, + "learning_rate": 1.3510154945439013e-07, + "loss": 0.2087, + "step": 16762 + }, + { + "epoch": 0.33, + "learning_rate": 1.3509766611005397e-07, + "loss": 0.0009, + "step": 16763 + }, + { + "epoch": 0.33, + "learning_rate": 1.3509378276571785e-07, + "loss": 0.001, + "step": 16764 + }, + { + "epoch": 0.33, + "learning_rate": 1.350898994213817e-07, + "loss": 0.0058, + "step": 16765 + }, + { + "epoch": 0.33, + "learning_rate": 1.3508601607704556e-07, + "loss": 0.0011, + "step": 16766 + }, + { + "epoch": 0.33, + "learning_rate": 1.350821327327094e-07, + "loss": 0.0009, + "step": 16767 + }, + { + "epoch": 0.33, + "learning_rate": 1.3507824938837328e-07, + "loss": 0.0009, + "step": 16768 + }, + { + "epoch": 0.33, + "learning_rate": 1.3507436604403712e-07, + "loss": 0.1986, + "step": 16769 + }, + { + "epoch": 0.33, + "learning_rate": 1.35070482699701e-07, + "loss": 0.0013, + "step": 16770 + }, + { + "epoch": 0.33, + "learning_rate": 1.3506659935536484e-07, + "loss": 0.0008, + "step": 16771 + }, + { + "epoch": 0.33, + "learning_rate": 1.350627160110287e-07, + "loss": 0.0011, + "step": 16772 + }, + { + "epoch": 0.33, + "learning_rate": 1.3505883266669256e-07, + "loss": 0.0029, + "step": 16773 + }, + { + "epoch": 0.33, + "learning_rate": 1.3505494932235643e-07, + "loss": 0.0011, + "step": 16774 + }, + { + "epoch": 0.33, + "learning_rate": 1.3505106597802027e-07, + "loss": 0.0009, + "step": 16775 + }, + { + "epoch": 0.33, + "learning_rate": 1.3504718263368412e-07, + "loss": 0.0009, + "step": 16776 + }, + { + "epoch": 0.33, + "learning_rate": 1.35043299289348e-07, + "loss": 0.005, + "step": 16777 + }, + { + "epoch": 0.33, + "learning_rate": 1.3503941594501183e-07, + "loss": 0.0009, + "step": 16778 + }, + { + "epoch": 0.33, + "learning_rate": 1.350355326006757e-07, + "loss": 0.0009, + "step": 16779 + }, + { + "epoch": 0.33, + "learning_rate": 1.3503164925633955e-07, + "loss": 0.0009, + "step": 16780 + }, + { + "epoch": 0.33, + "learning_rate": 1.3502776591200342e-07, + "loss": 0.0009, + "step": 16781 + }, + { + "epoch": 0.33, + "learning_rate": 1.3502388256766727e-07, + "loss": 0.0168, + "step": 16782 + }, + { + "epoch": 0.33, + "learning_rate": 1.350199992233311e-07, + "loss": 0.0009, + "step": 16783 + }, + { + "epoch": 0.33, + "learning_rate": 1.3501611587899498e-07, + "loss": 0.0008, + "step": 16784 + }, + { + "epoch": 0.33, + "learning_rate": 1.3501223253465883e-07, + "loss": 0.001, + "step": 16785 + }, + { + "epoch": 0.33, + "learning_rate": 1.350083491903227e-07, + "loss": 0.0013, + "step": 16786 + }, + { + "epoch": 0.33, + "learning_rate": 1.3500446584598655e-07, + "loss": 0.5574, + "step": 16787 + }, + { + "epoch": 0.33, + "learning_rate": 1.3500058250165042e-07, + "loss": 0.0013, + "step": 16788 + }, + { + "epoch": 0.33, + "learning_rate": 1.3499669915731426e-07, + "loss": 0.0031, + "step": 16789 + }, + { + "epoch": 0.33, + "learning_rate": 1.3499281581297813e-07, + "loss": 0.0109, + "step": 16790 + }, + { + "epoch": 0.33, + "learning_rate": 1.3498893246864198e-07, + "loss": 0.0258, + "step": 16791 + }, + { + "epoch": 0.33, + "learning_rate": 1.3498504912430585e-07, + "loss": 0.0007, + "step": 16792 + }, + { + "epoch": 0.33, + "learning_rate": 1.349811657799697e-07, + "loss": 0.0008, + "step": 16793 + }, + { + "epoch": 0.33, + "learning_rate": 1.3497728243563357e-07, + "loss": 0.0015, + "step": 16794 + }, + { + "epoch": 0.33, + "learning_rate": 1.349733990912974e-07, + "loss": 0.0013, + "step": 16795 + }, + { + "epoch": 0.33, + "learning_rate": 1.3496951574696128e-07, + "loss": 0.2233, + "step": 16796 + }, + { + "epoch": 0.33, + "learning_rate": 1.3496563240262513e-07, + "loss": 0.0017, + "step": 16797 + }, + { + "epoch": 0.33, + "learning_rate": 1.34961749058289e-07, + "loss": 0.0115, + "step": 16798 + }, + { + "epoch": 0.33, + "learning_rate": 1.3495786571395284e-07, + "loss": 0.0787, + "step": 16799 + }, + { + "epoch": 0.33, + "learning_rate": 1.3495398236961672e-07, + "loss": 0.0013, + "step": 16800 + }, + { + "epoch": 0.33, + "learning_rate": 1.3495009902528056e-07, + "loss": 0.001, + "step": 16801 + }, + { + "epoch": 0.33, + "learning_rate": 1.3494621568094443e-07, + "loss": 0.0013, + "step": 16802 + }, + { + "epoch": 0.33, + "learning_rate": 1.3494233233660828e-07, + "loss": 1.0507, + "step": 16803 + }, + { + "epoch": 0.33, + "learning_rate": 1.3493844899227215e-07, + "loss": 0.6185, + "step": 16804 + }, + { + "epoch": 0.33, + "learning_rate": 1.34934565647936e-07, + "loss": 0.001, + "step": 16805 + }, + { + "epoch": 0.33, + "learning_rate": 1.3493068230359984e-07, + "loss": 0.008, + "step": 16806 + }, + { + "epoch": 0.33, + "learning_rate": 1.349267989592637e-07, + "loss": 0.0008, + "step": 16807 + }, + { + "epoch": 0.33, + "learning_rate": 1.3492291561492756e-07, + "loss": 0.002, + "step": 16808 + }, + { + "epoch": 0.33, + "learning_rate": 1.3491903227059143e-07, + "loss": 0.0011, + "step": 16809 + }, + { + "epoch": 0.33, + "learning_rate": 1.3491514892625527e-07, + "loss": 0.0015, + "step": 16810 + }, + { + "epoch": 0.33, + "learning_rate": 1.3491126558191914e-07, + "loss": 0.0009, + "step": 16811 + }, + { + "epoch": 0.33, + "learning_rate": 1.34907382237583e-07, + "loss": 0.002, + "step": 16812 + }, + { + "epoch": 0.33, + "learning_rate": 1.3490349889324686e-07, + "loss": 0.0013, + "step": 16813 + }, + { + "epoch": 0.33, + "learning_rate": 1.348996155489107e-07, + "loss": 0.001, + "step": 16814 + }, + { + "epoch": 0.33, + "learning_rate": 1.3489573220457458e-07, + "loss": 0.0007, + "step": 16815 + }, + { + "epoch": 0.33, + "learning_rate": 1.3489184886023842e-07, + "loss": 0.0011, + "step": 16816 + }, + { + "epoch": 0.33, + "learning_rate": 1.348879655159023e-07, + "loss": 0.0064, + "step": 16817 + }, + { + "epoch": 0.33, + "learning_rate": 1.3488408217156614e-07, + "loss": 0.0009, + "step": 16818 + }, + { + "epoch": 0.33, + "learning_rate": 1.3488019882723e-07, + "loss": 0.0012, + "step": 16819 + }, + { + "epoch": 0.33, + "learning_rate": 1.3487631548289385e-07, + "loss": 0.0153, + "step": 16820 + }, + { + "epoch": 0.33, + "learning_rate": 1.3487243213855773e-07, + "loss": 0.0023, + "step": 16821 + }, + { + "epoch": 0.33, + "learning_rate": 1.3486854879422157e-07, + "loss": 0.001, + "step": 16822 + }, + { + "epoch": 0.33, + "learning_rate": 1.3486466544988544e-07, + "loss": 0.0008, + "step": 16823 + }, + { + "epoch": 0.33, + "learning_rate": 1.348607821055493e-07, + "loss": 0.1672, + "step": 16824 + }, + { + "epoch": 0.33, + "learning_rate": 1.3485689876121316e-07, + "loss": 0.0007, + "step": 16825 + }, + { + "epoch": 0.33, + "learning_rate": 1.34853015416877e-07, + "loss": 0.0008, + "step": 16826 + }, + { + "epoch": 0.33, + "learning_rate": 1.3484913207254088e-07, + "loss": 0.001, + "step": 16827 + }, + { + "epoch": 0.33, + "learning_rate": 1.3484524872820472e-07, + "loss": 0.0306, + "step": 16828 + }, + { + "epoch": 0.33, + "learning_rate": 1.348413653838686e-07, + "loss": 0.0008, + "step": 16829 + }, + { + "epoch": 0.33, + "learning_rate": 1.3483748203953244e-07, + "loss": 0.0008, + "step": 16830 + }, + { + "epoch": 0.33, + "learning_rate": 1.348335986951963e-07, + "loss": 0.0071, + "step": 16831 + }, + { + "epoch": 0.33, + "learning_rate": 1.3482971535086015e-07, + "loss": 0.0012, + "step": 16832 + }, + { + "epoch": 0.33, + "learning_rate": 1.3482583200652402e-07, + "loss": 0.001, + "step": 16833 + }, + { + "epoch": 0.33, + "learning_rate": 1.3482194866218787e-07, + "loss": 0.0013, + "step": 16834 + }, + { + "epoch": 0.33, + "learning_rate": 1.3481806531785174e-07, + "loss": 0.0011, + "step": 16835 + }, + { + "epoch": 0.33, + "learning_rate": 1.3481418197351559e-07, + "loss": 0.0015, + "step": 16836 + }, + { + "epoch": 0.33, + "learning_rate": 1.3481029862917946e-07, + "loss": 0.0145, + "step": 16837 + }, + { + "epoch": 0.33, + "learning_rate": 1.348064152848433e-07, + "loss": 0.0046, + "step": 16838 + }, + { + "epoch": 0.33, + "learning_rate": 1.3480253194050717e-07, + "loss": 0.0009, + "step": 16839 + }, + { + "epoch": 0.33, + "learning_rate": 1.3479864859617102e-07, + "loss": 0.0223, + "step": 16840 + }, + { + "epoch": 0.33, + "learning_rate": 1.3479476525183486e-07, + "loss": 0.001, + "step": 16841 + }, + { + "epoch": 0.33, + "learning_rate": 1.347908819074987e-07, + "loss": 0.001, + "step": 16842 + }, + { + "epoch": 0.33, + "learning_rate": 1.3478699856316258e-07, + "loss": 0.0009, + "step": 16843 + }, + { + "epoch": 0.33, + "learning_rate": 1.3478311521882643e-07, + "loss": 0.0012, + "step": 16844 + }, + { + "epoch": 0.33, + "learning_rate": 1.347792318744903e-07, + "loss": 0.6105, + "step": 16845 + }, + { + "epoch": 0.33, + "learning_rate": 1.3477534853015414e-07, + "loss": 0.0008, + "step": 16846 + }, + { + "epoch": 0.33, + "learning_rate": 1.3477146518581801e-07, + "loss": 0.9178, + "step": 16847 + }, + { + "epoch": 0.33, + "learning_rate": 1.3476758184148186e-07, + "loss": 0.0006, + "step": 16848 + }, + { + "epoch": 0.33, + "learning_rate": 1.3476369849714573e-07, + "loss": 0.001, + "step": 16849 + }, + { + "epoch": 0.33, + "learning_rate": 1.3475981515280958e-07, + "loss": 0.0093, + "step": 16850 + }, + { + "epoch": 0.33, + "learning_rate": 1.3475593180847345e-07, + "loss": 0.001, + "step": 16851 + }, + { + "epoch": 0.33, + "learning_rate": 1.347520484641373e-07, + "loss": 0.0014, + "step": 16852 + }, + { + "epoch": 0.33, + "learning_rate": 1.3474816511980116e-07, + "loss": 0.0011, + "step": 16853 + }, + { + "epoch": 0.33, + "learning_rate": 1.34744281775465e-07, + "loss": 0.0012, + "step": 16854 + }, + { + "epoch": 0.33, + "learning_rate": 1.3474039843112888e-07, + "loss": 0.0009, + "step": 16855 + }, + { + "epoch": 0.33, + "learning_rate": 1.3473651508679272e-07, + "loss": 0.0008, + "step": 16856 + }, + { + "epoch": 0.33, + "learning_rate": 1.347326317424566e-07, + "loss": 0.0012, + "step": 16857 + }, + { + "epoch": 0.33, + "learning_rate": 1.3472874839812044e-07, + "loss": 0.001, + "step": 16858 + }, + { + "epoch": 0.33, + "learning_rate": 1.347248650537843e-07, + "loss": 0.0011, + "step": 16859 + }, + { + "epoch": 0.33, + "learning_rate": 1.3472098170944816e-07, + "loss": 0.0018, + "step": 16860 + }, + { + "epoch": 0.33, + "learning_rate": 1.3471709836511203e-07, + "loss": 0.1588, + "step": 16861 + }, + { + "epoch": 0.33, + "learning_rate": 1.3471321502077587e-07, + "loss": 0.3826, + "step": 16862 + }, + { + "epoch": 0.33, + "learning_rate": 1.3470933167643975e-07, + "loss": 0.2735, + "step": 16863 + }, + { + "epoch": 0.33, + "learning_rate": 1.347054483321036e-07, + "loss": 0.0012, + "step": 16864 + }, + { + "epoch": 0.33, + "learning_rate": 1.3470156498776746e-07, + "loss": 0.0011, + "step": 16865 + }, + { + "epoch": 0.33, + "learning_rate": 1.346976816434313e-07, + "loss": 1.0079, + "step": 16866 + }, + { + "epoch": 0.33, + "learning_rate": 1.3469379829909518e-07, + "loss": 0.3181, + "step": 16867 + }, + { + "epoch": 0.33, + "learning_rate": 1.3468991495475902e-07, + "loss": 0.0013, + "step": 16868 + }, + { + "epoch": 0.33, + "learning_rate": 1.346860316104229e-07, + "loss": 0.0038, + "step": 16869 + }, + { + "epoch": 0.33, + "learning_rate": 1.3468214826608674e-07, + "loss": 0.001, + "step": 16870 + }, + { + "epoch": 0.33, + "learning_rate": 1.346782649217506e-07, + "loss": 0.0018, + "step": 16871 + }, + { + "epoch": 0.33, + "learning_rate": 1.3467438157741446e-07, + "loss": 0.0012, + "step": 16872 + }, + { + "epoch": 0.33, + "learning_rate": 1.3467049823307833e-07, + "loss": 0.0009, + "step": 16873 + }, + { + "epoch": 0.33, + "learning_rate": 1.3466661488874217e-07, + "loss": 0.0014, + "step": 16874 + }, + { + "epoch": 0.33, + "learning_rate": 1.3466273154440604e-07, + "loss": 0.4115, + "step": 16875 + }, + { + "epoch": 0.33, + "learning_rate": 1.346588482000699e-07, + "loss": 0.001, + "step": 16876 + }, + { + "epoch": 0.33, + "learning_rate": 1.3465496485573376e-07, + "loss": 0.0007, + "step": 16877 + }, + { + "epoch": 0.33, + "learning_rate": 1.346510815113976e-07, + "loss": 0.0013, + "step": 16878 + }, + { + "epoch": 0.33, + "learning_rate": 1.3464719816706148e-07, + "loss": 0.2182, + "step": 16879 + }, + { + "epoch": 0.33, + "learning_rate": 1.3464331482272532e-07, + "loss": 0.0012, + "step": 16880 + }, + { + "epoch": 0.33, + "learning_rate": 1.346394314783892e-07, + "loss": 0.001, + "step": 16881 + }, + { + "epoch": 0.33, + "learning_rate": 1.3463554813405304e-07, + "loss": 0.0009, + "step": 16882 + }, + { + "epoch": 0.33, + "learning_rate": 1.346316647897169e-07, + "loss": 0.0008, + "step": 16883 + }, + { + "epoch": 0.33, + "learning_rate": 1.3462778144538076e-07, + "loss": 0.0009, + "step": 16884 + }, + { + "epoch": 0.33, + "learning_rate": 1.3462389810104463e-07, + "loss": 0.0035, + "step": 16885 + }, + { + "epoch": 0.33, + "learning_rate": 1.3462001475670847e-07, + "loss": 0.0013, + "step": 16886 + }, + { + "epoch": 0.33, + "learning_rate": 1.3461613141237234e-07, + "loss": 0.001, + "step": 16887 + }, + { + "epoch": 0.33, + "learning_rate": 1.346122480680362e-07, + "loss": 0.0009, + "step": 16888 + }, + { + "epoch": 0.33, + "learning_rate": 1.3460836472370006e-07, + "loss": 0.0018, + "step": 16889 + }, + { + "epoch": 0.33, + "learning_rate": 1.346044813793639e-07, + "loss": 0.001, + "step": 16890 + }, + { + "epoch": 0.33, + "learning_rate": 1.3460059803502778e-07, + "loss": 0.0354, + "step": 16891 + }, + { + "epoch": 0.33, + "learning_rate": 1.3459671469069162e-07, + "loss": 0.0011, + "step": 16892 + }, + { + "epoch": 0.33, + "learning_rate": 1.345928313463555e-07, + "loss": 0.001, + "step": 16893 + }, + { + "epoch": 0.33, + "learning_rate": 1.3458894800201934e-07, + "loss": 0.8299, + "step": 16894 + }, + { + "epoch": 0.33, + "learning_rate": 1.345850646576832e-07, + "loss": 0.0058, + "step": 16895 + }, + { + "epoch": 0.33, + "learning_rate": 1.3458118131334705e-07, + "loss": 0.0009, + "step": 16896 + }, + { + "epoch": 0.33, + "learning_rate": 1.3457729796901093e-07, + "loss": 0.2073, + "step": 16897 + }, + { + "epoch": 0.33, + "learning_rate": 1.3457341462467477e-07, + "loss": 1.1285, + "step": 16898 + }, + { + "epoch": 0.33, + "learning_rate": 1.3456953128033862e-07, + "loss": 0.0013, + "step": 16899 + }, + { + "epoch": 0.33, + "learning_rate": 1.3456564793600246e-07, + "loss": 0.226, + "step": 16900 + }, + { + "epoch": 0.33, + "learning_rate": 1.3456176459166633e-07, + "loss": 0.0156, + "step": 16901 + }, + { + "epoch": 0.33, + "learning_rate": 1.3455788124733018e-07, + "loss": 0.0009, + "step": 16902 + }, + { + "epoch": 0.33, + "learning_rate": 1.3455399790299405e-07, + "loss": 0.0011, + "step": 16903 + }, + { + "epoch": 0.33, + "learning_rate": 1.345501145586579e-07, + "loss": 0.0008, + "step": 16904 + }, + { + "epoch": 0.33, + "learning_rate": 1.3454623121432177e-07, + "loss": 0.001, + "step": 16905 + }, + { + "epoch": 0.33, + "learning_rate": 1.345423478699856e-07, + "loss": 0.0027, + "step": 16906 + }, + { + "epoch": 0.33, + "learning_rate": 1.3453846452564948e-07, + "loss": 0.0009, + "step": 16907 + }, + { + "epoch": 0.33, + "learning_rate": 1.3453458118131333e-07, + "loss": 0.0012, + "step": 16908 + }, + { + "epoch": 0.33, + "learning_rate": 1.345306978369772e-07, + "loss": 0.0009, + "step": 16909 + }, + { + "epoch": 0.33, + "learning_rate": 1.3452681449264104e-07, + "loss": 0.0009, + "step": 16910 + }, + { + "epoch": 0.33, + "learning_rate": 1.3452293114830492e-07, + "loss": 0.0008, + "step": 16911 + }, + { + "epoch": 0.33, + "learning_rate": 1.3451904780396876e-07, + "loss": 0.1081, + "step": 16912 + }, + { + "epoch": 0.33, + "learning_rate": 1.3451516445963263e-07, + "loss": 0.0012, + "step": 16913 + }, + { + "epoch": 0.33, + "learning_rate": 1.3451128111529648e-07, + "loss": 0.0013, + "step": 16914 + }, + { + "epoch": 0.33, + "learning_rate": 1.3450739777096035e-07, + "loss": 0.0009, + "step": 16915 + }, + { + "epoch": 0.33, + "learning_rate": 1.345035144266242e-07, + "loss": 1.1202, + "step": 16916 + }, + { + "epoch": 0.33, + "learning_rate": 1.3449963108228806e-07, + "loss": 0.001, + "step": 16917 + }, + { + "epoch": 0.33, + "learning_rate": 1.344957477379519e-07, + "loss": 0.0013, + "step": 16918 + }, + { + "epoch": 0.33, + "learning_rate": 1.3449186439361578e-07, + "loss": 0.4484, + "step": 16919 + }, + { + "epoch": 0.33, + "learning_rate": 1.3448798104927963e-07, + "loss": 0.0013, + "step": 16920 + }, + { + "epoch": 0.33, + "learning_rate": 1.344840977049435e-07, + "loss": 1.1404, + "step": 16921 + }, + { + "epoch": 0.33, + "learning_rate": 1.3448021436060734e-07, + "loss": 0.0012, + "step": 16922 + }, + { + "epoch": 0.33, + "learning_rate": 1.3447633101627121e-07, + "loss": 0.0013, + "step": 16923 + }, + { + "epoch": 0.33, + "learning_rate": 1.3447244767193506e-07, + "loss": 0.0012, + "step": 16924 + }, + { + "epoch": 0.33, + "learning_rate": 1.3446856432759893e-07, + "loss": 0.0016, + "step": 16925 + }, + { + "epoch": 0.33, + "learning_rate": 1.3446468098326278e-07, + "loss": 0.0015, + "step": 16926 + }, + { + "epoch": 0.33, + "learning_rate": 1.3446079763892665e-07, + "loss": 0.0009, + "step": 16927 + }, + { + "epoch": 0.33, + "learning_rate": 1.344569142945905e-07, + "loss": 0.0011, + "step": 16928 + }, + { + "epoch": 0.33, + "learning_rate": 1.3445303095025436e-07, + "loss": 0.0057, + "step": 16929 + }, + { + "epoch": 0.33, + "learning_rate": 1.344491476059182e-07, + "loss": 0.3079, + "step": 16930 + }, + { + "epoch": 0.33, + "learning_rate": 1.3444526426158208e-07, + "loss": 0.0011, + "step": 16931 + }, + { + "epoch": 0.33, + "learning_rate": 1.3444138091724592e-07, + "loss": 0.7472, + "step": 16932 + }, + { + "epoch": 0.33, + "learning_rate": 1.344374975729098e-07, + "loss": 0.0009, + "step": 16933 + }, + { + "epoch": 0.33, + "learning_rate": 1.3443361422857364e-07, + "loss": 0.001, + "step": 16934 + }, + { + "epoch": 0.33, + "learning_rate": 1.344297308842375e-07, + "loss": 0.001, + "step": 16935 + }, + { + "epoch": 0.33, + "learning_rate": 1.3442584753990136e-07, + "loss": 0.1113, + "step": 16936 + }, + { + "epoch": 0.33, + "learning_rate": 1.3442196419556523e-07, + "loss": 0.0008, + "step": 16937 + }, + { + "epoch": 0.33, + "learning_rate": 1.3441808085122907e-07, + "loss": 0.0016, + "step": 16938 + }, + { + "epoch": 0.33, + "learning_rate": 1.3441419750689295e-07, + "loss": 0.0012, + "step": 16939 + }, + { + "epoch": 0.33, + "learning_rate": 1.344103141625568e-07, + "loss": 0.0017, + "step": 16940 + }, + { + "epoch": 0.33, + "learning_rate": 1.3440643081822066e-07, + "loss": 0.0541, + "step": 16941 + }, + { + "epoch": 0.33, + "learning_rate": 1.344025474738845e-07, + "loss": 0.1593, + "step": 16942 + }, + { + "epoch": 0.33, + "learning_rate": 1.3439866412954838e-07, + "loss": 0.0032, + "step": 16943 + }, + { + "epoch": 0.33, + "learning_rate": 1.3439478078521222e-07, + "loss": 0.0014, + "step": 16944 + }, + { + "epoch": 0.33, + "learning_rate": 1.343908974408761e-07, + "loss": 0.0009, + "step": 16945 + }, + { + "epoch": 0.33, + "learning_rate": 1.3438701409653994e-07, + "loss": 0.0013, + "step": 16946 + }, + { + "epoch": 0.33, + "learning_rate": 1.343831307522038e-07, + "loss": 0.0008, + "step": 16947 + }, + { + "epoch": 0.33, + "learning_rate": 1.3437924740786766e-07, + "loss": 1.1919, + "step": 16948 + }, + { + "epoch": 0.33, + "learning_rate": 1.3437536406353153e-07, + "loss": 0.002, + "step": 16949 + }, + { + "epoch": 0.33, + "learning_rate": 1.3437148071919537e-07, + "loss": 0.001, + "step": 16950 + }, + { + "epoch": 0.33, + "learning_rate": 1.3436759737485924e-07, + "loss": 0.001, + "step": 16951 + }, + { + "epoch": 0.33, + "learning_rate": 1.343637140305231e-07, + "loss": 0.0012, + "step": 16952 + }, + { + "epoch": 0.33, + "learning_rate": 1.3435983068618693e-07, + "loss": 0.0013, + "step": 16953 + }, + { + "epoch": 0.33, + "learning_rate": 1.343559473418508e-07, + "loss": 0.0013, + "step": 16954 + }, + { + "epoch": 0.33, + "learning_rate": 1.3435206399751465e-07, + "loss": 0.1694, + "step": 16955 + }, + { + "epoch": 0.33, + "learning_rate": 1.3434818065317852e-07, + "loss": 0.001, + "step": 16956 + }, + { + "epoch": 0.33, + "learning_rate": 1.3434429730884237e-07, + "loss": 0.0013, + "step": 16957 + }, + { + "epoch": 0.33, + "learning_rate": 1.343404139645062e-07, + "loss": 0.1021, + "step": 16958 + }, + { + "epoch": 0.33, + "learning_rate": 1.3433653062017008e-07, + "loss": 0.0007, + "step": 16959 + }, + { + "epoch": 0.33, + "learning_rate": 1.3433264727583393e-07, + "loss": 0.1483, + "step": 16960 + }, + { + "epoch": 0.33, + "learning_rate": 1.343287639314978e-07, + "loss": 0.0025, + "step": 16961 + }, + { + "epoch": 0.33, + "learning_rate": 1.3432488058716165e-07, + "loss": 0.0012, + "step": 16962 + }, + { + "epoch": 0.33, + "learning_rate": 1.3432099724282552e-07, + "loss": 0.0008, + "step": 16963 + }, + { + "epoch": 0.33, + "learning_rate": 1.3431711389848936e-07, + "loss": 0.0009, + "step": 16964 + }, + { + "epoch": 0.33, + "learning_rate": 1.3431323055415323e-07, + "loss": 0.0086, + "step": 16965 + }, + { + "epoch": 0.33, + "learning_rate": 1.3430934720981708e-07, + "loss": 0.0475, + "step": 16966 + }, + { + "epoch": 0.33, + "learning_rate": 1.3430546386548095e-07, + "loss": 0.0009, + "step": 16967 + }, + { + "epoch": 0.33, + "learning_rate": 1.343015805211448e-07, + "loss": 0.0011, + "step": 16968 + }, + { + "epoch": 0.33, + "learning_rate": 1.3429769717680867e-07, + "loss": 0.0016, + "step": 16969 + }, + { + "epoch": 0.33, + "learning_rate": 1.342938138324725e-07, + "loss": 0.0011, + "step": 16970 + }, + { + "epoch": 0.33, + "learning_rate": 1.3428993048813638e-07, + "loss": 0.0008, + "step": 16971 + }, + { + "epoch": 0.33, + "learning_rate": 1.3428604714380023e-07, + "loss": 0.0012, + "step": 16972 + }, + { + "epoch": 0.33, + "learning_rate": 1.342821637994641e-07, + "loss": 0.0009, + "step": 16973 + }, + { + "epoch": 0.33, + "learning_rate": 1.3427828045512794e-07, + "loss": 0.0015, + "step": 16974 + }, + { + "epoch": 0.33, + "learning_rate": 1.3427439711079182e-07, + "loss": 0.001, + "step": 16975 + }, + { + "epoch": 0.33, + "learning_rate": 1.3427051376645566e-07, + "loss": 0.001, + "step": 16976 + }, + { + "epoch": 0.33, + "learning_rate": 1.3426663042211953e-07, + "loss": 0.0011, + "step": 16977 + }, + { + "epoch": 0.33, + "learning_rate": 1.3426274707778338e-07, + "loss": 0.0009, + "step": 16978 + }, + { + "epoch": 0.33, + "learning_rate": 1.3425886373344725e-07, + "loss": 0.0306, + "step": 16979 + }, + { + "epoch": 0.33, + "learning_rate": 1.342549803891111e-07, + "loss": 0.0012, + "step": 16980 + }, + { + "epoch": 0.33, + "learning_rate": 1.3425109704477497e-07, + "loss": 0.0008, + "step": 16981 + }, + { + "epoch": 0.33, + "learning_rate": 1.342472137004388e-07, + "loss": 0.001, + "step": 16982 + }, + { + "epoch": 0.33, + "learning_rate": 1.3424333035610266e-07, + "loss": 0.0008, + "step": 16983 + }, + { + "epoch": 0.33, + "learning_rate": 1.3423944701176653e-07, + "loss": 0.0014, + "step": 16984 + }, + { + "epoch": 0.33, + "learning_rate": 1.3423556366743037e-07, + "loss": 0.0018, + "step": 16985 + }, + { + "epoch": 0.33, + "learning_rate": 1.3423168032309424e-07, + "loss": 0.0304, + "step": 16986 + }, + { + "epoch": 0.33, + "learning_rate": 1.342277969787581e-07, + "loss": 0.0007, + "step": 16987 + }, + { + "epoch": 0.33, + "learning_rate": 1.3422391363442196e-07, + "loss": 0.0009, + "step": 16988 + }, + { + "epoch": 0.33, + "learning_rate": 1.342200302900858e-07, + "loss": 0.0083, + "step": 16989 + }, + { + "epoch": 0.33, + "learning_rate": 1.3421614694574968e-07, + "loss": 0.001, + "step": 16990 + }, + { + "epoch": 0.33, + "learning_rate": 1.3421226360141352e-07, + "loss": 0.0011, + "step": 16991 + }, + { + "epoch": 0.33, + "learning_rate": 1.342083802570774e-07, + "loss": 0.0012, + "step": 16992 + }, + { + "epoch": 0.33, + "learning_rate": 1.3420449691274124e-07, + "loss": 0.0043, + "step": 16993 + }, + { + "epoch": 0.33, + "learning_rate": 1.342006135684051e-07, + "loss": 0.2891, + "step": 16994 + }, + { + "epoch": 0.33, + "learning_rate": 1.3419673022406895e-07, + "loss": 0.4827, + "step": 16995 + }, + { + "epoch": 0.33, + "learning_rate": 1.3419284687973283e-07, + "loss": 0.0021, + "step": 16996 + }, + { + "epoch": 0.33, + "learning_rate": 1.3418896353539667e-07, + "loss": 0.001, + "step": 16997 + }, + { + "epoch": 0.33, + "learning_rate": 1.3418508019106054e-07, + "loss": 0.0009, + "step": 16998 + }, + { + "epoch": 0.33, + "learning_rate": 1.341811968467244e-07, + "loss": 1.0288, + "step": 16999 + }, + { + "epoch": 0.33, + "learning_rate": 1.3417731350238826e-07, + "loss": 0.001, + "step": 17000 + }, + { + "epoch": 0.33, + "learning_rate": 1.341734301580521e-07, + "loss": 0.0008, + "step": 17001 + }, + { + "epoch": 0.33, + "learning_rate": 1.3416954681371598e-07, + "loss": 0.0011, + "step": 17002 + }, + { + "epoch": 0.33, + "learning_rate": 1.3416566346937982e-07, + "loss": 0.0011, + "step": 17003 + }, + { + "epoch": 0.33, + "learning_rate": 1.341617801250437e-07, + "loss": 0.0011, + "step": 17004 + }, + { + "epoch": 0.33, + "learning_rate": 1.3415789678070754e-07, + "loss": 0.0011, + "step": 17005 + }, + { + "epoch": 0.33, + "learning_rate": 1.341540134363714e-07, + "loss": 0.0009, + "step": 17006 + }, + { + "epoch": 0.33, + "learning_rate": 1.3415013009203525e-07, + "loss": 0.0011, + "step": 17007 + }, + { + "epoch": 0.33, + "learning_rate": 1.3414624674769913e-07, + "loss": 0.0007, + "step": 17008 + }, + { + "epoch": 0.33, + "learning_rate": 1.3414236340336297e-07, + "loss": 0.0024, + "step": 17009 + }, + { + "epoch": 0.33, + "learning_rate": 1.3413848005902684e-07, + "loss": 0.0014, + "step": 17010 + }, + { + "epoch": 0.33, + "learning_rate": 1.3413459671469069e-07, + "loss": 0.001, + "step": 17011 + }, + { + "epoch": 0.33, + "learning_rate": 1.3413071337035456e-07, + "loss": 0.001, + "step": 17012 + }, + { + "epoch": 0.33, + "learning_rate": 1.341268300260184e-07, + "loss": 0.0011, + "step": 17013 + }, + { + "epoch": 0.33, + "learning_rate": 1.3412294668168227e-07, + "loss": 0.0012, + "step": 17014 + }, + { + "epoch": 0.33, + "learning_rate": 1.341190633373461e-07, + "loss": 0.2244, + "step": 17015 + }, + { + "epoch": 0.33, + "learning_rate": 1.3411517999300996e-07, + "loss": 0.6737, + "step": 17016 + }, + { + "epoch": 0.33, + "learning_rate": 1.341112966486738e-07, + "loss": 0.0076, + "step": 17017 + }, + { + "epoch": 0.33, + "learning_rate": 1.3410741330433768e-07, + "loss": 0.0011, + "step": 17018 + }, + { + "epoch": 0.33, + "learning_rate": 1.3410352996000153e-07, + "loss": 0.0939, + "step": 17019 + }, + { + "epoch": 0.33, + "learning_rate": 1.340996466156654e-07, + "loss": 0.0011, + "step": 17020 + }, + { + "epoch": 0.33, + "learning_rate": 1.3409576327132924e-07, + "loss": 0.0009, + "step": 17021 + }, + { + "epoch": 0.33, + "learning_rate": 1.3409187992699311e-07, + "loss": 0.0012, + "step": 17022 + }, + { + "epoch": 0.33, + "learning_rate": 1.3408799658265696e-07, + "loss": 0.0009, + "step": 17023 + }, + { + "epoch": 0.33, + "learning_rate": 1.3408411323832083e-07, + "loss": 0.0014, + "step": 17024 + }, + { + "epoch": 0.33, + "learning_rate": 1.3408022989398468e-07, + "loss": 0.0012, + "step": 17025 + }, + { + "epoch": 0.33, + "learning_rate": 1.3407634654964855e-07, + "loss": 0.0007, + "step": 17026 + }, + { + "epoch": 0.33, + "learning_rate": 1.340724632053124e-07, + "loss": 0.0577, + "step": 17027 + }, + { + "epoch": 0.33, + "learning_rate": 1.3406857986097626e-07, + "loss": 0.0024, + "step": 17028 + }, + { + "epoch": 0.33, + "learning_rate": 1.340646965166401e-07, + "loss": 0.0021, + "step": 17029 + }, + { + "epoch": 0.33, + "learning_rate": 1.3406081317230398e-07, + "loss": 0.001, + "step": 17030 + }, + { + "epoch": 0.33, + "learning_rate": 1.3405692982796782e-07, + "loss": 0.0011, + "step": 17031 + }, + { + "epoch": 0.33, + "learning_rate": 1.340530464836317e-07, + "loss": 0.0363, + "step": 17032 + }, + { + "epoch": 0.33, + "learning_rate": 1.3404916313929554e-07, + "loss": 0.0008, + "step": 17033 + }, + { + "epoch": 0.33, + "learning_rate": 1.340452797949594e-07, + "loss": 0.0007, + "step": 17034 + }, + { + "epoch": 0.33, + "learning_rate": 1.3404139645062326e-07, + "loss": 0.0011, + "step": 17035 + }, + { + "epoch": 0.33, + "learning_rate": 1.3403751310628713e-07, + "loss": 0.001, + "step": 17036 + }, + { + "epoch": 0.33, + "learning_rate": 1.3403362976195097e-07, + "loss": 0.0009, + "step": 17037 + }, + { + "epoch": 0.33, + "learning_rate": 1.3402974641761485e-07, + "loss": 0.001, + "step": 17038 + }, + { + "epoch": 0.33, + "learning_rate": 1.340258630732787e-07, + "loss": 0.0023, + "step": 17039 + }, + { + "epoch": 0.33, + "learning_rate": 1.3402197972894256e-07, + "loss": 0.0009, + "step": 17040 + }, + { + "epoch": 0.33, + "learning_rate": 1.340180963846064e-07, + "loss": 0.001, + "step": 17041 + }, + { + "epoch": 0.33, + "learning_rate": 1.3401421304027028e-07, + "loss": 0.0009, + "step": 17042 + }, + { + "epoch": 0.33, + "learning_rate": 1.3401032969593412e-07, + "loss": 1.2813, + "step": 17043 + }, + { + "epoch": 0.33, + "learning_rate": 1.34006446351598e-07, + "loss": 0.3018, + "step": 17044 + }, + { + "epoch": 0.33, + "learning_rate": 1.3400256300726184e-07, + "loss": 0.001, + "step": 17045 + }, + { + "epoch": 0.33, + "learning_rate": 1.339986796629257e-07, + "loss": 0.0015, + "step": 17046 + }, + { + "epoch": 0.33, + "learning_rate": 1.3399479631858956e-07, + "loss": 0.0009, + "step": 17047 + }, + { + "epoch": 0.33, + "learning_rate": 1.3399091297425343e-07, + "loss": 0.0008, + "step": 17048 + }, + { + "epoch": 0.33, + "learning_rate": 1.3398702962991727e-07, + "loss": 0.0009, + "step": 17049 + }, + { + "epoch": 0.33, + "learning_rate": 1.3398314628558114e-07, + "loss": 0.0009, + "step": 17050 + }, + { + "epoch": 0.33, + "learning_rate": 1.33979262941245e-07, + "loss": 0.0007, + "step": 17051 + }, + { + "epoch": 0.33, + "learning_rate": 1.3397537959690886e-07, + "loss": 0.0007, + "step": 17052 + }, + { + "epoch": 0.33, + "learning_rate": 1.339714962525727e-07, + "loss": 0.0009, + "step": 17053 + }, + { + "epoch": 0.33, + "learning_rate": 1.3396761290823658e-07, + "loss": 0.0008, + "step": 17054 + }, + { + "epoch": 0.33, + "learning_rate": 1.3396372956390042e-07, + "loss": 0.0009, + "step": 17055 + }, + { + "epoch": 0.33, + "learning_rate": 1.339598462195643e-07, + "loss": 0.0008, + "step": 17056 + }, + { + "epoch": 0.33, + "learning_rate": 1.3395596287522814e-07, + "loss": 0.0011, + "step": 17057 + }, + { + "epoch": 0.33, + "learning_rate": 1.33952079530892e-07, + "loss": 0.001, + "step": 17058 + }, + { + "epoch": 0.33, + "learning_rate": 1.3394819618655586e-07, + "loss": 0.001, + "step": 17059 + }, + { + "epoch": 0.33, + "learning_rate": 1.3394431284221973e-07, + "loss": 0.4735, + "step": 17060 + }, + { + "epoch": 0.33, + "learning_rate": 1.3394042949788357e-07, + "loss": 0.0018, + "step": 17061 + }, + { + "epoch": 0.33, + "learning_rate": 1.3393654615354744e-07, + "loss": 0.0007, + "step": 17062 + }, + { + "epoch": 0.33, + "learning_rate": 1.339326628092113e-07, + "loss": 0.001, + "step": 17063 + }, + { + "epoch": 0.33, + "learning_rate": 1.3392877946487516e-07, + "loss": 0.0009, + "step": 17064 + }, + { + "epoch": 0.33, + "learning_rate": 1.33924896120539e-07, + "loss": 0.0127, + "step": 17065 + }, + { + "epoch": 0.33, + "learning_rate": 1.3392101277620288e-07, + "loss": 0.0011, + "step": 17066 + }, + { + "epoch": 0.33, + "learning_rate": 1.3391712943186672e-07, + "loss": 0.001, + "step": 17067 + }, + { + "epoch": 0.33, + "learning_rate": 1.339132460875306e-07, + "loss": 0.7053, + "step": 17068 + }, + { + "epoch": 0.33, + "learning_rate": 1.3390936274319444e-07, + "loss": 0.0047, + "step": 17069 + }, + { + "epoch": 0.33, + "learning_rate": 1.339054793988583e-07, + "loss": 0.0038, + "step": 17070 + }, + { + "epoch": 0.33, + "learning_rate": 1.3390159605452215e-07, + "loss": 0.0009, + "step": 17071 + }, + { + "epoch": 0.33, + "learning_rate": 1.3389771271018603e-07, + "loss": 0.001, + "step": 17072 + }, + { + "epoch": 0.33, + "learning_rate": 1.3389382936584984e-07, + "loss": 0.0008, + "step": 17073 + }, + { + "epoch": 0.33, + "learning_rate": 1.3388994602151372e-07, + "loss": 0.4363, + "step": 17074 + }, + { + "epoch": 0.33, + "learning_rate": 1.3388606267717756e-07, + "loss": 0.1954, + "step": 17075 + }, + { + "epoch": 0.33, + "learning_rate": 1.3388217933284143e-07, + "loss": 0.001, + "step": 17076 + }, + { + "epoch": 0.33, + "learning_rate": 1.3387829598850528e-07, + "loss": 0.0008, + "step": 17077 + }, + { + "epoch": 0.33, + "learning_rate": 1.3387441264416915e-07, + "loss": 0.0017, + "step": 17078 + }, + { + "epoch": 0.33, + "learning_rate": 1.33870529299833e-07, + "loss": 0.001, + "step": 17079 + }, + { + "epoch": 0.33, + "learning_rate": 1.3386664595549687e-07, + "loss": 0.0011, + "step": 17080 + }, + { + "epoch": 0.33, + "learning_rate": 1.338627626111607e-07, + "loss": 0.001, + "step": 17081 + }, + { + "epoch": 0.33, + "learning_rate": 1.3385887926682458e-07, + "loss": 0.0007, + "step": 17082 + }, + { + "epoch": 0.33, + "learning_rate": 1.3385499592248843e-07, + "loss": 0.0009, + "step": 17083 + }, + { + "epoch": 0.33, + "learning_rate": 1.338511125781523e-07, + "loss": 0.0011, + "step": 17084 + }, + { + "epoch": 0.33, + "learning_rate": 1.3384722923381614e-07, + "loss": 0.0014, + "step": 17085 + }, + { + "epoch": 0.33, + "learning_rate": 1.3384334588948002e-07, + "loss": 0.0007, + "step": 17086 + }, + { + "epoch": 0.33, + "learning_rate": 1.3383946254514386e-07, + "loss": 0.0011, + "step": 17087 + }, + { + "epoch": 0.33, + "learning_rate": 1.3383557920080773e-07, + "loss": 0.0009, + "step": 17088 + }, + { + "epoch": 0.33, + "learning_rate": 1.3383169585647158e-07, + "loss": 0.0009, + "step": 17089 + }, + { + "epoch": 0.33, + "learning_rate": 1.3382781251213545e-07, + "loss": 0.001, + "step": 17090 + }, + { + "epoch": 0.33, + "learning_rate": 1.338239291677993e-07, + "loss": 0.0018, + "step": 17091 + }, + { + "epoch": 0.33, + "learning_rate": 1.3382004582346316e-07, + "loss": 0.001, + "step": 17092 + }, + { + "epoch": 0.33, + "learning_rate": 1.33816162479127e-07, + "loss": 0.0137, + "step": 17093 + }, + { + "epoch": 0.33, + "learning_rate": 1.3381227913479088e-07, + "loss": 0.0017, + "step": 17094 + }, + { + "epoch": 0.33, + "learning_rate": 1.3380839579045473e-07, + "loss": 0.0132, + "step": 17095 + }, + { + "epoch": 0.33, + "learning_rate": 1.338045124461186e-07, + "loss": 0.0014, + "step": 17096 + }, + { + "epoch": 0.33, + "learning_rate": 1.3380062910178244e-07, + "loss": 0.0027, + "step": 17097 + }, + { + "epoch": 0.33, + "learning_rate": 1.3379674575744631e-07, + "loss": 0.001, + "step": 17098 + }, + { + "epoch": 0.33, + "learning_rate": 1.3379286241311016e-07, + "loss": 0.0011, + "step": 17099 + }, + { + "epoch": 0.33, + "learning_rate": 1.3378897906877403e-07, + "loss": 0.0011, + "step": 17100 + }, + { + "epoch": 0.33, + "learning_rate": 1.3378509572443788e-07, + "loss": 0.0007, + "step": 17101 + }, + { + "epoch": 0.33, + "learning_rate": 1.3378121238010175e-07, + "loss": 0.0007, + "step": 17102 + }, + { + "epoch": 0.33, + "learning_rate": 1.337773290357656e-07, + "loss": 0.0026, + "step": 17103 + }, + { + "epoch": 0.33, + "learning_rate": 1.3377344569142946e-07, + "loss": 0.0008, + "step": 17104 + }, + { + "epoch": 0.33, + "learning_rate": 1.337695623470933e-07, + "loss": 0.0101, + "step": 17105 + }, + { + "epoch": 0.33, + "learning_rate": 1.3376567900275718e-07, + "loss": 0.0009, + "step": 17106 + }, + { + "epoch": 0.33, + "learning_rate": 1.3376179565842103e-07, + "loss": 0.0349, + "step": 17107 + }, + { + "epoch": 0.33, + "learning_rate": 1.337579123140849e-07, + "loss": 0.0009, + "step": 17108 + }, + { + "epoch": 0.33, + "learning_rate": 1.3375402896974874e-07, + "loss": 0.0008, + "step": 17109 + }, + { + "epoch": 0.33, + "learning_rate": 1.337501456254126e-07, + "loss": 0.6188, + "step": 17110 + }, + { + "epoch": 0.33, + "learning_rate": 1.3374626228107646e-07, + "loss": 0.0009, + "step": 17111 + }, + { + "epoch": 0.33, + "learning_rate": 1.3374237893674033e-07, + "loss": 0.0009, + "step": 17112 + }, + { + "epoch": 0.33, + "learning_rate": 1.3373849559240417e-07, + "loss": 0.0013, + "step": 17113 + }, + { + "epoch": 0.33, + "learning_rate": 1.3373461224806805e-07, + "loss": 0.0585, + "step": 17114 + }, + { + "epoch": 0.33, + "learning_rate": 1.337307289037319e-07, + "loss": 0.002, + "step": 17115 + }, + { + "epoch": 0.33, + "learning_rate": 1.3372684555939576e-07, + "loss": 1.0357, + "step": 17116 + }, + { + "epoch": 0.33, + "learning_rate": 1.337229622150596e-07, + "loss": 0.0008, + "step": 17117 + }, + { + "epoch": 0.33, + "learning_rate": 1.3371907887072348e-07, + "loss": 0.0009, + "step": 17118 + }, + { + "epoch": 0.33, + "learning_rate": 1.3371519552638732e-07, + "loss": 0.0011, + "step": 17119 + }, + { + "epoch": 0.33, + "learning_rate": 1.337113121820512e-07, + "loss": 0.0007, + "step": 17120 + }, + { + "epoch": 0.33, + "learning_rate": 1.3370742883771504e-07, + "loss": 0.001, + "step": 17121 + }, + { + "epoch": 0.33, + "learning_rate": 1.337035454933789e-07, + "loss": 0.1345, + "step": 17122 + }, + { + "epoch": 0.33, + "learning_rate": 1.3369966214904276e-07, + "loss": 0.0007, + "step": 17123 + }, + { + "epoch": 0.33, + "learning_rate": 1.3369577880470663e-07, + "loss": 0.0017, + "step": 17124 + }, + { + "epoch": 0.33, + "learning_rate": 1.3369189546037047e-07, + "loss": 0.0014, + "step": 17125 + }, + { + "epoch": 0.33, + "learning_rate": 1.3368801211603434e-07, + "loss": 0.001, + "step": 17126 + }, + { + "epoch": 0.33, + "learning_rate": 1.336841287716982e-07, + "loss": 0.0009, + "step": 17127 + }, + { + "epoch": 0.33, + "learning_rate": 1.3368024542736206e-07, + "loss": 0.0013, + "step": 17128 + }, + { + "epoch": 0.33, + "learning_rate": 1.336763620830259e-07, + "loss": 0.0013, + "step": 17129 + }, + { + "epoch": 0.33, + "learning_rate": 1.3367247873868975e-07, + "loss": 0.1446, + "step": 17130 + }, + { + "epoch": 0.33, + "learning_rate": 1.336685953943536e-07, + "loss": 0.001, + "step": 17131 + }, + { + "epoch": 0.33, + "learning_rate": 1.3366471205001747e-07, + "loss": 0.751, + "step": 17132 + }, + { + "epoch": 0.33, + "learning_rate": 1.336608287056813e-07, + "loss": 0.0011, + "step": 17133 + }, + { + "epoch": 0.33, + "learning_rate": 1.3365694536134518e-07, + "loss": 0.0009, + "step": 17134 + }, + { + "epoch": 0.33, + "learning_rate": 1.3365306201700903e-07, + "loss": 0.0008, + "step": 17135 + }, + { + "epoch": 0.33, + "learning_rate": 1.336491786726729e-07, + "loss": 0.001, + "step": 17136 + }, + { + "epoch": 0.33, + "learning_rate": 1.3364529532833675e-07, + "loss": 0.044, + "step": 17137 + }, + { + "epoch": 0.33, + "learning_rate": 1.3364141198400062e-07, + "loss": 0.6403, + "step": 17138 + }, + { + "epoch": 0.33, + "learning_rate": 1.3363752863966446e-07, + "loss": 0.0012, + "step": 17139 + }, + { + "epoch": 0.33, + "learning_rate": 1.3363364529532833e-07, + "loss": 0.001, + "step": 17140 + }, + { + "epoch": 0.33, + "learning_rate": 1.3362976195099218e-07, + "loss": 0.001, + "step": 17141 + }, + { + "epoch": 0.33, + "learning_rate": 1.3362587860665605e-07, + "loss": 0.0048, + "step": 17142 + }, + { + "epoch": 0.33, + "learning_rate": 1.336219952623199e-07, + "loss": 0.0163, + "step": 17143 + }, + { + "epoch": 0.33, + "learning_rate": 1.3361811191798377e-07, + "loss": 0.8442, + "step": 17144 + }, + { + "epoch": 0.33, + "learning_rate": 1.336142285736476e-07, + "loss": 0.001, + "step": 17145 + }, + { + "epoch": 0.33, + "learning_rate": 1.3361034522931148e-07, + "loss": 0.0009, + "step": 17146 + }, + { + "epoch": 0.33, + "learning_rate": 1.3360646188497533e-07, + "loss": 0.001, + "step": 17147 + }, + { + "epoch": 0.33, + "learning_rate": 1.336025785406392e-07, + "loss": 0.0039, + "step": 17148 + }, + { + "epoch": 0.33, + "learning_rate": 1.3359869519630304e-07, + "loss": 0.0011, + "step": 17149 + }, + { + "epoch": 0.33, + "learning_rate": 1.3359481185196692e-07, + "loss": 0.0013, + "step": 17150 + }, + { + "epoch": 0.33, + "learning_rate": 1.3359092850763076e-07, + "loss": 0.0009, + "step": 17151 + }, + { + "epoch": 0.33, + "learning_rate": 1.3358704516329463e-07, + "loss": 0.203, + "step": 17152 + }, + { + "epoch": 0.33, + "learning_rate": 1.3358316181895848e-07, + "loss": 0.0008, + "step": 17153 + }, + { + "epoch": 0.33, + "learning_rate": 1.3357927847462235e-07, + "loss": 0.0032, + "step": 17154 + }, + { + "epoch": 0.33, + "learning_rate": 1.335753951302862e-07, + "loss": 0.001, + "step": 17155 + }, + { + "epoch": 0.33, + "learning_rate": 1.3357151178595007e-07, + "loss": 0.001, + "step": 17156 + }, + { + "epoch": 0.33, + "learning_rate": 1.335676284416139e-07, + "loss": 0.001, + "step": 17157 + }, + { + "epoch": 0.33, + "learning_rate": 1.3356374509727778e-07, + "loss": 0.0008, + "step": 17158 + }, + { + "epoch": 0.33, + "learning_rate": 1.3355986175294163e-07, + "loss": 0.001, + "step": 17159 + }, + { + "epoch": 0.33, + "learning_rate": 1.3355597840860547e-07, + "loss": 0.2006, + "step": 17160 + }, + { + "epoch": 0.33, + "learning_rate": 1.3355209506426934e-07, + "loss": 0.0012, + "step": 17161 + }, + { + "epoch": 0.33, + "learning_rate": 1.335482117199332e-07, + "loss": 0.0023, + "step": 17162 + }, + { + "epoch": 0.33, + "learning_rate": 1.3354432837559706e-07, + "loss": 0.4363, + "step": 17163 + }, + { + "epoch": 0.33, + "learning_rate": 1.335404450312609e-07, + "loss": 0.0288, + "step": 17164 + }, + { + "epoch": 0.33, + "learning_rate": 1.3353656168692478e-07, + "loss": 0.0011, + "step": 17165 + }, + { + "epoch": 0.33, + "learning_rate": 1.3353267834258862e-07, + "loss": 0.001, + "step": 17166 + }, + { + "epoch": 0.33, + "learning_rate": 1.335287949982525e-07, + "loss": 0.0009, + "step": 17167 + }, + { + "epoch": 0.33, + "learning_rate": 1.3352491165391634e-07, + "loss": 0.322, + "step": 17168 + }, + { + "epoch": 0.33, + "learning_rate": 1.335210283095802e-07, + "loss": 0.0008, + "step": 17169 + }, + { + "epoch": 0.33, + "learning_rate": 1.3351714496524405e-07, + "loss": 0.3291, + "step": 17170 + }, + { + "epoch": 0.33, + "learning_rate": 1.3351326162090793e-07, + "loss": 0.0285, + "step": 17171 + }, + { + "epoch": 0.33, + "learning_rate": 1.3350937827657177e-07, + "loss": 0.3576, + "step": 17172 + }, + { + "epoch": 0.33, + "learning_rate": 1.3350549493223564e-07, + "loss": 0.0006, + "step": 17173 + }, + { + "epoch": 0.33, + "learning_rate": 1.335016115878995e-07, + "loss": 0.001, + "step": 17174 + }, + { + "epoch": 0.33, + "learning_rate": 1.3349772824356336e-07, + "loss": 0.0011, + "step": 17175 + }, + { + "epoch": 0.33, + "learning_rate": 1.334938448992272e-07, + "loss": 0.0011, + "step": 17176 + }, + { + "epoch": 0.33, + "learning_rate": 1.3348996155489108e-07, + "loss": 0.0013, + "step": 17177 + }, + { + "epoch": 0.33, + "learning_rate": 1.3348607821055492e-07, + "loss": 0.5402, + "step": 17178 + }, + { + "epoch": 0.33, + "learning_rate": 1.334821948662188e-07, + "loss": 1.2293, + "step": 17179 + }, + { + "epoch": 0.33, + "learning_rate": 1.3347831152188264e-07, + "loss": 0.0008, + "step": 17180 + }, + { + "epoch": 0.33, + "learning_rate": 1.334744281775465e-07, + "loss": 0.001, + "step": 17181 + }, + { + "epoch": 0.33, + "learning_rate": 1.3347054483321035e-07, + "loss": 0.0133, + "step": 17182 + }, + { + "epoch": 0.33, + "learning_rate": 1.3346666148887423e-07, + "loss": 0.001, + "step": 17183 + }, + { + "epoch": 0.33, + "learning_rate": 1.3346277814453807e-07, + "loss": 0.0017, + "step": 17184 + }, + { + "epoch": 0.33, + "learning_rate": 1.3345889480020194e-07, + "loss": 0.0009, + "step": 17185 + }, + { + "epoch": 0.33, + "learning_rate": 1.3345501145586579e-07, + "loss": 0.0014, + "step": 17186 + }, + { + "epoch": 0.33, + "learning_rate": 1.3345112811152966e-07, + "loss": 0.0009, + "step": 17187 + }, + { + "epoch": 0.33, + "learning_rate": 1.334472447671935e-07, + "loss": 0.0008, + "step": 17188 + }, + { + "epoch": 0.33, + "learning_rate": 1.3344336142285735e-07, + "loss": 0.6983, + "step": 17189 + }, + { + "epoch": 0.33, + "learning_rate": 1.334394780785212e-07, + "loss": 0.0009, + "step": 17190 + }, + { + "epoch": 0.33, + "learning_rate": 1.3343559473418506e-07, + "loss": 1.5269, + "step": 17191 + }, + { + "epoch": 0.33, + "learning_rate": 1.334317113898489e-07, + "loss": 0.001, + "step": 17192 + }, + { + "epoch": 0.33, + "learning_rate": 1.3342782804551278e-07, + "loss": 0.0011, + "step": 17193 + }, + { + "epoch": 0.33, + "learning_rate": 1.3342394470117663e-07, + "loss": 0.0008, + "step": 17194 + }, + { + "epoch": 0.33, + "learning_rate": 1.334200613568405e-07, + "loss": 0.0009, + "step": 17195 + }, + { + "epoch": 0.33, + "learning_rate": 1.3341617801250434e-07, + "loss": 0.0008, + "step": 17196 + }, + { + "epoch": 0.33, + "learning_rate": 1.3341229466816821e-07, + "loss": 0.0055, + "step": 17197 + }, + { + "epoch": 0.33, + "learning_rate": 1.3340841132383206e-07, + "loss": 0.0015, + "step": 17198 + }, + { + "epoch": 0.33, + "learning_rate": 1.3340452797949593e-07, + "loss": 0.0032, + "step": 17199 + }, + { + "epoch": 0.33, + "learning_rate": 1.3340064463515978e-07, + "loss": 0.0008, + "step": 17200 + }, + { + "epoch": 0.33, + "learning_rate": 1.3339676129082365e-07, + "loss": 0.001, + "step": 17201 + }, + { + "epoch": 0.33, + "learning_rate": 1.333928779464875e-07, + "loss": 0.0012, + "step": 17202 + }, + { + "epoch": 0.33, + "learning_rate": 1.3338899460215136e-07, + "loss": 0.0008, + "step": 17203 + }, + { + "epoch": 0.33, + "learning_rate": 1.333851112578152e-07, + "loss": 0.0009, + "step": 17204 + }, + { + "epoch": 0.33, + "learning_rate": 1.3338122791347908e-07, + "loss": 0.9992, + "step": 17205 + }, + { + "epoch": 0.33, + "learning_rate": 1.3337734456914293e-07, + "loss": 0.001, + "step": 17206 + }, + { + "epoch": 0.33, + "learning_rate": 1.333734612248068e-07, + "loss": 0.0008, + "step": 17207 + }, + { + "epoch": 0.33, + "learning_rate": 1.3336957788047064e-07, + "loss": 0.0013, + "step": 17208 + }, + { + "epoch": 0.33, + "learning_rate": 1.333656945361345e-07, + "loss": 0.0061, + "step": 17209 + }, + { + "epoch": 0.33, + "learning_rate": 1.3336181119179836e-07, + "loss": 0.0009, + "step": 17210 + }, + { + "epoch": 0.33, + "learning_rate": 1.3335792784746223e-07, + "loss": 0.0009, + "step": 17211 + }, + { + "epoch": 0.33, + "learning_rate": 1.3335404450312607e-07, + "loss": 0.001, + "step": 17212 + }, + { + "epoch": 0.33, + "learning_rate": 1.3335016115878995e-07, + "loss": 0.0138, + "step": 17213 + }, + { + "epoch": 0.33, + "learning_rate": 1.333462778144538e-07, + "loss": 0.003, + "step": 17214 + }, + { + "epoch": 0.33, + "learning_rate": 1.3334239447011766e-07, + "loss": 0.0454, + "step": 17215 + }, + { + "epoch": 0.33, + "learning_rate": 1.333385111257815e-07, + "loss": 0.0007, + "step": 17216 + }, + { + "epoch": 0.33, + "learning_rate": 1.3333462778144538e-07, + "loss": 0.0007, + "step": 17217 + }, + { + "epoch": 0.33, + "learning_rate": 1.3333074443710922e-07, + "loss": 0.008, + "step": 17218 + }, + { + "epoch": 0.33, + "learning_rate": 1.333268610927731e-07, + "loss": 0.0021, + "step": 17219 + }, + { + "epoch": 0.33, + "learning_rate": 1.3332297774843694e-07, + "loss": 0.0089, + "step": 17220 + }, + { + "epoch": 0.33, + "learning_rate": 1.333190944041008e-07, + "loss": 0.0035, + "step": 17221 + }, + { + "epoch": 0.33, + "learning_rate": 1.3331521105976466e-07, + "loss": 0.0008, + "step": 17222 + }, + { + "epoch": 0.33, + "learning_rate": 1.3331132771542853e-07, + "loss": 0.0009, + "step": 17223 + }, + { + "epoch": 0.33, + "learning_rate": 1.3330744437109237e-07, + "loss": 0.001, + "step": 17224 + }, + { + "epoch": 0.33, + "learning_rate": 1.3330356102675624e-07, + "loss": 0.001, + "step": 17225 + }, + { + "epoch": 0.33, + "learning_rate": 1.332996776824201e-07, + "loss": 0.0013, + "step": 17226 + }, + { + "epoch": 0.33, + "learning_rate": 1.3329579433808396e-07, + "loss": 0.001, + "step": 17227 + }, + { + "epoch": 0.33, + "learning_rate": 1.332919109937478e-07, + "loss": 0.0018, + "step": 17228 + }, + { + "epoch": 0.33, + "learning_rate": 1.3328802764941168e-07, + "loss": 0.0009, + "step": 17229 + }, + { + "epoch": 0.33, + "learning_rate": 1.3328414430507552e-07, + "loss": 0.5784, + "step": 17230 + }, + { + "epoch": 0.33, + "learning_rate": 1.332802609607394e-07, + "loss": 0.0012, + "step": 17231 + }, + { + "epoch": 0.33, + "learning_rate": 1.3327637761640324e-07, + "loss": 0.0007, + "step": 17232 + }, + { + "epoch": 0.33, + "learning_rate": 1.332724942720671e-07, + "loss": 0.0008, + "step": 17233 + }, + { + "epoch": 0.33, + "learning_rate": 1.3326861092773096e-07, + "loss": 0.0035, + "step": 17234 + }, + { + "epoch": 0.33, + "learning_rate": 1.3326472758339483e-07, + "loss": 0.0015, + "step": 17235 + }, + { + "epoch": 0.33, + "learning_rate": 1.3326084423905867e-07, + "loss": 0.0008, + "step": 17236 + }, + { + "epoch": 0.33, + "learning_rate": 1.3325696089472254e-07, + "loss": 0.001, + "step": 17237 + }, + { + "epoch": 0.33, + "learning_rate": 1.332530775503864e-07, + "loss": 0.0011, + "step": 17238 + }, + { + "epoch": 0.33, + "learning_rate": 1.3324919420605026e-07, + "loss": 0.001, + "step": 17239 + }, + { + "epoch": 0.33, + "learning_rate": 1.332453108617141e-07, + "loss": 0.0008, + "step": 17240 + }, + { + "epoch": 0.33, + "learning_rate": 1.3324142751737798e-07, + "loss": 0.0006, + "step": 17241 + }, + { + "epoch": 0.33, + "learning_rate": 1.3323754417304182e-07, + "loss": 0.001, + "step": 17242 + }, + { + "epoch": 0.33, + "learning_rate": 1.332336608287057e-07, + "loss": 0.0007, + "step": 17243 + }, + { + "epoch": 0.33, + "learning_rate": 1.3322977748436954e-07, + "loss": 0.0008, + "step": 17244 + }, + { + "epoch": 0.33, + "learning_rate": 1.332258941400334e-07, + "loss": 0.0011, + "step": 17245 + }, + { + "epoch": 0.33, + "learning_rate": 1.3322201079569725e-07, + "loss": 0.001, + "step": 17246 + }, + { + "epoch": 0.33, + "learning_rate": 1.332181274513611e-07, + "loss": 0.0012, + "step": 17247 + }, + { + "epoch": 0.33, + "learning_rate": 1.3321424410702494e-07, + "loss": 0.0167, + "step": 17248 + }, + { + "epoch": 0.33, + "learning_rate": 1.3321036076268882e-07, + "loss": 0.0007, + "step": 17249 + }, + { + "epoch": 0.33, + "learning_rate": 1.3320647741835266e-07, + "loss": 0.0011, + "step": 17250 + }, + { + "epoch": 0.33, + "learning_rate": 1.3320259407401653e-07, + "loss": 0.0018, + "step": 17251 + }, + { + "epoch": 0.33, + "learning_rate": 1.3319871072968038e-07, + "loss": 0.0009, + "step": 17252 + }, + { + "epoch": 0.33, + "learning_rate": 1.3319482738534425e-07, + "loss": 0.0009, + "step": 17253 + }, + { + "epoch": 0.33, + "learning_rate": 1.331909440410081e-07, + "loss": 0.0009, + "step": 17254 + }, + { + "epoch": 0.33, + "learning_rate": 1.3318706069667197e-07, + "loss": 0.0009, + "step": 17255 + }, + { + "epoch": 0.33, + "learning_rate": 1.331831773523358e-07, + "loss": 0.0009, + "step": 17256 + }, + { + "epoch": 0.33, + "learning_rate": 1.3317929400799968e-07, + "loss": 0.001, + "step": 17257 + }, + { + "epoch": 0.33, + "learning_rate": 1.3317541066366353e-07, + "loss": 0.0008, + "step": 17258 + }, + { + "epoch": 0.33, + "learning_rate": 1.331715273193274e-07, + "loss": 0.0008, + "step": 17259 + }, + { + "epoch": 0.33, + "learning_rate": 1.3316764397499124e-07, + "loss": 0.1128, + "step": 17260 + }, + { + "epoch": 0.33, + "learning_rate": 1.3316376063065512e-07, + "loss": 0.0017, + "step": 17261 + }, + { + "epoch": 0.33, + "learning_rate": 1.3315987728631896e-07, + "loss": 0.001, + "step": 17262 + }, + { + "epoch": 0.33, + "learning_rate": 1.3315599394198283e-07, + "loss": 0.001, + "step": 17263 + }, + { + "epoch": 0.33, + "learning_rate": 1.3315211059764668e-07, + "loss": 0.0908, + "step": 17264 + }, + { + "epoch": 0.33, + "learning_rate": 1.3314822725331055e-07, + "loss": 0.001, + "step": 17265 + }, + { + "epoch": 0.33, + "learning_rate": 1.331443439089744e-07, + "loss": 0.0008, + "step": 17266 + }, + { + "epoch": 0.33, + "learning_rate": 1.3314046056463826e-07, + "loss": 0.0007, + "step": 17267 + }, + { + "epoch": 0.33, + "learning_rate": 1.331365772203021e-07, + "loss": 0.0014, + "step": 17268 + }, + { + "epoch": 0.33, + "learning_rate": 1.3313269387596598e-07, + "loss": 0.369, + "step": 17269 + }, + { + "epoch": 0.34, + "learning_rate": 1.3312881053162983e-07, + "loss": 0.0009, + "step": 17270 + }, + { + "epoch": 0.34, + "learning_rate": 1.331249271872937e-07, + "loss": 0.0014, + "step": 17271 + }, + { + "epoch": 0.34, + "learning_rate": 1.3312104384295754e-07, + "loss": 0.0037, + "step": 17272 + }, + { + "epoch": 0.34, + "learning_rate": 1.3311716049862141e-07, + "loss": 0.0011, + "step": 17273 + }, + { + "epoch": 0.34, + "learning_rate": 1.3311327715428526e-07, + "loss": 0.001, + "step": 17274 + }, + { + "epoch": 0.34, + "learning_rate": 1.3310939380994913e-07, + "loss": 0.0009, + "step": 17275 + }, + { + "epoch": 0.34, + "learning_rate": 1.3310551046561298e-07, + "loss": 0.0024, + "step": 17276 + }, + { + "epoch": 0.34, + "learning_rate": 1.3310162712127685e-07, + "loss": 0.001, + "step": 17277 + }, + { + "epoch": 0.34, + "learning_rate": 1.330977437769407e-07, + "loss": 0.0019, + "step": 17278 + }, + { + "epoch": 0.34, + "learning_rate": 1.3309386043260456e-07, + "loss": 0.0015, + "step": 17279 + }, + { + "epoch": 0.34, + "learning_rate": 1.330899770882684e-07, + "loss": 0.4494, + "step": 17280 + }, + { + "epoch": 0.34, + "learning_rate": 1.3308609374393228e-07, + "loss": 0.0108, + "step": 17281 + }, + { + "epoch": 0.34, + "learning_rate": 1.3308221039959613e-07, + "loss": 0.001, + "step": 17282 + }, + { + "epoch": 0.34, + "learning_rate": 1.3307832705526e-07, + "loss": 0.0012, + "step": 17283 + }, + { + "epoch": 0.34, + "learning_rate": 1.3307444371092384e-07, + "loss": 0.0011, + "step": 17284 + }, + { + "epoch": 0.34, + "learning_rate": 1.330705603665877e-07, + "loss": 0.0135, + "step": 17285 + }, + { + "epoch": 0.34, + "learning_rate": 1.3306667702225156e-07, + "loss": 0.0013, + "step": 17286 + }, + { + "epoch": 0.34, + "learning_rate": 1.3306279367791543e-07, + "loss": 0.001, + "step": 17287 + }, + { + "epoch": 0.34, + "learning_rate": 1.3305891033357927e-07, + "loss": 0.0008, + "step": 17288 + }, + { + "epoch": 0.34, + "learning_rate": 1.3305502698924315e-07, + "loss": 1.0952, + "step": 17289 + }, + { + "epoch": 0.34, + "learning_rate": 1.33051143644907e-07, + "loss": 0.0008, + "step": 17290 + }, + { + "epoch": 0.34, + "learning_rate": 1.3304726030057086e-07, + "loss": 1.0818, + "step": 17291 + }, + { + "epoch": 0.34, + "learning_rate": 1.330433769562347e-07, + "loss": 0.7355, + "step": 17292 + }, + { + "epoch": 0.34, + "learning_rate": 1.3303949361189858e-07, + "loss": 0.1844, + "step": 17293 + }, + { + "epoch": 0.34, + "learning_rate": 1.3303561026756242e-07, + "loss": 0.0014, + "step": 17294 + }, + { + "epoch": 0.34, + "learning_rate": 1.330317269232263e-07, + "loss": 0.0007, + "step": 17295 + }, + { + "epoch": 0.34, + "learning_rate": 1.3302784357889014e-07, + "loss": 0.0007, + "step": 17296 + }, + { + "epoch": 0.34, + "learning_rate": 1.33023960234554e-07, + "loss": 0.0008, + "step": 17297 + }, + { + "epoch": 0.34, + "learning_rate": 1.3302007689021786e-07, + "loss": 0.0011, + "step": 17298 + }, + { + "epoch": 0.34, + "learning_rate": 1.3301619354588173e-07, + "loss": 0.0112, + "step": 17299 + }, + { + "epoch": 0.34, + "learning_rate": 1.3301231020154557e-07, + "loss": 0.0008, + "step": 17300 + }, + { + "epoch": 0.34, + "learning_rate": 1.3300842685720945e-07, + "loss": 0.7699, + "step": 17301 + }, + { + "epoch": 0.34, + "learning_rate": 1.330045435128733e-07, + "loss": 0.0011, + "step": 17302 + }, + { + "epoch": 0.34, + "learning_rate": 1.3300066016853716e-07, + "loss": 0.0008, + "step": 17303 + }, + { + "epoch": 0.34, + "learning_rate": 1.32996776824201e-07, + "loss": 0.001, + "step": 17304 + }, + { + "epoch": 0.34, + "learning_rate": 1.3299289347986485e-07, + "loss": 0.0015, + "step": 17305 + }, + { + "epoch": 0.34, + "learning_rate": 1.329890101355287e-07, + "loss": 0.0016, + "step": 17306 + }, + { + "epoch": 0.34, + "learning_rate": 1.3298512679119257e-07, + "loss": 0.0008, + "step": 17307 + }, + { + "epoch": 0.34, + "learning_rate": 1.329812434468564e-07, + "loss": 0.0008, + "step": 17308 + }, + { + "epoch": 0.34, + "learning_rate": 1.3297736010252028e-07, + "loss": 0.0009, + "step": 17309 + }, + { + "epoch": 0.34, + "learning_rate": 1.3297347675818413e-07, + "loss": 0.0042, + "step": 17310 + }, + { + "epoch": 0.34, + "learning_rate": 1.32969593413848e-07, + "loss": 0.9873, + "step": 17311 + }, + { + "epoch": 0.34, + "learning_rate": 1.3296571006951185e-07, + "loss": 0.0008, + "step": 17312 + }, + { + "epoch": 0.34, + "learning_rate": 1.3296182672517572e-07, + "loss": 0.3179, + "step": 17313 + }, + { + "epoch": 0.34, + "learning_rate": 1.3295794338083956e-07, + "loss": 0.001, + "step": 17314 + }, + { + "epoch": 0.34, + "learning_rate": 1.3295406003650343e-07, + "loss": 0.0007, + "step": 17315 + }, + { + "epoch": 0.34, + "learning_rate": 1.3295017669216728e-07, + "loss": 0.0011, + "step": 17316 + }, + { + "epoch": 0.34, + "learning_rate": 1.3294629334783115e-07, + "loss": 0.6535, + "step": 17317 + }, + { + "epoch": 0.34, + "learning_rate": 1.32942410003495e-07, + "loss": 0.0009, + "step": 17318 + }, + { + "epoch": 0.34, + "learning_rate": 1.3293852665915887e-07, + "loss": 0.0532, + "step": 17319 + }, + { + "epoch": 0.34, + "learning_rate": 1.329346433148227e-07, + "loss": 0.0011, + "step": 17320 + }, + { + "epoch": 0.34, + "learning_rate": 1.3293075997048658e-07, + "loss": 0.0014, + "step": 17321 + }, + { + "epoch": 0.34, + "learning_rate": 1.3292687662615043e-07, + "loss": 0.001, + "step": 17322 + }, + { + "epoch": 0.34, + "learning_rate": 1.329229932818143e-07, + "loss": 0.318, + "step": 17323 + }, + { + "epoch": 0.34, + "learning_rate": 1.3291910993747814e-07, + "loss": 0.0027, + "step": 17324 + }, + { + "epoch": 0.34, + "learning_rate": 1.3291522659314202e-07, + "loss": 0.0029, + "step": 17325 + }, + { + "epoch": 0.34, + "learning_rate": 1.3291134324880586e-07, + "loss": 0.0011, + "step": 17326 + }, + { + "epoch": 0.34, + "learning_rate": 1.3290745990446973e-07, + "loss": 1.0886, + "step": 17327 + }, + { + "epoch": 0.34, + "learning_rate": 1.3290357656013358e-07, + "loss": 0.0424, + "step": 17328 + }, + { + "epoch": 0.34, + "learning_rate": 1.3289969321579745e-07, + "loss": 0.1813, + "step": 17329 + }, + { + "epoch": 0.34, + "learning_rate": 1.328958098714613e-07, + "loss": 0.0013, + "step": 17330 + }, + { + "epoch": 0.34, + "learning_rate": 1.3289192652712517e-07, + "loss": 0.001, + "step": 17331 + }, + { + "epoch": 0.34, + "learning_rate": 1.32888043182789e-07, + "loss": 0.0009, + "step": 17332 + }, + { + "epoch": 0.34, + "learning_rate": 1.3288415983845288e-07, + "loss": 0.0014, + "step": 17333 + }, + { + "epoch": 0.34, + "learning_rate": 1.3288027649411673e-07, + "loss": 0.001, + "step": 17334 + }, + { + "epoch": 0.34, + "learning_rate": 1.328763931497806e-07, + "loss": 0.0012, + "step": 17335 + }, + { + "epoch": 0.34, + "learning_rate": 1.3287250980544444e-07, + "loss": 0.9917, + "step": 17336 + }, + { + "epoch": 0.34, + "learning_rate": 1.328686264611083e-07, + "loss": 0.0012, + "step": 17337 + }, + { + "epoch": 0.34, + "learning_rate": 1.3286474311677216e-07, + "loss": 0.0008, + "step": 17338 + }, + { + "epoch": 0.34, + "learning_rate": 1.32860859772436e-07, + "loss": 0.0019, + "step": 17339 + }, + { + "epoch": 0.34, + "learning_rate": 1.3285697642809988e-07, + "loss": 0.0014, + "step": 17340 + }, + { + "epoch": 0.34, + "learning_rate": 1.3285309308376372e-07, + "loss": 0.0009, + "step": 17341 + }, + { + "epoch": 0.34, + "learning_rate": 1.328492097394276e-07, + "loss": 0.441, + "step": 17342 + }, + { + "epoch": 0.34, + "learning_rate": 1.3284532639509144e-07, + "loss": 0.0012, + "step": 17343 + }, + { + "epoch": 0.34, + "learning_rate": 1.328414430507553e-07, + "loss": 0.0011, + "step": 17344 + }, + { + "epoch": 0.34, + "learning_rate": 1.3283755970641915e-07, + "loss": 0.0025, + "step": 17345 + }, + { + "epoch": 0.34, + "learning_rate": 1.3283367636208303e-07, + "loss": 0.001, + "step": 17346 + }, + { + "epoch": 0.34, + "learning_rate": 1.3282979301774687e-07, + "loss": 0.001, + "step": 17347 + }, + { + "epoch": 0.34, + "learning_rate": 1.3282590967341074e-07, + "loss": 0.0735, + "step": 17348 + }, + { + "epoch": 0.34, + "learning_rate": 1.328220263290746e-07, + "loss": 0.001, + "step": 17349 + }, + { + "epoch": 0.34, + "learning_rate": 1.3281814298473846e-07, + "loss": 0.0012, + "step": 17350 + }, + { + "epoch": 0.34, + "learning_rate": 1.328142596404023e-07, + "loss": 0.0009, + "step": 17351 + }, + { + "epoch": 0.34, + "learning_rate": 1.3281037629606618e-07, + "loss": 0.0007, + "step": 17352 + }, + { + "epoch": 0.34, + "learning_rate": 1.3280649295173002e-07, + "loss": 0.0008, + "step": 17353 + }, + { + "epoch": 0.34, + "learning_rate": 1.328026096073939e-07, + "loss": 0.0646, + "step": 17354 + }, + { + "epoch": 0.34, + "learning_rate": 1.3279872626305774e-07, + "loss": 0.0016, + "step": 17355 + }, + { + "epoch": 0.34, + "learning_rate": 1.327948429187216e-07, + "loss": 0.001, + "step": 17356 + }, + { + "epoch": 0.34, + "learning_rate": 1.3279095957438545e-07, + "loss": 0.0009, + "step": 17357 + }, + { + "epoch": 0.34, + "learning_rate": 1.3278707623004933e-07, + "loss": 0.0009, + "step": 17358 + }, + { + "epoch": 0.34, + "learning_rate": 1.3278319288571317e-07, + "loss": 0.487, + "step": 17359 + }, + { + "epoch": 0.34, + "learning_rate": 1.3277930954137704e-07, + "loss": 0.9291, + "step": 17360 + }, + { + "epoch": 0.34, + "learning_rate": 1.3277542619704089e-07, + "loss": 0.0008, + "step": 17361 + }, + { + "epoch": 0.34, + "learning_rate": 1.3277154285270476e-07, + "loss": 0.0022, + "step": 17362 + }, + { + "epoch": 0.34, + "learning_rate": 1.327676595083686e-07, + "loss": 0.0013, + "step": 17363 + }, + { + "epoch": 0.34, + "learning_rate": 1.3276377616403245e-07, + "loss": 0.0463, + "step": 17364 + }, + { + "epoch": 0.34, + "learning_rate": 1.327598928196963e-07, + "loss": 0.0058, + "step": 17365 + }, + { + "epoch": 0.34, + "learning_rate": 1.3275600947536016e-07, + "loss": 0.0008, + "step": 17366 + }, + { + "epoch": 0.34, + "learning_rate": 1.32752126131024e-07, + "loss": 0.0672, + "step": 17367 + }, + { + "epoch": 0.34, + "learning_rate": 1.3274824278668788e-07, + "loss": 0.001, + "step": 17368 + }, + { + "epoch": 0.34, + "learning_rate": 1.3274435944235173e-07, + "loss": 0.0017, + "step": 17369 + }, + { + "epoch": 0.34, + "learning_rate": 1.327404760980156e-07, + "loss": 0.0012, + "step": 17370 + }, + { + "epoch": 0.34, + "learning_rate": 1.3273659275367944e-07, + "loss": 0.3818, + "step": 17371 + }, + { + "epoch": 0.34, + "learning_rate": 1.3273270940934331e-07, + "loss": 0.0048, + "step": 17372 + }, + { + "epoch": 0.34, + "learning_rate": 1.3272882606500716e-07, + "loss": 0.0009, + "step": 17373 + }, + { + "epoch": 0.34, + "learning_rate": 1.3272494272067103e-07, + "loss": 0.0044, + "step": 17374 + }, + { + "epoch": 0.34, + "learning_rate": 1.3272105937633488e-07, + "loss": 0.0009, + "step": 17375 + }, + { + "epoch": 0.34, + "learning_rate": 1.3271717603199875e-07, + "loss": 0.0013, + "step": 17376 + }, + { + "epoch": 0.34, + "learning_rate": 1.327132926876626e-07, + "loss": 0.0007, + "step": 17377 + }, + { + "epoch": 0.34, + "learning_rate": 1.3270940934332646e-07, + "loss": 0.0011, + "step": 17378 + }, + { + "epoch": 0.34, + "learning_rate": 1.327055259989903e-07, + "loss": 0.001, + "step": 17379 + }, + { + "epoch": 0.34, + "learning_rate": 1.3270164265465418e-07, + "loss": 0.0009, + "step": 17380 + }, + { + "epoch": 0.34, + "learning_rate": 1.3269775931031803e-07, + "loss": 0.0018, + "step": 17381 + }, + { + "epoch": 0.34, + "learning_rate": 1.326938759659819e-07, + "loss": 0.7865, + "step": 17382 + }, + { + "epoch": 0.34, + "learning_rate": 1.3268999262164574e-07, + "loss": 0.0011, + "step": 17383 + }, + { + "epoch": 0.34, + "learning_rate": 1.326861092773096e-07, + "loss": 0.0072, + "step": 17384 + }, + { + "epoch": 0.34, + "learning_rate": 1.3268222593297346e-07, + "loss": 0.4165, + "step": 17385 + }, + { + "epoch": 0.34, + "learning_rate": 1.3267834258863733e-07, + "loss": 0.0012, + "step": 17386 + }, + { + "epoch": 0.34, + "learning_rate": 1.3267445924430117e-07, + "loss": 0.002, + "step": 17387 + }, + { + "epoch": 0.34, + "learning_rate": 1.3267057589996505e-07, + "loss": 0.5286, + "step": 17388 + }, + { + "epoch": 0.34, + "learning_rate": 1.326666925556289e-07, + "loss": 0.0388, + "step": 17389 + }, + { + "epoch": 0.34, + "learning_rate": 1.3266280921129276e-07, + "loss": 0.0014, + "step": 17390 + }, + { + "epoch": 0.34, + "learning_rate": 1.326589258669566e-07, + "loss": 0.0008, + "step": 17391 + }, + { + "epoch": 0.34, + "learning_rate": 1.3265504252262048e-07, + "loss": 0.001, + "step": 17392 + }, + { + "epoch": 0.34, + "learning_rate": 1.3265115917828432e-07, + "loss": 0.0014, + "step": 17393 + }, + { + "epoch": 0.34, + "learning_rate": 1.326472758339482e-07, + "loss": 0.001, + "step": 17394 + }, + { + "epoch": 0.34, + "learning_rate": 1.3264339248961204e-07, + "loss": 0.002, + "step": 17395 + }, + { + "epoch": 0.34, + "learning_rate": 1.326395091452759e-07, + "loss": 0.052, + "step": 17396 + }, + { + "epoch": 0.34, + "learning_rate": 1.3263562580093976e-07, + "loss": 0.0008, + "step": 17397 + }, + { + "epoch": 0.34, + "learning_rate": 1.3263174245660363e-07, + "loss": 1.0093, + "step": 17398 + }, + { + "epoch": 0.34, + "learning_rate": 1.3262785911226747e-07, + "loss": 0.0007, + "step": 17399 + }, + { + "epoch": 0.34, + "learning_rate": 1.3262397576793135e-07, + "loss": 0.001, + "step": 17400 + }, + { + "epoch": 0.34, + "learning_rate": 1.326200924235952e-07, + "loss": 0.0009, + "step": 17401 + }, + { + "epoch": 0.34, + "learning_rate": 1.3261620907925906e-07, + "loss": 0.001, + "step": 17402 + }, + { + "epoch": 0.34, + "learning_rate": 1.326123257349229e-07, + "loss": 0.0015, + "step": 17403 + }, + { + "epoch": 0.34, + "learning_rate": 1.3260844239058678e-07, + "loss": 0.0044, + "step": 17404 + }, + { + "epoch": 0.34, + "learning_rate": 1.3260455904625062e-07, + "loss": 0.031, + "step": 17405 + }, + { + "epoch": 0.34, + "learning_rate": 1.326006757019145e-07, + "loss": 0.006, + "step": 17406 + }, + { + "epoch": 0.34, + "learning_rate": 1.3259679235757834e-07, + "loss": 0.001, + "step": 17407 + }, + { + "epoch": 0.34, + "learning_rate": 1.325929090132422e-07, + "loss": 0.2245, + "step": 17408 + }, + { + "epoch": 0.34, + "learning_rate": 1.3258902566890606e-07, + "loss": 0.2584, + "step": 17409 + }, + { + "epoch": 0.34, + "learning_rate": 1.3258514232456993e-07, + "loss": 0.7439, + "step": 17410 + }, + { + "epoch": 0.34, + "learning_rate": 1.3258125898023377e-07, + "loss": 0.0008, + "step": 17411 + }, + { + "epoch": 0.34, + "learning_rate": 1.3257737563589764e-07, + "loss": 0.0009, + "step": 17412 + }, + { + "epoch": 0.34, + "learning_rate": 1.325734922915615e-07, + "loss": 0.0013, + "step": 17413 + }, + { + "epoch": 0.34, + "learning_rate": 1.3256960894722536e-07, + "loss": 0.0045, + "step": 17414 + }, + { + "epoch": 0.34, + "learning_rate": 1.325657256028892e-07, + "loss": 0.0009, + "step": 17415 + }, + { + "epoch": 0.34, + "learning_rate": 1.3256184225855308e-07, + "loss": 0.001, + "step": 17416 + }, + { + "epoch": 0.34, + "learning_rate": 1.3255795891421692e-07, + "loss": 0.3571, + "step": 17417 + }, + { + "epoch": 0.34, + "learning_rate": 1.325540755698808e-07, + "loss": 0.0022, + "step": 17418 + }, + { + "epoch": 0.34, + "learning_rate": 1.3255019222554464e-07, + "loss": 0.7122, + "step": 17419 + }, + { + "epoch": 0.34, + "learning_rate": 1.325463088812085e-07, + "loss": 0.0009, + "step": 17420 + }, + { + "epoch": 0.34, + "learning_rate": 1.3254242553687233e-07, + "loss": 0.0009, + "step": 17421 + }, + { + "epoch": 0.34, + "learning_rate": 1.325385421925362e-07, + "loss": 0.0011, + "step": 17422 + }, + { + "epoch": 0.34, + "learning_rate": 1.3253465884820004e-07, + "loss": 0.6449, + "step": 17423 + }, + { + "epoch": 0.34, + "learning_rate": 1.3253077550386392e-07, + "loss": 0.0008, + "step": 17424 + }, + { + "epoch": 0.34, + "learning_rate": 1.3252689215952776e-07, + "loss": 0.0009, + "step": 17425 + }, + { + "epoch": 0.34, + "learning_rate": 1.3252300881519163e-07, + "loss": 1.2574, + "step": 17426 + }, + { + "epoch": 0.34, + "learning_rate": 1.3251912547085548e-07, + "loss": 0.0009, + "step": 17427 + }, + { + "epoch": 0.34, + "learning_rate": 1.3251524212651935e-07, + "loss": 0.0015, + "step": 17428 + }, + { + "epoch": 0.34, + "learning_rate": 1.325113587821832e-07, + "loss": 0.001, + "step": 17429 + }, + { + "epoch": 0.34, + "learning_rate": 1.3250747543784707e-07, + "loss": 0.0009, + "step": 17430 + }, + { + "epoch": 0.34, + "learning_rate": 1.325035920935109e-07, + "loss": 0.0012, + "step": 17431 + }, + { + "epoch": 0.34, + "learning_rate": 1.3249970874917478e-07, + "loss": 0.0009, + "step": 17432 + }, + { + "epoch": 0.34, + "learning_rate": 1.3249582540483863e-07, + "loss": 0.0017, + "step": 17433 + }, + { + "epoch": 0.34, + "learning_rate": 1.324919420605025e-07, + "loss": 0.0011, + "step": 17434 + }, + { + "epoch": 0.34, + "learning_rate": 1.3248805871616634e-07, + "loss": 0.0008, + "step": 17435 + }, + { + "epoch": 0.34, + "learning_rate": 1.3248417537183022e-07, + "loss": 0.0622, + "step": 17436 + }, + { + "epoch": 0.34, + "learning_rate": 1.3248029202749406e-07, + "loss": 0.1122, + "step": 17437 + }, + { + "epoch": 0.34, + "learning_rate": 1.3247640868315793e-07, + "loss": 0.0019, + "step": 17438 + }, + { + "epoch": 0.34, + "learning_rate": 1.3247252533882178e-07, + "loss": 0.002, + "step": 17439 + }, + { + "epoch": 0.34, + "learning_rate": 1.3246864199448565e-07, + "loss": 0.0008, + "step": 17440 + }, + { + "epoch": 0.34, + "learning_rate": 1.324647586501495e-07, + "loss": 0.0014, + "step": 17441 + }, + { + "epoch": 0.34, + "learning_rate": 1.3246087530581336e-07, + "loss": 0.5316, + "step": 17442 + }, + { + "epoch": 0.34, + "learning_rate": 1.324569919614772e-07, + "loss": 0.0007, + "step": 17443 + }, + { + "epoch": 0.34, + "learning_rate": 1.3245310861714108e-07, + "loss": 0.0009, + "step": 17444 + }, + { + "epoch": 0.34, + "learning_rate": 1.3244922527280493e-07, + "loss": 0.0039, + "step": 17445 + }, + { + "epoch": 0.34, + "learning_rate": 1.324453419284688e-07, + "loss": 0.0012, + "step": 17446 + }, + { + "epoch": 0.34, + "learning_rate": 1.3244145858413264e-07, + "loss": 0.0009, + "step": 17447 + }, + { + "epoch": 0.34, + "learning_rate": 1.3243757523979651e-07, + "loss": 0.0916, + "step": 17448 + }, + { + "epoch": 0.34, + "learning_rate": 1.3243369189546036e-07, + "loss": 0.0014, + "step": 17449 + }, + { + "epoch": 0.34, + "learning_rate": 1.3242980855112423e-07, + "loss": 0.0012, + "step": 17450 + }, + { + "epoch": 0.34, + "learning_rate": 1.3242592520678808e-07, + "loss": 0.0014, + "step": 17451 + }, + { + "epoch": 0.34, + "learning_rate": 1.3242204186245195e-07, + "loss": 0.046, + "step": 17452 + }, + { + "epoch": 0.34, + "learning_rate": 1.324181585181158e-07, + "loss": 0.4643, + "step": 17453 + }, + { + "epoch": 0.34, + "learning_rate": 1.3241427517377966e-07, + "loss": 0.0566, + "step": 17454 + }, + { + "epoch": 0.34, + "learning_rate": 1.324103918294435e-07, + "loss": 0.0026, + "step": 17455 + }, + { + "epoch": 0.34, + "learning_rate": 1.3240650848510738e-07, + "loss": 0.001, + "step": 17456 + }, + { + "epoch": 0.34, + "learning_rate": 1.3240262514077123e-07, + "loss": 0.002, + "step": 17457 + }, + { + "epoch": 0.34, + "learning_rate": 1.323987417964351e-07, + "loss": 0.0012, + "step": 17458 + }, + { + "epoch": 0.34, + "learning_rate": 1.3239485845209894e-07, + "loss": 0.0454, + "step": 17459 + }, + { + "epoch": 0.34, + "learning_rate": 1.323909751077628e-07, + "loss": 0.001, + "step": 17460 + }, + { + "epoch": 0.34, + "learning_rate": 1.3238709176342666e-07, + "loss": 0.0015, + "step": 17461 + }, + { + "epoch": 0.34, + "learning_rate": 1.3238320841909053e-07, + "loss": 0.0009, + "step": 17462 + }, + { + "epoch": 0.34, + "learning_rate": 1.3237932507475437e-07, + "loss": 0.0799, + "step": 17463 + }, + { + "epoch": 0.34, + "learning_rate": 1.3237544173041825e-07, + "loss": 0.0008, + "step": 17464 + }, + { + "epoch": 0.34, + "learning_rate": 1.323715583860821e-07, + "loss": 0.0008, + "step": 17465 + }, + { + "epoch": 0.34, + "learning_rate": 1.3236767504174596e-07, + "loss": 0.001, + "step": 17466 + }, + { + "epoch": 0.34, + "learning_rate": 1.323637916974098e-07, + "loss": 0.0188, + "step": 17467 + }, + { + "epoch": 0.34, + "learning_rate": 1.3235990835307368e-07, + "loss": 0.0009, + "step": 17468 + }, + { + "epoch": 0.34, + "learning_rate": 1.3235602500873752e-07, + "loss": 0.001, + "step": 17469 + }, + { + "epoch": 0.34, + "learning_rate": 1.323521416644014e-07, + "loss": 0.0127, + "step": 17470 + }, + { + "epoch": 0.34, + "learning_rate": 1.3234825832006524e-07, + "loss": 0.2225, + "step": 17471 + }, + { + "epoch": 0.34, + "learning_rate": 1.323443749757291e-07, + "loss": 0.0007, + "step": 17472 + }, + { + "epoch": 0.34, + "learning_rate": 1.3234049163139296e-07, + "loss": 0.001, + "step": 17473 + }, + { + "epoch": 0.34, + "learning_rate": 1.3233660828705683e-07, + "loss": 0.0141, + "step": 17474 + }, + { + "epoch": 0.34, + "learning_rate": 1.3233272494272067e-07, + "loss": 0.0009, + "step": 17475 + }, + { + "epoch": 0.34, + "learning_rate": 1.3232884159838455e-07, + "loss": 0.3351, + "step": 17476 + }, + { + "epoch": 0.34, + "learning_rate": 1.323249582540484e-07, + "loss": 0.0008, + "step": 17477 + }, + { + "epoch": 0.34, + "learning_rate": 1.3232107490971226e-07, + "loss": 0.0017, + "step": 17478 + }, + { + "epoch": 0.34, + "learning_rate": 1.3231719156537608e-07, + "loss": 0.0008, + "step": 17479 + }, + { + "epoch": 0.34, + "learning_rate": 1.3231330822103995e-07, + "loss": 0.001, + "step": 17480 + }, + { + "epoch": 0.34, + "learning_rate": 1.323094248767038e-07, + "loss": 0.001, + "step": 17481 + }, + { + "epoch": 0.34, + "learning_rate": 1.3230554153236767e-07, + "loss": 0.0021, + "step": 17482 + }, + { + "epoch": 0.34, + "learning_rate": 1.323016581880315e-07, + "loss": 0.0013, + "step": 17483 + }, + { + "epoch": 0.34, + "learning_rate": 1.3229777484369538e-07, + "loss": 0.001, + "step": 17484 + }, + { + "epoch": 0.34, + "learning_rate": 1.3229389149935923e-07, + "loss": 0.0006, + "step": 17485 + }, + { + "epoch": 0.34, + "learning_rate": 1.322900081550231e-07, + "loss": 0.001, + "step": 17486 + }, + { + "epoch": 0.34, + "learning_rate": 1.3228612481068695e-07, + "loss": 0.0017, + "step": 17487 + }, + { + "epoch": 0.34, + "learning_rate": 1.3228224146635082e-07, + "loss": 0.0107, + "step": 17488 + }, + { + "epoch": 0.34, + "learning_rate": 1.3227835812201466e-07, + "loss": 0.0012, + "step": 17489 + }, + { + "epoch": 0.34, + "learning_rate": 1.3227447477767853e-07, + "loss": 0.001, + "step": 17490 + }, + { + "epoch": 0.34, + "learning_rate": 1.3227059143334238e-07, + "loss": 0.0043, + "step": 17491 + }, + { + "epoch": 0.34, + "learning_rate": 1.3226670808900625e-07, + "loss": 0.0009, + "step": 17492 + }, + { + "epoch": 0.34, + "learning_rate": 1.322628247446701e-07, + "loss": 0.0095, + "step": 17493 + }, + { + "epoch": 0.34, + "learning_rate": 1.3225894140033397e-07, + "loss": 0.001, + "step": 17494 + }, + { + "epoch": 0.34, + "learning_rate": 1.322550580559978e-07, + "loss": 0.0017, + "step": 17495 + }, + { + "epoch": 0.34, + "learning_rate": 1.3225117471166168e-07, + "loss": 0.0017, + "step": 17496 + }, + { + "epoch": 0.34, + "learning_rate": 1.3224729136732553e-07, + "loss": 0.0025, + "step": 17497 + }, + { + "epoch": 0.34, + "learning_rate": 1.322434080229894e-07, + "loss": 0.0009, + "step": 17498 + }, + { + "epoch": 0.34, + "learning_rate": 1.3223952467865325e-07, + "loss": 0.0015, + "step": 17499 + }, + { + "epoch": 0.34, + "learning_rate": 1.3223564133431712e-07, + "loss": 0.004, + "step": 17500 + }, + { + "epoch": 0.34, + "learning_rate": 1.3223175798998096e-07, + "loss": 0.0011, + "step": 17501 + }, + { + "epoch": 0.34, + "learning_rate": 1.3222787464564483e-07, + "loss": 0.0008, + "step": 17502 + }, + { + "epoch": 0.34, + "learning_rate": 1.3222399130130868e-07, + "loss": 0.004, + "step": 17503 + }, + { + "epoch": 0.34, + "learning_rate": 1.3222010795697255e-07, + "loss": 0.0914, + "step": 17504 + }, + { + "epoch": 0.34, + "learning_rate": 1.322162246126364e-07, + "loss": 0.001, + "step": 17505 + }, + { + "epoch": 0.34, + "learning_rate": 1.3221234126830027e-07, + "loss": 0.0011, + "step": 17506 + }, + { + "epoch": 0.34, + "learning_rate": 1.322084579239641e-07, + "loss": 0.2398, + "step": 17507 + }, + { + "epoch": 0.34, + "learning_rate": 1.3220457457962798e-07, + "loss": 0.0007, + "step": 17508 + }, + { + "epoch": 0.34, + "learning_rate": 1.3220069123529183e-07, + "loss": 0.0044, + "step": 17509 + }, + { + "epoch": 0.34, + "learning_rate": 1.321968078909557e-07, + "loss": 0.0012, + "step": 17510 + }, + { + "epoch": 0.34, + "learning_rate": 1.3219292454661954e-07, + "loss": 0.002, + "step": 17511 + }, + { + "epoch": 0.34, + "learning_rate": 1.3218904120228342e-07, + "loss": 0.0015, + "step": 17512 + }, + { + "epoch": 0.34, + "learning_rate": 1.3218515785794726e-07, + "loss": 0.0019, + "step": 17513 + }, + { + "epoch": 0.34, + "learning_rate": 1.321812745136111e-07, + "loss": 0.0015, + "step": 17514 + }, + { + "epoch": 0.34, + "learning_rate": 1.3217739116927498e-07, + "loss": 0.0012, + "step": 17515 + }, + { + "epoch": 0.34, + "learning_rate": 1.3217350782493882e-07, + "loss": 0.6715, + "step": 17516 + }, + { + "epoch": 0.34, + "learning_rate": 1.321696244806027e-07, + "loss": 0.0013, + "step": 17517 + }, + { + "epoch": 0.34, + "learning_rate": 1.3216574113626654e-07, + "loss": 0.0007, + "step": 17518 + }, + { + "epoch": 0.34, + "learning_rate": 1.321618577919304e-07, + "loss": 0.5215, + "step": 17519 + }, + { + "epoch": 0.34, + "learning_rate": 1.3215797444759425e-07, + "loss": 0.1963, + "step": 17520 + }, + { + "epoch": 0.34, + "learning_rate": 1.3215409110325813e-07, + "loss": 0.0012, + "step": 17521 + }, + { + "epoch": 0.34, + "learning_rate": 1.3215020775892197e-07, + "loss": 0.0588, + "step": 17522 + }, + { + "epoch": 0.34, + "learning_rate": 1.3214632441458584e-07, + "loss": 0.0013, + "step": 17523 + }, + { + "epoch": 0.34, + "learning_rate": 1.321424410702497e-07, + "loss": 0.0101, + "step": 17524 + }, + { + "epoch": 0.34, + "learning_rate": 1.3213855772591356e-07, + "loss": 0.0011, + "step": 17525 + }, + { + "epoch": 0.34, + "learning_rate": 1.321346743815774e-07, + "loss": 0.0009, + "step": 17526 + }, + { + "epoch": 0.34, + "learning_rate": 1.3213079103724128e-07, + "loss": 0.1033, + "step": 17527 + }, + { + "epoch": 0.34, + "learning_rate": 1.3212690769290512e-07, + "loss": 0.001, + "step": 17528 + }, + { + "epoch": 0.34, + "learning_rate": 1.32123024348569e-07, + "loss": 0.0009, + "step": 17529 + }, + { + "epoch": 0.34, + "learning_rate": 1.3211914100423284e-07, + "loss": 0.001, + "step": 17530 + }, + { + "epoch": 0.34, + "learning_rate": 1.321152576598967e-07, + "loss": 0.0029, + "step": 17531 + }, + { + "epoch": 0.34, + "learning_rate": 1.3211137431556055e-07, + "loss": 0.5285, + "step": 17532 + }, + { + "epoch": 0.34, + "learning_rate": 1.3210749097122443e-07, + "loss": 0.001, + "step": 17533 + }, + { + "epoch": 0.34, + "learning_rate": 1.3210360762688827e-07, + "loss": 0.0931, + "step": 17534 + }, + { + "epoch": 0.34, + "learning_rate": 1.3209972428255214e-07, + "loss": 0.0009, + "step": 17535 + }, + { + "epoch": 0.34, + "learning_rate": 1.32095840938216e-07, + "loss": 0.0009, + "step": 17536 + }, + { + "epoch": 0.34, + "learning_rate": 1.3209195759387983e-07, + "loss": 0.0984, + "step": 17537 + }, + { + "epoch": 0.34, + "learning_rate": 1.320880742495437e-07, + "loss": 0.0007, + "step": 17538 + }, + { + "epoch": 0.34, + "learning_rate": 1.3208419090520755e-07, + "loss": 0.0023, + "step": 17539 + }, + { + "epoch": 0.34, + "learning_rate": 1.3208030756087142e-07, + "loss": 1.0894, + "step": 17540 + }, + { + "epoch": 0.34, + "learning_rate": 1.3207642421653526e-07, + "loss": 0.0012, + "step": 17541 + }, + { + "epoch": 0.34, + "learning_rate": 1.320725408721991e-07, + "loss": 0.0007, + "step": 17542 + }, + { + "epoch": 0.34, + "learning_rate": 1.3206865752786298e-07, + "loss": 0.001, + "step": 17543 + }, + { + "epoch": 0.34, + "learning_rate": 1.3206477418352683e-07, + "loss": 2.0798, + "step": 17544 + }, + { + "epoch": 0.34, + "learning_rate": 1.320608908391907e-07, + "loss": 0.02, + "step": 17545 + }, + { + "epoch": 0.34, + "learning_rate": 1.3205700749485454e-07, + "loss": 0.0009, + "step": 17546 + }, + { + "epoch": 0.34, + "learning_rate": 1.3205312415051841e-07, + "loss": 0.001, + "step": 17547 + }, + { + "epoch": 0.34, + "learning_rate": 1.3204924080618226e-07, + "loss": 0.0009, + "step": 17548 + }, + { + "epoch": 0.34, + "learning_rate": 1.3204535746184613e-07, + "loss": 0.0009, + "step": 17549 + }, + { + "epoch": 0.34, + "learning_rate": 1.3204147411750998e-07, + "loss": 0.001, + "step": 17550 + }, + { + "epoch": 0.34, + "learning_rate": 1.3203759077317385e-07, + "loss": 0.0009, + "step": 17551 + }, + { + "epoch": 0.34, + "learning_rate": 1.320337074288377e-07, + "loss": 0.0008, + "step": 17552 + }, + { + "epoch": 0.34, + "learning_rate": 1.3202982408450156e-07, + "loss": 0.0008, + "step": 17553 + }, + { + "epoch": 0.34, + "learning_rate": 1.320259407401654e-07, + "loss": 0.001, + "step": 17554 + }, + { + "epoch": 0.34, + "learning_rate": 1.3202205739582928e-07, + "loss": 0.0013, + "step": 17555 + }, + { + "epoch": 0.34, + "learning_rate": 1.3201817405149313e-07, + "loss": 0.0011, + "step": 17556 + }, + { + "epoch": 0.34, + "learning_rate": 1.32014290707157e-07, + "loss": 0.0012, + "step": 17557 + }, + { + "epoch": 0.34, + "learning_rate": 1.3201040736282084e-07, + "loss": 0.1517, + "step": 17558 + }, + { + "epoch": 0.34, + "learning_rate": 1.3200652401848471e-07, + "loss": 0.0023, + "step": 17559 + }, + { + "epoch": 0.34, + "learning_rate": 1.3200264067414856e-07, + "loss": 0.0012, + "step": 17560 + }, + { + "epoch": 0.34, + "learning_rate": 1.3199875732981243e-07, + "loss": 0.0017, + "step": 17561 + }, + { + "epoch": 0.34, + "learning_rate": 1.3199487398547627e-07, + "loss": 0.0221, + "step": 17562 + }, + { + "epoch": 0.34, + "learning_rate": 1.3199099064114015e-07, + "loss": 0.0013, + "step": 17563 + }, + { + "epoch": 0.34, + "learning_rate": 1.31987107296804e-07, + "loss": 0.0009, + "step": 17564 + }, + { + "epoch": 0.34, + "learning_rate": 1.3198322395246786e-07, + "loss": 0.0014, + "step": 17565 + }, + { + "epoch": 0.34, + "learning_rate": 1.319793406081317e-07, + "loss": 0.0009, + "step": 17566 + }, + { + "epoch": 0.34, + "learning_rate": 1.3197545726379558e-07, + "loss": 0.0009, + "step": 17567 + }, + { + "epoch": 0.34, + "learning_rate": 1.3197157391945942e-07, + "loss": 0.0008, + "step": 17568 + }, + { + "epoch": 0.34, + "learning_rate": 1.319676905751233e-07, + "loss": 0.001, + "step": 17569 + }, + { + "epoch": 0.34, + "learning_rate": 1.3196380723078714e-07, + "loss": 0.0008, + "step": 17570 + }, + { + "epoch": 0.34, + "learning_rate": 1.31959923886451e-07, + "loss": 0.001, + "step": 17571 + }, + { + "epoch": 0.34, + "learning_rate": 1.3195604054211486e-07, + "loss": 0.4702, + "step": 17572 + }, + { + "epoch": 0.34, + "learning_rate": 1.3195215719777873e-07, + "loss": 0.0011, + "step": 17573 + }, + { + "epoch": 0.34, + "learning_rate": 1.3194827385344257e-07, + "loss": 0.0009, + "step": 17574 + }, + { + "epoch": 0.34, + "learning_rate": 1.3194439050910645e-07, + "loss": 0.0468, + "step": 17575 + }, + { + "epoch": 0.34, + "learning_rate": 1.319405071647703e-07, + "loss": 0.3441, + "step": 17576 + }, + { + "epoch": 0.34, + "learning_rate": 1.3193662382043416e-07, + "loss": 0.0057, + "step": 17577 + }, + { + "epoch": 0.34, + "learning_rate": 1.31932740476098e-07, + "loss": 0.0075, + "step": 17578 + }, + { + "epoch": 0.34, + "learning_rate": 1.3192885713176188e-07, + "loss": 0.0037, + "step": 17579 + }, + { + "epoch": 0.34, + "learning_rate": 1.3192497378742572e-07, + "loss": 0.0011, + "step": 17580 + }, + { + "epoch": 0.34, + "learning_rate": 1.319210904430896e-07, + "loss": 0.0008, + "step": 17581 + }, + { + "epoch": 0.34, + "learning_rate": 1.3191720709875344e-07, + "loss": 0.0008, + "step": 17582 + }, + { + "epoch": 0.34, + "learning_rate": 1.319133237544173e-07, + "loss": 0.0019, + "step": 17583 + }, + { + "epoch": 0.34, + "learning_rate": 1.3190944041008116e-07, + "loss": 0.4477, + "step": 17584 + }, + { + "epoch": 0.34, + "learning_rate": 1.3190555706574503e-07, + "loss": 0.001, + "step": 17585 + }, + { + "epoch": 0.34, + "learning_rate": 1.3190167372140887e-07, + "loss": 0.0011, + "step": 17586 + }, + { + "epoch": 0.34, + "learning_rate": 1.3189779037707274e-07, + "loss": 0.0011, + "step": 17587 + }, + { + "epoch": 0.34, + "learning_rate": 1.318939070327366e-07, + "loss": 0.0026, + "step": 17588 + }, + { + "epoch": 0.34, + "learning_rate": 1.3189002368840046e-07, + "loss": 0.2597, + "step": 17589 + }, + { + "epoch": 0.34, + "learning_rate": 1.318861403440643e-07, + "loss": 0.0026, + "step": 17590 + }, + { + "epoch": 0.34, + "learning_rate": 1.3188225699972818e-07, + "loss": 0.0008, + "step": 17591 + }, + { + "epoch": 0.34, + "learning_rate": 1.3187837365539202e-07, + "loss": 0.0132, + "step": 17592 + }, + { + "epoch": 0.34, + "learning_rate": 1.318744903110559e-07, + "loss": 0.0011, + "step": 17593 + }, + { + "epoch": 0.34, + "learning_rate": 1.3187060696671974e-07, + "loss": 0.0008, + "step": 17594 + }, + { + "epoch": 0.34, + "learning_rate": 1.3186672362238358e-07, + "loss": 0.0009, + "step": 17595 + }, + { + "epoch": 0.34, + "learning_rate": 1.3186284027804743e-07, + "loss": 0.0011, + "step": 17596 + }, + { + "epoch": 0.34, + "learning_rate": 1.318589569337113e-07, + "loss": 0.2632, + "step": 17597 + }, + { + "epoch": 0.34, + "learning_rate": 1.3185507358937515e-07, + "loss": 0.001, + "step": 17598 + }, + { + "epoch": 0.34, + "learning_rate": 1.3185119024503902e-07, + "loss": 0.001, + "step": 17599 + }, + { + "epoch": 0.34, + "learning_rate": 1.3184730690070286e-07, + "loss": 0.0007, + "step": 17600 + }, + { + "epoch": 0.34, + "learning_rate": 1.3184342355636673e-07, + "loss": 0.0007, + "step": 17601 + }, + { + "epoch": 0.34, + "learning_rate": 1.3183954021203058e-07, + "loss": 0.2566, + "step": 17602 + }, + { + "epoch": 0.34, + "learning_rate": 1.3183565686769445e-07, + "loss": 0.0009, + "step": 17603 + }, + { + "epoch": 0.34, + "learning_rate": 1.318317735233583e-07, + "loss": 0.0015, + "step": 17604 + }, + { + "epoch": 0.34, + "learning_rate": 1.3182789017902217e-07, + "loss": 0.0009, + "step": 17605 + }, + { + "epoch": 0.34, + "learning_rate": 1.31824006834686e-07, + "loss": 0.7514, + "step": 17606 + }, + { + "epoch": 0.34, + "learning_rate": 1.3182012349034988e-07, + "loss": 0.0009, + "step": 17607 + }, + { + "epoch": 0.34, + "learning_rate": 1.3181624014601373e-07, + "loss": 0.0007, + "step": 17608 + }, + { + "epoch": 0.34, + "learning_rate": 1.318123568016776e-07, + "loss": 0.0013, + "step": 17609 + }, + { + "epoch": 0.34, + "learning_rate": 1.3180847345734144e-07, + "loss": 0.0006, + "step": 17610 + }, + { + "epoch": 0.34, + "learning_rate": 1.3180459011300532e-07, + "loss": 0.0011, + "step": 17611 + }, + { + "epoch": 0.34, + "learning_rate": 1.3180070676866916e-07, + "loss": 0.001, + "step": 17612 + }, + { + "epoch": 0.34, + "learning_rate": 1.3179682342433303e-07, + "loss": 0.008, + "step": 17613 + }, + { + "epoch": 0.34, + "learning_rate": 1.3179294007999688e-07, + "loss": 0.0008, + "step": 17614 + }, + { + "epoch": 0.34, + "learning_rate": 1.3178905673566075e-07, + "loss": 0.001, + "step": 17615 + }, + { + "epoch": 0.34, + "learning_rate": 1.317851733913246e-07, + "loss": 0.0901, + "step": 17616 + }, + { + "epoch": 0.34, + "learning_rate": 1.3178129004698846e-07, + "loss": 0.001, + "step": 17617 + }, + { + "epoch": 0.34, + "learning_rate": 1.317774067026523e-07, + "loss": 0.6154, + "step": 17618 + }, + { + "epoch": 0.34, + "learning_rate": 1.3177352335831618e-07, + "loss": 0.1105, + "step": 17619 + }, + { + "epoch": 0.34, + "learning_rate": 1.3176964001398003e-07, + "loss": 0.0021, + "step": 17620 + }, + { + "epoch": 0.34, + "learning_rate": 1.317657566696439e-07, + "loss": 0.0009, + "step": 17621 + }, + { + "epoch": 0.34, + "learning_rate": 1.3176187332530774e-07, + "loss": 0.0047, + "step": 17622 + }, + { + "epoch": 0.34, + "learning_rate": 1.3175798998097161e-07, + "loss": 0.0008, + "step": 17623 + }, + { + "epoch": 0.34, + "learning_rate": 1.3175410663663546e-07, + "loss": 0.0824, + "step": 17624 + }, + { + "epoch": 0.34, + "learning_rate": 1.3175022329229933e-07, + "loss": 0.0012, + "step": 17625 + }, + { + "epoch": 0.34, + "learning_rate": 1.3174633994796318e-07, + "loss": 0.0015, + "step": 17626 + }, + { + "epoch": 0.34, + "learning_rate": 1.3174245660362705e-07, + "loss": 0.0012, + "step": 17627 + }, + { + "epoch": 0.34, + "learning_rate": 1.317385732592909e-07, + "loss": 0.0008, + "step": 17628 + }, + { + "epoch": 0.34, + "learning_rate": 1.3173468991495476e-07, + "loss": 0.0032, + "step": 17629 + }, + { + "epoch": 0.34, + "learning_rate": 1.317308065706186e-07, + "loss": 0.0007, + "step": 17630 + }, + { + "epoch": 0.34, + "learning_rate": 1.3172692322628248e-07, + "loss": 0.0021, + "step": 17631 + }, + { + "epoch": 0.34, + "learning_rate": 1.3172303988194633e-07, + "loss": 0.0011, + "step": 17632 + }, + { + "epoch": 0.34, + "learning_rate": 1.317191565376102e-07, + "loss": 0.0007, + "step": 17633 + }, + { + "epoch": 0.34, + "learning_rate": 1.3171527319327404e-07, + "loss": 0.001, + "step": 17634 + }, + { + "epoch": 0.34, + "learning_rate": 1.3171138984893791e-07, + "loss": 0.0029, + "step": 17635 + }, + { + "epoch": 0.34, + "learning_rate": 1.3170750650460176e-07, + "loss": 0.0009, + "step": 17636 + }, + { + "epoch": 0.34, + "learning_rate": 1.3170362316026563e-07, + "loss": 0.0007, + "step": 17637 + }, + { + "epoch": 0.34, + "learning_rate": 1.3169973981592947e-07, + "loss": 0.0068, + "step": 17638 + }, + { + "epoch": 0.34, + "learning_rate": 1.3169585647159335e-07, + "loss": 0.001, + "step": 17639 + }, + { + "epoch": 0.34, + "learning_rate": 1.316919731272572e-07, + "loss": 0.0013, + "step": 17640 + }, + { + "epoch": 0.34, + "learning_rate": 1.3168808978292106e-07, + "loss": 0.0008, + "step": 17641 + }, + { + "epoch": 0.34, + "learning_rate": 1.316842064385849e-07, + "loss": 0.0008, + "step": 17642 + }, + { + "epoch": 0.34, + "learning_rate": 1.3168032309424878e-07, + "loss": 0.0007, + "step": 17643 + }, + { + "epoch": 0.34, + "learning_rate": 1.3167643974991262e-07, + "loss": 0.0011, + "step": 17644 + }, + { + "epoch": 0.34, + "learning_rate": 1.316725564055765e-07, + "loss": 0.001, + "step": 17645 + }, + { + "epoch": 0.34, + "learning_rate": 1.3166867306124034e-07, + "loss": 0.2367, + "step": 17646 + }, + { + "epoch": 0.34, + "learning_rate": 1.316647897169042e-07, + "loss": 0.0055, + "step": 17647 + }, + { + "epoch": 0.34, + "learning_rate": 1.3166090637256806e-07, + "loss": 0.0011, + "step": 17648 + }, + { + "epoch": 0.34, + "learning_rate": 1.3165702302823193e-07, + "loss": 0.0601, + "step": 17649 + }, + { + "epoch": 0.34, + "learning_rate": 1.3165313968389577e-07, + "loss": 0.123, + "step": 17650 + }, + { + "epoch": 0.34, + "learning_rate": 1.3164925633955965e-07, + "loss": 0.005, + "step": 17651 + }, + { + "epoch": 0.34, + "learning_rate": 1.316453729952235e-07, + "loss": 0.0027, + "step": 17652 + }, + { + "epoch": 0.34, + "learning_rate": 1.3164148965088734e-07, + "loss": 0.0046, + "step": 17653 + }, + { + "epoch": 0.34, + "learning_rate": 1.3163760630655118e-07, + "loss": 0.0017, + "step": 17654 + }, + { + "epoch": 0.34, + "learning_rate": 1.3163372296221505e-07, + "loss": 0.0013, + "step": 17655 + }, + { + "epoch": 0.34, + "learning_rate": 1.316298396178789e-07, + "loss": 0.0008, + "step": 17656 + }, + { + "epoch": 0.34, + "learning_rate": 1.3162595627354277e-07, + "loss": 0.0012, + "step": 17657 + }, + { + "epoch": 0.34, + "learning_rate": 1.3162207292920661e-07, + "loss": 0.0011, + "step": 17658 + }, + { + "epoch": 0.34, + "learning_rate": 1.3161818958487048e-07, + "loss": 0.0008, + "step": 17659 + }, + { + "epoch": 0.34, + "learning_rate": 1.3161430624053433e-07, + "loss": 0.0012, + "step": 17660 + }, + { + "epoch": 0.34, + "learning_rate": 1.316104228961982e-07, + "loss": 0.0008, + "step": 17661 + }, + { + "epoch": 0.34, + "learning_rate": 1.3160653955186205e-07, + "loss": 0.0103, + "step": 17662 + }, + { + "epoch": 0.34, + "learning_rate": 1.3160265620752592e-07, + "loss": 0.7892, + "step": 17663 + }, + { + "epoch": 0.34, + "learning_rate": 1.3159877286318976e-07, + "loss": 0.0595, + "step": 17664 + }, + { + "epoch": 0.34, + "learning_rate": 1.3159488951885363e-07, + "loss": 0.0014, + "step": 17665 + }, + { + "epoch": 0.34, + "learning_rate": 1.3159100617451748e-07, + "loss": 0.0352, + "step": 17666 + }, + { + "epoch": 0.34, + "learning_rate": 1.3158712283018135e-07, + "loss": 0.0007, + "step": 17667 + }, + { + "epoch": 0.34, + "learning_rate": 1.315832394858452e-07, + "loss": 0.0012, + "step": 17668 + }, + { + "epoch": 0.34, + "learning_rate": 1.3157935614150907e-07, + "loss": 0.0009, + "step": 17669 + }, + { + "epoch": 0.34, + "learning_rate": 1.315754727971729e-07, + "loss": 0.0017, + "step": 17670 + }, + { + "epoch": 0.34, + "learning_rate": 1.3157158945283678e-07, + "loss": 0.0013, + "step": 17671 + }, + { + "epoch": 0.34, + "learning_rate": 1.3156770610850063e-07, + "loss": 0.0014, + "step": 17672 + }, + { + "epoch": 0.34, + "learning_rate": 1.315638227641645e-07, + "loss": 0.0028, + "step": 17673 + }, + { + "epoch": 0.34, + "learning_rate": 1.3155993941982835e-07, + "loss": 0.0028, + "step": 17674 + }, + { + "epoch": 0.34, + "learning_rate": 1.3155605607549222e-07, + "loss": 0.2758, + "step": 17675 + }, + { + "epoch": 0.34, + "learning_rate": 1.3155217273115606e-07, + "loss": 0.0012, + "step": 17676 + }, + { + "epoch": 0.34, + "learning_rate": 1.3154828938681993e-07, + "loss": 0.0082, + "step": 17677 + }, + { + "epoch": 0.34, + "learning_rate": 1.3154440604248378e-07, + "loss": 0.001, + "step": 17678 + }, + { + "epoch": 0.34, + "learning_rate": 1.3154052269814765e-07, + "loss": 0.4997, + "step": 17679 + }, + { + "epoch": 0.34, + "learning_rate": 1.315366393538115e-07, + "loss": 0.001, + "step": 17680 + }, + { + "epoch": 0.34, + "learning_rate": 1.3153275600947537e-07, + "loss": 0.0009, + "step": 17681 + }, + { + "epoch": 0.34, + "learning_rate": 1.315288726651392e-07, + "loss": 0.0015, + "step": 17682 + }, + { + "epoch": 0.34, + "learning_rate": 1.3152498932080308e-07, + "loss": 0.001, + "step": 17683 + }, + { + "epoch": 0.34, + "learning_rate": 1.3152110597646693e-07, + "loss": 0.7403, + "step": 17684 + }, + { + "epoch": 0.34, + "learning_rate": 1.315172226321308e-07, + "loss": 0.0007, + "step": 17685 + }, + { + "epoch": 0.34, + "learning_rate": 1.3151333928779464e-07, + "loss": 0.0008, + "step": 17686 + }, + { + "epoch": 0.34, + "learning_rate": 1.3150945594345852e-07, + "loss": 0.0009, + "step": 17687 + }, + { + "epoch": 0.34, + "learning_rate": 1.3150557259912236e-07, + "loss": 0.0008, + "step": 17688 + }, + { + "epoch": 0.34, + "learning_rate": 1.3150168925478623e-07, + "loss": 0.0012, + "step": 17689 + }, + { + "epoch": 0.34, + "learning_rate": 1.3149780591045008e-07, + "loss": 0.001, + "step": 17690 + }, + { + "epoch": 0.34, + "learning_rate": 1.3149392256611392e-07, + "loss": 0.0008, + "step": 17691 + }, + { + "epoch": 0.34, + "learning_rate": 1.314900392217778e-07, + "loss": 0.0007, + "step": 17692 + }, + { + "epoch": 0.34, + "learning_rate": 1.3148615587744164e-07, + "loss": 0.0011, + "step": 17693 + }, + { + "epoch": 0.34, + "learning_rate": 1.314822725331055e-07, + "loss": 0.0007, + "step": 17694 + }, + { + "epoch": 0.34, + "learning_rate": 1.3147838918876936e-07, + "loss": 0.2798, + "step": 17695 + }, + { + "epoch": 0.34, + "learning_rate": 1.3147450584443323e-07, + "loss": 0.0009, + "step": 17696 + }, + { + "epoch": 0.34, + "learning_rate": 1.3147062250009707e-07, + "loss": 0.0016, + "step": 17697 + }, + { + "epoch": 0.34, + "learning_rate": 1.3146673915576094e-07, + "loss": 0.0008, + "step": 17698 + }, + { + "epoch": 0.34, + "learning_rate": 1.314628558114248e-07, + "loss": 0.9872, + "step": 17699 + }, + { + "epoch": 0.34, + "learning_rate": 1.3145897246708866e-07, + "loss": 0.0009, + "step": 17700 + }, + { + "epoch": 0.34, + "learning_rate": 1.314550891227525e-07, + "loss": 0.0011, + "step": 17701 + }, + { + "epoch": 0.34, + "learning_rate": 1.3145120577841638e-07, + "loss": 0.0012, + "step": 17702 + }, + { + "epoch": 0.34, + "learning_rate": 1.3144732243408022e-07, + "loss": 0.0011, + "step": 17703 + }, + { + "epoch": 0.34, + "learning_rate": 1.314434390897441e-07, + "loss": 0.0008, + "step": 17704 + }, + { + "epoch": 0.34, + "learning_rate": 1.3143955574540794e-07, + "loss": 0.0011, + "step": 17705 + }, + { + "epoch": 0.34, + "learning_rate": 1.314356724010718e-07, + "loss": 0.0032, + "step": 17706 + }, + { + "epoch": 0.34, + "learning_rate": 1.3143178905673565e-07, + "loss": 0.0011, + "step": 17707 + }, + { + "epoch": 0.34, + "learning_rate": 1.3142790571239953e-07, + "loss": 0.0083, + "step": 17708 + }, + { + "epoch": 0.34, + "learning_rate": 1.3142402236806337e-07, + "loss": 0.0021, + "step": 17709 + }, + { + "epoch": 0.34, + "learning_rate": 1.3142013902372724e-07, + "loss": 0.0011, + "step": 17710 + }, + { + "epoch": 0.34, + "learning_rate": 1.314162556793911e-07, + "loss": 0.0008, + "step": 17711 + }, + { + "epoch": 0.34, + "learning_rate": 1.3141237233505493e-07, + "loss": 0.001, + "step": 17712 + }, + { + "epoch": 0.34, + "learning_rate": 1.314084889907188e-07, + "loss": 0.0012, + "step": 17713 + }, + { + "epoch": 0.34, + "learning_rate": 1.3140460564638265e-07, + "loss": 0.738, + "step": 17714 + }, + { + "epoch": 0.34, + "learning_rate": 1.3140072230204652e-07, + "loss": 0.0162, + "step": 17715 + }, + { + "epoch": 0.34, + "learning_rate": 1.3139683895771036e-07, + "loss": 0.0033, + "step": 17716 + }, + { + "epoch": 0.34, + "learning_rate": 1.3139295561337424e-07, + "loss": 0.0013, + "step": 17717 + }, + { + "epoch": 0.34, + "learning_rate": 1.3138907226903808e-07, + "loss": 0.0009, + "step": 17718 + }, + { + "epoch": 0.34, + "learning_rate": 1.3138518892470193e-07, + "loss": 0.001, + "step": 17719 + }, + { + "epoch": 0.34, + "learning_rate": 1.313813055803658e-07, + "loss": 0.0011, + "step": 17720 + }, + { + "epoch": 0.34, + "learning_rate": 1.3137742223602964e-07, + "loss": 0.001, + "step": 17721 + }, + { + "epoch": 0.34, + "learning_rate": 1.3137353889169351e-07, + "loss": 0.0008, + "step": 17722 + }, + { + "epoch": 0.34, + "learning_rate": 1.3136965554735736e-07, + "loss": 0.0019, + "step": 17723 + }, + { + "epoch": 0.34, + "learning_rate": 1.3136577220302123e-07, + "loss": 0.06, + "step": 17724 + }, + { + "epoch": 0.34, + "learning_rate": 1.3136188885868508e-07, + "loss": 0.0007, + "step": 17725 + }, + { + "epoch": 0.34, + "learning_rate": 1.3135800551434895e-07, + "loss": 0.0006, + "step": 17726 + }, + { + "epoch": 0.34, + "learning_rate": 1.313541221700128e-07, + "loss": 0.0009, + "step": 17727 + }, + { + "epoch": 0.34, + "learning_rate": 1.3135023882567666e-07, + "loss": 0.0006, + "step": 17728 + }, + { + "epoch": 0.34, + "learning_rate": 1.313463554813405e-07, + "loss": 0.0015, + "step": 17729 + }, + { + "epoch": 0.34, + "learning_rate": 1.3134247213700438e-07, + "loss": 0.0009, + "step": 17730 + }, + { + "epoch": 0.34, + "learning_rate": 1.3133858879266823e-07, + "loss": 0.0011, + "step": 17731 + }, + { + "epoch": 0.34, + "learning_rate": 1.313347054483321e-07, + "loss": 0.0007, + "step": 17732 + }, + { + "epoch": 0.34, + "learning_rate": 1.3133082210399594e-07, + "loss": 0.0006, + "step": 17733 + }, + { + "epoch": 0.34, + "learning_rate": 1.3132693875965981e-07, + "loss": 0.0012, + "step": 17734 + }, + { + "epoch": 0.34, + "learning_rate": 1.3132305541532366e-07, + "loss": 0.0009, + "step": 17735 + }, + { + "epoch": 0.34, + "learning_rate": 1.3131917207098753e-07, + "loss": 0.0015, + "step": 17736 + }, + { + "epoch": 0.34, + "learning_rate": 1.3131528872665137e-07, + "loss": 0.0009, + "step": 17737 + }, + { + "epoch": 0.34, + "learning_rate": 1.3131140538231525e-07, + "loss": 0.3955, + "step": 17738 + }, + { + "epoch": 0.34, + "learning_rate": 1.313075220379791e-07, + "loss": 0.096, + "step": 17739 + }, + { + "epoch": 0.34, + "learning_rate": 1.3130363869364296e-07, + "loss": 0.0058, + "step": 17740 + }, + { + "epoch": 0.34, + "learning_rate": 1.312997553493068e-07, + "loss": 0.0011, + "step": 17741 + }, + { + "epoch": 0.34, + "learning_rate": 1.3129587200497068e-07, + "loss": 0.0008, + "step": 17742 + }, + { + "epoch": 0.34, + "learning_rate": 1.3129198866063452e-07, + "loss": 0.7017, + "step": 17743 + }, + { + "epoch": 0.34, + "learning_rate": 1.312881053162984e-07, + "loss": 0.0008, + "step": 17744 + }, + { + "epoch": 0.34, + "learning_rate": 1.3128422197196224e-07, + "loss": 0.0008, + "step": 17745 + }, + { + "epoch": 0.34, + "learning_rate": 1.312803386276261e-07, + "loss": 0.0007, + "step": 17746 + }, + { + "epoch": 0.34, + "learning_rate": 1.3127645528328996e-07, + "loss": 0.0014, + "step": 17747 + }, + { + "epoch": 0.34, + "learning_rate": 1.3127257193895383e-07, + "loss": 0.0009, + "step": 17748 + }, + { + "epoch": 0.34, + "learning_rate": 1.3126868859461767e-07, + "loss": 0.0007, + "step": 17749 + }, + { + "epoch": 0.34, + "learning_rate": 1.3126480525028155e-07, + "loss": 0.0008, + "step": 17750 + }, + { + "epoch": 0.34, + "learning_rate": 1.312609219059454e-07, + "loss": 0.0008, + "step": 17751 + }, + { + "epoch": 0.34, + "learning_rate": 1.3125703856160926e-07, + "loss": 0.001, + "step": 17752 + }, + { + "epoch": 0.34, + "learning_rate": 1.312531552172731e-07, + "loss": 0.0009, + "step": 17753 + }, + { + "epoch": 0.34, + "learning_rate": 1.3124927187293698e-07, + "loss": 0.0013, + "step": 17754 + }, + { + "epoch": 0.34, + "learning_rate": 1.3124538852860082e-07, + "loss": 0.0012, + "step": 17755 + }, + { + "epoch": 0.34, + "learning_rate": 1.312415051842647e-07, + "loss": 0.0008, + "step": 17756 + }, + { + "epoch": 0.34, + "learning_rate": 1.3123762183992854e-07, + "loss": 0.0009, + "step": 17757 + }, + { + "epoch": 0.34, + "learning_rate": 1.312337384955924e-07, + "loss": 0.0123, + "step": 17758 + }, + { + "epoch": 0.34, + "learning_rate": 1.3122985515125626e-07, + "loss": 0.0006, + "step": 17759 + }, + { + "epoch": 0.34, + "learning_rate": 1.3122597180692013e-07, + "loss": 0.9238, + "step": 17760 + }, + { + "epoch": 0.34, + "learning_rate": 1.3122208846258397e-07, + "loss": 0.0009, + "step": 17761 + }, + { + "epoch": 0.34, + "learning_rate": 1.3121820511824784e-07, + "loss": 0.4949, + "step": 17762 + }, + { + "epoch": 0.34, + "learning_rate": 1.312143217739117e-07, + "loss": 0.0026, + "step": 17763 + }, + { + "epoch": 0.34, + "learning_rate": 1.3121043842957556e-07, + "loss": 1.4334, + "step": 17764 + }, + { + "epoch": 0.34, + "learning_rate": 1.312065550852394e-07, + "loss": 0.0008, + "step": 17765 + }, + { + "epoch": 0.34, + "learning_rate": 1.3120267174090328e-07, + "loss": 0.0008, + "step": 17766 + }, + { + "epoch": 0.34, + "learning_rate": 1.3119878839656712e-07, + "loss": 0.0014, + "step": 17767 + }, + { + "epoch": 0.34, + "learning_rate": 1.31194905052231e-07, + "loss": 0.0024, + "step": 17768 + }, + { + "epoch": 0.34, + "learning_rate": 1.311910217078948e-07, + "loss": 0.0007, + "step": 17769 + }, + { + "epoch": 0.34, + "learning_rate": 1.3118713836355868e-07, + "loss": 0.0009, + "step": 17770 + }, + { + "epoch": 0.34, + "learning_rate": 1.3118325501922253e-07, + "loss": 0.0011, + "step": 17771 + }, + { + "epoch": 0.34, + "learning_rate": 1.311793716748864e-07, + "loss": 0.6229, + "step": 17772 + }, + { + "epoch": 0.34, + "learning_rate": 1.3117548833055025e-07, + "loss": 0.3726, + "step": 17773 + }, + { + "epoch": 0.34, + "learning_rate": 1.3117160498621412e-07, + "loss": 0.0474, + "step": 17774 + }, + { + "epoch": 0.34, + "learning_rate": 1.3116772164187796e-07, + "loss": 0.0017, + "step": 17775 + }, + { + "epoch": 0.34, + "learning_rate": 1.3116383829754183e-07, + "loss": 0.001, + "step": 17776 + }, + { + "epoch": 0.34, + "learning_rate": 1.3115995495320568e-07, + "loss": 0.005, + "step": 17777 + }, + { + "epoch": 0.34, + "learning_rate": 1.3115607160886955e-07, + "loss": 0.0013, + "step": 17778 + }, + { + "epoch": 0.34, + "learning_rate": 1.311521882645334e-07, + "loss": 0.5571, + "step": 17779 + }, + { + "epoch": 0.34, + "learning_rate": 1.3114830492019727e-07, + "loss": 0.001, + "step": 17780 + }, + { + "epoch": 0.34, + "learning_rate": 1.311444215758611e-07, + "loss": 0.0023, + "step": 17781 + }, + { + "epoch": 0.34, + "learning_rate": 1.3114053823152498e-07, + "loss": 0.0018, + "step": 17782 + }, + { + "epoch": 0.34, + "learning_rate": 1.3113665488718883e-07, + "loss": 0.6039, + "step": 17783 + }, + { + "epoch": 0.34, + "learning_rate": 1.311327715428527e-07, + "loss": 0.001, + "step": 17784 + }, + { + "epoch": 0.34, + "learning_rate": 1.3112888819851654e-07, + "loss": 0.9657, + "step": 17785 + }, + { + "epoch": 0.35, + "learning_rate": 1.3112500485418042e-07, + "loss": 0.0008, + "step": 17786 + }, + { + "epoch": 0.35, + "learning_rate": 1.3112112150984426e-07, + "loss": 0.0011, + "step": 17787 + }, + { + "epoch": 0.35, + "learning_rate": 1.3111723816550813e-07, + "loss": 0.001, + "step": 17788 + }, + { + "epoch": 0.35, + "learning_rate": 1.3111335482117198e-07, + "loss": 0.0017, + "step": 17789 + }, + { + "epoch": 0.35, + "learning_rate": 1.3110947147683585e-07, + "loss": 0.001, + "step": 17790 + }, + { + "epoch": 0.35, + "learning_rate": 1.311055881324997e-07, + "loss": 0.0024, + "step": 17791 + }, + { + "epoch": 0.35, + "learning_rate": 1.3110170478816357e-07, + "loss": 0.0013, + "step": 17792 + }, + { + "epoch": 0.35, + "learning_rate": 1.310978214438274e-07, + "loss": 0.0009, + "step": 17793 + }, + { + "epoch": 0.35, + "learning_rate": 1.3109393809949128e-07, + "loss": 0.0012, + "step": 17794 + }, + { + "epoch": 0.35, + "learning_rate": 1.3109005475515513e-07, + "loss": 0.1002, + "step": 17795 + }, + { + "epoch": 0.35, + "learning_rate": 1.31086171410819e-07, + "loss": 0.001, + "step": 17796 + }, + { + "epoch": 0.35, + "learning_rate": 1.3108228806648284e-07, + "loss": 0.0008, + "step": 17797 + }, + { + "epoch": 0.35, + "learning_rate": 1.3107840472214671e-07, + "loss": 0.001, + "step": 17798 + }, + { + "epoch": 0.35, + "learning_rate": 1.3107452137781056e-07, + "loss": 0.0018, + "step": 17799 + }, + { + "epoch": 0.35, + "learning_rate": 1.3107063803347443e-07, + "loss": 0.0013, + "step": 17800 + }, + { + "epoch": 0.35, + "learning_rate": 1.3106675468913828e-07, + "loss": 0.0375, + "step": 17801 + }, + { + "epoch": 0.35, + "learning_rate": 1.3106287134480215e-07, + "loss": 0.0009, + "step": 17802 + }, + { + "epoch": 0.35, + "learning_rate": 1.31058988000466e-07, + "loss": 0.0016, + "step": 17803 + }, + { + "epoch": 0.35, + "learning_rate": 1.3105510465612986e-07, + "loss": 0.0009, + "step": 17804 + }, + { + "epoch": 0.35, + "learning_rate": 1.310512213117937e-07, + "loss": 0.0061, + "step": 17805 + }, + { + "epoch": 0.35, + "learning_rate": 1.3104733796745758e-07, + "loss": 0.0009, + "step": 17806 + }, + { + "epoch": 0.35, + "learning_rate": 1.3104345462312143e-07, + "loss": 0.0008, + "step": 17807 + }, + { + "epoch": 0.35, + "learning_rate": 1.310395712787853e-07, + "loss": 0.0012, + "step": 17808 + }, + { + "epoch": 0.35, + "learning_rate": 1.3103568793444914e-07, + "loss": 0.0014, + "step": 17809 + }, + { + "epoch": 0.35, + "learning_rate": 1.3103180459011301e-07, + "loss": 0.0009, + "step": 17810 + }, + { + "epoch": 0.35, + "learning_rate": 1.3102792124577686e-07, + "loss": 0.0014, + "step": 17811 + }, + { + "epoch": 0.35, + "learning_rate": 1.3102403790144073e-07, + "loss": 0.0007, + "step": 17812 + }, + { + "epoch": 0.35, + "learning_rate": 1.3102015455710457e-07, + "loss": 0.0011, + "step": 17813 + }, + { + "epoch": 0.35, + "learning_rate": 1.3101627121276845e-07, + "loss": 0.0013, + "step": 17814 + }, + { + "epoch": 0.35, + "learning_rate": 1.310123878684323e-07, + "loss": 0.0009, + "step": 17815 + }, + { + "epoch": 0.35, + "learning_rate": 1.3100850452409616e-07, + "loss": 0.0016, + "step": 17816 + }, + { + "epoch": 0.35, + "learning_rate": 1.3100462117976e-07, + "loss": 0.0009, + "step": 17817 + }, + { + "epoch": 0.35, + "learning_rate": 1.3100073783542388e-07, + "loss": 0.0007, + "step": 17818 + }, + { + "epoch": 0.35, + "learning_rate": 1.3099685449108772e-07, + "loss": 0.0008, + "step": 17819 + }, + { + "epoch": 0.35, + "learning_rate": 1.309929711467516e-07, + "loss": 1.273, + "step": 17820 + }, + { + "epoch": 0.35, + "learning_rate": 1.3098908780241544e-07, + "loss": 0.4957, + "step": 17821 + }, + { + "epoch": 0.35, + "learning_rate": 1.309852044580793e-07, + "loss": 0.0009, + "step": 17822 + }, + { + "epoch": 0.35, + "learning_rate": 1.3098132111374316e-07, + "loss": 0.0012, + "step": 17823 + }, + { + "epoch": 0.35, + "learning_rate": 1.3097743776940703e-07, + "loss": 0.0011, + "step": 17824 + }, + { + "epoch": 0.35, + "learning_rate": 1.3097355442507087e-07, + "loss": 0.0023, + "step": 17825 + }, + { + "epoch": 0.35, + "learning_rate": 1.3096967108073475e-07, + "loss": 0.0008, + "step": 17826 + }, + { + "epoch": 0.35, + "learning_rate": 1.3096578773639856e-07, + "loss": 0.001, + "step": 17827 + }, + { + "epoch": 0.35, + "learning_rate": 1.3096190439206244e-07, + "loss": 0.0009, + "step": 17828 + }, + { + "epoch": 0.35, + "learning_rate": 1.3095802104772628e-07, + "loss": 0.0009, + "step": 17829 + }, + { + "epoch": 0.35, + "learning_rate": 1.3095413770339015e-07, + "loss": 0.0096, + "step": 17830 + }, + { + "epoch": 0.35, + "learning_rate": 1.30950254359054e-07, + "loss": 0.4841, + "step": 17831 + }, + { + "epoch": 0.35, + "learning_rate": 1.3094637101471787e-07, + "loss": 0.0007, + "step": 17832 + }, + { + "epoch": 0.35, + "learning_rate": 1.3094248767038171e-07, + "loss": 0.0153, + "step": 17833 + }, + { + "epoch": 0.35, + "learning_rate": 1.3093860432604558e-07, + "loss": 0.0007, + "step": 17834 + }, + { + "epoch": 0.35, + "learning_rate": 1.3093472098170943e-07, + "loss": 0.001, + "step": 17835 + }, + { + "epoch": 0.35, + "learning_rate": 1.309308376373733e-07, + "loss": 0.002, + "step": 17836 + }, + { + "epoch": 0.35, + "learning_rate": 1.3092695429303715e-07, + "loss": 0.001, + "step": 17837 + }, + { + "epoch": 0.35, + "learning_rate": 1.3092307094870102e-07, + "loss": 0.0009, + "step": 17838 + }, + { + "epoch": 0.35, + "learning_rate": 1.3091918760436486e-07, + "loss": 0.0038, + "step": 17839 + }, + { + "epoch": 0.35, + "learning_rate": 1.3091530426002873e-07, + "loss": 0.0008, + "step": 17840 + }, + { + "epoch": 0.35, + "learning_rate": 1.3091142091569258e-07, + "loss": 0.0008, + "step": 17841 + }, + { + "epoch": 0.35, + "learning_rate": 1.3090753757135645e-07, + "loss": 0.0013, + "step": 17842 + }, + { + "epoch": 0.35, + "learning_rate": 1.309036542270203e-07, + "loss": 0.0008, + "step": 17843 + }, + { + "epoch": 0.35, + "learning_rate": 1.3089977088268417e-07, + "loss": 0.0007, + "step": 17844 + }, + { + "epoch": 0.35, + "learning_rate": 1.30895887538348e-07, + "loss": 0.0009, + "step": 17845 + }, + { + "epoch": 0.35, + "learning_rate": 1.3089200419401188e-07, + "loss": 0.0111, + "step": 17846 + }, + { + "epoch": 0.35, + "learning_rate": 1.3088812084967573e-07, + "loss": 0.0017, + "step": 17847 + }, + { + "epoch": 0.35, + "learning_rate": 1.308842375053396e-07, + "loss": 0.0013, + "step": 17848 + }, + { + "epoch": 0.35, + "learning_rate": 1.3088035416100345e-07, + "loss": 0.0007, + "step": 17849 + }, + { + "epoch": 0.35, + "learning_rate": 1.3087647081666732e-07, + "loss": 0.001, + "step": 17850 + }, + { + "epoch": 0.35, + "learning_rate": 1.3087258747233116e-07, + "loss": 0.0009, + "step": 17851 + }, + { + "epoch": 0.35, + "learning_rate": 1.3086870412799503e-07, + "loss": 0.002, + "step": 17852 + }, + { + "epoch": 0.35, + "learning_rate": 1.3086482078365888e-07, + "loss": 0.001, + "step": 17853 + }, + { + "epoch": 0.35, + "learning_rate": 1.3086093743932275e-07, + "loss": 0.0574, + "step": 17854 + }, + { + "epoch": 0.35, + "learning_rate": 1.308570540949866e-07, + "loss": 0.0207, + "step": 17855 + }, + { + "epoch": 0.35, + "learning_rate": 1.3085317075065047e-07, + "loss": 0.0021, + "step": 17856 + }, + { + "epoch": 0.35, + "learning_rate": 1.308492874063143e-07, + "loss": 0.001, + "step": 17857 + }, + { + "epoch": 0.35, + "learning_rate": 1.3084540406197818e-07, + "loss": 0.0079, + "step": 17858 + }, + { + "epoch": 0.35, + "learning_rate": 1.3084152071764203e-07, + "loss": 0.0012, + "step": 17859 + }, + { + "epoch": 0.35, + "learning_rate": 1.308376373733059e-07, + "loss": 0.001, + "step": 17860 + }, + { + "epoch": 0.35, + "learning_rate": 1.3083375402896974e-07, + "loss": 0.0062, + "step": 17861 + }, + { + "epoch": 0.35, + "learning_rate": 1.3082987068463362e-07, + "loss": 0.004, + "step": 17862 + }, + { + "epoch": 0.35, + "learning_rate": 1.3082598734029746e-07, + "loss": 0.0008, + "step": 17863 + }, + { + "epoch": 0.35, + "learning_rate": 1.3082210399596133e-07, + "loss": 0.0008, + "step": 17864 + }, + { + "epoch": 0.35, + "learning_rate": 1.3081822065162518e-07, + "loss": 0.0009, + "step": 17865 + }, + { + "epoch": 0.35, + "learning_rate": 1.3081433730728905e-07, + "loss": 0.0098, + "step": 17866 + }, + { + "epoch": 0.35, + "learning_rate": 1.308104539629529e-07, + "loss": 0.001, + "step": 17867 + }, + { + "epoch": 0.35, + "learning_rate": 1.3080657061861674e-07, + "loss": 0.0008, + "step": 17868 + }, + { + "epoch": 0.35, + "learning_rate": 1.308026872742806e-07, + "loss": 0.0007, + "step": 17869 + }, + { + "epoch": 0.35, + "learning_rate": 1.3079880392994446e-07, + "loss": 0.0574, + "step": 17870 + }, + { + "epoch": 0.35, + "learning_rate": 1.3079492058560833e-07, + "loss": 0.0009, + "step": 17871 + }, + { + "epoch": 0.35, + "learning_rate": 1.3079103724127217e-07, + "loss": 0.0008, + "step": 17872 + }, + { + "epoch": 0.35, + "learning_rate": 1.3078715389693604e-07, + "loss": 0.0031, + "step": 17873 + }, + { + "epoch": 0.35, + "learning_rate": 1.307832705525999e-07, + "loss": 0.0017, + "step": 17874 + }, + { + "epoch": 0.35, + "learning_rate": 1.3077938720826376e-07, + "loss": 0.0331, + "step": 17875 + }, + { + "epoch": 0.35, + "learning_rate": 1.307755038639276e-07, + "loss": 1.5048, + "step": 17876 + }, + { + "epoch": 0.35, + "learning_rate": 1.3077162051959148e-07, + "loss": 0.0008, + "step": 17877 + }, + { + "epoch": 0.35, + "learning_rate": 1.3076773717525532e-07, + "loss": 0.7346, + "step": 17878 + }, + { + "epoch": 0.35, + "learning_rate": 1.307638538309192e-07, + "loss": 0.0009, + "step": 17879 + }, + { + "epoch": 0.35, + "learning_rate": 1.3075997048658304e-07, + "loss": 1.2922, + "step": 17880 + }, + { + "epoch": 0.35, + "learning_rate": 1.307560871422469e-07, + "loss": 0.0007, + "step": 17881 + }, + { + "epoch": 0.35, + "learning_rate": 1.3075220379791075e-07, + "loss": 0.003, + "step": 17882 + }, + { + "epoch": 0.35, + "learning_rate": 1.3074832045357463e-07, + "loss": 0.0008, + "step": 17883 + }, + { + "epoch": 0.35, + "learning_rate": 1.3074443710923847e-07, + "loss": 0.0012, + "step": 17884 + }, + { + "epoch": 0.35, + "learning_rate": 1.3074055376490232e-07, + "loss": 0.0007, + "step": 17885 + }, + { + "epoch": 0.35, + "learning_rate": 1.307366704205662e-07, + "loss": 0.0011, + "step": 17886 + }, + { + "epoch": 0.35, + "learning_rate": 1.3073278707623003e-07, + "loss": 0.0008, + "step": 17887 + }, + { + "epoch": 0.35, + "learning_rate": 1.307289037318939e-07, + "loss": 0.0011, + "step": 17888 + }, + { + "epoch": 0.35, + "learning_rate": 1.3072502038755775e-07, + "loss": 0.0006, + "step": 17889 + }, + { + "epoch": 0.35, + "learning_rate": 1.3072113704322162e-07, + "loss": 1.137, + "step": 17890 + }, + { + "epoch": 0.35, + "learning_rate": 1.3071725369888547e-07, + "loss": 0.0009, + "step": 17891 + }, + { + "epoch": 0.35, + "learning_rate": 1.3071337035454934e-07, + "loss": 0.001, + "step": 17892 + }, + { + "epoch": 0.35, + "learning_rate": 1.3070948701021318e-07, + "loss": 0.0008, + "step": 17893 + }, + { + "epoch": 0.35, + "learning_rate": 1.3070560366587705e-07, + "loss": 0.0014, + "step": 17894 + }, + { + "epoch": 0.35, + "learning_rate": 1.307017203215409e-07, + "loss": 0.1048, + "step": 17895 + }, + { + "epoch": 0.35, + "learning_rate": 1.3069783697720474e-07, + "loss": 0.0009, + "step": 17896 + }, + { + "epoch": 0.35, + "learning_rate": 1.3069395363286861e-07, + "loss": 0.001, + "step": 17897 + }, + { + "epoch": 0.35, + "learning_rate": 1.3069007028853246e-07, + "loss": 0.132, + "step": 17898 + }, + { + "epoch": 0.35, + "learning_rate": 1.3068618694419633e-07, + "loss": 0.0009, + "step": 17899 + }, + { + "epoch": 0.35, + "learning_rate": 1.3068230359986018e-07, + "loss": 0.9683, + "step": 17900 + }, + { + "epoch": 0.35, + "learning_rate": 1.3067842025552405e-07, + "loss": 0.0007, + "step": 17901 + }, + { + "epoch": 0.35, + "learning_rate": 1.306745369111879e-07, + "loss": 0.0008, + "step": 17902 + }, + { + "epoch": 0.35, + "learning_rate": 1.3067065356685176e-07, + "loss": 0.0009, + "step": 17903 + }, + { + "epoch": 0.35, + "learning_rate": 1.306667702225156e-07, + "loss": 1.794, + "step": 17904 + }, + { + "epoch": 0.35, + "learning_rate": 1.3066288687817948e-07, + "loss": 0.0193, + "step": 17905 + }, + { + "epoch": 0.35, + "learning_rate": 1.3065900353384333e-07, + "loss": 0.0007, + "step": 17906 + }, + { + "epoch": 0.35, + "learning_rate": 1.306551201895072e-07, + "loss": 0.0008, + "step": 17907 + }, + { + "epoch": 0.35, + "learning_rate": 1.3065123684517104e-07, + "loss": 0.0007, + "step": 17908 + }, + { + "epoch": 0.35, + "learning_rate": 1.3064735350083491e-07, + "loss": 0.0008, + "step": 17909 + }, + { + "epoch": 0.35, + "learning_rate": 1.3064347015649876e-07, + "loss": 0.057, + "step": 17910 + }, + { + "epoch": 0.35, + "learning_rate": 1.3063958681216263e-07, + "loss": 0.0009, + "step": 17911 + }, + { + "epoch": 0.35, + "learning_rate": 1.3063570346782647e-07, + "loss": 0.004, + "step": 17912 + }, + { + "epoch": 0.35, + "learning_rate": 1.3063182012349035e-07, + "loss": 0.0008, + "step": 17913 + }, + { + "epoch": 0.35, + "learning_rate": 1.306279367791542e-07, + "loss": 0.0009, + "step": 17914 + }, + { + "epoch": 0.35, + "learning_rate": 1.3062405343481806e-07, + "loss": 0.001, + "step": 17915 + }, + { + "epoch": 0.35, + "learning_rate": 1.306201700904819e-07, + "loss": 0.0021, + "step": 17916 + }, + { + "epoch": 0.35, + "learning_rate": 1.3061628674614578e-07, + "loss": 0.26, + "step": 17917 + }, + { + "epoch": 0.35, + "learning_rate": 1.3061240340180962e-07, + "loss": 1.0047, + "step": 17918 + }, + { + "epoch": 0.35, + "learning_rate": 1.306085200574735e-07, + "loss": 0.0009, + "step": 17919 + }, + { + "epoch": 0.35, + "learning_rate": 1.3060463671313734e-07, + "loss": 0.0013, + "step": 17920 + }, + { + "epoch": 0.35, + "learning_rate": 1.306007533688012e-07, + "loss": 0.0015, + "step": 17921 + }, + { + "epoch": 0.35, + "learning_rate": 1.3059687002446506e-07, + "loss": 0.0009, + "step": 17922 + }, + { + "epoch": 0.35, + "learning_rate": 1.3059298668012893e-07, + "loss": 0.001, + "step": 17923 + }, + { + "epoch": 0.35, + "learning_rate": 1.3058910333579277e-07, + "loss": 0.4931, + "step": 17924 + }, + { + "epoch": 0.35, + "learning_rate": 1.3058521999145665e-07, + "loss": 0.0203, + "step": 17925 + }, + { + "epoch": 0.35, + "learning_rate": 1.305813366471205e-07, + "loss": 0.0011, + "step": 17926 + }, + { + "epoch": 0.35, + "learning_rate": 1.3057745330278436e-07, + "loss": 1.3864, + "step": 17927 + }, + { + "epoch": 0.35, + "learning_rate": 1.305735699584482e-07, + "loss": 0.0792, + "step": 17928 + }, + { + "epoch": 0.35, + "learning_rate": 1.3056968661411208e-07, + "loss": 0.001, + "step": 17929 + }, + { + "epoch": 0.35, + "learning_rate": 1.3056580326977592e-07, + "loss": 0.0009, + "step": 17930 + }, + { + "epoch": 0.35, + "learning_rate": 1.305619199254398e-07, + "loss": 0.0012, + "step": 17931 + }, + { + "epoch": 0.35, + "learning_rate": 1.3055803658110364e-07, + "loss": 0.001, + "step": 17932 + }, + { + "epoch": 0.35, + "learning_rate": 1.305541532367675e-07, + "loss": 0.0012, + "step": 17933 + }, + { + "epoch": 0.35, + "learning_rate": 1.3055026989243136e-07, + "loss": 0.8864, + "step": 17934 + }, + { + "epoch": 0.35, + "learning_rate": 1.3054638654809523e-07, + "loss": 0.0037, + "step": 17935 + }, + { + "epoch": 0.35, + "learning_rate": 1.3054250320375907e-07, + "loss": 0.0008, + "step": 17936 + }, + { + "epoch": 0.35, + "learning_rate": 1.3053861985942294e-07, + "loss": 0.0012, + "step": 17937 + }, + { + "epoch": 0.35, + "learning_rate": 1.305347365150868e-07, + "loss": 0.5723, + "step": 17938 + }, + { + "epoch": 0.35, + "learning_rate": 1.3053085317075066e-07, + "loss": 0.5987, + "step": 17939 + }, + { + "epoch": 0.35, + "learning_rate": 1.305269698264145e-07, + "loss": 0.0008, + "step": 17940 + }, + { + "epoch": 0.35, + "learning_rate": 1.3052308648207838e-07, + "loss": 0.0012, + "step": 17941 + }, + { + "epoch": 0.35, + "learning_rate": 1.3051920313774222e-07, + "loss": 0.0009, + "step": 17942 + }, + { + "epoch": 0.35, + "learning_rate": 1.3051531979340607e-07, + "loss": 0.0012, + "step": 17943 + }, + { + "epoch": 0.35, + "learning_rate": 1.305114364490699e-07, + "loss": 0.0008, + "step": 17944 + }, + { + "epoch": 0.35, + "learning_rate": 1.3050755310473378e-07, + "loss": 0.0009, + "step": 17945 + }, + { + "epoch": 0.35, + "learning_rate": 1.3050366976039763e-07, + "loss": 0.0008, + "step": 17946 + }, + { + "epoch": 0.35, + "learning_rate": 1.304997864160615e-07, + "loss": 0.001, + "step": 17947 + }, + { + "epoch": 0.35, + "learning_rate": 1.3049590307172535e-07, + "loss": 0.0106, + "step": 17948 + }, + { + "epoch": 0.35, + "learning_rate": 1.3049201972738922e-07, + "loss": 0.0363, + "step": 17949 + }, + { + "epoch": 0.35, + "learning_rate": 1.3048813638305306e-07, + "loss": 0.0026, + "step": 17950 + }, + { + "epoch": 0.35, + "learning_rate": 1.3048425303871693e-07, + "loss": 0.0008, + "step": 17951 + }, + { + "epoch": 0.35, + "learning_rate": 1.3048036969438078e-07, + "loss": 0.001, + "step": 17952 + }, + { + "epoch": 0.35, + "learning_rate": 1.3047648635004465e-07, + "loss": 0.0008, + "step": 17953 + }, + { + "epoch": 0.35, + "learning_rate": 1.304726030057085e-07, + "loss": 0.0009, + "step": 17954 + }, + { + "epoch": 0.35, + "learning_rate": 1.3046871966137237e-07, + "loss": 0.0909, + "step": 17955 + }, + { + "epoch": 0.35, + "learning_rate": 1.304648363170362e-07, + "loss": 0.0013, + "step": 17956 + }, + { + "epoch": 0.35, + "learning_rate": 1.3046095297270008e-07, + "loss": 0.0011, + "step": 17957 + }, + { + "epoch": 0.35, + "learning_rate": 1.3045706962836393e-07, + "loss": 0.0008, + "step": 17958 + }, + { + "epoch": 0.35, + "learning_rate": 1.304531862840278e-07, + "loss": 0.001, + "step": 17959 + }, + { + "epoch": 0.35, + "learning_rate": 1.3044930293969164e-07, + "loss": 0.0009, + "step": 17960 + }, + { + "epoch": 0.35, + "learning_rate": 1.3044541959535552e-07, + "loss": 0.1126, + "step": 17961 + }, + { + "epoch": 0.35, + "learning_rate": 1.3044153625101936e-07, + "loss": 0.0012, + "step": 17962 + }, + { + "epoch": 0.35, + "learning_rate": 1.3043765290668323e-07, + "loss": 0.0551, + "step": 17963 + }, + { + "epoch": 0.35, + "learning_rate": 1.3043376956234708e-07, + "loss": 0.0009, + "step": 17964 + }, + { + "epoch": 0.35, + "learning_rate": 1.3042988621801095e-07, + "loss": 0.0009, + "step": 17965 + }, + { + "epoch": 0.35, + "learning_rate": 1.304260028736748e-07, + "loss": 0.0084, + "step": 17966 + }, + { + "epoch": 0.35, + "learning_rate": 1.3042211952933867e-07, + "loss": 0.001, + "step": 17967 + }, + { + "epoch": 0.35, + "learning_rate": 1.304182361850025e-07, + "loss": 0.3666, + "step": 17968 + }, + { + "epoch": 0.35, + "learning_rate": 1.3041435284066638e-07, + "loss": 0.0009, + "step": 17969 + }, + { + "epoch": 0.35, + "learning_rate": 1.3041046949633023e-07, + "loss": 0.0031, + "step": 17970 + }, + { + "epoch": 0.35, + "learning_rate": 1.304065861519941e-07, + "loss": 0.0007, + "step": 17971 + }, + { + "epoch": 0.35, + "learning_rate": 1.3040270280765794e-07, + "loss": 0.0477, + "step": 17972 + }, + { + "epoch": 0.35, + "learning_rate": 1.3039881946332181e-07, + "loss": 0.0011, + "step": 17973 + }, + { + "epoch": 0.35, + "learning_rate": 1.3039493611898566e-07, + "loss": 0.001, + "step": 17974 + }, + { + "epoch": 0.35, + "learning_rate": 1.3039105277464953e-07, + "loss": 0.0011, + "step": 17975 + }, + { + "epoch": 0.35, + "learning_rate": 1.3038716943031338e-07, + "loss": 0.0007, + "step": 17976 + }, + { + "epoch": 0.35, + "learning_rate": 1.3038328608597725e-07, + "loss": 0.0012, + "step": 17977 + }, + { + "epoch": 0.35, + "learning_rate": 1.303794027416411e-07, + "loss": 0.0008, + "step": 17978 + }, + { + "epoch": 0.35, + "learning_rate": 1.3037551939730496e-07, + "loss": 0.001, + "step": 17979 + }, + { + "epoch": 0.35, + "learning_rate": 1.303716360529688e-07, + "loss": 0.0008, + "step": 17980 + }, + { + "epoch": 0.35, + "learning_rate": 1.3036775270863268e-07, + "loss": 0.001, + "step": 17981 + }, + { + "epoch": 0.35, + "learning_rate": 1.3036386936429653e-07, + "loss": 0.001, + "step": 17982 + }, + { + "epoch": 0.35, + "learning_rate": 1.303599860199604e-07, + "loss": 0.0008, + "step": 17983 + }, + { + "epoch": 0.35, + "learning_rate": 1.3035610267562424e-07, + "loss": 0.001, + "step": 17984 + }, + { + "epoch": 0.35, + "learning_rate": 1.3035221933128811e-07, + "loss": 0.0008, + "step": 17985 + }, + { + "epoch": 0.35, + "learning_rate": 1.3034833598695196e-07, + "loss": 0.0021, + "step": 17986 + }, + { + "epoch": 0.35, + "learning_rate": 1.3034445264261583e-07, + "loss": 0.0011, + "step": 17987 + }, + { + "epoch": 0.35, + "learning_rate": 1.3034056929827968e-07, + "loss": 0.0008, + "step": 17988 + }, + { + "epoch": 0.35, + "learning_rate": 1.3033668595394355e-07, + "loss": 0.001, + "step": 17989 + }, + { + "epoch": 0.35, + "learning_rate": 1.303328026096074e-07, + "loss": 0.6083, + "step": 17990 + }, + { + "epoch": 0.35, + "learning_rate": 1.3032891926527126e-07, + "loss": 0.001, + "step": 17991 + }, + { + "epoch": 0.35, + "learning_rate": 1.303250359209351e-07, + "loss": 0.0008, + "step": 17992 + }, + { + "epoch": 0.35, + "learning_rate": 1.3032115257659898e-07, + "loss": 0.0302, + "step": 17993 + }, + { + "epoch": 0.35, + "learning_rate": 1.3031726923226282e-07, + "loss": 0.0014, + "step": 17994 + }, + { + "epoch": 0.35, + "learning_rate": 1.303133858879267e-07, + "loss": 0.0009, + "step": 17995 + }, + { + "epoch": 0.35, + "learning_rate": 1.3030950254359054e-07, + "loss": 0.0025, + "step": 17996 + }, + { + "epoch": 0.35, + "learning_rate": 1.303056191992544e-07, + "loss": 0.0008, + "step": 17997 + }, + { + "epoch": 0.35, + "learning_rate": 1.3030173585491826e-07, + "loss": 0.0008, + "step": 17998 + }, + { + "epoch": 0.35, + "learning_rate": 1.3029785251058213e-07, + "loss": 0.0013, + "step": 17999 + }, + { + "epoch": 0.35, + "learning_rate": 1.3029396916624597e-07, + "loss": 0.2599, + "step": 18000 + }, + { + "epoch": 0.35, + "learning_rate": 1.3029008582190982e-07, + "loss": 0.0006, + "step": 18001 + }, + { + "epoch": 0.35, + "learning_rate": 1.3028620247757366e-07, + "loss": 0.0008, + "step": 18002 + }, + { + "epoch": 0.35, + "learning_rate": 1.3028231913323754e-07, + "loss": 0.0009, + "step": 18003 + }, + { + "epoch": 0.35, + "learning_rate": 1.3027843578890138e-07, + "loss": 0.001, + "step": 18004 + }, + { + "epoch": 0.35, + "learning_rate": 1.3027455244456525e-07, + "loss": 0.0008, + "step": 18005 + }, + { + "epoch": 0.35, + "learning_rate": 1.302706691002291e-07, + "loss": 0.0085, + "step": 18006 + }, + { + "epoch": 0.35, + "learning_rate": 1.3026678575589297e-07, + "loss": 0.0006, + "step": 18007 + }, + { + "epoch": 0.35, + "learning_rate": 1.3026290241155681e-07, + "loss": 0.0014, + "step": 18008 + }, + { + "epoch": 0.35, + "learning_rate": 1.3025901906722068e-07, + "loss": 0.0009, + "step": 18009 + }, + { + "epoch": 0.35, + "learning_rate": 1.3025513572288453e-07, + "loss": 0.0009, + "step": 18010 + }, + { + "epoch": 0.35, + "learning_rate": 1.302512523785484e-07, + "loss": 0.0008, + "step": 18011 + }, + { + "epoch": 0.35, + "learning_rate": 1.3024736903421225e-07, + "loss": 0.001, + "step": 18012 + }, + { + "epoch": 0.35, + "learning_rate": 1.3024348568987612e-07, + "loss": 0.0007, + "step": 18013 + }, + { + "epoch": 0.35, + "learning_rate": 1.3023960234553996e-07, + "loss": 0.5424, + "step": 18014 + }, + { + "epoch": 0.35, + "learning_rate": 1.3023571900120383e-07, + "loss": 0.0007, + "step": 18015 + }, + { + "epoch": 0.35, + "learning_rate": 1.3023183565686768e-07, + "loss": 0.1494, + "step": 18016 + }, + { + "epoch": 0.35, + "learning_rate": 1.3022795231253155e-07, + "loss": 0.0008, + "step": 18017 + }, + { + "epoch": 0.35, + "learning_rate": 1.302240689681954e-07, + "loss": 0.0007, + "step": 18018 + }, + { + "epoch": 0.35, + "learning_rate": 1.3022018562385927e-07, + "loss": 0.0008, + "step": 18019 + }, + { + "epoch": 0.35, + "learning_rate": 1.302163022795231e-07, + "loss": 0.0009, + "step": 18020 + }, + { + "epoch": 0.35, + "learning_rate": 1.3021241893518698e-07, + "loss": 0.0008, + "step": 18021 + }, + { + "epoch": 0.35, + "learning_rate": 1.3020853559085083e-07, + "loss": 0.0008, + "step": 18022 + }, + { + "epoch": 0.35, + "learning_rate": 1.302046522465147e-07, + "loss": 0.0015, + "step": 18023 + }, + { + "epoch": 0.35, + "learning_rate": 1.3020076890217855e-07, + "loss": 0.3256, + "step": 18024 + }, + { + "epoch": 0.35, + "learning_rate": 1.3019688555784242e-07, + "loss": 0.0008, + "step": 18025 + }, + { + "epoch": 0.35, + "learning_rate": 1.3019300221350626e-07, + "loss": 0.001, + "step": 18026 + }, + { + "epoch": 0.35, + "learning_rate": 1.3018911886917013e-07, + "loss": 0.0011, + "step": 18027 + }, + { + "epoch": 0.35, + "learning_rate": 1.3018523552483398e-07, + "loss": 0.002, + "step": 18028 + }, + { + "epoch": 0.35, + "learning_rate": 1.3018135218049785e-07, + "loss": 0.001, + "step": 18029 + }, + { + "epoch": 0.35, + "learning_rate": 1.301774688361617e-07, + "loss": 0.0009, + "step": 18030 + }, + { + "epoch": 0.35, + "learning_rate": 1.3017358549182557e-07, + "loss": 0.0028, + "step": 18031 + }, + { + "epoch": 0.35, + "learning_rate": 1.301697021474894e-07, + "loss": 0.0007, + "step": 18032 + }, + { + "epoch": 0.35, + "learning_rate": 1.3016581880315328e-07, + "loss": 0.0009, + "step": 18033 + }, + { + "epoch": 0.35, + "learning_rate": 1.3016193545881713e-07, + "loss": 0.0007, + "step": 18034 + }, + { + "epoch": 0.35, + "learning_rate": 1.30158052114481e-07, + "loss": 0.001, + "step": 18035 + }, + { + "epoch": 0.35, + "learning_rate": 1.3015416877014484e-07, + "loss": 0.2527, + "step": 18036 + }, + { + "epoch": 0.35, + "learning_rate": 1.3015028542580872e-07, + "loss": 0.0008, + "step": 18037 + }, + { + "epoch": 0.35, + "learning_rate": 1.3014640208147256e-07, + "loss": 0.0008, + "step": 18038 + }, + { + "epoch": 0.35, + "learning_rate": 1.3014251873713643e-07, + "loss": 0.0099, + "step": 18039 + }, + { + "epoch": 0.35, + "learning_rate": 1.3013863539280028e-07, + "loss": 0.3526, + "step": 18040 + }, + { + "epoch": 0.35, + "learning_rate": 1.3013475204846415e-07, + "loss": 0.6657, + "step": 18041 + }, + { + "epoch": 0.35, + "learning_rate": 1.30130868704128e-07, + "loss": 0.0031, + "step": 18042 + }, + { + "epoch": 0.35, + "learning_rate": 1.3012698535979187e-07, + "loss": 0.0014, + "step": 18043 + }, + { + "epoch": 0.35, + "learning_rate": 1.301231020154557e-07, + "loss": 0.0876, + "step": 18044 + }, + { + "epoch": 0.35, + "learning_rate": 1.3011921867111956e-07, + "loss": 0.001, + "step": 18045 + }, + { + "epoch": 0.35, + "learning_rate": 1.3011533532678343e-07, + "loss": 0.0009, + "step": 18046 + }, + { + "epoch": 0.35, + "learning_rate": 1.3011145198244727e-07, + "loss": 0.0008, + "step": 18047 + }, + { + "epoch": 0.35, + "learning_rate": 1.3010756863811114e-07, + "loss": 0.0013, + "step": 18048 + }, + { + "epoch": 0.35, + "learning_rate": 1.30103685293775e-07, + "loss": 0.002, + "step": 18049 + }, + { + "epoch": 0.35, + "learning_rate": 1.3009980194943886e-07, + "loss": 0.0008, + "step": 18050 + }, + { + "epoch": 0.35, + "learning_rate": 1.300959186051027e-07, + "loss": 0.0603, + "step": 18051 + }, + { + "epoch": 0.35, + "learning_rate": 1.3009203526076658e-07, + "loss": 0.001, + "step": 18052 + }, + { + "epoch": 0.35, + "learning_rate": 1.3008815191643042e-07, + "loss": 0.4542, + "step": 18053 + }, + { + "epoch": 0.35, + "learning_rate": 1.300842685720943e-07, + "loss": 0.0009, + "step": 18054 + }, + { + "epoch": 0.35, + "learning_rate": 1.3008038522775814e-07, + "loss": 0.0009, + "step": 18055 + }, + { + "epoch": 0.35, + "learning_rate": 1.30076501883422e-07, + "loss": 0.0011, + "step": 18056 + }, + { + "epoch": 0.35, + "learning_rate": 1.3007261853908585e-07, + "loss": 0.0009, + "step": 18057 + }, + { + "epoch": 0.35, + "learning_rate": 1.3006873519474973e-07, + "loss": 0.0159, + "step": 18058 + }, + { + "epoch": 0.35, + "learning_rate": 1.3006485185041357e-07, + "loss": 0.0059, + "step": 18059 + }, + { + "epoch": 0.35, + "learning_rate": 1.3006096850607742e-07, + "loss": 0.0022, + "step": 18060 + }, + { + "epoch": 0.35, + "learning_rate": 1.300570851617413e-07, + "loss": 0.0011, + "step": 18061 + }, + { + "epoch": 0.35, + "learning_rate": 1.3005320181740513e-07, + "loss": 0.001, + "step": 18062 + }, + { + "epoch": 0.35, + "learning_rate": 1.30049318473069e-07, + "loss": 0.0009, + "step": 18063 + }, + { + "epoch": 0.35, + "learning_rate": 1.3004543512873285e-07, + "loss": 0.0008, + "step": 18064 + }, + { + "epoch": 0.35, + "learning_rate": 1.3004155178439672e-07, + "loss": 0.6174, + "step": 18065 + }, + { + "epoch": 0.35, + "learning_rate": 1.3003766844006057e-07, + "loss": 0.0009, + "step": 18066 + }, + { + "epoch": 0.35, + "learning_rate": 1.3003378509572444e-07, + "loss": 0.7377, + "step": 18067 + }, + { + "epoch": 0.35, + "learning_rate": 1.3002990175138828e-07, + "loss": 0.0009, + "step": 18068 + }, + { + "epoch": 0.35, + "learning_rate": 1.3002601840705215e-07, + "loss": 0.0007, + "step": 18069 + }, + { + "epoch": 0.35, + "learning_rate": 1.30022135062716e-07, + "loss": 0.0007, + "step": 18070 + }, + { + "epoch": 0.35, + "learning_rate": 1.3001825171837987e-07, + "loss": 0.1021, + "step": 18071 + }, + { + "epoch": 0.35, + "learning_rate": 1.3001436837404371e-07, + "loss": 0.0008, + "step": 18072 + }, + { + "epoch": 0.35, + "learning_rate": 1.3001048502970756e-07, + "loss": 0.001, + "step": 18073 + }, + { + "epoch": 0.35, + "learning_rate": 1.3000660168537143e-07, + "loss": 0.0008, + "step": 18074 + }, + { + "epoch": 0.35, + "learning_rate": 1.3000271834103528e-07, + "loss": 0.0013, + "step": 18075 + }, + { + "epoch": 0.35, + "learning_rate": 1.2999883499669915e-07, + "loss": 0.001, + "step": 18076 + }, + { + "epoch": 0.35, + "learning_rate": 1.29994951652363e-07, + "loss": 0.0024, + "step": 18077 + }, + { + "epoch": 0.35, + "learning_rate": 1.2999106830802686e-07, + "loss": 0.4814, + "step": 18078 + }, + { + "epoch": 0.35, + "learning_rate": 1.299871849636907e-07, + "loss": 0.0009, + "step": 18079 + }, + { + "epoch": 0.35, + "learning_rate": 1.2998330161935458e-07, + "loss": 0.0009, + "step": 18080 + }, + { + "epoch": 0.35, + "learning_rate": 1.2997941827501843e-07, + "loss": 0.0011, + "step": 18081 + }, + { + "epoch": 0.35, + "learning_rate": 1.299755349306823e-07, + "loss": 0.0011, + "step": 18082 + }, + { + "epoch": 0.35, + "learning_rate": 1.2997165158634614e-07, + "loss": 0.001, + "step": 18083 + }, + { + "epoch": 0.35, + "learning_rate": 1.2996776824201001e-07, + "loss": 0.001, + "step": 18084 + }, + { + "epoch": 0.35, + "learning_rate": 1.2996388489767386e-07, + "loss": 0.9108, + "step": 18085 + }, + { + "epoch": 0.35, + "learning_rate": 1.2996000155333773e-07, + "loss": 0.0014, + "step": 18086 + }, + { + "epoch": 0.35, + "learning_rate": 1.2995611820900158e-07, + "loss": 0.0014, + "step": 18087 + }, + { + "epoch": 0.35, + "learning_rate": 1.2995223486466545e-07, + "loss": 0.0016, + "step": 18088 + }, + { + "epoch": 0.35, + "learning_rate": 1.299483515203293e-07, + "loss": 0.0012, + "step": 18089 + }, + { + "epoch": 0.35, + "learning_rate": 1.2994446817599316e-07, + "loss": 0.0011, + "step": 18090 + }, + { + "epoch": 0.35, + "learning_rate": 1.29940584831657e-07, + "loss": 0.0008, + "step": 18091 + }, + { + "epoch": 0.35, + "learning_rate": 1.2993670148732088e-07, + "loss": 0.0009, + "step": 18092 + }, + { + "epoch": 0.35, + "learning_rate": 1.2993281814298472e-07, + "loss": 0.001, + "step": 18093 + }, + { + "epoch": 0.35, + "learning_rate": 1.299289347986486e-07, + "loss": 0.0008, + "step": 18094 + }, + { + "epoch": 0.35, + "learning_rate": 1.2992505145431244e-07, + "loss": 0.0011, + "step": 18095 + }, + { + "epoch": 0.35, + "learning_rate": 1.299211681099763e-07, + "loss": 0.0019, + "step": 18096 + }, + { + "epoch": 0.35, + "learning_rate": 1.2991728476564016e-07, + "loss": 0.0009, + "step": 18097 + }, + { + "epoch": 0.35, + "learning_rate": 1.2991340142130403e-07, + "loss": 0.089, + "step": 18098 + }, + { + "epoch": 0.35, + "learning_rate": 1.2990951807696787e-07, + "loss": 0.0013, + "step": 18099 + }, + { + "epoch": 0.35, + "learning_rate": 1.2990563473263175e-07, + "loss": 0.4917, + "step": 18100 + }, + { + "epoch": 0.35, + "learning_rate": 1.299017513882956e-07, + "loss": 0.0202, + "step": 18101 + }, + { + "epoch": 0.35, + "learning_rate": 1.2989786804395946e-07, + "loss": 0.3479, + "step": 18102 + }, + { + "epoch": 0.35, + "learning_rate": 1.298939846996233e-07, + "loss": 0.0009, + "step": 18103 + }, + { + "epoch": 0.35, + "learning_rate": 1.2989010135528718e-07, + "loss": 0.0009, + "step": 18104 + }, + { + "epoch": 0.35, + "learning_rate": 1.2988621801095102e-07, + "loss": 0.001, + "step": 18105 + }, + { + "epoch": 0.35, + "learning_rate": 1.298823346666149e-07, + "loss": 0.0024, + "step": 18106 + }, + { + "epoch": 0.35, + "learning_rate": 1.2987845132227874e-07, + "loss": 0.0008, + "step": 18107 + }, + { + "epoch": 0.35, + "learning_rate": 1.298745679779426e-07, + "loss": 0.0028, + "step": 18108 + }, + { + "epoch": 0.35, + "learning_rate": 1.2987068463360646e-07, + "loss": 0.0008, + "step": 18109 + }, + { + "epoch": 0.35, + "learning_rate": 1.2986680128927033e-07, + "loss": 0.0009, + "step": 18110 + }, + { + "epoch": 0.35, + "learning_rate": 1.2986291794493417e-07, + "loss": 0.0032, + "step": 18111 + }, + { + "epoch": 0.35, + "learning_rate": 1.2985903460059804e-07, + "loss": 0.0013, + "step": 18112 + }, + { + "epoch": 0.35, + "learning_rate": 1.298551512562619e-07, + "loss": 0.0016, + "step": 18113 + }, + { + "epoch": 0.35, + "learning_rate": 1.2985126791192576e-07, + "loss": 0.0008, + "step": 18114 + }, + { + "epoch": 0.35, + "learning_rate": 1.298473845675896e-07, + "loss": 0.3512, + "step": 18115 + }, + { + "epoch": 0.35, + "learning_rate": 1.2984350122325348e-07, + "loss": 0.0011, + "step": 18116 + }, + { + "epoch": 0.35, + "learning_rate": 1.298396178789173e-07, + "loss": 0.001, + "step": 18117 + }, + { + "epoch": 0.35, + "learning_rate": 1.2983573453458117e-07, + "loss": 0.001, + "step": 18118 + }, + { + "epoch": 0.35, + "learning_rate": 1.29831851190245e-07, + "loss": 0.0011, + "step": 18119 + }, + { + "epoch": 0.35, + "learning_rate": 1.2982796784590888e-07, + "loss": 0.0023, + "step": 18120 + }, + { + "epoch": 0.35, + "learning_rate": 1.2982408450157273e-07, + "loss": 0.0011, + "step": 18121 + }, + { + "epoch": 0.35, + "learning_rate": 1.298202011572366e-07, + "loss": 0.0012, + "step": 18122 + }, + { + "epoch": 0.35, + "learning_rate": 1.2981631781290045e-07, + "loss": 0.0012, + "step": 18123 + }, + { + "epoch": 0.35, + "learning_rate": 1.2981243446856432e-07, + "loss": 0.0022, + "step": 18124 + }, + { + "epoch": 0.35, + "learning_rate": 1.2980855112422816e-07, + "loss": 0.0013, + "step": 18125 + }, + { + "epoch": 0.35, + "learning_rate": 1.2980466777989203e-07, + "loss": 0.0009, + "step": 18126 + }, + { + "epoch": 0.35, + "learning_rate": 1.2980078443555588e-07, + "loss": 0.0009, + "step": 18127 + }, + { + "epoch": 0.35, + "learning_rate": 1.2979690109121975e-07, + "loss": 0.0008, + "step": 18128 + }, + { + "epoch": 0.35, + "learning_rate": 1.297930177468836e-07, + "loss": 0.0027, + "step": 18129 + }, + { + "epoch": 0.35, + "learning_rate": 1.2978913440254747e-07, + "loss": 0.0009, + "step": 18130 + }, + { + "epoch": 0.35, + "learning_rate": 1.297852510582113e-07, + "loss": 0.0009, + "step": 18131 + }, + { + "epoch": 0.35, + "learning_rate": 1.2978136771387518e-07, + "loss": 0.0008, + "step": 18132 + }, + { + "epoch": 0.35, + "learning_rate": 1.2977748436953903e-07, + "loss": 0.0014, + "step": 18133 + }, + { + "epoch": 0.35, + "learning_rate": 1.297736010252029e-07, + "loss": 0.0006, + "step": 18134 + }, + { + "epoch": 0.35, + "learning_rate": 1.2976971768086674e-07, + "loss": 0.0032, + "step": 18135 + }, + { + "epoch": 0.35, + "learning_rate": 1.2976583433653062e-07, + "loss": 0.0007, + "step": 18136 + }, + { + "epoch": 0.35, + "learning_rate": 1.2976195099219446e-07, + "loss": 0.001, + "step": 18137 + }, + { + "epoch": 0.35, + "learning_rate": 1.2975806764785833e-07, + "loss": 0.0008, + "step": 18138 + }, + { + "epoch": 0.35, + "learning_rate": 1.2975418430352218e-07, + "loss": 0.2261, + "step": 18139 + }, + { + "epoch": 0.35, + "learning_rate": 1.2975030095918605e-07, + "loss": 0.0008, + "step": 18140 + }, + { + "epoch": 0.35, + "learning_rate": 1.297464176148499e-07, + "loss": 0.0007, + "step": 18141 + }, + { + "epoch": 0.35, + "learning_rate": 1.2974253427051377e-07, + "loss": 0.0009, + "step": 18142 + }, + { + "epoch": 0.35, + "learning_rate": 1.297386509261776e-07, + "loss": 0.0034, + "step": 18143 + }, + { + "epoch": 0.35, + "learning_rate": 1.2973476758184148e-07, + "loss": 0.0009, + "step": 18144 + }, + { + "epoch": 0.35, + "learning_rate": 1.2973088423750533e-07, + "loss": 0.0007, + "step": 18145 + }, + { + "epoch": 0.35, + "learning_rate": 1.297270008931692e-07, + "loss": 0.0021, + "step": 18146 + }, + { + "epoch": 0.35, + "learning_rate": 1.2972311754883304e-07, + "loss": 0.0008, + "step": 18147 + }, + { + "epoch": 0.35, + "learning_rate": 1.2971923420449691e-07, + "loss": 0.0008, + "step": 18148 + }, + { + "epoch": 0.35, + "learning_rate": 1.2971535086016076e-07, + "loss": 0.0012, + "step": 18149 + }, + { + "epoch": 0.35, + "learning_rate": 1.2971146751582463e-07, + "loss": 0.0008, + "step": 18150 + }, + { + "epoch": 0.35, + "learning_rate": 1.2970758417148848e-07, + "loss": 0.0012, + "step": 18151 + }, + { + "epoch": 0.35, + "learning_rate": 1.2970370082715235e-07, + "loss": 0.0011, + "step": 18152 + }, + { + "epoch": 0.35, + "learning_rate": 1.296998174828162e-07, + "loss": 0.0008, + "step": 18153 + }, + { + "epoch": 0.35, + "learning_rate": 1.2969593413848006e-07, + "loss": 0.0007, + "step": 18154 + }, + { + "epoch": 0.35, + "learning_rate": 1.296920507941439e-07, + "loss": 0.1007, + "step": 18155 + }, + { + "epoch": 0.35, + "learning_rate": 1.2968816744980778e-07, + "loss": 0.0008, + "step": 18156 + }, + { + "epoch": 0.35, + "learning_rate": 1.2968428410547163e-07, + "loss": 0.0573, + "step": 18157 + }, + { + "epoch": 0.35, + "learning_rate": 1.296804007611355e-07, + "loss": 0.0007, + "step": 18158 + }, + { + "epoch": 0.35, + "learning_rate": 1.2967651741679934e-07, + "loss": 0.007, + "step": 18159 + }, + { + "epoch": 0.35, + "learning_rate": 1.2967263407246321e-07, + "loss": 0.0007, + "step": 18160 + }, + { + "epoch": 0.35, + "learning_rate": 1.2966875072812706e-07, + "loss": 0.0012, + "step": 18161 + }, + { + "epoch": 0.35, + "learning_rate": 1.2966486738379093e-07, + "loss": 0.0008, + "step": 18162 + }, + { + "epoch": 0.35, + "learning_rate": 1.2966098403945478e-07, + "loss": 0.0008, + "step": 18163 + }, + { + "epoch": 0.35, + "learning_rate": 1.2965710069511865e-07, + "loss": 0.0008, + "step": 18164 + }, + { + "epoch": 0.35, + "learning_rate": 1.296532173507825e-07, + "loss": 0.0009, + "step": 18165 + }, + { + "epoch": 0.35, + "learning_rate": 1.2964933400644636e-07, + "loss": 0.0009, + "step": 18166 + }, + { + "epoch": 0.35, + "learning_rate": 1.296454506621102e-07, + "loss": 0.0008, + "step": 18167 + }, + { + "epoch": 0.35, + "learning_rate": 1.2964156731777408e-07, + "loss": 0.0014, + "step": 18168 + }, + { + "epoch": 0.35, + "learning_rate": 1.2963768397343792e-07, + "loss": 0.0008, + "step": 18169 + }, + { + "epoch": 0.35, + "learning_rate": 1.296338006291018e-07, + "loss": 0.0014, + "step": 18170 + }, + { + "epoch": 0.35, + "learning_rate": 1.2962991728476564e-07, + "loss": 0.0011, + "step": 18171 + }, + { + "epoch": 0.35, + "learning_rate": 1.296260339404295e-07, + "loss": 0.0009, + "step": 18172 + }, + { + "epoch": 0.35, + "learning_rate": 1.2962215059609336e-07, + "loss": 0.0009, + "step": 18173 + }, + { + "epoch": 0.35, + "learning_rate": 1.2961826725175723e-07, + "loss": 0.0009, + "step": 18174 + }, + { + "epoch": 0.35, + "learning_rate": 1.2961438390742105e-07, + "loss": 0.0009, + "step": 18175 + }, + { + "epoch": 0.35, + "learning_rate": 1.2961050056308492e-07, + "loss": 0.2436, + "step": 18176 + }, + { + "epoch": 0.35, + "learning_rate": 1.2960661721874876e-07, + "loss": 0.0008, + "step": 18177 + }, + { + "epoch": 0.35, + "learning_rate": 1.2960273387441264e-07, + "loss": 0.0009, + "step": 18178 + }, + { + "epoch": 0.35, + "learning_rate": 1.2959885053007648e-07, + "loss": 0.0799, + "step": 18179 + }, + { + "epoch": 0.35, + "learning_rate": 1.2959496718574035e-07, + "loss": 0.2508, + "step": 18180 + }, + { + "epoch": 0.35, + "learning_rate": 1.295910838414042e-07, + "loss": 0.0007, + "step": 18181 + }, + { + "epoch": 0.35, + "learning_rate": 1.2958720049706807e-07, + "loss": 0.0012, + "step": 18182 + }, + { + "epoch": 0.35, + "learning_rate": 1.2958331715273191e-07, + "loss": 0.0008, + "step": 18183 + }, + { + "epoch": 0.35, + "learning_rate": 1.2957943380839579e-07, + "loss": 0.001, + "step": 18184 + }, + { + "epoch": 0.35, + "learning_rate": 1.2957555046405963e-07, + "loss": 0.0008, + "step": 18185 + }, + { + "epoch": 0.35, + "learning_rate": 1.295716671197235e-07, + "loss": 0.0007, + "step": 18186 + }, + { + "epoch": 0.35, + "learning_rate": 1.2956778377538735e-07, + "loss": 0.072, + "step": 18187 + }, + { + "epoch": 0.35, + "learning_rate": 1.2956390043105122e-07, + "loss": 0.0009, + "step": 18188 + }, + { + "epoch": 0.35, + "learning_rate": 1.2956001708671506e-07, + "loss": 0.0264, + "step": 18189 + }, + { + "epoch": 0.35, + "learning_rate": 1.2955613374237893e-07, + "loss": 0.0009, + "step": 18190 + }, + { + "epoch": 0.35, + "learning_rate": 1.2955225039804278e-07, + "loss": 0.0007, + "step": 18191 + }, + { + "epoch": 0.35, + "learning_rate": 1.2954836705370665e-07, + "loss": 0.001, + "step": 18192 + }, + { + "epoch": 0.35, + "learning_rate": 1.295444837093705e-07, + "loss": 0.0009, + "step": 18193 + }, + { + "epoch": 0.35, + "learning_rate": 1.2954060036503437e-07, + "loss": 0.001, + "step": 18194 + }, + { + "epoch": 0.35, + "learning_rate": 1.295367170206982e-07, + "loss": 0.0008, + "step": 18195 + }, + { + "epoch": 0.35, + "learning_rate": 1.2953283367636208e-07, + "loss": 0.0014, + "step": 18196 + }, + { + "epoch": 0.35, + "learning_rate": 1.2952895033202593e-07, + "loss": 0.001, + "step": 18197 + }, + { + "epoch": 0.35, + "learning_rate": 1.295250669876898e-07, + "loss": 0.5161, + "step": 18198 + }, + { + "epoch": 0.35, + "learning_rate": 1.2952118364335365e-07, + "loss": 0.0014, + "step": 18199 + }, + { + "epoch": 0.35, + "learning_rate": 1.2951730029901752e-07, + "loss": 0.0018, + "step": 18200 + }, + { + "epoch": 0.35, + "learning_rate": 1.2951341695468136e-07, + "loss": 0.2703, + "step": 18201 + }, + { + "epoch": 0.35, + "learning_rate": 1.2950953361034523e-07, + "loss": 0.1567, + "step": 18202 + }, + { + "epoch": 0.35, + "learning_rate": 1.2950565026600908e-07, + "loss": 0.0167, + "step": 18203 + }, + { + "epoch": 0.35, + "learning_rate": 1.2950176692167295e-07, + "loss": 0.0613, + "step": 18204 + }, + { + "epoch": 0.35, + "learning_rate": 1.294978835773368e-07, + "loss": 0.0472, + "step": 18205 + }, + { + "epoch": 0.35, + "learning_rate": 1.2949400023300067e-07, + "loss": 0.0012, + "step": 18206 + }, + { + "epoch": 0.35, + "learning_rate": 1.294901168886645e-07, + "loss": 0.0215, + "step": 18207 + }, + { + "epoch": 0.35, + "learning_rate": 1.2948623354432838e-07, + "loss": 0.0007, + "step": 18208 + }, + { + "epoch": 0.35, + "learning_rate": 1.2948235019999223e-07, + "loss": 0.0011, + "step": 18209 + }, + { + "epoch": 0.35, + "learning_rate": 1.294784668556561e-07, + "loss": 0.1566, + "step": 18210 + }, + { + "epoch": 0.35, + "learning_rate": 1.2947458351131994e-07, + "loss": 0.001, + "step": 18211 + }, + { + "epoch": 0.35, + "learning_rate": 1.2947070016698382e-07, + "loss": 0.0877, + "step": 18212 + }, + { + "epoch": 0.35, + "learning_rate": 1.2946681682264766e-07, + "loss": 0.0009, + "step": 18213 + }, + { + "epoch": 0.35, + "learning_rate": 1.2946293347831153e-07, + "loss": 0.0018, + "step": 18214 + }, + { + "epoch": 0.35, + "learning_rate": 1.2945905013397538e-07, + "loss": 0.0014, + "step": 18215 + }, + { + "epoch": 0.35, + "learning_rate": 1.2945516678963925e-07, + "loss": 0.002, + "step": 18216 + }, + { + "epoch": 0.35, + "learning_rate": 1.294512834453031e-07, + "loss": 0.0008, + "step": 18217 + }, + { + "epoch": 0.35, + "learning_rate": 1.2944740010096697e-07, + "loss": 0.661, + "step": 18218 + }, + { + "epoch": 0.35, + "learning_rate": 1.294435167566308e-07, + "loss": 0.0013, + "step": 18219 + }, + { + "epoch": 0.35, + "learning_rate": 1.2943963341229468e-07, + "loss": 0.5609, + "step": 18220 + }, + { + "epoch": 0.35, + "learning_rate": 1.2943575006795853e-07, + "loss": 0.0015, + "step": 18221 + }, + { + "epoch": 0.35, + "learning_rate": 1.2943186672362237e-07, + "loss": 0.1947, + "step": 18222 + }, + { + "epoch": 0.35, + "learning_rate": 1.2942798337928624e-07, + "loss": 0.0008, + "step": 18223 + }, + { + "epoch": 0.35, + "learning_rate": 1.294241000349501e-07, + "loss": 0.0008, + "step": 18224 + }, + { + "epoch": 0.35, + "learning_rate": 1.2942021669061396e-07, + "loss": 0.9219, + "step": 18225 + }, + { + "epoch": 0.35, + "learning_rate": 1.294163333462778e-07, + "loss": 0.0158, + "step": 18226 + }, + { + "epoch": 0.35, + "learning_rate": 1.2941245000194168e-07, + "loss": 0.0009, + "step": 18227 + }, + { + "epoch": 0.35, + "learning_rate": 1.2940856665760552e-07, + "loss": 0.0024, + "step": 18228 + }, + { + "epoch": 0.35, + "learning_rate": 1.294046833132694e-07, + "loss": 0.0011, + "step": 18229 + }, + { + "epoch": 0.35, + "learning_rate": 1.2940079996893324e-07, + "loss": 0.0008, + "step": 18230 + }, + { + "epoch": 0.35, + "learning_rate": 1.293969166245971e-07, + "loss": 0.7667, + "step": 18231 + }, + { + "epoch": 0.35, + "learning_rate": 1.2939303328026095e-07, + "loss": 0.0008, + "step": 18232 + }, + { + "epoch": 0.35, + "learning_rate": 1.293891499359248e-07, + "loss": 0.0037, + "step": 18233 + }, + { + "epoch": 0.35, + "learning_rate": 1.2938526659158867e-07, + "loss": 1.2434, + "step": 18234 + }, + { + "epoch": 0.35, + "learning_rate": 1.2938138324725252e-07, + "loss": 0.0006, + "step": 18235 + }, + { + "epoch": 0.35, + "learning_rate": 1.293774999029164e-07, + "loss": 0.0009, + "step": 18236 + }, + { + "epoch": 0.35, + "learning_rate": 1.2937361655858023e-07, + "loss": 0.0008, + "step": 18237 + }, + { + "epoch": 0.35, + "learning_rate": 1.293697332142441e-07, + "loss": 0.018, + "step": 18238 + }, + { + "epoch": 0.35, + "learning_rate": 1.2936584986990795e-07, + "loss": 0.0007, + "step": 18239 + }, + { + "epoch": 0.35, + "learning_rate": 1.2936196652557182e-07, + "loss": 0.0015, + "step": 18240 + }, + { + "epoch": 0.35, + "learning_rate": 1.2935808318123567e-07, + "loss": 0.0009, + "step": 18241 + }, + { + "epoch": 0.35, + "learning_rate": 1.2935419983689954e-07, + "loss": 0.0008, + "step": 18242 + }, + { + "epoch": 0.35, + "learning_rate": 1.2935031649256338e-07, + "loss": 0.0009, + "step": 18243 + }, + { + "epoch": 0.35, + "learning_rate": 1.2934643314822725e-07, + "loss": 0.7038, + "step": 18244 + }, + { + "epoch": 0.35, + "learning_rate": 1.293425498038911e-07, + "loss": 0.0015, + "step": 18245 + }, + { + "epoch": 0.35, + "learning_rate": 1.2933866645955497e-07, + "loss": 0.0008, + "step": 18246 + }, + { + "epoch": 0.35, + "learning_rate": 1.2933478311521881e-07, + "loss": 0.0009, + "step": 18247 + }, + { + "epoch": 0.35, + "learning_rate": 1.2933089977088269e-07, + "loss": 0.001, + "step": 18248 + }, + { + "epoch": 0.35, + "learning_rate": 1.2932701642654653e-07, + "loss": 0.0008, + "step": 18249 + }, + { + "epoch": 0.35, + "learning_rate": 1.2932313308221038e-07, + "loss": 0.0007, + "step": 18250 + }, + { + "epoch": 0.35, + "learning_rate": 1.2931924973787425e-07, + "loss": 0.001, + "step": 18251 + }, + { + "epoch": 0.35, + "learning_rate": 1.293153663935381e-07, + "loss": 0.0008, + "step": 18252 + }, + { + "epoch": 0.35, + "learning_rate": 1.2931148304920196e-07, + "loss": 0.0014, + "step": 18253 + }, + { + "epoch": 0.35, + "learning_rate": 1.293075997048658e-07, + "loss": 1.1246, + "step": 18254 + }, + { + "epoch": 0.35, + "learning_rate": 1.2930371636052968e-07, + "loss": 0.0008, + "step": 18255 + }, + { + "epoch": 0.35, + "learning_rate": 1.2929983301619353e-07, + "loss": 0.0011, + "step": 18256 + }, + { + "epoch": 0.35, + "learning_rate": 1.292959496718574e-07, + "loss": 0.0008, + "step": 18257 + }, + { + "epoch": 0.35, + "learning_rate": 1.2929206632752124e-07, + "loss": 0.001, + "step": 18258 + }, + { + "epoch": 0.35, + "learning_rate": 1.2928818298318511e-07, + "loss": 0.0006, + "step": 18259 + }, + { + "epoch": 0.35, + "learning_rate": 1.2928429963884896e-07, + "loss": 0.0012, + "step": 18260 + }, + { + "epoch": 0.35, + "learning_rate": 1.2928041629451283e-07, + "loss": 0.0009, + "step": 18261 + }, + { + "epoch": 0.35, + "learning_rate": 1.2927653295017668e-07, + "loss": 0.0023, + "step": 18262 + }, + { + "epoch": 0.35, + "learning_rate": 1.2927264960584055e-07, + "loss": 0.0008, + "step": 18263 + }, + { + "epoch": 0.35, + "learning_rate": 1.292687662615044e-07, + "loss": 0.0009, + "step": 18264 + }, + { + "epoch": 0.35, + "learning_rate": 1.2926488291716826e-07, + "loss": 0.0008, + "step": 18265 + }, + { + "epoch": 0.35, + "learning_rate": 1.292609995728321e-07, + "loss": 0.2137, + "step": 18266 + }, + { + "epoch": 0.35, + "learning_rate": 1.2925711622849598e-07, + "loss": 0.0008, + "step": 18267 + }, + { + "epoch": 0.35, + "learning_rate": 1.2925323288415982e-07, + "loss": 0.0009, + "step": 18268 + }, + { + "epoch": 0.35, + "learning_rate": 1.292493495398237e-07, + "loss": 0.0014, + "step": 18269 + }, + { + "epoch": 0.35, + "learning_rate": 1.2924546619548754e-07, + "loss": 0.0006, + "step": 18270 + }, + { + "epoch": 0.35, + "learning_rate": 1.292415828511514e-07, + "loss": 0.0007, + "step": 18271 + }, + { + "epoch": 0.35, + "learning_rate": 1.2923769950681526e-07, + "loss": 0.0009, + "step": 18272 + }, + { + "epoch": 0.35, + "learning_rate": 1.2923381616247913e-07, + "loss": 0.0955, + "step": 18273 + }, + { + "epoch": 0.35, + "learning_rate": 1.2922993281814297e-07, + "loss": 0.0011, + "step": 18274 + }, + { + "epoch": 0.35, + "learning_rate": 1.2922604947380685e-07, + "loss": 0.0007, + "step": 18275 + }, + { + "epoch": 0.35, + "learning_rate": 1.292221661294707e-07, + "loss": 0.0007, + "step": 18276 + }, + { + "epoch": 0.35, + "learning_rate": 1.2921828278513456e-07, + "loss": 0.0009, + "step": 18277 + }, + { + "epoch": 0.35, + "learning_rate": 1.292143994407984e-07, + "loss": 0.0009, + "step": 18278 + }, + { + "epoch": 0.35, + "learning_rate": 1.2921051609646228e-07, + "loss": 0.7752, + "step": 18279 + }, + { + "epoch": 0.35, + "learning_rate": 1.2920663275212612e-07, + "loss": 0.0021, + "step": 18280 + }, + { + "epoch": 0.35, + "learning_rate": 1.2920274940779e-07, + "loss": 0.0008, + "step": 18281 + }, + { + "epoch": 0.35, + "learning_rate": 1.2919886606345384e-07, + "loss": 0.0007, + "step": 18282 + }, + { + "epoch": 0.35, + "learning_rate": 1.291949827191177e-07, + "loss": 0.0014, + "step": 18283 + }, + { + "epoch": 0.35, + "learning_rate": 1.2919109937478156e-07, + "loss": 0.001, + "step": 18284 + }, + { + "epoch": 0.35, + "learning_rate": 1.2918721603044543e-07, + "loss": 1.2989, + "step": 18285 + }, + { + "epoch": 0.35, + "learning_rate": 1.2918333268610927e-07, + "loss": 0.445, + "step": 18286 + }, + { + "epoch": 0.35, + "learning_rate": 1.2917944934177314e-07, + "loss": 0.0014, + "step": 18287 + }, + { + "epoch": 0.35, + "learning_rate": 1.29175565997437e-07, + "loss": 0.0033, + "step": 18288 + }, + { + "epoch": 0.35, + "learning_rate": 1.2917168265310086e-07, + "loss": 0.0008, + "step": 18289 + }, + { + "epoch": 0.35, + "learning_rate": 1.291677993087647e-07, + "loss": 0.0009, + "step": 18290 + }, + { + "epoch": 0.35, + "learning_rate": 1.2916391596442855e-07, + "loss": 0.0008, + "step": 18291 + }, + { + "epoch": 0.35, + "learning_rate": 1.291600326200924e-07, + "loss": 0.0015, + "step": 18292 + }, + { + "epoch": 0.35, + "learning_rate": 1.2915614927575627e-07, + "loss": 0.0158, + "step": 18293 + }, + { + "epoch": 0.35, + "learning_rate": 1.291522659314201e-07, + "loss": 0.0018, + "step": 18294 + }, + { + "epoch": 0.35, + "learning_rate": 1.2914838258708398e-07, + "loss": 0.04, + "step": 18295 + }, + { + "epoch": 0.35, + "learning_rate": 1.2914449924274783e-07, + "loss": 0.0011, + "step": 18296 + }, + { + "epoch": 0.35, + "learning_rate": 1.291406158984117e-07, + "loss": 0.0189, + "step": 18297 + }, + { + "epoch": 0.35, + "learning_rate": 1.2913673255407555e-07, + "loss": 0.0019, + "step": 18298 + }, + { + "epoch": 0.35, + "learning_rate": 1.2913284920973942e-07, + "loss": 0.1283, + "step": 18299 + }, + { + "epoch": 0.35, + "learning_rate": 1.2912896586540326e-07, + "loss": 0.755, + "step": 18300 + }, + { + "epoch": 0.36, + "learning_rate": 1.2912508252106713e-07, + "loss": 0.0014, + "step": 18301 + }, + { + "epoch": 0.36, + "learning_rate": 1.2912119917673098e-07, + "loss": 0.0009, + "step": 18302 + }, + { + "epoch": 0.36, + "learning_rate": 1.2911731583239485e-07, + "loss": 1.2641, + "step": 18303 + }, + { + "epoch": 0.36, + "learning_rate": 1.291134324880587e-07, + "loss": 0.0012, + "step": 18304 + }, + { + "epoch": 0.36, + "learning_rate": 1.2910954914372257e-07, + "loss": 0.0011, + "step": 18305 + }, + { + "epoch": 0.36, + "learning_rate": 1.291056657993864e-07, + "loss": 0.0008, + "step": 18306 + }, + { + "epoch": 0.36, + "learning_rate": 1.2910178245505028e-07, + "loss": 0.0204, + "step": 18307 + }, + { + "epoch": 0.36, + "learning_rate": 1.2909789911071413e-07, + "loss": 0.0009, + "step": 18308 + }, + { + "epoch": 0.36, + "learning_rate": 1.29094015766378e-07, + "loss": 0.0009, + "step": 18309 + }, + { + "epoch": 0.36, + "learning_rate": 1.2909013242204184e-07, + "loss": 0.0015, + "step": 18310 + }, + { + "epoch": 0.36, + "learning_rate": 1.2908624907770572e-07, + "loss": 0.8151, + "step": 18311 + }, + { + "epoch": 0.36, + "learning_rate": 1.2908236573336956e-07, + "loss": 0.0007, + "step": 18312 + }, + { + "epoch": 0.36, + "learning_rate": 1.2907848238903343e-07, + "loss": 0.0067, + "step": 18313 + }, + { + "epoch": 0.36, + "learning_rate": 1.2907459904469728e-07, + "loss": 0.0008, + "step": 18314 + }, + { + "epoch": 0.36, + "learning_rate": 1.2907071570036115e-07, + "loss": 0.0011, + "step": 18315 + }, + { + "epoch": 0.36, + "learning_rate": 1.29066832356025e-07, + "loss": 0.0218, + "step": 18316 + }, + { + "epoch": 0.36, + "learning_rate": 1.2906294901168887e-07, + "loss": 0.0034, + "step": 18317 + }, + { + "epoch": 0.36, + "learning_rate": 1.290590656673527e-07, + "loss": 0.0009, + "step": 18318 + }, + { + "epoch": 0.36, + "learning_rate": 1.2905518232301658e-07, + "loss": 0.0009, + "step": 18319 + }, + { + "epoch": 0.36, + "learning_rate": 1.2905129897868043e-07, + "loss": 0.0008, + "step": 18320 + }, + { + "epoch": 0.36, + "learning_rate": 1.290474156343443e-07, + "loss": 0.1703, + "step": 18321 + }, + { + "epoch": 0.36, + "learning_rate": 1.2904353229000814e-07, + "loss": 0.0008, + "step": 18322 + }, + { + "epoch": 0.36, + "learning_rate": 1.2903964894567201e-07, + "loss": 0.2827, + "step": 18323 + }, + { + "epoch": 0.36, + "learning_rate": 1.2903576560133586e-07, + "loss": 0.0017, + "step": 18324 + }, + { + "epoch": 0.36, + "learning_rate": 1.2903188225699973e-07, + "loss": 0.0008, + "step": 18325 + }, + { + "epoch": 0.36, + "learning_rate": 1.2902799891266358e-07, + "loss": 0.0008, + "step": 18326 + }, + { + "epoch": 0.36, + "learning_rate": 1.2902411556832745e-07, + "loss": 0.0009, + "step": 18327 + }, + { + "epoch": 0.36, + "learning_rate": 1.290202322239913e-07, + "loss": 0.7188, + "step": 18328 + }, + { + "epoch": 0.36, + "learning_rate": 1.2901634887965516e-07, + "loss": 0.0011, + "step": 18329 + }, + { + "epoch": 0.36, + "learning_rate": 1.29012465535319e-07, + "loss": 0.0078, + "step": 18330 + }, + { + "epoch": 0.36, + "learning_rate": 1.2900858219098288e-07, + "loss": 0.0006, + "step": 18331 + }, + { + "epoch": 0.36, + "learning_rate": 1.2900469884664673e-07, + "loss": 0.5284, + "step": 18332 + }, + { + "epoch": 0.36, + "learning_rate": 1.290008155023106e-07, + "loss": 0.0015, + "step": 18333 + }, + { + "epoch": 0.36, + "learning_rate": 1.2899693215797444e-07, + "loss": 0.001, + "step": 18334 + }, + { + "epoch": 0.36, + "learning_rate": 1.2899304881363831e-07, + "loss": 0.3929, + "step": 18335 + }, + { + "epoch": 0.36, + "learning_rate": 1.2898916546930216e-07, + "loss": 0.6686, + "step": 18336 + }, + { + "epoch": 0.36, + "learning_rate": 1.2898528212496603e-07, + "loss": 0.001, + "step": 18337 + }, + { + "epoch": 0.36, + "learning_rate": 1.2898139878062988e-07, + "loss": 0.0014, + "step": 18338 + }, + { + "epoch": 0.36, + "learning_rate": 1.2897751543629375e-07, + "loss": 0.0012, + "step": 18339 + }, + { + "epoch": 0.36, + "learning_rate": 1.289736320919576e-07, + "loss": 0.0008, + "step": 18340 + }, + { + "epoch": 0.36, + "learning_rate": 1.2896974874762146e-07, + "loss": 1.4141, + "step": 18341 + }, + { + "epoch": 0.36, + "learning_rate": 1.289658654032853e-07, + "loss": 0.5503, + "step": 18342 + }, + { + "epoch": 0.36, + "learning_rate": 1.2896198205894918e-07, + "loss": 0.0189, + "step": 18343 + }, + { + "epoch": 0.36, + "learning_rate": 1.2895809871461302e-07, + "loss": 0.0009, + "step": 18344 + }, + { + "epoch": 0.36, + "learning_rate": 1.289542153702769e-07, + "loss": 0.003, + "step": 18345 + }, + { + "epoch": 0.36, + "learning_rate": 1.2895033202594074e-07, + "loss": 0.0008, + "step": 18346 + }, + { + "epoch": 0.36, + "learning_rate": 1.289464486816046e-07, + "loss": 0.6529, + "step": 18347 + }, + { + "epoch": 0.36, + "learning_rate": 1.2894256533726846e-07, + "loss": 0.0204, + "step": 18348 + }, + { + "epoch": 0.36, + "learning_rate": 1.289386819929323e-07, + "loss": 0.0007, + "step": 18349 + }, + { + "epoch": 0.36, + "learning_rate": 1.2893479864859615e-07, + "loss": 0.0011, + "step": 18350 + }, + { + "epoch": 0.36, + "learning_rate": 1.2893091530426002e-07, + "loss": 0.3794, + "step": 18351 + }, + { + "epoch": 0.36, + "learning_rate": 1.2892703195992386e-07, + "loss": 0.0014, + "step": 18352 + }, + { + "epoch": 0.36, + "learning_rate": 1.2892314861558774e-07, + "loss": 0.0014, + "step": 18353 + }, + { + "epoch": 0.36, + "learning_rate": 1.2891926527125158e-07, + "loss": 0.003, + "step": 18354 + }, + { + "epoch": 0.36, + "learning_rate": 1.2891538192691545e-07, + "loss": 0.0008, + "step": 18355 + }, + { + "epoch": 0.36, + "learning_rate": 1.289114985825793e-07, + "loss": 0.0014, + "step": 18356 + }, + { + "epoch": 0.36, + "learning_rate": 1.2890761523824317e-07, + "loss": 0.1525, + "step": 18357 + }, + { + "epoch": 0.36, + "learning_rate": 1.2890373189390701e-07, + "loss": 0.9123, + "step": 18358 + }, + { + "epoch": 0.36, + "learning_rate": 1.2889984854957089e-07, + "loss": 0.0011, + "step": 18359 + }, + { + "epoch": 0.36, + "learning_rate": 1.2889596520523473e-07, + "loss": 1.0266, + "step": 18360 + }, + { + "epoch": 0.36, + "learning_rate": 1.288920818608986e-07, + "loss": 0.003, + "step": 18361 + }, + { + "epoch": 0.36, + "learning_rate": 1.2888819851656245e-07, + "loss": 0.004, + "step": 18362 + }, + { + "epoch": 0.36, + "learning_rate": 1.2888431517222632e-07, + "loss": 0.0009, + "step": 18363 + }, + { + "epoch": 0.36, + "learning_rate": 1.2888043182789016e-07, + "loss": 0.0012, + "step": 18364 + }, + { + "epoch": 0.36, + "learning_rate": 1.2887654848355403e-07, + "loss": 0.0009, + "step": 18365 + }, + { + "epoch": 0.36, + "learning_rate": 1.2887266513921788e-07, + "loss": 0.0008, + "step": 18366 + }, + { + "epoch": 0.36, + "learning_rate": 1.2886878179488175e-07, + "loss": 0.0009, + "step": 18367 + }, + { + "epoch": 0.36, + "learning_rate": 1.288648984505456e-07, + "loss": 0.001, + "step": 18368 + }, + { + "epoch": 0.36, + "learning_rate": 1.2886101510620947e-07, + "loss": 0.0011, + "step": 18369 + }, + { + "epoch": 0.36, + "learning_rate": 1.288571317618733e-07, + "loss": 0.0012, + "step": 18370 + }, + { + "epoch": 0.36, + "learning_rate": 1.2885324841753718e-07, + "loss": 0.0008, + "step": 18371 + }, + { + "epoch": 0.36, + "learning_rate": 1.2884936507320103e-07, + "loss": 0.0008, + "step": 18372 + }, + { + "epoch": 0.36, + "learning_rate": 1.288454817288649e-07, + "loss": 0.002, + "step": 18373 + }, + { + "epoch": 0.36, + "learning_rate": 1.2884159838452875e-07, + "loss": 0.0006, + "step": 18374 + }, + { + "epoch": 0.36, + "learning_rate": 1.2883771504019262e-07, + "loss": 0.0008, + "step": 18375 + }, + { + "epoch": 0.36, + "learning_rate": 1.2883383169585646e-07, + "loss": 0.0143, + "step": 18376 + }, + { + "epoch": 0.36, + "learning_rate": 1.2882994835152033e-07, + "loss": 0.0007, + "step": 18377 + }, + { + "epoch": 0.36, + "learning_rate": 1.2882606500718418e-07, + "loss": 0.0129, + "step": 18378 + }, + { + "epoch": 0.36, + "learning_rate": 1.2882218166284805e-07, + "loss": 0.0009, + "step": 18379 + }, + { + "epoch": 0.36, + "learning_rate": 1.288182983185119e-07, + "loss": 0.0062, + "step": 18380 + }, + { + "epoch": 0.36, + "learning_rate": 1.2881441497417577e-07, + "loss": 0.0246, + "step": 18381 + }, + { + "epoch": 0.36, + "learning_rate": 1.288105316298396e-07, + "loss": 0.0009, + "step": 18382 + }, + { + "epoch": 0.36, + "learning_rate": 1.2880664828550348e-07, + "loss": 0.0008, + "step": 18383 + }, + { + "epoch": 0.36, + "learning_rate": 1.2880276494116733e-07, + "loss": 0.0023, + "step": 18384 + }, + { + "epoch": 0.36, + "learning_rate": 1.287988815968312e-07, + "loss": 1.1169, + "step": 18385 + }, + { + "epoch": 0.36, + "learning_rate": 1.2879499825249504e-07, + "loss": 0.9441, + "step": 18386 + }, + { + "epoch": 0.36, + "learning_rate": 1.2879111490815892e-07, + "loss": 0.0008, + "step": 18387 + }, + { + "epoch": 0.36, + "learning_rate": 1.2878723156382276e-07, + "loss": 0.0008, + "step": 18388 + }, + { + "epoch": 0.36, + "learning_rate": 1.2878334821948663e-07, + "loss": 0.0016, + "step": 18389 + }, + { + "epoch": 0.36, + "learning_rate": 1.2877946487515048e-07, + "loss": 0.0069, + "step": 18390 + }, + { + "epoch": 0.36, + "learning_rate": 1.2877558153081435e-07, + "loss": 0.0007, + "step": 18391 + }, + { + "epoch": 0.36, + "learning_rate": 1.287716981864782e-07, + "loss": 0.2121, + "step": 18392 + }, + { + "epoch": 0.36, + "learning_rate": 1.2876781484214207e-07, + "loss": 0.0028, + "step": 18393 + }, + { + "epoch": 0.36, + "learning_rate": 1.287639314978059e-07, + "loss": 0.0009, + "step": 18394 + }, + { + "epoch": 0.36, + "learning_rate": 1.2876004815346978e-07, + "loss": 0.0008, + "step": 18395 + }, + { + "epoch": 0.36, + "learning_rate": 1.2875616480913363e-07, + "loss": 0.0029, + "step": 18396 + }, + { + "epoch": 0.36, + "learning_rate": 1.287522814647975e-07, + "loss": 0.0008, + "step": 18397 + }, + { + "epoch": 0.36, + "learning_rate": 1.2874839812046134e-07, + "loss": 0.7254, + "step": 18398 + }, + { + "epoch": 0.36, + "learning_rate": 1.287445147761252e-07, + "loss": 0.0031, + "step": 18399 + }, + { + "epoch": 0.36, + "learning_rate": 1.2874063143178906e-07, + "loss": 0.7784, + "step": 18400 + }, + { + "epoch": 0.36, + "learning_rate": 1.287367480874529e-07, + "loss": 0.0007, + "step": 18401 + }, + { + "epoch": 0.36, + "learning_rate": 1.2873286474311678e-07, + "loss": 0.4977, + "step": 18402 + }, + { + "epoch": 0.36, + "learning_rate": 1.2872898139878062e-07, + "loss": 0.0119, + "step": 18403 + }, + { + "epoch": 0.36, + "learning_rate": 1.287250980544445e-07, + "loss": 0.2654, + "step": 18404 + }, + { + "epoch": 0.36, + "learning_rate": 1.2872121471010834e-07, + "loss": 0.0008, + "step": 18405 + }, + { + "epoch": 0.36, + "learning_rate": 1.287173313657722e-07, + "loss": 0.0008, + "step": 18406 + }, + { + "epoch": 0.36, + "learning_rate": 1.2871344802143605e-07, + "loss": 1.1854, + "step": 18407 + }, + { + "epoch": 0.36, + "learning_rate": 1.287095646770999e-07, + "loss": 0.0009, + "step": 18408 + }, + { + "epoch": 0.36, + "learning_rate": 1.2870568133276377e-07, + "loss": 0.0009, + "step": 18409 + }, + { + "epoch": 0.36, + "learning_rate": 1.2870179798842762e-07, + "loss": 0.0595, + "step": 18410 + }, + { + "epoch": 0.36, + "learning_rate": 1.286979146440915e-07, + "loss": 0.0026, + "step": 18411 + }, + { + "epoch": 0.36, + "learning_rate": 1.2869403129975533e-07, + "loss": 0.0023, + "step": 18412 + }, + { + "epoch": 0.36, + "learning_rate": 1.286901479554192e-07, + "loss": 0.0009, + "step": 18413 + }, + { + "epoch": 0.36, + "learning_rate": 1.2868626461108305e-07, + "loss": 0.3077, + "step": 18414 + }, + { + "epoch": 0.36, + "learning_rate": 1.2868238126674692e-07, + "loss": 0.0065, + "step": 18415 + }, + { + "epoch": 0.36, + "learning_rate": 1.2867849792241077e-07, + "loss": 0.001, + "step": 18416 + }, + { + "epoch": 0.36, + "learning_rate": 1.2867461457807464e-07, + "loss": 0.0007, + "step": 18417 + }, + { + "epoch": 0.36, + "learning_rate": 1.2867073123373848e-07, + "loss": 0.0012, + "step": 18418 + }, + { + "epoch": 0.36, + "learning_rate": 1.2866684788940235e-07, + "loss": 0.0017, + "step": 18419 + }, + { + "epoch": 0.36, + "learning_rate": 1.286629645450662e-07, + "loss": 0.0007, + "step": 18420 + }, + { + "epoch": 0.36, + "learning_rate": 1.2865908120073007e-07, + "loss": 0.001, + "step": 18421 + }, + { + "epoch": 0.36, + "learning_rate": 1.2865519785639391e-07, + "loss": 0.4938, + "step": 18422 + }, + { + "epoch": 0.36, + "learning_rate": 1.2865131451205779e-07, + "loss": 0.001, + "step": 18423 + }, + { + "epoch": 0.36, + "learning_rate": 1.2864743116772163e-07, + "loss": 0.0011, + "step": 18424 + }, + { + "epoch": 0.36, + "learning_rate": 1.286435478233855e-07, + "loss": 0.0012, + "step": 18425 + }, + { + "epoch": 0.36, + "learning_rate": 1.2863966447904935e-07, + "loss": 0.0009, + "step": 18426 + }, + { + "epoch": 0.36, + "learning_rate": 1.286357811347132e-07, + "loss": 0.001, + "step": 18427 + }, + { + "epoch": 0.36, + "learning_rate": 1.2863189779037706e-07, + "loss": 1.148, + "step": 18428 + }, + { + "epoch": 0.36, + "learning_rate": 1.286280144460409e-07, + "loss": 0.0008, + "step": 18429 + }, + { + "epoch": 0.36, + "learning_rate": 1.2862413110170478e-07, + "loss": 0.0029, + "step": 18430 + }, + { + "epoch": 0.36, + "learning_rate": 1.2862024775736863e-07, + "loss": 0.0009, + "step": 18431 + }, + { + "epoch": 0.36, + "learning_rate": 1.286163644130325e-07, + "loss": 0.0019, + "step": 18432 + }, + { + "epoch": 0.36, + "learning_rate": 1.2861248106869634e-07, + "loss": 0.0016, + "step": 18433 + }, + { + "epoch": 0.36, + "learning_rate": 1.2860859772436021e-07, + "loss": 0.0014, + "step": 18434 + }, + { + "epoch": 0.36, + "learning_rate": 1.2860471438002406e-07, + "loss": 0.0007, + "step": 18435 + }, + { + "epoch": 0.36, + "learning_rate": 1.2860083103568793e-07, + "loss": 0.0014, + "step": 18436 + }, + { + "epoch": 0.36, + "learning_rate": 1.2859694769135178e-07, + "loss": 1.2223, + "step": 18437 + }, + { + "epoch": 0.36, + "learning_rate": 1.2859306434701565e-07, + "loss": 0.0016, + "step": 18438 + }, + { + "epoch": 0.36, + "learning_rate": 1.285891810026795e-07, + "loss": 0.0009, + "step": 18439 + }, + { + "epoch": 0.36, + "learning_rate": 1.2858529765834336e-07, + "loss": 0.0009, + "step": 18440 + }, + { + "epoch": 0.36, + "learning_rate": 1.285814143140072e-07, + "loss": 0.0008, + "step": 18441 + }, + { + "epoch": 0.36, + "learning_rate": 1.2857753096967108e-07, + "loss": 0.116, + "step": 18442 + }, + { + "epoch": 0.36, + "learning_rate": 1.2857364762533492e-07, + "loss": 0.0008, + "step": 18443 + }, + { + "epoch": 0.36, + "learning_rate": 1.285697642809988e-07, + "loss": 0.001, + "step": 18444 + }, + { + "epoch": 0.36, + "learning_rate": 1.2856588093666264e-07, + "loss": 0.0009, + "step": 18445 + }, + { + "epoch": 0.36, + "learning_rate": 1.285619975923265e-07, + "loss": 0.0015, + "step": 18446 + }, + { + "epoch": 0.36, + "learning_rate": 1.2855811424799036e-07, + "loss": 0.0009, + "step": 18447 + }, + { + "epoch": 0.36, + "learning_rate": 1.2855423090365423e-07, + "loss": 0.0006, + "step": 18448 + }, + { + "epoch": 0.36, + "learning_rate": 1.2855034755931807e-07, + "loss": 0.0009, + "step": 18449 + }, + { + "epoch": 0.36, + "learning_rate": 1.2854646421498195e-07, + "loss": 0.0015, + "step": 18450 + }, + { + "epoch": 0.36, + "learning_rate": 1.285425808706458e-07, + "loss": 0.0008, + "step": 18451 + }, + { + "epoch": 0.36, + "learning_rate": 1.2853869752630966e-07, + "loss": 0.0009, + "step": 18452 + }, + { + "epoch": 0.36, + "learning_rate": 1.285348141819735e-07, + "loss": 0.0008, + "step": 18453 + }, + { + "epoch": 0.36, + "learning_rate": 1.2853093083763738e-07, + "loss": 1.0846, + "step": 18454 + }, + { + "epoch": 0.36, + "learning_rate": 1.2852704749330122e-07, + "loss": 0.0014, + "step": 18455 + }, + { + "epoch": 0.36, + "learning_rate": 1.285231641489651e-07, + "loss": 0.0008, + "step": 18456 + }, + { + "epoch": 0.36, + "learning_rate": 1.2851928080462894e-07, + "loss": 0.0008, + "step": 18457 + }, + { + "epoch": 0.36, + "learning_rate": 1.285153974602928e-07, + "loss": 1.207, + "step": 18458 + }, + { + "epoch": 0.36, + "learning_rate": 1.2851151411595666e-07, + "loss": 0.7628, + "step": 18459 + }, + { + "epoch": 0.36, + "learning_rate": 1.2850763077162053e-07, + "loss": 0.0008, + "step": 18460 + }, + { + "epoch": 0.36, + "learning_rate": 1.2850374742728437e-07, + "loss": 0.0076, + "step": 18461 + }, + { + "epoch": 0.36, + "learning_rate": 1.2849986408294824e-07, + "loss": 0.014, + "step": 18462 + }, + { + "epoch": 0.36, + "learning_rate": 1.284959807386121e-07, + "loss": 0.0008, + "step": 18463 + }, + { + "epoch": 0.36, + "learning_rate": 1.2849209739427596e-07, + "loss": 0.0008, + "step": 18464 + }, + { + "epoch": 0.36, + "learning_rate": 1.2848821404993978e-07, + "loss": 0.0008, + "step": 18465 + }, + { + "epoch": 0.36, + "learning_rate": 1.2848433070560365e-07, + "loss": 0.0008, + "step": 18466 + }, + { + "epoch": 0.36, + "learning_rate": 1.284804473612675e-07, + "loss": 0.0251, + "step": 18467 + }, + { + "epoch": 0.36, + "learning_rate": 1.2847656401693137e-07, + "loss": 0.0012, + "step": 18468 + }, + { + "epoch": 0.36, + "learning_rate": 1.284726806725952e-07, + "loss": 0.9421, + "step": 18469 + }, + { + "epoch": 0.36, + "learning_rate": 1.2846879732825908e-07, + "loss": 0.0009, + "step": 18470 + }, + { + "epoch": 0.36, + "learning_rate": 1.2846491398392293e-07, + "loss": 0.0016, + "step": 18471 + }, + { + "epoch": 0.36, + "learning_rate": 1.284610306395868e-07, + "loss": 0.0016, + "step": 18472 + }, + { + "epoch": 0.36, + "learning_rate": 1.2845714729525065e-07, + "loss": 0.9424, + "step": 18473 + }, + { + "epoch": 0.36, + "learning_rate": 1.2845326395091452e-07, + "loss": 0.0009, + "step": 18474 + }, + { + "epoch": 0.36, + "learning_rate": 1.2844938060657836e-07, + "loss": 0.0009, + "step": 18475 + }, + { + "epoch": 0.36, + "learning_rate": 1.2844549726224223e-07, + "loss": 0.0009, + "step": 18476 + }, + { + "epoch": 0.36, + "learning_rate": 1.2844161391790608e-07, + "loss": 0.8912, + "step": 18477 + }, + { + "epoch": 0.36, + "learning_rate": 1.2843773057356995e-07, + "loss": 0.0026, + "step": 18478 + }, + { + "epoch": 0.36, + "learning_rate": 1.284338472292338e-07, + "loss": 0.0007, + "step": 18479 + }, + { + "epoch": 0.36, + "learning_rate": 1.2842996388489767e-07, + "loss": 0.0008, + "step": 18480 + }, + { + "epoch": 0.36, + "learning_rate": 1.284260805405615e-07, + "loss": 0.0009, + "step": 18481 + }, + { + "epoch": 0.36, + "learning_rate": 1.2842219719622538e-07, + "loss": 0.0007, + "step": 18482 + }, + { + "epoch": 0.36, + "learning_rate": 1.2841831385188923e-07, + "loss": 0.0008, + "step": 18483 + }, + { + "epoch": 0.36, + "learning_rate": 1.284144305075531e-07, + "loss": 0.0009, + "step": 18484 + }, + { + "epoch": 0.36, + "learning_rate": 1.2841054716321694e-07, + "loss": 0.1836, + "step": 18485 + }, + { + "epoch": 0.36, + "learning_rate": 1.2840666381888082e-07, + "loss": 0.0015, + "step": 18486 + }, + { + "epoch": 0.36, + "learning_rate": 1.2840278047454466e-07, + "loss": 0.0008, + "step": 18487 + }, + { + "epoch": 0.36, + "learning_rate": 1.2839889713020853e-07, + "loss": 0.0009, + "step": 18488 + }, + { + "epoch": 0.36, + "learning_rate": 1.2839501378587238e-07, + "loss": 0.001, + "step": 18489 + }, + { + "epoch": 0.36, + "learning_rate": 1.2839113044153625e-07, + "loss": 0.0011, + "step": 18490 + }, + { + "epoch": 0.36, + "learning_rate": 1.283872470972001e-07, + "loss": 0.0009, + "step": 18491 + }, + { + "epoch": 0.36, + "learning_rate": 1.2838336375286397e-07, + "loss": 0.0013, + "step": 18492 + }, + { + "epoch": 0.36, + "learning_rate": 1.283794804085278e-07, + "loss": 0.0016, + "step": 18493 + }, + { + "epoch": 0.36, + "learning_rate": 1.2837559706419168e-07, + "loss": 0.2949, + "step": 18494 + }, + { + "epoch": 0.36, + "learning_rate": 1.2837171371985553e-07, + "loss": 0.001, + "step": 18495 + }, + { + "epoch": 0.36, + "learning_rate": 1.283678303755194e-07, + "loss": 0.001, + "step": 18496 + }, + { + "epoch": 0.36, + "learning_rate": 1.2836394703118324e-07, + "loss": 0.0008, + "step": 18497 + }, + { + "epoch": 0.36, + "learning_rate": 1.2836006368684711e-07, + "loss": 0.0977, + "step": 18498 + }, + { + "epoch": 0.36, + "learning_rate": 1.2835618034251096e-07, + "loss": 0.0008, + "step": 18499 + }, + { + "epoch": 0.36, + "learning_rate": 1.2835229699817483e-07, + "loss": 0.0017, + "step": 18500 + }, + { + "epoch": 0.36, + "learning_rate": 1.2834841365383868e-07, + "loss": 0.0022, + "step": 18501 + }, + { + "epoch": 0.36, + "learning_rate": 1.2834453030950255e-07, + "loss": 0.0009, + "step": 18502 + }, + { + "epoch": 0.36, + "learning_rate": 1.283406469651664e-07, + "loss": 0.0099, + "step": 18503 + }, + { + "epoch": 0.36, + "learning_rate": 1.2833676362083026e-07, + "loss": 0.0013, + "step": 18504 + }, + { + "epoch": 0.36, + "learning_rate": 1.283328802764941e-07, + "loss": 0.0173, + "step": 18505 + }, + { + "epoch": 0.36, + "learning_rate": 1.2832899693215798e-07, + "loss": 0.0013, + "step": 18506 + }, + { + "epoch": 0.36, + "learning_rate": 1.2832511358782183e-07, + "loss": 0.0009, + "step": 18507 + }, + { + "epoch": 0.36, + "learning_rate": 1.283212302434857e-07, + "loss": 1.1923, + "step": 18508 + }, + { + "epoch": 0.36, + "learning_rate": 1.2831734689914954e-07, + "loss": 0.0011, + "step": 18509 + }, + { + "epoch": 0.36, + "learning_rate": 1.2831346355481341e-07, + "loss": 0.0007, + "step": 18510 + }, + { + "epoch": 0.36, + "learning_rate": 1.2830958021047726e-07, + "loss": 0.0009, + "step": 18511 + }, + { + "epoch": 0.36, + "learning_rate": 1.2830569686614113e-07, + "loss": 0.0008, + "step": 18512 + }, + { + "epoch": 0.36, + "learning_rate": 1.2830181352180498e-07, + "loss": 0.0013, + "step": 18513 + }, + { + "epoch": 0.36, + "learning_rate": 1.2829793017746885e-07, + "loss": 0.0008, + "step": 18514 + }, + { + "epoch": 0.36, + "learning_rate": 1.282940468331327e-07, + "loss": 1.0959, + "step": 18515 + }, + { + "epoch": 0.36, + "learning_rate": 1.2829016348879656e-07, + "loss": 0.0008, + "step": 18516 + }, + { + "epoch": 0.36, + "learning_rate": 1.282862801444604e-07, + "loss": 0.0008, + "step": 18517 + }, + { + "epoch": 0.36, + "learning_rate": 1.2828239680012428e-07, + "loss": 0.0009, + "step": 18518 + }, + { + "epoch": 0.36, + "learning_rate": 1.2827851345578812e-07, + "loss": 0.0013, + "step": 18519 + }, + { + "epoch": 0.36, + "learning_rate": 1.28274630111452e-07, + "loss": 0.422, + "step": 18520 + }, + { + "epoch": 0.36, + "learning_rate": 1.2827074676711584e-07, + "loss": 0.0007, + "step": 18521 + }, + { + "epoch": 0.36, + "learning_rate": 1.282668634227797e-07, + "loss": 0.5036, + "step": 18522 + }, + { + "epoch": 0.36, + "learning_rate": 1.2826298007844353e-07, + "loss": 0.0008, + "step": 18523 + }, + { + "epoch": 0.36, + "learning_rate": 1.282590967341074e-07, + "loss": 0.002, + "step": 18524 + }, + { + "epoch": 0.36, + "learning_rate": 1.2825521338977125e-07, + "loss": 0.0007, + "step": 18525 + }, + { + "epoch": 0.36, + "learning_rate": 1.2825133004543512e-07, + "loss": 0.001, + "step": 18526 + }, + { + "epoch": 0.36, + "learning_rate": 1.2824744670109896e-07, + "loss": 0.0009, + "step": 18527 + }, + { + "epoch": 0.36, + "learning_rate": 1.2824356335676284e-07, + "loss": 0.002, + "step": 18528 + }, + { + "epoch": 0.36, + "learning_rate": 1.2823968001242668e-07, + "loss": 0.0012, + "step": 18529 + }, + { + "epoch": 0.36, + "learning_rate": 1.2823579666809055e-07, + "loss": 0.0007, + "step": 18530 + }, + { + "epoch": 0.36, + "learning_rate": 1.282319133237544e-07, + "loss": 0.0009, + "step": 18531 + }, + { + "epoch": 0.36, + "learning_rate": 1.2822802997941827e-07, + "loss": 0.0011, + "step": 18532 + }, + { + "epoch": 0.36, + "learning_rate": 1.2822414663508211e-07, + "loss": 0.0014, + "step": 18533 + }, + { + "epoch": 0.36, + "learning_rate": 1.2822026329074599e-07, + "loss": 0.0009, + "step": 18534 + }, + { + "epoch": 0.36, + "learning_rate": 1.2821637994640983e-07, + "loss": 0.0012, + "step": 18535 + }, + { + "epoch": 0.36, + "learning_rate": 1.282124966020737e-07, + "loss": 0.0016, + "step": 18536 + }, + { + "epoch": 0.36, + "learning_rate": 1.2820861325773755e-07, + "loss": 0.0023, + "step": 18537 + }, + { + "epoch": 0.36, + "learning_rate": 1.2820472991340142e-07, + "loss": 0.0011, + "step": 18538 + }, + { + "epoch": 0.36, + "learning_rate": 1.2820084656906526e-07, + "loss": 0.0008, + "step": 18539 + }, + { + "epoch": 0.36, + "learning_rate": 1.2819696322472913e-07, + "loss": 0.0008, + "step": 18540 + }, + { + "epoch": 0.36, + "learning_rate": 1.2819307988039298e-07, + "loss": 0.0046, + "step": 18541 + }, + { + "epoch": 0.36, + "learning_rate": 1.2818919653605685e-07, + "loss": 0.0008, + "step": 18542 + }, + { + "epoch": 0.36, + "learning_rate": 1.281853131917207e-07, + "loss": 0.0358, + "step": 18543 + }, + { + "epoch": 0.36, + "learning_rate": 1.2818142984738457e-07, + "loss": 0.0006, + "step": 18544 + }, + { + "epoch": 0.36, + "learning_rate": 1.281775465030484e-07, + "loss": 0.0008, + "step": 18545 + }, + { + "epoch": 0.36, + "learning_rate": 1.2817366315871228e-07, + "loss": 0.0025, + "step": 18546 + }, + { + "epoch": 0.36, + "learning_rate": 1.2816977981437613e-07, + "loss": 0.0007, + "step": 18547 + }, + { + "epoch": 0.36, + "learning_rate": 1.2816589647004e-07, + "loss": 1.207, + "step": 18548 + }, + { + "epoch": 0.36, + "learning_rate": 1.2816201312570385e-07, + "loss": 0.0009, + "step": 18549 + }, + { + "epoch": 0.36, + "learning_rate": 1.2815812978136772e-07, + "loss": 0.813, + "step": 18550 + }, + { + "epoch": 0.36, + "learning_rate": 1.2815424643703156e-07, + "loss": 0.0013, + "step": 18551 + }, + { + "epoch": 0.36, + "learning_rate": 1.2815036309269543e-07, + "loss": 0.0048, + "step": 18552 + }, + { + "epoch": 0.36, + "learning_rate": 1.2814647974835928e-07, + "loss": 0.0008, + "step": 18553 + }, + { + "epoch": 0.36, + "learning_rate": 1.2814259640402315e-07, + "loss": 0.0011, + "step": 18554 + }, + { + "epoch": 0.36, + "learning_rate": 1.28138713059687e-07, + "loss": 0.0009, + "step": 18555 + }, + { + "epoch": 0.36, + "learning_rate": 1.2813482971535087e-07, + "loss": 0.0012, + "step": 18556 + }, + { + "epoch": 0.36, + "learning_rate": 1.281309463710147e-07, + "loss": 0.0009, + "step": 18557 + }, + { + "epoch": 0.36, + "learning_rate": 1.2812706302667858e-07, + "loss": 0.007, + "step": 18558 + }, + { + "epoch": 0.36, + "learning_rate": 1.2812317968234243e-07, + "loss": 0.001, + "step": 18559 + }, + { + "epoch": 0.36, + "learning_rate": 1.281192963380063e-07, + "loss": 0.0021, + "step": 18560 + }, + { + "epoch": 0.36, + "learning_rate": 1.2811541299367014e-07, + "loss": 0.0011, + "step": 18561 + }, + { + "epoch": 0.36, + "learning_rate": 1.2811152964933402e-07, + "loss": 0.0013, + "step": 18562 + }, + { + "epoch": 0.36, + "learning_rate": 1.2810764630499786e-07, + "loss": 0.0007, + "step": 18563 + }, + { + "epoch": 0.36, + "learning_rate": 1.2810376296066173e-07, + "loss": 0.7119, + "step": 18564 + }, + { + "epoch": 0.36, + "learning_rate": 1.2809987961632558e-07, + "loss": 0.0009, + "step": 18565 + }, + { + "epoch": 0.36, + "learning_rate": 1.2809599627198945e-07, + "loss": 0.0024, + "step": 18566 + }, + { + "epoch": 0.36, + "learning_rate": 1.280921129276533e-07, + "loss": 0.001, + "step": 18567 + }, + { + "epoch": 0.36, + "learning_rate": 1.2808822958331717e-07, + "loss": 0.163, + "step": 18568 + }, + { + "epoch": 0.36, + "learning_rate": 1.28084346238981e-07, + "loss": 0.0039, + "step": 18569 + }, + { + "epoch": 0.36, + "learning_rate": 1.2808046289464488e-07, + "loss": 0.0009, + "step": 18570 + }, + { + "epoch": 0.36, + "learning_rate": 1.2807657955030873e-07, + "loss": 0.0007, + "step": 18571 + }, + { + "epoch": 0.36, + "learning_rate": 1.280726962059726e-07, + "loss": 0.0008, + "step": 18572 + }, + { + "epoch": 0.36, + "learning_rate": 1.2806881286163644e-07, + "loss": 0.0032, + "step": 18573 + }, + { + "epoch": 0.36, + "learning_rate": 1.2806492951730032e-07, + "loss": 0.0013, + "step": 18574 + }, + { + "epoch": 0.36, + "learning_rate": 1.2806104617296416e-07, + "loss": 0.0008, + "step": 18575 + }, + { + "epoch": 0.36, + "learning_rate": 1.28057162828628e-07, + "loss": 0.9525, + "step": 18576 + }, + { + "epoch": 0.36, + "learning_rate": 1.2805327948429188e-07, + "loss": 0.0008, + "step": 18577 + }, + { + "epoch": 0.36, + "learning_rate": 1.2804939613995572e-07, + "loss": 0.0008, + "step": 18578 + }, + { + "epoch": 0.36, + "learning_rate": 1.280455127956196e-07, + "loss": 0.0007, + "step": 18579 + }, + { + "epoch": 0.36, + "learning_rate": 1.2804162945128344e-07, + "loss": 0.0008, + "step": 18580 + }, + { + "epoch": 0.36, + "learning_rate": 1.2803774610694728e-07, + "loss": 0.0007, + "step": 18581 + }, + { + "epoch": 0.36, + "learning_rate": 1.2803386276261115e-07, + "loss": 0.0012, + "step": 18582 + }, + { + "epoch": 0.36, + "learning_rate": 1.28029979418275e-07, + "loss": 0.0008, + "step": 18583 + }, + { + "epoch": 0.36, + "learning_rate": 1.2802609607393887e-07, + "loss": 0.1909, + "step": 18584 + }, + { + "epoch": 0.36, + "learning_rate": 1.2802221272960272e-07, + "loss": 0.0009, + "step": 18585 + }, + { + "epoch": 0.36, + "learning_rate": 1.280183293852666e-07, + "loss": 1.3822, + "step": 18586 + }, + { + "epoch": 0.36, + "learning_rate": 1.2801444604093043e-07, + "loss": 0.0013, + "step": 18587 + }, + { + "epoch": 0.36, + "learning_rate": 1.280105626965943e-07, + "loss": 0.0008, + "step": 18588 + }, + { + "epoch": 0.36, + "learning_rate": 1.2800667935225815e-07, + "loss": 0.002, + "step": 18589 + }, + { + "epoch": 0.36, + "learning_rate": 1.2800279600792202e-07, + "loss": 0.0009, + "step": 18590 + }, + { + "epoch": 0.36, + "learning_rate": 1.2799891266358587e-07, + "loss": 0.0011, + "step": 18591 + }, + { + "epoch": 0.36, + "learning_rate": 1.2799502931924974e-07, + "loss": 0.0007, + "step": 18592 + }, + { + "epoch": 0.36, + "learning_rate": 1.2799114597491358e-07, + "loss": 0.0025, + "step": 18593 + }, + { + "epoch": 0.36, + "learning_rate": 1.2798726263057745e-07, + "loss": 0.0011, + "step": 18594 + }, + { + "epoch": 0.36, + "learning_rate": 1.279833792862413e-07, + "loss": 0.1373, + "step": 18595 + }, + { + "epoch": 0.36, + "learning_rate": 1.2797949594190517e-07, + "loss": 1.245, + "step": 18596 + }, + { + "epoch": 0.36, + "learning_rate": 1.2797561259756901e-07, + "loss": 0.003, + "step": 18597 + }, + { + "epoch": 0.36, + "learning_rate": 1.2797172925323289e-07, + "loss": 0.0008, + "step": 18598 + }, + { + "epoch": 0.36, + "learning_rate": 1.2796784590889673e-07, + "loss": 0.4043, + "step": 18599 + }, + { + "epoch": 0.36, + "learning_rate": 1.279639625645606e-07, + "loss": 0.0008, + "step": 18600 + }, + { + "epoch": 0.36, + "learning_rate": 1.2796007922022445e-07, + "loss": 0.0009, + "step": 18601 + }, + { + "epoch": 0.36, + "learning_rate": 1.2795619587588832e-07, + "loss": 0.0007, + "step": 18602 + }, + { + "epoch": 0.36, + "learning_rate": 1.2795231253155216e-07, + "loss": 0.0006, + "step": 18603 + }, + { + "epoch": 0.36, + "learning_rate": 1.27948429187216e-07, + "loss": 0.029, + "step": 18604 + }, + { + "epoch": 0.36, + "learning_rate": 1.2794454584287988e-07, + "loss": 0.4006, + "step": 18605 + }, + { + "epoch": 0.36, + "learning_rate": 1.2794066249854373e-07, + "loss": 0.0009, + "step": 18606 + }, + { + "epoch": 0.36, + "learning_rate": 1.279367791542076e-07, + "loss": 0.0008, + "step": 18607 + }, + { + "epoch": 0.36, + "learning_rate": 1.2793289580987144e-07, + "loss": 0.001, + "step": 18608 + }, + { + "epoch": 0.36, + "learning_rate": 1.2792901246553531e-07, + "loss": 0.0023, + "step": 18609 + }, + { + "epoch": 0.36, + "learning_rate": 1.2792512912119916e-07, + "loss": 0.0007, + "step": 18610 + }, + { + "epoch": 0.36, + "learning_rate": 1.2792124577686303e-07, + "loss": 0.0006, + "step": 18611 + }, + { + "epoch": 0.36, + "learning_rate": 1.2791736243252688e-07, + "loss": 0.0012, + "step": 18612 + }, + { + "epoch": 0.36, + "learning_rate": 1.2791347908819075e-07, + "loss": 0.0007, + "step": 18613 + }, + { + "epoch": 0.36, + "learning_rate": 1.279095957438546e-07, + "loss": 0.6472, + "step": 18614 + }, + { + "epoch": 0.36, + "learning_rate": 1.2790571239951846e-07, + "loss": 0.0012, + "step": 18615 + }, + { + "epoch": 0.36, + "learning_rate": 1.279018290551823e-07, + "loss": 0.0011, + "step": 18616 + }, + { + "epoch": 0.36, + "learning_rate": 1.2789794571084618e-07, + "loss": 0.0009, + "step": 18617 + }, + { + "epoch": 0.36, + "learning_rate": 1.2789406236651002e-07, + "loss": 0.0009, + "step": 18618 + }, + { + "epoch": 0.36, + "learning_rate": 1.278901790221739e-07, + "loss": 0.0009, + "step": 18619 + }, + { + "epoch": 0.36, + "learning_rate": 1.2788629567783774e-07, + "loss": 0.0011, + "step": 18620 + }, + { + "epoch": 0.36, + "learning_rate": 1.278824123335016e-07, + "loss": 0.0007, + "step": 18621 + }, + { + "epoch": 0.36, + "learning_rate": 1.2787852898916546e-07, + "loss": 0.0007, + "step": 18622 + }, + { + "epoch": 0.36, + "learning_rate": 1.2787464564482933e-07, + "loss": 0.0006, + "step": 18623 + }, + { + "epoch": 0.36, + "learning_rate": 1.2787076230049317e-07, + "loss": 0.0008, + "step": 18624 + }, + { + "epoch": 0.36, + "learning_rate": 1.2786687895615705e-07, + "loss": 0.0011, + "step": 18625 + }, + { + "epoch": 0.36, + "learning_rate": 1.278629956118209e-07, + "loss": 0.0011, + "step": 18626 + }, + { + "epoch": 0.36, + "learning_rate": 1.2785911226748476e-07, + "loss": 0.0014, + "step": 18627 + }, + { + "epoch": 0.36, + "learning_rate": 1.278552289231486e-07, + "loss": 0.0012, + "step": 18628 + }, + { + "epoch": 0.36, + "learning_rate": 1.2785134557881248e-07, + "loss": 0.0008, + "step": 18629 + }, + { + "epoch": 0.36, + "learning_rate": 1.2784746223447632e-07, + "loss": 0.0011, + "step": 18630 + }, + { + "epoch": 0.36, + "learning_rate": 1.278435788901402e-07, + "loss": 0.0008, + "step": 18631 + }, + { + "epoch": 0.36, + "learning_rate": 1.2783969554580404e-07, + "loss": 0.0018, + "step": 18632 + }, + { + "epoch": 0.36, + "learning_rate": 1.278358122014679e-07, + "loss": 0.0022, + "step": 18633 + }, + { + "epoch": 0.36, + "learning_rate": 1.2783192885713176e-07, + "loss": 0.1854, + "step": 18634 + }, + { + "epoch": 0.36, + "learning_rate": 1.2782804551279563e-07, + "loss": 0.0008, + "step": 18635 + }, + { + "epoch": 0.36, + "learning_rate": 1.2782416216845947e-07, + "loss": 0.0009, + "step": 18636 + }, + { + "epoch": 0.36, + "learning_rate": 1.2782027882412334e-07, + "loss": 0.0008, + "step": 18637 + }, + { + "epoch": 0.36, + "learning_rate": 1.278163954797872e-07, + "loss": 0.0023, + "step": 18638 + }, + { + "epoch": 0.36, + "learning_rate": 1.2781251213545103e-07, + "loss": 0.0009, + "step": 18639 + }, + { + "epoch": 0.36, + "learning_rate": 1.2780862879111488e-07, + "loss": 0.0008, + "step": 18640 + }, + { + "epoch": 0.36, + "learning_rate": 1.2780474544677875e-07, + "loss": 1.2031, + "step": 18641 + }, + { + "epoch": 0.36, + "learning_rate": 1.278008621024426e-07, + "loss": 0.0005, + "step": 18642 + }, + { + "epoch": 0.36, + "learning_rate": 1.2779697875810647e-07, + "loss": 0.0008, + "step": 18643 + }, + { + "epoch": 0.36, + "learning_rate": 1.277930954137703e-07, + "loss": 0.0011, + "step": 18644 + }, + { + "epoch": 0.36, + "learning_rate": 1.2778921206943418e-07, + "loss": 0.0012, + "step": 18645 + }, + { + "epoch": 0.36, + "learning_rate": 1.2778532872509803e-07, + "loss": 0.0007, + "step": 18646 + }, + { + "epoch": 0.36, + "learning_rate": 1.277814453807619e-07, + "loss": 0.0072, + "step": 18647 + }, + { + "epoch": 0.36, + "learning_rate": 1.2777756203642575e-07, + "loss": 0.0011, + "step": 18648 + }, + { + "epoch": 0.36, + "learning_rate": 1.2777367869208962e-07, + "loss": 0.0009, + "step": 18649 + }, + { + "epoch": 0.36, + "learning_rate": 1.2776979534775346e-07, + "loss": 0.0011, + "step": 18650 + }, + { + "epoch": 0.36, + "learning_rate": 1.2776591200341733e-07, + "loss": 0.0007, + "step": 18651 + }, + { + "epoch": 0.36, + "learning_rate": 1.2776202865908118e-07, + "loss": 0.0017, + "step": 18652 + }, + { + "epoch": 0.36, + "learning_rate": 1.2775814531474505e-07, + "loss": 0.0083, + "step": 18653 + }, + { + "epoch": 0.36, + "learning_rate": 1.277542619704089e-07, + "loss": 0.0014, + "step": 18654 + }, + { + "epoch": 0.36, + "learning_rate": 1.2775037862607277e-07, + "loss": 0.0008, + "step": 18655 + }, + { + "epoch": 0.36, + "learning_rate": 1.277464952817366e-07, + "loss": 0.0008, + "step": 18656 + }, + { + "epoch": 0.36, + "learning_rate": 1.2774261193740048e-07, + "loss": 0.0008, + "step": 18657 + }, + { + "epoch": 0.36, + "learning_rate": 1.2773872859306433e-07, + "loss": 0.0012, + "step": 18658 + }, + { + "epoch": 0.36, + "learning_rate": 1.277348452487282e-07, + "loss": 0.0009, + "step": 18659 + }, + { + "epoch": 0.36, + "learning_rate": 1.2773096190439204e-07, + "loss": 0.0009, + "step": 18660 + }, + { + "epoch": 0.36, + "learning_rate": 1.2772707856005592e-07, + "loss": 0.001, + "step": 18661 + }, + { + "epoch": 0.36, + "learning_rate": 1.2772319521571976e-07, + "loss": 0.0006, + "step": 18662 + }, + { + "epoch": 0.36, + "learning_rate": 1.2771931187138363e-07, + "loss": 0.0008, + "step": 18663 + }, + { + "epoch": 0.36, + "learning_rate": 1.2771542852704748e-07, + "loss": 0.0021, + "step": 18664 + }, + { + "epoch": 0.36, + "learning_rate": 1.2771154518271135e-07, + "loss": 0.0008, + "step": 18665 + }, + { + "epoch": 0.36, + "learning_rate": 1.277076618383752e-07, + "loss": 0.0008, + "step": 18666 + }, + { + "epoch": 0.36, + "learning_rate": 1.2770377849403907e-07, + "loss": 1.0391, + "step": 18667 + }, + { + "epoch": 0.36, + "learning_rate": 1.276998951497029e-07, + "loss": 0.138, + "step": 18668 + }, + { + "epoch": 0.36, + "learning_rate": 1.2769601180536678e-07, + "loss": 0.0008, + "step": 18669 + }, + { + "epoch": 0.36, + "learning_rate": 1.2769212846103063e-07, + "loss": 0.001, + "step": 18670 + }, + { + "epoch": 0.36, + "learning_rate": 1.276882451166945e-07, + "loss": 0.0015, + "step": 18671 + }, + { + "epoch": 0.36, + "learning_rate": 1.2768436177235834e-07, + "loss": 0.9008, + "step": 18672 + }, + { + "epoch": 0.36, + "learning_rate": 1.2768047842802222e-07, + "loss": 0.001, + "step": 18673 + }, + { + "epoch": 0.36, + "learning_rate": 1.2767659508368606e-07, + "loss": 0.0007, + "step": 18674 + }, + { + "epoch": 0.36, + "learning_rate": 1.2767271173934993e-07, + "loss": 0.0013, + "step": 18675 + }, + { + "epoch": 0.36, + "learning_rate": 1.2766882839501378e-07, + "loss": 0.0009, + "step": 18676 + }, + { + "epoch": 0.36, + "learning_rate": 1.2766494505067765e-07, + "loss": 0.5672, + "step": 18677 + }, + { + "epoch": 0.36, + "learning_rate": 1.276610617063415e-07, + "loss": 0.0012, + "step": 18678 + }, + { + "epoch": 0.36, + "learning_rate": 1.2765717836200536e-07, + "loss": 0.0008, + "step": 18679 + }, + { + "epoch": 0.36, + "learning_rate": 1.276532950176692e-07, + "loss": 0.668, + "step": 18680 + }, + { + "epoch": 0.36, + "learning_rate": 1.2764941167333308e-07, + "loss": 0.0007, + "step": 18681 + }, + { + "epoch": 0.36, + "learning_rate": 1.2764552832899693e-07, + "loss": 0.0009, + "step": 18682 + }, + { + "epoch": 0.36, + "learning_rate": 1.276416449846608e-07, + "loss": 0.0006, + "step": 18683 + }, + { + "epoch": 0.36, + "learning_rate": 1.2763776164032464e-07, + "loss": 0.004, + "step": 18684 + }, + { + "epoch": 0.36, + "learning_rate": 1.2763387829598851e-07, + "loss": 0.0007, + "step": 18685 + }, + { + "epoch": 0.36, + "learning_rate": 1.2762999495165236e-07, + "loss": 0.0006, + "step": 18686 + }, + { + "epoch": 0.36, + "learning_rate": 1.2762611160731623e-07, + "loss": 1.0319, + "step": 18687 + }, + { + "epoch": 0.36, + "learning_rate": 1.2762222826298008e-07, + "loss": 0.0006, + "step": 18688 + }, + { + "epoch": 0.36, + "learning_rate": 1.2761834491864395e-07, + "loss": 0.0009, + "step": 18689 + }, + { + "epoch": 0.36, + "learning_rate": 1.276144615743078e-07, + "loss": 0.0008, + "step": 18690 + }, + { + "epoch": 0.36, + "learning_rate": 1.2761057822997166e-07, + "loss": 0.0006, + "step": 18691 + }, + { + "epoch": 0.36, + "learning_rate": 1.276066948856355e-07, + "loss": 0.0457, + "step": 18692 + }, + { + "epoch": 0.36, + "learning_rate": 1.2760281154129938e-07, + "loss": 0.6323, + "step": 18693 + }, + { + "epoch": 0.36, + "learning_rate": 1.2759892819696322e-07, + "loss": 0.0011, + "step": 18694 + }, + { + "epoch": 0.36, + "learning_rate": 1.275950448526271e-07, + "loss": 0.0008, + "step": 18695 + }, + { + "epoch": 0.36, + "learning_rate": 1.2759116150829094e-07, + "loss": 0.0009, + "step": 18696 + }, + { + "epoch": 0.36, + "learning_rate": 1.2758727816395479e-07, + "loss": 0.0012, + "step": 18697 + }, + { + "epoch": 0.36, + "learning_rate": 1.2758339481961863e-07, + "loss": 0.0006, + "step": 18698 + }, + { + "epoch": 0.36, + "learning_rate": 1.275795114752825e-07, + "loss": 0.0012, + "step": 18699 + }, + { + "epoch": 0.36, + "learning_rate": 1.2757562813094635e-07, + "loss": 0.0008, + "step": 18700 + }, + { + "epoch": 0.36, + "learning_rate": 1.2757174478661022e-07, + "loss": 0.0009, + "step": 18701 + }, + { + "epoch": 0.36, + "learning_rate": 1.2756786144227406e-07, + "loss": 0.0007, + "step": 18702 + }, + { + "epoch": 0.36, + "learning_rate": 1.2756397809793794e-07, + "loss": 0.0014, + "step": 18703 + }, + { + "epoch": 0.36, + "learning_rate": 1.2756009475360178e-07, + "loss": 0.0015, + "step": 18704 + }, + { + "epoch": 0.36, + "learning_rate": 1.2755621140926565e-07, + "loss": 0.0008, + "step": 18705 + }, + { + "epoch": 0.36, + "learning_rate": 1.275523280649295e-07, + "loss": 0.0008, + "step": 18706 + }, + { + "epoch": 0.36, + "learning_rate": 1.2754844472059337e-07, + "loss": 0.0012, + "step": 18707 + }, + { + "epoch": 0.36, + "learning_rate": 1.2754456137625721e-07, + "loss": 0.001, + "step": 18708 + }, + { + "epoch": 0.36, + "learning_rate": 1.2754067803192109e-07, + "loss": 0.0008, + "step": 18709 + }, + { + "epoch": 0.36, + "learning_rate": 1.2753679468758493e-07, + "loss": 0.0679, + "step": 18710 + }, + { + "epoch": 0.36, + "learning_rate": 1.275329113432488e-07, + "loss": 0.0325, + "step": 18711 + }, + { + "epoch": 0.36, + "learning_rate": 1.2752902799891265e-07, + "loss": 0.0008, + "step": 18712 + }, + { + "epoch": 0.36, + "learning_rate": 1.2752514465457652e-07, + "loss": 0.0006, + "step": 18713 + }, + { + "epoch": 0.36, + "learning_rate": 1.2752126131024036e-07, + "loss": 0.0007, + "step": 18714 + }, + { + "epoch": 0.36, + "learning_rate": 1.2751737796590423e-07, + "loss": 0.0007, + "step": 18715 + }, + { + "epoch": 0.36, + "learning_rate": 1.2751349462156808e-07, + "loss": 0.001, + "step": 18716 + }, + { + "epoch": 0.36, + "learning_rate": 1.2750961127723195e-07, + "loss": 0.0294, + "step": 18717 + }, + { + "epoch": 0.36, + "learning_rate": 1.275057279328958e-07, + "loss": 0.0008, + "step": 18718 + }, + { + "epoch": 0.36, + "learning_rate": 1.2750184458855967e-07, + "loss": 0.0008, + "step": 18719 + }, + { + "epoch": 0.36, + "learning_rate": 1.274979612442235e-07, + "loss": 0.0011, + "step": 18720 + }, + { + "epoch": 0.36, + "learning_rate": 1.2749407789988738e-07, + "loss": 0.002, + "step": 18721 + }, + { + "epoch": 0.36, + "learning_rate": 1.2749019455555123e-07, + "loss": 0.0007, + "step": 18722 + }, + { + "epoch": 0.36, + "learning_rate": 1.274863112112151e-07, + "loss": 0.0077, + "step": 18723 + }, + { + "epoch": 0.36, + "learning_rate": 1.2748242786687895e-07, + "loss": 0.2004, + "step": 18724 + }, + { + "epoch": 0.36, + "learning_rate": 1.2747854452254282e-07, + "loss": 0.001, + "step": 18725 + }, + { + "epoch": 0.36, + "learning_rate": 1.2747466117820666e-07, + "loss": 0.0057, + "step": 18726 + }, + { + "epoch": 0.36, + "learning_rate": 1.2747077783387053e-07, + "loss": 0.0008, + "step": 18727 + }, + { + "epoch": 0.36, + "learning_rate": 1.2746689448953438e-07, + "loss": 0.001, + "step": 18728 + }, + { + "epoch": 0.36, + "learning_rate": 1.2746301114519825e-07, + "loss": 0.0068, + "step": 18729 + }, + { + "epoch": 0.36, + "learning_rate": 1.274591278008621e-07, + "loss": 0.0012, + "step": 18730 + }, + { + "epoch": 0.36, + "learning_rate": 1.2745524445652597e-07, + "loss": 0.0268, + "step": 18731 + }, + { + "epoch": 0.36, + "learning_rate": 1.274513611121898e-07, + "loss": 0.0009, + "step": 18732 + }, + { + "epoch": 0.36, + "learning_rate": 1.2744747776785368e-07, + "loss": 0.0011, + "step": 18733 + }, + { + "epoch": 0.36, + "learning_rate": 1.2744359442351753e-07, + "loss": 0.0015, + "step": 18734 + }, + { + "epoch": 0.36, + "learning_rate": 1.274397110791814e-07, + "loss": 0.7714, + "step": 18735 + }, + { + "epoch": 0.36, + "learning_rate": 1.2743582773484524e-07, + "loss": 0.0008, + "step": 18736 + }, + { + "epoch": 0.36, + "learning_rate": 1.2743194439050912e-07, + "loss": 0.0008, + "step": 18737 + }, + { + "epoch": 0.36, + "learning_rate": 1.2742806104617296e-07, + "loss": 0.001, + "step": 18738 + }, + { + "epoch": 0.36, + "learning_rate": 1.2742417770183683e-07, + "loss": 0.001, + "step": 18739 + }, + { + "epoch": 0.36, + "learning_rate": 1.2742029435750068e-07, + "loss": 0.001, + "step": 18740 + }, + { + "epoch": 0.36, + "learning_rate": 1.2741641101316455e-07, + "loss": 0.0012, + "step": 18741 + }, + { + "epoch": 0.36, + "learning_rate": 1.274125276688284e-07, + "loss": 0.0009, + "step": 18742 + }, + { + "epoch": 0.36, + "learning_rate": 1.2740864432449227e-07, + "loss": 0.6967, + "step": 18743 + }, + { + "epoch": 0.36, + "learning_rate": 1.274047609801561e-07, + "loss": 0.0013, + "step": 18744 + }, + { + "epoch": 0.36, + "learning_rate": 1.2740087763581998e-07, + "loss": 0.0014, + "step": 18745 + }, + { + "epoch": 0.36, + "learning_rate": 1.2739699429148383e-07, + "loss": 1.1751, + "step": 18746 + }, + { + "epoch": 0.36, + "learning_rate": 1.273931109471477e-07, + "loss": 0.1109, + "step": 18747 + }, + { + "epoch": 0.36, + "learning_rate": 1.2738922760281154e-07, + "loss": 0.0012, + "step": 18748 + }, + { + "epoch": 0.36, + "learning_rate": 1.2738534425847542e-07, + "loss": 0.0011, + "step": 18749 + }, + { + "epoch": 0.36, + "learning_rate": 1.2738146091413926e-07, + "loss": 0.0101, + "step": 18750 + }, + { + "epoch": 0.36, + "learning_rate": 1.2737757756980313e-07, + "loss": 0.0008, + "step": 18751 + }, + { + "epoch": 0.36, + "learning_rate": 1.2737369422546698e-07, + "loss": 0.0009, + "step": 18752 + }, + { + "epoch": 0.36, + "learning_rate": 1.2736981088113082e-07, + "loss": 0.0015, + "step": 18753 + }, + { + "epoch": 0.36, + "learning_rate": 1.273659275367947e-07, + "loss": 0.0007, + "step": 18754 + }, + { + "epoch": 0.36, + "learning_rate": 1.2736204419245854e-07, + "loss": 0.0024, + "step": 18755 + }, + { + "epoch": 0.36, + "learning_rate": 1.2735816084812238e-07, + "loss": 0.0636, + "step": 18756 + }, + { + "epoch": 0.36, + "learning_rate": 1.2735427750378625e-07, + "loss": 0.0007, + "step": 18757 + }, + { + "epoch": 0.36, + "learning_rate": 1.273503941594501e-07, + "loss": 0.0007, + "step": 18758 + }, + { + "epoch": 0.36, + "learning_rate": 1.2734651081511397e-07, + "loss": 0.0021, + "step": 18759 + }, + { + "epoch": 0.36, + "learning_rate": 1.2734262747077782e-07, + "loss": 0.0058, + "step": 18760 + }, + { + "epoch": 0.36, + "learning_rate": 1.273387441264417e-07, + "loss": 0.0014, + "step": 18761 + }, + { + "epoch": 0.36, + "learning_rate": 1.2733486078210553e-07, + "loss": 0.5629, + "step": 18762 + }, + { + "epoch": 0.36, + "learning_rate": 1.273309774377694e-07, + "loss": 0.0015, + "step": 18763 + }, + { + "epoch": 0.36, + "learning_rate": 1.2732709409343325e-07, + "loss": 0.0012, + "step": 18764 + }, + { + "epoch": 0.36, + "learning_rate": 1.2732321074909712e-07, + "loss": 0.0012, + "step": 18765 + }, + { + "epoch": 0.36, + "learning_rate": 1.2731932740476097e-07, + "loss": 0.001, + "step": 18766 + }, + { + "epoch": 0.36, + "learning_rate": 1.2731544406042484e-07, + "loss": 0.0006, + "step": 18767 + }, + { + "epoch": 0.36, + "learning_rate": 1.2731156071608868e-07, + "loss": 0.0142, + "step": 18768 + }, + { + "epoch": 0.36, + "learning_rate": 1.2730767737175255e-07, + "loss": 0.001, + "step": 18769 + }, + { + "epoch": 0.36, + "learning_rate": 1.273037940274164e-07, + "loss": 0.0008, + "step": 18770 + }, + { + "epoch": 0.36, + "learning_rate": 1.2729991068308027e-07, + "loss": 0.001, + "step": 18771 + }, + { + "epoch": 0.36, + "learning_rate": 1.2729602733874412e-07, + "loss": 0.0014, + "step": 18772 + }, + { + "epoch": 0.36, + "learning_rate": 1.2729214399440799e-07, + "loss": 0.0008, + "step": 18773 + }, + { + "epoch": 0.36, + "learning_rate": 1.2728826065007183e-07, + "loss": 0.0012, + "step": 18774 + }, + { + "epoch": 0.36, + "learning_rate": 1.272843773057357e-07, + "loss": 0.0012, + "step": 18775 + }, + { + "epoch": 0.36, + "learning_rate": 1.2728049396139955e-07, + "loss": 0.0008, + "step": 18776 + }, + { + "epoch": 0.36, + "learning_rate": 1.2727661061706342e-07, + "loss": 0.0008, + "step": 18777 + }, + { + "epoch": 0.36, + "learning_rate": 1.2727272727272726e-07, + "loss": 0.0012, + "step": 18778 + }, + { + "epoch": 0.36, + "learning_rate": 1.2726884392839114e-07, + "loss": 0.001, + "step": 18779 + }, + { + "epoch": 0.36, + "learning_rate": 1.2726496058405498e-07, + "loss": 0.0006, + "step": 18780 + }, + { + "epoch": 0.36, + "learning_rate": 1.2726107723971883e-07, + "loss": 0.0009, + "step": 18781 + }, + { + "epoch": 0.36, + "learning_rate": 1.272571938953827e-07, + "loss": 0.7073, + "step": 18782 + }, + { + "epoch": 0.36, + "learning_rate": 1.2725331055104654e-07, + "loss": 0.0054, + "step": 18783 + }, + { + "epoch": 0.36, + "learning_rate": 1.2724942720671041e-07, + "loss": 0.001, + "step": 18784 + }, + { + "epoch": 0.36, + "learning_rate": 1.2724554386237426e-07, + "loss": 0.2981, + "step": 18785 + }, + { + "epoch": 0.36, + "learning_rate": 1.2724166051803813e-07, + "loss": 0.0008, + "step": 18786 + }, + { + "epoch": 0.36, + "learning_rate": 1.2723777717370198e-07, + "loss": 0.0008, + "step": 18787 + }, + { + "epoch": 0.36, + "learning_rate": 1.2723389382936585e-07, + "loss": 0.0007, + "step": 18788 + }, + { + "epoch": 0.36, + "learning_rate": 1.272300104850297e-07, + "loss": 0.4458, + "step": 18789 + }, + { + "epoch": 0.36, + "learning_rate": 1.2722612714069356e-07, + "loss": 0.0008, + "step": 18790 + }, + { + "epoch": 0.36, + "learning_rate": 1.272222437963574e-07, + "loss": 0.0105, + "step": 18791 + }, + { + "epoch": 0.36, + "learning_rate": 1.2721836045202128e-07, + "loss": 0.0008, + "step": 18792 + }, + { + "epoch": 0.36, + "learning_rate": 1.2721447710768512e-07, + "loss": 0.002, + "step": 18793 + }, + { + "epoch": 0.36, + "learning_rate": 1.27210593763349e-07, + "loss": 0.0007, + "step": 18794 + }, + { + "epoch": 0.36, + "learning_rate": 1.2720671041901284e-07, + "loss": 0.0011, + "step": 18795 + }, + { + "epoch": 0.36, + "learning_rate": 1.272028270746767e-07, + "loss": 0.0008, + "step": 18796 + }, + { + "epoch": 0.36, + "learning_rate": 1.2719894373034056e-07, + "loss": 0.0469, + "step": 18797 + }, + { + "epoch": 0.36, + "learning_rate": 1.2719506038600443e-07, + "loss": 0.2365, + "step": 18798 + }, + { + "epoch": 0.36, + "learning_rate": 1.2719117704166827e-07, + "loss": 0.0009, + "step": 18799 + }, + { + "epoch": 0.36, + "learning_rate": 1.2718729369733215e-07, + "loss": 0.0007, + "step": 18800 + }, + { + "epoch": 0.36, + "learning_rate": 1.27183410352996e-07, + "loss": 0.0012, + "step": 18801 + }, + { + "epoch": 0.36, + "learning_rate": 1.2717952700865986e-07, + "loss": 0.0009, + "step": 18802 + }, + { + "epoch": 0.36, + "learning_rate": 1.271756436643237e-07, + "loss": 0.5468, + "step": 18803 + }, + { + "epoch": 0.36, + "learning_rate": 1.2717176031998758e-07, + "loss": 0.0786, + "step": 18804 + }, + { + "epoch": 0.36, + "learning_rate": 1.2716787697565142e-07, + "loss": 0.0023, + "step": 18805 + }, + { + "epoch": 0.36, + "learning_rate": 1.271639936313153e-07, + "loss": 0.0013, + "step": 18806 + }, + { + "epoch": 0.36, + "learning_rate": 1.2716011028697914e-07, + "loss": 0.0025, + "step": 18807 + }, + { + "epoch": 0.36, + "learning_rate": 1.27156226942643e-07, + "loss": 0.0006, + "step": 18808 + }, + { + "epoch": 0.36, + "learning_rate": 1.2715234359830686e-07, + "loss": 0.0043, + "step": 18809 + }, + { + "epoch": 0.36, + "learning_rate": 1.2714846025397073e-07, + "loss": 0.0008, + "step": 18810 + }, + { + "epoch": 0.36, + "learning_rate": 1.2714457690963457e-07, + "loss": 0.0009, + "step": 18811 + }, + { + "epoch": 0.36, + "learning_rate": 1.2714069356529844e-07, + "loss": 0.0009, + "step": 18812 + }, + { + "epoch": 0.36, + "learning_rate": 1.2713681022096226e-07, + "loss": 0.0122, + "step": 18813 + }, + { + "epoch": 0.36, + "learning_rate": 1.2713292687662613e-07, + "loss": 0.1423, + "step": 18814 + }, + { + "epoch": 0.36, + "learning_rate": 1.2712904353228998e-07, + "loss": 0.0009, + "step": 18815 + }, + { + "epoch": 0.36, + "learning_rate": 1.2712516018795385e-07, + "loss": 0.3514, + "step": 18816 + }, + { + "epoch": 0.37, + "learning_rate": 1.271212768436177e-07, + "loss": 0.0007, + "step": 18817 + }, + { + "epoch": 0.37, + "learning_rate": 1.2711739349928157e-07, + "loss": 0.0008, + "step": 18818 + }, + { + "epoch": 0.37, + "learning_rate": 1.271135101549454e-07, + "loss": 0.0007, + "step": 18819 + }, + { + "epoch": 0.37, + "learning_rate": 1.2710962681060928e-07, + "loss": 0.0448, + "step": 18820 + }, + { + "epoch": 0.37, + "learning_rate": 1.2710574346627313e-07, + "loss": 0.0006, + "step": 18821 + }, + { + "epoch": 0.37, + "learning_rate": 1.27101860121937e-07, + "loss": 0.001, + "step": 18822 + }, + { + "epoch": 0.37, + "learning_rate": 1.2709797677760085e-07, + "loss": 0.2048, + "step": 18823 + }, + { + "epoch": 0.37, + "learning_rate": 1.2709409343326472e-07, + "loss": 0.0011, + "step": 18824 + }, + { + "epoch": 0.37, + "learning_rate": 1.2709021008892856e-07, + "loss": 0.0012, + "step": 18825 + }, + { + "epoch": 0.37, + "learning_rate": 1.2708632674459243e-07, + "loss": 0.001, + "step": 18826 + }, + { + "epoch": 0.37, + "learning_rate": 1.2708244340025628e-07, + "loss": 0.0012, + "step": 18827 + }, + { + "epoch": 0.37, + "learning_rate": 1.2707856005592015e-07, + "loss": 0.0008, + "step": 18828 + }, + { + "epoch": 0.37, + "learning_rate": 1.27074676711584e-07, + "loss": 0.0007, + "step": 18829 + }, + { + "epoch": 0.37, + "learning_rate": 1.2707079336724787e-07, + "loss": 0.001, + "step": 18830 + }, + { + "epoch": 0.37, + "learning_rate": 1.270669100229117e-07, + "loss": 0.2828, + "step": 18831 + }, + { + "epoch": 0.37, + "learning_rate": 1.2706302667857558e-07, + "loss": 0.0008, + "step": 18832 + }, + { + "epoch": 0.37, + "learning_rate": 1.2705914333423943e-07, + "loss": 0.0028, + "step": 18833 + }, + { + "epoch": 0.37, + "learning_rate": 1.270552599899033e-07, + "loss": 0.0014, + "step": 18834 + }, + { + "epoch": 0.37, + "learning_rate": 1.2705137664556714e-07, + "loss": 0.0015, + "step": 18835 + }, + { + "epoch": 0.37, + "learning_rate": 1.2704749330123102e-07, + "loss": 0.0022, + "step": 18836 + }, + { + "epoch": 0.37, + "learning_rate": 1.2704360995689486e-07, + "loss": 0.001, + "step": 18837 + }, + { + "epoch": 0.37, + "learning_rate": 1.2703972661255873e-07, + "loss": 0.001, + "step": 18838 + }, + { + "epoch": 0.37, + "learning_rate": 1.2703584326822258e-07, + "loss": 0.3537, + "step": 18839 + }, + { + "epoch": 0.37, + "learning_rate": 1.2703195992388645e-07, + "loss": 0.0019, + "step": 18840 + }, + { + "epoch": 0.37, + "learning_rate": 1.270280765795503e-07, + "loss": 0.0009, + "step": 18841 + }, + { + "epoch": 0.37, + "learning_rate": 1.2702419323521417e-07, + "loss": 0.0009, + "step": 18842 + }, + { + "epoch": 0.37, + "learning_rate": 1.27020309890878e-07, + "loss": 0.0009, + "step": 18843 + }, + { + "epoch": 0.37, + "learning_rate": 1.2701642654654188e-07, + "loss": 0.0017, + "step": 18844 + }, + { + "epoch": 0.37, + "learning_rate": 1.2701254320220573e-07, + "loss": 0.0017, + "step": 18845 + }, + { + "epoch": 0.37, + "learning_rate": 1.270086598578696e-07, + "loss": 0.0008, + "step": 18846 + }, + { + "epoch": 0.37, + "learning_rate": 1.2700477651353344e-07, + "loss": 0.0008, + "step": 18847 + }, + { + "epoch": 0.37, + "learning_rate": 1.2700089316919732e-07, + "loss": 0.5021, + "step": 18848 + }, + { + "epoch": 0.37, + "learning_rate": 1.2699700982486116e-07, + "loss": 0.001, + "step": 18849 + }, + { + "epoch": 0.37, + "learning_rate": 1.2699312648052503e-07, + "loss": 0.004, + "step": 18850 + }, + { + "epoch": 0.37, + "learning_rate": 1.2698924313618888e-07, + "loss": 0.0009, + "step": 18851 + }, + { + "epoch": 0.37, + "learning_rate": 1.2698535979185275e-07, + "loss": 0.0009, + "step": 18852 + }, + { + "epoch": 0.37, + "learning_rate": 1.269814764475166e-07, + "loss": 0.0009, + "step": 18853 + }, + { + "epoch": 0.37, + "learning_rate": 1.2697759310318046e-07, + "loss": 0.6412, + "step": 18854 + }, + { + "epoch": 0.37, + "learning_rate": 1.269737097588443e-07, + "loss": 0.0008, + "step": 18855 + }, + { + "epoch": 0.37, + "learning_rate": 1.2696982641450818e-07, + "loss": 0.0009, + "step": 18856 + }, + { + "epoch": 0.37, + "learning_rate": 1.2696594307017203e-07, + "loss": 0.0011, + "step": 18857 + }, + { + "epoch": 0.37, + "learning_rate": 1.269620597258359e-07, + "loss": 0.0124, + "step": 18858 + }, + { + "epoch": 0.37, + "learning_rate": 1.2695817638149974e-07, + "loss": 0.0961, + "step": 18859 + }, + { + "epoch": 0.37, + "learning_rate": 1.2695429303716361e-07, + "loss": 0.0015, + "step": 18860 + }, + { + "epoch": 0.37, + "learning_rate": 1.2695040969282746e-07, + "loss": 0.0011, + "step": 18861 + }, + { + "epoch": 0.37, + "learning_rate": 1.2694652634849133e-07, + "loss": 0.0011, + "step": 18862 + }, + { + "epoch": 0.37, + "learning_rate": 1.2694264300415518e-07, + "loss": 0.0008, + "step": 18863 + }, + { + "epoch": 0.37, + "learning_rate": 1.2693875965981905e-07, + "loss": 1.1687, + "step": 18864 + }, + { + "epoch": 0.37, + "learning_rate": 1.269348763154829e-07, + "loss": 0.0077, + "step": 18865 + }, + { + "epoch": 0.37, + "learning_rate": 1.2693099297114676e-07, + "loss": 0.001, + "step": 18866 + }, + { + "epoch": 0.37, + "learning_rate": 1.269271096268106e-07, + "loss": 0.0012, + "step": 18867 + }, + { + "epoch": 0.37, + "learning_rate": 1.2692322628247448e-07, + "loss": 0.0025, + "step": 18868 + }, + { + "epoch": 0.37, + "learning_rate": 1.2691934293813833e-07, + "loss": 0.0045, + "step": 18869 + }, + { + "epoch": 0.37, + "learning_rate": 1.269154595938022e-07, + "loss": 0.0009, + "step": 18870 + }, + { + "epoch": 0.37, + "learning_rate": 1.2691157624946602e-07, + "loss": 0.0008, + "step": 18871 + }, + { + "epoch": 0.37, + "learning_rate": 1.2690769290512989e-07, + "loss": 0.0006, + "step": 18872 + }, + { + "epoch": 0.37, + "learning_rate": 1.2690380956079373e-07, + "loss": 0.0009, + "step": 18873 + }, + { + "epoch": 0.37, + "learning_rate": 1.268999262164576e-07, + "loss": 0.0009, + "step": 18874 + }, + { + "epoch": 0.37, + "learning_rate": 1.2689604287212145e-07, + "loss": 0.0919, + "step": 18875 + }, + { + "epoch": 0.37, + "learning_rate": 1.2689215952778532e-07, + "loss": 0.0009, + "step": 18876 + }, + { + "epoch": 0.37, + "learning_rate": 1.2688827618344916e-07, + "loss": 0.0007, + "step": 18877 + }, + { + "epoch": 0.37, + "learning_rate": 1.2688439283911304e-07, + "loss": 0.0023, + "step": 18878 + }, + { + "epoch": 0.37, + "learning_rate": 1.2688050949477688e-07, + "loss": 0.0084, + "step": 18879 + }, + { + "epoch": 0.37, + "learning_rate": 1.2687662615044075e-07, + "loss": 0.001, + "step": 18880 + }, + { + "epoch": 0.37, + "learning_rate": 1.268727428061046e-07, + "loss": 0.0016, + "step": 18881 + }, + { + "epoch": 0.37, + "learning_rate": 1.2686885946176847e-07, + "loss": 0.001, + "step": 18882 + }, + { + "epoch": 0.37, + "learning_rate": 1.2686497611743231e-07, + "loss": 0.001, + "step": 18883 + }, + { + "epoch": 0.37, + "learning_rate": 1.2686109277309619e-07, + "loss": 0.0007, + "step": 18884 + }, + { + "epoch": 0.37, + "learning_rate": 1.2685720942876003e-07, + "loss": 0.0308, + "step": 18885 + }, + { + "epoch": 0.37, + "learning_rate": 1.268533260844239e-07, + "loss": 0.0047, + "step": 18886 + }, + { + "epoch": 0.37, + "learning_rate": 1.2684944274008775e-07, + "loss": 0.001, + "step": 18887 + }, + { + "epoch": 0.37, + "learning_rate": 1.2684555939575162e-07, + "loss": 0.0009, + "step": 18888 + }, + { + "epoch": 0.37, + "learning_rate": 1.2684167605141546e-07, + "loss": 0.0101, + "step": 18889 + }, + { + "epoch": 0.37, + "learning_rate": 1.2683779270707933e-07, + "loss": 0.0538, + "step": 18890 + }, + { + "epoch": 0.37, + "learning_rate": 1.2683390936274318e-07, + "loss": 0.0009, + "step": 18891 + }, + { + "epoch": 0.37, + "learning_rate": 1.2683002601840705e-07, + "loss": 0.0323, + "step": 18892 + }, + { + "epoch": 0.37, + "learning_rate": 1.268261426740709e-07, + "loss": 0.001, + "step": 18893 + }, + { + "epoch": 0.37, + "learning_rate": 1.2682225932973477e-07, + "loss": 0.001, + "step": 18894 + }, + { + "epoch": 0.37, + "learning_rate": 1.268183759853986e-07, + "loss": 0.0014, + "step": 18895 + }, + { + "epoch": 0.37, + "learning_rate": 1.2681449264106248e-07, + "loss": 0.0019, + "step": 18896 + }, + { + "epoch": 0.37, + "learning_rate": 1.2681060929672633e-07, + "loss": 0.0009, + "step": 18897 + }, + { + "epoch": 0.37, + "learning_rate": 1.268067259523902e-07, + "loss": 0.0012, + "step": 18898 + }, + { + "epoch": 0.37, + "learning_rate": 1.2680284260805405e-07, + "loss": 0.001, + "step": 18899 + }, + { + "epoch": 0.37, + "learning_rate": 1.2679895926371792e-07, + "loss": 0.0017, + "step": 18900 + }, + { + "epoch": 0.37, + "learning_rate": 1.2679507591938176e-07, + "loss": 0.001, + "step": 18901 + }, + { + "epoch": 0.37, + "learning_rate": 1.2679119257504563e-07, + "loss": 0.0007, + "step": 18902 + }, + { + "epoch": 0.37, + "learning_rate": 1.2678730923070948e-07, + "loss": 0.0009, + "step": 18903 + }, + { + "epoch": 0.37, + "learning_rate": 1.2678342588637335e-07, + "loss": 0.0123, + "step": 18904 + }, + { + "epoch": 0.37, + "learning_rate": 1.267795425420372e-07, + "loss": 0.0007, + "step": 18905 + }, + { + "epoch": 0.37, + "learning_rate": 1.2677565919770107e-07, + "loss": 0.0011, + "step": 18906 + }, + { + "epoch": 0.37, + "learning_rate": 1.267717758533649e-07, + "loss": 0.0007, + "step": 18907 + }, + { + "epoch": 0.37, + "learning_rate": 1.2676789250902878e-07, + "loss": 0.0008, + "step": 18908 + }, + { + "epoch": 0.37, + "learning_rate": 1.2676400916469263e-07, + "loss": 0.0009, + "step": 18909 + }, + { + "epoch": 0.37, + "learning_rate": 1.267601258203565e-07, + "loss": 0.001, + "step": 18910 + }, + { + "epoch": 0.37, + "learning_rate": 1.2675624247602034e-07, + "loss": 0.0035, + "step": 18911 + }, + { + "epoch": 0.37, + "learning_rate": 1.2675235913168422e-07, + "loss": 0.0008, + "step": 18912 + }, + { + "epoch": 0.37, + "learning_rate": 1.2674847578734806e-07, + "loss": 0.001, + "step": 18913 + }, + { + "epoch": 0.37, + "learning_rate": 1.2674459244301193e-07, + "loss": 0.0014, + "step": 18914 + }, + { + "epoch": 0.37, + "learning_rate": 1.2674070909867578e-07, + "loss": 0.0008, + "step": 18915 + }, + { + "epoch": 0.37, + "learning_rate": 1.2673682575433965e-07, + "loss": 0.0008, + "step": 18916 + }, + { + "epoch": 0.37, + "learning_rate": 1.267329424100035e-07, + "loss": 0.0008, + "step": 18917 + }, + { + "epoch": 0.37, + "learning_rate": 1.2672905906566737e-07, + "loss": 0.0007, + "step": 18918 + }, + { + "epoch": 0.37, + "learning_rate": 1.267251757213312e-07, + "loss": 0.0036, + "step": 18919 + }, + { + "epoch": 0.37, + "learning_rate": 1.2672129237699508e-07, + "loss": 0.0008, + "step": 18920 + }, + { + "epoch": 0.37, + "learning_rate": 1.2671740903265893e-07, + "loss": 0.0007, + "step": 18921 + }, + { + "epoch": 0.37, + "learning_rate": 1.267135256883228e-07, + "loss": 0.0008, + "step": 18922 + }, + { + "epoch": 0.37, + "learning_rate": 1.2670964234398664e-07, + "loss": 0.001, + "step": 18923 + }, + { + "epoch": 0.37, + "learning_rate": 1.2670575899965052e-07, + "loss": 0.0049, + "step": 18924 + }, + { + "epoch": 0.37, + "learning_rate": 1.2670187565531436e-07, + "loss": 0.0012, + "step": 18925 + }, + { + "epoch": 0.37, + "learning_rate": 1.2669799231097823e-07, + "loss": 0.6038, + "step": 18926 + }, + { + "epoch": 0.37, + "learning_rate": 1.2669410896664208e-07, + "loss": 0.0009, + "step": 18927 + }, + { + "epoch": 0.37, + "learning_rate": 1.2669022562230595e-07, + "loss": 0.0012, + "step": 18928 + }, + { + "epoch": 0.37, + "learning_rate": 1.2668634227796977e-07, + "loss": 0.0111, + "step": 18929 + }, + { + "epoch": 0.37, + "learning_rate": 1.2668245893363364e-07, + "loss": 0.0146, + "step": 18930 + }, + { + "epoch": 0.37, + "learning_rate": 1.2667857558929748e-07, + "loss": 0.0007, + "step": 18931 + }, + { + "epoch": 0.37, + "learning_rate": 1.2667469224496135e-07, + "loss": 0.0015, + "step": 18932 + }, + { + "epoch": 0.37, + "learning_rate": 1.266708089006252e-07, + "loss": 0.0013, + "step": 18933 + }, + { + "epoch": 0.37, + "learning_rate": 1.2666692555628907e-07, + "loss": 0.0011, + "step": 18934 + }, + { + "epoch": 0.37, + "learning_rate": 1.2666304221195292e-07, + "loss": 0.0014, + "step": 18935 + }, + { + "epoch": 0.37, + "learning_rate": 1.266591588676168e-07, + "loss": 0.0007, + "step": 18936 + }, + { + "epoch": 0.37, + "learning_rate": 1.2665527552328063e-07, + "loss": 0.0008, + "step": 18937 + }, + { + "epoch": 0.37, + "learning_rate": 1.266513921789445e-07, + "loss": 0.0008, + "step": 18938 + }, + { + "epoch": 0.37, + "learning_rate": 1.2664750883460835e-07, + "loss": 0.001, + "step": 18939 + }, + { + "epoch": 0.37, + "learning_rate": 1.2664362549027222e-07, + "loss": 0.0273, + "step": 18940 + }, + { + "epoch": 0.37, + "learning_rate": 1.2663974214593607e-07, + "loss": 0.0009, + "step": 18941 + }, + { + "epoch": 0.37, + "learning_rate": 1.2663585880159994e-07, + "loss": 0.0007, + "step": 18942 + }, + { + "epoch": 0.37, + "learning_rate": 1.2663197545726378e-07, + "loss": 0.0007, + "step": 18943 + }, + { + "epoch": 0.37, + "learning_rate": 1.2662809211292765e-07, + "loss": 0.0008, + "step": 18944 + }, + { + "epoch": 0.37, + "learning_rate": 1.266242087685915e-07, + "loss": 0.6347, + "step": 18945 + }, + { + "epoch": 0.37, + "learning_rate": 1.2662032542425537e-07, + "loss": 0.0031, + "step": 18946 + }, + { + "epoch": 0.37, + "learning_rate": 1.2661644207991922e-07, + "loss": 0.5337, + "step": 18947 + }, + { + "epoch": 0.37, + "learning_rate": 1.2661255873558309e-07, + "loss": 0.001, + "step": 18948 + }, + { + "epoch": 0.37, + "learning_rate": 1.2660867539124693e-07, + "loss": 0.0009, + "step": 18949 + }, + { + "epoch": 0.37, + "learning_rate": 1.266047920469108e-07, + "loss": 0.0018, + "step": 18950 + }, + { + "epoch": 0.37, + "learning_rate": 1.2660090870257465e-07, + "loss": 0.001, + "step": 18951 + }, + { + "epoch": 0.37, + "learning_rate": 1.2659702535823852e-07, + "loss": 0.001, + "step": 18952 + }, + { + "epoch": 0.37, + "learning_rate": 1.2659314201390236e-07, + "loss": 0.001, + "step": 18953 + }, + { + "epoch": 0.37, + "learning_rate": 1.2658925866956624e-07, + "loss": 0.0012, + "step": 18954 + }, + { + "epoch": 0.37, + "learning_rate": 1.2658537532523008e-07, + "loss": 0.0007, + "step": 18955 + }, + { + "epoch": 0.37, + "learning_rate": 1.2658149198089395e-07, + "loss": 0.0045, + "step": 18956 + }, + { + "epoch": 0.37, + "learning_rate": 1.265776086365578e-07, + "loss": 0.0007, + "step": 18957 + }, + { + "epoch": 0.37, + "learning_rate": 1.2657372529222164e-07, + "loss": 0.0006, + "step": 18958 + }, + { + "epoch": 0.37, + "learning_rate": 1.2656984194788551e-07, + "loss": 0.0007, + "step": 18959 + }, + { + "epoch": 0.37, + "learning_rate": 1.2656595860354936e-07, + "loss": 0.0031, + "step": 18960 + }, + { + "epoch": 0.37, + "learning_rate": 1.2656207525921323e-07, + "loss": 0.0009, + "step": 18961 + }, + { + "epoch": 0.37, + "learning_rate": 1.2655819191487708e-07, + "loss": 0.001, + "step": 18962 + }, + { + "epoch": 0.37, + "learning_rate": 1.2655430857054095e-07, + "loss": 0.0009, + "step": 18963 + }, + { + "epoch": 0.37, + "learning_rate": 1.265504252262048e-07, + "loss": 0.0009, + "step": 18964 + }, + { + "epoch": 0.37, + "learning_rate": 1.2654654188186866e-07, + "loss": 0.0008, + "step": 18965 + }, + { + "epoch": 0.37, + "learning_rate": 1.265426585375325e-07, + "loss": 0.001, + "step": 18966 + }, + { + "epoch": 0.37, + "learning_rate": 1.2653877519319638e-07, + "loss": 0.2265, + "step": 18967 + }, + { + "epoch": 0.37, + "learning_rate": 1.2653489184886023e-07, + "loss": 0.0008, + "step": 18968 + }, + { + "epoch": 0.37, + "learning_rate": 1.265310085045241e-07, + "loss": 0.0014, + "step": 18969 + }, + { + "epoch": 0.37, + "learning_rate": 1.2652712516018794e-07, + "loss": 0.0006, + "step": 18970 + }, + { + "epoch": 0.37, + "learning_rate": 1.265232418158518e-07, + "loss": 0.001, + "step": 18971 + }, + { + "epoch": 0.37, + "learning_rate": 1.2651935847151566e-07, + "loss": 0.0014, + "step": 18972 + }, + { + "epoch": 0.37, + "learning_rate": 1.2651547512717953e-07, + "loss": 0.0009, + "step": 18973 + }, + { + "epoch": 0.37, + "learning_rate": 1.2651159178284337e-07, + "loss": 0.0101, + "step": 18974 + }, + { + "epoch": 0.37, + "learning_rate": 1.2650770843850725e-07, + "loss": 0.0006, + "step": 18975 + }, + { + "epoch": 0.37, + "learning_rate": 1.265038250941711e-07, + "loss": 0.0008, + "step": 18976 + }, + { + "epoch": 0.37, + "learning_rate": 1.2649994174983496e-07, + "loss": 0.0031, + "step": 18977 + }, + { + "epoch": 0.37, + "learning_rate": 1.264960584054988e-07, + "loss": 1.072, + "step": 18978 + }, + { + "epoch": 0.37, + "learning_rate": 1.2649217506116268e-07, + "loss": 0.0008, + "step": 18979 + }, + { + "epoch": 0.37, + "learning_rate": 1.2648829171682652e-07, + "loss": 0.0006, + "step": 18980 + }, + { + "epoch": 0.37, + "learning_rate": 1.264844083724904e-07, + "loss": 0.7705, + "step": 18981 + }, + { + "epoch": 0.37, + "learning_rate": 1.2648052502815424e-07, + "loss": 0.0006, + "step": 18982 + }, + { + "epoch": 0.37, + "learning_rate": 1.264766416838181e-07, + "loss": 0.0007, + "step": 18983 + }, + { + "epoch": 0.37, + "learning_rate": 1.2647275833948196e-07, + "loss": 0.0011, + "step": 18984 + }, + { + "epoch": 0.37, + "learning_rate": 1.2646887499514583e-07, + "loss": 0.0007, + "step": 18985 + }, + { + "epoch": 0.37, + "learning_rate": 1.2646499165080967e-07, + "loss": 0.487, + "step": 18986 + }, + { + "epoch": 0.37, + "learning_rate": 1.2646110830647352e-07, + "loss": 0.0012, + "step": 18987 + }, + { + "epoch": 0.37, + "learning_rate": 1.2645722496213736e-07, + "loss": 0.0007, + "step": 18988 + }, + { + "epoch": 0.37, + "learning_rate": 1.2645334161780124e-07, + "loss": 0.0017, + "step": 18989 + }, + { + "epoch": 0.37, + "learning_rate": 1.2644945827346508e-07, + "loss": 0.0342, + "step": 18990 + }, + { + "epoch": 0.37, + "learning_rate": 1.2644557492912895e-07, + "loss": 0.0007, + "step": 18991 + }, + { + "epoch": 0.37, + "learning_rate": 1.264416915847928e-07, + "loss": 0.0008, + "step": 18992 + }, + { + "epoch": 0.37, + "learning_rate": 1.2643780824045667e-07, + "loss": 0.0009, + "step": 18993 + }, + { + "epoch": 0.37, + "learning_rate": 1.264339248961205e-07, + "loss": 0.0009, + "step": 18994 + }, + { + "epoch": 0.37, + "learning_rate": 1.2643004155178438e-07, + "loss": 0.0009, + "step": 18995 + }, + { + "epoch": 0.37, + "learning_rate": 1.2642615820744823e-07, + "loss": 0.3962, + "step": 18996 + }, + { + "epoch": 0.37, + "learning_rate": 1.264222748631121e-07, + "loss": 0.0009, + "step": 18997 + }, + { + "epoch": 0.37, + "learning_rate": 1.2641839151877595e-07, + "loss": 0.0009, + "step": 18998 + }, + { + "epoch": 0.37, + "learning_rate": 1.2641450817443982e-07, + "loss": 0.001, + "step": 18999 + }, + { + "epoch": 0.37, + "learning_rate": 1.2641062483010366e-07, + "loss": 0.0008, + "step": 19000 + }, + { + "epoch": 0.37, + "learning_rate": 1.2640674148576753e-07, + "loss": 0.1435, + "step": 19001 + }, + { + "epoch": 0.37, + "learning_rate": 1.2640285814143138e-07, + "loss": 0.0008, + "step": 19002 + }, + { + "epoch": 0.37, + "learning_rate": 1.2639897479709525e-07, + "loss": 0.0007, + "step": 19003 + }, + { + "epoch": 0.37, + "learning_rate": 1.263950914527591e-07, + "loss": 0.6378, + "step": 19004 + }, + { + "epoch": 0.37, + "learning_rate": 1.2639120810842297e-07, + "loss": 0.0006, + "step": 19005 + }, + { + "epoch": 0.37, + "learning_rate": 1.263873247640868e-07, + "loss": 0.0009, + "step": 19006 + }, + { + "epoch": 0.37, + "learning_rate": 1.2638344141975068e-07, + "loss": 0.0008, + "step": 19007 + }, + { + "epoch": 0.37, + "learning_rate": 1.2637955807541453e-07, + "loss": 0.001, + "step": 19008 + }, + { + "epoch": 0.37, + "learning_rate": 1.263756747310784e-07, + "loss": 0.0009, + "step": 19009 + }, + { + "epoch": 0.37, + "learning_rate": 1.2637179138674224e-07, + "loss": 0.4221, + "step": 19010 + }, + { + "epoch": 0.37, + "learning_rate": 1.2636790804240612e-07, + "loss": 0.0016, + "step": 19011 + }, + { + "epoch": 0.37, + "learning_rate": 1.2636402469806996e-07, + "loss": 0.0007, + "step": 19012 + }, + { + "epoch": 0.37, + "learning_rate": 1.2636014135373383e-07, + "loss": 0.6908, + "step": 19013 + }, + { + "epoch": 0.37, + "learning_rate": 1.2635625800939768e-07, + "loss": 0.0007, + "step": 19014 + }, + { + "epoch": 0.37, + "learning_rate": 1.2635237466506155e-07, + "loss": 0.0011, + "step": 19015 + }, + { + "epoch": 0.37, + "learning_rate": 1.263484913207254e-07, + "loss": 0.001, + "step": 19016 + }, + { + "epoch": 0.37, + "learning_rate": 1.2634460797638927e-07, + "loss": 0.0009, + "step": 19017 + }, + { + "epoch": 0.37, + "learning_rate": 1.263407246320531e-07, + "loss": 0.0026, + "step": 19018 + }, + { + "epoch": 0.37, + "learning_rate": 1.2633684128771698e-07, + "loss": 0.0009, + "step": 19019 + }, + { + "epoch": 0.37, + "learning_rate": 1.2633295794338083e-07, + "loss": 0.0006, + "step": 19020 + }, + { + "epoch": 0.37, + "learning_rate": 1.263290745990447e-07, + "loss": 0.0013, + "step": 19021 + }, + { + "epoch": 0.37, + "learning_rate": 1.2632519125470854e-07, + "loss": 0.0008, + "step": 19022 + }, + { + "epoch": 0.37, + "learning_rate": 1.2632130791037242e-07, + "loss": 0.0139, + "step": 19023 + }, + { + "epoch": 0.37, + "learning_rate": 1.2631742456603626e-07, + "loss": 0.0008, + "step": 19024 + }, + { + "epoch": 0.37, + "learning_rate": 1.2631354122170013e-07, + "loss": 0.0007, + "step": 19025 + }, + { + "epoch": 0.37, + "learning_rate": 1.2630965787736398e-07, + "loss": 0.0022, + "step": 19026 + }, + { + "epoch": 0.37, + "learning_rate": 1.2630577453302785e-07, + "loss": 0.0009, + "step": 19027 + }, + { + "epoch": 0.37, + "learning_rate": 1.263018911886917e-07, + "loss": 0.0006, + "step": 19028 + }, + { + "epoch": 0.37, + "learning_rate": 1.2629800784435556e-07, + "loss": 0.0007, + "step": 19029 + }, + { + "epoch": 0.37, + "learning_rate": 1.262941245000194e-07, + "loss": 0.001, + "step": 19030 + }, + { + "epoch": 0.37, + "learning_rate": 1.2629024115568328e-07, + "loss": 0.0006, + "step": 19031 + }, + { + "epoch": 0.37, + "learning_rate": 1.2628635781134713e-07, + "loss": 0.0008, + "step": 19032 + }, + { + "epoch": 0.37, + "learning_rate": 1.26282474467011e-07, + "loss": 0.0008, + "step": 19033 + }, + { + "epoch": 0.37, + "learning_rate": 1.2627859112267484e-07, + "loss": 0.0008, + "step": 19034 + }, + { + "epoch": 0.37, + "learning_rate": 1.2627470777833871e-07, + "loss": 0.0009, + "step": 19035 + }, + { + "epoch": 0.37, + "learning_rate": 1.2627082443400256e-07, + "loss": 0.0017, + "step": 19036 + }, + { + "epoch": 0.37, + "learning_rate": 1.2626694108966643e-07, + "loss": 0.0008, + "step": 19037 + }, + { + "epoch": 0.37, + "learning_rate": 1.2626305774533028e-07, + "loss": 0.0015, + "step": 19038 + }, + { + "epoch": 0.37, + "learning_rate": 1.2625917440099415e-07, + "loss": 0.0008, + "step": 19039 + }, + { + "epoch": 0.37, + "learning_rate": 1.26255291056658e-07, + "loss": 0.0016, + "step": 19040 + }, + { + "epoch": 0.37, + "learning_rate": 1.2625140771232186e-07, + "loss": 0.0009, + "step": 19041 + }, + { + "epoch": 0.37, + "learning_rate": 1.262475243679857e-07, + "loss": 1.2375, + "step": 19042 + }, + { + "epoch": 0.37, + "learning_rate": 1.2624364102364958e-07, + "loss": 0.0008, + "step": 19043 + }, + { + "epoch": 0.37, + "learning_rate": 1.2623975767931343e-07, + "loss": 0.0011, + "step": 19044 + }, + { + "epoch": 0.37, + "learning_rate": 1.2623587433497727e-07, + "loss": 0.001, + "step": 19045 + }, + { + "epoch": 0.37, + "learning_rate": 1.2623199099064112e-07, + "loss": 0.0008, + "step": 19046 + }, + { + "epoch": 0.37, + "learning_rate": 1.2622810764630499e-07, + "loss": 0.0014, + "step": 19047 + }, + { + "epoch": 0.37, + "learning_rate": 1.2622422430196883e-07, + "loss": 0.0007, + "step": 19048 + }, + { + "epoch": 0.37, + "learning_rate": 1.262203409576327e-07, + "loss": 0.0008, + "step": 19049 + }, + { + "epoch": 0.37, + "learning_rate": 1.2621645761329655e-07, + "loss": 0.7243, + "step": 19050 + }, + { + "epoch": 0.37, + "learning_rate": 1.2621257426896042e-07, + "loss": 0.0015, + "step": 19051 + }, + { + "epoch": 0.37, + "learning_rate": 1.2620869092462426e-07, + "loss": 0.0016, + "step": 19052 + }, + { + "epoch": 0.37, + "learning_rate": 1.2620480758028814e-07, + "loss": 0.1773, + "step": 19053 + }, + { + "epoch": 0.37, + "learning_rate": 1.2620092423595198e-07, + "loss": 0.0006, + "step": 19054 + }, + { + "epoch": 0.37, + "learning_rate": 1.2619704089161585e-07, + "loss": 0.0009, + "step": 19055 + }, + { + "epoch": 0.37, + "learning_rate": 1.261931575472797e-07, + "loss": 0.0007, + "step": 19056 + }, + { + "epoch": 0.37, + "learning_rate": 1.2618927420294357e-07, + "loss": 0.0006, + "step": 19057 + }, + { + "epoch": 0.37, + "learning_rate": 1.2618539085860741e-07, + "loss": 0.0012, + "step": 19058 + }, + { + "epoch": 0.37, + "learning_rate": 1.2618150751427129e-07, + "loss": 0.6168, + "step": 19059 + }, + { + "epoch": 0.37, + "learning_rate": 1.2617762416993513e-07, + "loss": 0.0009, + "step": 19060 + }, + { + "epoch": 0.37, + "learning_rate": 1.26173740825599e-07, + "loss": 0.0012, + "step": 19061 + }, + { + "epoch": 0.37, + "learning_rate": 1.2616985748126285e-07, + "loss": 0.2245, + "step": 19062 + }, + { + "epoch": 0.37, + "learning_rate": 1.2616597413692672e-07, + "loss": 0.001, + "step": 19063 + }, + { + "epoch": 0.37, + "learning_rate": 1.2616209079259056e-07, + "loss": 0.0007, + "step": 19064 + }, + { + "epoch": 0.37, + "learning_rate": 1.2615820744825444e-07, + "loss": 0.0009, + "step": 19065 + }, + { + "epoch": 0.37, + "learning_rate": 1.2615432410391828e-07, + "loss": 0.0006, + "step": 19066 + }, + { + "epoch": 0.37, + "learning_rate": 1.2615044075958215e-07, + "loss": 0.0008, + "step": 19067 + }, + { + "epoch": 0.37, + "learning_rate": 1.26146557415246e-07, + "loss": 0.0097, + "step": 19068 + }, + { + "epoch": 0.37, + "learning_rate": 1.2614267407090987e-07, + "loss": 0.0007, + "step": 19069 + }, + { + "epoch": 0.37, + "learning_rate": 1.261387907265737e-07, + "loss": 0.0009, + "step": 19070 + }, + { + "epoch": 0.37, + "learning_rate": 1.2613490738223758e-07, + "loss": 0.0007, + "step": 19071 + }, + { + "epoch": 0.37, + "learning_rate": 1.2613102403790143e-07, + "loss": 0.0041, + "step": 19072 + }, + { + "epoch": 0.37, + "learning_rate": 1.261271406935653e-07, + "loss": 0.034, + "step": 19073 + }, + { + "epoch": 0.37, + "learning_rate": 1.2612325734922915e-07, + "loss": 0.0008, + "step": 19074 + }, + { + "epoch": 0.37, + "learning_rate": 1.2611937400489302e-07, + "loss": 0.0011, + "step": 19075 + }, + { + "epoch": 0.37, + "learning_rate": 1.2611549066055686e-07, + "loss": 0.0019, + "step": 19076 + }, + { + "epoch": 0.37, + "learning_rate": 1.2611160731622073e-07, + "loss": 0.001, + "step": 19077 + }, + { + "epoch": 0.37, + "learning_rate": 1.2610772397188458e-07, + "loss": 0.0008, + "step": 19078 + }, + { + "epoch": 0.37, + "learning_rate": 1.2610384062754845e-07, + "loss": 0.0132, + "step": 19079 + }, + { + "epoch": 0.37, + "learning_rate": 1.260999572832123e-07, + "loss": 0.0071, + "step": 19080 + }, + { + "epoch": 0.37, + "learning_rate": 1.2609607393887617e-07, + "loss": 0.0008, + "step": 19081 + }, + { + "epoch": 0.37, + "learning_rate": 1.2609219059454e-07, + "loss": 0.0006, + "step": 19082 + }, + { + "epoch": 0.37, + "learning_rate": 1.2608830725020388e-07, + "loss": 0.0008, + "step": 19083 + }, + { + "epoch": 0.37, + "learning_rate": 1.2608442390586773e-07, + "loss": 0.0011, + "step": 19084 + }, + { + "epoch": 0.37, + "learning_rate": 1.260805405615316e-07, + "loss": 0.001, + "step": 19085 + }, + { + "epoch": 0.37, + "learning_rate": 1.2607665721719544e-07, + "loss": 0.001, + "step": 19086 + }, + { + "epoch": 0.37, + "learning_rate": 1.2607277387285932e-07, + "loss": 1.0853, + "step": 19087 + }, + { + "epoch": 0.37, + "learning_rate": 1.2606889052852316e-07, + "loss": 0.0009, + "step": 19088 + }, + { + "epoch": 0.37, + "learning_rate": 1.2606500718418703e-07, + "loss": 0.0007, + "step": 19089 + }, + { + "epoch": 0.37, + "learning_rate": 1.2606112383985088e-07, + "loss": 0.0011, + "step": 19090 + }, + { + "epoch": 0.37, + "learning_rate": 1.2605724049551475e-07, + "loss": 0.0007, + "step": 19091 + }, + { + "epoch": 0.37, + "learning_rate": 1.260533571511786e-07, + "loss": 0.0007, + "step": 19092 + }, + { + "epoch": 0.37, + "learning_rate": 1.2604947380684247e-07, + "loss": 0.7322, + "step": 19093 + }, + { + "epoch": 0.37, + "learning_rate": 1.260455904625063e-07, + "loss": 0.0894, + "step": 19094 + }, + { + "epoch": 0.37, + "learning_rate": 1.2604170711817018e-07, + "loss": 0.0602, + "step": 19095 + }, + { + "epoch": 0.37, + "learning_rate": 1.2603782377383403e-07, + "loss": 0.0006, + "step": 19096 + }, + { + "epoch": 0.37, + "learning_rate": 1.260339404294979e-07, + "loss": 0.0008, + "step": 19097 + }, + { + "epoch": 0.37, + "learning_rate": 1.2603005708516174e-07, + "loss": 0.0008, + "step": 19098 + }, + { + "epoch": 0.37, + "learning_rate": 1.2602617374082562e-07, + "loss": 0.0012, + "step": 19099 + }, + { + "epoch": 0.37, + "learning_rate": 1.2602229039648946e-07, + "loss": 0.0008, + "step": 19100 + }, + { + "epoch": 0.37, + "learning_rate": 1.2601840705215333e-07, + "loss": 0.0005, + "step": 19101 + }, + { + "epoch": 0.37, + "learning_rate": 1.2601452370781718e-07, + "loss": 0.0008, + "step": 19102 + }, + { + "epoch": 0.37, + "learning_rate": 1.2601064036348102e-07, + "loss": 0.0028, + "step": 19103 + }, + { + "epoch": 0.37, + "learning_rate": 1.2600675701914487e-07, + "loss": 0.001, + "step": 19104 + }, + { + "epoch": 0.37, + "learning_rate": 1.2600287367480874e-07, + "loss": 0.0011, + "step": 19105 + }, + { + "epoch": 0.37, + "learning_rate": 1.2599899033047258e-07, + "loss": 0.0011, + "step": 19106 + }, + { + "epoch": 0.37, + "learning_rate": 1.2599510698613645e-07, + "loss": 0.001, + "step": 19107 + }, + { + "epoch": 0.37, + "learning_rate": 1.259912236418003e-07, + "loss": 0.0016, + "step": 19108 + }, + { + "epoch": 0.37, + "learning_rate": 1.2598734029746417e-07, + "loss": 0.0007, + "step": 19109 + }, + { + "epoch": 0.37, + "learning_rate": 1.2598345695312802e-07, + "loss": 0.0007, + "step": 19110 + }, + { + "epoch": 0.37, + "learning_rate": 1.259795736087919e-07, + "loss": 0.0042, + "step": 19111 + }, + { + "epoch": 0.37, + "learning_rate": 1.2597569026445573e-07, + "loss": 0.7422, + "step": 19112 + }, + { + "epoch": 0.37, + "learning_rate": 1.259718069201196e-07, + "loss": 0.0011, + "step": 19113 + }, + { + "epoch": 0.37, + "learning_rate": 1.2596792357578345e-07, + "loss": 0.0009, + "step": 19114 + }, + { + "epoch": 0.37, + "learning_rate": 1.2596404023144732e-07, + "loss": 0.0011, + "step": 19115 + }, + { + "epoch": 0.37, + "learning_rate": 1.2596015688711117e-07, + "loss": 0.6087, + "step": 19116 + }, + { + "epoch": 0.37, + "learning_rate": 1.2595627354277504e-07, + "loss": 0.0007, + "step": 19117 + }, + { + "epoch": 0.37, + "learning_rate": 1.2595239019843888e-07, + "loss": 0.0012, + "step": 19118 + }, + { + "epoch": 0.37, + "learning_rate": 1.2594850685410275e-07, + "loss": 0.0037, + "step": 19119 + }, + { + "epoch": 0.37, + "learning_rate": 1.259446235097666e-07, + "loss": 0.0042, + "step": 19120 + }, + { + "epoch": 0.37, + "learning_rate": 1.2594074016543047e-07, + "loss": 0.0073, + "step": 19121 + }, + { + "epoch": 0.37, + "learning_rate": 1.2593685682109432e-07, + "loss": 0.0008, + "step": 19122 + }, + { + "epoch": 0.37, + "learning_rate": 1.259329734767582e-07, + "loss": 0.0007, + "step": 19123 + }, + { + "epoch": 0.37, + "learning_rate": 1.2592909013242203e-07, + "loss": 0.0009, + "step": 19124 + }, + { + "epoch": 0.37, + "learning_rate": 1.259252067880859e-07, + "loss": 0.0008, + "step": 19125 + }, + { + "epoch": 0.37, + "learning_rate": 1.2592132344374975e-07, + "loss": 0.0027, + "step": 19126 + }, + { + "epoch": 0.37, + "learning_rate": 1.2591744009941362e-07, + "loss": 0.0011, + "step": 19127 + }, + { + "epoch": 0.37, + "learning_rate": 1.2591355675507746e-07, + "loss": 0.0183, + "step": 19128 + }, + { + "epoch": 0.37, + "learning_rate": 1.2590967341074134e-07, + "loss": 0.0008, + "step": 19129 + }, + { + "epoch": 0.37, + "learning_rate": 1.2590579006640518e-07, + "loss": 0.0031, + "step": 19130 + }, + { + "epoch": 0.37, + "learning_rate": 1.2590190672206905e-07, + "loss": 0.0009, + "step": 19131 + }, + { + "epoch": 0.37, + "learning_rate": 1.258980233777329e-07, + "loss": 0.0008, + "step": 19132 + }, + { + "epoch": 0.37, + "learning_rate": 1.2589414003339677e-07, + "loss": 0.0012, + "step": 19133 + }, + { + "epoch": 0.37, + "learning_rate": 1.2589025668906061e-07, + "loss": 0.8867, + "step": 19134 + }, + { + "epoch": 0.37, + "learning_rate": 1.2588637334472446e-07, + "loss": 1.0446, + "step": 19135 + }, + { + "epoch": 0.37, + "learning_rate": 1.2588249000038833e-07, + "loss": 0.001, + "step": 19136 + }, + { + "epoch": 0.37, + "learning_rate": 1.2587860665605218e-07, + "loss": 0.0009, + "step": 19137 + }, + { + "epoch": 0.37, + "learning_rate": 1.2587472331171605e-07, + "loss": 0.0012, + "step": 19138 + }, + { + "epoch": 0.37, + "learning_rate": 1.258708399673799e-07, + "loss": 0.8644, + "step": 19139 + }, + { + "epoch": 0.37, + "learning_rate": 1.2586695662304376e-07, + "loss": 0.001, + "step": 19140 + }, + { + "epoch": 0.37, + "learning_rate": 1.258630732787076e-07, + "loss": 0.0007, + "step": 19141 + }, + { + "epoch": 0.37, + "learning_rate": 1.2585918993437148e-07, + "loss": 0.0013, + "step": 19142 + }, + { + "epoch": 0.37, + "learning_rate": 1.2585530659003533e-07, + "loss": 0.0419, + "step": 19143 + }, + { + "epoch": 0.37, + "learning_rate": 1.258514232456992e-07, + "loss": 0.5089, + "step": 19144 + }, + { + "epoch": 0.37, + "learning_rate": 1.2584753990136304e-07, + "loss": 0.0009, + "step": 19145 + }, + { + "epoch": 0.37, + "learning_rate": 1.258436565570269e-07, + "loss": 0.0006, + "step": 19146 + }, + { + "epoch": 0.37, + "learning_rate": 1.2583977321269076e-07, + "loss": 0.0008, + "step": 19147 + }, + { + "epoch": 0.37, + "learning_rate": 1.2583588986835463e-07, + "loss": 0.0009, + "step": 19148 + }, + { + "epoch": 0.37, + "learning_rate": 1.2583200652401847e-07, + "loss": 0.428, + "step": 19149 + }, + { + "epoch": 0.37, + "learning_rate": 1.2582812317968235e-07, + "loss": 0.001, + "step": 19150 + }, + { + "epoch": 0.37, + "learning_rate": 1.258242398353462e-07, + "loss": 0.0011, + "step": 19151 + }, + { + "epoch": 0.37, + "learning_rate": 1.2582035649101006e-07, + "loss": 0.0007, + "step": 19152 + }, + { + "epoch": 0.37, + "learning_rate": 1.258164731466739e-07, + "loss": 0.0011, + "step": 19153 + }, + { + "epoch": 0.37, + "learning_rate": 1.2581258980233778e-07, + "loss": 0.0015, + "step": 19154 + }, + { + "epoch": 0.37, + "learning_rate": 1.2580870645800162e-07, + "loss": 0.001, + "step": 19155 + }, + { + "epoch": 0.37, + "learning_rate": 1.258048231136655e-07, + "loss": 0.0011, + "step": 19156 + }, + { + "epoch": 0.37, + "learning_rate": 1.2580093976932934e-07, + "loss": 0.0013, + "step": 19157 + }, + { + "epoch": 0.37, + "learning_rate": 1.257970564249932e-07, + "loss": 0.0007, + "step": 19158 + }, + { + "epoch": 0.37, + "learning_rate": 1.2579317308065706e-07, + "loss": 0.1048, + "step": 19159 + }, + { + "epoch": 0.37, + "learning_rate": 1.2578928973632093e-07, + "loss": 0.0009, + "step": 19160 + }, + { + "epoch": 0.37, + "learning_rate": 1.2578540639198477e-07, + "loss": 0.001, + "step": 19161 + }, + { + "epoch": 0.37, + "learning_rate": 1.2578152304764862e-07, + "loss": 0.0008, + "step": 19162 + }, + { + "epoch": 0.37, + "learning_rate": 1.257776397033125e-07, + "loss": 0.0009, + "step": 19163 + }, + { + "epoch": 0.37, + "learning_rate": 1.2577375635897634e-07, + "loss": 0.0008, + "step": 19164 + }, + { + "epoch": 0.37, + "learning_rate": 1.2576987301464018e-07, + "loss": 0.0007, + "step": 19165 + }, + { + "epoch": 0.37, + "learning_rate": 1.2576598967030405e-07, + "loss": 0.0189, + "step": 19166 + }, + { + "epoch": 0.37, + "learning_rate": 1.257621063259679e-07, + "loss": 0.0012, + "step": 19167 + }, + { + "epoch": 0.37, + "learning_rate": 1.2575822298163177e-07, + "loss": 0.0008, + "step": 19168 + }, + { + "epoch": 0.37, + "learning_rate": 1.257543396372956e-07, + "loss": 0.0013, + "step": 19169 + }, + { + "epoch": 0.37, + "learning_rate": 1.2575045629295948e-07, + "loss": 0.005, + "step": 19170 + }, + { + "epoch": 0.37, + "learning_rate": 1.2574657294862333e-07, + "loss": 0.0011, + "step": 19171 + }, + { + "epoch": 0.37, + "learning_rate": 1.257426896042872e-07, + "loss": 0.0008, + "step": 19172 + }, + { + "epoch": 0.37, + "learning_rate": 1.2573880625995105e-07, + "loss": 0.0011, + "step": 19173 + }, + { + "epoch": 0.37, + "learning_rate": 1.2573492291561492e-07, + "loss": 0.0007, + "step": 19174 + }, + { + "epoch": 0.37, + "learning_rate": 1.2573103957127876e-07, + "loss": 0.001, + "step": 19175 + }, + { + "epoch": 0.37, + "learning_rate": 1.2572715622694263e-07, + "loss": 0.0008, + "step": 19176 + }, + { + "epoch": 0.37, + "learning_rate": 1.2572327288260648e-07, + "loss": 0.0008, + "step": 19177 + }, + { + "epoch": 0.37, + "learning_rate": 1.2571938953827035e-07, + "loss": 0.1039, + "step": 19178 + }, + { + "epoch": 0.37, + "learning_rate": 1.257155061939342e-07, + "loss": 0.0017, + "step": 19179 + }, + { + "epoch": 0.37, + "learning_rate": 1.2571162284959807e-07, + "loss": 0.0008, + "step": 19180 + }, + { + "epoch": 0.37, + "learning_rate": 1.257077395052619e-07, + "loss": 0.0008, + "step": 19181 + }, + { + "epoch": 0.37, + "learning_rate": 1.2570385616092578e-07, + "loss": 0.0017, + "step": 19182 + }, + { + "epoch": 0.37, + "learning_rate": 1.2569997281658963e-07, + "loss": 0.0009, + "step": 19183 + }, + { + "epoch": 0.37, + "learning_rate": 1.256960894722535e-07, + "loss": 0.3668, + "step": 19184 + }, + { + "epoch": 0.37, + "learning_rate": 1.2569220612791735e-07, + "loss": 0.0014, + "step": 19185 + }, + { + "epoch": 0.37, + "learning_rate": 1.2568832278358122e-07, + "loss": 0.0008, + "step": 19186 + }, + { + "epoch": 0.37, + "learning_rate": 1.2568443943924506e-07, + "loss": 0.0005, + "step": 19187 + }, + { + "epoch": 0.37, + "learning_rate": 1.2568055609490893e-07, + "loss": 0.0015, + "step": 19188 + }, + { + "epoch": 0.37, + "learning_rate": 1.2567667275057278e-07, + "loss": 0.0011, + "step": 19189 + }, + { + "epoch": 0.37, + "learning_rate": 1.2567278940623665e-07, + "loss": 0.0011, + "step": 19190 + }, + { + "epoch": 0.37, + "learning_rate": 1.256689060619005e-07, + "loss": 0.0009, + "step": 19191 + }, + { + "epoch": 0.37, + "learning_rate": 1.2566502271756437e-07, + "loss": 0.0009, + "step": 19192 + }, + { + "epoch": 0.37, + "learning_rate": 1.256611393732282e-07, + "loss": 0.008, + "step": 19193 + }, + { + "epoch": 0.37, + "learning_rate": 1.2565725602889208e-07, + "loss": 0.0025, + "step": 19194 + }, + { + "epoch": 0.37, + "learning_rate": 1.2565337268455593e-07, + "loss": 0.0008, + "step": 19195 + }, + { + "epoch": 0.37, + "learning_rate": 1.256494893402198e-07, + "loss": 0.0008, + "step": 19196 + }, + { + "epoch": 0.37, + "learning_rate": 1.2564560599588364e-07, + "loss": 0.0006, + "step": 19197 + }, + { + "epoch": 0.37, + "learning_rate": 1.2564172265154752e-07, + "loss": 0.0007, + "step": 19198 + }, + { + "epoch": 0.37, + "learning_rate": 1.2563783930721136e-07, + "loss": 0.001, + "step": 19199 + }, + { + "epoch": 0.37, + "learning_rate": 1.2563395596287523e-07, + "loss": 0.0007, + "step": 19200 + }, + { + "epoch": 0.37, + "learning_rate": 1.2563007261853908e-07, + "loss": 0.0425, + "step": 19201 + }, + { + "epoch": 0.37, + "learning_rate": 1.2562618927420295e-07, + "loss": 0.0006, + "step": 19202 + }, + { + "epoch": 0.37, + "learning_rate": 1.256223059298668e-07, + "loss": 0.6019, + "step": 19203 + }, + { + "epoch": 0.37, + "learning_rate": 1.2561842258553066e-07, + "loss": 0.0008, + "step": 19204 + }, + { + "epoch": 0.37, + "learning_rate": 1.256145392411945e-07, + "loss": 0.0063, + "step": 19205 + }, + { + "epoch": 0.37, + "learning_rate": 1.2561065589685838e-07, + "loss": 0.0011, + "step": 19206 + }, + { + "epoch": 0.37, + "learning_rate": 1.2560677255252223e-07, + "loss": 0.0009, + "step": 19207 + }, + { + "epoch": 0.37, + "learning_rate": 1.256028892081861e-07, + "loss": 0.2427, + "step": 19208 + }, + { + "epoch": 0.37, + "learning_rate": 1.2559900586384994e-07, + "loss": 0.4259, + "step": 19209 + }, + { + "epoch": 0.37, + "learning_rate": 1.2559512251951381e-07, + "loss": 0.2511, + "step": 19210 + }, + { + "epoch": 0.37, + "learning_rate": 1.2559123917517766e-07, + "loss": 0.0006, + "step": 19211 + }, + { + "epoch": 0.37, + "learning_rate": 1.2558735583084153e-07, + "loss": 0.0011, + "step": 19212 + }, + { + "epoch": 0.37, + "learning_rate": 1.2558347248650538e-07, + "loss": 0.0008, + "step": 19213 + }, + { + "epoch": 0.37, + "learning_rate": 1.2557958914216925e-07, + "loss": 0.634, + "step": 19214 + }, + { + "epoch": 0.37, + "learning_rate": 1.255757057978331e-07, + "loss": 0.0007, + "step": 19215 + }, + { + "epoch": 0.37, + "learning_rate": 1.2557182245349696e-07, + "loss": 0.0007, + "step": 19216 + }, + { + "epoch": 0.37, + "learning_rate": 1.255679391091608e-07, + "loss": 0.0009, + "step": 19217 + }, + { + "epoch": 0.37, + "learning_rate": 1.2556405576482468e-07, + "loss": 0.0488, + "step": 19218 + }, + { + "epoch": 0.37, + "learning_rate": 1.255601724204885e-07, + "loss": 0.0021, + "step": 19219 + }, + { + "epoch": 0.37, + "learning_rate": 1.2555628907615237e-07, + "loss": 0.216, + "step": 19220 + }, + { + "epoch": 0.37, + "learning_rate": 1.2555240573181622e-07, + "loss": 0.0006, + "step": 19221 + }, + { + "epoch": 0.37, + "learning_rate": 1.255485223874801e-07, + "loss": 0.0016, + "step": 19222 + }, + { + "epoch": 0.37, + "learning_rate": 1.2554463904314393e-07, + "loss": 0.0009, + "step": 19223 + }, + { + "epoch": 0.37, + "learning_rate": 1.255407556988078e-07, + "loss": 0.0009, + "step": 19224 + }, + { + "epoch": 0.37, + "learning_rate": 1.2553687235447165e-07, + "loss": 0.0006, + "step": 19225 + }, + { + "epoch": 0.37, + "learning_rate": 1.2553298901013552e-07, + "loss": 0.0005, + "step": 19226 + }, + { + "epoch": 0.37, + "learning_rate": 1.2552910566579936e-07, + "loss": 0.0009, + "step": 19227 + }, + { + "epoch": 0.37, + "learning_rate": 1.2552522232146324e-07, + "loss": 0.0009, + "step": 19228 + }, + { + "epoch": 0.37, + "learning_rate": 1.2552133897712708e-07, + "loss": 0.0009, + "step": 19229 + }, + { + "epoch": 0.37, + "learning_rate": 1.2551745563279095e-07, + "loss": 0.0847, + "step": 19230 + }, + { + "epoch": 0.37, + "learning_rate": 1.255135722884548e-07, + "loss": 0.0017, + "step": 19231 + }, + { + "epoch": 0.37, + "learning_rate": 1.2550968894411867e-07, + "loss": 0.0017, + "step": 19232 + }, + { + "epoch": 0.37, + "learning_rate": 1.2550580559978251e-07, + "loss": 0.0024, + "step": 19233 + }, + { + "epoch": 0.37, + "learning_rate": 1.2550192225544639e-07, + "loss": 0.0008, + "step": 19234 + }, + { + "epoch": 0.37, + "learning_rate": 1.2549803891111023e-07, + "loss": 0.0008, + "step": 19235 + }, + { + "epoch": 0.37, + "learning_rate": 1.254941555667741e-07, + "loss": 0.0289, + "step": 19236 + }, + { + "epoch": 0.37, + "learning_rate": 1.2549027222243795e-07, + "loss": 0.0007, + "step": 19237 + }, + { + "epoch": 0.37, + "learning_rate": 1.2548638887810182e-07, + "loss": 0.0012, + "step": 19238 + }, + { + "epoch": 0.37, + "learning_rate": 1.2548250553376566e-07, + "loss": 0.0006, + "step": 19239 + }, + { + "epoch": 0.37, + "learning_rate": 1.2547862218942954e-07, + "loss": 0.0011, + "step": 19240 + }, + { + "epoch": 0.37, + "learning_rate": 1.2547473884509338e-07, + "loss": 0.0008, + "step": 19241 + }, + { + "epoch": 0.37, + "learning_rate": 1.2547085550075725e-07, + "loss": 0.0008, + "step": 19242 + }, + { + "epoch": 0.37, + "learning_rate": 1.254669721564211e-07, + "loss": 0.001, + "step": 19243 + }, + { + "epoch": 0.37, + "learning_rate": 1.2546308881208497e-07, + "loss": 0.1273, + "step": 19244 + }, + { + "epoch": 0.37, + "learning_rate": 1.254592054677488e-07, + "loss": 0.0009, + "step": 19245 + }, + { + "epoch": 0.37, + "learning_rate": 1.2545532212341268e-07, + "loss": 0.0008, + "step": 19246 + }, + { + "epoch": 0.37, + "learning_rate": 1.2545143877907653e-07, + "loss": 0.0077, + "step": 19247 + }, + { + "epoch": 0.37, + "learning_rate": 1.254475554347404e-07, + "loss": 0.0007, + "step": 19248 + }, + { + "epoch": 0.37, + "learning_rate": 1.2544367209040425e-07, + "loss": 0.0013, + "step": 19249 + }, + { + "epoch": 0.37, + "learning_rate": 1.2543978874606812e-07, + "loss": 0.001, + "step": 19250 + }, + { + "epoch": 0.37, + "learning_rate": 1.2543590540173196e-07, + "loss": 0.0009, + "step": 19251 + }, + { + "epoch": 0.37, + "learning_rate": 1.2543202205739583e-07, + "loss": 0.0008, + "step": 19252 + }, + { + "epoch": 0.37, + "learning_rate": 1.2542813871305968e-07, + "loss": 0.6739, + "step": 19253 + }, + { + "epoch": 0.37, + "learning_rate": 1.2542425536872355e-07, + "loss": 0.0062, + "step": 19254 + }, + { + "epoch": 0.37, + "learning_rate": 1.254203720243874e-07, + "loss": 0.0008, + "step": 19255 + }, + { + "epoch": 0.37, + "learning_rate": 1.2541648868005127e-07, + "loss": 0.001, + "step": 19256 + }, + { + "epoch": 0.37, + "learning_rate": 1.254126053357151e-07, + "loss": 0.0006, + "step": 19257 + }, + { + "epoch": 0.37, + "learning_rate": 1.2540872199137898e-07, + "loss": 0.0014, + "step": 19258 + }, + { + "epoch": 0.37, + "learning_rate": 1.2540483864704283e-07, + "loss": 0.3423, + "step": 19259 + }, + { + "epoch": 0.37, + "learning_rate": 1.254009553027067e-07, + "loss": 0.0014, + "step": 19260 + }, + { + "epoch": 0.37, + "learning_rate": 1.2539707195837055e-07, + "loss": 0.2293, + "step": 19261 + }, + { + "epoch": 0.37, + "learning_rate": 1.2539318861403442e-07, + "loss": 0.1884, + "step": 19262 + }, + { + "epoch": 0.37, + "learning_rate": 1.2538930526969826e-07, + "loss": 0.0022, + "step": 19263 + }, + { + "epoch": 0.37, + "learning_rate": 1.2538542192536213e-07, + "loss": 0.0021, + "step": 19264 + }, + { + "epoch": 0.37, + "learning_rate": 1.2538153858102598e-07, + "loss": 0.0009, + "step": 19265 + }, + { + "epoch": 0.37, + "learning_rate": 1.2537765523668985e-07, + "loss": 0.0008, + "step": 19266 + }, + { + "epoch": 0.37, + "learning_rate": 1.253737718923537e-07, + "loss": 0.6825, + "step": 19267 + }, + { + "epoch": 0.37, + "learning_rate": 1.2536988854801757e-07, + "loss": 0.001, + "step": 19268 + }, + { + "epoch": 0.37, + "learning_rate": 1.253660052036814e-07, + "loss": 0.0008, + "step": 19269 + }, + { + "epoch": 0.37, + "learning_rate": 1.2536212185934528e-07, + "loss": 0.0028, + "step": 19270 + }, + { + "epoch": 0.37, + "learning_rate": 1.2535823851500913e-07, + "loss": 0.0007, + "step": 19271 + }, + { + "epoch": 0.37, + "learning_rate": 1.25354355170673e-07, + "loss": 0.0009, + "step": 19272 + }, + { + "epoch": 0.37, + "learning_rate": 1.2535047182633684e-07, + "loss": 0.0011, + "step": 19273 + }, + { + "epoch": 0.37, + "learning_rate": 1.2534658848200072e-07, + "loss": 0.7137, + "step": 19274 + }, + { + "epoch": 0.37, + "learning_rate": 1.2534270513766456e-07, + "loss": 0.0007, + "step": 19275 + }, + { + "epoch": 0.37, + "learning_rate": 1.2533882179332843e-07, + "loss": 0.0021, + "step": 19276 + }, + { + "epoch": 0.37, + "learning_rate": 1.2533493844899225e-07, + "loss": 0.0006, + "step": 19277 + }, + { + "epoch": 0.37, + "learning_rate": 1.2533105510465612e-07, + "loss": 0.0007, + "step": 19278 + }, + { + "epoch": 0.37, + "learning_rate": 1.2532717176031997e-07, + "loss": 0.0011, + "step": 19279 + }, + { + "epoch": 0.37, + "learning_rate": 1.2532328841598384e-07, + "loss": 0.0008, + "step": 19280 + }, + { + "epoch": 0.37, + "learning_rate": 1.2531940507164768e-07, + "loss": 0.0006, + "step": 19281 + }, + { + "epoch": 0.37, + "learning_rate": 1.2531552172731156e-07, + "loss": 0.0006, + "step": 19282 + }, + { + "epoch": 0.37, + "learning_rate": 1.253116383829754e-07, + "loss": 0.0007, + "step": 19283 + }, + { + "epoch": 0.37, + "learning_rate": 1.2530775503863927e-07, + "loss": 0.0008, + "step": 19284 + }, + { + "epoch": 0.37, + "learning_rate": 1.2530387169430312e-07, + "loss": 0.0008, + "step": 19285 + }, + { + "epoch": 0.37, + "learning_rate": 1.25299988349967e-07, + "loss": 0.0008, + "step": 19286 + }, + { + "epoch": 0.37, + "learning_rate": 1.2529610500563083e-07, + "loss": 0.001, + "step": 19287 + }, + { + "epoch": 0.37, + "learning_rate": 1.252922216612947e-07, + "loss": 0.0006, + "step": 19288 + }, + { + "epoch": 0.37, + "learning_rate": 1.2528833831695855e-07, + "loss": 0.0074, + "step": 19289 + }, + { + "epoch": 0.37, + "learning_rate": 1.2528445497262242e-07, + "loss": 0.0009, + "step": 19290 + }, + { + "epoch": 0.37, + "learning_rate": 1.2528057162828627e-07, + "loss": 0.0017, + "step": 19291 + }, + { + "epoch": 0.37, + "learning_rate": 1.2527668828395014e-07, + "loss": 0.0009, + "step": 19292 + }, + { + "epoch": 0.37, + "learning_rate": 1.2527280493961398e-07, + "loss": 0.0009, + "step": 19293 + }, + { + "epoch": 0.37, + "learning_rate": 1.2526892159527785e-07, + "loss": 0.0052, + "step": 19294 + }, + { + "epoch": 0.37, + "learning_rate": 1.252650382509417e-07, + "loss": 0.0011, + "step": 19295 + }, + { + "epoch": 0.37, + "learning_rate": 1.2526115490660557e-07, + "loss": 0.0008, + "step": 19296 + }, + { + "epoch": 0.37, + "learning_rate": 1.2525727156226942e-07, + "loss": 0.0027, + "step": 19297 + }, + { + "epoch": 0.37, + "learning_rate": 1.252533882179333e-07, + "loss": 0.0007, + "step": 19298 + }, + { + "epoch": 0.37, + "learning_rate": 1.2524950487359713e-07, + "loss": 0.0008, + "step": 19299 + }, + { + "epoch": 0.37, + "learning_rate": 1.25245621529261e-07, + "loss": 0.0014, + "step": 19300 + }, + { + "epoch": 0.37, + "learning_rate": 1.2524173818492485e-07, + "loss": 0.0008, + "step": 19301 + }, + { + "epoch": 0.37, + "learning_rate": 1.2523785484058872e-07, + "loss": 0.2193, + "step": 19302 + }, + { + "epoch": 0.37, + "learning_rate": 1.2523397149625256e-07, + "loss": 0.0018, + "step": 19303 + }, + { + "epoch": 0.37, + "learning_rate": 1.2523008815191644e-07, + "loss": 0.0009, + "step": 19304 + }, + { + "epoch": 0.37, + "learning_rate": 1.2522620480758028e-07, + "loss": 0.0008, + "step": 19305 + }, + { + "epoch": 0.37, + "learning_rate": 1.2522232146324415e-07, + "loss": 0.0018, + "step": 19306 + }, + { + "epoch": 0.37, + "learning_rate": 1.25218438118908e-07, + "loss": 0.0007, + "step": 19307 + }, + { + "epoch": 0.37, + "learning_rate": 1.2521455477457187e-07, + "loss": 0.1257, + "step": 19308 + }, + { + "epoch": 0.37, + "learning_rate": 1.2521067143023571e-07, + "loss": 0.0071, + "step": 19309 + }, + { + "epoch": 0.37, + "learning_rate": 1.2520678808589959e-07, + "loss": 0.0011, + "step": 19310 + }, + { + "epoch": 0.37, + "learning_rate": 1.2520290474156343e-07, + "loss": 0.0008, + "step": 19311 + }, + { + "epoch": 0.37, + "learning_rate": 1.2519902139722728e-07, + "loss": 0.001, + "step": 19312 + }, + { + "epoch": 0.37, + "learning_rate": 1.2519513805289115e-07, + "loss": 0.0009, + "step": 19313 + }, + { + "epoch": 0.37, + "learning_rate": 1.25191254708555e-07, + "loss": 0.0007, + "step": 19314 + }, + { + "epoch": 0.37, + "learning_rate": 1.2518737136421886e-07, + "loss": 0.0024, + "step": 19315 + }, + { + "epoch": 0.37, + "learning_rate": 1.251834880198827e-07, + "loss": 0.0009, + "step": 19316 + }, + { + "epoch": 0.37, + "learning_rate": 1.2517960467554658e-07, + "loss": 0.0007, + "step": 19317 + }, + { + "epoch": 0.37, + "learning_rate": 1.2517572133121043e-07, + "loss": 0.4329, + "step": 19318 + }, + { + "epoch": 0.37, + "learning_rate": 1.251718379868743e-07, + "loss": 0.0013, + "step": 19319 + }, + { + "epoch": 0.37, + "learning_rate": 1.2516795464253814e-07, + "loss": 0.0008, + "step": 19320 + }, + { + "epoch": 0.37, + "learning_rate": 1.2516407129820201e-07, + "loss": 0.0045, + "step": 19321 + }, + { + "epoch": 0.37, + "learning_rate": 1.2516018795386586e-07, + "loss": 0.001, + "step": 19322 + }, + { + "epoch": 0.37, + "learning_rate": 1.2515630460952973e-07, + "loss": 1.1857, + "step": 19323 + }, + { + "epoch": 0.37, + "learning_rate": 1.2515242126519357e-07, + "loss": 0.0643, + "step": 19324 + }, + { + "epoch": 0.37, + "learning_rate": 1.2514853792085745e-07, + "loss": 0.0012, + "step": 19325 + }, + { + "epoch": 0.37, + "learning_rate": 1.251446545765213e-07, + "loss": 1.2413, + "step": 19326 + }, + { + "epoch": 0.37, + "learning_rate": 1.2514077123218516e-07, + "loss": 0.0017, + "step": 19327 + }, + { + "epoch": 0.37, + "learning_rate": 1.25136887887849e-07, + "loss": 0.0008, + "step": 19328 + }, + { + "epoch": 0.37, + "learning_rate": 1.2513300454351288e-07, + "loss": 0.0017, + "step": 19329 + }, + { + "epoch": 0.37, + "learning_rate": 1.2512912119917672e-07, + "loss": 0.001, + "step": 19330 + }, + { + "epoch": 0.37, + "learning_rate": 1.251252378548406e-07, + "loss": 0.1261, + "step": 19331 + }, + { + "epoch": 0.38, + "learning_rate": 1.2512135451050444e-07, + "loss": 0.0095, + "step": 19332 + }, + { + "epoch": 0.38, + "learning_rate": 1.251174711661683e-07, + "loss": 0.0009, + "step": 19333 + }, + { + "epoch": 0.38, + "learning_rate": 1.2511358782183216e-07, + "loss": 0.0007, + "step": 19334 + }, + { + "epoch": 0.38, + "learning_rate": 1.25109704477496e-07, + "loss": 0.0011, + "step": 19335 + }, + { + "epoch": 0.38, + "learning_rate": 1.2510582113315987e-07, + "loss": 0.0007, + "step": 19336 + }, + { + "epoch": 0.38, + "learning_rate": 1.2510193778882372e-07, + "loss": 0.0007, + "step": 19337 + }, + { + "epoch": 0.38, + "learning_rate": 1.250980544444876e-07, + "loss": 0.0026, + "step": 19338 + }, + { + "epoch": 0.38, + "learning_rate": 1.2509417110015144e-07, + "loss": 1.0763, + "step": 19339 + }, + { + "epoch": 0.38, + "learning_rate": 1.250902877558153e-07, + "loss": 0.0008, + "step": 19340 + }, + { + "epoch": 0.38, + "learning_rate": 1.2508640441147915e-07, + "loss": 0.001, + "step": 19341 + }, + { + "epoch": 0.38, + "learning_rate": 1.25082521067143e-07, + "loss": 0.0007, + "step": 19342 + }, + { + "epoch": 0.38, + "learning_rate": 1.2507863772280687e-07, + "loss": 0.0019, + "step": 19343 + }, + { + "epoch": 0.38, + "learning_rate": 1.250747543784707e-07, + "loss": 0.0724, + "step": 19344 + }, + { + "epoch": 0.38, + "learning_rate": 1.2507087103413458e-07, + "loss": 0.0007, + "step": 19345 + }, + { + "epoch": 0.38, + "learning_rate": 1.2506698768979843e-07, + "loss": 0.0009, + "step": 19346 + }, + { + "epoch": 0.38, + "learning_rate": 1.250631043454623e-07, + "loss": 0.0111, + "step": 19347 + }, + { + "epoch": 0.38, + "learning_rate": 1.2505922100112615e-07, + "loss": 0.1963, + "step": 19348 + }, + { + "epoch": 0.38, + "learning_rate": 1.2505533765679002e-07, + "loss": 0.0007, + "step": 19349 + }, + { + "epoch": 0.38, + "learning_rate": 1.2505145431245386e-07, + "loss": 0.0007, + "step": 19350 + }, + { + "epoch": 0.38, + "learning_rate": 1.2504757096811773e-07, + "loss": 0.0009, + "step": 19351 + }, + { + "epoch": 0.38, + "learning_rate": 1.2504368762378158e-07, + "loss": 0.001, + "step": 19352 + }, + { + "epoch": 0.38, + "learning_rate": 1.2503980427944545e-07, + "loss": 0.0011, + "step": 19353 + }, + { + "epoch": 0.38, + "learning_rate": 1.250359209351093e-07, + "loss": 0.0285, + "step": 19354 + }, + { + "epoch": 0.38, + "learning_rate": 1.2503203759077317e-07, + "loss": 0.0009, + "step": 19355 + }, + { + "epoch": 0.38, + "learning_rate": 1.25028154246437e-07, + "loss": 0.0009, + "step": 19356 + }, + { + "epoch": 0.38, + "learning_rate": 1.2502427090210088e-07, + "loss": 0.0065, + "step": 19357 + }, + { + "epoch": 0.38, + "learning_rate": 1.2502038755776473e-07, + "loss": 0.0008, + "step": 19358 + }, + { + "epoch": 0.38, + "learning_rate": 1.250165042134286e-07, + "loss": 0.35, + "step": 19359 + }, + { + "epoch": 0.38, + "learning_rate": 1.2501262086909245e-07, + "loss": 0.4388, + "step": 19360 + }, + { + "epoch": 0.38, + "learning_rate": 1.2500873752475632e-07, + "loss": 0.0009, + "step": 19361 + }, + { + "epoch": 0.38, + "learning_rate": 1.2500485418042016e-07, + "loss": 0.0008, + "step": 19362 + }, + { + "epoch": 0.38, + "learning_rate": 1.2500097083608403e-07, + "loss": 0.0012, + "step": 19363 + }, + { + "epoch": 0.38, + "learning_rate": 1.2499708749174788e-07, + "loss": 0.0011, + "step": 19364 + }, + { + "epoch": 0.38, + "learning_rate": 1.2499320414741175e-07, + "loss": 0.0015, + "step": 19365 + }, + { + "epoch": 0.38, + "learning_rate": 1.249893208030756e-07, + "loss": 0.0008, + "step": 19366 + }, + { + "epoch": 0.38, + "learning_rate": 1.2498543745873947e-07, + "loss": 0.0095, + "step": 19367 + }, + { + "epoch": 0.38, + "learning_rate": 1.249815541144033e-07, + "loss": 0.0008, + "step": 19368 + }, + { + "epoch": 0.38, + "learning_rate": 1.2497767077006718e-07, + "loss": 0.0038, + "step": 19369 + }, + { + "epoch": 0.38, + "learning_rate": 1.2497378742573103e-07, + "loss": 0.0013, + "step": 19370 + }, + { + "epoch": 0.38, + "learning_rate": 1.249699040813949e-07, + "loss": 0.0007, + "step": 19371 + }, + { + "epoch": 0.38, + "learning_rate": 1.2496602073705874e-07, + "loss": 0.0007, + "step": 19372 + }, + { + "epoch": 0.38, + "learning_rate": 1.2496213739272262e-07, + "loss": 0.0008, + "step": 19373 + }, + { + "epoch": 0.38, + "learning_rate": 1.2495825404838646e-07, + "loss": 0.0014, + "step": 19374 + }, + { + "epoch": 0.38, + "learning_rate": 1.2495437070405033e-07, + "loss": 0.0079, + "step": 19375 + }, + { + "epoch": 0.38, + "learning_rate": 1.2495048735971418e-07, + "loss": 0.6195, + "step": 19376 + }, + { + "epoch": 0.38, + "learning_rate": 1.2494660401537805e-07, + "loss": 0.0008, + "step": 19377 + }, + { + "epoch": 0.38, + "learning_rate": 1.249427206710419e-07, + "loss": 0.0026, + "step": 19378 + }, + { + "epoch": 0.38, + "learning_rate": 1.2493883732670577e-07, + "loss": 0.0031, + "step": 19379 + }, + { + "epoch": 0.38, + "learning_rate": 1.249349539823696e-07, + "loss": 0.0009, + "step": 19380 + }, + { + "epoch": 0.38, + "learning_rate": 1.2493107063803348e-07, + "loss": 0.0009, + "step": 19381 + }, + { + "epoch": 0.38, + "learning_rate": 1.2492718729369733e-07, + "loss": 0.0008, + "step": 19382 + }, + { + "epoch": 0.38, + "learning_rate": 1.249233039493612e-07, + "loss": 0.001, + "step": 19383 + }, + { + "epoch": 0.38, + "learning_rate": 1.2491942060502504e-07, + "loss": 0.0008, + "step": 19384 + }, + { + "epoch": 0.38, + "learning_rate": 1.2491553726068891e-07, + "loss": 0.0014, + "step": 19385 + }, + { + "epoch": 0.38, + "learning_rate": 1.2491165391635276e-07, + "loss": 0.001, + "step": 19386 + }, + { + "epoch": 0.38, + "learning_rate": 1.2490777057201663e-07, + "loss": 0.001, + "step": 19387 + }, + { + "epoch": 0.38, + "learning_rate": 1.2490388722768048e-07, + "loss": 0.0009, + "step": 19388 + }, + { + "epoch": 0.38, + "learning_rate": 1.2490000388334435e-07, + "loss": 0.0082, + "step": 19389 + }, + { + "epoch": 0.38, + "learning_rate": 1.248961205390082e-07, + "loss": 0.0025, + "step": 19390 + }, + { + "epoch": 0.38, + "learning_rate": 1.2489223719467206e-07, + "loss": 0.0017, + "step": 19391 + }, + { + "epoch": 0.38, + "learning_rate": 1.248883538503359e-07, + "loss": 0.0007, + "step": 19392 + }, + { + "epoch": 0.38, + "learning_rate": 1.2488447050599975e-07, + "loss": 0.0009, + "step": 19393 + }, + { + "epoch": 0.38, + "learning_rate": 1.248805871616636e-07, + "loss": 0.0009, + "step": 19394 + }, + { + "epoch": 0.38, + "learning_rate": 1.2487670381732747e-07, + "loss": 0.0006, + "step": 19395 + }, + { + "epoch": 0.38, + "learning_rate": 1.2487282047299132e-07, + "loss": 0.0019, + "step": 19396 + }, + { + "epoch": 0.38, + "learning_rate": 1.248689371286552e-07, + "loss": 0.0009, + "step": 19397 + }, + { + "epoch": 0.38, + "learning_rate": 1.2486505378431903e-07, + "loss": 0.0009, + "step": 19398 + }, + { + "epoch": 0.38, + "learning_rate": 1.248611704399829e-07, + "loss": 0.0044, + "step": 19399 + }, + { + "epoch": 0.38, + "learning_rate": 1.2485728709564675e-07, + "loss": 0.0008, + "step": 19400 + }, + { + "epoch": 0.38, + "learning_rate": 1.2485340375131062e-07, + "loss": 0.0009, + "step": 19401 + }, + { + "epoch": 0.38, + "learning_rate": 1.2484952040697446e-07, + "loss": 0.2355, + "step": 19402 + }, + { + "epoch": 0.38, + "learning_rate": 1.2484563706263834e-07, + "loss": 0.0007, + "step": 19403 + }, + { + "epoch": 0.38, + "learning_rate": 1.2484175371830218e-07, + "loss": 0.0011, + "step": 19404 + }, + { + "epoch": 0.38, + "learning_rate": 1.2483787037396605e-07, + "loss": 0.0008, + "step": 19405 + }, + { + "epoch": 0.38, + "learning_rate": 1.248339870296299e-07, + "loss": 0.0011, + "step": 19406 + }, + { + "epoch": 0.38, + "learning_rate": 1.2483010368529377e-07, + "loss": 0.0007, + "step": 19407 + }, + { + "epoch": 0.38, + "learning_rate": 1.2482622034095761e-07, + "loss": 0.0015, + "step": 19408 + }, + { + "epoch": 0.38, + "learning_rate": 1.2482233699662149e-07, + "loss": 0.0008, + "step": 19409 + }, + { + "epoch": 0.38, + "learning_rate": 1.2481845365228533e-07, + "loss": 0.0011, + "step": 19410 + }, + { + "epoch": 0.38, + "learning_rate": 1.248145703079492e-07, + "loss": 0.0006, + "step": 19411 + }, + { + "epoch": 0.38, + "learning_rate": 1.2481068696361305e-07, + "loss": 0.0022, + "step": 19412 + }, + { + "epoch": 0.38, + "learning_rate": 1.2480680361927692e-07, + "loss": 0.0017, + "step": 19413 + }, + { + "epoch": 0.38, + "learning_rate": 1.2480292027494076e-07, + "loss": 0.001, + "step": 19414 + }, + { + "epoch": 0.38, + "learning_rate": 1.2479903693060464e-07, + "loss": 0.0014, + "step": 19415 + }, + { + "epoch": 0.38, + "learning_rate": 1.2479515358626848e-07, + "loss": 0.0006, + "step": 19416 + }, + { + "epoch": 0.38, + "learning_rate": 1.2479127024193235e-07, + "loss": 0.001, + "step": 19417 + }, + { + "epoch": 0.38, + "learning_rate": 1.247873868975962e-07, + "loss": 0.0021, + "step": 19418 + }, + { + "epoch": 0.38, + "learning_rate": 1.2478350355326007e-07, + "loss": 0.001, + "step": 19419 + }, + { + "epoch": 0.38, + "learning_rate": 1.2477962020892391e-07, + "loss": 0.0018, + "step": 19420 + }, + { + "epoch": 0.38, + "learning_rate": 1.2477573686458778e-07, + "loss": 0.002, + "step": 19421 + }, + { + "epoch": 0.38, + "learning_rate": 1.2477185352025163e-07, + "loss": 0.0008, + "step": 19422 + }, + { + "epoch": 0.38, + "learning_rate": 1.247679701759155e-07, + "loss": 0.0018, + "step": 19423 + }, + { + "epoch": 0.38, + "learning_rate": 1.2476408683157935e-07, + "loss": 0.1654, + "step": 19424 + }, + { + "epoch": 0.38, + "learning_rate": 1.2476020348724322e-07, + "loss": 0.882, + "step": 19425 + }, + { + "epoch": 0.38, + "learning_rate": 1.2475632014290706e-07, + "loss": 0.0007, + "step": 19426 + }, + { + "epoch": 0.38, + "learning_rate": 1.2475243679857093e-07, + "loss": 0.2703, + "step": 19427 + }, + { + "epoch": 0.38, + "learning_rate": 1.2474855345423478e-07, + "loss": 0.0007, + "step": 19428 + }, + { + "epoch": 0.38, + "learning_rate": 1.2474467010989865e-07, + "loss": 0.001, + "step": 19429 + }, + { + "epoch": 0.38, + "learning_rate": 1.247407867655625e-07, + "loss": 0.0009, + "step": 19430 + }, + { + "epoch": 0.38, + "learning_rate": 1.2473690342122637e-07, + "loss": 0.0011, + "step": 19431 + }, + { + "epoch": 0.38, + "learning_rate": 1.247330200768902e-07, + "loss": 0.0382, + "step": 19432 + }, + { + "epoch": 0.38, + "learning_rate": 1.2472913673255408e-07, + "loss": 0.001, + "step": 19433 + }, + { + "epoch": 0.38, + "learning_rate": 1.2472525338821793e-07, + "loss": 0.0007, + "step": 19434 + }, + { + "epoch": 0.38, + "learning_rate": 1.247213700438818e-07, + "loss": 0.0025, + "step": 19435 + }, + { + "epoch": 0.38, + "learning_rate": 1.2471748669954565e-07, + "loss": 0.0007, + "step": 19436 + }, + { + "epoch": 0.38, + "learning_rate": 1.2471360335520952e-07, + "loss": 0.1893, + "step": 19437 + }, + { + "epoch": 0.38, + "learning_rate": 1.2470972001087336e-07, + "loss": 0.0007, + "step": 19438 + }, + { + "epoch": 0.38, + "learning_rate": 1.2470583666653723e-07, + "loss": 0.0009, + "step": 19439 + }, + { + "epoch": 0.38, + "learning_rate": 1.2470195332220108e-07, + "loss": 0.001, + "step": 19440 + }, + { + "epoch": 0.38, + "learning_rate": 1.2469806997786495e-07, + "loss": 0.0007, + "step": 19441 + }, + { + "epoch": 0.38, + "learning_rate": 1.246941866335288e-07, + "loss": 0.0007, + "step": 19442 + }, + { + "epoch": 0.38, + "learning_rate": 1.2469030328919267e-07, + "loss": 0.0006, + "step": 19443 + }, + { + "epoch": 0.38, + "learning_rate": 1.246864199448565e-07, + "loss": 0.0008, + "step": 19444 + }, + { + "epoch": 0.38, + "learning_rate": 1.2468253660052038e-07, + "loss": 0.0008, + "step": 19445 + }, + { + "epoch": 0.38, + "learning_rate": 1.2467865325618423e-07, + "loss": 0.0008, + "step": 19446 + }, + { + "epoch": 0.38, + "learning_rate": 1.246747699118481e-07, + "loss": 0.4856, + "step": 19447 + }, + { + "epoch": 0.38, + "learning_rate": 1.2467088656751194e-07, + "loss": 0.0006, + "step": 19448 + }, + { + "epoch": 0.38, + "learning_rate": 1.2466700322317582e-07, + "loss": 0.001, + "step": 19449 + }, + { + "epoch": 0.38, + "learning_rate": 1.2466311987883966e-07, + "loss": 0.0007, + "step": 19450 + }, + { + "epoch": 0.38, + "learning_rate": 1.246592365345035e-07, + "loss": 0.0007, + "step": 19451 + }, + { + "epoch": 0.38, + "learning_rate": 1.2465535319016735e-07, + "loss": 0.0008, + "step": 19452 + }, + { + "epoch": 0.38, + "learning_rate": 1.2465146984583122e-07, + "loss": 0.0008, + "step": 19453 + }, + { + "epoch": 0.38, + "learning_rate": 1.2464758650149507e-07, + "loss": 0.0007, + "step": 19454 + }, + { + "epoch": 0.38, + "learning_rate": 1.2464370315715894e-07, + "loss": 0.001, + "step": 19455 + }, + { + "epoch": 0.38, + "learning_rate": 1.2463981981282278e-07, + "loss": 0.0006, + "step": 19456 + }, + { + "epoch": 0.38, + "learning_rate": 1.2463593646848666e-07, + "loss": 0.001, + "step": 19457 + }, + { + "epoch": 0.38, + "learning_rate": 1.246320531241505e-07, + "loss": 0.0007, + "step": 19458 + }, + { + "epoch": 0.38, + "learning_rate": 1.2462816977981437e-07, + "loss": 0.0008, + "step": 19459 + }, + { + "epoch": 0.38, + "learning_rate": 1.2462428643547822e-07, + "loss": 0.0008, + "step": 19460 + }, + { + "epoch": 0.38, + "learning_rate": 1.246204030911421e-07, + "loss": 0.3887, + "step": 19461 + }, + { + "epoch": 0.38, + "learning_rate": 1.2461651974680593e-07, + "loss": 0.001, + "step": 19462 + }, + { + "epoch": 0.38, + "learning_rate": 1.246126364024698e-07, + "loss": 0.0738, + "step": 19463 + }, + { + "epoch": 0.38, + "learning_rate": 1.2460875305813365e-07, + "loss": 0.0007, + "step": 19464 + }, + { + "epoch": 0.38, + "learning_rate": 1.2460486971379752e-07, + "loss": 0.0005, + "step": 19465 + }, + { + "epoch": 0.38, + "learning_rate": 1.2460098636946137e-07, + "loss": 0.0023, + "step": 19466 + }, + { + "epoch": 0.38, + "learning_rate": 1.2459710302512524e-07, + "loss": 0.0008, + "step": 19467 + }, + { + "epoch": 0.38, + "learning_rate": 1.2459321968078908e-07, + "loss": 0.0041, + "step": 19468 + }, + { + "epoch": 0.38, + "learning_rate": 1.2458933633645295e-07, + "loss": 0.5442, + "step": 19469 + }, + { + "epoch": 0.38, + "learning_rate": 1.245854529921168e-07, + "loss": 0.0008, + "step": 19470 + }, + { + "epoch": 0.38, + "learning_rate": 1.2458156964778067e-07, + "loss": 0.0006, + "step": 19471 + }, + { + "epoch": 0.38, + "learning_rate": 1.2457768630344452e-07, + "loss": 1.1192, + "step": 19472 + }, + { + "epoch": 0.38, + "learning_rate": 1.245738029591084e-07, + "loss": 0.0006, + "step": 19473 + }, + { + "epoch": 0.38, + "learning_rate": 1.2456991961477223e-07, + "loss": 0.0007, + "step": 19474 + }, + { + "epoch": 0.38, + "learning_rate": 1.245660362704361e-07, + "loss": 0.0017, + "step": 19475 + }, + { + "epoch": 0.38, + "learning_rate": 1.2456215292609995e-07, + "loss": 0.0008, + "step": 19476 + }, + { + "epoch": 0.38, + "learning_rate": 1.2455826958176382e-07, + "loss": 0.0012, + "step": 19477 + }, + { + "epoch": 0.38, + "learning_rate": 1.2455438623742767e-07, + "loss": 0.0007, + "step": 19478 + }, + { + "epoch": 0.38, + "learning_rate": 1.2455050289309154e-07, + "loss": 0.0779, + "step": 19479 + }, + { + "epoch": 0.38, + "learning_rate": 1.2454661954875538e-07, + "loss": 0.0008, + "step": 19480 + }, + { + "epoch": 0.38, + "learning_rate": 1.2454273620441925e-07, + "loss": 0.0007, + "step": 19481 + }, + { + "epoch": 0.38, + "learning_rate": 1.245388528600831e-07, + "loss": 0.0007, + "step": 19482 + }, + { + "epoch": 0.38, + "learning_rate": 1.2453496951574697e-07, + "loss": 0.0007, + "step": 19483 + }, + { + "epoch": 0.38, + "learning_rate": 1.2453108617141081e-07, + "loss": 0.0139, + "step": 19484 + }, + { + "epoch": 0.38, + "learning_rate": 1.2452720282707469e-07, + "loss": 0.001, + "step": 19485 + }, + { + "epoch": 0.38, + "learning_rate": 1.2452331948273853e-07, + "loss": 0.0007, + "step": 19486 + }, + { + "epoch": 0.38, + "learning_rate": 1.245194361384024e-07, + "loss": 0.0008, + "step": 19487 + }, + { + "epoch": 0.38, + "learning_rate": 1.2451555279406625e-07, + "loss": 0.0008, + "step": 19488 + }, + { + "epoch": 0.38, + "learning_rate": 1.245116694497301e-07, + "loss": 0.0009, + "step": 19489 + }, + { + "epoch": 0.38, + "learning_rate": 1.2450778610539396e-07, + "loss": 0.0007, + "step": 19490 + }, + { + "epoch": 0.38, + "learning_rate": 1.245039027610578e-07, + "loss": 1.0918, + "step": 19491 + }, + { + "epoch": 0.38, + "learning_rate": 1.2450001941672168e-07, + "loss": 0.0009, + "step": 19492 + }, + { + "epoch": 0.38, + "learning_rate": 1.2449613607238553e-07, + "loss": 0.001, + "step": 19493 + }, + { + "epoch": 0.38, + "learning_rate": 1.244922527280494e-07, + "loss": 0.0007, + "step": 19494 + }, + { + "epoch": 0.38, + "learning_rate": 1.2448836938371324e-07, + "loss": 0.001, + "step": 19495 + }, + { + "epoch": 0.38, + "learning_rate": 1.2448448603937711e-07, + "loss": 0.0008, + "step": 19496 + }, + { + "epoch": 0.38, + "learning_rate": 1.2448060269504096e-07, + "loss": 0.0006, + "step": 19497 + }, + { + "epoch": 0.38, + "learning_rate": 1.2447671935070483e-07, + "loss": 0.0077, + "step": 19498 + }, + { + "epoch": 0.38, + "learning_rate": 1.2447283600636867e-07, + "loss": 0.001, + "step": 19499 + }, + { + "epoch": 0.38, + "learning_rate": 1.2446895266203255e-07, + "loss": 0.0016, + "step": 19500 + }, + { + "epoch": 0.38, + "learning_rate": 1.244650693176964e-07, + "loss": 0.0283, + "step": 19501 + }, + { + "epoch": 0.38, + "learning_rate": 1.2446118597336026e-07, + "loss": 0.0011, + "step": 19502 + }, + { + "epoch": 0.38, + "learning_rate": 1.244573026290241e-07, + "loss": 0.0021, + "step": 19503 + }, + { + "epoch": 0.38, + "learning_rate": 1.2445341928468798e-07, + "loss": 0.0008, + "step": 19504 + }, + { + "epoch": 0.38, + "learning_rate": 1.2444953594035182e-07, + "loss": 1.5228, + "step": 19505 + }, + { + "epoch": 0.38, + "learning_rate": 1.244456525960157e-07, + "loss": 0.0013, + "step": 19506 + }, + { + "epoch": 0.38, + "learning_rate": 1.2444176925167954e-07, + "loss": 0.0006, + "step": 19507 + }, + { + "epoch": 0.38, + "learning_rate": 1.244378859073434e-07, + "loss": 0.0009, + "step": 19508 + }, + { + "epoch": 0.38, + "learning_rate": 1.2443400256300726e-07, + "loss": 0.001, + "step": 19509 + }, + { + "epoch": 0.38, + "learning_rate": 1.244301192186711e-07, + "loss": 0.2859, + "step": 19510 + }, + { + "epoch": 0.38, + "learning_rate": 1.2442623587433497e-07, + "loss": 0.0006, + "step": 19511 + }, + { + "epoch": 0.38, + "learning_rate": 1.2442235252999882e-07, + "loss": 0.0007, + "step": 19512 + }, + { + "epoch": 0.38, + "learning_rate": 1.244184691856627e-07, + "loss": 0.001, + "step": 19513 + }, + { + "epoch": 0.38, + "learning_rate": 1.2441458584132654e-07, + "loss": 0.0009, + "step": 19514 + }, + { + "epoch": 0.38, + "learning_rate": 1.244107024969904e-07, + "loss": 0.001, + "step": 19515 + }, + { + "epoch": 0.38, + "learning_rate": 1.2440681915265425e-07, + "loss": 0.0007, + "step": 19516 + }, + { + "epoch": 0.38, + "learning_rate": 1.2440293580831812e-07, + "loss": 0.0009, + "step": 19517 + }, + { + "epoch": 0.38, + "learning_rate": 1.2439905246398197e-07, + "loss": 0.0006, + "step": 19518 + }, + { + "epoch": 0.38, + "learning_rate": 1.2439516911964581e-07, + "loss": 0.0006, + "step": 19519 + }, + { + "epoch": 0.38, + "learning_rate": 1.2439128577530968e-07, + "loss": 0.0007, + "step": 19520 + }, + { + "epoch": 0.38, + "learning_rate": 1.2438740243097353e-07, + "loss": 0.0147, + "step": 19521 + }, + { + "epoch": 0.38, + "learning_rate": 1.243835190866374e-07, + "loss": 0.0007, + "step": 19522 + }, + { + "epoch": 0.38, + "learning_rate": 1.2437963574230125e-07, + "loss": 0.0008, + "step": 19523 + }, + { + "epoch": 0.38, + "learning_rate": 1.2437575239796512e-07, + "loss": 0.0008, + "step": 19524 + }, + { + "epoch": 0.38, + "learning_rate": 1.2437186905362896e-07, + "loss": 0.0009, + "step": 19525 + }, + { + "epoch": 0.38, + "learning_rate": 1.2436798570929283e-07, + "loss": 0.001, + "step": 19526 + }, + { + "epoch": 0.38, + "learning_rate": 1.2436410236495668e-07, + "loss": 0.0015, + "step": 19527 + }, + { + "epoch": 0.38, + "learning_rate": 1.2436021902062055e-07, + "loss": 0.0268, + "step": 19528 + }, + { + "epoch": 0.38, + "learning_rate": 1.243563356762844e-07, + "loss": 1.8104, + "step": 19529 + }, + { + "epoch": 0.38, + "learning_rate": 1.2435245233194827e-07, + "loss": 0.0009, + "step": 19530 + }, + { + "epoch": 0.38, + "learning_rate": 1.243485689876121e-07, + "loss": 0.0014, + "step": 19531 + }, + { + "epoch": 0.38, + "learning_rate": 1.2434468564327598e-07, + "loss": 0.7283, + "step": 19532 + }, + { + "epoch": 0.38, + "learning_rate": 1.2434080229893983e-07, + "loss": 0.0007, + "step": 19533 + }, + { + "epoch": 0.38, + "learning_rate": 1.243369189546037e-07, + "loss": 0.0006, + "step": 19534 + }, + { + "epoch": 0.38, + "learning_rate": 1.2433303561026755e-07, + "loss": 0.0014, + "step": 19535 + }, + { + "epoch": 0.38, + "learning_rate": 1.2432915226593142e-07, + "loss": 0.0009, + "step": 19536 + }, + { + "epoch": 0.38, + "learning_rate": 1.2432526892159526e-07, + "loss": 0.0006, + "step": 19537 + }, + { + "epoch": 0.38, + "learning_rate": 1.2432138557725913e-07, + "loss": 0.0007, + "step": 19538 + }, + { + "epoch": 0.38, + "learning_rate": 1.2431750223292298e-07, + "loss": 0.0012, + "step": 19539 + }, + { + "epoch": 0.38, + "learning_rate": 1.2431361888858685e-07, + "loss": 0.0006, + "step": 19540 + }, + { + "epoch": 0.38, + "learning_rate": 1.243097355442507e-07, + "loss": 0.0007, + "step": 19541 + }, + { + "epoch": 0.38, + "learning_rate": 1.2430585219991457e-07, + "loss": 0.0008, + "step": 19542 + }, + { + "epoch": 0.38, + "learning_rate": 1.243019688555784e-07, + "loss": 0.0007, + "step": 19543 + }, + { + "epoch": 0.38, + "learning_rate": 1.2429808551124228e-07, + "loss": 0.0011, + "step": 19544 + }, + { + "epoch": 0.38, + "learning_rate": 1.2429420216690613e-07, + "loss": 0.0007, + "step": 19545 + }, + { + "epoch": 0.38, + "learning_rate": 1.2429031882257e-07, + "loss": 0.002, + "step": 19546 + }, + { + "epoch": 0.38, + "learning_rate": 1.2428643547823384e-07, + "loss": 0.0008, + "step": 19547 + }, + { + "epoch": 0.38, + "learning_rate": 1.2428255213389772e-07, + "loss": 0.0009, + "step": 19548 + }, + { + "epoch": 0.38, + "learning_rate": 1.2427866878956156e-07, + "loss": 0.0009, + "step": 19549 + }, + { + "epoch": 0.38, + "learning_rate": 1.2427478544522543e-07, + "loss": 0.0023, + "step": 19550 + }, + { + "epoch": 0.38, + "learning_rate": 1.2427090210088928e-07, + "loss": 0.0009, + "step": 19551 + }, + { + "epoch": 0.38, + "learning_rate": 1.2426701875655315e-07, + "loss": 0.0007, + "step": 19552 + }, + { + "epoch": 0.38, + "learning_rate": 1.24263135412217e-07, + "loss": 0.0008, + "step": 19553 + }, + { + "epoch": 0.38, + "learning_rate": 1.2425925206788087e-07, + "loss": 0.0059, + "step": 19554 + }, + { + "epoch": 0.38, + "learning_rate": 1.242553687235447e-07, + "loss": 0.8235, + "step": 19555 + }, + { + "epoch": 0.38, + "learning_rate": 1.2425148537920858e-07, + "loss": 0.0012, + "step": 19556 + }, + { + "epoch": 0.38, + "learning_rate": 1.2424760203487243e-07, + "loss": 0.0008, + "step": 19557 + }, + { + "epoch": 0.38, + "learning_rate": 1.242437186905363e-07, + "loss": 0.0191, + "step": 19558 + }, + { + "epoch": 0.38, + "learning_rate": 1.2423983534620014e-07, + "loss": 0.0008, + "step": 19559 + }, + { + "epoch": 0.38, + "learning_rate": 1.2423595200186401e-07, + "loss": 0.0009, + "step": 19560 + }, + { + "epoch": 0.38, + "learning_rate": 1.2423206865752786e-07, + "loss": 0.0008, + "step": 19561 + }, + { + "epoch": 0.38, + "learning_rate": 1.2422818531319173e-07, + "loss": 0.0009, + "step": 19562 + }, + { + "epoch": 0.38, + "learning_rate": 1.2422430196885558e-07, + "loss": 0.0012, + "step": 19563 + }, + { + "epoch": 0.38, + "learning_rate": 1.2422041862451945e-07, + "loss": 0.0008, + "step": 19564 + }, + { + "epoch": 0.38, + "learning_rate": 1.242165352801833e-07, + "loss": 0.0008, + "step": 19565 + }, + { + "epoch": 0.38, + "learning_rate": 1.2421265193584716e-07, + "loss": 0.0008, + "step": 19566 + }, + { + "epoch": 0.38, + "learning_rate": 1.2420876859151098e-07, + "loss": 0.0007, + "step": 19567 + }, + { + "epoch": 0.38, + "learning_rate": 1.2420488524717485e-07, + "loss": 0.278, + "step": 19568 + }, + { + "epoch": 0.38, + "learning_rate": 1.242010019028387e-07, + "loss": 0.0007, + "step": 19569 + }, + { + "epoch": 0.38, + "learning_rate": 1.2419711855850257e-07, + "loss": 0.0009, + "step": 19570 + }, + { + "epoch": 0.38, + "learning_rate": 1.2419323521416642e-07, + "loss": 0.0008, + "step": 19571 + }, + { + "epoch": 0.38, + "learning_rate": 1.241893518698303e-07, + "loss": 0.0007, + "step": 19572 + }, + { + "epoch": 0.38, + "learning_rate": 1.2418546852549413e-07, + "loss": 0.0008, + "step": 19573 + }, + { + "epoch": 0.38, + "learning_rate": 1.24181585181158e-07, + "loss": 0.0007, + "step": 19574 + }, + { + "epoch": 0.38, + "learning_rate": 1.2417770183682185e-07, + "loss": 0.003, + "step": 19575 + }, + { + "epoch": 0.38, + "learning_rate": 1.2417381849248572e-07, + "loss": 0.0011, + "step": 19576 + }, + { + "epoch": 0.38, + "learning_rate": 1.2416993514814957e-07, + "loss": 0.1484, + "step": 19577 + }, + { + "epoch": 0.38, + "learning_rate": 1.2416605180381344e-07, + "loss": 0.0007, + "step": 19578 + }, + { + "epoch": 0.38, + "learning_rate": 1.2416216845947728e-07, + "loss": 0.0021, + "step": 19579 + }, + { + "epoch": 0.38, + "learning_rate": 1.2415828511514115e-07, + "loss": 0.6676, + "step": 19580 + }, + { + "epoch": 0.38, + "learning_rate": 1.24154401770805e-07, + "loss": 0.0007, + "step": 19581 + }, + { + "epoch": 0.38, + "learning_rate": 1.2415051842646887e-07, + "loss": 0.0021, + "step": 19582 + }, + { + "epoch": 0.38, + "learning_rate": 1.2414663508213271e-07, + "loss": 0.0008, + "step": 19583 + }, + { + "epoch": 0.38, + "learning_rate": 1.2414275173779659e-07, + "loss": 0.6798, + "step": 19584 + }, + { + "epoch": 0.38, + "learning_rate": 1.2413886839346043e-07, + "loss": 0.0008, + "step": 19585 + }, + { + "epoch": 0.38, + "learning_rate": 1.241349850491243e-07, + "loss": 0.0017, + "step": 19586 + }, + { + "epoch": 0.38, + "learning_rate": 1.2413110170478815e-07, + "loss": 0.001, + "step": 19587 + }, + { + "epoch": 0.38, + "learning_rate": 1.2412721836045202e-07, + "loss": 0.191, + "step": 19588 + }, + { + "epoch": 0.38, + "learning_rate": 1.2412333501611586e-07, + "loss": 0.0009, + "step": 19589 + }, + { + "epoch": 0.38, + "learning_rate": 1.2411945167177974e-07, + "loss": 0.0703, + "step": 19590 + }, + { + "epoch": 0.38, + "learning_rate": 1.2411556832744358e-07, + "loss": 0.0024, + "step": 19591 + }, + { + "epoch": 0.38, + "learning_rate": 1.2411168498310745e-07, + "loss": 0.0008, + "step": 19592 + }, + { + "epoch": 0.38, + "learning_rate": 1.241078016387713e-07, + "loss": 0.0007, + "step": 19593 + }, + { + "epoch": 0.38, + "learning_rate": 1.2410391829443517e-07, + "loss": 0.0545, + "step": 19594 + }, + { + "epoch": 0.38, + "learning_rate": 1.2410003495009901e-07, + "loss": 0.0008, + "step": 19595 + }, + { + "epoch": 0.38, + "learning_rate": 1.2409615160576288e-07, + "loss": 0.0016, + "step": 19596 + }, + { + "epoch": 0.38, + "learning_rate": 1.2409226826142673e-07, + "loss": 0.7464, + "step": 19597 + }, + { + "epoch": 0.38, + "learning_rate": 1.240883849170906e-07, + "loss": 0.0008, + "step": 19598 + }, + { + "epoch": 0.38, + "learning_rate": 1.2408450157275445e-07, + "loss": 0.0008, + "step": 19599 + }, + { + "epoch": 0.38, + "learning_rate": 1.2408061822841832e-07, + "loss": 0.0013, + "step": 19600 + }, + { + "epoch": 0.38, + "learning_rate": 1.2407673488408216e-07, + "loss": 0.001, + "step": 19601 + }, + { + "epoch": 0.38, + "learning_rate": 1.2407285153974603e-07, + "loss": 0.0007, + "step": 19602 + }, + { + "epoch": 0.38, + "learning_rate": 1.2406896819540988e-07, + "loss": 0.0006, + "step": 19603 + }, + { + "epoch": 0.38, + "learning_rate": 1.2406508485107375e-07, + "loss": 0.0007, + "step": 19604 + }, + { + "epoch": 0.38, + "learning_rate": 1.240612015067376e-07, + "loss": 0.001, + "step": 19605 + }, + { + "epoch": 0.38, + "learning_rate": 1.2405731816240147e-07, + "loss": 0.0007, + "step": 19606 + }, + { + "epoch": 0.38, + "learning_rate": 1.240534348180653e-07, + "loss": 0.0009, + "step": 19607 + }, + { + "epoch": 0.38, + "learning_rate": 1.2404955147372918e-07, + "loss": 0.0012, + "step": 19608 + }, + { + "epoch": 0.38, + "learning_rate": 1.2404566812939303e-07, + "loss": 0.0029, + "step": 19609 + }, + { + "epoch": 0.38, + "learning_rate": 1.240417847850569e-07, + "loss": 0.0007, + "step": 19610 + }, + { + "epoch": 0.38, + "learning_rate": 1.2403790144072075e-07, + "loss": 0.0009, + "step": 19611 + }, + { + "epoch": 0.38, + "learning_rate": 1.2403401809638462e-07, + "loss": 1.274, + "step": 19612 + }, + { + "epoch": 0.38, + "learning_rate": 1.2403013475204846e-07, + "loss": 0.0014, + "step": 19613 + }, + { + "epoch": 0.38, + "learning_rate": 1.2402625140771233e-07, + "loss": 0.0014, + "step": 19614 + }, + { + "epoch": 0.38, + "learning_rate": 1.2402236806337618e-07, + "loss": 0.0006, + "step": 19615 + }, + { + "epoch": 0.38, + "learning_rate": 1.2401848471904005e-07, + "loss": 0.3922, + "step": 19616 + }, + { + "epoch": 0.38, + "learning_rate": 1.240146013747039e-07, + "loss": 0.0123, + "step": 19617 + }, + { + "epoch": 0.38, + "learning_rate": 1.2401071803036777e-07, + "loss": 0.001, + "step": 19618 + }, + { + "epoch": 0.38, + "learning_rate": 1.240068346860316e-07, + "loss": 0.0007, + "step": 19619 + }, + { + "epoch": 0.38, + "learning_rate": 1.2400295134169548e-07, + "loss": 0.0018, + "step": 19620 + }, + { + "epoch": 0.38, + "learning_rate": 1.2399906799735933e-07, + "loss": 0.0009, + "step": 19621 + }, + { + "epoch": 0.38, + "learning_rate": 1.239951846530232e-07, + "loss": 0.0006, + "step": 19622 + }, + { + "epoch": 0.38, + "learning_rate": 1.2399130130868704e-07, + "loss": 0.0008, + "step": 19623 + }, + { + "epoch": 0.38, + "learning_rate": 1.2398741796435092e-07, + "loss": 0.0007, + "step": 19624 + }, + { + "epoch": 0.38, + "learning_rate": 1.2398353462001473e-07, + "loss": 0.0011, + "step": 19625 + }, + { + "epoch": 0.38, + "learning_rate": 1.239796512756786e-07, + "loss": 0.0007, + "step": 19626 + }, + { + "epoch": 0.38, + "learning_rate": 1.2397576793134245e-07, + "loss": 0.8161, + "step": 19627 + }, + { + "epoch": 0.38, + "learning_rate": 1.2397188458700632e-07, + "loss": 1.0192, + "step": 19628 + }, + { + "epoch": 0.38, + "learning_rate": 1.2396800124267017e-07, + "loss": 0.7443, + "step": 19629 + }, + { + "epoch": 0.38, + "learning_rate": 1.2396411789833404e-07, + "loss": 0.0015, + "step": 19630 + }, + { + "epoch": 0.38, + "learning_rate": 1.2396023455399788e-07, + "loss": 0.0007, + "step": 19631 + }, + { + "epoch": 0.38, + "learning_rate": 1.2395635120966176e-07, + "loss": 0.0007, + "step": 19632 + }, + { + "epoch": 0.38, + "learning_rate": 1.239524678653256e-07, + "loss": 0.0009, + "step": 19633 + }, + { + "epoch": 0.38, + "learning_rate": 1.2394858452098947e-07, + "loss": 0.0006, + "step": 19634 + }, + { + "epoch": 0.38, + "learning_rate": 1.2394470117665332e-07, + "loss": 0.0034, + "step": 19635 + }, + { + "epoch": 0.38, + "learning_rate": 1.239408178323172e-07, + "loss": 0.0008, + "step": 19636 + }, + { + "epoch": 0.38, + "learning_rate": 1.2393693448798103e-07, + "loss": 0.0008, + "step": 19637 + }, + { + "epoch": 0.38, + "learning_rate": 1.239330511436449e-07, + "loss": 0.0008, + "step": 19638 + }, + { + "epoch": 0.38, + "learning_rate": 1.2392916779930875e-07, + "loss": 0.0008, + "step": 19639 + }, + { + "epoch": 0.38, + "learning_rate": 1.2392528445497262e-07, + "loss": 0.1623, + "step": 19640 + }, + { + "epoch": 0.38, + "learning_rate": 1.2392140111063647e-07, + "loss": 0.0007, + "step": 19641 + }, + { + "epoch": 0.38, + "learning_rate": 1.2391751776630034e-07, + "loss": 0.0009, + "step": 19642 + }, + { + "epoch": 0.38, + "learning_rate": 1.2391363442196418e-07, + "loss": 0.0007, + "step": 19643 + }, + { + "epoch": 0.38, + "learning_rate": 1.2390975107762805e-07, + "loss": 0.001, + "step": 19644 + }, + { + "epoch": 0.38, + "learning_rate": 1.239058677332919e-07, + "loss": 0.0012, + "step": 19645 + }, + { + "epoch": 0.38, + "learning_rate": 1.2390198438895577e-07, + "loss": 0.0008, + "step": 19646 + }, + { + "epoch": 0.38, + "learning_rate": 1.2389810104461962e-07, + "loss": 0.0009, + "step": 19647 + }, + { + "epoch": 0.38, + "learning_rate": 1.238942177002835e-07, + "loss": 0.0007, + "step": 19648 + }, + { + "epoch": 0.38, + "learning_rate": 1.2389033435594733e-07, + "loss": 0.0011, + "step": 19649 + }, + { + "epoch": 0.38, + "learning_rate": 1.238864510116112e-07, + "loss": 0.0029, + "step": 19650 + }, + { + "epoch": 0.38, + "learning_rate": 1.2388256766727505e-07, + "loss": 0.0007, + "step": 19651 + }, + { + "epoch": 0.38, + "learning_rate": 1.2387868432293892e-07, + "loss": 0.0009, + "step": 19652 + }, + { + "epoch": 0.38, + "learning_rate": 1.2387480097860277e-07, + "loss": 0.0035, + "step": 19653 + }, + { + "epoch": 0.38, + "learning_rate": 1.2387091763426664e-07, + "loss": 0.0009, + "step": 19654 + }, + { + "epoch": 0.38, + "learning_rate": 1.2386703428993048e-07, + "loss": 0.0008, + "step": 19655 + }, + { + "epoch": 0.38, + "learning_rate": 1.2386315094559435e-07, + "loss": 0.0005, + "step": 19656 + }, + { + "epoch": 0.38, + "learning_rate": 1.238592676012582e-07, + "loss": 0.0018, + "step": 19657 + }, + { + "epoch": 0.38, + "learning_rate": 1.2385538425692207e-07, + "loss": 0.0008, + "step": 19658 + }, + { + "epoch": 0.38, + "learning_rate": 1.2385150091258591e-07, + "loss": 0.0012, + "step": 19659 + }, + { + "epoch": 0.38, + "learning_rate": 1.2384761756824979e-07, + "loss": 0.0009, + "step": 19660 + }, + { + "epoch": 0.38, + "learning_rate": 1.2384373422391363e-07, + "loss": 0.0009, + "step": 19661 + }, + { + "epoch": 0.38, + "learning_rate": 1.238398508795775e-07, + "loss": 0.0011, + "step": 19662 + }, + { + "epoch": 0.38, + "learning_rate": 1.2383596753524135e-07, + "loss": 0.0011, + "step": 19663 + }, + { + "epoch": 0.38, + "learning_rate": 1.2383208419090522e-07, + "loss": 0.0018, + "step": 19664 + }, + { + "epoch": 0.38, + "learning_rate": 1.2382820084656906e-07, + "loss": 0.0083, + "step": 19665 + }, + { + "epoch": 0.38, + "learning_rate": 1.238243175022329e-07, + "loss": 0.0006, + "step": 19666 + }, + { + "epoch": 0.38, + "learning_rate": 1.2382043415789678e-07, + "loss": 0.0011, + "step": 19667 + }, + { + "epoch": 0.38, + "learning_rate": 1.2381655081356063e-07, + "loss": 0.0013, + "step": 19668 + }, + { + "epoch": 0.38, + "learning_rate": 1.238126674692245e-07, + "loss": 0.0146, + "step": 19669 + }, + { + "epoch": 0.38, + "learning_rate": 1.2380878412488834e-07, + "loss": 0.004, + "step": 19670 + }, + { + "epoch": 0.38, + "learning_rate": 1.2380490078055221e-07, + "loss": 0.0009, + "step": 19671 + }, + { + "epoch": 0.38, + "learning_rate": 1.2380101743621606e-07, + "loss": 0.0009, + "step": 19672 + }, + { + "epoch": 0.38, + "learning_rate": 1.2379713409187993e-07, + "loss": 0.0105, + "step": 19673 + }, + { + "epoch": 0.38, + "learning_rate": 1.2379325074754378e-07, + "loss": 0.0016, + "step": 19674 + }, + { + "epoch": 0.38, + "learning_rate": 1.2378936740320765e-07, + "loss": 0.0011, + "step": 19675 + }, + { + "epoch": 0.38, + "learning_rate": 1.237854840588715e-07, + "loss": 0.0011, + "step": 19676 + }, + { + "epoch": 0.38, + "learning_rate": 1.2378160071453536e-07, + "loss": 0.0008, + "step": 19677 + }, + { + "epoch": 0.38, + "learning_rate": 1.237777173701992e-07, + "loss": 0.0007, + "step": 19678 + }, + { + "epoch": 0.38, + "learning_rate": 1.2377383402586308e-07, + "loss": 0.0008, + "step": 19679 + }, + { + "epoch": 0.38, + "learning_rate": 1.2376995068152692e-07, + "loss": 0.0008, + "step": 19680 + }, + { + "epoch": 0.38, + "learning_rate": 1.237660673371908e-07, + "loss": 0.0007, + "step": 19681 + }, + { + "epoch": 0.38, + "learning_rate": 1.2376218399285464e-07, + "loss": 0.0008, + "step": 19682 + }, + { + "epoch": 0.38, + "learning_rate": 1.2375830064851849e-07, + "loss": 0.001, + "step": 19683 + }, + { + "epoch": 0.38, + "learning_rate": 1.2375441730418236e-07, + "loss": 0.0008, + "step": 19684 + }, + { + "epoch": 0.38, + "learning_rate": 1.237505339598462e-07, + "loss": 0.0008, + "step": 19685 + }, + { + "epoch": 0.38, + "learning_rate": 1.2374665061551007e-07, + "loss": 0.0009, + "step": 19686 + }, + { + "epoch": 0.38, + "learning_rate": 1.2374276727117392e-07, + "loss": 0.0007, + "step": 19687 + }, + { + "epoch": 0.38, + "learning_rate": 1.237388839268378e-07, + "loss": 0.0011, + "step": 19688 + }, + { + "epoch": 0.38, + "learning_rate": 1.2373500058250164e-07, + "loss": 0.0007, + "step": 19689 + }, + { + "epoch": 0.38, + "learning_rate": 1.237311172381655e-07, + "loss": 0.0007, + "step": 19690 + }, + { + "epoch": 0.38, + "learning_rate": 1.2372723389382935e-07, + "loss": 0.0007, + "step": 19691 + }, + { + "epoch": 0.38, + "learning_rate": 1.2372335054949322e-07, + "loss": 0.0008, + "step": 19692 + }, + { + "epoch": 0.38, + "learning_rate": 1.2371946720515707e-07, + "loss": 0.0013, + "step": 19693 + }, + { + "epoch": 0.38, + "learning_rate": 1.2371558386082094e-07, + "loss": 0.0009, + "step": 19694 + }, + { + "epoch": 0.38, + "learning_rate": 1.2371170051648478e-07, + "loss": 0.0049, + "step": 19695 + }, + { + "epoch": 0.38, + "learning_rate": 1.2370781717214863e-07, + "loss": 0.0015, + "step": 19696 + }, + { + "epoch": 0.38, + "learning_rate": 1.237039338278125e-07, + "loss": 0.5924, + "step": 19697 + }, + { + "epoch": 0.38, + "learning_rate": 1.2370005048347635e-07, + "loss": 0.0158, + "step": 19698 + }, + { + "epoch": 0.38, + "learning_rate": 1.2369616713914022e-07, + "loss": 0.0009, + "step": 19699 + }, + { + "epoch": 0.38, + "learning_rate": 1.2369228379480406e-07, + "loss": 0.797, + "step": 19700 + }, + { + "epoch": 0.38, + "learning_rate": 1.2368840045046793e-07, + "loss": 0.0007, + "step": 19701 + }, + { + "epoch": 0.38, + "learning_rate": 1.2368451710613178e-07, + "loss": 0.0009, + "step": 19702 + }, + { + "epoch": 0.38, + "learning_rate": 1.2368063376179565e-07, + "loss": 0.0009, + "step": 19703 + }, + { + "epoch": 0.38, + "learning_rate": 1.236767504174595e-07, + "loss": 0.0008, + "step": 19704 + }, + { + "epoch": 0.38, + "learning_rate": 1.2367286707312337e-07, + "loss": 0.0007, + "step": 19705 + }, + { + "epoch": 0.38, + "learning_rate": 1.236689837287872e-07, + "loss": 0.0007, + "step": 19706 + }, + { + "epoch": 0.38, + "learning_rate": 1.2366510038445108e-07, + "loss": 0.0008, + "step": 19707 + }, + { + "epoch": 0.38, + "learning_rate": 1.2366121704011493e-07, + "loss": 0.001, + "step": 19708 + }, + { + "epoch": 0.38, + "learning_rate": 1.236573336957788e-07, + "loss": 0.6474, + "step": 19709 + }, + { + "epoch": 0.38, + "learning_rate": 1.2365345035144265e-07, + "loss": 0.0009, + "step": 19710 + }, + { + "epoch": 0.38, + "learning_rate": 1.2364956700710652e-07, + "loss": 0.0102, + "step": 19711 + }, + { + "epoch": 0.38, + "learning_rate": 1.2364568366277036e-07, + "loss": 0.1005, + "step": 19712 + }, + { + "epoch": 0.38, + "learning_rate": 1.2364180031843423e-07, + "loss": 0.0007, + "step": 19713 + }, + { + "epoch": 0.38, + "learning_rate": 1.2363791697409808e-07, + "loss": 0.0007, + "step": 19714 + }, + { + "epoch": 0.38, + "learning_rate": 1.2363403362976195e-07, + "loss": 0.0034, + "step": 19715 + }, + { + "epoch": 0.38, + "learning_rate": 1.236301502854258e-07, + "loss": 0.0008, + "step": 19716 + }, + { + "epoch": 0.38, + "learning_rate": 1.2362626694108967e-07, + "loss": 0.0009, + "step": 19717 + }, + { + "epoch": 0.38, + "learning_rate": 1.236223835967535e-07, + "loss": 0.0011, + "step": 19718 + }, + { + "epoch": 0.38, + "learning_rate": 1.2361850025241738e-07, + "loss": 0.0006, + "step": 19719 + }, + { + "epoch": 0.38, + "learning_rate": 1.2361461690808123e-07, + "loss": 0.0007, + "step": 19720 + }, + { + "epoch": 0.38, + "learning_rate": 1.236107335637451e-07, + "loss": 0.0005, + "step": 19721 + }, + { + "epoch": 0.38, + "learning_rate": 1.2360685021940894e-07, + "loss": 0.0009, + "step": 19722 + }, + { + "epoch": 0.38, + "learning_rate": 1.2360296687507282e-07, + "loss": 0.0007, + "step": 19723 + }, + { + "epoch": 0.38, + "learning_rate": 1.2359908353073666e-07, + "loss": 0.001, + "step": 19724 + }, + { + "epoch": 0.38, + "learning_rate": 1.2359520018640053e-07, + "loss": 0.0011, + "step": 19725 + }, + { + "epoch": 0.38, + "learning_rate": 1.2359131684206438e-07, + "loss": 0.0006, + "step": 19726 + }, + { + "epoch": 0.38, + "learning_rate": 1.2358743349772825e-07, + "loss": 0.0008, + "step": 19727 + }, + { + "epoch": 0.38, + "learning_rate": 1.235835501533921e-07, + "loss": 0.0017, + "step": 19728 + }, + { + "epoch": 0.38, + "learning_rate": 1.2357966680905597e-07, + "loss": 0.0155, + "step": 19729 + }, + { + "epoch": 0.38, + "learning_rate": 1.235757834647198e-07, + "loss": 0.0009, + "step": 19730 + }, + { + "epoch": 0.38, + "learning_rate": 1.2357190012038368e-07, + "loss": 0.0012, + "step": 19731 + }, + { + "epoch": 0.38, + "learning_rate": 1.2356801677604753e-07, + "loss": 0.0009, + "step": 19732 + }, + { + "epoch": 0.38, + "learning_rate": 1.235641334317114e-07, + "loss": 0.0007, + "step": 19733 + }, + { + "epoch": 0.38, + "learning_rate": 1.2356025008737524e-07, + "loss": 0.0011, + "step": 19734 + }, + { + "epoch": 0.38, + "learning_rate": 1.2355636674303911e-07, + "loss": 0.001, + "step": 19735 + }, + { + "epoch": 0.38, + "learning_rate": 1.2355248339870296e-07, + "loss": 0.0008, + "step": 19736 + }, + { + "epoch": 0.38, + "learning_rate": 1.2354860005436683e-07, + "loss": 0.0009, + "step": 19737 + }, + { + "epoch": 0.38, + "learning_rate": 1.2354471671003068e-07, + "loss": 0.0018, + "step": 19738 + }, + { + "epoch": 0.38, + "learning_rate": 1.2354083336569455e-07, + "loss": 0.001, + "step": 19739 + }, + { + "epoch": 0.38, + "learning_rate": 1.235369500213584e-07, + "loss": 0.001, + "step": 19740 + }, + { + "epoch": 0.38, + "learning_rate": 1.2353306667702224e-07, + "loss": 0.0011, + "step": 19741 + }, + { + "epoch": 0.38, + "learning_rate": 1.2352918333268608e-07, + "loss": 0.0008, + "step": 19742 + }, + { + "epoch": 0.38, + "learning_rate": 1.2352529998834995e-07, + "loss": 0.0008, + "step": 19743 + }, + { + "epoch": 0.38, + "learning_rate": 1.235214166440138e-07, + "loss": 0.6901, + "step": 19744 + }, + { + "epoch": 0.38, + "learning_rate": 1.2351753329967767e-07, + "loss": 0.4371, + "step": 19745 + }, + { + "epoch": 0.38, + "learning_rate": 1.2351364995534152e-07, + "loss": 0.0008, + "step": 19746 + }, + { + "epoch": 0.38, + "learning_rate": 1.235097666110054e-07, + "loss": 0.0009, + "step": 19747 + }, + { + "epoch": 0.38, + "learning_rate": 1.2350588326666923e-07, + "loss": 0.0007, + "step": 19748 + }, + { + "epoch": 0.38, + "learning_rate": 1.235019999223331e-07, + "loss": 0.9395, + "step": 19749 + }, + { + "epoch": 0.38, + "learning_rate": 1.2349811657799695e-07, + "loss": 0.0009, + "step": 19750 + }, + { + "epoch": 0.38, + "learning_rate": 1.2349423323366082e-07, + "loss": 0.0005, + "step": 19751 + }, + { + "epoch": 0.38, + "learning_rate": 1.2349034988932467e-07, + "loss": 0.0016, + "step": 19752 + }, + { + "epoch": 0.38, + "learning_rate": 1.2348646654498854e-07, + "loss": 0.001, + "step": 19753 + }, + { + "epoch": 0.38, + "learning_rate": 1.2348258320065238e-07, + "loss": 0.9189, + "step": 19754 + }, + { + "epoch": 0.38, + "learning_rate": 1.2347869985631625e-07, + "loss": 0.0008, + "step": 19755 + }, + { + "epoch": 0.38, + "learning_rate": 1.234748165119801e-07, + "loss": 0.0022, + "step": 19756 + }, + { + "epoch": 0.38, + "learning_rate": 1.2347093316764397e-07, + "loss": 0.0007, + "step": 19757 + }, + { + "epoch": 0.38, + "learning_rate": 1.2346704982330781e-07, + "loss": 0.0006, + "step": 19758 + }, + { + "epoch": 0.38, + "learning_rate": 1.2346316647897169e-07, + "loss": 0.0011, + "step": 19759 + }, + { + "epoch": 0.38, + "learning_rate": 1.2345928313463553e-07, + "loss": 0.7634, + "step": 19760 + }, + { + "epoch": 0.38, + "learning_rate": 1.234553997902994e-07, + "loss": 0.0005, + "step": 19761 + }, + { + "epoch": 0.38, + "learning_rate": 1.2345151644596325e-07, + "loss": 0.0006, + "step": 19762 + }, + { + "epoch": 0.38, + "learning_rate": 1.2344763310162712e-07, + "loss": 0.0008, + "step": 19763 + }, + { + "epoch": 0.38, + "learning_rate": 1.2344374975729096e-07, + "loss": 0.0042, + "step": 19764 + }, + { + "epoch": 0.38, + "learning_rate": 1.2343986641295484e-07, + "loss": 0.001, + "step": 19765 + }, + { + "epoch": 0.38, + "learning_rate": 1.2343598306861868e-07, + "loss": 0.001, + "step": 19766 + }, + { + "epoch": 0.38, + "learning_rate": 1.2343209972428255e-07, + "loss": 0.0012, + "step": 19767 + }, + { + "epoch": 0.38, + "learning_rate": 1.234282163799464e-07, + "loss": 0.0808, + "step": 19768 + }, + { + "epoch": 0.38, + "learning_rate": 1.2342433303561027e-07, + "loss": 0.0015, + "step": 19769 + }, + { + "epoch": 0.38, + "learning_rate": 1.2342044969127411e-07, + "loss": 0.0007, + "step": 19770 + }, + { + "epoch": 0.38, + "learning_rate": 1.2341656634693799e-07, + "loss": 0.2987, + "step": 19771 + }, + { + "epoch": 0.38, + "learning_rate": 1.2341268300260183e-07, + "loss": 0.0007, + "step": 19772 + }, + { + "epoch": 0.38, + "learning_rate": 1.234087996582657e-07, + "loss": 0.0048, + "step": 19773 + }, + { + "epoch": 0.38, + "learning_rate": 1.2340491631392955e-07, + "loss": 0.0006, + "step": 19774 + }, + { + "epoch": 0.38, + "learning_rate": 1.2340103296959342e-07, + "loss": 0.001, + "step": 19775 + }, + { + "epoch": 0.38, + "learning_rate": 1.2339714962525726e-07, + "loss": 0.001, + "step": 19776 + }, + { + "epoch": 0.38, + "learning_rate": 1.2339326628092113e-07, + "loss": 0.0232, + "step": 19777 + }, + { + "epoch": 0.38, + "learning_rate": 1.2338938293658498e-07, + "loss": 0.0012, + "step": 19778 + }, + { + "epoch": 0.38, + "learning_rate": 1.2338549959224885e-07, + "loss": 0.0009, + "step": 19779 + }, + { + "epoch": 0.38, + "learning_rate": 1.233816162479127e-07, + "loss": 0.0009, + "step": 19780 + }, + { + "epoch": 0.38, + "learning_rate": 1.2337773290357657e-07, + "loss": 0.0008, + "step": 19781 + }, + { + "epoch": 0.38, + "learning_rate": 1.233738495592404e-07, + "loss": 0.001, + "step": 19782 + }, + { + "epoch": 0.38, + "learning_rate": 1.2336996621490428e-07, + "loss": 0.001, + "step": 19783 + }, + { + "epoch": 0.38, + "learning_rate": 1.2336608287056813e-07, + "loss": 0.0007, + "step": 19784 + }, + { + "epoch": 0.38, + "learning_rate": 1.23362199526232e-07, + "loss": 0.4825, + "step": 19785 + }, + { + "epoch": 0.38, + "learning_rate": 1.2335831618189585e-07, + "loss": 1.1886, + "step": 19786 + }, + { + "epoch": 0.38, + "learning_rate": 1.2335443283755972e-07, + "loss": 0.0011, + "step": 19787 + }, + { + "epoch": 0.38, + "learning_rate": 1.2335054949322356e-07, + "loss": 0.0024, + "step": 19788 + }, + { + "epoch": 0.38, + "learning_rate": 1.2334666614888743e-07, + "loss": 0.0007, + "step": 19789 + }, + { + "epoch": 0.38, + "learning_rate": 1.2334278280455128e-07, + "loss": 0.0007, + "step": 19790 + }, + { + "epoch": 0.38, + "learning_rate": 1.2333889946021515e-07, + "loss": 0.0006, + "step": 19791 + }, + { + "epoch": 0.38, + "learning_rate": 1.23335016115879e-07, + "loss": 0.0008, + "step": 19792 + }, + { + "epoch": 0.38, + "learning_rate": 1.2333113277154287e-07, + "loss": 0.0025, + "step": 19793 + }, + { + "epoch": 0.38, + "learning_rate": 1.233272494272067e-07, + "loss": 0.0012, + "step": 19794 + }, + { + "epoch": 0.38, + "learning_rate": 1.2332336608287058e-07, + "loss": 0.0011, + "step": 19795 + }, + { + "epoch": 0.38, + "learning_rate": 1.2331948273853443e-07, + "loss": 0.0008, + "step": 19796 + }, + { + "epoch": 0.38, + "learning_rate": 1.233155993941983e-07, + "loss": 0.0009, + "step": 19797 + }, + { + "epoch": 0.38, + "learning_rate": 1.2331171604986214e-07, + "loss": 0.0013, + "step": 19798 + }, + { + "epoch": 0.38, + "learning_rate": 1.23307832705526e-07, + "loss": 0.0411, + "step": 19799 + }, + { + "epoch": 0.38, + "learning_rate": 1.2330394936118983e-07, + "loss": 0.0007, + "step": 19800 + }, + { + "epoch": 0.38, + "learning_rate": 1.233000660168537e-07, + "loss": 0.0006, + "step": 19801 + }, + { + "epoch": 0.38, + "learning_rate": 1.2329618267251755e-07, + "loss": 0.0008, + "step": 19802 + }, + { + "epoch": 0.38, + "learning_rate": 1.2329229932818142e-07, + "loss": 0.0008, + "step": 19803 + }, + { + "epoch": 0.38, + "learning_rate": 1.2328841598384527e-07, + "loss": 0.2831, + "step": 19804 + }, + { + "epoch": 0.38, + "learning_rate": 1.2328453263950914e-07, + "loss": 0.0007, + "step": 19805 + }, + { + "epoch": 0.38, + "learning_rate": 1.2328064929517298e-07, + "loss": 0.0008, + "step": 19806 + }, + { + "epoch": 0.38, + "learning_rate": 1.2327676595083686e-07, + "loss": 0.0013, + "step": 19807 + }, + { + "epoch": 0.38, + "learning_rate": 1.232728826065007e-07, + "loss": 0.0013, + "step": 19808 + }, + { + "epoch": 0.38, + "learning_rate": 1.2326899926216457e-07, + "loss": 0.0058, + "step": 19809 + }, + { + "epoch": 0.38, + "learning_rate": 1.2326511591782842e-07, + "loss": 0.0008, + "step": 19810 + }, + { + "epoch": 0.38, + "learning_rate": 1.232612325734923e-07, + "loss": 0.0008, + "step": 19811 + }, + { + "epoch": 0.38, + "learning_rate": 1.2325734922915613e-07, + "loss": 0.0008, + "step": 19812 + }, + { + "epoch": 0.38, + "learning_rate": 1.2325346588482e-07, + "loss": 0.002, + "step": 19813 + }, + { + "epoch": 0.38, + "learning_rate": 1.2324958254048385e-07, + "loss": 0.001, + "step": 19814 + }, + { + "epoch": 0.38, + "learning_rate": 1.2324569919614772e-07, + "loss": 0.0027, + "step": 19815 + }, + { + "epoch": 0.38, + "learning_rate": 1.2324181585181157e-07, + "loss": 0.0008, + "step": 19816 + }, + { + "epoch": 0.38, + "learning_rate": 1.2323793250747544e-07, + "loss": 0.0106, + "step": 19817 + }, + { + "epoch": 0.38, + "learning_rate": 1.2323404916313928e-07, + "loss": 0.188, + "step": 19818 + }, + { + "epoch": 0.38, + "learning_rate": 1.2323016581880315e-07, + "loss": 0.0009, + "step": 19819 + }, + { + "epoch": 0.38, + "learning_rate": 1.23226282474467e-07, + "loss": 0.017, + "step": 19820 + }, + { + "epoch": 0.38, + "learning_rate": 1.2322239913013087e-07, + "loss": 0.0008, + "step": 19821 + }, + { + "epoch": 0.38, + "learning_rate": 1.2321851578579472e-07, + "loss": 0.0841, + "step": 19822 + }, + { + "epoch": 0.38, + "learning_rate": 1.232146324414586e-07, + "loss": 0.0006, + "step": 19823 + }, + { + "epoch": 0.38, + "learning_rate": 1.2321074909712243e-07, + "loss": 0.0007, + "step": 19824 + }, + { + "epoch": 0.38, + "learning_rate": 1.232068657527863e-07, + "loss": 0.0325, + "step": 19825 + }, + { + "epoch": 0.38, + "learning_rate": 1.2320298240845015e-07, + "loss": 0.0007, + "step": 19826 + }, + { + "epoch": 0.38, + "learning_rate": 1.2319909906411402e-07, + "loss": 0.0011, + "step": 19827 + }, + { + "epoch": 0.38, + "learning_rate": 1.2319521571977787e-07, + "loss": 0.0165, + "step": 19828 + }, + { + "epoch": 0.38, + "learning_rate": 1.2319133237544174e-07, + "loss": 0.0009, + "step": 19829 + }, + { + "epoch": 0.38, + "learning_rate": 1.2318744903110558e-07, + "loss": 0.6452, + "step": 19830 + }, + { + "epoch": 0.38, + "learning_rate": 1.2318356568676945e-07, + "loss": 0.8654, + "step": 19831 + }, + { + "epoch": 0.38, + "learning_rate": 1.231796823424333e-07, + "loss": 0.0007, + "step": 19832 + }, + { + "epoch": 0.38, + "learning_rate": 1.2317579899809717e-07, + "loss": 0.0007, + "step": 19833 + }, + { + "epoch": 0.38, + "learning_rate": 1.2317191565376101e-07, + "loss": 0.0007, + "step": 19834 + }, + { + "epoch": 0.38, + "learning_rate": 1.2316803230942489e-07, + "loss": 0.0007, + "step": 19835 + }, + { + "epoch": 0.38, + "learning_rate": 1.2316414896508873e-07, + "loss": 0.8658, + "step": 19836 + }, + { + "epoch": 0.38, + "learning_rate": 1.231602656207526e-07, + "loss": 0.8827, + "step": 19837 + }, + { + "epoch": 0.38, + "learning_rate": 1.2315638227641645e-07, + "loss": 0.0994, + "step": 19838 + }, + { + "epoch": 0.38, + "learning_rate": 1.2315249893208032e-07, + "loss": 0.4, + "step": 19839 + }, + { + "epoch": 0.38, + "learning_rate": 1.2314861558774416e-07, + "loss": 0.001, + "step": 19840 + }, + { + "epoch": 0.38, + "learning_rate": 1.2314473224340804e-07, + "loss": 0.0007, + "step": 19841 + }, + { + "epoch": 0.38, + "learning_rate": 1.2314084889907188e-07, + "loss": 0.001, + "step": 19842 + }, + { + "epoch": 0.38, + "learning_rate": 1.2313696555473573e-07, + "loss": 0.0008, + "step": 19843 + }, + { + "epoch": 0.38, + "learning_rate": 1.231330822103996e-07, + "loss": 0.0008, + "step": 19844 + }, + { + "epoch": 0.38, + "learning_rate": 1.2312919886606344e-07, + "loss": 0.0878, + "step": 19845 + }, + { + "epoch": 0.38, + "learning_rate": 1.2312531552172731e-07, + "loss": 0.5206, + "step": 19846 + }, + { + "epoch": 0.38, + "learning_rate": 1.2312143217739116e-07, + "loss": 0.0005, + "step": 19847 + }, + { + "epoch": 0.39, + "learning_rate": 1.2311754883305503e-07, + "loss": 0.5803, + "step": 19848 + }, + { + "epoch": 0.39, + "learning_rate": 1.2311366548871888e-07, + "loss": 0.0008, + "step": 19849 + }, + { + "epoch": 0.39, + "learning_rate": 1.2310978214438275e-07, + "loss": 0.0013, + "step": 19850 + }, + { + "epoch": 0.39, + "learning_rate": 1.231058988000466e-07, + "loss": 0.002, + "step": 19851 + }, + { + "epoch": 0.39, + "learning_rate": 1.2310201545571046e-07, + "loss": 0.0031, + "step": 19852 + }, + { + "epoch": 0.39, + "learning_rate": 1.230981321113743e-07, + "loss": 0.0007, + "step": 19853 + }, + { + "epoch": 0.39, + "learning_rate": 1.2309424876703818e-07, + "loss": 0.0011, + "step": 19854 + }, + { + "epoch": 0.39, + "learning_rate": 1.2309036542270202e-07, + "loss": 0.0014, + "step": 19855 + }, + { + "epoch": 0.39, + "learning_rate": 1.230864820783659e-07, + "loss": 0.0575, + "step": 19856 + }, + { + "epoch": 0.39, + "learning_rate": 1.2308259873402974e-07, + "loss": 0.0009, + "step": 19857 + }, + { + "epoch": 0.39, + "learning_rate": 1.2307871538969359e-07, + "loss": 0.0007, + "step": 19858 + }, + { + "epoch": 0.39, + "learning_rate": 1.2307483204535746e-07, + "loss": 0.005, + "step": 19859 + }, + { + "epoch": 0.39, + "learning_rate": 1.230709487010213e-07, + "loss": 0.0006, + "step": 19860 + }, + { + "epoch": 0.39, + "learning_rate": 1.2306706535668517e-07, + "loss": 0.0012, + "step": 19861 + }, + { + "epoch": 0.39, + "learning_rate": 1.2306318201234902e-07, + "loss": 0.0008, + "step": 19862 + }, + { + "epoch": 0.39, + "learning_rate": 1.230592986680129e-07, + "loss": 0.0008, + "step": 19863 + }, + { + "epoch": 0.39, + "learning_rate": 1.2305541532367674e-07, + "loss": 0.0007, + "step": 19864 + }, + { + "epoch": 0.39, + "learning_rate": 1.230515319793406e-07, + "loss": 0.0008, + "step": 19865 + }, + { + "epoch": 0.39, + "learning_rate": 1.2304764863500445e-07, + "loss": 0.0007, + "step": 19866 + }, + { + "epoch": 0.39, + "learning_rate": 1.2304376529066832e-07, + "loss": 0.001, + "step": 19867 + }, + { + "epoch": 0.39, + "learning_rate": 1.2303988194633217e-07, + "loss": 0.0122, + "step": 19868 + }, + { + "epoch": 0.39, + "learning_rate": 1.2303599860199604e-07, + "loss": 0.0007, + "step": 19869 + }, + { + "epoch": 0.39, + "learning_rate": 1.2303211525765989e-07, + "loss": 0.0007, + "step": 19870 + }, + { + "epoch": 0.39, + "learning_rate": 1.2302823191332376e-07, + "loss": 0.0008, + "step": 19871 + }, + { + "epoch": 0.39, + "learning_rate": 1.230243485689876e-07, + "loss": 0.0008, + "step": 19872 + }, + { + "epoch": 0.39, + "learning_rate": 1.2302046522465145e-07, + "loss": 0.428, + "step": 19873 + }, + { + "epoch": 0.39, + "learning_rate": 1.2301658188031532e-07, + "loss": 0.0007, + "step": 19874 + }, + { + "epoch": 0.39, + "learning_rate": 1.2301269853597916e-07, + "loss": 1.3365, + "step": 19875 + }, + { + "epoch": 0.39, + "learning_rate": 1.2300881519164303e-07, + "loss": 0.0009, + "step": 19876 + }, + { + "epoch": 0.39, + "learning_rate": 1.2300493184730688e-07, + "loss": 0.0008, + "step": 19877 + }, + { + "epoch": 0.39, + "learning_rate": 1.2300104850297075e-07, + "loss": 0.0657, + "step": 19878 + }, + { + "epoch": 0.39, + "learning_rate": 1.229971651586346e-07, + "loss": 0.0008, + "step": 19879 + }, + { + "epoch": 0.39, + "learning_rate": 1.2299328181429847e-07, + "loss": 0.0008, + "step": 19880 + }, + { + "epoch": 0.39, + "learning_rate": 1.229893984699623e-07, + "loss": 0.0007, + "step": 19881 + }, + { + "epoch": 0.39, + "learning_rate": 1.2298551512562618e-07, + "loss": 0.4324, + "step": 19882 + }, + { + "epoch": 0.39, + "learning_rate": 1.2298163178129003e-07, + "loss": 0.0007, + "step": 19883 + }, + { + "epoch": 0.39, + "learning_rate": 1.229777484369539e-07, + "loss": 0.001, + "step": 19884 + }, + { + "epoch": 0.39, + "learning_rate": 1.2297386509261775e-07, + "loss": 0.0007, + "step": 19885 + }, + { + "epoch": 0.39, + "learning_rate": 1.2296998174828162e-07, + "loss": 0.0006, + "step": 19886 + }, + { + "epoch": 0.39, + "learning_rate": 1.2296609840394546e-07, + "loss": 0.0009, + "step": 19887 + }, + { + "epoch": 0.39, + "learning_rate": 1.2296221505960933e-07, + "loss": 1.0827, + "step": 19888 + }, + { + "epoch": 0.39, + "learning_rate": 1.2295833171527318e-07, + "loss": 0.0013, + "step": 19889 + }, + { + "epoch": 0.39, + "learning_rate": 1.2295444837093705e-07, + "loss": 0.0007, + "step": 19890 + }, + { + "epoch": 0.39, + "learning_rate": 1.229505650266009e-07, + "loss": 0.0006, + "step": 19891 + }, + { + "epoch": 0.39, + "learning_rate": 1.2294668168226477e-07, + "loss": 0.0007, + "step": 19892 + }, + { + "epoch": 0.39, + "learning_rate": 1.229427983379286e-07, + "loss": 0.0353, + "step": 19893 + }, + { + "epoch": 0.39, + "learning_rate": 1.2293891499359248e-07, + "loss": 0.0009, + "step": 19894 + }, + { + "epoch": 0.39, + "learning_rate": 1.2293503164925633e-07, + "loss": 0.0006, + "step": 19895 + }, + { + "epoch": 0.39, + "learning_rate": 1.229311483049202e-07, + "loss": 0.0011, + "step": 19896 + }, + { + "epoch": 0.39, + "learning_rate": 1.2292726496058404e-07, + "loss": 0.8418, + "step": 19897 + }, + { + "epoch": 0.39, + "learning_rate": 1.2292338161624792e-07, + "loss": 0.0008, + "step": 19898 + }, + { + "epoch": 0.39, + "learning_rate": 1.2291949827191176e-07, + "loss": 0.1282, + "step": 19899 + }, + { + "epoch": 0.39, + "learning_rate": 1.2291561492757563e-07, + "loss": 0.0025, + "step": 19900 + }, + { + "epoch": 0.39, + "learning_rate": 1.2291173158323948e-07, + "loss": 0.0012, + "step": 19901 + }, + { + "epoch": 0.39, + "learning_rate": 1.2290784823890335e-07, + "loss": 0.0007, + "step": 19902 + }, + { + "epoch": 0.39, + "learning_rate": 1.229039648945672e-07, + "loss": 0.0008, + "step": 19903 + }, + { + "epoch": 0.39, + "learning_rate": 1.2290008155023107e-07, + "loss": 0.0008, + "step": 19904 + }, + { + "epoch": 0.39, + "learning_rate": 1.228961982058949e-07, + "loss": 0.0008, + "step": 19905 + }, + { + "epoch": 0.39, + "learning_rate": 1.2289231486155878e-07, + "loss": 0.0008, + "step": 19906 + }, + { + "epoch": 0.39, + "learning_rate": 1.2288843151722263e-07, + "loss": 0.0008, + "step": 19907 + }, + { + "epoch": 0.39, + "learning_rate": 1.228845481728865e-07, + "loss": 0.0021, + "step": 19908 + }, + { + "epoch": 0.39, + "learning_rate": 1.2288066482855034e-07, + "loss": 0.0032, + "step": 19909 + }, + { + "epoch": 0.39, + "learning_rate": 1.2287678148421421e-07, + "loss": 0.3325, + "step": 19910 + }, + { + "epoch": 0.39, + "learning_rate": 1.2287289813987806e-07, + "loss": 0.0008, + "step": 19911 + }, + { + "epoch": 0.39, + "learning_rate": 1.2286901479554193e-07, + "loss": 0.1279, + "step": 19912 + }, + { + "epoch": 0.39, + "learning_rate": 1.2286513145120578e-07, + "loss": 0.001, + "step": 19913 + }, + { + "epoch": 0.39, + "learning_rate": 1.2286124810686965e-07, + "loss": 0.0007, + "step": 19914 + }, + { + "epoch": 0.39, + "learning_rate": 1.2285736476253347e-07, + "loss": 0.0007, + "step": 19915 + }, + { + "epoch": 0.39, + "learning_rate": 1.2285348141819734e-07, + "loss": 0.0079, + "step": 19916 + }, + { + "epoch": 0.39, + "learning_rate": 1.2284959807386118e-07, + "loss": 0.0007, + "step": 19917 + }, + { + "epoch": 0.39, + "learning_rate": 1.2284571472952505e-07, + "loss": 0.0079, + "step": 19918 + }, + { + "epoch": 0.39, + "learning_rate": 1.228418313851889e-07, + "loss": 0.0023, + "step": 19919 + }, + { + "epoch": 0.39, + "learning_rate": 1.2283794804085277e-07, + "loss": 0.0009, + "step": 19920 + }, + { + "epoch": 0.39, + "learning_rate": 1.2283406469651662e-07, + "loss": 0.0009, + "step": 19921 + }, + { + "epoch": 0.39, + "learning_rate": 1.228301813521805e-07, + "loss": 0.0007, + "step": 19922 + }, + { + "epoch": 0.39, + "learning_rate": 1.2282629800784433e-07, + "loss": 0.0007, + "step": 19923 + }, + { + "epoch": 0.39, + "learning_rate": 1.228224146635082e-07, + "loss": 0.001, + "step": 19924 + }, + { + "epoch": 0.39, + "learning_rate": 1.2281853131917205e-07, + "loss": 0.0009, + "step": 19925 + }, + { + "epoch": 0.39, + "learning_rate": 1.2281464797483592e-07, + "loss": 0.0007, + "step": 19926 + }, + { + "epoch": 0.39, + "learning_rate": 1.2281076463049977e-07, + "loss": 0.0007, + "step": 19927 + }, + { + "epoch": 0.39, + "learning_rate": 1.2280688128616364e-07, + "loss": 0.0009, + "step": 19928 + }, + { + "epoch": 0.39, + "learning_rate": 1.2280299794182748e-07, + "loss": 0.0007, + "step": 19929 + }, + { + "epoch": 0.39, + "learning_rate": 1.2279911459749135e-07, + "loss": 0.001, + "step": 19930 + }, + { + "epoch": 0.39, + "learning_rate": 1.227952312531552e-07, + "loss": 0.0034, + "step": 19931 + }, + { + "epoch": 0.39, + "learning_rate": 1.2279134790881907e-07, + "loss": 0.023, + "step": 19932 + }, + { + "epoch": 0.39, + "learning_rate": 1.2278746456448291e-07, + "loss": 0.0008, + "step": 19933 + }, + { + "epoch": 0.39, + "learning_rate": 1.2278358122014679e-07, + "loss": 0.0007, + "step": 19934 + }, + { + "epoch": 0.39, + "learning_rate": 1.2277969787581063e-07, + "loss": 0.0008, + "step": 19935 + }, + { + "epoch": 0.39, + "learning_rate": 1.227758145314745e-07, + "loss": 0.0009, + "step": 19936 + }, + { + "epoch": 0.39, + "learning_rate": 1.2277193118713835e-07, + "loss": 0.0019, + "step": 19937 + }, + { + "epoch": 0.39, + "learning_rate": 1.2276804784280222e-07, + "loss": 0.0008, + "step": 19938 + }, + { + "epoch": 0.39, + "learning_rate": 1.2276416449846606e-07, + "loss": 1.073, + "step": 19939 + }, + { + "epoch": 0.39, + "learning_rate": 1.2276028115412994e-07, + "loss": 0.8801, + "step": 19940 + }, + { + "epoch": 0.39, + "learning_rate": 1.2275639780979378e-07, + "loss": 0.3932, + "step": 19941 + }, + { + "epoch": 0.39, + "learning_rate": 1.2275251446545765e-07, + "loss": 0.0007, + "step": 19942 + }, + { + "epoch": 0.39, + "learning_rate": 1.227486311211215e-07, + "loss": 0.0024, + "step": 19943 + }, + { + "epoch": 0.39, + "learning_rate": 1.2274474777678537e-07, + "loss": 0.003, + "step": 19944 + }, + { + "epoch": 0.39, + "learning_rate": 1.2274086443244921e-07, + "loss": 0.0006, + "step": 19945 + }, + { + "epoch": 0.39, + "learning_rate": 1.2273698108811309e-07, + "loss": 0.0024, + "step": 19946 + }, + { + "epoch": 0.39, + "learning_rate": 1.2273309774377693e-07, + "loss": 1.072, + "step": 19947 + }, + { + "epoch": 0.39, + "learning_rate": 1.227292143994408e-07, + "loss": 0.0006, + "step": 19948 + }, + { + "epoch": 0.39, + "learning_rate": 1.2272533105510465e-07, + "loss": 0.0007, + "step": 19949 + }, + { + "epoch": 0.39, + "learning_rate": 1.2272144771076852e-07, + "loss": 0.0014, + "step": 19950 + }, + { + "epoch": 0.39, + "learning_rate": 1.2271756436643236e-07, + "loss": 0.0012, + "step": 19951 + }, + { + "epoch": 0.39, + "learning_rate": 1.2271368102209623e-07, + "loss": 0.5605, + "step": 19952 + }, + { + "epoch": 0.39, + "learning_rate": 1.2270979767776008e-07, + "loss": 0.0886, + "step": 19953 + }, + { + "epoch": 0.39, + "learning_rate": 1.2270591433342395e-07, + "loss": 0.0052, + "step": 19954 + }, + { + "epoch": 0.39, + "learning_rate": 1.227020309890878e-07, + "loss": 0.0008, + "step": 19955 + }, + { + "epoch": 0.39, + "learning_rate": 1.2269814764475167e-07, + "loss": 0.0008, + "step": 19956 + }, + { + "epoch": 0.39, + "learning_rate": 1.226942643004155e-07, + "loss": 0.0007, + "step": 19957 + }, + { + "epoch": 0.39, + "learning_rate": 1.2269038095607938e-07, + "loss": 0.0005, + "step": 19958 + }, + { + "epoch": 0.39, + "learning_rate": 1.2268649761174323e-07, + "loss": 0.0007, + "step": 19959 + }, + { + "epoch": 0.39, + "learning_rate": 1.226826142674071e-07, + "loss": 0.3467, + "step": 19960 + }, + { + "epoch": 0.39, + "learning_rate": 1.2267873092307095e-07, + "loss": 0.001, + "step": 19961 + }, + { + "epoch": 0.39, + "learning_rate": 1.2267484757873482e-07, + "loss": 0.0008, + "step": 19962 + }, + { + "epoch": 0.39, + "learning_rate": 1.2267096423439866e-07, + "loss": 0.0008, + "step": 19963 + }, + { + "epoch": 0.39, + "learning_rate": 1.2266708089006253e-07, + "loss": 0.0006, + "step": 19964 + }, + { + "epoch": 0.39, + "learning_rate": 1.2266319754572638e-07, + "loss": 0.0008, + "step": 19965 + }, + { + "epoch": 0.39, + "learning_rate": 1.2265931420139025e-07, + "loss": 0.0014, + "step": 19966 + }, + { + "epoch": 0.39, + "learning_rate": 1.226554308570541e-07, + "loss": 0.0039, + "step": 19967 + }, + { + "epoch": 0.39, + "learning_rate": 1.2265154751271797e-07, + "loss": 0.0007, + "step": 19968 + }, + { + "epoch": 0.39, + "learning_rate": 1.226476641683818e-07, + "loss": 0.0006, + "step": 19969 + }, + { + "epoch": 0.39, + "learning_rate": 1.2264378082404568e-07, + "loss": 0.0008, + "step": 19970 + }, + { + "epoch": 0.39, + "learning_rate": 1.2263989747970953e-07, + "loss": 0.0008, + "step": 19971 + }, + { + "epoch": 0.39, + "learning_rate": 1.226360141353734e-07, + "loss": 0.0006, + "step": 19972 + }, + { + "epoch": 0.39, + "learning_rate": 1.2263213079103722e-07, + "loss": 0.001, + "step": 19973 + }, + { + "epoch": 0.39, + "learning_rate": 1.226282474467011e-07, + "loss": 0.0074, + "step": 19974 + }, + { + "epoch": 0.39, + "learning_rate": 1.2262436410236493e-07, + "loss": 0.0007, + "step": 19975 + }, + { + "epoch": 0.39, + "learning_rate": 1.226204807580288e-07, + "loss": 0.0503, + "step": 19976 + }, + { + "epoch": 0.39, + "learning_rate": 1.2261659741369265e-07, + "loss": 0.0009, + "step": 19977 + }, + { + "epoch": 0.39, + "learning_rate": 1.2261271406935652e-07, + "loss": 0.0008, + "step": 19978 + }, + { + "epoch": 0.39, + "learning_rate": 1.2260883072502037e-07, + "loss": 0.0015, + "step": 19979 + }, + { + "epoch": 0.39, + "learning_rate": 1.2260494738068424e-07, + "loss": 0.7932, + "step": 19980 + }, + { + "epoch": 0.39, + "learning_rate": 1.2260106403634808e-07, + "loss": 0.0008, + "step": 19981 + }, + { + "epoch": 0.39, + "learning_rate": 1.2259718069201196e-07, + "loss": 0.0007, + "step": 19982 + }, + { + "epoch": 0.39, + "learning_rate": 1.225932973476758e-07, + "loss": 0.0006, + "step": 19983 + }, + { + "epoch": 0.39, + "learning_rate": 1.2258941400333967e-07, + "loss": 0.0017, + "step": 19984 + }, + { + "epoch": 0.39, + "learning_rate": 1.2258553065900352e-07, + "loss": 0.0047, + "step": 19985 + }, + { + "epoch": 0.39, + "learning_rate": 1.225816473146674e-07, + "loss": 0.0009, + "step": 19986 + }, + { + "epoch": 0.39, + "learning_rate": 1.2257776397033123e-07, + "loss": 0.0012, + "step": 19987 + }, + { + "epoch": 0.39, + "learning_rate": 1.225738806259951e-07, + "loss": 0.0007, + "step": 19988 + }, + { + "epoch": 0.39, + "learning_rate": 1.2256999728165895e-07, + "loss": 0.0101, + "step": 19989 + }, + { + "epoch": 0.39, + "learning_rate": 1.2256611393732282e-07, + "loss": 0.7172, + "step": 19990 + }, + { + "epoch": 0.39, + "learning_rate": 1.2256223059298667e-07, + "loss": 0.0008, + "step": 19991 + }, + { + "epoch": 0.39, + "learning_rate": 1.2255834724865054e-07, + "loss": 0.001, + "step": 19992 + }, + { + "epoch": 0.39, + "learning_rate": 1.2255446390431438e-07, + "loss": 0.0031, + "step": 19993 + }, + { + "epoch": 0.39, + "learning_rate": 1.2255058055997825e-07, + "loss": 0.0007, + "step": 19994 + }, + { + "epoch": 0.39, + "learning_rate": 1.225466972156421e-07, + "loss": 0.0008, + "step": 19995 + }, + { + "epoch": 0.39, + "learning_rate": 1.2254281387130597e-07, + "loss": 0.0071, + "step": 19996 + }, + { + "epoch": 0.39, + "learning_rate": 1.2253893052696982e-07, + "loss": 0.0007, + "step": 19997 + }, + { + "epoch": 0.39, + "learning_rate": 1.225350471826337e-07, + "loss": 0.0017, + "step": 19998 + }, + { + "epoch": 0.39, + "learning_rate": 1.2253116383829753e-07, + "loss": 0.001, + "step": 19999 + }, + { + "epoch": 0.39, + "learning_rate": 1.225272804939614e-07, + "loss": 0.0027, + "step": 20000 + }, + { + "epoch": 0.39, + "learning_rate": 1.2252339714962525e-07, + "loss": 0.2837, + "step": 20001 + }, + { + "epoch": 0.39, + "learning_rate": 1.2251951380528912e-07, + "loss": 0.0009, + "step": 20002 + }, + { + "epoch": 0.39, + "learning_rate": 1.2251563046095297e-07, + "loss": 0.001, + "step": 20003 + }, + { + "epoch": 0.39, + "learning_rate": 1.2251174711661684e-07, + "loss": 0.0007, + "step": 20004 + }, + { + "epoch": 0.39, + "learning_rate": 1.2250786377228068e-07, + "loss": 0.0008, + "step": 20005 + }, + { + "epoch": 0.39, + "learning_rate": 1.2250398042794455e-07, + "loss": 0.0006, + "step": 20006 + }, + { + "epoch": 0.39, + "learning_rate": 1.225000970836084e-07, + "loss": 0.0006, + "step": 20007 + }, + { + "epoch": 0.39, + "learning_rate": 1.2249621373927227e-07, + "loss": 0.2082, + "step": 20008 + }, + { + "epoch": 0.39, + "learning_rate": 1.2249233039493611e-07, + "loss": 0.0009, + "step": 20009 + }, + { + "epoch": 0.39, + "learning_rate": 1.2248844705059999e-07, + "loss": 0.0012, + "step": 20010 + }, + { + "epoch": 0.39, + "learning_rate": 1.2248456370626383e-07, + "loss": 0.0022, + "step": 20011 + }, + { + "epoch": 0.39, + "learning_rate": 1.224806803619277e-07, + "loss": 0.0007, + "step": 20012 + }, + { + "epoch": 0.39, + "learning_rate": 1.2247679701759155e-07, + "loss": 0.0007, + "step": 20013 + }, + { + "epoch": 0.39, + "learning_rate": 1.2247291367325542e-07, + "loss": 0.0011, + "step": 20014 + }, + { + "epoch": 0.39, + "learning_rate": 1.2246903032891926e-07, + "loss": 0.0007, + "step": 20015 + }, + { + "epoch": 0.39, + "learning_rate": 1.2246514698458314e-07, + "loss": 0.3883, + "step": 20016 + }, + { + "epoch": 0.39, + "learning_rate": 1.2246126364024698e-07, + "loss": 0.0013, + "step": 20017 + }, + { + "epoch": 0.39, + "learning_rate": 1.2245738029591085e-07, + "loss": 0.0007, + "step": 20018 + }, + { + "epoch": 0.39, + "learning_rate": 1.224534969515747e-07, + "loss": 0.0014, + "step": 20019 + }, + { + "epoch": 0.39, + "learning_rate": 1.2244961360723854e-07, + "loss": 0.2272, + "step": 20020 + }, + { + "epoch": 0.39, + "learning_rate": 1.2244573026290241e-07, + "loss": 0.0066, + "step": 20021 + }, + { + "epoch": 0.39, + "learning_rate": 1.2244184691856626e-07, + "loss": 0.0008, + "step": 20022 + }, + { + "epoch": 0.39, + "learning_rate": 1.2243796357423013e-07, + "loss": 0.0014, + "step": 20023 + }, + { + "epoch": 0.39, + "learning_rate": 1.2243408022989398e-07, + "loss": 0.0373, + "step": 20024 + }, + { + "epoch": 0.39, + "learning_rate": 1.2243019688555785e-07, + "loss": 0.0006, + "step": 20025 + }, + { + "epoch": 0.39, + "learning_rate": 1.224263135412217e-07, + "loss": 0.0024, + "step": 20026 + }, + { + "epoch": 0.39, + "learning_rate": 1.2242243019688556e-07, + "loss": 0.0007, + "step": 20027 + }, + { + "epoch": 0.39, + "learning_rate": 1.224185468525494e-07, + "loss": 0.0007, + "step": 20028 + }, + { + "epoch": 0.39, + "learning_rate": 1.2241466350821328e-07, + "loss": 0.0008, + "step": 20029 + }, + { + "epoch": 0.39, + "learning_rate": 1.2241078016387712e-07, + "loss": 0.0009, + "step": 20030 + }, + { + "epoch": 0.39, + "learning_rate": 1.2240689681954097e-07, + "loss": 0.0043, + "step": 20031 + }, + { + "epoch": 0.39, + "learning_rate": 1.2240301347520484e-07, + "loss": 0.0011, + "step": 20032 + }, + { + "epoch": 0.39, + "learning_rate": 1.2239913013086869e-07, + "loss": 0.0007, + "step": 20033 + }, + { + "epoch": 0.39, + "learning_rate": 1.2239524678653256e-07, + "loss": 0.0014, + "step": 20034 + }, + { + "epoch": 0.39, + "learning_rate": 1.223913634421964e-07, + "loss": 0.0007, + "step": 20035 + }, + { + "epoch": 0.39, + "learning_rate": 1.2238748009786027e-07, + "loss": 0.0013, + "step": 20036 + }, + { + "epoch": 0.39, + "learning_rate": 1.2238359675352412e-07, + "loss": 0.6481, + "step": 20037 + }, + { + "epoch": 0.39, + "learning_rate": 1.22379713409188e-07, + "loss": 0.001, + "step": 20038 + }, + { + "epoch": 0.39, + "learning_rate": 1.2237583006485184e-07, + "loss": 0.0008, + "step": 20039 + }, + { + "epoch": 0.39, + "learning_rate": 1.223719467205157e-07, + "loss": 0.0011, + "step": 20040 + }, + { + "epoch": 0.39, + "learning_rate": 1.2236806337617955e-07, + "loss": 0.0008, + "step": 20041 + }, + { + "epoch": 0.39, + "learning_rate": 1.2236418003184342e-07, + "loss": 0.0009, + "step": 20042 + }, + { + "epoch": 0.39, + "learning_rate": 1.2236029668750727e-07, + "loss": 0.0127, + "step": 20043 + }, + { + "epoch": 0.39, + "learning_rate": 1.2235641334317114e-07, + "loss": 0.001, + "step": 20044 + }, + { + "epoch": 0.39, + "learning_rate": 1.2235252999883499e-07, + "loss": 0.8492, + "step": 20045 + }, + { + "epoch": 0.39, + "learning_rate": 1.2234864665449886e-07, + "loss": 0.0007, + "step": 20046 + }, + { + "epoch": 0.39, + "learning_rate": 1.223447633101627e-07, + "loss": 0.0009, + "step": 20047 + }, + { + "epoch": 0.39, + "learning_rate": 1.2234087996582657e-07, + "loss": 0.0008, + "step": 20048 + }, + { + "epoch": 0.39, + "learning_rate": 1.2233699662149042e-07, + "loss": 0.0006, + "step": 20049 + }, + { + "epoch": 0.39, + "learning_rate": 1.2233311327715426e-07, + "loss": 0.0009, + "step": 20050 + }, + { + "epoch": 0.39, + "learning_rate": 1.2232922993281813e-07, + "loss": 0.0007, + "step": 20051 + }, + { + "epoch": 0.39, + "learning_rate": 1.2232534658848198e-07, + "loss": 0.0814, + "step": 20052 + }, + { + "epoch": 0.39, + "learning_rate": 1.2232146324414585e-07, + "loss": 0.0015, + "step": 20053 + }, + { + "epoch": 0.39, + "learning_rate": 1.223175798998097e-07, + "loss": 0.0008, + "step": 20054 + }, + { + "epoch": 0.39, + "learning_rate": 1.2231369655547357e-07, + "loss": 0.0007, + "step": 20055 + }, + { + "epoch": 0.39, + "learning_rate": 1.223098132111374e-07, + "loss": 0.0009, + "step": 20056 + }, + { + "epoch": 0.39, + "learning_rate": 1.2230592986680128e-07, + "loss": 0.0009, + "step": 20057 + }, + { + "epoch": 0.39, + "learning_rate": 1.2230204652246513e-07, + "loss": 0.0008, + "step": 20058 + }, + { + "epoch": 0.39, + "learning_rate": 1.22298163178129e-07, + "loss": 0.008, + "step": 20059 + }, + { + "epoch": 0.39, + "learning_rate": 1.2229427983379285e-07, + "loss": 0.0007, + "step": 20060 + }, + { + "epoch": 0.39, + "learning_rate": 1.2229039648945672e-07, + "loss": 0.0083, + "step": 20061 + }, + { + "epoch": 0.39, + "learning_rate": 1.2228651314512056e-07, + "loss": 0.0006, + "step": 20062 + }, + { + "epoch": 0.39, + "learning_rate": 1.2228262980078443e-07, + "loss": 0.0006, + "step": 20063 + }, + { + "epoch": 0.39, + "learning_rate": 1.2227874645644828e-07, + "loss": 0.0008, + "step": 20064 + }, + { + "epoch": 0.39, + "learning_rate": 1.2227486311211215e-07, + "loss": 0.2908, + "step": 20065 + }, + { + "epoch": 0.39, + "learning_rate": 1.22270979767776e-07, + "loss": 0.0006, + "step": 20066 + }, + { + "epoch": 0.39, + "learning_rate": 1.2226709642343987e-07, + "loss": 0.0008, + "step": 20067 + }, + { + "epoch": 0.39, + "learning_rate": 1.222632130791037e-07, + "loss": 0.0007, + "step": 20068 + }, + { + "epoch": 0.39, + "learning_rate": 1.2225932973476758e-07, + "loss": 0.0007, + "step": 20069 + }, + { + "epoch": 0.39, + "learning_rate": 1.2225544639043143e-07, + "loss": 0.001, + "step": 20070 + }, + { + "epoch": 0.39, + "learning_rate": 1.222515630460953e-07, + "loss": 0.0009, + "step": 20071 + }, + { + "epoch": 0.39, + "learning_rate": 1.2224767970175914e-07, + "loss": 1.1668, + "step": 20072 + }, + { + "epoch": 0.39, + "learning_rate": 1.2224379635742302e-07, + "loss": 0.0007, + "step": 20073 + }, + { + "epoch": 0.39, + "learning_rate": 1.2223991301308686e-07, + "loss": 0.0028, + "step": 20074 + }, + { + "epoch": 0.39, + "learning_rate": 1.2223602966875073e-07, + "loss": 0.0011, + "step": 20075 + }, + { + "epoch": 0.39, + "learning_rate": 1.2223214632441458e-07, + "loss": 0.0007, + "step": 20076 + }, + { + "epoch": 0.39, + "learning_rate": 1.2222826298007845e-07, + "loss": 0.0008, + "step": 20077 + }, + { + "epoch": 0.39, + "learning_rate": 1.222243796357423e-07, + "loss": 0.002, + "step": 20078 + }, + { + "epoch": 0.39, + "learning_rate": 1.2222049629140617e-07, + "loss": 0.0009, + "step": 20079 + }, + { + "epoch": 0.39, + "learning_rate": 1.2221661294707e-07, + "loss": 1.0074, + "step": 20080 + }, + { + "epoch": 0.39, + "learning_rate": 1.2221272960273388e-07, + "loss": 0.0008, + "step": 20081 + }, + { + "epoch": 0.39, + "learning_rate": 1.2220884625839773e-07, + "loss": 0.0011, + "step": 20082 + }, + { + "epoch": 0.39, + "learning_rate": 1.222049629140616e-07, + "loss": 0.0011, + "step": 20083 + }, + { + "epoch": 0.39, + "learning_rate": 1.2220107956972544e-07, + "loss": 0.0007, + "step": 20084 + }, + { + "epoch": 0.39, + "learning_rate": 1.2219719622538931e-07, + "loss": 0.001, + "step": 20085 + }, + { + "epoch": 0.39, + "learning_rate": 1.2219331288105316e-07, + "loss": 0.0006, + "step": 20086 + }, + { + "epoch": 0.39, + "learning_rate": 1.2218942953671703e-07, + "loss": 0.0006, + "step": 20087 + }, + { + "epoch": 0.39, + "learning_rate": 1.2218554619238088e-07, + "loss": 0.0126, + "step": 20088 + }, + { + "epoch": 0.39, + "learning_rate": 1.2218166284804472e-07, + "loss": 0.0012, + "step": 20089 + }, + { + "epoch": 0.39, + "learning_rate": 1.2217777950370857e-07, + "loss": 0.3175, + "step": 20090 + }, + { + "epoch": 0.39, + "learning_rate": 1.2217389615937244e-07, + "loss": 0.0008, + "step": 20091 + }, + { + "epoch": 0.39, + "learning_rate": 1.2217001281503628e-07, + "loss": 0.0007, + "step": 20092 + }, + { + "epoch": 0.39, + "learning_rate": 1.2216612947070015e-07, + "loss": 0.0008, + "step": 20093 + }, + { + "epoch": 0.39, + "learning_rate": 1.22162246126364e-07, + "loss": 0.0094, + "step": 20094 + }, + { + "epoch": 0.39, + "learning_rate": 1.2215836278202787e-07, + "loss": 0.0007, + "step": 20095 + }, + { + "epoch": 0.39, + "learning_rate": 1.2215447943769172e-07, + "loss": 0.0013, + "step": 20096 + }, + { + "epoch": 0.39, + "learning_rate": 1.221505960933556e-07, + "loss": 0.5203, + "step": 20097 + }, + { + "epoch": 0.39, + "learning_rate": 1.2214671274901943e-07, + "loss": 0.4836, + "step": 20098 + }, + { + "epoch": 0.39, + "learning_rate": 1.221428294046833e-07, + "loss": 0.0008, + "step": 20099 + }, + { + "epoch": 0.39, + "learning_rate": 1.2213894606034715e-07, + "loss": 0.0006, + "step": 20100 + }, + { + "epoch": 0.39, + "learning_rate": 1.2213506271601102e-07, + "loss": 0.0008, + "step": 20101 + }, + { + "epoch": 0.39, + "learning_rate": 1.2213117937167487e-07, + "loss": 0.0008, + "step": 20102 + }, + { + "epoch": 0.39, + "learning_rate": 1.2212729602733874e-07, + "loss": 0.0087, + "step": 20103 + }, + { + "epoch": 0.39, + "learning_rate": 1.2212341268300258e-07, + "loss": 0.0009, + "step": 20104 + }, + { + "epoch": 0.39, + "learning_rate": 1.2211952933866645e-07, + "loss": 0.0007, + "step": 20105 + }, + { + "epoch": 0.39, + "learning_rate": 1.221156459943303e-07, + "loss": 0.0008, + "step": 20106 + }, + { + "epoch": 0.39, + "learning_rate": 1.2211176264999417e-07, + "loss": 0.0011, + "step": 20107 + }, + { + "epoch": 0.39, + "learning_rate": 1.2210787930565801e-07, + "loss": 0.0009, + "step": 20108 + }, + { + "epoch": 0.39, + "learning_rate": 1.2210399596132189e-07, + "loss": 0.0022, + "step": 20109 + }, + { + "epoch": 0.39, + "learning_rate": 1.2210011261698573e-07, + "loss": 0.0009, + "step": 20110 + }, + { + "epoch": 0.39, + "learning_rate": 1.220962292726496e-07, + "loss": 0.8503, + "step": 20111 + }, + { + "epoch": 0.39, + "learning_rate": 1.2209234592831345e-07, + "loss": 0.0007, + "step": 20112 + }, + { + "epoch": 0.39, + "learning_rate": 1.2208846258397732e-07, + "loss": 0.0006, + "step": 20113 + }, + { + "epoch": 0.39, + "learning_rate": 1.2208457923964116e-07, + "loss": 0.0025, + "step": 20114 + }, + { + "epoch": 0.39, + "learning_rate": 1.2208069589530504e-07, + "loss": 0.0008, + "step": 20115 + }, + { + "epoch": 0.39, + "learning_rate": 1.2207681255096888e-07, + "loss": 0.0006, + "step": 20116 + }, + { + "epoch": 0.39, + "learning_rate": 1.2207292920663275e-07, + "loss": 0.1924, + "step": 20117 + }, + { + "epoch": 0.39, + "learning_rate": 1.220690458622966e-07, + "loss": 0.0009, + "step": 20118 + }, + { + "epoch": 0.39, + "learning_rate": 1.2206516251796047e-07, + "loss": 0.0006, + "step": 20119 + }, + { + "epoch": 0.39, + "learning_rate": 1.2206127917362431e-07, + "loss": 0.1433, + "step": 20120 + }, + { + "epoch": 0.39, + "learning_rate": 1.2205739582928819e-07, + "loss": 0.0008, + "step": 20121 + }, + { + "epoch": 0.39, + "learning_rate": 1.2205351248495203e-07, + "loss": 0.0007, + "step": 20122 + }, + { + "epoch": 0.39, + "learning_rate": 1.220496291406159e-07, + "loss": 0.0007, + "step": 20123 + }, + { + "epoch": 0.39, + "learning_rate": 1.2204574579627975e-07, + "loss": 0.1831, + "step": 20124 + }, + { + "epoch": 0.39, + "learning_rate": 1.2204186245194362e-07, + "loss": 0.0104, + "step": 20125 + }, + { + "epoch": 0.39, + "learning_rate": 1.2203797910760746e-07, + "loss": 0.0114, + "step": 20126 + }, + { + "epoch": 0.39, + "learning_rate": 1.2203409576327133e-07, + "loss": 0.0075, + "step": 20127 + }, + { + "epoch": 0.39, + "learning_rate": 1.2203021241893518e-07, + "loss": 0.0178, + "step": 20128 + }, + { + "epoch": 0.39, + "learning_rate": 1.2202632907459905e-07, + "loss": 0.0006, + "step": 20129 + }, + { + "epoch": 0.39, + "learning_rate": 1.220224457302629e-07, + "loss": 0.0011, + "step": 20130 + }, + { + "epoch": 0.39, + "learning_rate": 1.2201856238592677e-07, + "loss": 0.0008, + "step": 20131 + }, + { + "epoch": 0.39, + "learning_rate": 1.220146790415906e-07, + "loss": 0.0008, + "step": 20132 + }, + { + "epoch": 0.39, + "learning_rate": 1.2201079569725448e-07, + "loss": 0.085, + "step": 20133 + }, + { + "epoch": 0.39, + "learning_rate": 1.2200691235291833e-07, + "loss": 0.0007, + "step": 20134 + }, + { + "epoch": 0.39, + "learning_rate": 1.220030290085822e-07, + "loss": 0.0013, + "step": 20135 + }, + { + "epoch": 0.39, + "learning_rate": 1.2199914566424605e-07, + "loss": 0.0009, + "step": 20136 + }, + { + "epoch": 0.39, + "learning_rate": 1.2199526231990992e-07, + "loss": 0.0015, + "step": 20137 + }, + { + "epoch": 0.39, + "learning_rate": 1.2199137897557376e-07, + "loss": 0.0007, + "step": 20138 + }, + { + "epoch": 0.39, + "learning_rate": 1.2198749563123763e-07, + "loss": 0.0006, + "step": 20139 + }, + { + "epoch": 0.39, + "learning_rate": 1.2198361228690148e-07, + "loss": 0.3589, + "step": 20140 + }, + { + "epoch": 0.39, + "learning_rate": 1.2197972894256535e-07, + "loss": 0.0012, + "step": 20141 + }, + { + "epoch": 0.39, + "learning_rate": 1.219758455982292e-07, + "loss": 0.0018, + "step": 20142 + }, + { + "epoch": 0.39, + "learning_rate": 1.2197196225389307e-07, + "loss": 0.0008, + "step": 20143 + }, + { + "epoch": 0.39, + "learning_rate": 1.219680789095569e-07, + "loss": 0.0008, + "step": 20144 + }, + { + "epoch": 0.39, + "learning_rate": 1.2196419556522078e-07, + "loss": 0.001, + "step": 20145 + }, + { + "epoch": 0.39, + "learning_rate": 1.2196031222088463e-07, + "loss": 0.0009, + "step": 20146 + }, + { + "epoch": 0.39, + "learning_rate": 1.2195642887654847e-07, + "loss": 0.0013, + "step": 20147 + }, + { + "epoch": 0.39, + "learning_rate": 1.2195254553221232e-07, + "loss": 0.0006, + "step": 20148 + }, + { + "epoch": 0.39, + "learning_rate": 1.219486621878762e-07, + "loss": 0.001, + "step": 20149 + }, + { + "epoch": 0.39, + "learning_rate": 1.2194477884354003e-07, + "loss": 0.0025, + "step": 20150 + }, + { + "epoch": 0.39, + "learning_rate": 1.219408954992039e-07, + "loss": 0.0006, + "step": 20151 + }, + { + "epoch": 0.39, + "learning_rate": 1.2193701215486775e-07, + "loss": 0.0008, + "step": 20152 + }, + { + "epoch": 0.39, + "learning_rate": 1.2193312881053162e-07, + "loss": 0.001, + "step": 20153 + }, + { + "epoch": 0.39, + "learning_rate": 1.2192924546619547e-07, + "loss": 0.0006, + "step": 20154 + }, + { + "epoch": 0.39, + "learning_rate": 1.2192536212185934e-07, + "loss": 0.1789, + "step": 20155 + }, + { + "epoch": 0.39, + "learning_rate": 1.2192147877752318e-07, + "loss": 0.0008, + "step": 20156 + }, + { + "epoch": 0.39, + "learning_rate": 1.2191759543318706e-07, + "loss": 0.8191, + "step": 20157 + }, + { + "epoch": 0.39, + "learning_rate": 1.219137120888509e-07, + "loss": 0.3689, + "step": 20158 + }, + { + "epoch": 0.39, + "learning_rate": 1.2190982874451477e-07, + "loss": 0.0016, + "step": 20159 + }, + { + "epoch": 0.39, + "learning_rate": 1.2190594540017862e-07, + "loss": 0.0014, + "step": 20160 + }, + { + "epoch": 0.39, + "learning_rate": 1.219020620558425e-07, + "loss": 0.0032, + "step": 20161 + }, + { + "epoch": 0.39, + "learning_rate": 1.2189817871150633e-07, + "loss": 0.2025, + "step": 20162 + }, + { + "epoch": 0.39, + "learning_rate": 1.218942953671702e-07, + "loss": 0.0006, + "step": 20163 + }, + { + "epoch": 0.39, + "learning_rate": 1.2189041202283405e-07, + "loss": 0.0008, + "step": 20164 + }, + { + "epoch": 0.39, + "learning_rate": 1.2188652867849792e-07, + "loss": 0.0008, + "step": 20165 + }, + { + "epoch": 0.39, + "learning_rate": 1.2188264533416177e-07, + "loss": 0.0008, + "step": 20166 + }, + { + "epoch": 0.39, + "learning_rate": 1.2187876198982564e-07, + "loss": 0.0016, + "step": 20167 + }, + { + "epoch": 0.39, + "learning_rate": 1.2187487864548948e-07, + "loss": 0.0007, + "step": 20168 + }, + { + "epoch": 0.39, + "learning_rate": 1.2187099530115335e-07, + "loss": 0.0007, + "step": 20169 + }, + { + "epoch": 0.39, + "learning_rate": 1.218671119568172e-07, + "loss": 0.0008, + "step": 20170 + }, + { + "epoch": 0.39, + "learning_rate": 1.2186322861248107e-07, + "loss": 0.0006, + "step": 20171 + }, + { + "epoch": 0.39, + "learning_rate": 1.2185934526814492e-07, + "loss": 0.0006, + "step": 20172 + }, + { + "epoch": 0.39, + "learning_rate": 1.218554619238088e-07, + "loss": 0.0015, + "step": 20173 + }, + { + "epoch": 0.39, + "learning_rate": 1.2185157857947263e-07, + "loss": 0.0011, + "step": 20174 + }, + { + "epoch": 0.39, + "learning_rate": 1.218476952351365e-07, + "loss": 0.0008, + "step": 20175 + }, + { + "epoch": 0.39, + "learning_rate": 1.2184381189080035e-07, + "loss": 0.0005, + "step": 20176 + }, + { + "epoch": 0.39, + "learning_rate": 1.2183992854646422e-07, + "loss": 0.0008, + "step": 20177 + }, + { + "epoch": 0.39, + "learning_rate": 1.2183604520212807e-07, + "loss": 0.0605, + "step": 20178 + }, + { + "epoch": 0.39, + "learning_rate": 1.2183216185779194e-07, + "loss": 1.3205, + "step": 20179 + }, + { + "epoch": 0.39, + "learning_rate": 1.2182827851345578e-07, + "loss": 0.0007, + "step": 20180 + }, + { + "epoch": 0.39, + "learning_rate": 1.2182439516911965e-07, + "loss": 0.0005, + "step": 20181 + }, + { + "epoch": 0.39, + "learning_rate": 1.218205118247835e-07, + "loss": 0.001, + "step": 20182 + }, + { + "epoch": 0.39, + "learning_rate": 1.2181662848044737e-07, + "loss": 0.0013, + "step": 20183 + }, + { + "epoch": 0.39, + "learning_rate": 1.2181274513611121e-07, + "loss": 0.0007, + "step": 20184 + }, + { + "epoch": 0.39, + "learning_rate": 1.2180886179177509e-07, + "loss": 0.0084, + "step": 20185 + }, + { + "epoch": 0.39, + "learning_rate": 1.2180497844743893e-07, + "loss": 0.0014, + "step": 20186 + }, + { + "epoch": 0.39, + "learning_rate": 1.218010951031028e-07, + "loss": 0.0007, + "step": 20187 + }, + { + "epoch": 0.39, + "learning_rate": 1.2179721175876665e-07, + "loss": 0.0007, + "step": 20188 + }, + { + "epoch": 0.39, + "learning_rate": 1.2179332841443052e-07, + "loss": 0.0006, + "step": 20189 + }, + { + "epoch": 0.39, + "learning_rate": 1.2178944507009436e-07, + "loss": 0.0009, + "step": 20190 + }, + { + "epoch": 0.39, + "learning_rate": 1.2178556172575824e-07, + "loss": 0.0007, + "step": 20191 + }, + { + "epoch": 0.39, + "learning_rate": 1.2178167838142208e-07, + "loss": 0.0009, + "step": 20192 + }, + { + "epoch": 0.39, + "learning_rate": 1.2177779503708595e-07, + "loss": 0.0023, + "step": 20193 + }, + { + "epoch": 0.39, + "learning_rate": 1.217739116927498e-07, + "loss": 0.0009, + "step": 20194 + }, + { + "epoch": 0.39, + "learning_rate": 1.2177002834841367e-07, + "loss": 0.001, + "step": 20195 + }, + { + "epoch": 0.39, + "learning_rate": 1.2176614500407751e-07, + "loss": 0.2335, + "step": 20196 + }, + { + "epoch": 0.39, + "learning_rate": 1.2176226165974136e-07, + "loss": 0.0007, + "step": 20197 + }, + { + "epoch": 0.39, + "learning_rate": 1.2175837831540523e-07, + "loss": 0.0012, + "step": 20198 + }, + { + "epoch": 0.39, + "learning_rate": 1.2175449497106908e-07, + "loss": 0.0011, + "step": 20199 + }, + { + "epoch": 0.39, + "learning_rate": 1.2175061162673295e-07, + "loss": 0.0006, + "step": 20200 + }, + { + "epoch": 0.39, + "learning_rate": 1.217467282823968e-07, + "loss": 0.0007, + "step": 20201 + }, + { + "epoch": 0.39, + "learning_rate": 1.2174284493806066e-07, + "loss": 0.0013, + "step": 20202 + }, + { + "epoch": 0.39, + "learning_rate": 1.217389615937245e-07, + "loss": 0.0006, + "step": 20203 + }, + { + "epoch": 0.39, + "learning_rate": 1.2173507824938838e-07, + "loss": 0.0142, + "step": 20204 + }, + { + "epoch": 0.39, + "learning_rate": 1.2173119490505222e-07, + "loss": 0.0007, + "step": 20205 + }, + { + "epoch": 0.39, + "learning_rate": 1.2172731156071607e-07, + "loss": 0.0008, + "step": 20206 + }, + { + "epoch": 0.39, + "learning_rate": 1.2172342821637994e-07, + "loss": 0.0056, + "step": 20207 + }, + { + "epoch": 0.39, + "learning_rate": 1.2171954487204379e-07, + "loss": 0.0007, + "step": 20208 + }, + { + "epoch": 0.39, + "learning_rate": 1.2171566152770766e-07, + "loss": 0.0014, + "step": 20209 + }, + { + "epoch": 0.39, + "learning_rate": 1.217117781833715e-07, + "loss": 0.001, + "step": 20210 + }, + { + "epoch": 0.39, + "learning_rate": 1.2170789483903537e-07, + "loss": 0.001, + "step": 20211 + }, + { + "epoch": 0.39, + "learning_rate": 1.2170401149469922e-07, + "loss": 0.7938, + "step": 20212 + }, + { + "epoch": 0.39, + "learning_rate": 1.217001281503631e-07, + "loss": 0.0013, + "step": 20213 + }, + { + "epoch": 0.39, + "learning_rate": 1.2169624480602694e-07, + "loss": 0.0011, + "step": 20214 + }, + { + "epoch": 0.39, + "learning_rate": 1.216923614616908e-07, + "loss": 0.0008, + "step": 20215 + }, + { + "epoch": 0.39, + "learning_rate": 1.2168847811735465e-07, + "loss": 0.0006, + "step": 20216 + }, + { + "epoch": 0.39, + "learning_rate": 1.2168459477301852e-07, + "loss": 0.0007, + "step": 20217 + }, + { + "epoch": 0.39, + "learning_rate": 1.2168071142868237e-07, + "loss": 0.0038, + "step": 20218 + }, + { + "epoch": 0.39, + "learning_rate": 1.2167682808434624e-07, + "loss": 0.0007, + "step": 20219 + }, + { + "epoch": 0.39, + "learning_rate": 1.2167294474001009e-07, + "loss": 1.0518, + "step": 20220 + }, + { + "epoch": 0.39, + "learning_rate": 1.2166906139567396e-07, + "loss": 0.0935, + "step": 20221 + }, + { + "epoch": 0.39, + "learning_rate": 1.216651780513378e-07, + "loss": 0.0011, + "step": 20222 + }, + { + "epoch": 0.39, + "learning_rate": 1.2166129470700167e-07, + "loss": 0.3182, + "step": 20223 + }, + { + "epoch": 0.39, + "learning_rate": 1.2165741136266552e-07, + "loss": 0.0018, + "step": 20224 + }, + { + "epoch": 0.39, + "learning_rate": 1.216535280183294e-07, + "loss": 0.0012, + "step": 20225 + }, + { + "epoch": 0.39, + "learning_rate": 1.2164964467399323e-07, + "loss": 0.0012, + "step": 20226 + }, + { + "epoch": 0.39, + "learning_rate": 1.2164576132965708e-07, + "loss": 0.0007, + "step": 20227 + }, + { + "epoch": 0.39, + "learning_rate": 1.2164187798532095e-07, + "loss": 0.0023, + "step": 20228 + }, + { + "epoch": 0.39, + "learning_rate": 1.216379946409848e-07, + "loss": 0.0007, + "step": 20229 + }, + { + "epoch": 0.39, + "learning_rate": 1.2163411129664867e-07, + "loss": 0.0008, + "step": 20230 + }, + { + "epoch": 0.39, + "learning_rate": 1.216302279523125e-07, + "loss": 0.0114, + "step": 20231 + }, + { + "epoch": 0.39, + "learning_rate": 1.2162634460797638e-07, + "loss": 0.0006, + "step": 20232 + }, + { + "epoch": 0.39, + "learning_rate": 1.2162246126364023e-07, + "loss": 0.0539, + "step": 20233 + }, + { + "epoch": 0.39, + "learning_rate": 1.216185779193041e-07, + "loss": 0.0011, + "step": 20234 + }, + { + "epoch": 0.39, + "learning_rate": 1.2161469457496795e-07, + "loss": 0.0007, + "step": 20235 + }, + { + "epoch": 0.39, + "learning_rate": 1.2161081123063182e-07, + "loss": 0.0009, + "step": 20236 + }, + { + "epoch": 0.39, + "learning_rate": 1.2160692788629566e-07, + "loss": 0.0015, + "step": 20237 + }, + { + "epoch": 0.39, + "learning_rate": 1.2160304454195953e-07, + "loss": 0.0009, + "step": 20238 + }, + { + "epoch": 0.39, + "learning_rate": 1.2159916119762338e-07, + "loss": 0.0586, + "step": 20239 + }, + { + "epoch": 0.39, + "learning_rate": 1.2159527785328725e-07, + "loss": 0.0007, + "step": 20240 + }, + { + "epoch": 0.39, + "learning_rate": 1.215913945089511e-07, + "loss": 0.0009, + "step": 20241 + }, + { + "epoch": 0.39, + "learning_rate": 1.2158751116461497e-07, + "loss": 0.0007, + "step": 20242 + }, + { + "epoch": 0.39, + "learning_rate": 1.215836278202788e-07, + "loss": 0.001, + "step": 20243 + }, + { + "epoch": 0.39, + "learning_rate": 1.2157974447594268e-07, + "loss": 0.0007, + "step": 20244 + }, + { + "epoch": 0.39, + "learning_rate": 1.2157586113160653e-07, + "loss": 0.0005, + "step": 20245 + }, + { + "epoch": 0.39, + "learning_rate": 1.215719777872704e-07, + "loss": 0.0007, + "step": 20246 + }, + { + "epoch": 0.39, + "learning_rate": 1.2156809444293424e-07, + "loss": 0.0066, + "step": 20247 + }, + { + "epoch": 0.39, + "learning_rate": 1.2156421109859812e-07, + "loss": 0.0007, + "step": 20248 + }, + { + "epoch": 0.39, + "learning_rate": 1.2156032775426196e-07, + "loss": 0.0007, + "step": 20249 + }, + { + "epoch": 0.39, + "learning_rate": 1.2155644440992583e-07, + "loss": 1.1864, + "step": 20250 + }, + { + "epoch": 0.39, + "learning_rate": 1.2155256106558968e-07, + "loss": 0.0006, + "step": 20251 + }, + { + "epoch": 0.39, + "learning_rate": 1.2154867772125355e-07, + "loss": 0.0007, + "step": 20252 + }, + { + "epoch": 0.39, + "learning_rate": 1.215447943769174e-07, + "loss": 0.0031, + "step": 20253 + }, + { + "epoch": 0.39, + "learning_rate": 1.2154091103258127e-07, + "loss": 0.0008, + "step": 20254 + }, + { + "epoch": 0.39, + "learning_rate": 1.215370276882451e-07, + "loss": 0.0007, + "step": 20255 + }, + { + "epoch": 0.39, + "learning_rate": 1.2153314434390898e-07, + "loss": 0.0056, + "step": 20256 + }, + { + "epoch": 0.39, + "learning_rate": 1.2152926099957283e-07, + "loss": 0.0007, + "step": 20257 + }, + { + "epoch": 0.39, + "learning_rate": 1.215253776552367e-07, + "loss": 0.0009, + "step": 20258 + }, + { + "epoch": 0.39, + "learning_rate": 1.2152149431090054e-07, + "loss": 0.0008, + "step": 20259 + }, + { + "epoch": 0.39, + "learning_rate": 1.2151761096656442e-07, + "loss": 0.0008, + "step": 20260 + }, + { + "epoch": 0.39, + "learning_rate": 1.2151372762222826e-07, + "loss": 0.0006, + "step": 20261 + }, + { + "epoch": 0.39, + "learning_rate": 1.2150984427789213e-07, + "loss": 0.8874, + "step": 20262 + }, + { + "epoch": 0.39, + "learning_rate": 1.2150596093355595e-07, + "loss": 0.0007, + "step": 20263 + }, + { + "epoch": 0.39, + "learning_rate": 1.2150207758921982e-07, + "loss": 0.0011, + "step": 20264 + }, + { + "epoch": 0.39, + "learning_rate": 1.2149819424488367e-07, + "loss": 0.0019, + "step": 20265 + }, + { + "epoch": 0.39, + "learning_rate": 1.2149431090054754e-07, + "loss": 0.0008, + "step": 20266 + }, + { + "epoch": 0.39, + "learning_rate": 1.2149042755621138e-07, + "loss": 0.0613, + "step": 20267 + }, + { + "epoch": 0.39, + "learning_rate": 1.2148654421187525e-07, + "loss": 0.91, + "step": 20268 + }, + { + "epoch": 0.39, + "learning_rate": 1.214826608675391e-07, + "loss": 0.0007, + "step": 20269 + }, + { + "epoch": 0.39, + "learning_rate": 1.2147877752320297e-07, + "loss": 0.0008, + "step": 20270 + }, + { + "epoch": 0.39, + "learning_rate": 1.2147489417886682e-07, + "loss": 0.0011, + "step": 20271 + }, + { + "epoch": 0.39, + "learning_rate": 1.214710108345307e-07, + "loss": 0.0006, + "step": 20272 + }, + { + "epoch": 0.39, + "learning_rate": 1.2146712749019453e-07, + "loss": 0.0188, + "step": 20273 + }, + { + "epoch": 0.39, + "learning_rate": 1.214632441458584e-07, + "loss": 0.0009, + "step": 20274 + }, + { + "epoch": 0.39, + "learning_rate": 1.2145936080152225e-07, + "loss": 0.0007, + "step": 20275 + }, + { + "epoch": 0.39, + "learning_rate": 1.2145547745718612e-07, + "loss": 0.0563, + "step": 20276 + }, + { + "epoch": 0.39, + "learning_rate": 1.2145159411284997e-07, + "loss": 0.0349, + "step": 20277 + }, + { + "epoch": 0.39, + "learning_rate": 1.2144771076851384e-07, + "loss": 0.0008, + "step": 20278 + }, + { + "epoch": 0.39, + "learning_rate": 1.2144382742417768e-07, + "loss": 0.0008, + "step": 20279 + }, + { + "epoch": 0.39, + "learning_rate": 1.2143994407984155e-07, + "loss": 0.0009, + "step": 20280 + }, + { + "epoch": 0.39, + "learning_rate": 1.214360607355054e-07, + "loss": 0.0007, + "step": 20281 + }, + { + "epoch": 0.39, + "learning_rate": 1.2143217739116927e-07, + "loss": 0.0006, + "step": 20282 + }, + { + "epoch": 0.39, + "learning_rate": 1.2142829404683311e-07, + "loss": 0.002, + "step": 20283 + }, + { + "epoch": 0.39, + "learning_rate": 1.2142441070249699e-07, + "loss": 0.0185, + "step": 20284 + }, + { + "epoch": 0.39, + "learning_rate": 1.2142052735816083e-07, + "loss": 0.0009, + "step": 20285 + }, + { + "epoch": 0.39, + "learning_rate": 1.214166440138247e-07, + "loss": 0.0006, + "step": 20286 + }, + { + "epoch": 0.39, + "learning_rate": 1.2141276066948855e-07, + "loss": 0.0008, + "step": 20287 + }, + { + "epoch": 0.39, + "learning_rate": 1.2140887732515242e-07, + "loss": 0.0009, + "step": 20288 + }, + { + "epoch": 0.39, + "learning_rate": 1.2140499398081626e-07, + "loss": 0.0014, + "step": 20289 + }, + { + "epoch": 0.39, + "learning_rate": 1.2140111063648014e-07, + "loss": 0.0007, + "step": 20290 + }, + { + "epoch": 0.39, + "learning_rate": 1.2139722729214398e-07, + "loss": 0.0007, + "step": 20291 + }, + { + "epoch": 0.39, + "learning_rate": 1.2139334394780785e-07, + "loss": 0.0357, + "step": 20292 + }, + { + "epoch": 0.39, + "learning_rate": 1.213894606034717e-07, + "loss": 0.0008, + "step": 20293 + }, + { + "epoch": 0.39, + "learning_rate": 1.2138557725913557e-07, + "loss": 0.0009, + "step": 20294 + }, + { + "epoch": 0.39, + "learning_rate": 1.2138169391479941e-07, + "loss": 0.026, + "step": 20295 + }, + { + "epoch": 0.39, + "learning_rate": 1.2137781057046329e-07, + "loss": 0.0008, + "step": 20296 + }, + { + "epoch": 0.39, + "learning_rate": 1.2137392722612713e-07, + "loss": 0.0678, + "step": 20297 + }, + { + "epoch": 0.39, + "learning_rate": 1.21370043881791e-07, + "loss": 0.0024, + "step": 20298 + }, + { + "epoch": 0.39, + "learning_rate": 1.2136616053745485e-07, + "loss": 0.0005, + "step": 20299 + }, + { + "epoch": 0.39, + "learning_rate": 1.2136227719311872e-07, + "loss": 0.0007, + "step": 20300 + }, + { + "epoch": 0.39, + "learning_rate": 1.2135839384878256e-07, + "loss": 0.0007, + "step": 20301 + }, + { + "epoch": 0.39, + "learning_rate": 1.2135451050444643e-07, + "loss": 0.0008, + "step": 20302 + }, + { + "epoch": 0.39, + "learning_rate": 1.2135062716011028e-07, + "loss": 0.7415, + "step": 20303 + }, + { + "epoch": 0.39, + "learning_rate": 1.2134674381577415e-07, + "loss": 0.0006, + "step": 20304 + }, + { + "epoch": 0.39, + "learning_rate": 1.21342860471438e-07, + "loss": 0.001, + "step": 20305 + }, + { + "epoch": 0.39, + "learning_rate": 1.2133897712710187e-07, + "loss": 0.0007, + "step": 20306 + }, + { + "epoch": 0.39, + "learning_rate": 1.213350937827657e-07, + "loss": 0.0029, + "step": 20307 + }, + { + "epoch": 0.39, + "learning_rate": 1.2133121043842958e-07, + "loss": 0.0009, + "step": 20308 + }, + { + "epoch": 0.39, + "learning_rate": 1.2132732709409343e-07, + "loss": 0.0007, + "step": 20309 + }, + { + "epoch": 0.39, + "learning_rate": 1.213234437497573e-07, + "loss": 0.0008, + "step": 20310 + }, + { + "epoch": 0.39, + "learning_rate": 1.2131956040542115e-07, + "loss": 0.0008, + "step": 20311 + }, + { + "epoch": 0.39, + "learning_rate": 1.2131567706108502e-07, + "loss": 0.0007, + "step": 20312 + }, + { + "epoch": 0.39, + "learning_rate": 1.2131179371674886e-07, + "loss": 0.0007, + "step": 20313 + }, + { + "epoch": 0.39, + "learning_rate": 1.2130791037241273e-07, + "loss": 0.0512, + "step": 20314 + }, + { + "epoch": 0.39, + "learning_rate": 1.2130402702807658e-07, + "loss": 0.0007, + "step": 20315 + }, + { + "epoch": 0.39, + "learning_rate": 1.2130014368374045e-07, + "loss": 0.0008, + "step": 20316 + }, + { + "epoch": 0.39, + "learning_rate": 1.212962603394043e-07, + "loss": 0.0179, + "step": 20317 + }, + { + "epoch": 0.39, + "learning_rate": 1.2129237699506817e-07, + "loss": 0.0007, + "step": 20318 + }, + { + "epoch": 0.39, + "learning_rate": 1.21288493650732e-07, + "loss": 0.0007, + "step": 20319 + }, + { + "epoch": 0.39, + "learning_rate": 1.2128461030639588e-07, + "loss": 0.3423, + "step": 20320 + }, + { + "epoch": 0.39, + "learning_rate": 1.212807269620597e-07, + "loss": 0.0008, + "step": 20321 + }, + { + "epoch": 0.39, + "learning_rate": 1.2127684361772357e-07, + "loss": 0.0008, + "step": 20322 + }, + { + "epoch": 0.39, + "learning_rate": 1.2127296027338742e-07, + "loss": 0.0006, + "step": 20323 + }, + { + "epoch": 0.39, + "learning_rate": 1.212690769290513e-07, + "loss": 0.6119, + "step": 20324 + }, + { + "epoch": 0.39, + "learning_rate": 1.2126519358471513e-07, + "loss": 0.0006, + "step": 20325 + }, + { + "epoch": 0.39, + "learning_rate": 1.21261310240379e-07, + "loss": 0.0549, + "step": 20326 + }, + { + "epoch": 0.39, + "learning_rate": 1.2125742689604285e-07, + "loss": 0.0006, + "step": 20327 + }, + { + "epoch": 0.39, + "learning_rate": 1.2125354355170672e-07, + "loss": 0.0008, + "step": 20328 + }, + { + "epoch": 0.39, + "learning_rate": 1.2124966020737057e-07, + "loss": 0.0006, + "step": 20329 + }, + { + "epoch": 0.39, + "learning_rate": 1.2124577686303444e-07, + "loss": 0.0007, + "step": 20330 + }, + { + "epoch": 0.39, + "learning_rate": 1.2124189351869828e-07, + "loss": 0.0007, + "step": 20331 + }, + { + "epoch": 0.39, + "learning_rate": 1.2123801017436216e-07, + "loss": 0.0007, + "step": 20332 + }, + { + "epoch": 0.39, + "learning_rate": 1.21234126830026e-07, + "loss": 0.0007, + "step": 20333 + }, + { + "epoch": 0.39, + "learning_rate": 1.2123024348568987e-07, + "loss": 0.0007, + "step": 20334 + }, + { + "epoch": 0.39, + "learning_rate": 1.2122636014135372e-07, + "loss": 0.0009, + "step": 20335 + }, + { + "epoch": 0.39, + "learning_rate": 1.212224767970176e-07, + "loss": 0.0007, + "step": 20336 + }, + { + "epoch": 0.39, + "learning_rate": 1.2121859345268143e-07, + "loss": 0.0082, + "step": 20337 + }, + { + "epoch": 0.39, + "learning_rate": 1.212147101083453e-07, + "loss": 0.0037, + "step": 20338 + }, + { + "epoch": 0.39, + "learning_rate": 1.2121082676400915e-07, + "loss": 0.0007, + "step": 20339 + }, + { + "epoch": 0.39, + "learning_rate": 1.2120694341967302e-07, + "loss": 0.2219, + "step": 20340 + }, + { + "epoch": 0.39, + "learning_rate": 1.2120306007533687e-07, + "loss": 0.0007, + "step": 20341 + }, + { + "epoch": 0.39, + "learning_rate": 1.2119917673100074e-07, + "loss": 0.0018, + "step": 20342 + }, + { + "epoch": 0.39, + "learning_rate": 1.2119529338666458e-07, + "loss": 0.0006, + "step": 20343 + }, + { + "epoch": 0.39, + "learning_rate": 1.2119141004232845e-07, + "loss": 0.0005, + "step": 20344 + }, + { + "epoch": 0.39, + "learning_rate": 1.211875266979923e-07, + "loss": 0.0017, + "step": 20345 + }, + { + "epoch": 0.39, + "learning_rate": 1.2118364335365617e-07, + "loss": 0.0007, + "step": 20346 + }, + { + "epoch": 0.39, + "learning_rate": 1.2117976000932002e-07, + "loss": 0.0007, + "step": 20347 + }, + { + "epoch": 0.39, + "learning_rate": 1.211758766649839e-07, + "loss": 0.0116, + "step": 20348 + }, + { + "epoch": 0.39, + "learning_rate": 1.2117199332064773e-07, + "loss": 0.1574, + "step": 20349 + }, + { + "epoch": 0.39, + "learning_rate": 1.211681099763116e-07, + "loss": 0.0009, + "step": 20350 + }, + { + "epoch": 0.39, + "learning_rate": 1.2116422663197545e-07, + "loss": 0.0007, + "step": 20351 + }, + { + "epoch": 0.39, + "learning_rate": 1.2116034328763932e-07, + "loss": 0.0007, + "step": 20352 + }, + { + "epoch": 0.39, + "learning_rate": 1.2115645994330317e-07, + "loss": 0.0008, + "step": 20353 + }, + { + "epoch": 0.39, + "learning_rate": 1.2115257659896704e-07, + "loss": 0.0006, + "step": 20354 + }, + { + "epoch": 0.39, + "learning_rate": 1.2114869325463088e-07, + "loss": 0.0013, + "step": 20355 + }, + { + "epoch": 0.39, + "learning_rate": 1.2114480991029475e-07, + "loss": 0.4158, + "step": 20356 + }, + { + "epoch": 0.39, + "learning_rate": 1.211409265659586e-07, + "loss": 0.0007, + "step": 20357 + }, + { + "epoch": 0.39, + "learning_rate": 1.2113704322162247e-07, + "loss": 0.0037, + "step": 20358 + }, + { + "epoch": 0.39, + "learning_rate": 1.2113315987728632e-07, + "loss": 0.0007, + "step": 20359 + }, + { + "epoch": 0.39, + "learning_rate": 1.2112927653295019e-07, + "loss": 0.0007, + "step": 20360 + }, + { + "epoch": 0.39, + "learning_rate": 1.2112539318861403e-07, + "loss": 0.0007, + "step": 20361 + }, + { + "epoch": 0.39, + "learning_rate": 1.211215098442779e-07, + "loss": 0.0009, + "step": 20362 + }, + { + "epoch": 0.39, + "learning_rate": 1.2111762649994175e-07, + "loss": 0.2159, + "step": 20363 + }, + { + "epoch": 0.4, + "learning_rate": 1.2111374315560562e-07, + "loss": 0.7498, + "step": 20364 + }, + { + "epoch": 0.4, + "learning_rate": 1.2110985981126946e-07, + "loss": 0.0008, + "step": 20365 + }, + { + "epoch": 0.4, + "learning_rate": 1.2110597646693334e-07, + "loss": 0.0038, + "step": 20366 + }, + { + "epoch": 0.4, + "learning_rate": 1.2110209312259718e-07, + "loss": 0.0475, + "step": 20367 + }, + { + "epoch": 0.4, + "learning_rate": 1.2109820977826105e-07, + "loss": 0.0069, + "step": 20368 + }, + { + "epoch": 0.4, + "learning_rate": 1.210943264339249e-07, + "loss": 0.0007, + "step": 20369 + }, + { + "epoch": 0.4, + "learning_rate": 1.2109044308958877e-07, + "loss": 0.0008, + "step": 20370 + }, + { + "epoch": 0.4, + "learning_rate": 1.2108655974525261e-07, + "loss": 0.0013, + "step": 20371 + }, + { + "epoch": 0.4, + "learning_rate": 1.2108267640091649e-07, + "loss": 0.0022, + "step": 20372 + }, + { + "epoch": 0.4, + "learning_rate": 1.2107879305658033e-07, + "loss": 0.0023, + "step": 20373 + }, + { + "epoch": 0.4, + "learning_rate": 1.2107490971224418e-07, + "loss": 0.0009, + "step": 20374 + }, + { + "epoch": 0.4, + "learning_rate": 1.2107102636790805e-07, + "loss": 1.2732, + "step": 20375 + }, + { + "epoch": 0.4, + "learning_rate": 1.210671430235719e-07, + "loss": 0.0008, + "step": 20376 + }, + { + "epoch": 0.4, + "learning_rate": 1.2106325967923576e-07, + "loss": 0.0022, + "step": 20377 + }, + { + "epoch": 0.4, + "learning_rate": 1.210593763348996e-07, + "loss": 0.3648, + "step": 20378 + }, + { + "epoch": 0.4, + "learning_rate": 1.2105549299056345e-07, + "loss": 0.0009, + "step": 20379 + }, + { + "epoch": 0.4, + "learning_rate": 1.2105160964622732e-07, + "loss": 0.0012, + "step": 20380 + }, + { + "epoch": 0.4, + "learning_rate": 1.2104772630189117e-07, + "loss": 0.0008, + "step": 20381 + }, + { + "epoch": 0.4, + "learning_rate": 1.2104384295755504e-07, + "loss": 0.0029, + "step": 20382 + }, + { + "epoch": 0.4, + "learning_rate": 1.2103995961321889e-07, + "loss": 0.0012, + "step": 20383 + }, + { + "epoch": 0.4, + "learning_rate": 1.2103607626888276e-07, + "loss": 0.0115, + "step": 20384 + }, + { + "epoch": 0.4, + "learning_rate": 1.210321929245466e-07, + "loss": 0.0012, + "step": 20385 + }, + { + "epoch": 0.4, + "learning_rate": 1.2102830958021047e-07, + "loss": 0.7208, + "step": 20386 + }, + { + "epoch": 0.4, + "learning_rate": 1.2102442623587432e-07, + "loss": 0.0141, + "step": 20387 + }, + { + "epoch": 0.4, + "learning_rate": 1.210205428915382e-07, + "loss": 0.0008, + "step": 20388 + }, + { + "epoch": 0.4, + "learning_rate": 1.2101665954720204e-07, + "loss": 0.0009, + "step": 20389 + }, + { + "epoch": 0.4, + "learning_rate": 1.210127762028659e-07, + "loss": 0.0014, + "step": 20390 + }, + { + "epoch": 0.4, + "learning_rate": 1.2100889285852975e-07, + "loss": 0.0006, + "step": 20391 + }, + { + "epoch": 0.4, + "learning_rate": 1.2100500951419362e-07, + "loss": 0.0007, + "step": 20392 + }, + { + "epoch": 0.4, + "learning_rate": 1.2100112616985747e-07, + "loss": 0.0366, + "step": 20393 + }, + { + "epoch": 0.4, + "learning_rate": 1.2099724282552134e-07, + "loss": 0.0009, + "step": 20394 + }, + { + "epoch": 0.4, + "learning_rate": 1.2099335948118519e-07, + "loss": 0.0009, + "step": 20395 + }, + { + "epoch": 0.4, + "learning_rate": 1.2098947613684906e-07, + "loss": 0.001, + "step": 20396 + }, + { + "epoch": 0.4, + "learning_rate": 1.209855927925129e-07, + "loss": 0.001, + "step": 20397 + }, + { + "epoch": 0.4, + "learning_rate": 1.2098170944817677e-07, + "loss": 0.0007, + "step": 20398 + }, + { + "epoch": 0.4, + "learning_rate": 1.2097782610384062e-07, + "loss": 0.0013, + "step": 20399 + }, + { + "epoch": 0.4, + "learning_rate": 1.209739427595045e-07, + "loss": 0.0047, + "step": 20400 + }, + { + "epoch": 0.4, + "learning_rate": 1.2097005941516833e-07, + "loss": 0.0008, + "step": 20401 + }, + { + "epoch": 0.4, + "learning_rate": 1.209661760708322e-07, + "loss": 0.0008, + "step": 20402 + }, + { + "epoch": 0.4, + "learning_rate": 1.2096229272649605e-07, + "loss": 0.4731, + "step": 20403 + }, + { + "epoch": 0.4, + "learning_rate": 1.209584093821599e-07, + "loss": 0.0006, + "step": 20404 + }, + { + "epoch": 0.4, + "learning_rate": 1.2095452603782377e-07, + "loss": 0.0008, + "step": 20405 + }, + { + "epoch": 0.4, + "learning_rate": 1.209506426934876e-07, + "loss": 0.0129, + "step": 20406 + }, + { + "epoch": 0.4, + "learning_rate": 1.2094675934915148e-07, + "loss": 0.001, + "step": 20407 + }, + { + "epoch": 0.4, + "learning_rate": 1.2094287600481533e-07, + "loss": 0.0007, + "step": 20408 + }, + { + "epoch": 0.4, + "learning_rate": 1.209389926604792e-07, + "loss": 0.0008, + "step": 20409 + }, + { + "epoch": 0.4, + "learning_rate": 1.2093510931614305e-07, + "loss": 0.001, + "step": 20410 + }, + { + "epoch": 0.4, + "learning_rate": 1.2093122597180692e-07, + "loss": 0.0009, + "step": 20411 + }, + { + "epoch": 0.4, + "learning_rate": 1.2092734262747076e-07, + "loss": 0.0008, + "step": 20412 + }, + { + "epoch": 0.4, + "learning_rate": 1.2092345928313463e-07, + "loss": 0.001, + "step": 20413 + }, + { + "epoch": 0.4, + "learning_rate": 1.2091957593879848e-07, + "loss": 0.001, + "step": 20414 + }, + { + "epoch": 0.4, + "learning_rate": 1.2091569259446235e-07, + "loss": 0.0007, + "step": 20415 + }, + { + "epoch": 0.4, + "learning_rate": 1.209118092501262e-07, + "loss": 0.0006, + "step": 20416 + }, + { + "epoch": 0.4, + "learning_rate": 1.2090792590579007e-07, + "loss": 0.0008, + "step": 20417 + }, + { + "epoch": 0.4, + "learning_rate": 1.209040425614539e-07, + "loss": 0.0346, + "step": 20418 + }, + { + "epoch": 0.4, + "learning_rate": 1.2090015921711778e-07, + "loss": 0.0008, + "step": 20419 + }, + { + "epoch": 0.4, + "learning_rate": 1.2089627587278163e-07, + "loss": 0.0039, + "step": 20420 + }, + { + "epoch": 0.4, + "learning_rate": 1.208923925284455e-07, + "loss": 0.0008, + "step": 20421 + }, + { + "epoch": 0.4, + "learning_rate": 1.2088850918410934e-07, + "loss": 0.0007, + "step": 20422 + }, + { + "epoch": 0.4, + "learning_rate": 1.2088462583977322e-07, + "loss": 0.0009, + "step": 20423 + }, + { + "epoch": 0.4, + "learning_rate": 1.2088074249543706e-07, + "loss": 0.0009, + "step": 20424 + }, + { + "epoch": 0.4, + "learning_rate": 1.2087685915110093e-07, + "loss": 0.0006, + "step": 20425 + }, + { + "epoch": 0.4, + "learning_rate": 1.2087297580676478e-07, + "loss": 0.0015, + "step": 20426 + }, + { + "epoch": 0.4, + "learning_rate": 1.2086909246242865e-07, + "loss": 0.0016, + "step": 20427 + }, + { + "epoch": 0.4, + "learning_rate": 1.208652091180925e-07, + "loss": 0.0008, + "step": 20428 + }, + { + "epoch": 0.4, + "learning_rate": 1.2086132577375637e-07, + "loss": 0.0083, + "step": 20429 + }, + { + "epoch": 0.4, + "learning_rate": 1.208574424294202e-07, + "loss": 0.0008, + "step": 20430 + }, + { + "epoch": 0.4, + "learning_rate": 1.2085355908508408e-07, + "loss": 0.0045, + "step": 20431 + }, + { + "epoch": 0.4, + "learning_rate": 1.2084967574074793e-07, + "loss": 0.0011, + "step": 20432 + }, + { + "epoch": 0.4, + "learning_rate": 1.208457923964118e-07, + "loss": 0.001, + "step": 20433 + }, + { + "epoch": 0.4, + "learning_rate": 1.2084190905207564e-07, + "loss": 0.0007, + "step": 20434 + }, + { + "epoch": 0.4, + "learning_rate": 1.2083802570773952e-07, + "loss": 0.0011, + "step": 20435 + }, + { + "epoch": 0.4, + "learning_rate": 1.2083414236340336e-07, + "loss": 0.1231, + "step": 20436 + }, + { + "epoch": 0.4, + "learning_rate": 1.208302590190672e-07, + "loss": 0.0009, + "step": 20437 + }, + { + "epoch": 0.4, + "learning_rate": 1.2082637567473105e-07, + "loss": 0.0021, + "step": 20438 + }, + { + "epoch": 0.4, + "learning_rate": 1.2082249233039492e-07, + "loss": 0.0007, + "step": 20439 + }, + { + "epoch": 0.4, + "learning_rate": 1.2081860898605877e-07, + "loss": 0.0094, + "step": 20440 + }, + { + "epoch": 0.4, + "learning_rate": 1.2081472564172264e-07, + "loss": 0.0008, + "step": 20441 + }, + { + "epoch": 0.4, + "learning_rate": 1.2081084229738648e-07, + "loss": 0.0008, + "step": 20442 + }, + { + "epoch": 0.4, + "learning_rate": 1.2080695895305035e-07, + "loss": 1.281, + "step": 20443 + }, + { + "epoch": 0.4, + "learning_rate": 1.208030756087142e-07, + "loss": 0.0007, + "step": 20444 + }, + { + "epoch": 0.4, + "learning_rate": 1.2079919226437807e-07, + "loss": 0.0008, + "step": 20445 + }, + { + "epoch": 0.4, + "learning_rate": 1.2079530892004192e-07, + "loss": 0.1441, + "step": 20446 + }, + { + "epoch": 0.4, + "learning_rate": 1.207914255757058e-07, + "loss": 0.0303, + "step": 20447 + }, + { + "epoch": 0.4, + "learning_rate": 1.2078754223136963e-07, + "loss": 0.0007, + "step": 20448 + }, + { + "epoch": 0.4, + "learning_rate": 1.207836588870335e-07, + "loss": 0.001, + "step": 20449 + }, + { + "epoch": 0.4, + "learning_rate": 1.2077977554269735e-07, + "loss": 0.0007, + "step": 20450 + }, + { + "epoch": 0.4, + "learning_rate": 1.2077589219836122e-07, + "loss": 0.0008, + "step": 20451 + }, + { + "epoch": 0.4, + "learning_rate": 1.2077200885402507e-07, + "loss": 0.0006, + "step": 20452 + }, + { + "epoch": 0.4, + "learning_rate": 1.2076812550968894e-07, + "loss": 0.0007, + "step": 20453 + }, + { + "epoch": 0.4, + "learning_rate": 1.2076424216535278e-07, + "loss": 0.0006, + "step": 20454 + }, + { + "epoch": 0.4, + "learning_rate": 1.2076035882101665e-07, + "loss": 0.0007, + "step": 20455 + }, + { + "epoch": 0.4, + "learning_rate": 1.207564754766805e-07, + "loss": 0.0008, + "step": 20456 + }, + { + "epoch": 0.4, + "learning_rate": 1.2075259213234437e-07, + "loss": 0.0007, + "step": 20457 + }, + { + "epoch": 0.4, + "learning_rate": 1.2074870878800822e-07, + "loss": 0.0007, + "step": 20458 + }, + { + "epoch": 0.4, + "learning_rate": 1.2074482544367209e-07, + "loss": 0.001, + "step": 20459 + }, + { + "epoch": 0.4, + "learning_rate": 1.2074094209933593e-07, + "loss": 0.0008, + "step": 20460 + }, + { + "epoch": 0.4, + "learning_rate": 1.207370587549998e-07, + "loss": 0.0007, + "step": 20461 + }, + { + "epoch": 0.4, + "learning_rate": 1.2073317541066365e-07, + "loss": 0.3281, + "step": 20462 + }, + { + "epoch": 0.4, + "learning_rate": 1.2072929206632752e-07, + "loss": 0.001, + "step": 20463 + }, + { + "epoch": 0.4, + "learning_rate": 1.2072540872199136e-07, + "loss": 0.0012, + "step": 20464 + }, + { + "epoch": 0.4, + "learning_rate": 1.2072152537765524e-07, + "loss": 0.0009, + "step": 20465 + }, + { + "epoch": 0.4, + "learning_rate": 1.2071764203331908e-07, + "loss": 0.0028, + "step": 20466 + }, + { + "epoch": 0.4, + "learning_rate": 1.2071375868898295e-07, + "loss": 0.0008, + "step": 20467 + }, + { + "epoch": 0.4, + "learning_rate": 1.207098753446468e-07, + "loss": 0.0154, + "step": 20468 + }, + { + "epoch": 0.4, + "learning_rate": 1.2070599200031067e-07, + "loss": 0.005, + "step": 20469 + }, + { + "epoch": 0.4, + "learning_rate": 1.2070210865597451e-07, + "loss": 0.0012, + "step": 20470 + }, + { + "epoch": 0.4, + "learning_rate": 1.2069822531163839e-07, + "loss": 0.0032, + "step": 20471 + }, + { + "epoch": 0.4, + "learning_rate": 1.2069434196730223e-07, + "loss": 0.0007, + "step": 20472 + }, + { + "epoch": 0.4, + "learning_rate": 1.206904586229661e-07, + "loss": 0.0005, + "step": 20473 + }, + { + "epoch": 0.4, + "learning_rate": 1.2068657527862995e-07, + "loss": 0.0013, + "step": 20474 + }, + { + "epoch": 0.4, + "learning_rate": 1.2068269193429382e-07, + "loss": 0.0008, + "step": 20475 + }, + { + "epoch": 0.4, + "learning_rate": 1.2067880858995766e-07, + "loss": 0.0008, + "step": 20476 + }, + { + "epoch": 0.4, + "learning_rate": 1.2067492524562153e-07, + "loss": 0.0593, + "step": 20477 + }, + { + "epoch": 0.4, + "learning_rate": 1.2067104190128538e-07, + "loss": 0.0008, + "step": 20478 + }, + { + "epoch": 0.4, + "learning_rate": 1.2066715855694925e-07, + "loss": 0.2835, + "step": 20479 + }, + { + "epoch": 0.4, + "learning_rate": 1.206632752126131e-07, + "loss": 0.0015, + "step": 20480 + }, + { + "epoch": 0.4, + "learning_rate": 1.2065939186827697e-07, + "loss": 0.0008, + "step": 20481 + }, + { + "epoch": 0.4, + "learning_rate": 1.206555085239408e-07, + "loss": 0.0008, + "step": 20482 + }, + { + "epoch": 0.4, + "learning_rate": 1.2065162517960468e-07, + "loss": 0.0008, + "step": 20483 + }, + { + "epoch": 0.4, + "learning_rate": 1.2064774183526853e-07, + "loss": 0.0007, + "step": 20484 + }, + { + "epoch": 0.4, + "learning_rate": 1.206438584909324e-07, + "loss": 0.0008, + "step": 20485 + }, + { + "epoch": 0.4, + "learning_rate": 1.2063997514659625e-07, + "loss": 0.0006, + "step": 20486 + }, + { + "epoch": 0.4, + "learning_rate": 1.2063609180226012e-07, + "loss": 0.0092, + "step": 20487 + }, + { + "epoch": 0.4, + "learning_rate": 1.2063220845792396e-07, + "loss": 0.0087, + "step": 20488 + }, + { + "epoch": 0.4, + "learning_rate": 1.2062832511358783e-07, + "loss": 0.0034, + "step": 20489 + }, + { + "epoch": 0.4, + "learning_rate": 1.2062444176925168e-07, + "loss": 0.0006, + "step": 20490 + }, + { + "epoch": 0.4, + "learning_rate": 1.2062055842491555e-07, + "loss": 0.6163, + "step": 20491 + }, + { + "epoch": 0.4, + "learning_rate": 1.206166750805794e-07, + "loss": 0.0025, + "step": 20492 + }, + { + "epoch": 0.4, + "learning_rate": 1.2061279173624327e-07, + "loss": 0.0008, + "step": 20493 + }, + { + "epoch": 0.4, + "learning_rate": 1.206089083919071e-07, + "loss": 0.0008, + "step": 20494 + }, + { + "epoch": 0.4, + "learning_rate": 1.2060502504757096e-07, + "loss": 0.0011, + "step": 20495 + }, + { + "epoch": 0.4, + "learning_rate": 1.206011417032348e-07, + "loss": 0.0009, + "step": 20496 + }, + { + "epoch": 0.4, + "learning_rate": 1.2059725835889867e-07, + "loss": 0.0007, + "step": 20497 + }, + { + "epoch": 0.4, + "learning_rate": 1.2059337501456252e-07, + "loss": 0.001, + "step": 20498 + }, + { + "epoch": 0.4, + "learning_rate": 1.205894916702264e-07, + "loss": 0.0007, + "step": 20499 + }, + { + "epoch": 0.4, + "learning_rate": 1.2058560832589023e-07, + "loss": 1.9359, + "step": 20500 + }, + { + "epoch": 0.4, + "learning_rate": 1.205817249815541e-07, + "loss": 0.0005, + "step": 20501 + }, + { + "epoch": 0.4, + "learning_rate": 1.2057784163721795e-07, + "loss": 0.0037, + "step": 20502 + }, + { + "epoch": 0.4, + "learning_rate": 1.2057395829288182e-07, + "loss": 0.0006, + "step": 20503 + }, + { + "epoch": 0.4, + "learning_rate": 1.2057007494854567e-07, + "loss": 0.0006, + "step": 20504 + }, + { + "epoch": 0.4, + "learning_rate": 1.2056619160420954e-07, + "loss": 0.0007, + "step": 20505 + }, + { + "epoch": 0.4, + "learning_rate": 1.2056230825987338e-07, + "loss": 0.0006, + "step": 20506 + }, + { + "epoch": 0.4, + "learning_rate": 1.2055842491553726e-07, + "loss": 0.0011, + "step": 20507 + }, + { + "epoch": 0.4, + "learning_rate": 1.205545415712011e-07, + "loss": 0.2259, + "step": 20508 + }, + { + "epoch": 0.4, + "learning_rate": 1.2055065822686497e-07, + "loss": 0.0009, + "step": 20509 + }, + { + "epoch": 0.4, + "learning_rate": 1.2054677488252882e-07, + "loss": 0.0006, + "step": 20510 + }, + { + "epoch": 0.4, + "learning_rate": 1.205428915381927e-07, + "loss": 0.0017, + "step": 20511 + }, + { + "epoch": 0.4, + "learning_rate": 1.2053900819385653e-07, + "loss": 0.5516, + "step": 20512 + }, + { + "epoch": 0.4, + "learning_rate": 1.205351248495204e-07, + "loss": 0.2163, + "step": 20513 + }, + { + "epoch": 0.4, + "learning_rate": 1.2053124150518425e-07, + "loss": 0.0007, + "step": 20514 + }, + { + "epoch": 0.4, + "learning_rate": 1.2052735816084812e-07, + "loss": 0.0033, + "step": 20515 + }, + { + "epoch": 0.4, + "learning_rate": 1.2052347481651197e-07, + "loss": 0.0007, + "step": 20516 + }, + { + "epoch": 0.4, + "learning_rate": 1.2051959147217584e-07, + "loss": 0.0006, + "step": 20517 + }, + { + "epoch": 0.4, + "learning_rate": 1.2051570812783968e-07, + "loss": 0.0034, + "step": 20518 + }, + { + "epoch": 0.4, + "learning_rate": 1.2051182478350355e-07, + "loss": 0.0007, + "step": 20519 + }, + { + "epoch": 0.4, + "learning_rate": 1.205079414391674e-07, + "loss": 0.0008, + "step": 20520 + }, + { + "epoch": 0.4, + "learning_rate": 1.2050405809483127e-07, + "loss": 0.001, + "step": 20521 + }, + { + "epoch": 0.4, + "learning_rate": 1.2050017475049512e-07, + "loss": 0.0007, + "step": 20522 + }, + { + "epoch": 0.4, + "learning_rate": 1.20496291406159e-07, + "loss": 0.0008, + "step": 20523 + }, + { + "epoch": 0.4, + "learning_rate": 1.2049240806182283e-07, + "loss": 0.005, + "step": 20524 + }, + { + "epoch": 0.4, + "learning_rate": 1.204885247174867e-07, + "loss": 0.0008, + "step": 20525 + }, + { + "epoch": 0.4, + "learning_rate": 1.2048464137315055e-07, + "loss": 0.5327, + "step": 20526 + }, + { + "epoch": 0.4, + "learning_rate": 1.2048075802881442e-07, + "loss": 0.0007, + "step": 20527 + }, + { + "epoch": 0.4, + "learning_rate": 1.2047687468447827e-07, + "loss": 0.0008, + "step": 20528 + }, + { + "epoch": 0.4, + "learning_rate": 1.2047299134014214e-07, + "loss": 0.1302, + "step": 20529 + }, + { + "epoch": 0.4, + "learning_rate": 1.2046910799580598e-07, + "loss": 0.0007, + "step": 20530 + }, + { + "epoch": 0.4, + "learning_rate": 1.2046522465146985e-07, + "loss": 0.0005, + "step": 20531 + }, + { + "epoch": 0.4, + "learning_rate": 1.204613413071337e-07, + "loss": 0.0007, + "step": 20532 + }, + { + "epoch": 0.4, + "learning_rate": 1.2045745796279757e-07, + "loss": 0.0007, + "step": 20533 + }, + { + "epoch": 0.4, + "learning_rate": 1.2045357461846142e-07, + "loss": 0.001, + "step": 20534 + }, + { + "epoch": 0.4, + "learning_rate": 1.2044969127412529e-07, + "loss": 0.0115, + "step": 20535 + }, + { + "epoch": 0.4, + "learning_rate": 1.2044580792978913e-07, + "loss": 0.0008, + "step": 20536 + }, + { + "epoch": 0.4, + "learning_rate": 1.20441924585453e-07, + "loss": 0.0008, + "step": 20537 + }, + { + "epoch": 0.4, + "learning_rate": 1.2043804124111685e-07, + "loss": 0.0008, + "step": 20538 + }, + { + "epoch": 0.4, + "learning_rate": 1.2043415789678072e-07, + "loss": 0.0008, + "step": 20539 + }, + { + "epoch": 0.4, + "learning_rate": 1.2043027455244456e-07, + "loss": 0.0052, + "step": 20540 + }, + { + "epoch": 0.4, + "learning_rate": 1.2042639120810844e-07, + "loss": 0.0007, + "step": 20541 + }, + { + "epoch": 0.4, + "learning_rate": 1.2042250786377228e-07, + "loss": 0.0006, + "step": 20542 + }, + { + "epoch": 0.4, + "learning_rate": 1.2041862451943615e-07, + "loss": 0.602, + "step": 20543 + }, + { + "epoch": 0.4, + "learning_rate": 1.204147411751e-07, + "loss": 0.001, + "step": 20544 + }, + { + "epoch": 0.4, + "learning_rate": 1.2041085783076387e-07, + "loss": 0.5966, + "step": 20545 + }, + { + "epoch": 0.4, + "learning_rate": 1.2040697448642771e-07, + "loss": 0.0015, + "step": 20546 + }, + { + "epoch": 0.4, + "learning_rate": 1.2040309114209159e-07, + "loss": 0.0018, + "step": 20547 + }, + { + "epoch": 0.4, + "learning_rate": 1.2039920779775543e-07, + "loss": 0.0008, + "step": 20548 + }, + { + "epoch": 0.4, + "learning_rate": 1.203953244534193e-07, + "loss": 0.0016, + "step": 20549 + }, + { + "epoch": 0.4, + "learning_rate": 1.2039144110908315e-07, + "loss": 0.0006, + "step": 20550 + }, + { + "epoch": 0.4, + "learning_rate": 1.20387557764747e-07, + "loss": 0.0013, + "step": 20551 + }, + { + "epoch": 0.4, + "learning_rate": 1.2038367442041086e-07, + "loss": 0.0008, + "step": 20552 + }, + { + "epoch": 0.4, + "learning_rate": 1.203797910760747e-07, + "loss": 0.0006, + "step": 20553 + }, + { + "epoch": 0.4, + "learning_rate": 1.2037590773173855e-07, + "loss": 0.0006, + "step": 20554 + }, + { + "epoch": 0.4, + "learning_rate": 1.2037202438740243e-07, + "loss": 0.0007, + "step": 20555 + }, + { + "epoch": 0.4, + "learning_rate": 1.2036814104306627e-07, + "loss": 0.1534, + "step": 20556 + }, + { + "epoch": 0.4, + "learning_rate": 1.2036425769873014e-07, + "loss": 0.0008, + "step": 20557 + }, + { + "epoch": 0.4, + "learning_rate": 1.2036037435439399e-07, + "loss": 0.0034, + "step": 20558 + }, + { + "epoch": 0.4, + "learning_rate": 1.2035649101005786e-07, + "loss": 0.0014, + "step": 20559 + }, + { + "epoch": 0.4, + "learning_rate": 1.203526076657217e-07, + "loss": 0.0007, + "step": 20560 + }, + { + "epoch": 0.4, + "learning_rate": 1.2034872432138557e-07, + "loss": 0.6148, + "step": 20561 + }, + { + "epoch": 0.4, + "learning_rate": 1.2034484097704942e-07, + "loss": 0.0006, + "step": 20562 + }, + { + "epoch": 0.4, + "learning_rate": 1.203409576327133e-07, + "loss": 0.0022, + "step": 20563 + }, + { + "epoch": 0.4, + "learning_rate": 1.2033707428837714e-07, + "loss": 0.0008, + "step": 20564 + }, + { + "epoch": 0.4, + "learning_rate": 1.20333190944041e-07, + "loss": 0.001, + "step": 20565 + }, + { + "epoch": 0.4, + "learning_rate": 1.2032930759970485e-07, + "loss": 0.0006, + "step": 20566 + }, + { + "epoch": 0.4, + "learning_rate": 1.2032542425536872e-07, + "loss": 0.0079, + "step": 20567 + }, + { + "epoch": 0.4, + "learning_rate": 1.2032154091103257e-07, + "loss": 0.0059, + "step": 20568 + }, + { + "epoch": 0.4, + "learning_rate": 1.2031765756669644e-07, + "loss": 0.0007, + "step": 20569 + }, + { + "epoch": 0.4, + "learning_rate": 1.2031377422236029e-07, + "loss": 0.0006, + "step": 20570 + }, + { + "epoch": 0.4, + "learning_rate": 1.2030989087802416e-07, + "loss": 0.0007, + "step": 20571 + }, + { + "epoch": 0.4, + "learning_rate": 1.20306007533688e-07, + "loss": 0.0111, + "step": 20572 + }, + { + "epoch": 0.4, + "learning_rate": 1.2030212418935187e-07, + "loss": 0.0468, + "step": 20573 + }, + { + "epoch": 0.4, + "learning_rate": 1.2029824084501572e-07, + "loss": 0.0096, + "step": 20574 + }, + { + "epoch": 0.4, + "learning_rate": 1.202943575006796e-07, + "loss": 0.0008, + "step": 20575 + }, + { + "epoch": 0.4, + "learning_rate": 1.2029047415634343e-07, + "loss": 0.0006, + "step": 20576 + }, + { + "epoch": 0.4, + "learning_rate": 1.202865908120073e-07, + "loss": 0.0006, + "step": 20577 + }, + { + "epoch": 0.4, + "learning_rate": 1.2028270746767115e-07, + "loss": 0.0007, + "step": 20578 + }, + { + "epoch": 0.4, + "learning_rate": 1.2027882412333502e-07, + "loss": 0.0008, + "step": 20579 + }, + { + "epoch": 0.4, + "learning_rate": 1.2027494077899887e-07, + "loss": 0.0011, + "step": 20580 + }, + { + "epoch": 0.4, + "learning_rate": 1.202710574346627e-07, + "loss": 0.0007, + "step": 20581 + }, + { + "epoch": 0.4, + "learning_rate": 1.2026717409032658e-07, + "loss": 0.0007, + "step": 20582 + }, + { + "epoch": 0.4, + "learning_rate": 1.2026329074599043e-07, + "loss": 0.0008, + "step": 20583 + }, + { + "epoch": 0.4, + "learning_rate": 1.202594074016543e-07, + "loss": 0.0006, + "step": 20584 + }, + { + "epoch": 0.4, + "learning_rate": 1.2025552405731815e-07, + "loss": 0.0885, + "step": 20585 + }, + { + "epoch": 0.4, + "learning_rate": 1.2025164071298202e-07, + "loss": 0.0021, + "step": 20586 + }, + { + "epoch": 0.4, + "learning_rate": 1.2024775736864586e-07, + "loss": 0.0008, + "step": 20587 + }, + { + "epoch": 0.4, + "learning_rate": 1.2024387402430973e-07, + "loss": 0.001, + "step": 20588 + }, + { + "epoch": 0.4, + "learning_rate": 1.2023999067997358e-07, + "loss": 0.0015, + "step": 20589 + }, + { + "epoch": 0.4, + "learning_rate": 1.2023610733563745e-07, + "loss": 0.0007, + "step": 20590 + }, + { + "epoch": 0.4, + "learning_rate": 1.202322239913013e-07, + "loss": 0.0009, + "step": 20591 + }, + { + "epoch": 0.4, + "learning_rate": 1.2022834064696517e-07, + "loss": 0.0006, + "step": 20592 + }, + { + "epoch": 0.4, + "learning_rate": 1.20224457302629e-07, + "loss": 0.0007, + "step": 20593 + }, + { + "epoch": 0.4, + "learning_rate": 1.2022057395829288e-07, + "loss": 0.0009, + "step": 20594 + }, + { + "epoch": 0.4, + "learning_rate": 1.2021669061395673e-07, + "loss": 0.0007, + "step": 20595 + }, + { + "epoch": 0.4, + "learning_rate": 1.202128072696206e-07, + "loss": 0.0008, + "step": 20596 + }, + { + "epoch": 0.4, + "learning_rate": 1.2020892392528444e-07, + "loss": 0.0036, + "step": 20597 + }, + { + "epoch": 0.4, + "learning_rate": 1.2020504058094832e-07, + "loss": 0.0008, + "step": 20598 + }, + { + "epoch": 0.4, + "learning_rate": 1.2020115723661216e-07, + "loss": 0.0008, + "step": 20599 + }, + { + "epoch": 0.4, + "learning_rate": 1.2019727389227603e-07, + "loss": 0.0007, + "step": 20600 + }, + { + "epoch": 0.4, + "learning_rate": 1.2019339054793988e-07, + "loss": 0.0008, + "step": 20601 + }, + { + "epoch": 0.4, + "learning_rate": 1.2018950720360375e-07, + "loss": 0.0006, + "step": 20602 + }, + { + "epoch": 0.4, + "learning_rate": 1.201856238592676e-07, + "loss": 0.0009, + "step": 20603 + }, + { + "epoch": 0.4, + "learning_rate": 1.2018174051493147e-07, + "loss": 0.2659, + "step": 20604 + }, + { + "epoch": 0.4, + "learning_rate": 1.201778571705953e-07, + "loss": 0.0008, + "step": 20605 + }, + { + "epoch": 0.4, + "learning_rate": 1.2017397382625918e-07, + "loss": 0.0607, + "step": 20606 + }, + { + "epoch": 0.4, + "learning_rate": 1.2017009048192303e-07, + "loss": 0.0009, + "step": 20607 + }, + { + "epoch": 0.4, + "learning_rate": 1.201662071375869e-07, + "loss": 0.0008, + "step": 20608 + }, + { + "epoch": 0.4, + "learning_rate": 1.2016232379325074e-07, + "loss": 0.0006, + "step": 20609 + }, + { + "epoch": 0.4, + "learning_rate": 1.2015844044891462e-07, + "loss": 0.0009, + "step": 20610 + }, + { + "epoch": 0.4, + "learning_rate": 1.2015455710457843e-07, + "loss": 0.0007, + "step": 20611 + }, + { + "epoch": 0.4, + "learning_rate": 1.201506737602423e-07, + "loss": 0.0009, + "step": 20612 + }, + { + "epoch": 0.4, + "learning_rate": 1.2014679041590615e-07, + "loss": 0.2359, + "step": 20613 + }, + { + "epoch": 0.4, + "learning_rate": 1.2014290707157002e-07, + "loss": 1.3662, + "step": 20614 + }, + { + "epoch": 0.4, + "learning_rate": 1.2013902372723387e-07, + "loss": 0.0009, + "step": 20615 + }, + { + "epoch": 0.4, + "learning_rate": 1.2013514038289774e-07, + "loss": 0.0005, + "step": 20616 + }, + { + "epoch": 0.4, + "learning_rate": 1.2013125703856158e-07, + "loss": 0.3951, + "step": 20617 + }, + { + "epoch": 0.4, + "learning_rate": 1.2012737369422545e-07, + "loss": 0.0012, + "step": 20618 + }, + { + "epoch": 0.4, + "learning_rate": 1.201234903498893e-07, + "loss": 0.0009, + "step": 20619 + }, + { + "epoch": 0.4, + "learning_rate": 1.2011960700555317e-07, + "loss": 0.0013, + "step": 20620 + }, + { + "epoch": 0.4, + "learning_rate": 1.2011572366121702e-07, + "loss": 0.0011, + "step": 20621 + }, + { + "epoch": 0.4, + "learning_rate": 1.201118403168809e-07, + "loss": 0.0006, + "step": 20622 + }, + { + "epoch": 0.4, + "learning_rate": 1.2010795697254473e-07, + "loss": 0.0007, + "step": 20623 + }, + { + "epoch": 0.4, + "learning_rate": 1.201040736282086e-07, + "loss": 0.0005, + "step": 20624 + }, + { + "epoch": 0.4, + "learning_rate": 1.2010019028387245e-07, + "loss": 0.2159, + "step": 20625 + }, + { + "epoch": 0.4, + "learning_rate": 1.2009630693953632e-07, + "loss": 0.0007, + "step": 20626 + }, + { + "epoch": 0.4, + "learning_rate": 1.2009242359520017e-07, + "loss": 0.0009, + "step": 20627 + }, + { + "epoch": 0.4, + "learning_rate": 1.2008854025086404e-07, + "loss": 0.0563, + "step": 20628 + }, + { + "epoch": 0.4, + "learning_rate": 1.2008465690652788e-07, + "loss": 0.0009, + "step": 20629 + }, + { + "epoch": 0.4, + "learning_rate": 1.2008077356219175e-07, + "loss": 0.1757, + "step": 20630 + }, + { + "epoch": 0.4, + "learning_rate": 1.200768902178556e-07, + "loss": 0.0007, + "step": 20631 + }, + { + "epoch": 0.4, + "learning_rate": 1.2007300687351947e-07, + "loss": 0.0007, + "step": 20632 + }, + { + "epoch": 0.4, + "learning_rate": 1.2006912352918332e-07, + "loss": 0.0009, + "step": 20633 + }, + { + "epoch": 0.4, + "learning_rate": 1.2006524018484719e-07, + "loss": 0.001, + "step": 20634 + }, + { + "epoch": 0.4, + "learning_rate": 1.2006135684051103e-07, + "loss": 0.0009, + "step": 20635 + }, + { + "epoch": 0.4, + "learning_rate": 1.200574734961749e-07, + "loss": 0.0007, + "step": 20636 + }, + { + "epoch": 0.4, + "learning_rate": 1.2005359015183875e-07, + "loss": 0.0193, + "step": 20637 + }, + { + "epoch": 0.4, + "learning_rate": 1.2004970680750262e-07, + "loss": 0.0059, + "step": 20638 + }, + { + "epoch": 0.4, + "learning_rate": 1.2004582346316646e-07, + "loss": 0.0213, + "step": 20639 + }, + { + "epoch": 0.4, + "learning_rate": 1.2004194011883034e-07, + "loss": 0.0007, + "step": 20640 + }, + { + "epoch": 0.4, + "learning_rate": 1.2003805677449418e-07, + "loss": 0.0007, + "step": 20641 + }, + { + "epoch": 0.4, + "learning_rate": 1.2003417343015805e-07, + "loss": 0.0007, + "step": 20642 + }, + { + "epoch": 0.4, + "learning_rate": 1.200302900858219e-07, + "loss": 0.4538, + "step": 20643 + }, + { + "epoch": 0.4, + "learning_rate": 1.2002640674148577e-07, + "loss": 0.0012, + "step": 20644 + }, + { + "epoch": 0.4, + "learning_rate": 1.2002252339714961e-07, + "loss": 0.0007, + "step": 20645 + }, + { + "epoch": 0.4, + "learning_rate": 1.2001864005281349e-07, + "loss": 0.0013, + "step": 20646 + }, + { + "epoch": 0.4, + "learning_rate": 1.2001475670847733e-07, + "loss": 0.0009, + "step": 20647 + }, + { + "epoch": 0.4, + "learning_rate": 1.200108733641412e-07, + "loss": 0.0007, + "step": 20648 + }, + { + "epoch": 0.4, + "learning_rate": 1.2000699001980505e-07, + "loss": 0.0007, + "step": 20649 + }, + { + "epoch": 0.4, + "learning_rate": 1.2000310667546892e-07, + "loss": 0.0013, + "step": 20650 + }, + { + "epoch": 0.4, + "learning_rate": 1.1999922333113276e-07, + "loss": 0.0007, + "step": 20651 + }, + { + "epoch": 0.4, + "learning_rate": 1.1999533998679664e-07, + "loss": 0.0007, + "step": 20652 + }, + { + "epoch": 0.4, + "learning_rate": 1.1999145664246048e-07, + "loss": 0.1295, + "step": 20653 + }, + { + "epoch": 0.4, + "learning_rate": 1.1998757329812435e-07, + "loss": 0.0062, + "step": 20654 + }, + { + "epoch": 0.4, + "learning_rate": 1.199836899537882e-07, + "loss": 0.0006, + "step": 20655 + }, + { + "epoch": 0.4, + "learning_rate": 1.1997980660945207e-07, + "loss": 0.0008, + "step": 20656 + }, + { + "epoch": 0.4, + "learning_rate": 1.199759232651159e-07, + "loss": 0.0008, + "step": 20657 + }, + { + "epoch": 0.4, + "learning_rate": 1.1997203992077978e-07, + "loss": 0.0006, + "step": 20658 + }, + { + "epoch": 0.4, + "learning_rate": 1.1996815657644363e-07, + "loss": 0.0008, + "step": 20659 + }, + { + "epoch": 0.4, + "learning_rate": 1.199642732321075e-07, + "loss": 0.0198, + "step": 20660 + }, + { + "epoch": 0.4, + "learning_rate": 1.1996038988777135e-07, + "loss": 0.9979, + "step": 20661 + }, + { + "epoch": 0.4, + "learning_rate": 1.1995650654343522e-07, + "loss": 0.0015, + "step": 20662 + }, + { + "epoch": 0.4, + "learning_rate": 1.1995262319909906e-07, + "loss": 0.0006, + "step": 20663 + }, + { + "epoch": 0.4, + "learning_rate": 1.1994873985476293e-07, + "loss": 0.0007, + "step": 20664 + }, + { + "epoch": 0.4, + "learning_rate": 1.1994485651042678e-07, + "loss": 0.0009, + "step": 20665 + }, + { + "epoch": 0.4, + "learning_rate": 1.1994097316609065e-07, + "loss": 0.0006, + "step": 20666 + }, + { + "epoch": 0.4, + "learning_rate": 1.199370898217545e-07, + "loss": 0.0005, + "step": 20667 + }, + { + "epoch": 0.4, + "learning_rate": 1.1993320647741837e-07, + "loss": 0.0007, + "step": 20668 + }, + { + "epoch": 0.4, + "learning_rate": 1.1992932313308219e-07, + "loss": 0.0031, + "step": 20669 + }, + { + "epoch": 0.4, + "learning_rate": 1.1992543978874606e-07, + "loss": 0.0037, + "step": 20670 + }, + { + "epoch": 0.4, + "learning_rate": 1.199215564444099e-07, + "loss": 0.0013, + "step": 20671 + }, + { + "epoch": 0.4, + "learning_rate": 1.1991767310007377e-07, + "loss": 0.0007, + "step": 20672 + }, + { + "epoch": 0.4, + "learning_rate": 1.1991378975573762e-07, + "loss": 0.0007, + "step": 20673 + }, + { + "epoch": 0.4, + "learning_rate": 1.199099064114015e-07, + "loss": 0.0143, + "step": 20674 + }, + { + "epoch": 0.4, + "learning_rate": 1.1990602306706533e-07, + "loss": 0.0007, + "step": 20675 + }, + { + "epoch": 0.4, + "learning_rate": 1.199021397227292e-07, + "loss": 0.0007, + "step": 20676 + }, + { + "epoch": 0.4, + "learning_rate": 1.1989825637839305e-07, + "loss": 0.0009, + "step": 20677 + }, + { + "epoch": 0.4, + "learning_rate": 1.1989437303405692e-07, + "loss": 0.0007, + "step": 20678 + }, + { + "epoch": 0.4, + "learning_rate": 1.1989048968972077e-07, + "loss": 0.0006, + "step": 20679 + }, + { + "epoch": 0.4, + "learning_rate": 1.1988660634538464e-07, + "loss": 0.5937, + "step": 20680 + }, + { + "epoch": 0.4, + "learning_rate": 1.1988272300104848e-07, + "loss": 0.0006, + "step": 20681 + }, + { + "epoch": 0.4, + "learning_rate": 1.1987883965671236e-07, + "loss": 0.0006, + "step": 20682 + }, + { + "epoch": 0.4, + "learning_rate": 1.198749563123762e-07, + "loss": 0.001, + "step": 20683 + }, + { + "epoch": 0.4, + "learning_rate": 1.1987107296804007e-07, + "loss": 0.0006, + "step": 20684 + }, + { + "epoch": 0.4, + "learning_rate": 1.1986718962370392e-07, + "loss": 0.2931, + "step": 20685 + }, + { + "epoch": 0.4, + "learning_rate": 1.198633062793678e-07, + "loss": 0.0243, + "step": 20686 + }, + { + "epoch": 0.4, + "learning_rate": 1.1985942293503163e-07, + "loss": 0.0009, + "step": 20687 + }, + { + "epoch": 0.4, + "learning_rate": 1.198555395906955e-07, + "loss": 0.0006, + "step": 20688 + }, + { + "epoch": 0.4, + "learning_rate": 1.1985165624635935e-07, + "loss": 0.0012, + "step": 20689 + }, + { + "epoch": 0.4, + "learning_rate": 1.1984777290202322e-07, + "loss": 0.0347, + "step": 20690 + }, + { + "epoch": 0.4, + "learning_rate": 1.1984388955768707e-07, + "loss": 0.0006, + "step": 20691 + }, + { + "epoch": 0.4, + "learning_rate": 1.1984000621335094e-07, + "loss": 0.0007, + "step": 20692 + }, + { + "epoch": 0.4, + "learning_rate": 1.1983612286901478e-07, + "loss": 0.0007, + "step": 20693 + }, + { + "epoch": 0.4, + "learning_rate": 1.1983223952467865e-07, + "loss": 0.5416, + "step": 20694 + }, + { + "epoch": 0.4, + "learning_rate": 1.198283561803425e-07, + "loss": 0.0009, + "step": 20695 + }, + { + "epoch": 0.4, + "learning_rate": 1.1982447283600637e-07, + "loss": 0.0014, + "step": 20696 + }, + { + "epoch": 0.4, + "learning_rate": 1.1982058949167022e-07, + "loss": 0.0008, + "step": 20697 + }, + { + "epoch": 0.4, + "learning_rate": 1.198167061473341e-07, + "loss": 0.0049, + "step": 20698 + }, + { + "epoch": 0.4, + "learning_rate": 1.1981282280299793e-07, + "loss": 0.0007, + "step": 20699 + }, + { + "epoch": 0.4, + "learning_rate": 1.198089394586618e-07, + "loss": 0.0008, + "step": 20700 + }, + { + "epoch": 0.4, + "learning_rate": 1.1980505611432565e-07, + "loss": 0.0583, + "step": 20701 + }, + { + "epoch": 0.4, + "learning_rate": 1.1980117276998952e-07, + "loss": 0.0006, + "step": 20702 + }, + { + "epoch": 0.4, + "learning_rate": 1.1979728942565337e-07, + "loss": 0.006, + "step": 20703 + }, + { + "epoch": 0.4, + "learning_rate": 1.1979340608131724e-07, + "loss": 0.0025, + "step": 20704 + }, + { + "epoch": 0.4, + "learning_rate": 1.1978952273698108e-07, + "loss": 0.4468, + "step": 20705 + }, + { + "epoch": 0.4, + "learning_rate": 1.1978563939264495e-07, + "loss": 0.0007, + "step": 20706 + }, + { + "epoch": 0.4, + "learning_rate": 1.197817560483088e-07, + "loss": 0.0009, + "step": 20707 + }, + { + "epoch": 0.4, + "learning_rate": 1.1977787270397267e-07, + "loss": 0.0007, + "step": 20708 + }, + { + "epoch": 0.4, + "learning_rate": 1.1977398935963652e-07, + "loss": 0.0006, + "step": 20709 + }, + { + "epoch": 0.4, + "learning_rate": 1.1977010601530039e-07, + "loss": 0.0007, + "step": 20710 + }, + { + "epoch": 0.4, + "learning_rate": 1.1976622267096423e-07, + "loss": 0.7342, + "step": 20711 + }, + { + "epoch": 0.4, + "learning_rate": 1.197623393266281e-07, + "loss": 0.0007, + "step": 20712 + }, + { + "epoch": 0.4, + "learning_rate": 1.1975845598229195e-07, + "loss": 0.0007, + "step": 20713 + }, + { + "epoch": 0.4, + "learning_rate": 1.1975457263795582e-07, + "loss": 0.0008, + "step": 20714 + }, + { + "epoch": 0.4, + "learning_rate": 1.1975068929361966e-07, + "loss": 0.0018, + "step": 20715 + }, + { + "epoch": 0.4, + "learning_rate": 1.1974680594928354e-07, + "loss": 0.0007, + "step": 20716 + }, + { + "epoch": 0.4, + "learning_rate": 1.1974292260494738e-07, + "loss": 0.0017, + "step": 20717 + }, + { + "epoch": 0.4, + "learning_rate": 1.1973903926061125e-07, + "loss": 0.0007, + "step": 20718 + }, + { + "epoch": 0.4, + "learning_rate": 1.197351559162751e-07, + "loss": 0.0006, + "step": 20719 + }, + { + "epoch": 0.4, + "learning_rate": 1.1973127257193897e-07, + "loss": 0.9085, + "step": 20720 + }, + { + "epoch": 0.4, + "learning_rate": 1.1972738922760281e-07, + "loss": 0.6814, + "step": 20721 + }, + { + "epoch": 0.4, + "learning_rate": 1.1972350588326669e-07, + "loss": 0.051, + "step": 20722 + }, + { + "epoch": 0.4, + "learning_rate": 1.1971962253893053e-07, + "loss": 0.0008, + "step": 20723 + }, + { + "epoch": 0.4, + "learning_rate": 1.197157391945944e-07, + "loss": 0.0018, + "step": 20724 + }, + { + "epoch": 0.4, + "learning_rate": 1.1971185585025825e-07, + "loss": 0.0008, + "step": 20725 + }, + { + "epoch": 0.4, + "learning_rate": 1.1970797250592212e-07, + "loss": 0.0007, + "step": 20726 + }, + { + "epoch": 0.4, + "learning_rate": 1.1970408916158594e-07, + "loss": 0.0007, + "step": 20727 + }, + { + "epoch": 0.4, + "learning_rate": 1.197002058172498e-07, + "loss": 0.0008, + "step": 20728 + }, + { + "epoch": 0.4, + "learning_rate": 1.1969632247291365e-07, + "loss": 0.0012, + "step": 20729 + }, + { + "epoch": 0.4, + "learning_rate": 1.1969243912857753e-07, + "loss": 0.2499, + "step": 20730 + }, + { + "epoch": 0.4, + "learning_rate": 1.1968855578424137e-07, + "loss": 0.0005, + "step": 20731 + }, + { + "epoch": 0.4, + "learning_rate": 1.1968467243990524e-07, + "loss": 0.0007, + "step": 20732 + }, + { + "epoch": 0.4, + "learning_rate": 1.1968078909556909e-07, + "loss": 0.0005, + "step": 20733 + }, + { + "epoch": 0.4, + "learning_rate": 1.1967690575123296e-07, + "loss": 0.6871, + "step": 20734 + }, + { + "epoch": 0.4, + "learning_rate": 1.196730224068968e-07, + "loss": 0.018, + "step": 20735 + }, + { + "epoch": 0.4, + "learning_rate": 1.1966913906256067e-07, + "loss": 0.0006, + "step": 20736 + }, + { + "epoch": 0.4, + "learning_rate": 1.1966525571822452e-07, + "loss": 0.0006, + "step": 20737 + }, + { + "epoch": 0.4, + "learning_rate": 1.196613723738884e-07, + "loss": 0.0011, + "step": 20738 + }, + { + "epoch": 0.4, + "learning_rate": 1.1965748902955224e-07, + "loss": 0.0015, + "step": 20739 + }, + { + "epoch": 0.4, + "learning_rate": 1.196536056852161e-07, + "loss": 0.0009, + "step": 20740 + }, + { + "epoch": 0.4, + "learning_rate": 1.1964972234087995e-07, + "loss": 0.0008, + "step": 20741 + }, + { + "epoch": 0.4, + "learning_rate": 1.1964583899654382e-07, + "loss": 0.0014, + "step": 20742 + }, + { + "epoch": 0.4, + "learning_rate": 1.1964195565220767e-07, + "loss": 0.0008, + "step": 20743 + }, + { + "epoch": 0.4, + "learning_rate": 1.1963807230787154e-07, + "loss": 0.0008, + "step": 20744 + }, + { + "epoch": 0.4, + "learning_rate": 1.1963418896353539e-07, + "loss": 0.0007, + "step": 20745 + }, + { + "epoch": 0.4, + "learning_rate": 1.1963030561919926e-07, + "loss": 0.3208, + "step": 20746 + }, + { + "epoch": 0.4, + "learning_rate": 1.196264222748631e-07, + "loss": 0.0008, + "step": 20747 + }, + { + "epoch": 0.4, + "learning_rate": 1.1962253893052697e-07, + "loss": 0.0015, + "step": 20748 + }, + { + "epoch": 0.4, + "learning_rate": 1.1961865558619082e-07, + "loss": 0.0007, + "step": 20749 + }, + { + "epoch": 0.4, + "learning_rate": 1.196147722418547e-07, + "loss": 0.0006, + "step": 20750 + }, + { + "epoch": 0.4, + "learning_rate": 1.1961088889751854e-07, + "loss": 0.0007, + "step": 20751 + }, + { + "epoch": 0.4, + "learning_rate": 1.196070055531824e-07, + "loss": 0.0184, + "step": 20752 + }, + { + "epoch": 0.4, + "learning_rate": 1.1960312220884625e-07, + "loss": 0.0006, + "step": 20753 + }, + { + "epoch": 0.4, + "learning_rate": 1.1959923886451012e-07, + "loss": 0.0007, + "step": 20754 + }, + { + "epoch": 0.4, + "learning_rate": 1.1959535552017397e-07, + "loss": 0.0008, + "step": 20755 + }, + { + "epoch": 0.4, + "learning_rate": 1.1959147217583784e-07, + "loss": 0.0011, + "step": 20756 + }, + { + "epoch": 0.4, + "learning_rate": 1.1958758883150168e-07, + "loss": 0.0111, + "step": 20757 + }, + { + "epoch": 0.4, + "learning_rate": 1.1958370548716553e-07, + "loss": 0.0006, + "step": 20758 + }, + { + "epoch": 0.4, + "learning_rate": 1.195798221428294e-07, + "loss": 0.0008, + "step": 20759 + }, + { + "epoch": 0.4, + "learning_rate": 1.1957593879849325e-07, + "loss": 0.0011, + "step": 20760 + }, + { + "epoch": 0.4, + "learning_rate": 1.1957205545415712e-07, + "loss": 0.7091, + "step": 20761 + }, + { + "epoch": 0.4, + "learning_rate": 1.1956817210982096e-07, + "loss": 0.0007, + "step": 20762 + }, + { + "epoch": 0.4, + "learning_rate": 1.1956428876548483e-07, + "loss": 0.0009, + "step": 20763 + }, + { + "epoch": 0.4, + "learning_rate": 1.1956040542114868e-07, + "loss": 0.0008, + "step": 20764 + }, + { + "epoch": 0.4, + "learning_rate": 1.1955652207681255e-07, + "loss": 0.0009, + "step": 20765 + }, + { + "epoch": 0.4, + "learning_rate": 1.195526387324764e-07, + "loss": 0.0017, + "step": 20766 + }, + { + "epoch": 0.4, + "learning_rate": 1.1954875538814027e-07, + "loss": 0.7374, + "step": 20767 + }, + { + "epoch": 0.4, + "learning_rate": 1.195448720438041e-07, + "loss": 0.0006, + "step": 20768 + }, + { + "epoch": 0.4, + "learning_rate": 1.1954098869946798e-07, + "loss": 0.0005, + "step": 20769 + }, + { + "epoch": 0.4, + "learning_rate": 1.1953710535513183e-07, + "loss": 0.0009, + "step": 20770 + }, + { + "epoch": 0.4, + "learning_rate": 1.195332220107957e-07, + "loss": 1.0815, + "step": 20771 + }, + { + "epoch": 0.4, + "learning_rate": 1.1952933866645954e-07, + "loss": 0.0007, + "step": 20772 + }, + { + "epoch": 0.4, + "learning_rate": 1.1952545532212342e-07, + "loss": 0.9822, + "step": 20773 + }, + { + "epoch": 0.4, + "learning_rate": 1.1952157197778726e-07, + "loss": 0.011, + "step": 20774 + }, + { + "epoch": 0.4, + "learning_rate": 1.1951768863345113e-07, + "loss": 0.0007, + "step": 20775 + }, + { + "epoch": 0.4, + "learning_rate": 1.1951380528911498e-07, + "loss": 0.0006, + "step": 20776 + }, + { + "epoch": 0.4, + "learning_rate": 1.1950992194477885e-07, + "loss": 0.0007, + "step": 20777 + }, + { + "epoch": 0.4, + "learning_rate": 1.195060386004427e-07, + "loss": 0.0006, + "step": 20778 + }, + { + "epoch": 0.4, + "learning_rate": 1.1950215525610657e-07, + "loss": 0.0009, + "step": 20779 + }, + { + "epoch": 0.4, + "learning_rate": 1.194982719117704e-07, + "loss": 0.0027, + "step": 20780 + }, + { + "epoch": 0.4, + "learning_rate": 1.1949438856743428e-07, + "loss": 0.0006, + "step": 20781 + }, + { + "epoch": 0.4, + "learning_rate": 1.1949050522309813e-07, + "loss": 0.0007, + "step": 20782 + }, + { + "epoch": 0.4, + "learning_rate": 1.19486621878762e-07, + "loss": 0.0007, + "step": 20783 + }, + { + "epoch": 0.4, + "learning_rate": 1.1948273853442584e-07, + "loss": 0.0009, + "step": 20784 + }, + { + "epoch": 0.4, + "learning_rate": 1.194788551900897e-07, + "loss": 0.0008, + "step": 20785 + }, + { + "epoch": 0.4, + "learning_rate": 1.1947497184575356e-07, + "loss": 0.0006, + "step": 20786 + }, + { + "epoch": 0.4, + "learning_rate": 1.194710885014174e-07, + "loss": 0.0011, + "step": 20787 + }, + { + "epoch": 0.4, + "learning_rate": 1.1946720515708125e-07, + "loss": 0.0008, + "step": 20788 + }, + { + "epoch": 0.4, + "learning_rate": 1.1946332181274512e-07, + "loss": 0.0006, + "step": 20789 + }, + { + "epoch": 0.4, + "learning_rate": 1.1945943846840897e-07, + "loss": 1.5675, + "step": 20790 + }, + { + "epoch": 0.4, + "learning_rate": 1.1945555512407284e-07, + "loss": 0.011, + "step": 20791 + }, + { + "epoch": 0.4, + "learning_rate": 1.1945167177973668e-07, + "loss": 0.0013, + "step": 20792 + }, + { + "epoch": 0.4, + "learning_rate": 1.1944778843540055e-07, + "loss": 0.0007, + "step": 20793 + }, + { + "epoch": 0.4, + "learning_rate": 1.194439050910644e-07, + "loss": 0.0011, + "step": 20794 + }, + { + "epoch": 0.4, + "learning_rate": 1.1944002174672827e-07, + "loss": 0.0006, + "step": 20795 + }, + { + "epoch": 0.4, + "learning_rate": 1.1943613840239212e-07, + "loss": 0.0007, + "step": 20796 + }, + { + "epoch": 0.4, + "learning_rate": 1.19432255058056e-07, + "loss": 0.0062, + "step": 20797 + }, + { + "epoch": 0.4, + "learning_rate": 1.1942837171371983e-07, + "loss": 0.2372, + "step": 20798 + }, + { + "epoch": 0.4, + "learning_rate": 1.194244883693837e-07, + "loss": 0.0015, + "step": 20799 + }, + { + "epoch": 0.4, + "learning_rate": 1.1942060502504755e-07, + "loss": 0.0007, + "step": 20800 + }, + { + "epoch": 0.4, + "learning_rate": 1.1941672168071142e-07, + "loss": 0.0007, + "step": 20801 + }, + { + "epoch": 0.4, + "learning_rate": 1.1941283833637527e-07, + "loss": 0.002, + "step": 20802 + }, + { + "epoch": 0.4, + "learning_rate": 1.1940895499203914e-07, + "loss": 0.0009, + "step": 20803 + }, + { + "epoch": 0.4, + "learning_rate": 1.1940507164770298e-07, + "loss": 0.0071, + "step": 20804 + }, + { + "epoch": 0.4, + "learning_rate": 1.1940118830336685e-07, + "loss": 0.0009, + "step": 20805 + }, + { + "epoch": 0.4, + "learning_rate": 1.193973049590307e-07, + "loss": 0.0007, + "step": 20806 + }, + { + "epoch": 0.4, + "learning_rate": 1.1939342161469457e-07, + "loss": 0.0276, + "step": 20807 + }, + { + "epoch": 0.4, + "learning_rate": 1.1938953827035842e-07, + "loss": 0.0006, + "step": 20808 + }, + { + "epoch": 0.4, + "learning_rate": 1.193856549260223e-07, + "loss": 0.0008, + "step": 20809 + }, + { + "epoch": 0.4, + "learning_rate": 1.1938177158168613e-07, + "loss": 0.0026, + "step": 20810 + }, + { + "epoch": 0.4, + "learning_rate": 1.1937788823735e-07, + "loss": 0.0055, + "step": 20811 + }, + { + "epoch": 0.4, + "learning_rate": 1.1937400489301385e-07, + "loss": 0.0008, + "step": 20812 + }, + { + "epoch": 0.4, + "learning_rate": 1.1937012154867772e-07, + "loss": 0.0006, + "step": 20813 + }, + { + "epoch": 0.4, + "learning_rate": 1.1936623820434156e-07, + "loss": 0.0068, + "step": 20814 + }, + { + "epoch": 0.4, + "learning_rate": 1.1936235486000544e-07, + "loss": 0.0007, + "step": 20815 + }, + { + "epoch": 0.4, + "learning_rate": 1.1935847151566928e-07, + "loss": 0.0008, + "step": 20816 + }, + { + "epoch": 0.4, + "learning_rate": 1.1935458817133315e-07, + "loss": 0.0011, + "step": 20817 + }, + { + "epoch": 0.4, + "learning_rate": 1.19350704826997e-07, + "loss": 0.0008, + "step": 20818 + }, + { + "epoch": 0.4, + "learning_rate": 1.1934682148266087e-07, + "loss": 0.428, + "step": 20819 + }, + { + "epoch": 0.4, + "learning_rate": 1.1934293813832471e-07, + "loss": 0.0007, + "step": 20820 + }, + { + "epoch": 0.4, + "learning_rate": 1.1933905479398859e-07, + "loss": 0.0035, + "step": 20821 + }, + { + "epoch": 0.4, + "learning_rate": 1.1933517144965243e-07, + "loss": 0.5117, + "step": 20822 + }, + { + "epoch": 0.4, + "learning_rate": 1.193312881053163e-07, + "loss": 0.0006, + "step": 20823 + }, + { + "epoch": 0.4, + "learning_rate": 1.1932740476098015e-07, + "loss": 0.0008, + "step": 20824 + }, + { + "epoch": 0.4, + "learning_rate": 1.1932352141664402e-07, + "loss": 0.0014, + "step": 20825 + }, + { + "epoch": 0.4, + "learning_rate": 1.1931963807230786e-07, + "loss": 0.0006, + "step": 20826 + }, + { + "epoch": 0.4, + "learning_rate": 1.1931575472797174e-07, + "loss": 0.0007, + "step": 20827 + }, + { + "epoch": 0.4, + "learning_rate": 1.1931187138363558e-07, + "loss": 0.0192, + "step": 20828 + }, + { + "epoch": 0.4, + "learning_rate": 1.1930798803929945e-07, + "loss": 0.0013, + "step": 20829 + }, + { + "epoch": 0.4, + "learning_rate": 1.193041046949633e-07, + "loss": 0.0008, + "step": 20830 + }, + { + "epoch": 0.4, + "learning_rate": 1.1930022135062717e-07, + "loss": 0.2627, + "step": 20831 + }, + { + "epoch": 0.4, + "learning_rate": 1.19296338006291e-07, + "loss": 0.0007, + "step": 20832 + }, + { + "epoch": 0.4, + "learning_rate": 1.1929245466195488e-07, + "loss": 0.0014, + "step": 20833 + }, + { + "epoch": 0.4, + "learning_rate": 1.1928857131761873e-07, + "loss": 0.0012, + "step": 20834 + }, + { + "epoch": 0.4, + "learning_rate": 1.192846879732826e-07, + "loss": 0.0007, + "step": 20835 + }, + { + "epoch": 0.4, + "learning_rate": 1.1928080462894645e-07, + "loss": 0.0212, + "step": 20836 + }, + { + "epoch": 0.4, + "learning_rate": 1.1927692128461032e-07, + "loss": 0.0006, + "step": 20837 + }, + { + "epoch": 0.4, + "learning_rate": 1.1927303794027416e-07, + "loss": 0.0012, + "step": 20838 + }, + { + "epoch": 0.4, + "learning_rate": 1.1926915459593803e-07, + "loss": 0.0006, + "step": 20839 + }, + { + "epoch": 0.4, + "learning_rate": 1.1926527125160188e-07, + "loss": 0.0008, + "step": 20840 + }, + { + "epoch": 0.4, + "learning_rate": 1.1926138790726575e-07, + "loss": 0.0087, + "step": 20841 + }, + { + "epoch": 0.4, + "learning_rate": 1.192575045629296e-07, + "loss": 0.0304, + "step": 20842 + }, + { + "epoch": 0.4, + "learning_rate": 1.1925362121859344e-07, + "loss": 0.0007, + "step": 20843 + }, + { + "epoch": 0.4, + "learning_rate": 1.1924973787425729e-07, + "loss": 0.0008, + "step": 20844 + }, + { + "epoch": 0.4, + "learning_rate": 1.1924585452992116e-07, + "loss": 0.3491, + "step": 20845 + }, + { + "epoch": 0.4, + "learning_rate": 1.19241971185585e-07, + "loss": 0.0011, + "step": 20846 + }, + { + "epoch": 0.4, + "learning_rate": 1.1923808784124887e-07, + "loss": 0.0008, + "step": 20847 + }, + { + "epoch": 0.4, + "learning_rate": 1.1923420449691272e-07, + "loss": 0.0007, + "step": 20848 + }, + { + "epoch": 0.4, + "learning_rate": 1.192303211525766e-07, + "loss": 0.0007, + "step": 20849 + }, + { + "epoch": 0.4, + "learning_rate": 1.1922643780824044e-07, + "loss": 0.0007, + "step": 20850 + }, + { + "epoch": 0.4, + "learning_rate": 1.192225544639043e-07, + "loss": 0.0006, + "step": 20851 + }, + { + "epoch": 0.4, + "learning_rate": 1.1921867111956815e-07, + "loss": 0.0028, + "step": 20852 + }, + { + "epoch": 0.4, + "learning_rate": 1.1921478777523202e-07, + "loss": 0.7629, + "step": 20853 + }, + { + "epoch": 0.4, + "learning_rate": 1.1921090443089587e-07, + "loss": 0.0008, + "step": 20854 + }, + { + "epoch": 0.4, + "learning_rate": 1.1920702108655974e-07, + "loss": 0.2172, + "step": 20855 + }, + { + "epoch": 0.4, + "learning_rate": 1.192031377422236e-07, + "loss": 0.0006, + "step": 20856 + }, + { + "epoch": 0.4, + "learning_rate": 1.1919925439788746e-07, + "loss": 0.0525, + "step": 20857 + }, + { + "epoch": 0.4, + "learning_rate": 1.1919537105355131e-07, + "loss": 0.0011, + "step": 20858 + }, + { + "epoch": 0.4, + "learning_rate": 1.1919148770921517e-07, + "loss": 0.047, + "step": 20859 + }, + { + "epoch": 0.4, + "learning_rate": 1.1918760436487903e-07, + "loss": 0.1857, + "step": 20860 + }, + { + "epoch": 0.4, + "learning_rate": 1.1918372102054288e-07, + "loss": 0.0015, + "step": 20861 + }, + { + "epoch": 0.4, + "learning_rate": 1.1917983767620673e-07, + "loss": 0.0008, + "step": 20862 + }, + { + "epoch": 0.4, + "learning_rate": 1.1917595433187059e-07, + "loss": 0.0006, + "step": 20863 + }, + { + "epoch": 0.4, + "learning_rate": 1.1917207098753445e-07, + "loss": 0.0071, + "step": 20864 + }, + { + "epoch": 0.4, + "learning_rate": 1.1916818764319831e-07, + "loss": 0.0008, + "step": 20865 + }, + { + "epoch": 0.4, + "learning_rate": 1.1916430429886217e-07, + "loss": 0.2079, + "step": 20866 + }, + { + "epoch": 0.4, + "learning_rate": 1.1916042095452603e-07, + "loss": 0.0009, + "step": 20867 + }, + { + "epoch": 0.4, + "learning_rate": 1.1915653761018988e-07, + "loss": 0.1582, + "step": 20868 + }, + { + "epoch": 0.4, + "learning_rate": 1.1915265426585374e-07, + "loss": 0.0006, + "step": 20869 + }, + { + "epoch": 0.4, + "learning_rate": 1.191487709215176e-07, + "loss": 0.0006, + "step": 20870 + }, + { + "epoch": 0.4, + "learning_rate": 1.1914488757718146e-07, + "loss": 0.0006, + "step": 20871 + }, + { + "epoch": 0.4, + "learning_rate": 1.1914100423284532e-07, + "loss": 0.0008, + "step": 20872 + }, + { + "epoch": 0.4, + "learning_rate": 1.1913712088850917e-07, + "loss": 0.0006, + "step": 20873 + }, + { + "epoch": 0.4, + "learning_rate": 1.1913323754417303e-07, + "loss": 0.0015, + "step": 20874 + }, + { + "epoch": 0.4, + "learning_rate": 1.1912935419983689e-07, + "loss": 0.0008, + "step": 20875 + }, + { + "epoch": 0.4, + "learning_rate": 1.1912547085550075e-07, + "loss": 0.0009, + "step": 20876 + }, + { + "epoch": 0.4, + "learning_rate": 1.1912158751116461e-07, + "loss": 0.0006, + "step": 20877 + }, + { + "epoch": 0.4, + "learning_rate": 1.1911770416682847e-07, + "loss": 0.0007, + "step": 20878 + }, + { + "epoch": 0.41, + "learning_rate": 1.1911382082249232e-07, + "loss": 0.0091, + "step": 20879 + }, + { + "epoch": 0.41, + "learning_rate": 1.1910993747815618e-07, + "loss": 0.0008, + "step": 20880 + }, + { + "epoch": 0.41, + "learning_rate": 1.1910605413382004e-07, + "loss": 0.0007, + "step": 20881 + }, + { + "epoch": 0.41, + "learning_rate": 1.191021707894839e-07, + "loss": 0.002, + "step": 20882 + }, + { + "epoch": 0.41, + "learning_rate": 1.1909828744514776e-07, + "loss": 0.0016, + "step": 20883 + }, + { + "epoch": 0.41, + "learning_rate": 1.1909440410081162e-07, + "loss": 0.0014, + "step": 20884 + }, + { + "epoch": 0.41, + "learning_rate": 1.1909052075647547e-07, + "loss": 0.001, + "step": 20885 + }, + { + "epoch": 0.41, + "learning_rate": 1.1908663741213933e-07, + "loss": 0.0006, + "step": 20886 + }, + { + "epoch": 0.41, + "learning_rate": 1.1908275406780319e-07, + "loss": 0.5208, + "step": 20887 + }, + { + "epoch": 0.41, + "learning_rate": 1.1907887072346705e-07, + "loss": 0.001, + "step": 20888 + }, + { + "epoch": 0.41, + "learning_rate": 1.190749873791309e-07, + "loss": 0.0047, + "step": 20889 + }, + { + "epoch": 0.41, + "learning_rate": 1.1907110403479476e-07, + "loss": 0.0059, + "step": 20890 + }, + { + "epoch": 0.41, + "learning_rate": 1.1906722069045862e-07, + "loss": 0.9644, + "step": 20891 + }, + { + "epoch": 0.41, + "learning_rate": 1.1906333734612248e-07, + "loss": 0.0027, + "step": 20892 + }, + { + "epoch": 0.41, + "learning_rate": 1.1905945400178634e-07, + "loss": 0.0006, + "step": 20893 + }, + { + "epoch": 0.41, + "learning_rate": 1.190555706574502e-07, + "loss": 0.0006, + "step": 20894 + }, + { + "epoch": 0.41, + "learning_rate": 1.1905168731311406e-07, + "loss": 0.0006, + "step": 20895 + }, + { + "epoch": 0.41, + "learning_rate": 1.1904780396877791e-07, + "loss": 0.0055, + "step": 20896 + }, + { + "epoch": 0.41, + "learning_rate": 1.1904392062444177e-07, + "loss": 0.0178, + "step": 20897 + }, + { + "epoch": 0.41, + "learning_rate": 1.1904003728010563e-07, + "loss": 0.0007, + "step": 20898 + }, + { + "epoch": 0.41, + "learning_rate": 1.1903615393576949e-07, + "loss": 0.0009, + "step": 20899 + }, + { + "epoch": 0.41, + "learning_rate": 1.1903227059143335e-07, + "loss": 0.0007, + "step": 20900 + }, + { + "epoch": 0.41, + "learning_rate": 1.1902838724709718e-07, + "loss": 0.0007, + "step": 20901 + }, + { + "epoch": 0.41, + "learning_rate": 1.1902450390276104e-07, + "loss": 0.0017, + "step": 20902 + }, + { + "epoch": 0.41, + "learning_rate": 1.190206205584249e-07, + "loss": 0.0007, + "step": 20903 + }, + { + "epoch": 0.41, + "learning_rate": 1.1901673721408875e-07, + "loss": 0.0005, + "step": 20904 + }, + { + "epoch": 0.41, + "learning_rate": 1.1901285386975261e-07, + "loss": 0.0668, + "step": 20905 + }, + { + "epoch": 0.41, + "learning_rate": 1.1900897052541647e-07, + "loss": 0.0031, + "step": 20906 + }, + { + "epoch": 0.41, + "learning_rate": 1.1900508718108033e-07, + "loss": 0.0006, + "step": 20907 + }, + { + "epoch": 0.41, + "learning_rate": 1.1900120383674419e-07, + "loss": 0.0007, + "step": 20908 + }, + { + "epoch": 0.41, + "learning_rate": 1.1899732049240805e-07, + "loss": 0.0013, + "step": 20909 + }, + { + "epoch": 0.41, + "learning_rate": 1.189934371480719e-07, + "loss": 0.0009, + "step": 20910 + }, + { + "epoch": 0.41, + "learning_rate": 1.1898955380373576e-07, + "loss": 0.002, + "step": 20911 + }, + { + "epoch": 0.41, + "learning_rate": 1.1898567045939962e-07, + "loss": 0.0008, + "step": 20912 + }, + { + "epoch": 0.41, + "learning_rate": 1.1898178711506348e-07, + "loss": 0.0684, + "step": 20913 + }, + { + "epoch": 0.41, + "learning_rate": 1.1897790377072734e-07, + "loss": 0.0009, + "step": 20914 + }, + { + "epoch": 0.41, + "learning_rate": 1.189740204263912e-07, + "loss": 0.0008, + "step": 20915 + }, + { + "epoch": 0.41, + "learning_rate": 1.1897013708205505e-07, + "loss": 0.0006, + "step": 20916 + }, + { + "epoch": 0.41, + "learning_rate": 1.1896625373771891e-07, + "loss": 0.0006, + "step": 20917 + }, + { + "epoch": 0.41, + "learning_rate": 1.1896237039338277e-07, + "loss": 0.0006, + "step": 20918 + }, + { + "epoch": 0.41, + "learning_rate": 1.1895848704904663e-07, + "loss": 0.0013, + "step": 20919 + }, + { + "epoch": 0.41, + "learning_rate": 1.1895460370471049e-07, + "loss": 0.0031, + "step": 20920 + }, + { + "epoch": 0.41, + "learning_rate": 1.1895072036037434e-07, + "loss": 0.0008, + "step": 20921 + }, + { + "epoch": 0.41, + "learning_rate": 1.189468370160382e-07, + "loss": 0.0011, + "step": 20922 + }, + { + "epoch": 0.41, + "learning_rate": 1.1894295367170206e-07, + "loss": 0.0007, + "step": 20923 + }, + { + "epoch": 0.41, + "learning_rate": 1.1893907032736592e-07, + "loss": 0.0009, + "step": 20924 + }, + { + "epoch": 0.41, + "learning_rate": 1.1893518698302978e-07, + "loss": 0.0753, + "step": 20925 + }, + { + "epoch": 0.41, + "learning_rate": 1.1893130363869364e-07, + "loss": 0.0007, + "step": 20926 + }, + { + "epoch": 0.41, + "learning_rate": 1.189274202943575e-07, + "loss": 0.0006, + "step": 20927 + }, + { + "epoch": 0.41, + "learning_rate": 1.1892353695002135e-07, + "loss": 0.0005, + "step": 20928 + }, + { + "epoch": 0.41, + "learning_rate": 1.1891965360568521e-07, + "loss": 0.4021, + "step": 20929 + }, + { + "epoch": 0.41, + "learning_rate": 1.1891577026134907e-07, + "loss": 1.2252, + "step": 20930 + }, + { + "epoch": 0.41, + "learning_rate": 1.1891188691701293e-07, + "loss": 0.0006, + "step": 20931 + }, + { + "epoch": 0.41, + "learning_rate": 1.1890800357267678e-07, + "loss": 0.0007, + "step": 20932 + }, + { + "epoch": 0.41, + "learning_rate": 1.1890412022834064e-07, + "loss": 0.0023, + "step": 20933 + }, + { + "epoch": 0.41, + "learning_rate": 1.189002368840045e-07, + "loss": 0.9266, + "step": 20934 + }, + { + "epoch": 0.41, + "learning_rate": 1.1889635353966836e-07, + "loss": 0.0005, + "step": 20935 + }, + { + "epoch": 0.41, + "learning_rate": 1.1889247019533222e-07, + "loss": 0.0009, + "step": 20936 + }, + { + "epoch": 0.41, + "learning_rate": 1.1888858685099608e-07, + "loss": 0.0013, + "step": 20937 + }, + { + "epoch": 0.41, + "learning_rate": 1.1888470350665993e-07, + "loss": 0.0008, + "step": 20938 + }, + { + "epoch": 0.41, + "learning_rate": 1.1888082016232379e-07, + "loss": 0.0013, + "step": 20939 + }, + { + "epoch": 0.41, + "learning_rate": 1.1887693681798765e-07, + "loss": 0.0008, + "step": 20940 + }, + { + "epoch": 0.41, + "learning_rate": 1.1887305347365151e-07, + "loss": 0.0039, + "step": 20941 + }, + { + "epoch": 0.41, + "learning_rate": 1.1886917012931537e-07, + "loss": 0.0007, + "step": 20942 + }, + { + "epoch": 0.41, + "learning_rate": 1.1886528678497923e-07, + "loss": 0.0007, + "step": 20943 + }, + { + "epoch": 0.41, + "learning_rate": 1.1886140344064308e-07, + "loss": 0.0047, + "step": 20944 + }, + { + "epoch": 0.41, + "learning_rate": 1.1885752009630694e-07, + "loss": 0.0008, + "step": 20945 + }, + { + "epoch": 0.41, + "learning_rate": 1.188536367519708e-07, + "loss": 0.0008, + "step": 20946 + }, + { + "epoch": 0.41, + "learning_rate": 1.1884975340763466e-07, + "loss": 0.0007, + "step": 20947 + }, + { + "epoch": 0.41, + "learning_rate": 1.1884587006329852e-07, + "loss": 0.0006, + "step": 20948 + }, + { + "epoch": 0.41, + "learning_rate": 1.1884198671896237e-07, + "loss": 0.0008, + "step": 20949 + }, + { + "epoch": 0.41, + "learning_rate": 1.1883810337462623e-07, + "loss": 0.0009, + "step": 20950 + }, + { + "epoch": 0.41, + "learning_rate": 1.1883422003029009e-07, + "loss": 0.0006, + "step": 20951 + }, + { + "epoch": 0.41, + "learning_rate": 1.1883033668595395e-07, + "loss": 0.0018, + "step": 20952 + }, + { + "epoch": 0.41, + "learning_rate": 1.1882645334161781e-07, + "loss": 0.0008, + "step": 20953 + }, + { + "epoch": 0.41, + "learning_rate": 1.1882256999728167e-07, + "loss": 0.0008, + "step": 20954 + }, + { + "epoch": 0.41, + "learning_rate": 1.1881868665294552e-07, + "loss": 0.0007, + "step": 20955 + }, + { + "epoch": 0.41, + "learning_rate": 1.1881480330860938e-07, + "loss": 0.0007, + "step": 20956 + }, + { + "epoch": 0.41, + "learning_rate": 1.1881091996427324e-07, + "loss": 0.0008, + "step": 20957 + }, + { + "epoch": 0.41, + "learning_rate": 1.188070366199371e-07, + "loss": 0.0007, + "step": 20958 + }, + { + "epoch": 0.41, + "learning_rate": 1.1880315327560093e-07, + "loss": 0.0007, + "step": 20959 + }, + { + "epoch": 0.41, + "learning_rate": 1.1879926993126479e-07, + "loss": 0.0007, + "step": 20960 + }, + { + "epoch": 0.41, + "learning_rate": 1.1879538658692865e-07, + "loss": 0.0007, + "step": 20961 + }, + { + "epoch": 0.41, + "learning_rate": 1.187915032425925e-07, + "loss": 0.0005, + "step": 20962 + }, + { + "epoch": 0.41, + "learning_rate": 1.1878761989825636e-07, + "loss": 0.0005, + "step": 20963 + }, + { + "epoch": 0.41, + "learning_rate": 1.1878373655392022e-07, + "loss": 0.0008, + "step": 20964 + }, + { + "epoch": 0.41, + "learning_rate": 1.1877985320958408e-07, + "loss": 0.0007, + "step": 20965 + }, + { + "epoch": 0.41, + "learning_rate": 1.1877596986524794e-07, + "loss": 0.0008, + "step": 20966 + }, + { + "epoch": 0.41, + "learning_rate": 1.187720865209118e-07, + "loss": 0.1434, + "step": 20967 + }, + { + "epoch": 0.41, + "learning_rate": 1.1876820317657565e-07, + "loss": 0.0011, + "step": 20968 + }, + { + "epoch": 0.41, + "learning_rate": 1.1876431983223951e-07, + "loss": 0.0007, + "step": 20969 + }, + { + "epoch": 0.41, + "learning_rate": 1.1876043648790337e-07, + "loss": 0.0007, + "step": 20970 + }, + { + "epoch": 0.41, + "learning_rate": 1.1875655314356723e-07, + "loss": 0.0012, + "step": 20971 + }, + { + "epoch": 0.41, + "learning_rate": 1.1875266979923109e-07, + "loss": 0.0007, + "step": 20972 + }, + { + "epoch": 0.41, + "learning_rate": 1.1874878645489495e-07, + "loss": 0.0009, + "step": 20973 + }, + { + "epoch": 0.41, + "learning_rate": 1.187449031105588e-07, + "loss": 0.0012, + "step": 20974 + }, + { + "epoch": 0.41, + "learning_rate": 1.1874101976622266e-07, + "loss": 0.9995, + "step": 20975 + }, + { + "epoch": 0.41, + "learning_rate": 1.1873713642188652e-07, + "loss": 0.0008, + "step": 20976 + }, + { + "epoch": 0.41, + "learning_rate": 1.1873325307755038e-07, + "loss": 0.0009, + "step": 20977 + }, + { + "epoch": 0.41, + "learning_rate": 1.1872936973321424e-07, + "loss": 0.0007, + "step": 20978 + }, + { + "epoch": 0.41, + "learning_rate": 1.187254863888781e-07, + "loss": 0.001, + "step": 20979 + }, + { + "epoch": 0.41, + "learning_rate": 1.1872160304454195e-07, + "loss": 0.001, + "step": 20980 + }, + { + "epoch": 0.41, + "learning_rate": 1.1871771970020581e-07, + "loss": 0.0006, + "step": 20981 + }, + { + "epoch": 0.41, + "learning_rate": 1.1871383635586967e-07, + "loss": 0.0007, + "step": 20982 + }, + { + "epoch": 0.41, + "learning_rate": 1.1870995301153353e-07, + "loss": 0.0008, + "step": 20983 + }, + { + "epoch": 0.41, + "learning_rate": 1.1870606966719739e-07, + "loss": 0.0016, + "step": 20984 + }, + { + "epoch": 0.41, + "learning_rate": 1.1870218632286125e-07, + "loss": 0.0007, + "step": 20985 + }, + { + "epoch": 0.41, + "learning_rate": 1.186983029785251e-07, + "loss": 0.0021, + "step": 20986 + }, + { + "epoch": 0.41, + "learning_rate": 1.1869441963418896e-07, + "loss": 0.0008, + "step": 20987 + }, + { + "epoch": 0.41, + "learning_rate": 1.1869053628985282e-07, + "loss": 0.0008, + "step": 20988 + }, + { + "epoch": 0.41, + "learning_rate": 1.1868665294551668e-07, + "loss": 0.0034, + "step": 20989 + }, + { + "epoch": 0.41, + "learning_rate": 1.1868276960118054e-07, + "loss": 0.0105, + "step": 20990 + }, + { + "epoch": 0.41, + "learning_rate": 1.186788862568444e-07, + "loss": 0.5702, + "step": 20991 + }, + { + "epoch": 0.41, + "learning_rate": 1.1867500291250825e-07, + "loss": 0.0015, + "step": 20992 + }, + { + "epoch": 0.41, + "learning_rate": 1.1867111956817211e-07, + "loss": 0.9726, + "step": 20993 + }, + { + "epoch": 0.41, + "learning_rate": 1.1866723622383597e-07, + "loss": 0.7575, + "step": 20994 + }, + { + "epoch": 0.41, + "learning_rate": 1.1866335287949983e-07, + "loss": 1.0733, + "step": 20995 + }, + { + "epoch": 0.41, + "learning_rate": 1.1865946953516369e-07, + "loss": 0.6673, + "step": 20996 + }, + { + "epoch": 0.41, + "learning_rate": 1.1865558619082754e-07, + "loss": 0.0006, + "step": 20997 + }, + { + "epoch": 0.41, + "learning_rate": 1.186517028464914e-07, + "loss": 0.0006, + "step": 20998 + }, + { + "epoch": 0.41, + "learning_rate": 1.1864781950215526e-07, + "loss": 0.0007, + "step": 20999 + }, + { + "epoch": 0.41, + "learning_rate": 1.1864393615781912e-07, + "loss": 0.0035, + "step": 21000 + }, + { + "epoch": 0.41, + "learning_rate": 1.1864005281348298e-07, + "loss": 0.0007, + "step": 21001 + }, + { + "epoch": 0.41, + "learning_rate": 1.1863616946914684e-07, + "loss": 0.0009, + "step": 21002 + }, + { + "epoch": 0.41, + "learning_rate": 1.186322861248107e-07, + "loss": 0.0006, + "step": 21003 + }, + { + "epoch": 0.41, + "learning_rate": 1.1862840278047455e-07, + "loss": 0.0015, + "step": 21004 + }, + { + "epoch": 0.41, + "learning_rate": 1.1862451943613841e-07, + "loss": 0.001, + "step": 21005 + }, + { + "epoch": 0.41, + "learning_rate": 1.1862063609180227e-07, + "loss": 0.0007, + "step": 21006 + }, + { + "epoch": 0.41, + "learning_rate": 1.1861675274746613e-07, + "loss": 0.0011, + "step": 21007 + }, + { + "epoch": 0.41, + "learning_rate": 1.1861286940312998e-07, + "loss": 0.0065, + "step": 21008 + }, + { + "epoch": 0.41, + "learning_rate": 1.1860898605879383e-07, + "loss": 0.0007, + "step": 21009 + }, + { + "epoch": 0.41, + "learning_rate": 1.1860510271445769e-07, + "loss": 0.0016, + "step": 21010 + }, + { + "epoch": 0.41, + "learning_rate": 1.1860121937012155e-07, + "loss": 0.0009, + "step": 21011 + }, + { + "epoch": 0.41, + "learning_rate": 1.185973360257854e-07, + "loss": 0.0008, + "step": 21012 + }, + { + "epoch": 0.41, + "learning_rate": 1.1859345268144926e-07, + "loss": 0.0006, + "step": 21013 + }, + { + "epoch": 0.41, + "learning_rate": 1.1858956933711312e-07, + "loss": 0.0037, + "step": 21014 + }, + { + "epoch": 0.41, + "learning_rate": 1.1858568599277698e-07, + "loss": 0.0007, + "step": 21015 + }, + { + "epoch": 0.41, + "learning_rate": 1.1858180264844084e-07, + "loss": 0.6253, + "step": 21016 + }, + { + "epoch": 0.41, + "learning_rate": 1.1857791930410468e-07, + "loss": 0.0007, + "step": 21017 + }, + { + "epoch": 0.41, + "learning_rate": 1.1857403595976854e-07, + "loss": 0.0006, + "step": 21018 + }, + { + "epoch": 0.41, + "learning_rate": 1.185701526154324e-07, + "loss": 0.0006, + "step": 21019 + }, + { + "epoch": 0.41, + "learning_rate": 1.1856626927109626e-07, + "loss": 0.0027, + "step": 21020 + }, + { + "epoch": 0.41, + "learning_rate": 1.1856238592676012e-07, + "loss": 0.0031, + "step": 21021 + }, + { + "epoch": 0.41, + "learning_rate": 1.1855850258242397e-07, + "loss": 0.0812, + "step": 21022 + }, + { + "epoch": 0.41, + "learning_rate": 1.1855461923808783e-07, + "loss": 0.0007, + "step": 21023 + }, + { + "epoch": 0.41, + "learning_rate": 1.1855073589375169e-07, + "loss": 0.0005, + "step": 21024 + }, + { + "epoch": 0.41, + "learning_rate": 1.1854685254941555e-07, + "loss": 0.0006, + "step": 21025 + }, + { + "epoch": 0.41, + "learning_rate": 1.1854296920507941e-07, + "loss": 0.6375, + "step": 21026 + }, + { + "epoch": 0.41, + "learning_rate": 1.1853908586074326e-07, + "loss": 0.855, + "step": 21027 + }, + { + "epoch": 0.41, + "learning_rate": 1.1853520251640712e-07, + "loss": 0.0008, + "step": 21028 + }, + { + "epoch": 0.41, + "learning_rate": 1.1853131917207098e-07, + "loss": 0.0008, + "step": 21029 + }, + { + "epoch": 0.41, + "learning_rate": 1.1852743582773484e-07, + "loss": 0.0007, + "step": 21030 + }, + { + "epoch": 0.41, + "learning_rate": 1.185235524833987e-07, + "loss": 0.0007, + "step": 21031 + }, + { + "epoch": 0.41, + "learning_rate": 1.1851966913906256e-07, + "loss": 0.0005, + "step": 21032 + }, + { + "epoch": 0.41, + "learning_rate": 1.1851578579472641e-07, + "loss": 0.0465, + "step": 21033 + }, + { + "epoch": 0.41, + "learning_rate": 1.1851190245039027e-07, + "loss": 0.1726, + "step": 21034 + }, + { + "epoch": 0.41, + "learning_rate": 1.1850801910605413e-07, + "loss": 0.0012, + "step": 21035 + }, + { + "epoch": 0.41, + "learning_rate": 1.1850413576171799e-07, + "loss": 0.0013, + "step": 21036 + }, + { + "epoch": 0.41, + "learning_rate": 1.1850025241738185e-07, + "loss": 0.001, + "step": 21037 + }, + { + "epoch": 0.41, + "learning_rate": 1.1849636907304569e-07, + "loss": 0.0005, + "step": 21038 + }, + { + "epoch": 0.41, + "learning_rate": 1.1849248572870955e-07, + "loss": 0.0025, + "step": 21039 + }, + { + "epoch": 0.41, + "learning_rate": 1.1848860238437341e-07, + "loss": 0.0008, + "step": 21040 + }, + { + "epoch": 0.41, + "learning_rate": 1.1848471904003727e-07, + "loss": 0.3219, + "step": 21041 + }, + { + "epoch": 0.41, + "learning_rate": 1.1848083569570113e-07, + "loss": 0.0006, + "step": 21042 + }, + { + "epoch": 0.41, + "learning_rate": 1.1847695235136498e-07, + "loss": 0.003, + "step": 21043 + }, + { + "epoch": 0.41, + "learning_rate": 1.1847306900702884e-07, + "loss": 0.0011, + "step": 21044 + }, + { + "epoch": 0.41, + "learning_rate": 1.184691856626927e-07, + "loss": 0.2249, + "step": 21045 + }, + { + "epoch": 0.41, + "learning_rate": 1.1846530231835656e-07, + "loss": 0.7929, + "step": 21046 + }, + { + "epoch": 0.41, + "learning_rate": 1.1846141897402042e-07, + "loss": 0.0009, + "step": 21047 + }, + { + "epoch": 0.41, + "learning_rate": 1.1845753562968427e-07, + "loss": 0.0012, + "step": 21048 + }, + { + "epoch": 0.41, + "learning_rate": 1.1845365228534813e-07, + "loss": 0.8359, + "step": 21049 + }, + { + "epoch": 0.41, + "learning_rate": 1.1844976894101199e-07, + "loss": 0.0009, + "step": 21050 + }, + { + "epoch": 0.41, + "learning_rate": 1.1844588559667585e-07, + "loss": 1.1122, + "step": 21051 + }, + { + "epoch": 0.41, + "learning_rate": 1.1844200225233971e-07, + "loss": 0.0007, + "step": 21052 + }, + { + "epoch": 0.41, + "learning_rate": 1.1843811890800357e-07, + "loss": 0.0006, + "step": 21053 + }, + { + "epoch": 0.41, + "learning_rate": 1.1843423556366742e-07, + "loss": 0.0008, + "step": 21054 + }, + { + "epoch": 0.41, + "learning_rate": 1.1843035221933128e-07, + "loss": 0.2973, + "step": 21055 + }, + { + "epoch": 0.41, + "learning_rate": 1.1842646887499514e-07, + "loss": 0.0007, + "step": 21056 + }, + { + "epoch": 0.41, + "learning_rate": 1.18422585530659e-07, + "loss": 0.0008, + "step": 21057 + }, + { + "epoch": 0.41, + "learning_rate": 1.1841870218632286e-07, + "loss": 0.0006, + "step": 21058 + }, + { + "epoch": 0.41, + "learning_rate": 1.1841481884198672e-07, + "loss": 0.0271, + "step": 21059 + }, + { + "epoch": 0.41, + "learning_rate": 1.1841093549765057e-07, + "loss": 0.0008, + "step": 21060 + }, + { + "epoch": 0.41, + "learning_rate": 1.1840705215331443e-07, + "loss": 0.0007, + "step": 21061 + }, + { + "epoch": 0.41, + "learning_rate": 1.1840316880897829e-07, + "loss": 0.0007, + "step": 21062 + }, + { + "epoch": 0.41, + "learning_rate": 1.1839928546464215e-07, + "loss": 0.0009, + "step": 21063 + }, + { + "epoch": 0.41, + "learning_rate": 1.1839540212030601e-07, + "loss": 0.0006, + "step": 21064 + }, + { + "epoch": 0.41, + "learning_rate": 1.1839151877596986e-07, + "loss": 0.0006, + "step": 21065 + }, + { + "epoch": 0.41, + "learning_rate": 1.1838763543163372e-07, + "loss": 0.0008, + "step": 21066 + }, + { + "epoch": 0.41, + "learning_rate": 1.1838375208729758e-07, + "loss": 0.0009, + "step": 21067 + }, + { + "epoch": 0.41, + "learning_rate": 1.1837986874296144e-07, + "loss": 0.0007, + "step": 21068 + }, + { + "epoch": 0.41, + "learning_rate": 1.183759853986253e-07, + "loss": 0.0007, + "step": 21069 + }, + { + "epoch": 0.41, + "learning_rate": 1.1837210205428916e-07, + "loss": 0.0012, + "step": 21070 + }, + { + "epoch": 0.41, + "learning_rate": 1.1836821870995301e-07, + "loss": 0.0007, + "step": 21071 + }, + { + "epoch": 0.41, + "learning_rate": 1.1836433536561687e-07, + "loss": 0.0009, + "step": 21072 + }, + { + "epoch": 0.41, + "learning_rate": 1.1836045202128073e-07, + "loss": 0.0005, + "step": 21073 + }, + { + "epoch": 0.41, + "learning_rate": 1.1835656867694459e-07, + "loss": 0.0006, + "step": 21074 + }, + { + "epoch": 0.41, + "learning_rate": 1.1835268533260842e-07, + "loss": 0.0005, + "step": 21075 + }, + { + "epoch": 0.41, + "learning_rate": 1.1834880198827228e-07, + "loss": 0.0007, + "step": 21076 + }, + { + "epoch": 0.41, + "learning_rate": 1.1834491864393614e-07, + "loss": 0.0008, + "step": 21077 + }, + { + "epoch": 0.41, + "learning_rate": 1.183410352996e-07, + "loss": 0.0029, + "step": 21078 + }, + { + "epoch": 0.41, + "learning_rate": 1.1833715195526385e-07, + "loss": 0.0007, + "step": 21079 + }, + { + "epoch": 0.41, + "learning_rate": 1.1833326861092771e-07, + "loss": 0.0009, + "step": 21080 + }, + { + "epoch": 0.41, + "learning_rate": 1.1832938526659157e-07, + "loss": 0.0006, + "step": 21081 + }, + { + "epoch": 0.41, + "learning_rate": 1.1832550192225543e-07, + "loss": 0.0005, + "step": 21082 + }, + { + "epoch": 0.41, + "learning_rate": 1.1832161857791929e-07, + "loss": 0.001, + "step": 21083 + }, + { + "epoch": 0.41, + "learning_rate": 1.1831773523358315e-07, + "loss": 0.0006, + "step": 21084 + }, + { + "epoch": 0.41, + "learning_rate": 1.18313851889247e-07, + "loss": 0.0007, + "step": 21085 + }, + { + "epoch": 0.41, + "learning_rate": 1.1830996854491086e-07, + "loss": 0.0008, + "step": 21086 + }, + { + "epoch": 0.41, + "learning_rate": 1.1830608520057472e-07, + "loss": 0.001, + "step": 21087 + }, + { + "epoch": 0.41, + "learning_rate": 1.1830220185623858e-07, + "loss": 0.0005, + "step": 21088 + }, + { + "epoch": 0.41, + "learning_rate": 1.1829831851190244e-07, + "loss": 0.0007, + "step": 21089 + }, + { + "epoch": 0.41, + "learning_rate": 1.182944351675663e-07, + "loss": 0.0072, + "step": 21090 + }, + { + "epoch": 0.41, + "learning_rate": 1.1829055182323015e-07, + "loss": 0.0007, + "step": 21091 + }, + { + "epoch": 0.41, + "learning_rate": 1.1828666847889401e-07, + "loss": 0.0008, + "step": 21092 + }, + { + "epoch": 0.41, + "learning_rate": 1.1828278513455787e-07, + "loss": 0.0008, + "step": 21093 + }, + { + "epoch": 0.41, + "learning_rate": 1.1827890179022173e-07, + "loss": 0.0008, + "step": 21094 + }, + { + "epoch": 0.41, + "learning_rate": 1.1827501844588559e-07, + "loss": 0.0049, + "step": 21095 + }, + { + "epoch": 0.41, + "learning_rate": 1.1827113510154944e-07, + "loss": 0.0025, + "step": 21096 + }, + { + "epoch": 0.41, + "learning_rate": 1.182672517572133e-07, + "loss": 0.0011, + "step": 21097 + }, + { + "epoch": 0.41, + "learning_rate": 1.1826336841287716e-07, + "loss": 0.0136, + "step": 21098 + }, + { + "epoch": 0.41, + "learning_rate": 1.1825948506854102e-07, + "loss": 0.0008, + "step": 21099 + }, + { + "epoch": 0.41, + "learning_rate": 1.1825560172420488e-07, + "loss": 0.0011, + "step": 21100 + }, + { + "epoch": 0.41, + "learning_rate": 1.1825171837986874e-07, + "loss": 0.0008, + "step": 21101 + }, + { + "epoch": 0.41, + "learning_rate": 1.182478350355326e-07, + "loss": 0.0016, + "step": 21102 + }, + { + "epoch": 0.41, + "learning_rate": 1.1824395169119645e-07, + "loss": 0.0007, + "step": 21103 + }, + { + "epoch": 0.41, + "learning_rate": 1.1824006834686031e-07, + "loss": 0.0006, + "step": 21104 + }, + { + "epoch": 0.41, + "learning_rate": 1.1823618500252417e-07, + "loss": 0.0011, + "step": 21105 + }, + { + "epoch": 0.41, + "learning_rate": 1.1823230165818803e-07, + "loss": 0.0011, + "step": 21106 + }, + { + "epoch": 0.41, + "learning_rate": 1.1822841831385188e-07, + "loss": 0.0014, + "step": 21107 + }, + { + "epoch": 0.41, + "learning_rate": 1.1822453496951574e-07, + "loss": 0.0007, + "step": 21108 + }, + { + "epoch": 0.41, + "learning_rate": 1.182206516251796e-07, + "loss": 0.0007, + "step": 21109 + }, + { + "epoch": 0.41, + "learning_rate": 1.1821676828084346e-07, + "loss": 0.0007, + "step": 21110 + }, + { + "epoch": 0.41, + "learning_rate": 1.1821288493650732e-07, + "loss": 0.0007, + "step": 21111 + }, + { + "epoch": 0.41, + "learning_rate": 1.1820900159217118e-07, + "loss": 0.0008, + "step": 21112 + }, + { + "epoch": 0.41, + "learning_rate": 1.1820511824783503e-07, + "loss": 0.0015, + "step": 21113 + }, + { + "epoch": 0.41, + "learning_rate": 1.1820123490349889e-07, + "loss": 0.0007, + "step": 21114 + }, + { + "epoch": 0.41, + "learning_rate": 1.1819735155916275e-07, + "loss": 0.0006, + "step": 21115 + }, + { + "epoch": 0.41, + "learning_rate": 1.1819346821482661e-07, + "loss": 0.0297, + "step": 21116 + }, + { + "epoch": 0.41, + "learning_rate": 1.1818958487049047e-07, + "loss": 0.0006, + "step": 21117 + }, + { + "epoch": 0.41, + "learning_rate": 1.1818570152615433e-07, + "loss": 0.0006, + "step": 21118 + }, + { + "epoch": 0.41, + "learning_rate": 1.1818181818181818e-07, + "loss": 0.0005, + "step": 21119 + }, + { + "epoch": 0.41, + "learning_rate": 1.1817793483748204e-07, + "loss": 0.0008, + "step": 21120 + }, + { + "epoch": 0.41, + "learning_rate": 1.181740514931459e-07, + "loss": 0.0009, + "step": 21121 + }, + { + "epoch": 0.41, + "learning_rate": 1.1817016814880976e-07, + "loss": 0.0009, + "step": 21122 + }, + { + "epoch": 0.41, + "learning_rate": 1.1816628480447362e-07, + "loss": 0.0006, + "step": 21123 + }, + { + "epoch": 0.41, + "learning_rate": 1.1816240146013747e-07, + "loss": 0.0007, + "step": 21124 + }, + { + "epoch": 0.41, + "learning_rate": 1.1815851811580133e-07, + "loss": 0.0008, + "step": 21125 + }, + { + "epoch": 0.41, + "learning_rate": 1.1815463477146519e-07, + "loss": 0.0006, + "step": 21126 + }, + { + "epoch": 0.41, + "learning_rate": 1.1815075142712905e-07, + "loss": 0.0005, + "step": 21127 + }, + { + "epoch": 0.41, + "learning_rate": 1.1814686808279291e-07, + "loss": 1.2825, + "step": 21128 + }, + { + "epoch": 0.41, + "learning_rate": 1.1814298473845677e-07, + "loss": 0.0011, + "step": 21129 + }, + { + "epoch": 0.41, + "learning_rate": 1.1813910139412062e-07, + "loss": 0.0012, + "step": 21130 + }, + { + "epoch": 0.41, + "learning_rate": 1.1813521804978448e-07, + "loss": 0.0066, + "step": 21131 + }, + { + "epoch": 0.41, + "learning_rate": 1.1813133470544834e-07, + "loss": 0.0008, + "step": 21132 + }, + { + "epoch": 0.41, + "learning_rate": 1.1812745136111217e-07, + "loss": 0.0014, + "step": 21133 + }, + { + "epoch": 0.41, + "learning_rate": 1.1812356801677603e-07, + "loss": 0.0008, + "step": 21134 + }, + { + "epoch": 0.41, + "learning_rate": 1.1811968467243989e-07, + "loss": 0.0006, + "step": 21135 + }, + { + "epoch": 0.41, + "learning_rate": 1.1811580132810375e-07, + "loss": 0.0007, + "step": 21136 + }, + { + "epoch": 0.41, + "learning_rate": 1.181119179837676e-07, + "loss": 0.0013, + "step": 21137 + }, + { + "epoch": 0.41, + "learning_rate": 1.1810803463943146e-07, + "loss": 0.0007, + "step": 21138 + }, + { + "epoch": 0.41, + "learning_rate": 1.1810415129509532e-07, + "loss": 0.0007, + "step": 21139 + }, + { + "epoch": 0.41, + "learning_rate": 1.1810026795075918e-07, + "loss": 0.0015, + "step": 21140 + }, + { + "epoch": 0.41, + "learning_rate": 1.1809638460642304e-07, + "loss": 0.2402, + "step": 21141 + }, + { + "epoch": 0.41, + "learning_rate": 1.180925012620869e-07, + "loss": 0.0007, + "step": 21142 + }, + { + "epoch": 0.41, + "learning_rate": 1.1808861791775076e-07, + "loss": 0.0207, + "step": 21143 + }, + { + "epoch": 0.41, + "learning_rate": 1.1808473457341461e-07, + "loss": 0.0005, + "step": 21144 + }, + { + "epoch": 0.41, + "learning_rate": 1.1808085122907847e-07, + "loss": 0.0007, + "step": 21145 + }, + { + "epoch": 0.41, + "learning_rate": 1.1807696788474233e-07, + "loss": 0.0006, + "step": 21146 + }, + { + "epoch": 0.41, + "learning_rate": 1.1807308454040619e-07, + "loss": 0.0023, + "step": 21147 + }, + { + "epoch": 0.41, + "learning_rate": 1.1806920119607005e-07, + "loss": 0.0007, + "step": 21148 + }, + { + "epoch": 0.41, + "learning_rate": 1.180653178517339e-07, + "loss": 0.0006, + "step": 21149 + }, + { + "epoch": 0.41, + "learning_rate": 1.1806143450739776e-07, + "loss": 0.0008, + "step": 21150 + }, + { + "epoch": 0.41, + "learning_rate": 1.1805755116306162e-07, + "loss": 0.4698, + "step": 21151 + }, + { + "epoch": 0.41, + "learning_rate": 1.1805366781872548e-07, + "loss": 0.001, + "step": 21152 + }, + { + "epoch": 0.41, + "learning_rate": 1.1804978447438934e-07, + "loss": 0.0007, + "step": 21153 + }, + { + "epoch": 0.41, + "learning_rate": 1.180459011300532e-07, + "loss": 0.0007, + "step": 21154 + }, + { + "epoch": 0.41, + "learning_rate": 1.1804201778571705e-07, + "loss": 0.0008, + "step": 21155 + }, + { + "epoch": 0.41, + "learning_rate": 1.1803813444138091e-07, + "loss": 0.0007, + "step": 21156 + }, + { + "epoch": 0.41, + "learning_rate": 1.1803425109704477e-07, + "loss": 0.0007, + "step": 21157 + }, + { + "epoch": 0.41, + "learning_rate": 1.1803036775270863e-07, + "loss": 0.0007, + "step": 21158 + }, + { + "epoch": 0.41, + "learning_rate": 1.1802648440837249e-07, + "loss": 0.0009, + "step": 21159 + }, + { + "epoch": 0.41, + "learning_rate": 1.1802260106403635e-07, + "loss": 0.0007, + "step": 21160 + }, + { + "epoch": 0.41, + "learning_rate": 1.180187177197002e-07, + "loss": 0.0461, + "step": 21161 + }, + { + "epoch": 0.41, + "learning_rate": 1.1801483437536406e-07, + "loss": 0.0008, + "step": 21162 + }, + { + "epoch": 0.41, + "learning_rate": 1.1801095103102792e-07, + "loss": 0.0006, + "step": 21163 + }, + { + "epoch": 0.41, + "learning_rate": 1.1800706768669178e-07, + "loss": 0.0007, + "step": 21164 + }, + { + "epoch": 0.41, + "learning_rate": 1.1800318434235564e-07, + "loss": 0.0013, + "step": 21165 + }, + { + "epoch": 0.41, + "learning_rate": 1.179993009980195e-07, + "loss": 0.001, + "step": 21166 + }, + { + "epoch": 0.41, + "learning_rate": 1.1799541765368335e-07, + "loss": 0.0006, + "step": 21167 + }, + { + "epoch": 0.41, + "learning_rate": 1.1799153430934721e-07, + "loss": 0.0005, + "step": 21168 + }, + { + "epoch": 0.41, + "learning_rate": 1.1798765096501107e-07, + "loss": 0.0008, + "step": 21169 + }, + { + "epoch": 0.41, + "learning_rate": 1.1798376762067493e-07, + "loss": 0.0007, + "step": 21170 + }, + { + "epoch": 0.41, + "learning_rate": 1.1797988427633879e-07, + "loss": 0.0008, + "step": 21171 + }, + { + "epoch": 0.41, + "learning_rate": 1.1797600093200264e-07, + "loss": 0.0008, + "step": 21172 + }, + { + "epoch": 0.41, + "learning_rate": 1.179721175876665e-07, + "loss": 0.0006, + "step": 21173 + }, + { + "epoch": 0.41, + "learning_rate": 1.1796823424333036e-07, + "loss": 0.0005, + "step": 21174 + }, + { + "epoch": 0.41, + "learning_rate": 1.1796435089899422e-07, + "loss": 0.0006, + "step": 21175 + }, + { + "epoch": 0.41, + "learning_rate": 1.1796046755465808e-07, + "loss": 0.0006, + "step": 21176 + }, + { + "epoch": 0.41, + "learning_rate": 1.1795658421032194e-07, + "loss": 0.0006, + "step": 21177 + }, + { + "epoch": 0.41, + "learning_rate": 1.179527008659858e-07, + "loss": 0.4891, + "step": 21178 + }, + { + "epoch": 0.41, + "learning_rate": 1.1794881752164965e-07, + "loss": 0.0007, + "step": 21179 + }, + { + "epoch": 0.41, + "learning_rate": 1.1794493417731351e-07, + "loss": 0.0006, + "step": 21180 + }, + { + "epoch": 0.41, + "learning_rate": 1.1794105083297737e-07, + "loss": 0.1393, + "step": 21181 + }, + { + "epoch": 0.41, + "learning_rate": 1.1793716748864123e-07, + "loss": 0.0063, + "step": 21182 + }, + { + "epoch": 0.41, + "learning_rate": 1.1793328414430508e-07, + "loss": 0.0005, + "step": 21183 + }, + { + "epoch": 0.41, + "learning_rate": 1.1792940079996894e-07, + "loss": 0.0007, + "step": 21184 + }, + { + "epoch": 0.41, + "learning_rate": 1.179255174556328e-07, + "loss": 0.0005, + "step": 21185 + }, + { + "epoch": 0.41, + "learning_rate": 1.1792163411129665e-07, + "loss": 0.0008, + "step": 21186 + }, + { + "epoch": 0.41, + "learning_rate": 1.179177507669605e-07, + "loss": 0.0008, + "step": 21187 + }, + { + "epoch": 0.41, + "learning_rate": 1.1791386742262436e-07, + "loss": 0.0009, + "step": 21188 + }, + { + "epoch": 0.41, + "learning_rate": 1.1790998407828822e-07, + "loss": 0.9991, + "step": 21189 + }, + { + "epoch": 0.41, + "learning_rate": 1.1790610073395208e-07, + "loss": 0.0006, + "step": 21190 + }, + { + "epoch": 0.41, + "learning_rate": 1.1790221738961592e-07, + "loss": 0.0007, + "step": 21191 + }, + { + "epoch": 0.41, + "learning_rate": 1.1789833404527978e-07, + "loss": 0.0008, + "step": 21192 + }, + { + "epoch": 0.41, + "learning_rate": 1.1789445070094364e-07, + "loss": 0.0008, + "step": 21193 + }, + { + "epoch": 0.41, + "learning_rate": 1.178905673566075e-07, + "loss": 0.0008, + "step": 21194 + }, + { + "epoch": 0.41, + "learning_rate": 1.1788668401227136e-07, + "loss": 0.0005, + "step": 21195 + }, + { + "epoch": 0.41, + "learning_rate": 1.1788280066793522e-07, + "loss": 0.0008, + "step": 21196 + }, + { + "epoch": 0.41, + "learning_rate": 1.1787891732359907e-07, + "loss": 0.0032, + "step": 21197 + }, + { + "epoch": 0.41, + "learning_rate": 1.1787503397926293e-07, + "loss": 0.0006, + "step": 21198 + }, + { + "epoch": 0.41, + "learning_rate": 1.1787115063492679e-07, + "loss": 0.0006, + "step": 21199 + }, + { + "epoch": 0.41, + "learning_rate": 1.1786726729059065e-07, + "loss": 0.0013, + "step": 21200 + }, + { + "epoch": 0.41, + "learning_rate": 1.1786338394625451e-07, + "loss": 0.0007, + "step": 21201 + }, + { + "epoch": 0.41, + "learning_rate": 1.1785950060191837e-07, + "loss": 0.0007, + "step": 21202 + }, + { + "epoch": 0.41, + "learning_rate": 1.1785561725758222e-07, + "loss": 0.0005, + "step": 21203 + }, + { + "epoch": 0.41, + "learning_rate": 1.1785173391324608e-07, + "loss": 0.499, + "step": 21204 + }, + { + "epoch": 0.41, + "learning_rate": 1.1784785056890994e-07, + "loss": 1.0604, + "step": 21205 + }, + { + "epoch": 0.41, + "learning_rate": 1.178439672245738e-07, + "loss": 0.0007, + "step": 21206 + }, + { + "epoch": 0.41, + "learning_rate": 1.1784008388023766e-07, + "loss": 0.0007, + "step": 21207 + }, + { + "epoch": 0.41, + "learning_rate": 1.1783620053590151e-07, + "loss": 0.0019, + "step": 21208 + }, + { + "epoch": 0.41, + "learning_rate": 1.1783231719156537e-07, + "loss": 0.0009, + "step": 21209 + }, + { + "epoch": 0.41, + "learning_rate": 1.1782843384722923e-07, + "loss": 0.0008, + "step": 21210 + }, + { + "epoch": 0.41, + "learning_rate": 1.1782455050289309e-07, + "loss": 0.0008, + "step": 21211 + }, + { + "epoch": 0.41, + "learning_rate": 1.1782066715855695e-07, + "loss": 0.0017, + "step": 21212 + }, + { + "epoch": 0.41, + "learning_rate": 1.178167838142208e-07, + "loss": 0.0133, + "step": 21213 + }, + { + "epoch": 0.41, + "learning_rate": 1.1781290046988466e-07, + "loss": 0.0007, + "step": 21214 + }, + { + "epoch": 0.41, + "learning_rate": 1.1780901712554851e-07, + "loss": 0.0659, + "step": 21215 + }, + { + "epoch": 0.41, + "learning_rate": 1.1780513378121237e-07, + "loss": 0.0009, + "step": 21216 + }, + { + "epoch": 0.41, + "learning_rate": 1.1780125043687623e-07, + "loss": 0.9955, + "step": 21217 + }, + { + "epoch": 0.41, + "learning_rate": 1.1779736709254008e-07, + "loss": 0.0006, + "step": 21218 + }, + { + "epoch": 0.41, + "learning_rate": 1.1779348374820394e-07, + "loss": 0.0008, + "step": 21219 + }, + { + "epoch": 0.41, + "learning_rate": 1.177896004038678e-07, + "loss": 0.0007, + "step": 21220 + }, + { + "epoch": 0.41, + "learning_rate": 1.1778571705953166e-07, + "loss": 0.0007, + "step": 21221 + }, + { + "epoch": 0.41, + "learning_rate": 1.1778183371519552e-07, + "loss": 0.0013, + "step": 21222 + }, + { + "epoch": 0.41, + "learning_rate": 1.1777795037085937e-07, + "loss": 0.0009, + "step": 21223 + }, + { + "epoch": 0.41, + "learning_rate": 1.1777406702652323e-07, + "loss": 0.0007, + "step": 21224 + }, + { + "epoch": 0.41, + "learning_rate": 1.1777018368218709e-07, + "loss": 0.0008, + "step": 21225 + }, + { + "epoch": 0.41, + "learning_rate": 1.1776630033785095e-07, + "loss": 0.001, + "step": 21226 + }, + { + "epoch": 0.41, + "learning_rate": 1.1776241699351481e-07, + "loss": 0.0009, + "step": 21227 + }, + { + "epoch": 0.41, + "learning_rate": 1.1775853364917867e-07, + "loss": 0.0005, + "step": 21228 + }, + { + "epoch": 0.41, + "learning_rate": 1.1775465030484252e-07, + "loss": 0.0009, + "step": 21229 + }, + { + "epoch": 0.41, + "learning_rate": 1.1775076696050638e-07, + "loss": 0.8626, + "step": 21230 + }, + { + "epoch": 0.41, + "learning_rate": 1.1774688361617024e-07, + "loss": 0.0007, + "step": 21231 + }, + { + "epoch": 0.41, + "learning_rate": 1.177430002718341e-07, + "loss": 0.0023, + "step": 21232 + }, + { + "epoch": 0.41, + "learning_rate": 1.1773911692749796e-07, + "loss": 0.001, + "step": 21233 + }, + { + "epoch": 0.41, + "learning_rate": 1.1773523358316182e-07, + "loss": 0.0008, + "step": 21234 + }, + { + "epoch": 0.41, + "learning_rate": 1.1773135023882567e-07, + "loss": 0.0006, + "step": 21235 + }, + { + "epoch": 0.41, + "learning_rate": 1.1772746689448953e-07, + "loss": 0.0011, + "step": 21236 + }, + { + "epoch": 0.41, + "learning_rate": 1.1772358355015339e-07, + "loss": 0.0028, + "step": 21237 + }, + { + "epoch": 0.41, + "learning_rate": 1.1771970020581725e-07, + "loss": 0.001, + "step": 21238 + }, + { + "epoch": 0.41, + "learning_rate": 1.1771581686148111e-07, + "loss": 0.0006, + "step": 21239 + }, + { + "epoch": 0.41, + "learning_rate": 1.1771193351714497e-07, + "loss": 0.1803, + "step": 21240 + }, + { + "epoch": 0.41, + "learning_rate": 1.1770805017280882e-07, + "loss": 0.0006, + "step": 21241 + }, + { + "epoch": 0.41, + "learning_rate": 1.1770416682847268e-07, + "loss": 0.0008, + "step": 21242 + }, + { + "epoch": 0.41, + "learning_rate": 1.1770028348413654e-07, + "loss": 0.0011, + "step": 21243 + }, + { + "epoch": 0.41, + "learning_rate": 1.176964001398004e-07, + "loss": 0.6066, + "step": 21244 + }, + { + "epoch": 0.41, + "learning_rate": 1.1769251679546426e-07, + "loss": 0.0008, + "step": 21245 + }, + { + "epoch": 0.41, + "learning_rate": 1.1768863345112811e-07, + "loss": 0.0008, + "step": 21246 + }, + { + "epoch": 0.41, + "learning_rate": 1.1768475010679197e-07, + "loss": 0.0008, + "step": 21247 + }, + { + "epoch": 0.41, + "learning_rate": 1.1768086676245583e-07, + "loss": 0.0006, + "step": 21248 + }, + { + "epoch": 0.41, + "learning_rate": 1.1767698341811966e-07, + "loss": 0.0005, + "step": 21249 + }, + { + "epoch": 0.41, + "learning_rate": 1.1767310007378352e-07, + "loss": 0.0005, + "step": 21250 + }, + { + "epoch": 0.41, + "learning_rate": 1.1766921672944738e-07, + "loss": 0.0009, + "step": 21251 + }, + { + "epoch": 0.41, + "learning_rate": 1.1766533338511124e-07, + "loss": 0.0011, + "step": 21252 + }, + { + "epoch": 0.41, + "learning_rate": 1.176614500407751e-07, + "loss": 0.0015, + "step": 21253 + }, + { + "epoch": 0.41, + "learning_rate": 1.1765756669643895e-07, + "loss": 0.3881, + "step": 21254 + }, + { + "epoch": 0.41, + "learning_rate": 1.1765368335210281e-07, + "loss": 0.0011, + "step": 21255 + }, + { + "epoch": 0.41, + "learning_rate": 1.1764980000776667e-07, + "loss": 0.0009, + "step": 21256 + }, + { + "epoch": 0.41, + "learning_rate": 1.1764591666343053e-07, + "loss": 0.0005, + "step": 21257 + }, + { + "epoch": 0.41, + "learning_rate": 1.1764203331909439e-07, + "loss": 0.0013, + "step": 21258 + }, + { + "epoch": 0.41, + "learning_rate": 1.1763814997475825e-07, + "loss": 0.0007, + "step": 21259 + }, + { + "epoch": 0.41, + "learning_rate": 1.176342666304221e-07, + "loss": 0.1077, + "step": 21260 + }, + { + "epoch": 0.41, + "learning_rate": 1.1763038328608596e-07, + "loss": 0.0006, + "step": 21261 + }, + { + "epoch": 0.41, + "learning_rate": 1.1762649994174982e-07, + "loss": 0.0008, + "step": 21262 + }, + { + "epoch": 0.41, + "learning_rate": 1.1762261659741368e-07, + "loss": 0.0007, + "step": 21263 + }, + { + "epoch": 0.41, + "learning_rate": 1.1761873325307754e-07, + "loss": 0.0006, + "step": 21264 + }, + { + "epoch": 0.41, + "learning_rate": 1.176148499087414e-07, + "loss": 0.0013, + "step": 21265 + }, + { + "epoch": 0.41, + "learning_rate": 1.1761096656440525e-07, + "loss": 0.0019, + "step": 21266 + }, + { + "epoch": 0.41, + "learning_rate": 1.1760708322006911e-07, + "loss": 0.0018, + "step": 21267 + }, + { + "epoch": 0.41, + "learning_rate": 1.1760319987573297e-07, + "loss": 0.0009, + "step": 21268 + }, + { + "epoch": 0.41, + "learning_rate": 1.1759931653139683e-07, + "loss": 0.0007, + "step": 21269 + }, + { + "epoch": 0.41, + "learning_rate": 1.1759543318706069e-07, + "loss": 0.0017, + "step": 21270 + }, + { + "epoch": 0.41, + "learning_rate": 1.1759154984272454e-07, + "loss": 1.1669, + "step": 21271 + }, + { + "epoch": 0.41, + "learning_rate": 1.175876664983884e-07, + "loss": 0.0014, + "step": 21272 + }, + { + "epoch": 0.41, + "learning_rate": 1.1758378315405226e-07, + "loss": 0.0006, + "step": 21273 + }, + { + "epoch": 0.41, + "learning_rate": 1.1757989980971612e-07, + "loss": 0.0007, + "step": 21274 + }, + { + "epoch": 0.41, + "learning_rate": 1.1757601646537998e-07, + "loss": 0.0005, + "step": 21275 + }, + { + "epoch": 0.41, + "learning_rate": 1.1757213312104384e-07, + "loss": 0.0007, + "step": 21276 + }, + { + "epoch": 0.41, + "learning_rate": 1.175682497767077e-07, + "loss": 0.0008, + "step": 21277 + }, + { + "epoch": 0.41, + "learning_rate": 1.1756436643237155e-07, + "loss": 0.0007, + "step": 21278 + }, + { + "epoch": 0.41, + "learning_rate": 1.1756048308803541e-07, + "loss": 0.0007, + "step": 21279 + }, + { + "epoch": 0.41, + "learning_rate": 1.1755659974369927e-07, + "loss": 0.0007, + "step": 21280 + }, + { + "epoch": 0.41, + "learning_rate": 1.1755271639936313e-07, + "loss": 0.0007, + "step": 21281 + }, + { + "epoch": 0.41, + "learning_rate": 1.1754883305502698e-07, + "loss": 0.0023, + "step": 21282 + }, + { + "epoch": 0.41, + "learning_rate": 1.1754494971069084e-07, + "loss": 0.0009, + "step": 21283 + }, + { + "epoch": 0.41, + "learning_rate": 1.175410663663547e-07, + "loss": 0.0008, + "step": 21284 + }, + { + "epoch": 0.41, + "learning_rate": 1.1753718302201856e-07, + "loss": 0.3744, + "step": 21285 + }, + { + "epoch": 0.41, + "learning_rate": 1.1753329967768242e-07, + "loss": 0.0005, + "step": 21286 + }, + { + "epoch": 0.41, + "learning_rate": 1.1752941633334628e-07, + "loss": 0.001, + "step": 21287 + }, + { + "epoch": 0.41, + "learning_rate": 1.1752553298901013e-07, + "loss": 0.0007, + "step": 21288 + }, + { + "epoch": 0.41, + "learning_rate": 1.1752164964467399e-07, + "loss": 0.0008, + "step": 21289 + }, + { + "epoch": 0.41, + "learning_rate": 1.1751776630033785e-07, + "loss": 0.0006, + "step": 21290 + }, + { + "epoch": 0.41, + "learning_rate": 1.1751388295600171e-07, + "loss": 0.0007, + "step": 21291 + }, + { + "epoch": 0.41, + "learning_rate": 1.1750999961166557e-07, + "loss": 0.0006, + "step": 21292 + }, + { + "epoch": 0.41, + "learning_rate": 1.1750611626732943e-07, + "loss": 0.0007, + "step": 21293 + }, + { + "epoch": 0.41, + "learning_rate": 1.1750223292299328e-07, + "loss": 0.0006, + "step": 21294 + }, + { + "epoch": 0.41, + "learning_rate": 1.1749834957865714e-07, + "loss": 0.0025, + "step": 21295 + }, + { + "epoch": 0.41, + "learning_rate": 1.17494466234321e-07, + "loss": 0.0008, + "step": 21296 + }, + { + "epoch": 0.41, + "learning_rate": 1.1749058288998486e-07, + "loss": 0.0095, + "step": 21297 + }, + { + "epoch": 0.41, + "learning_rate": 1.1748669954564872e-07, + "loss": 0.0007, + "step": 21298 + }, + { + "epoch": 0.41, + "learning_rate": 1.1748281620131258e-07, + "loss": 0.0013, + "step": 21299 + }, + { + "epoch": 0.41, + "learning_rate": 1.1747893285697643e-07, + "loss": 0.0012, + "step": 21300 + }, + { + "epoch": 0.41, + "learning_rate": 1.1747504951264029e-07, + "loss": 0.0007, + "step": 21301 + }, + { + "epoch": 0.41, + "learning_rate": 1.1747116616830415e-07, + "loss": 0.0006, + "step": 21302 + }, + { + "epoch": 0.41, + "learning_rate": 1.1746728282396801e-07, + "loss": 0.0006, + "step": 21303 + }, + { + "epoch": 0.41, + "learning_rate": 1.1746339947963187e-07, + "loss": 0.0005, + "step": 21304 + }, + { + "epoch": 0.41, + "learning_rate": 1.1745951613529572e-07, + "loss": 0.0026, + "step": 21305 + }, + { + "epoch": 0.41, + "learning_rate": 1.1745563279095958e-07, + "loss": 0.0006, + "step": 21306 + }, + { + "epoch": 0.41, + "learning_rate": 1.1745174944662341e-07, + "loss": 0.618, + "step": 21307 + }, + { + "epoch": 0.41, + "learning_rate": 1.1744786610228727e-07, + "loss": 0.3196, + "step": 21308 + }, + { + "epoch": 0.41, + "learning_rate": 1.1744398275795113e-07, + "loss": 0.0007, + "step": 21309 + }, + { + "epoch": 0.41, + "learning_rate": 1.1744009941361499e-07, + "loss": 0.0007, + "step": 21310 + }, + { + "epoch": 0.41, + "learning_rate": 1.1743621606927885e-07, + "loss": 1.0033, + "step": 21311 + }, + { + "epoch": 0.41, + "learning_rate": 1.174323327249427e-07, + "loss": 0.0007, + "step": 21312 + }, + { + "epoch": 0.41, + "learning_rate": 1.1742844938060656e-07, + "loss": 0.0006, + "step": 21313 + }, + { + "epoch": 0.41, + "learning_rate": 1.1742456603627042e-07, + "loss": 0.0005, + "step": 21314 + }, + { + "epoch": 0.41, + "learning_rate": 1.1742068269193428e-07, + "loss": 0.0367, + "step": 21315 + }, + { + "epoch": 0.41, + "learning_rate": 1.1741679934759814e-07, + "loss": 0.0005, + "step": 21316 + }, + { + "epoch": 0.41, + "learning_rate": 1.17412916003262e-07, + "loss": 0.0005, + "step": 21317 + }, + { + "epoch": 0.41, + "learning_rate": 1.1740903265892586e-07, + "loss": 0.0006, + "step": 21318 + }, + { + "epoch": 0.41, + "learning_rate": 1.1740514931458971e-07, + "loss": 0.0009, + "step": 21319 + }, + { + "epoch": 0.41, + "learning_rate": 1.1740126597025357e-07, + "loss": 1.272, + "step": 21320 + }, + { + "epoch": 0.41, + "learning_rate": 1.1739738262591743e-07, + "loss": 0.0049, + "step": 21321 + }, + { + "epoch": 0.41, + "learning_rate": 1.1739349928158129e-07, + "loss": 0.0008, + "step": 21322 + }, + { + "epoch": 0.41, + "learning_rate": 1.1738961593724515e-07, + "loss": 0.0032, + "step": 21323 + }, + { + "epoch": 0.41, + "learning_rate": 1.17385732592909e-07, + "loss": 0.0011, + "step": 21324 + }, + { + "epoch": 0.41, + "learning_rate": 1.1738184924857286e-07, + "loss": 0.1339, + "step": 21325 + }, + { + "epoch": 0.41, + "learning_rate": 1.1737796590423672e-07, + "loss": 0.0006, + "step": 21326 + }, + { + "epoch": 0.41, + "learning_rate": 1.1737408255990058e-07, + "loss": 0.0006, + "step": 21327 + }, + { + "epoch": 0.41, + "learning_rate": 1.1737019921556444e-07, + "loss": 0.0054, + "step": 21328 + }, + { + "epoch": 0.41, + "learning_rate": 1.173663158712283e-07, + "loss": 0.0005, + "step": 21329 + }, + { + "epoch": 0.41, + "learning_rate": 1.1736243252689215e-07, + "loss": 0.0005, + "step": 21330 + }, + { + "epoch": 0.41, + "learning_rate": 1.1735854918255601e-07, + "loss": 0.0007, + "step": 21331 + }, + { + "epoch": 0.41, + "learning_rate": 1.1735466583821987e-07, + "loss": 0.0006, + "step": 21332 + }, + { + "epoch": 0.41, + "learning_rate": 1.1735078249388373e-07, + "loss": 0.0007, + "step": 21333 + }, + { + "epoch": 0.41, + "learning_rate": 1.1734689914954759e-07, + "loss": 0.0006, + "step": 21334 + }, + { + "epoch": 0.41, + "learning_rate": 1.1734301580521145e-07, + "loss": 0.0006, + "step": 21335 + }, + { + "epoch": 0.41, + "learning_rate": 1.173391324608753e-07, + "loss": 0.1625, + "step": 21336 + }, + { + "epoch": 0.41, + "learning_rate": 1.1733524911653916e-07, + "loss": 0.0008, + "step": 21337 + }, + { + "epoch": 0.41, + "learning_rate": 1.1733136577220302e-07, + "loss": 0.0006, + "step": 21338 + }, + { + "epoch": 0.41, + "learning_rate": 1.1732748242786688e-07, + "loss": 0.0008, + "step": 21339 + }, + { + "epoch": 0.41, + "learning_rate": 1.1732359908353074e-07, + "loss": 0.0011, + "step": 21340 + }, + { + "epoch": 0.41, + "learning_rate": 1.173197157391946e-07, + "loss": 0.0008, + "step": 21341 + }, + { + "epoch": 0.41, + "learning_rate": 1.1731583239485845e-07, + "loss": 0.0007, + "step": 21342 + }, + { + "epoch": 0.41, + "learning_rate": 1.1731194905052231e-07, + "loss": 0.0006, + "step": 21343 + }, + { + "epoch": 0.41, + "learning_rate": 1.1730806570618617e-07, + "loss": 0.811, + "step": 21344 + }, + { + "epoch": 0.41, + "learning_rate": 1.1730418236185003e-07, + "loss": 0.0005, + "step": 21345 + }, + { + "epoch": 0.41, + "learning_rate": 1.1730029901751389e-07, + "loss": 0.0007, + "step": 21346 + }, + { + "epoch": 0.41, + "learning_rate": 1.1729641567317774e-07, + "loss": 0.0009, + "step": 21347 + }, + { + "epoch": 0.41, + "learning_rate": 1.172925323288416e-07, + "loss": 0.0011, + "step": 21348 + }, + { + "epoch": 0.41, + "learning_rate": 1.1728864898450546e-07, + "loss": 0.0277, + "step": 21349 + }, + { + "epoch": 0.41, + "learning_rate": 1.1728476564016932e-07, + "loss": 0.0322, + "step": 21350 + }, + { + "epoch": 0.41, + "learning_rate": 1.1728088229583318e-07, + "loss": 0.0008, + "step": 21351 + }, + { + "epoch": 0.41, + "learning_rate": 1.1727699895149704e-07, + "loss": 0.0657, + "step": 21352 + }, + { + "epoch": 0.41, + "learning_rate": 1.172731156071609e-07, + "loss": 0.0007, + "step": 21353 + }, + { + "epoch": 0.41, + "learning_rate": 1.1726923226282475e-07, + "loss": 0.0007, + "step": 21354 + }, + { + "epoch": 0.41, + "learning_rate": 1.1726534891848861e-07, + "loss": 0.0008, + "step": 21355 + }, + { + "epoch": 0.41, + "learning_rate": 1.1726146557415247e-07, + "loss": 0.0008, + "step": 21356 + }, + { + "epoch": 0.41, + "learning_rate": 1.1725758222981633e-07, + "loss": 1.5926, + "step": 21357 + }, + { + "epoch": 0.41, + "learning_rate": 1.1725369888548018e-07, + "loss": 0.0014, + "step": 21358 + }, + { + "epoch": 0.41, + "learning_rate": 1.1724981554114404e-07, + "loss": 0.0007, + "step": 21359 + }, + { + "epoch": 0.41, + "learning_rate": 1.172459321968079e-07, + "loss": 0.002, + "step": 21360 + }, + { + "epoch": 0.41, + "learning_rate": 1.1724204885247176e-07, + "loss": 0.0007, + "step": 21361 + }, + { + "epoch": 0.41, + "learning_rate": 1.1723816550813562e-07, + "loss": 0.0005, + "step": 21362 + }, + { + "epoch": 0.41, + "learning_rate": 1.1723428216379946e-07, + "loss": 0.0015, + "step": 21363 + }, + { + "epoch": 0.41, + "learning_rate": 1.1723039881946332e-07, + "loss": 0.0018, + "step": 21364 + }, + { + "epoch": 0.41, + "learning_rate": 1.1722651547512717e-07, + "loss": 0.0006, + "step": 21365 + }, + { + "epoch": 0.41, + "learning_rate": 1.1722263213079102e-07, + "loss": 0.0007, + "step": 21366 + }, + { + "epoch": 0.41, + "learning_rate": 1.1721874878645488e-07, + "loss": 0.0031, + "step": 21367 + }, + { + "epoch": 0.41, + "learning_rate": 1.1721486544211874e-07, + "loss": 0.0006, + "step": 21368 + }, + { + "epoch": 0.41, + "learning_rate": 1.172109820977826e-07, + "loss": 0.0018, + "step": 21369 + }, + { + "epoch": 0.41, + "learning_rate": 1.1720709875344646e-07, + "loss": 0.0409, + "step": 21370 + }, + { + "epoch": 0.41, + "learning_rate": 1.1720321540911032e-07, + "loss": 0.0008, + "step": 21371 + }, + { + "epoch": 0.41, + "learning_rate": 1.1719933206477417e-07, + "loss": 0.0047, + "step": 21372 + }, + { + "epoch": 0.41, + "learning_rate": 1.1719544872043803e-07, + "loss": 0.0008, + "step": 21373 + }, + { + "epoch": 0.41, + "learning_rate": 1.1719156537610189e-07, + "loss": 0.0007, + "step": 21374 + }, + { + "epoch": 0.41, + "learning_rate": 1.1718768203176575e-07, + "loss": 0.0008, + "step": 21375 + }, + { + "epoch": 0.41, + "learning_rate": 1.1718379868742961e-07, + "loss": 0.0008, + "step": 21376 + }, + { + "epoch": 0.41, + "learning_rate": 1.1717991534309347e-07, + "loss": 0.0005, + "step": 21377 + }, + { + "epoch": 0.41, + "learning_rate": 1.1717603199875732e-07, + "loss": 0.0005, + "step": 21378 + }, + { + "epoch": 0.41, + "learning_rate": 1.1717214865442118e-07, + "loss": 0.0005, + "step": 21379 + }, + { + "epoch": 0.41, + "learning_rate": 1.1716826531008504e-07, + "loss": 0.0005, + "step": 21380 + }, + { + "epoch": 0.41, + "learning_rate": 1.171643819657489e-07, + "loss": 0.0009, + "step": 21381 + }, + { + "epoch": 0.41, + "learning_rate": 1.1716049862141276e-07, + "loss": 0.0049, + "step": 21382 + }, + { + "epoch": 0.41, + "learning_rate": 1.1715661527707661e-07, + "loss": 0.0027, + "step": 21383 + }, + { + "epoch": 0.41, + "learning_rate": 1.1715273193274047e-07, + "loss": 0.0006, + "step": 21384 + }, + { + "epoch": 0.41, + "learning_rate": 1.1714884858840433e-07, + "loss": 0.0004, + "step": 21385 + }, + { + "epoch": 0.41, + "learning_rate": 1.1714496524406819e-07, + "loss": 0.0006, + "step": 21386 + }, + { + "epoch": 0.41, + "learning_rate": 1.1714108189973205e-07, + "loss": 0.0011, + "step": 21387 + }, + { + "epoch": 0.41, + "learning_rate": 1.171371985553959e-07, + "loss": 0.6426, + "step": 21388 + }, + { + "epoch": 0.41, + "learning_rate": 1.1713331521105976e-07, + "loss": 0.001, + "step": 21389 + }, + { + "epoch": 0.41, + "learning_rate": 1.1712943186672362e-07, + "loss": 0.0005, + "step": 21390 + }, + { + "epoch": 0.41, + "learning_rate": 1.1712554852238748e-07, + "loss": 0.0007, + "step": 21391 + }, + { + "epoch": 0.41, + "learning_rate": 1.1712166517805133e-07, + "loss": 0.2623, + "step": 21392 + }, + { + "epoch": 0.41, + "learning_rate": 1.1711778183371518e-07, + "loss": 0.6952, + "step": 21393 + }, + { + "epoch": 0.41, + "learning_rate": 1.1711389848937904e-07, + "loss": 0.0014, + "step": 21394 + }, + { + "epoch": 0.42, + "learning_rate": 1.171100151450429e-07, + "loss": 0.1436, + "step": 21395 + }, + { + "epoch": 0.42, + "learning_rate": 1.1710613180070676e-07, + "loss": 0.0009, + "step": 21396 + }, + { + "epoch": 0.42, + "learning_rate": 1.1710224845637062e-07, + "loss": 0.0008, + "step": 21397 + }, + { + "epoch": 0.42, + "learning_rate": 1.1709836511203448e-07, + "loss": 0.0007, + "step": 21398 + }, + { + "epoch": 0.42, + "learning_rate": 1.1709448176769833e-07, + "loss": 0.3279, + "step": 21399 + }, + { + "epoch": 0.42, + "learning_rate": 1.1709059842336219e-07, + "loss": 0.0006, + "step": 21400 + }, + { + "epoch": 0.42, + "learning_rate": 1.1708671507902605e-07, + "loss": 0.0006, + "step": 21401 + }, + { + "epoch": 0.42, + "learning_rate": 1.1708283173468991e-07, + "loss": 0.0009, + "step": 21402 + }, + { + "epoch": 0.42, + "learning_rate": 1.1707894839035377e-07, + "loss": 0.0019, + "step": 21403 + }, + { + "epoch": 0.42, + "learning_rate": 1.1707506504601762e-07, + "loss": 0.0018, + "step": 21404 + }, + { + "epoch": 0.42, + "learning_rate": 1.1707118170168148e-07, + "loss": 0.0012, + "step": 21405 + }, + { + "epoch": 0.42, + "learning_rate": 1.1706729835734534e-07, + "loss": 0.0008, + "step": 21406 + }, + { + "epoch": 0.42, + "learning_rate": 1.170634150130092e-07, + "loss": 0.0006, + "step": 21407 + }, + { + "epoch": 0.42, + "learning_rate": 1.1705953166867306e-07, + "loss": 0.0006, + "step": 21408 + }, + { + "epoch": 0.42, + "learning_rate": 1.1705564832433692e-07, + "loss": 0.0007, + "step": 21409 + }, + { + "epoch": 0.42, + "learning_rate": 1.1705176498000077e-07, + "loss": 0.0053, + "step": 21410 + }, + { + "epoch": 0.42, + "learning_rate": 1.1704788163566463e-07, + "loss": 0.0006, + "step": 21411 + }, + { + "epoch": 0.42, + "learning_rate": 1.1704399829132849e-07, + "loss": 0.0006, + "step": 21412 + }, + { + "epoch": 0.42, + "learning_rate": 1.1704011494699235e-07, + "loss": 0.0021, + "step": 21413 + }, + { + "epoch": 0.42, + "learning_rate": 1.1703623160265621e-07, + "loss": 0.0008, + "step": 21414 + }, + { + "epoch": 0.42, + "learning_rate": 1.1703234825832007e-07, + "loss": 0.0008, + "step": 21415 + }, + { + "epoch": 0.42, + "learning_rate": 1.1702846491398392e-07, + "loss": 0.0006, + "step": 21416 + }, + { + "epoch": 0.42, + "learning_rate": 1.1702458156964778e-07, + "loss": 0.0009, + "step": 21417 + }, + { + "epoch": 0.42, + "learning_rate": 1.1702069822531164e-07, + "loss": 0.2599, + "step": 21418 + }, + { + "epoch": 0.42, + "learning_rate": 1.170168148809755e-07, + "loss": 0.001, + "step": 21419 + }, + { + "epoch": 0.42, + "learning_rate": 1.1701293153663936e-07, + "loss": 0.0006, + "step": 21420 + }, + { + "epoch": 0.42, + "learning_rate": 1.1700904819230321e-07, + "loss": 0.0007, + "step": 21421 + }, + { + "epoch": 0.42, + "learning_rate": 1.1700516484796707e-07, + "loss": 0.0007, + "step": 21422 + }, + { + "epoch": 0.42, + "learning_rate": 1.170012815036309e-07, + "loss": 1.2468, + "step": 21423 + }, + { + "epoch": 0.42, + "learning_rate": 1.1699739815929476e-07, + "loss": 0.0006, + "step": 21424 + }, + { + "epoch": 0.42, + "learning_rate": 1.1699351481495862e-07, + "loss": 0.0007, + "step": 21425 + }, + { + "epoch": 0.42, + "learning_rate": 1.1698963147062248e-07, + "loss": 0.0014, + "step": 21426 + }, + { + "epoch": 0.42, + "learning_rate": 1.1698574812628634e-07, + "loss": 0.0007, + "step": 21427 + }, + { + "epoch": 0.42, + "learning_rate": 1.169818647819502e-07, + "loss": 0.0007, + "step": 21428 + }, + { + "epoch": 0.42, + "learning_rate": 1.1697798143761405e-07, + "loss": 0.0252, + "step": 21429 + }, + { + "epoch": 0.42, + "learning_rate": 1.1697409809327791e-07, + "loss": 0.2018, + "step": 21430 + }, + { + "epoch": 0.42, + "learning_rate": 1.1697021474894177e-07, + "loss": 0.7295, + "step": 21431 + }, + { + "epoch": 0.42, + "learning_rate": 1.1696633140460563e-07, + "loss": 0.0007, + "step": 21432 + }, + { + "epoch": 0.42, + "learning_rate": 1.1696244806026949e-07, + "loss": 0.0009, + "step": 21433 + }, + { + "epoch": 0.42, + "learning_rate": 1.1695856471593335e-07, + "loss": 0.0007, + "step": 21434 + }, + { + "epoch": 0.42, + "learning_rate": 1.169546813715972e-07, + "loss": 0.0008, + "step": 21435 + }, + { + "epoch": 0.42, + "learning_rate": 1.1695079802726106e-07, + "loss": 0.0008, + "step": 21436 + }, + { + "epoch": 0.42, + "learning_rate": 1.1694691468292492e-07, + "loss": 0.0018, + "step": 21437 + }, + { + "epoch": 0.42, + "learning_rate": 1.1694303133858878e-07, + "loss": 1.0201, + "step": 21438 + }, + { + "epoch": 0.42, + "learning_rate": 1.1693914799425264e-07, + "loss": 0.0006, + "step": 21439 + }, + { + "epoch": 0.42, + "learning_rate": 1.169352646499165e-07, + "loss": 0.1891, + "step": 21440 + }, + { + "epoch": 0.42, + "learning_rate": 1.1693138130558035e-07, + "loss": 1.4903, + "step": 21441 + }, + { + "epoch": 0.42, + "learning_rate": 1.1692749796124421e-07, + "loss": 0.001, + "step": 21442 + }, + { + "epoch": 0.42, + "learning_rate": 1.1692361461690807e-07, + "loss": 0.4554, + "step": 21443 + }, + { + "epoch": 0.42, + "learning_rate": 1.1691973127257193e-07, + "loss": 0.0006, + "step": 21444 + }, + { + "epoch": 0.42, + "learning_rate": 1.1691584792823579e-07, + "loss": 0.0006, + "step": 21445 + }, + { + "epoch": 0.42, + "learning_rate": 1.1691196458389964e-07, + "loss": 0.0006, + "step": 21446 + }, + { + "epoch": 0.42, + "learning_rate": 1.169080812395635e-07, + "loss": 0.4544, + "step": 21447 + }, + { + "epoch": 0.42, + "learning_rate": 1.1690419789522736e-07, + "loss": 0.0196, + "step": 21448 + }, + { + "epoch": 0.42, + "learning_rate": 1.1690031455089122e-07, + "loss": 0.0006, + "step": 21449 + }, + { + "epoch": 0.42, + "learning_rate": 1.1689643120655508e-07, + "loss": 0.0006, + "step": 21450 + }, + { + "epoch": 0.42, + "learning_rate": 1.1689254786221894e-07, + "loss": 0.0312, + "step": 21451 + }, + { + "epoch": 0.42, + "learning_rate": 1.168886645178828e-07, + "loss": 0.0005, + "step": 21452 + }, + { + "epoch": 0.42, + "learning_rate": 1.1688478117354665e-07, + "loss": 0.003, + "step": 21453 + }, + { + "epoch": 0.42, + "learning_rate": 1.1688089782921051e-07, + "loss": 0.0015, + "step": 21454 + }, + { + "epoch": 0.42, + "learning_rate": 1.1687701448487437e-07, + "loss": 0.0006, + "step": 21455 + }, + { + "epoch": 0.42, + "learning_rate": 1.1687313114053823e-07, + "loss": 0.0011, + "step": 21456 + }, + { + "epoch": 0.42, + "learning_rate": 1.1686924779620208e-07, + "loss": 0.0007, + "step": 21457 + }, + { + "epoch": 0.42, + "learning_rate": 1.1686536445186594e-07, + "loss": 0.002, + "step": 21458 + }, + { + "epoch": 0.42, + "learning_rate": 1.168614811075298e-07, + "loss": 0.0006, + "step": 21459 + }, + { + "epoch": 0.42, + "learning_rate": 1.1685759776319366e-07, + "loss": 0.0007, + "step": 21460 + }, + { + "epoch": 0.42, + "learning_rate": 1.1685371441885752e-07, + "loss": 0.5276, + "step": 21461 + }, + { + "epoch": 0.42, + "learning_rate": 1.1684983107452138e-07, + "loss": 0.001, + "step": 21462 + }, + { + "epoch": 0.42, + "learning_rate": 1.1684594773018523e-07, + "loss": 0.0049, + "step": 21463 + }, + { + "epoch": 0.42, + "learning_rate": 1.1684206438584909e-07, + "loss": 0.0005, + "step": 21464 + }, + { + "epoch": 0.42, + "learning_rate": 1.1683818104151295e-07, + "loss": 0.0009, + "step": 21465 + }, + { + "epoch": 0.42, + "learning_rate": 1.1683429769717681e-07, + "loss": 0.0008, + "step": 21466 + }, + { + "epoch": 0.42, + "learning_rate": 1.1683041435284067e-07, + "loss": 0.0012, + "step": 21467 + }, + { + "epoch": 0.42, + "learning_rate": 1.1682653100850453e-07, + "loss": 0.0008, + "step": 21468 + }, + { + "epoch": 0.42, + "learning_rate": 1.1682264766416838e-07, + "loss": 0.0013, + "step": 21469 + }, + { + "epoch": 0.42, + "learning_rate": 1.1681876431983224e-07, + "loss": 0.0006, + "step": 21470 + }, + { + "epoch": 0.42, + "learning_rate": 1.168148809754961e-07, + "loss": 0.0008, + "step": 21471 + }, + { + "epoch": 0.42, + "learning_rate": 1.1681099763115996e-07, + "loss": 0.0007, + "step": 21472 + }, + { + "epoch": 0.42, + "learning_rate": 1.1680711428682382e-07, + "loss": 0.001, + "step": 21473 + }, + { + "epoch": 0.42, + "learning_rate": 1.1680323094248768e-07, + "loss": 0.0009, + "step": 21474 + }, + { + "epoch": 0.42, + "learning_rate": 1.1679934759815153e-07, + "loss": 0.0009, + "step": 21475 + }, + { + "epoch": 0.42, + "learning_rate": 1.1679546425381539e-07, + "loss": 0.0012, + "step": 21476 + }, + { + "epoch": 0.42, + "learning_rate": 1.1679158090947925e-07, + "loss": 0.0039, + "step": 21477 + }, + { + "epoch": 0.42, + "learning_rate": 1.1678769756514311e-07, + "loss": 0.0007, + "step": 21478 + }, + { + "epoch": 0.42, + "learning_rate": 1.1678381422080697e-07, + "loss": 0.0006, + "step": 21479 + }, + { + "epoch": 0.42, + "learning_rate": 1.1677993087647082e-07, + "loss": 0.0006, + "step": 21480 + }, + { + "epoch": 0.42, + "learning_rate": 1.1677604753213466e-07, + "loss": 0.0007, + "step": 21481 + }, + { + "epoch": 0.42, + "learning_rate": 1.1677216418779851e-07, + "loss": 0.0006, + "step": 21482 + }, + { + "epoch": 0.42, + "learning_rate": 1.1676828084346237e-07, + "loss": 0.0006, + "step": 21483 + }, + { + "epoch": 0.42, + "learning_rate": 1.1676439749912623e-07, + "loss": 0.0009, + "step": 21484 + }, + { + "epoch": 0.42, + "learning_rate": 1.1676051415479009e-07, + "loss": 0.0043, + "step": 21485 + }, + { + "epoch": 0.42, + "learning_rate": 1.1675663081045395e-07, + "loss": 0.0007, + "step": 21486 + }, + { + "epoch": 0.42, + "learning_rate": 1.167527474661178e-07, + "loss": 0.0012, + "step": 21487 + }, + { + "epoch": 0.42, + "learning_rate": 1.1674886412178166e-07, + "loss": 0.0009, + "step": 21488 + }, + { + "epoch": 0.42, + "learning_rate": 1.1674498077744552e-07, + "loss": 0.0006, + "step": 21489 + }, + { + "epoch": 0.42, + "learning_rate": 1.1674109743310938e-07, + "loss": 0.0007, + "step": 21490 + }, + { + "epoch": 0.42, + "learning_rate": 1.1673721408877324e-07, + "loss": 0.0019, + "step": 21491 + }, + { + "epoch": 0.42, + "learning_rate": 1.167333307444371e-07, + "loss": 0.0007, + "step": 21492 + }, + { + "epoch": 0.42, + "learning_rate": 1.1672944740010096e-07, + "loss": 0.0006, + "step": 21493 + }, + { + "epoch": 0.42, + "learning_rate": 1.1672556405576481e-07, + "loss": 0.0009, + "step": 21494 + }, + { + "epoch": 0.42, + "learning_rate": 1.1672168071142867e-07, + "loss": 0.001, + "step": 21495 + }, + { + "epoch": 0.42, + "learning_rate": 1.1671779736709253e-07, + "loss": 0.0007, + "step": 21496 + }, + { + "epoch": 0.42, + "learning_rate": 1.1671391402275639e-07, + "loss": 0.0017, + "step": 21497 + }, + { + "epoch": 0.42, + "learning_rate": 1.1671003067842025e-07, + "loss": 0.0126, + "step": 21498 + }, + { + "epoch": 0.42, + "learning_rate": 1.167061473340841e-07, + "loss": 0.0084, + "step": 21499 + }, + { + "epoch": 0.42, + "learning_rate": 1.1670226398974796e-07, + "loss": 0.0006, + "step": 21500 + }, + { + "epoch": 0.42, + "learning_rate": 1.1669838064541182e-07, + "loss": 0.0005, + "step": 21501 + }, + { + "epoch": 0.42, + "learning_rate": 1.1669449730107568e-07, + "loss": 0.0009, + "step": 21502 + }, + { + "epoch": 0.42, + "learning_rate": 1.1669061395673954e-07, + "loss": 0.0007, + "step": 21503 + }, + { + "epoch": 0.42, + "learning_rate": 1.166867306124034e-07, + "loss": 0.0005, + "step": 21504 + }, + { + "epoch": 0.42, + "learning_rate": 1.1668284726806725e-07, + "loss": 0.0009, + "step": 21505 + }, + { + "epoch": 0.42, + "learning_rate": 1.1667896392373111e-07, + "loss": 0.0057, + "step": 21506 + }, + { + "epoch": 0.42, + "learning_rate": 1.1667508057939497e-07, + "loss": 0.0006, + "step": 21507 + }, + { + "epoch": 0.42, + "learning_rate": 1.1667119723505883e-07, + "loss": 0.0007, + "step": 21508 + }, + { + "epoch": 0.42, + "learning_rate": 1.1666731389072269e-07, + "loss": 0.0007, + "step": 21509 + }, + { + "epoch": 0.42, + "learning_rate": 1.1666343054638655e-07, + "loss": 0.0009, + "step": 21510 + }, + { + "epoch": 0.42, + "learning_rate": 1.166595472020504e-07, + "loss": 0.0005, + "step": 21511 + }, + { + "epoch": 0.42, + "learning_rate": 1.1665566385771426e-07, + "loss": 0.0008, + "step": 21512 + }, + { + "epoch": 0.42, + "learning_rate": 1.1665178051337812e-07, + "loss": 0.0046, + "step": 21513 + }, + { + "epoch": 0.42, + "learning_rate": 1.1664789716904198e-07, + "loss": 0.0006, + "step": 21514 + }, + { + "epoch": 0.42, + "learning_rate": 1.1664401382470584e-07, + "loss": 0.0008, + "step": 21515 + }, + { + "epoch": 0.42, + "learning_rate": 1.166401304803697e-07, + "loss": 0.0007, + "step": 21516 + }, + { + "epoch": 0.42, + "learning_rate": 1.1663624713603355e-07, + "loss": 0.0005, + "step": 21517 + }, + { + "epoch": 0.42, + "learning_rate": 1.1663236379169741e-07, + "loss": 0.0009, + "step": 21518 + }, + { + "epoch": 0.42, + "learning_rate": 1.1662848044736127e-07, + "loss": 0.0006, + "step": 21519 + }, + { + "epoch": 0.42, + "learning_rate": 1.1662459710302513e-07, + "loss": 0.001, + "step": 21520 + }, + { + "epoch": 0.42, + "learning_rate": 1.1662071375868899e-07, + "loss": 0.0601, + "step": 21521 + }, + { + "epoch": 0.42, + "learning_rate": 1.1661683041435284e-07, + "loss": 0.0012, + "step": 21522 + }, + { + "epoch": 0.42, + "learning_rate": 1.166129470700167e-07, + "loss": 0.0007, + "step": 21523 + }, + { + "epoch": 0.42, + "learning_rate": 1.1660906372568056e-07, + "loss": 1.0178, + "step": 21524 + }, + { + "epoch": 0.42, + "learning_rate": 1.1660518038134442e-07, + "loss": 0.0008, + "step": 21525 + }, + { + "epoch": 0.42, + "learning_rate": 1.1660129703700828e-07, + "loss": 0.0007, + "step": 21526 + }, + { + "epoch": 0.42, + "learning_rate": 1.1659741369267214e-07, + "loss": 0.0109, + "step": 21527 + }, + { + "epoch": 0.42, + "learning_rate": 1.16593530348336e-07, + "loss": 0.0005, + "step": 21528 + }, + { + "epoch": 0.42, + "learning_rate": 1.1658964700399985e-07, + "loss": 0.0006, + "step": 21529 + }, + { + "epoch": 0.42, + "learning_rate": 1.1658576365966371e-07, + "loss": 0.302, + "step": 21530 + }, + { + "epoch": 0.42, + "learning_rate": 1.1658188031532757e-07, + "loss": 0.0008, + "step": 21531 + }, + { + "epoch": 0.42, + "learning_rate": 1.1657799697099143e-07, + "loss": 0.0012, + "step": 21532 + }, + { + "epoch": 0.42, + "learning_rate": 1.1657411362665529e-07, + "loss": 0.0006, + "step": 21533 + }, + { + "epoch": 0.42, + "learning_rate": 1.1657023028231914e-07, + "loss": 0.0007, + "step": 21534 + }, + { + "epoch": 0.42, + "learning_rate": 1.16566346937983e-07, + "loss": 0.002, + "step": 21535 + }, + { + "epoch": 0.42, + "learning_rate": 1.1656246359364686e-07, + "loss": 0.5693, + "step": 21536 + }, + { + "epoch": 0.42, + "learning_rate": 1.1655858024931072e-07, + "loss": 0.0008, + "step": 21537 + }, + { + "epoch": 0.42, + "learning_rate": 1.1655469690497458e-07, + "loss": 0.0007, + "step": 21538 + }, + { + "epoch": 0.42, + "learning_rate": 1.1655081356063841e-07, + "loss": 1.0569, + "step": 21539 + }, + { + "epoch": 0.42, + "learning_rate": 1.1654693021630227e-07, + "loss": 0.0006, + "step": 21540 + }, + { + "epoch": 0.42, + "learning_rate": 1.1654304687196612e-07, + "loss": 0.035, + "step": 21541 + }, + { + "epoch": 0.42, + "learning_rate": 1.1653916352762998e-07, + "loss": 0.0007, + "step": 21542 + }, + { + "epoch": 0.42, + "learning_rate": 1.1653528018329384e-07, + "loss": 0.0008, + "step": 21543 + }, + { + "epoch": 0.42, + "learning_rate": 1.165313968389577e-07, + "loss": 0.0008, + "step": 21544 + }, + { + "epoch": 0.42, + "learning_rate": 1.1652751349462156e-07, + "loss": 0.0008, + "step": 21545 + }, + { + "epoch": 0.42, + "learning_rate": 1.1652363015028542e-07, + "loss": 0.0008, + "step": 21546 + }, + { + "epoch": 0.42, + "learning_rate": 1.1651974680594927e-07, + "loss": 0.0006, + "step": 21547 + }, + { + "epoch": 0.42, + "learning_rate": 1.1651586346161313e-07, + "loss": 0.0006, + "step": 21548 + }, + { + "epoch": 0.42, + "learning_rate": 1.1651198011727699e-07, + "loss": 0.0006, + "step": 21549 + }, + { + "epoch": 0.42, + "learning_rate": 1.1650809677294085e-07, + "loss": 0.0007, + "step": 21550 + }, + { + "epoch": 0.42, + "learning_rate": 1.1650421342860471e-07, + "loss": 0.0007, + "step": 21551 + }, + { + "epoch": 0.42, + "learning_rate": 1.1650033008426857e-07, + "loss": 0.0007, + "step": 21552 + }, + { + "epoch": 0.42, + "learning_rate": 1.1649644673993242e-07, + "loss": 0.0011, + "step": 21553 + }, + { + "epoch": 0.42, + "learning_rate": 1.1649256339559628e-07, + "loss": 0.0424, + "step": 21554 + }, + { + "epoch": 0.42, + "learning_rate": 1.1648868005126014e-07, + "loss": 0.0023, + "step": 21555 + }, + { + "epoch": 0.42, + "learning_rate": 1.16484796706924e-07, + "loss": 0.001, + "step": 21556 + }, + { + "epoch": 0.42, + "learning_rate": 1.1648091336258786e-07, + "loss": 0.001, + "step": 21557 + }, + { + "epoch": 0.42, + "learning_rate": 1.1647703001825171e-07, + "loss": 0.0007, + "step": 21558 + }, + { + "epoch": 0.42, + "learning_rate": 1.1647314667391557e-07, + "loss": 0.9697, + "step": 21559 + }, + { + "epoch": 0.42, + "learning_rate": 1.1646926332957943e-07, + "loss": 0.0015, + "step": 21560 + }, + { + "epoch": 0.42, + "learning_rate": 1.1646537998524329e-07, + "loss": 0.0007, + "step": 21561 + }, + { + "epoch": 0.42, + "learning_rate": 1.1646149664090715e-07, + "loss": 0.0006, + "step": 21562 + }, + { + "epoch": 0.42, + "learning_rate": 1.16457613296571e-07, + "loss": 0.0006, + "step": 21563 + }, + { + "epoch": 0.42, + "learning_rate": 1.1645372995223486e-07, + "loss": 0.0031, + "step": 21564 + }, + { + "epoch": 0.42, + "learning_rate": 1.1644984660789872e-07, + "loss": 0.0008, + "step": 21565 + }, + { + "epoch": 0.42, + "learning_rate": 1.1644596326356258e-07, + "loss": 0.0006, + "step": 21566 + }, + { + "epoch": 0.42, + "learning_rate": 1.1644207991922644e-07, + "loss": 0.0005, + "step": 21567 + }, + { + "epoch": 0.42, + "learning_rate": 1.164381965748903e-07, + "loss": 0.0006, + "step": 21568 + }, + { + "epoch": 0.42, + "learning_rate": 1.1643431323055414e-07, + "loss": 0.0008, + "step": 21569 + }, + { + "epoch": 0.42, + "learning_rate": 1.16430429886218e-07, + "loss": 1.8542, + "step": 21570 + }, + { + "epoch": 0.42, + "learning_rate": 1.1642654654188186e-07, + "loss": 0.0018, + "step": 21571 + }, + { + "epoch": 0.42, + "learning_rate": 1.1642266319754572e-07, + "loss": 0.0006, + "step": 21572 + }, + { + "epoch": 0.42, + "learning_rate": 1.1641877985320958e-07, + "loss": 0.0058, + "step": 21573 + }, + { + "epoch": 0.42, + "learning_rate": 1.1641489650887343e-07, + "loss": 0.0011, + "step": 21574 + }, + { + "epoch": 0.42, + "learning_rate": 1.1641101316453729e-07, + "loss": 0.0008, + "step": 21575 + }, + { + "epoch": 0.42, + "learning_rate": 1.1640712982020115e-07, + "loss": 0.0071, + "step": 21576 + }, + { + "epoch": 0.42, + "learning_rate": 1.1640324647586501e-07, + "loss": 0.0007, + "step": 21577 + }, + { + "epoch": 0.42, + "learning_rate": 1.1639936313152887e-07, + "loss": 0.0012, + "step": 21578 + }, + { + "epoch": 0.42, + "learning_rate": 1.1639547978719272e-07, + "loss": 0.0263, + "step": 21579 + }, + { + "epoch": 0.42, + "learning_rate": 1.1639159644285658e-07, + "loss": 0.0007, + "step": 21580 + }, + { + "epoch": 0.42, + "learning_rate": 1.1638771309852044e-07, + "loss": 0.0007, + "step": 21581 + }, + { + "epoch": 0.42, + "learning_rate": 1.163838297541843e-07, + "loss": 0.0012, + "step": 21582 + }, + { + "epoch": 0.42, + "learning_rate": 1.1637994640984816e-07, + "loss": 0.0011, + "step": 21583 + }, + { + "epoch": 0.42, + "learning_rate": 1.1637606306551202e-07, + "loss": 0.0006, + "step": 21584 + }, + { + "epoch": 0.42, + "learning_rate": 1.1637217972117587e-07, + "loss": 0.0006, + "step": 21585 + }, + { + "epoch": 0.42, + "learning_rate": 1.1636829637683973e-07, + "loss": 0.0009, + "step": 21586 + }, + { + "epoch": 0.42, + "learning_rate": 1.1636441303250359e-07, + "loss": 0.0008, + "step": 21587 + }, + { + "epoch": 0.42, + "learning_rate": 1.1636052968816745e-07, + "loss": 0.0008, + "step": 21588 + }, + { + "epoch": 0.42, + "learning_rate": 1.1635664634383131e-07, + "loss": 0.0007, + "step": 21589 + }, + { + "epoch": 0.42, + "learning_rate": 1.1635276299949517e-07, + "loss": 0.0006, + "step": 21590 + }, + { + "epoch": 0.42, + "learning_rate": 1.1634887965515902e-07, + "loss": 0.0005, + "step": 21591 + }, + { + "epoch": 0.42, + "learning_rate": 1.1634499631082288e-07, + "loss": 0.0007, + "step": 21592 + }, + { + "epoch": 0.42, + "learning_rate": 1.1634111296648674e-07, + "loss": 0.001, + "step": 21593 + }, + { + "epoch": 0.42, + "learning_rate": 1.163372296221506e-07, + "loss": 0.001, + "step": 21594 + }, + { + "epoch": 0.42, + "learning_rate": 1.1633334627781446e-07, + "loss": 0.0007, + "step": 21595 + }, + { + "epoch": 0.42, + "learning_rate": 1.1632946293347831e-07, + "loss": 0.0029, + "step": 21596 + }, + { + "epoch": 0.42, + "learning_rate": 1.1632557958914216e-07, + "loss": 0.0012, + "step": 21597 + }, + { + "epoch": 0.42, + "learning_rate": 1.16321696244806e-07, + "loss": 0.0005, + "step": 21598 + }, + { + "epoch": 0.42, + "learning_rate": 1.1631781290046986e-07, + "loss": 0.0009, + "step": 21599 + }, + { + "epoch": 0.42, + "learning_rate": 1.1631392955613372e-07, + "loss": 0.0006, + "step": 21600 + }, + { + "epoch": 0.42, + "learning_rate": 1.1631004621179758e-07, + "loss": 0.0007, + "step": 21601 + }, + { + "epoch": 0.42, + "learning_rate": 1.1630616286746144e-07, + "loss": 0.0006, + "step": 21602 + }, + { + "epoch": 0.42, + "learning_rate": 1.163022795231253e-07, + "loss": 0.0266, + "step": 21603 + }, + { + "epoch": 0.42, + "learning_rate": 1.1629839617878915e-07, + "loss": 0.0005, + "step": 21604 + }, + { + "epoch": 0.42, + "learning_rate": 1.1629451283445301e-07, + "loss": 0.0007, + "step": 21605 + }, + { + "epoch": 0.42, + "learning_rate": 1.1629062949011687e-07, + "loss": 0.0007, + "step": 21606 + }, + { + "epoch": 0.42, + "learning_rate": 1.1628674614578073e-07, + "loss": 0.0009, + "step": 21607 + }, + { + "epoch": 0.42, + "learning_rate": 1.1628286280144459e-07, + "loss": 0.6442, + "step": 21608 + }, + { + "epoch": 0.42, + "learning_rate": 1.1627897945710845e-07, + "loss": 0.0006, + "step": 21609 + }, + { + "epoch": 0.42, + "learning_rate": 1.162750961127723e-07, + "loss": 0.1539, + "step": 21610 + }, + { + "epoch": 0.42, + "learning_rate": 1.1627121276843616e-07, + "loss": 0.0023, + "step": 21611 + }, + { + "epoch": 0.42, + "learning_rate": 1.1626732942410002e-07, + "loss": 0.0006, + "step": 21612 + }, + { + "epoch": 0.42, + "learning_rate": 1.1626344607976388e-07, + "loss": 0.0007, + "step": 21613 + }, + { + "epoch": 0.42, + "learning_rate": 1.1625956273542774e-07, + "loss": 0.0005, + "step": 21614 + }, + { + "epoch": 0.42, + "learning_rate": 1.162556793910916e-07, + "loss": 1.0382, + "step": 21615 + }, + { + "epoch": 0.42, + "learning_rate": 1.1625179604675545e-07, + "loss": 0.0006, + "step": 21616 + }, + { + "epoch": 0.42, + "learning_rate": 1.1624791270241931e-07, + "loss": 0.1711, + "step": 21617 + }, + { + "epoch": 0.42, + "learning_rate": 1.1624402935808317e-07, + "loss": 0.0007, + "step": 21618 + }, + { + "epoch": 0.42, + "learning_rate": 1.1624014601374703e-07, + "loss": 0.0008, + "step": 21619 + }, + { + "epoch": 0.42, + "learning_rate": 1.1623626266941089e-07, + "loss": 0.0008, + "step": 21620 + }, + { + "epoch": 0.42, + "learning_rate": 1.1623237932507474e-07, + "loss": 0.0104, + "step": 21621 + }, + { + "epoch": 0.42, + "learning_rate": 1.162284959807386e-07, + "loss": 0.0037, + "step": 21622 + }, + { + "epoch": 0.42, + "learning_rate": 1.1622461263640246e-07, + "loss": 0.0006, + "step": 21623 + }, + { + "epoch": 0.42, + "learning_rate": 1.1622072929206632e-07, + "loss": 0.0005, + "step": 21624 + }, + { + "epoch": 0.42, + "learning_rate": 1.1621684594773018e-07, + "loss": 0.0011, + "step": 21625 + }, + { + "epoch": 0.42, + "learning_rate": 1.1621296260339404e-07, + "loss": 0.0008, + "step": 21626 + }, + { + "epoch": 0.42, + "learning_rate": 1.162090792590579e-07, + "loss": 0.0007, + "step": 21627 + }, + { + "epoch": 0.42, + "learning_rate": 1.1620519591472175e-07, + "loss": 0.0049, + "step": 21628 + }, + { + "epoch": 0.42, + "learning_rate": 1.1620131257038561e-07, + "loss": 0.0009, + "step": 21629 + }, + { + "epoch": 0.42, + "learning_rate": 1.1619742922604947e-07, + "loss": 0.0006, + "step": 21630 + }, + { + "epoch": 0.42, + "learning_rate": 1.1619354588171333e-07, + "loss": 0.001, + "step": 21631 + }, + { + "epoch": 0.42, + "learning_rate": 1.1618966253737719e-07, + "loss": 0.001, + "step": 21632 + }, + { + "epoch": 0.42, + "learning_rate": 1.1618577919304104e-07, + "loss": 0.0007, + "step": 21633 + }, + { + "epoch": 0.42, + "learning_rate": 1.161818958487049e-07, + "loss": 0.0009, + "step": 21634 + }, + { + "epoch": 0.42, + "learning_rate": 1.1617801250436876e-07, + "loss": 0.0022, + "step": 21635 + }, + { + "epoch": 0.42, + "learning_rate": 1.1617412916003262e-07, + "loss": 1.0624, + "step": 21636 + }, + { + "epoch": 0.42, + "learning_rate": 1.1617024581569648e-07, + "loss": 0.0008, + "step": 21637 + }, + { + "epoch": 0.42, + "learning_rate": 1.1616636247136033e-07, + "loss": 0.0006, + "step": 21638 + }, + { + "epoch": 0.42, + "learning_rate": 1.1616247912702419e-07, + "loss": 0.0006, + "step": 21639 + }, + { + "epoch": 0.42, + "learning_rate": 1.1615859578268805e-07, + "loss": 0.0016, + "step": 21640 + }, + { + "epoch": 0.42, + "learning_rate": 1.1615471243835191e-07, + "loss": 0.5013, + "step": 21641 + }, + { + "epoch": 0.42, + "learning_rate": 1.1615082909401577e-07, + "loss": 0.0006, + "step": 21642 + }, + { + "epoch": 0.42, + "learning_rate": 1.1614694574967963e-07, + "loss": 0.0005, + "step": 21643 + }, + { + "epoch": 0.42, + "learning_rate": 1.1614306240534348e-07, + "loss": 0.0014, + "step": 21644 + }, + { + "epoch": 0.42, + "learning_rate": 1.1613917906100734e-07, + "loss": 0.0007, + "step": 21645 + }, + { + "epoch": 0.42, + "learning_rate": 1.161352957166712e-07, + "loss": 0.0009, + "step": 21646 + }, + { + "epoch": 0.42, + "learning_rate": 1.1613141237233506e-07, + "loss": 0.001, + "step": 21647 + }, + { + "epoch": 0.42, + "learning_rate": 1.1612752902799892e-07, + "loss": 0.0029, + "step": 21648 + }, + { + "epoch": 0.42, + "learning_rate": 1.1612364568366278e-07, + "loss": 0.0023, + "step": 21649 + }, + { + "epoch": 0.42, + "learning_rate": 1.1611976233932663e-07, + "loss": 0.0013, + "step": 21650 + }, + { + "epoch": 0.42, + "learning_rate": 1.1611587899499049e-07, + "loss": 0.0007, + "step": 21651 + }, + { + "epoch": 0.42, + "learning_rate": 1.1611199565065435e-07, + "loss": 0.0008, + "step": 21652 + }, + { + "epoch": 0.42, + "learning_rate": 1.1610811230631821e-07, + "loss": 0.0006, + "step": 21653 + }, + { + "epoch": 0.42, + "learning_rate": 1.1610422896198207e-07, + "loss": 0.0006, + "step": 21654 + }, + { + "epoch": 0.42, + "learning_rate": 1.161003456176459e-07, + "loss": 0.0006, + "step": 21655 + }, + { + "epoch": 0.42, + "learning_rate": 1.1609646227330976e-07, + "loss": 0.0005, + "step": 21656 + }, + { + "epoch": 0.42, + "learning_rate": 1.1609257892897361e-07, + "loss": 0.0008, + "step": 21657 + }, + { + "epoch": 0.42, + "learning_rate": 1.1608869558463747e-07, + "loss": 0.0007, + "step": 21658 + }, + { + "epoch": 0.42, + "learning_rate": 1.1608481224030133e-07, + "loss": 0.0179, + "step": 21659 + }, + { + "epoch": 0.42, + "learning_rate": 1.1608092889596519e-07, + "loss": 0.0006, + "step": 21660 + }, + { + "epoch": 0.42, + "learning_rate": 1.1607704555162905e-07, + "loss": 0.0006, + "step": 21661 + }, + { + "epoch": 0.42, + "learning_rate": 1.160731622072929e-07, + "loss": 0.5114, + "step": 21662 + }, + { + "epoch": 0.42, + "learning_rate": 1.1606927886295676e-07, + "loss": 0.0007, + "step": 21663 + }, + { + "epoch": 0.42, + "learning_rate": 1.1606539551862062e-07, + "loss": 0.0007, + "step": 21664 + }, + { + "epoch": 0.42, + "learning_rate": 1.1606151217428448e-07, + "loss": 0.0009, + "step": 21665 + }, + { + "epoch": 0.42, + "learning_rate": 1.1605762882994834e-07, + "loss": 0.001, + "step": 21666 + }, + { + "epoch": 0.42, + "learning_rate": 1.160537454856122e-07, + "loss": 0.0005, + "step": 21667 + }, + { + "epoch": 0.42, + "learning_rate": 1.1604986214127606e-07, + "loss": 0.9609, + "step": 21668 + }, + { + "epoch": 0.42, + "learning_rate": 1.1604597879693991e-07, + "loss": 0.0005, + "step": 21669 + }, + { + "epoch": 0.42, + "learning_rate": 1.1604209545260377e-07, + "loss": 0.0014, + "step": 21670 + }, + { + "epoch": 0.42, + "learning_rate": 1.1603821210826763e-07, + "loss": 0.0007, + "step": 21671 + }, + { + "epoch": 0.42, + "learning_rate": 1.1603432876393149e-07, + "loss": 0.005, + "step": 21672 + }, + { + "epoch": 0.42, + "learning_rate": 1.1603044541959535e-07, + "loss": 0.001, + "step": 21673 + }, + { + "epoch": 0.42, + "learning_rate": 1.160265620752592e-07, + "loss": 0.0008, + "step": 21674 + }, + { + "epoch": 0.42, + "learning_rate": 1.1602267873092306e-07, + "loss": 0.0008, + "step": 21675 + }, + { + "epoch": 0.42, + "learning_rate": 1.1601879538658692e-07, + "loss": 0.0006, + "step": 21676 + }, + { + "epoch": 0.42, + "learning_rate": 1.1601491204225078e-07, + "loss": 0.0006, + "step": 21677 + }, + { + "epoch": 0.42, + "learning_rate": 1.1601102869791464e-07, + "loss": 0.0018, + "step": 21678 + }, + { + "epoch": 0.42, + "learning_rate": 1.160071453535785e-07, + "loss": 0.0006, + "step": 21679 + }, + { + "epoch": 0.42, + "learning_rate": 1.1600326200924235e-07, + "loss": 0.0009, + "step": 21680 + }, + { + "epoch": 0.42, + "learning_rate": 1.1599937866490621e-07, + "loss": 0.0028, + "step": 21681 + }, + { + "epoch": 0.42, + "learning_rate": 1.1599549532057007e-07, + "loss": 0.0006, + "step": 21682 + }, + { + "epoch": 0.42, + "learning_rate": 1.1599161197623393e-07, + "loss": 0.0008, + "step": 21683 + }, + { + "epoch": 0.42, + "learning_rate": 1.1598772863189779e-07, + "loss": 0.0448, + "step": 21684 + }, + { + "epoch": 0.42, + "learning_rate": 1.1598384528756165e-07, + "loss": 0.6236, + "step": 21685 + }, + { + "epoch": 0.42, + "learning_rate": 1.159799619432255e-07, + "loss": 0.0008, + "step": 21686 + }, + { + "epoch": 0.42, + "learning_rate": 1.1597607859888936e-07, + "loss": 0.001, + "step": 21687 + }, + { + "epoch": 0.42, + "learning_rate": 1.1597219525455322e-07, + "loss": 0.0006, + "step": 21688 + }, + { + "epoch": 0.42, + "learning_rate": 1.1596831191021708e-07, + "loss": 0.0012, + "step": 21689 + }, + { + "epoch": 0.42, + "learning_rate": 1.1596442856588094e-07, + "loss": 0.0006, + "step": 21690 + }, + { + "epoch": 0.42, + "learning_rate": 1.159605452215448e-07, + "loss": 0.0006, + "step": 21691 + }, + { + "epoch": 0.42, + "learning_rate": 1.1595666187720865e-07, + "loss": 0.0007, + "step": 21692 + }, + { + "epoch": 0.42, + "learning_rate": 1.1595277853287251e-07, + "loss": 0.0007, + "step": 21693 + }, + { + "epoch": 0.42, + "learning_rate": 1.1594889518853637e-07, + "loss": 0.0162, + "step": 21694 + }, + { + "epoch": 0.42, + "learning_rate": 1.1594501184420023e-07, + "loss": 0.0006, + "step": 21695 + }, + { + "epoch": 0.42, + "learning_rate": 1.1594112849986409e-07, + "loss": 0.0007, + "step": 21696 + }, + { + "epoch": 0.42, + "learning_rate": 1.1593724515552794e-07, + "loss": 0.171, + "step": 21697 + }, + { + "epoch": 0.42, + "learning_rate": 1.159333618111918e-07, + "loss": 0.0008, + "step": 21698 + }, + { + "epoch": 0.42, + "learning_rate": 1.1592947846685566e-07, + "loss": 0.0008, + "step": 21699 + }, + { + "epoch": 0.42, + "learning_rate": 1.1592559512251952e-07, + "loss": 0.0005, + "step": 21700 + }, + { + "epoch": 0.42, + "learning_rate": 1.1592171177818338e-07, + "loss": 0.0009, + "step": 21701 + }, + { + "epoch": 0.42, + "learning_rate": 1.1591782843384724e-07, + "loss": 0.0008, + "step": 21702 + }, + { + "epoch": 0.42, + "learning_rate": 1.159139450895111e-07, + "loss": 0.0007, + "step": 21703 + }, + { + "epoch": 0.42, + "learning_rate": 1.1591006174517495e-07, + "loss": 0.001, + "step": 21704 + }, + { + "epoch": 0.42, + "learning_rate": 1.1590617840083881e-07, + "loss": 0.0006, + "step": 21705 + }, + { + "epoch": 0.42, + "learning_rate": 1.1590229505650267e-07, + "loss": 0.0007, + "step": 21706 + }, + { + "epoch": 0.42, + "learning_rate": 1.1589841171216653e-07, + "loss": 0.0006, + "step": 21707 + }, + { + "epoch": 0.42, + "learning_rate": 1.1589452836783039e-07, + "loss": 0.9166, + "step": 21708 + }, + { + "epoch": 0.42, + "learning_rate": 1.1589064502349424e-07, + "loss": 0.0007, + "step": 21709 + }, + { + "epoch": 0.42, + "learning_rate": 1.158867616791581e-07, + "loss": 0.0008, + "step": 21710 + }, + { + "epoch": 0.42, + "learning_rate": 1.1588287833482196e-07, + "loss": 0.0009, + "step": 21711 + }, + { + "epoch": 0.42, + "learning_rate": 1.1587899499048582e-07, + "loss": 0.001, + "step": 21712 + }, + { + "epoch": 0.42, + "learning_rate": 1.1587511164614965e-07, + "loss": 0.0027, + "step": 21713 + }, + { + "epoch": 0.42, + "learning_rate": 1.1587122830181351e-07, + "loss": 0.0109, + "step": 21714 + }, + { + "epoch": 0.42, + "learning_rate": 1.1586734495747737e-07, + "loss": 0.8239, + "step": 21715 + }, + { + "epoch": 0.42, + "learning_rate": 1.1586346161314122e-07, + "loss": 0.0009, + "step": 21716 + }, + { + "epoch": 0.42, + "learning_rate": 1.1585957826880508e-07, + "loss": 0.0007, + "step": 21717 + }, + { + "epoch": 0.42, + "learning_rate": 1.1585569492446894e-07, + "loss": 0.0005, + "step": 21718 + }, + { + "epoch": 0.42, + "learning_rate": 1.158518115801328e-07, + "loss": 0.0007, + "step": 21719 + }, + { + "epoch": 0.42, + "learning_rate": 1.1584792823579666e-07, + "loss": 0.0008, + "step": 21720 + }, + { + "epoch": 0.42, + "learning_rate": 1.1584404489146052e-07, + "loss": 0.0006, + "step": 21721 + }, + { + "epoch": 0.42, + "learning_rate": 1.1584016154712437e-07, + "loss": 0.2466, + "step": 21722 + }, + { + "epoch": 0.42, + "learning_rate": 1.1583627820278823e-07, + "loss": 0.0006, + "step": 21723 + }, + { + "epoch": 0.42, + "learning_rate": 1.1583239485845209e-07, + "loss": 0.3753, + "step": 21724 + }, + { + "epoch": 0.42, + "learning_rate": 1.1582851151411595e-07, + "loss": 0.0008, + "step": 21725 + }, + { + "epoch": 0.42, + "learning_rate": 1.1582462816977981e-07, + "loss": 1.31, + "step": 21726 + }, + { + "epoch": 0.42, + "learning_rate": 1.1582074482544367e-07, + "loss": 0.0005, + "step": 21727 + }, + { + "epoch": 0.42, + "learning_rate": 1.1581686148110752e-07, + "loss": 0.0012, + "step": 21728 + }, + { + "epoch": 0.42, + "learning_rate": 1.1581297813677138e-07, + "loss": 0.0009, + "step": 21729 + }, + { + "epoch": 0.42, + "learning_rate": 1.1580909479243524e-07, + "loss": 0.0007, + "step": 21730 + }, + { + "epoch": 0.42, + "learning_rate": 1.158052114480991e-07, + "loss": 0.0023, + "step": 21731 + }, + { + "epoch": 0.42, + "learning_rate": 1.1580132810376296e-07, + "loss": 0.7678, + "step": 21732 + }, + { + "epoch": 0.42, + "learning_rate": 1.1579744475942681e-07, + "loss": 0.0006, + "step": 21733 + }, + { + "epoch": 0.42, + "learning_rate": 1.1579356141509067e-07, + "loss": 0.0007, + "step": 21734 + }, + { + "epoch": 0.42, + "learning_rate": 1.1578967807075453e-07, + "loss": 0.001, + "step": 21735 + }, + { + "epoch": 0.42, + "learning_rate": 1.1578579472641839e-07, + "loss": 0.5237, + "step": 21736 + }, + { + "epoch": 0.42, + "learning_rate": 1.1578191138208225e-07, + "loss": 0.0007, + "step": 21737 + }, + { + "epoch": 0.42, + "learning_rate": 1.157780280377461e-07, + "loss": 0.0006, + "step": 21738 + }, + { + "epoch": 0.42, + "learning_rate": 1.1577414469340996e-07, + "loss": 0.0009, + "step": 21739 + }, + { + "epoch": 0.42, + "learning_rate": 1.1577026134907382e-07, + "loss": 0.0006, + "step": 21740 + }, + { + "epoch": 0.42, + "learning_rate": 1.1576637800473768e-07, + "loss": 0.0008, + "step": 21741 + }, + { + "epoch": 0.42, + "learning_rate": 1.1576249466040154e-07, + "loss": 0.0007, + "step": 21742 + }, + { + "epoch": 0.42, + "learning_rate": 1.157586113160654e-07, + "loss": 0.2493, + "step": 21743 + }, + { + "epoch": 0.42, + "learning_rate": 1.1575472797172926e-07, + "loss": 0.0006, + "step": 21744 + }, + { + "epoch": 0.42, + "learning_rate": 1.1575084462739311e-07, + "loss": 0.0005, + "step": 21745 + }, + { + "epoch": 0.42, + "learning_rate": 1.1574696128305696e-07, + "loss": 0.0005, + "step": 21746 + }, + { + "epoch": 0.42, + "learning_rate": 1.1574307793872082e-07, + "loss": 0.8943, + "step": 21747 + }, + { + "epoch": 0.42, + "learning_rate": 1.1573919459438468e-07, + "loss": 0.0015, + "step": 21748 + }, + { + "epoch": 0.42, + "learning_rate": 1.1573531125004853e-07, + "loss": 0.0006, + "step": 21749 + }, + { + "epoch": 0.42, + "learning_rate": 1.1573142790571239e-07, + "loss": 0.0014, + "step": 21750 + }, + { + "epoch": 0.42, + "learning_rate": 1.1572754456137625e-07, + "loss": 0.0464, + "step": 21751 + }, + { + "epoch": 0.42, + "learning_rate": 1.1572366121704011e-07, + "loss": 0.003, + "step": 21752 + }, + { + "epoch": 0.42, + "learning_rate": 1.1571977787270397e-07, + "loss": 0.0008, + "step": 21753 + }, + { + "epoch": 0.42, + "learning_rate": 1.1571589452836782e-07, + "loss": 0.0128, + "step": 21754 + }, + { + "epoch": 0.42, + "learning_rate": 1.1571201118403168e-07, + "loss": 0.0008, + "step": 21755 + }, + { + "epoch": 0.42, + "learning_rate": 1.1570812783969554e-07, + "loss": 0.0012, + "step": 21756 + }, + { + "epoch": 0.42, + "learning_rate": 1.157042444953594e-07, + "loss": 0.0008, + "step": 21757 + }, + { + "epoch": 0.42, + "learning_rate": 1.1570036115102326e-07, + "loss": 0.0025, + "step": 21758 + }, + { + "epoch": 0.42, + "learning_rate": 1.1569647780668712e-07, + "loss": 0.0006, + "step": 21759 + }, + { + "epoch": 0.42, + "learning_rate": 1.1569259446235097e-07, + "loss": 0.0005, + "step": 21760 + }, + { + "epoch": 0.42, + "learning_rate": 1.1568871111801483e-07, + "loss": 0.0033, + "step": 21761 + }, + { + "epoch": 0.42, + "learning_rate": 1.1568482777367869e-07, + "loss": 0.0006, + "step": 21762 + }, + { + "epoch": 0.42, + "learning_rate": 1.1568094442934255e-07, + "loss": 0.0005, + "step": 21763 + }, + { + "epoch": 0.42, + "learning_rate": 1.1567706108500641e-07, + "loss": 0.001, + "step": 21764 + }, + { + "epoch": 0.42, + "learning_rate": 1.1567317774067027e-07, + "loss": 0.0005, + "step": 21765 + }, + { + "epoch": 0.42, + "learning_rate": 1.1566929439633412e-07, + "loss": 0.0007, + "step": 21766 + }, + { + "epoch": 0.42, + "learning_rate": 1.1566541105199798e-07, + "loss": 0.0007, + "step": 21767 + }, + { + "epoch": 0.42, + "learning_rate": 1.1566152770766184e-07, + "loss": 0.0007, + "step": 21768 + }, + { + "epoch": 0.42, + "learning_rate": 1.156576443633257e-07, + "loss": 0.3691, + "step": 21769 + }, + { + "epoch": 0.42, + "learning_rate": 1.1565376101898956e-07, + "loss": 0.0014, + "step": 21770 + }, + { + "epoch": 0.42, + "learning_rate": 1.156498776746534e-07, + "loss": 0.0004, + "step": 21771 + }, + { + "epoch": 0.42, + "learning_rate": 1.1564599433031726e-07, + "loss": 0.487, + "step": 21772 + }, + { + "epoch": 0.42, + "learning_rate": 1.1564211098598112e-07, + "loss": 0.0055, + "step": 21773 + }, + { + "epoch": 0.42, + "learning_rate": 1.1563822764164498e-07, + "loss": 0.9848, + "step": 21774 + }, + { + "epoch": 0.42, + "learning_rate": 1.1563434429730882e-07, + "loss": 0.0007, + "step": 21775 + }, + { + "epoch": 0.42, + "learning_rate": 1.1563046095297268e-07, + "loss": 0.0009, + "step": 21776 + }, + { + "epoch": 0.42, + "learning_rate": 1.1562657760863654e-07, + "loss": 0.0008, + "step": 21777 + }, + { + "epoch": 0.42, + "learning_rate": 1.156226942643004e-07, + "loss": 0.0005, + "step": 21778 + }, + { + "epoch": 0.42, + "learning_rate": 1.1561881091996425e-07, + "loss": 0.0007, + "step": 21779 + }, + { + "epoch": 0.42, + "learning_rate": 1.1561492757562811e-07, + "loss": 0.0007, + "step": 21780 + }, + { + "epoch": 0.42, + "learning_rate": 1.1561104423129197e-07, + "loss": 0.0006, + "step": 21781 + }, + { + "epoch": 0.42, + "learning_rate": 1.1560716088695583e-07, + "loss": 0.0008, + "step": 21782 + }, + { + "epoch": 0.42, + "learning_rate": 1.1560327754261969e-07, + "loss": 0.001, + "step": 21783 + }, + { + "epoch": 0.42, + "learning_rate": 1.1559939419828355e-07, + "loss": 0.0052, + "step": 21784 + }, + { + "epoch": 0.42, + "learning_rate": 1.155955108539474e-07, + "loss": 0.0006, + "step": 21785 + }, + { + "epoch": 0.42, + "learning_rate": 1.1559162750961126e-07, + "loss": 0.0008, + "step": 21786 + }, + { + "epoch": 0.42, + "learning_rate": 1.1558774416527512e-07, + "loss": 0.0005, + "step": 21787 + }, + { + "epoch": 0.42, + "learning_rate": 1.1558386082093898e-07, + "loss": 0.071, + "step": 21788 + }, + { + "epoch": 0.42, + "learning_rate": 1.1557997747660284e-07, + "loss": 0.0011, + "step": 21789 + }, + { + "epoch": 0.42, + "learning_rate": 1.155760941322667e-07, + "loss": 0.0005, + "step": 21790 + }, + { + "epoch": 0.42, + "learning_rate": 1.1557221078793055e-07, + "loss": 0.0018, + "step": 21791 + }, + { + "epoch": 0.42, + "learning_rate": 1.1556832744359441e-07, + "loss": 0.0005, + "step": 21792 + }, + { + "epoch": 0.42, + "learning_rate": 1.1556444409925827e-07, + "loss": 0.0007, + "step": 21793 + }, + { + "epoch": 0.42, + "learning_rate": 1.1556056075492213e-07, + "loss": 0.0007, + "step": 21794 + }, + { + "epoch": 0.42, + "learning_rate": 1.1555667741058599e-07, + "loss": 0.0006, + "step": 21795 + }, + { + "epoch": 0.42, + "learning_rate": 1.1555279406624984e-07, + "loss": 0.0019, + "step": 21796 + }, + { + "epoch": 0.42, + "learning_rate": 1.155489107219137e-07, + "loss": 1.1461, + "step": 21797 + }, + { + "epoch": 0.42, + "learning_rate": 1.1554502737757756e-07, + "loss": 0.0006, + "step": 21798 + }, + { + "epoch": 0.42, + "learning_rate": 1.1554114403324142e-07, + "loss": 0.0023, + "step": 21799 + }, + { + "epoch": 0.42, + "learning_rate": 1.1553726068890528e-07, + "loss": 0.3073, + "step": 21800 + }, + { + "epoch": 0.42, + "learning_rate": 1.1553337734456914e-07, + "loss": 0.0008, + "step": 21801 + }, + { + "epoch": 0.42, + "learning_rate": 1.15529494000233e-07, + "loss": 0.0006, + "step": 21802 + }, + { + "epoch": 0.42, + "learning_rate": 1.1552561065589685e-07, + "loss": 0.0025, + "step": 21803 + }, + { + "epoch": 0.42, + "learning_rate": 1.1552172731156071e-07, + "loss": 0.0007, + "step": 21804 + }, + { + "epoch": 0.42, + "learning_rate": 1.1551784396722457e-07, + "loss": 0.0015, + "step": 21805 + }, + { + "epoch": 0.42, + "learning_rate": 1.1551396062288843e-07, + "loss": 0.0572, + "step": 21806 + }, + { + "epoch": 0.42, + "learning_rate": 1.1551007727855229e-07, + "loss": 0.0007, + "step": 21807 + }, + { + "epoch": 0.42, + "learning_rate": 1.1550619393421614e-07, + "loss": 0.0008, + "step": 21808 + }, + { + "epoch": 0.42, + "learning_rate": 1.1550231058988e-07, + "loss": 0.0008, + "step": 21809 + }, + { + "epoch": 0.42, + "learning_rate": 1.1549842724554386e-07, + "loss": 0.0008, + "step": 21810 + }, + { + "epoch": 0.42, + "learning_rate": 1.1549454390120772e-07, + "loss": 0.1202, + "step": 21811 + }, + { + "epoch": 0.42, + "learning_rate": 1.1549066055687158e-07, + "loss": 0.0008, + "step": 21812 + }, + { + "epoch": 0.42, + "learning_rate": 1.1548677721253543e-07, + "loss": 0.0009, + "step": 21813 + }, + { + "epoch": 0.42, + "learning_rate": 1.1548289386819929e-07, + "loss": 0.0006, + "step": 21814 + }, + { + "epoch": 0.42, + "learning_rate": 1.1547901052386315e-07, + "loss": 0.0009, + "step": 21815 + }, + { + "epoch": 0.42, + "learning_rate": 1.1547512717952701e-07, + "loss": 0.0347, + "step": 21816 + }, + { + "epoch": 0.42, + "learning_rate": 1.1547124383519087e-07, + "loss": 0.0019, + "step": 21817 + }, + { + "epoch": 0.42, + "learning_rate": 1.1546736049085473e-07, + "loss": 0.0131, + "step": 21818 + }, + { + "epoch": 0.42, + "learning_rate": 1.1546347714651858e-07, + "loss": 0.0008, + "step": 21819 + }, + { + "epoch": 0.42, + "learning_rate": 1.1545959380218244e-07, + "loss": 0.0034, + "step": 21820 + }, + { + "epoch": 0.42, + "learning_rate": 1.154557104578463e-07, + "loss": 0.0056, + "step": 21821 + }, + { + "epoch": 0.42, + "learning_rate": 1.1545182711351016e-07, + "loss": 0.4255, + "step": 21822 + }, + { + "epoch": 0.42, + "learning_rate": 1.1544794376917402e-07, + "loss": 0.0982, + "step": 21823 + }, + { + "epoch": 0.42, + "learning_rate": 1.1544406042483788e-07, + "loss": 0.0008, + "step": 21824 + }, + { + "epoch": 0.42, + "learning_rate": 1.1544017708050173e-07, + "loss": 0.0015, + "step": 21825 + }, + { + "epoch": 0.42, + "learning_rate": 1.1543629373616559e-07, + "loss": 0.0006, + "step": 21826 + }, + { + "epoch": 0.42, + "learning_rate": 1.1543241039182945e-07, + "loss": 0.5519, + "step": 21827 + }, + { + "epoch": 0.42, + "learning_rate": 1.1542852704749331e-07, + "loss": 0.0007, + "step": 21828 + }, + { + "epoch": 0.42, + "learning_rate": 1.1542464370315714e-07, + "loss": 0.0007, + "step": 21829 + }, + { + "epoch": 0.42, + "learning_rate": 1.15420760358821e-07, + "loss": 0.0006, + "step": 21830 + }, + { + "epoch": 0.42, + "learning_rate": 1.1541687701448486e-07, + "loss": 0.0011, + "step": 21831 + }, + { + "epoch": 0.42, + "learning_rate": 1.1541299367014871e-07, + "loss": 0.0005, + "step": 21832 + }, + { + "epoch": 0.42, + "learning_rate": 1.1540911032581257e-07, + "loss": 0.0009, + "step": 21833 + }, + { + "epoch": 0.42, + "learning_rate": 1.1540522698147643e-07, + "loss": 0.0005, + "step": 21834 + }, + { + "epoch": 0.42, + "learning_rate": 1.1540134363714029e-07, + "loss": 0.0006, + "step": 21835 + }, + { + "epoch": 0.42, + "learning_rate": 1.1539746029280415e-07, + "loss": 0.0012, + "step": 21836 + }, + { + "epoch": 0.42, + "learning_rate": 1.15393576948468e-07, + "loss": 0.0007, + "step": 21837 + }, + { + "epoch": 0.42, + "learning_rate": 1.1538969360413186e-07, + "loss": 0.0012, + "step": 21838 + }, + { + "epoch": 0.42, + "learning_rate": 1.1538581025979572e-07, + "loss": 0.0007, + "step": 21839 + }, + { + "epoch": 0.42, + "learning_rate": 1.1538192691545958e-07, + "loss": 1.2111, + "step": 21840 + }, + { + "epoch": 0.42, + "learning_rate": 1.1537804357112344e-07, + "loss": 0.0006, + "step": 21841 + }, + { + "epoch": 0.42, + "learning_rate": 1.153741602267873e-07, + "loss": 0.2579, + "step": 21842 + }, + { + "epoch": 0.42, + "learning_rate": 1.1537027688245116e-07, + "loss": 0.001, + "step": 21843 + }, + { + "epoch": 0.42, + "learning_rate": 1.1536639353811501e-07, + "loss": 0.0007, + "step": 21844 + }, + { + "epoch": 0.42, + "learning_rate": 1.1536251019377887e-07, + "loss": 0.0008, + "step": 21845 + }, + { + "epoch": 0.42, + "learning_rate": 1.1535862684944273e-07, + "loss": 0.0006, + "step": 21846 + }, + { + "epoch": 0.42, + "learning_rate": 1.1535474350510659e-07, + "loss": 0.0006, + "step": 21847 + }, + { + "epoch": 0.42, + "learning_rate": 1.1535086016077045e-07, + "loss": 0.0017, + "step": 21848 + }, + { + "epoch": 0.42, + "learning_rate": 1.153469768164343e-07, + "loss": 0.0006, + "step": 21849 + }, + { + "epoch": 0.42, + "learning_rate": 1.1534309347209816e-07, + "loss": 0.001, + "step": 21850 + }, + { + "epoch": 0.42, + "learning_rate": 1.1533921012776202e-07, + "loss": 0.0007, + "step": 21851 + }, + { + "epoch": 0.42, + "learning_rate": 1.1533532678342588e-07, + "loss": 0.0507, + "step": 21852 + }, + { + "epoch": 0.42, + "learning_rate": 1.1533144343908974e-07, + "loss": 0.0008, + "step": 21853 + }, + { + "epoch": 0.42, + "learning_rate": 1.153275600947536e-07, + "loss": 0.0007, + "step": 21854 + }, + { + "epoch": 0.42, + "learning_rate": 1.1532367675041745e-07, + "loss": 0.0007, + "step": 21855 + }, + { + "epoch": 0.42, + "learning_rate": 1.1531979340608131e-07, + "loss": 0.0006, + "step": 21856 + }, + { + "epoch": 0.42, + "learning_rate": 1.1531591006174517e-07, + "loss": 0.0009, + "step": 21857 + }, + { + "epoch": 0.42, + "learning_rate": 1.1531202671740903e-07, + "loss": 0.0012, + "step": 21858 + }, + { + "epoch": 0.42, + "learning_rate": 1.1530814337307289e-07, + "loss": 0.0012, + "step": 21859 + }, + { + "epoch": 0.42, + "learning_rate": 1.1530426002873675e-07, + "loss": 0.0009, + "step": 21860 + }, + { + "epoch": 0.42, + "learning_rate": 1.153003766844006e-07, + "loss": 0.0006, + "step": 21861 + }, + { + "epoch": 0.42, + "learning_rate": 1.1529649334006446e-07, + "loss": 0.0006, + "step": 21862 + }, + { + "epoch": 0.42, + "learning_rate": 1.1529260999572832e-07, + "loss": 0.0007, + "step": 21863 + }, + { + "epoch": 0.42, + "learning_rate": 1.1528872665139218e-07, + "loss": 0.0011, + "step": 21864 + }, + { + "epoch": 0.42, + "learning_rate": 1.1528484330705604e-07, + "loss": 0.001, + "step": 21865 + }, + { + "epoch": 0.42, + "learning_rate": 1.152809599627199e-07, + "loss": 0.0005, + "step": 21866 + }, + { + "epoch": 0.42, + "learning_rate": 1.1527707661838375e-07, + "loss": 0.0007, + "step": 21867 + }, + { + "epoch": 0.42, + "learning_rate": 1.1527319327404761e-07, + "loss": 0.0008, + "step": 21868 + }, + { + "epoch": 0.42, + "learning_rate": 1.1526930992971147e-07, + "loss": 0.0008, + "step": 21869 + }, + { + "epoch": 0.42, + "learning_rate": 1.1526542658537533e-07, + "loss": 0.2057, + "step": 21870 + }, + { + "epoch": 0.42, + "learning_rate": 1.1526154324103919e-07, + "loss": 0.0009, + "step": 21871 + }, + { + "epoch": 0.42, + "learning_rate": 1.1525765989670304e-07, + "loss": 0.0005, + "step": 21872 + }, + { + "epoch": 0.42, + "learning_rate": 1.152537765523669e-07, + "loss": 0.0006, + "step": 21873 + }, + { + "epoch": 0.42, + "learning_rate": 1.1524989320803076e-07, + "loss": 0.0009, + "step": 21874 + }, + { + "epoch": 0.42, + "learning_rate": 1.1524600986369462e-07, + "loss": 0.0119, + "step": 21875 + }, + { + "epoch": 0.42, + "learning_rate": 1.1524212651935848e-07, + "loss": 0.0008, + "step": 21876 + }, + { + "epoch": 0.42, + "learning_rate": 1.1523824317502234e-07, + "loss": 0.0005, + "step": 21877 + }, + { + "epoch": 0.42, + "learning_rate": 1.152343598306862e-07, + "loss": 0.0008, + "step": 21878 + }, + { + "epoch": 0.42, + "learning_rate": 1.1523047648635005e-07, + "loss": 0.7321, + "step": 21879 + }, + { + "epoch": 0.42, + "learning_rate": 1.1522659314201391e-07, + "loss": 0.0026, + "step": 21880 + }, + { + "epoch": 0.42, + "learning_rate": 1.1522270979767777e-07, + "loss": 0.001, + "step": 21881 + }, + { + "epoch": 0.42, + "learning_rate": 1.1521882645334163e-07, + "loss": 0.0652, + "step": 21882 + }, + { + "epoch": 0.42, + "learning_rate": 1.1521494310900549e-07, + "loss": 0.0009, + "step": 21883 + }, + { + "epoch": 0.42, + "learning_rate": 1.1521105976466934e-07, + "loss": 0.0008, + "step": 21884 + }, + { + "epoch": 0.42, + "learning_rate": 1.152071764203332e-07, + "loss": 0.064, + "step": 21885 + }, + { + "epoch": 0.42, + "learning_rate": 1.1520329307599706e-07, + "loss": 0.0019, + "step": 21886 + }, + { + "epoch": 0.42, + "learning_rate": 1.1519940973166089e-07, + "loss": 0.0008, + "step": 21887 + }, + { + "epoch": 0.42, + "learning_rate": 1.1519552638732475e-07, + "loss": 0.0005, + "step": 21888 + }, + { + "epoch": 0.42, + "learning_rate": 1.1519164304298861e-07, + "loss": 0.0009, + "step": 21889 + }, + { + "epoch": 0.42, + "learning_rate": 1.1518775969865247e-07, + "loss": 0.0006, + "step": 21890 + }, + { + "epoch": 0.42, + "learning_rate": 1.1518387635431632e-07, + "loss": 0.001, + "step": 21891 + }, + { + "epoch": 0.42, + "learning_rate": 1.1517999300998018e-07, + "loss": 0.0006, + "step": 21892 + }, + { + "epoch": 0.42, + "learning_rate": 1.1517610966564404e-07, + "loss": 0.0006, + "step": 21893 + }, + { + "epoch": 0.42, + "learning_rate": 1.151722263213079e-07, + "loss": 0.5201, + "step": 21894 + }, + { + "epoch": 0.42, + "learning_rate": 1.1516834297697176e-07, + "loss": 0.0008, + "step": 21895 + }, + { + "epoch": 0.42, + "learning_rate": 1.1516445963263562e-07, + "loss": 0.1952, + "step": 21896 + }, + { + "epoch": 0.42, + "learning_rate": 1.1516057628829947e-07, + "loss": 0.0012, + "step": 21897 + }, + { + "epoch": 0.42, + "learning_rate": 1.1515669294396333e-07, + "loss": 0.0008, + "step": 21898 + }, + { + "epoch": 0.42, + "learning_rate": 1.1515280959962719e-07, + "loss": 0.0007, + "step": 21899 + }, + { + "epoch": 0.42, + "learning_rate": 1.1514892625529105e-07, + "loss": 0.0005, + "step": 21900 + }, + { + "epoch": 0.42, + "learning_rate": 1.1514504291095491e-07, + "loss": 0.029, + "step": 21901 + }, + { + "epoch": 0.42, + "learning_rate": 1.1514115956661877e-07, + "loss": 0.0016, + "step": 21902 + }, + { + "epoch": 0.42, + "learning_rate": 1.1513727622228262e-07, + "loss": 0.9508, + "step": 21903 + }, + { + "epoch": 0.42, + "learning_rate": 1.1513339287794648e-07, + "loss": 0.0006, + "step": 21904 + }, + { + "epoch": 0.42, + "learning_rate": 1.1512950953361034e-07, + "loss": 0.001, + "step": 21905 + }, + { + "epoch": 0.42, + "learning_rate": 1.151256261892742e-07, + "loss": 0.0007, + "step": 21906 + }, + { + "epoch": 0.42, + "learning_rate": 1.1512174284493806e-07, + "loss": 0.0005, + "step": 21907 + }, + { + "epoch": 0.42, + "learning_rate": 1.1511785950060191e-07, + "loss": 0.9654, + "step": 21908 + }, + { + "epoch": 0.42, + "learning_rate": 1.1511397615626577e-07, + "loss": 0.0006, + "step": 21909 + }, + { + "epoch": 0.43, + "learning_rate": 1.1511009281192963e-07, + "loss": 0.0009, + "step": 21910 + }, + { + "epoch": 0.43, + "learning_rate": 1.1510620946759349e-07, + "loss": 0.0009, + "step": 21911 + }, + { + "epoch": 0.43, + "learning_rate": 1.1510232612325735e-07, + "loss": 0.5477, + "step": 21912 + }, + { + "epoch": 0.43, + "learning_rate": 1.150984427789212e-07, + "loss": 0.0014, + "step": 21913 + }, + { + "epoch": 0.43, + "learning_rate": 1.1509455943458506e-07, + "loss": 0.0005, + "step": 21914 + }, + { + "epoch": 0.43, + "learning_rate": 1.1509067609024892e-07, + "loss": 0.0013, + "step": 21915 + }, + { + "epoch": 0.43, + "learning_rate": 1.1508679274591278e-07, + "loss": 0.0008, + "step": 21916 + }, + { + "epoch": 0.43, + "learning_rate": 1.1508290940157664e-07, + "loss": 0.0006, + "step": 21917 + }, + { + "epoch": 0.43, + "learning_rate": 1.150790260572405e-07, + "loss": 0.0008, + "step": 21918 + }, + { + "epoch": 0.43, + "learning_rate": 1.1507514271290436e-07, + "loss": 0.0011, + "step": 21919 + }, + { + "epoch": 0.43, + "learning_rate": 1.1507125936856821e-07, + "loss": 0.0006, + "step": 21920 + }, + { + "epoch": 0.43, + "learning_rate": 1.1506737602423207e-07, + "loss": 0.001, + "step": 21921 + }, + { + "epoch": 0.43, + "learning_rate": 1.1506349267989593e-07, + "loss": 0.0005, + "step": 21922 + }, + { + "epoch": 0.43, + "learning_rate": 1.1505960933555978e-07, + "loss": 0.0005, + "step": 21923 + }, + { + "epoch": 0.43, + "learning_rate": 1.1505572599122363e-07, + "loss": 0.0011, + "step": 21924 + }, + { + "epoch": 0.43, + "learning_rate": 1.1505184264688749e-07, + "loss": 0.0008, + "step": 21925 + }, + { + "epoch": 0.43, + "learning_rate": 1.1504795930255135e-07, + "loss": 0.0006, + "step": 21926 + }, + { + "epoch": 0.43, + "learning_rate": 1.1504407595821521e-07, + "loss": 0.0008, + "step": 21927 + }, + { + "epoch": 0.43, + "learning_rate": 1.1504019261387907e-07, + "loss": 0.0006, + "step": 21928 + }, + { + "epoch": 0.43, + "learning_rate": 1.1503630926954292e-07, + "loss": 0.0009, + "step": 21929 + }, + { + "epoch": 0.43, + "learning_rate": 1.1503242592520678e-07, + "loss": 0.0035, + "step": 21930 + }, + { + "epoch": 0.43, + "learning_rate": 1.1502854258087064e-07, + "loss": 0.0007, + "step": 21931 + }, + { + "epoch": 0.43, + "learning_rate": 1.150246592365345e-07, + "loss": 0.7342, + "step": 21932 + }, + { + "epoch": 0.43, + "learning_rate": 1.1502077589219836e-07, + "loss": 0.0007, + "step": 21933 + }, + { + "epoch": 0.43, + "learning_rate": 1.1501689254786222e-07, + "loss": 0.0006, + "step": 21934 + }, + { + "epoch": 0.43, + "learning_rate": 1.1501300920352607e-07, + "loss": 0.0009, + "step": 21935 + }, + { + "epoch": 0.43, + "learning_rate": 1.1500912585918993e-07, + "loss": 1.0332, + "step": 21936 + }, + { + "epoch": 0.43, + "learning_rate": 1.1500524251485379e-07, + "loss": 0.0006, + "step": 21937 + }, + { + "epoch": 0.43, + "learning_rate": 1.1500135917051765e-07, + "loss": 0.0008, + "step": 21938 + }, + { + "epoch": 0.43, + "learning_rate": 1.1499747582618151e-07, + "loss": 0.0007, + "step": 21939 + }, + { + "epoch": 0.43, + "learning_rate": 1.1499359248184537e-07, + "loss": 0.0006, + "step": 21940 + }, + { + "epoch": 0.43, + "learning_rate": 1.1498970913750922e-07, + "loss": 0.0005, + "step": 21941 + }, + { + "epoch": 0.43, + "learning_rate": 1.1498582579317308e-07, + "loss": 0.0008, + "step": 21942 + }, + { + "epoch": 0.43, + "learning_rate": 1.1498194244883694e-07, + "loss": 0.0006, + "step": 21943 + }, + { + "epoch": 0.43, + "learning_rate": 1.149780591045008e-07, + "loss": 0.0006, + "step": 21944 + }, + { + "epoch": 0.43, + "learning_rate": 1.1497417576016464e-07, + "loss": 0.0005, + "step": 21945 + }, + { + "epoch": 0.43, + "learning_rate": 1.149702924158285e-07, + "loss": 0.0009, + "step": 21946 + }, + { + "epoch": 0.43, + "learning_rate": 1.1496640907149236e-07, + "loss": 0.0008, + "step": 21947 + }, + { + "epoch": 0.43, + "learning_rate": 1.1496252572715622e-07, + "loss": 1.0143, + "step": 21948 + }, + { + "epoch": 0.43, + "learning_rate": 1.1495864238282008e-07, + "loss": 0.0006, + "step": 21949 + }, + { + "epoch": 0.43, + "learning_rate": 1.1495475903848393e-07, + "loss": 0.0007, + "step": 21950 + }, + { + "epoch": 0.43, + "learning_rate": 1.1495087569414779e-07, + "loss": 0.0006, + "step": 21951 + }, + { + "epoch": 0.43, + "learning_rate": 1.1494699234981164e-07, + "loss": 0.0007, + "step": 21952 + }, + { + "epoch": 0.43, + "learning_rate": 1.149431090054755e-07, + "loss": 1.0571, + "step": 21953 + }, + { + "epoch": 0.43, + "learning_rate": 1.1493922566113935e-07, + "loss": 0.0006, + "step": 21954 + }, + { + "epoch": 0.43, + "learning_rate": 1.1493534231680321e-07, + "loss": 0.0007, + "step": 21955 + }, + { + "epoch": 0.43, + "learning_rate": 1.1493145897246707e-07, + "loss": 0.0005, + "step": 21956 + }, + { + "epoch": 0.43, + "learning_rate": 1.1492757562813093e-07, + "loss": 0.0006, + "step": 21957 + }, + { + "epoch": 0.43, + "learning_rate": 1.1492369228379479e-07, + "loss": 0.0008, + "step": 21958 + }, + { + "epoch": 0.43, + "learning_rate": 1.1491980893945865e-07, + "loss": 0.0007, + "step": 21959 + }, + { + "epoch": 0.43, + "learning_rate": 1.149159255951225e-07, + "loss": 0.0006, + "step": 21960 + }, + { + "epoch": 0.43, + "learning_rate": 1.1491204225078636e-07, + "loss": 0.0012, + "step": 21961 + }, + { + "epoch": 0.43, + "learning_rate": 1.1490815890645022e-07, + "loss": 0.0011, + "step": 21962 + }, + { + "epoch": 0.43, + "learning_rate": 1.1490427556211408e-07, + "loss": 1.0357, + "step": 21963 + }, + { + "epoch": 0.43, + "learning_rate": 1.1490039221777794e-07, + "loss": 0.0006, + "step": 21964 + }, + { + "epoch": 0.43, + "learning_rate": 1.148965088734418e-07, + "loss": 0.0006, + "step": 21965 + }, + { + "epoch": 0.43, + "learning_rate": 1.1489262552910565e-07, + "loss": 0.0005, + "step": 21966 + }, + { + "epoch": 0.43, + "learning_rate": 1.1488874218476951e-07, + "loss": 0.0042, + "step": 21967 + }, + { + "epoch": 0.43, + "learning_rate": 1.1488485884043337e-07, + "loss": 0.0005, + "step": 21968 + }, + { + "epoch": 0.43, + "learning_rate": 1.1488097549609723e-07, + "loss": 0.0008, + "step": 21969 + }, + { + "epoch": 0.43, + "learning_rate": 1.1487709215176109e-07, + "loss": 0.004, + "step": 21970 + }, + { + "epoch": 0.43, + "learning_rate": 1.1487320880742494e-07, + "loss": 0.0019, + "step": 21971 + }, + { + "epoch": 0.43, + "learning_rate": 1.148693254630888e-07, + "loss": 0.0011, + "step": 21972 + }, + { + "epoch": 0.43, + "learning_rate": 1.1486544211875266e-07, + "loss": 0.0005, + "step": 21973 + }, + { + "epoch": 0.43, + "learning_rate": 1.1486155877441652e-07, + "loss": 0.1053, + "step": 21974 + }, + { + "epoch": 0.43, + "learning_rate": 1.1485767543008038e-07, + "loss": 0.0007, + "step": 21975 + }, + { + "epoch": 0.43, + "learning_rate": 1.1485379208574424e-07, + "loss": 0.0007, + "step": 21976 + }, + { + "epoch": 0.43, + "learning_rate": 1.148499087414081e-07, + "loss": 0.0006, + "step": 21977 + }, + { + "epoch": 0.43, + "learning_rate": 1.1484602539707195e-07, + "loss": 0.9677, + "step": 21978 + }, + { + "epoch": 0.43, + "learning_rate": 1.1484214205273581e-07, + "loss": 0.0007, + "step": 21979 + }, + { + "epoch": 0.43, + "learning_rate": 1.1483825870839967e-07, + "loss": 0.0004, + "step": 21980 + }, + { + "epoch": 0.43, + "learning_rate": 1.1483437536406353e-07, + "loss": 0.0007, + "step": 21981 + }, + { + "epoch": 0.43, + "learning_rate": 1.1483049201972739e-07, + "loss": 0.0009, + "step": 21982 + }, + { + "epoch": 0.43, + "learning_rate": 1.1482660867539124e-07, + "loss": 0.0008, + "step": 21983 + }, + { + "epoch": 0.43, + "learning_rate": 1.148227253310551e-07, + "loss": 0.0005, + "step": 21984 + }, + { + "epoch": 0.43, + "learning_rate": 1.1481884198671896e-07, + "loss": 0.0008, + "step": 21985 + }, + { + "epoch": 0.43, + "learning_rate": 1.1481495864238282e-07, + "loss": 0.0005, + "step": 21986 + }, + { + "epoch": 0.43, + "learning_rate": 1.1481107529804668e-07, + "loss": 0.0007, + "step": 21987 + }, + { + "epoch": 0.43, + "learning_rate": 1.1480719195371053e-07, + "loss": 0.0006, + "step": 21988 + }, + { + "epoch": 0.43, + "learning_rate": 1.1480330860937439e-07, + "loss": 0.0009, + "step": 21989 + }, + { + "epoch": 0.43, + "learning_rate": 1.1479942526503825e-07, + "loss": 0.2495, + "step": 21990 + }, + { + "epoch": 0.43, + "learning_rate": 1.1479554192070211e-07, + "loss": 0.0006, + "step": 21991 + }, + { + "epoch": 0.43, + "learning_rate": 1.1479165857636597e-07, + "loss": 0.0006, + "step": 21992 + }, + { + "epoch": 0.43, + "learning_rate": 1.1478777523202983e-07, + "loss": 1.2114, + "step": 21993 + }, + { + "epoch": 0.43, + "learning_rate": 1.1478389188769368e-07, + "loss": 0.0006, + "step": 21994 + }, + { + "epoch": 0.43, + "learning_rate": 1.1478000854335754e-07, + "loss": 0.0006, + "step": 21995 + }, + { + "epoch": 0.43, + "learning_rate": 1.147761251990214e-07, + "loss": 0.1527, + "step": 21996 + }, + { + "epoch": 0.43, + "learning_rate": 1.1477224185468526e-07, + "loss": 0.001, + "step": 21997 + }, + { + "epoch": 0.43, + "learning_rate": 1.1476835851034912e-07, + "loss": 0.0006, + "step": 21998 + }, + { + "epoch": 0.43, + "learning_rate": 1.1476447516601298e-07, + "loss": 0.7668, + "step": 21999 + }, + { + "epoch": 0.43, + "learning_rate": 1.1476059182167683e-07, + "loss": 0.0011, + "step": 22000 + }, + { + "epoch": 0.43, + "learning_rate": 1.1475670847734069e-07, + "loss": 0.0006, + "step": 22001 + }, + { + "epoch": 0.43, + "learning_rate": 1.1475282513300455e-07, + "loss": 0.0009, + "step": 22002 + }, + { + "epoch": 0.43, + "learning_rate": 1.1474894178866838e-07, + "loss": 1.5324, + "step": 22003 + }, + { + "epoch": 0.43, + "learning_rate": 1.1474505844433224e-07, + "loss": 0.0008, + "step": 22004 + }, + { + "epoch": 0.43, + "learning_rate": 1.147411750999961e-07, + "loss": 0.0031, + "step": 22005 + }, + { + "epoch": 0.43, + "learning_rate": 1.1473729175565996e-07, + "loss": 0.0009, + "step": 22006 + }, + { + "epoch": 0.43, + "learning_rate": 1.1473340841132381e-07, + "loss": 0.0006, + "step": 22007 + }, + { + "epoch": 0.43, + "learning_rate": 1.1472952506698767e-07, + "loss": 0.0008, + "step": 22008 + }, + { + "epoch": 0.43, + "learning_rate": 1.1472564172265153e-07, + "loss": 0.0005, + "step": 22009 + }, + { + "epoch": 0.43, + "learning_rate": 1.1472175837831539e-07, + "loss": 0.0006, + "step": 22010 + }, + { + "epoch": 0.43, + "learning_rate": 1.1471787503397925e-07, + "loss": 0.0008, + "step": 22011 + }, + { + "epoch": 0.43, + "learning_rate": 1.147139916896431e-07, + "loss": 0.0006, + "step": 22012 + }, + { + "epoch": 0.43, + "learning_rate": 1.1471010834530696e-07, + "loss": 0.2086, + "step": 22013 + }, + { + "epoch": 0.43, + "learning_rate": 1.1470622500097082e-07, + "loss": 0.108, + "step": 22014 + }, + { + "epoch": 0.43, + "learning_rate": 1.1470234165663468e-07, + "loss": 0.0005, + "step": 22015 + }, + { + "epoch": 0.43, + "learning_rate": 1.1469845831229854e-07, + "loss": 0.0097, + "step": 22016 + }, + { + "epoch": 0.43, + "learning_rate": 1.146945749679624e-07, + "loss": 0.0008, + "step": 22017 + }, + { + "epoch": 0.43, + "learning_rate": 1.1469069162362626e-07, + "loss": 0.0005, + "step": 22018 + }, + { + "epoch": 0.43, + "learning_rate": 1.1468680827929011e-07, + "loss": 0.0007, + "step": 22019 + }, + { + "epoch": 0.43, + "learning_rate": 1.1468292493495397e-07, + "loss": 0.0007, + "step": 22020 + }, + { + "epoch": 0.43, + "learning_rate": 1.1467904159061783e-07, + "loss": 0.6285, + "step": 22021 + }, + { + "epoch": 0.43, + "learning_rate": 1.1467515824628169e-07, + "loss": 0.001, + "step": 22022 + }, + { + "epoch": 0.43, + "learning_rate": 1.1467127490194555e-07, + "loss": 0.0008, + "step": 22023 + }, + { + "epoch": 0.43, + "learning_rate": 1.146673915576094e-07, + "loss": 0.0027, + "step": 22024 + }, + { + "epoch": 0.43, + "learning_rate": 1.1466350821327326e-07, + "loss": 0.0011, + "step": 22025 + }, + { + "epoch": 0.43, + "learning_rate": 1.1465962486893712e-07, + "loss": 0.0008, + "step": 22026 + }, + { + "epoch": 0.43, + "learning_rate": 1.1465574152460098e-07, + "loss": 0.0006, + "step": 22027 + }, + { + "epoch": 0.43, + "learning_rate": 1.1465185818026484e-07, + "loss": 0.0005, + "step": 22028 + }, + { + "epoch": 0.43, + "learning_rate": 1.146479748359287e-07, + "loss": 0.0006, + "step": 22029 + }, + { + "epoch": 0.43, + "learning_rate": 1.1464409149159255e-07, + "loss": 0.0008, + "step": 22030 + }, + { + "epoch": 0.43, + "learning_rate": 1.1464020814725641e-07, + "loss": 0.0012, + "step": 22031 + }, + { + "epoch": 0.43, + "learning_rate": 1.1463632480292027e-07, + "loss": 0.0006, + "step": 22032 + }, + { + "epoch": 0.43, + "learning_rate": 1.1463244145858413e-07, + "loss": 0.0007, + "step": 22033 + }, + { + "epoch": 0.43, + "learning_rate": 1.1462855811424799e-07, + "loss": 0.0007, + "step": 22034 + }, + { + "epoch": 0.43, + "learning_rate": 1.1462467476991185e-07, + "loss": 0.0036, + "step": 22035 + }, + { + "epoch": 0.43, + "learning_rate": 1.146207914255757e-07, + "loss": 0.0022, + "step": 22036 + }, + { + "epoch": 0.43, + "learning_rate": 1.1461690808123956e-07, + "loss": 0.0006, + "step": 22037 + }, + { + "epoch": 0.43, + "learning_rate": 1.1461302473690342e-07, + "loss": 0.0005, + "step": 22038 + }, + { + "epoch": 0.43, + "learning_rate": 1.1460914139256728e-07, + "loss": 0.0006, + "step": 22039 + }, + { + "epoch": 0.43, + "learning_rate": 1.1460525804823114e-07, + "loss": 0.0007, + "step": 22040 + }, + { + "epoch": 0.43, + "learning_rate": 1.14601374703895e-07, + "loss": 0.0021, + "step": 22041 + }, + { + "epoch": 0.43, + "learning_rate": 1.1459749135955885e-07, + "loss": 0.4049, + "step": 22042 + }, + { + "epoch": 0.43, + "learning_rate": 1.1459360801522271e-07, + "loss": 0.0006, + "step": 22043 + }, + { + "epoch": 0.43, + "learning_rate": 1.1458972467088657e-07, + "loss": 0.0031, + "step": 22044 + }, + { + "epoch": 0.43, + "learning_rate": 1.1458584132655043e-07, + "loss": 0.0005, + "step": 22045 + }, + { + "epoch": 0.43, + "learning_rate": 1.1458195798221429e-07, + "loss": 0.0007, + "step": 22046 + }, + { + "epoch": 0.43, + "learning_rate": 1.1457807463787814e-07, + "loss": 0.0006, + "step": 22047 + }, + { + "epoch": 0.43, + "learning_rate": 1.14574191293542e-07, + "loss": 0.0006, + "step": 22048 + }, + { + "epoch": 0.43, + "learning_rate": 1.1457030794920586e-07, + "loss": 0.0009, + "step": 22049 + }, + { + "epoch": 0.43, + "learning_rate": 1.1456642460486972e-07, + "loss": 0.0009, + "step": 22050 + }, + { + "epoch": 0.43, + "learning_rate": 1.1456254126053358e-07, + "loss": 0.0011, + "step": 22051 + }, + { + "epoch": 0.43, + "learning_rate": 1.1455865791619744e-07, + "loss": 0.0016, + "step": 22052 + }, + { + "epoch": 0.43, + "learning_rate": 1.145547745718613e-07, + "loss": 0.0009, + "step": 22053 + }, + { + "epoch": 0.43, + "learning_rate": 1.1455089122752515e-07, + "loss": 0.0006, + "step": 22054 + }, + { + "epoch": 0.43, + "learning_rate": 1.1454700788318901e-07, + "loss": 0.0006, + "step": 22055 + }, + { + "epoch": 0.43, + "learning_rate": 1.1454312453885287e-07, + "loss": 0.0006, + "step": 22056 + }, + { + "epoch": 0.43, + "learning_rate": 1.1453924119451673e-07, + "loss": 1.1281, + "step": 22057 + }, + { + "epoch": 0.43, + "learning_rate": 1.1453535785018059e-07, + "loss": 0.0007, + "step": 22058 + }, + { + "epoch": 0.43, + "learning_rate": 1.1453147450584444e-07, + "loss": 0.0008, + "step": 22059 + }, + { + "epoch": 0.43, + "learning_rate": 1.145275911615083e-07, + "loss": 0.6904, + "step": 22060 + }, + { + "epoch": 0.43, + "learning_rate": 1.1452370781717213e-07, + "loss": 0.0008, + "step": 22061 + }, + { + "epoch": 0.43, + "learning_rate": 1.1451982447283599e-07, + "loss": 0.6582, + "step": 22062 + }, + { + "epoch": 0.43, + "learning_rate": 1.1451594112849985e-07, + "loss": 0.0006, + "step": 22063 + }, + { + "epoch": 0.43, + "learning_rate": 1.1451205778416371e-07, + "loss": 0.0043, + "step": 22064 + }, + { + "epoch": 0.43, + "learning_rate": 1.1450817443982757e-07, + "loss": 0.0008, + "step": 22065 + }, + { + "epoch": 0.43, + "learning_rate": 1.1450429109549142e-07, + "loss": 0.0006, + "step": 22066 + }, + { + "epoch": 0.43, + "learning_rate": 1.1450040775115528e-07, + "loss": 0.0006, + "step": 22067 + }, + { + "epoch": 0.43, + "learning_rate": 1.1449652440681914e-07, + "loss": 0.0007, + "step": 22068 + }, + { + "epoch": 0.43, + "learning_rate": 1.14492641062483e-07, + "loss": 0.0006, + "step": 22069 + }, + { + "epoch": 0.43, + "learning_rate": 1.1448875771814686e-07, + "loss": 0.001, + "step": 22070 + }, + { + "epoch": 0.43, + "learning_rate": 1.1448487437381072e-07, + "loss": 0.0008, + "step": 22071 + }, + { + "epoch": 0.43, + "learning_rate": 1.1448099102947457e-07, + "loss": 1.1548, + "step": 22072 + }, + { + "epoch": 0.43, + "learning_rate": 1.1447710768513843e-07, + "loss": 0.0014, + "step": 22073 + }, + { + "epoch": 0.43, + "learning_rate": 1.1447322434080229e-07, + "loss": 0.0139, + "step": 22074 + }, + { + "epoch": 0.43, + "learning_rate": 1.1446934099646615e-07, + "loss": 0.0008, + "step": 22075 + }, + { + "epoch": 0.43, + "learning_rate": 1.1446545765213001e-07, + "loss": 0.0008, + "step": 22076 + }, + { + "epoch": 0.43, + "learning_rate": 1.1446157430779387e-07, + "loss": 0.0011, + "step": 22077 + }, + { + "epoch": 0.43, + "learning_rate": 1.1445769096345772e-07, + "loss": 0.0007, + "step": 22078 + }, + { + "epoch": 0.43, + "learning_rate": 1.1445380761912158e-07, + "loss": 0.0006, + "step": 22079 + }, + { + "epoch": 0.43, + "learning_rate": 1.1444992427478544e-07, + "loss": 0.0007, + "step": 22080 + }, + { + "epoch": 0.43, + "learning_rate": 1.144460409304493e-07, + "loss": 0.0007, + "step": 22081 + }, + { + "epoch": 0.43, + "learning_rate": 1.1444215758611316e-07, + "loss": 0.0006, + "step": 22082 + }, + { + "epoch": 0.43, + "learning_rate": 1.1443827424177702e-07, + "loss": 0.0006, + "step": 22083 + }, + { + "epoch": 0.43, + "learning_rate": 1.1443439089744087e-07, + "loss": 0.0006, + "step": 22084 + }, + { + "epoch": 0.43, + "learning_rate": 1.1443050755310473e-07, + "loss": 0.001, + "step": 22085 + }, + { + "epoch": 0.43, + "learning_rate": 1.1442662420876859e-07, + "loss": 0.552, + "step": 22086 + }, + { + "epoch": 0.43, + "learning_rate": 1.1442274086443245e-07, + "loss": 0.0006, + "step": 22087 + }, + { + "epoch": 0.43, + "learning_rate": 1.144188575200963e-07, + "loss": 0.0006, + "step": 22088 + }, + { + "epoch": 0.43, + "learning_rate": 1.1441497417576016e-07, + "loss": 0.0007, + "step": 22089 + }, + { + "epoch": 0.43, + "learning_rate": 1.1441109083142402e-07, + "loss": 0.0007, + "step": 22090 + }, + { + "epoch": 0.43, + "learning_rate": 1.1440720748708788e-07, + "loss": 0.0007, + "step": 22091 + }, + { + "epoch": 0.43, + "learning_rate": 1.1440332414275174e-07, + "loss": 0.0006, + "step": 22092 + }, + { + "epoch": 0.43, + "learning_rate": 1.143994407984156e-07, + "loss": 0.0008, + "step": 22093 + }, + { + "epoch": 0.43, + "learning_rate": 1.1439555745407946e-07, + "loss": 0.0148, + "step": 22094 + }, + { + "epoch": 0.43, + "learning_rate": 1.1439167410974331e-07, + "loss": 0.0047, + "step": 22095 + }, + { + "epoch": 0.43, + "learning_rate": 1.1438779076540717e-07, + "loss": 0.0007, + "step": 22096 + }, + { + "epoch": 0.43, + "learning_rate": 1.1438390742107103e-07, + "loss": 0.0025, + "step": 22097 + }, + { + "epoch": 0.43, + "learning_rate": 1.1438002407673489e-07, + "loss": 0.0016, + "step": 22098 + }, + { + "epoch": 0.43, + "learning_rate": 1.1437614073239875e-07, + "loss": 0.0013, + "step": 22099 + }, + { + "epoch": 0.43, + "learning_rate": 1.1437225738806259e-07, + "loss": 0.0008, + "step": 22100 + }, + { + "epoch": 0.43, + "learning_rate": 1.1436837404372645e-07, + "loss": 0.0005, + "step": 22101 + }, + { + "epoch": 0.43, + "learning_rate": 1.1436449069939031e-07, + "loss": 0.0008, + "step": 22102 + }, + { + "epoch": 0.43, + "learning_rate": 1.1436060735505417e-07, + "loss": 0.0014, + "step": 22103 + }, + { + "epoch": 0.43, + "learning_rate": 1.1435672401071802e-07, + "loss": 0.0005, + "step": 22104 + }, + { + "epoch": 0.43, + "learning_rate": 1.1435284066638188e-07, + "loss": 0.0008, + "step": 22105 + }, + { + "epoch": 0.43, + "learning_rate": 1.1434895732204574e-07, + "loss": 0.0006, + "step": 22106 + }, + { + "epoch": 0.43, + "learning_rate": 1.143450739777096e-07, + "loss": 0.9377, + "step": 22107 + }, + { + "epoch": 0.43, + "learning_rate": 1.1434119063337346e-07, + "loss": 0.0006, + "step": 22108 + }, + { + "epoch": 0.43, + "learning_rate": 1.1433730728903732e-07, + "loss": 0.0007, + "step": 22109 + }, + { + "epoch": 0.43, + "learning_rate": 1.1433342394470117e-07, + "loss": 0.0015, + "step": 22110 + }, + { + "epoch": 0.43, + "learning_rate": 1.1432954060036503e-07, + "loss": 0.2067, + "step": 22111 + }, + { + "epoch": 0.43, + "learning_rate": 1.1432565725602889e-07, + "loss": 0.0014, + "step": 22112 + }, + { + "epoch": 0.43, + "learning_rate": 1.1432177391169275e-07, + "loss": 0.0007, + "step": 22113 + }, + { + "epoch": 0.43, + "learning_rate": 1.1431789056735661e-07, + "loss": 0.0006, + "step": 22114 + }, + { + "epoch": 0.43, + "learning_rate": 1.1431400722302047e-07, + "loss": 0.0009, + "step": 22115 + }, + { + "epoch": 0.43, + "learning_rate": 1.1431012387868432e-07, + "loss": 0.0013, + "step": 22116 + }, + { + "epoch": 0.43, + "learning_rate": 1.1430624053434818e-07, + "loss": 0.0006, + "step": 22117 + }, + { + "epoch": 0.43, + "learning_rate": 1.1430235719001204e-07, + "loss": 0.3064, + "step": 22118 + }, + { + "epoch": 0.43, + "learning_rate": 1.1429847384567589e-07, + "loss": 0.0007, + "step": 22119 + }, + { + "epoch": 0.43, + "learning_rate": 1.1429459050133974e-07, + "loss": 0.0021, + "step": 22120 + }, + { + "epoch": 0.43, + "learning_rate": 1.142907071570036e-07, + "loss": 0.0258, + "step": 22121 + }, + { + "epoch": 0.43, + "learning_rate": 1.1428682381266746e-07, + "loss": 0.0006, + "step": 22122 + }, + { + "epoch": 0.43, + "learning_rate": 1.1428294046833132e-07, + "loss": 0.0006, + "step": 22123 + }, + { + "epoch": 0.43, + "learning_rate": 1.1427905712399518e-07, + "loss": 0.0005, + "step": 22124 + }, + { + "epoch": 0.43, + "learning_rate": 1.1427517377965903e-07, + "loss": 0.0006, + "step": 22125 + }, + { + "epoch": 0.43, + "learning_rate": 1.1427129043532289e-07, + "loss": 0.0006, + "step": 22126 + }, + { + "epoch": 0.43, + "learning_rate": 1.1426740709098675e-07, + "loss": 0.0012, + "step": 22127 + }, + { + "epoch": 0.43, + "learning_rate": 1.1426352374665061e-07, + "loss": 0.0008, + "step": 22128 + }, + { + "epoch": 0.43, + "learning_rate": 1.1425964040231445e-07, + "loss": 0.001, + "step": 22129 + }, + { + "epoch": 0.43, + "learning_rate": 1.1425575705797831e-07, + "loss": 0.0059, + "step": 22130 + }, + { + "epoch": 0.43, + "learning_rate": 1.1425187371364217e-07, + "loss": 0.0005, + "step": 22131 + }, + { + "epoch": 0.43, + "learning_rate": 1.1424799036930603e-07, + "loss": 0.0158, + "step": 22132 + }, + { + "epoch": 0.43, + "learning_rate": 1.1424410702496989e-07, + "loss": 0.003, + "step": 22133 + }, + { + "epoch": 0.43, + "learning_rate": 1.1424022368063375e-07, + "loss": 0.0007, + "step": 22134 + }, + { + "epoch": 0.43, + "learning_rate": 1.142363403362976e-07, + "loss": 0.0009, + "step": 22135 + }, + { + "epoch": 0.43, + "learning_rate": 1.1423245699196146e-07, + "loss": 0.0005, + "step": 22136 + }, + { + "epoch": 0.43, + "learning_rate": 1.1422857364762532e-07, + "loss": 0.0027, + "step": 22137 + }, + { + "epoch": 0.43, + "learning_rate": 1.1422469030328918e-07, + "loss": 0.0042, + "step": 22138 + }, + { + "epoch": 0.43, + "learning_rate": 1.1422080695895304e-07, + "loss": 0.0008, + "step": 22139 + }, + { + "epoch": 0.43, + "learning_rate": 1.142169236146169e-07, + "loss": 0.0007, + "step": 22140 + }, + { + "epoch": 0.43, + "learning_rate": 1.1421304027028075e-07, + "loss": 0.0008, + "step": 22141 + }, + { + "epoch": 0.43, + "learning_rate": 1.1420915692594461e-07, + "loss": 0.0016, + "step": 22142 + }, + { + "epoch": 0.43, + "learning_rate": 1.1420527358160847e-07, + "loss": 0.0006, + "step": 22143 + }, + { + "epoch": 0.43, + "learning_rate": 1.1420139023727233e-07, + "loss": 0.0008, + "step": 22144 + }, + { + "epoch": 0.43, + "learning_rate": 1.1419750689293619e-07, + "loss": 0.0006, + "step": 22145 + }, + { + "epoch": 0.43, + "learning_rate": 1.1419362354860004e-07, + "loss": 0.0021, + "step": 22146 + }, + { + "epoch": 0.43, + "learning_rate": 1.141897402042639e-07, + "loss": 0.0008, + "step": 22147 + }, + { + "epoch": 0.43, + "learning_rate": 1.1418585685992776e-07, + "loss": 0.0006, + "step": 22148 + }, + { + "epoch": 0.43, + "learning_rate": 1.1418197351559162e-07, + "loss": 0.0006, + "step": 22149 + }, + { + "epoch": 0.43, + "learning_rate": 1.1417809017125548e-07, + "loss": 0.0007, + "step": 22150 + }, + { + "epoch": 0.43, + "learning_rate": 1.1417420682691934e-07, + "loss": 0.0005, + "step": 22151 + }, + { + "epoch": 0.43, + "learning_rate": 1.141703234825832e-07, + "loss": 0.0007, + "step": 22152 + }, + { + "epoch": 0.43, + "learning_rate": 1.1416644013824705e-07, + "loss": 0.003, + "step": 22153 + }, + { + "epoch": 0.43, + "learning_rate": 1.1416255679391091e-07, + "loss": 0.0013, + "step": 22154 + }, + { + "epoch": 0.43, + "learning_rate": 1.1415867344957477e-07, + "loss": 0.0007, + "step": 22155 + }, + { + "epoch": 0.43, + "learning_rate": 1.1415479010523863e-07, + "loss": 0.0005, + "step": 22156 + }, + { + "epoch": 0.43, + "learning_rate": 1.1415090676090249e-07, + "loss": 0.0006, + "step": 22157 + }, + { + "epoch": 0.43, + "learning_rate": 1.1414702341656634e-07, + "loss": 0.6987, + "step": 22158 + }, + { + "epoch": 0.43, + "learning_rate": 1.141431400722302e-07, + "loss": 0.0196, + "step": 22159 + }, + { + "epoch": 0.43, + "learning_rate": 1.1413925672789406e-07, + "loss": 0.0065, + "step": 22160 + }, + { + "epoch": 0.43, + "learning_rate": 1.1413537338355792e-07, + "loss": 0.0007, + "step": 22161 + }, + { + "epoch": 0.43, + "learning_rate": 1.1413149003922178e-07, + "loss": 0.001, + "step": 22162 + }, + { + "epoch": 0.43, + "learning_rate": 1.1412760669488563e-07, + "loss": 0.0007, + "step": 22163 + }, + { + "epoch": 0.43, + "learning_rate": 1.1412372335054949e-07, + "loss": 0.0009, + "step": 22164 + }, + { + "epoch": 0.43, + "learning_rate": 1.1411984000621335e-07, + "loss": 0.0009, + "step": 22165 + }, + { + "epoch": 0.43, + "learning_rate": 1.1411595666187721e-07, + "loss": 0.0007, + "step": 22166 + }, + { + "epoch": 0.43, + "learning_rate": 1.1411207331754107e-07, + "loss": 0.0009, + "step": 22167 + }, + { + "epoch": 0.43, + "learning_rate": 1.1410818997320493e-07, + "loss": 0.0009, + "step": 22168 + }, + { + "epoch": 0.43, + "learning_rate": 1.1410430662886878e-07, + "loss": 1.1025, + "step": 22169 + }, + { + "epoch": 0.43, + "learning_rate": 1.1410042328453264e-07, + "loss": 0.318, + "step": 22170 + }, + { + "epoch": 0.43, + "learning_rate": 1.140965399401965e-07, + "loss": 0.0007, + "step": 22171 + }, + { + "epoch": 0.43, + "learning_rate": 1.1409265659586036e-07, + "loss": 0.0008, + "step": 22172 + }, + { + "epoch": 0.43, + "learning_rate": 1.1408877325152422e-07, + "loss": 0.3322, + "step": 22173 + }, + { + "epoch": 0.43, + "learning_rate": 1.1408488990718808e-07, + "loss": 0.8128, + "step": 22174 + }, + { + "epoch": 0.43, + "learning_rate": 1.1408100656285193e-07, + "loss": 0.6339, + "step": 22175 + }, + { + "epoch": 0.43, + "learning_rate": 1.1407712321851579e-07, + "loss": 0.0012, + "step": 22176 + }, + { + "epoch": 0.43, + "learning_rate": 1.1407323987417962e-07, + "loss": 0.1416, + "step": 22177 + }, + { + "epoch": 0.43, + "learning_rate": 1.1406935652984348e-07, + "loss": 0.5418, + "step": 22178 + }, + { + "epoch": 0.43, + "learning_rate": 1.1406547318550734e-07, + "loss": 0.0053, + "step": 22179 + }, + { + "epoch": 0.43, + "learning_rate": 1.140615898411712e-07, + "loss": 0.0012, + "step": 22180 + }, + { + "epoch": 0.43, + "learning_rate": 1.1405770649683506e-07, + "loss": 0.0007, + "step": 22181 + }, + { + "epoch": 0.43, + "learning_rate": 1.1405382315249892e-07, + "loss": 0.0006, + "step": 22182 + }, + { + "epoch": 0.43, + "learning_rate": 1.1404993980816277e-07, + "loss": 0.0007, + "step": 22183 + }, + { + "epoch": 0.43, + "learning_rate": 1.1404605646382663e-07, + "loss": 0.6397, + "step": 22184 + }, + { + "epoch": 0.43, + "learning_rate": 1.1404217311949049e-07, + "loss": 0.0005, + "step": 22185 + }, + { + "epoch": 0.43, + "learning_rate": 1.1403828977515435e-07, + "loss": 0.0009, + "step": 22186 + }, + { + "epoch": 0.43, + "learning_rate": 1.140344064308182e-07, + "loss": 0.0006, + "step": 22187 + }, + { + "epoch": 0.43, + "learning_rate": 1.1403052308648206e-07, + "loss": 0.001, + "step": 22188 + }, + { + "epoch": 0.43, + "learning_rate": 1.1402663974214592e-07, + "loss": 0.0007, + "step": 22189 + }, + { + "epoch": 0.43, + "learning_rate": 1.1402275639780978e-07, + "loss": 0.0007, + "step": 22190 + }, + { + "epoch": 0.43, + "learning_rate": 1.1401887305347364e-07, + "loss": 0.0007, + "step": 22191 + }, + { + "epoch": 0.43, + "learning_rate": 1.140149897091375e-07, + "loss": 0.1843, + "step": 22192 + }, + { + "epoch": 0.43, + "learning_rate": 1.1401110636480136e-07, + "loss": 0.0007, + "step": 22193 + }, + { + "epoch": 0.43, + "learning_rate": 1.1400722302046521e-07, + "loss": 0.2618, + "step": 22194 + }, + { + "epoch": 0.43, + "learning_rate": 1.1400333967612907e-07, + "loss": 0.0009, + "step": 22195 + }, + { + "epoch": 0.43, + "learning_rate": 1.1399945633179293e-07, + "loss": 0.0006, + "step": 22196 + }, + { + "epoch": 0.43, + "learning_rate": 1.1399557298745679e-07, + "loss": 0.0011, + "step": 22197 + }, + { + "epoch": 0.43, + "learning_rate": 1.1399168964312065e-07, + "loss": 0.001, + "step": 22198 + }, + { + "epoch": 0.43, + "learning_rate": 1.139878062987845e-07, + "loss": 0.0007, + "step": 22199 + }, + { + "epoch": 0.43, + "learning_rate": 1.1398392295444836e-07, + "loss": 0.0241, + "step": 22200 + }, + { + "epoch": 0.43, + "learning_rate": 1.1398003961011222e-07, + "loss": 0.4921, + "step": 22201 + }, + { + "epoch": 0.43, + "learning_rate": 1.1397615626577608e-07, + "loss": 0.0047, + "step": 22202 + }, + { + "epoch": 0.43, + "learning_rate": 1.1397227292143994e-07, + "loss": 0.0005, + "step": 22203 + }, + { + "epoch": 0.43, + "learning_rate": 1.139683895771038e-07, + "loss": 0.1446, + "step": 22204 + }, + { + "epoch": 0.43, + "learning_rate": 1.1396450623276765e-07, + "loss": 0.4109, + "step": 22205 + }, + { + "epoch": 0.43, + "learning_rate": 1.1396062288843151e-07, + "loss": 0.0007, + "step": 22206 + }, + { + "epoch": 0.43, + "learning_rate": 1.1395673954409537e-07, + "loss": 0.0005, + "step": 22207 + }, + { + "epoch": 0.43, + "learning_rate": 1.1395285619975923e-07, + "loss": 0.1073, + "step": 22208 + }, + { + "epoch": 0.43, + "learning_rate": 1.1394897285542309e-07, + "loss": 0.0005, + "step": 22209 + }, + { + "epoch": 0.43, + "learning_rate": 1.1394508951108695e-07, + "loss": 0.0007, + "step": 22210 + }, + { + "epoch": 0.43, + "learning_rate": 1.139412061667508e-07, + "loss": 0.0005, + "step": 22211 + }, + { + "epoch": 0.43, + "learning_rate": 1.1393732282241466e-07, + "loss": 0.0027, + "step": 22212 + }, + { + "epoch": 0.43, + "learning_rate": 1.1393343947807852e-07, + "loss": 0.0007, + "step": 22213 + }, + { + "epoch": 0.43, + "learning_rate": 1.1392955613374238e-07, + "loss": 0.0007, + "step": 22214 + }, + { + "epoch": 0.43, + "learning_rate": 1.1392567278940624e-07, + "loss": 0.0006, + "step": 22215 + }, + { + "epoch": 0.43, + "learning_rate": 1.139217894450701e-07, + "loss": 0.2226, + "step": 22216 + }, + { + "epoch": 0.43, + "learning_rate": 1.1391790610073395e-07, + "loss": 0.0008, + "step": 22217 + }, + { + "epoch": 0.43, + "learning_rate": 1.1391402275639781e-07, + "loss": 0.0007, + "step": 22218 + }, + { + "epoch": 0.43, + "learning_rate": 1.1391013941206167e-07, + "loss": 0.0015, + "step": 22219 + }, + { + "epoch": 0.43, + "learning_rate": 1.1390625606772553e-07, + "loss": 0.0009, + "step": 22220 + }, + { + "epoch": 0.43, + "learning_rate": 1.1390237272338939e-07, + "loss": 0.0013, + "step": 22221 + }, + { + "epoch": 0.43, + "learning_rate": 1.1389848937905324e-07, + "loss": 0.0012, + "step": 22222 + }, + { + "epoch": 0.43, + "learning_rate": 1.138946060347171e-07, + "loss": 0.009, + "step": 22223 + }, + { + "epoch": 0.43, + "learning_rate": 1.1389072269038096e-07, + "loss": 0.0013, + "step": 22224 + }, + { + "epoch": 0.43, + "learning_rate": 1.1388683934604482e-07, + "loss": 0.0006, + "step": 22225 + }, + { + "epoch": 0.43, + "learning_rate": 1.1388295600170868e-07, + "loss": 0.398, + "step": 22226 + }, + { + "epoch": 0.43, + "learning_rate": 1.1387907265737254e-07, + "loss": 0.0006, + "step": 22227 + }, + { + "epoch": 0.43, + "learning_rate": 1.138751893130364e-07, + "loss": 0.0005, + "step": 22228 + }, + { + "epoch": 0.43, + "learning_rate": 1.1387130596870025e-07, + "loss": 0.0008, + "step": 22229 + }, + { + "epoch": 0.43, + "learning_rate": 1.1386742262436411e-07, + "loss": 0.0008, + "step": 22230 + }, + { + "epoch": 0.43, + "learning_rate": 1.1386353928002797e-07, + "loss": 0.1503, + "step": 22231 + }, + { + "epoch": 0.43, + "learning_rate": 1.1385965593569183e-07, + "loss": 0.0203, + "step": 22232 + }, + { + "epoch": 0.43, + "learning_rate": 1.1385577259135569e-07, + "loss": 1.149, + "step": 22233 + }, + { + "epoch": 0.43, + "learning_rate": 1.1385188924701954e-07, + "loss": 0.0006, + "step": 22234 + }, + { + "epoch": 0.43, + "learning_rate": 1.1384800590268338e-07, + "loss": 0.0008, + "step": 22235 + }, + { + "epoch": 0.43, + "learning_rate": 1.1384412255834723e-07, + "loss": 0.0006, + "step": 22236 + }, + { + "epoch": 0.43, + "learning_rate": 1.1384023921401109e-07, + "loss": 0.0005, + "step": 22237 + }, + { + "epoch": 0.43, + "learning_rate": 1.1383635586967495e-07, + "loss": 0.0008, + "step": 22238 + }, + { + "epoch": 0.43, + "learning_rate": 1.1383247252533881e-07, + "loss": 0.2327, + "step": 22239 + }, + { + "epoch": 0.43, + "learning_rate": 1.1382858918100267e-07, + "loss": 0.0006, + "step": 22240 + }, + { + "epoch": 0.43, + "learning_rate": 1.1382470583666653e-07, + "loss": 1.1232, + "step": 22241 + }, + { + "epoch": 0.43, + "learning_rate": 1.1382082249233038e-07, + "loss": 0.0026, + "step": 22242 + }, + { + "epoch": 0.43, + "learning_rate": 1.1381693914799424e-07, + "loss": 0.0009, + "step": 22243 + }, + { + "epoch": 0.43, + "learning_rate": 1.138130558036581e-07, + "loss": 0.0006, + "step": 22244 + }, + { + "epoch": 0.43, + "learning_rate": 1.1380917245932196e-07, + "loss": 0.0006, + "step": 22245 + }, + { + "epoch": 0.43, + "learning_rate": 1.1380528911498582e-07, + "loss": 0.0005, + "step": 22246 + }, + { + "epoch": 0.43, + "learning_rate": 1.1380140577064967e-07, + "loss": 0.0006, + "step": 22247 + }, + { + "epoch": 0.43, + "learning_rate": 1.1379752242631353e-07, + "loss": 0.0006, + "step": 22248 + }, + { + "epoch": 0.43, + "learning_rate": 1.1379363908197739e-07, + "loss": 0.0006, + "step": 22249 + }, + { + "epoch": 0.43, + "learning_rate": 1.1378975573764125e-07, + "loss": 0.5507, + "step": 22250 + }, + { + "epoch": 0.43, + "learning_rate": 1.1378587239330511e-07, + "loss": 0.0009, + "step": 22251 + }, + { + "epoch": 0.43, + "learning_rate": 1.1378198904896897e-07, + "loss": 0.0006, + "step": 22252 + }, + { + "epoch": 0.43, + "learning_rate": 1.1377810570463282e-07, + "loss": 0.0008, + "step": 22253 + }, + { + "epoch": 0.43, + "learning_rate": 1.1377422236029668e-07, + "loss": 0.0005, + "step": 22254 + }, + { + "epoch": 0.43, + "learning_rate": 1.1377033901596054e-07, + "loss": 0.0008, + "step": 22255 + }, + { + "epoch": 0.43, + "learning_rate": 1.137664556716244e-07, + "loss": 0.0006, + "step": 22256 + }, + { + "epoch": 0.43, + "learning_rate": 1.1376257232728826e-07, + "loss": 0.0004, + "step": 22257 + }, + { + "epoch": 0.43, + "learning_rate": 1.1375868898295212e-07, + "loss": 0.0126, + "step": 22258 + }, + { + "epoch": 0.43, + "learning_rate": 1.1375480563861597e-07, + "loss": 0.0008, + "step": 22259 + }, + { + "epoch": 0.43, + "learning_rate": 1.1375092229427983e-07, + "loss": 0.0006, + "step": 22260 + }, + { + "epoch": 0.43, + "learning_rate": 1.1374703894994369e-07, + "loss": 0.0008, + "step": 22261 + }, + { + "epoch": 0.43, + "learning_rate": 1.1374315560560755e-07, + "loss": 0.0017, + "step": 22262 + }, + { + "epoch": 0.43, + "learning_rate": 1.137392722612714e-07, + "loss": 0.0007, + "step": 22263 + }, + { + "epoch": 0.43, + "learning_rate": 1.1373538891693526e-07, + "loss": 0.7095, + "step": 22264 + }, + { + "epoch": 0.43, + "learning_rate": 1.1373150557259912e-07, + "loss": 0.0022, + "step": 22265 + }, + { + "epoch": 0.43, + "learning_rate": 1.1372762222826298e-07, + "loss": 0.0005, + "step": 22266 + }, + { + "epoch": 0.43, + "learning_rate": 1.1372373888392684e-07, + "loss": 0.0007, + "step": 22267 + }, + { + "epoch": 0.43, + "learning_rate": 1.137198555395907e-07, + "loss": 0.0009, + "step": 22268 + }, + { + "epoch": 0.43, + "learning_rate": 1.1371597219525456e-07, + "loss": 0.0007, + "step": 22269 + }, + { + "epoch": 0.43, + "learning_rate": 1.1371208885091841e-07, + "loss": 0.0018, + "step": 22270 + }, + { + "epoch": 0.43, + "learning_rate": 1.1370820550658227e-07, + "loss": 0.0009, + "step": 22271 + }, + { + "epoch": 0.43, + "learning_rate": 1.1370432216224613e-07, + "loss": 0.2039, + "step": 22272 + }, + { + "epoch": 0.43, + "learning_rate": 1.1370043881790999e-07, + "loss": 0.0007, + "step": 22273 + }, + { + "epoch": 0.43, + "learning_rate": 1.1369655547357385e-07, + "loss": 0.0006, + "step": 22274 + }, + { + "epoch": 0.43, + "learning_rate": 1.136926721292377e-07, + "loss": 0.0006, + "step": 22275 + }, + { + "epoch": 0.43, + "learning_rate": 1.1368878878490156e-07, + "loss": 0.0375, + "step": 22276 + }, + { + "epoch": 0.43, + "learning_rate": 1.1368490544056541e-07, + "loss": 0.0008, + "step": 22277 + }, + { + "epoch": 0.43, + "learning_rate": 1.1368102209622927e-07, + "loss": 0.6941, + "step": 22278 + }, + { + "epoch": 0.43, + "learning_rate": 1.1367713875189313e-07, + "loss": 0.0006, + "step": 22279 + }, + { + "epoch": 0.43, + "learning_rate": 1.1367325540755698e-07, + "loss": 0.0007, + "step": 22280 + }, + { + "epoch": 0.43, + "learning_rate": 1.1366937206322084e-07, + "loss": 0.0006, + "step": 22281 + }, + { + "epoch": 0.43, + "learning_rate": 1.136654887188847e-07, + "loss": 0.0011, + "step": 22282 + }, + { + "epoch": 0.43, + "learning_rate": 1.1366160537454856e-07, + "loss": 0.0006, + "step": 22283 + }, + { + "epoch": 0.43, + "learning_rate": 1.1365772203021242e-07, + "loss": 0.0006, + "step": 22284 + }, + { + "epoch": 0.43, + "learning_rate": 1.1365383868587627e-07, + "loss": 0.0007, + "step": 22285 + }, + { + "epoch": 0.43, + "learning_rate": 1.1364995534154013e-07, + "loss": 0.0748, + "step": 22286 + }, + { + "epoch": 0.43, + "learning_rate": 1.1364607199720399e-07, + "loss": 0.0006, + "step": 22287 + }, + { + "epoch": 0.43, + "learning_rate": 1.1364218865286785e-07, + "loss": 0.0793, + "step": 22288 + }, + { + "epoch": 0.43, + "learning_rate": 1.1363830530853171e-07, + "loss": 0.0006, + "step": 22289 + }, + { + "epoch": 0.43, + "learning_rate": 1.1363442196419557e-07, + "loss": 0.0005, + "step": 22290 + }, + { + "epoch": 0.43, + "learning_rate": 1.1363053861985942e-07, + "loss": 0.0006, + "step": 22291 + }, + { + "epoch": 0.43, + "learning_rate": 1.1362665527552328e-07, + "loss": 0.0009, + "step": 22292 + }, + { + "epoch": 0.43, + "learning_rate": 1.1362277193118713e-07, + "loss": 1.5931, + "step": 22293 + }, + { + "epoch": 0.43, + "learning_rate": 1.1361888858685099e-07, + "loss": 0.0005, + "step": 22294 + }, + { + "epoch": 0.43, + "learning_rate": 1.1361500524251484e-07, + "loss": 0.0012, + "step": 22295 + }, + { + "epoch": 0.43, + "learning_rate": 1.136111218981787e-07, + "loss": 0.0009, + "step": 22296 + }, + { + "epoch": 0.43, + "learning_rate": 1.1360723855384256e-07, + "loss": 0.0006, + "step": 22297 + }, + { + "epoch": 0.43, + "learning_rate": 1.1360335520950642e-07, + "loss": 0.0761, + "step": 22298 + }, + { + "epoch": 0.43, + "learning_rate": 1.1359947186517028e-07, + "loss": 0.0007, + "step": 22299 + }, + { + "epoch": 0.43, + "learning_rate": 1.1359558852083413e-07, + "loss": 0.0008, + "step": 22300 + }, + { + "epoch": 0.43, + "learning_rate": 1.1359170517649799e-07, + "loss": 0.001, + "step": 22301 + }, + { + "epoch": 0.43, + "learning_rate": 1.1358782183216185e-07, + "loss": 0.0009, + "step": 22302 + }, + { + "epoch": 0.43, + "learning_rate": 1.1358393848782571e-07, + "loss": 0.0007, + "step": 22303 + }, + { + "epoch": 0.43, + "learning_rate": 1.1358005514348957e-07, + "loss": 0.0006, + "step": 22304 + }, + { + "epoch": 0.43, + "learning_rate": 1.1357617179915343e-07, + "loss": 1.346, + "step": 22305 + }, + { + "epoch": 0.43, + "learning_rate": 1.1357228845481727e-07, + "loss": 0.0008, + "step": 22306 + }, + { + "epoch": 0.43, + "learning_rate": 1.1356840511048113e-07, + "loss": 0.0006, + "step": 22307 + }, + { + "epoch": 0.43, + "learning_rate": 1.1356452176614499e-07, + "loss": 0.0076, + "step": 22308 + }, + { + "epoch": 0.43, + "learning_rate": 1.1356063842180885e-07, + "loss": 0.0288, + "step": 22309 + }, + { + "epoch": 0.43, + "learning_rate": 1.135567550774727e-07, + "loss": 0.0009, + "step": 22310 + }, + { + "epoch": 0.43, + "learning_rate": 1.1355287173313656e-07, + "loss": 0.0008, + "step": 22311 + }, + { + "epoch": 0.43, + "learning_rate": 1.1354898838880042e-07, + "loss": 0.0006, + "step": 22312 + }, + { + "epoch": 0.43, + "learning_rate": 1.1354510504446428e-07, + "loss": 0.6512, + "step": 22313 + }, + { + "epoch": 0.43, + "learning_rate": 1.1354122170012814e-07, + "loss": 0.0007, + "step": 22314 + }, + { + "epoch": 0.43, + "learning_rate": 1.13537338355792e-07, + "loss": 0.0008, + "step": 22315 + }, + { + "epoch": 0.43, + "learning_rate": 1.1353345501145585e-07, + "loss": 0.0006, + "step": 22316 + }, + { + "epoch": 0.43, + "learning_rate": 1.1352957166711971e-07, + "loss": 0.0008, + "step": 22317 + }, + { + "epoch": 0.43, + "learning_rate": 1.1352568832278357e-07, + "loss": 0.0069, + "step": 22318 + }, + { + "epoch": 0.43, + "learning_rate": 1.1352180497844743e-07, + "loss": 0.0096, + "step": 22319 + }, + { + "epoch": 0.43, + "learning_rate": 1.1351792163411129e-07, + "loss": 0.0008, + "step": 22320 + }, + { + "epoch": 0.43, + "learning_rate": 1.1351403828977514e-07, + "loss": 0.4076, + "step": 22321 + }, + { + "epoch": 0.43, + "learning_rate": 1.13510154945439e-07, + "loss": 0.0007, + "step": 22322 + }, + { + "epoch": 0.43, + "learning_rate": 1.1350627160110286e-07, + "loss": 0.0009, + "step": 22323 + }, + { + "epoch": 0.43, + "learning_rate": 1.1350238825676672e-07, + "loss": 0.0008, + "step": 22324 + }, + { + "epoch": 0.43, + "learning_rate": 1.1349850491243058e-07, + "loss": 0.0021, + "step": 22325 + }, + { + "epoch": 0.43, + "learning_rate": 1.1349462156809444e-07, + "loss": 0.0007, + "step": 22326 + }, + { + "epoch": 0.43, + "learning_rate": 1.134907382237583e-07, + "loss": 0.0017, + "step": 22327 + }, + { + "epoch": 0.43, + "learning_rate": 1.1348685487942215e-07, + "loss": 0.1894, + "step": 22328 + }, + { + "epoch": 0.43, + "learning_rate": 1.1348297153508601e-07, + "loss": 0.0008, + "step": 22329 + }, + { + "epoch": 0.43, + "learning_rate": 1.1347908819074987e-07, + "loss": 0.0046, + "step": 22330 + }, + { + "epoch": 0.43, + "learning_rate": 1.1347520484641373e-07, + "loss": 0.0008, + "step": 22331 + }, + { + "epoch": 0.43, + "learning_rate": 1.1347132150207759e-07, + "loss": 0.0009, + "step": 22332 + }, + { + "epoch": 0.43, + "learning_rate": 1.1346743815774144e-07, + "loss": 0.0006, + "step": 22333 + }, + { + "epoch": 0.43, + "learning_rate": 1.134635548134053e-07, + "loss": 0.0007, + "step": 22334 + }, + { + "epoch": 0.43, + "learning_rate": 1.1345967146906916e-07, + "loss": 0.0007, + "step": 22335 + }, + { + "epoch": 0.43, + "learning_rate": 1.1345578812473302e-07, + "loss": 0.0006, + "step": 22336 + }, + { + "epoch": 0.43, + "learning_rate": 1.1345190478039688e-07, + "loss": 0.0006, + "step": 22337 + }, + { + "epoch": 0.43, + "learning_rate": 1.1344802143606074e-07, + "loss": 0.0007, + "step": 22338 + }, + { + "epoch": 0.43, + "learning_rate": 1.1344413809172459e-07, + "loss": 0.0008, + "step": 22339 + }, + { + "epoch": 0.43, + "learning_rate": 1.1344025474738845e-07, + "loss": 0.0006, + "step": 22340 + }, + { + "epoch": 0.43, + "learning_rate": 1.1343637140305231e-07, + "loss": 0.0285, + "step": 22341 + }, + { + "epoch": 0.43, + "learning_rate": 1.1343248805871617e-07, + "loss": 0.0007, + "step": 22342 + }, + { + "epoch": 0.43, + "learning_rate": 1.1342860471438003e-07, + "loss": 0.0006, + "step": 22343 + }, + { + "epoch": 0.43, + "learning_rate": 1.1342472137004388e-07, + "loss": 0.0006, + "step": 22344 + }, + { + "epoch": 0.43, + "learning_rate": 1.1342083802570774e-07, + "loss": 0.0009, + "step": 22345 + }, + { + "epoch": 0.43, + "learning_rate": 1.134169546813716e-07, + "loss": 0.0611, + "step": 22346 + }, + { + "epoch": 0.43, + "learning_rate": 1.1341307133703546e-07, + "loss": 0.0006, + "step": 22347 + }, + { + "epoch": 0.43, + "learning_rate": 1.1340918799269932e-07, + "loss": 0.0193, + "step": 22348 + }, + { + "epoch": 0.43, + "learning_rate": 1.1340530464836318e-07, + "loss": 0.4209, + "step": 22349 + }, + { + "epoch": 0.43, + "learning_rate": 1.1340142130402703e-07, + "loss": 0.0007, + "step": 22350 + }, + { + "epoch": 0.43, + "learning_rate": 1.1339753795969087e-07, + "loss": 0.0007, + "step": 22351 + }, + { + "epoch": 0.43, + "learning_rate": 1.1339365461535472e-07, + "loss": 0.0006, + "step": 22352 + }, + { + "epoch": 0.43, + "learning_rate": 1.1338977127101858e-07, + "loss": 0.0007, + "step": 22353 + }, + { + "epoch": 0.43, + "learning_rate": 1.1338588792668244e-07, + "loss": 0.0006, + "step": 22354 + }, + { + "epoch": 0.43, + "learning_rate": 1.133820045823463e-07, + "loss": 0.0006, + "step": 22355 + }, + { + "epoch": 0.43, + "learning_rate": 1.1337812123801016e-07, + "loss": 0.0006, + "step": 22356 + }, + { + "epoch": 0.43, + "learning_rate": 1.1337423789367402e-07, + "loss": 0.0013, + "step": 22357 + }, + { + "epoch": 0.43, + "learning_rate": 1.1337035454933787e-07, + "loss": 0.0029, + "step": 22358 + }, + { + "epoch": 0.43, + "learning_rate": 1.1336647120500173e-07, + "loss": 0.0476, + "step": 22359 + }, + { + "epoch": 0.43, + "learning_rate": 1.1336258786066559e-07, + "loss": 0.5691, + "step": 22360 + }, + { + "epoch": 0.43, + "learning_rate": 1.1335870451632945e-07, + "loss": 0.0008, + "step": 22361 + }, + { + "epoch": 0.43, + "learning_rate": 1.133548211719933e-07, + "loss": 0.0006, + "step": 22362 + }, + { + "epoch": 0.43, + "learning_rate": 1.1335093782765716e-07, + "loss": 0.0012, + "step": 22363 + }, + { + "epoch": 0.43, + "learning_rate": 1.1334705448332102e-07, + "loss": 0.0008, + "step": 22364 + }, + { + "epoch": 0.43, + "learning_rate": 1.1334317113898488e-07, + "loss": 0.0006, + "step": 22365 + }, + { + "epoch": 0.43, + "learning_rate": 1.1333928779464874e-07, + "loss": 0.0054, + "step": 22366 + }, + { + "epoch": 0.43, + "learning_rate": 1.133354044503126e-07, + "loss": 0.6172, + "step": 22367 + }, + { + "epoch": 0.43, + "learning_rate": 1.1333152110597646e-07, + "loss": 0.0005, + "step": 22368 + }, + { + "epoch": 0.43, + "learning_rate": 1.1332763776164031e-07, + "loss": 0.0005, + "step": 22369 + }, + { + "epoch": 0.43, + "learning_rate": 1.1332375441730417e-07, + "loss": 0.847, + "step": 22370 + }, + { + "epoch": 0.43, + "learning_rate": 1.1331987107296803e-07, + "loss": 0.0006, + "step": 22371 + }, + { + "epoch": 0.43, + "learning_rate": 1.1331598772863189e-07, + "loss": 0.0015, + "step": 22372 + }, + { + "epoch": 0.43, + "learning_rate": 1.1331210438429575e-07, + "loss": 0.0008, + "step": 22373 + }, + { + "epoch": 0.43, + "learning_rate": 1.133082210399596e-07, + "loss": 0.2327, + "step": 22374 + }, + { + "epoch": 0.43, + "learning_rate": 1.1330433769562346e-07, + "loss": 1.0097, + "step": 22375 + }, + { + "epoch": 0.43, + "learning_rate": 1.1330045435128732e-07, + "loss": 0.0005, + "step": 22376 + }, + { + "epoch": 0.43, + "learning_rate": 1.1329657100695118e-07, + "loss": 0.0006, + "step": 22377 + }, + { + "epoch": 0.43, + "learning_rate": 1.1329268766261504e-07, + "loss": 0.0006, + "step": 22378 + }, + { + "epoch": 0.43, + "learning_rate": 1.132888043182789e-07, + "loss": 0.0007, + "step": 22379 + }, + { + "epoch": 0.43, + "learning_rate": 1.1328492097394275e-07, + "loss": 0.0007, + "step": 22380 + }, + { + "epoch": 0.43, + "learning_rate": 1.1328103762960661e-07, + "loss": 0.0007, + "step": 22381 + }, + { + "epoch": 0.43, + "learning_rate": 1.1327715428527047e-07, + "loss": 0.0007, + "step": 22382 + }, + { + "epoch": 0.43, + "learning_rate": 1.1327327094093433e-07, + "loss": 0.0007, + "step": 22383 + }, + { + "epoch": 0.43, + "learning_rate": 1.1326938759659819e-07, + "loss": 0.0006, + "step": 22384 + }, + { + "epoch": 0.43, + "learning_rate": 1.1326550425226205e-07, + "loss": 0.0009, + "step": 22385 + }, + { + "epoch": 0.43, + "learning_rate": 1.132616209079259e-07, + "loss": 0.0006, + "step": 22386 + }, + { + "epoch": 0.43, + "learning_rate": 1.1325773756358976e-07, + "loss": 0.0004, + "step": 22387 + }, + { + "epoch": 0.43, + "learning_rate": 1.1325385421925362e-07, + "loss": 0.0006, + "step": 22388 + }, + { + "epoch": 0.43, + "learning_rate": 1.1324997087491748e-07, + "loss": 0.0009, + "step": 22389 + }, + { + "epoch": 0.43, + "learning_rate": 1.1324608753058134e-07, + "loss": 0.0007, + "step": 22390 + }, + { + "epoch": 0.43, + "learning_rate": 1.132422041862452e-07, + "loss": 0.5364, + "step": 22391 + }, + { + "epoch": 0.43, + "learning_rate": 1.1323832084190905e-07, + "loss": 0.0007, + "step": 22392 + }, + { + "epoch": 0.43, + "learning_rate": 1.1323443749757291e-07, + "loss": 0.0007, + "step": 22393 + }, + { + "epoch": 0.43, + "learning_rate": 1.1323055415323677e-07, + "loss": 0.0006, + "step": 22394 + }, + { + "epoch": 0.43, + "learning_rate": 1.1322667080890063e-07, + "loss": 0.1143, + "step": 22395 + }, + { + "epoch": 0.43, + "learning_rate": 1.1322278746456449e-07, + "loss": 0.0011, + "step": 22396 + }, + { + "epoch": 0.43, + "learning_rate": 1.1321890412022834e-07, + "loss": 0.0005, + "step": 22397 + }, + { + "epoch": 0.43, + "learning_rate": 1.132150207758922e-07, + "loss": 0.0358, + "step": 22398 + }, + { + "epoch": 0.43, + "learning_rate": 1.1321113743155606e-07, + "loss": 0.0007, + "step": 22399 + }, + { + "epoch": 0.43, + "learning_rate": 1.1320725408721992e-07, + "loss": 0.0668, + "step": 22400 + }, + { + "epoch": 0.43, + "learning_rate": 1.1320337074288378e-07, + "loss": 0.0042, + "step": 22401 + }, + { + "epoch": 0.43, + "learning_rate": 1.1319948739854764e-07, + "loss": 0.001, + "step": 22402 + }, + { + "epoch": 0.43, + "learning_rate": 1.131956040542115e-07, + "loss": 0.0007, + "step": 22403 + }, + { + "epoch": 0.43, + "learning_rate": 1.1319172070987535e-07, + "loss": 0.0008, + "step": 22404 + }, + { + "epoch": 0.43, + "learning_rate": 1.1318783736553921e-07, + "loss": 0.0025, + "step": 22405 + }, + { + "epoch": 0.43, + "learning_rate": 1.1318395402120307e-07, + "loss": 0.0006, + "step": 22406 + }, + { + "epoch": 0.43, + "learning_rate": 1.1318007067686693e-07, + "loss": 0.0005, + "step": 22407 + }, + { + "epoch": 0.43, + "learning_rate": 1.1317618733253079e-07, + "loss": 0.0008, + "step": 22408 + }, + { + "epoch": 0.43, + "learning_rate": 1.1317230398819462e-07, + "loss": 0.0029, + "step": 22409 + }, + { + "epoch": 0.43, + "learning_rate": 1.1316842064385848e-07, + "loss": 0.0005, + "step": 22410 + }, + { + "epoch": 0.43, + "learning_rate": 1.1316453729952233e-07, + "loss": 0.0009, + "step": 22411 + }, + { + "epoch": 0.43, + "learning_rate": 1.1316065395518619e-07, + "loss": 0.0006, + "step": 22412 + }, + { + "epoch": 0.43, + "learning_rate": 1.1315677061085005e-07, + "loss": 0.3767, + "step": 22413 + }, + { + "epoch": 0.43, + "learning_rate": 1.1315288726651391e-07, + "loss": 0.6059, + "step": 22414 + }, + { + "epoch": 0.43, + "learning_rate": 1.1314900392217777e-07, + "loss": 0.0006, + "step": 22415 + }, + { + "epoch": 0.43, + "learning_rate": 1.1314512057784163e-07, + "loss": 0.0007, + "step": 22416 + }, + { + "epoch": 0.43, + "learning_rate": 1.1314123723350548e-07, + "loss": 0.0007, + "step": 22417 + }, + { + "epoch": 0.43, + "learning_rate": 1.1313735388916934e-07, + "loss": 0.0007, + "step": 22418 + }, + { + "epoch": 0.43, + "learning_rate": 1.131334705448332e-07, + "loss": 0.0007, + "step": 22419 + }, + { + "epoch": 0.43, + "learning_rate": 1.1312958720049706e-07, + "loss": 0.0006, + "step": 22420 + }, + { + "epoch": 0.43, + "learning_rate": 1.1312570385616092e-07, + "loss": 0.0008, + "step": 22421 + }, + { + "epoch": 0.43, + "learning_rate": 1.1312182051182477e-07, + "loss": 0.0046, + "step": 22422 + }, + { + "epoch": 0.43, + "learning_rate": 1.1311793716748863e-07, + "loss": 0.0008, + "step": 22423 + }, + { + "epoch": 0.43, + "learning_rate": 1.1311405382315249e-07, + "loss": 0.0007, + "step": 22424 + }, + { + "epoch": 0.43, + "learning_rate": 1.1311017047881635e-07, + "loss": 0.0008, + "step": 22425 + }, + { + "epoch": 0.44, + "learning_rate": 1.1310628713448021e-07, + "loss": 0.0008, + "step": 22426 + }, + { + "epoch": 0.44, + "learning_rate": 1.1310240379014407e-07, + "loss": 0.0004, + "step": 22427 + }, + { + "epoch": 0.44, + "learning_rate": 1.1309852044580792e-07, + "loss": 0.0007, + "step": 22428 + }, + { + "epoch": 0.44, + "learning_rate": 1.1309463710147178e-07, + "loss": 0.0008, + "step": 22429 + }, + { + "epoch": 0.44, + "learning_rate": 1.1309075375713564e-07, + "loss": 0.0028, + "step": 22430 + }, + { + "epoch": 0.44, + "learning_rate": 1.130868704127995e-07, + "loss": 0.1492, + "step": 22431 + }, + { + "epoch": 0.44, + "learning_rate": 1.1308298706846336e-07, + "loss": 0.0008, + "step": 22432 + }, + { + "epoch": 0.44, + "learning_rate": 1.1307910372412722e-07, + "loss": 0.0007, + "step": 22433 + }, + { + "epoch": 0.44, + "learning_rate": 1.1307522037979107e-07, + "loss": 0.0006, + "step": 22434 + }, + { + "epoch": 0.44, + "learning_rate": 1.1307133703545493e-07, + "loss": 0.0005, + "step": 22435 + }, + { + "epoch": 0.44, + "learning_rate": 1.1306745369111879e-07, + "loss": 0.4901, + "step": 22436 + }, + { + "epoch": 0.44, + "learning_rate": 1.1306357034678265e-07, + "loss": 0.0015, + "step": 22437 + }, + { + "epoch": 0.44, + "learning_rate": 1.130596870024465e-07, + "loss": 0.0019, + "step": 22438 + }, + { + "epoch": 0.44, + "learning_rate": 1.1305580365811036e-07, + "loss": 0.0007, + "step": 22439 + }, + { + "epoch": 0.44, + "learning_rate": 1.1305192031377422e-07, + "loss": 0.0005, + "step": 22440 + }, + { + "epoch": 0.44, + "learning_rate": 1.1304803696943808e-07, + "loss": 1.1617, + "step": 22441 + }, + { + "epoch": 0.44, + "learning_rate": 1.1304415362510194e-07, + "loss": 0.0005, + "step": 22442 + }, + { + "epoch": 0.44, + "learning_rate": 1.130402702807658e-07, + "loss": 0.793, + "step": 22443 + }, + { + "epoch": 0.44, + "learning_rate": 1.1303638693642966e-07, + "loss": 0.0007, + "step": 22444 + }, + { + "epoch": 0.44, + "learning_rate": 1.1303250359209351e-07, + "loss": 1.4809, + "step": 22445 + }, + { + "epoch": 0.44, + "learning_rate": 1.1302862024775737e-07, + "loss": 0.0007, + "step": 22446 + }, + { + "epoch": 0.44, + "learning_rate": 1.1302473690342123e-07, + "loss": 0.0005, + "step": 22447 + }, + { + "epoch": 0.44, + "learning_rate": 1.1302085355908509e-07, + "loss": 0.0004, + "step": 22448 + }, + { + "epoch": 0.44, + "learning_rate": 1.1301697021474895e-07, + "loss": 0.0005, + "step": 22449 + }, + { + "epoch": 0.44, + "learning_rate": 1.130130868704128e-07, + "loss": 0.0007, + "step": 22450 + }, + { + "epoch": 0.44, + "learning_rate": 1.1300920352607666e-07, + "loss": 0.1945, + "step": 22451 + }, + { + "epoch": 0.44, + "learning_rate": 1.1300532018174052e-07, + "loss": 0.0028, + "step": 22452 + }, + { + "epoch": 0.44, + "learning_rate": 1.1300143683740438e-07, + "loss": 0.0009, + "step": 22453 + }, + { + "epoch": 0.44, + "learning_rate": 1.1299755349306823e-07, + "loss": 0.0007, + "step": 22454 + }, + { + "epoch": 0.44, + "learning_rate": 1.1299367014873208e-07, + "loss": 0.0007, + "step": 22455 + }, + { + "epoch": 0.44, + "learning_rate": 1.1298978680439594e-07, + "loss": 0.001, + "step": 22456 + }, + { + "epoch": 0.44, + "learning_rate": 1.129859034600598e-07, + "loss": 0.0008, + "step": 22457 + }, + { + "epoch": 0.44, + "learning_rate": 1.1298202011572366e-07, + "loss": 0.0008, + "step": 22458 + }, + { + "epoch": 0.44, + "learning_rate": 1.1297813677138752e-07, + "loss": 0.0007, + "step": 22459 + }, + { + "epoch": 0.44, + "learning_rate": 1.1297425342705137e-07, + "loss": 0.0008, + "step": 22460 + }, + { + "epoch": 0.44, + "learning_rate": 1.1297037008271523e-07, + "loss": 0.0018, + "step": 22461 + }, + { + "epoch": 0.44, + "learning_rate": 1.1296648673837909e-07, + "loss": 0.0006, + "step": 22462 + }, + { + "epoch": 0.44, + "learning_rate": 1.1296260339404295e-07, + "loss": 0.0007, + "step": 22463 + }, + { + "epoch": 0.44, + "learning_rate": 1.1295872004970681e-07, + "loss": 0.0007, + "step": 22464 + }, + { + "epoch": 0.44, + "learning_rate": 1.1295483670537067e-07, + "loss": 0.0007, + "step": 22465 + }, + { + "epoch": 0.44, + "learning_rate": 1.1295095336103452e-07, + "loss": 0.0007, + "step": 22466 + }, + { + "epoch": 0.44, + "learning_rate": 1.1294707001669837e-07, + "loss": 0.0007, + "step": 22467 + }, + { + "epoch": 0.44, + "learning_rate": 1.1294318667236223e-07, + "loss": 0.0007, + "step": 22468 + }, + { + "epoch": 0.44, + "learning_rate": 1.1293930332802609e-07, + "loss": 0.0006, + "step": 22469 + }, + { + "epoch": 0.44, + "learning_rate": 1.1293541998368994e-07, + "loss": 0.0007, + "step": 22470 + }, + { + "epoch": 0.44, + "learning_rate": 1.129315366393538e-07, + "loss": 0.0005, + "step": 22471 + }, + { + "epoch": 0.44, + "learning_rate": 1.1292765329501766e-07, + "loss": 1.0797, + "step": 22472 + }, + { + "epoch": 0.44, + "learning_rate": 1.1292376995068152e-07, + "loss": 0.0006, + "step": 22473 + }, + { + "epoch": 0.44, + "learning_rate": 1.1291988660634538e-07, + "loss": 0.0007, + "step": 22474 + }, + { + "epoch": 0.44, + "learning_rate": 1.1291600326200924e-07, + "loss": 0.0011, + "step": 22475 + }, + { + "epoch": 0.44, + "learning_rate": 1.1291211991767309e-07, + "loss": 0.0009, + "step": 22476 + }, + { + "epoch": 0.44, + "learning_rate": 1.1290823657333695e-07, + "loss": 0.5965, + "step": 22477 + }, + { + "epoch": 0.44, + "learning_rate": 1.1290435322900081e-07, + "loss": 0.0006, + "step": 22478 + }, + { + "epoch": 0.44, + "learning_rate": 1.1290046988466467e-07, + "loss": 0.0005, + "step": 22479 + }, + { + "epoch": 0.44, + "learning_rate": 1.1289658654032853e-07, + "loss": 0.0006, + "step": 22480 + }, + { + "epoch": 0.44, + "learning_rate": 1.1289270319599238e-07, + "loss": 0.5594, + "step": 22481 + }, + { + "epoch": 0.44, + "learning_rate": 1.1288881985165624e-07, + "loss": 0.0005, + "step": 22482 + }, + { + "epoch": 0.44, + "learning_rate": 1.1288493650732009e-07, + "loss": 0.0007, + "step": 22483 + }, + { + "epoch": 0.44, + "learning_rate": 1.1288105316298395e-07, + "loss": 0.1435, + "step": 22484 + }, + { + "epoch": 0.44, + "learning_rate": 1.128771698186478e-07, + "loss": 0.0006, + "step": 22485 + }, + { + "epoch": 0.44, + "learning_rate": 1.1287328647431166e-07, + "loss": 0.0052, + "step": 22486 + }, + { + "epoch": 0.44, + "learning_rate": 1.1286940312997552e-07, + "loss": 0.6014, + "step": 22487 + }, + { + "epoch": 0.44, + "learning_rate": 1.1286551978563938e-07, + "loss": 0.0007, + "step": 22488 + }, + { + "epoch": 0.44, + "learning_rate": 1.1286163644130324e-07, + "loss": 0.0006, + "step": 22489 + }, + { + "epoch": 0.44, + "learning_rate": 1.128577530969671e-07, + "loss": 0.9796, + "step": 22490 + }, + { + "epoch": 0.44, + "learning_rate": 1.1285386975263095e-07, + "loss": 0.0008, + "step": 22491 + }, + { + "epoch": 0.44, + "learning_rate": 1.1284998640829481e-07, + "loss": 0.0007, + "step": 22492 + }, + { + "epoch": 0.44, + "learning_rate": 1.1284610306395867e-07, + "loss": 0.0007, + "step": 22493 + }, + { + "epoch": 0.44, + "learning_rate": 1.1284221971962253e-07, + "loss": 0.0005, + "step": 22494 + }, + { + "epoch": 0.44, + "learning_rate": 1.1283833637528639e-07, + "loss": 0.782, + "step": 22495 + }, + { + "epoch": 0.44, + "learning_rate": 1.1283445303095024e-07, + "loss": 0.0607, + "step": 22496 + }, + { + "epoch": 0.44, + "learning_rate": 1.128305696866141e-07, + "loss": 0.0005, + "step": 22497 + }, + { + "epoch": 0.44, + "learning_rate": 1.1282668634227796e-07, + "loss": 0.0009, + "step": 22498 + }, + { + "epoch": 0.44, + "learning_rate": 1.1282280299794182e-07, + "loss": 0.0007, + "step": 22499 + }, + { + "epoch": 0.44, + "learning_rate": 1.1281891965360568e-07, + "loss": 0.0007, + "step": 22500 + }, + { + "epoch": 0.44, + "learning_rate": 1.1281503630926954e-07, + "loss": 0.0008, + "step": 22501 + }, + { + "epoch": 0.44, + "learning_rate": 1.128111529649334e-07, + "loss": 0.0005, + "step": 22502 + }, + { + "epoch": 0.44, + "learning_rate": 1.1280726962059725e-07, + "loss": 0.0012, + "step": 22503 + }, + { + "epoch": 0.44, + "learning_rate": 1.1280338627626111e-07, + "loss": 0.0027, + "step": 22504 + }, + { + "epoch": 0.44, + "learning_rate": 1.1279950293192497e-07, + "loss": 0.0007, + "step": 22505 + }, + { + "epoch": 0.44, + "learning_rate": 1.1279561958758883e-07, + "loss": 0.0034, + "step": 22506 + }, + { + "epoch": 0.44, + "learning_rate": 1.1279173624325269e-07, + "loss": 0.0005, + "step": 22507 + }, + { + "epoch": 0.44, + "learning_rate": 1.1278785289891654e-07, + "loss": 0.0008, + "step": 22508 + }, + { + "epoch": 0.44, + "learning_rate": 1.127839695545804e-07, + "loss": 0.0029, + "step": 22509 + }, + { + "epoch": 0.44, + "learning_rate": 1.1278008621024426e-07, + "loss": 0.0005, + "step": 22510 + }, + { + "epoch": 0.44, + "learning_rate": 1.1277620286590812e-07, + "loss": 0.0007, + "step": 22511 + }, + { + "epoch": 0.44, + "learning_rate": 1.1277231952157198e-07, + "loss": 0.0013, + "step": 22512 + }, + { + "epoch": 0.44, + "learning_rate": 1.1276843617723584e-07, + "loss": 0.0007, + "step": 22513 + }, + { + "epoch": 0.44, + "learning_rate": 1.1276455283289969e-07, + "loss": 0.0082, + "step": 22514 + }, + { + "epoch": 0.44, + "learning_rate": 1.1276066948856355e-07, + "loss": 0.0012, + "step": 22515 + }, + { + "epoch": 0.44, + "learning_rate": 1.1275678614422741e-07, + "loss": 0.0005, + "step": 22516 + }, + { + "epoch": 0.44, + "learning_rate": 1.1275290279989127e-07, + "loss": 0.1058, + "step": 22517 + }, + { + "epoch": 0.44, + "learning_rate": 1.1274901945555513e-07, + "loss": 0.0007, + "step": 22518 + }, + { + "epoch": 0.44, + "learning_rate": 1.1274513611121898e-07, + "loss": 0.0007, + "step": 22519 + }, + { + "epoch": 0.44, + "learning_rate": 1.1274125276688284e-07, + "loss": 0.0647, + "step": 22520 + }, + { + "epoch": 0.44, + "learning_rate": 1.127373694225467e-07, + "loss": 1.2629, + "step": 22521 + }, + { + "epoch": 0.44, + "learning_rate": 1.1273348607821056e-07, + "loss": 0.0017, + "step": 22522 + }, + { + "epoch": 0.44, + "learning_rate": 1.1272960273387442e-07, + "loss": 0.5559, + "step": 22523 + }, + { + "epoch": 0.44, + "learning_rate": 1.1272571938953828e-07, + "loss": 0.9906, + "step": 22524 + }, + { + "epoch": 0.44, + "learning_rate": 1.1272183604520211e-07, + "loss": 0.0013, + "step": 22525 + }, + { + "epoch": 0.44, + "learning_rate": 1.1271795270086597e-07, + "loss": 0.0007, + "step": 22526 + }, + { + "epoch": 0.44, + "learning_rate": 1.1271406935652982e-07, + "loss": 0.003, + "step": 22527 + }, + { + "epoch": 0.44, + "learning_rate": 1.1271018601219368e-07, + "loss": 0.2066, + "step": 22528 + }, + { + "epoch": 0.44, + "learning_rate": 1.1270630266785754e-07, + "loss": 0.0007, + "step": 22529 + }, + { + "epoch": 0.44, + "learning_rate": 1.127024193235214e-07, + "loss": 0.0006, + "step": 22530 + }, + { + "epoch": 0.44, + "learning_rate": 1.1269853597918526e-07, + "loss": 0.0006, + "step": 22531 + }, + { + "epoch": 0.44, + "learning_rate": 1.1269465263484912e-07, + "loss": 0.0007, + "step": 22532 + }, + { + "epoch": 0.44, + "learning_rate": 1.1269076929051297e-07, + "loss": 0.0006, + "step": 22533 + }, + { + "epoch": 0.44, + "learning_rate": 1.1268688594617683e-07, + "loss": 0.0007, + "step": 22534 + }, + { + "epoch": 0.44, + "learning_rate": 1.1268300260184069e-07, + "loss": 0.0011, + "step": 22535 + }, + { + "epoch": 0.44, + "learning_rate": 1.1267911925750455e-07, + "loss": 0.0009, + "step": 22536 + }, + { + "epoch": 0.44, + "learning_rate": 1.126752359131684e-07, + "loss": 0.0027, + "step": 22537 + }, + { + "epoch": 0.44, + "learning_rate": 1.1267135256883226e-07, + "loss": 0.0006, + "step": 22538 + }, + { + "epoch": 0.44, + "learning_rate": 1.1266746922449612e-07, + "loss": 0.0005, + "step": 22539 + }, + { + "epoch": 0.44, + "learning_rate": 1.1266358588015998e-07, + "loss": 0.0023, + "step": 22540 + }, + { + "epoch": 0.44, + "learning_rate": 1.1265970253582384e-07, + "loss": 0.0025, + "step": 22541 + }, + { + "epoch": 0.44, + "learning_rate": 1.126558191914877e-07, + "loss": 0.1731, + "step": 22542 + }, + { + "epoch": 0.44, + "learning_rate": 1.1265193584715156e-07, + "loss": 0.0007, + "step": 22543 + }, + { + "epoch": 0.44, + "learning_rate": 1.1264805250281541e-07, + "loss": 0.0006, + "step": 22544 + }, + { + "epoch": 0.44, + "learning_rate": 1.1264416915847927e-07, + "loss": 0.0005, + "step": 22545 + }, + { + "epoch": 0.44, + "learning_rate": 1.1264028581414313e-07, + "loss": 0.0007, + "step": 22546 + }, + { + "epoch": 0.44, + "learning_rate": 1.1263640246980699e-07, + "loss": 0.3063, + "step": 22547 + }, + { + "epoch": 0.44, + "learning_rate": 1.1263251912547085e-07, + "loss": 0.0015, + "step": 22548 + }, + { + "epoch": 0.44, + "learning_rate": 1.126286357811347e-07, + "loss": 0.0006, + "step": 22549 + }, + { + "epoch": 0.44, + "learning_rate": 1.1262475243679856e-07, + "loss": 0.0006, + "step": 22550 + }, + { + "epoch": 0.44, + "learning_rate": 1.1262086909246242e-07, + "loss": 0.0018, + "step": 22551 + }, + { + "epoch": 0.44, + "learning_rate": 1.1261698574812628e-07, + "loss": 0.0007, + "step": 22552 + }, + { + "epoch": 0.44, + "learning_rate": 1.1261310240379014e-07, + "loss": 0.001, + "step": 22553 + }, + { + "epoch": 0.44, + "learning_rate": 1.12609219059454e-07, + "loss": 0.839, + "step": 22554 + }, + { + "epoch": 0.44, + "learning_rate": 1.1260533571511785e-07, + "loss": 0.0006, + "step": 22555 + }, + { + "epoch": 0.44, + "learning_rate": 1.1260145237078171e-07, + "loss": 0.0006, + "step": 22556 + }, + { + "epoch": 0.44, + "learning_rate": 1.1259756902644557e-07, + "loss": 0.0005, + "step": 22557 + }, + { + "epoch": 0.44, + "learning_rate": 1.1259368568210943e-07, + "loss": 0.0006, + "step": 22558 + }, + { + "epoch": 0.44, + "learning_rate": 1.1258980233777329e-07, + "loss": 0.0008, + "step": 22559 + }, + { + "epoch": 0.44, + "learning_rate": 1.1258591899343715e-07, + "loss": 0.0009, + "step": 22560 + }, + { + "epoch": 0.44, + "learning_rate": 1.12582035649101e-07, + "loss": 0.0008, + "step": 22561 + }, + { + "epoch": 0.44, + "learning_rate": 1.1257815230476486e-07, + "loss": 0.0005, + "step": 22562 + }, + { + "epoch": 0.44, + "learning_rate": 1.1257426896042872e-07, + "loss": 1.0556, + "step": 22563 + }, + { + "epoch": 0.44, + "learning_rate": 1.1257038561609258e-07, + "loss": 0.0008, + "step": 22564 + }, + { + "epoch": 0.44, + "learning_rate": 1.1256650227175644e-07, + "loss": 0.0005, + "step": 22565 + }, + { + "epoch": 0.44, + "learning_rate": 1.125626189274203e-07, + "loss": 0.0007, + "step": 22566 + }, + { + "epoch": 0.44, + "learning_rate": 1.1255873558308415e-07, + "loss": 0.0007, + "step": 22567 + }, + { + "epoch": 0.44, + "learning_rate": 1.1255485223874801e-07, + "loss": 0.0007, + "step": 22568 + }, + { + "epoch": 0.44, + "learning_rate": 1.1255096889441187e-07, + "loss": 0.0007, + "step": 22569 + }, + { + "epoch": 0.44, + "learning_rate": 1.1254708555007573e-07, + "loss": 0.0006, + "step": 22570 + }, + { + "epoch": 0.44, + "learning_rate": 1.1254320220573959e-07, + "loss": 0.0025, + "step": 22571 + }, + { + "epoch": 0.44, + "learning_rate": 1.1253931886140345e-07, + "loss": 0.0006, + "step": 22572 + }, + { + "epoch": 0.44, + "learning_rate": 1.125354355170673e-07, + "loss": 0.0007, + "step": 22573 + }, + { + "epoch": 0.44, + "learning_rate": 1.1253155217273116e-07, + "loss": 0.0088, + "step": 22574 + }, + { + "epoch": 0.44, + "learning_rate": 1.1252766882839502e-07, + "loss": 0.0069, + "step": 22575 + }, + { + "epoch": 0.44, + "learning_rate": 1.1252378548405888e-07, + "loss": 0.0007, + "step": 22576 + }, + { + "epoch": 0.44, + "learning_rate": 1.1251990213972274e-07, + "loss": 1.1636, + "step": 22577 + }, + { + "epoch": 0.44, + "learning_rate": 1.125160187953866e-07, + "loss": 0.0006, + "step": 22578 + }, + { + "epoch": 0.44, + "learning_rate": 1.1251213545105045e-07, + "loss": 0.0004, + "step": 22579 + }, + { + "epoch": 0.44, + "learning_rate": 1.1250825210671431e-07, + "loss": 0.0005, + "step": 22580 + }, + { + "epoch": 0.44, + "learning_rate": 1.1250436876237817e-07, + "loss": 0.0007, + "step": 22581 + }, + { + "epoch": 0.44, + "learning_rate": 1.1250048541804203e-07, + "loss": 0.0012, + "step": 22582 + }, + { + "epoch": 0.44, + "learning_rate": 1.1249660207370586e-07, + "loss": 1.0155, + "step": 22583 + }, + { + "epoch": 0.44, + "learning_rate": 1.1249271872936972e-07, + "loss": 0.2043, + "step": 22584 + }, + { + "epoch": 0.44, + "learning_rate": 1.1248883538503358e-07, + "loss": 0.0006, + "step": 22585 + }, + { + "epoch": 0.44, + "learning_rate": 1.1248495204069743e-07, + "loss": 0.0006, + "step": 22586 + }, + { + "epoch": 0.44, + "learning_rate": 1.1248106869636129e-07, + "loss": 0.0008, + "step": 22587 + }, + { + "epoch": 0.44, + "learning_rate": 1.1247718535202515e-07, + "loss": 0.0007, + "step": 22588 + }, + { + "epoch": 0.44, + "learning_rate": 1.1247330200768901e-07, + "loss": 0.0161, + "step": 22589 + }, + { + "epoch": 0.44, + "learning_rate": 1.1246941866335287e-07, + "loss": 0.1114, + "step": 22590 + }, + { + "epoch": 0.44, + "learning_rate": 1.1246553531901673e-07, + "loss": 0.0006, + "step": 22591 + }, + { + "epoch": 0.44, + "learning_rate": 1.1246165197468058e-07, + "loss": 0.0067, + "step": 22592 + }, + { + "epoch": 0.44, + "learning_rate": 1.1245776863034444e-07, + "loss": 0.0008, + "step": 22593 + }, + { + "epoch": 0.44, + "learning_rate": 1.124538852860083e-07, + "loss": 0.0009, + "step": 22594 + }, + { + "epoch": 0.44, + "learning_rate": 1.1245000194167216e-07, + "loss": 0.0005, + "step": 22595 + }, + { + "epoch": 0.44, + "learning_rate": 1.1244611859733602e-07, + "loss": 0.0007, + "step": 22596 + }, + { + "epoch": 0.44, + "learning_rate": 1.1244223525299987e-07, + "loss": 0.0005, + "step": 22597 + }, + { + "epoch": 0.44, + "learning_rate": 1.1243835190866373e-07, + "loss": 0.0007, + "step": 22598 + }, + { + "epoch": 0.44, + "learning_rate": 1.1243446856432759e-07, + "loss": 0.0021, + "step": 22599 + }, + { + "epoch": 0.44, + "learning_rate": 1.1243058521999145e-07, + "loss": 0.0086, + "step": 22600 + }, + { + "epoch": 0.44, + "learning_rate": 1.1242670187565531e-07, + "loss": 0.0008, + "step": 22601 + }, + { + "epoch": 0.44, + "learning_rate": 1.1242281853131917e-07, + "loss": 0.0351, + "step": 22602 + }, + { + "epoch": 0.44, + "learning_rate": 1.1241893518698302e-07, + "loss": 0.0006, + "step": 22603 + }, + { + "epoch": 0.44, + "learning_rate": 1.1241505184264688e-07, + "loss": 0.0007, + "step": 22604 + }, + { + "epoch": 0.44, + "learning_rate": 1.1241116849831074e-07, + "loss": 0.0196, + "step": 22605 + }, + { + "epoch": 0.44, + "learning_rate": 1.124072851539746e-07, + "loss": 0.0008, + "step": 22606 + }, + { + "epoch": 0.44, + "learning_rate": 1.1240340180963846e-07, + "loss": 0.0006, + "step": 22607 + }, + { + "epoch": 0.44, + "learning_rate": 1.1239951846530232e-07, + "loss": 0.0006, + "step": 22608 + }, + { + "epoch": 0.44, + "learning_rate": 1.1239563512096617e-07, + "loss": 0.0714, + "step": 22609 + }, + { + "epoch": 0.44, + "learning_rate": 1.1239175177663003e-07, + "loss": 0.0016, + "step": 22610 + }, + { + "epoch": 0.44, + "learning_rate": 1.1238786843229389e-07, + "loss": 0.0005, + "step": 22611 + }, + { + "epoch": 0.44, + "learning_rate": 1.1238398508795775e-07, + "loss": 0.0006, + "step": 22612 + }, + { + "epoch": 0.44, + "learning_rate": 1.1238010174362161e-07, + "loss": 0.0762, + "step": 22613 + }, + { + "epoch": 0.44, + "learning_rate": 1.1237621839928546e-07, + "loss": 0.0008, + "step": 22614 + }, + { + "epoch": 0.44, + "learning_rate": 1.1237233505494932e-07, + "loss": 0.0007, + "step": 22615 + }, + { + "epoch": 0.44, + "learning_rate": 1.1236845171061318e-07, + "loss": 0.0006, + "step": 22616 + }, + { + "epoch": 0.44, + "learning_rate": 1.1236456836627704e-07, + "loss": 0.0007, + "step": 22617 + }, + { + "epoch": 0.44, + "learning_rate": 1.123606850219409e-07, + "loss": 0.0006, + "step": 22618 + }, + { + "epoch": 0.44, + "learning_rate": 1.1235680167760476e-07, + "loss": 0.0038, + "step": 22619 + }, + { + "epoch": 0.44, + "learning_rate": 1.1235291833326861e-07, + "loss": 0.0078, + "step": 22620 + }, + { + "epoch": 0.44, + "learning_rate": 1.1234903498893247e-07, + "loss": 0.0007, + "step": 22621 + }, + { + "epoch": 0.44, + "learning_rate": 1.1234515164459633e-07, + "loss": 0.002, + "step": 22622 + }, + { + "epoch": 0.44, + "learning_rate": 1.1234126830026019e-07, + "loss": 0.6947, + "step": 22623 + }, + { + "epoch": 0.44, + "learning_rate": 1.1233738495592405e-07, + "loss": 0.0008, + "step": 22624 + }, + { + "epoch": 0.44, + "learning_rate": 1.123335016115879e-07, + "loss": 0.0285, + "step": 22625 + }, + { + "epoch": 0.44, + "learning_rate": 1.1232961826725176e-07, + "loss": 0.0107, + "step": 22626 + }, + { + "epoch": 0.44, + "learning_rate": 1.1232573492291562e-07, + "loss": 0.0006, + "step": 22627 + }, + { + "epoch": 0.44, + "learning_rate": 1.1232185157857948e-07, + "loss": 0.0007, + "step": 22628 + }, + { + "epoch": 0.44, + "learning_rate": 1.1231796823424334e-07, + "loss": 0.0008, + "step": 22629 + }, + { + "epoch": 0.44, + "learning_rate": 1.123140848899072e-07, + "loss": 0.001, + "step": 22630 + }, + { + "epoch": 0.44, + "learning_rate": 1.1231020154557104e-07, + "loss": 0.0452, + "step": 22631 + }, + { + "epoch": 0.44, + "learning_rate": 1.123063182012349e-07, + "loss": 0.0005, + "step": 22632 + }, + { + "epoch": 0.44, + "learning_rate": 1.1230243485689876e-07, + "loss": 0.4466, + "step": 22633 + }, + { + "epoch": 0.44, + "learning_rate": 1.1229855151256262e-07, + "loss": 0.0006, + "step": 22634 + }, + { + "epoch": 0.44, + "learning_rate": 1.1229466816822647e-07, + "loss": 0.2643, + "step": 22635 + }, + { + "epoch": 0.44, + "learning_rate": 1.1229078482389033e-07, + "loss": 0.0006, + "step": 22636 + }, + { + "epoch": 0.44, + "learning_rate": 1.1228690147955419e-07, + "loss": 0.0019, + "step": 22637 + }, + { + "epoch": 0.44, + "learning_rate": 1.1228301813521805e-07, + "loss": 0.0007, + "step": 22638 + }, + { + "epoch": 0.44, + "learning_rate": 1.1227913479088191e-07, + "loss": 0.0016, + "step": 22639 + }, + { + "epoch": 0.44, + "learning_rate": 1.1227525144654577e-07, + "loss": 0.9716, + "step": 22640 + }, + { + "epoch": 0.44, + "learning_rate": 1.1227136810220961e-07, + "loss": 0.0108, + "step": 22641 + }, + { + "epoch": 0.44, + "learning_rate": 1.1226748475787347e-07, + "loss": 0.0007, + "step": 22642 + }, + { + "epoch": 0.44, + "learning_rate": 1.1226360141353733e-07, + "loss": 0.0006, + "step": 22643 + }, + { + "epoch": 0.44, + "learning_rate": 1.1225971806920119e-07, + "loss": 0.0006, + "step": 22644 + }, + { + "epoch": 0.44, + "learning_rate": 1.1225583472486504e-07, + "loss": 0.0006, + "step": 22645 + }, + { + "epoch": 0.44, + "learning_rate": 1.122519513805289e-07, + "loss": 0.0013, + "step": 22646 + }, + { + "epoch": 0.44, + "learning_rate": 1.1224806803619276e-07, + "loss": 0.6305, + "step": 22647 + }, + { + "epoch": 0.44, + "learning_rate": 1.1224418469185662e-07, + "loss": 0.0007, + "step": 22648 + }, + { + "epoch": 0.44, + "learning_rate": 1.1224030134752048e-07, + "loss": 0.0007, + "step": 22649 + }, + { + "epoch": 0.44, + "learning_rate": 1.1223641800318434e-07, + "loss": 0.0007, + "step": 22650 + }, + { + "epoch": 0.44, + "learning_rate": 1.122325346588482e-07, + "loss": 0.6814, + "step": 22651 + }, + { + "epoch": 0.44, + "learning_rate": 1.1222865131451205e-07, + "loss": 0.0011, + "step": 22652 + }, + { + "epoch": 0.44, + "learning_rate": 1.1222476797017591e-07, + "loss": 0.3065, + "step": 22653 + }, + { + "epoch": 0.44, + "learning_rate": 1.1222088462583977e-07, + "loss": 0.0005, + "step": 22654 + }, + { + "epoch": 0.44, + "learning_rate": 1.1221700128150363e-07, + "loss": 0.0005, + "step": 22655 + }, + { + "epoch": 0.44, + "learning_rate": 1.1221311793716748e-07, + "loss": 0.0007, + "step": 22656 + }, + { + "epoch": 0.44, + "learning_rate": 1.1220923459283134e-07, + "loss": 0.0005, + "step": 22657 + }, + { + "epoch": 0.44, + "learning_rate": 1.122053512484952e-07, + "loss": 0.0008, + "step": 22658 + }, + { + "epoch": 0.44, + "learning_rate": 1.1220146790415906e-07, + "loss": 0.0012, + "step": 22659 + }, + { + "epoch": 0.44, + "learning_rate": 1.121975845598229e-07, + "loss": 0.0007, + "step": 22660 + }, + { + "epoch": 0.44, + "learning_rate": 1.1219370121548676e-07, + "loss": 0.0008, + "step": 22661 + }, + { + "epoch": 0.44, + "learning_rate": 1.1218981787115062e-07, + "loss": 0.0006, + "step": 22662 + }, + { + "epoch": 0.44, + "learning_rate": 1.1218593452681448e-07, + "loss": 0.0008, + "step": 22663 + }, + { + "epoch": 0.44, + "learning_rate": 1.1218205118247834e-07, + "loss": 0.0016, + "step": 22664 + }, + { + "epoch": 0.44, + "learning_rate": 1.121781678381422e-07, + "loss": 0.0006, + "step": 22665 + }, + { + "epoch": 0.44, + "learning_rate": 1.1217428449380605e-07, + "loss": 0.0011, + "step": 22666 + }, + { + "epoch": 0.44, + "learning_rate": 1.1217040114946991e-07, + "loss": 0.2546, + "step": 22667 + }, + { + "epoch": 0.44, + "learning_rate": 1.1216651780513377e-07, + "loss": 0.912, + "step": 22668 + }, + { + "epoch": 0.44, + "learning_rate": 1.1216263446079763e-07, + "loss": 0.0007, + "step": 22669 + }, + { + "epoch": 0.44, + "learning_rate": 1.1215875111646149e-07, + "loss": 0.0006, + "step": 22670 + }, + { + "epoch": 0.44, + "learning_rate": 1.1215486777212535e-07, + "loss": 0.0007, + "step": 22671 + }, + { + "epoch": 0.44, + "learning_rate": 1.121509844277892e-07, + "loss": 0.0005, + "step": 22672 + }, + { + "epoch": 0.44, + "learning_rate": 1.1214710108345306e-07, + "loss": 0.0008, + "step": 22673 + }, + { + "epoch": 0.44, + "learning_rate": 1.1214321773911692e-07, + "loss": 0.0006, + "step": 22674 + }, + { + "epoch": 0.44, + "learning_rate": 1.1213933439478078e-07, + "loss": 0.0007, + "step": 22675 + }, + { + "epoch": 0.44, + "learning_rate": 1.1213545105044464e-07, + "loss": 0.0006, + "step": 22676 + }, + { + "epoch": 0.44, + "learning_rate": 1.121315677061085e-07, + "loss": 0.6265, + "step": 22677 + }, + { + "epoch": 0.44, + "learning_rate": 1.1212768436177235e-07, + "loss": 0.0007, + "step": 22678 + }, + { + "epoch": 0.44, + "learning_rate": 1.1212380101743621e-07, + "loss": 0.0017, + "step": 22679 + }, + { + "epoch": 0.44, + "learning_rate": 1.1211991767310007e-07, + "loss": 0.0276, + "step": 22680 + }, + { + "epoch": 0.44, + "learning_rate": 1.1211603432876393e-07, + "loss": 0.0006, + "step": 22681 + }, + { + "epoch": 0.44, + "learning_rate": 1.1211215098442779e-07, + "loss": 0.001, + "step": 22682 + }, + { + "epoch": 0.44, + "learning_rate": 1.1210826764009164e-07, + "loss": 0.0007, + "step": 22683 + }, + { + "epoch": 0.44, + "learning_rate": 1.121043842957555e-07, + "loss": 0.0007, + "step": 22684 + }, + { + "epoch": 0.44, + "learning_rate": 1.1210050095141936e-07, + "loss": 0.0007, + "step": 22685 + }, + { + "epoch": 0.44, + "learning_rate": 1.1209661760708322e-07, + "loss": 0.001, + "step": 22686 + }, + { + "epoch": 0.44, + "learning_rate": 1.1209273426274708e-07, + "loss": 0.0007, + "step": 22687 + }, + { + "epoch": 0.44, + "learning_rate": 1.1208885091841094e-07, + "loss": 0.0007, + "step": 22688 + }, + { + "epoch": 0.44, + "learning_rate": 1.120849675740748e-07, + "loss": 0.0008, + "step": 22689 + }, + { + "epoch": 0.44, + "learning_rate": 1.1208108422973865e-07, + "loss": 0.0006, + "step": 22690 + }, + { + "epoch": 0.44, + "learning_rate": 1.1207720088540251e-07, + "loss": 0.0006, + "step": 22691 + }, + { + "epoch": 0.44, + "learning_rate": 1.1207331754106637e-07, + "loss": 0.0011, + "step": 22692 + }, + { + "epoch": 0.44, + "learning_rate": 1.1206943419673023e-07, + "loss": 0.0008, + "step": 22693 + }, + { + "epoch": 0.44, + "learning_rate": 1.1206555085239408e-07, + "loss": 0.0009, + "step": 22694 + }, + { + "epoch": 0.44, + "learning_rate": 1.1206166750805794e-07, + "loss": 0.0008, + "step": 22695 + }, + { + "epoch": 0.44, + "learning_rate": 1.120577841637218e-07, + "loss": 0.0005, + "step": 22696 + }, + { + "epoch": 0.44, + "learning_rate": 1.1205390081938566e-07, + "loss": 0.0031, + "step": 22697 + }, + { + "epoch": 0.44, + "learning_rate": 1.1205001747504952e-07, + "loss": 0.0005, + "step": 22698 + }, + { + "epoch": 0.44, + "learning_rate": 1.1204613413071335e-07, + "loss": 0.0008, + "step": 22699 + }, + { + "epoch": 0.44, + "learning_rate": 1.1204225078637721e-07, + "loss": 0.0007, + "step": 22700 + }, + { + "epoch": 0.44, + "learning_rate": 1.1203836744204107e-07, + "loss": 0.0007, + "step": 22701 + }, + { + "epoch": 0.44, + "learning_rate": 1.1203448409770492e-07, + "loss": 0.0013, + "step": 22702 + }, + { + "epoch": 0.44, + "learning_rate": 1.1203060075336878e-07, + "loss": 0.0006, + "step": 22703 + }, + { + "epoch": 0.44, + "learning_rate": 1.1202671740903264e-07, + "loss": 0.0006, + "step": 22704 + }, + { + "epoch": 0.44, + "learning_rate": 1.120228340646965e-07, + "loss": 0.0006, + "step": 22705 + }, + { + "epoch": 0.44, + "learning_rate": 1.1201895072036036e-07, + "loss": 0.0004, + "step": 22706 + }, + { + "epoch": 0.44, + "learning_rate": 1.1201506737602422e-07, + "loss": 0.0012, + "step": 22707 + }, + { + "epoch": 0.44, + "learning_rate": 1.1201118403168807e-07, + "loss": 0.0007, + "step": 22708 + }, + { + "epoch": 0.44, + "learning_rate": 1.1200730068735193e-07, + "loss": 0.0029, + "step": 22709 + }, + { + "epoch": 0.44, + "learning_rate": 1.1200341734301579e-07, + "loss": 0.0082, + "step": 22710 + }, + { + "epoch": 0.44, + "learning_rate": 1.1199953399867965e-07, + "loss": 0.8109, + "step": 22711 + }, + { + "epoch": 0.44, + "learning_rate": 1.1199565065434351e-07, + "loss": 0.1051, + "step": 22712 + }, + { + "epoch": 0.44, + "learning_rate": 1.1199176731000736e-07, + "loss": 0.0007, + "step": 22713 + }, + { + "epoch": 0.44, + "learning_rate": 1.1198788396567122e-07, + "loss": 0.0005, + "step": 22714 + }, + { + "epoch": 0.44, + "learning_rate": 1.1198400062133508e-07, + "loss": 0.0009, + "step": 22715 + }, + { + "epoch": 0.44, + "learning_rate": 1.1198011727699894e-07, + "loss": 0.5249, + "step": 22716 + }, + { + "epoch": 0.44, + "learning_rate": 1.119762339326628e-07, + "loss": 0.001, + "step": 22717 + }, + { + "epoch": 0.44, + "learning_rate": 1.1197235058832666e-07, + "loss": 0.0012, + "step": 22718 + }, + { + "epoch": 0.44, + "learning_rate": 1.1196846724399051e-07, + "loss": 0.0006, + "step": 22719 + }, + { + "epoch": 0.44, + "learning_rate": 1.1196458389965437e-07, + "loss": 0.0034, + "step": 22720 + }, + { + "epoch": 0.44, + "learning_rate": 1.1196070055531823e-07, + "loss": 0.2504, + "step": 22721 + }, + { + "epoch": 0.44, + "learning_rate": 1.1195681721098209e-07, + "loss": 0.0007, + "step": 22722 + }, + { + "epoch": 0.44, + "learning_rate": 1.1195293386664595e-07, + "loss": 0.0006, + "step": 22723 + }, + { + "epoch": 0.44, + "learning_rate": 1.119490505223098e-07, + "loss": 0.0005, + "step": 22724 + }, + { + "epoch": 0.44, + "learning_rate": 1.1194516717797366e-07, + "loss": 0.011, + "step": 22725 + }, + { + "epoch": 0.44, + "learning_rate": 1.1194128383363752e-07, + "loss": 0.0007, + "step": 22726 + }, + { + "epoch": 0.44, + "learning_rate": 1.1193740048930138e-07, + "loss": 0.0007, + "step": 22727 + }, + { + "epoch": 0.44, + "learning_rate": 1.1193351714496524e-07, + "loss": 0.001, + "step": 22728 + }, + { + "epoch": 0.44, + "learning_rate": 1.119296338006291e-07, + "loss": 0.0033, + "step": 22729 + }, + { + "epoch": 0.44, + "learning_rate": 1.1192575045629296e-07, + "loss": 0.0066, + "step": 22730 + }, + { + "epoch": 0.44, + "learning_rate": 1.1192186711195681e-07, + "loss": 0.0005, + "step": 22731 + }, + { + "epoch": 0.44, + "learning_rate": 1.1191798376762067e-07, + "loss": 0.0008, + "step": 22732 + }, + { + "epoch": 0.44, + "learning_rate": 1.1191410042328453e-07, + "loss": 0.0005, + "step": 22733 + }, + { + "epoch": 0.44, + "learning_rate": 1.1191021707894839e-07, + "loss": 0.0007, + "step": 22734 + }, + { + "epoch": 0.44, + "learning_rate": 1.1190633373461225e-07, + "loss": 0.0058, + "step": 22735 + }, + { + "epoch": 0.44, + "learning_rate": 1.119024503902761e-07, + "loss": 0.0005, + "step": 22736 + }, + { + "epoch": 0.44, + "learning_rate": 1.1189856704593996e-07, + "loss": 0.0007, + "step": 22737 + }, + { + "epoch": 0.44, + "learning_rate": 1.1189468370160382e-07, + "loss": 0.6865, + "step": 22738 + }, + { + "epoch": 0.44, + "learning_rate": 1.1189080035726768e-07, + "loss": 0.0149, + "step": 22739 + }, + { + "epoch": 0.44, + "learning_rate": 1.1188691701293154e-07, + "loss": 0.0006, + "step": 22740 + }, + { + "epoch": 0.44, + "learning_rate": 1.118830336685954e-07, + "loss": 0.0006, + "step": 22741 + }, + { + "epoch": 0.44, + "learning_rate": 1.1187915032425925e-07, + "loss": 0.9794, + "step": 22742 + }, + { + "epoch": 0.44, + "learning_rate": 1.1187526697992311e-07, + "loss": 0.0007, + "step": 22743 + }, + { + "epoch": 0.44, + "learning_rate": 1.1187138363558697e-07, + "loss": 0.0011, + "step": 22744 + }, + { + "epoch": 0.44, + "learning_rate": 1.1186750029125083e-07, + "loss": 0.0008, + "step": 22745 + }, + { + "epoch": 0.44, + "learning_rate": 1.1186361694691469e-07, + "loss": 0.0008, + "step": 22746 + }, + { + "epoch": 0.44, + "learning_rate": 1.1185973360257855e-07, + "loss": 0.0008, + "step": 22747 + }, + { + "epoch": 0.44, + "learning_rate": 1.118558502582424e-07, + "loss": 0.0081, + "step": 22748 + }, + { + "epoch": 0.44, + "learning_rate": 1.1185196691390626e-07, + "loss": 0.0011, + "step": 22749 + }, + { + "epoch": 0.44, + "learning_rate": 1.1184808356957012e-07, + "loss": 0.0009, + "step": 22750 + }, + { + "epoch": 0.44, + "learning_rate": 1.1184420022523398e-07, + "loss": 0.0006, + "step": 22751 + }, + { + "epoch": 0.44, + "learning_rate": 1.1184031688089784e-07, + "loss": 0.0004, + "step": 22752 + }, + { + "epoch": 0.44, + "learning_rate": 1.118364335365617e-07, + "loss": 0.0005, + "step": 22753 + }, + { + "epoch": 0.44, + "learning_rate": 1.1183255019222555e-07, + "loss": 0.0017, + "step": 22754 + }, + { + "epoch": 0.44, + "learning_rate": 1.1182866684788941e-07, + "loss": 0.0008, + "step": 22755 + }, + { + "epoch": 0.44, + "learning_rate": 1.1182478350355327e-07, + "loss": 0.0005, + "step": 22756 + }, + { + "epoch": 0.44, + "learning_rate": 1.118209001592171e-07, + "loss": 0.003, + "step": 22757 + }, + { + "epoch": 0.44, + "learning_rate": 1.1181701681488096e-07, + "loss": 0.0006, + "step": 22758 + }, + { + "epoch": 0.44, + "learning_rate": 1.1181313347054482e-07, + "loss": 0.0011, + "step": 22759 + }, + { + "epoch": 0.44, + "learning_rate": 1.1180925012620868e-07, + "loss": 0.0005, + "step": 22760 + }, + { + "epoch": 0.44, + "learning_rate": 1.1180536678187253e-07, + "loss": 0.0006, + "step": 22761 + }, + { + "epoch": 0.44, + "learning_rate": 1.1180148343753639e-07, + "loss": 0.0006, + "step": 22762 + }, + { + "epoch": 0.44, + "learning_rate": 1.1179760009320025e-07, + "loss": 0.0006, + "step": 22763 + }, + { + "epoch": 0.44, + "learning_rate": 1.1179371674886411e-07, + "loss": 0.0008, + "step": 22764 + }, + { + "epoch": 0.44, + "learning_rate": 1.1178983340452797e-07, + "loss": 0.0007, + "step": 22765 + }, + { + "epoch": 0.44, + "learning_rate": 1.1178595006019183e-07, + "loss": 0.6741, + "step": 22766 + }, + { + "epoch": 0.44, + "learning_rate": 1.1178206671585568e-07, + "loss": 0.0498, + "step": 22767 + }, + { + "epoch": 0.44, + "learning_rate": 1.1177818337151954e-07, + "loss": 0.0005, + "step": 22768 + }, + { + "epoch": 0.44, + "learning_rate": 1.117743000271834e-07, + "loss": 0.0006, + "step": 22769 + }, + { + "epoch": 0.44, + "learning_rate": 1.1177041668284726e-07, + "loss": 0.001, + "step": 22770 + }, + { + "epoch": 0.44, + "learning_rate": 1.1176653333851112e-07, + "loss": 0.1345, + "step": 22771 + }, + { + "epoch": 0.44, + "learning_rate": 1.1176264999417497e-07, + "loss": 0.0006, + "step": 22772 + }, + { + "epoch": 0.44, + "learning_rate": 1.1175876664983883e-07, + "loss": 0.0006, + "step": 22773 + }, + { + "epoch": 0.44, + "learning_rate": 1.1175488330550269e-07, + "loss": 0.0005, + "step": 22774 + }, + { + "epoch": 0.44, + "learning_rate": 1.1175099996116655e-07, + "loss": 0.0007, + "step": 22775 + }, + { + "epoch": 0.44, + "learning_rate": 1.1174711661683041e-07, + "loss": 0.4192, + "step": 22776 + }, + { + "epoch": 0.44, + "learning_rate": 1.1174323327249427e-07, + "loss": 0.0077, + "step": 22777 + }, + { + "epoch": 0.44, + "learning_rate": 1.1173934992815812e-07, + "loss": 0.0007, + "step": 22778 + }, + { + "epoch": 0.44, + "learning_rate": 1.1173546658382198e-07, + "loss": 0.0008, + "step": 22779 + }, + { + "epoch": 0.44, + "learning_rate": 1.1173158323948584e-07, + "loss": 0.0007, + "step": 22780 + }, + { + "epoch": 0.44, + "learning_rate": 1.117276998951497e-07, + "loss": 0.0009, + "step": 22781 + }, + { + "epoch": 0.44, + "learning_rate": 1.1172381655081356e-07, + "loss": 0.1742, + "step": 22782 + }, + { + "epoch": 0.44, + "learning_rate": 1.1171993320647742e-07, + "loss": 0.0035, + "step": 22783 + }, + { + "epoch": 0.44, + "learning_rate": 1.1171604986214127e-07, + "loss": 0.0006, + "step": 22784 + }, + { + "epoch": 0.44, + "learning_rate": 1.1171216651780513e-07, + "loss": 0.0007, + "step": 22785 + }, + { + "epoch": 0.44, + "learning_rate": 1.1170828317346899e-07, + "loss": 0.0005, + "step": 22786 + }, + { + "epoch": 0.44, + "learning_rate": 1.1170439982913285e-07, + "loss": 0.0011, + "step": 22787 + }, + { + "epoch": 0.44, + "learning_rate": 1.1170051648479671e-07, + "loss": 0.0008, + "step": 22788 + }, + { + "epoch": 0.44, + "learning_rate": 1.1169663314046056e-07, + "loss": 0.0007, + "step": 22789 + }, + { + "epoch": 0.44, + "learning_rate": 1.1169274979612442e-07, + "loss": 0.0012, + "step": 22790 + }, + { + "epoch": 0.44, + "learning_rate": 1.1168886645178828e-07, + "loss": 0.0008, + "step": 22791 + }, + { + "epoch": 0.44, + "learning_rate": 1.1168498310745214e-07, + "loss": 0.0011, + "step": 22792 + }, + { + "epoch": 0.44, + "learning_rate": 1.11681099763116e-07, + "loss": 0.0006, + "step": 22793 + }, + { + "epoch": 0.44, + "learning_rate": 1.1167721641877986e-07, + "loss": 0.0014, + "step": 22794 + }, + { + "epoch": 0.44, + "learning_rate": 1.1167333307444371e-07, + "loss": 0.7597, + "step": 22795 + }, + { + "epoch": 0.44, + "learning_rate": 1.1166944973010757e-07, + "loss": 0.0005, + "step": 22796 + }, + { + "epoch": 0.44, + "learning_rate": 1.1166556638577143e-07, + "loss": 0.0006, + "step": 22797 + }, + { + "epoch": 0.44, + "learning_rate": 1.1166168304143529e-07, + "loss": 0.0008, + "step": 22798 + }, + { + "epoch": 0.44, + "learning_rate": 1.1165779969709915e-07, + "loss": 0.0008, + "step": 22799 + }, + { + "epoch": 0.44, + "learning_rate": 1.11653916352763e-07, + "loss": 0.0008, + "step": 22800 + }, + { + "epoch": 0.44, + "learning_rate": 1.1165003300842686e-07, + "loss": 0.0007, + "step": 22801 + }, + { + "epoch": 0.44, + "learning_rate": 1.1164614966409072e-07, + "loss": 0.2127, + "step": 22802 + }, + { + "epoch": 0.44, + "learning_rate": 1.1164226631975458e-07, + "loss": 0.0007, + "step": 22803 + }, + { + "epoch": 0.44, + "learning_rate": 1.1163838297541844e-07, + "loss": 0.0004, + "step": 22804 + }, + { + "epoch": 0.44, + "learning_rate": 1.116344996310823e-07, + "loss": 0.0005, + "step": 22805 + }, + { + "epoch": 0.44, + "learning_rate": 1.1163061628674616e-07, + "loss": 0.0019, + "step": 22806 + }, + { + "epoch": 0.44, + "learning_rate": 1.1162673294241001e-07, + "loss": 0.0007, + "step": 22807 + }, + { + "epoch": 0.44, + "learning_rate": 1.1162284959807386e-07, + "loss": 0.0009, + "step": 22808 + }, + { + "epoch": 0.44, + "learning_rate": 1.1161896625373772e-07, + "loss": 0.0007, + "step": 22809 + }, + { + "epoch": 0.44, + "learning_rate": 1.1161508290940157e-07, + "loss": 0.0228, + "step": 22810 + }, + { + "epoch": 0.44, + "learning_rate": 1.1161119956506543e-07, + "loss": 0.0005, + "step": 22811 + }, + { + "epoch": 0.44, + "learning_rate": 1.1160731622072929e-07, + "loss": 0.0006, + "step": 22812 + }, + { + "epoch": 0.44, + "learning_rate": 1.1160343287639315e-07, + "loss": 0.0006, + "step": 22813 + }, + { + "epoch": 0.44, + "learning_rate": 1.1159954953205701e-07, + "loss": 0.0005, + "step": 22814 + }, + { + "epoch": 0.44, + "learning_rate": 1.1159566618772085e-07, + "loss": 0.0007, + "step": 22815 + }, + { + "epoch": 0.44, + "learning_rate": 1.1159178284338471e-07, + "loss": 0.0007, + "step": 22816 + }, + { + "epoch": 0.44, + "learning_rate": 1.1158789949904857e-07, + "loss": 0.6114, + "step": 22817 + }, + { + "epoch": 0.44, + "learning_rate": 1.1158401615471243e-07, + "loss": 0.0005, + "step": 22818 + }, + { + "epoch": 0.44, + "learning_rate": 1.1158013281037629e-07, + "loss": 0.0007, + "step": 22819 + }, + { + "epoch": 0.44, + "learning_rate": 1.1157624946604014e-07, + "loss": 0.0009, + "step": 22820 + }, + { + "epoch": 0.44, + "learning_rate": 1.11572366121704e-07, + "loss": 0.0004, + "step": 22821 + }, + { + "epoch": 0.44, + "learning_rate": 1.1156848277736786e-07, + "loss": 0.0008, + "step": 22822 + }, + { + "epoch": 0.44, + "learning_rate": 1.1156459943303172e-07, + "loss": 0.0021, + "step": 22823 + }, + { + "epoch": 0.44, + "learning_rate": 1.1156071608869558e-07, + "loss": 0.0006, + "step": 22824 + }, + { + "epoch": 0.44, + "learning_rate": 1.1155683274435944e-07, + "loss": 0.0008, + "step": 22825 + }, + { + "epoch": 0.44, + "learning_rate": 1.115529494000233e-07, + "loss": 0.0025, + "step": 22826 + }, + { + "epoch": 0.44, + "learning_rate": 1.1154906605568715e-07, + "loss": 0.0005, + "step": 22827 + }, + { + "epoch": 0.44, + "learning_rate": 1.1154518271135101e-07, + "loss": 0.0018, + "step": 22828 + }, + { + "epoch": 0.44, + "learning_rate": 1.1154129936701487e-07, + "loss": 0.0009, + "step": 22829 + }, + { + "epoch": 0.44, + "learning_rate": 1.1153741602267873e-07, + "loss": 0.0006, + "step": 22830 + }, + { + "epoch": 0.44, + "learning_rate": 1.1153353267834258e-07, + "loss": 0.0006, + "step": 22831 + }, + { + "epoch": 0.44, + "learning_rate": 1.1152964933400644e-07, + "loss": 0.0007, + "step": 22832 + }, + { + "epoch": 0.44, + "learning_rate": 1.115257659896703e-07, + "loss": 0.0008, + "step": 22833 + }, + { + "epoch": 0.44, + "learning_rate": 1.1152188264533416e-07, + "loss": 0.0006, + "step": 22834 + }, + { + "epoch": 0.44, + "learning_rate": 1.1151799930099802e-07, + "loss": 0.6988, + "step": 22835 + }, + { + "epoch": 0.44, + "learning_rate": 1.1151411595666188e-07, + "loss": 0.0007, + "step": 22836 + }, + { + "epoch": 0.44, + "learning_rate": 1.1151023261232572e-07, + "loss": 0.0004, + "step": 22837 + }, + { + "epoch": 0.44, + "learning_rate": 1.1150634926798958e-07, + "loss": 0.0005, + "step": 22838 + }, + { + "epoch": 0.44, + "learning_rate": 1.1150246592365344e-07, + "loss": 0.0006, + "step": 22839 + }, + { + "epoch": 0.44, + "learning_rate": 1.114985825793173e-07, + "loss": 0.0009, + "step": 22840 + }, + { + "epoch": 0.44, + "learning_rate": 1.1149469923498115e-07, + "loss": 0.0016, + "step": 22841 + }, + { + "epoch": 0.44, + "learning_rate": 1.1149081589064501e-07, + "loss": 0.0011, + "step": 22842 + }, + { + "epoch": 0.44, + "learning_rate": 1.1148693254630887e-07, + "loss": 0.0044, + "step": 22843 + }, + { + "epoch": 0.44, + "learning_rate": 1.1148304920197273e-07, + "loss": 0.0007, + "step": 22844 + }, + { + "epoch": 0.44, + "learning_rate": 1.1147916585763659e-07, + "loss": 0.0005, + "step": 22845 + }, + { + "epoch": 0.44, + "learning_rate": 1.1147528251330045e-07, + "loss": 0.001, + "step": 22846 + }, + { + "epoch": 0.44, + "learning_rate": 1.114713991689643e-07, + "loss": 0.0006, + "step": 22847 + }, + { + "epoch": 0.44, + "learning_rate": 1.1146751582462816e-07, + "loss": 0.0008, + "step": 22848 + }, + { + "epoch": 0.44, + "learning_rate": 1.1146363248029202e-07, + "loss": 0.0006, + "step": 22849 + }, + { + "epoch": 0.44, + "learning_rate": 1.1145974913595588e-07, + "loss": 0.0935, + "step": 22850 + }, + { + "epoch": 0.44, + "learning_rate": 1.1145586579161974e-07, + "loss": 0.001, + "step": 22851 + }, + { + "epoch": 0.44, + "learning_rate": 1.114519824472836e-07, + "loss": 0.0006, + "step": 22852 + }, + { + "epoch": 0.44, + "learning_rate": 1.1144809910294745e-07, + "loss": 0.001, + "step": 22853 + }, + { + "epoch": 0.44, + "learning_rate": 1.1144421575861131e-07, + "loss": 0.0008, + "step": 22854 + }, + { + "epoch": 0.44, + "learning_rate": 1.1144033241427517e-07, + "loss": 0.3898, + "step": 22855 + }, + { + "epoch": 0.44, + "learning_rate": 1.1143644906993903e-07, + "loss": 0.0143, + "step": 22856 + }, + { + "epoch": 0.44, + "learning_rate": 1.1143256572560289e-07, + "loss": 0.0012, + "step": 22857 + }, + { + "epoch": 0.44, + "learning_rate": 1.1142868238126674e-07, + "loss": 0.0006, + "step": 22858 + }, + { + "epoch": 0.44, + "learning_rate": 1.114247990369306e-07, + "loss": 0.0006, + "step": 22859 + }, + { + "epoch": 0.44, + "learning_rate": 1.1142091569259446e-07, + "loss": 0.0819, + "step": 22860 + }, + { + "epoch": 0.44, + "learning_rate": 1.1141703234825832e-07, + "loss": 0.0006, + "step": 22861 + }, + { + "epoch": 0.44, + "learning_rate": 1.1141314900392218e-07, + "loss": 0.2729, + "step": 22862 + }, + { + "epoch": 0.44, + "learning_rate": 1.1140926565958604e-07, + "loss": 0.0006, + "step": 22863 + }, + { + "epoch": 0.44, + "learning_rate": 1.114053823152499e-07, + "loss": 0.0006, + "step": 22864 + }, + { + "epoch": 0.44, + "learning_rate": 1.1140149897091375e-07, + "loss": 0.0006, + "step": 22865 + }, + { + "epoch": 0.44, + "learning_rate": 1.1139761562657761e-07, + "loss": 0.0005, + "step": 22866 + }, + { + "epoch": 0.44, + "learning_rate": 1.1139373228224147e-07, + "loss": 0.0008, + "step": 22867 + }, + { + "epoch": 0.44, + "learning_rate": 1.1138984893790533e-07, + "loss": 0.6193, + "step": 22868 + }, + { + "epoch": 0.44, + "learning_rate": 1.1138596559356918e-07, + "loss": 0.0022, + "step": 22869 + }, + { + "epoch": 0.44, + "learning_rate": 1.1138208224923304e-07, + "loss": 0.0024, + "step": 22870 + }, + { + "epoch": 0.44, + "learning_rate": 1.113781989048969e-07, + "loss": 0.0008, + "step": 22871 + }, + { + "epoch": 0.44, + "learning_rate": 1.1137431556056076e-07, + "loss": 0.0005, + "step": 22872 + }, + { + "epoch": 0.44, + "learning_rate": 1.1137043221622459e-07, + "loss": 0.0179, + "step": 22873 + }, + { + "epoch": 0.44, + "learning_rate": 1.1136654887188845e-07, + "loss": 0.0009, + "step": 22874 + }, + { + "epoch": 0.44, + "learning_rate": 1.1136266552755231e-07, + "loss": 0.0007, + "step": 22875 + }, + { + "epoch": 0.44, + "learning_rate": 1.1135878218321617e-07, + "loss": 0.0086, + "step": 22876 + }, + { + "epoch": 0.44, + "learning_rate": 1.1135489883888002e-07, + "loss": 0.0007, + "step": 22877 + }, + { + "epoch": 0.44, + "learning_rate": 1.1135101549454388e-07, + "loss": 0.0008, + "step": 22878 + }, + { + "epoch": 0.44, + "learning_rate": 1.1134713215020774e-07, + "loss": 0.0005, + "step": 22879 + }, + { + "epoch": 0.44, + "learning_rate": 1.113432488058716e-07, + "loss": 1.3063, + "step": 22880 + }, + { + "epoch": 0.44, + "learning_rate": 1.1133936546153546e-07, + "loss": 0.0006, + "step": 22881 + }, + { + "epoch": 0.44, + "learning_rate": 1.1133548211719932e-07, + "loss": 0.0005, + "step": 22882 + }, + { + "epoch": 0.44, + "learning_rate": 1.1133159877286317e-07, + "loss": 0.0009, + "step": 22883 + }, + { + "epoch": 0.44, + "learning_rate": 1.1132771542852703e-07, + "loss": 0.0034, + "step": 22884 + }, + { + "epoch": 0.44, + "learning_rate": 1.1132383208419089e-07, + "loss": 0.6972, + "step": 22885 + }, + { + "epoch": 0.44, + "learning_rate": 1.1131994873985475e-07, + "loss": 0.0007, + "step": 22886 + }, + { + "epoch": 0.44, + "learning_rate": 1.1131606539551861e-07, + "loss": 0.0005, + "step": 22887 + }, + { + "epoch": 0.44, + "learning_rate": 1.1131218205118246e-07, + "loss": 0.0043, + "step": 22888 + }, + { + "epoch": 0.44, + "learning_rate": 1.1130829870684632e-07, + "loss": 0.0048, + "step": 22889 + }, + { + "epoch": 0.44, + "learning_rate": 1.1130441536251018e-07, + "loss": 0.0006, + "step": 22890 + }, + { + "epoch": 0.44, + "learning_rate": 1.1130053201817404e-07, + "loss": 0.0004, + "step": 22891 + }, + { + "epoch": 0.44, + "learning_rate": 1.112966486738379e-07, + "loss": 0.0008, + "step": 22892 + }, + { + "epoch": 0.44, + "learning_rate": 1.1129276532950176e-07, + "loss": 0.0006, + "step": 22893 + }, + { + "epoch": 0.44, + "learning_rate": 1.1128888198516561e-07, + "loss": 0.0013, + "step": 22894 + }, + { + "epoch": 0.44, + "learning_rate": 1.1128499864082947e-07, + "loss": 0.0006, + "step": 22895 + }, + { + "epoch": 0.44, + "learning_rate": 1.1128111529649333e-07, + "loss": 0.0084, + "step": 22896 + }, + { + "epoch": 0.44, + "learning_rate": 1.1127723195215719e-07, + "loss": 0.0006, + "step": 22897 + }, + { + "epoch": 0.44, + "learning_rate": 1.1127334860782105e-07, + "loss": 0.1078, + "step": 22898 + }, + { + "epoch": 0.44, + "learning_rate": 1.112694652634849e-07, + "loss": 0.0006, + "step": 22899 + }, + { + "epoch": 0.44, + "learning_rate": 1.1126558191914876e-07, + "loss": 0.0007, + "step": 22900 + }, + { + "epoch": 0.44, + "learning_rate": 1.1126169857481262e-07, + "loss": 0.0019, + "step": 22901 + }, + { + "epoch": 0.44, + "learning_rate": 1.1125781523047648e-07, + "loss": 0.0017, + "step": 22902 + }, + { + "epoch": 0.44, + "learning_rate": 1.1125393188614034e-07, + "loss": 0.0006, + "step": 22903 + }, + { + "epoch": 0.44, + "learning_rate": 1.112500485418042e-07, + "loss": 0.0015, + "step": 22904 + }, + { + "epoch": 0.44, + "learning_rate": 1.1124616519746806e-07, + "loss": 0.0008, + "step": 22905 + }, + { + "epoch": 0.44, + "learning_rate": 1.1124228185313191e-07, + "loss": 0.0004, + "step": 22906 + }, + { + "epoch": 0.44, + "learning_rate": 1.1123839850879577e-07, + "loss": 0.0233, + "step": 22907 + }, + { + "epoch": 0.44, + "learning_rate": 1.1123451516445963e-07, + "loss": 0.7135, + "step": 22908 + }, + { + "epoch": 0.44, + "learning_rate": 1.1123063182012349e-07, + "loss": 0.0005, + "step": 22909 + }, + { + "epoch": 0.44, + "learning_rate": 1.1122674847578735e-07, + "loss": 0.0007, + "step": 22910 + }, + { + "epoch": 0.44, + "learning_rate": 1.112228651314512e-07, + "loss": 0.9704, + "step": 22911 + }, + { + "epoch": 0.44, + "learning_rate": 1.1121898178711506e-07, + "loss": 0.0005, + "step": 22912 + }, + { + "epoch": 0.44, + "learning_rate": 1.1121509844277892e-07, + "loss": 0.0005, + "step": 22913 + }, + { + "epoch": 0.44, + "learning_rate": 1.1121121509844278e-07, + "loss": 0.0013, + "step": 22914 + }, + { + "epoch": 0.44, + "learning_rate": 1.1120733175410664e-07, + "loss": 0.1807, + "step": 22915 + }, + { + "epoch": 0.44, + "learning_rate": 1.112034484097705e-07, + "loss": 0.0009, + "step": 22916 + }, + { + "epoch": 0.44, + "learning_rate": 1.1119956506543435e-07, + "loss": 0.0006, + "step": 22917 + }, + { + "epoch": 0.44, + "learning_rate": 1.1119568172109821e-07, + "loss": 0.0006, + "step": 22918 + }, + { + "epoch": 0.44, + "learning_rate": 1.1119179837676207e-07, + "loss": 0.0011, + "step": 22919 + }, + { + "epoch": 0.44, + "learning_rate": 1.1118791503242593e-07, + "loss": 0.0004, + "step": 22920 + }, + { + "epoch": 0.44, + "learning_rate": 1.1118403168808979e-07, + "loss": 0.0009, + "step": 22921 + }, + { + "epoch": 0.44, + "learning_rate": 1.1118014834375365e-07, + "loss": 0.0009, + "step": 22922 + }, + { + "epoch": 0.44, + "learning_rate": 1.111762649994175e-07, + "loss": 0.0008, + "step": 22923 + }, + { + "epoch": 0.44, + "learning_rate": 1.1117238165508136e-07, + "loss": 0.1821, + "step": 22924 + }, + { + "epoch": 0.44, + "learning_rate": 1.1116849831074522e-07, + "loss": 0.0055, + "step": 22925 + }, + { + "epoch": 0.44, + "learning_rate": 1.1116461496640908e-07, + "loss": 0.6221, + "step": 22926 + }, + { + "epoch": 0.44, + "learning_rate": 1.1116073162207294e-07, + "loss": 0.0006, + "step": 22927 + }, + { + "epoch": 0.44, + "learning_rate": 1.111568482777368e-07, + "loss": 0.5946, + "step": 22928 + }, + { + "epoch": 0.44, + "learning_rate": 1.1115296493340065e-07, + "loss": 0.0008, + "step": 22929 + }, + { + "epoch": 0.44, + "learning_rate": 1.1114908158906451e-07, + "loss": 0.0146, + "step": 22930 + }, + { + "epoch": 0.44, + "learning_rate": 1.1114519824472834e-07, + "loss": 0.0008, + "step": 22931 + }, + { + "epoch": 0.44, + "learning_rate": 1.111413149003922e-07, + "loss": 0.0006, + "step": 22932 + }, + { + "epoch": 0.44, + "learning_rate": 1.1113743155605606e-07, + "loss": 0.0011, + "step": 22933 + }, + { + "epoch": 0.44, + "learning_rate": 1.1113354821171992e-07, + "loss": 0.0006, + "step": 22934 + }, + { + "epoch": 0.44, + "learning_rate": 1.1112966486738378e-07, + "loss": 0.0005, + "step": 22935 + }, + { + "epoch": 0.44, + "learning_rate": 1.1112578152304763e-07, + "loss": 0.0008, + "step": 22936 + }, + { + "epoch": 0.44, + "learning_rate": 1.1112189817871149e-07, + "loss": 0.0006, + "step": 22937 + }, + { + "epoch": 0.44, + "learning_rate": 1.1111801483437535e-07, + "loss": 0.0007, + "step": 22938 + }, + { + "epoch": 0.44, + "learning_rate": 1.1111413149003921e-07, + "loss": 0.0006, + "step": 22939 + }, + { + "epoch": 0.44, + "learning_rate": 1.1111024814570307e-07, + "loss": 0.0007, + "step": 22940 + }, + { + "epoch": 0.45, + "learning_rate": 1.1110636480136693e-07, + "loss": 0.0006, + "step": 22941 + }, + { + "epoch": 0.45, + "learning_rate": 1.1110248145703078e-07, + "loss": 0.0004, + "step": 22942 + }, + { + "epoch": 0.45, + "learning_rate": 1.1109859811269464e-07, + "loss": 0.0007, + "step": 22943 + }, + { + "epoch": 0.45, + "learning_rate": 1.110947147683585e-07, + "loss": 0.0005, + "step": 22944 + }, + { + "epoch": 0.45, + "learning_rate": 1.1109083142402236e-07, + "loss": 0.001, + "step": 22945 + }, + { + "epoch": 0.45, + "learning_rate": 1.1108694807968622e-07, + "loss": 0.2089, + "step": 22946 + }, + { + "epoch": 0.45, + "learning_rate": 1.1108306473535007e-07, + "loss": 0.0007, + "step": 22947 + }, + { + "epoch": 0.45, + "learning_rate": 1.1107918139101393e-07, + "loss": 0.0008, + "step": 22948 + }, + { + "epoch": 0.45, + "learning_rate": 1.1107529804667779e-07, + "loss": 0.0012, + "step": 22949 + }, + { + "epoch": 0.45, + "learning_rate": 1.1107141470234165e-07, + "loss": 0.0006, + "step": 22950 + }, + { + "epoch": 0.45, + "learning_rate": 1.1106753135800551e-07, + "loss": 0.0014, + "step": 22951 + }, + { + "epoch": 0.45, + "learning_rate": 1.1106364801366937e-07, + "loss": 0.0007, + "step": 22952 + }, + { + "epoch": 0.45, + "learning_rate": 1.1105976466933322e-07, + "loss": 0.0008, + "step": 22953 + }, + { + "epoch": 0.45, + "learning_rate": 1.1105588132499708e-07, + "loss": 0.0005, + "step": 22954 + }, + { + "epoch": 0.45, + "learning_rate": 1.1105199798066094e-07, + "loss": 0.0008, + "step": 22955 + }, + { + "epoch": 0.45, + "learning_rate": 1.110481146363248e-07, + "loss": 0.0006, + "step": 22956 + }, + { + "epoch": 0.45, + "learning_rate": 1.1104423129198866e-07, + "loss": 0.0009, + "step": 22957 + }, + { + "epoch": 0.45, + "learning_rate": 1.1104034794765252e-07, + "loss": 0.0007, + "step": 22958 + }, + { + "epoch": 0.45, + "learning_rate": 1.1103646460331637e-07, + "loss": 0.6839, + "step": 22959 + }, + { + "epoch": 0.45, + "learning_rate": 1.1103258125898023e-07, + "loss": 0.0004, + "step": 22960 + }, + { + "epoch": 0.45, + "learning_rate": 1.1102869791464409e-07, + "loss": 0.0007, + "step": 22961 + }, + { + "epoch": 0.45, + "learning_rate": 1.1102481457030795e-07, + "loss": 0.0005, + "step": 22962 + }, + { + "epoch": 0.45, + "learning_rate": 1.1102093122597181e-07, + "loss": 0.0006, + "step": 22963 + }, + { + "epoch": 0.45, + "learning_rate": 1.1101704788163567e-07, + "loss": 0.0006, + "step": 22964 + }, + { + "epoch": 0.45, + "learning_rate": 1.1101316453729952e-07, + "loss": 0.0005, + "step": 22965 + }, + { + "epoch": 0.45, + "learning_rate": 1.1100928119296338e-07, + "loss": 0.0007, + "step": 22966 + }, + { + "epoch": 0.45, + "learning_rate": 1.1100539784862724e-07, + "loss": 0.0559, + "step": 22967 + }, + { + "epoch": 0.45, + "learning_rate": 1.110015145042911e-07, + "loss": 0.5746, + "step": 22968 + }, + { + "epoch": 0.45, + "learning_rate": 1.1099763115995496e-07, + "loss": 0.0008, + "step": 22969 + }, + { + "epoch": 0.45, + "learning_rate": 1.1099374781561881e-07, + "loss": 0.0009, + "step": 22970 + }, + { + "epoch": 0.45, + "learning_rate": 1.1098986447128267e-07, + "loss": 0.0008, + "step": 22971 + }, + { + "epoch": 0.45, + "learning_rate": 1.1098598112694653e-07, + "loss": 0.0007, + "step": 22972 + }, + { + "epoch": 0.45, + "learning_rate": 1.1098209778261039e-07, + "loss": 0.0006, + "step": 22973 + }, + { + "epoch": 0.45, + "learning_rate": 1.1097821443827425e-07, + "loss": 0.0006, + "step": 22974 + }, + { + "epoch": 0.45, + "learning_rate": 1.109743310939381e-07, + "loss": 0.0006, + "step": 22975 + }, + { + "epoch": 0.45, + "learning_rate": 1.1097044774960196e-07, + "loss": 0.0006, + "step": 22976 + }, + { + "epoch": 0.45, + "learning_rate": 1.1096656440526582e-07, + "loss": 0.0006, + "step": 22977 + }, + { + "epoch": 0.45, + "learning_rate": 1.1096268106092968e-07, + "loss": 0.001, + "step": 22978 + }, + { + "epoch": 0.45, + "learning_rate": 1.1095879771659354e-07, + "loss": 0.4485, + "step": 22979 + }, + { + "epoch": 0.45, + "learning_rate": 1.109549143722574e-07, + "loss": 0.1626, + "step": 22980 + }, + { + "epoch": 0.45, + "learning_rate": 1.1095103102792126e-07, + "loss": 0.0008, + "step": 22981 + }, + { + "epoch": 0.45, + "learning_rate": 1.1094714768358511e-07, + "loss": 0.0011, + "step": 22982 + }, + { + "epoch": 0.45, + "learning_rate": 1.1094326433924897e-07, + "loss": 0.0007, + "step": 22983 + }, + { + "epoch": 0.45, + "learning_rate": 1.1093938099491283e-07, + "loss": 0.0006, + "step": 22984 + }, + { + "epoch": 0.45, + "learning_rate": 1.1093549765057667e-07, + "loss": 0.0008, + "step": 22985 + }, + { + "epoch": 0.45, + "learning_rate": 1.1093161430624053e-07, + "loss": 0.0473, + "step": 22986 + }, + { + "epoch": 0.45, + "learning_rate": 1.1092773096190439e-07, + "loss": 0.0007, + "step": 22987 + }, + { + "epoch": 0.45, + "learning_rate": 1.1092384761756825e-07, + "loss": 0.0005, + "step": 22988 + }, + { + "epoch": 0.45, + "learning_rate": 1.109199642732321e-07, + "loss": 0.0005, + "step": 22989 + }, + { + "epoch": 0.45, + "learning_rate": 1.1091608092889595e-07, + "loss": 0.1587, + "step": 22990 + }, + { + "epoch": 0.45, + "learning_rate": 1.1091219758455981e-07, + "loss": 0.0007, + "step": 22991 + }, + { + "epoch": 0.45, + "learning_rate": 1.1090831424022367e-07, + "loss": 0.0009, + "step": 22992 + }, + { + "epoch": 0.45, + "learning_rate": 1.1090443089588753e-07, + "loss": 0.0006, + "step": 22993 + }, + { + "epoch": 0.45, + "learning_rate": 1.1090054755155139e-07, + "loss": 0.1156, + "step": 22994 + }, + { + "epoch": 0.45, + "learning_rate": 1.1089666420721524e-07, + "loss": 0.0007, + "step": 22995 + }, + { + "epoch": 0.45, + "learning_rate": 1.108927808628791e-07, + "loss": 0.0009, + "step": 22996 + }, + { + "epoch": 0.45, + "learning_rate": 1.1088889751854296e-07, + "loss": 0.0007, + "step": 22997 + }, + { + "epoch": 0.45, + "learning_rate": 1.1088501417420682e-07, + "loss": 0.0005, + "step": 22998 + }, + { + "epoch": 0.45, + "learning_rate": 1.1088113082987068e-07, + "loss": 0.0008, + "step": 22999 + }, + { + "epoch": 0.45, + "learning_rate": 1.1087724748553454e-07, + "loss": 0.0007, + "step": 23000 + }, + { + "epoch": 0.45, + "learning_rate": 1.108733641411984e-07, + "loss": 0.0041, + "step": 23001 + }, + { + "epoch": 0.45, + "learning_rate": 1.1086948079686225e-07, + "loss": 0.0031, + "step": 23002 + }, + { + "epoch": 0.45, + "learning_rate": 1.1086559745252611e-07, + "loss": 0.0006, + "step": 23003 + }, + { + "epoch": 0.45, + "learning_rate": 1.1086171410818997e-07, + "loss": 1.2056, + "step": 23004 + }, + { + "epoch": 0.45, + "learning_rate": 1.1085783076385383e-07, + "loss": 0.0007, + "step": 23005 + }, + { + "epoch": 0.45, + "learning_rate": 1.1085394741951768e-07, + "loss": 0.0006, + "step": 23006 + }, + { + "epoch": 0.45, + "learning_rate": 1.1085006407518154e-07, + "loss": 0.0006, + "step": 23007 + }, + { + "epoch": 0.45, + "learning_rate": 1.108461807308454e-07, + "loss": 0.0007, + "step": 23008 + }, + { + "epoch": 0.45, + "learning_rate": 1.1084229738650926e-07, + "loss": 0.0011, + "step": 23009 + }, + { + "epoch": 0.45, + "learning_rate": 1.1083841404217312e-07, + "loss": 0.0676, + "step": 23010 + }, + { + "epoch": 0.45, + "learning_rate": 1.1083453069783698e-07, + "loss": 0.5612, + "step": 23011 + }, + { + "epoch": 0.45, + "learning_rate": 1.1083064735350083e-07, + "loss": 0.0007, + "step": 23012 + }, + { + "epoch": 0.45, + "learning_rate": 1.1082676400916469e-07, + "loss": 0.7419, + "step": 23013 + }, + { + "epoch": 0.45, + "learning_rate": 1.1082288066482854e-07, + "loss": 0.0068, + "step": 23014 + }, + { + "epoch": 0.45, + "learning_rate": 1.108189973204924e-07, + "loss": 0.0008, + "step": 23015 + }, + { + "epoch": 0.45, + "learning_rate": 1.1081511397615625e-07, + "loss": 0.0007, + "step": 23016 + }, + { + "epoch": 0.45, + "learning_rate": 1.1081123063182011e-07, + "loss": 0.0006, + "step": 23017 + }, + { + "epoch": 0.45, + "learning_rate": 1.1080734728748397e-07, + "loss": 0.405, + "step": 23018 + }, + { + "epoch": 0.45, + "learning_rate": 1.1080346394314783e-07, + "loss": 0.0007, + "step": 23019 + }, + { + "epoch": 0.45, + "learning_rate": 1.1079958059881169e-07, + "loss": 0.001, + "step": 23020 + }, + { + "epoch": 0.45, + "learning_rate": 1.1079569725447555e-07, + "loss": 0.0006, + "step": 23021 + }, + { + "epoch": 0.45, + "learning_rate": 1.107918139101394e-07, + "loss": 0.0006, + "step": 23022 + }, + { + "epoch": 0.45, + "learning_rate": 1.1078793056580326e-07, + "loss": 0.0007, + "step": 23023 + }, + { + "epoch": 0.45, + "learning_rate": 1.1078404722146712e-07, + "loss": 0.0006, + "step": 23024 + }, + { + "epoch": 0.45, + "learning_rate": 1.1078016387713098e-07, + "loss": 0.0005, + "step": 23025 + }, + { + "epoch": 0.45, + "learning_rate": 1.1077628053279484e-07, + "loss": 0.0009, + "step": 23026 + }, + { + "epoch": 0.45, + "learning_rate": 1.107723971884587e-07, + "loss": 0.0005, + "step": 23027 + }, + { + "epoch": 0.45, + "learning_rate": 1.1076851384412255e-07, + "loss": 0.0009, + "step": 23028 + }, + { + "epoch": 0.45, + "learning_rate": 1.1076463049978641e-07, + "loss": 0.5151, + "step": 23029 + }, + { + "epoch": 0.45, + "learning_rate": 1.1076074715545027e-07, + "loss": 0.0005, + "step": 23030 + }, + { + "epoch": 0.45, + "learning_rate": 1.1075686381111413e-07, + "loss": 0.071, + "step": 23031 + }, + { + "epoch": 0.45, + "learning_rate": 1.1075298046677799e-07, + "loss": 0.3008, + "step": 23032 + }, + { + "epoch": 0.45, + "learning_rate": 1.1074909712244184e-07, + "loss": 0.0007, + "step": 23033 + }, + { + "epoch": 0.45, + "learning_rate": 1.107452137781057e-07, + "loss": 0.0006, + "step": 23034 + }, + { + "epoch": 0.45, + "learning_rate": 1.1074133043376956e-07, + "loss": 0.0006, + "step": 23035 + }, + { + "epoch": 0.45, + "learning_rate": 1.1073744708943342e-07, + "loss": 0.0005, + "step": 23036 + }, + { + "epoch": 0.45, + "learning_rate": 1.1073356374509728e-07, + "loss": 0.0011, + "step": 23037 + }, + { + "epoch": 0.45, + "learning_rate": 1.1072968040076114e-07, + "loss": 0.0008, + "step": 23038 + }, + { + "epoch": 0.45, + "learning_rate": 1.10725797056425e-07, + "loss": 0.0011, + "step": 23039 + }, + { + "epoch": 0.45, + "learning_rate": 1.1072191371208885e-07, + "loss": 0.1873, + "step": 23040 + }, + { + "epoch": 0.45, + "learning_rate": 1.1071803036775271e-07, + "loss": 0.007, + "step": 23041 + }, + { + "epoch": 0.45, + "learning_rate": 1.1071414702341657e-07, + "loss": 0.0007, + "step": 23042 + }, + { + "epoch": 0.45, + "learning_rate": 1.1071026367908043e-07, + "loss": 0.016, + "step": 23043 + }, + { + "epoch": 0.45, + "learning_rate": 1.1070638033474428e-07, + "loss": 0.0008, + "step": 23044 + }, + { + "epoch": 0.45, + "learning_rate": 1.1070249699040814e-07, + "loss": 0.0053, + "step": 23045 + }, + { + "epoch": 0.45, + "learning_rate": 1.10698613646072e-07, + "loss": 0.0017, + "step": 23046 + }, + { + "epoch": 0.45, + "learning_rate": 1.1069473030173583e-07, + "loss": 0.0005, + "step": 23047 + }, + { + "epoch": 0.45, + "learning_rate": 1.1069084695739969e-07, + "loss": 0.0006, + "step": 23048 + }, + { + "epoch": 0.45, + "learning_rate": 1.1068696361306355e-07, + "loss": 0.0014, + "step": 23049 + }, + { + "epoch": 0.45, + "learning_rate": 1.1068308026872741e-07, + "loss": 0.0174, + "step": 23050 + }, + { + "epoch": 0.45, + "learning_rate": 1.1067919692439127e-07, + "loss": 1.0049, + "step": 23051 + }, + { + "epoch": 0.45, + "learning_rate": 1.1067531358005512e-07, + "loss": 0.0006, + "step": 23052 + }, + { + "epoch": 0.45, + "learning_rate": 1.1067143023571898e-07, + "loss": 0.0006, + "step": 23053 + }, + { + "epoch": 0.45, + "learning_rate": 1.1066754689138284e-07, + "loss": 0.3278, + "step": 23054 + }, + { + "epoch": 0.45, + "learning_rate": 1.106636635470467e-07, + "loss": 0.001, + "step": 23055 + }, + { + "epoch": 0.45, + "learning_rate": 1.1065978020271056e-07, + "loss": 0.0006, + "step": 23056 + }, + { + "epoch": 0.45, + "learning_rate": 1.1065589685837442e-07, + "loss": 0.0072, + "step": 23057 + }, + { + "epoch": 0.45, + "learning_rate": 1.1065201351403827e-07, + "loss": 0.1557, + "step": 23058 + }, + { + "epoch": 0.45, + "learning_rate": 1.1064813016970213e-07, + "loss": 0.0005, + "step": 23059 + }, + { + "epoch": 0.45, + "learning_rate": 1.1064424682536599e-07, + "loss": 0.0012, + "step": 23060 + }, + { + "epoch": 0.45, + "learning_rate": 1.1064036348102985e-07, + "loss": 0.0006, + "step": 23061 + }, + { + "epoch": 0.45, + "learning_rate": 1.1063648013669371e-07, + "loss": 0.0006, + "step": 23062 + }, + { + "epoch": 0.45, + "learning_rate": 1.1063259679235757e-07, + "loss": 0.0005, + "step": 23063 + }, + { + "epoch": 0.45, + "learning_rate": 1.1062871344802142e-07, + "loss": 0.0342, + "step": 23064 + }, + { + "epoch": 0.45, + "learning_rate": 1.1062483010368528e-07, + "loss": 0.0005, + "step": 23065 + }, + { + "epoch": 0.45, + "learning_rate": 1.1062094675934914e-07, + "loss": 0.0005, + "step": 23066 + }, + { + "epoch": 0.45, + "learning_rate": 1.10617063415013e-07, + "loss": 0.0005, + "step": 23067 + }, + { + "epoch": 0.45, + "learning_rate": 1.1061318007067686e-07, + "loss": 0.0012, + "step": 23068 + }, + { + "epoch": 0.45, + "learning_rate": 1.1060929672634071e-07, + "loss": 0.0007, + "step": 23069 + }, + { + "epoch": 0.45, + "learning_rate": 1.1060541338200457e-07, + "loss": 0.0006, + "step": 23070 + }, + { + "epoch": 0.45, + "learning_rate": 1.1060153003766843e-07, + "loss": 0.0007, + "step": 23071 + }, + { + "epoch": 0.45, + "learning_rate": 1.1059764669333229e-07, + "loss": 0.0005, + "step": 23072 + }, + { + "epoch": 0.45, + "learning_rate": 1.1059376334899615e-07, + "loss": 0.0008, + "step": 23073 + }, + { + "epoch": 0.45, + "learning_rate": 1.1058988000466e-07, + "loss": 0.0005, + "step": 23074 + }, + { + "epoch": 0.45, + "learning_rate": 1.1058599666032386e-07, + "loss": 0.0005, + "step": 23075 + }, + { + "epoch": 0.45, + "learning_rate": 1.1058211331598772e-07, + "loss": 0.0011, + "step": 23076 + }, + { + "epoch": 0.45, + "learning_rate": 1.1057822997165158e-07, + "loss": 0.0008, + "step": 23077 + }, + { + "epoch": 0.45, + "learning_rate": 1.1057434662731544e-07, + "loss": 0.0042, + "step": 23078 + }, + { + "epoch": 0.45, + "learning_rate": 1.105704632829793e-07, + "loss": 0.0284, + "step": 23079 + }, + { + "epoch": 0.45, + "learning_rate": 1.1056657993864316e-07, + "loss": 0.0008, + "step": 23080 + }, + { + "epoch": 0.45, + "learning_rate": 1.1056269659430701e-07, + "loss": 0.001, + "step": 23081 + }, + { + "epoch": 0.45, + "learning_rate": 1.1055881324997087e-07, + "loss": 0.0009, + "step": 23082 + }, + { + "epoch": 0.45, + "learning_rate": 1.1055492990563473e-07, + "loss": 0.0006, + "step": 23083 + }, + { + "epoch": 0.45, + "learning_rate": 1.1055104656129859e-07, + "loss": 0.6941, + "step": 23084 + }, + { + "epoch": 0.45, + "learning_rate": 1.1054716321696245e-07, + "loss": 0.0018, + "step": 23085 + }, + { + "epoch": 0.45, + "learning_rate": 1.105432798726263e-07, + "loss": 0.0005, + "step": 23086 + }, + { + "epoch": 0.45, + "learning_rate": 1.1053939652829016e-07, + "loss": 0.0007, + "step": 23087 + }, + { + "epoch": 0.45, + "learning_rate": 1.1053551318395402e-07, + "loss": 0.0007, + "step": 23088 + }, + { + "epoch": 0.45, + "learning_rate": 1.1053162983961788e-07, + "loss": 0.0008, + "step": 23089 + }, + { + "epoch": 0.45, + "learning_rate": 1.1052774649528174e-07, + "loss": 0.0008, + "step": 23090 + }, + { + "epoch": 0.45, + "learning_rate": 1.105238631509456e-07, + "loss": 0.7379, + "step": 23091 + }, + { + "epoch": 0.45, + "learning_rate": 1.1051997980660945e-07, + "loss": 0.0024, + "step": 23092 + }, + { + "epoch": 0.45, + "learning_rate": 1.1051609646227331e-07, + "loss": 0.0155, + "step": 23093 + }, + { + "epoch": 0.45, + "learning_rate": 1.1051221311793717e-07, + "loss": 0.0005, + "step": 23094 + }, + { + "epoch": 0.45, + "learning_rate": 1.1050832977360103e-07, + "loss": 0.0006, + "step": 23095 + }, + { + "epoch": 0.45, + "learning_rate": 1.1050444642926489e-07, + "loss": 0.0007, + "step": 23096 + }, + { + "epoch": 0.45, + "learning_rate": 1.1050056308492875e-07, + "loss": 0.0006, + "step": 23097 + }, + { + "epoch": 0.45, + "learning_rate": 1.104966797405926e-07, + "loss": 0.0008, + "step": 23098 + }, + { + "epoch": 0.45, + "learning_rate": 1.1049279639625646e-07, + "loss": 0.0007, + "step": 23099 + }, + { + "epoch": 0.45, + "learning_rate": 1.1048891305192032e-07, + "loss": 0.4171, + "step": 23100 + }, + { + "epoch": 0.45, + "learning_rate": 1.1048502970758418e-07, + "loss": 0.0013, + "step": 23101 + }, + { + "epoch": 0.45, + "learning_rate": 1.1048114636324804e-07, + "loss": 0.0006, + "step": 23102 + }, + { + "epoch": 0.45, + "learning_rate": 1.104772630189119e-07, + "loss": 0.0006, + "step": 23103 + }, + { + "epoch": 0.45, + "learning_rate": 1.1047337967457575e-07, + "loss": 0.0006, + "step": 23104 + }, + { + "epoch": 0.45, + "learning_rate": 1.1046949633023958e-07, + "loss": 0.0006, + "step": 23105 + }, + { + "epoch": 0.45, + "learning_rate": 1.1046561298590344e-07, + "loss": 0.0146, + "step": 23106 + }, + { + "epoch": 0.45, + "learning_rate": 1.104617296415673e-07, + "loss": 0.0006, + "step": 23107 + }, + { + "epoch": 0.45, + "learning_rate": 1.1045784629723116e-07, + "loss": 0.0006, + "step": 23108 + }, + { + "epoch": 0.45, + "learning_rate": 1.1045396295289502e-07, + "loss": 0.0007, + "step": 23109 + }, + { + "epoch": 0.45, + "learning_rate": 1.1045007960855888e-07, + "loss": 0.0016, + "step": 23110 + }, + { + "epoch": 0.45, + "learning_rate": 1.1044619626422273e-07, + "loss": 0.0004, + "step": 23111 + }, + { + "epoch": 0.45, + "learning_rate": 1.1044231291988659e-07, + "loss": 0.0006, + "step": 23112 + }, + { + "epoch": 0.45, + "learning_rate": 1.1043842957555045e-07, + "loss": 0.0248, + "step": 23113 + }, + { + "epoch": 0.45, + "learning_rate": 1.1043454623121431e-07, + "loss": 0.0039, + "step": 23114 + }, + { + "epoch": 0.45, + "learning_rate": 1.1043066288687817e-07, + "loss": 0.2109, + "step": 23115 + }, + { + "epoch": 0.45, + "learning_rate": 1.1042677954254203e-07, + "loss": 0.0006, + "step": 23116 + }, + { + "epoch": 0.45, + "learning_rate": 1.1042289619820588e-07, + "loss": 0.0005, + "step": 23117 + }, + { + "epoch": 0.45, + "learning_rate": 1.1041901285386974e-07, + "loss": 0.4842, + "step": 23118 + }, + { + "epoch": 0.45, + "learning_rate": 1.104151295095336e-07, + "loss": 0.0007, + "step": 23119 + }, + { + "epoch": 0.45, + "learning_rate": 1.1041124616519746e-07, + "loss": 0.0006, + "step": 23120 + }, + { + "epoch": 0.45, + "learning_rate": 1.1040736282086132e-07, + "loss": 0.0006, + "step": 23121 + }, + { + "epoch": 0.45, + "learning_rate": 1.1040347947652518e-07, + "loss": 0.0006, + "step": 23122 + }, + { + "epoch": 0.45, + "learning_rate": 1.1039959613218903e-07, + "loss": 0.0007, + "step": 23123 + }, + { + "epoch": 0.45, + "learning_rate": 1.1039571278785289e-07, + "loss": 0.0006, + "step": 23124 + }, + { + "epoch": 0.45, + "learning_rate": 1.1039182944351675e-07, + "loss": 0.0005, + "step": 23125 + }, + { + "epoch": 0.45, + "learning_rate": 1.1038794609918061e-07, + "loss": 0.0013, + "step": 23126 + }, + { + "epoch": 0.45, + "learning_rate": 1.1038406275484447e-07, + "loss": 0.0005, + "step": 23127 + }, + { + "epoch": 0.45, + "learning_rate": 1.1038017941050832e-07, + "loss": 0.0004, + "step": 23128 + }, + { + "epoch": 0.45, + "learning_rate": 1.1037629606617218e-07, + "loss": 0.0008, + "step": 23129 + }, + { + "epoch": 0.45, + "learning_rate": 1.1037241272183604e-07, + "loss": 0.0103, + "step": 23130 + }, + { + "epoch": 0.45, + "learning_rate": 1.103685293774999e-07, + "loss": 0.0006, + "step": 23131 + }, + { + "epoch": 0.45, + "learning_rate": 1.1036464603316376e-07, + "loss": 0.0008, + "step": 23132 + }, + { + "epoch": 0.45, + "learning_rate": 1.1036076268882762e-07, + "loss": 0.0006, + "step": 23133 + }, + { + "epoch": 0.45, + "learning_rate": 1.1035687934449147e-07, + "loss": 0.0008, + "step": 23134 + }, + { + "epoch": 0.45, + "learning_rate": 1.1035299600015533e-07, + "loss": 0.0007, + "step": 23135 + }, + { + "epoch": 0.45, + "learning_rate": 1.1034911265581919e-07, + "loss": 0.0006, + "step": 23136 + }, + { + "epoch": 0.45, + "learning_rate": 1.1034522931148305e-07, + "loss": 0.001, + "step": 23137 + }, + { + "epoch": 0.45, + "learning_rate": 1.1034134596714691e-07, + "loss": 0.0007, + "step": 23138 + }, + { + "epoch": 0.45, + "learning_rate": 1.1033746262281077e-07, + "loss": 0.0006, + "step": 23139 + }, + { + "epoch": 0.45, + "learning_rate": 1.1033357927847462e-07, + "loss": 0.0014, + "step": 23140 + }, + { + "epoch": 0.45, + "learning_rate": 1.1032969593413848e-07, + "loss": 0.0008, + "step": 23141 + }, + { + "epoch": 0.45, + "learning_rate": 1.1032581258980234e-07, + "loss": 0.0008, + "step": 23142 + }, + { + "epoch": 0.45, + "learning_rate": 1.103219292454662e-07, + "loss": 0.0006, + "step": 23143 + }, + { + "epoch": 0.45, + "learning_rate": 1.1031804590113006e-07, + "loss": 0.0006, + "step": 23144 + }, + { + "epoch": 0.45, + "learning_rate": 1.1031416255679391e-07, + "loss": 0.0006, + "step": 23145 + }, + { + "epoch": 0.45, + "learning_rate": 1.1031027921245777e-07, + "loss": 0.0008, + "step": 23146 + }, + { + "epoch": 0.45, + "learning_rate": 1.1030639586812163e-07, + "loss": 0.0008, + "step": 23147 + }, + { + "epoch": 0.45, + "learning_rate": 1.1030251252378549e-07, + "loss": 0.0008, + "step": 23148 + }, + { + "epoch": 0.45, + "learning_rate": 1.1029862917944935e-07, + "loss": 0.0007, + "step": 23149 + }, + { + "epoch": 0.45, + "learning_rate": 1.102947458351132e-07, + "loss": 0.0007, + "step": 23150 + }, + { + "epoch": 0.45, + "learning_rate": 1.1029086249077706e-07, + "loss": 0.0006, + "step": 23151 + }, + { + "epoch": 0.45, + "learning_rate": 1.1028697914644092e-07, + "loss": 0.0006, + "step": 23152 + }, + { + "epoch": 0.45, + "learning_rate": 1.1028309580210478e-07, + "loss": 0.0008, + "step": 23153 + }, + { + "epoch": 0.45, + "learning_rate": 1.1027921245776864e-07, + "loss": 0.0006, + "step": 23154 + }, + { + "epoch": 0.45, + "learning_rate": 1.102753291134325e-07, + "loss": 0.3823, + "step": 23155 + }, + { + "epoch": 0.45, + "learning_rate": 1.1027144576909636e-07, + "loss": 0.0008, + "step": 23156 + }, + { + "epoch": 0.45, + "learning_rate": 1.1026756242476021e-07, + "loss": 1.0729, + "step": 23157 + }, + { + "epoch": 0.45, + "learning_rate": 1.1026367908042407e-07, + "loss": 0.0021, + "step": 23158 + }, + { + "epoch": 0.45, + "learning_rate": 1.1025979573608793e-07, + "loss": 0.0008, + "step": 23159 + }, + { + "epoch": 0.45, + "learning_rate": 1.1025591239175179e-07, + "loss": 0.0006, + "step": 23160 + }, + { + "epoch": 0.45, + "learning_rate": 1.1025202904741565e-07, + "loss": 0.0212, + "step": 23161 + }, + { + "epoch": 0.45, + "learning_rate": 1.1024814570307949e-07, + "loss": 0.0026, + "step": 23162 + }, + { + "epoch": 0.45, + "learning_rate": 1.1024426235874334e-07, + "loss": 0.0006, + "step": 23163 + }, + { + "epoch": 0.45, + "learning_rate": 1.102403790144072e-07, + "loss": 1.3407, + "step": 23164 + }, + { + "epoch": 0.45, + "learning_rate": 1.1023649567007105e-07, + "loss": 0.0006, + "step": 23165 + }, + { + "epoch": 0.45, + "learning_rate": 1.1023261232573491e-07, + "loss": 0.0007, + "step": 23166 + }, + { + "epoch": 0.45, + "learning_rate": 1.1022872898139877e-07, + "loss": 0.01, + "step": 23167 + }, + { + "epoch": 0.45, + "learning_rate": 1.1022484563706263e-07, + "loss": 0.0005, + "step": 23168 + }, + { + "epoch": 0.45, + "learning_rate": 1.1022096229272649e-07, + "loss": 0.0021, + "step": 23169 + }, + { + "epoch": 0.45, + "learning_rate": 1.1021707894839034e-07, + "loss": 0.0006, + "step": 23170 + }, + { + "epoch": 0.45, + "learning_rate": 1.102131956040542e-07, + "loss": 0.0013, + "step": 23171 + }, + { + "epoch": 0.45, + "learning_rate": 1.1020931225971806e-07, + "loss": 0.0006, + "step": 23172 + }, + { + "epoch": 0.45, + "learning_rate": 1.1020542891538192e-07, + "loss": 0.0008, + "step": 23173 + }, + { + "epoch": 0.45, + "learning_rate": 1.1020154557104578e-07, + "loss": 0.001, + "step": 23174 + }, + { + "epoch": 0.45, + "learning_rate": 1.1019766222670964e-07, + "loss": 0.0006, + "step": 23175 + }, + { + "epoch": 0.45, + "learning_rate": 1.101937788823735e-07, + "loss": 0.3367, + "step": 23176 + }, + { + "epoch": 0.45, + "learning_rate": 1.1018989553803735e-07, + "loss": 0.0595, + "step": 23177 + }, + { + "epoch": 0.45, + "learning_rate": 1.1018601219370121e-07, + "loss": 0.001, + "step": 23178 + }, + { + "epoch": 0.45, + "learning_rate": 1.1018212884936507e-07, + "loss": 0.0007, + "step": 23179 + }, + { + "epoch": 0.45, + "learning_rate": 1.1017824550502893e-07, + "loss": 0.2111, + "step": 23180 + }, + { + "epoch": 0.45, + "learning_rate": 1.1017436216069278e-07, + "loss": 0.0006, + "step": 23181 + }, + { + "epoch": 0.45, + "learning_rate": 1.1017047881635664e-07, + "loss": 0.002, + "step": 23182 + }, + { + "epoch": 0.45, + "learning_rate": 1.101665954720205e-07, + "loss": 0.0006, + "step": 23183 + }, + { + "epoch": 0.45, + "learning_rate": 1.1016271212768436e-07, + "loss": 0.0005, + "step": 23184 + }, + { + "epoch": 0.45, + "learning_rate": 1.1015882878334822e-07, + "loss": 0.0008, + "step": 23185 + }, + { + "epoch": 0.45, + "learning_rate": 1.1015494543901208e-07, + "loss": 0.5946, + "step": 23186 + }, + { + "epoch": 0.45, + "learning_rate": 1.1015106209467593e-07, + "loss": 0.0005, + "step": 23187 + }, + { + "epoch": 0.45, + "learning_rate": 1.1014717875033979e-07, + "loss": 0.0005, + "step": 23188 + }, + { + "epoch": 0.45, + "learning_rate": 1.1014329540600365e-07, + "loss": 0.0004, + "step": 23189 + }, + { + "epoch": 0.45, + "learning_rate": 1.1013941206166751e-07, + "loss": 0.0514, + "step": 23190 + }, + { + "epoch": 0.45, + "learning_rate": 1.1013552871733135e-07, + "loss": 0.4428, + "step": 23191 + }, + { + "epoch": 0.45, + "learning_rate": 1.1013164537299521e-07, + "loss": 0.0005, + "step": 23192 + }, + { + "epoch": 0.45, + "learning_rate": 1.1012776202865907e-07, + "loss": 0.0016, + "step": 23193 + }, + { + "epoch": 0.45, + "learning_rate": 1.1012387868432293e-07, + "loss": 0.0027, + "step": 23194 + }, + { + "epoch": 0.45, + "learning_rate": 1.1011999533998679e-07, + "loss": 0.0006, + "step": 23195 + }, + { + "epoch": 0.45, + "learning_rate": 1.1011611199565065e-07, + "loss": 0.0007, + "step": 23196 + }, + { + "epoch": 0.45, + "learning_rate": 1.101122286513145e-07, + "loss": 0.0013, + "step": 23197 + }, + { + "epoch": 0.45, + "learning_rate": 1.1010834530697836e-07, + "loss": 0.0005, + "step": 23198 + }, + { + "epoch": 0.45, + "learning_rate": 1.1010446196264222e-07, + "loss": 0.0008, + "step": 23199 + }, + { + "epoch": 0.45, + "learning_rate": 1.1010057861830608e-07, + "loss": 0.0006, + "step": 23200 + }, + { + "epoch": 0.45, + "learning_rate": 1.1009669527396994e-07, + "loss": 0.0007, + "step": 23201 + }, + { + "epoch": 0.45, + "learning_rate": 1.100928119296338e-07, + "loss": 0.0006, + "step": 23202 + }, + { + "epoch": 0.45, + "learning_rate": 1.1008892858529765e-07, + "loss": 0.0007, + "step": 23203 + }, + { + "epoch": 0.45, + "learning_rate": 1.1008504524096151e-07, + "loss": 0.0018, + "step": 23204 + }, + { + "epoch": 0.45, + "learning_rate": 1.1008116189662537e-07, + "loss": 0.0006, + "step": 23205 + }, + { + "epoch": 0.45, + "learning_rate": 1.1007727855228923e-07, + "loss": 0.0009, + "step": 23206 + }, + { + "epoch": 0.45, + "learning_rate": 1.1007339520795309e-07, + "loss": 0.3853, + "step": 23207 + }, + { + "epoch": 0.45, + "learning_rate": 1.1006951186361694e-07, + "loss": 0.0006, + "step": 23208 + }, + { + "epoch": 0.45, + "learning_rate": 1.100656285192808e-07, + "loss": 0.3826, + "step": 23209 + }, + { + "epoch": 0.45, + "learning_rate": 1.1006174517494466e-07, + "loss": 0.0006, + "step": 23210 + }, + { + "epoch": 0.45, + "learning_rate": 1.1005786183060852e-07, + "loss": 0.0051, + "step": 23211 + }, + { + "epoch": 0.45, + "learning_rate": 1.1005397848627238e-07, + "loss": 0.0006, + "step": 23212 + }, + { + "epoch": 0.45, + "learning_rate": 1.1005009514193624e-07, + "loss": 0.5192, + "step": 23213 + }, + { + "epoch": 0.45, + "learning_rate": 1.100462117976001e-07, + "loss": 0.0006, + "step": 23214 + }, + { + "epoch": 0.45, + "learning_rate": 1.1004232845326395e-07, + "loss": 0.0012, + "step": 23215 + }, + { + "epoch": 0.45, + "learning_rate": 1.1003844510892781e-07, + "loss": 0.0006, + "step": 23216 + }, + { + "epoch": 0.45, + "learning_rate": 1.1003456176459167e-07, + "loss": 0.0006, + "step": 23217 + }, + { + "epoch": 0.45, + "learning_rate": 1.1003067842025553e-07, + "loss": 0.0005, + "step": 23218 + }, + { + "epoch": 0.45, + "learning_rate": 1.1002679507591939e-07, + "loss": 0.0005, + "step": 23219 + }, + { + "epoch": 0.45, + "learning_rate": 1.1002291173158324e-07, + "loss": 0.0007, + "step": 23220 + }, + { + "epoch": 0.45, + "learning_rate": 1.1001902838724708e-07, + "loss": 0.0005, + "step": 23221 + }, + { + "epoch": 0.45, + "learning_rate": 1.1001514504291093e-07, + "loss": 0.0004, + "step": 23222 + }, + { + "epoch": 0.45, + "learning_rate": 1.1001126169857479e-07, + "loss": 0.0011, + "step": 23223 + }, + { + "epoch": 0.45, + "learning_rate": 1.1000737835423865e-07, + "loss": 0.0006, + "step": 23224 + }, + { + "epoch": 0.45, + "learning_rate": 1.1000349500990251e-07, + "loss": 0.0008, + "step": 23225 + }, + { + "epoch": 0.45, + "learning_rate": 1.0999961166556637e-07, + "loss": 0.0006, + "step": 23226 + }, + { + "epoch": 0.45, + "learning_rate": 1.0999572832123022e-07, + "loss": 0.0007, + "step": 23227 + }, + { + "epoch": 0.45, + "learning_rate": 1.0999184497689408e-07, + "loss": 0.0006, + "step": 23228 + }, + { + "epoch": 0.45, + "learning_rate": 1.0998796163255794e-07, + "loss": 0.001, + "step": 23229 + }, + { + "epoch": 0.45, + "learning_rate": 1.099840782882218e-07, + "loss": 0.0007, + "step": 23230 + }, + { + "epoch": 0.45, + "learning_rate": 1.0998019494388566e-07, + "loss": 0.0005, + "step": 23231 + }, + { + "epoch": 0.45, + "learning_rate": 1.0997631159954952e-07, + "loss": 0.0007, + "step": 23232 + }, + { + "epoch": 0.45, + "learning_rate": 1.0997242825521337e-07, + "loss": 0.0015, + "step": 23233 + }, + { + "epoch": 0.45, + "learning_rate": 1.0996854491087723e-07, + "loss": 0.0008, + "step": 23234 + }, + { + "epoch": 0.45, + "learning_rate": 1.0996466156654109e-07, + "loss": 0.0006, + "step": 23235 + }, + { + "epoch": 0.45, + "learning_rate": 1.0996077822220495e-07, + "loss": 0.0006, + "step": 23236 + }, + { + "epoch": 0.45, + "learning_rate": 1.0995689487786881e-07, + "loss": 0.0006, + "step": 23237 + }, + { + "epoch": 0.45, + "learning_rate": 1.0995301153353267e-07, + "loss": 0.0008, + "step": 23238 + }, + { + "epoch": 0.45, + "learning_rate": 1.0994912818919652e-07, + "loss": 0.0006, + "step": 23239 + }, + { + "epoch": 0.45, + "learning_rate": 1.0994524484486038e-07, + "loss": 0.0005, + "step": 23240 + }, + { + "epoch": 0.45, + "learning_rate": 1.0994136150052424e-07, + "loss": 0.0006, + "step": 23241 + }, + { + "epoch": 0.45, + "learning_rate": 1.099374781561881e-07, + "loss": 0.9583, + "step": 23242 + }, + { + "epoch": 0.45, + "learning_rate": 1.0993359481185196e-07, + "loss": 0.001, + "step": 23243 + }, + { + "epoch": 0.45, + "learning_rate": 1.0992971146751581e-07, + "loss": 0.0021, + "step": 23244 + }, + { + "epoch": 0.45, + "learning_rate": 1.0992582812317967e-07, + "loss": 0.0016, + "step": 23245 + }, + { + "epoch": 0.45, + "learning_rate": 1.0992194477884353e-07, + "loss": 0.0007, + "step": 23246 + }, + { + "epoch": 0.45, + "learning_rate": 1.0991806143450739e-07, + "loss": 0.0007, + "step": 23247 + }, + { + "epoch": 0.45, + "learning_rate": 1.0991417809017125e-07, + "loss": 0.0011, + "step": 23248 + }, + { + "epoch": 0.45, + "learning_rate": 1.099102947458351e-07, + "loss": 0.0005, + "step": 23249 + }, + { + "epoch": 0.45, + "learning_rate": 1.0990641140149896e-07, + "loss": 0.0006, + "step": 23250 + }, + { + "epoch": 0.45, + "learning_rate": 1.0990252805716282e-07, + "loss": 0.0036, + "step": 23251 + }, + { + "epoch": 0.45, + "learning_rate": 1.0989864471282668e-07, + "loss": 0.0006, + "step": 23252 + }, + { + "epoch": 0.45, + "learning_rate": 1.0989476136849054e-07, + "loss": 0.0006, + "step": 23253 + }, + { + "epoch": 0.45, + "learning_rate": 1.098908780241544e-07, + "loss": 0.0025, + "step": 23254 + }, + { + "epoch": 0.45, + "learning_rate": 1.0988699467981826e-07, + "loss": 0.0006, + "step": 23255 + }, + { + "epoch": 0.45, + "learning_rate": 1.0988311133548211e-07, + "loss": 0.0007, + "step": 23256 + }, + { + "epoch": 0.45, + "learning_rate": 1.0987922799114597e-07, + "loss": 0.0008, + "step": 23257 + }, + { + "epoch": 0.45, + "learning_rate": 1.0987534464680983e-07, + "loss": 0.0006, + "step": 23258 + }, + { + "epoch": 0.45, + "learning_rate": 1.0987146130247369e-07, + "loss": 0.0006, + "step": 23259 + }, + { + "epoch": 0.45, + "learning_rate": 1.0986757795813755e-07, + "loss": 0.0007, + "step": 23260 + }, + { + "epoch": 0.45, + "learning_rate": 1.098636946138014e-07, + "loss": 0.0006, + "step": 23261 + }, + { + "epoch": 0.45, + "learning_rate": 1.0985981126946526e-07, + "loss": 0.0004, + "step": 23262 + }, + { + "epoch": 0.45, + "learning_rate": 1.0985592792512912e-07, + "loss": 0.0026, + "step": 23263 + }, + { + "epoch": 0.45, + "learning_rate": 1.0985204458079298e-07, + "loss": 0.0013, + "step": 23264 + }, + { + "epoch": 0.45, + "learning_rate": 1.0984816123645684e-07, + "loss": 0.0007, + "step": 23265 + }, + { + "epoch": 0.45, + "learning_rate": 1.098442778921207e-07, + "loss": 0.2192, + "step": 23266 + }, + { + "epoch": 0.45, + "learning_rate": 1.0984039454778455e-07, + "loss": 1.1082, + "step": 23267 + }, + { + "epoch": 0.45, + "learning_rate": 1.0983651120344841e-07, + "loss": 0.0009, + "step": 23268 + }, + { + "epoch": 0.45, + "learning_rate": 1.0983262785911227e-07, + "loss": 0.0006, + "step": 23269 + }, + { + "epoch": 0.45, + "learning_rate": 1.0982874451477613e-07, + "loss": 0.0006, + "step": 23270 + }, + { + "epoch": 0.45, + "learning_rate": 1.0982486117043999e-07, + "loss": 0.0005, + "step": 23271 + }, + { + "epoch": 0.45, + "learning_rate": 1.0982097782610385e-07, + "loss": 0.0004, + "step": 23272 + }, + { + "epoch": 0.45, + "learning_rate": 1.098170944817677e-07, + "loss": 0.001, + "step": 23273 + }, + { + "epoch": 0.45, + "learning_rate": 1.0981321113743156e-07, + "loss": 0.3733, + "step": 23274 + }, + { + "epoch": 0.45, + "learning_rate": 1.0980932779309542e-07, + "loss": 1.0437, + "step": 23275 + }, + { + "epoch": 0.45, + "learning_rate": 1.0980544444875928e-07, + "loss": 0.0005, + "step": 23276 + }, + { + "epoch": 0.45, + "learning_rate": 1.0980156110442314e-07, + "loss": 0.0005, + "step": 23277 + }, + { + "epoch": 0.45, + "learning_rate": 1.09797677760087e-07, + "loss": 0.0006, + "step": 23278 + }, + { + "epoch": 0.45, + "learning_rate": 1.0979379441575083e-07, + "loss": 0.9971, + "step": 23279 + }, + { + "epoch": 0.45, + "learning_rate": 1.0978991107141469e-07, + "loss": 0.8314, + "step": 23280 + }, + { + "epoch": 0.45, + "learning_rate": 1.0978602772707854e-07, + "loss": 0.0009, + "step": 23281 + }, + { + "epoch": 0.45, + "learning_rate": 1.097821443827424e-07, + "loss": 0.163, + "step": 23282 + }, + { + "epoch": 0.45, + "learning_rate": 1.0977826103840626e-07, + "loss": 0.0005, + "step": 23283 + }, + { + "epoch": 0.45, + "learning_rate": 1.0977437769407012e-07, + "loss": 0.002, + "step": 23284 + }, + { + "epoch": 0.45, + "learning_rate": 1.0977049434973398e-07, + "loss": 0.0145, + "step": 23285 + }, + { + "epoch": 0.45, + "learning_rate": 1.0976661100539783e-07, + "loss": 0.0012, + "step": 23286 + }, + { + "epoch": 0.45, + "learning_rate": 1.0976272766106169e-07, + "loss": 0.0026, + "step": 23287 + }, + { + "epoch": 0.45, + "learning_rate": 1.0975884431672555e-07, + "loss": 0.0006, + "step": 23288 + }, + { + "epoch": 0.45, + "learning_rate": 1.0975496097238941e-07, + "loss": 0.0046, + "step": 23289 + }, + { + "epoch": 0.45, + "learning_rate": 1.0975107762805327e-07, + "loss": 0.0007, + "step": 23290 + }, + { + "epoch": 0.45, + "learning_rate": 1.0974719428371713e-07, + "loss": 0.001, + "step": 23291 + }, + { + "epoch": 0.45, + "learning_rate": 1.0974331093938098e-07, + "loss": 0.0007, + "step": 23292 + }, + { + "epoch": 0.45, + "learning_rate": 1.0973942759504484e-07, + "loss": 0.0006, + "step": 23293 + }, + { + "epoch": 0.45, + "learning_rate": 1.097355442507087e-07, + "loss": 0.5659, + "step": 23294 + }, + { + "epoch": 0.45, + "learning_rate": 1.0973166090637256e-07, + "loss": 0.0006, + "step": 23295 + }, + { + "epoch": 0.45, + "learning_rate": 1.0972777756203642e-07, + "loss": 0.0007, + "step": 23296 + }, + { + "epoch": 0.45, + "learning_rate": 1.0972389421770028e-07, + "loss": 0.0005, + "step": 23297 + }, + { + "epoch": 0.45, + "learning_rate": 1.0972001087336413e-07, + "loss": 0.4752, + "step": 23298 + }, + { + "epoch": 0.45, + "learning_rate": 1.0971612752902799e-07, + "loss": 0.0006, + "step": 23299 + }, + { + "epoch": 0.45, + "learning_rate": 1.0971224418469185e-07, + "loss": 0.2208, + "step": 23300 + }, + { + "epoch": 0.45, + "learning_rate": 1.0970836084035571e-07, + "loss": 0.0178, + "step": 23301 + }, + { + "epoch": 0.45, + "learning_rate": 1.0970447749601957e-07, + "loss": 0.0011, + "step": 23302 + }, + { + "epoch": 0.45, + "learning_rate": 1.0970059415168342e-07, + "loss": 0.0006, + "step": 23303 + }, + { + "epoch": 0.45, + "learning_rate": 1.0969671080734728e-07, + "loss": 0.0005, + "step": 23304 + }, + { + "epoch": 0.45, + "learning_rate": 1.0969282746301114e-07, + "loss": 0.0008, + "step": 23305 + }, + { + "epoch": 0.45, + "learning_rate": 1.09688944118675e-07, + "loss": 0.0005, + "step": 23306 + }, + { + "epoch": 0.45, + "learning_rate": 1.0968506077433886e-07, + "loss": 0.0008, + "step": 23307 + }, + { + "epoch": 0.45, + "learning_rate": 1.0968117743000272e-07, + "loss": 0.0007, + "step": 23308 + }, + { + "epoch": 0.45, + "learning_rate": 1.0967729408566657e-07, + "loss": 0.0009, + "step": 23309 + }, + { + "epoch": 0.45, + "learning_rate": 1.0967341074133043e-07, + "loss": 0.0008, + "step": 23310 + }, + { + "epoch": 0.45, + "learning_rate": 1.0966952739699429e-07, + "loss": 0.0004, + "step": 23311 + }, + { + "epoch": 0.45, + "learning_rate": 1.0966564405265815e-07, + "loss": 0.0446, + "step": 23312 + }, + { + "epoch": 0.45, + "learning_rate": 1.0966176070832201e-07, + "loss": 0.0008, + "step": 23313 + }, + { + "epoch": 0.45, + "learning_rate": 1.0965787736398587e-07, + "loss": 0.007, + "step": 23314 + }, + { + "epoch": 0.45, + "learning_rate": 1.0965399401964972e-07, + "loss": 0.0009, + "step": 23315 + }, + { + "epoch": 0.45, + "learning_rate": 1.0965011067531358e-07, + "loss": 0.0007, + "step": 23316 + }, + { + "epoch": 0.45, + "learning_rate": 1.0964622733097744e-07, + "loss": 0.0009, + "step": 23317 + }, + { + "epoch": 0.45, + "learning_rate": 1.096423439866413e-07, + "loss": 0.0006, + "step": 23318 + }, + { + "epoch": 0.45, + "learning_rate": 1.0963846064230516e-07, + "loss": 0.0007, + "step": 23319 + }, + { + "epoch": 0.45, + "learning_rate": 1.0963457729796901e-07, + "loss": 0.0005, + "step": 23320 + }, + { + "epoch": 0.45, + "learning_rate": 1.0963069395363287e-07, + "loss": 0.0006, + "step": 23321 + }, + { + "epoch": 0.45, + "learning_rate": 1.0962681060929673e-07, + "loss": 0.0008, + "step": 23322 + }, + { + "epoch": 0.45, + "learning_rate": 1.0962292726496059e-07, + "loss": 0.0007, + "step": 23323 + }, + { + "epoch": 0.45, + "learning_rate": 1.0961904392062445e-07, + "loss": 0.0007, + "step": 23324 + }, + { + "epoch": 0.45, + "learning_rate": 1.096151605762883e-07, + "loss": 0.0006, + "step": 23325 + }, + { + "epoch": 0.45, + "learning_rate": 1.0961127723195216e-07, + "loss": 0.0008, + "step": 23326 + }, + { + "epoch": 0.45, + "learning_rate": 1.0960739388761602e-07, + "loss": 0.0006, + "step": 23327 + }, + { + "epoch": 0.45, + "learning_rate": 1.0960351054327988e-07, + "loss": 0.3502, + "step": 23328 + }, + { + "epoch": 0.45, + "learning_rate": 1.0959962719894374e-07, + "loss": 0.0007, + "step": 23329 + }, + { + "epoch": 0.45, + "learning_rate": 1.095957438546076e-07, + "loss": 0.0006, + "step": 23330 + }, + { + "epoch": 0.45, + "learning_rate": 1.0959186051027146e-07, + "loss": 0.0007, + "step": 23331 + }, + { + "epoch": 0.45, + "learning_rate": 1.0958797716593531e-07, + "loss": 0.0011, + "step": 23332 + }, + { + "epoch": 0.45, + "learning_rate": 1.0958409382159917e-07, + "loss": 0.0006, + "step": 23333 + }, + { + "epoch": 0.45, + "learning_rate": 1.0958021047726303e-07, + "loss": 0.0007, + "step": 23334 + }, + { + "epoch": 0.45, + "learning_rate": 1.0957632713292689e-07, + "loss": 0.424, + "step": 23335 + }, + { + "epoch": 0.45, + "learning_rate": 1.0957244378859075e-07, + "loss": 0.0009, + "step": 23336 + }, + { + "epoch": 0.45, + "learning_rate": 1.0956856044425458e-07, + "loss": 0.0007, + "step": 23337 + }, + { + "epoch": 0.45, + "learning_rate": 1.0956467709991844e-07, + "loss": 0.0009, + "step": 23338 + }, + { + "epoch": 0.45, + "learning_rate": 1.095607937555823e-07, + "loss": 1.2161, + "step": 23339 + }, + { + "epoch": 0.45, + "learning_rate": 1.0955691041124615e-07, + "loss": 0.0006, + "step": 23340 + }, + { + "epoch": 0.45, + "learning_rate": 1.0955302706691001e-07, + "loss": 0.0006, + "step": 23341 + }, + { + "epoch": 0.45, + "learning_rate": 1.0954914372257387e-07, + "loss": 0.0006, + "step": 23342 + }, + { + "epoch": 0.45, + "learning_rate": 1.0954526037823773e-07, + "loss": 0.0006, + "step": 23343 + }, + { + "epoch": 0.45, + "learning_rate": 1.0954137703390159e-07, + "loss": 0.0015, + "step": 23344 + }, + { + "epoch": 0.45, + "learning_rate": 1.0953749368956544e-07, + "loss": 0.0007, + "step": 23345 + }, + { + "epoch": 0.45, + "learning_rate": 1.095336103452293e-07, + "loss": 0.0005, + "step": 23346 + }, + { + "epoch": 0.45, + "learning_rate": 1.0952972700089316e-07, + "loss": 0.0011, + "step": 23347 + }, + { + "epoch": 0.45, + "learning_rate": 1.0952584365655702e-07, + "loss": 0.031, + "step": 23348 + }, + { + "epoch": 0.45, + "learning_rate": 1.0952196031222088e-07, + "loss": 0.0008, + "step": 23349 + }, + { + "epoch": 0.45, + "learning_rate": 1.0951807696788474e-07, + "loss": 1.2129, + "step": 23350 + }, + { + "epoch": 0.45, + "learning_rate": 1.095141936235486e-07, + "loss": 0.0008, + "step": 23351 + }, + { + "epoch": 0.45, + "learning_rate": 1.0951031027921245e-07, + "loss": 0.0005, + "step": 23352 + }, + { + "epoch": 0.45, + "learning_rate": 1.0950642693487631e-07, + "loss": 0.0023, + "step": 23353 + }, + { + "epoch": 0.45, + "learning_rate": 1.0950254359054017e-07, + "loss": 0.0007, + "step": 23354 + }, + { + "epoch": 0.45, + "learning_rate": 1.0949866024620403e-07, + "loss": 0.0005, + "step": 23355 + }, + { + "epoch": 0.45, + "learning_rate": 1.0949477690186789e-07, + "loss": 0.0007, + "step": 23356 + }, + { + "epoch": 0.45, + "learning_rate": 1.0949089355753174e-07, + "loss": 0.0073, + "step": 23357 + }, + { + "epoch": 0.45, + "learning_rate": 1.094870102131956e-07, + "loss": 1.0875, + "step": 23358 + }, + { + "epoch": 0.45, + "learning_rate": 1.0948312686885946e-07, + "loss": 0.0005, + "step": 23359 + }, + { + "epoch": 0.45, + "learning_rate": 1.0947924352452332e-07, + "loss": 0.0005, + "step": 23360 + }, + { + "epoch": 0.45, + "learning_rate": 1.0947536018018718e-07, + "loss": 0.0006, + "step": 23361 + }, + { + "epoch": 0.45, + "learning_rate": 1.0947147683585103e-07, + "loss": 0.0006, + "step": 23362 + }, + { + "epoch": 0.45, + "learning_rate": 1.0946759349151489e-07, + "loss": 0.0006, + "step": 23363 + }, + { + "epoch": 0.45, + "learning_rate": 1.0946371014717875e-07, + "loss": 0.6999, + "step": 23364 + }, + { + "epoch": 0.45, + "learning_rate": 1.0945982680284261e-07, + "loss": 0.0015, + "step": 23365 + }, + { + "epoch": 0.45, + "learning_rate": 1.0945594345850647e-07, + "loss": 0.0005, + "step": 23366 + }, + { + "epoch": 0.45, + "learning_rate": 1.0945206011417033e-07, + "loss": 0.0009, + "step": 23367 + }, + { + "epoch": 0.45, + "learning_rate": 1.0944817676983417e-07, + "loss": 0.0065, + "step": 23368 + }, + { + "epoch": 0.45, + "learning_rate": 1.0944429342549803e-07, + "loss": 0.001, + "step": 23369 + }, + { + "epoch": 0.45, + "learning_rate": 1.0944041008116189e-07, + "loss": 0.0085, + "step": 23370 + }, + { + "epoch": 0.45, + "learning_rate": 1.0943652673682575e-07, + "loss": 0.3649, + "step": 23371 + }, + { + "epoch": 0.45, + "learning_rate": 1.094326433924896e-07, + "loss": 0.0007, + "step": 23372 + }, + { + "epoch": 0.45, + "learning_rate": 1.0942876004815346e-07, + "loss": 0.0005, + "step": 23373 + }, + { + "epoch": 0.45, + "learning_rate": 1.0942487670381732e-07, + "loss": 0.0012, + "step": 23374 + }, + { + "epoch": 0.45, + "learning_rate": 1.0942099335948118e-07, + "loss": 0.0006, + "step": 23375 + }, + { + "epoch": 0.45, + "learning_rate": 1.0941711001514504e-07, + "loss": 0.0006, + "step": 23376 + }, + { + "epoch": 0.45, + "learning_rate": 1.094132266708089e-07, + "loss": 0.0009, + "step": 23377 + }, + { + "epoch": 0.45, + "learning_rate": 1.0940934332647275e-07, + "loss": 0.0005, + "step": 23378 + }, + { + "epoch": 0.45, + "learning_rate": 1.0940545998213661e-07, + "loss": 0.0008, + "step": 23379 + }, + { + "epoch": 0.45, + "learning_rate": 1.0940157663780047e-07, + "loss": 0.0029, + "step": 23380 + }, + { + "epoch": 0.45, + "learning_rate": 1.0939769329346433e-07, + "loss": 0.0005, + "step": 23381 + }, + { + "epoch": 0.45, + "learning_rate": 1.0939380994912819e-07, + "loss": 0.0032, + "step": 23382 + }, + { + "epoch": 0.45, + "learning_rate": 1.0938992660479204e-07, + "loss": 0.0005, + "step": 23383 + }, + { + "epoch": 0.45, + "learning_rate": 1.093860432604559e-07, + "loss": 0.0012, + "step": 23384 + }, + { + "epoch": 0.45, + "learning_rate": 1.0938215991611976e-07, + "loss": 0.0007, + "step": 23385 + }, + { + "epoch": 0.45, + "learning_rate": 1.0937827657178362e-07, + "loss": 0.0006, + "step": 23386 + }, + { + "epoch": 0.45, + "learning_rate": 1.0937439322744748e-07, + "loss": 0.0005, + "step": 23387 + }, + { + "epoch": 0.45, + "learning_rate": 1.0937050988311134e-07, + "loss": 0.305, + "step": 23388 + }, + { + "epoch": 0.45, + "learning_rate": 1.093666265387752e-07, + "loss": 0.0006, + "step": 23389 + }, + { + "epoch": 0.45, + "learning_rate": 1.0936274319443905e-07, + "loss": 0.0006, + "step": 23390 + }, + { + "epoch": 0.45, + "learning_rate": 1.0935885985010291e-07, + "loss": 0.0007, + "step": 23391 + }, + { + "epoch": 0.45, + "learning_rate": 1.0935497650576677e-07, + "loss": 0.0009, + "step": 23392 + }, + { + "epoch": 0.45, + "learning_rate": 1.0935109316143063e-07, + "loss": 0.0006, + "step": 23393 + }, + { + "epoch": 0.45, + "learning_rate": 1.0934720981709449e-07, + "loss": 0.0005, + "step": 23394 + }, + { + "epoch": 0.45, + "learning_rate": 1.0934332647275833e-07, + "loss": 0.0005, + "step": 23395 + }, + { + "epoch": 0.45, + "learning_rate": 1.0933944312842219e-07, + "loss": 0.0126, + "step": 23396 + }, + { + "epoch": 0.45, + "learning_rate": 1.0933555978408603e-07, + "loss": 0.0006, + "step": 23397 + }, + { + "epoch": 0.45, + "learning_rate": 1.0933167643974989e-07, + "loss": 0.0021, + "step": 23398 + }, + { + "epoch": 0.45, + "learning_rate": 1.0932779309541375e-07, + "loss": 0.0004, + "step": 23399 + }, + { + "epoch": 0.45, + "learning_rate": 1.0932390975107761e-07, + "loss": 0.0007, + "step": 23400 + }, + { + "epoch": 0.45, + "learning_rate": 1.0932002640674147e-07, + "loss": 0.0005, + "step": 23401 + }, + { + "epoch": 0.45, + "learning_rate": 1.0931614306240532e-07, + "loss": 0.0005, + "step": 23402 + }, + { + "epoch": 0.45, + "learning_rate": 1.0931225971806918e-07, + "loss": 0.001, + "step": 23403 + }, + { + "epoch": 0.45, + "learning_rate": 1.0930837637373304e-07, + "loss": 0.0013, + "step": 23404 + }, + { + "epoch": 0.45, + "learning_rate": 1.093044930293969e-07, + "loss": 0.0011, + "step": 23405 + }, + { + "epoch": 0.45, + "learning_rate": 1.0930060968506076e-07, + "loss": 0.0009, + "step": 23406 + }, + { + "epoch": 0.45, + "learning_rate": 1.0929672634072462e-07, + "loss": 0.0006, + "step": 23407 + }, + { + "epoch": 0.45, + "learning_rate": 1.0929284299638847e-07, + "loss": 0.229, + "step": 23408 + }, + { + "epoch": 0.45, + "learning_rate": 1.0928895965205233e-07, + "loss": 0.0006, + "step": 23409 + }, + { + "epoch": 0.45, + "learning_rate": 1.0928507630771619e-07, + "loss": 0.0006, + "step": 23410 + }, + { + "epoch": 0.45, + "learning_rate": 1.0928119296338005e-07, + "loss": 0.0006, + "step": 23411 + }, + { + "epoch": 0.45, + "learning_rate": 1.0927730961904391e-07, + "loss": 0.0006, + "step": 23412 + }, + { + "epoch": 0.45, + "learning_rate": 1.0927342627470777e-07, + "loss": 0.0006, + "step": 23413 + }, + { + "epoch": 0.45, + "learning_rate": 1.0926954293037162e-07, + "loss": 0.488, + "step": 23414 + }, + { + "epoch": 0.45, + "learning_rate": 1.0926565958603548e-07, + "loss": 0.0005, + "step": 23415 + }, + { + "epoch": 0.45, + "learning_rate": 1.0926177624169934e-07, + "loss": 0.0006, + "step": 23416 + }, + { + "epoch": 0.45, + "learning_rate": 1.092578928973632e-07, + "loss": 0.0007, + "step": 23417 + }, + { + "epoch": 0.45, + "learning_rate": 1.0925400955302706e-07, + "loss": 0.0007, + "step": 23418 + }, + { + "epoch": 0.45, + "learning_rate": 1.0925012620869091e-07, + "loss": 0.0006, + "step": 23419 + }, + { + "epoch": 0.45, + "learning_rate": 1.0924624286435477e-07, + "loss": 0.0008, + "step": 23420 + }, + { + "epoch": 0.45, + "learning_rate": 1.0924235952001863e-07, + "loss": 0.0012, + "step": 23421 + }, + { + "epoch": 0.45, + "learning_rate": 1.0923847617568249e-07, + "loss": 1.2667, + "step": 23422 + }, + { + "epoch": 0.45, + "learning_rate": 1.0923459283134635e-07, + "loss": 0.0014, + "step": 23423 + }, + { + "epoch": 0.45, + "learning_rate": 1.092307094870102e-07, + "loss": 0.0008, + "step": 23424 + }, + { + "epoch": 0.45, + "learning_rate": 1.0922682614267406e-07, + "loss": 0.0007, + "step": 23425 + }, + { + "epoch": 0.45, + "learning_rate": 1.0922294279833792e-07, + "loss": 0.0007, + "step": 23426 + }, + { + "epoch": 0.45, + "learning_rate": 1.0921905945400178e-07, + "loss": 0.0005, + "step": 23427 + }, + { + "epoch": 0.45, + "learning_rate": 1.0921517610966564e-07, + "loss": 0.0012, + "step": 23428 + }, + { + "epoch": 0.45, + "learning_rate": 1.092112927653295e-07, + "loss": 0.0005, + "step": 23429 + }, + { + "epoch": 0.45, + "learning_rate": 1.0920740942099336e-07, + "loss": 0.017, + "step": 23430 + }, + { + "epoch": 0.45, + "learning_rate": 1.0920352607665721e-07, + "loss": 0.0007, + "step": 23431 + }, + { + "epoch": 0.45, + "learning_rate": 1.0919964273232107e-07, + "loss": 0.0005, + "step": 23432 + }, + { + "epoch": 0.45, + "learning_rate": 1.0919575938798493e-07, + "loss": 0.5606, + "step": 23433 + }, + { + "epoch": 0.45, + "learning_rate": 1.0919187604364879e-07, + "loss": 0.0082, + "step": 23434 + }, + { + "epoch": 0.45, + "learning_rate": 1.0918799269931265e-07, + "loss": 0.0006, + "step": 23435 + }, + { + "epoch": 0.45, + "learning_rate": 1.091841093549765e-07, + "loss": 0.0009, + "step": 23436 + }, + { + "epoch": 0.45, + "learning_rate": 1.0918022601064036e-07, + "loss": 0.002, + "step": 23437 + }, + { + "epoch": 0.45, + "learning_rate": 1.0917634266630422e-07, + "loss": 0.0004, + "step": 23438 + }, + { + "epoch": 0.45, + "learning_rate": 1.0917245932196808e-07, + "loss": 0.0005, + "step": 23439 + }, + { + "epoch": 0.45, + "learning_rate": 1.0916857597763194e-07, + "loss": 0.0005, + "step": 23440 + }, + { + "epoch": 0.45, + "learning_rate": 1.091646926332958e-07, + "loss": 0.031, + "step": 23441 + }, + { + "epoch": 0.45, + "learning_rate": 1.0916080928895965e-07, + "loss": 0.0134, + "step": 23442 + }, + { + "epoch": 0.45, + "learning_rate": 1.0915692594462351e-07, + "loss": 0.0096, + "step": 23443 + }, + { + "epoch": 0.45, + "learning_rate": 1.0915304260028737e-07, + "loss": 0.0006, + "step": 23444 + }, + { + "epoch": 0.45, + "learning_rate": 1.0914915925595123e-07, + "loss": 0.0007, + "step": 23445 + }, + { + "epoch": 0.45, + "learning_rate": 1.0914527591161509e-07, + "loss": 0.0125, + "step": 23446 + }, + { + "epoch": 0.45, + "learning_rate": 1.0914139256727895e-07, + "loss": 0.0022, + "step": 23447 + }, + { + "epoch": 0.45, + "learning_rate": 1.091375092229428e-07, + "loss": 0.0007, + "step": 23448 + }, + { + "epoch": 0.45, + "learning_rate": 1.0913362587860666e-07, + "loss": 0.0006, + "step": 23449 + }, + { + "epoch": 0.45, + "learning_rate": 1.0912974253427052e-07, + "loss": 0.0007, + "step": 23450 + }, + { + "epoch": 0.45, + "learning_rate": 1.0912585918993438e-07, + "loss": 0.0005, + "step": 23451 + }, + { + "epoch": 0.45, + "learning_rate": 1.0912197584559824e-07, + "loss": 0.0011, + "step": 23452 + }, + { + "epoch": 0.45, + "learning_rate": 1.0911809250126207e-07, + "loss": 0.0008, + "step": 23453 + }, + { + "epoch": 0.45, + "learning_rate": 1.0911420915692593e-07, + "loss": 0.0005, + "step": 23454 + }, + { + "epoch": 0.45, + "learning_rate": 1.0911032581258979e-07, + "loss": 0.0007, + "step": 23455 + }, + { + "epoch": 0.45, + "learning_rate": 1.0910644246825364e-07, + "loss": 0.0006, + "step": 23456 + }, + { + "epoch": 0.46, + "learning_rate": 1.091025591239175e-07, + "loss": 0.0005, + "step": 23457 + }, + { + "epoch": 0.46, + "learning_rate": 1.0909867577958136e-07, + "loss": 0.0008, + "step": 23458 + }, + { + "epoch": 0.46, + "learning_rate": 1.0909479243524522e-07, + "loss": 0.0005, + "step": 23459 + }, + { + "epoch": 0.46, + "learning_rate": 1.0909090909090908e-07, + "loss": 0.0006, + "step": 23460 + }, + { + "epoch": 0.46, + "learning_rate": 1.0908702574657293e-07, + "loss": 0.11, + "step": 23461 + }, + { + "epoch": 0.46, + "learning_rate": 1.0908314240223679e-07, + "loss": 0.0006, + "step": 23462 + }, + { + "epoch": 0.46, + "learning_rate": 1.0907925905790065e-07, + "loss": 0.0006, + "step": 23463 + }, + { + "epoch": 0.46, + "learning_rate": 1.0907537571356451e-07, + "loss": 0.0005, + "step": 23464 + }, + { + "epoch": 0.46, + "learning_rate": 1.0907149236922837e-07, + "loss": 0.0006, + "step": 23465 + }, + { + "epoch": 0.46, + "learning_rate": 1.0906760902489223e-07, + "loss": 0.0005, + "step": 23466 + }, + { + "epoch": 0.46, + "learning_rate": 1.0906372568055608e-07, + "loss": 0.0007, + "step": 23467 + }, + { + "epoch": 0.46, + "learning_rate": 1.0905984233621994e-07, + "loss": 0.0007, + "step": 23468 + }, + { + "epoch": 0.46, + "learning_rate": 1.090559589918838e-07, + "loss": 0.001, + "step": 23469 + }, + { + "epoch": 0.46, + "learning_rate": 1.0905207564754766e-07, + "loss": 0.0005, + "step": 23470 + }, + { + "epoch": 0.46, + "learning_rate": 1.0904819230321152e-07, + "loss": 0.0006, + "step": 23471 + }, + { + "epoch": 0.46, + "learning_rate": 1.0904430895887538e-07, + "loss": 0.0006, + "step": 23472 + }, + { + "epoch": 0.46, + "learning_rate": 1.0904042561453923e-07, + "loss": 0.0005, + "step": 23473 + }, + { + "epoch": 0.46, + "learning_rate": 1.0903654227020309e-07, + "loss": 0.0007, + "step": 23474 + }, + { + "epoch": 0.46, + "learning_rate": 1.0903265892586695e-07, + "loss": 0.0005, + "step": 23475 + }, + { + "epoch": 0.46, + "learning_rate": 1.0902877558153081e-07, + "loss": 0.0007, + "step": 23476 + }, + { + "epoch": 0.46, + "learning_rate": 1.0902489223719467e-07, + "loss": 0.0005, + "step": 23477 + }, + { + "epoch": 0.46, + "learning_rate": 1.0902100889285852e-07, + "loss": 0.0006, + "step": 23478 + }, + { + "epoch": 0.46, + "learning_rate": 1.0901712554852238e-07, + "loss": 0.0005, + "step": 23479 + }, + { + "epoch": 0.46, + "learning_rate": 1.0901324220418624e-07, + "loss": 0.0006, + "step": 23480 + }, + { + "epoch": 0.46, + "learning_rate": 1.090093588598501e-07, + "loss": 0.0008, + "step": 23481 + }, + { + "epoch": 0.46, + "learning_rate": 1.0900547551551396e-07, + "loss": 0.0031, + "step": 23482 + }, + { + "epoch": 0.46, + "learning_rate": 1.0900159217117782e-07, + "loss": 0.0006, + "step": 23483 + }, + { + "epoch": 0.46, + "learning_rate": 1.0899770882684167e-07, + "loss": 0.0011, + "step": 23484 + }, + { + "epoch": 0.46, + "learning_rate": 1.0899382548250553e-07, + "loss": 0.0006, + "step": 23485 + }, + { + "epoch": 0.46, + "learning_rate": 1.0898994213816939e-07, + "loss": 0.0005, + "step": 23486 + }, + { + "epoch": 0.46, + "learning_rate": 1.0898605879383325e-07, + "loss": 0.0009, + "step": 23487 + }, + { + "epoch": 0.46, + "learning_rate": 1.0898217544949711e-07, + "loss": 0.0006, + "step": 23488 + }, + { + "epoch": 0.46, + "learning_rate": 1.0897829210516097e-07, + "loss": 0.2043, + "step": 23489 + }, + { + "epoch": 0.46, + "learning_rate": 1.0897440876082482e-07, + "loss": 0.0008, + "step": 23490 + }, + { + "epoch": 0.46, + "learning_rate": 1.0897052541648868e-07, + "loss": 0.504, + "step": 23491 + }, + { + "epoch": 0.46, + "learning_rate": 1.0896664207215254e-07, + "loss": 0.0056, + "step": 23492 + }, + { + "epoch": 0.46, + "learning_rate": 1.089627587278164e-07, + "loss": 0.0071, + "step": 23493 + }, + { + "epoch": 0.46, + "learning_rate": 1.0895887538348026e-07, + "loss": 0.0008, + "step": 23494 + }, + { + "epoch": 0.46, + "learning_rate": 1.0895499203914411e-07, + "loss": 0.0009, + "step": 23495 + }, + { + "epoch": 0.46, + "learning_rate": 1.0895110869480797e-07, + "loss": 0.0004, + "step": 23496 + }, + { + "epoch": 0.46, + "learning_rate": 1.0894722535047183e-07, + "loss": 0.0007, + "step": 23497 + }, + { + "epoch": 0.46, + "learning_rate": 1.0894334200613569e-07, + "loss": 0.2846, + "step": 23498 + }, + { + "epoch": 0.46, + "learning_rate": 1.0893945866179955e-07, + "loss": 0.0005, + "step": 23499 + }, + { + "epoch": 0.46, + "learning_rate": 1.089355753174634e-07, + "loss": 0.0006, + "step": 23500 + }, + { + "epoch": 0.46, + "learning_rate": 1.0893169197312726e-07, + "loss": 0.001, + "step": 23501 + }, + { + "epoch": 0.46, + "learning_rate": 1.0892780862879112e-07, + "loss": 0.0007, + "step": 23502 + }, + { + "epoch": 0.46, + "learning_rate": 1.0892392528445498e-07, + "loss": 0.0742, + "step": 23503 + }, + { + "epoch": 0.46, + "learning_rate": 1.0892004194011884e-07, + "loss": 1.1859, + "step": 23504 + }, + { + "epoch": 0.46, + "learning_rate": 1.089161585957827e-07, + "loss": 0.0007, + "step": 23505 + }, + { + "epoch": 0.46, + "learning_rate": 1.0891227525144656e-07, + "loss": 0.0004, + "step": 23506 + }, + { + "epoch": 0.46, + "learning_rate": 1.0890839190711041e-07, + "loss": 0.0158, + "step": 23507 + }, + { + "epoch": 0.46, + "learning_rate": 1.0890450856277427e-07, + "loss": 0.0041, + "step": 23508 + }, + { + "epoch": 0.46, + "learning_rate": 1.0890062521843813e-07, + "loss": 0.0008, + "step": 23509 + }, + { + "epoch": 0.46, + "learning_rate": 1.0889674187410199e-07, + "loss": 1.0128, + "step": 23510 + }, + { + "epoch": 0.46, + "learning_rate": 1.0889285852976582e-07, + "loss": 0.0006, + "step": 23511 + }, + { + "epoch": 0.46, + "learning_rate": 1.0888897518542968e-07, + "loss": 0.0005, + "step": 23512 + }, + { + "epoch": 0.46, + "learning_rate": 1.0888509184109354e-07, + "loss": 0.0008, + "step": 23513 + }, + { + "epoch": 0.46, + "learning_rate": 1.088812084967574e-07, + "loss": 0.0007, + "step": 23514 + }, + { + "epoch": 0.46, + "learning_rate": 1.0887732515242125e-07, + "loss": 0.0006, + "step": 23515 + }, + { + "epoch": 0.46, + "learning_rate": 1.0887344180808511e-07, + "loss": 0.0008, + "step": 23516 + }, + { + "epoch": 0.46, + "learning_rate": 1.0886955846374897e-07, + "loss": 0.0007, + "step": 23517 + }, + { + "epoch": 0.46, + "learning_rate": 1.0886567511941283e-07, + "loss": 0.0005, + "step": 23518 + }, + { + "epoch": 0.46, + "learning_rate": 1.0886179177507669e-07, + "loss": 0.2482, + "step": 23519 + }, + { + "epoch": 0.46, + "learning_rate": 1.0885790843074054e-07, + "loss": 0.0009, + "step": 23520 + }, + { + "epoch": 0.46, + "learning_rate": 1.088540250864044e-07, + "loss": 0.0005, + "step": 23521 + }, + { + "epoch": 0.46, + "learning_rate": 1.0885014174206826e-07, + "loss": 0.0006, + "step": 23522 + }, + { + "epoch": 0.46, + "learning_rate": 1.0884625839773212e-07, + "loss": 0.0007, + "step": 23523 + }, + { + "epoch": 0.46, + "learning_rate": 1.0884237505339598e-07, + "loss": 0.001, + "step": 23524 + }, + { + "epoch": 0.46, + "learning_rate": 1.0883849170905984e-07, + "loss": 0.0008, + "step": 23525 + }, + { + "epoch": 0.46, + "learning_rate": 1.088346083647237e-07, + "loss": 0.122, + "step": 23526 + }, + { + "epoch": 0.46, + "learning_rate": 1.0883072502038755e-07, + "loss": 0.0006, + "step": 23527 + }, + { + "epoch": 0.46, + "learning_rate": 1.0882684167605141e-07, + "loss": 1.0222, + "step": 23528 + }, + { + "epoch": 0.46, + "learning_rate": 1.0882295833171527e-07, + "loss": 0.4678, + "step": 23529 + }, + { + "epoch": 0.46, + "learning_rate": 1.0881907498737913e-07, + "loss": 0.0006, + "step": 23530 + }, + { + "epoch": 0.46, + "learning_rate": 1.0881519164304299e-07, + "loss": 0.0025, + "step": 23531 + }, + { + "epoch": 0.46, + "learning_rate": 1.0881130829870684e-07, + "loss": 0.0006, + "step": 23532 + }, + { + "epoch": 0.46, + "learning_rate": 1.088074249543707e-07, + "loss": 0.0005, + "step": 23533 + }, + { + "epoch": 0.46, + "learning_rate": 1.0880354161003456e-07, + "loss": 0.0005, + "step": 23534 + }, + { + "epoch": 0.46, + "learning_rate": 1.0879965826569842e-07, + "loss": 0.2551, + "step": 23535 + }, + { + "epoch": 0.46, + "learning_rate": 1.0879577492136228e-07, + "loss": 0.0007, + "step": 23536 + }, + { + "epoch": 0.46, + "learning_rate": 1.0879189157702613e-07, + "loss": 0.0005, + "step": 23537 + }, + { + "epoch": 0.46, + "learning_rate": 1.0878800823268999e-07, + "loss": 0.0007, + "step": 23538 + }, + { + "epoch": 0.46, + "learning_rate": 1.0878412488835385e-07, + "loss": 0.0008, + "step": 23539 + }, + { + "epoch": 0.46, + "learning_rate": 1.0878024154401771e-07, + "loss": 0.0011, + "step": 23540 + }, + { + "epoch": 0.46, + "learning_rate": 1.0877635819968157e-07, + "loss": 0.0006, + "step": 23541 + }, + { + "epoch": 0.46, + "learning_rate": 1.0877247485534543e-07, + "loss": 0.0007, + "step": 23542 + }, + { + "epoch": 0.46, + "learning_rate": 1.0876859151100928e-07, + "loss": 0.0012, + "step": 23543 + }, + { + "epoch": 0.46, + "learning_rate": 1.0876470816667314e-07, + "loss": 0.5835, + "step": 23544 + }, + { + "epoch": 0.46, + "learning_rate": 1.0876082482233699e-07, + "loss": 1.2084, + "step": 23545 + }, + { + "epoch": 0.46, + "learning_rate": 1.0875694147800085e-07, + "loss": 0.0013, + "step": 23546 + }, + { + "epoch": 0.46, + "learning_rate": 1.087530581336647e-07, + "loss": 0.0007, + "step": 23547 + }, + { + "epoch": 0.46, + "learning_rate": 1.0874917478932856e-07, + "loss": 0.001, + "step": 23548 + }, + { + "epoch": 0.46, + "learning_rate": 1.0874529144499242e-07, + "loss": 0.0007, + "step": 23549 + }, + { + "epoch": 0.46, + "learning_rate": 1.0874140810065628e-07, + "loss": 0.0007, + "step": 23550 + }, + { + "epoch": 0.46, + "learning_rate": 1.0873752475632014e-07, + "loss": 0.0006, + "step": 23551 + }, + { + "epoch": 0.46, + "learning_rate": 1.08733641411984e-07, + "loss": 0.0012, + "step": 23552 + }, + { + "epoch": 0.46, + "learning_rate": 1.0872975806764785e-07, + "loss": 0.001, + "step": 23553 + }, + { + "epoch": 0.46, + "learning_rate": 1.0872587472331171e-07, + "loss": 0.0006, + "step": 23554 + }, + { + "epoch": 0.46, + "learning_rate": 1.0872199137897557e-07, + "loss": 0.0007, + "step": 23555 + }, + { + "epoch": 0.46, + "learning_rate": 1.0871810803463943e-07, + "loss": 0.9345, + "step": 23556 + }, + { + "epoch": 0.46, + "learning_rate": 1.0871422469030329e-07, + "loss": 0.0331, + "step": 23557 + }, + { + "epoch": 0.46, + "learning_rate": 1.0871034134596714e-07, + "loss": 0.0089, + "step": 23558 + }, + { + "epoch": 0.46, + "learning_rate": 1.08706458001631e-07, + "loss": 0.0006, + "step": 23559 + }, + { + "epoch": 0.46, + "learning_rate": 1.0870257465729486e-07, + "loss": 0.0016, + "step": 23560 + }, + { + "epoch": 0.46, + "learning_rate": 1.0869869131295872e-07, + "loss": 0.0007, + "step": 23561 + }, + { + "epoch": 0.46, + "learning_rate": 1.0869480796862258e-07, + "loss": 0.0008, + "step": 23562 + }, + { + "epoch": 0.46, + "learning_rate": 1.0869092462428644e-07, + "loss": 0.0008, + "step": 23563 + }, + { + "epoch": 0.46, + "learning_rate": 1.086870412799503e-07, + "loss": 0.4995, + "step": 23564 + }, + { + "epoch": 0.46, + "learning_rate": 1.0868315793561415e-07, + "loss": 0.0016, + "step": 23565 + }, + { + "epoch": 0.46, + "learning_rate": 1.0867927459127801e-07, + "loss": 0.0007, + "step": 23566 + }, + { + "epoch": 0.46, + "learning_rate": 1.0867539124694187e-07, + "loss": 0.0019, + "step": 23567 + }, + { + "epoch": 0.46, + "learning_rate": 1.0867150790260573e-07, + "loss": 0.0005, + "step": 23568 + }, + { + "epoch": 0.46, + "learning_rate": 1.0866762455826957e-07, + "loss": 1.2158, + "step": 23569 + }, + { + "epoch": 0.46, + "learning_rate": 1.0866374121393343e-07, + "loss": 0.0007, + "step": 23570 + }, + { + "epoch": 0.46, + "learning_rate": 1.0865985786959729e-07, + "loss": 0.0005, + "step": 23571 + }, + { + "epoch": 0.46, + "learning_rate": 1.0865597452526115e-07, + "loss": 0.0007, + "step": 23572 + }, + { + "epoch": 0.46, + "learning_rate": 1.08652091180925e-07, + "loss": 0.0006, + "step": 23573 + }, + { + "epoch": 0.46, + "learning_rate": 1.0864820783658885e-07, + "loss": 0.0006, + "step": 23574 + }, + { + "epoch": 0.46, + "learning_rate": 1.0864432449225271e-07, + "loss": 1.1625, + "step": 23575 + }, + { + "epoch": 0.46, + "learning_rate": 1.0864044114791657e-07, + "loss": 0.1914, + "step": 23576 + }, + { + "epoch": 0.46, + "learning_rate": 1.0863655780358042e-07, + "loss": 0.0011, + "step": 23577 + }, + { + "epoch": 0.46, + "learning_rate": 1.0863267445924428e-07, + "loss": 0.0006, + "step": 23578 + }, + { + "epoch": 0.46, + "learning_rate": 1.0862879111490814e-07, + "loss": 0.0005, + "step": 23579 + }, + { + "epoch": 0.46, + "learning_rate": 1.08624907770572e-07, + "loss": 0.0008, + "step": 23580 + }, + { + "epoch": 0.46, + "learning_rate": 1.0862102442623586e-07, + "loss": 0.0005, + "step": 23581 + }, + { + "epoch": 0.46, + "learning_rate": 1.0861714108189972e-07, + "loss": 0.0006, + "step": 23582 + }, + { + "epoch": 0.46, + "learning_rate": 1.0861325773756357e-07, + "loss": 0.0013, + "step": 23583 + }, + { + "epoch": 0.46, + "learning_rate": 1.0860937439322743e-07, + "loss": 0.2285, + "step": 23584 + }, + { + "epoch": 0.46, + "learning_rate": 1.0860549104889129e-07, + "loss": 0.0005, + "step": 23585 + }, + { + "epoch": 0.46, + "learning_rate": 1.0860160770455515e-07, + "loss": 0.0008, + "step": 23586 + }, + { + "epoch": 0.46, + "learning_rate": 1.0859772436021901e-07, + "loss": 1.0006, + "step": 23587 + }, + { + "epoch": 0.46, + "learning_rate": 1.0859384101588287e-07, + "loss": 0.0011, + "step": 23588 + }, + { + "epoch": 0.46, + "learning_rate": 1.0858995767154672e-07, + "loss": 0.0006, + "step": 23589 + }, + { + "epoch": 0.46, + "learning_rate": 1.0858607432721058e-07, + "loss": 0.0005, + "step": 23590 + }, + { + "epoch": 0.46, + "learning_rate": 1.0858219098287444e-07, + "loss": 0.0008, + "step": 23591 + }, + { + "epoch": 0.46, + "learning_rate": 1.085783076385383e-07, + "loss": 0.0007, + "step": 23592 + }, + { + "epoch": 0.46, + "learning_rate": 1.0857442429420216e-07, + "loss": 0.0008, + "step": 23593 + }, + { + "epoch": 0.46, + "learning_rate": 1.0857054094986601e-07, + "loss": 0.0006, + "step": 23594 + }, + { + "epoch": 0.46, + "learning_rate": 1.0856665760552987e-07, + "loss": 0.001, + "step": 23595 + }, + { + "epoch": 0.46, + "learning_rate": 1.0856277426119373e-07, + "loss": 0.0014, + "step": 23596 + }, + { + "epoch": 0.46, + "learning_rate": 1.0855889091685759e-07, + "loss": 0.0008, + "step": 23597 + }, + { + "epoch": 0.46, + "learning_rate": 1.0855500757252145e-07, + "loss": 0.0006, + "step": 23598 + }, + { + "epoch": 0.46, + "learning_rate": 1.085511242281853e-07, + "loss": 0.0027, + "step": 23599 + }, + { + "epoch": 0.46, + "learning_rate": 1.0854724088384916e-07, + "loss": 0.0006, + "step": 23600 + }, + { + "epoch": 0.46, + "learning_rate": 1.0854335753951302e-07, + "loss": 0.0008, + "step": 23601 + }, + { + "epoch": 0.46, + "learning_rate": 1.0853947419517688e-07, + "loss": 1.1345, + "step": 23602 + }, + { + "epoch": 0.46, + "learning_rate": 1.0853559085084074e-07, + "loss": 0.0006, + "step": 23603 + }, + { + "epoch": 0.46, + "learning_rate": 1.085317075065046e-07, + "loss": 0.0005, + "step": 23604 + }, + { + "epoch": 0.46, + "learning_rate": 1.0852782416216846e-07, + "loss": 0.004, + "step": 23605 + }, + { + "epoch": 0.46, + "learning_rate": 1.0852394081783231e-07, + "loss": 0.0005, + "step": 23606 + }, + { + "epoch": 0.46, + "learning_rate": 1.0852005747349617e-07, + "loss": 0.6305, + "step": 23607 + }, + { + "epoch": 0.46, + "learning_rate": 1.0851617412916003e-07, + "loss": 0.0006, + "step": 23608 + }, + { + "epoch": 0.46, + "learning_rate": 1.0851229078482389e-07, + "loss": 0.0005, + "step": 23609 + }, + { + "epoch": 0.46, + "learning_rate": 1.0850840744048775e-07, + "loss": 0.0006, + "step": 23610 + }, + { + "epoch": 0.46, + "learning_rate": 1.085045240961516e-07, + "loss": 0.106, + "step": 23611 + }, + { + "epoch": 0.46, + "learning_rate": 1.0850064075181546e-07, + "loss": 0.0007, + "step": 23612 + }, + { + "epoch": 0.46, + "learning_rate": 1.0849675740747932e-07, + "loss": 0.0005, + "step": 23613 + }, + { + "epoch": 0.46, + "learning_rate": 1.0849287406314318e-07, + "loss": 0.0007, + "step": 23614 + }, + { + "epoch": 0.46, + "learning_rate": 1.0848899071880704e-07, + "loss": 0.0006, + "step": 23615 + }, + { + "epoch": 0.46, + "learning_rate": 1.084851073744709e-07, + "loss": 0.0004, + "step": 23616 + }, + { + "epoch": 0.46, + "learning_rate": 1.0848122403013475e-07, + "loss": 0.0007, + "step": 23617 + }, + { + "epoch": 0.46, + "learning_rate": 1.0847734068579861e-07, + "loss": 0.0006, + "step": 23618 + }, + { + "epoch": 0.46, + "learning_rate": 1.0847345734146247e-07, + "loss": 0.0007, + "step": 23619 + }, + { + "epoch": 0.46, + "learning_rate": 1.0846957399712633e-07, + "loss": 0.0007, + "step": 23620 + }, + { + "epoch": 0.46, + "learning_rate": 1.0846569065279019e-07, + "loss": 0.0006, + "step": 23621 + }, + { + "epoch": 0.46, + "learning_rate": 1.0846180730845405e-07, + "loss": 0.0007, + "step": 23622 + }, + { + "epoch": 0.46, + "learning_rate": 1.084579239641179e-07, + "loss": 0.0009, + "step": 23623 + }, + { + "epoch": 0.46, + "learning_rate": 1.0845404061978176e-07, + "loss": 0.0038, + "step": 23624 + }, + { + "epoch": 0.46, + "learning_rate": 1.0845015727544562e-07, + "loss": 0.0006, + "step": 23625 + }, + { + "epoch": 0.46, + "learning_rate": 1.0844627393110948e-07, + "loss": 0.4579, + "step": 23626 + }, + { + "epoch": 0.46, + "learning_rate": 1.0844239058677331e-07, + "loss": 0.0006, + "step": 23627 + }, + { + "epoch": 0.46, + "learning_rate": 1.0843850724243717e-07, + "loss": 0.0008, + "step": 23628 + }, + { + "epoch": 0.46, + "learning_rate": 1.0843462389810103e-07, + "loss": 0.0027, + "step": 23629 + }, + { + "epoch": 0.46, + "learning_rate": 1.0843074055376489e-07, + "loss": 0.0546, + "step": 23630 + }, + { + "epoch": 0.46, + "learning_rate": 1.0842685720942874e-07, + "loss": 0.0007, + "step": 23631 + }, + { + "epoch": 0.46, + "learning_rate": 1.084229738650926e-07, + "loss": 0.0008, + "step": 23632 + }, + { + "epoch": 0.46, + "learning_rate": 1.0841909052075646e-07, + "loss": 0.001, + "step": 23633 + }, + { + "epoch": 0.46, + "learning_rate": 1.0841520717642032e-07, + "loss": 0.0006, + "step": 23634 + }, + { + "epoch": 0.46, + "learning_rate": 1.0841132383208418e-07, + "loss": 0.0006, + "step": 23635 + }, + { + "epoch": 0.46, + "learning_rate": 1.0840744048774803e-07, + "loss": 0.0017, + "step": 23636 + }, + { + "epoch": 0.46, + "learning_rate": 1.0840355714341189e-07, + "loss": 0.0206, + "step": 23637 + }, + { + "epoch": 0.46, + "learning_rate": 1.0839967379907575e-07, + "loss": 0.0015, + "step": 23638 + }, + { + "epoch": 0.46, + "learning_rate": 1.0839579045473961e-07, + "loss": 0.0011, + "step": 23639 + }, + { + "epoch": 0.46, + "learning_rate": 1.0839190711040347e-07, + "loss": 1.1866, + "step": 23640 + }, + { + "epoch": 0.46, + "learning_rate": 1.0838802376606733e-07, + "loss": 0.0005, + "step": 23641 + }, + { + "epoch": 0.46, + "learning_rate": 1.0838414042173118e-07, + "loss": 0.0017, + "step": 23642 + }, + { + "epoch": 0.46, + "learning_rate": 1.0838025707739504e-07, + "loss": 0.0007, + "step": 23643 + }, + { + "epoch": 0.46, + "learning_rate": 1.083763737330589e-07, + "loss": 0.2909, + "step": 23644 + }, + { + "epoch": 0.46, + "learning_rate": 1.0837249038872276e-07, + "loss": 0.0008, + "step": 23645 + }, + { + "epoch": 0.46, + "learning_rate": 1.0836860704438662e-07, + "loss": 0.4798, + "step": 23646 + }, + { + "epoch": 0.46, + "learning_rate": 1.0836472370005048e-07, + "loss": 0.001, + "step": 23647 + }, + { + "epoch": 0.46, + "learning_rate": 1.0836084035571433e-07, + "loss": 0.0006, + "step": 23648 + }, + { + "epoch": 0.46, + "learning_rate": 1.0835695701137819e-07, + "loss": 0.0007, + "step": 23649 + }, + { + "epoch": 0.46, + "learning_rate": 1.0835307366704205e-07, + "loss": 0.0005, + "step": 23650 + }, + { + "epoch": 0.46, + "learning_rate": 1.0834919032270591e-07, + "loss": 0.0006, + "step": 23651 + }, + { + "epoch": 0.46, + "learning_rate": 1.0834530697836977e-07, + "loss": 0.0005, + "step": 23652 + }, + { + "epoch": 0.46, + "learning_rate": 1.0834142363403362e-07, + "loss": 0.0009, + "step": 23653 + }, + { + "epoch": 0.46, + "learning_rate": 1.0833754028969748e-07, + "loss": 0.0006, + "step": 23654 + }, + { + "epoch": 0.46, + "learning_rate": 1.0833365694536134e-07, + "loss": 0.0006, + "step": 23655 + }, + { + "epoch": 0.46, + "learning_rate": 1.083297736010252e-07, + "loss": 0.0006, + "step": 23656 + }, + { + "epoch": 0.46, + "learning_rate": 1.0832589025668906e-07, + "loss": 0.0011, + "step": 23657 + }, + { + "epoch": 0.46, + "learning_rate": 1.0832200691235292e-07, + "loss": 0.0005, + "step": 23658 + }, + { + "epoch": 0.46, + "learning_rate": 1.0831812356801677e-07, + "loss": 0.7739, + "step": 23659 + }, + { + "epoch": 0.46, + "learning_rate": 1.0831424022368063e-07, + "loss": 0.0006, + "step": 23660 + }, + { + "epoch": 0.46, + "learning_rate": 1.0831035687934449e-07, + "loss": 0.001, + "step": 23661 + }, + { + "epoch": 0.46, + "learning_rate": 1.0830647353500835e-07, + "loss": 0.1104, + "step": 23662 + }, + { + "epoch": 0.46, + "learning_rate": 1.0830259019067221e-07, + "loss": 0.0007, + "step": 23663 + }, + { + "epoch": 0.46, + "learning_rate": 1.0829870684633607e-07, + "loss": 0.0008, + "step": 23664 + }, + { + "epoch": 0.46, + "learning_rate": 1.0829482350199992e-07, + "loss": 0.0007, + "step": 23665 + }, + { + "epoch": 0.46, + "learning_rate": 1.0829094015766378e-07, + "loss": 0.0008, + "step": 23666 + }, + { + "epoch": 0.46, + "learning_rate": 1.0828705681332764e-07, + "loss": 0.9237, + "step": 23667 + }, + { + "epoch": 0.46, + "learning_rate": 1.082831734689915e-07, + "loss": 0.0035, + "step": 23668 + }, + { + "epoch": 0.46, + "learning_rate": 1.0827929012465536e-07, + "loss": 0.0006, + "step": 23669 + }, + { + "epoch": 0.46, + "learning_rate": 1.0827540678031922e-07, + "loss": 0.0009, + "step": 23670 + }, + { + "epoch": 0.46, + "learning_rate": 1.0827152343598307e-07, + "loss": 0.1105, + "step": 23671 + }, + { + "epoch": 0.46, + "learning_rate": 1.0826764009164693e-07, + "loss": 0.0007, + "step": 23672 + }, + { + "epoch": 0.46, + "learning_rate": 1.0826375674731079e-07, + "loss": 0.0644, + "step": 23673 + }, + { + "epoch": 0.46, + "learning_rate": 1.0825987340297465e-07, + "loss": 0.0006, + "step": 23674 + }, + { + "epoch": 0.46, + "learning_rate": 1.082559900586385e-07, + "loss": 0.0005, + "step": 23675 + }, + { + "epoch": 0.46, + "learning_rate": 1.0825210671430236e-07, + "loss": 0.0007, + "step": 23676 + }, + { + "epoch": 0.46, + "learning_rate": 1.0824822336996622e-07, + "loss": 1.277, + "step": 23677 + }, + { + "epoch": 0.46, + "learning_rate": 1.0824434002563008e-07, + "loss": 0.0006, + "step": 23678 + }, + { + "epoch": 0.46, + "learning_rate": 1.0824045668129394e-07, + "loss": 1.7934, + "step": 23679 + }, + { + "epoch": 0.46, + "learning_rate": 1.082365733369578e-07, + "loss": 0.0587, + "step": 23680 + }, + { + "epoch": 0.46, + "learning_rate": 1.0823268999262166e-07, + "loss": 0.0005, + "step": 23681 + }, + { + "epoch": 0.46, + "learning_rate": 1.0822880664828551e-07, + "loss": 0.0006, + "step": 23682 + }, + { + "epoch": 0.46, + "learning_rate": 1.0822492330394937e-07, + "loss": 0.0006, + "step": 23683 + }, + { + "epoch": 0.46, + "learning_rate": 1.0822103995961323e-07, + "loss": 0.0007, + "step": 23684 + }, + { + "epoch": 0.46, + "learning_rate": 1.0821715661527706e-07, + "loss": 0.0023, + "step": 23685 + }, + { + "epoch": 0.46, + "learning_rate": 1.0821327327094092e-07, + "loss": 1.2427, + "step": 23686 + }, + { + "epoch": 0.46, + "learning_rate": 1.0820938992660478e-07, + "loss": 0.0011, + "step": 23687 + }, + { + "epoch": 0.46, + "learning_rate": 1.0820550658226864e-07, + "loss": 0.0588, + "step": 23688 + }, + { + "epoch": 0.46, + "learning_rate": 1.082016232379325e-07, + "loss": 0.0009, + "step": 23689 + }, + { + "epoch": 0.46, + "learning_rate": 1.0819773989359635e-07, + "loss": 0.0009, + "step": 23690 + }, + { + "epoch": 0.46, + "learning_rate": 1.0819385654926021e-07, + "loss": 0.0035, + "step": 23691 + }, + { + "epoch": 0.46, + "learning_rate": 1.0818997320492407e-07, + "loss": 0.0005, + "step": 23692 + }, + { + "epoch": 0.46, + "learning_rate": 1.0818608986058793e-07, + "loss": 0.0005, + "step": 23693 + }, + { + "epoch": 0.46, + "learning_rate": 1.0818220651625179e-07, + "loss": 0.1101, + "step": 23694 + }, + { + "epoch": 0.46, + "learning_rate": 1.0817832317191564e-07, + "loss": 0.0015, + "step": 23695 + }, + { + "epoch": 0.46, + "learning_rate": 1.081744398275795e-07, + "loss": 0.0006, + "step": 23696 + }, + { + "epoch": 0.46, + "learning_rate": 1.0817055648324336e-07, + "loss": 0.0007, + "step": 23697 + }, + { + "epoch": 0.46, + "learning_rate": 1.0816667313890722e-07, + "loss": 0.0032, + "step": 23698 + }, + { + "epoch": 0.46, + "learning_rate": 1.0816278979457108e-07, + "loss": 0.001, + "step": 23699 + }, + { + "epoch": 0.46, + "learning_rate": 1.0815890645023494e-07, + "loss": 0.0174, + "step": 23700 + }, + { + "epoch": 0.46, + "learning_rate": 1.081550231058988e-07, + "loss": 0.0007, + "step": 23701 + }, + { + "epoch": 0.46, + "learning_rate": 1.0815113976156265e-07, + "loss": 0.0009, + "step": 23702 + }, + { + "epoch": 0.46, + "learning_rate": 1.0814725641722651e-07, + "loss": 1.0756, + "step": 23703 + }, + { + "epoch": 0.46, + "learning_rate": 1.0814337307289037e-07, + "loss": 0.6508, + "step": 23704 + }, + { + "epoch": 0.46, + "learning_rate": 1.0813948972855423e-07, + "loss": 0.0006, + "step": 23705 + }, + { + "epoch": 0.46, + "learning_rate": 1.0813560638421809e-07, + "loss": 0.0005, + "step": 23706 + }, + { + "epoch": 0.46, + "learning_rate": 1.0813172303988194e-07, + "loss": 1.1675, + "step": 23707 + }, + { + "epoch": 0.46, + "learning_rate": 1.081278396955458e-07, + "loss": 0.0022, + "step": 23708 + }, + { + "epoch": 0.46, + "learning_rate": 1.0812395635120966e-07, + "loss": 0.002, + "step": 23709 + }, + { + "epoch": 0.46, + "learning_rate": 1.0812007300687352e-07, + "loss": 0.001, + "step": 23710 + }, + { + "epoch": 0.46, + "learning_rate": 1.0811618966253738e-07, + "loss": 0.0204, + "step": 23711 + }, + { + "epoch": 0.46, + "learning_rate": 1.0811230631820123e-07, + "loss": 0.0005, + "step": 23712 + }, + { + "epoch": 0.46, + "learning_rate": 1.0810842297386509e-07, + "loss": 0.0007, + "step": 23713 + }, + { + "epoch": 0.46, + "learning_rate": 1.0810453962952895e-07, + "loss": 0.7443, + "step": 23714 + }, + { + "epoch": 0.46, + "learning_rate": 1.0810065628519281e-07, + "loss": 0.0014, + "step": 23715 + }, + { + "epoch": 0.46, + "learning_rate": 1.0809677294085667e-07, + "loss": 0.002, + "step": 23716 + }, + { + "epoch": 0.46, + "learning_rate": 1.0809288959652053e-07, + "loss": 0.0004, + "step": 23717 + }, + { + "epoch": 0.46, + "learning_rate": 1.0808900625218438e-07, + "loss": 0.0005, + "step": 23718 + }, + { + "epoch": 0.46, + "learning_rate": 1.0808512290784824e-07, + "loss": 0.1315, + "step": 23719 + }, + { + "epoch": 0.46, + "learning_rate": 1.080812395635121e-07, + "loss": 0.0006, + "step": 23720 + }, + { + "epoch": 0.46, + "learning_rate": 1.0807735621917596e-07, + "loss": 0.0004, + "step": 23721 + }, + { + "epoch": 0.46, + "learning_rate": 1.080734728748398e-07, + "loss": 0.0005, + "step": 23722 + }, + { + "epoch": 0.46, + "learning_rate": 1.0806958953050366e-07, + "loss": 0.0006, + "step": 23723 + }, + { + "epoch": 0.46, + "learning_rate": 1.0806570618616752e-07, + "loss": 0.0028, + "step": 23724 + }, + { + "epoch": 0.46, + "learning_rate": 1.0806182284183138e-07, + "loss": 0.0005, + "step": 23725 + }, + { + "epoch": 0.46, + "learning_rate": 1.0805793949749524e-07, + "loss": 0.0006, + "step": 23726 + }, + { + "epoch": 0.46, + "learning_rate": 1.080540561531591e-07, + "loss": 0.0008, + "step": 23727 + }, + { + "epoch": 0.46, + "learning_rate": 1.0805017280882295e-07, + "loss": 0.0007, + "step": 23728 + }, + { + "epoch": 0.46, + "learning_rate": 1.0804628946448681e-07, + "loss": 0.0006, + "step": 23729 + }, + { + "epoch": 0.46, + "learning_rate": 1.0804240612015067e-07, + "loss": 0.0007, + "step": 23730 + }, + { + "epoch": 0.46, + "learning_rate": 1.0803852277581453e-07, + "loss": 0.0075, + "step": 23731 + }, + { + "epoch": 0.46, + "learning_rate": 1.0803463943147839e-07, + "loss": 0.0266, + "step": 23732 + }, + { + "epoch": 0.46, + "learning_rate": 1.0803075608714224e-07, + "loss": 0.0006, + "step": 23733 + }, + { + "epoch": 0.46, + "learning_rate": 1.080268727428061e-07, + "loss": 0.0006, + "step": 23734 + }, + { + "epoch": 0.46, + "learning_rate": 1.0802298939846996e-07, + "loss": 0.001, + "step": 23735 + }, + { + "epoch": 0.46, + "learning_rate": 1.0801910605413382e-07, + "loss": 0.0075, + "step": 23736 + }, + { + "epoch": 0.46, + "learning_rate": 1.0801522270979768e-07, + "loss": 0.1113, + "step": 23737 + }, + { + "epoch": 0.46, + "learning_rate": 1.0801133936546154e-07, + "loss": 0.0037, + "step": 23738 + }, + { + "epoch": 0.46, + "learning_rate": 1.080074560211254e-07, + "loss": 0.3056, + "step": 23739 + }, + { + "epoch": 0.46, + "learning_rate": 1.0800357267678925e-07, + "loss": 0.0352, + "step": 23740 + }, + { + "epoch": 0.46, + "learning_rate": 1.0799968933245311e-07, + "loss": 0.0025, + "step": 23741 + }, + { + "epoch": 0.46, + "learning_rate": 1.0799580598811697e-07, + "loss": 0.4198, + "step": 23742 + }, + { + "epoch": 0.46, + "learning_rate": 1.0799192264378081e-07, + "loss": 0.0007, + "step": 23743 + }, + { + "epoch": 0.46, + "learning_rate": 1.0798803929944467e-07, + "loss": 0.001, + "step": 23744 + }, + { + "epoch": 0.46, + "learning_rate": 1.0798415595510853e-07, + "loss": 0.0007, + "step": 23745 + }, + { + "epoch": 0.46, + "learning_rate": 1.0798027261077239e-07, + "loss": 0.0006, + "step": 23746 + }, + { + "epoch": 0.46, + "learning_rate": 1.0797638926643625e-07, + "loss": 0.0008, + "step": 23747 + }, + { + "epoch": 0.46, + "learning_rate": 1.079725059221001e-07, + "loss": 0.0006, + "step": 23748 + }, + { + "epoch": 0.46, + "learning_rate": 1.0796862257776396e-07, + "loss": 0.0234, + "step": 23749 + }, + { + "epoch": 0.46, + "learning_rate": 1.0796473923342782e-07, + "loss": 0.0006, + "step": 23750 + }, + { + "epoch": 0.46, + "learning_rate": 1.0796085588909167e-07, + "loss": 0.1614, + "step": 23751 + }, + { + "epoch": 0.46, + "learning_rate": 1.0795697254475552e-07, + "loss": 0.0096, + "step": 23752 + }, + { + "epoch": 0.46, + "learning_rate": 1.0795308920041938e-07, + "loss": 0.0006, + "step": 23753 + }, + { + "epoch": 0.46, + "learning_rate": 1.0794920585608324e-07, + "loss": 0.0005, + "step": 23754 + }, + { + "epoch": 0.46, + "learning_rate": 1.079453225117471e-07, + "loss": 0.0311, + "step": 23755 + }, + { + "epoch": 0.46, + "learning_rate": 1.0794143916741096e-07, + "loss": 0.0006, + "step": 23756 + }, + { + "epoch": 0.46, + "learning_rate": 1.0793755582307482e-07, + "loss": 0.0007, + "step": 23757 + }, + { + "epoch": 0.46, + "learning_rate": 1.0793367247873867e-07, + "loss": 0.1548, + "step": 23758 + }, + { + "epoch": 0.46, + "learning_rate": 1.0792978913440253e-07, + "loss": 0.0006, + "step": 23759 + }, + { + "epoch": 0.46, + "learning_rate": 1.0792590579006639e-07, + "loss": 0.0078, + "step": 23760 + }, + { + "epoch": 0.46, + "learning_rate": 1.0792202244573025e-07, + "loss": 0.9641, + "step": 23761 + }, + { + "epoch": 0.46, + "learning_rate": 1.0791813910139411e-07, + "loss": 0.0062, + "step": 23762 + }, + { + "epoch": 0.46, + "learning_rate": 1.0791425575705797e-07, + "loss": 0.0007, + "step": 23763 + }, + { + "epoch": 0.46, + "learning_rate": 1.0791037241272182e-07, + "loss": 0.0014, + "step": 23764 + }, + { + "epoch": 0.46, + "learning_rate": 1.0790648906838568e-07, + "loss": 0.0005, + "step": 23765 + }, + { + "epoch": 0.46, + "learning_rate": 1.0790260572404954e-07, + "loss": 0.0056, + "step": 23766 + }, + { + "epoch": 0.46, + "learning_rate": 1.078987223797134e-07, + "loss": 0.0006, + "step": 23767 + }, + { + "epoch": 0.46, + "learning_rate": 1.0789483903537726e-07, + "loss": 0.0005, + "step": 23768 + }, + { + "epoch": 0.46, + "learning_rate": 1.0789095569104112e-07, + "loss": 0.4159, + "step": 23769 + }, + { + "epoch": 0.46, + "learning_rate": 1.0788707234670497e-07, + "loss": 0.0006, + "step": 23770 + }, + { + "epoch": 0.46, + "learning_rate": 1.0788318900236883e-07, + "loss": 0.0005, + "step": 23771 + }, + { + "epoch": 0.46, + "learning_rate": 1.0787930565803269e-07, + "loss": 0.0011, + "step": 23772 + }, + { + "epoch": 0.46, + "learning_rate": 1.0787542231369655e-07, + "loss": 0.0005, + "step": 23773 + }, + { + "epoch": 0.46, + "learning_rate": 1.078715389693604e-07, + "loss": 0.0007, + "step": 23774 + }, + { + "epoch": 0.46, + "learning_rate": 1.0786765562502426e-07, + "loss": 0.0005, + "step": 23775 + }, + { + "epoch": 0.46, + "learning_rate": 1.0786377228068812e-07, + "loss": 0.0006, + "step": 23776 + }, + { + "epoch": 0.46, + "learning_rate": 1.0785988893635198e-07, + "loss": 0.0009, + "step": 23777 + }, + { + "epoch": 0.46, + "learning_rate": 1.0785600559201584e-07, + "loss": 0.0009, + "step": 23778 + }, + { + "epoch": 0.46, + "learning_rate": 1.078521222476797e-07, + "loss": 0.5543, + "step": 23779 + }, + { + "epoch": 0.46, + "learning_rate": 1.0784823890334356e-07, + "loss": 0.0005, + "step": 23780 + }, + { + "epoch": 0.46, + "learning_rate": 1.0784435555900741e-07, + "loss": 0.0006, + "step": 23781 + }, + { + "epoch": 0.46, + "learning_rate": 1.0784047221467127e-07, + "loss": 0.0056, + "step": 23782 + }, + { + "epoch": 0.46, + "learning_rate": 1.0783658887033513e-07, + "loss": 0.0077, + "step": 23783 + }, + { + "epoch": 0.46, + "learning_rate": 1.0783270552599899e-07, + "loss": 0.0007, + "step": 23784 + }, + { + "epoch": 0.46, + "learning_rate": 1.0782882218166285e-07, + "loss": 0.0006, + "step": 23785 + }, + { + "epoch": 0.46, + "learning_rate": 1.078249388373267e-07, + "loss": 0.0069, + "step": 23786 + }, + { + "epoch": 0.46, + "learning_rate": 1.0782105549299056e-07, + "loss": 0.0008, + "step": 23787 + }, + { + "epoch": 0.46, + "learning_rate": 1.0781717214865442e-07, + "loss": 0.0005, + "step": 23788 + }, + { + "epoch": 0.46, + "learning_rate": 1.0781328880431828e-07, + "loss": 0.0008, + "step": 23789 + }, + { + "epoch": 0.46, + "learning_rate": 1.0780940545998214e-07, + "loss": 0.0007, + "step": 23790 + }, + { + "epoch": 0.46, + "learning_rate": 1.07805522115646e-07, + "loss": 0.0007, + "step": 23791 + }, + { + "epoch": 0.46, + "learning_rate": 1.0780163877130985e-07, + "loss": 0.0124, + "step": 23792 + }, + { + "epoch": 0.46, + "learning_rate": 1.0779775542697371e-07, + "loss": 0.0007, + "step": 23793 + }, + { + "epoch": 0.46, + "learning_rate": 1.0779387208263757e-07, + "loss": 0.0035, + "step": 23794 + }, + { + "epoch": 0.46, + "learning_rate": 1.0778998873830143e-07, + "loss": 0.0649, + "step": 23795 + }, + { + "epoch": 0.46, + "learning_rate": 1.0778610539396529e-07, + "loss": 0.0007, + "step": 23796 + }, + { + "epoch": 0.46, + "learning_rate": 1.0778222204962915e-07, + "loss": 0.0015, + "step": 23797 + }, + { + "epoch": 0.46, + "learning_rate": 1.07778338705293e-07, + "loss": 0.0006, + "step": 23798 + }, + { + "epoch": 0.46, + "learning_rate": 1.0777445536095686e-07, + "loss": 0.0006, + "step": 23799 + }, + { + "epoch": 0.46, + "learning_rate": 1.0777057201662072e-07, + "loss": 0.0035, + "step": 23800 + }, + { + "epoch": 0.46, + "learning_rate": 1.0776668867228455e-07, + "loss": 0.0006, + "step": 23801 + }, + { + "epoch": 0.46, + "learning_rate": 1.0776280532794841e-07, + "loss": 0.5996, + "step": 23802 + }, + { + "epoch": 0.46, + "learning_rate": 1.0775892198361227e-07, + "loss": 0.0007, + "step": 23803 + }, + { + "epoch": 0.46, + "learning_rate": 1.0775503863927613e-07, + "loss": 0.0007, + "step": 23804 + }, + { + "epoch": 0.46, + "learning_rate": 1.0775115529493999e-07, + "loss": 0.0005, + "step": 23805 + }, + { + "epoch": 0.46, + "learning_rate": 1.0774727195060384e-07, + "loss": 0.001, + "step": 23806 + }, + { + "epoch": 0.46, + "learning_rate": 1.077433886062677e-07, + "loss": 0.0008, + "step": 23807 + }, + { + "epoch": 0.46, + "learning_rate": 1.0773950526193156e-07, + "loss": 0.0041, + "step": 23808 + }, + { + "epoch": 0.46, + "learning_rate": 1.0773562191759542e-07, + "loss": 0.387, + "step": 23809 + }, + { + "epoch": 0.46, + "learning_rate": 1.0773173857325928e-07, + "loss": 0.0009, + "step": 23810 + }, + { + "epoch": 0.46, + "learning_rate": 1.0772785522892313e-07, + "loss": 1.4429, + "step": 23811 + }, + { + "epoch": 0.46, + "learning_rate": 1.0772397188458699e-07, + "loss": 0.0012, + "step": 23812 + }, + { + "epoch": 0.46, + "learning_rate": 1.0772008854025085e-07, + "loss": 0.001, + "step": 23813 + }, + { + "epoch": 0.46, + "learning_rate": 1.0771620519591471e-07, + "loss": 0.0006, + "step": 23814 + }, + { + "epoch": 0.46, + "learning_rate": 1.0771232185157857e-07, + "loss": 0.0005, + "step": 23815 + }, + { + "epoch": 0.46, + "learning_rate": 1.0770843850724243e-07, + "loss": 0.0007, + "step": 23816 + }, + { + "epoch": 0.46, + "learning_rate": 1.0770455516290628e-07, + "loss": 0.001, + "step": 23817 + }, + { + "epoch": 0.46, + "learning_rate": 1.0770067181857014e-07, + "loss": 0.0006, + "step": 23818 + }, + { + "epoch": 0.46, + "learning_rate": 1.07696788474234e-07, + "loss": 0.0006, + "step": 23819 + }, + { + "epoch": 0.46, + "learning_rate": 1.0769290512989786e-07, + "loss": 0.5078, + "step": 23820 + }, + { + "epoch": 0.46, + "learning_rate": 1.0768902178556172e-07, + "loss": 0.3088, + "step": 23821 + }, + { + "epoch": 0.46, + "learning_rate": 1.0768513844122558e-07, + "loss": 0.0007, + "step": 23822 + }, + { + "epoch": 0.46, + "learning_rate": 1.0768125509688943e-07, + "loss": 0.3508, + "step": 23823 + }, + { + "epoch": 0.46, + "learning_rate": 1.0767737175255329e-07, + "loss": 0.7867, + "step": 23824 + }, + { + "epoch": 0.46, + "learning_rate": 1.0767348840821715e-07, + "loss": 0.0249, + "step": 23825 + }, + { + "epoch": 0.46, + "learning_rate": 1.0766960506388101e-07, + "loss": 0.666, + "step": 23826 + }, + { + "epoch": 0.46, + "learning_rate": 1.0766572171954487e-07, + "loss": 0.0004, + "step": 23827 + }, + { + "epoch": 0.46, + "learning_rate": 1.0766183837520872e-07, + "loss": 0.0008, + "step": 23828 + }, + { + "epoch": 0.46, + "learning_rate": 1.0765795503087258e-07, + "loss": 0.0017, + "step": 23829 + }, + { + "epoch": 0.46, + "learning_rate": 1.0765407168653644e-07, + "loss": 0.0006, + "step": 23830 + }, + { + "epoch": 0.46, + "learning_rate": 1.076501883422003e-07, + "loss": 0.0008, + "step": 23831 + }, + { + "epoch": 0.46, + "learning_rate": 1.0764630499786416e-07, + "loss": 0.5744, + "step": 23832 + }, + { + "epoch": 0.46, + "learning_rate": 1.0764242165352802e-07, + "loss": 0.1411, + "step": 23833 + }, + { + "epoch": 0.46, + "learning_rate": 1.0763853830919187e-07, + "loss": 0.0007, + "step": 23834 + }, + { + "epoch": 0.46, + "learning_rate": 1.0763465496485573e-07, + "loss": 0.0006, + "step": 23835 + }, + { + "epoch": 0.46, + "learning_rate": 1.0763077162051959e-07, + "loss": 0.0004, + "step": 23836 + }, + { + "epoch": 0.46, + "learning_rate": 1.0762688827618345e-07, + "loss": 0.0016, + "step": 23837 + }, + { + "epoch": 0.46, + "learning_rate": 1.0762300493184731e-07, + "loss": 0.0007, + "step": 23838 + }, + { + "epoch": 0.46, + "learning_rate": 1.0761912158751117e-07, + "loss": 0.0005, + "step": 23839 + }, + { + "epoch": 0.46, + "learning_rate": 1.0761523824317502e-07, + "loss": 0.0007, + "step": 23840 + }, + { + "epoch": 0.46, + "learning_rate": 1.0761135489883888e-07, + "loss": 0.0007, + "step": 23841 + }, + { + "epoch": 0.46, + "learning_rate": 1.0760747155450274e-07, + "loss": 0.0006, + "step": 23842 + }, + { + "epoch": 0.46, + "learning_rate": 1.076035882101666e-07, + "loss": 0.0006, + "step": 23843 + }, + { + "epoch": 0.46, + "learning_rate": 1.0759970486583046e-07, + "loss": 0.0007, + "step": 23844 + }, + { + "epoch": 0.46, + "learning_rate": 1.0759582152149432e-07, + "loss": 1.0834, + "step": 23845 + }, + { + "epoch": 0.46, + "learning_rate": 1.0759193817715817e-07, + "loss": 0.0008, + "step": 23846 + }, + { + "epoch": 0.46, + "learning_rate": 1.0758805483282203e-07, + "loss": 0.0006, + "step": 23847 + }, + { + "epoch": 0.46, + "learning_rate": 1.0758417148848589e-07, + "loss": 0.0009, + "step": 23848 + }, + { + "epoch": 0.46, + "learning_rate": 1.0758028814414975e-07, + "loss": 0.01, + "step": 23849 + }, + { + "epoch": 0.46, + "learning_rate": 1.075764047998136e-07, + "loss": 0.0006, + "step": 23850 + }, + { + "epoch": 0.46, + "learning_rate": 1.0757252145547746e-07, + "loss": 0.0006, + "step": 23851 + }, + { + "epoch": 0.46, + "learning_rate": 1.0756863811114132e-07, + "loss": 0.0011, + "step": 23852 + }, + { + "epoch": 0.46, + "learning_rate": 1.0756475476680518e-07, + "loss": 0.0015, + "step": 23853 + }, + { + "epoch": 0.46, + "learning_rate": 1.0756087142246904e-07, + "loss": 0.0019, + "step": 23854 + }, + { + "epoch": 0.46, + "learning_rate": 1.075569880781329e-07, + "loss": 0.0007, + "step": 23855 + }, + { + "epoch": 0.46, + "learning_rate": 1.0755310473379676e-07, + "loss": 0.0005, + "step": 23856 + }, + { + "epoch": 0.46, + "learning_rate": 1.0754922138946061e-07, + "loss": 0.0007, + "step": 23857 + }, + { + "epoch": 0.46, + "learning_rate": 1.0754533804512447e-07, + "loss": 0.0007, + "step": 23858 + }, + { + "epoch": 0.46, + "learning_rate": 1.075414547007883e-07, + "loss": 0.0007, + "step": 23859 + }, + { + "epoch": 0.46, + "learning_rate": 1.0753757135645216e-07, + "loss": 0.0005, + "step": 23860 + }, + { + "epoch": 0.46, + "learning_rate": 1.0753368801211602e-07, + "loss": 0.6094, + "step": 23861 + }, + { + "epoch": 0.46, + "learning_rate": 1.0752980466777988e-07, + "loss": 0.0006, + "step": 23862 + }, + { + "epoch": 0.46, + "learning_rate": 1.0752592132344374e-07, + "loss": 0.0004, + "step": 23863 + }, + { + "epoch": 0.46, + "learning_rate": 1.075220379791076e-07, + "loss": 0.0007, + "step": 23864 + }, + { + "epoch": 0.46, + "learning_rate": 1.0751815463477145e-07, + "loss": 0.0932, + "step": 23865 + }, + { + "epoch": 0.46, + "learning_rate": 1.0751427129043531e-07, + "loss": 0.0004, + "step": 23866 + }, + { + "epoch": 0.46, + "learning_rate": 1.0751038794609917e-07, + "loss": 0.0008, + "step": 23867 + }, + { + "epoch": 0.46, + "learning_rate": 1.0750650460176303e-07, + "loss": 0.0008, + "step": 23868 + }, + { + "epoch": 0.46, + "learning_rate": 1.0750262125742689e-07, + "loss": 0.0007, + "step": 23869 + }, + { + "epoch": 0.46, + "learning_rate": 1.0749873791309074e-07, + "loss": 0.2849, + "step": 23870 + }, + { + "epoch": 0.46, + "learning_rate": 1.074948545687546e-07, + "loss": 0.0005, + "step": 23871 + }, + { + "epoch": 0.46, + "learning_rate": 1.0749097122441846e-07, + "loss": 0.0006, + "step": 23872 + }, + { + "epoch": 0.46, + "learning_rate": 1.0748708788008232e-07, + "loss": 0.0006, + "step": 23873 + }, + { + "epoch": 0.46, + "learning_rate": 1.0748320453574618e-07, + "loss": 0.0007, + "step": 23874 + }, + { + "epoch": 0.46, + "learning_rate": 1.0747932119141004e-07, + "loss": 0.2926, + "step": 23875 + }, + { + "epoch": 0.46, + "learning_rate": 1.074754378470739e-07, + "loss": 0.5217, + "step": 23876 + }, + { + "epoch": 0.46, + "learning_rate": 1.0747155450273775e-07, + "loss": 0.0006, + "step": 23877 + }, + { + "epoch": 0.46, + "learning_rate": 1.0746767115840161e-07, + "loss": 0.0005, + "step": 23878 + }, + { + "epoch": 0.46, + "learning_rate": 1.0746378781406547e-07, + "loss": 0.0006, + "step": 23879 + }, + { + "epoch": 0.46, + "learning_rate": 1.0745990446972933e-07, + "loss": 0.0008, + "step": 23880 + }, + { + "epoch": 0.46, + "learning_rate": 1.0745602112539319e-07, + "loss": 0.0007, + "step": 23881 + }, + { + "epoch": 0.46, + "learning_rate": 1.0745213778105704e-07, + "loss": 0.0013, + "step": 23882 + }, + { + "epoch": 0.46, + "learning_rate": 1.074482544367209e-07, + "loss": 0.0006, + "step": 23883 + }, + { + "epoch": 0.46, + "learning_rate": 1.0744437109238476e-07, + "loss": 0.0007, + "step": 23884 + }, + { + "epoch": 0.46, + "learning_rate": 1.0744048774804862e-07, + "loss": 0.0015, + "step": 23885 + }, + { + "epoch": 0.46, + "learning_rate": 1.0743660440371248e-07, + "loss": 0.0016, + "step": 23886 + }, + { + "epoch": 0.46, + "learning_rate": 1.0743272105937633e-07, + "loss": 0.2133, + "step": 23887 + }, + { + "epoch": 0.46, + "learning_rate": 1.0742883771504019e-07, + "loss": 0.0005, + "step": 23888 + }, + { + "epoch": 0.46, + "learning_rate": 1.0742495437070405e-07, + "loss": 0.0044, + "step": 23889 + }, + { + "epoch": 0.46, + "learning_rate": 1.0742107102636791e-07, + "loss": 0.9208, + "step": 23890 + }, + { + "epoch": 0.46, + "learning_rate": 1.0741718768203177e-07, + "loss": 0.0006, + "step": 23891 + }, + { + "epoch": 0.46, + "learning_rate": 1.0741330433769563e-07, + "loss": 0.0008, + "step": 23892 + }, + { + "epoch": 0.46, + "learning_rate": 1.0740942099335948e-07, + "loss": 0.0048, + "step": 23893 + }, + { + "epoch": 0.46, + "learning_rate": 1.0740553764902334e-07, + "loss": 0.0006, + "step": 23894 + }, + { + "epoch": 0.46, + "learning_rate": 1.074016543046872e-07, + "loss": 0.0006, + "step": 23895 + }, + { + "epoch": 0.46, + "learning_rate": 1.0739777096035106e-07, + "loss": 0.0006, + "step": 23896 + }, + { + "epoch": 0.46, + "learning_rate": 1.0739388761601492e-07, + "loss": 0.0007, + "step": 23897 + }, + { + "epoch": 0.46, + "learning_rate": 1.0739000427167878e-07, + "loss": 0.0006, + "step": 23898 + }, + { + "epoch": 0.46, + "learning_rate": 1.0738612092734262e-07, + "loss": 0.1335, + "step": 23899 + }, + { + "epoch": 0.46, + "learning_rate": 1.0738223758300648e-07, + "loss": 0.0005, + "step": 23900 + }, + { + "epoch": 0.46, + "learning_rate": 1.0737835423867034e-07, + "loss": 0.0005, + "step": 23901 + }, + { + "epoch": 0.46, + "learning_rate": 1.073744708943342e-07, + "loss": 1.1525, + "step": 23902 + }, + { + "epoch": 0.46, + "learning_rate": 1.0737058754999805e-07, + "loss": 0.0011, + "step": 23903 + }, + { + "epoch": 0.46, + "learning_rate": 1.0736670420566191e-07, + "loss": 0.0005, + "step": 23904 + }, + { + "epoch": 0.46, + "learning_rate": 1.0736282086132577e-07, + "loss": 0.0007, + "step": 23905 + }, + { + "epoch": 0.46, + "learning_rate": 1.0735893751698963e-07, + "loss": 0.0006, + "step": 23906 + }, + { + "epoch": 0.46, + "learning_rate": 1.0735505417265349e-07, + "loss": 0.0005, + "step": 23907 + }, + { + "epoch": 0.46, + "learning_rate": 1.0735117082831734e-07, + "loss": 0.8983, + "step": 23908 + }, + { + "epoch": 0.46, + "learning_rate": 1.073472874839812e-07, + "loss": 0.0004, + "step": 23909 + }, + { + "epoch": 0.46, + "learning_rate": 1.0734340413964506e-07, + "loss": 0.0012, + "step": 23910 + }, + { + "epoch": 0.46, + "learning_rate": 1.0733952079530892e-07, + "loss": 0.0007, + "step": 23911 + }, + { + "epoch": 0.46, + "learning_rate": 1.0733563745097278e-07, + "loss": 0.0007, + "step": 23912 + }, + { + "epoch": 0.46, + "learning_rate": 1.0733175410663664e-07, + "loss": 0.852, + "step": 23913 + }, + { + "epoch": 0.46, + "learning_rate": 1.073278707623005e-07, + "loss": 0.0005, + "step": 23914 + }, + { + "epoch": 0.46, + "learning_rate": 1.0732398741796435e-07, + "loss": 0.0012, + "step": 23915 + }, + { + "epoch": 0.46, + "learning_rate": 1.0732010407362821e-07, + "loss": 0.001, + "step": 23916 + }, + { + "epoch": 0.46, + "learning_rate": 1.0731622072929206e-07, + "loss": 0.0006, + "step": 23917 + }, + { + "epoch": 0.46, + "learning_rate": 1.0731233738495591e-07, + "loss": 0.0007, + "step": 23918 + }, + { + "epoch": 0.46, + "learning_rate": 1.0730845404061977e-07, + "loss": 0.0008, + "step": 23919 + }, + { + "epoch": 0.46, + "learning_rate": 1.0730457069628363e-07, + "loss": 0.0008, + "step": 23920 + }, + { + "epoch": 0.46, + "learning_rate": 1.0730068735194749e-07, + "loss": 0.0008, + "step": 23921 + }, + { + "epoch": 0.46, + "learning_rate": 1.0729680400761135e-07, + "loss": 0.0232, + "step": 23922 + }, + { + "epoch": 0.46, + "learning_rate": 1.072929206632752e-07, + "loss": 0.4252, + "step": 23923 + }, + { + "epoch": 0.46, + "learning_rate": 1.0728903731893906e-07, + "loss": 0.0007, + "step": 23924 + }, + { + "epoch": 0.46, + "learning_rate": 1.0728515397460292e-07, + "loss": 0.014, + "step": 23925 + }, + { + "epoch": 0.46, + "learning_rate": 1.0728127063026678e-07, + "loss": 0.0007, + "step": 23926 + }, + { + "epoch": 0.46, + "learning_rate": 1.0727738728593064e-07, + "loss": 0.0005, + "step": 23927 + }, + { + "epoch": 0.46, + "learning_rate": 1.0727350394159448e-07, + "loss": 0.0005, + "step": 23928 + }, + { + "epoch": 0.46, + "learning_rate": 1.0726962059725834e-07, + "loss": 0.0014, + "step": 23929 + }, + { + "epoch": 0.46, + "learning_rate": 1.072657372529222e-07, + "loss": 0.0013, + "step": 23930 + }, + { + "epoch": 0.46, + "learning_rate": 1.0726185390858606e-07, + "loss": 0.0006, + "step": 23931 + }, + { + "epoch": 0.46, + "learning_rate": 1.0725797056424992e-07, + "loss": 0.0371, + "step": 23932 + }, + { + "epoch": 0.46, + "learning_rate": 1.0725408721991377e-07, + "loss": 0.0081, + "step": 23933 + }, + { + "epoch": 0.46, + "learning_rate": 1.0725020387557763e-07, + "loss": 0.0007, + "step": 23934 + }, + { + "epoch": 0.46, + "learning_rate": 1.0724632053124149e-07, + "loss": 0.001, + "step": 23935 + }, + { + "epoch": 0.46, + "learning_rate": 1.0724243718690535e-07, + "loss": 0.001, + "step": 23936 + }, + { + "epoch": 0.46, + "learning_rate": 1.0723855384256921e-07, + "loss": 0.0022, + "step": 23937 + }, + { + "epoch": 0.46, + "learning_rate": 1.0723467049823307e-07, + "loss": 0.174, + "step": 23938 + }, + { + "epoch": 0.46, + "learning_rate": 1.0723078715389692e-07, + "loss": 0.5425, + "step": 23939 + }, + { + "epoch": 0.46, + "learning_rate": 1.0722690380956078e-07, + "loss": 0.0006, + "step": 23940 + }, + { + "epoch": 0.46, + "learning_rate": 1.0722302046522464e-07, + "loss": 0.0007, + "step": 23941 + }, + { + "epoch": 0.46, + "learning_rate": 1.072191371208885e-07, + "loss": 0.0008, + "step": 23942 + }, + { + "epoch": 0.46, + "learning_rate": 1.0721525377655236e-07, + "loss": 0.1302, + "step": 23943 + }, + { + "epoch": 0.46, + "learning_rate": 1.0721137043221622e-07, + "loss": 0.0006, + "step": 23944 + }, + { + "epoch": 0.46, + "learning_rate": 1.0720748708788007e-07, + "loss": 0.0006, + "step": 23945 + }, + { + "epoch": 0.46, + "learning_rate": 1.0720360374354393e-07, + "loss": 0.0007, + "step": 23946 + }, + { + "epoch": 0.46, + "learning_rate": 1.0719972039920779e-07, + "loss": 0.0005, + "step": 23947 + }, + { + "epoch": 0.46, + "learning_rate": 1.0719583705487165e-07, + "loss": 0.0011, + "step": 23948 + }, + { + "epoch": 0.46, + "learning_rate": 1.071919537105355e-07, + "loss": 0.3646, + "step": 23949 + }, + { + "epoch": 0.46, + "learning_rate": 1.0718807036619936e-07, + "loss": 0.002, + "step": 23950 + }, + { + "epoch": 0.46, + "learning_rate": 1.0718418702186322e-07, + "loss": 0.0006, + "step": 23951 + }, + { + "epoch": 0.46, + "learning_rate": 1.0718030367752708e-07, + "loss": 0.531, + "step": 23952 + }, + { + "epoch": 0.46, + "learning_rate": 1.0717642033319094e-07, + "loss": 0.0006, + "step": 23953 + }, + { + "epoch": 0.46, + "learning_rate": 1.071725369888548e-07, + "loss": 0.0084, + "step": 23954 + }, + { + "epoch": 0.46, + "learning_rate": 1.0716865364451866e-07, + "loss": 0.0006, + "step": 23955 + }, + { + "epoch": 0.46, + "learning_rate": 1.0716477030018251e-07, + "loss": 0.0299, + "step": 23956 + }, + { + "epoch": 0.46, + "learning_rate": 1.0716088695584637e-07, + "loss": 0.0006, + "step": 23957 + }, + { + "epoch": 0.46, + "learning_rate": 1.0715700361151023e-07, + "loss": 0.0006, + "step": 23958 + }, + { + "epoch": 0.46, + "learning_rate": 1.0715312026717409e-07, + "loss": 0.0006, + "step": 23959 + }, + { + "epoch": 0.46, + "learning_rate": 1.0714923692283795e-07, + "loss": 0.7841, + "step": 23960 + }, + { + "epoch": 0.46, + "learning_rate": 1.071453535785018e-07, + "loss": 0.0011, + "step": 23961 + }, + { + "epoch": 0.46, + "learning_rate": 1.0714147023416566e-07, + "loss": 0.0005, + "step": 23962 + }, + { + "epoch": 0.46, + "learning_rate": 1.0713758688982952e-07, + "loss": 0.0005, + "step": 23963 + }, + { + "epoch": 0.46, + "learning_rate": 1.0713370354549338e-07, + "loss": 1.2067, + "step": 23964 + }, + { + "epoch": 0.46, + "learning_rate": 1.0712982020115724e-07, + "loss": 0.4805, + "step": 23965 + }, + { + "epoch": 0.46, + "learning_rate": 1.071259368568211e-07, + "loss": 0.0553, + "step": 23966 + }, + { + "epoch": 0.46, + "learning_rate": 1.0712205351248495e-07, + "loss": 0.0008, + "step": 23967 + }, + { + "epoch": 0.46, + "learning_rate": 1.0711817016814881e-07, + "loss": 0.0121, + "step": 23968 + }, + { + "epoch": 0.46, + "learning_rate": 1.0711428682381267e-07, + "loss": 0.0008, + "step": 23969 + }, + { + "epoch": 0.46, + "learning_rate": 1.0711040347947653e-07, + "loss": 0.0037, + "step": 23970 + }, + { + "epoch": 0.46, + "learning_rate": 1.0710652013514039e-07, + "loss": 0.0008, + "step": 23971 + }, + { + "epoch": 0.47, + "learning_rate": 1.0710263679080425e-07, + "loss": 0.0007, + "step": 23972 + }, + { + "epoch": 0.47, + "learning_rate": 1.070987534464681e-07, + "loss": 0.0004, + "step": 23973 + }, + { + "epoch": 0.47, + "learning_rate": 1.0709487010213196e-07, + "loss": 0.0013, + "step": 23974 + }, + { + "epoch": 0.47, + "learning_rate": 1.070909867577958e-07, + "loss": 0.0005, + "step": 23975 + }, + { + "epoch": 0.47, + "learning_rate": 1.0708710341345965e-07, + "loss": 0.0007, + "step": 23976 + }, + { + "epoch": 0.47, + "learning_rate": 1.0708322006912351e-07, + "loss": 0.0007, + "step": 23977 + }, + { + "epoch": 0.47, + "learning_rate": 1.0707933672478737e-07, + "loss": 0.0006, + "step": 23978 + }, + { + "epoch": 0.47, + "learning_rate": 1.0707545338045123e-07, + "loss": 0.0006, + "step": 23979 + }, + { + "epoch": 0.47, + "learning_rate": 1.0707157003611509e-07, + "loss": 0.0009, + "step": 23980 + }, + { + "epoch": 0.47, + "learning_rate": 1.0706768669177894e-07, + "loss": 0.0007, + "step": 23981 + }, + { + "epoch": 0.47, + "learning_rate": 1.070638033474428e-07, + "loss": 0.0006, + "step": 23982 + }, + { + "epoch": 0.47, + "learning_rate": 1.0705992000310666e-07, + "loss": 0.0007, + "step": 23983 + }, + { + "epoch": 0.47, + "learning_rate": 1.0705603665877052e-07, + "loss": 0.001, + "step": 23984 + }, + { + "epoch": 0.47, + "learning_rate": 1.0705215331443438e-07, + "loss": 0.0041, + "step": 23985 + }, + { + "epoch": 0.47, + "learning_rate": 1.0704826997009823e-07, + "loss": 0.0007, + "step": 23986 + }, + { + "epoch": 0.47, + "learning_rate": 1.0704438662576209e-07, + "loss": 0.0005, + "step": 23987 + }, + { + "epoch": 0.47, + "learning_rate": 1.0704050328142595e-07, + "loss": 0.0006, + "step": 23988 + }, + { + "epoch": 0.47, + "learning_rate": 1.0703661993708981e-07, + "loss": 0.0007, + "step": 23989 + }, + { + "epoch": 0.47, + "learning_rate": 1.0703273659275367e-07, + "loss": 0.0806, + "step": 23990 + }, + { + "epoch": 0.47, + "learning_rate": 1.0702885324841753e-07, + "loss": 0.0006, + "step": 23991 + }, + { + "epoch": 0.47, + "learning_rate": 1.0702496990408138e-07, + "loss": 0.2828, + "step": 23992 + }, + { + "epoch": 0.47, + "learning_rate": 1.0702108655974524e-07, + "loss": 0.0007, + "step": 23993 + }, + { + "epoch": 0.47, + "learning_rate": 1.070172032154091e-07, + "loss": 0.0013, + "step": 23994 + }, + { + "epoch": 0.47, + "learning_rate": 1.0701331987107296e-07, + "loss": 0.0005, + "step": 23995 + }, + { + "epoch": 0.47, + "learning_rate": 1.0700943652673682e-07, + "loss": 0.0009, + "step": 23996 + }, + { + "epoch": 0.47, + "learning_rate": 1.0700555318240068e-07, + "loss": 0.0016, + "step": 23997 + }, + { + "epoch": 0.47, + "learning_rate": 1.0700166983806453e-07, + "loss": 0.0012, + "step": 23998 + }, + { + "epoch": 0.47, + "learning_rate": 1.0699778649372839e-07, + "loss": 0.0071, + "step": 23999 + }, + { + "epoch": 0.47, + "learning_rate": 1.0699390314939225e-07, + "loss": 0.0005, + "step": 24000 + }, + { + "epoch": 0.47, + "learning_rate": 1.0699001980505611e-07, + "loss": 0.0009, + "step": 24001 + }, + { + "epoch": 0.47, + "learning_rate": 1.0698613646071997e-07, + "loss": 0.0006, + "step": 24002 + }, + { + "epoch": 0.47, + "learning_rate": 1.0698225311638383e-07, + "loss": 0.0006, + "step": 24003 + }, + { + "epoch": 0.47, + "learning_rate": 1.0697836977204768e-07, + "loss": 0.5507, + "step": 24004 + }, + { + "epoch": 0.47, + "learning_rate": 1.0697448642771154e-07, + "loss": 0.0005, + "step": 24005 + }, + { + "epoch": 0.47, + "learning_rate": 1.069706030833754e-07, + "loss": 0.0007, + "step": 24006 + }, + { + "epoch": 0.47, + "learning_rate": 1.0696671973903926e-07, + "loss": 0.0005, + "step": 24007 + }, + { + "epoch": 0.47, + "learning_rate": 1.0696283639470312e-07, + "loss": 0.0007, + "step": 24008 + }, + { + "epoch": 0.47, + "learning_rate": 1.0695895305036697e-07, + "loss": 0.0007, + "step": 24009 + }, + { + "epoch": 0.47, + "learning_rate": 1.0695506970603083e-07, + "loss": 0.0007, + "step": 24010 + }, + { + "epoch": 0.47, + "learning_rate": 1.0695118636169469e-07, + "loss": 0.0006, + "step": 24011 + }, + { + "epoch": 0.47, + "learning_rate": 1.0694730301735855e-07, + "loss": 0.0006, + "step": 24012 + }, + { + "epoch": 0.47, + "learning_rate": 1.0694341967302241e-07, + "loss": 0.0008, + "step": 24013 + }, + { + "epoch": 0.47, + "learning_rate": 1.0693953632868627e-07, + "loss": 0.0005, + "step": 24014 + }, + { + "epoch": 0.47, + "learning_rate": 1.0693565298435012e-07, + "loss": 0.0005, + "step": 24015 + }, + { + "epoch": 0.47, + "learning_rate": 1.0693176964001398e-07, + "loss": 0.0006, + "step": 24016 + }, + { + "epoch": 0.47, + "learning_rate": 1.0692788629567784e-07, + "loss": 0.0008, + "step": 24017 + }, + { + "epoch": 0.47, + "learning_rate": 1.069240029513417e-07, + "loss": 0.0016, + "step": 24018 + }, + { + "epoch": 0.47, + "learning_rate": 1.0692011960700556e-07, + "loss": 0.0006, + "step": 24019 + }, + { + "epoch": 0.47, + "learning_rate": 1.0691623626266942e-07, + "loss": 0.0007, + "step": 24020 + }, + { + "epoch": 0.47, + "learning_rate": 1.0691235291833327e-07, + "loss": 0.0013, + "step": 24021 + }, + { + "epoch": 0.47, + "learning_rate": 1.0690846957399713e-07, + "loss": 0.0006, + "step": 24022 + }, + { + "epoch": 0.47, + "learning_rate": 1.0690458622966099e-07, + "loss": 0.0006, + "step": 24023 + }, + { + "epoch": 0.47, + "learning_rate": 1.0690070288532485e-07, + "loss": 0.0878, + "step": 24024 + }, + { + "epoch": 0.47, + "learning_rate": 1.068968195409887e-07, + "loss": 0.0005, + "step": 24025 + }, + { + "epoch": 0.47, + "learning_rate": 1.0689293619665256e-07, + "loss": 0.0007, + "step": 24026 + }, + { + "epoch": 0.47, + "learning_rate": 1.0688905285231642e-07, + "loss": 0.0005, + "step": 24027 + }, + { + "epoch": 0.47, + "learning_rate": 1.0688516950798028e-07, + "loss": 0.0006, + "step": 24028 + }, + { + "epoch": 0.47, + "learning_rate": 1.0688128616364414e-07, + "loss": 0.0008, + "step": 24029 + }, + { + "epoch": 0.47, + "learning_rate": 1.06877402819308e-07, + "loss": 0.0008, + "step": 24030 + }, + { + "epoch": 0.47, + "learning_rate": 1.0687351947497186e-07, + "loss": 0.0046, + "step": 24031 + }, + { + "epoch": 0.47, + "learning_rate": 1.0686963613063571e-07, + "loss": 0.0006, + "step": 24032 + }, + { + "epoch": 0.47, + "learning_rate": 1.0686575278629955e-07, + "loss": 0.0007, + "step": 24033 + }, + { + "epoch": 0.47, + "learning_rate": 1.068618694419634e-07, + "loss": 0.0009, + "step": 24034 + }, + { + "epoch": 0.47, + "learning_rate": 1.0685798609762726e-07, + "loss": 0.0006, + "step": 24035 + }, + { + "epoch": 0.47, + "learning_rate": 1.0685410275329112e-07, + "loss": 0.0006, + "step": 24036 + }, + { + "epoch": 0.47, + "learning_rate": 1.0685021940895498e-07, + "loss": 0.0048, + "step": 24037 + }, + { + "epoch": 0.47, + "learning_rate": 1.0684633606461884e-07, + "loss": 0.0006, + "step": 24038 + }, + { + "epoch": 0.47, + "learning_rate": 1.068424527202827e-07, + "loss": 0.0006, + "step": 24039 + }, + { + "epoch": 0.47, + "learning_rate": 1.0683856937594655e-07, + "loss": 0.0008, + "step": 24040 + }, + { + "epoch": 0.47, + "learning_rate": 1.0683468603161041e-07, + "loss": 0.0027, + "step": 24041 + }, + { + "epoch": 0.47, + "learning_rate": 1.0683080268727427e-07, + "loss": 0.0009, + "step": 24042 + }, + { + "epoch": 0.47, + "learning_rate": 1.0682691934293813e-07, + "loss": 0.0007, + "step": 24043 + }, + { + "epoch": 0.47, + "learning_rate": 1.0682303599860199e-07, + "loss": 0.0006, + "step": 24044 + }, + { + "epoch": 0.47, + "learning_rate": 1.0681915265426584e-07, + "loss": 0.0005, + "step": 24045 + }, + { + "epoch": 0.47, + "learning_rate": 1.068152693099297e-07, + "loss": 0.0006, + "step": 24046 + }, + { + "epoch": 0.47, + "learning_rate": 1.0681138596559356e-07, + "loss": 0.0005, + "step": 24047 + }, + { + "epoch": 0.47, + "learning_rate": 1.0680750262125742e-07, + "loss": 0.0007, + "step": 24048 + }, + { + "epoch": 0.47, + "learning_rate": 1.0680361927692128e-07, + "loss": 0.0008, + "step": 24049 + }, + { + "epoch": 0.47, + "learning_rate": 1.0679973593258514e-07, + "loss": 0.0154, + "step": 24050 + }, + { + "epoch": 0.47, + "learning_rate": 1.06795852588249e-07, + "loss": 0.0007, + "step": 24051 + }, + { + "epoch": 0.47, + "learning_rate": 1.0679196924391285e-07, + "loss": 0.0006, + "step": 24052 + }, + { + "epoch": 0.47, + "learning_rate": 1.0678808589957671e-07, + "loss": 0.0009, + "step": 24053 + }, + { + "epoch": 0.47, + "learning_rate": 1.0678420255524057e-07, + "loss": 0.0007, + "step": 24054 + }, + { + "epoch": 0.47, + "learning_rate": 1.0678031921090443e-07, + "loss": 0.0005, + "step": 24055 + }, + { + "epoch": 0.47, + "learning_rate": 1.0677643586656829e-07, + "loss": 0.5067, + "step": 24056 + }, + { + "epoch": 0.47, + "learning_rate": 1.0677255252223214e-07, + "loss": 0.0007, + "step": 24057 + }, + { + "epoch": 0.47, + "learning_rate": 1.06768669177896e-07, + "loss": 0.0006, + "step": 24058 + }, + { + "epoch": 0.47, + "learning_rate": 1.0676478583355986e-07, + "loss": 0.001, + "step": 24059 + }, + { + "epoch": 0.47, + "learning_rate": 1.0676090248922372e-07, + "loss": 0.0006, + "step": 24060 + }, + { + "epoch": 0.47, + "learning_rate": 1.0675701914488758e-07, + "loss": 0.0011, + "step": 24061 + }, + { + "epoch": 0.47, + "learning_rate": 1.0675313580055144e-07, + "loss": 0.0009, + "step": 24062 + }, + { + "epoch": 0.47, + "learning_rate": 1.0674925245621529e-07, + "loss": 0.0007, + "step": 24063 + }, + { + "epoch": 0.47, + "learning_rate": 1.0674536911187915e-07, + "loss": 0.0016, + "step": 24064 + }, + { + "epoch": 0.47, + "learning_rate": 1.0674148576754301e-07, + "loss": 0.0013, + "step": 24065 + }, + { + "epoch": 0.47, + "learning_rate": 1.0673760242320687e-07, + "loss": 0.0082, + "step": 24066 + }, + { + "epoch": 0.47, + "learning_rate": 1.0673371907887073e-07, + "loss": 1.3083, + "step": 24067 + }, + { + "epoch": 0.47, + "learning_rate": 1.0672983573453458e-07, + "loss": 1.0321, + "step": 24068 + }, + { + "epoch": 0.47, + "learning_rate": 1.0672595239019844e-07, + "loss": 0.0006, + "step": 24069 + }, + { + "epoch": 0.47, + "learning_rate": 1.067220690458623e-07, + "loss": 0.0005, + "step": 24070 + }, + { + "epoch": 0.47, + "learning_rate": 1.0671818570152616e-07, + "loss": 0.0009, + "step": 24071 + }, + { + "epoch": 0.47, + "learning_rate": 1.0671430235719002e-07, + "loss": 0.0006, + "step": 24072 + }, + { + "epoch": 0.47, + "learning_rate": 1.0671041901285388e-07, + "loss": 0.0006, + "step": 24073 + }, + { + "epoch": 0.47, + "learning_rate": 1.0670653566851773e-07, + "loss": 0.6444, + "step": 24074 + }, + { + "epoch": 0.47, + "learning_rate": 1.0670265232418159e-07, + "loss": 0.7685, + "step": 24075 + }, + { + "epoch": 0.47, + "learning_rate": 1.0669876897984544e-07, + "loss": 0.0007, + "step": 24076 + }, + { + "epoch": 0.47, + "learning_rate": 1.066948856355093e-07, + "loss": 0.0005, + "step": 24077 + }, + { + "epoch": 0.47, + "learning_rate": 1.0669100229117315e-07, + "loss": 0.0091, + "step": 24078 + }, + { + "epoch": 0.47, + "learning_rate": 1.0668711894683701e-07, + "loss": 0.0007, + "step": 24079 + }, + { + "epoch": 0.47, + "learning_rate": 1.0668323560250087e-07, + "loss": 0.0005, + "step": 24080 + }, + { + "epoch": 0.47, + "learning_rate": 1.0667935225816473e-07, + "loss": 0.0009, + "step": 24081 + }, + { + "epoch": 0.47, + "learning_rate": 1.0667546891382859e-07, + "loss": 0.0006, + "step": 24082 + }, + { + "epoch": 0.47, + "learning_rate": 1.0667158556949244e-07, + "loss": 0.0005, + "step": 24083 + }, + { + "epoch": 0.47, + "learning_rate": 1.066677022251563e-07, + "loss": 0.0005, + "step": 24084 + }, + { + "epoch": 0.47, + "learning_rate": 1.0666381888082016e-07, + "loss": 0.0006, + "step": 24085 + }, + { + "epoch": 0.47, + "learning_rate": 1.0665993553648402e-07, + "loss": 0.0011, + "step": 24086 + }, + { + "epoch": 0.47, + "learning_rate": 1.0665605219214788e-07, + "loss": 0.0007, + "step": 24087 + }, + { + "epoch": 0.47, + "learning_rate": 1.0665216884781174e-07, + "loss": 0.0007, + "step": 24088 + }, + { + "epoch": 0.47, + "learning_rate": 1.066482855034756e-07, + "loss": 0.0005, + "step": 24089 + }, + { + "epoch": 0.47, + "learning_rate": 1.0664440215913945e-07, + "loss": 0.0006, + "step": 24090 + }, + { + "epoch": 0.47, + "learning_rate": 1.066405188148033e-07, + "loss": 0.3814, + "step": 24091 + }, + { + "epoch": 0.47, + "learning_rate": 1.0663663547046716e-07, + "loss": 0.0014, + "step": 24092 + }, + { + "epoch": 0.47, + "learning_rate": 1.0663275212613101e-07, + "loss": 0.0008, + "step": 24093 + }, + { + "epoch": 0.47, + "learning_rate": 1.0662886878179487e-07, + "loss": 0.0011, + "step": 24094 + }, + { + "epoch": 0.47, + "learning_rate": 1.0662498543745873e-07, + "loss": 0.0016, + "step": 24095 + }, + { + "epoch": 0.47, + "learning_rate": 1.0662110209312259e-07, + "loss": 0.0255, + "step": 24096 + }, + { + "epoch": 0.47, + "learning_rate": 1.0661721874878645e-07, + "loss": 0.0026, + "step": 24097 + }, + { + "epoch": 0.47, + "learning_rate": 1.066133354044503e-07, + "loss": 0.5637, + "step": 24098 + }, + { + "epoch": 0.47, + "learning_rate": 1.0660945206011416e-07, + "loss": 0.0006, + "step": 24099 + }, + { + "epoch": 0.47, + "learning_rate": 1.0660556871577802e-07, + "loss": 0.0008, + "step": 24100 + }, + { + "epoch": 0.47, + "learning_rate": 1.0660168537144188e-07, + "loss": 0.0007, + "step": 24101 + }, + { + "epoch": 0.47, + "learning_rate": 1.0659780202710574e-07, + "loss": 0.0007, + "step": 24102 + }, + { + "epoch": 0.47, + "learning_rate": 1.065939186827696e-07, + "loss": 0.0008, + "step": 24103 + }, + { + "epoch": 0.47, + "learning_rate": 1.0659003533843345e-07, + "loss": 0.0005, + "step": 24104 + }, + { + "epoch": 0.47, + "learning_rate": 1.065861519940973e-07, + "loss": 0.0009, + "step": 24105 + }, + { + "epoch": 0.47, + "learning_rate": 1.0658226864976116e-07, + "loss": 0.075, + "step": 24106 + }, + { + "epoch": 0.47, + "learning_rate": 1.0657838530542502e-07, + "loss": 0.0004, + "step": 24107 + }, + { + "epoch": 0.47, + "learning_rate": 1.0657450196108887e-07, + "loss": 0.0005, + "step": 24108 + }, + { + "epoch": 0.47, + "learning_rate": 1.0657061861675273e-07, + "loss": 0.1881, + "step": 24109 + }, + { + "epoch": 0.47, + "learning_rate": 1.0656673527241659e-07, + "loss": 0.0008, + "step": 24110 + }, + { + "epoch": 0.47, + "learning_rate": 1.0656285192808045e-07, + "loss": 0.0007, + "step": 24111 + }, + { + "epoch": 0.47, + "learning_rate": 1.0655896858374431e-07, + "loss": 0.0555, + "step": 24112 + }, + { + "epoch": 0.47, + "learning_rate": 1.0655508523940817e-07, + "loss": 0.0025, + "step": 24113 + }, + { + "epoch": 0.47, + "learning_rate": 1.0655120189507202e-07, + "loss": 0.0095, + "step": 24114 + }, + { + "epoch": 0.47, + "learning_rate": 1.0654731855073588e-07, + "loss": 0.0682, + "step": 24115 + }, + { + "epoch": 0.47, + "learning_rate": 1.0654343520639974e-07, + "loss": 0.0005, + "step": 24116 + }, + { + "epoch": 0.47, + "learning_rate": 1.065395518620636e-07, + "loss": 0.0009, + "step": 24117 + }, + { + "epoch": 0.47, + "learning_rate": 1.0653566851772746e-07, + "loss": 0.0006, + "step": 24118 + }, + { + "epoch": 0.47, + "learning_rate": 1.0653178517339132e-07, + "loss": 0.0005, + "step": 24119 + }, + { + "epoch": 0.47, + "learning_rate": 1.0652790182905517e-07, + "loss": 0.0006, + "step": 24120 + }, + { + "epoch": 0.47, + "learning_rate": 1.0652401848471903e-07, + "loss": 0.0015, + "step": 24121 + }, + { + "epoch": 0.47, + "learning_rate": 1.0652013514038289e-07, + "loss": 0.0006, + "step": 24122 + }, + { + "epoch": 0.47, + "learning_rate": 1.0651625179604675e-07, + "loss": 0.0006, + "step": 24123 + }, + { + "epoch": 0.47, + "learning_rate": 1.065123684517106e-07, + "loss": 0.0005, + "step": 24124 + }, + { + "epoch": 0.47, + "learning_rate": 1.0650848510737446e-07, + "loss": 0.0006, + "step": 24125 + }, + { + "epoch": 0.47, + "learning_rate": 1.0650460176303832e-07, + "loss": 0.0006, + "step": 24126 + }, + { + "epoch": 0.47, + "learning_rate": 1.0650071841870218e-07, + "loss": 0.0006, + "step": 24127 + }, + { + "epoch": 0.47, + "learning_rate": 1.0649683507436604e-07, + "loss": 0.0007, + "step": 24128 + }, + { + "epoch": 0.47, + "learning_rate": 1.064929517300299e-07, + "loss": 0.0006, + "step": 24129 + }, + { + "epoch": 0.47, + "learning_rate": 1.0648906838569376e-07, + "loss": 0.0006, + "step": 24130 + }, + { + "epoch": 0.47, + "learning_rate": 1.0648518504135761e-07, + "loss": 0.0008, + "step": 24131 + }, + { + "epoch": 0.47, + "learning_rate": 1.0648130169702147e-07, + "loss": 0.0005, + "step": 24132 + }, + { + "epoch": 0.47, + "learning_rate": 1.0647741835268533e-07, + "loss": 0.0005, + "step": 24133 + }, + { + "epoch": 0.47, + "learning_rate": 1.0647353500834919e-07, + "loss": 0.0005, + "step": 24134 + }, + { + "epoch": 0.47, + "learning_rate": 1.0646965166401305e-07, + "loss": 0.0011, + "step": 24135 + }, + { + "epoch": 0.47, + "learning_rate": 1.064657683196769e-07, + "loss": 0.0005, + "step": 24136 + }, + { + "epoch": 0.47, + "learning_rate": 1.0646188497534076e-07, + "loss": 0.0011, + "step": 24137 + }, + { + "epoch": 0.47, + "learning_rate": 1.0645800163100462e-07, + "loss": 0.0006, + "step": 24138 + }, + { + "epoch": 0.47, + "learning_rate": 1.0645411828666848e-07, + "loss": 0.0005, + "step": 24139 + }, + { + "epoch": 0.47, + "learning_rate": 1.0645023494233234e-07, + "loss": 0.0005, + "step": 24140 + }, + { + "epoch": 0.47, + "learning_rate": 1.064463515979962e-07, + "loss": 0.0005, + "step": 24141 + }, + { + "epoch": 0.47, + "learning_rate": 1.0644246825366005e-07, + "loss": 0.0005, + "step": 24142 + }, + { + "epoch": 0.47, + "learning_rate": 1.0643858490932391e-07, + "loss": 0.0005, + "step": 24143 + }, + { + "epoch": 0.47, + "learning_rate": 1.0643470156498777e-07, + "loss": 0.0006, + "step": 24144 + }, + { + "epoch": 0.47, + "learning_rate": 1.0643081822065163e-07, + "loss": 0.0006, + "step": 24145 + }, + { + "epoch": 0.47, + "learning_rate": 1.0642693487631549e-07, + "loss": 0.0059, + "step": 24146 + }, + { + "epoch": 0.47, + "learning_rate": 1.0642305153197935e-07, + "loss": 0.0005, + "step": 24147 + }, + { + "epoch": 0.47, + "learning_rate": 1.064191681876432e-07, + "loss": 0.9646, + "step": 24148 + }, + { + "epoch": 0.47, + "learning_rate": 1.0641528484330704e-07, + "loss": 0.0006, + "step": 24149 + }, + { + "epoch": 0.47, + "learning_rate": 1.064114014989709e-07, + "loss": 0.001, + "step": 24150 + }, + { + "epoch": 0.47, + "learning_rate": 1.0640751815463475e-07, + "loss": 0.0006, + "step": 24151 + }, + { + "epoch": 0.47, + "learning_rate": 1.0640363481029861e-07, + "loss": 0.0005, + "step": 24152 + }, + { + "epoch": 0.47, + "learning_rate": 1.0639975146596247e-07, + "loss": 0.0006, + "step": 24153 + }, + { + "epoch": 0.47, + "learning_rate": 1.0639586812162633e-07, + "loss": 0.0007, + "step": 24154 + }, + { + "epoch": 0.47, + "learning_rate": 1.0639198477729019e-07, + "loss": 0.0006, + "step": 24155 + }, + { + "epoch": 0.47, + "learning_rate": 1.0638810143295404e-07, + "loss": 0.0007, + "step": 24156 + }, + { + "epoch": 0.47, + "learning_rate": 1.063842180886179e-07, + "loss": 0.0009, + "step": 24157 + }, + { + "epoch": 0.47, + "learning_rate": 1.0638033474428176e-07, + "loss": 0.0005, + "step": 24158 + }, + { + "epoch": 0.47, + "learning_rate": 1.0637645139994562e-07, + "loss": 0.001, + "step": 24159 + }, + { + "epoch": 0.47, + "learning_rate": 1.0637256805560948e-07, + "loss": 0.0009, + "step": 24160 + }, + { + "epoch": 0.47, + "learning_rate": 1.0636868471127334e-07, + "loss": 0.0006, + "step": 24161 + }, + { + "epoch": 0.47, + "learning_rate": 1.0636480136693719e-07, + "loss": 0.0008, + "step": 24162 + }, + { + "epoch": 0.47, + "learning_rate": 1.0636091802260105e-07, + "loss": 0.004, + "step": 24163 + }, + { + "epoch": 0.47, + "learning_rate": 1.0635703467826491e-07, + "loss": 0.0005, + "step": 24164 + }, + { + "epoch": 0.47, + "learning_rate": 1.0635315133392877e-07, + "loss": 0.0018, + "step": 24165 + }, + { + "epoch": 0.47, + "learning_rate": 1.0634926798959263e-07, + "loss": 0.0007, + "step": 24166 + }, + { + "epoch": 0.47, + "learning_rate": 1.0634538464525648e-07, + "loss": 0.0007, + "step": 24167 + }, + { + "epoch": 0.47, + "learning_rate": 1.0634150130092034e-07, + "loss": 0.0008, + "step": 24168 + }, + { + "epoch": 0.47, + "learning_rate": 1.063376179565842e-07, + "loss": 0.2483, + "step": 24169 + }, + { + "epoch": 0.47, + "learning_rate": 1.0633373461224806e-07, + "loss": 0.001, + "step": 24170 + }, + { + "epoch": 0.47, + "learning_rate": 1.0632985126791192e-07, + "loss": 0.0007, + "step": 24171 + }, + { + "epoch": 0.47, + "learning_rate": 1.0632596792357578e-07, + "loss": 0.9399, + "step": 24172 + }, + { + "epoch": 0.47, + "learning_rate": 1.0632208457923963e-07, + "loss": 0.0008, + "step": 24173 + }, + { + "epoch": 0.47, + "learning_rate": 1.0631820123490349e-07, + "loss": 0.0029, + "step": 24174 + }, + { + "epoch": 0.47, + "learning_rate": 1.0631431789056735e-07, + "loss": 0.0008, + "step": 24175 + }, + { + "epoch": 0.47, + "learning_rate": 1.0631043454623121e-07, + "loss": 0.3196, + "step": 24176 + }, + { + "epoch": 0.47, + "learning_rate": 1.0630655120189507e-07, + "loss": 0.0005, + "step": 24177 + }, + { + "epoch": 0.47, + "learning_rate": 1.0630266785755893e-07, + "loss": 0.0005, + "step": 24178 + }, + { + "epoch": 0.47, + "learning_rate": 1.0629878451322278e-07, + "loss": 0.0005, + "step": 24179 + }, + { + "epoch": 0.47, + "learning_rate": 1.0629490116888664e-07, + "loss": 0.0008, + "step": 24180 + }, + { + "epoch": 0.47, + "learning_rate": 1.062910178245505e-07, + "loss": 0.0006, + "step": 24181 + }, + { + "epoch": 0.47, + "learning_rate": 1.0628713448021436e-07, + "loss": 0.0006, + "step": 24182 + }, + { + "epoch": 0.47, + "learning_rate": 1.0628325113587822e-07, + "loss": 0.0006, + "step": 24183 + }, + { + "epoch": 0.47, + "learning_rate": 1.0627936779154207e-07, + "loss": 0.0236, + "step": 24184 + }, + { + "epoch": 0.47, + "learning_rate": 1.0627548444720593e-07, + "loss": 0.0006, + "step": 24185 + }, + { + "epoch": 0.47, + "learning_rate": 1.0627160110286979e-07, + "loss": 0.0005, + "step": 24186 + }, + { + "epoch": 0.47, + "learning_rate": 1.0626771775853365e-07, + "loss": 0.0005, + "step": 24187 + }, + { + "epoch": 0.47, + "learning_rate": 1.0626383441419751e-07, + "loss": 0.0006, + "step": 24188 + }, + { + "epoch": 0.47, + "learning_rate": 1.0625995106986137e-07, + "loss": 0.0007, + "step": 24189 + }, + { + "epoch": 0.47, + "learning_rate": 1.0625606772552522e-07, + "loss": 0.0007, + "step": 24190 + }, + { + "epoch": 0.47, + "learning_rate": 1.0625218438118908e-07, + "loss": 0.0024, + "step": 24191 + }, + { + "epoch": 0.47, + "learning_rate": 1.0624830103685294e-07, + "loss": 0.0221, + "step": 24192 + }, + { + "epoch": 0.47, + "learning_rate": 1.062444176925168e-07, + "loss": 0.0005, + "step": 24193 + }, + { + "epoch": 0.47, + "learning_rate": 1.0624053434818066e-07, + "loss": 0.0017, + "step": 24194 + }, + { + "epoch": 0.47, + "learning_rate": 1.0623665100384452e-07, + "loss": 0.0006, + "step": 24195 + }, + { + "epoch": 0.47, + "learning_rate": 1.0623276765950837e-07, + "loss": 0.0005, + "step": 24196 + }, + { + "epoch": 0.47, + "learning_rate": 1.0622888431517223e-07, + "loss": 0.0084, + "step": 24197 + }, + { + "epoch": 0.47, + "learning_rate": 1.0622500097083609e-07, + "loss": 0.0009, + "step": 24198 + }, + { + "epoch": 0.47, + "learning_rate": 1.0622111762649995e-07, + "loss": 0.5262, + "step": 24199 + }, + { + "epoch": 0.47, + "learning_rate": 1.062172342821638e-07, + "loss": 0.0007, + "step": 24200 + }, + { + "epoch": 0.47, + "learning_rate": 1.0621335093782766e-07, + "loss": 0.0028, + "step": 24201 + }, + { + "epoch": 0.47, + "learning_rate": 1.0620946759349152e-07, + "loss": 0.0005, + "step": 24202 + }, + { + "epoch": 0.47, + "learning_rate": 1.0620558424915538e-07, + "loss": 0.0006, + "step": 24203 + }, + { + "epoch": 0.47, + "learning_rate": 1.0620170090481924e-07, + "loss": 0.0005, + "step": 24204 + }, + { + "epoch": 0.47, + "learning_rate": 1.061978175604831e-07, + "loss": 1.2236, + "step": 24205 + }, + { + "epoch": 0.47, + "learning_rate": 1.0619393421614696e-07, + "loss": 0.0032, + "step": 24206 + }, + { + "epoch": 0.47, + "learning_rate": 1.0619005087181079e-07, + "loss": 0.0006, + "step": 24207 + }, + { + "epoch": 0.47, + "learning_rate": 1.0618616752747465e-07, + "loss": 0.8186, + "step": 24208 + }, + { + "epoch": 0.47, + "learning_rate": 1.061822841831385e-07, + "loss": 0.0007, + "step": 24209 + }, + { + "epoch": 0.47, + "learning_rate": 1.0617840083880236e-07, + "loss": 0.0005, + "step": 24210 + }, + { + "epoch": 0.47, + "learning_rate": 1.0617451749446622e-07, + "loss": 0.0006, + "step": 24211 + }, + { + "epoch": 0.47, + "learning_rate": 1.0617063415013008e-07, + "loss": 0.0006, + "step": 24212 + }, + { + "epoch": 0.47, + "learning_rate": 1.0616675080579394e-07, + "loss": 0.0005, + "step": 24213 + }, + { + "epoch": 0.47, + "learning_rate": 1.061628674614578e-07, + "loss": 0.0006, + "step": 24214 + }, + { + "epoch": 0.47, + "learning_rate": 1.0615898411712165e-07, + "loss": 0.0007, + "step": 24215 + }, + { + "epoch": 0.47, + "learning_rate": 1.0615510077278551e-07, + "loss": 0.0175, + "step": 24216 + }, + { + "epoch": 0.47, + "learning_rate": 1.0615121742844937e-07, + "loss": 0.0007, + "step": 24217 + }, + { + "epoch": 0.47, + "learning_rate": 1.0614733408411323e-07, + "loss": 0.0006, + "step": 24218 + }, + { + "epoch": 0.47, + "learning_rate": 1.0614345073977709e-07, + "loss": 0.0005, + "step": 24219 + }, + { + "epoch": 0.47, + "learning_rate": 1.0613956739544094e-07, + "loss": 0.0008, + "step": 24220 + }, + { + "epoch": 0.47, + "learning_rate": 1.061356840511048e-07, + "loss": 0.0005, + "step": 24221 + }, + { + "epoch": 0.47, + "learning_rate": 1.0613180070676866e-07, + "loss": 0.0108, + "step": 24222 + }, + { + "epoch": 0.47, + "learning_rate": 1.0612791736243252e-07, + "loss": 0.8989, + "step": 24223 + }, + { + "epoch": 0.47, + "learning_rate": 1.0612403401809638e-07, + "loss": 1.3932, + "step": 24224 + }, + { + "epoch": 0.47, + "learning_rate": 1.0612015067376024e-07, + "loss": 0.0013, + "step": 24225 + }, + { + "epoch": 0.47, + "learning_rate": 1.061162673294241e-07, + "loss": 0.0006, + "step": 24226 + }, + { + "epoch": 0.47, + "learning_rate": 1.0611238398508795e-07, + "loss": 0.0006, + "step": 24227 + }, + { + "epoch": 0.47, + "learning_rate": 1.0610850064075181e-07, + "loss": 0.0005, + "step": 24228 + }, + { + "epoch": 0.47, + "learning_rate": 1.0610461729641567e-07, + "loss": 0.0008, + "step": 24229 + }, + { + "epoch": 0.47, + "learning_rate": 1.0610073395207953e-07, + "loss": 0.5433, + "step": 24230 + }, + { + "epoch": 0.47, + "learning_rate": 1.0609685060774339e-07, + "loss": 0.6204, + "step": 24231 + }, + { + "epoch": 0.47, + "learning_rate": 1.0609296726340724e-07, + "loss": 0.0009, + "step": 24232 + }, + { + "epoch": 0.47, + "learning_rate": 1.060890839190711e-07, + "loss": 0.0006, + "step": 24233 + }, + { + "epoch": 0.47, + "learning_rate": 1.0608520057473496e-07, + "loss": 0.0005, + "step": 24234 + }, + { + "epoch": 0.47, + "learning_rate": 1.0608131723039882e-07, + "loss": 0.0008, + "step": 24235 + }, + { + "epoch": 0.47, + "learning_rate": 1.0607743388606268e-07, + "loss": 0.012, + "step": 24236 + }, + { + "epoch": 0.47, + "learning_rate": 1.0607355054172654e-07, + "loss": 0.0006, + "step": 24237 + }, + { + "epoch": 0.47, + "learning_rate": 1.060696671973904e-07, + "loss": 0.0007, + "step": 24238 + }, + { + "epoch": 0.47, + "learning_rate": 1.0606578385305425e-07, + "loss": 0.0006, + "step": 24239 + }, + { + "epoch": 0.47, + "learning_rate": 1.0606190050871811e-07, + "loss": 0.0005, + "step": 24240 + }, + { + "epoch": 0.47, + "learning_rate": 1.0605801716438197e-07, + "loss": 0.0005, + "step": 24241 + }, + { + "epoch": 0.47, + "learning_rate": 1.0605413382004583e-07, + "loss": 0.0006, + "step": 24242 + }, + { + "epoch": 0.47, + "learning_rate": 1.0605025047570968e-07, + "loss": 0.0007, + "step": 24243 + }, + { + "epoch": 0.47, + "learning_rate": 1.0604636713137354e-07, + "loss": 0.0007, + "step": 24244 + }, + { + "epoch": 0.47, + "learning_rate": 1.060424837870374e-07, + "loss": 0.5908, + "step": 24245 + }, + { + "epoch": 0.47, + "learning_rate": 1.0603860044270126e-07, + "loss": 0.0014, + "step": 24246 + }, + { + "epoch": 0.47, + "learning_rate": 1.0603471709836512e-07, + "loss": 0.0012, + "step": 24247 + }, + { + "epoch": 0.47, + "learning_rate": 1.0603083375402898e-07, + "loss": 0.0007, + "step": 24248 + }, + { + "epoch": 0.47, + "learning_rate": 1.0602695040969283e-07, + "loss": 0.0006, + "step": 24249 + }, + { + "epoch": 0.47, + "learning_rate": 1.0602306706535669e-07, + "loss": 0.0006, + "step": 24250 + }, + { + "epoch": 0.47, + "learning_rate": 1.0601918372102055e-07, + "loss": 0.0005, + "step": 24251 + }, + { + "epoch": 0.47, + "learning_rate": 1.0601530037668441e-07, + "loss": 0.0057, + "step": 24252 + }, + { + "epoch": 0.47, + "learning_rate": 1.0601141703234825e-07, + "loss": 0.0007, + "step": 24253 + }, + { + "epoch": 0.47, + "learning_rate": 1.0600753368801211e-07, + "loss": 0.0067, + "step": 24254 + }, + { + "epoch": 0.47, + "learning_rate": 1.0600365034367597e-07, + "loss": 0.0005, + "step": 24255 + }, + { + "epoch": 0.47, + "learning_rate": 1.0599976699933983e-07, + "loss": 0.0481, + "step": 24256 + }, + { + "epoch": 0.47, + "learning_rate": 1.0599588365500369e-07, + "loss": 0.0034, + "step": 24257 + }, + { + "epoch": 0.47, + "learning_rate": 1.0599200031066755e-07, + "loss": 0.0008, + "step": 24258 + }, + { + "epoch": 0.47, + "learning_rate": 1.059881169663314e-07, + "loss": 0.0026, + "step": 24259 + }, + { + "epoch": 0.47, + "learning_rate": 1.0598423362199526e-07, + "loss": 0.0005, + "step": 24260 + }, + { + "epoch": 0.47, + "learning_rate": 1.0598035027765912e-07, + "loss": 0.0006, + "step": 24261 + }, + { + "epoch": 0.47, + "learning_rate": 1.0597646693332298e-07, + "loss": 0.0007, + "step": 24262 + }, + { + "epoch": 0.47, + "learning_rate": 1.0597258358898684e-07, + "loss": 0.19, + "step": 24263 + }, + { + "epoch": 0.47, + "learning_rate": 1.059687002446507e-07, + "loss": 1.2457, + "step": 24264 + }, + { + "epoch": 0.47, + "learning_rate": 1.0596481690031454e-07, + "loss": 0.0109, + "step": 24265 + }, + { + "epoch": 0.47, + "learning_rate": 1.059609335559784e-07, + "loss": 0.0006, + "step": 24266 + }, + { + "epoch": 0.47, + "learning_rate": 1.0595705021164226e-07, + "loss": 0.0006, + "step": 24267 + }, + { + "epoch": 0.47, + "learning_rate": 1.0595316686730611e-07, + "loss": 0.0005, + "step": 24268 + }, + { + "epoch": 0.47, + "learning_rate": 1.0594928352296997e-07, + "loss": 0.0007, + "step": 24269 + }, + { + "epoch": 0.47, + "learning_rate": 1.0594540017863383e-07, + "loss": 0.0005, + "step": 24270 + }, + { + "epoch": 0.47, + "learning_rate": 1.0594151683429769e-07, + "loss": 0.0051, + "step": 24271 + }, + { + "epoch": 0.47, + "learning_rate": 1.0593763348996155e-07, + "loss": 0.0007, + "step": 24272 + }, + { + "epoch": 0.47, + "learning_rate": 1.059337501456254e-07, + "loss": 0.0007, + "step": 24273 + }, + { + "epoch": 0.47, + "learning_rate": 1.0592986680128926e-07, + "loss": 0.0005, + "step": 24274 + }, + { + "epoch": 0.47, + "learning_rate": 1.0592598345695312e-07, + "loss": 0.0005, + "step": 24275 + }, + { + "epoch": 0.47, + "learning_rate": 1.0592210011261698e-07, + "loss": 0.0134, + "step": 24276 + }, + { + "epoch": 0.47, + "learning_rate": 1.0591821676828084e-07, + "loss": 0.3345, + "step": 24277 + }, + { + "epoch": 0.47, + "learning_rate": 1.059143334239447e-07, + "loss": 0.0141, + "step": 24278 + }, + { + "epoch": 0.47, + "learning_rate": 1.0591045007960855e-07, + "loss": 0.0006, + "step": 24279 + }, + { + "epoch": 0.47, + "learning_rate": 1.0590656673527241e-07, + "loss": 0.0026, + "step": 24280 + }, + { + "epoch": 0.47, + "learning_rate": 1.0590268339093627e-07, + "loss": 0.0692, + "step": 24281 + }, + { + "epoch": 0.47, + "learning_rate": 1.0589880004660012e-07, + "loss": 0.6123, + "step": 24282 + }, + { + "epoch": 0.47, + "learning_rate": 1.0589491670226397e-07, + "loss": 0.0022, + "step": 24283 + }, + { + "epoch": 0.47, + "learning_rate": 1.0589103335792783e-07, + "loss": 0.0006, + "step": 24284 + }, + { + "epoch": 0.47, + "learning_rate": 1.0588715001359169e-07, + "loss": 0.0004, + "step": 24285 + }, + { + "epoch": 0.47, + "learning_rate": 1.0588326666925555e-07, + "loss": 0.5095, + "step": 24286 + }, + { + "epoch": 0.47, + "learning_rate": 1.0587938332491941e-07, + "loss": 0.0005, + "step": 24287 + }, + { + "epoch": 0.47, + "learning_rate": 1.0587549998058327e-07, + "loss": 0.0005, + "step": 24288 + }, + { + "epoch": 0.47, + "learning_rate": 1.0587161663624712e-07, + "loss": 0.0007, + "step": 24289 + }, + { + "epoch": 0.47, + "learning_rate": 1.0586773329191098e-07, + "loss": 0.0008, + "step": 24290 + }, + { + "epoch": 0.47, + "learning_rate": 1.0586384994757484e-07, + "loss": 0.0007, + "step": 24291 + }, + { + "epoch": 0.47, + "learning_rate": 1.058599666032387e-07, + "loss": 0.0032, + "step": 24292 + }, + { + "epoch": 0.47, + "learning_rate": 1.0585608325890256e-07, + "loss": 0.0051, + "step": 24293 + }, + { + "epoch": 0.47, + "learning_rate": 1.0585219991456642e-07, + "loss": 0.0014, + "step": 24294 + }, + { + "epoch": 0.47, + "learning_rate": 1.0584831657023027e-07, + "loss": 0.0006, + "step": 24295 + }, + { + "epoch": 0.47, + "learning_rate": 1.0584443322589413e-07, + "loss": 0.0006, + "step": 24296 + }, + { + "epoch": 0.47, + "learning_rate": 1.0584054988155799e-07, + "loss": 0.0007, + "step": 24297 + }, + { + "epoch": 0.47, + "learning_rate": 1.0583666653722185e-07, + "loss": 0.0007, + "step": 24298 + }, + { + "epoch": 0.47, + "learning_rate": 1.058327831928857e-07, + "loss": 0.0007, + "step": 24299 + }, + { + "epoch": 0.47, + "learning_rate": 1.0582889984854956e-07, + "loss": 0.0006, + "step": 24300 + }, + { + "epoch": 0.47, + "learning_rate": 1.0582501650421342e-07, + "loss": 0.0005, + "step": 24301 + }, + { + "epoch": 0.47, + "learning_rate": 1.0582113315987728e-07, + "loss": 0.3498, + "step": 24302 + }, + { + "epoch": 0.47, + "learning_rate": 1.0581724981554114e-07, + "loss": 0.0004, + "step": 24303 + }, + { + "epoch": 0.47, + "learning_rate": 1.05813366471205e-07, + "loss": 0.0005, + "step": 24304 + }, + { + "epoch": 0.47, + "learning_rate": 1.0580948312686886e-07, + "loss": 0.0006, + "step": 24305 + }, + { + "epoch": 0.47, + "learning_rate": 1.0580559978253271e-07, + "loss": 0.0006, + "step": 24306 + }, + { + "epoch": 0.47, + "learning_rate": 1.0580171643819657e-07, + "loss": 0.0005, + "step": 24307 + }, + { + "epoch": 0.47, + "learning_rate": 1.0579783309386043e-07, + "loss": 0.0007, + "step": 24308 + }, + { + "epoch": 0.47, + "learning_rate": 1.0579394974952429e-07, + "loss": 0.0015, + "step": 24309 + }, + { + "epoch": 0.47, + "learning_rate": 1.0579006640518815e-07, + "loss": 0.0006, + "step": 24310 + }, + { + "epoch": 0.47, + "learning_rate": 1.05786183060852e-07, + "loss": 0.0011, + "step": 24311 + }, + { + "epoch": 0.47, + "learning_rate": 1.0578229971651586e-07, + "loss": 0.0007, + "step": 24312 + }, + { + "epoch": 0.47, + "learning_rate": 1.0577841637217972e-07, + "loss": 0.0009, + "step": 24313 + }, + { + "epoch": 0.47, + "learning_rate": 1.0577453302784358e-07, + "loss": 0.0005, + "step": 24314 + }, + { + "epoch": 0.47, + "learning_rate": 1.0577064968350744e-07, + "loss": 0.0006, + "step": 24315 + }, + { + "epoch": 0.47, + "learning_rate": 1.057667663391713e-07, + "loss": 0.0005, + "step": 24316 + }, + { + "epoch": 0.47, + "learning_rate": 1.0576288299483515e-07, + "loss": 1.0977, + "step": 24317 + }, + { + "epoch": 0.47, + "learning_rate": 1.0575899965049901e-07, + "loss": 0.0007, + "step": 24318 + }, + { + "epoch": 0.47, + "learning_rate": 1.0575511630616287e-07, + "loss": 0.0006, + "step": 24319 + }, + { + "epoch": 0.47, + "learning_rate": 1.0575123296182673e-07, + "loss": 0.0006, + "step": 24320 + }, + { + "epoch": 0.47, + "learning_rate": 1.0574734961749059e-07, + "loss": 0.0013, + "step": 24321 + }, + { + "epoch": 0.47, + "learning_rate": 1.0574346627315445e-07, + "loss": 0.0008, + "step": 24322 + }, + { + "epoch": 0.47, + "learning_rate": 1.0573958292881828e-07, + "loss": 0.0007, + "step": 24323 + }, + { + "epoch": 0.47, + "learning_rate": 1.0573569958448214e-07, + "loss": 0.0016, + "step": 24324 + }, + { + "epoch": 0.47, + "learning_rate": 1.05731816240146e-07, + "loss": 0.0005, + "step": 24325 + }, + { + "epoch": 0.47, + "learning_rate": 1.0572793289580985e-07, + "loss": 0.0005, + "step": 24326 + }, + { + "epoch": 0.47, + "learning_rate": 1.0572404955147371e-07, + "loss": 0.5042, + "step": 24327 + }, + { + "epoch": 0.47, + "learning_rate": 1.0572016620713757e-07, + "loss": 0.0005, + "step": 24328 + }, + { + "epoch": 0.47, + "learning_rate": 1.0571628286280143e-07, + "loss": 0.0011, + "step": 24329 + }, + { + "epoch": 0.47, + "learning_rate": 1.0571239951846529e-07, + "loss": 0.0008, + "step": 24330 + }, + { + "epoch": 0.47, + "learning_rate": 1.0570851617412914e-07, + "loss": 0.0014, + "step": 24331 + }, + { + "epoch": 0.47, + "learning_rate": 1.05704632829793e-07, + "loss": 0.0004, + "step": 24332 + }, + { + "epoch": 0.47, + "learning_rate": 1.0570074948545686e-07, + "loss": 0.0008, + "step": 24333 + }, + { + "epoch": 0.47, + "learning_rate": 1.0569686614112072e-07, + "loss": 0.0007, + "step": 24334 + }, + { + "epoch": 0.47, + "learning_rate": 1.0569298279678458e-07, + "loss": 0.0006, + "step": 24335 + }, + { + "epoch": 0.47, + "learning_rate": 1.0568909945244844e-07, + "loss": 0.0282, + "step": 24336 + }, + { + "epoch": 0.47, + "learning_rate": 1.056852161081123e-07, + "loss": 1.1922, + "step": 24337 + }, + { + "epoch": 0.47, + "learning_rate": 1.0568133276377615e-07, + "loss": 0.0017, + "step": 24338 + }, + { + "epoch": 0.47, + "learning_rate": 1.0567744941944001e-07, + "loss": 0.0007, + "step": 24339 + }, + { + "epoch": 0.47, + "learning_rate": 1.0567356607510387e-07, + "loss": 0.0005, + "step": 24340 + }, + { + "epoch": 0.47, + "learning_rate": 1.0566968273076773e-07, + "loss": 0.0006, + "step": 24341 + }, + { + "epoch": 0.47, + "learning_rate": 1.0566579938643158e-07, + "loss": 0.0005, + "step": 24342 + }, + { + "epoch": 0.47, + "learning_rate": 1.0566191604209544e-07, + "loss": 0.0014, + "step": 24343 + }, + { + "epoch": 0.47, + "learning_rate": 1.056580326977593e-07, + "loss": 0.0008, + "step": 24344 + }, + { + "epoch": 0.47, + "learning_rate": 1.0565414935342316e-07, + "loss": 0.0006, + "step": 24345 + }, + { + "epoch": 0.47, + "learning_rate": 1.0565026600908702e-07, + "loss": 0.0006, + "step": 24346 + }, + { + "epoch": 0.47, + "learning_rate": 1.0564638266475088e-07, + "loss": 0.0006, + "step": 24347 + }, + { + "epoch": 0.47, + "learning_rate": 1.0564249932041473e-07, + "loss": 0.0008, + "step": 24348 + }, + { + "epoch": 0.47, + "learning_rate": 1.0563861597607859e-07, + "loss": 0.0004, + "step": 24349 + }, + { + "epoch": 0.47, + "learning_rate": 1.0563473263174245e-07, + "loss": 0.0006, + "step": 24350 + }, + { + "epoch": 0.47, + "learning_rate": 1.0563084928740631e-07, + "loss": 0.0012, + "step": 24351 + }, + { + "epoch": 0.47, + "learning_rate": 1.0562696594307017e-07, + "loss": 0.0009, + "step": 24352 + }, + { + "epoch": 0.47, + "learning_rate": 1.0562308259873403e-07, + "loss": 0.0005, + "step": 24353 + }, + { + "epoch": 0.47, + "learning_rate": 1.0561919925439788e-07, + "loss": 0.0034, + "step": 24354 + }, + { + "epoch": 0.47, + "learning_rate": 1.0561531591006174e-07, + "loss": 0.0006, + "step": 24355 + }, + { + "epoch": 0.47, + "learning_rate": 1.056114325657256e-07, + "loss": 0.0007, + "step": 24356 + }, + { + "epoch": 0.47, + "learning_rate": 1.0560754922138946e-07, + "loss": 0.0008, + "step": 24357 + }, + { + "epoch": 0.47, + "learning_rate": 1.0560366587705332e-07, + "loss": 0.0008, + "step": 24358 + }, + { + "epoch": 0.47, + "learning_rate": 1.0559978253271717e-07, + "loss": 0.0178, + "step": 24359 + }, + { + "epoch": 0.47, + "learning_rate": 1.0559589918838103e-07, + "loss": 0.0007, + "step": 24360 + }, + { + "epoch": 0.47, + "learning_rate": 1.0559201584404489e-07, + "loss": 0.0005, + "step": 24361 + }, + { + "epoch": 0.47, + "learning_rate": 1.0558813249970875e-07, + "loss": 0.0061, + "step": 24362 + }, + { + "epoch": 0.47, + "learning_rate": 1.0558424915537261e-07, + "loss": 0.0008, + "step": 24363 + }, + { + "epoch": 0.47, + "learning_rate": 1.0558036581103647e-07, + "loss": 0.0005, + "step": 24364 + }, + { + "epoch": 0.47, + "learning_rate": 1.0557648246670032e-07, + "loss": 0.0154, + "step": 24365 + }, + { + "epoch": 0.47, + "learning_rate": 1.0557259912236418e-07, + "loss": 0.0006, + "step": 24366 + }, + { + "epoch": 0.47, + "learning_rate": 1.0556871577802804e-07, + "loss": 0.0005, + "step": 24367 + }, + { + "epoch": 0.47, + "learning_rate": 1.055648324336919e-07, + "loss": 0.0007, + "step": 24368 + }, + { + "epoch": 0.47, + "learning_rate": 1.0556094908935576e-07, + "loss": 0.0168, + "step": 24369 + }, + { + "epoch": 0.47, + "learning_rate": 1.0555706574501962e-07, + "loss": 0.0009, + "step": 24370 + }, + { + "epoch": 0.47, + "learning_rate": 1.0555318240068347e-07, + "loss": 0.0006, + "step": 24371 + }, + { + "epoch": 0.47, + "learning_rate": 1.0554929905634733e-07, + "loss": 0.538, + "step": 24372 + }, + { + "epoch": 0.47, + "learning_rate": 1.0554541571201119e-07, + "loss": 0.0005, + "step": 24373 + }, + { + "epoch": 0.47, + "learning_rate": 1.0554153236767505e-07, + "loss": 0.0766, + "step": 24374 + }, + { + "epoch": 0.47, + "learning_rate": 1.0553764902333891e-07, + "loss": 0.0006, + "step": 24375 + }, + { + "epoch": 0.47, + "learning_rate": 1.0553376567900276e-07, + "loss": 0.106, + "step": 24376 + }, + { + "epoch": 0.47, + "learning_rate": 1.0552988233466662e-07, + "loss": 0.0006, + "step": 24377 + }, + { + "epoch": 0.47, + "learning_rate": 1.0552599899033048e-07, + "loss": 1.0586, + "step": 24378 + }, + { + "epoch": 0.47, + "learning_rate": 1.0552211564599434e-07, + "loss": 0.0005, + "step": 24379 + }, + { + "epoch": 0.47, + "learning_rate": 1.055182323016582e-07, + "loss": 0.0006, + "step": 24380 + }, + { + "epoch": 0.47, + "learning_rate": 1.0551434895732203e-07, + "loss": 0.0006, + "step": 24381 + }, + { + "epoch": 0.47, + "learning_rate": 1.0551046561298589e-07, + "loss": 0.0004, + "step": 24382 + }, + { + "epoch": 0.47, + "learning_rate": 1.0550658226864975e-07, + "loss": 0.0007, + "step": 24383 + }, + { + "epoch": 0.47, + "learning_rate": 1.055026989243136e-07, + "loss": 0.0005, + "step": 24384 + }, + { + "epoch": 0.47, + "learning_rate": 1.0549881557997746e-07, + "loss": 0.0006, + "step": 24385 + }, + { + "epoch": 0.47, + "learning_rate": 1.0549493223564132e-07, + "loss": 0.0054, + "step": 24386 + }, + { + "epoch": 0.47, + "learning_rate": 1.0549104889130518e-07, + "loss": 0.0052, + "step": 24387 + }, + { + "epoch": 0.47, + "learning_rate": 1.0548716554696904e-07, + "loss": 0.0006, + "step": 24388 + }, + { + "epoch": 0.47, + "learning_rate": 1.054832822026329e-07, + "loss": 0.1741, + "step": 24389 + }, + { + "epoch": 0.47, + "learning_rate": 1.0547939885829675e-07, + "loss": 0.0073, + "step": 24390 + }, + { + "epoch": 0.47, + "learning_rate": 1.0547551551396061e-07, + "loss": 0.001, + "step": 24391 + }, + { + "epoch": 0.47, + "learning_rate": 1.0547163216962447e-07, + "loss": 0.0005, + "step": 24392 + }, + { + "epoch": 0.47, + "learning_rate": 1.0546774882528833e-07, + "loss": 0.0005, + "step": 24393 + }, + { + "epoch": 0.47, + "learning_rate": 1.0546386548095219e-07, + "loss": 0.0007, + "step": 24394 + }, + { + "epoch": 0.47, + "learning_rate": 1.0545998213661605e-07, + "loss": 0.0006, + "step": 24395 + }, + { + "epoch": 0.47, + "learning_rate": 1.054560987922799e-07, + "loss": 0.0005, + "step": 24396 + }, + { + "epoch": 0.47, + "learning_rate": 1.0545221544794376e-07, + "loss": 0.0005, + "step": 24397 + }, + { + "epoch": 0.47, + "learning_rate": 1.0544833210360762e-07, + "loss": 0.0154, + "step": 24398 + }, + { + "epoch": 0.47, + "learning_rate": 1.0544444875927148e-07, + "loss": 0.0006, + "step": 24399 + }, + { + "epoch": 0.47, + "learning_rate": 1.0544056541493534e-07, + "loss": 0.0008, + "step": 24400 + }, + { + "epoch": 0.47, + "learning_rate": 1.054366820705992e-07, + "loss": 0.0006, + "step": 24401 + }, + { + "epoch": 0.47, + "learning_rate": 1.0543279872626305e-07, + "loss": 0.0005, + "step": 24402 + }, + { + "epoch": 0.47, + "learning_rate": 1.0542891538192691e-07, + "loss": 0.0005, + "step": 24403 + }, + { + "epoch": 0.47, + "learning_rate": 1.0542503203759077e-07, + "loss": 0.4741, + "step": 24404 + }, + { + "epoch": 0.47, + "learning_rate": 1.0542114869325463e-07, + "loss": 0.0009, + "step": 24405 + }, + { + "epoch": 0.47, + "learning_rate": 1.0541726534891849e-07, + "loss": 1.0946, + "step": 24406 + }, + { + "epoch": 0.47, + "learning_rate": 1.0541338200458234e-07, + "loss": 0.0005, + "step": 24407 + }, + { + "epoch": 0.47, + "learning_rate": 1.054094986602462e-07, + "loss": 0.0005, + "step": 24408 + }, + { + "epoch": 0.47, + "learning_rate": 1.0540561531591006e-07, + "loss": 0.0008, + "step": 24409 + }, + { + "epoch": 0.47, + "learning_rate": 1.0540173197157392e-07, + "loss": 0.0005, + "step": 24410 + }, + { + "epoch": 0.47, + "learning_rate": 1.0539784862723778e-07, + "loss": 0.0578, + "step": 24411 + }, + { + "epoch": 0.47, + "learning_rate": 1.0539396528290164e-07, + "loss": 0.0005, + "step": 24412 + }, + { + "epoch": 0.47, + "learning_rate": 1.053900819385655e-07, + "loss": 0.0009, + "step": 24413 + }, + { + "epoch": 0.47, + "learning_rate": 1.0538619859422935e-07, + "loss": 0.0005, + "step": 24414 + }, + { + "epoch": 0.47, + "learning_rate": 1.0538231524989321e-07, + "loss": 0.0005, + "step": 24415 + }, + { + "epoch": 0.47, + "learning_rate": 1.0537843190555707e-07, + "loss": 0.0005, + "step": 24416 + }, + { + "epoch": 0.47, + "learning_rate": 1.0537454856122093e-07, + "loss": 0.001, + "step": 24417 + }, + { + "epoch": 0.47, + "learning_rate": 1.0537066521688478e-07, + "loss": 0.0006, + "step": 24418 + }, + { + "epoch": 0.47, + "learning_rate": 1.0536678187254864e-07, + "loss": 0.0124, + "step": 24419 + }, + { + "epoch": 0.47, + "learning_rate": 1.053628985282125e-07, + "loss": 0.0008, + "step": 24420 + }, + { + "epoch": 0.47, + "learning_rate": 1.0535901518387636e-07, + "loss": 1.2126, + "step": 24421 + }, + { + "epoch": 0.47, + "learning_rate": 1.0535513183954022e-07, + "loss": 0.0007, + "step": 24422 + }, + { + "epoch": 0.47, + "learning_rate": 1.0535124849520408e-07, + "loss": 0.0005, + "step": 24423 + }, + { + "epoch": 0.47, + "learning_rate": 1.0534736515086793e-07, + "loss": 0.0006, + "step": 24424 + }, + { + "epoch": 0.47, + "learning_rate": 1.0534348180653179e-07, + "loss": 0.0008, + "step": 24425 + }, + { + "epoch": 0.47, + "learning_rate": 1.0533959846219565e-07, + "loss": 0.0008, + "step": 24426 + }, + { + "epoch": 0.47, + "learning_rate": 1.0533571511785951e-07, + "loss": 0.1554, + "step": 24427 + }, + { + "epoch": 0.47, + "learning_rate": 1.0533183177352337e-07, + "loss": 0.0006, + "step": 24428 + }, + { + "epoch": 0.47, + "learning_rate": 1.0532794842918723e-07, + "loss": 0.0005, + "step": 24429 + }, + { + "epoch": 0.47, + "learning_rate": 1.0532406508485107e-07, + "loss": 0.0005, + "step": 24430 + }, + { + "epoch": 0.47, + "learning_rate": 1.0532018174051493e-07, + "loss": 0.0006, + "step": 24431 + }, + { + "epoch": 0.47, + "learning_rate": 1.0531629839617879e-07, + "loss": 0.0007, + "step": 24432 + }, + { + "epoch": 0.47, + "learning_rate": 1.0531241505184265e-07, + "loss": 0.0005, + "step": 24433 + }, + { + "epoch": 0.47, + "learning_rate": 1.053085317075065e-07, + "loss": 0.0005, + "step": 24434 + }, + { + "epoch": 0.47, + "learning_rate": 1.0530464836317036e-07, + "loss": 0.0005, + "step": 24435 + }, + { + "epoch": 0.47, + "learning_rate": 1.0530076501883422e-07, + "loss": 0.0009, + "step": 24436 + }, + { + "epoch": 0.47, + "learning_rate": 1.0529688167449808e-07, + "loss": 0.1398, + "step": 24437 + }, + { + "epoch": 0.47, + "learning_rate": 1.0529299833016194e-07, + "loss": 0.0011, + "step": 24438 + }, + { + "epoch": 0.47, + "learning_rate": 1.0528911498582578e-07, + "loss": 0.0017, + "step": 24439 + }, + { + "epoch": 0.47, + "learning_rate": 1.0528523164148964e-07, + "loss": 0.0006, + "step": 24440 + }, + { + "epoch": 0.47, + "learning_rate": 1.052813482971535e-07, + "loss": 0.0004, + "step": 24441 + }, + { + "epoch": 0.47, + "learning_rate": 1.0527746495281736e-07, + "loss": 0.0006, + "step": 24442 + }, + { + "epoch": 0.47, + "learning_rate": 1.0527358160848121e-07, + "loss": 0.0006, + "step": 24443 + }, + { + "epoch": 0.47, + "learning_rate": 1.0526969826414507e-07, + "loss": 0.5696, + "step": 24444 + }, + { + "epoch": 0.47, + "learning_rate": 1.0526581491980893e-07, + "loss": 0.0007, + "step": 24445 + }, + { + "epoch": 0.47, + "learning_rate": 1.0526193157547279e-07, + "loss": 0.0004, + "step": 24446 + }, + { + "epoch": 0.47, + "learning_rate": 1.0525804823113665e-07, + "loss": 0.0006, + "step": 24447 + }, + { + "epoch": 0.47, + "learning_rate": 1.052541648868005e-07, + "loss": 0.0009, + "step": 24448 + }, + { + "epoch": 0.47, + "learning_rate": 1.0525028154246436e-07, + "loss": 0.6453, + "step": 24449 + }, + { + "epoch": 0.47, + "learning_rate": 1.0524639819812822e-07, + "loss": 0.064, + "step": 24450 + }, + { + "epoch": 0.47, + "learning_rate": 1.0524251485379208e-07, + "loss": 0.0007, + "step": 24451 + }, + { + "epoch": 0.47, + "learning_rate": 1.0523863150945594e-07, + "loss": 0.001, + "step": 24452 + }, + { + "epoch": 0.47, + "learning_rate": 1.052347481651198e-07, + "loss": 0.0006, + "step": 24453 + }, + { + "epoch": 0.47, + "learning_rate": 1.0523086482078366e-07, + "loss": 0.0009, + "step": 24454 + }, + { + "epoch": 0.47, + "learning_rate": 1.0522698147644751e-07, + "loss": 0.0007, + "step": 24455 + }, + { + "epoch": 0.47, + "learning_rate": 1.0522309813211137e-07, + "loss": 0.0005, + "step": 24456 + }, + { + "epoch": 0.47, + "learning_rate": 1.0521921478777523e-07, + "loss": 0.0006, + "step": 24457 + }, + { + "epoch": 0.47, + "learning_rate": 1.0521533144343909e-07, + "loss": 0.0006, + "step": 24458 + }, + { + "epoch": 0.47, + "learning_rate": 1.0521144809910293e-07, + "loss": 0.0004, + "step": 24459 + }, + { + "epoch": 0.47, + "learning_rate": 1.0520756475476679e-07, + "loss": 0.0023, + "step": 24460 + }, + { + "epoch": 0.47, + "learning_rate": 1.0520368141043065e-07, + "loss": 0.0418, + "step": 24461 + }, + { + "epoch": 0.47, + "learning_rate": 1.0519979806609451e-07, + "loss": 0.0006, + "step": 24462 + }, + { + "epoch": 0.47, + "learning_rate": 1.0519591472175837e-07, + "loss": 0.0004, + "step": 24463 + }, + { + "epoch": 0.47, + "learning_rate": 1.0519203137742222e-07, + "loss": 0.0005, + "step": 24464 + }, + { + "epoch": 0.47, + "learning_rate": 1.0518814803308608e-07, + "loss": 0.0007, + "step": 24465 + }, + { + "epoch": 0.47, + "learning_rate": 1.0518426468874994e-07, + "loss": 0.0009, + "step": 24466 + }, + { + "epoch": 0.47, + "learning_rate": 1.051803813444138e-07, + "loss": 0.0009, + "step": 24467 + }, + { + "epoch": 0.47, + "learning_rate": 1.0517649800007766e-07, + "loss": 0.0006, + "step": 24468 + }, + { + "epoch": 0.47, + "learning_rate": 1.0517261465574152e-07, + "loss": 0.0006, + "step": 24469 + }, + { + "epoch": 0.47, + "learning_rate": 1.0516873131140537e-07, + "loss": 0.0613, + "step": 24470 + }, + { + "epoch": 0.47, + "learning_rate": 1.0516484796706923e-07, + "loss": 0.0005, + "step": 24471 + }, + { + "epoch": 0.47, + "learning_rate": 1.0516096462273309e-07, + "loss": 0.0005, + "step": 24472 + }, + { + "epoch": 0.47, + "learning_rate": 1.0515708127839695e-07, + "loss": 0.0068, + "step": 24473 + }, + { + "epoch": 0.47, + "learning_rate": 1.0515319793406081e-07, + "loss": 0.0005, + "step": 24474 + }, + { + "epoch": 0.47, + "learning_rate": 1.0514931458972466e-07, + "loss": 0.0006, + "step": 24475 + }, + { + "epoch": 0.47, + "learning_rate": 1.0514543124538852e-07, + "loss": 0.0005, + "step": 24476 + }, + { + "epoch": 0.47, + "learning_rate": 1.0514154790105238e-07, + "loss": 0.0005, + "step": 24477 + }, + { + "epoch": 0.47, + "learning_rate": 1.0513766455671624e-07, + "loss": 0.0007, + "step": 24478 + }, + { + "epoch": 0.47, + "learning_rate": 1.051337812123801e-07, + "loss": 0.0032, + "step": 24479 + }, + { + "epoch": 0.47, + "learning_rate": 1.0512989786804396e-07, + "loss": 0.0008, + "step": 24480 + }, + { + "epoch": 0.47, + "learning_rate": 1.0512601452370781e-07, + "loss": 0.0007, + "step": 24481 + }, + { + "epoch": 0.47, + "learning_rate": 1.0512213117937167e-07, + "loss": 0.0007, + "step": 24482 + }, + { + "epoch": 0.47, + "learning_rate": 1.0511824783503553e-07, + "loss": 1.1308, + "step": 24483 + }, + { + "epoch": 0.47, + "learning_rate": 1.0511436449069939e-07, + "loss": 0.0012, + "step": 24484 + }, + { + "epoch": 0.47, + "learning_rate": 1.0511048114636325e-07, + "loss": 0.0007, + "step": 24485 + }, + { + "epoch": 0.47, + "learning_rate": 1.051065978020271e-07, + "loss": 0.0006, + "step": 24486 + }, + { + "epoch": 0.47, + "learning_rate": 1.0510271445769096e-07, + "loss": 0.0735, + "step": 24487 + }, + { + "epoch": 0.48, + "learning_rate": 1.0509883111335482e-07, + "loss": 0.1008, + "step": 24488 + }, + { + "epoch": 0.48, + "learning_rate": 1.0509494776901868e-07, + "loss": 0.0007, + "step": 24489 + }, + { + "epoch": 0.48, + "learning_rate": 1.0509106442468254e-07, + "loss": 0.185, + "step": 24490 + }, + { + "epoch": 0.48, + "learning_rate": 1.050871810803464e-07, + "loss": 0.0006, + "step": 24491 + }, + { + "epoch": 0.48, + "learning_rate": 1.0508329773601026e-07, + "loss": 0.0006, + "step": 24492 + }, + { + "epoch": 0.48, + "learning_rate": 1.0507941439167411e-07, + "loss": 0.0006, + "step": 24493 + }, + { + "epoch": 0.48, + "learning_rate": 1.0507553104733797e-07, + "loss": 1.1907, + "step": 24494 + }, + { + "epoch": 0.48, + "learning_rate": 1.0507164770300183e-07, + "loss": 0.0005, + "step": 24495 + }, + { + "epoch": 0.48, + "learning_rate": 1.0506776435866569e-07, + "loss": 1.0879, + "step": 24496 + }, + { + "epoch": 0.48, + "learning_rate": 1.0506388101432952e-07, + "loss": 0.0007, + "step": 24497 + }, + { + "epoch": 0.48, + "learning_rate": 1.0505999766999338e-07, + "loss": 0.0005, + "step": 24498 + }, + { + "epoch": 0.48, + "learning_rate": 1.0505611432565724e-07, + "loss": 0.0005, + "step": 24499 + }, + { + "epoch": 0.48, + "learning_rate": 1.050522309813211e-07, + "loss": 0.0006, + "step": 24500 + }, + { + "epoch": 0.48, + "learning_rate": 1.0504834763698495e-07, + "loss": 0.0008, + "step": 24501 + }, + { + "epoch": 0.48, + "learning_rate": 1.0504446429264881e-07, + "loss": 0.0007, + "step": 24502 + }, + { + "epoch": 0.48, + "learning_rate": 1.0504058094831267e-07, + "loss": 0.0006, + "step": 24503 + }, + { + "epoch": 0.48, + "learning_rate": 1.0503669760397653e-07, + "loss": 0.0005, + "step": 24504 + }, + { + "epoch": 0.48, + "learning_rate": 1.0503281425964039e-07, + "loss": 0.0006, + "step": 24505 + }, + { + "epoch": 0.48, + "learning_rate": 1.0502893091530424e-07, + "loss": 0.0005, + "step": 24506 + }, + { + "epoch": 0.48, + "learning_rate": 1.050250475709681e-07, + "loss": 0.0006, + "step": 24507 + }, + { + "epoch": 0.48, + "learning_rate": 1.0502116422663196e-07, + "loss": 0.0007, + "step": 24508 + }, + { + "epoch": 0.48, + "learning_rate": 1.0501728088229582e-07, + "loss": 0.0005, + "step": 24509 + }, + { + "epoch": 0.48, + "learning_rate": 1.0501339753795968e-07, + "loss": 0.0007, + "step": 24510 + }, + { + "epoch": 0.48, + "learning_rate": 1.0500951419362354e-07, + "loss": 0.0005, + "step": 24511 + }, + { + "epoch": 0.48, + "learning_rate": 1.050056308492874e-07, + "loss": 0.6324, + "step": 24512 + }, + { + "epoch": 0.48, + "learning_rate": 1.0500174750495125e-07, + "loss": 0.0008, + "step": 24513 + }, + { + "epoch": 0.48, + "learning_rate": 1.0499786416061511e-07, + "loss": 0.0005, + "step": 24514 + }, + { + "epoch": 0.48, + "learning_rate": 1.0499398081627897e-07, + "loss": 0.5027, + "step": 24515 + }, + { + "epoch": 0.48, + "learning_rate": 1.0499009747194283e-07, + "loss": 0.0009, + "step": 24516 + }, + { + "epoch": 0.48, + "learning_rate": 1.0498621412760668e-07, + "loss": 0.0006, + "step": 24517 + }, + { + "epoch": 0.48, + "learning_rate": 1.0498233078327054e-07, + "loss": 0.0006, + "step": 24518 + }, + { + "epoch": 0.48, + "learning_rate": 1.049784474389344e-07, + "loss": 0.0005, + "step": 24519 + }, + { + "epoch": 0.48, + "learning_rate": 1.0497456409459826e-07, + "loss": 0.001, + "step": 24520 + }, + { + "epoch": 0.48, + "learning_rate": 1.0497068075026212e-07, + "loss": 0.0006, + "step": 24521 + }, + { + "epoch": 0.48, + "learning_rate": 1.0496679740592598e-07, + "loss": 1.1413, + "step": 24522 + }, + { + "epoch": 0.48, + "learning_rate": 1.0496291406158983e-07, + "loss": 0.0083, + "step": 24523 + }, + { + "epoch": 0.48, + "learning_rate": 1.0495903071725369e-07, + "loss": 0.0005, + "step": 24524 + }, + { + "epoch": 0.48, + "learning_rate": 1.0495514737291755e-07, + "loss": 0.0242, + "step": 24525 + }, + { + "epoch": 0.48, + "learning_rate": 1.0495126402858141e-07, + "loss": 0.7611, + "step": 24526 + }, + { + "epoch": 0.48, + "learning_rate": 1.0494738068424527e-07, + "loss": 0.0006, + "step": 24527 + }, + { + "epoch": 0.48, + "learning_rate": 1.0494349733990913e-07, + "loss": 0.0021, + "step": 24528 + }, + { + "epoch": 0.48, + "learning_rate": 1.0493961399557298e-07, + "loss": 0.1563, + "step": 24529 + }, + { + "epoch": 0.48, + "learning_rate": 1.0493573065123684e-07, + "loss": 0.2127, + "step": 24530 + }, + { + "epoch": 0.48, + "learning_rate": 1.049318473069007e-07, + "loss": 0.0005, + "step": 24531 + }, + { + "epoch": 0.48, + "learning_rate": 1.0492796396256456e-07, + "loss": 0.0008, + "step": 24532 + }, + { + "epoch": 0.48, + "learning_rate": 1.0492408061822842e-07, + "loss": 0.0006, + "step": 24533 + }, + { + "epoch": 0.48, + "learning_rate": 1.0492019727389227e-07, + "loss": 0.0007, + "step": 24534 + }, + { + "epoch": 0.48, + "learning_rate": 1.0491631392955613e-07, + "loss": 0.0006, + "step": 24535 + }, + { + "epoch": 0.48, + "learning_rate": 1.0491243058521999e-07, + "loss": 0.0248, + "step": 24536 + }, + { + "epoch": 0.48, + "learning_rate": 1.0490854724088385e-07, + "loss": 0.0007, + "step": 24537 + }, + { + "epoch": 0.48, + "learning_rate": 1.0490466389654771e-07, + "loss": 0.0007, + "step": 24538 + }, + { + "epoch": 0.48, + "learning_rate": 1.0490078055221157e-07, + "loss": 0.0004, + "step": 24539 + }, + { + "epoch": 0.48, + "learning_rate": 1.0489689720787542e-07, + "loss": 0.0005, + "step": 24540 + }, + { + "epoch": 0.48, + "learning_rate": 1.0489301386353928e-07, + "loss": 0.0006, + "step": 24541 + }, + { + "epoch": 0.48, + "learning_rate": 1.0488913051920314e-07, + "loss": 0.0007, + "step": 24542 + }, + { + "epoch": 0.48, + "learning_rate": 1.04885247174867e-07, + "loss": 0.0158, + "step": 24543 + }, + { + "epoch": 0.48, + "learning_rate": 1.0488136383053086e-07, + "loss": 0.0006, + "step": 24544 + }, + { + "epoch": 0.48, + "learning_rate": 1.0487748048619472e-07, + "loss": 0.0007, + "step": 24545 + }, + { + "epoch": 0.48, + "learning_rate": 1.0487359714185857e-07, + "loss": 0.0006, + "step": 24546 + }, + { + "epoch": 0.48, + "learning_rate": 1.0486971379752243e-07, + "loss": 0.0009, + "step": 24547 + }, + { + "epoch": 0.48, + "learning_rate": 1.0486583045318629e-07, + "loss": 0.0006, + "step": 24548 + }, + { + "epoch": 0.48, + "learning_rate": 1.0486194710885015e-07, + "loss": 0.0006, + "step": 24549 + }, + { + "epoch": 0.48, + "learning_rate": 1.0485806376451401e-07, + "loss": 0.0005, + "step": 24550 + }, + { + "epoch": 0.48, + "learning_rate": 1.0485418042017787e-07, + "loss": 0.002, + "step": 24551 + }, + { + "epoch": 0.48, + "learning_rate": 1.0485029707584172e-07, + "loss": 0.0008, + "step": 24552 + }, + { + "epoch": 0.48, + "learning_rate": 1.0484641373150558e-07, + "loss": 0.0007, + "step": 24553 + }, + { + "epoch": 0.48, + "learning_rate": 1.0484253038716944e-07, + "loss": 0.0006, + "step": 24554 + }, + { + "epoch": 0.48, + "learning_rate": 1.0483864704283327e-07, + "loss": 0.0007, + "step": 24555 + }, + { + "epoch": 0.48, + "learning_rate": 1.0483476369849713e-07, + "loss": 0.0008, + "step": 24556 + }, + { + "epoch": 0.48, + "learning_rate": 1.0483088035416099e-07, + "loss": 0.001, + "step": 24557 + }, + { + "epoch": 0.48, + "learning_rate": 1.0482699700982485e-07, + "loss": 0.0006, + "step": 24558 + }, + { + "epoch": 0.48, + "learning_rate": 1.048231136654887e-07, + "loss": 0.202, + "step": 24559 + }, + { + "epoch": 0.48, + "learning_rate": 1.0481923032115256e-07, + "loss": 0.0004, + "step": 24560 + }, + { + "epoch": 0.48, + "learning_rate": 1.0481534697681642e-07, + "loss": 0.0005, + "step": 24561 + }, + { + "epoch": 0.48, + "learning_rate": 1.0481146363248028e-07, + "loss": 0.0006, + "step": 24562 + }, + { + "epoch": 0.48, + "learning_rate": 1.0480758028814414e-07, + "loss": 0.0009, + "step": 24563 + }, + { + "epoch": 0.48, + "learning_rate": 1.04803696943808e-07, + "loss": 0.0006, + "step": 24564 + }, + { + "epoch": 0.48, + "learning_rate": 1.0479981359947185e-07, + "loss": 0.0006, + "step": 24565 + }, + { + "epoch": 0.48, + "learning_rate": 1.0479593025513571e-07, + "loss": 0.0013, + "step": 24566 + }, + { + "epoch": 0.48, + "learning_rate": 1.0479204691079957e-07, + "loss": 0.0006, + "step": 24567 + }, + { + "epoch": 0.48, + "learning_rate": 1.0478816356646343e-07, + "loss": 0.0192, + "step": 24568 + }, + { + "epoch": 0.48, + "learning_rate": 1.0478428022212729e-07, + "loss": 0.0004, + "step": 24569 + }, + { + "epoch": 0.48, + "learning_rate": 1.0478039687779115e-07, + "loss": 0.0004, + "step": 24570 + }, + { + "epoch": 0.48, + "learning_rate": 1.04776513533455e-07, + "loss": 0.0276, + "step": 24571 + }, + { + "epoch": 0.48, + "learning_rate": 1.0477263018911886e-07, + "loss": 0.0007, + "step": 24572 + }, + { + "epoch": 0.48, + "learning_rate": 1.0476874684478272e-07, + "loss": 0.0005, + "step": 24573 + }, + { + "epoch": 0.48, + "learning_rate": 1.0476486350044658e-07, + "loss": 0.0009, + "step": 24574 + }, + { + "epoch": 0.48, + "learning_rate": 1.0476098015611044e-07, + "loss": 0.0005, + "step": 24575 + }, + { + "epoch": 0.48, + "learning_rate": 1.047570968117743e-07, + "loss": 0.0005, + "step": 24576 + }, + { + "epoch": 0.48, + "learning_rate": 1.0475321346743815e-07, + "loss": 0.0005, + "step": 24577 + }, + { + "epoch": 0.48, + "learning_rate": 1.0474933012310201e-07, + "loss": 0.0006, + "step": 24578 + }, + { + "epoch": 0.48, + "learning_rate": 1.0474544677876587e-07, + "loss": 0.0006, + "step": 24579 + }, + { + "epoch": 0.48, + "learning_rate": 1.0474156343442973e-07, + "loss": 0.0006, + "step": 24580 + }, + { + "epoch": 0.48, + "learning_rate": 1.0473768009009359e-07, + "loss": 1.2254, + "step": 24581 + }, + { + "epoch": 0.48, + "learning_rate": 1.0473379674575744e-07, + "loss": 0.0006, + "step": 24582 + }, + { + "epoch": 0.48, + "learning_rate": 1.047299134014213e-07, + "loss": 0.0008, + "step": 24583 + }, + { + "epoch": 0.48, + "learning_rate": 1.0472603005708516e-07, + "loss": 0.0006, + "step": 24584 + }, + { + "epoch": 0.48, + "learning_rate": 1.0472214671274902e-07, + "loss": 0.0005, + "step": 24585 + }, + { + "epoch": 0.48, + "learning_rate": 1.0471826336841288e-07, + "loss": 0.0004, + "step": 24586 + }, + { + "epoch": 0.48, + "learning_rate": 1.0471438002407674e-07, + "loss": 0.5894, + "step": 24587 + }, + { + "epoch": 0.48, + "learning_rate": 1.047104966797406e-07, + "loss": 0.0007, + "step": 24588 + }, + { + "epoch": 0.48, + "learning_rate": 1.0470661333540445e-07, + "loss": 1.1398, + "step": 24589 + }, + { + "epoch": 0.48, + "learning_rate": 1.0470272999106831e-07, + "loss": 1.1071, + "step": 24590 + }, + { + "epoch": 0.48, + "learning_rate": 1.0469884664673217e-07, + "loss": 0.0004, + "step": 24591 + }, + { + "epoch": 0.48, + "learning_rate": 1.0469496330239603e-07, + "loss": 0.0005, + "step": 24592 + }, + { + "epoch": 0.48, + "learning_rate": 1.0469107995805988e-07, + "loss": 0.0005, + "step": 24593 + }, + { + "epoch": 0.48, + "learning_rate": 1.0468719661372374e-07, + "loss": 0.0006, + "step": 24594 + }, + { + "epoch": 0.48, + "learning_rate": 1.046833132693876e-07, + "loss": 0.0005, + "step": 24595 + }, + { + "epoch": 0.48, + "learning_rate": 1.0467942992505146e-07, + "loss": 0.0005, + "step": 24596 + }, + { + "epoch": 0.48, + "learning_rate": 1.0467554658071532e-07, + "loss": 0.0008, + "step": 24597 + }, + { + "epoch": 0.48, + "learning_rate": 1.0467166323637918e-07, + "loss": 0.0006, + "step": 24598 + }, + { + "epoch": 0.48, + "learning_rate": 1.0466777989204303e-07, + "loss": 0.0005, + "step": 24599 + }, + { + "epoch": 0.48, + "learning_rate": 1.0466389654770689e-07, + "loss": 0.0006, + "step": 24600 + }, + { + "epoch": 0.48, + "learning_rate": 1.0466001320337075e-07, + "loss": 1.2289, + "step": 24601 + }, + { + "epoch": 0.48, + "learning_rate": 1.0465612985903461e-07, + "loss": 0.0005, + "step": 24602 + }, + { + "epoch": 0.48, + "learning_rate": 1.0465224651469847e-07, + "loss": 0.0006, + "step": 24603 + }, + { + "epoch": 0.48, + "learning_rate": 1.0464836317036233e-07, + "loss": 0.0004, + "step": 24604 + }, + { + "epoch": 0.48, + "learning_rate": 1.0464447982602618e-07, + "loss": 0.0006, + "step": 24605 + }, + { + "epoch": 0.48, + "learning_rate": 1.0464059648169004e-07, + "loss": 0.0006, + "step": 24606 + }, + { + "epoch": 0.48, + "learning_rate": 1.0463671313735389e-07, + "loss": 0.0007, + "step": 24607 + }, + { + "epoch": 0.48, + "learning_rate": 1.0463282979301775e-07, + "loss": 0.0032, + "step": 24608 + }, + { + "epoch": 0.48, + "learning_rate": 1.046289464486816e-07, + "loss": 0.0009, + "step": 24609 + }, + { + "epoch": 0.48, + "learning_rate": 1.0462506310434546e-07, + "loss": 0.001, + "step": 24610 + }, + { + "epoch": 0.48, + "learning_rate": 1.0462117976000932e-07, + "loss": 0.0006, + "step": 24611 + }, + { + "epoch": 0.48, + "learning_rate": 1.0461729641567318e-07, + "loss": 0.0006, + "step": 24612 + }, + { + "epoch": 0.48, + "learning_rate": 1.0461341307133702e-07, + "loss": 0.0008, + "step": 24613 + }, + { + "epoch": 0.48, + "learning_rate": 1.0460952972700088e-07, + "loss": 0.001, + "step": 24614 + }, + { + "epoch": 0.48, + "learning_rate": 1.0460564638266474e-07, + "loss": 1.0075, + "step": 24615 + }, + { + "epoch": 0.48, + "learning_rate": 1.046017630383286e-07, + "loss": 0.0247, + "step": 24616 + }, + { + "epoch": 0.48, + "learning_rate": 1.0459787969399246e-07, + "loss": 0.0012, + "step": 24617 + }, + { + "epoch": 0.48, + "learning_rate": 1.0459399634965631e-07, + "loss": 0.0008, + "step": 24618 + }, + { + "epoch": 0.48, + "learning_rate": 1.0459011300532017e-07, + "loss": 0.9814, + "step": 24619 + }, + { + "epoch": 0.48, + "learning_rate": 1.0458622966098403e-07, + "loss": 0.0007, + "step": 24620 + }, + { + "epoch": 0.48, + "learning_rate": 1.0458234631664789e-07, + "loss": 0.0006, + "step": 24621 + }, + { + "epoch": 0.48, + "learning_rate": 1.0457846297231175e-07, + "loss": 0.0006, + "step": 24622 + }, + { + "epoch": 0.48, + "learning_rate": 1.045745796279756e-07, + "loss": 0.0007, + "step": 24623 + }, + { + "epoch": 0.48, + "learning_rate": 1.0457069628363946e-07, + "loss": 0.3735, + "step": 24624 + }, + { + "epoch": 0.48, + "learning_rate": 1.0456681293930332e-07, + "loss": 0.0005, + "step": 24625 + }, + { + "epoch": 0.48, + "learning_rate": 1.0456292959496718e-07, + "loss": 0.0007, + "step": 24626 + }, + { + "epoch": 0.48, + "learning_rate": 1.0455904625063104e-07, + "loss": 0.0026, + "step": 24627 + }, + { + "epoch": 0.48, + "learning_rate": 1.045551629062949e-07, + "loss": 0.002, + "step": 24628 + }, + { + "epoch": 0.48, + "learning_rate": 1.0455127956195876e-07, + "loss": 0.8516, + "step": 24629 + }, + { + "epoch": 0.48, + "learning_rate": 1.0454739621762261e-07, + "loss": 0.0006, + "step": 24630 + }, + { + "epoch": 0.48, + "learning_rate": 1.0454351287328647e-07, + "loss": 0.0007, + "step": 24631 + }, + { + "epoch": 0.48, + "learning_rate": 1.0453962952895033e-07, + "loss": 0.0009, + "step": 24632 + }, + { + "epoch": 0.48, + "learning_rate": 1.0453574618461419e-07, + "loss": 0.0007, + "step": 24633 + }, + { + "epoch": 0.48, + "learning_rate": 1.0453186284027805e-07, + "loss": 0.0008, + "step": 24634 + }, + { + "epoch": 0.48, + "learning_rate": 1.045279794959419e-07, + "loss": 0.0006, + "step": 24635 + }, + { + "epoch": 0.48, + "learning_rate": 1.0452409615160575e-07, + "loss": 0.0009, + "step": 24636 + }, + { + "epoch": 0.48, + "learning_rate": 1.0452021280726961e-07, + "loss": 0.0005, + "step": 24637 + }, + { + "epoch": 0.48, + "learning_rate": 1.0451632946293347e-07, + "loss": 0.0083, + "step": 24638 + }, + { + "epoch": 0.48, + "learning_rate": 1.0451244611859732e-07, + "loss": 0.0007, + "step": 24639 + }, + { + "epoch": 0.48, + "learning_rate": 1.0450856277426118e-07, + "loss": 0.0007, + "step": 24640 + }, + { + "epoch": 0.48, + "learning_rate": 1.0450467942992504e-07, + "loss": 0.353, + "step": 24641 + }, + { + "epoch": 0.48, + "learning_rate": 1.045007960855889e-07, + "loss": 1.0284, + "step": 24642 + }, + { + "epoch": 0.48, + "learning_rate": 1.0449691274125276e-07, + "loss": 0.0372, + "step": 24643 + }, + { + "epoch": 0.48, + "learning_rate": 1.0449302939691662e-07, + "loss": 0.0006, + "step": 24644 + }, + { + "epoch": 0.48, + "learning_rate": 1.0448914605258047e-07, + "loss": 0.0005, + "step": 24645 + }, + { + "epoch": 0.48, + "learning_rate": 1.0448526270824433e-07, + "loss": 0.0006, + "step": 24646 + }, + { + "epoch": 0.48, + "learning_rate": 1.0448137936390819e-07, + "loss": 0.0006, + "step": 24647 + }, + { + "epoch": 0.48, + "learning_rate": 1.0447749601957205e-07, + "loss": 0.0009, + "step": 24648 + }, + { + "epoch": 0.48, + "learning_rate": 1.0447361267523591e-07, + "loss": 0.0005, + "step": 24649 + }, + { + "epoch": 0.48, + "learning_rate": 1.0446972933089977e-07, + "loss": 0.0053, + "step": 24650 + }, + { + "epoch": 0.48, + "learning_rate": 1.0446584598656362e-07, + "loss": 0.0005, + "step": 24651 + }, + { + "epoch": 0.48, + "learning_rate": 1.0446196264222748e-07, + "loss": 0.0006, + "step": 24652 + }, + { + "epoch": 0.48, + "learning_rate": 1.0445807929789134e-07, + "loss": 0.5947, + "step": 24653 + }, + { + "epoch": 0.48, + "learning_rate": 1.044541959535552e-07, + "loss": 0.1324, + "step": 24654 + }, + { + "epoch": 0.48, + "learning_rate": 1.0445031260921906e-07, + "loss": 0.0105, + "step": 24655 + }, + { + "epoch": 0.48, + "learning_rate": 1.0444642926488291e-07, + "loss": 0.0005, + "step": 24656 + }, + { + "epoch": 0.48, + "learning_rate": 1.0444254592054677e-07, + "loss": 0.0005, + "step": 24657 + }, + { + "epoch": 0.48, + "learning_rate": 1.0443866257621063e-07, + "loss": 0.0005, + "step": 24658 + }, + { + "epoch": 0.48, + "learning_rate": 1.0443477923187449e-07, + "loss": 0.0015, + "step": 24659 + }, + { + "epoch": 0.48, + "learning_rate": 1.0443089588753835e-07, + "loss": 0.0005, + "step": 24660 + }, + { + "epoch": 0.48, + "learning_rate": 1.044270125432022e-07, + "loss": 0.0007, + "step": 24661 + }, + { + "epoch": 0.48, + "learning_rate": 1.0442312919886606e-07, + "loss": 0.0006, + "step": 24662 + }, + { + "epoch": 0.48, + "learning_rate": 1.0441924585452992e-07, + "loss": 0.0005, + "step": 24663 + }, + { + "epoch": 0.48, + "learning_rate": 1.0441536251019378e-07, + "loss": 0.0006, + "step": 24664 + }, + { + "epoch": 0.48, + "learning_rate": 1.0441147916585764e-07, + "loss": 0.0006, + "step": 24665 + }, + { + "epoch": 0.48, + "learning_rate": 1.044075958215215e-07, + "loss": 0.0006, + "step": 24666 + }, + { + "epoch": 0.48, + "learning_rate": 1.0440371247718536e-07, + "loss": 0.0013, + "step": 24667 + }, + { + "epoch": 0.48, + "learning_rate": 1.0439982913284921e-07, + "loss": 0.0008, + "step": 24668 + }, + { + "epoch": 0.48, + "learning_rate": 1.0439594578851307e-07, + "loss": 0.0008, + "step": 24669 + }, + { + "epoch": 0.48, + "learning_rate": 1.0439206244417693e-07, + "loss": 0.0007, + "step": 24670 + }, + { + "epoch": 0.48, + "learning_rate": 1.0438817909984076e-07, + "loss": 0.7461, + "step": 24671 + }, + { + "epoch": 0.48, + "learning_rate": 1.0438429575550462e-07, + "loss": 0.0008, + "step": 24672 + }, + { + "epoch": 0.48, + "learning_rate": 1.0438041241116848e-07, + "loss": 0.6278, + "step": 24673 + }, + { + "epoch": 0.48, + "learning_rate": 1.0437652906683234e-07, + "loss": 0.0007, + "step": 24674 + }, + { + "epoch": 0.48, + "learning_rate": 1.043726457224962e-07, + "loss": 0.0006, + "step": 24675 + }, + { + "epoch": 0.48, + "learning_rate": 1.0436876237816005e-07, + "loss": 0.0005, + "step": 24676 + }, + { + "epoch": 0.48, + "learning_rate": 1.0436487903382391e-07, + "loss": 0.0006, + "step": 24677 + }, + { + "epoch": 0.48, + "learning_rate": 1.0436099568948777e-07, + "loss": 0.0735, + "step": 24678 + }, + { + "epoch": 0.48, + "learning_rate": 1.0435711234515163e-07, + "loss": 0.0005, + "step": 24679 + }, + { + "epoch": 0.48, + "learning_rate": 1.0435322900081549e-07, + "loss": 0.0004, + "step": 24680 + }, + { + "epoch": 0.48, + "learning_rate": 1.0434934565647934e-07, + "loss": 0.0013, + "step": 24681 + }, + { + "epoch": 0.48, + "learning_rate": 1.043454623121432e-07, + "loss": 0.0009, + "step": 24682 + }, + { + "epoch": 0.48, + "learning_rate": 1.0434157896780706e-07, + "loss": 0.0007, + "step": 24683 + }, + { + "epoch": 0.48, + "learning_rate": 1.0433769562347092e-07, + "loss": 0.552, + "step": 24684 + }, + { + "epoch": 0.48, + "learning_rate": 1.0433381227913478e-07, + "loss": 0.0007, + "step": 24685 + }, + { + "epoch": 0.48, + "learning_rate": 1.0432992893479864e-07, + "loss": 0.0005, + "step": 24686 + }, + { + "epoch": 0.48, + "learning_rate": 1.043260455904625e-07, + "loss": 0.0007, + "step": 24687 + }, + { + "epoch": 0.48, + "learning_rate": 1.0432216224612635e-07, + "loss": 0.2396, + "step": 24688 + }, + { + "epoch": 0.48, + "learning_rate": 1.0431827890179021e-07, + "loss": 0.0004, + "step": 24689 + }, + { + "epoch": 0.48, + "learning_rate": 1.0431439555745407e-07, + "loss": 0.0014, + "step": 24690 + }, + { + "epoch": 0.48, + "learning_rate": 1.0431051221311793e-07, + "loss": 0.0011, + "step": 24691 + }, + { + "epoch": 0.48, + "learning_rate": 1.0430662886878178e-07, + "loss": 0.0009, + "step": 24692 + }, + { + "epoch": 0.48, + "learning_rate": 1.0430274552444564e-07, + "loss": 0.0005, + "step": 24693 + }, + { + "epoch": 0.48, + "learning_rate": 1.042988621801095e-07, + "loss": 0.0006, + "step": 24694 + }, + { + "epoch": 0.48, + "learning_rate": 1.0429497883577336e-07, + "loss": 0.0008, + "step": 24695 + }, + { + "epoch": 0.48, + "learning_rate": 1.0429109549143722e-07, + "loss": 0.0132, + "step": 24696 + }, + { + "epoch": 0.48, + "learning_rate": 1.0428721214710108e-07, + "loss": 0.0004, + "step": 24697 + }, + { + "epoch": 0.48, + "learning_rate": 1.0428332880276493e-07, + "loss": 0.0012, + "step": 24698 + }, + { + "epoch": 0.48, + "learning_rate": 1.0427944545842879e-07, + "loss": 0.0006, + "step": 24699 + }, + { + "epoch": 0.48, + "learning_rate": 1.0427556211409265e-07, + "loss": 0.0004, + "step": 24700 + }, + { + "epoch": 0.48, + "learning_rate": 1.0427167876975651e-07, + "loss": 0.0006, + "step": 24701 + }, + { + "epoch": 0.48, + "learning_rate": 1.0426779542542037e-07, + "loss": 0.7407, + "step": 24702 + }, + { + "epoch": 0.48, + "learning_rate": 1.0426391208108423e-07, + "loss": 0.0008, + "step": 24703 + }, + { + "epoch": 0.48, + "learning_rate": 1.0426002873674808e-07, + "loss": 0.0052, + "step": 24704 + }, + { + "epoch": 0.48, + "learning_rate": 1.0425614539241194e-07, + "loss": 0.0005, + "step": 24705 + }, + { + "epoch": 0.48, + "learning_rate": 1.042522620480758e-07, + "loss": 0.0007, + "step": 24706 + }, + { + "epoch": 0.48, + "learning_rate": 1.0424837870373966e-07, + "loss": 0.0006, + "step": 24707 + }, + { + "epoch": 0.48, + "learning_rate": 1.0424449535940352e-07, + "loss": 0.0009, + "step": 24708 + }, + { + "epoch": 0.48, + "learning_rate": 1.0424061201506738e-07, + "loss": 0.0005, + "step": 24709 + }, + { + "epoch": 0.48, + "learning_rate": 1.0423672867073123e-07, + "loss": 0.0004, + "step": 24710 + }, + { + "epoch": 0.48, + "learning_rate": 1.0423284532639509e-07, + "loss": 0.3214, + "step": 24711 + }, + { + "epoch": 0.48, + "learning_rate": 1.0422896198205895e-07, + "loss": 0.0057, + "step": 24712 + }, + { + "epoch": 0.48, + "learning_rate": 1.0422507863772281e-07, + "loss": 0.0005, + "step": 24713 + }, + { + "epoch": 0.48, + "learning_rate": 1.0422119529338667e-07, + "loss": 0.0006, + "step": 24714 + }, + { + "epoch": 0.48, + "learning_rate": 1.0421731194905052e-07, + "loss": 0.0006, + "step": 24715 + }, + { + "epoch": 0.48, + "learning_rate": 1.0421342860471438e-07, + "loss": 0.0023, + "step": 24716 + }, + { + "epoch": 0.48, + "learning_rate": 1.0420954526037824e-07, + "loss": 0.0005, + "step": 24717 + }, + { + "epoch": 0.48, + "learning_rate": 1.042056619160421e-07, + "loss": 0.0006, + "step": 24718 + }, + { + "epoch": 0.48, + "learning_rate": 1.0420177857170596e-07, + "loss": 0.0005, + "step": 24719 + }, + { + "epoch": 0.48, + "learning_rate": 1.0419789522736982e-07, + "loss": 0.0006, + "step": 24720 + }, + { + "epoch": 0.48, + "learning_rate": 1.0419401188303367e-07, + "loss": 0.0011, + "step": 24721 + }, + { + "epoch": 0.48, + "learning_rate": 1.0419012853869753e-07, + "loss": 0.003, + "step": 24722 + }, + { + "epoch": 0.48, + "learning_rate": 1.0418624519436139e-07, + "loss": 0.0006, + "step": 24723 + }, + { + "epoch": 0.48, + "learning_rate": 1.0418236185002525e-07, + "loss": 0.0006, + "step": 24724 + }, + { + "epoch": 0.48, + "learning_rate": 1.0417847850568911e-07, + "loss": 1.0682, + "step": 24725 + }, + { + "epoch": 0.48, + "learning_rate": 1.0417459516135297e-07, + "loss": 0.0007, + "step": 24726 + }, + { + "epoch": 0.48, + "learning_rate": 1.0417071181701682e-07, + "loss": 0.0008, + "step": 24727 + }, + { + "epoch": 0.48, + "learning_rate": 1.0416682847268068e-07, + "loss": 0.0009, + "step": 24728 + }, + { + "epoch": 0.48, + "learning_rate": 1.0416294512834451e-07, + "loss": 0.0031, + "step": 24729 + }, + { + "epoch": 0.48, + "learning_rate": 1.0415906178400837e-07, + "loss": 0.0004, + "step": 24730 + }, + { + "epoch": 0.48, + "learning_rate": 1.0415517843967223e-07, + "loss": 0.0011, + "step": 24731 + }, + { + "epoch": 0.48, + "learning_rate": 1.0415129509533609e-07, + "loss": 0.0753, + "step": 24732 + }, + { + "epoch": 0.48, + "learning_rate": 1.0414741175099995e-07, + "loss": 0.0016, + "step": 24733 + }, + { + "epoch": 0.48, + "learning_rate": 1.041435284066638e-07, + "loss": 0.0006, + "step": 24734 + }, + { + "epoch": 0.48, + "learning_rate": 1.0413964506232766e-07, + "loss": 0.0008, + "step": 24735 + }, + { + "epoch": 0.48, + "learning_rate": 1.0413576171799152e-07, + "loss": 0.0008, + "step": 24736 + }, + { + "epoch": 0.48, + "learning_rate": 1.0413187837365538e-07, + "loss": 0.0026, + "step": 24737 + }, + { + "epoch": 0.48, + "learning_rate": 1.0412799502931924e-07, + "loss": 0.0006, + "step": 24738 + }, + { + "epoch": 0.48, + "learning_rate": 1.041241116849831e-07, + "loss": 0.0007, + "step": 24739 + }, + { + "epoch": 0.48, + "learning_rate": 1.0412022834064695e-07, + "loss": 0.0071, + "step": 24740 + }, + { + "epoch": 0.48, + "learning_rate": 1.0411634499631081e-07, + "loss": 0.2438, + "step": 24741 + }, + { + "epoch": 0.48, + "learning_rate": 1.0411246165197467e-07, + "loss": 0.0005, + "step": 24742 + }, + { + "epoch": 0.48, + "learning_rate": 1.0410857830763853e-07, + "loss": 0.8901, + "step": 24743 + }, + { + "epoch": 0.48, + "learning_rate": 1.0410469496330239e-07, + "loss": 0.0007, + "step": 24744 + }, + { + "epoch": 0.48, + "learning_rate": 1.0410081161896625e-07, + "loss": 0.0008, + "step": 24745 + }, + { + "epoch": 0.48, + "learning_rate": 1.040969282746301e-07, + "loss": 0.7875, + "step": 24746 + }, + { + "epoch": 0.48, + "learning_rate": 1.0409304493029396e-07, + "loss": 0.0005, + "step": 24747 + }, + { + "epoch": 0.48, + "learning_rate": 1.0408916158595782e-07, + "loss": 0.0017, + "step": 24748 + }, + { + "epoch": 0.48, + "learning_rate": 1.0408527824162168e-07, + "loss": 0.0007, + "step": 24749 + }, + { + "epoch": 0.48, + "learning_rate": 1.0408139489728554e-07, + "loss": 0.0005, + "step": 24750 + }, + { + "epoch": 0.48, + "learning_rate": 1.040775115529494e-07, + "loss": 0.0005, + "step": 24751 + }, + { + "epoch": 0.48, + "learning_rate": 1.0407362820861325e-07, + "loss": 0.0006, + "step": 24752 + }, + { + "epoch": 0.48, + "learning_rate": 1.0406974486427711e-07, + "loss": 0.0057, + "step": 24753 + }, + { + "epoch": 0.48, + "learning_rate": 1.0406586151994097e-07, + "loss": 0.0009, + "step": 24754 + }, + { + "epoch": 0.48, + "learning_rate": 1.0406197817560483e-07, + "loss": 0.0007, + "step": 24755 + }, + { + "epoch": 0.48, + "learning_rate": 1.0405809483126869e-07, + "loss": 0.0007, + "step": 24756 + }, + { + "epoch": 0.48, + "learning_rate": 1.0405421148693254e-07, + "loss": 0.0006, + "step": 24757 + }, + { + "epoch": 0.48, + "learning_rate": 1.040503281425964e-07, + "loss": 0.0008, + "step": 24758 + }, + { + "epoch": 0.48, + "learning_rate": 1.0404644479826026e-07, + "loss": 0.0005, + "step": 24759 + }, + { + "epoch": 0.48, + "learning_rate": 1.0404256145392412e-07, + "loss": 0.0008, + "step": 24760 + }, + { + "epoch": 0.48, + "learning_rate": 1.0403867810958798e-07, + "loss": 0.0009, + "step": 24761 + }, + { + "epoch": 0.48, + "learning_rate": 1.0403479476525184e-07, + "loss": 1.1354, + "step": 24762 + }, + { + "epoch": 0.48, + "learning_rate": 1.040309114209157e-07, + "loss": 0.0006, + "step": 24763 + }, + { + "epoch": 0.48, + "learning_rate": 1.0402702807657955e-07, + "loss": 0.7606, + "step": 24764 + }, + { + "epoch": 0.48, + "learning_rate": 1.0402314473224341e-07, + "loss": 0.0006, + "step": 24765 + }, + { + "epoch": 0.48, + "learning_rate": 1.0401926138790727e-07, + "loss": 0.4144, + "step": 24766 + }, + { + "epoch": 0.48, + "learning_rate": 1.0401537804357113e-07, + "loss": 0.0011, + "step": 24767 + }, + { + "epoch": 0.48, + "learning_rate": 1.0401149469923498e-07, + "loss": 0.0008, + "step": 24768 + }, + { + "epoch": 0.48, + "learning_rate": 1.0400761135489884e-07, + "loss": 0.2709, + "step": 24769 + }, + { + "epoch": 0.48, + "learning_rate": 1.040037280105627e-07, + "loss": 0.0009, + "step": 24770 + }, + { + "epoch": 0.48, + "learning_rate": 1.0399984466622656e-07, + "loss": 0.2155, + "step": 24771 + }, + { + "epoch": 0.48, + "learning_rate": 1.0399596132189042e-07, + "loss": 0.3566, + "step": 24772 + }, + { + "epoch": 0.48, + "learning_rate": 1.0399207797755428e-07, + "loss": 0.0005, + "step": 24773 + }, + { + "epoch": 0.48, + "learning_rate": 1.0398819463321813e-07, + "loss": 0.0007, + "step": 24774 + }, + { + "epoch": 0.48, + "learning_rate": 1.0398431128888199e-07, + "loss": 0.0005, + "step": 24775 + }, + { + "epoch": 0.48, + "learning_rate": 1.0398042794454585e-07, + "loss": 0.0006, + "step": 24776 + }, + { + "epoch": 0.48, + "learning_rate": 1.0397654460020971e-07, + "loss": 0.0004, + "step": 24777 + }, + { + "epoch": 0.48, + "learning_rate": 1.0397266125587357e-07, + "loss": 0.0007, + "step": 24778 + }, + { + "epoch": 0.48, + "learning_rate": 1.0396877791153743e-07, + "loss": 0.2086, + "step": 24779 + }, + { + "epoch": 0.48, + "learning_rate": 1.0396489456720128e-07, + "loss": 0.0007, + "step": 24780 + }, + { + "epoch": 0.48, + "learning_rate": 1.0396101122286514e-07, + "loss": 0.0005, + "step": 24781 + }, + { + "epoch": 0.48, + "learning_rate": 1.03957127878529e-07, + "loss": 0.0017, + "step": 24782 + }, + { + "epoch": 0.48, + "learning_rate": 1.0395324453419286e-07, + "loss": 0.0004, + "step": 24783 + }, + { + "epoch": 0.48, + "learning_rate": 1.039493611898567e-07, + "loss": 0.0007, + "step": 24784 + }, + { + "epoch": 0.48, + "learning_rate": 1.0394547784552056e-07, + "loss": 0.0413, + "step": 24785 + }, + { + "epoch": 0.48, + "learning_rate": 1.0394159450118442e-07, + "loss": 0.0671, + "step": 24786 + }, + { + "epoch": 0.48, + "learning_rate": 1.0393771115684827e-07, + "loss": 1.3131, + "step": 24787 + }, + { + "epoch": 0.48, + "learning_rate": 1.0393382781251212e-07, + "loss": 0.0011, + "step": 24788 + }, + { + "epoch": 0.48, + "learning_rate": 1.0392994446817598e-07, + "loss": 0.013, + "step": 24789 + }, + { + "epoch": 0.48, + "learning_rate": 1.0392606112383984e-07, + "loss": 0.0005, + "step": 24790 + }, + { + "epoch": 0.48, + "learning_rate": 1.039221777795037e-07, + "loss": 0.3989, + "step": 24791 + }, + { + "epoch": 0.48, + "learning_rate": 1.0391829443516756e-07, + "loss": 0.0005, + "step": 24792 + }, + { + "epoch": 0.48, + "learning_rate": 1.0391441109083141e-07, + "loss": 0.0008, + "step": 24793 + }, + { + "epoch": 0.48, + "learning_rate": 1.0391052774649527e-07, + "loss": 0.0005, + "step": 24794 + }, + { + "epoch": 0.48, + "learning_rate": 1.0390664440215913e-07, + "loss": 0.0021, + "step": 24795 + }, + { + "epoch": 0.48, + "learning_rate": 1.0390276105782299e-07, + "loss": 0.0005, + "step": 24796 + }, + { + "epoch": 0.48, + "learning_rate": 1.0389887771348685e-07, + "loss": 0.0006, + "step": 24797 + }, + { + "epoch": 0.48, + "learning_rate": 1.038949943691507e-07, + "loss": 0.0007, + "step": 24798 + }, + { + "epoch": 0.48, + "learning_rate": 1.0389111102481456e-07, + "loss": 0.0006, + "step": 24799 + }, + { + "epoch": 0.48, + "learning_rate": 1.0388722768047842e-07, + "loss": 0.0507, + "step": 24800 + }, + { + "epoch": 0.48, + "learning_rate": 1.0388334433614228e-07, + "loss": 0.0006, + "step": 24801 + }, + { + "epoch": 0.48, + "learning_rate": 1.0387946099180614e-07, + "loss": 0.0393, + "step": 24802 + }, + { + "epoch": 0.48, + "learning_rate": 1.0387557764747e-07, + "loss": 0.0005, + "step": 24803 + }, + { + "epoch": 0.48, + "learning_rate": 1.0387169430313386e-07, + "loss": 0.0005, + "step": 24804 + }, + { + "epoch": 0.48, + "learning_rate": 1.0386781095879771e-07, + "loss": 0.0007, + "step": 24805 + }, + { + "epoch": 0.48, + "learning_rate": 1.0386392761446157e-07, + "loss": 0.0011, + "step": 24806 + }, + { + "epoch": 0.48, + "learning_rate": 1.0386004427012543e-07, + "loss": 0.1221, + "step": 24807 + }, + { + "epoch": 0.48, + "learning_rate": 1.0385616092578929e-07, + "loss": 0.4176, + "step": 24808 + }, + { + "epoch": 0.48, + "learning_rate": 1.0385227758145315e-07, + "loss": 0.0007, + "step": 24809 + }, + { + "epoch": 0.48, + "learning_rate": 1.03848394237117e-07, + "loss": 0.0008, + "step": 24810 + }, + { + "epoch": 0.48, + "learning_rate": 1.0384451089278086e-07, + "loss": 0.0035, + "step": 24811 + }, + { + "epoch": 0.48, + "learning_rate": 1.0384062754844472e-07, + "loss": 0.0007, + "step": 24812 + }, + { + "epoch": 0.48, + "learning_rate": 1.0383674420410857e-07, + "loss": 0.0007, + "step": 24813 + }, + { + "epoch": 0.48, + "learning_rate": 1.0383286085977242e-07, + "loss": 0.0009, + "step": 24814 + }, + { + "epoch": 0.48, + "learning_rate": 1.0382897751543628e-07, + "loss": 0.0006, + "step": 24815 + }, + { + "epoch": 0.48, + "learning_rate": 1.0382509417110014e-07, + "loss": 0.0006, + "step": 24816 + }, + { + "epoch": 0.48, + "learning_rate": 1.03821210826764e-07, + "loss": 0.0006, + "step": 24817 + }, + { + "epoch": 0.48, + "learning_rate": 1.0381732748242786e-07, + "loss": 0.0005, + "step": 24818 + }, + { + "epoch": 0.48, + "learning_rate": 1.0381344413809172e-07, + "loss": 0.0006, + "step": 24819 + }, + { + "epoch": 0.48, + "learning_rate": 1.0380956079375557e-07, + "loss": 0.0006, + "step": 24820 + }, + { + "epoch": 0.48, + "learning_rate": 1.0380567744941943e-07, + "loss": 0.2069, + "step": 24821 + }, + { + "epoch": 0.48, + "learning_rate": 1.0380179410508329e-07, + "loss": 0.0006, + "step": 24822 + }, + { + "epoch": 0.48, + "learning_rate": 1.0379791076074715e-07, + "loss": 0.0005, + "step": 24823 + }, + { + "epoch": 0.48, + "learning_rate": 1.0379402741641101e-07, + "loss": 0.0568, + "step": 24824 + }, + { + "epoch": 0.48, + "learning_rate": 1.0379014407207487e-07, + "loss": 0.0006, + "step": 24825 + }, + { + "epoch": 0.48, + "learning_rate": 1.0378626072773872e-07, + "loss": 0.0015, + "step": 24826 + }, + { + "epoch": 0.48, + "learning_rate": 1.0378237738340258e-07, + "loss": 0.0006, + "step": 24827 + }, + { + "epoch": 0.48, + "learning_rate": 1.0377849403906644e-07, + "loss": 0.0006, + "step": 24828 + }, + { + "epoch": 0.48, + "learning_rate": 1.037746106947303e-07, + "loss": 1.2838, + "step": 24829 + }, + { + "epoch": 0.48, + "learning_rate": 1.0377072735039416e-07, + "loss": 0.0005, + "step": 24830 + }, + { + "epoch": 0.48, + "learning_rate": 1.0376684400605801e-07, + "loss": 0.0048, + "step": 24831 + }, + { + "epoch": 0.48, + "learning_rate": 1.0376296066172187e-07, + "loss": 0.0005, + "step": 24832 + }, + { + "epoch": 0.48, + "learning_rate": 1.0375907731738573e-07, + "loss": 0.0005, + "step": 24833 + }, + { + "epoch": 0.48, + "learning_rate": 1.0375519397304959e-07, + "loss": 0.0007, + "step": 24834 + }, + { + "epoch": 0.48, + "learning_rate": 1.0375131062871345e-07, + "loss": 0.0046, + "step": 24835 + }, + { + "epoch": 0.48, + "learning_rate": 1.037474272843773e-07, + "loss": 0.0094, + "step": 24836 + }, + { + "epoch": 0.48, + "learning_rate": 1.0374354394004116e-07, + "loss": 0.0009, + "step": 24837 + }, + { + "epoch": 0.48, + "learning_rate": 1.0373966059570502e-07, + "loss": 0.0005, + "step": 24838 + }, + { + "epoch": 0.48, + "learning_rate": 1.0373577725136888e-07, + "loss": 0.0007, + "step": 24839 + }, + { + "epoch": 0.48, + "learning_rate": 1.0373189390703274e-07, + "loss": 0.0132, + "step": 24840 + }, + { + "epoch": 0.48, + "learning_rate": 1.037280105626966e-07, + "loss": 0.0006, + "step": 24841 + }, + { + "epoch": 0.48, + "learning_rate": 1.0372412721836046e-07, + "loss": 0.0006, + "step": 24842 + }, + { + "epoch": 0.48, + "learning_rate": 1.0372024387402431e-07, + "loss": 0.2198, + "step": 24843 + }, + { + "epoch": 0.48, + "learning_rate": 1.0371636052968817e-07, + "loss": 0.0006, + "step": 24844 + }, + { + "epoch": 0.48, + "learning_rate": 1.03712477185352e-07, + "loss": 0.2591, + "step": 24845 + }, + { + "epoch": 0.48, + "learning_rate": 1.0370859384101586e-07, + "loss": 0.0009, + "step": 24846 + }, + { + "epoch": 0.48, + "learning_rate": 1.0370471049667972e-07, + "loss": 0.0006, + "step": 24847 + }, + { + "epoch": 0.48, + "learning_rate": 1.0370082715234358e-07, + "loss": 0.0005, + "step": 24848 + }, + { + "epoch": 0.48, + "learning_rate": 1.0369694380800744e-07, + "loss": 0.0034, + "step": 24849 + }, + { + "epoch": 0.48, + "learning_rate": 1.036930604636713e-07, + "loss": 0.0024, + "step": 24850 + }, + { + "epoch": 0.48, + "learning_rate": 1.0368917711933515e-07, + "loss": 0.0008, + "step": 24851 + }, + { + "epoch": 0.48, + "learning_rate": 1.0368529377499901e-07, + "loss": 0.0006, + "step": 24852 + }, + { + "epoch": 0.48, + "learning_rate": 1.0368141043066287e-07, + "loss": 0.4526, + "step": 24853 + }, + { + "epoch": 0.48, + "learning_rate": 1.0367752708632673e-07, + "loss": 0.0007, + "step": 24854 + }, + { + "epoch": 0.48, + "learning_rate": 1.0367364374199059e-07, + "loss": 0.0006, + "step": 24855 + }, + { + "epoch": 0.48, + "learning_rate": 1.0366976039765444e-07, + "loss": 0.2864, + "step": 24856 + }, + { + "epoch": 0.48, + "learning_rate": 1.036658770533183e-07, + "loss": 0.0026, + "step": 24857 + }, + { + "epoch": 0.48, + "learning_rate": 1.0366199370898216e-07, + "loss": 0.0007, + "step": 24858 + }, + { + "epoch": 0.48, + "learning_rate": 1.0365811036464602e-07, + "loss": 0.0006, + "step": 24859 + }, + { + "epoch": 0.48, + "learning_rate": 1.0365422702030988e-07, + "loss": 0.0008, + "step": 24860 + }, + { + "epoch": 0.48, + "learning_rate": 1.0365034367597374e-07, + "loss": 0.0007, + "step": 24861 + }, + { + "epoch": 0.48, + "learning_rate": 1.036464603316376e-07, + "loss": 0.0012, + "step": 24862 + }, + { + "epoch": 0.48, + "learning_rate": 1.0364257698730145e-07, + "loss": 0.0005, + "step": 24863 + }, + { + "epoch": 0.48, + "learning_rate": 1.0363869364296531e-07, + "loss": 0.0007, + "step": 24864 + }, + { + "epoch": 0.48, + "learning_rate": 1.0363481029862917e-07, + "loss": 0.0007, + "step": 24865 + }, + { + "epoch": 0.48, + "learning_rate": 1.0363092695429303e-07, + "loss": 0.0007, + "step": 24866 + }, + { + "epoch": 0.48, + "learning_rate": 1.0362704360995688e-07, + "loss": 0.2866, + "step": 24867 + }, + { + "epoch": 0.48, + "learning_rate": 1.0362316026562074e-07, + "loss": 0.0005, + "step": 24868 + }, + { + "epoch": 0.48, + "learning_rate": 1.036192769212846e-07, + "loss": 0.0006, + "step": 24869 + }, + { + "epoch": 0.48, + "learning_rate": 1.0361539357694846e-07, + "loss": 0.0007, + "step": 24870 + }, + { + "epoch": 0.48, + "learning_rate": 1.0361151023261232e-07, + "loss": 0.0111, + "step": 24871 + }, + { + "epoch": 0.48, + "learning_rate": 1.0360762688827618e-07, + "loss": 0.0087, + "step": 24872 + }, + { + "epoch": 0.48, + "learning_rate": 1.0360374354394003e-07, + "loss": 0.0979, + "step": 24873 + }, + { + "epoch": 0.48, + "learning_rate": 1.0359986019960389e-07, + "loss": 0.0005, + "step": 24874 + }, + { + "epoch": 0.48, + "learning_rate": 1.0359597685526775e-07, + "loss": 0.2121, + "step": 24875 + }, + { + "epoch": 0.48, + "learning_rate": 1.0359209351093161e-07, + "loss": 1.2703, + "step": 24876 + }, + { + "epoch": 0.48, + "learning_rate": 1.0358821016659547e-07, + "loss": 0.0005, + "step": 24877 + }, + { + "epoch": 0.48, + "learning_rate": 1.0358432682225933e-07, + "loss": 0.0005, + "step": 24878 + }, + { + "epoch": 0.48, + "learning_rate": 1.0358044347792318e-07, + "loss": 0.0005, + "step": 24879 + }, + { + "epoch": 0.48, + "learning_rate": 1.0357656013358704e-07, + "loss": 0.0118, + "step": 24880 + }, + { + "epoch": 0.48, + "learning_rate": 1.035726767892509e-07, + "loss": 0.0008, + "step": 24881 + }, + { + "epoch": 0.48, + "learning_rate": 1.0356879344491476e-07, + "loss": 0.0005, + "step": 24882 + }, + { + "epoch": 0.48, + "learning_rate": 1.0356491010057862e-07, + "loss": 0.0146, + "step": 24883 + }, + { + "epoch": 0.48, + "learning_rate": 1.0356102675624248e-07, + "loss": 0.0006, + "step": 24884 + }, + { + "epoch": 0.48, + "learning_rate": 1.0355714341190633e-07, + "loss": 0.0006, + "step": 24885 + }, + { + "epoch": 0.48, + "learning_rate": 1.0355326006757019e-07, + "loss": 0.001, + "step": 24886 + }, + { + "epoch": 0.48, + "learning_rate": 1.0354937672323405e-07, + "loss": 0.0011, + "step": 24887 + }, + { + "epoch": 0.48, + "learning_rate": 1.0354549337889791e-07, + "loss": 0.0022, + "step": 24888 + }, + { + "epoch": 0.48, + "learning_rate": 1.0354161003456177e-07, + "loss": 0.0051, + "step": 24889 + }, + { + "epoch": 0.48, + "learning_rate": 1.0353772669022562e-07, + "loss": 0.0007, + "step": 24890 + }, + { + "epoch": 0.48, + "learning_rate": 1.0353384334588948e-07, + "loss": 0.0007, + "step": 24891 + }, + { + "epoch": 0.48, + "learning_rate": 1.0352996000155334e-07, + "loss": 0.0011, + "step": 24892 + }, + { + "epoch": 0.48, + "learning_rate": 1.035260766572172e-07, + "loss": 0.0006, + "step": 24893 + }, + { + "epoch": 0.48, + "learning_rate": 1.0352219331288106e-07, + "loss": 0.0032, + "step": 24894 + }, + { + "epoch": 0.48, + "learning_rate": 1.0351830996854492e-07, + "loss": 0.0005, + "step": 24895 + }, + { + "epoch": 0.48, + "learning_rate": 1.0351442662420877e-07, + "loss": 0.0004, + "step": 24896 + }, + { + "epoch": 0.48, + "learning_rate": 1.0351054327987263e-07, + "loss": 0.0116, + "step": 24897 + }, + { + "epoch": 0.48, + "learning_rate": 1.0350665993553649e-07, + "loss": 0.0009, + "step": 24898 + }, + { + "epoch": 0.48, + "learning_rate": 1.0350277659120035e-07, + "loss": 0.0006, + "step": 24899 + }, + { + "epoch": 0.48, + "learning_rate": 1.0349889324686421e-07, + "loss": 0.0006, + "step": 24900 + }, + { + "epoch": 0.48, + "learning_rate": 1.0349500990252807e-07, + "loss": 0.0005, + "step": 24901 + }, + { + "epoch": 0.48, + "learning_rate": 1.0349112655819192e-07, + "loss": 0.0006, + "step": 24902 + }, + { + "epoch": 0.48, + "learning_rate": 1.0348724321385576e-07, + "loss": 0.0007, + "step": 24903 + }, + { + "epoch": 0.48, + "learning_rate": 1.0348335986951961e-07, + "loss": 0.0007, + "step": 24904 + }, + { + "epoch": 0.48, + "learning_rate": 1.0347947652518347e-07, + "loss": 0.0005, + "step": 24905 + }, + { + "epoch": 0.48, + "learning_rate": 1.0347559318084733e-07, + "loss": 0.0005, + "step": 24906 + }, + { + "epoch": 0.48, + "learning_rate": 1.0347170983651119e-07, + "loss": 1.012, + "step": 24907 + }, + { + "epoch": 0.48, + "learning_rate": 1.0346782649217505e-07, + "loss": 0.0007, + "step": 24908 + }, + { + "epoch": 0.48, + "learning_rate": 1.034639431478389e-07, + "loss": 0.0005, + "step": 24909 + }, + { + "epoch": 0.48, + "learning_rate": 1.0346005980350276e-07, + "loss": 0.0007, + "step": 24910 + }, + { + "epoch": 0.48, + "learning_rate": 1.0345617645916662e-07, + "loss": 0.0006, + "step": 24911 + }, + { + "epoch": 0.48, + "learning_rate": 1.0345229311483048e-07, + "loss": 0.0037, + "step": 24912 + }, + { + "epoch": 0.48, + "learning_rate": 1.0344840977049434e-07, + "loss": 0.0006, + "step": 24913 + }, + { + "epoch": 0.48, + "learning_rate": 1.034445264261582e-07, + "loss": 0.0007, + "step": 24914 + }, + { + "epoch": 0.48, + "learning_rate": 1.0344064308182205e-07, + "loss": 0.0004, + "step": 24915 + }, + { + "epoch": 0.48, + "learning_rate": 1.0343675973748591e-07, + "loss": 0.0007, + "step": 24916 + }, + { + "epoch": 0.48, + "learning_rate": 1.0343287639314977e-07, + "loss": 0.0008, + "step": 24917 + }, + { + "epoch": 0.48, + "learning_rate": 1.0342899304881363e-07, + "loss": 0.0006, + "step": 24918 + }, + { + "epoch": 0.48, + "learning_rate": 1.0342510970447749e-07, + "loss": 0.0305, + "step": 24919 + }, + { + "epoch": 0.48, + "learning_rate": 1.0342122636014135e-07, + "loss": 0.0007, + "step": 24920 + }, + { + "epoch": 0.48, + "learning_rate": 1.034173430158052e-07, + "loss": 0.0006, + "step": 24921 + }, + { + "epoch": 0.48, + "learning_rate": 1.0341345967146906e-07, + "loss": 0.0016, + "step": 24922 + }, + { + "epoch": 0.48, + "learning_rate": 1.0340957632713292e-07, + "loss": 0.0007, + "step": 24923 + }, + { + "epoch": 0.48, + "learning_rate": 1.0340569298279678e-07, + "loss": 0.0099, + "step": 24924 + }, + { + "epoch": 0.48, + "learning_rate": 1.0340180963846064e-07, + "loss": 0.0008, + "step": 24925 + }, + { + "epoch": 0.48, + "learning_rate": 1.033979262941245e-07, + "loss": 0.0006, + "step": 24926 + }, + { + "epoch": 0.48, + "learning_rate": 1.0339404294978835e-07, + "loss": 0.0006, + "step": 24927 + }, + { + "epoch": 0.48, + "learning_rate": 1.0339015960545221e-07, + "loss": 0.0006, + "step": 24928 + }, + { + "epoch": 0.48, + "learning_rate": 1.0338627626111607e-07, + "loss": 0.0007, + "step": 24929 + }, + { + "epoch": 0.48, + "learning_rate": 1.0338239291677993e-07, + "loss": 0.0007, + "step": 24930 + }, + { + "epoch": 0.48, + "learning_rate": 1.0337850957244379e-07, + "loss": 0.0005, + "step": 24931 + }, + { + "epoch": 0.48, + "learning_rate": 1.0337462622810764e-07, + "loss": 0.001, + "step": 24932 + }, + { + "epoch": 0.48, + "learning_rate": 1.033707428837715e-07, + "loss": 0.0006, + "step": 24933 + }, + { + "epoch": 0.48, + "learning_rate": 1.0336685953943536e-07, + "loss": 0.9203, + "step": 24934 + }, + { + "epoch": 0.48, + "learning_rate": 1.0336297619509922e-07, + "loss": 0.0006, + "step": 24935 + }, + { + "epoch": 0.48, + "learning_rate": 1.0335909285076308e-07, + "loss": 0.0007, + "step": 24936 + }, + { + "epoch": 0.48, + "learning_rate": 1.0335520950642694e-07, + "loss": 0.7171, + "step": 24937 + }, + { + "epoch": 0.48, + "learning_rate": 1.033513261620908e-07, + "loss": 0.001, + "step": 24938 + }, + { + "epoch": 0.48, + "learning_rate": 1.0334744281775465e-07, + "loss": 0.0004, + "step": 24939 + }, + { + "epoch": 0.48, + "learning_rate": 1.0334355947341851e-07, + "loss": 0.0005, + "step": 24940 + }, + { + "epoch": 0.48, + "learning_rate": 1.0333967612908237e-07, + "loss": 0.0824, + "step": 24941 + }, + { + "epoch": 0.48, + "learning_rate": 1.0333579278474623e-07, + "loss": 0.0006, + "step": 24942 + }, + { + "epoch": 0.48, + "learning_rate": 1.0333190944041009e-07, + "loss": 0.2503, + "step": 24943 + }, + { + "epoch": 0.48, + "learning_rate": 1.0332802609607394e-07, + "loss": 0.0007, + "step": 24944 + }, + { + "epoch": 0.48, + "learning_rate": 1.033241427517378e-07, + "loss": 0.0006, + "step": 24945 + }, + { + "epoch": 0.48, + "learning_rate": 1.0332025940740166e-07, + "loss": 0.0006, + "step": 24946 + }, + { + "epoch": 0.48, + "learning_rate": 1.0331637606306552e-07, + "loss": 0.0006, + "step": 24947 + }, + { + "epoch": 0.48, + "learning_rate": 1.0331249271872938e-07, + "loss": 0.0009, + "step": 24948 + }, + { + "epoch": 0.48, + "learning_rate": 1.0330860937439323e-07, + "loss": 0.0006, + "step": 24949 + }, + { + "epoch": 0.48, + "learning_rate": 1.0330472603005709e-07, + "loss": 0.0007, + "step": 24950 + }, + { + "epoch": 0.48, + "learning_rate": 1.0330084268572095e-07, + "loss": 0.0011, + "step": 24951 + }, + { + "epoch": 0.48, + "learning_rate": 1.0329695934138481e-07, + "loss": 0.0006, + "step": 24952 + }, + { + "epoch": 0.48, + "learning_rate": 1.0329307599704867e-07, + "loss": 0.0006, + "step": 24953 + }, + { + "epoch": 0.48, + "learning_rate": 1.0328919265271253e-07, + "loss": 0.0005, + "step": 24954 + }, + { + "epoch": 0.48, + "learning_rate": 1.0328530930837638e-07, + "loss": 0.0005, + "step": 24955 + }, + { + "epoch": 0.48, + "learning_rate": 1.0328142596404024e-07, + "loss": 0.0005, + "step": 24956 + }, + { + "epoch": 0.48, + "learning_rate": 1.032775426197041e-07, + "loss": 0.0004, + "step": 24957 + }, + { + "epoch": 0.48, + "learning_rate": 1.0327365927536796e-07, + "loss": 0.0014, + "step": 24958 + }, + { + "epoch": 0.48, + "learning_rate": 1.0326977593103182e-07, + "loss": 0.0347, + "step": 24959 + }, + { + "epoch": 0.48, + "learning_rate": 1.0326589258669568e-07, + "loss": 0.0007, + "step": 24960 + }, + { + "epoch": 0.48, + "learning_rate": 1.0326200924235951e-07, + "loss": 0.0005, + "step": 24961 + }, + { + "epoch": 0.48, + "learning_rate": 1.0325812589802337e-07, + "loss": 0.0007, + "step": 24962 + }, + { + "epoch": 0.48, + "learning_rate": 1.0325424255368722e-07, + "loss": 0.0009, + "step": 24963 + }, + { + "epoch": 0.48, + "learning_rate": 1.0325035920935108e-07, + "loss": 0.0007, + "step": 24964 + }, + { + "epoch": 0.48, + "learning_rate": 1.0324647586501494e-07, + "loss": 0.0019, + "step": 24965 + }, + { + "epoch": 0.48, + "learning_rate": 1.032425925206788e-07, + "loss": 0.0006, + "step": 24966 + }, + { + "epoch": 0.48, + "learning_rate": 1.0323870917634266e-07, + "loss": 0.0009, + "step": 24967 + }, + { + "epoch": 0.48, + "learning_rate": 1.0323482583200651e-07, + "loss": 0.0131, + "step": 24968 + }, + { + "epoch": 0.48, + "learning_rate": 1.0323094248767037e-07, + "loss": 0.0004, + "step": 24969 + }, + { + "epoch": 0.48, + "learning_rate": 1.0322705914333423e-07, + "loss": 0.0009, + "step": 24970 + }, + { + "epoch": 0.48, + "learning_rate": 1.0322317579899809e-07, + "loss": 0.0006, + "step": 24971 + }, + { + "epoch": 0.48, + "learning_rate": 1.0321929245466195e-07, + "loss": 0.001, + "step": 24972 + }, + { + "epoch": 0.48, + "learning_rate": 1.032154091103258e-07, + "loss": 0.0005, + "step": 24973 + }, + { + "epoch": 0.48, + "learning_rate": 1.0321152576598966e-07, + "loss": 0.0009, + "step": 24974 + }, + { + "epoch": 0.48, + "learning_rate": 1.0320764242165352e-07, + "loss": 0.0009, + "step": 24975 + }, + { + "epoch": 0.48, + "learning_rate": 1.0320375907731738e-07, + "loss": 0.0005, + "step": 24976 + }, + { + "epoch": 0.48, + "learning_rate": 1.0319987573298124e-07, + "loss": 0.0022, + "step": 24977 + }, + { + "epoch": 0.48, + "learning_rate": 1.031959923886451e-07, + "loss": 0.0005, + "step": 24978 + }, + { + "epoch": 0.48, + "learning_rate": 1.0319210904430896e-07, + "loss": 0.0007, + "step": 24979 + }, + { + "epoch": 0.48, + "learning_rate": 1.0318822569997281e-07, + "loss": 0.0006, + "step": 24980 + }, + { + "epoch": 0.48, + "learning_rate": 1.0318434235563667e-07, + "loss": 0.9703, + "step": 24981 + }, + { + "epoch": 0.48, + "learning_rate": 1.0318045901130053e-07, + "loss": 0.0006, + "step": 24982 + }, + { + "epoch": 0.48, + "learning_rate": 1.0317657566696439e-07, + "loss": 0.0004, + "step": 24983 + }, + { + "epoch": 0.48, + "learning_rate": 1.0317269232262825e-07, + "loss": 0.0004, + "step": 24984 + }, + { + "epoch": 0.48, + "learning_rate": 1.031688089782921e-07, + "loss": 0.5284, + "step": 24985 + }, + { + "epoch": 0.48, + "learning_rate": 1.0316492563395596e-07, + "loss": 0.0005, + "step": 24986 + }, + { + "epoch": 0.48, + "learning_rate": 1.0316104228961982e-07, + "loss": 0.0016, + "step": 24987 + }, + { + "epoch": 0.48, + "learning_rate": 1.0315715894528368e-07, + "loss": 0.0007, + "step": 24988 + }, + { + "epoch": 0.48, + "learning_rate": 1.0315327560094754e-07, + "loss": 1.0403, + "step": 24989 + }, + { + "epoch": 0.48, + "learning_rate": 1.0314939225661138e-07, + "loss": 0.0005, + "step": 24990 + }, + { + "epoch": 0.48, + "learning_rate": 1.0314550891227524e-07, + "loss": 0.0005, + "step": 24991 + }, + { + "epoch": 0.48, + "learning_rate": 1.031416255679391e-07, + "loss": 0.0007, + "step": 24992 + }, + { + "epoch": 0.48, + "learning_rate": 1.0313774222360296e-07, + "loss": 0.0029, + "step": 24993 + }, + { + "epoch": 0.48, + "learning_rate": 1.0313385887926682e-07, + "loss": 0.2377, + "step": 24994 + }, + { + "epoch": 0.48, + "learning_rate": 1.0312997553493067e-07, + "loss": 0.0011, + "step": 24995 + }, + { + "epoch": 0.48, + "learning_rate": 1.0312609219059453e-07, + "loss": 0.0008, + "step": 24996 + }, + { + "epoch": 0.48, + "learning_rate": 1.0312220884625839e-07, + "loss": 0.0007, + "step": 24997 + }, + { + "epoch": 0.48, + "learning_rate": 1.0311832550192225e-07, + "loss": 0.0008, + "step": 24998 + }, + { + "epoch": 0.48, + "learning_rate": 1.0311444215758611e-07, + "loss": 0.0006, + "step": 24999 + }, + { + "epoch": 0.48, + "learning_rate": 1.0311055881324997e-07, + "loss": 0.0008, + "step": 25000 + }, + { + "epoch": 0.48, + "learning_rate": 1.0310667546891382e-07, + "loss": 0.0011, + "step": 25001 + }, + { + "epoch": 0.48, + "learning_rate": 1.0310279212457768e-07, + "loss": 0.0004, + "step": 25002 + }, + { + "epoch": 0.49, + "learning_rate": 1.0309890878024154e-07, + "loss": 0.0005, + "step": 25003 + }, + { + "epoch": 0.49, + "learning_rate": 1.030950254359054e-07, + "loss": 0.3275, + "step": 25004 + }, + { + "epoch": 0.49, + "learning_rate": 1.0309114209156926e-07, + "loss": 0.0006, + "step": 25005 + }, + { + "epoch": 0.49, + "learning_rate": 1.0308725874723311e-07, + "loss": 0.0005, + "step": 25006 + }, + { + "epoch": 0.49, + "learning_rate": 1.0308337540289697e-07, + "loss": 0.0005, + "step": 25007 + }, + { + "epoch": 0.49, + "learning_rate": 1.0307949205856083e-07, + "loss": 0.5314, + "step": 25008 + }, + { + "epoch": 0.49, + "learning_rate": 1.0307560871422469e-07, + "loss": 0.0005, + "step": 25009 + }, + { + "epoch": 0.49, + "learning_rate": 1.0307172536988855e-07, + "loss": 0.0005, + "step": 25010 + }, + { + "epoch": 0.49, + "learning_rate": 1.030678420255524e-07, + "loss": 0.1749, + "step": 25011 + }, + { + "epoch": 0.49, + "learning_rate": 1.0306395868121626e-07, + "loss": 0.0005, + "step": 25012 + }, + { + "epoch": 0.49, + "learning_rate": 1.0306007533688012e-07, + "loss": 0.9235, + "step": 25013 + }, + { + "epoch": 0.49, + "learning_rate": 1.0305619199254398e-07, + "loss": 0.0007, + "step": 25014 + }, + { + "epoch": 0.49, + "learning_rate": 1.0305230864820784e-07, + "loss": 0.0006, + "step": 25015 + }, + { + "epoch": 0.49, + "learning_rate": 1.030484253038717e-07, + "loss": 0.0008, + "step": 25016 + }, + { + "epoch": 0.49, + "learning_rate": 1.0304454195953556e-07, + "loss": 0.0006, + "step": 25017 + }, + { + "epoch": 0.49, + "learning_rate": 1.0304065861519941e-07, + "loss": 0.0005, + "step": 25018 + }, + { + "epoch": 0.49, + "learning_rate": 1.0303677527086325e-07, + "loss": 0.0009, + "step": 25019 + }, + { + "epoch": 0.49, + "learning_rate": 1.030328919265271e-07, + "loss": 0.0007, + "step": 25020 + }, + { + "epoch": 0.49, + "learning_rate": 1.0302900858219096e-07, + "loss": 1.3342, + "step": 25021 + }, + { + "epoch": 0.49, + "learning_rate": 1.0302512523785482e-07, + "loss": 0.0006, + "step": 25022 + }, + { + "epoch": 0.49, + "learning_rate": 1.0302124189351868e-07, + "loss": 0.0006, + "step": 25023 + }, + { + "epoch": 0.49, + "learning_rate": 1.0301735854918254e-07, + "loss": 0.0007, + "step": 25024 + }, + { + "epoch": 0.49, + "learning_rate": 1.030134752048464e-07, + "loss": 0.0025, + "step": 25025 + }, + { + "epoch": 0.49, + "learning_rate": 1.0300959186051025e-07, + "loss": 0.0006, + "step": 25026 + }, + { + "epoch": 0.49, + "learning_rate": 1.0300570851617411e-07, + "loss": 0.0035, + "step": 25027 + }, + { + "epoch": 0.49, + "learning_rate": 1.0300182517183797e-07, + "loss": 0.0007, + "step": 25028 + }, + { + "epoch": 0.49, + "learning_rate": 1.0299794182750183e-07, + "loss": 0.0006, + "step": 25029 + }, + { + "epoch": 0.49, + "learning_rate": 1.0299405848316569e-07, + "loss": 0.0455, + "step": 25030 + }, + { + "epoch": 0.49, + "learning_rate": 1.0299017513882954e-07, + "loss": 0.0111, + "step": 25031 + }, + { + "epoch": 0.49, + "learning_rate": 1.029862917944934e-07, + "loss": 0.0005, + "step": 25032 + }, + { + "epoch": 0.49, + "learning_rate": 1.0298240845015726e-07, + "loss": 0.0007, + "step": 25033 + }, + { + "epoch": 0.49, + "learning_rate": 1.0297852510582112e-07, + "loss": 0.0007, + "step": 25034 + }, + { + "epoch": 0.49, + "learning_rate": 1.0297464176148498e-07, + "loss": 0.0007, + "step": 25035 + }, + { + "epoch": 0.49, + "learning_rate": 1.0297075841714884e-07, + "loss": 0.0008, + "step": 25036 + }, + { + "epoch": 0.49, + "learning_rate": 1.029668750728127e-07, + "loss": 0.0005, + "step": 25037 + }, + { + "epoch": 0.49, + "learning_rate": 1.0296299172847655e-07, + "loss": 0.0011, + "step": 25038 + }, + { + "epoch": 0.49, + "learning_rate": 1.0295910838414041e-07, + "loss": 0.0008, + "step": 25039 + }, + { + "epoch": 0.49, + "learning_rate": 1.0295522503980427e-07, + "loss": 0.0007, + "step": 25040 + }, + { + "epoch": 0.49, + "learning_rate": 1.0295134169546813e-07, + "loss": 0.024, + "step": 25041 + }, + { + "epoch": 0.49, + "learning_rate": 1.0294745835113199e-07, + "loss": 0.0007, + "step": 25042 + }, + { + "epoch": 0.49, + "learning_rate": 1.0294357500679584e-07, + "loss": 0.0005, + "step": 25043 + }, + { + "epoch": 0.49, + "learning_rate": 1.029396916624597e-07, + "loss": 0.0008, + "step": 25044 + }, + { + "epoch": 0.49, + "learning_rate": 1.0293580831812356e-07, + "loss": 0.0006, + "step": 25045 + }, + { + "epoch": 0.49, + "learning_rate": 1.0293192497378742e-07, + "loss": 0.0005, + "step": 25046 + }, + { + "epoch": 0.49, + "learning_rate": 1.0292804162945128e-07, + "loss": 0.0005, + "step": 25047 + }, + { + "epoch": 0.49, + "learning_rate": 1.0292415828511513e-07, + "loss": 0.0006, + "step": 25048 + }, + { + "epoch": 0.49, + "learning_rate": 1.0292027494077899e-07, + "loss": 0.0058, + "step": 25049 + }, + { + "epoch": 0.49, + "learning_rate": 1.0291639159644285e-07, + "loss": 0.0006, + "step": 25050 + }, + { + "epoch": 0.49, + "learning_rate": 1.0291250825210671e-07, + "loss": 0.0007, + "step": 25051 + }, + { + "epoch": 0.49, + "learning_rate": 1.0290862490777057e-07, + "loss": 0.0009, + "step": 25052 + }, + { + "epoch": 0.49, + "learning_rate": 1.0290474156343443e-07, + "loss": 0.2359, + "step": 25053 + }, + { + "epoch": 0.49, + "learning_rate": 1.0290085821909828e-07, + "loss": 0.0007, + "step": 25054 + }, + { + "epoch": 0.49, + "learning_rate": 1.0289697487476214e-07, + "loss": 0.0005, + "step": 25055 + }, + { + "epoch": 0.49, + "learning_rate": 1.02893091530426e-07, + "loss": 0.0006, + "step": 25056 + }, + { + "epoch": 0.49, + "learning_rate": 1.0288920818608986e-07, + "loss": 0.0008, + "step": 25057 + }, + { + "epoch": 0.49, + "learning_rate": 1.0288532484175372e-07, + "loss": 0.4509, + "step": 25058 + }, + { + "epoch": 0.49, + "learning_rate": 1.0288144149741758e-07, + "loss": 0.0007, + "step": 25059 + }, + { + "epoch": 0.49, + "learning_rate": 1.0287755815308143e-07, + "loss": 0.0011, + "step": 25060 + }, + { + "epoch": 0.49, + "learning_rate": 1.0287367480874529e-07, + "loss": 0.0006, + "step": 25061 + }, + { + "epoch": 0.49, + "learning_rate": 1.0286979146440915e-07, + "loss": 0.0006, + "step": 25062 + }, + { + "epoch": 0.49, + "learning_rate": 1.0286590812007301e-07, + "loss": 0.0005, + "step": 25063 + }, + { + "epoch": 0.49, + "learning_rate": 1.0286202477573687e-07, + "loss": 0.0008, + "step": 25064 + }, + { + "epoch": 0.49, + "learning_rate": 1.0285814143140072e-07, + "loss": 0.0969, + "step": 25065 + }, + { + "epoch": 0.49, + "learning_rate": 1.0285425808706458e-07, + "loss": 0.0024, + "step": 25066 + }, + { + "epoch": 0.49, + "learning_rate": 1.0285037474272844e-07, + "loss": 0.0006, + "step": 25067 + }, + { + "epoch": 0.49, + "learning_rate": 1.028464913983923e-07, + "loss": 0.0008, + "step": 25068 + }, + { + "epoch": 0.49, + "learning_rate": 1.0284260805405616e-07, + "loss": 0.0004, + "step": 25069 + }, + { + "epoch": 0.49, + "learning_rate": 1.0283872470972002e-07, + "loss": 0.0006, + "step": 25070 + }, + { + "epoch": 0.49, + "learning_rate": 1.0283484136538387e-07, + "loss": 0.0013, + "step": 25071 + }, + { + "epoch": 0.49, + "learning_rate": 1.0283095802104773e-07, + "loss": 0.0108, + "step": 25072 + }, + { + "epoch": 0.49, + "learning_rate": 1.0282707467671159e-07, + "loss": 0.0006, + "step": 25073 + }, + { + "epoch": 0.49, + "learning_rate": 1.0282319133237545e-07, + "loss": 0.0005, + "step": 25074 + }, + { + "epoch": 0.49, + "learning_rate": 1.0281930798803931e-07, + "loss": 0.0008, + "step": 25075 + }, + { + "epoch": 0.49, + "learning_rate": 1.0281542464370317e-07, + "loss": 0.0006, + "step": 25076 + }, + { + "epoch": 0.49, + "learning_rate": 1.02811541299367e-07, + "loss": 0.0014, + "step": 25077 + }, + { + "epoch": 0.49, + "learning_rate": 1.0280765795503086e-07, + "loss": 0.0006, + "step": 25078 + }, + { + "epoch": 0.49, + "learning_rate": 1.0280377461069471e-07, + "loss": 0.0053, + "step": 25079 + }, + { + "epoch": 0.49, + "learning_rate": 1.0279989126635857e-07, + "loss": 0.0042, + "step": 25080 + }, + { + "epoch": 0.49, + "learning_rate": 1.0279600792202243e-07, + "loss": 0.0007, + "step": 25081 + }, + { + "epoch": 0.49, + "learning_rate": 1.0279212457768629e-07, + "loss": 0.0008, + "step": 25082 + }, + { + "epoch": 0.49, + "learning_rate": 1.0278824123335015e-07, + "loss": 0.0007, + "step": 25083 + }, + { + "epoch": 0.49, + "learning_rate": 1.02784357889014e-07, + "loss": 0.0007, + "step": 25084 + }, + { + "epoch": 0.49, + "learning_rate": 1.0278047454467786e-07, + "loss": 0.0005, + "step": 25085 + }, + { + "epoch": 0.49, + "learning_rate": 1.0277659120034172e-07, + "loss": 0.0005, + "step": 25086 + }, + { + "epoch": 0.49, + "learning_rate": 1.0277270785600558e-07, + "loss": 0.0014, + "step": 25087 + }, + { + "epoch": 0.49, + "learning_rate": 1.0276882451166944e-07, + "loss": 0.0005, + "step": 25088 + }, + { + "epoch": 0.49, + "learning_rate": 1.027649411673333e-07, + "loss": 0.0006, + "step": 25089 + }, + { + "epoch": 0.49, + "learning_rate": 1.0276105782299715e-07, + "loss": 0.0006, + "step": 25090 + }, + { + "epoch": 0.49, + "learning_rate": 1.0275717447866101e-07, + "loss": 0.0005, + "step": 25091 + }, + { + "epoch": 0.49, + "learning_rate": 1.0275329113432487e-07, + "loss": 1.0826, + "step": 25092 + }, + { + "epoch": 0.49, + "learning_rate": 1.0274940778998873e-07, + "loss": 0.0005, + "step": 25093 + }, + { + "epoch": 0.49, + "learning_rate": 1.0274552444565259e-07, + "loss": 0.3984, + "step": 25094 + }, + { + "epoch": 0.49, + "learning_rate": 1.0274164110131645e-07, + "loss": 0.0005, + "step": 25095 + }, + { + "epoch": 0.49, + "learning_rate": 1.027377577569803e-07, + "loss": 0.0005, + "step": 25096 + }, + { + "epoch": 0.49, + "learning_rate": 1.0273387441264416e-07, + "loss": 0.005, + "step": 25097 + }, + { + "epoch": 0.49, + "learning_rate": 1.0272999106830802e-07, + "loss": 0.0005, + "step": 25098 + }, + { + "epoch": 0.49, + "learning_rate": 1.0272610772397188e-07, + "loss": 0.0006, + "step": 25099 + }, + { + "epoch": 0.49, + "learning_rate": 1.0272222437963574e-07, + "loss": 0.9756, + "step": 25100 + }, + { + "epoch": 0.49, + "learning_rate": 1.027183410352996e-07, + "loss": 0.0004, + "step": 25101 + }, + { + "epoch": 0.49, + "learning_rate": 1.0271445769096345e-07, + "loss": 0.0005, + "step": 25102 + }, + { + "epoch": 0.49, + "learning_rate": 1.0271057434662731e-07, + "loss": 0.001, + "step": 25103 + }, + { + "epoch": 0.49, + "learning_rate": 1.0270669100229117e-07, + "loss": 0.0006, + "step": 25104 + }, + { + "epoch": 0.49, + "learning_rate": 1.0270280765795503e-07, + "loss": 0.0004, + "step": 25105 + }, + { + "epoch": 0.49, + "learning_rate": 1.0269892431361889e-07, + "loss": 0.1838, + "step": 25106 + }, + { + "epoch": 0.49, + "learning_rate": 1.0269504096928274e-07, + "loss": 0.0006, + "step": 25107 + }, + { + "epoch": 0.49, + "learning_rate": 1.026911576249466e-07, + "loss": 0.0007, + "step": 25108 + }, + { + "epoch": 0.49, + "learning_rate": 1.0268727428061046e-07, + "loss": 0.0005, + "step": 25109 + }, + { + "epoch": 0.49, + "learning_rate": 1.0268339093627432e-07, + "loss": 0.0005, + "step": 25110 + }, + { + "epoch": 0.49, + "learning_rate": 1.0267950759193818e-07, + "loss": 0.0006, + "step": 25111 + }, + { + "epoch": 0.49, + "learning_rate": 1.0267562424760204e-07, + "loss": 0.9164, + "step": 25112 + }, + { + "epoch": 0.49, + "learning_rate": 1.026717409032659e-07, + "loss": 0.0004, + "step": 25113 + }, + { + "epoch": 0.49, + "learning_rate": 1.0266785755892975e-07, + "loss": 0.0006, + "step": 25114 + }, + { + "epoch": 0.49, + "learning_rate": 1.0266397421459361e-07, + "loss": 0.0005, + "step": 25115 + }, + { + "epoch": 0.49, + "learning_rate": 1.0266009087025747e-07, + "loss": 0.0013, + "step": 25116 + }, + { + "epoch": 0.49, + "learning_rate": 1.0265620752592133e-07, + "loss": 0.0006, + "step": 25117 + }, + { + "epoch": 0.49, + "learning_rate": 1.0265232418158519e-07, + "loss": 0.0005, + "step": 25118 + }, + { + "epoch": 0.49, + "learning_rate": 1.0264844083724904e-07, + "loss": 0.0007, + "step": 25119 + }, + { + "epoch": 0.49, + "learning_rate": 1.026445574929129e-07, + "loss": 1.1981, + "step": 25120 + }, + { + "epoch": 0.49, + "learning_rate": 1.0264067414857676e-07, + "loss": 0.0005, + "step": 25121 + }, + { + "epoch": 0.49, + "learning_rate": 1.0263679080424062e-07, + "loss": 0.0006, + "step": 25122 + }, + { + "epoch": 0.49, + "learning_rate": 1.0263290745990448e-07, + "loss": 0.0008, + "step": 25123 + }, + { + "epoch": 0.49, + "learning_rate": 1.0262902411556833e-07, + "loss": 0.0006, + "step": 25124 + }, + { + "epoch": 0.49, + "learning_rate": 1.0262514077123219e-07, + "loss": 0.0005, + "step": 25125 + }, + { + "epoch": 0.49, + "learning_rate": 1.0262125742689605e-07, + "loss": 0.0007, + "step": 25126 + }, + { + "epoch": 0.49, + "learning_rate": 1.0261737408255991e-07, + "loss": 0.0021, + "step": 25127 + }, + { + "epoch": 0.49, + "learning_rate": 1.0261349073822377e-07, + "loss": 0.0007, + "step": 25128 + }, + { + "epoch": 0.49, + "learning_rate": 1.0260960739388763e-07, + "loss": 0.5224, + "step": 25129 + }, + { + "epoch": 0.49, + "learning_rate": 1.0260572404955148e-07, + "loss": 0.0037, + "step": 25130 + }, + { + "epoch": 0.49, + "learning_rate": 1.0260184070521534e-07, + "loss": 0.0015, + "step": 25131 + }, + { + "epoch": 0.49, + "learning_rate": 1.025979573608792e-07, + "loss": 0.0006, + "step": 25132 + }, + { + "epoch": 0.49, + "learning_rate": 1.0259407401654306e-07, + "loss": 0.0006, + "step": 25133 + }, + { + "epoch": 0.49, + "learning_rate": 1.0259019067220692e-07, + "loss": 0.4503, + "step": 25134 + }, + { + "epoch": 0.49, + "learning_rate": 1.0258630732787075e-07, + "loss": 0.0006, + "step": 25135 + }, + { + "epoch": 0.49, + "learning_rate": 1.0258242398353461e-07, + "loss": 0.0014, + "step": 25136 + }, + { + "epoch": 0.49, + "learning_rate": 1.0257854063919847e-07, + "loss": 0.0006, + "step": 25137 + }, + { + "epoch": 0.49, + "learning_rate": 1.0257465729486232e-07, + "loss": 0.0005, + "step": 25138 + }, + { + "epoch": 0.49, + "learning_rate": 1.0257077395052618e-07, + "loss": 0.0007, + "step": 25139 + }, + { + "epoch": 0.49, + "learning_rate": 1.0256689060619004e-07, + "loss": 0.0059, + "step": 25140 + }, + { + "epoch": 0.49, + "learning_rate": 1.025630072618539e-07, + "loss": 0.0006, + "step": 25141 + }, + { + "epoch": 0.49, + "learning_rate": 1.0255912391751776e-07, + "loss": 0.0005, + "step": 25142 + }, + { + "epoch": 0.49, + "learning_rate": 1.0255524057318161e-07, + "loss": 0.0007, + "step": 25143 + }, + { + "epoch": 0.49, + "learning_rate": 1.0255135722884547e-07, + "loss": 0.0004, + "step": 25144 + }, + { + "epoch": 0.49, + "learning_rate": 1.0254747388450933e-07, + "loss": 0.0009, + "step": 25145 + }, + { + "epoch": 0.49, + "learning_rate": 1.0254359054017319e-07, + "loss": 0.0006, + "step": 25146 + }, + { + "epoch": 0.49, + "learning_rate": 1.0253970719583705e-07, + "loss": 0.0006, + "step": 25147 + }, + { + "epoch": 0.49, + "learning_rate": 1.025358238515009e-07, + "loss": 0.0006, + "step": 25148 + }, + { + "epoch": 0.49, + "learning_rate": 1.0253194050716476e-07, + "loss": 0.0008, + "step": 25149 + }, + { + "epoch": 0.49, + "learning_rate": 1.0252805716282862e-07, + "loss": 0.0006, + "step": 25150 + }, + { + "epoch": 0.49, + "learning_rate": 1.0252417381849248e-07, + "loss": 0.0009, + "step": 25151 + }, + { + "epoch": 0.49, + "learning_rate": 1.0252029047415634e-07, + "loss": 0.0008, + "step": 25152 + }, + { + "epoch": 0.49, + "learning_rate": 1.025164071298202e-07, + "loss": 0.0006, + "step": 25153 + }, + { + "epoch": 0.49, + "learning_rate": 1.0251252378548406e-07, + "loss": 0.0168, + "step": 25154 + }, + { + "epoch": 0.49, + "learning_rate": 1.0250864044114791e-07, + "loss": 0.0006, + "step": 25155 + }, + { + "epoch": 0.49, + "learning_rate": 1.0250475709681177e-07, + "loss": 0.0006, + "step": 25156 + }, + { + "epoch": 0.49, + "learning_rate": 1.0250087375247563e-07, + "loss": 0.0012, + "step": 25157 + }, + { + "epoch": 0.49, + "learning_rate": 1.0249699040813949e-07, + "loss": 0.0031, + "step": 25158 + }, + { + "epoch": 0.49, + "learning_rate": 1.0249310706380335e-07, + "loss": 0.0007, + "step": 25159 + }, + { + "epoch": 0.49, + "learning_rate": 1.024892237194672e-07, + "loss": 0.0005, + "step": 25160 + }, + { + "epoch": 0.49, + "learning_rate": 1.0248534037513106e-07, + "loss": 0.0008, + "step": 25161 + }, + { + "epoch": 0.49, + "learning_rate": 1.0248145703079492e-07, + "loss": 0.2227, + "step": 25162 + }, + { + "epoch": 0.49, + "learning_rate": 1.0247757368645878e-07, + "loss": 0.0006, + "step": 25163 + }, + { + "epoch": 0.49, + "learning_rate": 1.0247369034212264e-07, + "loss": 0.0005, + "step": 25164 + }, + { + "epoch": 0.49, + "learning_rate": 1.024698069977865e-07, + "loss": 0.0007, + "step": 25165 + }, + { + "epoch": 0.49, + "learning_rate": 1.0246592365345035e-07, + "loss": 0.0009, + "step": 25166 + }, + { + "epoch": 0.49, + "learning_rate": 1.024620403091142e-07, + "loss": 0.0008, + "step": 25167 + }, + { + "epoch": 0.49, + "learning_rate": 1.0245815696477806e-07, + "loss": 0.0097, + "step": 25168 + }, + { + "epoch": 0.49, + "learning_rate": 1.0245427362044192e-07, + "loss": 0.0028, + "step": 25169 + }, + { + "epoch": 0.49, + "learning_rate": 1.0245039027610577e-07, + "loss": 0.0005, + "step": 25170 + }, + { + "epoch": 0.49, + "learning_rate": 1.0244650693176963e-07, + "loss": 0.0007, + "step": 25171 + }, + { + "epoch": 0.49, + "learning_rate": 1.0244262358743349e-07, + "loss": 0.0845, + "step": 25172 + }, + { + "epoch": 0.49, + "learning_rate": 1.0243874024309735e-07, + "loss": 0.0006, + "step": 25173 + }, + { + "epoch": 0.49, + "learning_rate": 1.0243485689876121e-07, + "loss": 0.0314, + "step": 25174 + }, + { + "epoch": 0.49, + "learning_rate": 1.0243097355442507e-07, + "loss": 0.0006, + "step": 25175 + }, + { + "epoch": 0.49, + "learning_rate": 1.0242709021008892e-07, + "loss": 0.0007, + "step": 25176 + }, + { + "epoch": 0.49, + "learning_rate": 1.0242320686575278e-07, + "loss": 0.0014, + "step": 25177 + }, + { + "epoch": 0.49, + "learning_rate": 1.0241932352141664e-07, + "loss": 0.0075, + "step": 25178 + }, + { + "epoch": 0.49, + "learning_rate": 1.024154401770805e-07, + "loss": 0.0033, + "step": 25179 + }, + { + "epoch": 0.49, + "learning_rate": 1.0241155683274436e-07, + "loss": 0.3505, + "step": 25180 + }, + { + "epoch": 0.49, + "learning_rate": 1.0240767348840821e-07, + "loss": 0.0013, + "step": 25181 + }, + { + "epoch": 0.49, + "learning_rate": 1.0240379014407207e-07, + "loss": 0.0007, + "step": 25182 + }, + { + "epoch": 0.49, + "learning_rate": 1.0239990679973593e-07, + "loss": 0.0006, + "step": 25183 + }, + { + "epoch": 0.49, + "learning_rate": 1.0239602345539979e-07, + "loss": 0.0758, + "step": 25184 + }, + { + "epoch": 0.49, + "learning_rate": 1.0239214011106365e-07, + "loss": 0.0009, + "step": 25185 + }, + { + "epoch": 0.49, + "learning_rate": 1.023882567667275e-07, + "loss": 0.001, + "step": 25186 + }, + { + "epoch": 0.49, + "learning_rate": 1.0238437342239136e-07, + "loss": 0.0007, + "step": 25187 + }, + { + "epoch": 0.49, + "learning_rate": 1.0238049007805522e-07, + "loss": 0.0005, + "step": 25188 + }, + { + "epoch": 0.49, + "learning_rate": 1.0237660673371908e-07, + "loss": 0.0006, + "step": 25189 + }, + { + "epoch": 0.49, + "learning_rate": 1.0237272338938294e-07, + "loss": 0.0005, + "step": 25190 + }, + { + "epoch": 0.49, + "learning_rate": 1.023688400450468e-07, + "loss": 0.0155, + "step": 25191 + }, + { + "epoch": 0.49, + "learning_rate": 1.0236495670071066e-07, + "loss": 0.0005, + "step": 25192 + }, + { + "epoch": 0.49, + "learning_rate": 1.023610733563745e-07, + "loss": 0.0009, + "step": 25193 + }, + { + "epoch": 0.49, + "learning_rate": 1.0235719001203836e-07, + "loss": 0.0006, + "step": 25194 + }, + { + "epoch": 0.49, + "learning_rate": 1.0235330666770222e-07, + "loss": 0.0007, + "step": 25195 + }, + { + "epoch": 0.49, + "learning_rate": 1.0234942332336606e-07, + "loss": 0.0005, + "step": 25196 + }, + { + "epoch": 0.49, + "learning_rate": 1.0234553997902992e-07, + "loss": 0.0007, + "step": 25197 + }, + { + "epoch": 0.49, + "learning_rate": 1.0234165663469378e-07, + "loss": 0.0006, + "step": 25198 + }, + { + "epoch": 0.49, + "learning_rate": 1.0233777329035764e-07, + "loss": 0.0007, + "step": 25199 + }, + { + "epoch": 0.49, + "learning_rate": 1.023338899460215e-07, + "loss": 0.0007, + "step": 25200 + }, + { + "epoch": 0.49, + "learning_rate": 1.0233000660168535e-07, + "loss": 0.0027, + "step": 25201 + }, + { + "epoch": 0.49, + "learning_rate": 1.0232612325734921e-07, + "loss": 0.3778, + "step": 25202 + }, + { + "epoch": 0.49, + "learning_rate": 1.0232223991301307e-07, + "loss": 0.0018, + "step": 25203 + }, + { + "epoch": 0.49, + "learning_rate": 1.0231835656867693e-07, + "loss": 0.0004, + "step": 25204 + }, + { + "epoch": 0.49, + "learning_rate": 1.0231447322434079e-07, + "loss": 0.0008, + "step": 25205 + }, + { + "epoch": 0.49, + "learning_rate": 1.0231058988000464e-07, + "loss": 0.0005, + "step": 25206 + }, + { + "epoch": 0.49, + "learning_rate": 1.023067065356685e-07, + "loss": 1.0435, + "step": 25207 + }, + { + "epoch": 0.49, + "learning_rate": 1.0230282319133236e-07, + "loss": 0.8692, + "step": 25208 + }, + { + "epoch": 0.49, + "learning_rate": 1.0229893984699622e-07, + "loss": 0.0067, + "step": 25209 + }, + { + "epoch": 0.49, + "learning_rate": 1.0229505650266008e-07, + "loss": 0.1229, + "step": 25210 + }, + { + "epoch": 0.49, + "learning_rate": 1.0229117315832394e-07, + "loss": 0.3884, + "step": 25211 + }, + { + "epoch": 0.49, + "learning_rate": 1.022872898139878e-07, + "loss": 0.0007, + "step": 25212 + }, + { + "epoch": 0.49, + "learning_rate": 1.0228340646965165e-07, + "loss": 0.0011, + "step": 25213 + }, + { + "epoch": 0.49, + "learning_rate": 1.0227952312531551e-07, + "loss": 0.0059, + "step": 25214 + }, + { + "epoch": 0.49, + "learning_rate": 1.0227563978097937e-07, + "loss": 0.0004, + "step": 25215 + }, + { + "epoch": 0.49, + "learning_rate": 1.0227175643664323e-07, + "loss": 0.0004, + "step": 25216 + }, + { + "epoch": 0.49, + "learning_rate": 1.0226787309230709e-07, + "loss": 0.0006, + "step": 25217 + }, + { + "epoch": 0.49, + "learning_rate": 1.0226398974797094e-07, + "loss": 0.0007, + "step": 25218 + }, + { + "epoch": 0.49, + "learning_rate": 1.022601064036348e-07, + "loss": 0.0008, + "step": 25219 + }, + { + "epoch": 0.49, + "learning_rate": 1.0225622305929866e-07, + "loss": 0.0009, + "step": 25220 + }, + { + "epoch": 0.49, + "learning_rate": 1.0225233971496252e-07, + "loss": 0.0005, + "step": 25221 + }, + { + "epoch": 0.49, + "learning_rate": 1.0224845637062638e-07, + "loss": 0.0005, + "step": 25222 + }, + { + "epoch": 0.49, + "learning_rate": 1.0224457302629023e-07, + "loss": 0.0008, + "step": 25223 + }, + { + "epoch": 0.49, + "learning_rate": 1.0224068968195409e-07, + "loss": 0.0006, + "step": 25224 + }, + { + "epoch": 0.49, + "learning_rate": 1.0223680633761795e-07, + "loss": 0.0011, + "step": 25225 + }, + { + "epoch": 0.49, + "learning_rate": 1.0223292299328181e-07, + "loss": 0.0004, + "step": 25226 + }, + { + "epoch": 0.49, + "learning_rate": 1.0222903964894567e-07, + "loss": 0.0022, + "step": 25227 + }, + { + "epoch": 0.49, + "learning_rate": 1.0222515630460953e-07, + "loss": 0.0006, + "step": 25228 + }, + { + "epoch": 0.49, + "learning_rate": 1.0222127296027338e-07, + "loss": 0.0008, + "step": 25229 + }, + { + "epoch": 0.49, + "learning_rate": 1.0221738961593724e-07, + "loss": 0.0007, + "step": 25230 + }, + { + "epoch": 0.49, + "learning_rate": 1.022135062716011e-07, + "loss": 0.0005, + "step": 25231 + }, + { + "epoch": 0.49, + "learning_rate": 1.0220962292726496e-07, + "loss": 0.0005, + "step": 25232 + }, + { + "epoch": 0.49, + "learning_rate": 1.0220573958292882e-07, + "loss": 0.0005, + "step": 25233 + }, + { + "epoch": 0.49, + "learning_rate": 1.0220185623859268e-07, + "loss": 0.0011, + "step": 25234 + }, + { + "epoch": 0.49, + "learning_rate": 1.0219797289425653e-07, + "loss": 0.0011, + "step": 25235 + }, + { + "epoch": 0.49, + "learning_rate": 1.0219408954992039e-07, + "loss": 0.0007, + "step": 25236 + }, + { + "epoch": 0.49, + "learning_rate": 1.0219020620558425e-07, + "loss": 0.0007, + "step": 25237 + }, + { + "epoch": 0.49, + "learning_rate": 1.0218632286124811e-07, + "loss": 0.0438, + "step": 25238 + }, + { + "epoch": 0.49, + "learning_rate": 1.0218243951691197e-07, + "loss": 0.0005, + "step": 25239 + }, + { + "epoch": 0.49, + "learning_rate": 1.0217855617257582e-07, + "loss": 0.3213, + "step": 25240 + }, + { + "epoch": 0.49, + "learning_rate": 1.0217467282823968e-07, + "loss": 0.0007, + "step": 25241 + }, + { + "epoch": 0.49, + "learning_rate": 1.0217078948390354e-07, + "loss": 0.4062, + "step": 25242 + }, + { + "epoch": 0.49, + "learning_rate": 1.021669061395674e-07, + "loss": 0.0007, + "step": 25243 + }, + { + "epoch": 0.49, + "learning_rate": 1.0216302279523126e-07, + "loss": 0.0005, + "step": 25244 + }, + { + "epoch": 0.49, + "learning_rate": 1.0215913945089512e-07, + "loss": 0.0006, + "step": 25245 + }, + { + "epoch": 0.49, + "learning_rate": 1.0215525610655897e-07, + "loss": 0.0005, + "step": 25246 + }, + { + "epoch": 0.49, + "learning_rate": 1.0215137276222283e-07, + "loss": 0.7687, + "step": 25247 + }, + { + "epoch": 0.49, + "learning_rate": 1.0214748941788669e-07, + "loss": 0.0183, + "step": 25248 + }, + { + "epoch": 0.49, + "learning_rate": 1.0214360607355055e-07, + "loss": 0.0007, + "step": 25249 + }, + { + "epoch": 0.49, + "learning_rate": 1.0213972272921441e-07, + "loss": 0.0004, + "step": 25250 + }, + { + "epoch": 0.49, + "learning_rate": 1.0213583938487824e-07, + "loss": 0.0009, + "step": 25251 + }, + { + "epoch": 0.49, + "learning_rate": 1.021319560405421e-07, + "loss": 0.0006, + "step": 25252 + }, + { + "epoch": 0.49, + "learning_rate": 1.0212807269620596e-07, + "loss": 0.0006, + "step": 25253 + }, + { + "epoch": 0.49, + "learning_rate": 1.0212418935186981e-07, + "loss": 0.0008, + "step": 25254 + }, + { + "epoch": 0.49, + "learning_rate": 1.0212030600753367e-07, + "loss": 0.0006, + "step": 25255 + }, + { + "epoch": 0.49, + "learning_rate": 1.0211642266319753e-07, + "loss": 0.0303, + "step": 25256 + }, + { + "epoch": 0.49, + "learning_rate": 1.0211253931886139e-07, + "loss": 0.1472, + "step": 25257 + }, + { + "epoch": 0.49, + "learning_rate": 1.0210865597452525e-07, + "loss": 0.0005, + "step": 25258 + }, + { + "epoch": 0.49, + "learning_rate": 1.021047726301891e-07, + "loss": 0.001, + "step": 25259 + }, + { + "epoch": 0.49, + "learning_rate": 1.0210088928585296e-07, + "loss": 0.0006, + "step": 25260 + }, + { + "epoch": 0.49, + "learning_rate": 1.0209700594151682e-07, + "loss": 0.0005, + "step": 25261 + }, + { + "epoch": 0.49, + "learning_rate": 1.0209312259718068e-07, + "loss": 0.0007, + "step": 25262 + }, + { + "epoch": 0.49, + "learning_rate": 1.0208923925284454e-07, + "loss": 0.0005, + "step": 25263 + }, + { + "epoch": 0.49, + "learning_rate": 1.020853559085084e-07, + "loss": 0.0004, + "step": 25264 + }, + { + "epoch": 0.49, + "learning_rate": 1.0208147256417225e-07, + "loss": 0.4925, + "step": 25265 + }, + { + "epoch": 0.49, + "learning_rate": 1.0207758921983611e-07, + "loss": 0.0006, + "step": 25266 + }, + { + "epoch": 0.49, + "learning_rate": 1.0207370587549997e-07, + "loss": 0.0016, + "step": 25267 + }, + { + "epoch": 0.49, + "learning_rate": 1.0206982253116383e-07, + "loss": 0.0006, + "step": 25268 + }, + { + "epoch": 0.49, + "learning_rate": 1.0206593918682769e-07, + "loss": 0.0008, + "step": 25269 + }, + { + "epoch": 0.49, + "learning_rate": 1.0206205584249155e-07, + "loss": 0.001, + "step": 25270 + }, + { + "epoch": 0.49, + "learning_rate": 1.020581724981554e-07, + "loss": 0.0013, + "step": 25271 + }, + { + "epoch": 0.49, + "learning_rate": 1.0205428915381926e-07, + "loss": 0.0007, + "step": 25272 + }, + { + "epoch": 0.49, + "learning_rate": 1.0205040580948312e-07, + "loss": 0.5055, + "step": 25273 + }, + { + "epoch": 0.49, + "learning_rate": 1.0204652246514698e-07, + "loss": 0.0006, + "step": 25274 + }, + { + "epoch": 0.49, + "learning_rate": 1.0204263912081084e-07, + "loss": 0.0006, + "step": 25275 + }, + { + "epoch": 0.49, + "learning_rate": 1.020387557764747e-07, + "loss": 0.0007, + "step": 25276 + }, + { + "epoch": 0.49, + "learning_rate": 1.0203487243213855e-07, + "loss": 0.0008, + "step": 25277 + }, + { + "epoch": 0.49, + "learning_rate": 1.0203098908780241e-07, + "loss": 0.0005, + "step": 25278 + }, + { + "epoch": 0.49, + "learning_rate": 1.0202710574346627e-07, + "loss": 0.0006, + "step": 25279 + }, + { + "epoch": 0.49, + "learning_rate": 1.0202322239913013e-07, + "loss": 0.0012, + "step": 25280 + }, + { + "epoch": 0.49, + "learning_rate": 1.0201933905479399e-07, + "loss": 0.0005, + "step": 25281 + }, + { + "epoch": 0.49, + "learning_rate": 1.0201545571045784e-07, + "loss": 0.0005, + "step": 25282 + }, + { + "epoch": 0.49, + "learning_rate": 1.020115723661217e-07, + "loss": 0.0005, + "step": 25283 + }, + { + "epoch": 0.49, + "learning_rate": 1.0200768902178556e-07, + "loss": 0.0007, + "step": 25284 + }, + { + "epoch": 0.49, + "learning_rate": 1.0200380567744942e-07, + "loss": 0.0036, + "step": 25285 + }, + { + "epoch": 0.49, + "learning_rate": 1.0199992233311328e-07, + "loss": 0.0007, + "step": 25286 + }, + { + "epoch": 0.49, + "learning_rate": 1.0199603898877714e-07, + "loss": 0.0005, + "step": 25287 + }, + { + "epoch": 0.49, + "learning_rate": 1.01992155644441e-07, + "loss": 0.0028, + "step": 25288 + }, + { + "epoch": 0.49, + "learning_rate": 1.0198827230010485e-07, + "loss": 0.0248, + "step": 25289 + }, + { + "epoch": 0.49, + "learning_rate": 1.0198438895576871e-07, + "loss": 0.0006, + "step": 25290 + }, + { + "epoch": 0.49, + "learning_rate": 1.0198050561143257e-07, + "loss": 0.0007, + "step": 25291 + }, + { + "epoch": 0.49, + "learning_rate": 1.0197662226709643e-07, + "loss": 0.0006, + "step": 25292 + }, + { + "epoch": 0.49, + "learning_rate": 1.0197273892276029e-07, + "loss": 0.0007, + "step": 25293 + }, + { + "epoch": 0.49, + "learning_rate": 1.0196885557842414e-07, + "loss": 0.3018, + "step": 25294 + }, + { + "epoch": 0.49, + "learning_rate": 1.01964972234088e-07, + "loss": 0.0006, + "step": 25295 + }, + { + "epoch": 0.49, + "learning_rate": 1.0196108888975186e-07, + "loss": 0.0005, + "step": 25296 + }, + { + "epoch": 0.49, + "learning_rate": 1.0195720554541572e-07, + "loss": 0.0007, + "step": 25297 + }, + { + "epoch": 0.49, + "learning_rate": 1.0195332220107958e-07, + "loss": 0.0006, + "step": 25298 + }, + { + "epoch": 0.49, + "learning_rate": 1.0194943885674343e-07, + "loss": 0.003, + "step": 25299 + }, + { + "epoch": 0.49, + "learning_rate": 1.0194555551240729e-07, + "loss": 0.0006, + "step": 25300 + }, + { + "epoch": 0.49, + "learning_rate": 1.0194167216807115e-07, + "loss": 0.0005, + "step": 25301 + }, + { + "epoch": 0.49, + "learning_rate": 1.0193778882373501e-07, + "loss": 0.0006, + "step": 25302 + }, + { + "epoch": 0.49, + "learning_rate": 1.0193390547939887e-07, + "loss": 0.0007, + "step": 25303 + }, + { + "epoch": 0.49, + "learning_rate": 1.0193002213506273e-07, + "loss": 0.0007, + "step": 25304 + }, + { + "epoch": 0.49, + "learning_rate": 1.0192613879072658e-07, + "loss": 0.0007, + "step": 25305 + }, + { + "epoch": 0.49, + "learning_rate": 1.0192225544639044e-07, + "loss": 0.0006, + "step": 25306 + }, + { + "epoch": 0.49, + "learning_rate": 1.019183721020543e-07, + "loss": 0.0005, + "step": 25307 + }, + { + "epoch": 0.49, + "learning_rate": 1.0191448875771816e-07, + "loss": 0.0008, + "step": 25308 + }, + { + "epoch": 0.49, + "learning_rate": 1.0191060541338199e-07, + "loss": 0.0004, + "step": 25309 + }, + { + "epoch": 0.49, + "learning_rate": 1.0190672206904585e-07, + "loss": 0.0006, + "step": 25310 + }, + { + "epoch": 0.49, + "learning_rate": 1.0190283872470971e-07, + "loss": 0.0005, + "step": 25311 + }, + { + "epoch": 0.49, + "learning_rate": 1.0189895538037357e-07, + "loss": 0.0004, + "step": 25312 + }, + { + "epoch": 0.49, + "learning_rate": 1.0189507203603742e-07, + "loss": 0.0008, + "step": 25313 + }, + { + "epoch": 0.49, + "learning_rate": 1.0189118869170128e-07, + "loss": 0.0021, + "step": 25314 + }, + { + "epoch": 0.49, + "learning_rate": 1.0188730534736514e-07, + "loss": 0.0005, + "step": 25315 + }, + { + "epoch": 0.49, + "learning_rate": 1.01883422003029e-07, + "loss": 0.0006, + "step": 25316 + }, + { + "epoch": 0.49, + "learning_rate": 1.0187953865869286e-07, + "loss": 0.0007, + "step": 25317 + }, + { + "epoch": 0.49, + "learning_rate": 1.0187565531435671e-07, + "loss": 0.001, + "step": 25318 + }, + { + "epoch": 0.49, + "learning_rate": 1.0187177197002057e-07, + "loss": 0.0005, + "step": 25319 + }, + { + "epoch": 0.49, + "learning_rate": 1.0186788862568443e-07, + "loss": 0.0005, + "step": 25320 + }, + { + "epoch": 0.49, + "learning_rate": 1.0186400528134829e-07, + "loss": 0.0005, + "step": 25321 + }, + { + "epoch": 0.49, + "learning_rate": 1.0186012193701215e-07, + "loss": 0.0006, + "step": 25322 + }, + { + "epoch": 0.49, + "learning_rate": 1.01856238592676e-07, + "loss": 0.6264, + "step": 25323 + }, + { + "epoch": 0.49, + "learning_rate": 1.0185235524833986e-07, + "loss": 0.0008, + "step": 25324 + }, + { + "epoch": 0.49, + "learning_rate": 1.0184847190400372e-07, + "loss": 0.0006, + "step": 25325 + }, + { + "epoch": 0.49, + "learning_rate": 1.0184458855966758e-07, + "loss": 0.0004, + "step": 25326 + }, + { + "epoch": 0.49, + "learning_rate": 1.0184070521533144e-07, + "loss": 0.0004, + "step": 25327 + }, + { + "epoch": 0.49, + "learning_rate": 1.018368218709953e-07, + "loss": 0.0005, + "step": 25328 + }, + { + "epoch": 0.49, + "learning_rate": 1.0183293852665916e-07, + "loss": 0.0007, + "step": 25329 + }, + { + "epoch": 0.49, + "learning_rate": 1.0182905518232301e-07, + "loss": 0.0005, + "step": 25330 + }, + { + "epoch": 0.49, + "learning_rate": 1.0182517183798687e-07, + "loss": 0.0012, + "step": 25331 + }, + { + "epoch": 0.49, + "learning_rate": 1.0182128849365073e-07, + "loss": 0.0005, + "step": 25332 + }, + { + "epoch": 0.49, + "learning_rate": 1.0181740514931459e-07, + "loss": 0.0006, + "step": 25333 + }, + { + "epoch": 0.49, + "learning_rate": 1.0181352180497845e-07, + "loss": 0.0006, + "step": 25334 + }, + { + "epoch": 0.49, + "learning_rate": 1.018096384606423e-07, + "loss": 0.8458, + "step": 25335 + }, + { + "epoch": 0.49, + "learning_rate": 1.0180575511630616e-07, + "loss": 0.0005, + "step": 25336 + }, + { + "epoch": 0.49, + "learning_rate": 1.0180187177197002e-07, + "loss": 0.0015, + "step": 25337 + }, + { + "epoch": 0.49, + "learning_rate": 1.0179798842763388e-07, + "loss": 0.0006, + "step": 25338 + }, + { + "epoch": 0.49, + "learning_rate": 1.0179410508329774e-07, + "loss": 0.0005, + "step": 25339 + }, + { + "epoch": 0.49, + "learning_rate": 1.017902217389616e-07, + "loss": 0.0006, + "step": 25340 + }, + { + "epoch": 0.49, + "learning_rate": 1.0178633839462545e-07, + "loss": 0.0008, + "step": 25341 + }, + { + "epoch": 0.49, + "learning_rate": 1.0178245505028931e-07, + "loss": 0.0007, + "step": 25342 + }, + { + "epoch": 0.49, + "learning_rate": 1.0177857170595317e-07, + "loss": 0.0006, + "step": 25343 + }, + { + "epoch": 0.49, + "learning_rate": 1.0177468836161702e-07, + "loss": 0.0006, + "step": 25344 + }, + { + "epoch": 0.49, + "learning_rate": 1.0177080501728087e-07, + "loss": 0.0006, + "step": 25345 + }, + { + "epoch": 0.49, + "learning_rate": 1.0176692167294473e-07, + "loss": 0.0007, + "step": 25346 + }, + { + "epoch": 0.49, + "learning_rate": 1.0176303832860859e-07, + "loss": 0.0006, + "step": 25347 + }, + { + "epoch": 0.49, + "learning_rate": 1.0175915498427245e-07, + "loss": 0.0006, + "step": 25348 + }, + { + "epoch": 0.49, + "learning_rate": 1.0175527163993631e-07, + "loss": 0.0009, + "step": 25349 + }, + { + "epoch": 0.49, + "learning_rate": 1.0175138829560017e-07, + "loss": 0.0005, + "step": 25350 + }, + { + "epoch": 0.49, + "learning_rate": 1.0174750495126402e-07, + "loss": 0.0008, + "step": 25351 + }, + { + "epoch": 0.49, + "learning_rate": 1.0174362160692788e-07, + "loss": 0.0009, + "step": 25352 + }, + { + "epoch": 0.49, + "learning_rate": 1.0173973826259174e-07, + "loss": 0.0617, + "step": 25353 + }, + { + "epoch": 0.49, + "learning_rate": 1.017358549182556e-07, + "loss": 0.0006, + "step": 25354 + }, + { + "epoch": 0.49, + "learning_rate": 1.0173197157391946e-07, + "loss": 0.0004, + "step": 25355 + }, + { + "epoch": 0.49, + "learning_rate": 1.0172808822958331e-07, + "loss": 0.0006, + "step": 25356 + }, + { + "epoch": 0.49, + "learning_rate": 1.0172420488524717e-07, + "loss": 0.0006, + "step": 25357 + }, + { + "epoch": 0.49, + "learning_rate": 1.0172032154091103e-07, + "loss": 0.0005, + "step": 25358 + }, + { + "epoch": 0.49, + "learning_rate": 1.0171643819657489e-07, + "loss": 0.5141, + "step": 25359 + }, + { + "epoch": 0.49, + "learning_rate": 1.0171255485223875e-07, + "loss": 0.0454, + "step": 25360 + }, + { + "epoch": 0.49, + "learning_rate": 1.017086715079026e-07, + "loss": 0.0006, + "step": 25361 + }, + { + "epoch": 0.49, + "learning_rate": 1.0170478816356646e-07, + "loss": 0.0006, + "step": 25362 + }, + { + "epoch": 0.49, + "learning_rate": 1.0170090481923032e-07, + "loss": 0.2659, + "step": 25363 + }, + { + "epoch": 0.49, + "learning_rate": 1.0169702147489418e-07, + "loss": 0.0007, + "step": 25364 + }, + { + "epoch": 0.49, + "learning_rate": 1.0169313813055804e-07, + "loss": 0.0006, + "step": 25365 + }, + { + "epoch": 0.49, + "learning_rate": 1.016892547862219e-07, + "loss": 0.0006, + "step": 25366 + }, + { + "epoch": 0.49, + "learning_rate": 1.0168537144188574e-07, + "loss": 0.0004, + "step": 25367 + }, + { + "epoch": 0.49, + "learning_rate": 1.016814880975496e-07, + "loss": 0.0006, + "step": 25368 + }, + { + "epoch": 0.49, + "learning_rate": 1.0167760475321346e-07, + "loss": 0.0008, + "step": 25369 + }, + { + "epoch": 0.49, + "learning_rate": 1.0167372140887732e-07, + "loss": 0.9964, + "step": 25370 + }, + { + "epoch": 0.49, + "learning_rate": 1.0166983806454118e-07, + "loss": 0.0005, + "step": 25371 + }, + { + "epoch": 0.49, + "learning_rate": 1.0166595472020503e-07, + "loss": 0.001, + "step": 25372 + }, + { + "epoch": 0.49, + "learning_rate": 1.0166207137586888e-07, + "loss": 0.0006, + "step": 25373 + }, + { + "epoch": 0.49, + "learning_rate": 1.0165818803153274e-07, + "loss": 0.0118, + "step": 25374 + }, + { + "epoch": 0.49, + "learning_rate": 1.016543046871966e-07, + "loss": 0.0008, + "step": 25375 + }, + { + "epoch": 0.49, + "learning_rate": 1.0165042134286045e-07, + "loss": 0.0024, + "step": 25376 + }, + { + "epoch": 0.49, + "learning_rate": 1.0164653799852431e-07, + "loss": 0.0005, + "step": 25377 + }, + { + "epoch": 0.49, + "learning_rate": 1.0164265465418817e-07, + "loss": 0.0007, + "step": 25378 + }, + { + "epoch": 0.49, + "learning_rate": 1.0163877130985203e-07, + "loss": 0.0006, + "step": 25379 + }, + { + "epoch": 0.49, + "learning_rate": 1.0163488796551589e-07, + "loss": 0.0006, + "step": 25380 + }, + { + "epoch": 0.49, + "learning_rate": 1.0163100462117974e-07, + "loss": 0.0007, + "step": 25381 + }, + { + "epoch": 0.49, + "learning_rate": 1.016271212768436e-07, + "loss": 0.0007, + "step": 25382 + }, + { + "epoch": 0.49, + "learning_rate": 1.0162323793250746e-07, + "loss": 0.0006, + "step": 25383 + }, + { + "epoch": 0.49, + "learning_rate": 1.0161935458817132e-07, + "loss": 0.0005, + "step": 25384 + }, + { + "epoch": 0.49, + "learning_rate": 1.0161547124383518e-07, + "loss": 0.0005, + "step": 25385 + }, + { + "epoch": 0.49, + "learning_rate": 1.0161158789949904e-07, + "loss": 1.2022, + "step": 25386 + }, + { + "epoch": 0.49, + "learning_rate": 1.016077045551629e-07, + "loss": 0.0008, + "step": 25387 + }, + { + "epoch": 0.49, + "learning_rate": 1.0160382121082675e-07, + "loss": 0.0008, + "step": 25388 + }, + { + "epoch": 0.49, + "learning_rate": 1.0159993786649061e-07, + "loss": 0.0005, + "step": 25389 + }, + { + "epoch": 0.49, + "learning_rate": 1.0159605452215447e-07, + "loss": 0.0005, + "step": 25390 + }, + { + "epoch": 0.49, + "learning_rate": 1.0159217117781833e-07, + "loss": 0.0007, + "step": 25391 + }, + { + "epoch": 0.49, + "learning_rate": 1.0158828783348219e-07, + "loss": 0.0007, + "step": 25392 + }, + { + "epoch": 0.49, + "learning_rate": 1.0158440448914604e-07, + "loss": 0.6298, + "step": 25393 + }, + { + "epoch": 0.49, + "learning_rate": 1.015805211448099e-07, + "loss": 0.0005, + "step": 25394 + }, + { + "epoch": 0.49, + "learning_rate": 1.0157663780047376e-07, + "loss": 0.0006, + "step": 25395 + }, + { + "epoch": 0.49, + "learning_rate": 1.0157275445613762e-07, + "loss": 0.0008, + "step": 25396 + }, + { + "epoch": 0.49, + "learning_rate": 1.0156887111180148e-07, + "loss": 0.0006, + "step": 25397 + }, + { + "epoch": 0.49, + "learning_rate": 1.0156498776746533e-07, + "loss": 0.0802, + "step": 25398 + }, + { + "epoch": 0.49, + "learning_rate": 1.0156110442312919e-07, + "loss": 0.0006, + "step": 25399 + }, + { + "epoch": 0.49, + "learning_rate": 1.0155722107879305e-07, + "loss": 0.0092, + "step": 25400 + }, + { + "epoch": 0.49, + "learning_rate": 1.0155333773445691e-07, + "loss": 0.0005, + "step": 25401 + }, + { + "epoch": 0.49, + "learning_rate": 1.0154945439012077e-07, + "loss": 0.0005, + "step": 25402 + }, + { + "epoch": 0.49, + "learning_rate": 1.0154557104578463e-07, + "loss": 0.177, + "step": 25403 + }, + { + "epoch": 0.49, + "learning_rate": 1.0154168770144848e-07, + "loss": 0.0008, + "step": 25404 + }, + { + "epoch": 0.49, + "learning_rate": 1.0153780435711234e-07, + "loss": 0.0008, + "step": 25405 + }, + { + "epoch": 0.49, + "learning_rate": 1.015339210127762e-07, + "loss": 0.0016, + "step": 25406 + }, + { + "epoch": 0.49, + "learning_rate": 1.0153003766844006e-07, + "loss": 0.0004, + "step": 25407 + }, + { + "epoch": 0.49, + "learning_rate": 1.0152615432410392e-07, + "loss": 0.0005, + "step": 25408 + }, + { + "epoch": 0.49, + "learning_rate": 1.0152227097976778e-07, + "loss": 0.0008, + "step": 25409 + }, + { + "epoch": 0.49, + "learning_rate": 1.0151838763543163e-07, + "loss": 0.0006, + "step": 25410 + }, + { + "epoch": 0.49, + "learning_rate": 1.0151450429109549e-07, + "loss": 0.0006, + "step": 25411 + }, + { + "epoch": 0.49, + "learning_rate": 1.0151062094675935e-07, + "loss": 0.0382, + "step": 25412 + }, + { + "epoch": 0.49, + "learning_rate": 1.0150673760242321e-07, + "loss": 0.003, + "step": 25413 + }, + { + "epoch": 0.49, + "learning_rate": 1.0150285425808707e-07, + "loss": 0.0007, + "step": 25414 + }, + { + "epoch": 0.49, + "learning_rate": 1.0149897091375092e-07, + "loss": 0.0007, + "step": 25415 + }, + { + "epoch": 0.49, + "learning_rate": 1.0149508756941478e-07, + "loss": 0.0005, + "step": 25416 + }, + { + "epoch": 0.49, + "learning_rate": 1.0149120422507864e-07, + "loss": 0.0006, + "step": 25417 + }, + { + "epoch": 0.49, + "learning_rate": 1.014873208807425e-07, + "loss": 0.0005, + "step": 25418 + }, + { + "epoch": 0.49, + "learning_rate": 1.0148343753640636e-07, + "loss": 0.0106, + "step": 25419 + }, + { + "epoch": 0.49, + "learning_rate": 1.0147955419207022e-07, + "loss": 0.0006, + "step": 25420 + }, + { + "epoch": 0.49, + "learning_rate": 1.0147567084773407e-07, + "loss": 0.0009, + "step": 25421 + }, + { + "epoch": 0.49, + "learning_rate": 1.0147178750339793e-07, + "loss": 0.0007, + "step": 25422 + }, + { + "epoch": 0.49, + "learning_rate": 1.0146790415906179e-07, + "loss": 0.0008, + "step": 25423 + }, + { + "epoch": 0.49, + "learning_rate": 1.0146402081472565e-07, + "loss": 0.0005, + "step": 25424 + }, + { + "epoch": 0.49, + "learning_rate": 1.0146013747038948e-07, + "loss": 1.3014, + "step": 25425 + }, + { + "epoch": 0.49, + "learning_rate": 1.0145625412605334e-07, + "loss": 0.0006, + "step": 25426 + }, + { + "epoch": 0.49, + "learning_rate": 1.014523707817172e-07, + "loss": 0.0006, + "step": 25427 + }, + { + "epoch": 0.49, + "learning_rate": 1.0144848743738106e-07, + "loss": 0.0711, + "step": 25428 + }, + { + "epoch": 0.49, + "learning_rate": 1.0144460409304491e-07, + "loss": 0.0004, + "step": 25429 + }, + { + "epoch": 0.49, + "learning_rate": 1.0144072074870877e-07, + "loss": 0.0007, + "step": 25430 + }, + { + "epoch": 0.49, + "learning_rate": 1.0143683740437263e-07, + "loss": 0.0019, + "step": 25431 + }, + { + "epoch": 0.49, + "learning_rate": 1.0143295406003649e-07, + "loss": 0.0009, + "step": 25432 + }, + { + "epoch": 0.49, + "learning_rate": 1.0142907071570035e-07, + "loss": 0.0007, + "step": 25433 + }, + { + "epoch": 0.49, + "learning_rate": 1.014251873713642e-07, + "loss": 0.0005, + "step": 25434 + }, + { + "epoch": 0.49, + "learning_rate": 1.0142130402702806e-07, + "loss": 0.0032, + "step": 25435 + }, + { + "epoch": 0.49, + "learning_rate": 1.0141742068269192e-07, + "loss": 0.0049, + "step": 25436 + }, + { + "epoch": 0.49, + "learning_rate": 1.0141353733835578e-07, + "loss": 0.0006, + "step": 25437 + }, + { + "epoch": 0.49, + "learning_rate": 1.0140965399401964e-07, + "loss": 0.0007, + "step": 25438 + }, + { + "epoch": 0.49, + "learning_rate": 1.014057706496835e-07, + "loss": 0.0005, + "step": 25439 + }, + { + "epoch": 0.49, + "learning_rate": 1.0140188730534735e-07, + "loss": 0.0521, + "step": 25440 + }, + { + "epoch": 0.49, + "learning_rate": 1.0139800396101121e-07, + "loss": 0.0071, + "step": 25441 + }, + { + "epoch": 0.49, + "learning_rate": 1.0139412061667507e-07, + "loss": 0.0007, + "step": 25442 + }, + { + "epoch": 0.49, + "learning_rate": 1.0139023727233893e-07, + "loss": 0.0261, + "step": 25443 + }, + { + "epoch": 0.49, + "learning_rate": 1.0138635392800279e-07, + "loss": 0.0006, + "step": 25444 + }, + { + "epoch": 0.49, + "learning_rate": 1.0138247058366665e-07, + "loss": 0.0005, + "step": 25445 + }, + { + "epoch": 0.49, + "learning_rate": 1.013785872393305e-07, + "loss": 1.0673, + "step": 25446 + }, + { + "epoch": 0.49, + "learning_rate": 1.0137470389499436e-07, + "loss": 0.001, + "step": 25447 + }, + { + "epoch": 0.49, + "learning_rate": 1.0137082055065822e-07, + "loss": 0.0005, + "step": 25448 + }, + { + "epoch": 0.49, + "learning_rate": 1.0136693720632208e-07, + "loss": 0.0005, + "step": 25449 + }, + { + "epoch": 0.49, + "learning_rate": 1.0136305386198594e-07, + "loss": 0.0004, + "step": 25450 + }, + { + "epoch": 0.49, + "learning_rate": 1.013591705176498e-07, + "loss": 0.0005, + "step": 25451 + }, + { + "epoch": 0.49, + "learning_rate": 1.0135528717331365e-07, + "loss": 0.0051, + "step": 25452 + }, + { + "epoch": 0.49, + "learning_rate": 1.0135140382897751e-07, + "loss": 0.0008, + "step": 25453 + }, + { + "epoch": 0.49, + "learning_rate": 1.0134752048464137e-07, + "loss": 0.0008, + "step": 25454 + }, + { + "epoch": 0.49, + "learning_rate": 1.0134363714030523e-07, + "loss": 0.0017, + "step": 25455 + }, + { + "epoch": 0.49, + "learning_rate": 1.0133975379596909e-07, + "loss": 0.0009, + "step": 25456 + }, + { + "epoch": 0.49, + "learning_rate": 1.0133587045163294e-07, + "loss": 0.0006, + "step": 25457 + }, + { + "epoch": 0.49, + "learning_rate": 1.013319871072968e-07, + "loss": 0.0007, + "step": 25458 + }, + { + "epoch": 0.49, + "learning_rate": 1.0132810376296066e-07, + "loss": 0.0004, + "step": 25459 + }, + { + "epoch": 0.49, + "learning_rate": 1.0132422041862452e-07, + "loss": 0.0007, + "step": 25460 + }, + { + "epoch": 0.49, + "learning_rate": 1.0132033707428838e-07, + "loss": 0.0008, + "step": 25461 + }, + { + "epoch": 0.49, + "learning_rate": 1.0131645372995224e-07, + "loss": 0.0005, + "step": 25462 + }, + { + "epoch": 0.49, + "learning_rate": 1.013125703856161e-07, + "loss": 0.0007, + "step": 25463 + }, + { + "epoch": 0.49, + "learning_rate": 1.0130868704127995e-07, + "loss": 0.8266, + "step": 25464 + }, + { + "epoch": 0.49, + "learning_rate": 1.0130480369694381e-07, + "loss": 0.0007, + "step": 25465 + }, + { + "epoch": 0.49, + "learning_rate": 1.0130092035260767e-07, + "loss": 0.011, + "step": 25466 + }, + { + "epoch": 0.49, + "learning_rate": 1.0129703700827153e-07, + "loss": 0.0006, + "step": 25467 + }, + { + "epoch": 0.49, + "learning_rate": 1.0129315366393539e-07, + "loss": 0.0004, + "step": 25468 + }, + { + "epoch": 0.49, + "learning_rate": 1.0128927031959924e-07, + "loss": 0.001, + "step": 25469 + }, + { + "epoch": 0.49, + "learning_rate": 1.012853869752631e-07, + "loss": 0.6616, + "step": 25470 + }, + { + "epoch": 0.49, + "learning_rate": 1.0128150363092696e-07, + "loss": 0.2582, + "step": 25471 + }, + { + "epoch": 0.49, + "learning_rate": 1.0127762028659082e-07, + "loss": 0.0006, + "step": 25472 + }, + { + "epoch": 0.49, + "learning_rate": 1.0127373694225468e-07, + "loss": 0.0006, + "step": 25473 + }, + { + "epoch": 0.49, + "learning_rate": 1.0126985359791853e-07, + "loss": 0.0006, + "step": 25474 + }, + { + "epoch": 0.49, + "learning_rate": 1.0126597025358239e-07, + "loss": 0.0007, + "step": 25475 + }, + { + "epoch": 0.49, + "learning_rate": 1.0126208690924625e-07, + "loss": 0.0184, + "step": 25476 + }, + { + "epoch": 0.49, + "learning_rate": 1.0125820356491011e-07, + "loss": 0.5696, + "step": 25477 + }, + { + "epoch": 0.49, + "learning_rate": 1.0125432022057397e-07, + "loss": 0.0892, + "step": 25478 + }, + { + "epoch": 0.49, + "learning_rate": 1.0125043687623783e-07, + "loss": 0.0005, + "step": 25479 + }, + { + "epoch": 0.49, + "learning_rate": 1.0124655353190168e-07, + "loss": 0.0005, + "step": 25480 + }, + { + "epoch": 0.49, + "learning_rate": 1.0124267018756554e-07, + "loss": 0.0005, + "step": 25481 + }, + { + "epoch": 0.49, + "learning_rate": 1.012387868432294e-07, + "loss": 0.0005, + "step": 25482 + }, + { + "epoch": 0.49, + "learning_rate": 1.0123490349889323e-07, + "loss": 0.0006, + "step": 25483 + }, + { + "epoch": 0.49, + "learning_rate": 1.0123102015455709e-07, + "loss": 0.0004, + "step": 25484 + }, + { + "epoch": 0.49, + "learning_rate": 1.0122713681022095e-07, + "loss": 0.0005, + "step": 25485 + }, + { + "epoch": 0.49, + "learning_rate": 1.0122325346588481e-07, + "loss": 0.0006, + "step": 25486 + }, + { + "epoch": 0.49, + "learning_rate": 1.0121937012154867e-07, + "loss": 1.0229, + "step": 25487 + }, + { + "epoch": 0.49, + "learning_rate": 1.0121548677721252e-07, + "loss": 0.0006, + "step": 25488 + }, + { + "epoch": 0.49, + "learning_rate": 1.0121160343287638e-07, + "loss": 0.0006, + "step": 25489 + }, + { + "epoch": 0.49, + "learning_rate": 1.0120772008854024e-07, + "loss": 0.0007, + "step": 25490 + }, + { + "epoch": 0.49, + "learning_rate": 1.012038367442041e-07, + "loss": 0.0006, + "step": 25491 + }, + { + "epoch": 0.49, + "learning_rate": 1.0119995339986796e-07, + "loss": 0.5777, + "step": 25492 + }, + { + "epoch": 0.49, + "learning_rate": 1.0119607005553182e-07, + "loss": 0.0011, + "step": 25493 + }, + { + "epoch": 0.49, + "learning_rate": 1.0119218671119567e-07, + "loss": 0.0053, + "step": 25494 + }, + { + "epoch": 0.49, + "learning_rate": 1.0118830336685953e-07, + "loss": 0.0004, + "step": 25495 + }, + { + "epoch": 0.49, + "learning_rate": 1.0118442002252339e-07, + "loss": 0.0005, + "step": 25496 + }, + { + "epoch": 0.49, + "learning_rate": 1.0118053667818725e-07, + "loss": 0.0007, + "step": 25497 + }, + { + "epoch": 0.49, + "learning_rate": 1.011766533338511e-07, + "loss": 0.0006, + "step": 25498 + }, + { + "epoch": 0.49, + "learning_rate": 1.0117276998951496e-07, + "loss": 0.0004, + "step": 25499 + }, + { + "epoch": 0.49, + "learning_rate": 1.0116888664517882e-07, + "loss": 0.0266, + "step": 25500 + }, + { + "epoch": 0.49, + "learning_rate": 1.0116500330084268e-07, + "loss": 0.0005, + "step": 25501 + }, + { + "epoch": 0.49, + "learning_rate": 1.0116111995650654e-07, + "loss": 0.0005, + "step": 25502 + }, + { + "epoch": 0.49, + "learning_rate": 1.011572366121704e-07, + "loss": 0.0004, + "step": 25503 + }, + { + "epoch": 0.49, + "learning_rate": 1.0115335326783426e-07, + "loss": 0.0022, + "step": 25504 + }, + { + "epoch": 0.49, + "learning_rate": 1.0114946992349811e-07, + "loss": 0.6447, + "step": 25505 + }, + { + "epoch": 0.49, + "learning_rate": 1.0114558657916197e-07, + "loss": 0.986, + "step": 25506 + }, + { + "epoch": 0.49, + "learning_rate": 1.0114170323482583e-07, + "loss": 0.0006, + "step": 25507 + }, + { + "epoch": 0.49, + "learning_rate": 1.0113781989048969e-07, + "loss": 0.0006, + "step": 25508 + }, + { + "epoch": 0.49, + "learning_rate": 1.0113393654615355e-07, + "loss": 0.0006, + "step": 25509 + }, + { + "epoch": 0.49, + "learning_rate": 1.011300532018174e-07, + "loss": 0.0018, + "step": 25510 + }, + { + "epoch": 0.49, + "learning_rate": 1.0112616985748126e-07, + "loss": 0.0005, + "step": 25511 + }, + { + "epoch": 0.49, + "learning_rate": 1.0112228651314512e-07, + "loss": 0.0006, + "step": 25512 + }, + { + "epoch": 0.49, + "learning_rate": 1.0111840316880898e-07, + "loss": 0.0009, + "step": 25513 + }, + { + "epoch": 0.49, + "learning_rate": 1.0111451982447284e-07, + "loss": 0.0007, + "step": 25514 + }, + { + "epoch": 0.49, + "learning_rate": 1.011106364801367e-07, + "loss": 0.0007, + "step": 25515 + }, + { + "epoch": 0.49, + "learning_rate": 1.0110675313580055e-07, + "loss": 0.0006, + "step": 25516 + }, + { + "epoch": 0.49, + "learning_rate": 1.0110286979146441e-07, + "loss": 0.0005, + "step": 25517 + }, + { + "epoch": 0.49, + "learning_rate": 1.0109898644712827e-07, + "loss": 0.0007, + "step": 25518 + }, + { + "epoch": 0.5, + "learning_rate": 1.0109510310279213e-07, + "loss": 0.0031, + "step": 25519 + }, + { + "epoch": 0.5, + "learning_rate": 1.0109121975845599e-07, + "loss": 0.0005, + "step": 25520 + }, + { + "epoch": 0.5, + "learning_rate": 1.0108733641411983e-07, + "loss": 0.0007, + "step": 25521 + }, + { + "epoch": 0.5, + "learning_rate": 1.0108345306978369e-07, + "loss": 0.0005, + "step": 25522 + }, + { + "epoch": 0.5, + "learning_rate": 1.0107956972544755e-07, + "loss": 0.0005, + "step": 25523 + }, + { + "epoch": 0.5, + "learning_rate": 1.0107568638111141e-07, + "loss": 0.0017, + "step": 25524 + }, + { + "epoch": 0.5, + "learning_rate": 1.0107180303677527e-07, + "loss": 0.0014, + "step": 25525 + }, + { + "epoch": 0.5, + "learning_rate": 1.0106791969243912e-07, + "loss": 0.0005, + "step": 25526 + }, + { + "epoch": 0.5, + "learning_rate": 1.0106403634810298e-07, + "loss": 0.0009, + "step": 25527 + }, + { + "epoch": 0.5, + "learning_rate": 1.0106015300376684e-07, + "loss": 0.0006, + "step": 25528 + }, + { + "epoch": 0.5, + "learning_rate": 1.010562696594307e-07, + "loss": 0.0005, + "step": 25529 + }, + { + "epoch": 0.5, + "learning_rate": 1.0105238631509456e-07, + "loss": 0.0009, + "step": 25530 + }, + { + "epoch": 0.5, + "learning_rate": 1.0104850297075842e-07, + "loss": 0.0005, + "step": 25531 + }, + { + "epoch": 0.5, + "learning_rate": 1.0104461962642227e-07, + "loss": 0.0007, + "step": 25532 + }, + { + "epoch": 0.5, + "learning_rate": 1.0104073628208613e-07, + "loss": 0.0006, + "step": 25533 + }, + { + "epoch": 0.5, + "learning_rate": 1.0103685293774999e-07, + "loss": 0.0006, + "step": 25534 + }, + { + "epoch": 0.5, + "learning_rate": 1.0103296959341385e-07, + "loss": 0.0005, + "step": 25535 + }, + { + "epoch": 0.5, + "learning_rate": 1.010290862490777e-07, + "loss": 0.0005, + "step": 25536 + }, + { + "epoch": 0.5, + "learning_rate": 1.0102520290474156e-07, + "loss": 0.0011, + "step": 25537 + }, + { + "epoch": 0.5, + "learning_rate": 1.0102131956040542e-07, + "loss": 0.0007, + "step": 25538 + }, + { + "epoch": 0.5, + "learning_rate": 1.0101743621606928e-07, + "loss": 0.0006, + "step": 25539 + }, + { + "epoch": 0.5, + "learning_rate": 1.0101355287173314e-07, + "loss": 1.184, + "step": 25540 + }, + { + "epoch": 0.5, + "learning_rate": 1.0100966952739698e-07, + "loss": 0.0006, + "step": 25541 + }, + { + "epoch": 0.5, + "learning_rate": 1.0100578618306084e-07, + "loss": 0.0132, + "step": 25542 + }, + { + "epoch": 0.5, + "learning_rate": 1.010019028387247e-07, + "loss": 0.2585, + "step": 25543 + }, + { + "epoch": 0.5, + "learning_rate": 1.0099801949438856e-07, + "loss": 0.0005, + "step": 25544 + }, + { + "epoch": 0.5, + "learning_rate": 1.0099413615005242e-07, + "loss": 0.0008, + "step": 25545 + }, + { + "epoch": 0.5, + "learning_rate": 1.0099025280571628e-07, + "loss": 0.0005, + "step": 25546 + }, + { + "epoch": 0.5, + "learning_rate": 1.0098636946138013e-07, + "loss": 0.0005, + "step": 25547 + }, + { + "epoch": 0.5, + "learning_rate": 1.0098248611704399e-07, + "loss": 0.0004, + "step": 25548 + }, + { + "epoch": 0.5, + "learning_rate": 1.0097860277270785e-07, + "loss": 0.1548, + "step": 25549 + }, + { + "epoch": 0.5, + "learning_rate": 1.009747194283717e-07, + "loss": 0.0005, + "step": 25550 + }, + { + "epoch": 0.5, + "learning_rate": 1.0097083608403555e-07, + "loss": 0.0006, + "step": 25551 + }, + { + "epoch": 0.5, + "learning_rate": 1.0096695273969941e-07, + "loss": 0.0007, + "step": 25552 + }, + { + "epoch": 0.5, + "learning_rate": 1.0096306939536327e-07, + "loss": 0.0007, + "step": 25553 + }, + { + "epoch": 0.5, + "learning_rate": 1.0095918605102713e-07, + "loss": 0.0005, + "step": 25554 + }, + { + "epoch": 0.5, + "learning_rate": 1.0095530270669099e-07, + "loss": 0.0008, + "step": 25555 + }, + { + "epoch": 0.5, + "learning_rate": 1.0095141936235484e-07, + "loss": 0.0006, + "step": 25556 + }, + { + "epoch": 0.5, + "learning_rate": 1.009475360180187e-07, + "loss": 0.0008, + "step": 25557 + }, + { + "epoch": 0.5, + "learning_rate": 1.0094365267368256e-07, + "loss": 0.0006, + "step": 25558 + }, + { + "epoch": 0.5, + "learning_rate": 1.0093976932934642e-07, + "loss": 0.0029, + "step": 25559 + }, + { + "epoch": 0.5, + "learning_rate": 1.0093588598501028e-07, + "loss": 0.0007, + "step": 25560 + }, + { + "epoch": 0.5, + "learning_rate": 1.0093200264067414e-07, + "loss": 0.0005, + "step": 25561 + }, + { + "epoch": 0.5, + "learning_rate": 1.00928119296338e-07, + "loss": 0.0007, + "step": 25562 + }, + { + "epoch": 0.5, + "learning_rate": 1.0092423595200185e-07, + "loss": 0.0008, + "step": 25563 + }, + { + "epoch": 0.5, + "learning_rate": 1.0092035260766571e-07, + "loss": 0.0009, + "step": 25564 + }, + { + "epoch": 0.5, + "learning_rate": 1.0091646926332957e-07, + "loss": 0.0008, + "step": 25565 + }, + { + "epoch": 0.5, + "learning_rate": 1.0091258591899343e-07, + "loss": 0.0005, + "step": 25566 + }, + { + "epoch": 0.5, + "learning_rate": 1.0090870257465729e-07, + "loss": 0.0006, + "step": 25567 + }, + { + "epoch": 0.5, + "learning_rate": 1.0090481923032114e-07, + "loss": 1.2292, + "step": 25568 + }, + { + "epoch": 0.5, + "learning_rate": 1.00900935885985e-07, + "loss": 0.0007, + "step": 25569 + }, + { + "epoch": 0.5, + "learning_rate": 1.0089705254164886e-07, + "loss": 0.0005, + "step": 25570 + }, + { + "epoch": 0.5, + "learning_rate": 1.0089316919731272e-07, + "loss": 0.674, + "step": 25571 + }, + { + "epoch": 0.5, + "learning_rate": 1.0088928585297658e-07, + "loss": 0.0005, + "step": 25572 + }, + { + "epoch": 0.5, + "learning_rate": 1.0088540250864043e-07, + "loss": 0.0007, + "step": 25573 + }, + { + "epoch": 0.5, + "learning_rate": 1.0088151916430429e-07, + "loss": 0.0006, + "step": 25574 + }, + { + "epoch": 0.5, + "learning_rate": 1.0087763581996815e-07, + "loss": 0.0006, + "step": 25575 + }, + { + "epoch": 0.5, + "learning_rate": 1.0087375247563201e-07, + "loss": 0.0012, + "step": 25576 + }, + { + "epoch": 0.5, + "learning_rate": 1.0086986913129587e-07, + "loss": 0.0011, + "step": 25577 + }, + { + "epoch": 0.5, + "learning_rate": 1.0086598578695973e-07, + "loss": 0.0007, + "step": 25578 + }, + { + "epoch": 0.5, + "learning_rate": 1.0086210244262358e-07, + "loss": 0.0009, + "step": 25579 + }, + { + "epoch": 0.5, + "learning_rate": 1.0085821909828744e-07, + "loss": 0.0025, + "step": 25580 + }, + { + "epoch": 0.5, + "learning_rate": 1.008543357539513e-07, + "loss": 0.001, + "step": 25581 + }, + { + "epoch": 0.5, + "learning_rate": 1.0085045240961516e-07, + "loss": 0.0006, + "step": 25582 + }, + { + "epoch": 0.5, + "learning_rate": 1.0084656906527902e-07, + "loss": 0.0009, + "step": 25583 + }, + { + "epoch": 0.5, + "learning_rate": 1.0084268572094288e-07, + "loss": 0.0007, + "step": 25584 + }, + { + "epoch": 0.5, + "learning_rate": 1.0083880237660673e-07, + "loss": 0.0004, + "step": 25585 + }, + { + "epoch": 0.5, + "learning_rate": 1.0083491903227059e-07, + "loss": 0.0004, + "step": 25586 + }, + { + "epoch": 0.5, + "learning_rate": 1.0083103568793445e-07, + "loss": 0.0022, + "step": 25587 + }, + { + "epoch": 0.5, + "learning_rate": 1.0082715234359831e-07, + "loss": 0.0004, + "step": 25588 + }, + { + "epoch": 0.5, + "learning_rate": 1.0082326899926217e-07, + "loss": 0.0031, + "step": 25589 + }, + { + "epoch": 0.5, + "learning_rate": 1.0081938565492603e-07, + "loss": 0.0007, + "step": 25590 + }, + { + "epoch": 0.5, + "learning_rate": 1.0081550231058988e-07, + "loss": 0.0005, + "step": 25591 + }, + { + "epoch": 0.5, + "learning_rate": 1.0081161896625374e-07, + "loss": 0.0005, + "step": 25592 + }, + { + "epoch": 0.5, + "learning_rate": 1.008077356219176e-07, + "loss": 0.5076, + "step": 25593 + }, + { + "epoch": 0.5, + "learning_rate": 1.0080385227758146e-07, + "loss": 0.0494, + "step": 25594 + }, + { + "epoch": 0.5, + "learning_rate": 1.0079996893324532e-07, + "loss": 0.0007, + "step": 25595 + }, + { + "epoch": 0.5, + "learning_rate": 1.0079608558890917e-07, + "loss": 0.0008, + "step": 25596 + }, + { + "epoch": 0.5, + "learning_rate": 1.0079220224457303e-07, + "loss": 0.0075, + "step": 25597 + }, + { + "epoch": 0.5, + "learning_rate": 1.0078831890023689e-07, + "loss": 0.0006, + "step": 25598 + }, + { + "epoch": 0.5, + "learning_rate": 1.0078443555590072e-07, + "loss": 0.0004, + "step": 25599 + }, + { + "epoch": 0.5, + "learning_rate": 1.0078055221156458e-07, + "loss": 0.0006, + "step": 25600 + }, + { + "epoch": 0.5, + "learning_rate": 1.0077666886722844e-07, + "loss": 0.0007, + "step": 25601 + }, + { + "epoch": 0.5, + "learning_rate": 1.007727855228923e-07, + "loss": 0.0006, + "step": 25602 + }, + { + "epoch": 0.5, + "learning_rate": 1.0076890217855616e-07, + "loss": 0.0005, + "step": 25603 + }, + { + "epoch": 0.5, + "learning_rate": 1.0076501883422001e-07, + "loss": 0.0015, + "step": 25604 + }, + { + "epoch": 0.5, + "learning_rate": 1.0076113548988387e-07, + "loss": 0.1118, + "step": 25605 + }, + { + "epoch": 0.5, + "learning_rate": 1.0075725214554773e-07, + "loss": 0.0007, + "step": 25606 + }, + { + "epoch": 0.5, + "learning_rate": 1.0075336880121159e-07, + "loss": 0.0006, + "step": 25607 + }, + { + "epoch": 0.5, + "learning_rate": 1.0074948545687545e-07, + "loss": 0.0023, + "step": 25608 + }, + { + "epoch": 0.5, + "learning_rate": 1.007456021125393e-07, + "loss": 0.0698, + "step": 25609 + }, + { + "epoch": 0.5, + "learning_rate": 1.0074171876820316e-07, + "loss": 0.0006, + "step": 25610 + }, + { + "epoch": 0.5, + "learning_rate": 1.0073783542386702e-07, + "loss": 0.0006, + "step": 25611 + }, + { + "epoch": 0.5, + "learning_rate": 1.0073395207953088e-07, + "loss": 0.0068, + "step": 25612 + }, + { + "epoch": 0.5, + "learning_rate": 1.0073006873519474e-07, + "loss": 0.0011, + "step": 25613 + }, + { + "epoch": 0.5, + "learning_rate": 1.007261853908586e-07, + "loss": 0.0006, + "step": 25614 + }, + { + "epoch": 0.5, + "learning_rate": 1.0072230204652245e-07, + "loss": 0.0006, + "step": 25615 + }, + { + "epoch": 0.5, + "learning_rate": 1.0071841870218631e-07, + "loss": 0.0006, + "step": 25616 + }, + { + "epoch": 0.5, + "learning_rate": 1.0071453535785017e-07, + "loss": 0.0005, + "step": 25617 + }, + { + "epoch": 0.5, + "learning_rate": 1.0071065201351403e-07, + "loss": 0.0007, + "step": 25618 + }, + { + "epoch": 0.5, + "learning_rate": 1.0070676866917789e-07, + "loss": 0.0007, + "step": 25619 + }, + { + "epoch": 0.5, + "learning_rate": 1.0070288532484175e-07, + "loss": 0.001, + "step": 25620 + }, + { + "epoch": 0.5, + "learning_rate": 1.006990019805056e-07, + "loss": 0.0014, + "step": 25621 + }, + { + "epoch": 0.5, + "learning_rate": 1.0069511863616946e-07, + "loss": 0.2468, + "step": 25622 + }, + { + "epoch": 0.5, + "learning_rate": 1.0069123529183332e-07, + "loss": 0.0004, + "step": 25623 + }, + { + "epoch": 0.5, + "learning_rate": 1.0068735194749718e-07, + "loss": 0.0005, + "step": 25624 + }, + { + "epoch": 0.5, + "learning_rate": 1.0068346860316104e-07, + "loss": 0.0004, + "step": 25625 + }, + { + "epoch": 0.5, + "learning_rate": 1.006795852588249e-07, + "loss": 1.0114, + "step": 25626 + }, + { + "epoch": 0.5, + "learning_rate": 1.0067570191448875e-07, + "loss": 0.0005, + "step": 25627 + }, + { + "epoch": 0.5, + "learning_rate": 1.0067181857015261e-07, + "loss": 0.0007, + "step": 25628 + }, + { + "epoch": 0.5, + "learning_rate": 1.0066793522581647e-07, + "loss": 0.0005, + "step": 25629 + }, + { + "epoch": 0.5, + "learning_rate": 1.0066405188148033e-07, + "loss": 0.0005, + "step": 25630 + }, + { + "epoch": 0.5, + "learning_rate": 1.0066016853714419e-07, + "loss": 0.0006, + "step": 25631 + }, + { + "epoch": 0.5, + "learning_rate": 1.0065628519280804e-07, + "loss": 0.0007, + "step": 25632 + }, + { + "epoch": 0.5, + "learning_rate": 1.006524018484719e-07, + "loss": 0.0006, + "step": 25633 + }, + { + "epoch": 0.5, + "learning_rate": 1.0064851850413576e-07, + "loss": 0.0016, + "step": 25634 + }, + { + "epoch": 0.5, + "learning_rate": 1.0064463515979962e-07, + "loss": 0.0005, + "step": 25635 + }, + { + "epoch": 0.5, + "learning_rate": 1.0064075181546348e-07, + "loss": 0.0005, + "step": 25636 + }, + { + "epoch": 0.5, + "learning_rate": 1.0063686847112734e-07, + "loss": 0.0018, + "step": 25637 + }, + { + "epoch": 0.5, + "learning_rate": 1.006329851267912e-07, + "loss": 0.0006, + "step": 25638 + }, + { + "epoch": 0.5, + "learning_rate": 1.0062910178245505e-07, + "loss": 0.137, + "step": 25639 + }, + { + "epoch": 0.5, + "learning_rate": 1.0062521843811891e-07, + "loss": 0.0012, + "step": 25640 + }, + { + "epoch": 0.5, + "learning_rate": 1.0062133509378277e-07, + "loss": 0.0005, + "step": 25641 + }, + { + "epoch": 0.5, + "learning_rate": 1.0061745174944663e-07, + "loss": 0.0047, + "step": 25642 + }, + { + "epoch": 0.5, + "learning_rate": 1.0061356840511049e-07, + "loss": 0.0004, + "step": 25643 + }, + { + "epoch": 0.5, + "learning_rate": 1.0060968506077434e-07, + "loss": 0.0491, + "step": 25644 + }, + { + "epoch": 0.5, + "learning_rate": 1.006058017164382e-07, + "loss": 0.0005, + "step": 25645 + }, + { + "epoch": 0.5, + "learning_rate": 1.0060191837210206e-07, + "loss": 0.0009, + "step": 25646 + }, + { + "epoch": 0.5, + "learning_rate": 1.0059803502776592e-07, + "loss": 0.0004, + "step": 25647 + }, + { + "epoch": 0.5, + "learning_rate": 1.0059415168342978e-07, + "loss": 0.0006, + "step": 25648 + }, + { + "epoch": 0.5, + "learning_rate": 1.0059026833909363e-07, + "loss": 0.0011, + "step": 25649 + }, + { + "epoch": 0.5, + "learning_rate": 1.0058638499475749e-07, + "loss": 0.0004, + "step": 25650 + }, + { + "epoch": 0.5, + "learning_rate": 1.0058250165042135e-07, + "loss": 0.0005, + "step": 25651 + }, + { + "epoch": 0.5, + "learning_rate": 1.0057861830608521e-07, + "loss": 0.0011, + "step": 25652 + }, + { + "epoch": 0.5, + "learning_rate": 1.0057473496174907e-07, + "loss": 0.0012, + "step": 25653 + }, + { + "epoch": 0.5, + "learning_rate": 1.0057085161741293e-07, + "loss": 0.0006, + "step": 25654 + }, + { + "epoch": 0.5, + "learning_rate": 1.0056696827307678e-07, + "loss": 0.0005, + "step": 25655 + }, + { + "epoch": 0.5, + "learning_rate": 1.0056308492874064e-07, + "loss": 0.0005, + "step": 25656 + }, + { + "epoch": 0.5, + "learning_rate": 1.0055920158440447e-07, + "loss": 0.0004, + "step": 25657 + }, + { + "epoch": 0.5, + "learning_rate": 1.0055531824006833e-07, + "loss": 0.0006, + "step": 25658 + }, + { + "epoch": 0.5, + "learning_rate": 1.0055143489573219e-07, + "loss": 0.0005, + "step": 25659 + }, + { + "epoch": 0.5, + "learning_rate": 1.0054755155139605e-07, + "loss": 0.0007, + "step": 25660 + }, + { + "epoch": 0.5, + "learning_rate": 1.0054366820705991e-07, + "loss": 1.2438, + "step": 25661 + }, + { + "epoch": 0.5, + "learning_rate": 1.0053978486272377e-07, + "loss": 0.0005, + "step": 25662 + }, + { + "epoch": 0.5, + "learning_rate": 1.0053590151838762e-07, + "loss": 0.0007, + "step": 25663 + }, + { + "epoch": 0.5, + "learning_rate": 1.0053201817405148e-07, + "loss": 0.0006, + "step": 25664 + }, + { + "epoch": 0.5, + "learning_rate": 1.0052813482971534e-07, + "loss": 0.0009, + "step": 25665 + }, + { + "epoch": 0.5, + "learning_rate": 1.005242514853792e-07, + "loss": 0.0008, + "step": 25666 + }, + { + "epoch": 0.5, + "learning_rate": 1.0052036814104306e-07, + "loss": 0.0007, + "step": 25667 + }, + { + "epoch": 0.5, + "learning_rate": 1.0051648479670692e-07, + "loss": 0.0006, + "step": 25668 + }, + { + "epoch": 0.5, + "learning_rate": 1.0051260145237077e-07, + "loss": 0.0318, + "step": 25669 + }, + { + "epoch": 0.5, + "learning_rate": 1.0050871810803463e-07, + "loss": 0.9301, + "step": 25670 + }, + { + "epoch": 0.5, + "learning_rate": 1.0050483476369849e-07, + "loss": 0.001, + "step": 25671 + }, + { + "epoch": 0.5, + "learning_rate": 1.0050095141936235e-07, + "loss": 0.0005, + "step": 25672 + }, + { + "epoch": 0.5, + "learning_rate": 1.004970680750262e-07, + "loss": 0.0005, + "step": 25673 + }, + { + "epoch": 0.5, + "learning_rate": 1.0049318473069006e-07, + "loss": 0.0005, + "step": 25674 + }, + { + "epoch": 0.5, + "learning_rate": 1.0048930138635392e-07, + "loss": 0.0007, + "step": 25675 + }, + { + "epoch": 0.5, + "learning_rate": 1.0048541804201778e-07, + "loss": 0.001, + "step": 25676 + }, + { + "epoch": 0.5, + "learning_rate": 1.0048153469768164e-07, + "loss": 0.0005, + "step": 25677 + }, + { + "epoch": 0.5, + "learning_rate": 1.004776513533455e-07, + "loss": 0.0004, + "step": 25678 + }, + { + "epoch": 0.5, + "learning_rate": 1.0047376800900936e-07, + "loss": 0.0005, + "step": 25679 + }, + { + "epoch": 0.5, + "learning_rate": 1.0046988466467321e-07, + "loss": 0.0008, + "step": 25680 + }, + { + "epoch": 0.5, + "learning_rate": 1.0046600132033707e-07, + "loss": 0.0009, + "step": 25681 + }, + { + "epoch": 0.5, + "learning_rate": 1.0046211797600093e-07, + "loss": 0.0006, + "step": 25682 + }, + { + "epoch": 0.5, + "learning_rate": 1.0045823463166479e-07, + "loss": 0.2601, + "step": 25683 + }, + { + "epoch": 0.5, + "learning_rate": 1.0045435128732865e-07, + "loss": 0.0005, + "step": 25684 + }, + { + "epoch": 0.5, + "learning_rate": 1.004504679429925e-07, + "loss": 0.0007, + "step": 25685 + }, + { + "epoch": 0.5, + "learning_rate": 1.0044658459865636e-07, + "loss": 0.001, + "step": 25686 + }, + { + "epoch": 0.5, + "learning_rate": 1.0044270125432022e-07, + "loss": 0.6958, + "step": 25687 + }, + { + "epoch": 0.5, + "learning_rate": 1.0043881790998408e-07, + "loss": 0.0005, + "step": 25688 + }, + { + "epoch": 0.5, + "learning_rate": 1.0043493456564794e-07, + "loss": 0.0019, + "step": 25689 + }, + { + "epoch": 0.5, + "learning_rate": 1.004310512213118e-07, + "loss": 0.0006, + "step": 25690 + }, + { + "epoch": 0.5, + "learning_rate": 1.0042716787697565e-07, + "loss": 0.243, + "step": 25691 + }, + { + "epoch": 0.5, + "learning_rate": 1.0042328453263951e-07, + "loss": 0.0007, + "step": 25692 + }, + { + "epoch": 0.5, + "learning_rate": 1.0041940118830337e-07, + "loss": 0.0029, + "step": 25693 + }, + { + "epoch": 0.5, + "learning_rate": 1.0041551784396723e-07, + "loss": 0.0005, + "step": 25694 + }, + { + "epoch": 0.5, + "learning_rate": 1.0041163449963109e-07, + "loss": 0.0006, + "step": 25695 + }, + { + "epoch": 0.5, + "learning_rate": 1.0040775115529495e-07, + "loss": 0.0103, + "step": 25696 + }, + { + "epoch": 0.5, + "learning_rate": 1.004038678109588e-07, + "loss": 1.098, + "step": 25697 + }, + { + "epoch": 0.5, + "learning_rate": 1.0039998446662265e-07, + "loss": 0.0007, + "step": 25698 + }, + { + "epoch": 0.5, + "learning_rate": 1.0039610112228651e-07, + "loss": 0.0658, + "step": 25699 + }, + { + "epoch": 0.5, + "learning_rate": 1.0039221777795037e-07, + "loss": 0.0007, + "step": 25700 + }, + { + "epoch": 0.5, + "learning_rate": 1.0038833443361422e-07, + "loss": 0.0006, + "step": 25701 + }, + { + "epoch": 0.5, + "learning_rate": 1.0038445108927808e-07, + "loss": 0.0038, + "step": 25702 + }, + { + "epoch": 0.5, + "learning_rate": 1.0038056774494194e-07, + "loss": 0.013, + "step": 25703 + }, + { + "epoch": 0.5, + "learning_rate": 1.003766844006058e-07, + "loss": 0.0006, + "step": 25704 + }, + { + "epoch": 0.5, + "learning_rate": 1.0037280105626966e-07, + "loss": 0.0006, + "step": 25705 + }, + { + "epoch": 0.5, + "learning_rate": 1.0036891771193352e-07, + "loss": 0.0925, + "step": 25706 + }, + { + "epoch": 0.5, + "learning_rate": 1.0036503436759737e-07, + "loss": 0.0108, + "step": 25707 + }, + { + "epoch": 0.5, + "learning_rate": 1.0036115102326123e-07, + "loss": 1.0865, + "step": 25708 + }, + { + "epoch": 0.5, + "learning_rate": 1.0035726767892509e-07, + "loss": 0.0005, + "step": 25709 + }, + { + "epoch": 0.5, + "learning_rate": 1.0035338433458895e-07, + "loss": 0.0005, + "step": 25710 + }, + { + "epoch": 0.5, + "learning_rate": 1.003495009902528e-07, + "loss": 0.001, + "step": 25711 + }, + { + "epoch": 0.5, + "learning_rate": 1.0034561764591666e-07, + "loss": 0.7053, + "step": 25712 + }, + { + "epoch": 0.5, + "learning_rate": 1.0034173430158052e-07, + "loss": 0.0015, + "step": 25713 + }, + { + "epoch": 0.5, + "learning_rate": 1.0033785095724438e-07, + "loss": 0.0063, + "step": 25714 + }, + { + "epoch": 0.5, + "learning_rate": 1.0033396761290823e-07, + "loss": 0.0006, + "step": 25715 + }, + { + "epoch": 0.5, + "learning_rate": 1.0033008426857208e-07, + "loss": 0.0006, + "step": 25716 + }, + { + "epoch": 0.5, + "learning_rate": 1.0032620092423594e-07, + "loss": 0.0007, + "step": 25717 + }, + { + "epoch": 0.5, + "learning_rate": 1.003223175798998e-07, + "loss": 0.0005, + "step": 25718 + }, + { + "epoch": 0.5, + "learning_rate": 1.0031843423556366e-07, + "loss": 0.0007, + "step": 25719 + }, + { + "epoch": 0.5, + "learning_rate": 1.0031455089122752e-07, + "loss": 0.0006, + "step": 25720 + }, + { + "epoch": 0.5, + "learning_rate": 1.0031066754689138e-07, + "loss": 0.0007, + "step": 25721 + }, + { + "epoch": 0.5, + "learning_rate": 1.0030678420255523e-07, + "loss": 0.0009, + "step": 25722 + }, + { + "epoch": 0.5, + "learning_rate": 1.0030290085821909e-07, + "loss": 0.0007, + "step": 25723 + }, + { + "epoch": 0.5, + "learning_rate": 1.0029901751388295e-07, + "loss": 0.9142, + "step": 25724 + }, + { + "epoch": 0.5, + "learning_rate": 1.0029513416954681e-07, + "loss": 0.0007, + "step": 25725 + }, + { + "epoch": 0.5, + "learning_rate": 1.0029125082521067e-07, + "loss": 0.0007, + "step": 25726 + }, + { + "epoch": 0.5, + "learning_rate": 1.0028736748087451e-07, + "loss": 0.0391, + "step": 25727 + }, + { + "epoch": 0.5, + "learning_rate": 1.0028348413653837e-07, + "loss": 0.0005, + "step": 25728 + }, + { + "epoch": 0.5, + "learning_rate": 1.0027960079220223e-07, + "loss": 0.0007, + "step": 25729 + }, + { + "epoch": 0.5, + "learning_rate": 1.0027571744786609e-07, + "loss": 0.0005, + "step": 25730 + }, + { + "epoch": 0.5, + "learning_rate": 1.0027183410352994e-07, + "loss": 0.0007, + "step": 25731 + }, + { + "epoch": 0.5, + "learning_rate": 1.002679507591938e-07, + "loss": 0.0006, + "step": 25732 + }, + { + "epoch": 0.5, + "learning_rate": 1.0026406741485766e-07, + "loss": 0.0005, + "step": 25733 + }, + { + "epoch": 0.5, + "learning_rate": 1.0026018407052152e-07, + "loss": 0.0007, + "step": 25734 + }, + { + "epoch": 0.5, + "learning_rate": 1.0025630072618538e-07, + "loss": 0.001, + "step": 25735 + }, + { + "epoch": 0.5, + "learning_rate": 1.0025241738184924e-07, + "loss": 0.0004, + "step": 25736 + }, + { + "epoch": 0.5, + "learning_rate": 1.002485340375131e-07, + "loss": 0.0007, + "step": 25737 + }, + { + "epoch": 0.5, + "learning_rate": 1.0024465069317695e-07, + "loss": 0.0006, + "step": 25738 + }, + { + "epoch": 0.5, + "learning_rate": 1.0024076734884081e-07, + "loss": 0.0042, + "step": 25739 + }, + { + "epoch": 0.5, + "learning_rate": 1.0023688400450467e-07, + "loss": 0.0006, + "step": 25740 + }, + { + "epoch": 0.5, + "learning_rate": 1.0023300066016853e-07, + "loss": 0.0006, + "step": 25741 + }, + { + "epoch": 0.5, + "learning_rate": 1.0022911731583239e-07, + "loss": 0.0006, + "step": 25742 + }, + { + "epoch": 0.5, + "learning_rate": 1.0022523397149624e-07, + "loss": 0.0007, + "step": 25743 + }, + { + "epoch": 0.5, + "learning_rate": 1.002213506271601e-07, + "loss": 0.0007, + "step": 25744 + }, + { + "epoch": 0.5, + "learning_rate": 1.0021746728282396e-07, + "loss": 0.5041, + "step": 25745 + }, + { + "epoch": 0.5, + "learning_rate": 1.0021358393848782e-07, + "loss": 0.001, + "step": 25746 + }, + { + "epoch": 0.5, + "learning_rate": 1.0020970059415168e-07, + "loss": 0.0005, + "step": 25747 + }, + { + "epoch": 0.5, + "learning_rate": 1.0020581724981553e-07, + "loss": 0.8458, + "step": 25748 + }, + { + "epoch": 0.5, + "learning_rate": 1.0020193390547939e-07, + "loss": 0.0006, + "step": 25749 + }, + { + "epoch": 0.5, + "learning_rate": 1.0019805056114325e-07, + "loss": 0.0027, + "step": 25750 + }, + { + "epoch": 0.5, + "learning_rate": 1.0019416721680711e-07, + "loss": 0.0005, + "step": 25751 + }, + { + "epoch": 0.5, + "learning_rate": 1.0019028387247097e-07, + "loss": 0.0005, + "step": 25752 + }, + { + "epoch": 0.5, + "learning_rate": 1.0018640052813483e-07, + "loss": 0.0005, + "step": 25753 + }, + { + "epoch": 0.5, + "learning_rate": 1.0018251718379868e-07, + "loss": 0.0005, + "step": 25754 + }, + { + "epoch": 0.5, + "learning_rate": 1.0017863383946254e-07, + "loss": 0.0006, + "step": 25755 + }, + { + "epoch": 0.5, + "learning_rate": 1.001747504951264e-07, + "loss": 0.0006, + "step": 25756 + }, + { + "epoch": 0.5, + "learning_rate": 1.0017086715079026e-07, + "loss": 0.0008, + "step": 25757 + }, + { + "epoch": 0.5, + "learning_rate": 1.0016698380645412e-07, + "loss": 0.007, + "step": 25758 + }, + { + "epoch": 0.5, + "learning_rate": 1.0016310046211798e-07, + "loss": 0.0005, + "step": 25759 + }, + { + "epoch": 0.5, + "learning_rate": 1.0015921711778183e-07, + "loss": 0.0137, + "step": 25760 + }, + { + "epoch": 0.5, + "learning_rate": 1.0015533377344569e-07, + "loss": 0.0006, + "step": 25761 + }, + { + "epoch": 0.5, + "learning_rate": 1.0015145042910955e-07, + "loss": 0.0004, + "step": 25762 + }, + { + "epoch": 0.5, + "learning_rate": 1.0014756708477341e-07, + "loss": 0.0005, + "step": 25763 + }, + { + "epoch": 0.5, + "learning_rate": 1.0014368374043727e-07, + "loss": 0.0007, + "step": 25764 + }, + { + "epoch": 0.5, + "learning_rate": 1.0013980039610113e-07, + "loss": 0.0007, + "step": 25765 + }, + { + "epoch": 0.5, + "learning_rate": 1.0013591705176498e-07, + "loss": 0.0005, + "step": 25766 + }, + { + "epoch": 0.5, + "learning_rate": 1.0013203370742884e-07, + "loss": 0.0005, + "step": 25767 + }, + { + "epoch": 0.5, + "learning_rate": 1.001281503630927e-07, + "loss": 0.0005, + "step": 25768 + }, + { + "epoch": 0.5, + "learning_rate": 1.0012426701875656e-07, + "loss": 0.7447, + "step": 25769 + }, + { + "epoch": 0.5, + "learning_rate": 1.0012038367442042e-07, + "loss": 0.0063, + "step": 25770 + }, + { + "epoch": 0.5, + "learning_rate": 1.0011650033008427e-07, + "loss": 0.001, + "step": 25771 + }, + { + "epoch": 0.5, + "learning_rate": 1.0011261698574813e-07, + "loss": 0.0011, + "step": 25772 + }, + { + "epoch": 0.5, + "learning_rate": 1.0010873364141196e-07, + "loss": 0.0005, + "step": 25773 + }, + { + "epoch": 0.5, + "learning_rate": 1.0010485029707582e-07, + "loss": 0.0004, + "step": 25774 + }, + { + "epoch": 0.5, + "learning_rate": 1.0010096695273968e-07, + "loss": 0.0005, + "step": 25775 + }, + { + "epoch": 0.5, + "learning_rate": 1.0009708360840354e-07, + "loss": 0.001, + "step": 25776 + }, + { + "epoch": 0.5, + "learning_rate": 1.000932002640674e-07, + "loss": 0.0005, + "step": 25777 + }, + { + "epoch": 0.5, + "learning_rate": 1.0008931691973126e-07, + "loss": 0.0006, + "step": 25778 + }, + { + "epoch": 0.5, + "learning_rate": 1.0008543357539511e-07, + "loss": 0.0005, + "step": 25779 + }, + { + "epoch": 0.5, + "learning_rate": 1.0008155023105897e-07, + "loss": 0.0004, + "step": 25780 + }, + { + "epoch": 0.5, + "learning_rate": 1.0007766688672283e-07, + "loss": 0.0005, + "step": 25781 + }, + { + "epoch": 0.5, + "learning_rate": 1.0007378354238669e-07, + "loss": 0.0004, + "step": 25782 + }, + { + "epoch": 0.5, + "learning_rate": 1.0006990019805055e-07, + "loss": 0.0688, + "step": 25783 + }, + { + "epoch": 0.5, + "learning_rate": 1.000660168537144e-07, + "loss": 0.0006, + "step": 25784 + }, + { + "epoch": 0.5, + "learning_rate": 1.0006213350937826e-07, + "loss": 0.0005, + "step": 25785 + }, + { + "epoch": 0.5, + "learning_rate": 1.0005825016504212e-07, + "loss": 0.0005, + "step": 25786 + }, + { + "epoch": 0.5, + "learning_rate": 1.0005436682070598e-07, + "loss": 0.002, + "step": 25787 + }, + { + "epoch": 0.5, + "learning_rate": 1.0005048347636984e-07, + "loss": 0.0009, + "step": 25788 + }, + { + "epoch": 0.5, + "learning_rate": 1.000466001320337e-07, + "loss": 0.0008, + "step": 25789 + }, + { + "epoch": 0.5, + "learning_rate": 1.0004271678769755e-07, + "loss": 0.0006, + "step": 25790 + }, + { + "epoch": 0.5, + "learning_rate": 1.0003883344336141e-07, + "loss": 0.0019, + "step": 25791 + }, + { + "epoch": 0.5, + "learning_rate": 1.0003495009902527e-07, + "loss": 0.0004, + "step": 25792 + }, + { + "epoch": 0.5, + "learning_rate": 1.0003106675468913e-07, + "loss": 0.0006, + "step": 25793 + }, + { + "epoch": 0.5, + "learning_rate": 1.0002718341035299e-07, + "loss": 0.0136, + "step": 25794 + }, + { + "epoch": 0.5, + "learning_rate": 1.0002330006601685e-07, + "loss": 0.0005, + "step": 25795 + }, + { + "epoch": 0.5, + "learning_rate": 1.000194167216807e-07, + "loss": 0.0007, + "step": 25796 + }, + { + "epoch": 0.5, + "learning_rate": 1.0001553337734456e-07, + "loss": 0.0007, + "step": 25797 + }, + { + "epoch": 0.5, + "learning_rate": 1.0001165003300842e-07, + "loss": 0.0007, + "step": 25798 + }, + { + "epoch": 0.5, + "learning_rate": 1.0000776668867228e-07, + "loss": 0.0006, + "step": 25799 + }, + { + "epoch": 0.5, + "learning_rate": 1.0000388334433614e-07, + "loss": 0.0188, + "step": 25800 + }, + { + "epoch": 0.5, + "learning_rate": 1e-07, + "loss": 0.0277, + "step": 25801 + }, + { + "epoch": 0.5, + "learning_rate": 9.999611665566385e-08, + "loss": 0.0006, + "step": 25802 + }, + { + "epoch": 0.5, + "learning_rate": 9.999223331132771e-08, + "loss": 0.1249, + "step": 25803 + }, + { + "epoch": 0.5, + "learning_rate": 9.998834996699157e-08, + "loss": 0.0006, + "step": 25804 + }, + { + "epoch": 0.5, + "learning_rate": 9.998446662265543e-08, + "loss": 0.0011, + "step": 25805 + }, + { + "epoch": 0.5, + "learning_rate": 9.998058327831929e-08, + "loss": 0.0006, + "step": 25806 + }, + { + "epoch": 0.5, + "learning_rate": 9.997669993398314e-08, + "loss": 0.0006, + "step": 25807 + }, + { + "epoch": 0.5, + "learning_rate": 9.9972816589647e-08, + "loss": 0.0006, + "step": 25808 + }, + { + "epoch": 0.5, + "learning_rate": 9.996893324531086e-08, + "loss": 0.0005, + "step": 25809 + }, + { + "epoch": 0.5, + "learning_rate": 9.996504990097472e-08, + "loss": 0.0007, + "step": 25810 + }, + { + "epoch": 0.5, + "learning_rate": 9.996116655663858e-08, + "loss": 0.0102, + "step": 25811 + }, + { + "epoch": 0.5, + "learning_rate": 9.995728321230244e-08, + "loss": 0.0006, + "step": 25812 + }, + { + "epoch": 0.5, + "learning_rate": 9.99533998679663e-08, + "loss": 0.0007, + "step": 25813 + }, + { + "epoch": 0.5, + "learning_rate": 9.994951652363015e-08, + "loss": 0.0005, + "step": 25814 + }, + { + "epoch": 0.5, + "learning_rate": 9.994563317929401e-08, + "loss": 0.0007, + "step": 25815 + }, + { + "epoch": 0.5, + "learning_rate": 9.994174983495786e-08, + "loss": 0.0006, + "step": 25816 + }, + { + "epoch": 0.5, + "learning_rate": 9.993786649062171e-08, + "loss": 0.0006, + "step": 25817 + }, + { + "epoch": 0.5, + "learning_rate": 9.993398314628557e-08, + "loss": 0.0005, + "step": 25818 + }, + { + "epoch": 0.5, + "learning_rate": 9.993009980194943e-08, + "loss": 0.0004, + "step": 25819 + }, + { + "epoch": 0.5, + "learning_rate": 9.992621645761329e-08, + "loss": 0.0005, + "step": 25820 + }, + { + "epoch": 0.5, + "learning_rate": 9.992233311327715e-08, + "loss": 0.0013, + "step": 25821 + }, + { + "epoch": 0.5, + "learning_rate": 9.9918449768941e-08, + "loss": 0.0006, + "step": 25822 + }, + { + "epoch": 0.5, + "learning_rate": 9.991456642460486e-08, + "loss": 0.0005, + "step": 25823 + }, + { + "epoch": 0.5, + "learning_rate": 9.991068308026872e-08, + "loss": 0.0049, + "step": 25824 + }, + { + "epoch": 0.5, + "learning_rate": 9.990679973593258e-08, + "loss": 0.0005, + "step": 25825 + }, + { + "epoch": 0.5, + "learning_rate": 9.990291639159644e-08, + "loss": 0.0026, + "step": 25826 + }, + { + "epoch": 0.5, + "learning_rate": 9.98990330472603e-08, + "loss": 0.2083, + "step": 25827 + }, + { + "epoch": 0.5, + "learning_rate": 9.989514970292415e-08, + "loss": 0.0004, + "step": 25828 + }, + { + "epoch": 0.5, + "learning_rate": 9.989126635858801e-08, + "loss": 0.0008, + "step": 25829 + }, + { + "epoch": 0.5, + "learning_rate": 9.988738301425187e-08, + "loss": 0.0005, + "step": 25830 + }, + { + "epoch": 0.5, + "learning_rate": 9.988349966991573e-08, + "loss": 0.0413, + "step": 25831 + }, + { + "epoch": 0.5, + "learning_rate": 9.987961632557959e-08, + "loss": 0.0013, + "step": 25832 + }, + { + "epoch": 0.5, + "learning_rate": 9.987573298124345e-08, + "loss": 0.0077, + "step": 25833 + }, + { + "epoch": 0.5, + "learning_rate": 9.98718496369073e-08, + "loss": 0.0005, + "step": 25834 + }, + { + "epoch": 0.5, + "learning_rate": 9.986796629257116e-08, + "loss": 0.0039, + "step": 25835 + }, + { + "epoch": 0.5, + "learning_rate": 9.986408294823502e-08, + "loss": 0.0006, + "step": 25836 + }, + { + "epoch": 0.5, + "learning_rate": 9.986019960389888e-08, + "loss": 0.0009, + "step": 25837 + }, + { + "epoch": 0.5, + "learning_rate": 9.985631625956274e-08, + "loss": 0.0004, + "step": 25838 + }, + { + "epoch": 0.5, + "learning_rate": 9.98524329152266e-08, + "loss": 0.0006, + "step": 25839 + }, + { + "epoch": 0.5, + "learning_rate": 9.984854957089045e-08, + "loss": 0.0012, + "step": 25840 + }, + { + "epoch": 0.5, + "learning_rate": 9.984466622655431e-08, + "loss": 0.0014, + "step": 25841 + }, + { + "epoch": 0.5, + "learning_rate": 9.984078288221817e-08, + "loss": 0.0009, + "step": 25842 + }, + { + "epoch": 0.5, + "learning_rate": 9.983689953788203e-08, + "loss": 0.0005, + "step": 25843 + }, + { + "epoch": 0.5, + "learning_rate": 9.983301619354589e-08, + "loss": 0.0005, + "step": 25844 + }, + { + "epoch": 0.5, + "learning_rate": 9.982913284920973e-08, + "loss": 0.0006, + "step": 25845 + }, + { + "epoch": 0.5, + "learning_rate": 9.982524950487359e-08, + "loss": 0.0006, + "step": 25846 + }, + { + "epoch": 0.5, + "learning_rate": 9.982136616053745e-08, + "loss": 0.0009, + "step": 25847 + }, + { + "epoch": 0.5, + "learning_rate": 9.98174828162013e-08, + "loss": 0.0007, + "step": 25848 + }, + { + "epoch": 0.5, + "learning_rate": 9.981359947186516e-08, + "loss": 0.3107, + "step": 25849 + }, + { + "epoch": 0.5, + "learning_rate": 9.980971612752902e-08, + "loss": 0.0005, + "step": 25850 + }, + { + "epoch": 0.5, + "learning_rate": 9.980583278319288e-08, + "loss": 0.0005, + "step": 25851 + }, + { + "epoch": 0.5, + "learning_rate": 9.980194943885674e-08, + "loss": 0.0072, + "step": 25852 + }, + { + "epoch": 0.5, + "learning_rate": 9.97980660945206e-08, + "loss": 0.1104, + "step": 25853 + }, + { + "epoch": 0.5, + "learning_rate": 9.979418275018446e-08, + "loss": 0.0012, + "step": 25854 + }, + { + "epoch": 0.5, + "learning_rate": 9.979029940584831e-08, + "loss": 0.0046, + "step": 25855 + }, + { + "epoch": 0.5, + "learning_rate": 9.978641606151217e-08, + "loss": 0.0007, + "step": 25856 + }, + { + "epoch": 0.5, + "learning_rate": 9.978253271717603e-08, + "loss": 0.8755, + "step": 25857 + }, + { + "epoch": 0.5, + "learning_rate": 9.977864937283989e-08, + "loss": 0.0005, + "step": 25858 + }, + { + "epoch": 0.5, + "learning_rate": 9.977476602850375e-08, + "loss": 0.0005, + "step": 25859 + }, + { + "epoch": 0.5, + "learning_rate": 9.97708826841676e-08, + "loss": 0.0005, + "step": 25860 + }, + { + "epoch": 0.5, + "learning_rate": 9.976699933983146e-08, + "loss": 0.0006, + "step": 25861 + }, + { + "epoch": 0.5, + "learning_rate": 9.976311599549532e-08, + "loss": 0.6896, + "step": 25862 + }, + { + "epoch": 0.5, + "learning_rate": 9.975923265115918e-08, + "loss": 0.0007, + "step": 25863 + }, + { + "epoch": 0.5, + "learning_rate": 9.975534930682304e-08, + "loss": 0.0005, + "step": 25864 + }, + { + "epoch": 0.5, + "learning_rate": 9.97514659624869e-08, + "loss": 0.0005, + "step": 25865 + }, + { + "epoch": 0.5, + "learning_rate": 9.974758261815075e-08, + "loss": 0.0004, + "step": 25866 + }, + { + "epoch": 0.5, + "learning_rate": 9.974369927381461e-08, + "loss": 0.0067, + "step": 25867 + }, + { + "epoch": 0.5, + "learning_rate": 9.973981592947847e-08, + "loss": 0.0008, + "step": 25868 + }, + { + "epoch": 0.5, + "learning_rate": 9.973593258514233e-08, + "loss": 0.0004, + "step": 25869 + }, + { + "epoch": 0.5, + "learning_rate": 9.973204924080619e-08, + "loss": 0.0005, + "step": 25870 + }, + { + "epoch": 0.5, + "learning_rate": 9.972816589647005e-08, + "loss": 0.0042, + "step": 25871 + }, + { + "epoch": 0.5, + "learning_rate": 9.97242825521339e-08, + "loss": 0.0008, + "step": 25872 + }, + { + "epoch": 0.5, + "learning_rate": 9.972039920779776e-08, + "loss": 0.0012, + "step": 25873 + }, + { + "epoch": 0.5, + "learning_rate": 9.971651586346161e-08, + "loss": 0.0004, + "step": 25874 + }, + { + "epoch": 0.5, + "learning_rate": 9.971263251912547e-08, + "loss": 0.0006, + "step": 25875 + }, + { + "epoch": 0.5, + "learning_rate": 9.970874917478932e-08, + "loss": 0.0008, + "step": 25876 + }, + { + "epoch": 0.5, + "learning_rate": 9.970486583045318e-08, + "loss": 0.0037, + "step": 25877 + }, + { + "epoch": 0.5, + "learning_rate": 9.970098248611704e-08, + "loss": 0.0005, + "step": 25878 + }, + { + "epoch": 0.5, + "learning_rate": 9.96970991417809e-08, + "loss": 0.0006, + "step": 25879 + }, + { + "epoch": 0.5, + "learning_rate": 9.969321579744476e-08, + "loss": 0.016, + "step": 25880 + }, + { + "epoch": 0.5, + "learning_rate": 9.968933245310862e-08, + "loss": 0.0005, + "step": 25881 + }, + { + "epoch": 0.5, + "learning_rate": 9.968544910877247e-08, + "loss": 0.3153, + "step": 25882 + }, + { + "epoch": 0.5, + "learning_rate": 9.968156576443633e-08, + "loss": 0.0013, + "step": 25883 + }, + { + "epoch": 0.5, + "learning_rate": 9.967768242010019e-08, + "loss": 0.0055, + "step": 25884 + }, + { + "epoch": 0.5, + "learning_rate": 9.967379907576405e-08, + "loss": 0.491, + "step": 25885 + }, + { + "epoch": 0.5, + "learning_rate": 9.96699157314279e-08, + "loss": 0.0006, + "step": 25886 + }, + { + "epoch": 0.5, + "learning_rate": 9.966603238709176e-08, + "loss": 0.0007, + "step": 25887 + }, + { + "epoch": 0.5, + "learning_rate": 9.966214904275562e-08, + "loss": 0.3456, + "step": 25888 + }, + { + "epoch": 0.5, + "learning_rate": 9.965826569841948e-08, + "loss": 0.1281, + "step": 25889 + }, + { + "epoch": 0.5, + "learning_rate": 9.965438235408333e-08, + "loss": 0.0005, + "step": 25890 + }, + { + "epoch": 0.5, + "learning_rate": 9.965049900974718e-08, + "loss": 1.0457, + "step": 25891 + }, + { + "epoch": 0.5, + "learning_rate": 9.964661566541104e-08, + "loss": 0.0043, + "step": 25892 + }, + { + "epoch": 0.5, + "learning_rate": 9.96427323210749e-08, + "loss": 0.1293, + "step": 25893 + }, + { + "epoch": 0.5, + "learning_rate": 9.963884897673876e-08, + "loss": 0.5563, + "step": 25894 + }, + { + "epoch": 0.5, + "learning_rate": 9.963496563240262e-08, + "loss": 0.0005, + "step": 25895 + }, + { + "epoch": 0.5, + "learning_rate": 9.963108228806648e-08, + "loss": 0.0005, + "step": 25896 + }, + { + "epoch": 0.5, + "learning_rate": 9.962719894373033e-08, + "loss": 0.0005, + "step": 25897 + }, + { + "epoch": 0.5, + "learning_rate": 9.962331559939419e-08, + "loss": 0.0006, + "step": 25898 + }, + { + "epoch": 0.5, + "learning_rate": 9.961943225505805e-08, + "loss": 0.0005, + "step": 25899 + }, + { + "epoch": 0.5, + "learning_rate": 9.961554891072191e-08, + "loss": 0.0008, + "step": 25900 + }, + { + "epoch": 0.5, + "learning_rate": 9.961166556638577e-08, + "loss": 0.0006, + "step": 25901 + }, + { + "epoch": 0.5, + "learning_rate": 9.960778222204963e-08, + "loss": 0.0196, + "step": 25902 + }, + { + "epoch": 0.5, + "learning_rate": 9.960389887771348e-08, + "loss": 0.0003, + "step": 25903 + }, + { + "epoch": 0.5, + "learning_rate": 9.960001553337734e-08, + "loss": 0.0005, + "step": 25904 + }, + { + "epoch": 0.5, + "learning_rate": 9.959613218904119e-08, + "loss": 0.0007, + "step": 25905 + }, + { + "epoch": 0.5, + "learning_rate": 9.959224884470504e-08, + "loss": 0.0005, + "step": 25906 + }, + { + "epoch": 0.5, + "learning_rate": 9.95883655003689e-08, + "loss": 0.0121, + "step": 25907 + }, + { + "epoch": 0.5, + "learning_rate": 9.958448215603276e-08, + "loss": 0.0007, + "step": 25908 + }, + { + "epoch": 0.5, + "learning_rate": 9.958059881169662e-08, + "loss": 0.0005, + "step": 25909 + }, + { + "epoch": 0.5, + "learning_rate": 9.957671546736048e-08, + "loss": 0.031, + "step": 25910 + }, + { + "epoch": 0.5, + "learning_rate": 9.957283212302434e-08, + "loss": 0.0005, + "step": 25911 + }, + { + "epoch": 0.5, + "learning_rate": 9.95689487786882e-08, + "loss": 0.0005, + "step": 25912 + }, + { + "epoch": 0.5, + "learning_rate": 9.956506543435205e-08, + "loss": 0.0007, + "step": 25913 + }, + { + "epoch": 0.5, + "learning_rate": 9.956118209001591e-08, + "loss": 0.4957, + "step": 25914 + }, + { + "epoch": 0.5, + "learning_rate": 9.955729874567977e-08, + "loss": 0.0007, + "step": 25915 + }, + { + "epoch": 0.5, + "learning_rate": 9.955341540134363e-08, + "loss": 0.3238, + "step": 25916 + }, + { + "epoch": 0.5, + "learning_rate": 9.954953205700749e-08, + "loss": 0.0005, + "step": 25917 + }, + { + "epoch": 0.5, + "learning_rate": 9.954564871267134e-08, + "loss": 0.0007, + "step": 25918 + }, + { + "epoch": 0.5, + "learning_rate": 9.95417653683352e-08, + "loss": 0.0007, + "step": 25919 + }, + { + "epoch": 0.5, + "learning_rate": 9.953788202399906e-08, + "loss": 1.486, + "step": 25920 + }, + { + "epoch": 0.5, + "learning_rate": 9.953399867966292e-08, + "loss": 0.1494, + "step": 25921 + }, + { + "epoch": 0.5, + "learning_rate": 9.953011533532678e-08, + "loss": 0.0006, + "step": 25922 + }, + { + "epoch": 0.5, + "learning_rate": 9.952623199099064e-08, + "loss": 0.0142, + "step": 25923 + }, + { + "epoch": 0.5, + "learning_rate": 9.952234864665449e-08, + "loss": 0.0005, + "step": 25924 + }, + { + "epoch": 0.5, + "learning_rate": 9.951846530231835e-08, + "loss": 0.0006, + "step": 25925 + }, + { + "epoch": 0.5, + "learning_rate": 9.951458195798221e-08, + "loss": 0.0008, + "step": 25926 + }, + { + "epoch": 0.5, + "learning_rate": 9.951069861364607e-08, + "loss": 0.0007, + "step": 25927 + }, + { + "epoch": 0.5, + "learning_rate": 9.950681526930993e-08, + "loss": 0.0004, + "step": 25928 + }, + { + "epoch": 0.5, + "learning_rate": 9.950293192497378e-08, + "loss": 0.0005, + "step": 25929 + }, + { + "epoch": 0.5, + "learning_rate": 9.949904858063764e-08, + "loss": 0.0006, + "step": 25930 + }, + { + "epoch": 0.5, + "learning_rate": 9.94951652363015e-08, + "loss": 0.0006, + "step": 25931 + }, + { + "epoch": 0.5, + "learning_rate": 9.949128189196535e-08, + "loss": 0.0006, + "step": 25932 + }, + { + "epoch": 0.5, + "learning_rate": 9.94873985476292e-08, + "loss": 0.0006, + "step": 25933 + }, + { + "epoch": 0.5, + "learning_rate": 9.948351520329306e-08, + "loss": 0.0005, + "step": 25934 + }, + { + "epoch": 0.5, + "learning_rate": 9.947963185895692e-08, + "loss": 0.9796, + "step": 25935 + }, + { + "epoch": 0.5, + "learning_rate": 9.947574851462078e-08, + "loss": 0.0006, + "step": 25936 + }, + { + "epoch": 0.5, + "learning_rate": 9.947186517028464e-08, + "loss": 0.0013, + "step": 25937 + }, + { + "epoch": 0.5, + "learning_rate": 9.94679818259485e-08, + "loss": 0.0117, + "step": 25938 + }, + { + "epoch": 0.5, + "learning_rate": 9.946409848161235e-08, + "loss": 0.0005, + "step": 25939 + }, + { + "epoch": 0.5, + "learning_rate": 9.946021513727621e-08, + "loss": 0.0006, + "step": 25940 + }, + { + "epoch": 0.5, + "learning_rate": 9.945633179294007e-08, + "loss": 0.0011, + "step": 25941 + }, + { + "epoch": 0.5, + "learning_rate": 9.945244844860393e-08, + "loss": 0.0005, + "step": 25942 + }, + { + "epoch": 0.5, + "learning_rate": 9.944856510426779e-08, + "loss": 0.0006, + "step": 25943 + }, + { + "epoch": 0.5, + "learning_rate": 9.944468175993165e-08, + "loss": 0.0007, + "step": 25944 + }, + { + "epoch": 0.5, + "learning_rate": 9.94407984155955e-08, + "loss": 0.0007, + "step": 25945 + }, + { + "epoch": 0.5, + "learning_rate": 9.943691507125936e-08, + "loss": 0.0005, + "step": 25946 + }, + { + "epoch": 0.5, + "learning_rate": 9.943303172692322e-08, + "loss": 0.0005, + "step": 25947 + }, + { + "epoch": 0.5, + "learning_rate": 9.942914838258708e-08, + "loss": 0.0009, + "step": 25948 + }, + { + "epoch": 0.5, + "learning_rate": 9.942526503825094e-08, + "loss": 0.0008, + "step": 25949 + }, + { + "epoch": 0.5, + "learning_rate": 9.94213816939148e-08, + "loss": 0.0007, + "step": 25950 + }, + { + "epoch": 0.5, + "learning_rate": 9.941749834957865e-08, + "loss": 0.0006, + "step": 25951 + }, + { + "epoch": 0.5, + "learning_rate": 9.941361500524251e-08, + "loss": 0.3544, + "step": 25952 + }, + { + "epoch": 0.5, + "learning_rate": 9.940973166090637e-08, + "loss": 0.0004, + "step": 25953 + }, + { + "epoch": 0.5, + "learning_rate": 9.940584831657023e-08, + "loss": 0.0005, + "step": 25954 + }, + { + "epoch": 0.5, + "learning_rate": 9.940196497223409e-08, + "loss": 0.0006, + "step": 25955 + }, + { + "epoch": 0.5, + "learning_rate": 9.939808162789794e-08, + "loss": 0.0006, + "step": 25956 + }, + { + "epoch": 0.5, + "learning_rate": 9.93941982835618e-08, + "loss": 0.0006, + "step": 25957 + }, + { + "epoch": 0.5, + "learning_rate": 9.939031493922566e-08, + "loss": 0.0007, + "step": 25958 + }, + { + "epoch": 0.5, + "learning_rate": 9.938643159488952e-08, + "loss": 0.0134, + "step": 25959 + }, + { + "epoch": 0.5, + "learning_rate": 9.938254825055338e-08, + "loss": 0.0006, + "step": 25960 + }, + { + "epoch": 0.5, + "learning_rate": 9.937866490621722e-08, + "loss": 0.0006, + "step": 25961 + }, + { + "epoch": 0.5, + "learning_rate": 9.937478156188108e-08, + "loss": 0.0008, + "step": 25962 + }, + { + "epoch": 0.5, + "learning_rate": 9.937089821754494e-08, + "loss": 0.0006, + "step": 25963 + }, + { + "epoch": 0.5, + "learning_rate": 9.93670148732088e-08, + "loss": 0.0006, + "step": 25964 + }, + { + "epoch": 0.5, + "learning_rate": 9.936313152887265e-08, + "loss": 0.0004, + "step": 25965 + }, + { + "epoch": 0.5, + "learning_rate": 9.935924818453651e-08, + "loss": 0.0004, + "step": 25966 + }, + { + "epoch": 0.5, + "learning_rate": 9.935536484020037e-08, + "loss": 0.0006, + "step": 25967 + }, + { + "epoch": 0.5, + "learning_rate": 9.935148149586423e-08, + "loss": 0.0076, + "step": 25968 + }, + { + "epoch": 0.5, + "learning_rate": 9.934759815152809e-08, + "loss": 0.0005, + "step": 25969 + }, + { + "epoch": 0.5, + "learning_rate": 9.934371480719195e-08, + "loss": 0.0008, + "step": 25970 + }, + { + "epoch": 0.5, + "learning_rate": 9.93398314628558e-08, + "loss": 0.0008, + "step": 25971 + }, + { + "epoch": 0.5, + "learning_rate": 9.933594811851966e-08, + "loss": 0.0006, + "step": 25972 + }, + { + "epoch": 0.5, + "learning_rate": 9.933206477418352e-08, + "loss": 0.0006, + "step": 25973 + }, + { + "epoch": 0.5, + "learning_rate": 9.932818142984738e-08, + "loss": 0.0006, + "step": 25974 + }, + { + "epoch": 0.5, + "learning_rate": 9.932429808551124e-08, + "loss": 0.0006, + "step": 25975 + }, + { + "epoch": 0.5, + "learning_rate": 9.93204147411751e-08, + "loss": 0.4205, + "step": 25976 + }, + { + "epoch": 0.5, + "learning_rate": 9.931653139683895e-08, + "loss": 0.3927, + "step": 25977 + }, + { + "epoch": 0.5, + "learning_rate": 9.931264805250281e-08, + "loss": 0.0006, + "step": 25978 + }, + { + "epoch": 0.5, + "learning_rate": 9.930876470816667e-08, + "loss": 0.0006, + "step": 25979 + }, + { + "epoch": 0.5, + "learning_rate": 9.930488136383053e-08, + "loss": 0.1022, + "step": 25980 + }, + { + "epoch": 0.5, + "learning_rate": 9.930099801949439e-08, + "loss": 0.5045, + "step": 25981 + }, + { + "epoch": 0.5, + "learning_rate": 9.929711467515825e-08, + "loss": 0.0006, + "step": 25982 + }, + { + "epoch": 0.5, + "learning_rate": 9.92932313308221e-08, + "loss": 0.0007, + "step": 25983 + }, + { + "epoch": 0.5, + "learning_rate": 9.928934798648596e-08, + "loss": 0.0006, + "step": 25984 + }, + { + "epoch": 0.5, + "learning_rate": 9.928546464214982e-08, + "loss": 0.0005, + "step": 25985 + }, + { + "epoch": 0.5, + "learning_rate": 9.928158129781368e-08, + "loss": 0.0006, + "step": 25986 + }, + { + "epoch": 0.5, + "learning_rate": 9.927769795347754e-08, + "loss": 0.0007, + "step": 25987 + }, + { + "epoch": 0.5, + "learning_rate": 9.92738146091414e-08, + "loss": 0.0008, + "step": 25988 + }, + { + "epoch": 0.5, + "learning_rate": 9.926993126480525e-08, + "loss": 0.0121, + "step": 25989 + }, + { + "epoch": 0.5, + "learning_rate": 9.92660479204691e-08, + "loss": 0.0006, + "step": 25990 + }, + { + "epoch": 0.5, + "learning_rate": 9.926216457613296e-08, + "loss": 0.0004, + "step": 25991 + }, + { + "epoch": 0.5, + "learning_rate": 9.925828123179681e-08, + "loss": 0.0029, + "step": 25992 + }, + { + "epoch": 0.5, + "learning_rate": 9.925439788746067e-08, + "loss": 0.0008, + "step": 25993 + }, + { + "epoch": 0.5, + "learning_rate": 9.925051454312453e-08, + "loss": 0.0042, + "step": 25994 + }, + { + "epoch": 0.5, + "learning_rate": 9.924663119878839e-08, + "loss": 0.0006, + "step": 25995 + }, + { + "epoch": 0.5, + "learning_rate": 9.924274785445225e-08, + "loss": 0.0012, + "step": 25996 + }, + { + "epoch": 0.5, + "learning_rate": 9.92388645101161e-08, + "loss": 0.0004, + "step": 25997 + }, + { + "epoch": 0.5, + "learning_rate": 9.923498116577996e-08, + "loss": 0.0005, + "step": 25998 + }, + { + "epoch": 0.5, + "learning_rate": 9.923109782144382e-08, + "loss": 0.0005, + "step": 25999 + }, + { + "epoch": 0.5, + "learning_rate": 9.922721447710768e-08, + "loss": 0.0007, + "step": 26000 + }, + { + "epoch": 0.5, + "learning_rate": 9.922333113277154e-08, + "loss": 0.0005, + "step": 26001 + }, + { + "epoch": 0.5, + "learning_rate": 9.92194477884354e-08, + "loss": 0.0024, + "step": 26002 + }, + { + "epoch": 0.5, + "learning_rate": 9.921556444409925e-08, + "loss": 0.0054, + "step": 26003 + }, + { + "epoch": 0.5, + "learning_rate": 9.921168109976311e-08, + "loss": 0.0005, + "step": 26004 + }, + { + "epoch": 0.5, + "learning_rate": 9.920779775542697e-08, + "loss": 0.001, + "step": 26005 + }, + { + "epoch": 0.5, + "learning_rate": 9.920391441109083e-08, + "loss": 0.0005, + "step": 26006 + }, + { + "epoch": 0.5, + "learning_rate": 9.920003106675469e-08, + "loss": 0.0807, + "step": 26007 + }, + { + "epoch": 0.5, + "learning_rate": 9.919614772241855e-08, + "loss": 0.0005, + "step": 26008 + }, + { + "epoch": 0.5, + "learning_rate": 9.91922643780824e-08, + "loss": 0.0004, + "step": 26009 + }, + { + "epoch": 0.5, + "learning_rate": 9.918838103374626e-08, + "loss": 0.0009, + "step": 26010 + }, + { + "epoch": 0.5, + "learning_rate": 9.918449768941012e-08, + "loss": 0.0276, + "step": 26011 + }, + { + "epoch": 0.5, + "learning_rate": 9.918061434507398e-08, + "loss": 0.0006, + "step": 26012 + }, + { + "epoch": 0.5, + "learning_rate": 9.917673100073784e-08, + "loss": 0.0011, + "step": 26013 + }, + { + "epoch": 0.5, + "learning_rate": 9.91728476564017e-08, + "loss": 0.0005, + "step": 26014 + }, + { + "epoch": 0.5, + "learning_rate": 9.916896431206555e-08, + "loss": 0.0004, + "step": 26015 + }, + { + "epoch": 0.5, + "learning_rate": 9.916508096772941e-08, + "loss": 0.0006, + "step": 26016 + }, + { + "epoch": 0.5, + "learning_rate": 9.916119762339327e-08, + "loss": 0.0006, + "step": 26017 + }, + { + "epoch": 0.5, + "learning_rate": 9.915731427905713e-08, + "loss": 0.0006, + "step": 26018 + }, + { + "epoch": 0.5, + "learning_rate": 9.915343093472097e-08, + "loss": 0.0005, + "step": 26019 + }, + { + "epoch": 0.5, + "learning_rate": 9.914954759038483e-08, + "loss": 0.0005, + "step": 26020 + }, + { + "epoch": 0.5, + "learning_rate": 9.914566424604869e-08, + "loss": 0.0007, + "step": 26021 + }, + { + "epoch": 0.5, + "learning_rate": 9.914178090171255e-08, + "loss": 0.9884, + "step": 26022 + }, + { + "epoch": 0.5, + "learning_rate": 9.91378975573764e-08, + "loss": 0.0947, + "step": 26023 + }, + { + "epoch": 0.5, + "learning_rate": 9.913401421304026e-08, + "loss": 0.0006, + "step": 26024 + }, + { + "epoch": 0.5, + "learning_rate": 9.913013086870412e-08, + "loss": 0.0446, + "step": 26025 + }, + { + "epoch": 0.5, + "learning_rate": 9.912624752436798e-08, + "loss": 0.0006, + "step": 26026 + }, + { + "epoch": 0.5, + "learning_rate": 9.912236418003184e-08, + "loss": 0.0231, + "step": 26027 + }, + { + "epoch": 0.5, + "learning_rate": 9.91184808356957e-08, + "loss": 0.0007, + "step": 26028 + }, + { + "epoch": 0.5, + "learning_rate": 9.911459749135956e-08, + "loss": 0.0004, + "step": 26029 + }, + { + "epoch": 0.5, + "learning_rate": 9.911071414702341e-08, + "loss": 0.337, + "step": 26030 + }, + { + "epoch": 0.5, + "learning_rate": 9.910683080268727e-08, + "loss": 0.0006, + "step": 26031 + }, + { + "epoch": 0.5, + "learning_rate": 9.910294745835113e-08, + "loss": 0.0007, + "step": 26032 + }, + { + "epoch": 0.5, + "learning_rate": 9.909906411401499e-08, + "loss": 0.0008, + "step": 26033 + }, + { + "epoch": 0.51, + "learning_rate": 9.909518076967885e-08, + "loss": 0.0005, + "step": 26034 + }, + { + "epoch": 0.51, + "learning_rate": 9.90912974253427e-08, + "loss": 0.0006, + "step": 26035 + }, + { + "epoch": 0.51, + "learning_rate": 9.908741408100656e-08, + "loss": 0.0007, + "step": 26036 + }, + { + "epoch": 0.51, + "learning_rate": 9.908353073667042e-08, + "loss": 0.0118, + "step": 26037 + }, + { + "epoch": 0.51, + "learning_rate": 9.907964739233428e-08, + "loss": 0.0003, + "step": 26038 + }, + { + "epoch": 0.51, + "learning_rate": 9.907576404799814e-08, + "loss": 0.0006, + "step": 26039 + }, + { + "epoch": 0.51, + "learning_rate": 9.9071880703662e-08, + "loss": 0.0005, + "step": 26040 + }, + { + "epoch": 0.51, + "learning_rate": 9.906799735932585e-08, + "loss": 0.0022, + "step": 26041 + }, + { + "epoch": 0.51, + "learning_rate": 9.906411401498971e-08, + "loss": 0.0008, + "step": 26042 + }, + { + "epoch": 0.51, + "learning_rate": 9.906023067065357e-08, + "loss": 0.0011, + "step": 26043 + }, + { + "epoch": 0.51, + "learning_rate": 9.905634732631743e-08, + "loss": 0.3324, + "step": 26044 + }, + { + "epoch": 0.51, + "learning_rate": 9.905246398198129e-08, + "loss": 0.0008, + "step": 26045 + }, + { + "epoch": 0.51, + "learning_rate": 9.904858063764515e-08, + "loss": 0.0031, + "step": 26046 + }, + { + "epoch": 0.51, + "learning_rate": 9.9044697293309e-08, + "loss": 0.6934, + "step": 26047 + }, + { + "epoch": 0.51, + "learning_rate": 9.904081394897285e-08, + "loss": 0.0007, + "step": 26048 + }, + { + "epoch": 0.51, + "learning_rate": 9.903693060463671e-08, + "loss": 0.2128, + "step": 26049 + }, + { + "epoch": 0.51, + "learning_rate": 9.903304726030057e-08, + "loss": 0.0005, + "step": 26050 + }, + { + "epoch": 0.51, + "learning_rate": 9.902916391596442e-08, + "loss": 0.0005, + "step": 26051 + }, + { + "epoch": 0.51, + "learning_rate": 9.902528057162828e-08, + "loss": 0.0006, + "step": 26052 + }, + { + "epoch": 0.51, + "learning_rate": 9.902139722729214e-08, + "loss": 0.0008, + "step": 26053 + }, + { + "epoch": 0.51, + "learning_rate": 9.9017513882956e-08, + "loss": 0.0004, + "step": 26054 + }, + { + "epoch": 0.51, + "learning_rate": 9.901363053861986e-08, + "loss": 0.0005, + "step": 26055 + }, + { + "epoch": 0.51, + "learning_rate": 9.900974719428372e-08, + "loss": 0.001, + "step": 26056 + }, + { + "epoch": 0.51, + "learning_rate": 9.900586384994757e-08, + "loss": 0.0006, + "step": 26057 + }, + { + "epoch": 0.51, + "learning_rate": 9.900198050561143e-08, + "loss": 0.0007, + "step": 26058 + }, + { + "epoch": 0.51, + "learning_rate": 9.899809716127529e-08, + "loss": 0.0005, + "step": 26059 + }, + { + "epoch": 0.51, + "learning_rate": 9.899421381693915e-08, + "loss": 0.0009, + "step": 26060 + }, + { + "epoch": 0.51, + "learning_rate": 9.899033047260301e-08, + "loss": 0.0641, + "step": 26061 + }, + { + "epoch": 0.51, + "learning_rate": 9.898644712826686e-08, + "loss": 0.0007, + "step": 26062 + }, + { + "epoch": 0.51, + "learning_rate": 9.898256378393072e-08, + "loss": 0.0006, + "step": 26063 + }, + { + "epoch": 0.51, + "learning_rate": 9.897868043959458e-08, + "loss": 0.0056, + "step": 26064 + }, + { + "epoch": 0.51, + "learning_rate": 9.897479709525844e-08, + "loss": 0.0009, + "step": 26065 + }, + { + "epoch": 0.51, + "learning_rate": 9.89709137509223e-08, + "loss": 1.0343, + "step": 26066 + }, + { + "epoch": 0.51, + "learning_rate": 9.896703040658614e-08, + "loss": 0.0005, + "step": 26067 + }, + { + "epoch": 0.51, + "learning_rate": 9.896314706225e-08, + "loss": 0.0004, + "step": 26068 + }, + { + "epoch": 0.51, + "learning_rate": 9.895926371791386e-08, + "loss": 0.0006, + "step": 26069 + }, + { + "epoch": 0.51, + "learning_rate": 9.895538037357772e-08, + "loss": 0.0013, + "step": 26070 + }, + { + "epoch": 0.51, + "learning_rate": 9.895149702924158e-08, + "loss": 0.0008, + "step": 26071 + }, + { + "epoch": 0.51, + "learning_rate": 9.894761368490543e-08, + "loss": 0.0007, + "step": 26072 + }, + { + "epoch": 0.51, + "learning_rate": 9.894373034056929e-08, + "loss": 0.8047, + "step": 26073 + }, + { + "epoch": 0.51, + "learning_rate": 9.893984699623315e-08, + "loss": 0.0005, + "step": 26074 + }, + { + "epoch": 0.51, + "learning_rate": 9.893596365189701e-08, + "loss": 0.0006, + "step": 26075 + }, + { + "epoch": 0.51, + "learning_rate": 9.893208030756087e-08, + "loss": 0.0007, + "step": 26076 + }, + { + "epoch": 0.51, + "learning_rate": 9.892819696322473e-08, + "loss": 0.001, + "step": 26077 + }, + { + "epoch": 0.51, + "learning_rate": 9.892431361888858e-08, + "loss": 0.003, + "step": 26078 + }, + { + "epoch": 0.51, + "learning_rate": 9.892043027455244e-08, + "loss": 0.0883, + "step": 26079 + }, + { + "epoch": 0.51, + "learning_rate": 9.89165469302163e-08, + "loss": 0.0008, + "step": 26080 + }, + { + "epoch": 0.51, + "learning_rate": 9.891266358588016e-08, + "loss": 0.0007, + "step": 26081 + }, + { + "epoch": 0.51, + "learning_rate": 9.8908780241544e-08, + "loss": 0.0009, + "step": 26082 + }, + { + "epoch": 0.51, + "learning_rate": 9.890489689720786e-08, + "loss": 0.0041, + "step": 26083 + }, + { + "epoch": 0.51, + "learning_rate": 9.890101355287172e-08, + "loss": 0.0005, + "step": 26084 + }, + { + "epoch": 0.51, + "learning_rate": 9.889713020853558e-08, + "loss": 0.0006, + "step": 26085 + }, + { + "epoch": 0.51, + "learning_rate": 9.889324686419944e-08, + "loss": 0.0004, + "step": 26086 + }, + { + "epoch": 0.51, + "learning_rate": 9.88893635198633e-08, + "loss": 0.0006, + "step": 26087 + }, + { + "epoch": 0.51, + "learning_rate": 9.888548017552715e-08, + "loss": 0.0007, + "step": 26088 + }, + { + "epoch": 0.51, + "learning_rate": 9.888159683119101e-08, + "loss": 0.0004, + "step": 26089 + }, + { + "epoch": 0.51, + "learning_rate": 9.887771348685487e-08, + "loss": 0.0007, + "step": 26090 + }, + { + "epoch": 0.51, + "learning_rate": 9.887383014251873e-08, + "loss": 0.0007, + "step": 26091 + }, + { + "epoch": 0.51, + "learning_rate": 9.886994679818259e-08, + "loss": 0.0014, + "step": 26092 + }, + { + "epoch": 0.51, + "learning_rate": 9.886606345384644e-08, + "loss": 0.0079, + "step": 26093 + }, + { + "epoch": 0.51, + "learning_rate": 9.88621801095103e-08, + "loss": 0.0008, + "step": 26094 + }, + { + "epoch": 0.51, + "learning_rate": 9.885829676517416e-08, + "loss": 0.0005, + "step": 26095 + }, + { + "epoch": 0.51, + "learning_rate": 9.885441342083802e-08, + "loss": 0.001, + "step": 26096 + }, + { + "epoch": 0.51, + "learning_rate": 9.885053007650188e-08, + "loss": 0.0006, + "step": 26097 + }, + { + "epoch": 0.51, + "learning_rate": 9.884664673216574e-08, + "loss": 0.0024, + "step": 26098 + }, + { + "epoch": 0.51, + "learning_rate": 9.88427633878296e-08, + "loss": 0.0007, + "step": 26099 + }, + { + "epoch": 0.51, + "learning_rate": 9.883888004349345e-08, + "loss": 0.0005, + "step": 26100 + }, + { + "epoch": 0.51, + "learning_rate": 9.883499669915731e-08, + "loss": 0.0073, + "step": 26101 + }, + { + "epoch": 0.51, + "learning_rate": 9.883111335482117e-08, + "loss": 0.0008, + "step": 26102 + }, + { + "epoch": 0.51, + "learning_rate": 9.882723001048503e-08, + "loss": 0.0004, + "step": 26103 + }, + { + "epoch": 0.51, + "learning_rate": 9.882334666614888e-08, + "loss": 0.0004, + "step": 26104 + }, + { + "epoch": 0.51, + "learning_rate": 9.881946332181274e-08, + "loss": 0.0005, + "step": 26105 + }, + { + "epoch": 0.51, + "learning_rate": 9.881557997747659e-08, + "loss": 0.0005, + "step": 26106 + }, + { + "epoch": 0.51, + "learning_rate": 9.881169663314045e-08, + "loss": 0.0007, + "step": 26107 + }, + { + "epoch": 0.51, + "learning_rate": 9.88078132888043e-08, + "loss": 0.0006, + "step": 26108 + }, + { + "epoch": 0.51, + "learning_rate": 9.880392994446816e-08, + "loss": 0.0006, + "step": 26109 + }, + { + "epoch": 0.51, + "learning_rate": 9.880004660013202e-08, + "loss": 0.0006, + "step": 26110 + }, + { + "epoch": 0.51, + "learning_rate": 9.879616325579588e-08, + "loss": 0.0006, + "step": 26111 + }, + { + "epoch": 0.51, + "learning_rate": 9.879227991145974e-08, + "loss": 0.0006, + "step": 26112 + }, + { + "epoch": 0.51, + "learning_rate": 9.87883965671236e-08, + "loss": 0.0017, + "step": 26113 + }, + { + "epoch": 0.51, + "learning_rate": 9.878451322278745e-08, + "loss": 0.0006, + "step": 26114 + }, + { + "epoch": 0.51, + "learning_rate": 9.878062987845131e-08, + "loss": 0.0005, + "step": 26115 + }, + { + "epoch": 0.51, + "learning_rate": 9.877674653411517e-08, + "loss": 0.0514, + "step": 26116 + }, + { + "epoch": 0.51, + "learning_rate": 9.877286318977903e-08, + "loss": 0.0005, + "step": 26117 + }, + { + "epoch": 0.51, + "learning_rate": 9.876897984544289e-08, + "loss": 1.4862, + "step": 26118 + }, + { + "epoch": 0.51, + "learning_rate": 9.876509650110675e-08, + "loss": 0.0017, + "step": 26119 + }, + { + "epoch": 0.51, + "learning_rate": 9.87612131567706e-08, + "loss": 0.0004, + "step": 26120 + }, + { + "epoch": 0.51, + "learning_rate": 9.875732981243446e-08, + "loss": 0.0005, + "step": 26121 + }, + { + "epoch": 0.51, + "learning_rate": 9.875344646809832e-08, + "loss": 0.0006, + "step": 26122 + }, + { + "epoch": 0.51, + "learning_rate": 9.874956312376218e-08, + "loss": 0.0005, + "step": 26123 + }, + { + "epoch": 0.51, + "learning_rate": 9.874567977942604e-08, + "loss": 0.0014, + "step": 26124 + }, + { + "epoch": 0.51, + "learning_rate": 9.87417964350899e-08, + "loss": 0.0005, + "step": 26125 + }, + { + "epoch": 0.51, + "learning_rate": 9.873791309075375e-08, + "loss": 0.0233, + "step": 26126 + }, + { + "epoch": 0.51, + "learning_rate": 9.873402974641761e-08, + "loss": 0.0007, + "step": 26127 + }, + { + "epoch": 0.51, + "learning_rate": 9.873014640208147e-08, + "loss": 0.0005, + "step": 26128 + }, + { + "epoch": 0.51, + "learning_rate": 9.872626305774533e-08, + "loss": 0.0011, + "step": 26129 + }, + { + "epoch": 0.51, + "learning_rate": 9.872237971340919e-08, + "loss": 0.0005, + "step": 26130 + }, + { + "epoch": 0.51, + "learning_rate": 9.871849636907304e-08, + "loss": 0.0006, + "step": 26131 + }, + { + "epoch": 0.51, + "learning_rate": 9.87146130247369e-08, + "loss": 0.0005, + "step": 26132 + }, + { + "epoch": 0.51, + "learning_rate": 9.871072968040076e-08, + "loss": 0.8172, + "step": 26133 + }, + { + "epoch": 0.51, + "learning_rate": 9.870684633606462e-08, + "loss": 0.0006, + "step": 26134 + }, + { + "epoch": 0.51, + "learning_rate": 9.870296299172846e-08, + "loss": 0.0004, + "step": 26135 + }, + { + "epoch": 0.51, + "learning_rate": 9.869907964739232e-08, + "loss": 0.0005, + "step": 26136 + }, + { + "epoch": 0.51, + "learning_rate": 9.869519630305618e-08, + "loss": 0.0004, + "step": 26137 + }, + { + "epoch": 0.51, + "learning_rate": 9.869131295872004e-08, + "loss": 0.0005, + "step": 26138 + }, + { + "epoch": 0.51, + "learning_rate": 9.86874296143839e-08, + "loss": 0.0004, + "step": 26139 + }, + { + "epoch": 0.51, + "learning_rate": 9.868354627004776e-08, + "loss": 0.0008, + "step": 26140 + }, + { + "epoch": 0.51, + "learning_rate": 9.867966292571161e-08, + "loss": 0.0004, + "step": 26141 + }, + { + "epoch": 0.51, + "learning_rate": 9.867577958137547e-08, + "loss": 0.0005, + "step": 26142 + }, + { + "epoch": 0.51, + "learning_rate": 9.867189623703933e-08, + "loss": 0.0006, + "step": 26143 + }, + { + "epoch": 0.51, + "learning_rate": 9.866801289270319e-08, + "loss": 0.0005, + "step": 26144 + }, + { + "epoch": 0.51, + "learning_rate": 9.866412954836705e-08, + "loss": 0.0006, + "step": 26145 + }, + { + "epoch": 0.51, + "learning_rate": 9.86602462040309e-08, + "loss": 0.0006, + "step": 26146 + }, + { + "epoch": 0.51, + "learning_rate": 9.865636285969476e-08, + "loss": 0.0005, + "step": 26147 + }, + { + "epoch": 0.51, + "learning_rate": 9.865247951535862e-08, + "loss": 0.0004, + "step": 26148 + }, + { + "epoch": 0.51, + "learning_rate": 9.864859617102248e-08, + "loss": 0.1137, + "step": 26149 + }, + { + "epoch": 0.51, + "learning_rate": 9.864471282668634e-08, + "loss": 0.0005, + "step": 26150 + }, + { + "epoch": 0.51, + "learning_rate": 9.86408294823502e-08, + "loss": 0.0004, + "step": 26151 + }, + { + "epoch": 0.51, + "learning_rate": 9.863694613801405e-08, + "loss": 0.0006, + "step": 26152 + }, + { + "epoch": 0.51, + "learning_rate": 9.863306279367791e-08, + "loss": 0.0006, + "step": 26153 + }, + { + "epoch": 0.51, + "learning_rate": 9.862917944934177e-08, + "loss": 0.0012, + "step": 26154 + }, + { + "epoch": 0.51, + "learning_rate": 9.862529610500563e-08, + "loss": 0.0153, + "step": 26155 + }, + { + "epoch": 0.51, + "learning_rate": 9.862141276066949e-08, + "loss": 0.0006, + "step": 26156 + }, + { + "epoch": 0.51, + "learning_rate": 9.861752941633335e-08, + "loss": 0.0005, + "step": 26157 + }, + { + "epoch": 0.51, + "learning_rate": 9.86136460719972e-08, + "loss": 0.0003, + "step": 26158 + }, + { + "epoch": 0.51, + "learning_rate": 9.860976272766106e-08, + "loss": 0.0007, + "step": 26159 + }, + { + "epoch": 0.51, + "learning_rate": 9.860587938332492e-08, + "loss": 0.0005, + "step": 26160 + }, + { + "epoch": 0.51, + "learning_rate": 9.860199603898878e-08, + "loss": 0.0006, + "step": 26161 + }, + { + "epoch": 0.51, + "learning_rate": 9.859811269465264e-08, + "loss": 0.2932, + "step": 26162 + }, + { + "epoch": 0.51, + "learning_rate": 9.85942293503165e-08, + "loss": 0.0004, + "step": 26163 + }, + { + "epoch": 0.51, + "learning_rate": 9.859034600598034e-08, + "loss": 0.4753, + "step": 26164 + }, + { + "epoch": 0.51, + "learning_rate": 9.85864626616442e-08, + "loss": 0.0005, + "step": 26165 + }, + { + "epoch": 0.51, + "learning_rate": 9.858257931730806e-08, + "loss": 0.0005, + "step": 26166 + }, + { + "epoch": 0.51, + "learning_rate": 9.857869597297191e-08, + "loss": 0.0008, + "step": 26167 + }, + { + "epoch": 0.51, + "learning_rate": 9.857481262863577e-08, + "loss": 0.001, + "step": 26168 + }, + { + "epoch": 0.51, + "learning_rate": 9.857092928429963e-08, + "loss": 1.0228, + "step": 26169 + }, + { + "epoch": 0.51, + "learning_rate": 9.856704593996349e-08, + "loss": 0.0005, + "step": 26170 + }, + { + "epoch": 0.51, + "learning_rate": 9.856316259562735e-08, + "loss": 0.0004, + "step": 26171 + }, + { + "epoch": 0.51, + "learning_rate": 9.85592792512912e-08, + "loss": 0.6371, + "step": 26172 + }, + { + "epoch": 0.51, + "learning_rate": 9.855539590695506e-08, + "loss": 0.0041, + "step": 26173 + }, + { + "epoch": 0.51, + "learning_rate": 9.855151256261892e-08, + "loss": 0.0005, + "step": 26174 + }, + { + "epoch": 0.51, + "learning_rate": 9.854762921828278e-08, + "loss": 0.0008, + "step": 26175 + }, + { + "epoch": 0.51, + "learning_rate": 9.854374587394664e-08, + "loss": 0.0004, + "step": 26176 + }, + { + "epoch": 0.51, + "learning_rate": 9.85398625296105e-08, + "loss": 0.0006, + "step": 26177 + }, + { + "epoch": 0.51, + "learning_rate": 9.853597918527436e-08, + "loss": 0.002, + "step": 26178 + }, + { + "epoch": 0.51, + "learning_rate": 9.853209584093821e-08, + "loss": 0.0005, + "step": 26179 + }, + { + "epoch": 0.51, + "learning_rate": 9.852821249660207e-08, + "loss": 0.0007, + "step": 26180 + }, + { + "epoch": 0.51, + "learning_rate": 9.852432915226593e-08, + "loss": 0.0006, + "step": 26181 + }, + { + "epoch": 0.51, + "learning_rate": 9.852044580792979e-08, + "loss": 0.0008, + "step": 26182 + }, + { + "epoch": 0.51, + "learning_rate": 9.851656246359365e-08, + "loss": 0.0005, + "step": 26183 + }, + { + "epoch": 0.51, + "learning_rate": 9.85126791192575e-08, + "loss": 0.0004, + "step": 26184 + }, + { + "epoch": 0.51, + "learning_rate": 9.850879577492136e-08, + "loss": 0.0007, + "step": 26185 + }, + { + "epoch": 0.51, + "learning_rate": 9.850491243058522e-08, + "loss": 0.0007, + "step": 26186 + }, + { + "epoch": 0.51, + "learning_rate": 9.850102908624908e-08, + "loss": 0.0008, + "step": 26187 + }, + { + "epoch": 0.51, + "learning_rate": 9.849714574191294e-08, + "loss": 0.0005, + "step": 26188 + }, + { + "epoch": 0.51, + "learning_rate": 9.84932623975768e-08, + "loss": 0.0007, + "step": 26189 + }, + { + "epoch": 0.51, + "learning_rate": 9.848937905324065e-08, + "loss": 0.0006, + "step": 26190 + }, + { + "epoch": 0.51, + "learning_rate": 9.848549570890451e-08, + "loss": 0.0006, + "step": 26191 + }, + { + "epoch": 0.51, + "learning_rate": 9.848161236456837e-08, + "loss": 0.0004, + "step": 26192 + }, + { + "epoch": 0.51, + "learning_rate": 9.847772902023222e-08, + "loss": 0.0005, + "step": 26193 + }, + { + "epoch": 0.51, + "learning_rate": 9.847384567589607e-08, + "loss": 0.2863, + "step": 26194 + }, + { + "epoch": 0.51, + "learning_rate": 9.846996233155993e-08, + "loss": 0.0006, + "step": 26195 + }, + { + "epoch": 0.51, + "learning_rate": 9.846607898722379e-08, + "loss": 0.0004, + "step": 26196 + }, + { + "epoch": 0.51, + "learning_rate": 9.846219564288765e-08, + "loss": 0.0005, + "step": 26197 + }, + { + "epoch": 0.51, + "learning_rate": 9.845831229855151e-08, + "loss": 0.0005, + "step": 26198 + }, + { + "epoch": 0.51, + "learning_rate": 9.845442895421536e-08, + "loss": 0.0045, + "step": 26199 + }, + { + "epoch": 0.51, + "learning_rate": 9.845054560987922e-08, + "loss": 0.0006, + "step": 26200 + }, + { + "epoch": 0.51, + "learning_rate": 9.844666226554308e-08, + "loss": 0.0016, + "step": 26201 + }, + { + "epoch": 0.51, + "learning_rate": 9.844277892120694e-08, + "loss": 0.0005, + "step": 26202 + }, + { + "epoch": 0.51, + "learning_rate": 9.84388955768708e-08, + "loss": 0.0006, + "step": 26203 + }, + { + "epoch": 0.51, + "learning_rate": 9.843501223253466e-08, + "loss": 0.0008, + "step": 26204 + }, + { + "epoch": 0.51, + "learning_rate": 9.843112888819851e-08, + "loss": 0.0015, + "step": 26205 + }, + { + "epoch": 0.51, + "learning_rate": 9.842724554386237e-08, + "loss": 0.0005, + "step": 26206 + }, + { + "epoch": 0.51, + "learning_rate": 9.842336219952623e-08, + "loss": 0.0006, + "step": 26207 + }, + { + "epoch": 0.51, + "learning_rate": 9.841947885519009e-08, + "loss": 0.0007, + "step": 26208 + }, + { + "epoch": 0.51, + "learning_rate": 9.841559551085395e-08, + "loss": 0.0005, + "step": 26209 + }, + { + "epoch": 0.51, + "learning_rate": 9.84117121665178e-08, + "loss": 0.0356, + "step": 26210 + }, + { + "epoch": 0.51, + "learning_rate": 9.840782882218166e-08, + "loss": 0.0499, + "step": 26211 + }, + { + "epoch": 0.51, + "learning_rate": 9.840394547784552e-08, + "loss": 0.999, + "step": 26212 + }, + { + "epoch": 0.51, + "learning_rate": 9.840006213350938e-08, + "loss": 0.0005, + "step": 26213 + }, + { + "epoch": 0.51, + "learning_rate": 9.839617878917324e-08, + "loss": 0.0006, + "step": 26214 + }, + { + "epoch": 0.51, + "learning_rate": 9.83922954448371e-08, + "loss": 0.0004, + "step": 26215 + }, + { + "epoch": 0.51, + "learning_rate": 9.838841210050096e-08, + "loss": 0.0005, + "step": 26216 + }, + { + "epoch": 0.51, + "learning_rate": 9.838452875616481e-08, + "loss": 1.2516, + "step": 26217 + }, + { + "epoch": 0.51, + "learning_rate": 9.838064541182867e-08, + "loss": 0.0005, + "step": 26218 + }, + { + "epoch": 0.51, + "learning_rate": 9.837676206749253e-08, + "loss": 0.0033, + "step": 26219 + }, + { + "epoch": 0.51, + "learning_rate": 9.837287872315639e-08, + "loss": 0.0006, + "step": 26220 + }, + { + "epoch": 0.51, + "learning_rate": 9.836899537882025e-08, + "loss": 0.0005, + "step": 26221 + }, + { + "epoch": 0.51, + "learning_rate": 9.836511203448409e-08, + "loss": 0.0004, + "step": 26222 + }, + { + "epoch": 0.51, + "learning_rate": 9.836122869014795e-08, + "loss": 0.0923, + "step": 26223 + }, + { + "epoch": 0.51, + "learning_rate": 9.835734534581181e-08, + "loss": 0.0004, + "step": 26224 + }, + { + "epoch": 0.51, + "learning_rate": 9.835346200147567e-08, + "loss": 0.002, + "step": 26225 + }, + { + "epoch": 0.51, + "learning_rate": 9.834957865713952e-08, + "loss": 0.0005, + "step": 26226 + }, + { + "epoch": 0.51, + "learning_rate": 9.834569531280338e-08, + "loss": 0.0005, + "step": 26227 + }, + { + "epoch": 0.51, + "learning_rate": 9.834181196846724e-08, + "loss": 0.0005, + "step": 26228 + }, + { + "epoch": 0.51, + "learning_rate": 9.83379286241311e-08, + "loss": 0.0006, + "step": 26229 + }, + { + "epoch": 0.51, + "learning_rate": 9.833404527979496e-08, + "loss": 0.0004, + "step": 26230 + }, + { + "epoch": 0.51, + "learning_rate": 9.833016193545882e-08, + "loss": 0.0006, + "step": 26231 + }, + { + "epoch": 0.51, + "learning_rate": 9.832627859112267e-08, + "loss": 0.0005, + "step": 26232 + }, + { + "epoch": 0.51, + "learning_rate": 9.832239524678653e-08, + "loss": 0.0019, + "step": 26233 + }, + { + "epoch": 0.51, + "learning_rate": 9.831851190245039e-08, + "loss": 0.0006, + "step": 26234 + }, + { + "epoch": 0.51, + "learning_rate": 9.831462855811425e-08, + "loss": 0.0024, + "step": 26235 + }, + { + "epoch": 0.51, + "learning_rate": 9.831074521377811e-08, + "loss": 0.0017, + "step": 26236 + }, + { + "epoch": 0.51, + "learning_rate": 9.830686186944197e-08, + "loss": 0.0006, + "step": 26237 + }, + { + "epoch": 0.51, + "learning_rate": 9.830297852510582e-08, + "loss": 0.0005, + "step": 26238 + }, + { + "epoch": 0.51, + "learning_rate": 9.829909518076968e-08, + "loss": 0.0006, + "step": 26239 + }, + { + "epoch": 0.51, + "learning_rate": 9.829521183643354e-08, + "loss": 0.0005, + "step": 26240 + }, + { + "epoch": 0.51, + "learning_rate": 9.82913284920974e-08, + "loss": 0.0011, + "step": 26241 + }, + { + "epoch": 0.51, + "learning_rate": 9.828744514776126e-08, + "loss": 0.0006, + "step": 26242 + }, + { + "epoch": 0.51, + "learning_rate": 9.828356180342511e-08, + "loss": 0.0006, + "step": 26243 + }, + { + "epoch": 0.51, + "learning_rate": 9.827967845908896e-08, + "loss": 0.0004, + "step": 26244 + }, + { + "epoch": 0.51, + "learning_rate": 9.827579511475282e-08, + "loss": 0.0006, + "step": 26245 + }, + { + "epoch": 0.51, + "learning_rate": 9.827191177041668e-08, + "loss": 0.0007, + "step": 26246 + }, + { + "epoch": 0.51, + "learning_rate": 9.826802842608053e-08, + "loss": 0.0006, + "step": 26247 + }, + { + "epoch": 0.51, + "learning_rate": 9.826414508174439e-08, + "loss": 0.0024, + "step": 26248 + }, + { + "epoch": 0.51, + "learning_rate": 9.826026173740825e-08, + "loss": 0.0006, + "step": 26249 + }, + { + "epoch": 0.51, + "learning_rate": 9.825637839307211e-08, + "loss": 0.0004, + "step": 26250 + }, + { + "epoch": 0.51, + "learning_rate": 9.825249504873597e-08, + "loss": 0.0104, + "step": 26251 + }, + { + "epoch": 0.51, + "learning_rate": 9.824861170439983e-08, + "loss": 0.0005, + "step": 26252 + }, + { + "epoch": 0.51, + "learning_rate": 9.824472836006368e-08, + "loss": 1.4328, + "step": 26253 + }, + { + "epoch": 0.51, + "learning_rate": 9.824084501572754e-08, + "loss": 0.0004, + "step": 26254 + }, + { + "epoch": 0.51, + "learning_rate": 9.82369616713914e-08, + "loss": 0.3236, + "step": 26255 + }, + { + "epoch": 0.51, + "learning_rate": 9.823307832705526e-08, + "loss": 0.1914, + "step": 26256 + }, + { + "epoch": 0.51, + "learning_rate": 9.822919498271912e-08, + "loss": 0.0006, + "step": 26257 + }, + { + "epoch": 0.51, + "learning_rate": 9.822531163838297e-08, + "loss": 0.0201, + "step": 26258 + }, + { + "epoch": 0.51, + "learning_rate": 9.822142829404682e-08, + "loss": 0.0034, + "step": 26259 + }, + { + "epoch": 0.51, + "learning_rate": 9.821754494971068e-08, + "loss": 0.001, + "step": 26260 + }, + { + "epoch": 0.51, + "learning_rate": 9.821366160537454e-08, + "loss": 0.0006, + "step": 26261 + }, + { + "epoch": 0.51, + "learning_rate": 9.82097782610384e-08, + "loss": 0.0006, + "step": 26262 + }, + { + "epoch": 0.51, + "learning_rate": 9.820589491670225e-08, + "loss": 0.0005, + "step": 26263 + }, + { + "epoch": 0.51, + "learning_rate": 9.820201157236611e-08, + "loss": 0.0011, + "step": 26264 + }, + { + "epoch": 0.51, + "learning_rate": 9.819812822802997e-08, + "loss": 0.0005, + "step": 26265 + }, + { + "epoch": 0.51, + "learning_rate": 9.819424488369383e-08, + "loss": 0.0058, + "step": 26266 + }, + { + "epoch": 0.51, + "learning_rate": 9.819036153935769e-08, + "loss": 0.0012, + "step": 26267 + }, + { + "epoch": 0.51, + "learning_rate": 9.818647819502154e-08, + "loss": 0.0006, + "step": 26268 + }, + { + "epoch": 0.51, + "learning_rate": 9.81825948506854e-08, + "loss": 0.0006, + "step": 26269 + }, + { + "epoch": 0.51, + "learning_rate": 9.817871150634926e-08, + "loss": 0.0015, + "step": 26270 + }, + { + "epoch": 0.51, + "learning_rate": 9.817482816201312e-08, + "loss": 0.1331, + "step": 26271 + }, + { + "epoch": 0.51, + "learning_rate": 9.817094481767698e-08, + "loss": 0.0006, + "step": 26272 + }, + { + "epoch": 0.51, + "learning_rate": 9.816706147334084e-08, + "loss": 0.0004, + "step": 26273 + }, + { + "epoch": 0.51, + "learning_rate": 9.81631781290047e-08, + "loss": 0.0015, + "step": 26274 + }, + { + "epoch": 0.51, + "learning_rate": 9.815929478466855e-08, + "loss": 0.0339, + "step": 26275 + }, + { + "epoch": 0.51, + "learning_rate": 9.815541144033241e-08, + "loss": 0.0005, + "step": 26276 + }, + { + "epoch": 0.51, + "learning_rate": 9.815152809599627e-08, + "loss": 0.0005, + "step": 26277 + }, + { + "epoch": 0.51, + "learning_rate": 9.814764475166013e-08, + "loss": 0.1236, + "step": 26278 + }, + { + "epoch": 0.51, + "learning_rate": 9.814376140732398e-08, + "loss": 0.0005, + "step": 26279 + }, + { + "epoch": 0.51, + "learning_rate": 9.813987806298783e-08, + "loss": 0.0005, + "step": 26280 + }, + { + "epoch": 0.51, + "learning_rate": 9.813599471865169e-08, + "loss": 0.0004, + "step": 26281 + }, + { + "epoch": 0.51, + "learning_rate": 9.813211137431555e-08, + "loss": 0.0008, + "step": 26282 + }, + { + "epoch": 0.51, + "learning_rate": 9.81282280299794e-08, + "loss": 0.0038, + "step": 26283 + }, + { + "epoch": 0.51, + "learning_rate": 9.812434468564326e-08, + "loss": 0.0041, + "step": 26284 + }, + { + "epoch": 0.51, + "learning_rate": 9.812046134130712e-08, + "loss": 0.0005, + "step": 26285 + }, + { + "epoch": 0.51, + "learning_rate": 9.811657799697098e-08, + "loss": 0.2503, + "step": 26286 + }, + { + "epoch": 0.51, + "learning_rate": 9.811269465263484e-08, + "loss": 0.0005, + "step": 26287 + }, + { + "epoch": 0.51, + "learning_rate": 9.81088113082987e-08, + "loss": 0.0005, + "step": 26288 + }, + { + "epoch": 0.51, + "learning_rate": 9.810492796396255e-08, + "loss": 1.0577, + "step": 26289 + }, + { + "epoch": 0.51, + "learning_rate": 9.810104461962641e-08, + "loss": 0.0007, + "step": 26290 + }, + { + "epoch": 0.51, + "learning_rate": 9.809716127529027e-08, + "loss": 0.0007, + "step": 26291 + }, + { + "epoch": 0.51, + "learning_rate": 9.809327793095413e-08, + "loss": 0.0004, + "step": 26292 + }, + { + "epoch": 0.51, + "learning_rate": 9.808939458661799e-08, + "loss": 0.0004, + "step": 26293 + }, + { + "epoch": 0.51, + "learning_rate": 9.808551124228185e-08, + "loss": 0.0005, + "step": 26294 + }, + { + "epoch": 0.51, + "learning_rate": 9.80816278979457e-08, + "loss": 0.3565, + "step": 26295 + }, + { + "epoch": 0.51, + "learning_rate": 9.807774455360956e-08, + "loss": 0.0004, + "step": 26296 + }, + { + "epoch": 0.51, + "learning_rate": 9.807386120927342e-08, + "loss": 0.0072, + "step": 26297 + }, + { + "epoch": 0.51, + "learning_rate": 9.806997786493728e-08, + "loss": 0.0039, + "step": 26298 + }, + { + "epoch": 0.51, + "learning_rate": 9.806609452060114e-08, + "loss": 0.0005, + "step": 26299 + }, + { + "epoch": 0.51, + "learning_rate": 9.8062211176265e-08, + "loss": 0.0005, + "step": 26300 + }, + { + "epoch": 0.51, + "learning_rate": 9.805832783192885e-08, + "loss": 0.0162, + "step": 26301 + }, + { + "epoch": 0.51, + "learning_rate": 9.805444448759271e-08, + "loss": 0.0379, + "step": 26302 + }, + { + "epoch": 0.51, + "learning_rate": 9.805056114325657e-08, + "loss": 0.0007, + "step": 26303 + }, + { + "epoch": 0.51, + "learning_rate": 9.804667779892043e-08, + "loss": 0.0005, + "step": 26304 + }, + { + "epoch": 0.51, + "learning_rate": 9.804279445458429e-08, + "loss": 0.1834, + "step": 26305 + }, + { + "epoch": 0.51, + "learning_rate": 9.803891111024814e-08, + "loss": 0.0017, + "step": 26306 + }, + { + "epoch": 0.51, + "learning_rate": 9.8035027765912e-08, + "loss": 0.0005, + "step": 26307 + }, + { + "epoch": 0.51, + "learning_rate": 9.803114442157586e-08, + "loss": 0.0007, + "step": 26308 + }, + { + "epoch": 0.51, + "learning_rate": 9.80272610772397e-08, + "loss": 0.0006, + "step": 26309 + }, + { + "epoch": 0.51, + "learning_rate": 9.802337773290356e-08, + "loss": 0.0005, + "step": 26310 + }, + { + "epoch": 0.51, + "learning_rate": 9.801949438856742e-08, + "loss": 0.0011, + "step": 26311 + }, + { + "epoch": 0.51, + "learning_rate": 9.801561104423128e-08, + "loss": 0.0008, + "step": 26312 + }, + { + "epoch": 0.51, + "learning_rate": 9.801172769989514e-08, + "loss": 0.0024, + "step": 26313 + }, + { + "epoch": 0.51, + "learning_rate": 9.8007844355559e-08, + "loss": 0.0006, + "step": 26314 + }, + { + "epoch": 0.51, + "learning_rate": 9.800396101122286e-08, + "loss": 1.2232, + "step": 26315 + }, + { + "epoch": 0.51, + "learning_rate": 9.800007766688671e-08, + "loss": 0.0009, + "step": 26316 + }, + { + "epoch": 0.51, + "learning_rate": 9.799619432255057e-08, + "loss": 0.0005, + "step": 26317 + }, + { + "epoch": 0.51, + "learning_rate": 9.799231097821443e-08, + "loss": 0.01, + "step": 26318 + }, + { + "epoch": 0.51, + "learning_rate": 9.798842763387829e-08, + "loss": 0.0004, + "step": 26319 + }, + { + "epoch": 0.51, + "learning_rate": 9.798454428954215e-08, + "loss": 1.2253, + "step": 26320 + }, + { + "epoch": 0.51, + "learning_rate": 9.7980660945206e-08, + "loss": 0.0006, + "step": 26321 + }, + { + "epoch": 0.51, + "learning_rate": 9.797677760086986e-08, + "loss": 0.0005, + "step": 26322 + }, + { + "epoch": 0.51, + "learning_rate": 9.797289425653372e-08, + "loss": 0.0015, + "step": 26323 + }, + { + "epoch": 0.51, + "learning_rate": 9.796901091219758e-08, + "loss": 0.0005, + "step": 26324 + }, + { + "epoch": 0.51, + "learning_rate": 9.796512756786144e-08, + "loss": 0.0009, + "step": 26325 + }, + { + "epoch": 0.51, + "learning_rate": 9.79612442235253e-08, + "loss": 0.0006, + "step": 26326 + }, + { + "epoch": 0.51, + "learning_rate": 9.795736087918915e-08, + "loss": 0.0006, + "step": 26327 + }, + { + "epoch": 0.51, + "learning_rate": 9.795347753485301e-08, + "loss": 0.0005, + "step": 26328 + }, + { + "epoch": 0.51, + "learning_rate": 9.794959419051687e-08, + "loss": 0.5013, + "step": 26329 + }, + { + "epoch": 0.51, + "learning_rate": 9.794571084618073e-08, + "loss": 0.0005, + "step": 26330 + }, + { + "epoch": 0.51, + "learning_rate": 9.794182750184459e-08, + "loss": 0.0008, + "step": 26331 + }, + { + "epoch": 0.51, + "learning_rate": 9.793794415750845e-08, + "loss": 0.0006, + "step": 26332 + }, + { + "epoch": 0.51, + "learning_rate": 9.79340608131723e-08, + "loss": 0.0007, + "step": 26333 + }, + { + "epoch": 0.51, + "learning_rate": 9.793017746883616e-08, + "loss": 0.0285, + "step": 26334 + }, + { + "epoch": 0.51, + "learning_rate": 9.792629412450002e-08, + "loss": 0.0005, + "step": 26335 + }, + { + "epoch": 0.51, + "learning_rate": 9.792241078016388e-08, + "loss": 0.0005, + "step": 26336 + }, + { + "epoch": 0.51, + "learning_rate": 9.791852743582774e-08, + "loss": 0.0009, + "step": 26337 + }, + { + "epoch": 0.51, + "learning_rate": 9.791464409149158e-08, + "loss": 0.0005, + "step": 26338 + }, + { + "epoch": 0.51, + "learning_rate": 9.791076074715544e-08, + "loss": 0.0007, + "step": 26339 + }, + { + "epoch": 0.51, + "learning_rate": 9.79068774028193e-08, + "loss": 0.0006, + "step": 26340 + }, + { + "epoch": 0.51, + "learning_rate": 9.790299405848316e-08, + "loss": 0.0005, + "step": 26341 + }, + { + "epoch": 0.51, + "learning_rate": 9.789911071414701e-08, + "loss": 0.0004, + "step": 26342 + }, + { + "epoch": 0.51, + "learning_rate": 9.789522736981087e-08, + "loss": 0.0007, + "step": 26343 + }, + { + "epoch": 0.51, + "learning_rate": 9.789134402547473e-08, + "loss": 0.001, + "step": 26344 + }, + { + "epoch": 0.51, + "learning_rate": 9.788746068113859e-08, + "loss": 0.0011, + "step": 26345 + }, + { + "epoch": 0.51, + "learning_rate": 9.788357733680245e-08, + "loss": 0.0005, + "step": 26346 + }, + { + "epoch": 0.51, + "learning_rate": 9.78796939924663e-08, + "loss": 0.0006, + "step": 26347 + }, + { + "epoch": 0.51, + "learning_rate": 9.787581064813016e-08, + "loss": 0.6312, + "step": 26348 + }, + { + "epoch": 0.51, + "learning_rate": 9.787192730379402e-08, + "loss": 0.0005, + "step": 26349 + }, + { + "epoch": 0.51, + "learning_rate": 9.786804395945788e-08, + "loss": 0.0005, + "step": 26350 + }, + { + "epoch": 0.51, + "learning_rate": 9.786416061512174e-08, + "loss": 0.0021, + "step": 26351 + }, + { + "epoch": 0.51, + "learning_rate": 9.78602772707856e-08, + "loss": 0.0085, + "step": 26352 + }, + { + "epoch": 0.51, + "learning_rate": 9.785639392644946e-08, + "loss": 0.0007, + "step": 26353 + }, + { + "epoch": 0.51, + "learning_rate": 9.785251058211331e-08, + "loss": 0.0006, + "step": 26354 + }, + { + "epoch": 0.51, + "learning_rate": 9.784862723777717e-08, + "loss": 0.0006, + "step": 26355 + }, + { + "epoch": 0.51, + "learning_rate": 9.784474389344103e-08, + "loss": 0.0005, + "step": 26356 + }, + { + "epoch": 0.51, + "learning_rate": 9.784086054910489e-08, + "loss": 0.0017, + "step": 26357 + }, + { + "epoch": 0.51, + "learning_rate": 9.783697720476875e-08, + "loss": 0.0302, + "step": 26358 + }, + { + "epoch": 0.51, + "learning_rate": 9.78330938604326e-08, + "loss": 0.0006, + "step": 26359 + }, + { + "epoch": 0.51, + "learning_rate": 9.782921051609646e-08, + "loss": 0.0008, + "step": 26360 + }, + { + "epoch": 0.51, + "learning_rate": 9.782532717176032e-08, + "loss": 0.0004, + "step": 26361 + }, + { + "epoch": 0.51, + "learning_rate": 9.782144382742418e-08, + "loss": 0.0005, + "step": 26362 + }, + { + "epoch": 0.51, + "learning_rate": 9.781756048308804e-08, + "loss": 0.0005, + "step": 26363 + }, + { + "epoch": 0.51, + "learning_rate": 9.78136771387519e-08, + "loss": 1.0467, + "step": 26364 + }, + { + "epoch": 0.51, + "learning_rate": 9.780979379441575e-08, + "loss": 0.0004, + "step": 26365 + }, + { + "epoch": 0.51, + "learning_rate": 9.780591045007961e-08, + "loss": 0.002, + "step": 26366 + }, + { + "epoch": 0.51, + "learning_rate": 9.780202710574346e-08, + "loss": 0.0009, + "step": 26367 + }, + { + "epoch": 0.51, + "learning_rate": 9.779814376140732e-08, + "loss": 0.0007, + "step": 26368 + }, + { + "epoch": 0.51, + "learning_rate": 9.779426041707117e-08, + "loss": 0.0005, + "step": 26369 + }, + { + "epoch": 0.51, + "learning_rate": 9.779037707273503e-08, + "loss": 0.2048, + "step": 26370 + }, + { + "epoch": 0.51, + "learning_rate": 9.778649372839889e-08, + "loss": 0.0005, + "step": 26371 + }, + { + "epoch": 0.51, + "learning_rate": 9.778261038406275e-08, + "loss": 0.0253, + "step": 26372 + }, + { + "epoch": 0.51, + "learning_rate": 9.777872703972661e-08, + "loss": 0.0009, + "step": 26373 + }, + { + "epoch": 0.51, + "learning_rate": 9.777484369539047e-08, + "loss": 0.0006, + "step": 26374 + }, + { + "epoch": 0.51, + "learning_rate": 9.777096035105432e-08, + "loss": 0.0005, + "step": 26375 + }, + { + "epoch": 0.51, + "learning_rate": 9.776707700671818e-08, + "loss": 0.0073, + "step": 26376 + }, + { + "epoch": 0.51, + "learning_rate": 9.776319366238204e-08, + "loss": 0.0006, + "step": 26377 + }, + { + "epoch": 0.51, + "learning_rate": 9.77593103180459e-08, + "loss": 0.0017, + "step": 26378 + }, + { + "epoch": 0.51, + "learning_rate": 9.775542697370976e-08, + "loss": 0.0006, + "step": 26379 + }, + { + "epoch": 0.51, + "learning_rate": 9.775154362937361e-08, + "loss": 0.0005, + "step": 26380 + }, + { + "epoch": 0.51, + "learning_rate": 9.774766028503747e-08, + "loss": 0.0006, + "step": 26381 + }, + { + "epoch": 0.51, + "learning_rate": 9.774377694070133e-08, + "loss": 0.0004, + "step": 26382 + }, + { + "epoch": 0.51, + "learning_rate": 9.773989359636519e-08, + "loss": 0.0008, + "step": 26383 + }, + { + "epoch": 0.51, + "learning_rate": 9.773601025202905e-08, + "loss": 0.0009, + "step": 26384 + }, + { + "epoch": 0.51, + "learning_rate": 9.77321269076929e-08, + "loss": 0.001, + "step": 26385 + }, + { + "epoch": 0.51, + "learning_rate": 9.772824356335676e-08, + "loss": 0.0006, + "step": 26386 + }, + { + "epoch": 0.51, + "learning_rate": 9.772436021902062e-08, + "loss": 0.0005, + "step": 26387 + }, + { + "epoch": 0.51, + "learning_rate": 9.772047687468448e-08, + "loss": 0.001, + "step": 26388 + }, + { + "epoch": 0.51, + "learning_rate": 9.771659353034834e-08, + "loss": 0.0007, + "step": 26389 + }, + { + "epoch": 0.51, + "learning_rate": 9.77127101860122e-08, + "loss": 0.0005, + "step": 26390 + }, + { + "epoch": 0.51, + "learning_rate": 9.770882684167606e-08, + "loss": 0.0006, + "step": 26391 + }, + { + "epoch": 0.51, + "learning_rate": 9.770494349733991e-08, + "loss": 0.0008, + "step": 26392 + }, + { + "epoch": 0.51, + "learning_rate": 9.770106015300377e-08, + "loss": 0.0004, + "step": 26393 + }, + { + "epoch": 0.51, + "learning_rate": 9.769717680866763e-08, + "loss": 0.0004, + "step": 26394 + }, + { + "epoch": 0.51, + "learning_rate": 9.769329346433149e-08, + "loss": 0.0013, + "step": 26395 + }, + { + "epoch": 0.51, + "learning_rate": 9.768941011999533e-08, + "loss": 0.0016, + "step": 26396 + }, + { + "epoch": 0.51, + "learning_rate": 9.768552677565919e-08, + "loss": 0.0004, + "step": 26397 + }, + { + "epoch": 0.51, + "learning_rate": 9.768164343132305e-08, + "loss": 0.0013, + "step": 26398 + }, + { + "epoch": 0.51, + "learning_rate": 9.767776008698691e-08, + "loss": 0.0006, + "step": 26399 + }, + { + "epoch": 0.51, + "learning_rate": 9.767387674265077e-08, + "loss": 0.0006, + "step": 26400 + }, + { + "epoch": 0.51, + "learning_rate": 9.766999339831462e-08, + "loss": 0.0007, + "step": 26401 + }, + { + "epoch": 0.51, + "learning_rate": 9.766611005397848e-08, + "loss": 0.0007, + "step": 26402 + }, + { + "epoch": 0.51, + "learning_rate": 9.766222670964234e-08, + "loss": 0.001, + "step": 26403 + }, + { + "epoch": 0.51, + "learning_rate": 9.76583433653062e-08, + "loss": 0.0051, + "step": 26404 + }, + { + "epoch": 0.51, + "learning_rate": 9.765446002097006e-08, + "loss": 0.0005, + "step": 26405 + }, + { + "epoch": 0.51, + "learning_rate": 9.765057667663392e-08, + "loss": 0.0008, + "step": 26406 + }, + { + "epoch": 0.51, + "learning_rate": 9.764669333229777e-08, + "loss": 0.0006, + "step": 26407 + }, + { + "epoch": 0.51, + "learning_rate": 9.764280998796163e-08, + "loss": 0.0056, + "step": 26408 + }, + { + "epoch": 0.51, + "learning_rate": 9.763892664362549e-08, + "loss": 0.0028, + "step": 26409 + }, + { + "epoch": 0.51, + "learning_rate": 9.763504329928935e-08, + "loss": 0.0011, + "step": 26410 + }, + { + "epoch": 0.51, + "learning_rate": 9.763115995495321e-08, + "loss": 0.0086, + "step": 26411 + }, + { + "epoch": 0.51, + "learning_rate": 9.762727661061707e-08, + "loss": 0.0006, + "step": 26412 + }, + { + "epoch": 0.51, + "learning_rate": 9.762339326628092e-08, + "loss": 0.0006, + "step": 26413 + }, + { + "epoch": 0.51, + "learning_rate": 9.761950992194478e-08, + "loss": 0.0013, + "step": 26414 + }, + { + "epoch": 0.51, + "learning_rate": 9.761562657760864e-08, + "loss": 0.0006, + "step": 26415 + }, + { + "epoch": 0.51, + "learning_rate": 9.76117432332725e-08, + "loss": 0.0007, + "step": 26416 + }, + { + "epoch": 0.51, + "learning_rate": 9.760785988893636e-08, + "loss": 0.0009, + "step": 26417 + }, + { + "epoch": 0.51, + "learning_rate": 9.760397654460021e-08, + "loss": 0.0006, + "step": 26418 + }, + { + "epoch": 0.51, + "learning_rate": 9.760009320026407e-08, + "loss": 0.0011, + "step": 26419 + }, + { + "epoch": 0.51, + "learning_rate": 9.759620985592793e-08, + "loss": 0.0004, + "step": 26420 + }, + { + "epoch": 0.51, + "learning_rate": 9.759232651159178e-08, + "loss": 1.1901, + "step": 26421 + }, + { + "epoch": 0.51, + "learning_rate": 9.758844316725563e-08, + "loss": 0.0005, + "step": 26422 + }, + { + "epoch": 0.51, + "learning_rate": 9.758455982291949e-08, + "loss": 0.0185, + "step": 26423 + }, + { + "epoch": 0.51, + "learning_rate": 9.758067647858335e-08, + "loss": 0.0005, + "step": 26424 + }, + { + "epoch": 0.51, + "learning_rate": 9.757679313424721e-08, + "loss": 0.981, + "step": 26425 + }, + { + "epoch": 0.51, + "learning_rate": 9.757290978991107e-08, + "loss": 0.0006, + "step": 26426 + }, + { + "epoch": 0.51, + "learning_rate": 9.756902644557493e-08, + "loss": 0.0005, + "step": 26427 + }, + { + "epoch": 0.51, + "learning_rate": 9.756514310123878e-08, + "loss": 0.0008, + "step": 26428 + }, + { + "epoch": 0.51, + "learning_rate": 9.756125975690264e-08, + "loss": 0.0006, + "step": 26429 + }, + { + "epoch": 0.51, + "learning_rate": 9.75573764125665e-08, + "loss": 0.0005, + "step": 26430 + }, + { + "epoch": 0.51, + "learning_rate": 9.755349306823036e-08, + "loss": 0.0006, + "step": 26431 + }, + { + "epoch": 0.51, + "learning_rate": 9.754960972389422e-08, + "loss": 0.0008, + "step": 26432 + }, + { + "epoch": 0.51, + "learning_rate": 9.754572637955808e-08, + "loss": 0.0005, + "step": 26433 + }, + { + "epoch": 0.51, + "learning_rate": 9.754184303522193e-08, + "loss": 0.0006, + "step": 26434 + }, + { + "epoch": 0.51, + "learning_rate": 9.753795969088579e-08, + "loss": 0.0006, + "step": 26435 + }, + { + "epoch": 0.51, + "learning_rate": 9.753407634654964e-08, + "loss": 0.0005, + "step": 26436 + }, + { + "epoch": 0.51, + "learning_rate": 9.75301930022135e-08, + "loss": 0.0004, + "step": 26437 + }, + { + "epoch": 0.51, + "learning_rate": 9.752630965787735e-08, + "loss": 0.0005, + "step": 26438 + }, + { + "epoch": 0.51, + "learning_rate": 9.752242631354121e-08, + "loss": 0.0006, + "step": 26439 + }, + { + "epoch": 0.51, + "learning_rate": 9.751854296920507e-08, + "loss": 0.0009, + "step": 26440 + }, + { + "epoch": 0.51, + "learning_rate": 9.751465962486893e-08, + "loss": 0.0014, + "step": 26441 + }, + { + "epoch": 0.51, + "learning_rate": 9.751077628053279e-08, + "loss": 0.0005, + "step": 26442 + }, + { + "epoch": 0.51, + "learning_rate": 9.750689293619664e-08, + "loss": 0.0006, + "step": 26443 + }, + { + "epoch": 0.51, + "learning_rate": 9.75030095918605e-08, + "loss": 0.0366, + "step": 26444 + }, + { + "epoch": 0.51, + "learning_rate": 9.749912624752436e-08, + "loss": 1.011, + "step": 26445 + }, + { + "epoch": 0.51, + "learning_rate": 9.749524290318822e-08, + "loss": 0.0011, + "step": 26446 + }, + { + "epoch": 0.51, + "learning_rate": 9.749135955885208e-08, + "loss": 0.0007, + "step": 26447 + }, + { + "epoch": 0.51, + "learning_rate": 9.748747621451594e-08, + "loss": 0.0006, + "step": 26448 + }, + { + "epoch": 0.51, + "learning_rate": 9.74835928701798e-08, + "loss": 0.0004, + "step": 26449 + }, + { + "epoch": 0.51, + "learning_rate": 9.747970952584365e-08, + "loss": 0.0478, + "step": 26450 + }, + { + "epoch": 0.51, + "learning_rate": 9.747582618150751e-08, + "loss": 0.0006, + "step": 26451 + }, + { + "epoch": 0.51, + "learning_rate": 9.747194283717137e-08, + "loss": 0.0005, + "step": 26452 + }, + { + "epoch": 0.51, + "learning_rate": 9.746805949283523e-08, + "loss": 0.0005, + "step": 26453 + }, + { + "epoch": 0.51, + "learning_rate": 9.746417614849907e-08, + "loss": 0.5005, + "step": 26454 + }, + { + "epoch": 0.51, + "learning_rate": 9.746029280416293e-08, + "loss": 0.0006, + "step": 26455 + }, + { + "epoch": 0.51, + "learning_rate": 9.745640945982679e-08, + "loss": 0.0006, + "step": 26456 + }, + { + "epoch": 0.51, + "learning_rate": 9.745252611549065e-08, + "loss": 0.0004, + "step": 26457 + }, + { + "epoch": 0.51, + "learning_rate": 9.74486427711545e-08, + "loss": 0.0006, + "step": 26458 + }, + { + "epoch": 0.51, + "learning_rate": 9.744475942681836e-08, + "loss": 0.5003, + "step": 26459 + }, + { + "epoch": 0.51, + "learning_rate": 9.744087608248222e-08, + "loss": 0.0006, + "step": 26460 + }, + { + "epoch": 0.51, + "learning_rate": 9.743699273814608e-08, + "loss": 0.2931, + "step": 26461 + }, + { + "epoch": 0.51, + "learning_rate": 9.743310939380994e-08, + "loss": 0.0005, + "step": 26462 + }, + { + "epoch": 0.51, + "learning_rate": 9.74292260494738e-08, + "loss": 0.0005, + "step": 26463 + }, + { + "epoch": 0.51, + "learning_rate": 9.742534270513765e-08, + "loss": 0.0005, + "step": 26464 + }, + { + "epoch": 0.51, + "learning_rate": 9.742145936080151e-08, + "loss": 0.0009, + "step": 26465 + }, + { + "epoch": 0.51, + "learning_rate": 9.741757601646537e-08, + "loss": 0.0004, + "step": 26466 + }, + { + "epoch": 0.51, + "learning_rate": 9.741369267212923e-08, + "loss": 0.0035, + "step": 26467 + }, + { + "epoch": 0.51, + "learning_rate": 9.740980932779309e-08, + "loss": 0.0004, + "step": 26468 + }, + { + "epoch": 0.51, + "learning_rate": 9.740592598345695e-08, + "loss": 0.0007, + "step": 26469 + }, + { + "epoch": 0.51, + "learning_rate": 9.74020426391208e-08, + "loss": 0.0006, + "step": 26470 + }, + { + "epoch": 0.51, + "learning_rate": 9.739815929478466e-08, + "loss": 0.0004, + "step": 26471 + }, + { + "epoch": 0.51, + "learning_rate": 9.739427595044852e-08, + "loss": 0.4953, + "step": 26472 + }, + { + "epoch": 0.51, + "learning_rate": 9.739039260611238e-08, + "loss": 0.0028, + "step": 26473 + }, + { + "epoch": 0.51, + "learning_rate": 9.738650926177624e-08, + "loss": 0.0005, + "step": 26474 + }, + { + "epoch": 0.51, + "learning_rate": 9.73826259174401e-08, + "loss": 0.0006, + "step": 26475 + }, + { + "epoch": 0.51, + "learning_rate": 9.737874257310395e-08, + "loss": 0.0005, + "step": 26476 + }, + { + "epoch": 0.51, + "learning_rate": 9.737485922876781e-08, + "loss": 0.0004, + "step": 26477 + }, + { + "epoch": 0.51, + "learning_rate": 9.737097588443167e-08, + "loss": 0.2484, + "step": 26478 + }, + { + "epoch": 0.51, + "learning_rate": 9.736709254009553e-08, + "loss": 0.0007, + "step": 26479 + }, + { + "epoch": 0.51, + "learning_rate": 9.736320919575939e-08, + "loss": 0.0007, + "step": 26480 + }, + { + "epoch": 0.51, + "learning_rate": 9.735932585142324e-08, + "loss": 0.0006, + "step": 26481 + }, + { + "epoch": 0.51, + "learning_rate": 9.73554425070871e-08, + "loss": 0.0033, + "step": 26482 + }, + { + "epoch": 0.51, + "learning_rate": 9.735155916275095e-08, + "loss": 0.067, + "step": 26483 + }, + { + "epoch": 0.51, + "learning_rate": 9.73476758184148e-08, + "loss": 0.0004, + "step": 26484 + }, + { + "epoch": 0.51, + "learning_rate": 9.734379247407866e-08, + "loss": 0.0007, + "step": 26485 + }, + { + "epoch": 0.51, + "learning_rate": 9.733990912974252e-08, + "loss": 0.0006, + "step": 26486 + }, + { + "epoch": 0.51, + "learning_rate": 9.733602578540638e-08, + "loss": 0.9482, + "step": 26487 + }, + { + "epoch": 0.51, + "learning_rate": 9.733214244107024e-08, + "loss": 0.0006, + "step": 26488 + }, + { + "epoch": 0.51, + "learning_rate": 9.73282590967341e-08, + "loss": 0.5705, + "step": 26489 + }, + { + "epoch": 0.51, + "learning_rate": 9.732437575239796e-08, + "loss": 0.0018, + "step": 26490 + }, + { + "epoch": 0.51, + "learning_rate": 9.732049240806181e-08, + "loss": 0.0005, + "step": 26491 + }, + { + "epoch": 0.51, + "learning_rate": 9.731660906372567e-08, + "loss": 0.7916, + "step": 26492 + }, + { + "epoch": 0.51, + "learning_rate": 9.731272571938953e-08, + "loss": 0.0005, + "step": 26493 + }, + { + "epoch": 0.51, + "learning_rate": 9.730884237505339e-08, + "loss": 0.0011, + "step": 26494 + }, + { + "epoch": 0.51, + "learning_rate": 9.730495903071725e-08, + "loss": 0.005, + "step": 26495 + }, + { + "epoch": 0.51, + "learning_rate": 9.73010756863811e-08, + "loss": 0.001, + "step": 26496 + }, + { + "epoch": 0.51, + "learning_rate": 9.729719234204496e-08, + "loss": 0.0005, + "step": 26497 + }, + { + "epoch": 0.51, + "learning_rate": 9.729330899770882e-08, + "loss": 0.5846, + "step": 26498 + }, + { + "epoch": 0.51, + "learning_rate": 9.728942565337268e-08, + "loss": 0.0005, + "step": 26499 + }, + { + "epoch": 0.51, + "learning_rate": 9.728554230903654e-08, + "loss": 0.0007, + "step": 26500 + }, + { + "epoch": 0.51, + "learning_rate": 9.72816589647004e-08, + "loss": 0.0009, + "step": 26501 + }, + { + "epoch": 0.51, + "learning_rate": 9.727777562036425e-08, + "loss": 0.0005, + "step": 26502 + }, + { + "epoch": 0.51, + "learning_rate": 9.727389227602811e-08, + "loss": 0.0012, + "step": 26503 + }, + { + "epoch": 0.51, + "learning_rate": 9.727000893169197e-08, + "loss": 0.0005, + "step": 26504 + }, + { + "epoch": 0.51, + "learning_rate": 9.726612558735583e-08, + "loss": 0.0005, + "step": 26505 + }, + { + "epoch": 0.51, + "learning_rate": 9.726224224301969e-08, + "loss": 0.0005, + "step": 26506 + }, + { + "epoch": 0.51, + "learning_rate": 9.725835889868355e-08, + "loss": 0.0005, + "step": 26507 + }, + { + "epoch": 0.51, + "learning_rate": 9.72544755543474e-08, + "loss": 0.0012, + "step": 26508 + }, + { + "epoch": 0.51, + "learning_rate": 9.725059221001126e-08, + "loss": 0.0004, + "step": 26509 + }, + { + "epoch": 0.51, + "learning_rate": 9.724670886567512e-08, + "loss": 0.0006, + "step": 26510 + }, + { + "epoch": 0.51, + "learning_rate": 9.724282552133898e-08, + "loss": 0.0005, + "step": 26511 + }, + { + "epoch": 0.51, + "learning_rate": 9.723894217700282e-08, + "loss": 0.0005, + "step": 26512 + }, + { + "epoch": 0.51, + "learning_rate": 9.723505883266668e-08, + "loss": 0.0008, + "step": 26513 + }, + { + "epoch": 0.51, + "learning_rate": 9.723117548833054e-08, + "loss": 0.5176, + "step": 26514 + }, + { + "epoch": 0.51, + "learning_rate": 9.72272921439944e-08, + "loss": 0.0007, + "step": 26515 + }, + { + "epoch": 0.51, + "learning_rate": 9.722340879965826e-08, + "loss": 0.0005, + "step": 26516 + }, + { + "epoch": 0.51, + "learning_rate": 9.721952545532211e-08, + "loss": 1.3115, + "step": 26517 + }, + { + "epoch": 0.51, + "learning_rate": 9.721564211098597e-08, + "loss": 1.1983, + "step": 26518 + }, + { + "epoch": 0.51, + "learning_rate": 9.721175876664983e-08, + "loss": 0.0007, + "step": 26519 + }, + { + "epoch": 0.51, + "learning_rate": 9.720787542231369e-08, + "loss": 0.8727, + "step": 26520 + }, + { + "epoch": 0.51, + "learning_rate": 9.720399207797755e-08, + "loss": 0.0004, + "step": 26521 + }, + { + "epoch": 0.51, + "learning_rate": 9.72001087336414e-08, + "loss": 0.0005, + "step": 26522 + }, + { + "epoch": 0.51, + "learning_rate": 9.719622538930526e-08, + "loss": 0.0005, + "step": 26523 + }, + { + "epoch": 0.51, + "learning_rate": 9.719234204496912e-08, + "loss": 0.0225, + "step": 26524 + }, + { + "epoch": 0.51, + "learning_rate": 9.718845870063298e-08, + "loss": 0.0005, + "step": 26525 + }, + { + "epoch": 0.51, + "learning_rate": 9.718457535629684e-08, + "loss": 0.0006, + "step": 26526 + }, + { + "epoch": 0.51, + "learning_rate": 9.71806920119607e-08, + "loss": 0.0006, + "step": 26527 + }, + { + "epoch": 0.51, + "learning_rate": 9.717680866762456e-08, + "loss": 0.0004, + "step": 26528 + }, + { + "epoch": 0.51, + "learning_rate": 9.717292532328841e-08, + "loss": 0.0006, + "step": 26529 + }, + { + "epoch": 0.51, + "learning_rate": 9.716904197895227e-08, + "loss": 1.097, + "step": 26530 + }, + { + "epoch": 0.51, + "learning_rate": 9.716515863461613e-08, + "loss": 0.0005, + "step": 26531 + }, + { + "epoch": 0.51, + "learning_rate": 9.716127529027999e-08, + "loss": 0.0025, + "step": 26532 + }, + { + "epoch": 0.51, + "learning_rate": 9.715739194594385e-08, + "loss": 0.0007, + "step": 26533 + }, + { + "epoch": 0.51, + "learning_rate": 9.71535086016077e-08, + "loss": 0.0053, + "step": 26534 + }, + { + "epoch": 0.51, + "learning_rate": 9.714962525727156e-08, + "loss": 0.0008, + "step": 26535 + }, + { + "epoch": 0.51, + "learning_rate": 9.714574191293542e-08, + "loss": 0.0006, + "step": 26536 + }, + { + "epoch": 0.51, + "learning_rate": 9.714185856859928e-08, + "loss": 1.0612, + "step": 26537 + }, + { + "epoch": 0.51, + "learning_rate": 9.713797522426314e-08, + "loss": 0.4316, + "step": 26538 + }, + { + "epoch": 0.51, + "learning_rate": 9.7134091879927e-08, + "loss": 0.0379, + "step": 26539 + }, + { + "epoch": 0.51, + "learning_rate": 9.713020853559085e-08, + "loss": 0.0004, + "step": 26540 + }, + { + "epoch": 0.51, + "learning_rate": 9.71263251912547e-08, + "loss": 0.0006, + "step": 26541 + }, + { + "epoch": 0.51, + "learning_rate": 9.712244184691856e-08, + "loss": 0.0043, + "step": 26542 + }, + { + "epoch": 0.51, + "learning_rate": 9.711855850258242e-08, + "loss": 0.003, + "step": 26543 + }, + { + "epoch": 0.51, + "learning_rate": 9.711467515824627e-08, + "loss": 0.0005, + "step": 26544 + }, + { + "epoch": 0.51, + "learning_rate": 9.711079181391013e-08, + "loss": 0.0007, + "step": 26545 + }, + { + "epoch": 0.51, + "learning_rate": 9.710690846957399e-08, + "loss": 0.0005, + "step": 26546 + }, + { + "epoch": 0.51, + "learning_rate": 9.710302512523785e-08, + "loss": 0.4368, + "step": 26547 + }, + { + "epoch": 0.51, + "learning_rate": 9.709914178090171e-08, + "loss": 0.0009, + "step": 26548 + }, + { + "epoch": 0.51, + "learning_rate": 9.709525843656557e-08, + "loss": 0.0497, + "step": 26549 + }, + { + "epoch": 0.52, + "learning_rate": 9.709137509222942e-08, + "loss": 0.0004, + "step": 26550 + }, + { + "epoch": 0.52, + "learning_rate": 9.708749174789328e-08, + "loss": 1.2381, + "step": 26551 + }, + { + "epoch": 0.52, + "learning_rate": 9.708360840355714e-08, + "loss": 0.0008, + "step": 26552 + }, + { + "epoch": 0.52, + "learning_rate": 9.7079725059221e-08, + "loss": 0.0005, + "step": 26553 + }, + { + "epoch": 0.52, + "learning_rate": 9.707584171488486e-08, + "loss": 0.0036, + "step": 26554 + }, + { + "epoch": 0.52, + "learning_rate": 9.707195837054871e-08, + "loss": 0.0006, + "step": 26555 + }, + { + "epoch": 0.52, + "learning_rate": 9.706807502621257e-08, + "loss": 0.0007, + "step": 26556 + }, + { + "epoch": 0.52, + "learning_rate": 9.706419168187643e-08, + "loss": 0.0012, + "step": 26557 + }, + { + "epoch": 0.52, + "learning_rate": 9.706030833754029e-08, + "loss": 0.0006, + "step": 26558 + }, + { + "epoch": 0.52, + "learning_rate": 9.705642499320415e-08, + "loss": 0.0006, + "step": 26559 + }, + { + "epoch": 0.52, + "learning_rate": 9.7052541648868e-08, + "loss": 0.5198, + "step": 26560 + }, + { + "epoch": 0.52, + "learning_rate": 9.704865830453186e-08, + "loss": 0.1795, + "step": 26561 + }, + { + "epoch": 0.52, + "learning_rate": 9.704477496019572e-08, + "loss": 0.0003, + "step": 26562 + }, + { + "epoch": 0.52, + "learning_rate": 9.704089161585958e-08, + "loss": 0.5634, + "step": 26563 + }, + { + "epoch": 0.52, + "learning_rate": 9.703700827152344e-08, + "loss": 0.4547, + "step": 26564 + }, + { + "epoch": 0.52, + "learning_rate": 9.70331249271873e-08, + "loss": 0.0005, + "step": 26565 + }, + { + "epoch": 0.52, + "learning_rate": 9.702924158285116e-08, + "loss": 0.0632, + "step": 26566 + }, + { + "epoch": 0.52, + "learning_rate": 9.702535823851501e-08, + "loss": 0.0005, + "step": 26567 + }, + { + "epoch": 0.52, + "learning_rate": 9.702147489417887e-08, + "loss": 0.0008, + "step": 26568 + }, + { + "epoch": 0.52, + "learning_rate": 9.701759154984273e-08, + "loss": 0.0005, + "step": 26569 + }, + { + "epoch": 0.52, + "learning_rate": 9.701370820550658e-08, + "loss": 0.0005, + "step": 26570 + }, + { + "epoch": 0.52, + "learning_rate": 9.700982486117043e-08, + "loss": 0.0005, + "step": 26571 + }, + { + "epoch": 0.52, + "learning_rate": 9.700594151683429e-08, + "loss": 0.0005, + "step": 26572 + }, + { + "epoch": 0.52, + "learning_rate": 9.700205817249815e-08, + "loss": 0.0898, + "step": 26573 + }, + { + "epoch": 0.52, + "learning_rate": 9.699817482816201e-08, + "loss": 0.0005, + "step": 26574 + }, + { + "epoch": 0.52, + "learning_rate": 9.699429148382587e-08, + "loss": 0.0004, + "step": 26575 + }, + { + "epoch": 0.52, + "learning_rate": 9.699040813948972e-08, + "loss": 0.0004, + "step": 26576 + }, + { + "epoch": 0.52, + "learning_rate": 9.698652479515358e-08, + "loss": 0.0006, + "step": 26577 + }, + { + "epoch": 0.52, + "learning_rate": 9.698264145081744e-08, + "loss": 0.0004, + "step": 26578 + }, + { + "epoch": 0.52, + "learning_rate": 9.69787581064813e-08, + "loss": 0.0459, + "step": 26579 + }, + { + "epoch": 0.52, + "learning_rate": 9.697487476214516e-08, + "loss": 0.0004, + "step": 26580 + }, + { + "epoch": 0.52, + "learning_rate": 9.697099141780902e-08, + "loss": 0.0007, + "step": 26581 + }, + { + "epoch": 0.52, + "learning_rate": 9.696710807347287e-08, + "loss": 0.0007, + "step": 26582 + }, + { + "epoch": 0.52, + "learning_rate": 9.696322472913673e-08, + "loss": 0.0148, + "step": 26583 + }, + { + "epoch": 0.52, + "learning_rate": 9.695934138480059e-08, + "loss": 0.0005, + "step": 26584 + }, + { + "epoch": 0.52, + "learning_rate": 9.695545804046445e-08, + "loss": 0.0006, + "step": 26585 + }, + { + "epoch": 0.52, + "learning_rate": 9.695157469612831e-08, + "loss": 0.966, + "step": 26586 + }, + { + "epoch": 0.52, + "learning_rate": 9.694769135179217e-08, + "loss": 0.0022, + "step": 26587 + }, + { + "epoch": 0.52, + "learning_rate": 9.694380800745602e-08, + "loss": 0.0004, + "step": 26588 + }, + { + "epoch": 0.52, + "learning_rate": 9.693992466311988e-08, + "loss": 0.0005, + "step": 26589 + }, + { + "epoch": 0.52, + "learning_rate": 9.693604131878374e-08, + "loss": 0.0005, + "step": 26590 + }, + { + "epoch": 0.52, + "learning_rate": 9.69321579744476e-08, + "loss": 0.0155, + "step": 26591 + }, + { + "epoch": 0.52, + "learning_rate": 9.692827463011146e-08, + "loss": 0.0007, + "step": 26592 + }, + { + "epoch": 0.52, + "learning_rate": 9.692439128577531e-08, + "loss": 0.0011, + "step": 26593 + }, + { + "epoch": 0.52, + "learning_rate": 9.692050794143917e-08, + "loss": 0.0005, + "step": 26594 + }, + { + "epoch": 0.52, + "learning_rate": 9.691662459710303e-08, + "loss": 0.0006, + "step": 26595 + }, + { + "epoch": 0.52, + "learning_rate": 9.691274125276689e-08, + "loss": 0.0009, + "step": 26596 + }, + { + "epoch": 0.52, + "learning_rate": 9.690885790843075e-08, + "loss": 0.0005, + "step": 26597 + }, + { + "epoch": 0.52, + "learning_rate": 9.690497456409459e-08, + "loss": 0.0006, + "step": 26598 + }, + { + "epoch": 0.52, + "learning_rate": 9.690109121975845e-08, + "loss": 0.0004, + "step": 26599 + }, + { + "epoch": 0.52, + "learning_rate": 9.689720787542231e-08, + "loss": 0.0012, + "step": 26600 + }, + { + "epoch": 0.52, + "learning_rate": 9.689332453108617e-08, + "loss": 0.0005, + "step": 26601 + }, + { + "epoch": 0.52, + "learning_rate": 9.688944118675003e-08, + "loss": 0.0006, + "step": 26602 + }, + { + "epoch": 0.52, + "learning_rate": 9.688555784241388e-08, + "loss": 0.0006, + "step": 26603 + }, + { + "epoch": 0.52, + "learning_rate": 9.688167449807774e-08, + "loss": 0.0297, + "step": 26604 + }, + { + "epoch": 0.52, + "learning_rate": 9.68777911537416e-08, + "loss": 0.0009, + "step": 26605 + }, + { + "epoch": 0.52, + "learning_rate": 9.687390780940546e-08, + "loss": 0.0005, + "step": 26606 + }, + { + "epoch": 0.52, + "learning_rate": 9.687002446506932e-08, + "loss": 0.0005, + "step": 26607 + }, + { + "epoch": 0.52, + "learning_rate": 9.686614112073318e-08, + "loss": 0.0009, + "step": 26608 + }, + { + "epoch": 0.52, + "learning_rate": 9.686225777639703e-08, + "loss": 0.0023, + "step": 26609 + }, + { + "epoch": 0.52, + "learning_rate": 9.685837443206089e-08, + "loss": 0.0005, + "step": 26610 + }, + { + "epoch": 0.52, + "learning_rate": 9.685449108772475e-08, + "loss": 0.9049, + "step": 26611 + }, + { + "epoch": 0.52, + "learning_rate": 9.685060774338861e-08, + "loss": 1.2178, + "step": 26612 + }, + { + "epoch": 0.52, + "learning_rate": 9.684672439905245e-08, + "loss": 0.0006, + "step": 26613 + }, + { + "epoch": 0.52, + "learning_rate": 9.684284105471631e-08, + "loss": 0.0004, + "step": 26614 + }, + { + "epoch": 0.52, + "learning_rate": 9.683895771038017e-08, + "loss": 0.0066, + "step": 26615 + }, + { + "epoch": 0.52, + "learning_rate": 9.683507436604403e-08, + "loss": 0.0008, + "step": 26616 + }, + { + "epoch": 0.52, + "learning_rate": 9.683119102170789e-08, + "loss": 1.1375, + "step": 26617 + }, + { + "epoch": 0.52, + "learning_rate": 9.682730767737174e-08, + "loss": 0.0005, + "step": 26618 + }, + { + "epoch": 0.52, + "learning_rate": 9.68234243330356e-08, + "loss": 0.0006, + "step": 26619 + }, + { + "epoch": 0.52, + "learning_rate": 9.681954098869946e-08, + "loss": 0.0004, + "step": 26620 + }, + { + "epoch": 0.52, + "learning_rate": 9.681565764436332e-08, + "loss": 0.3875, + "step": 26621 + }, + { + "epoch": 0.52, + "learning_rate": 9.681177430002718e-08, + "loss": 0.0005, + "step": 26622 + }, + { + "epoch": 0.52, + "learning_rate": 9.680789095569104e-08, + "loss": 0.0007, + "step": 26623 + }, + { + "epoch": 0.52, + "learning_rate": 9.68040076113549e-08, + "loss": 0.0005, + "step": 26624 + }, + { + "epoch": 0.52, + "learning_rate": 9.680012426701875e-08, + "loss": 0.0006, + "step": 26625 + }, + { + "epoch": 0.52, + "learning_rate": 9.679624092268261e-08, + "loss": 0.0006, + "step": 26626 + }, + { + "epoch": 0.52, + "learning_rate": 9.679235757834647e-08, + "loss": 0.0006, + "step": 26627 + }, + { + "epoch": 0.52, + "learning_rate": 9.678847423401031e-08, + "loss": 0.0007, + "step": 26628 + }, + { + "epoch": 0.52, + "learning_rate": 9.678459088967417e-08, + "loss": 0.0013, + "step": 26629 + }, + { + "epoch": 0.52, + "learning_rate": 9.678070754533803e-08, + "loss": 0.0013, + "step": 26630 + }, + { + "epoch": 0.52, + "learning_rate": 9.677682420100189e-08, + "loss": 0.0009, + "step": 26631 + }, + { + "epoch": 0.52, + "learning_rate": 9.677294085666575e-08, + "loss": 0.0007, + "step": 26632 + }, + { + "epoch": 0.52, + "learning_rate": 9.67690575123296e-08, + "loss": 0.0006, + "step": 26633 + }, + { + "epoch": 0.52, + "learning_rate": 9.676517416799346e-08, + "loss": 0.0006, + "step": 26634 + }, + { + "epoch": 0.52, + "learning_rate": 9.676129082365732e-08, + "loss": 0.1432, + "step": 26635 + }, + { + "epoch": 0.52, + "learning_rate": 9.675740747932118e-08, + "loss": 0.0006, + "step": 26636 + }, + { + "epoch": 0.52, + "learning_rate": 9.675352413498504e-08, + "loss": 0.0004, + "step": 26637 + }, + { + "epoch": 0.52, + "learning_rate": 9.67496407906489e-08, + "loss": 0.0005, + "step": 26638 + }, + { + "epoch": 0.52, + "learning_rate": 9.674575744631275e-08, + "loss": 0.4346, + "step": 26639 + }, + { + "epoch": 0.52, + "learning_rate": 9.674187410197661e-08, + "loss": 0.0004, + "step": 26640 + }, + { + "epoch": 0.52, + "learning_rate": 9.673799075764047e-08, + "loss": 0.0004, + "step": 26641 + }, + { + "epoch": 0.52, + "learning_rate": 9.673410741330433e-08, + "loss": 0.0018, + "step": 26642 + }, + { + "epoch": 0.52, + "learning_rate": 9.673022406896819e-08, + "loss": 0.9896, + "step": 26643 + }, + { + "epoch": 0.52, + "learning_rate": 9.672634072463205e-08, + "loss": 0.0005, + "step": 26644 + }, + { + "epoch": 0.52, + "learning_rate": 9.67224573802959e-08, + "loss": 0.0004, + "step": 26645 + }, + { + "epoch": 0.52, + "learning_rate": 9.671857403595976e-08, + "loss": 0.0005, + "step": 26646 + }, + { + "epoch": 0.52, + "learning_rate": 9.671469069162362e-08, + "loss": 0.0007, + "step": 26647 + }, + { + "epoch": 0.52, + "learning_rate": 9.671080734728748e-08, + "loss": 0.0005, + "step": 26648 + }, + { + "epoch": 0.52, + "learning_rate": 9.670692400295134e-08, + "loss": 0.0007, + "step": 26649 + }, + { + "epoch": 0.52, + "learning_rate": 9.67030406586152e-08, + "loss": 0.0009, + "step": 26650 + }, + { + "epoch": 0.52, + "learning_rate": 9.669915731427905e-08, + "loss": 1.2749, + "step": 26651 + }, + { + "epoch": 0.52, + "learning_rate": 9.669527396994291e-08, + "loss": 0.0008, + "step": 26652 + }, + { + "epoch": 0.52, + "learning_rate": 9.669139062560677e-08, + "loss": 1.5479, + "step": 26653 + }, + { + "epoch": 0.52, + "learning_rate": 9.668750728127063e-08, + "loss": 0.0005, + "step": 26654 + }, + { + "epoch": 0.52, + "learning_rate": 9.668362393693449e-08, + "loss": 0.0006, + "step": 26655 + }, + { + "epoch": 0.52, + "learning_rate": 9.667974059259834e-08, + "loss": 0.0074, + "step": 26656 + }, + { + "epoch": 0.52, + "learning_rate": 9.667585724826219e-08, + "loss": 0.0534, + "step": 26657 + }, + { + "epoch": 0.52, + "learning_rate": 9.667197390392605e-08, + "loss": 0.0006, + "step": 26658 + }, + { + "epoch": 0.52, + "learning_rate": 9.66680905595899e-08, + "loss": 0.0005, + "step": 26659 + }, + { + "epoch": 0.52, + "learning_rate": 9.666420721525376e-08, + "loss": 0.0006, + "step": 26660 + }, + { + "epoch": 0.52, + "learning_rate": 9.666032387091762e-08, + "loss": 0.002, + "step": 26661 + }, + { + "epoch": 0.52, + "learning_rate": 9.665644052658148e-08, + "loss": 0.0006, + "step": 26662 + }, + { + "epoch": 0.52, + "learning_rate": 9.665255718224534e-08, + "loss": 0.0014, + "step": 26663 + }, + { + "epoch": 0.52, + "learning_rate": 9.66486738379092e-08, + "loss": 0.0007, + "step": 26664 + }, + { + "epoch": 0.52, + "learning_rate": 9.664479049357306e-08, + "loss": 0.0005, + "step": 26665 + }, + { + "epoch": 0.52, + "learning_rate": 9.664090714923691e-08, + "loss": 0.0005, + "step": 26666 + }, + { + "epoch": 0.52, + "learning_rate": 9.663702380490077e-08, + "loss": 0.0023, + "step": 26667 + }, + { + "epoch": 0.52, + "learning_rate": 9.663314046056463e-08, + "loss": 1.2213, + "step": 26668 + }, + { + "epoch": 0.52, + "learning_rate": 9.662925711622849e-08, + "loss": 0.001, + "step": 26669 + }, + { + "epoch": 0.52, + "learning_rate": 9.662537377189235e-08, + "loss": 1.0976, + "step": 26670 + }, + { + "epoch": 0.52, + "learning_rate": 9.66214904275562e-08, + "loss": 0.0006, + "step": 26671 + }, + { + "epoch": 0.52, + "learning_rate": 9.661760708322006e-08, + "loss": 0.0007, + "step": 26672 + }, + { + "epoch": 0.52, + "learning_rate": 9.661372373888392e-08, + "loss": 0.0005, + "step": 26673 + }, + { + "epoch": 0.52, + "learning_rate": 9.660984039454778e-08, + "loss": 0.0005, + "step": 26674 + }, + { + "epoch": 0.52, + "learning_rate": 9.660595705021164e-08, + "loss": 0.2774, + "step": 26675 + }, + { + "epoch": 0.52, + "learning_rate": 9.66020737058755e-08, + "loss": 0.0007, + "step": 26676 + }, + { + "epoch": 0.52, + "learning_rate": 9.659819036153935e-08, + "loss": 0.0005, + "step": 26677 + }, + { + "epoch": 0.52, + "learning_rate": 9.659430701720321e-08, + "loss": 0.0008, + "step": 26678 + }, + { + "epoch": 0.52, + "learning_rate": 9.659042367286707e-08, + "loss": 0.0005, + "step": 26679 + }, + { + "epoch": 0.52, + "learning_rate": 9.658654032853093e-08, + "loss": 0.0011, + "step": 26680 + }, + { + "epoch": 0.52, + "learning_rate": 9.658265698419479e-08, + "loss": 0.0126, + "step": 26681 + }, + { + "epoch": 0.52, + "learning_rate": 9.657877363985865e-08, + "loss": 0.0005, + "step": 26682 + }, + { + "epoch": 0.52, + "learning_rate": 9.65748902955225e-08, + "loss": 0.0026, + "step": 26683 + }, + { + "epoch": 0.52, + "learning_rate": 9.657100695118636e-08, + "loss": 0.0006, + "step": 26684 + }, + { + "epoch": 0.52, + "learning_rate": 9.656712360685022e-08, + "loss": 0.0006, + "step": 26685 + }, + { + "epoch": 0.52, + "learning_rate": 9.656324026251407e-08, + "loss": 0.0005, + "step": 26686 + }, + { + "epoch": 0.52, + "learning_rate": 9.655935691817792e-08, + "loss": 0.0005, + "step": 26687 + }, + { + "epoch": 0.52, + "learning_rate": 9.655547357384178e-08, + "loss": 0.0039, + "step": 26688 + }, + { + "epoch": 0.52, + "learning_rate": 9.655159022950564e-08, + "loss": 0.0007, + "step": 26689 + }, + { + "epoch": 0.52, + "learning_rate": 9.65477068851695e-08, + "loss": 0.0004, + "step": 26690 + }, + { + "epoch": 0.52, + "learning_rate": 9.654382354083336e-08, + "loss": 0.0112, + "step": 26691 + }, + { + "epoch": 0.52, + "learning_rate": 9.653994019649721e-08, + "loss": 0.0005, + "step": 26692 + }, + { + "epoch": 0.52, + "learning_rate": 9.653605685216107e-08, + "loss": 0.0003, + "step": 26693 + }, + { + "epoch": 0.52, + "learning_rate": 9.653217350782493e-08, + "loss": 0.0007, + "step": 26694 + }, + { + "epoch": 0.52, + "learning_rate": 9.652829016348879e-08, + "loss": 0.003, + "step": 26695 + }, + { + "epoch": 0.52, + "learning_rate": 9.652440681915265e-08, + "loss": 0.001, + "step": 26696 + }, + { + "epoch": 0.52, + "learning_rate": 9.65205234748165e-08, + "loss": 0.0006, + "step": 26697 + }, + { + "epoch": 0.52, + "learning_rate": 9.651664013048036e-08, + "loss": 0.0005, + "step": 26698 + }, + { + "epoch": 0.52, + "learning_rate": 9.651275678614422e-08, + "loss": 1.0817, + "step": 26699 + }, + { + "epoch": 0.52, + "learning_rate": 9.650887344180808e-08, + "loss": 0.0007, + "step": 26700 + }, + { + "epoch": 0.52, + "learning_rate": 9.650499009747194e-08, + "loss": 0.0006, + "step": 26701 + }, + { + "epoch": 0.52, + "learning_rate": 9.65011067531358e-08, + "loss": 0.0006, + "step": 26702 + }, + { + "epoch": 0.52, + "learning_rate": 9.649722340879966e-08, + "loss": 0.0006, + "step": 26703 + }, + { + "epoch": 0.52, + "learning_rate": 9.649334006446351e-08, + "loss": 0.0057, + "step": 26704 + }, + { + "epoch": 0.52, + "learning_rate": 9.648945672012737e-08, + "loss": 0.0004, + "step": 26705 + }, + { + "epoch": 0.52, + "learning_rate": 9.648557337579123e-08, + "loss": 0.0008, + "step": 26706 + }, + { + "epoch": 0.52, + "learning_rate": 9.648169003145509e-08, + "loss": 0.0027, + "step": 26707 + }, + { + "epoch": 0.52, + "learning_rate": 9.647780668711895e-08, + "loss": 0.0005, + "step": 26708 + }, + { + "epoch": 0.52, + "learning_rate": 9.64739233427828e-08, + "loss": 0.0007, + "step": 26709 + }, + { + "epoch": 0.52, + "learning_rate": 9.647003999844666e-08, + "loss": 0.0008, + "step": 26710 + }, + { + "epoch": 0.52, + "learning_rate": 9.646615665411052e-08, + "loss": 0.0005, + "step": 26711 + }, + { + "epoch": 0.52, + "learning_rate": 9.646227330977438e-08, + "loss": 0.0005, + "step": 26712 + }, + { + "epoch": 0.52, + "learning_rate": 9.645838996543824e-08, + "loss": 0.0005, + "step": 26713 + }, + { + "epoch": 0.52, + "learning_rate": 9.64545066211021e-08, + "loss": 0.0006, + "step": 26714 + }, + { + "epoch": 0.52, + "learning_rate": 9.645062327676594e-08, + "loss": 0.0006, + "step": 26715 + }, + { + "epoch": 0.52, + "learning_rate": 9.64467399324298e-08, + "loss": 0.0005, + "step": 26716 + }, + { + "epoch": 0.52, + "learning_rate": 9.644285658809366e-08, + "loss": 0.0323, + "step": 26717 + }, + { + "epoch": 0.52, + "learning_rate": 9.643897324375752e-08, + "loss": 0.0024, + "step": 26718 + }, + { + "epoch": 0.52, + "learning_rate": 9.643508989942137e-08, + "loss": 0.0014, + "step": 26719 + }, + { + "epoch": 0.52, + "learning_rate": 9.643120655508523e-08, + "loss": 0.0022, + "step": 26720 + }, + { + "epoch": 0.52, + "learning_rate": 9.642732321074909e-08, + "loss": 0.0004, + "step": 26721 + }, + { + "epoch": 0.52, + "learning_rate": 9.642343986641295e-08, + "loss": 0.0036, + "step": 26722 + }, + { + "epoch": 0.52, + "learning_rate": 9.641955652207681e-08, + "loss": 0.0004, + "step": 26723 + }, + { + "epoch": 0.52, + "learning_rate": 9.641567317774067e-08, + "loss": 0.518, + "step": 26724 + }, + { + "epoch": 0.52, + "learning_rate": 9.641178983340452e-08, + "loss": 0.0008, + "step": 26725 + }, + { + "epoch": 0.52, + "learning_rate": 9.640790648906838e-08, + "loss": 0.0006, + "step": 26726 + }, + { + "epoch": 0.52, + "learning_rate": 9.640402314473224e-08, + "loss": 0.0007, + "step": 26727 + }, + { + "epoch": 0.52, + "learning_rate": 9.64001398003961e-08, + "loss": 0.0006, + "step": 26728 + }, + { + "epoch": 0.52, + "learning_rate": 9.639625645605996e-08, + "loss": 0.5504, + "step": 26729 + }, + { + "epoch": 0.52, + "learning_rate": 9.639237311172381e-08, + "loss": 0.001, + "step": 26730 + }, + { + "epoch": 0.52, + "learning_rate": 9.638848976738767e-08, + "loss": 0.0005, + "step": 26731 + }, + { + "epoch": 0.52, + "learning_rate": 9.638460642305153e-08, + "loss": 0.0251, + "step": 26732 + }, + { + "epoch": 0.52, + "learning_rate": 9.638072307871539e-08, + "loss": 0.0006, + "step": 26733 + }, + { + "epoch": 0.52, + "learning_rate": 9.637683973437925e-08, + "loss": 0.0005, + "step": 26734 + }, + { + "epoch": 0.52, + "learning_rate": 9.63729563900431e-08, + "loss": 0.0003, + "step": 26735 + }, + { + "epoch": 0.52, + "learning_rate": 9.636907304570696e-08, + "loss": 0.004, + "step": 26736 + }, + { + "epoch": 0.52, + "learning_rate": 9.636518970137082e-08, + "loss": 0.0004, + "step": 26737 + }, + { + "epoch": 0.52, + "learning_rate": 9.636130635703468e-08, + "loss": 1.0339, + "step": 26738 + }, + { + "epoch": 0.52, + "learning_rate": 9.635742301269854e-08, + "loss": 0.0011, + "step": 26739 + }, + { + "epoch": 0.52, + "learning_rate": 9.63535396683624e-08, + "loss": 0.118, + "step": 26740 + }, + { + "epoch": 0.52, + "learning_rate": 9.634965632402626e-08, + "loss": 0.0008, + "step": 26741 + }, + { + "epoch": 0.52, + "learning_rate": 9.634577297969011e-08, + "loss": 0.0007, + "step": 26742 + }, + { + "epoch": 0.52, + "learning_rate": 9.634188963535397e-08, + "loss": 0.0007, + "step": 26743 + }, + { + "epoch": 0.52, + "learning_rate": 9.633800629101782e-08, + "loss": 0.0004, + "step": 26744 + }, + { + "epoch": 0.52, + "learning_rate": 9.633412294668168e-08, + "loss": 0.0006, + "step": 26745 + }, + { + "epoch": 0.52, + "learning_rate": 9.633023960234553e-08, + "loss": 0.0005, + "step": 26746 + }, + { + "epoch": 0.52, + "learning_rate": 9.632635625800939e-08, + "loss": 0.0005, + "step": 26747 + }, + { + "epoch": 0.52, + "learning_rate": 9.632247291367325e-08, + "loss": 0.8456, + "step": 26748 + }, + { + "epoch": 0.52, + "learning_rate": 9.631858956933711e-08, + "loss": 0.0007, + "step": 26749 + }, + { + "epoch": 0.52, + "learning_rate": 9.631470622500097e-08, + "loss": 0.0004, + "step": 26750 + }, + { + "epoch": 0.52, + "learning_rate": 9.631082288066482e-08, + "loss": 0.0006, + "step": 26751 + }, + { + "epoch": 0.52, + "learning_rate": 9.630693953632868e-08, + "loss": 0.0006, + "step": 26752 + }, + { + "epoch": 0.52, + "learning_rate": 9.630305619199254e-08, + "loss": 0.001, + "step": 26753 + }, + { + "epoch": 0.52, + "learning_rate": 9.62991728476564e-08, + "loss": 0.0005, + "step": 26754 + }, + { + "epoch": 0.52, + "learning_rate": 9.629528950332026e-08, + "loss": 0.0004, + "step": 26755 + }, + { + "epoch": 0.52, + "learning_rate": 9.629140615898412e-08, + "loss": 0.0006, + "step": 26756 + }, + { + "epoch": 0.52, + "learning_rate": 9.628752281464797e-08, + "loss": 0.0005, + "step": 26757 + }, + { + "epoch": 0.52, + "learning_rate": 9.628363947031183e-08, + "loss": 0.0004, + "step": 26758 + }, + { + "epoch": 0.52, + "learning_rate": 9.627975612597569e-08, + "loss": 0.0016, + "step": 26759 + }, + { + "epoch": 0.52, + "learning_rate": 9.627587278163955e-08, + "loss": 0.0006, + "step": 26760 + }, + { + "epoch": 0.52, + "learning_rate": 9.627198943730341e-08, + "loss": 0.0005, + "step": 26761 + }, + { + "epoch": 0.52, + "learning_rate": 9.626810609296727e-08, + "loss": 0.3211, + "step": 26762 + }, + { + "epoch": 0.52, + "learning_rate": 9.626422274863112e-08, + "loss": 0.7928, + "step": 26763 + }, + { + "epoch": 0.52, + "learning_rate": 9.626033940429498e-08, + "loss": 0.0004, + "step": 26764 + }, + { + "epoch": 0.52, + "learning_rate": 9.625645605995884e-08, + "loss": 0.0006, + "step": 26765 + }, + { + "epoch": 0.52, + "learning_rate": 9.62525727156227e-08, + "loss": 0.4866, + "step": 26766 + }, + { + "epoch": 0.52, + "learning_rate": 9.624868937128656e-08, + "loss": 0.0013, + "step": 26767 + }, + { + "epoch": 0.52, + "learning_rate": 9.624480602695041e-08, + "loss": 0.0006, + "step": 26768 + }, + { + "epoch": 0.52, + "learning_rate": 9.624092268261427e-08, + "loss": 0.0006, + "step": 26769 + }, + { + "epoch": 0.52, + "learning_rate": 9.623703933827813e-08, + "loss": 0.0007, + "step": 26770 + }, + { + "epoch": 0.52, + "learning_rate": 9.623315599394199e-08, + "loss": 0.0006, + "step": 26771 + }, + { + "epoch": 0.52, + "learning_rate": 9.622927264960585e-08, + "loss": 0.0006, + "step": 26772 + }, + { + "epoch": 0.52, + "learning_rate": 9.622538930526969e-08, + "loss": 0.0006, + "step": 26773 + }, + { + "epoch": 0.52, + "learning_rate": 9.622150596093355e-08, + "loss": 0.0006, + "step": 26774 + }, + { + "epoch": 0.52, + "learning_rate": 9.621762261659741e-08, + "loss": 0.0004, + "step": 26775 + }, + { + "epoch": 0.52, + "learning_rate": 9.621373927226127e-08, + "loss": 0.0005, + "step": 26776 + }, + { + "epoch": 0.52, + "learning_rate": 9.620985592792513e-08, + "loss": 0.0004, + "step": 26777 + }, + { + "epoch": 0.52, + "learning_rate": 9.620597258358898e-08, + "loss": 0.781, + "step": 26778 + }, + { + "epoch": 0.52, + "learning_rate": 9.620208923925284e-08, + "loss": 0.0005, + "step": 26779 + }, + { + "epoch": 0.52, + "learning_rate": 9.61982058949167e-08, + "loss": 0.0005, + "step": 26780 + }, + { + "epoch": 0.52, + "learning_rate": 9.619432255058056e-08, + "loss": 0.0006, + "step": 26781 + }, + { + "epoch": 0.52, + "learning_rate": 9.619043920624442e-08, + "loss": 0.6946, + "step": 26782 + }, + { + "epoch": 0.52, + "learning_rate": 9.618655586190828e-08, + "loss": 0.0006, + "step": 26783 + }, + { + "epoch": 0.52, + "learning_rate": 9.618267251757213e-08, + "loss": 0.0006, + "step": 26784 + }, + { + "epoch": 0.52, + "learning_rate": 9.617878917323599e-08, + "loss": 0.0004, + "step": 26785 + }, + { + "epoch": 0.52, + "learning_rate": 9.617490582889985e-08, + "loss": 0.0005, + "step": 26786 + }, + { + "epoch": 0.52, + "learning_rate": 9.617102248456371e-08, + "loss": 0.0005, + "step": 26787 + }, + { + "epoch": 0.52, + "learning_rate": 9.616713914022757e-08, + "loss": 0.0005, + "step": 26788 + }, + { + "epoch": 0.52, + "learning_rate": 9.616325579589142e-08, + "loss": 0.0007, + "step": 26789 + }, + { + "epoch": 0.52, + "learning_rate": 9.615937245155527e-08, + "loss": 0.0007, + "step": 26790 + }, + { + "epoch": 0.52, + "learning_rate": 9.615548910721913e-08, + "loss": 0.1451, + "step": 26791 + }, + { + "epoch": 0.52, + "learning_rate": 9.615160576288299e-08, + "loss": 0.0023, + "step": 26792 + }, + { + "epoch": 0.52, + "learning_rate": 9.614772241854684e-08, + "loss": 0.0008, + "step": 26793 + }, + { + "epoch": 0.52, + "learning_rate": 9.61438390742107e-08, + "loss": 0.0006, + "step": 26794 + }, + { + "epoch": 0.52, + "learning_rate": 9.613995572987456e-08, + "loss": 0.0005, + "step": 26795 + }, + { + "epoch": 0.52, + "learning_rate": 9.613607238553842e-08, + "loss": 0.0007, + "step": 26796 + }, + { + "epoch": 0.52, + "learning_rate": 9.613218904120228e-08, + "loss": 0.0016, + "step": 26797 + }, + { + "epoch": 0.52, + "learning_rate": 9.612830569686614e-08, + "loss": 0.4389, + "step": 26798 + }, + { + "epoch": 0.52, + "learning_rate": 9.612442235253e-08, + "loss": 0.0006, + "step": 26799 + }, + { + "epoch": 0.52, + "learning_rate": 9.612053900819385e-08, + "loss": 0.0019, + "step": 26800 + }, + { + "epoch": 0.52, + "learning_rate": 9.611665566385771e-08, + "loss": 0.0006, + "step": 26801 + }, + { + "epoch": 0.52, + "learning_rate": 9.611277231952157e-08, + "loss": 0.0225, + "step": 26802 + }, + { + "epoch": 0.52, + "learning_rate": 9.610888897518543e-08, + "loss": 0.0006, + "step": 26803 + }, + { + "epoch": 0.52, + "learning_rate": 9.610500563084927e-08, + "loss": 0.0392, + "step": 26804 + }, + { + "epoch": 0.52, + "learning_rate": 9.610112228651313e-08, + "loss": 0.0006, + "step": 26805 + }, + { + "epoch": 0.52, + "learning_rate": 9.609723894217699e-08, + "loss": 0.007, + "step": 26806 + }, + { + "epoch": 0.52, + "learning_rate": 9.609335559784085e-08, + "loss": 0.0005, + "step": 26807 + }, + { + "epoch": 0.52, + "learning_rate": 9.60894722535047e-08, + "loss": 0.0005, + "step": 26808 + }, + { + "epoch": 0.52, + "learning_rate": 9.608558890916856e-08, + "loss": 0.0006, + "step": 26809 + }, + { + "epoch": 0.52, + "learning_rate": 9.608170556483242e-08, + "loss": 0.0014, + "step": 26810 + }, + { + "epoch": 0.52, + "learning_rate": 9.607782222049628e-08, + "loss": 0.0006, + "step": 26811 + }, + { + "epoch": 0.52, + "learning_rate": 9.607393887616014e-08, + "loss": 0.0007, + "step": 26812 + }, + { + "epoch": 0.52, + "learning_rate": 9.6070055531824e-08, + "loss": 0.0004, + "step": 26813 + }, + { + "epoch": 0.52, + "learning_rate": 9.606617218748785e-08, + "loss": 0.8853, + "step": 26814 + }, + { + "epoch": 0.52, + "learning_rate": 9.606228884315171e-08, + "loss": 0.0522, + "step": 26815 + }, + { + "epoch": 0.52, + "learning_rate": 9.605840549881557e-08, + "loss": 0.0005, + "step": 26816 + }, + { + "epoch": 0.52, + "learning_rate": 9.605452215447943e-08, + "loss": 0.0004, + "step": 26817 + }, + { + "epoch": 0.52, + "learning_rate": 9.605063881014329e-08, + "loss": 0.0006, + "step": 26818 + }, + { + "epoch": 0.52, + "learning_rate": 9.604675546580715e-08, + "loss": 0.0019, + "step": 26819 + }, + { + "epoch": 0.52, + "learning_rate": 9.6042872121471e-08, + "loss": 0.0133, + "step": 26820 + }, + { + "epoch": 0.52, + "learning_rate": 9.603898877713486e-08, + "loss": 0.1681, + "step": 26821 + }, + { + "epoch": 0.52, + "learning_rate": 9.603510543279872e-08, + "loss": 0.0028, + "step": 26822 + }, + { + "epoch": 0.52, + "learning_rate": 9.603122208846258e-08, + "loss": 0.0009, + "step": 26823 + }, + { + "epoch": 0.52, + "learning_rate": 9.602733874412644e-08, + "loss": 0.0005, + "step": 26824 + }, + { + "epoch": 0.52, + "learning_rate": 9.60234553997903e-08, + "loss": 0.0009, + "step": 26825 + }, + { + "epoch": 0.52, + "learning_rate": 9.601957205545415e-08, + "loss": 0.0006, + "step": 26826 + }, + { + "epoch": 0.52, + "learning_rate": 9.601568871111801e-08, + "loss": 0.0009, + "step": 26827 + }, + { + "epoch": 0.52, + "learning_rate": 9.601180536678187e-08, + "loss": 0.3515, + "step": 26828 + }, + { + "epoch": 0.52, + "learning_rate": 9.600792202244573e-08, + "loss": 1.0089, + "step": 26829 + }, + { + "epoch": 0.52, + "learning_rate": 9.600403867810959e-08, + "loss": 0.0078, + "step": 26830 + }, + { + "epoch": 0.52, + "learning_rate": 9.600015533377343e-08, + "loss": 0.0006, + "step": 26831 + }, + { + "epoch": 0.52, + "learning_rate": 9.599627198943729e-08, + "loss": 0.0006, + "step": 26832 + }, + { + "epoch": 0.52, + "learning_rate": 9.599238864510115e-08, + "loss": 0.666, + "step": 26833 + }, + { + "epoch": 0.52, + "learning_rate": 9.5988505300765e-08, + "loss": 0.0005, + "step": 26834 + }, + { + "epoch": 0.52, + "learning_rate": 9.598462195642886e-08, + "loss": 0.0005, + "step": 26835 + }, + { + "epoch": 0.52, + "learning_rate": 9.598073861209272e-08, + "loss": 0.0008, + "step": 26836 + }, + { + "epoch": 0.52, + "learning_rate": 9.597685526775658e-08, + "loss": 0.0006, + "step": 26837 + }, + { + "epoch": 0.52, + "learning_rate": 9.597297192342044e-08, + "loss": 0.0005, + "step": 26838 + }, + { + "epoch": 0.52, + "learning_rate": 9.59690885790843e-08, + "loss": 0.0006, + "step": 26839 + }, + { + "epoch": 0.52, + "learning_rate": 9.596520523474816e-08, + "loss": 0.0005, + "step": 26840 + }, + { + "epoch": 0.52, + "learning_rate": 9.596132189041201e-08, + "loss": 0.0005, + "step": 26841 + }, + { + "epoch": 0.52, + "learning_rate": 9.595743854607587e-08, + "loss": 0.0311, + "step": 26842 + }, + { + "epoch": 0.52, + "learning_rate": 9.595355520173973e-08, + "loss": 0.0013, + "step": 26843 + }, + { + "epoch": 0.52, + "learning_rate": 9.594967185740359e-08, + "loss": 0.001, + "step": 26844 + }, + { + "epoch": 0.52, + "learning_rate": 9.594578851306745e-08, + "loss": 0.0021, + "step": 26845 + }, + { + "epoch": 0.52, + "learning_rate": 9.59419051687313e-08, + "loss": 0.0601, + "step": 26846 + }, + { + "epoch": 0.52, + "learning_rate": 9.593802182439516e-08, + "loss": 0.063, + "step": 26847 + }, + { + "epoch": 0.52, + "learning_rate": 9.593413848005902e-08, + "loss": 0.0007, + "step": 26848 + }, + { + "epoch": 0.52, + "learning_rate": 9.593025513572288e-08, + "loss": 0.0004, + "step": 26849 + }, + { + "epoch": 0.52, + "learning_rate": 9.592637179138674e-08, + "loss": 0.0005, + "step": 26850 + }, + { + "epoch": 0.52, + "learning_rate": 9.59224884470506e-08, + "loss": 0.0007, + "step": 26851 + }, + { + "epoch": 0.52, + "learning_rate": 9.591860510271445e-08, + "loss": 0.0006, + "step": 26852 + }, + { + "epoch": 0.52, + "learning_rate": 9.591472175837831e-08, + "loss": 0.0012, + "step": 26853 + }, + { + "epoch": 0.52, + "learning_rate": 9.591083841404217e-08, + "loss": 0.0005, + "step": 26854 + }, + { + "epoch": 0.52, + "learning_rate": 9.590695506970603e-08, + "loss": 0.436, + "step": 26855 + }, + { + "epoch": 0.52, + "learning_rate": 9.590307172536989e-08, + "loss": 0.0045, + "step": 26856 + }, + { + "epoch": 0.52, + "learning_rate": 9.589918838103375e-08, + "loss": 0.5526, + "step": 26857 + }, + { + "epoch": 0.52, + "learning_rate": 9.58953050366976e-08, + "loss": 0.0006, + "step": 26858 + }, + { + "epoch": 0.52, + "learning_rate": 9.589142169236146e-08, + "loss": 0.0005, + "step": 26859 + }, + { + "epoch": 0.52, + "learning_rate": 9.588753834802531e-08, + "loss": 1.0438, + "step": 26860 + }, + { + "epoch": 0.52, + "learning_rate": 9.588365500368917e-08, + "loss": 0.0005, + "step": 26861 + }, + { + "epoch": 0.52, + "learning_rate": 9.587977165935302e-08, + "loss": 0.0005, + "step": 26862 + }, + { + "epoch": 0.52, + "learning_rate": 9.587588831501688e-08, + "loss": 0.0007, + "step": 26863 + }, + { + "epoch": 0.52, + "learning_rate": 9.587200497068074e-08, + "loss": 0.0006, + "step": 26864 + }, + { + "epoch": 0.52, + "learning_rate": 9.58681216263446e-08, + "loss": 0.0003, + "step": 26865 + }, + { + "epoch": 0.52, + "learning_rate": 9.586423828200846e-08, + "loss": 0.0005, + "step": 26866 + }, + { + "epoch": 0.52, + "learning_rate": 9.586035493767231e-08, + "loss": 0.0011, + "step": 26867 + }, + { + "epoch": 0.52, + "learning_rate": 9.585647159333617e-08, + "loss": 0.0004, + "step": 26868 + }, + { + "epoch": 0.52, + "learning_rate": 9.585258824900003e-08, + "loss": 0.0012, + "step": 26869 + }, + { + "epoch": 0.52, + "learning_rate": 9.584870490466389e-08, + "loss": 0.0013, + "step": 26870 + }, + { + "epoch": 0.52, + "learning_rate": 9.584482156032775e-08, + "loss": 0.0005, + "step": 26871 + }, + { + "epoch": 0.52, + "learning_rate": 9.58409382159916e-08, + "loss": 0.5764, + "step": 26872 + }, + { + "epoch": 0.52, + "learning_rate": 9.583705487165546e-08, + "loss": 0.0012, + "step": 26873 + }, + { + "epoch": 0.52, + "learning_rate": 9.583317152731932e-08, + "loss": 0.0005, + "step": 26874 + }, + { + "epoch": 0.52, + "learning_rate": 9.582928818298318e-08, + "loss": 0.4013, + "step": 26875 + }, + { + "epoch": 0.52, + "learning_rate": 9.582540483864704e-08, + "loss": 0.0029, + "step": 26876 + }, + { + "epoch": 0.52, + "learning_rate": 9.58215214943109e-08, + "loss": 0.0005, + "step": 26877 + }, + { + "epoch": 0.52, + "learning_rate": 9.581763814997476e-08, + "loss": 0.0012, + "step": 26878 + }, + { + "epoch": 0.52, + "learning_rate": 9.581375480563861e-08, + "loss": 0.9438, + "step": 26879 + }, + { + "epoch": 0.52, + "learning_rate": 9.580987146130247e-08, + "loss": 0.0007, + "step": 26880 + }, + { + "epoch": 0.52, + "learning_rate": 9.580598811696633e-08, + "loss": 0.0006, + "step": 26881 + }, + { + "epoch": 0.52, + "learning_rate": 9.580210477263019e-08, + "loss": 0.0005, + "step": 26882 + }, + { + "epoch": 0.52, + "learning_rate": 9.579822142829405e-08, + "loss": 0.0006, + "step": 26883 + }, + { + "epoch": 0.52, + "learning_rate": 9.57943380839579e-08, + "loss": 0.0013, + "step": 26884 + }, + { + "epoch": 0.52, + "learning_rate": 9.579045473962176e-08, + "loss": 0.0009, + "step": 26885 + }, + { + "epoch": 0.52, + "learning_rate": 9.578657139528562e-08, + "loss": 0.197, + "step": 26886 + }, + { + "epoch": 0.52, + "learning_rate": 9.578268805094948e-08, + "loss": 0.0007, + "step": 26887 + }, + { + "epoch": 0.52, + "learning_rate": 9.577880470661334e-08, + "loss": 0.0006, + "step": 26888 + }, + { + "epoch": 0.52, + "learning_rate": 9.577492136227718e-08, + "loss": 0.0007, + "step": 26889 + }, + { + "epoch": 0.52, + "learning_rate": 9.577103801794104e-08, + "loss": 0.0063, + "step": 26890 + }, + { + "epoch": 0.52, + "learning_rate": 9.57671546736049e-08, + "loss": 0.0004, + "step": 26891 + }, + { + "epoch": 0.52, + "learning_rate": 9.576327132926876e-08, + "loss": 0.0005, + "step": 26892 + }, + { + "epoch": 0.52, + "learning_rate": 9.575938798493262e-08, + "loss": 0.0069, + "step": 26893 + }, + { + "epoch": 0.52, + "learning_rate": 9.575550464059647e-08, + "loss": 0.1993, + "step": 26894 + }, + { + "epoch": 0.52, + "learning_rate": 9.575162129626033e-08, + "loss": 0.0006, + "step": 26895 + }, + { + "epoch": 0.52, + "learning_rate": 9.574773795192419e-08, + "loss": 0.8877, + "step": 26896 + }, + { + "epoch": 0.52, + "learning_rate": 9.574385460758805e-08, + "loss": 0.0007, + "step": 26897 + }, + { + "epoch": 0.52, + "learning_rate": 9.573997126325191e-08, + "loss": 0.0007, + "step": 26898 + }, + { + "epoch": 0.52, + "learning_rate": 9.573608791891577e-08, + "loss": 0.0006, + "step": 26899 + }, + { + "epoch": 0.52, + "learning_rate": 9.573220457457962e-08, + "loss": 0.0005, + "step": 26900 + }, + { + "epoch": 0.52, + "learning_rate": 9.572832123024348e-08, + "loss": 0.0005, + "step": 26901 + }, + { + "epoch": 0.52, + "learning_rate": 9.572443788590734e-08, + "loss": 0.0009, + "step": 26902 + }, + { + "epoch": 0.52, + "learning_rate": 9.57205545415712e-08, + "loss": 0.6101, + "step": 26903 + }, + { + "epoch": 0.52, + "learning_rate": 9.571667119723506e-08, + "loss": 0.0004, + "step": 26904 + }, + { + "epoch": 0.52, + "learning_rate": 9.571278785289891e-08, + "loss": 0.0014, + "step": 26905 + }, + { + "epoch": 0.52, + "learning_rate": 9.570890450856277e-08, + "loss": 1.0903, + "step": 26906 + }, + { + "epoch": 0.52, + "learning_rate": 9.570502116422663e-08, + "loss": 0.0007, + "step": 26907 + }, + { + "epoch": 0.52, + "learning_rate": 9.570113781989049e-08, + "loss": 0.0007, + "step": 26908 + }, + { + "epoch": 0.52, + "learning_rate": 9.569725447555435e-08, + "loss": 0.0006, + "step": 26909 + }, + { + "epoch": 0.52, + "learning_rate": 9.56933711312182e-08, + "loss": 0.0006, + "step": 26910 + }, + { + "epoch": 0.52, + "learning_rate": 9.568948778688206e-08, + "loss": 0.0006, + "step": 26911 + }, + { + "epoch": 0.52, + "learning_rate": 9.568560444254592e-08, + "loss": 0.0009, + "step": 26912 + }, + { + "epoch": 0.52, + "learning_rate": 9.568172109820978e-08, + "loss": 0.001, + "step": 26913 + }, + { + "epoch": 0.52, + "learning_rate": 9.567783775387364e-08, + "loss": 0.0005, + "step": 26914 + }, + { + "epoch": 0.52, + "learning_rate": 9.56739544095375e-08, + "loss": 0.0004, + "step": 26915 + }, + { + "epoch": 0.52, + "learning_rate": 9.567007106520136e-08, + "loss": 0.46, + "step": 26916 + }, + { + "epoch": 0.52, + "learning_rate": 9.566618772086521e-08, + "loss": 0.0009, + "step": 26917 + }, + { + "epoch": 0.52, + "learning_rate": 9.566230437652906e-08, + "loss": 0.0007, + "step": 26918 + }, + { + "epoch": 0.52, + "learning_rate": 9.565842103219292e-08, + "loss": 0.001, + "step": 26919 + }, + { + "epoch": 0.52, + "learning_rate": 9.565453768785678e-08, + "loss": 0.047, + "step": 26920 + }, + { + "epoch": 0.52, + "learning_rate": 9.565065434352063e-08, + "loss": 0.0006, + "step": 26921 + }, + { + "epoch": 0.52, + "learning_rate": 9.564677099918449e-08, + "loss": 0.0006, + "step": 26922 + }, + { + "epoch": 0.52, + "learning_rate": 9.564288765484835e-08, + "loss": 0.0871, + "step": 26923 + }, + { + "epoch": 0.52, + "learning_rate": 9.563900431051221e-08, + "loss": 0.0004, + "step": 26924 + }, + { + "epoch": 0.52, + "learning_rate": 9.563512096617607e-08, + "loss": 0.4134, + "step": 26925 + }, + { + "epoch": 0.52, + "learning_rate": 9.563123762183992e-08, + "loss": 0.7802, + "step": 26926 + }, + { + "epoch": 0.52, + "learning_rate": 9.562735427750378e-08, + "loss": 0.0006, + "step": 26927 + }, + { + "epoch": 0.52, + "learning_rate": 9.562347093316764e-08, + "loss": 0.0006, + "step": 26928 + }, + { + "epoch": 0.52, + "learning_rate": 9.56195875888315e-08, + "loss": 0.0019, + "step": 26929 + }, + { + "epoch": 0.52, + "learning_rate": 9.561570424449536e-08, + "loss": 0.0013, + "step": 26930 + }, + { + "epoch": 0.52, + "learning_rate": 9.561182090015922e-08, + "loss": 0.0009, + "step": 26931 + }, + { + "epoch": 0.52, + "learning_rate": 9.560793755582307e-08, + "loss": 0.0004, + "step": 26932 + }, + { + "epoch": 0.52, + "learning_rate": 9.560405421148693e-08, + "loss": 0.0006, + "step": 26933 + }, + { + "epoch": 0.52, + "learning_rate": 9.560017086715079e-08, + "loss": 0.0005, + "step": 26934 + }, + { + "epoch": 0.52, + "learning_rate": 9.559628752281465e-08, + "loss": 0.7139, + "step": 26935 + }, + { + "epoch": 0.52, + "learning_rate": 9.559240417847851e-08, + "loss": 0.0006, + "step": 26936 + }, + { + "epoch": 0.52, + "learning_rate": 9.558852083414237e-08, + "loss": 0.0006, + "step": 26937 + }, + { + "epoch": 0.52, + "learning_rate": 9.558463748980622e-08, + "loss": 0.0006, + "step": 26938 + }, + { + "epoch": 0.52, + "learning_rate": 9.558075414547008e-08, + "loss": 0.8471, + "step": 26939 + }, + { + "epoch": 0.52, + "learning_rate": 9.557687080113394e-08, + "loss": 0.0007, + "step": 26940 + }, + { + "epoch": 0.52, + "learning_rate": 9.55729874567978e-08, + "loss": 0.0005, + "step": 26941 + }, + { + "epoch": 0.52, + "learning_rate": 9.556910411246166e-08, + "loss": 0.0293, + "step": 26942 + }, + { + "epoch": 0.52, + "learning_rate": 9.556522076812551e-08, + "loss": 0.0003, + "step": 26943 + }, + { + "epoch": 0.52, + "learning_rate": 9.556133742378937e-08, + "loss": 1.2603, + "step": 26944 + }, + { + "epoch": 0.52, + "learning_rate": 9.555745407945323e-08, + "loss": 0.098, + "step": 26945 + }, + { + "epoch": 0.52, + "learning_rate": 9.555357073511709e-08, + "loss": 0.0006, + "step": 26946 + }, + { + "epoch": 0.52, + "learning_rate": 9.554968739078093e-08, + "loss": 0.0007, + "step": 26947 + }, + { + "epoch": 0.52, + "learning_rate": 9.554580404644479e-08, + "loss": 0.0008, + "step": 26948 + }, + { + "epoch": 0.52, + "learning_rate": 9.554192070210865e-08, + "loss": 0.0005, + "step": 26949 + }, + { + "epoch": 0.52, + "learning_rate": 9.553803735777251e-08, + "loss": 0.0006, + "step": 26950 + }, + { + "epoch": 0.52, + "learning_rate": 9.553415401343637e-08, + "loss": 0.0042, + "step": 26951 + }, + { + "epoch": 0.52, + "learning_rate": 9.553027066910023e-08, + "loss": 0.0008, + "step": 26952 + }, + { + "epoch": 0.52, + "learning_rate": 9.552638732476408e-08, + "loss": 0.0007, + "step": 26953 + }, + { + "epoch": 0.52, + "learning_rate": 9.552250398042794e-08, + "loss": 0.3352, + "step": 26954 + }, + { + "epoch": 0.52, + "learning_rate": 9.55186206360918e-08, + "loss": 0.0006, + "step": 26955 + }, + { + "epoch": 0.52, + "learning_rate": 9.551473729175566e-08, + "loss": 0.0008, + "step": 26956 + }, + { + "epoch": 0.52, + "learning_rate": 9.551085394741952e-08, + "loss": 0.0005, + "step": 26957 + }, + { + "epoch": 0.52, + "learning_rate": 9.550697060308338e-08, + "loss": 0.0006, + "step": 26958 + }, + { + "epoch": 0.52, + "learning_rate": 9.550308725874723e-08, + "loss": 0.0011, + "step": 26959 + }, + { + "epoch": 0.52, + "learning_rate": 9.549920391441109e-08, + "loss": 0.0005, + "step": 26960 + }, + { + "epoch": 0.52, + "learning_rate": 9.549532057007495e-08, + "loss": 0.0005, + "step": 26961 + }, + { + "epoch": 0.52, + "learning_rate": 9.549143722573881e-08, + "loss": 0.0005, + "step": 26962 + }, + { + "epoch": 0.52, + "learning_rate": 9.548755388140267e-08, + "loss": 0.0005, + "step": 26963 + }, + { + "epoch": 0.52, + "learning_rate": 9.548367053706652e-08, + "loss": 0.5067, + "step": 26964 + }, + { + "epoch": 0.52, + "learning_rate": 9.547978719273038e-08, + "loss": 0.001, + "step": 26965 + }, + { + "epoch": 0.52, + "learning_rate": 9.547590384839424e-08, + "loss": 0.0004, + "step": 26966 + }, + { + "epoch": 0.52, + "learning_rate": 9.547202050405809e-08, + "loss": 0.0007, + "step": 26967 + }, + { + "epoch": 0.52, + "learning_rate": 9.546813715972194e-08, + "loss": 0.4315, + "step": 26968 + }, + { + "epoch": 0.52, + "learning_rate": 9.54642538153858e-08, + "loss": 0.0005, + "step": 26969 + }, + { + "epoch": 0.52, + "learning_rate": 9.546037047104966e-08, + "loss": 0.0004, + "step": 26970 + }, + { + "epoch": 0.52, + "learning_rate": 9.545648712671352e-08, + "loss": 0.0006, + "step": 26971 + }, + { + "epoch": 0.52, + "learning_rate": 9.545260378237738e-08, + "loss": 0.0611, + "step": 26972 + }, + { + "epoch": 0.52, + "learning_rate": 9.544872043804124e-08, + "loss": 0.0006, + "step": 26973 + }, + { + "epoch": 0.52, + "learning_rate": 9.54448370937051e-08, + "loss": 0.0005, + "step": 26974 + }, + { + "epoch": 0.52, + "learning_rate": 9.544095374936895e-08, + "loss": 0.0047, + "step": 26975 + }, + { + "epoch": 0.52, + "learning_rate": 9.543707040503281e-08, + "loss": 0.0006, + "step": 26976 + }, + { + "epoch": 0.52, + "learning_rate": 9.543318706069667e-08, + "loss": 0.0006, + "step": 26977 + }, + { + "epoch": 0.52, + "learning_rate": 9.542930371636053e-08, + "loss": 0.0006, + "step": 26978 + }, + { + "epoch": 0.52, + "learning_rate": 9.542542037202439e-08, + "loss": 0.2026, + "step": 26979 + }, + { + "epoch": 0.52, + "learning_rate": 9.542153702768824e-08, + "loss": 0.0004, + "step": 26980 + }, + { + "epoch": 0.52, + "learning_rate": 9.541765368335209e-08, + "loss": 0.001, + "step": 26981 + }, + { + "epoch": 0.52, + "learning_rate": 9.541377033901595e-08, + "loss": 0.0005, + "step": 26982 + }, + { + "epoch": 0.52, + "learning_rate": 9.54098869946798e-08, + "loss": 0.0005, + "step": 26983 + }, + { + "epoch": 0.52, + "learning_rate": 9.540600365034366e-08, + "loss": 0.0004, + "step": 26984 + }, + { + "epoch": 0.52, + "learning_rate": 9.540212030600752e-08, + "loss": 0.0006, + "step": 26985 + }, + { + "epoch": 0.52, + "learning_rate": 9.539823696167138e-08, + "loss": 0.0008, + "step": 26986 + }, + { + "epoch": 0.52, + "learning_rate": 9.539435361733524e-08, + "loss": 0.0005, + "step": 26987 + }, + { + "epoch": 0.52, + "learning_rate": 9.53904702729991e-08, + "loss": 0.0027, + "step": 26988 + }, + { + "epoch": 0.52, + "learning_rate": 9.538658692866295e-08, + "loss": 0.0029, + "step": 26989 + }, + { + "epoch": 0.52, + "learning_rate": 9.538270358432681e-08, + "loss": 0.0009, + "step": 26990 + }, + { + "epoch": 0.52, + "learning_rate": 9.537882023999067e-08, + "loss": 0.0005, + "step": 26991 + }, + { + "epoch": 0.52, + "learning_rate": 9.537493689565453e-08, + "loss": 0.0065, + "step": 26992 + }, + { + "epoch": 0.52, + "learning_rate": 9.537105355131839e-08, + "loss": 0.0006, + "step": 26993 + }, + { + "epoch": 0.52, + "learning_rate": 9.536717020698225e-08, + "loss": 0.0005, + "step": 26994 + }, + { + "epoch": 0.52, + "learning_rate": 9.53632868626461e-08, + "loss": 0.0004, + "step": 26995 + }, + { + "epoch": 0.52, + "learning_rate": 9.535940351830996e-08, + "loss": 0.001, + "step": 26996 + }, + { + "epoch": 0.52, + "learning_rate": 9.535552017397382e-08, + "loss": 0.001, + "step": 26997 + }, + { + "epoch": 0.52, + "learning_rate": 9.535163682963768e-08, + "loss": 0.0007, + "step": 26998 + }, + { + "epoch": 0.52, + "learning_rate": 9.534775348530154e-08, + "loss": 0.0004, + "step": 26999 + }, + { + "epoch": 0.52, + "learning_rate": 9.53438701409654e-08, + "loss": 0.0006, + "step": 27000 + }, + { + "epoch": 0.52, + "learning_rate": 9.533998679662925e-08, + "loss": 1.0876, + "step": 27001 + }, + { + "epoch": 0.52, + "learning_rate": 9.533610345229311e-08, + "loss": 0.0006, + "step": 27002 + }, + { + "epoch": 0.52, + "learning_rate": 9.533222010795697e-08, + "loss": 0.0005, + "step": 27003 + }, + { + "epoch": 0.52, + "learning_rate": 9.532833676362083e-08, + "loss": 0.0006, + "step": 27004 + }, + { + "epoch": 0.52, + "learning_rate": 9.532445341928467e-08, + "loss": 0.0006, + "step": 27005 + }, + { + "epoch": 0.52, + "learning_rate": 9.532057007494853e-08, + "loss": 0.0004, + "step": 27006 + }, + { + "epoch": 0.52, + "learning_rate": 9.531668673061239e-08, + "loss": 0.001, + "step": 27007 + }, + { + "epoch": 0.52, + "learning_rate": 9.531280338627625e-08, + "loss": 0.0005, + "step": 27008 + }, + { + "epoch": 0.52, + "learning_rate": 9.53089200419401e-08, + "loss": 0.0005, + "step": 27009 + }, + { + "epoch": 0.52, + "learning_rate": 9.530503669760396e-08, + "loss": 0.0007, + "step": 27010 + }, + { + "epoch": 0.52, + "learning_rate": 9.530115335326782e-08, + "loss": 0.0005, + "step": 27011 + }, + { + "epoch": 0.52, + "learning_rate": 9.529727000893168e-08, + "loss": 0.0028, + "step": 27012 + }, + { + "epoch": 0.52, + "learning_rate": 9.529338666459554e-08, + "loss": 0.4646, + "step": 27013 + }, + { + "epoch": 0.52, + "learning_rate": 9.52895033202594e-08, + "loss": 0.0006, + "step": 27014 + }, + { + "epoch": 0.52, + "learning_rate": 9.528561997592326e-08, + "loss": 0.0009, + "step": 27015 + }, + { + "epoch": 0.52, + "learning_rate": 9.528173663158711e-08, + "loss": 0.0069, + "step": 27016 + }, + { + "epoch": 0.52, + "learning_rate": 9.527785328725097e-08, + "loss": 0.0006, + "step": 27017 + }, + { + "epoch": 0.52, + "learning_rate": 9.527396994291483e-08, + "loss": 0.0004, + "step": 27018 + }, + { + "epoch": 0.52, + "learning_rate": 9.527008659857869e-08, + "loss": 0.152, + "step": 27019 + }, + { + "epoch": 0.52, + "learning_rate": 9.526620325424255e-08, + "loss": 0.0005, + "step": 27020 + }, + { + "epoch": 0.52, + "learning_rate": 9.52623199099064e-08, + "loss": 0.8312, + "step": 27021 + }, + { + "epoch": 0.52, + "learning_rate": 9.525843656557026e-08, + "loss": 0.0006, + "step": 27022 + }, + { + "epoch": 0.52, + "learning_rate": 9.525455322123412e-08, + "loss": 0.0008, + "step": 27023 + }, + { + "epoch": 0.52, + "learning_rate": 9.525066987689798e-08, + "loss": 0.0907, + "step": 27024 + }, + { + "epoch": 0.52, + "learning_rate": 9.524678653256184e-08, + "loss": 0.0006, + "step": 27025 + }, + { + "epoch": 0.52, + "learning_rate": 9.52429031882257e-08, + "loss": 0.0004, + "step": 27026 + }, + { + "epoch": 0.52, + "learning_rate": 9.523901984388955e-08, + "loss": 0.001, + "step": 27027 + }, + { + "epoch": 0.52, + "learning_rate": 9.523513649955341e-08, + "loss": 0.0005, + "step": 27028 + }, + { + "epoch": 0.52, + "learning_rate": 9.523125315521727e-08, + "loss": 0.0005, + "step": 27029 + }, + { + "epoch": 0.52, + "learning_rate": 9.522736981088113e-08, + "loss": 0.0006, + "step": 27030 + }, + { + "epoch": 0.52, + "learning_rate": 9.522348646654499e-08, + "loss": 0.0026, + "step": 27031 + }, + { + "epoch": 0.52, + "learning_rate": 9.521960312220885e-08, + "loss": 0.0013, + "step": 27032 + }, + { + "epoch": 0.52, + "learning_rate": 9.52157197778727e-08, + "loss": 0.0006, + "step": 27033 + }, + { + "epoch": 0.52, + "learning_rate": 9.521183643353655e-08, + "loss": 0.0537, + "step": 27034 + }, + { + "epoch": 0.52, + "learning_rate": 9.520795308920041e-08, + "loss": 0.0008, + "step": 27035 + }, + { + "epoch": 0.52, + "learning_rate": 9.520406974486427e-08, + "loss": 0.038, + "step": 27036 + }, + { + "epoch": 0.52, + "learning_rate": 9.520018640052812e-08, + "loss": 0.0438, + "step": 27037 + }, + { + "epoch": 0.52, + "learning_rate": 9.519630305619198e-08, + "loss": 0.0004, + "step": 27038 + }, + { + "epoch": 0.52, + "learning_rate": 9.519241971185584e-08, + "loss": 0.0006, + "step": 27039 + }, + { + "epoch": 0.52, + "learning_rate": 9.51885363675197e-08, + "loss": 0.0005, + "step": 27040 + }, + { + "epoch": 0.52, + "learning_rate": 9.518465302318356e-08, + "loss": 0.0008, + "step": 27041 + }, + { + "epoch": 0.52, + "learning_rate": 9.518076967884741e-08, + "loss": 0.0011, + "step": 27042 + }, + { + "epoch": 0.52, + "learning_rate": 9.517688633451127e-08, + "loss": 0.0011, + "step": 27043 + }, + { + "epoch": 0.52, + "learning_rate": 9.517300299017513e-08, + "loss": 0.0006, + "step": 27044 + }, + { + "epoch": 0.52, + "learning_rate": 9.516911964583899e-08, + "loss": 0.0006, + "step": 27045 + }, + { + "epoch": 0.52, + "learning_rate": 9.516523630150285e-08, + "loss": 0.0004, + "step": 27046 + }, + { + "epoch": 0.52, + "learning_rate": 9.51613529571667e-08, + "loss": 0.0006, + "step": 27047 + }, + { + "epoch": 0.52, + "learning_rate": 9.515746961283056e-08, + "loss": 0.0007, + "step": 27048 + }, + { + "epoch": 0.52, + "learning_rate": 9.515358626849442e-08, + "loss": 0.0006, + "step": 27049 + }, + { + "epoch": 0.52, + "learning_rate": 9.514970292415828e-08, + "loss": 0.0006, + "step": 27050 + }, + { + "epoch": 0.52, + "learning_rate": 9.514581957982214e-08, + "loss": 0.0007, + "step": 27051 + }, + { + "epoch": 0.52, + "learning_rate": 9.5141936235486e-08, + "loss": 0.0008, + "step": 27052 + }, + { + "epoch": 0.52, + "learning_rate": 9.513805289114986e-08, + "loss": 0.892, + "step": 27053 + }, + { + "epoch": 0.52, + "learning_rate": 9.513416954681371e-08, + "loss": 0.0011, + "step": 27054 + }, + { + "epoch": 0.52, + "learning_rate": 9.513028620247757e-08, + "loss": 0.0009, + "step": 27055 + }, + { + "epoch": 0.52, + "learning_rate": 9.512640285814143e-08, + "loss": 0.0098, + "step": 27056 + }, + { + "epoch": 0.52, + "learning_rate": 9.512251951380529e-08, + "loss": 0.0498, + "step": 27057 + }, + { + "epoch": 0.52, + "learning_rate": 9.511863616946915e-08, + "loss": 0.0006, + "step": 27058 + }, + { + "epoch": 0.52, + "learning_rate": 9.5114752825133e-08, + "loss": 0.0006, + "step": 27059 + }, + { + "epoch": 0.52, + "learning_rate": 9.511086948079686e-08, + "loss": 0.0005, + "step": 27060 + }, + { + "epoch": 0.52, + "learning_rate": 9.510698613646072e-08, + "loss": 0.0006, + "step": 27061 + }, + { + "epoch": 0.52, + "learning_rate": 9.510310279212458e-08, + "loss": 0.0008, + "step": 27062 + }, + { + "epoch": 0.52, + "learning_rate": 9.509921944778842e-08, + "loss": 0.0005, + "step": 27063 + }, + { + "epoch": 0.52, + "learning_rate": 9.509533610345228e-08, + "loss": 0.0006, + "step": 27064 + }, + { + "epoch": 0.53, + "learning_rate": 9.509145275911614e-08, + "loss": 0.0005, + "step": 27065 + }, + { + "epoch": 0.53, + "learning_rate": 9.508756941478e-08, + "loss": 0.0005, + "step": 27066 + }, + { + "epoch": 0.53, + "learning_rate": 9.508368607044386e-08, + "loss": 0.0012, + "step": 27067 + }, + { + "epoch": 0.53, + "learning_rate": 9.507980272610772e-08, + "loss": 0.0005, + "step": 27068 + }, + { + "epoch": 0.53, + "learning_rate": 9.507591938177157e-08, + "loss": 0.0004, + "step": 27069 + }, + { + "epoch": 0.53, + "learning_rate": 9.507203603743543e-08, + "loss": 0.0005, + "step": 27070 + }, + { + "epoch": 0.53, + "learning_rate": 9.506815269309929e-08, + "loss": 0.0004, + "step": 27071 + }, + { + "epoch": 0.53, + "learning_rate": 9.506426934876315e-08, + "loss": 0.0004, + "step": 27072 + }, + { + "epoch": 0.53, + "learning_rate": 9.506038600442701e-08, + "loss": 0.0597, + "step": 27073 + }, + { + "epoch": 0.53, + "learning_rate": 9.505650266009087e-08, + "loss": 0.0007, + "step": 27074 + }, + { + "epoch": 0.53, + "learning_rate": 9.505261931575472e-08, + "loss": 0.0005, + "step": 27075 + }, + { + "epoch": 0.53, + "learning_rate": 9.504873597141858e-08, + "loss": 0.0005, + "step": 27076 + }, + { + "epoch": 0.53, + "learning_rate": 9.504485262708244e-08, + "loss": 0.117, + "step": 27077 + }, + { + "epoch": 0.53, + "learning_rate": 9.50409692827463e-08, + "loss": 1.2692, + "step": 27078 + }, + { + "epoch": 0.53, + "learning_rate": 9.503708593841016e-08, + "loss": 0.0005, + "step": 27079 + }, + { + "epoch": 0.53, + "learning_rate": 9.503320259407401e-08, + "loss": 0.0005, + "step": 27080 + }, + { + "epoch": 0.53, + "learning_rate": 9.502931924973787e-08, + "loss": 0.0004, + "step": 27081 + }, + { + "epoch": 0.53, + "learning_rate": 9.502543590540173e-08, + "loss": 0.0007, + "step": 27082 + }, + { + "epoch": 0.53, + "learning_rate": 9.502155256106559e-08, + "loss": 0.0007, + "step": 27083 + }, + { + "epoch": 0.53, + "learning_rate": 9.501766921672945e-08, + "loss": 0.0005, + "step": 27084 + }, + { + "epoch": 0.53, + "learning_rate": 9.50137858723933e-08, + "loss": 0.0005, + "step": 27085 + }, + { + "epoch": 0.53, + "learning_rate": 9.500990252805716e-08, + "loss": 0.0003, + "step": 27086 + }, + { + "epoch": 0.53, + "learning_rate": 9.500601918372102e-08, + "loss": 0.0005, + "step": 27087 + }, + { + "epoch": 0.53, + "learning_rate": 9.500213583938488e-08, + "loss": 0.0007, + "step": 27088 + }, + { + "epoch": 0.53, + "learning_rate": 9.499825249504874e-08, + "loss": 0.0027, + "step": 27089 + }, + { + "epoch": 0.53, + "learning_rate": 9.49943691507126e-08, + "loss": 0.0006, + "step": 27090 + }, + { + "epoch": 0.53, + "learning_rate": 9.499048580637646e-08, + "loss": 0.1723, + "step": 27091 + }, + { + "epoch": 0.53, + "learning_rate": 9.49866024620403e-08, + "loss": 0.0006, + "step": 27092 + }, + { + "epoch": 0.53, + "learning_rate": 9.498271911770416e-08, + "loss": 0.0003, + "step": 27093 + }, + { + "epoch": 0.53, + "learning_rate": 9.497883577336802e-08, + "loss": 0.0004, + "step": 27094 + }, + { + "epoch": 0.53, + "learning_rate": 9.497495242903188e-08, + "loss": 0.0006, + "step": 27095 + }, + { + "epoch": 0.53, + "learning_rate": 9.497106908469573e-08, + "loss": 0.0008, + "step": 27096 + }, + { + "epoch": 0.53, + "learning_rate": 9.496718574035959e-08, + "loss": 0.0006, + "step": 27097 + }, + { + "epoch": 0.53, + "learning_rate": 9.496330239602345e-08, + "loss": 0.0005, + "step": 27098 + }, + { + "epoch": 0.53, + "learning_rate": 9.495941905168731e-08, + "loss": 0.0005, + "step": 27099 + }, + { + "epoch": 0.53, + "learning_rate": 9.495553570735117e-08, + "loss": 0.0011, + "step": 27100 + }, + { + "epoch": 0.53, + "learning_rate": 9.495165236301502e-08, + "loss": 0.0006, + "step": 27101 + }, + { + "epoch": 0.53, + "learning_rate": 9.494776901867888e-08, + "loss": 0.0005, + "step": 27102 + }, + { + "epoch": 0.53, + "learning_rate": 9.494388567434274e-08, + "loss": 0.0005, + "step": 27103 + }, + { + "epoch": 0.53, + "learning_rate": 9.49400023300066e-08, + "loss": 0.0005, + "step": 27104 + }, + { + "epoch": 0.53, + "learning_rate": 9.493611898567046e-08, + "loss": 0.0005, + "step": 27105 + }, + { + "epoch": 0.53, + "learning_rate": 9.493223564133432e-08, + "loss": 0.0005, + "step": 27106 + }, + { + "epoch": 0.53, + "learning_rate": 9.492835229699817e-08, + "loss": 0.0005, + "step": 27107 + }, + { + "epoch": 0.53, + "learning_rate": 9.492446895266203e-08, + "loss": 0.0008, + "step": 27108 + }, + { + "epoch": 0.53, + "learning_rate": 9.492058560832589e-08, + "loss": 0.0008, + "step": 27109 + }, + { + "epoch": 0.53, + "learning_rate": 9.491670226398975e-08, + "loss": 0.0018, + "step": 27110 + }, + { + "epoch": 0.53, + "learning_rate": 9.491281891965361e-08, + "loss": 0.0006, + "step": 27111 + }, + { + "epoch": 0.53, + "learning_rate": 9.490893557531747e-08, + "loss": 0.0009, + "step": 27112 + }, + { + "epoch": 0.53, + "learning_rate": 9.490505223098132e-08, + "loss": 0.0004, + "step": 27113 + }, + { + "epoch": 0.53, + "learning_rate": 9.490116888664518e-08, + "loss": 0.0005, + "step": 27114 + }, + { + "epoch": 0.53, + "learning_rate": 9.489728554230904e-08, + "loss": 0.0005, + "step": 27115 + }, + { + "epoch": 0.53, + "learning_rate": 9.48934021979729e-08, + "loss": 0.001, + "step": 27116 + }, + { + "epoch": 0.53, + "learning_rate": 9.488951885363676e-08, + "loss": 0.0007, + "step": 27117 + }, + { + "epoch": 0.53, + "learning_rate": 9.488563550930062e-08, + "loss": 0.0004, + "step": 27118 + }, + { + "epoch": 0.53, + "learning_rate": 9.488175216496447e-08, + "loss": 0.0007, + "step": 27119 + }, + { + "epoch": 0.53, + "learning_rate": 9.487786882062833e-08, + "loss": 0.0005, + "step": 27120 + }, + { + "epoch": 0.53, + "learning_rate": 9.487398547629218e-08, + "loss": 0.0006, + "step": 27121 + }, + { + "epoch": 0.53, + "learning_rate": 9.487010213195603e-08, + "loss": 0.0008, + "step": 27122 + }, + { + "epoch": 0.53, + "learning_rate": 9.486621878761989e-08, + "loss": 0.4087, + "step": 27123 + }, + { + "epoch": 0.53, + "learning_rate": 9.486233544328375e-08, + "loss": 0.0006, + "step": 27124 + }, + { + "epoch": 0.53, + "learning_rate": 9.485845209894761e-08, + "loss": 0.0173, + "step": 27125 + }, + { + "epoch": 0.53, + "learning_rate": 9.485456875461147e-08, + "loss": 0.0081, + "step": 27126 + }, + { + "epoch": 0.53, + "learning_rate": 9.485068541027533e-08, + "loss": 0.0006, + "step": 27127 + }, + { + "epoch": 0.53, + "learning_rate": 9.484680206593918e-08, + "loss": 0.0006, + "step": 27128 + }, + { + "epoch": 0.53, + "learning_rate": 9.484291872160304e-08, + "loss": 0.0003, + "step": 27129 + }, + { + "epoch": 0.53, + "learning_rate": 9.48390353772669e-08, + "loss": 0.0004, + "step": 27130 + }, + { + "epoch": 0.53, + "learning_rate": 9.483515203293076e-08, + "loss": 0.0007, + "step": 27131 + }, + { + "epoch": 0.53, + "learning_rate": 9.483126868859462e-08, + "loss": 0.0007, + "step": 27132 + }, + { + "epoch": 0.53, + "learning_rate": 9.482738534425848e-08, + "loss": 0.4096, + "step": 27133 + }, + { + "epoch": 0.53, + "learning_rate": 9.482350199992233e-08, + "loss": 0.0006, + "step": 27134 + }, + { + "epoch": 0.53, + "learning_rate": 9.481961865558619e-08, + "loss": 0.0006, + "step": 27135 + }, + { + "epoch": 0.53, + "learning_rate": 9.481573531125005e-08, + "loss": 0.0004, + "step": 27136 + }, + { + "epoch": 0.53, + "learning_rate": 9.481185196691391e-08, + "loss": 0.0116, + "step": 27137 + }, + { + "epoch": 0.53, + "learning_rate": 9.480796862257777e-08, + "loss": 0.0006, + "step": 27138 + }, + { + "epoch": 0.53, + "learning_rate": 9.480408527824162e-08, + "loss": 0.0006, + "step": 27139 + }, + { + "epoch": 0.53, + "learning_rate": 9.480020193390548e-08, + "loss": 0.0004, + "step": 27140 + }, + { + "epoch": 0.53, + "learning_rate": 9.479631858956934e-08, + "loss": 0.0005, + "step": 27141 + }, + { + "epoch": 0.53, + "learning_rate": 9.47924352452332e-08, + "loss": 0.0004, + "step": 27142 + }, + { + "epoch": 0.53, + "learning_rate": 9.478855190089706e-08, + "loss": 0.09, + "step": 27143 + }, + { + "epoch": 0.53, + "learning_rate": 9.47846685565609e-08, + "loss": 0.0028, + "step": 27144 + }, + { + "epoch": 0.53, + "learning_rate": 9.478078521222476e-08, + "loss": 0.0005, + "step": 27145 + }, + { + "epoch": 0.53, + "learning_rate": 9.477690186788862e-08, + "loss": 0.0003, + "step": 27146 + }, + { + "epoch": 0.53, + "learning_rate": 9.477301852355248e-08, + "loss": 0.0148, + "step": 27147 + }, + { + "epoch": 0.53, + "learning_rate": 9.476913517921634e-08, + "loss": 0.0012, + "step": 27148 + }, + { + "epoch": 0.53, + "learning_rate": 9.47652518348802e-08, + "loss": 0.2577, + "step": 27149 + }, + { + "epoch": 0.53, + "learning_rate": 9.476136849054405e-08, + "loss": 0.0332, + "step": 27150 + }, + { + "epoch": 0.53, + "learning_rate": 9.475748514620791e-08, + "loss": 0.9053, + "step": 27151 + }, + { + "epoch": 0.53, + "learning_rate": 9.475360180187177e-08, + "loss": 0.0006, + "step": 27152 + }, + { + "epoch": 0.53, + "learning_rate": 9.474971845753563e-08, + "loss": 0.1364, + "step": 27153 + }, + { + "epoch": 0.53, + "learning_rate": 9.474583511319949e-08, + "loss": 0.0005, + "step": 27154 + }, + { + "epoch": 0.53, + "learning_rate": 9.474195176886334e-08, + "loss": 0.0011, + "step": 27155 + }, + { + "epoch": 0.53, + "learning_rate": 9.47380684245272e-08, + "loss": 0.0033, + "step": 27156 + }, + { + "epoch": 0.53, + "learning_rate": 9.473418508019106e-08, + "loss": 0.0006, + "step": 27157 + }, + { + "epoch": 0.53, + "learning_rate": 9.47303017358549e-08, + "loss": 0.0005, + "step": 27158 + }, + { + "epoch": 0.53, + "learning_rate": 9.472641839151876e-08, + "loss": 0.0005, + "step": 27159 + }, + { + "epoch": 0.53, + "learning_rate": 9.472253504718262e-08, + "loss": 0.0007, + "step": 27160 + }, + { + "epoch": 0.53, + "learning_rate": 9.471865170284648e-08, + "loss": 0.0033, + "step": 27161 + }, + { + "epoch": 0.53, + "learning_rate": 9.471476835851034e-08, + "loss": 0.1539, + "step": 27162 + }, + { + "epoch": 0.53, + "learning_rate": 9.47108850141742e-08, + "loss": 0.0004, + "step": 27163 + }, + { + "epoch": 0.53, + "learning_rate": 9.470700166983805e-08, + "loss": 0.0005, + "step": 27164 + }, + { + "epoch": 0.53, + "learning_rate": 9.470311832550191e-08, + "loss": 0.0004, + "step": 27165 + }, + { + "epoch": 0.53, + "learning_rate": 9.469923498116577e-08, + "loss": 0.4348, + "step": 27166 + }, + { + "epoch": 0.53, + "learning_rate": 9.469535163682963e-08, + "loss": 0.0005, + "step": 27167 + }, + { + "epoch": 0.53, + "learning_rate": 9.469146829249349e-08, + "loss": 0.0012, + "step": 27168 + }, + { + "epoch": 0.53, + "learning_rate": 9.468758494815735e-08, + "loss": 0.0008, + "step": 27169 + }, + { + "epoch": 0.53, + "learning_rate": 9.46837016038212e-08, + "loss": 0.0005, + "step": 27170 + }, + { + "epoch": 0.53, + "learning_rate": 9.467981825948506e-08, + "loss": 0.0848, + "step": 27171 + }, + { + "epoch": 0.53, + "learning_rate": 9.467593491514892e-08, + "loss": 0.0005, + "step": 27172 + }, + { + "epoch": 0.53, + "learning_rate": 9.467205157081278e-08, + "loss": 0.0004, + "step": 27173 + }, + { + "epoch": 0.53, + "learning_rate": 9.466816822647664e-08, + "loss": 0.0005, + "step": 27174 + }, + { + "epoch": 0.53, + "learning_rate": 9.46642848821405e-08, + "loss": 0.0008, + "step": 27175 + }, + { + "epoch": 0.53, + "learning_rate": 9.466040153780435e-08, + "loss": 0.0261, + "step": 27176 + }, + { + "epoch": 0.53, + "learning_rate": 9.465651819346821e-08, + "loss": 0.0004, + "step": 27177 + }, + { + "epoch": 0.53, + "learning_rate": 9.465263484913207e-08, + "loss": 0.0004, + "step": 27178 + }, + { + "epoch": 0.53, + "learning_rate": 9.464875150479592e-08, + "loss": 0.0017, + "step": 27179 + }, + { + "epoch": 0.53, + "learning_rate": 9.464486816045977e-08, + "loss": 0.0006, + "step": 27180 + }, + { + "epoch": 0.53, + "learning_rate": 9.464098481612363e-08, + "loss": 0.0022, + "step": 27181 + }, + { + "epoch": 0.53, + "learning_rate": 9.463710147178749e-08, + "loss": 0.4468, + "step": 27182 + }, + { + "epoch": 0.53, + "learning_rate": 9.463321812745135e-08, + "loss": 0.9523, + "step": 27183 + }, + { + "epoch": 0.53, + "learning_rate": 9.46293347831152e-08, + "loss": 0.0005, + "step": 27184 + }, + { + "epoch": 0.53, + "learning_rate": 9.462545143877906e-08, + "loss": 0.5389, + "step": 27185 + }, + { + "epoch": 0.53, + "learning_rate": 9.462156809444292e-08, + "loss": 0.0006, + "step": 27186 + }, + { + "epoch": 0.53, + "learning_rate": 9.461768475010678e-08, + "loss": 0.0006, + "step": 27187 + }, + { + "epoch": 0.53, + "learning_rate": 9.461380140577064e-08, + "loss": 0.0004, + "step": 27188 + }, + { + "epoch": 0.53, + "learning_rate": 9.46099180614345e-08, + "loss": 0.0006, + "step": 27189 + }, + { + "epoch": 0.53, + "learning_rate": 9.460603471709836e-08, + "loss": 0.0006, + "step": 27190 + }, + { + "epoch": 0.53, + "learning_rate": 9.460215137276221e-08, + "loss": 0.8026, + "step": 27191 + }, + { + "epoch": 0.53, + "learning_rate": 9.459826802842607e-08, + "loss": 0.0005, + "step": 27192 + }, + { + "epoch": 0.53, + "learning_rate": 9.459438468408993e-08, + "loss": 0.0007, + "step": 27193 + }, + { + "epoch": 0.53, + "learning_rate": 9.459050133975379e-08, + "loss": 0.0006, + "step": 27194 + }, + { + "epoch": 0.53, + "learning_rate": 9.458661799541765e-08, + "loss": 0.0007, + "step": 27195 + }, + { + "epoch": 0.53, + "learning_rate": 9.45827346510815e-08, + "loss": 0.0006, + "step": 27196 + }, + { + "epoch": 0.53, + "learning_rate": 9.457885130674536e-08, + "loss": 0.0003, + "step": 27197 + }, + { + "epoch": 0.53, + "learning_rate": 9.457496796240922e-08, + "loss": 0.0006, + "step": 27198 + }, + { + "epoch": 0.53, + "learning_rate": 9.457108461807308e-08, + "loss": 0.0067, + "step": 27199 + }, + { + "epoch": 0.53, + "learning_rate": 9.456720127373694e-08, + "loss": 0.0005, + "step": 27200 + }, + { + "epoch": 0.53, + "learning_rate": 9.45633179294008e-08, + "loss": 0.962, + "step": 27201 + }, + { + "epoch": 0.53, + "learning_rate": 9.455943458506465e-08, + "loss": 0.0008, + "step": 27202 + }, + { + "epoch": 0.53, + "learning_rate": 9.455555124072851e-08, + "loss": 0.2333, + "step": 27203 + }, + { + "epoch": 0.53, + "learning_rate": 9.455166789639237e-08, + "loss": 0.0006, + "step": 27204 + }, + { + "epoch": 0.53, + "learning_rate": 9.454778455205623e-08, + "loss": 0.0004, + "step": 27205 + }, + { + "epoch": 0.53, + "learning_rate": 9.454390120772009e-08, + "loss": 0.0005, + "step": 27206 + }, + { + "epoch": 0.53, + "learning_rate": 9.454001786338395e-08, + "loss": 0.0005, + "step": 27207 + }, + { + "epoch": 0.53, + "learning_rate": 9.453613451904779e-08, + "loss": 0.0005, + "step": 27208 + }, + { + "epoch": 0.53, + "learning_rate": 9.453225117471165e-08, + "loss": 0.0006, + "step": 27209 + }, + { + "epoch": 0.53, + "learning_rate": 9.452836783037551e-08, + "loss": 0.0004, + "step": 27210 + }, + { + "epoch": 0.53, + "learning_rate": 9.452448448603937e-08, + "loss": 0.0043, + "step": 27211 + }, + { + "epoch": 0.53, + "learning_rate": 9.452060114170322e-08, + "loss": 0.0007, + "step": 27212 + }, + { + "epoch": 0.53, + "learning_rate": 9.451671779736708e-08, + "loss": 0.0003, + "step": 27213 + }, + { + "epoch": 0.53, + "learning_rate": 9.451283445303094e-08, + "loss": 0.0005, + "step": 27214 + }, + { + "epoch": 0.53, + "learning_rate": 9.45089511086948e-08, + "loss": 0.0006, + "step": 27215 + }, + { + "epoch": 0.53, + "learning_rate": 9.450506776435866e-08, + "loss": 0.0009, + "step": 27216 + }, + { + "epoch": 0.53, + "learning_rate": 9.450118442002252e-08, + "loss": 0.0005, + "step": 27217 + }, + { + "epoch": 0.53, + "learning_rate": 9.449730107568637e-08, + "loss": 0.0006, + "step": 27218 + }, + { + "epoch": 0.53, + "learning_rate": 9.449341773135023e-08, + "loss": 0.0005, + "step": 27219 + }, + { + "epoch": 0.53, + "learning_rate": 9.448953438701409e-08, + "loss": 0.0005, + "step": 27220 + }, + { + "epoch": 0.53, + "learning_rate": 9.448565104267795e-08, + "loss": 0.0007, + "step": 27221 + }, + { + "epoch": 0.53, + "learning_rate": 9.44817676983418e-08, + "loss": 0.0005, + "step": 27222 + }, + { + "epoch": 0.53, + "learning_rate": 9.447788435400566e-08, + "loss": 0.001, + "step": 27223 + }, + { + "epoch": 0.53, + "learning_rate": 9.447400100966952e-08, + "loss": 0.0008, + "step": 27224 + }, + { + "epoch": 0.53, + "learning_rate": 9.447011766533338e-08, + "loss": 0.0004, + "step": 27225 + }, + { + "epoch": 0.53, + "learning_rate": 9.446623432099724e-08, + "loss": 0.0004, + "step": 27226 + }, + { + "epoch": 0.53, + "learning_rate": 9.44623509766611e-08, + "loss": 0.1057, + "step": 27227 + }, + { + "epoch": 0.53, + "learning_rate": 9.445846763232496e-08, + "loss": 0.0005, + "step": 27228 + }, + { + "epoch": 0.53, + "learning_rate": 9.445458428798881e-08, + "loss": 1.2279, + "step": 27229 + }, + { + "epoch": 0.53, + "learning_rate": 9.445070094365267e-08, + "loss": 0.0005, + "step": 27230 + }, + { + "epoch": 0.53, + "learning_rate": 9.444681759931653e-08, + "loss": 0.0059, + "step": 27231 + }, + { + "epoch": 0.53, + "learning_rate": 9.444293425498039e-08, + "loss": 0.0004, + "step": 27232 + }, + { + "epoch": 0.53, + "learning_rate": 9.443905091064425e-08, + "loss": 0.0008, + "step": 27233 + }, + { + "epoch": 0.53, + "learning_rate": 9.44351675663081e-08, + "loss": 0.001, + "step": 27234 + }, + { + "epoch": 0.53, + "learning_rate": 9.443128422197196e-08, + "loss": 0.0007, + "step": 27235 + }, + { + "epoch": 0.53, + "learning_rate": 9.442740087763582e-08, + "loss": 0.0004, + "step": 27236 + }, + { + "epoch": 0.53, + "learning_rate": 9.442351753329967e-08, + "loss": 0.2721, + "step": 27237 + }, + { + "epoch": 0.53, + "learning_rate": 9.441963418896352e-08, + "loss": 0.0007, + "step": 27238 + }, + { + "epoch": 0.53, + "learning_rate": 9.441575084462738e-08, + "loss": 0.6691, + "step": 27239 + }, + { + "epoch": 0.53, + "learning_rate": 9.441186750029124e-08, + "loss": 0.0004, + "step": 27240 + }, + { + "epoch": 0.53, + "learning_rate": 9.44079841559551e-08, + "loss": 0.0014, + "step": 27241 + }, + { + "epoch": 0.53, + "learning_rate": 9.440410081161896e-08, + "loss": 1.0095, + "step": 27242 + }, + { + "epoch": 0.53, + "learning_rate": 9.440021746728282e-08, + "loss": 0.0006, + "step": 27243 + }, + { + "epoch": 0.53, + "learning_rate": 9.439633412294667e-08, + "loss": 0.0014, + "step": 27244 + }, + { + "epoch": 0.53, + "learning_rate": 9.439245077861053e-08, + "loss": 0.0008, + "step": 27245 + }, + { + "epoch": 0.53, + "learning_rate": 9.438856743427439e-08, + "loss": 0.0005, + "step": 27246 + }, + { + "epoch": 0.53, + "learning_rate": 9.438468408993825e-08, + "loss": 0.0008, + "step": 27247 + }, + { + "epoch": 0.53, + "learning_rate": 9.438080074560211e-08, + "loss": 0.0006, + "step": 27248 + }, + { + "epoch": 0.53, + "learning_rate": 9.437691740126597e-08, + "loss": 0.0007, + "step": 27249 + }, + { + "epoch": 0.53, + "learning_rate": 9.437303405692982e-08, + "loss": 0.4193, + "step": 27250 + }, + { + "epoch": 0.53, + "learning_rate": 9.436915071259368e-08, + "loss": 0.0037, + "step": 27251 + }, + { + "epoch": 0.53, + "learning_rate": 9.436526736825754e-08, + "loss": 0.0008, + "step": 27252 + }, + { + "epoch": 0.53, + "learning_rate": 9.43613840239214e-08, + "loss": 0.0008, + "step": 27253 + }, + { + "epoch": 0.53, + "learning_rate": 9.435750067958526e-08, + "loss": 0.0004, + "step": 27254 + }, + { + "epoch": 0.53, + "learning_rate": 9.435361733524912e-08, + "loss": 0.728, + "step": 27255 + }, + { + "epoch": 0.53, + "learning_rate": 9.434973399091297e-08, + "loss": 0.0006, + "step": 27256 + }, + { + "epoch": 0.53, + "learning_rate": 9.434585064657683e-08, + "loss": 0.0942, + "step": 27257 + }, + { + "epoch": 0.53, + "learning_rate": 9.434196730224069e-08, + "loss": 0.0004, + "step": 27258 + }, + { + "epoch": 0.53, + "learning_rate": 9.433808395790455e-08, + "loss": 0.0004, + "step": 27259 + }, + { + "epoch": 0.53, + "learning_rate": 9.43342006135684e-08, + "loss": 0.0007, + "step": 27260 + }, + { + "epoch": 0.53, + "learning_rate": 9.433031726923226e-08, + "loss": 0.0218, + "step": 27261 + }, + { + "epoch": 0.53, + "learning_rate": 9.432643392489612e-08, + "loss": 0.0006, + "step": 27262 + }, + { + "epoch": 0.53, + "learning_rate": 9.432255058055998e-08, + "loss": 0.0007, + "step": 27263 + }, + { + "epoch": 0.53, + "learning_rate": 9.431866723622384e-08, + "loss": 0.0005, + "step": 27264 + }, + { + "epoch": 0.53, + "learning_rate": 9.43147838918877e-08, + "loss": 0.0006, + "step": 27265 + }, + { + "epoch": 0.53, + "learning_rate": 9.431090054755154e-08, + "loss": 0.0006, + "step": 27266 + }, + { + "epoch": 0.53, + "learning_rate": 9.43070172032154e-08, + "loss": 0.0007, + "step": 27267 + }, + { + "epoch": 0.53, + "learning_rate": 9.430313385887926e-08, + "loss": 0.0004, + "step": 27268 + }, + { + "epoch": 0.53, + "learning_rate": 9.429925051454312e-08, + "loss": 0.0005, + "step": 27269 + }, + { + "epoch": 0.53, + "learning_rate": 9.429536717020698e-08, + "loss": 0.0004, + "step": 27270 + }, + { + "epoch": 0.53, + "learning_rate": 9.429148382587083e-08, + "loss": 0.0006, + "step": 27271 + }, + { + "epoch": 0.53, + "learning_rate": 9.428760048153469e-08, + "loss": 0.0013, + "step": 27272 + }, + { + "epoch": 0.53, + "learning_rate": 9.428371713719855e-08, + "loss": 0.0005, + "step": 27273 + }, + { + "epoch": 0.53, + "learning_rate": 9.427983379286241e-08, + "loss": 0.0008, + "step": 27274 + }, + { + "epoch": 0.53, + "learning_rate": 9.427595044852627e-08, + "loss": 0.0007, + "step": 27275 + }, + { + "epoch": 0.53, + "learning_rate": 9.427206710419013e-08, + "loss": 0.0006, + "step": 27276 + }, + { + "epoch": 0.53, + "learning_rate": 9.426818375985398e-08, + "loss": 0.0005, + "step": 27277 + }, + { + "epoch": 0.53, + "learning_rate": 9.426430041551784e-08, + "loss": 1.4093, + "step": 27278 + }, + { + "epoch": 0.53, + "learning_rate": 9.42604170711817e-08, + "loss": 0.0004, + "step": 27279 + }, + { + "epoch": 0.53, + "learning_rate": 9.425653372684556e-08, + "loss": 0.0004, + "step": 27280 + }, + { + "epoch": 0.53, + "learning_rate": 9.425265038250942e-08, + "loss": 0.0007, + "step": 27281 + }, + { + "epoch": 0.53, + "learning_rate": 9.424876703817327e-08, + "loss": 0.0007, + "step": 27282 + }, + { + "epoch": 0.53, + "learning_rate": 9.424488369383713e-08, + "loss": 0.0004, + "step": 27283 + }, + { + "epoch": 0.53, + "learning_rate": 9.424100034950099e-08, + "loss": 0.0005, + "step": 27284 + }, + { + "epoch": 0.53, + "learning_rate": 9.423711700516485e-08, + "loss": 0.0007, + "step": 27285 + }, + { + "epoch": 0.53, + "learning_rate": 9.423323366082871e-08, + "loss": 0.0005, + "step": 27286 + }, + { + "epoch": 0.53, + "learning_rate": 9.422935031649257e-08, + "loss": 1.2072, + "step": 27287 + }, + { + "epoch": 0.53, + "learning_rate": 9.422546697215642e-08, + "loss": 0.3432, + "step": 27288 + }, + { + "epoch": 0.53, + "learning_rate": 9.422158362782028e-08, + "loss": 0.0006, + "step": 27289 + }, + { + "epoch": 0.53, + "learning_rate": 9.421770028348414e-08, + "loss": 0.0052, + "step": 27290 + }, + { + "epoch": 0.53, + "learning_rate": 9.4213816939148e-08, + "loss": 0.0009, + "step": 27291 + }, + { + "epoch": 0.53, + "learning_rate": 9.420993359481186e-08, + "loss": 0.0006, + "step": 27292 + }, + { + "epoch": 0.53, + "learning_rate": 9.420605025047572e-08, + "loss": 0.0007, + "step": 27293 + }, + { + "epoch": 0.53, + "learning_rate": 9.420216690613957e-08, + "loss": 0.0004, + "step": 27294 + }, + { + "epoch": 0.53, + "learning_rate": 9.419828356180342e-08, + "loss": 0.0005, + "step": 27295 + }, + { + "epoch": 0.53, + "learning_rate": 9.419440021746728e-08, + "loss": 0.0006, + "step": 27296 + }, + { + "epoch": 0.53, + "learning_rate": 9.419051687313113e-08, + "loss": 0.0006, + "step": 27297 + }, + { + "epoch": 0.53, + "learning_rate": 9.418663352879499e-08, + "loss": 0.0006, + "step": 27298 + }, + { + "epoch": 0.53, + "learning_rate": 9.418275018445885e-08, + "loss": 0.0006, + "step": 27299 + }, + { + "epoch": 0.53, + "learning_rate": 9.417886684012271e-08, + "loss": 0.0005, + "step": 27300 + }, + { + "epoch": 0.53, + "learning_rate": 9.417498349578657e-08, + "loss": 0.0006, + "step": 27301 + }, + { + "epoch": 0.53, + "learning_rate": 9.417110015145043e-08, + "loss": 0.0007, + "step": 27302 + }, + { + "epoch": 0.53, + "learning_rate": 9.416721680711428e-08, + "loss": 0.0004, + "step": 27303 + }, + { + "epoch": 0.53, + "learning_rate": 9.416333346277814e-08, + "loss": 0.0008, + "step": 27304 + }, + { + "epoch": 0.53, + "learning_rate": 9.4159450118442e-08, + "loss": 0.1327, + "step": 27305 + }, + { + "epoch": 0.53, + "learning_rate": 9.415556677410586e-08, + "loss": 0.0005, + "step": 27306 + }, + { + "epoch": 0.53, + "learning_rate": 9.415168342976972e-08, + "loss": 0.0007, + "step": 27307 + }, + { + "epoch": 0.53, + "learning_rate": 9.414780008543358e-08, + "loss": 0.0004, + "step": 27308 + }, + { + "epoch": 0.53, + "learning_rate": 9.414391674109743e-08, + "loss": 0.0006, + "step": 27309 + }, + { + "epoch": 0.53, + "learning_rate": 9.414003339676129e-08, + "loss": 0.0005, + "step": 27310 + }, + { + "epoch": 0.53, + "learning_rate": 9.413615005242515e-08, + "loss": 0.0006, + "step": 27311 + }, + { + "epoch": 0.53, + "learning_rate": 9.413226670808901e-08, + "loss": 0.0149, + "step": 27312 + }, + { + "epoch": 0.53, + "learning_rate": 9.412838336375287e-08, + "loss": 0.2892, + "step": 27313 + }, + { + "epoch": 0.53, + "learning_rate": 9.412450001941673e-08, + "loss": 0.0006, + "step": 27314 + }, + { + "epoch": 0.53, + "learning_rate": 9.412061667508058e-08, + "loss": 0.0004, + "step": 27315 + }, + { + "epoch": 0.53, + "learning_rate": 9.411673333074444e-08, + "loss": 0.0005, + "step": 27316 + }, + { + "epoch": 0.53, + "learning_rate": 9.41128499864083e-08, + "loss": 0.0008, + "step": 27317 + }, + { + "epoch": 0.53, + "learning_rate": 9.410896664207216e-08, + "loss": 0.0005, + "step": 27318 + }, + { + "epoch": 0.53, + "learning_rate": 9.410508329773602e-08, + "loss": 0.0006, + "step": 27319 + }, + { + "epoch": 0.53, + "learning_rate": 9.410119995339987e-08, + "loss": 0.0005, + "step": 27320 + }, + { + "epoch": 0.53, + "learning_rate": 9.409731660906372e-08, + "loss": 0.0008, + "step": 27321 + }, + { + "epoch": 0.53, + "learning_rate": 9.409343326472758e-08, + "loss": 1.0883, + "step": 27322 + }, + { + "epoch": 0.53, + "learning_rate": 9.408954992039144e-08, + "loss": 0.0006, + "step": 27323 + }, + { + "epoch": 0.53, + "learning_rate": 9.40856665760553e-08, + "loss": 0.0004, + "step": 27324 + }, + { + "epoch": 0.53, + "learning_rate": 9.408178323171915e-08, + "loss": 0.0011, + "step": 27325 + }, + { + "epoch": 0.53, + "learning_rate": 9.407789988738301e-08, + "loss": 0.0009, + "step": 27326 + }, + { + "epoch": 0.53, + "learning_rate": 9.407401654304687e-08, + "loss": 0.0005, + "step": 27327 + }, + { + "epoch": 0.53, + "learning_rate": 9.407013319871073e-08, + "loss": 0.0008, + "step": 27328 + }, + { + "epoch": 0.53, + "learning_rate": 9.406624985437459e-08, + "loss": 0.0007, + "step": 27329 + }, + { + "epoch": 0.53, + "learning_rate": 9.406236651003844e-08, + "loss": 0.0006, + "step": 27330 + }, + { + "epoch": 0.53, + "learning_rate": 9.40584831657023e-08, + "loss": 0.0004, + "step": 27331 + }, + { + "epoch": 0.53, + "learning_rate": 9.405459982136616e-08, + "loss": 0.0004, + "step": 27332 + }, + { + "epoch": 0.53, + "learning_rate": 9.405071647703002e-08, + "loss": 0.0027, + "step": 27333 + }, + { + "epoch": 0.53, + "learning_rate": 9.404683313269388e-08, + "loss": 0.0007, + "step": 27334 + }, + { + "epoch": 0.53, + "learning_rate": 9.404294978835772e-08, + "loss": 0.0626, + "step": 27335 + }, + { + "epoch": 0.53, + "learning_rate": 9.403906644402158e-08, + "loss": 0.0006, + "step": 27336 + }, + { + "epoch": 0.53, + "learning_rate": 9.403518309968544e-08, + "loss": 0.0004, + "step": 27337 + }, + { + "epoch": 0.53, + "learning_rate": 9.40312997553493e-08, + "loss": 0.0006, + "step": 27338 + }, + { + "epoch": 0.53, + "learning_rate": 9.402741641101315e-08, + "loss": 0.0005, + "step": 27339 + }, + { + "epoch": 0.53, + "learning_rate": 9.402353306667701e-08, + "loss": 0.0004, + "step": 27340 + }, + { + "epoch": 0.53, + "learning_rate": 9.401964972234087e-08, + "loss": 0.001, + "step": 27341 + }, + { + "epoch": 0.53, + "learning_rate": 9.401576637800473e-08, + "loss": 0.02, + "step": 27342 + }, + { + "epoch": 0.53, + "learning_rate": 9.401188303366859e-08, + "loss": 0.0006, + "step": 27343 + }, + { + "epoch": 0.53, + "learning_rate": 9.400799968933245e-08, + "loss": 0.0007, + "step": 27344 + }, + { + "epoch": 0.53, + "learning_rate": 9.40041163449963e-08, + "loss": 0.0007, + "step": 27345 + }, + { + "epoch": 0.53, + "learning_rate": 9.400023300066016e-08, + "loss": 0.0008, + "step": 27346 + }, + { + "epoch": 0.53, + "learning_rate": 9.399634965632402e-08, + "loss": 0.0008, + "step": 27347 + }, + { + "epoch": 0.53, + "learning_rate": 9.399246631198788e-08, + "loss": 0.0004, + "step": 27348 + }, + { + "epoch": 0.53, + "learning_rate": 9.398858296765174e-08, + "loss": 0.9328, + "step": 27349 + }, + { + "epoch": 0.53, + "learning_rate": 9.39846996233156e-08, + "loss": 0.0008, + "step": 27350 + }, + { + "epoch": 0.53, + "learning_rate": 9.398081627897945e-08, + "loss": 0.0005, + "step": 27351 + }, + { + "epoch": 0.53, + "learning_rate": 9.397693293464331e-08, + "loss": 0.0007, + "step": 27352 + }, + { + "epoch": 0.53, + "learning_rate": 9.397304959030716e-08, + "loss": 0.0005, + "step": 27353 + }, + { + "epoch": 0.53, + "learning_rate": 9.396916624597102e-08, + "loss": 0.001, + "step": 27354 + }, + { + "epoch": 0.53, + "learning_rate": 9.396528290163487e-08, + "loss": 0.0005, + "step": 27355 + }, + { + "epoch": 0.53, + "learning_rate": 9.396139955729873e-08, + "loss": 0.0014, + "step": 27356 + }, + { + "epoch": 0.53, + "learning_rate": 9.395751621296259e-08, + "loss": 0.0007, + "step": 27357 + }, + { + "epoch": 0.53, + "learning_rate": 9.395363286862645e-08, + "loss": 0.0005, + "step": 27358 + }, + { + "epoch": 0.53, + "learning_rate": 9.39497495242903e-08, + "loss": 0.0032, + "step": 27359 + }, + { + "epoch": 0.53, + "learning_rate": 9.394586617995416e-08, + "loss": 0.0006, + "step": 27360 + }, + { + "epoch": 0.53, + "learning_rate": 9.394198283561802e-08, + "loss": 0.0007, + "step": 27361 + }, + { + "epoch": 0.53, + "learning_rate": 9.393809949128188e-08, + "loss": 0.0005, + "step": 27362 + }, + { + "epoch": 0.53, + "learning_rate": 9.393421614694574e-08, + "loss": 0.0018, + "step": 27363 + }, + { + "epoch": 0.53, + "learning_rate": 9.39303328026096e-08, + "loss": 0.0005, + "step": 27364 + }, + { + "epoch": 0.53, + "learning_rate": 9.392644945827346e-08, + "loss": 0.0005, + "step": 27365 + }, + { + "epoch": 0.53, + "learning_rate": 9.392256611393731e-08, + "loss": 0.0005, + "step": 27366 + }, + { + "epoch": 0.53, + "learning_rate": 9.391868276960117e-08, + "loss": 0.0005, + "step": 27367 + }, + { + "epoch": 0.53, + "learning_rate": 9.391479942526503e-08, + "loss": 0.0004, + "step": 27368 + }, + { + "epoch": 0.53, + "learning_rate": 9.391091608092889e-08, + "loss": 0.0005, + "step": 27369 + }, + { + "epoch": 0.53, + "learning_rate": 9.390703273659275e-08, + "loss": 0.0005, + "step": 27370 + }, + { + "epoch": 0.53, + "learning_rate": 9.39031493922566e-08, + "loss": 0.0008, + "step": 27371 + }, + { + "epoch": 0.53, + "learning_rate": 9.389926604792046e-08, + "loss": 1.1484, + "step": 27372 + }, + { + "epoch": 0.53, + "learning_rate": 9.389538270358432e-08, + "loss": 0.0005, + "step": 27373 + }, + { + "epoch": 0.53, + "learning_rate": 9.389149935924818e-08, + "loss": 0.0004, + "step": 27374 + }, + { + "epoch": 0.53, + "learning_rate": 9.388761601491204e-08, + "loss": 0.0007, + "step": 27375 + }, + { + "epoch": 0.53, + "learning_rate": 9.38837326705759e-08, + "loss": 0.0005, + "step": 27376 + }, + { + "epoch": 0.53, + "learning_rate": 9.387984932623975e-08, + "loss": 0.0006, + "step": 27377 + }, + { + "epoch": 0.53, + "learning_rate": 9.387596598190361e-08, + "loss": 0.0099, + "step": 27378 + }, + { + "epoch": 0.53, + "learning_rate": 9.387208263756747e-08, + "loss": 0.0008, + "step": 27379 + }, + { + "epoch": 0.53, + "learning_rate": 9.386819929323133e-08, + "loss": 0.0036, + "step": 27380 + }, + { + "epoch": 0.53, + "learning_rate": 9.386431594889519e-08, + "loss": 0.0006, + "step": 27381 + }, + { + "epoch": 0.53, + "learning_rate": 9.386043260455903e-08, + "loss": 1.0202, + "step": 27382 + }, + { + "epoch": 0.53, + "learning_rate": 9.385654926022289e-08, + "loss": 0.0013, + "step": 27383 + }, + { + "epoch": 0.53, + "learning_rate": 9.385266591588675e-08, + "loss": 1.2076, + "step": 27384 + }, + { + "epoch": 0.53, + "learning_rate": 9.384878257155061e-08, + "loss": 0.0008, + "step": 27385 + }, + { + "epoch": 0.53, + "learning_rate": 9.384489922721447e-08, + "loss": 0.0004, + "step": 27386 + }, + { + "epoch": 0.53, + "learning_rate": 9.384101588287832e-08, + "loss": 0.0007, + "step": 27387 + }, + { + "epoch": 0.53, + "learning_rate": 9.383713253854218e-08, + "loss": 0.0004, + "step": 27388 + }, + { + "epoch": 0.53, + "learning_rate": 9.383324919420604e-08, + "loss": 0.0007, + "step": 27389 + }, + { + "epoch": 0.53, + "learning_rate": 9.38293658498699e-08, + "loss": 0.0006, + "step": 27390 + }, + { + "epoch": 0.53, + "learning_rate": 9.382548250553376e-08, + "loss": 0.0004, + "step": 27391 + }, + { + "epoch": 0.53, + "learning_rate": 9.382159916119762e-08, + "loss": 0.0005, + "step": 27392 + }, + { + "epoch": 0.53, + "learning_rate": 9.381771581686147e-08, + "loss": 0.0006, + "step": 27393 + }, + { + "epoch": 0.53, + "learning_rate": 9.381383247252533e-08, + "loss": 1.2188, + "step": 27394 + }, + { + "epoch": 0.53, + "learning_rate": 9.380994912818919e-08, + "loss": 0.0024, + "step": 27395 + }, + { + "epoch": 0.53, + "learning_rate": 9.380606578385305e-08, + "loss": 0.0007, + "step": 27396 + }, + { + "epoch": 0.53, + "learning_rate": 9.38021824395169e-08, + "loss": 0.0176, + "step": 27397 + }, + { + "epoch": 0.53, + "learning_rate": 9.379829909518076e-08, + "loss": 0.0004, + "step": 27398 + }, + { + "epoch": 0.53, + "learning_rate": 9.379441575084462e-08, + "loss": 0.0009, + "step": 27399 + }, + { + "epoch": 0.53, + "learning_rate": 9.379053240650848e-08, + "loss": 0.0005, + "step": 27400 + }, + { + "epoch": 0.53, + "learning_rate": 9.378664906217234e-08, + "loss": 0.0007, + "step": 27401 + }, + { + "epoch": 0.53, + "learning_rate": 9.37827657178362e-08, + "loss": 0.0005, + "step": 27402 + }, + { + "epoch": 0.53, + "learning_rate": 9.377888237350006e-08, + "loss": 0.5335, + "step": 27403 + }, + { + "epoch": 0.53, + "learning_rate": 9.377499902916391e-08, + "loss": 0.5401, + "step": 27404 + }, + { + "epoch": 0.53, + "learning_rate": 9.377111568482777e-08, + "loss": 0.0007, + "step": 27405 + }, + { + "epoch": 0.53, + "learning_rate": 9.376723234049163e-08, + "loss": 0.0005, + "step": 27406 + }, + { + "epoch": 0.53, + "learning_rate": 9.376334899615549e-08, + "loss": 0.0005, + "step": 27407 + }, + { + "epoch": 0.53, + "learning_rate": 9.375946565181935e-08, + "loss": 1.0493, + "step": 27408 + }, + { + "epoch": 0.53, + "learning_rate": 9.37555823074832e-08, + "loss": 0.0006, + "step": 27409 + }, + { + "epoch": 0.53, + "learning_rate": 9.375169896314706e-08, + "loss": 0.0101, + "step": 27410 + }, + { + "epoch": 0.53, + "learning_rate": 9.374781561881091e-08, + "loss": 0.0005, + "step": 27411 + }, + { + "epoch": 0.53, + "learning_rate": 9.374393227447477e-08, + "loss": 0.0006, + "step": 27412 + }, + { + "epoch": 0.53, + "learning_rate": 9.374004893013863e-08, + "loss": 1.0342, + "step": 27413 + }, + { + "epoch": 0.53, + "learning_rate": 9.373616558580248e-08, + "loss": 0.0004, + "step": 27414 + }, + { + "epoch": 0.53, + "learning_rate": 9.373228224146634e-08, + "loss": 0.7052, + "step": 27415 + }, + { + "epoch": 0.53, + "learning_rate": 9.37283988971302e-08, + "loss": 0.0005, + "step": 27416 + }, + { + "epoch": 0.53, + "learning_rate": 9.372451555279406e-08, + "loss": 0.0221, + "step": 27417 + }, + { + "epoch": 0.53, + "learning_rate": 9.372063220845792e-08, + "loss": 0.0006, + "step": 27418 + }, + { + "epoch": 0.53, + "learning_rate": 9.371674886412177e-08, + "loss": 0.0007, + "step": 27419 + }, + { + "epoch": 0.53, + "learning_rate": 9.371286551978563e-08, + "loss": 0.0458, + "step": 27420 + }, + { + "epoch": 0.53, + "learning_rate": 9.370898217544949e-08, + "loss": 0.0015, + "step": 27421 + }, + { + "epoch": 0.53, + "learning_rate": 9.370509883111335e-08, + "loss": 0.001, + "step": 27422 + }, + { + "epoch": 0.53, + "learning_rate": 9.370121548677721e-08, + "loss": 0.0015, + "step": 27423 + }, + { + "epoch": 0.53, + "learning_rate": 9.369733214244107e-08, + "loss": 0.0006, + "step": 27424 + }, + { + "epoch": 0.53, + "learning_rate": 9.369344879810492e-08, + "loss": 0.0006, + "step": 27425 + }, + { + "epoch": 0.53, + "learning_rate": 9.368956545376878e-08, + "loss": 0.0006, + "step": 27426 + }, + { + "epoch": 0.53, + "learning_rate": 9.368568210943264e-08, + "loss": 0.0007, + "step": 27427 + }, + { + "epoch": 0.53, + "learning_rate": 9.36817987650965e-08, + "loss": 0.0004, + "step": 27428 + }, + { + "epoch": 0.53, + "learning_rate": 9.367791542076036e-08, + "loss": 0.0005, + "step": 27429 + }, + { + "epoch": 0.53, + "learning_rate": 9.367403207642422e-08, + "loss": 0.0005, + "step": 27430 + }, + { + "epoch": 0.53, + "learning_rate": 9.367014873208807e-08, + "loss": 0.6018, + "step": 27431 + }, + { + "epoch": 0.53, + "learning_rate": 9.366626538775193e-08, + "loss": 0.0053, + "step": 27432 + }, + { + "epoch": 0.53, + "learning_rate": 9.366238204341579e-08, + "loss": 0.0005, + "step": 27433 + }, + { + "epoch": 0.53, + "learning_rate": 9.365849869907965e-08, + "loss": 0.0005, + "step": 27434 + }, + { + "epoch": 0.53, + "learning_rate": 9.36546153547435e-08, + "loss": 1.122, + "step": 27435 + }, + { + "epoch": 0.53, + "learning_rate": 9.365073201040736e-08, + "loss": 0.0005, + "step": 27436 + }, + { + "epoch": 0.53, + "learning_rate": 9.364684866607122e-08, + "loss": 0.001, + "step": 27437 + }, + { + "epoch": 0.53, + "learning_rate": 9.364296532173508e-08, + "loss": 0.0006, + "step": 27438 + }, + { + "epoch": 0.53, + "learning_rate": 9.363908197739894e-08, + "loss": 0.0004, + "step": 27439 + }, + { + "epoch": 0.53, + "learning_rate": 9.363519863306278e-08, + "loss": 0.0004, + "step": 27440 + }, + { + "epoch": 0.53, + "learning_rate": 9.363131528872664e-08, + "loss": 0.0008, + "step": 27441 + }, + { + "epoch": 0.53, + "learning_rate": 9.36274319443905e-08, + "loss": 0.0006, + "step": 27442 + }, + { + "epoch": 0.53, + "learning_rate": 9.362354860005436e-08, + "loss": 0.0006, + "step": 27443 + }, + { + "epoch": 0.53, + "learning_rate": 9.361966525571822e-08, + "loss": 0.0043, + "step": 27444 + }, + { + "epoch": 0.53, + "learning_rate": 9.361578191138208e-08, + "loss": 0.0043, + "step": 27445 + }, + { + "epoch": 0.53, + "learning_rate": 9.361189856704593e-08, + "loss": 0.3844, + "step": 27446 + }, + { + "epoch": 0.53, + "learning_rate": 9.360801522270979e-08, + "loss": 0.0354, + "step": 27447 + }, + { + "epoch": 0.53, + "learning_rate": 9.360413187837365e-08, + "loss": 0.0005, + "step": 27448 + }, + { + "epoch": 0.53, + "learning_rate": 9.360024853403751e-08, + "loss": 0.0005, + "step": 27449 + }, + { + "epoch": 0.53, + "learning_rate": 9.359636518970137e-08, + "loss": 0.0024, + "step": 27450 + }, + { + "epoch": 0.53, + "learning_rate": 9.359248184536523e-08, + "loss": 0.0004, + "step": 27451 + }, + { + "epoch": 0.53, + "learning_rate": 9.358859850102908e-08, + "loss": 0.0004, + "step": 27452 + }, + { + "epoch": 0.53, + "learning_rate": 9.358471515669294e-08, + "loss": 0.0016, + "step": 27453 + }, + { + "epoch": 0.53, + "learning_rate": 9.35808318123568e-08, + "loss": 0.0005, + "step": 27454 + }, + { + "epoch": 0.53, + "learning_rate": 9.357694846802066e-08, + "loss": 0.0006, + "step": 27455 + }, + { + "epoch": 0.53, + "learning_rate": 9.357306512368452e-08, + "loss": 0.0006, + "step": 27456 + }, + { + "epoch": 0.53, + "learning_rate": 9.356918177934837e-08, + "loss": 0.0004, + "step": 27457 + }, + { + "epoch": 0.53, + "learning_rate": 9.356529843501223e-08, + "loss": 0.0008, + "step": 27458 + }, + { + "epoch": 0.53, + "learning_rate": 9.356141509067609e-08, + "loss": 0.0007, + "step": 27459 + }, + { + "epoch": 0.53, + "learning_rate": 9.355753174633995e-08, + "loss": 0.0005, + "step": 27460 + }, + { + "epoch": 0.53, + "learning_rate": 9.355364840200381e-08, + "loss": 0.3832, + "step": 27461 + }, + { + "epoch": 0.53, + "learning_rate": 9.354976505766767e-08, + "loss": 0.0005, + "step": 27462 + }, + { + "epoch": 0.53, + "learning_rate": 9.354588171333152e-08, + "loss": 0.0423, + "step": 27463 + }, + { + "epoch": 0.53, + "learning_rate": 9.354199836899538e-08, + "loss": 0.4952, + "step": 27464 + }, + { + "epoch": 0.53, + "learning_rate": 9.353811502465924e-08, + "loss": 0.0005, + "step": 27465 + }, + { + "epoch": 0.53, + "learning_rate": 9.35342316803231e-08, + "loss": 0.0006, + "step": 27466 + }, + { + "epoch": 0.53, + "learning_rate": 9.353034833598696e-08, + "loss": 0.0004, + "step": 27467 + }, + { + "epoch": 0.53, + "learning_rate": 9.352646499165082e-08, + "loss": 0.0011, + "step": 27468 + }, + { + "epoch": 0.53, + "learning_rate": 9.352258164731466e-08, + "loss": 0.0005, + "step": 27469 + }, + { + "epoch": 0.53, + "learning_rate": 9.351869830297852e-08, + "loss": 0.0018, + "step": 27470 + }, + { + "epoch": 0.53, + "learning_rate": 9.351481495864238e-08, + "loss": 0.0009, + "step": 27471 + }, + { + "epoch": 0.53, + "learning_rate": 9.351093161430624e-08, + "loss": 0.0005, + "step": 27472 + }, + { + "epoch": 0.53, + "learning_rate": 9.350704826997009e-08, + "loss": 0.0017, + "step": 27473 + }, + { + "epoch": 0.53, + "learning_rate": 9.350316492563395e-08, + "loss": 0.0008, + "step": 27474 + }, + { + "epoch": 0.53, + "learning_rate": 9.349928158129781e-08, + "loss": 0.0005, + "step": 27475 + }, + { + "epoch": 0.53, + "learning_rate": 9.349539823696167e-08, + "loss": 0.0007, + "step": 27476 + }, + { + "epoch": 0.53, + "learning_rate": 9.349151489262553e-08, + "loss": 0.0005, + "step": 27477 + }, + { + "epoch": 0.53, + "learning_rate": 9.348763154828938e-08, + "loss": 0.0004, + "step": 27478 + }, + { + "epoch": 0.53, + "learning_rate": 9.348374820395324e-08, + "loss": 0.0011, + "step": 27479 + }, + { + "epoch": 0.53, + "learning_rate": 9.34798648596171e-08, + "loss": 0.0041, + "step": 27480 + }, + { + "epoch": 0.53, + "learning_rate": 9.347598151528096e-08, + "loss": 0.0008, + "step": 27481 + }, + { + "epoch": 0.53, + "learning_rate": 9.347209817094482e-08, + "loss": 0.0004, + "step": 27482 + }, + { + "epoch": 0.53, + "learning_rate": 9.346821482660868e-08, + "loss": 0.5737, + "step": 27483 + }, + { + "epoch": 0.53, + "learning_rate": 9.346433148227253e-08, + "loss": 0.0005, + "step": 27484 + }, + { + "epoch": 0.53, + "learning_rate": 9.346044813793639e-08, + "loss": 0.0006, + "step": 27485 + }, + { + "epoch": 0.53, + "learning_rate": 9.345656479360025e-08, + "loss": 0.0004, + "step": 27486 + }, + { + "epoch": 0.53, + "learning_rate": 9.345268144926411e-08, + "loss": 0.0011, + "step": 27487 + }, + { + "epoch": 0.53, + "learning_rate": 9.344879810492797e-08, + "loss": 0.0005, + "step": 27488 + }, + { + "epoch": 0.53, + "learning_rate": 9.344491476059183e-08, + "loss": 0.0005, + "step": 27489 + }, + { + "epoch": 0.53, + "learning_rate": 9.344103141625568e-08, + "loss": 0.0006, + "step": 27490 + }, + { + "epoch": 0.53, + "learning_rate": 9.343714807191954e-08, + "loss": 0.0007, + "step": 27491 + }, + { + "epoch": 0.53, + "learning_rate": 9.34332647275834e-08, + "loss": 0.0007, + "step": 27492 + }, + { + "epoch": 0.53, + "learning_rate": 9.342938138324726e-08, + "loss": 0.0004, + "step": 27493 + }, + { + "epoch": 0.53, + "learning_rate": 9.342549803891112e-08, + "loss": 0.0004, + "step": 27494 + }, + { + "epoch": 0.53, + "learning_rate": 9.342161469457497e-08, + "loss": 0.7652, + "step": 27495 + }, + { + "epoch": 0.53, + "learning_rate": 9.341773135023883e-08, + "loss": 0.0015, + "step": 27496 + }, + { + "epoch": 0.53, + "learning_rate": 9.341384800590269e-08, + "loss": 0.0005, + "step": 27497 + }, + { + "epoch": 0.53, + "learning_rate": 9.340996466156654e-08, + "loss": 0.0006, + "step": 27498 + }, + { + "epoch": 0.53, + "learning_rate": 9.34060813172304e-08, + "loss": 0.0004, + "step": 27499 + }, + { + "epoch": 0.53, + "learning_rate": 9.340219797289425e-08, + "loss": 0.0007, + "step": 27500 + }, + { + "epoch": 0.53, + "learning_rate": 9.339831462855811e-08, + "loss": 0.0016, + "step": 27501 + }, + { + "epoch": 0.53, + "learning_rate": 9.339443128422197e-08, + "loss": 0.0004, + "step": 27502 + }, + { + "epoch": 0.53, + "learning_rate": 9.339054793988583e-08, + "loss": 0.0055, + "step": 27503 + }, + { + "epoch": 0.53, + "learning_rate": 9.338666459554969e-08, + "loss": 0.0007, + "step": 27504 + }, + { + "epoch": 0.53, + "learning_rate": 9.338278125121354e-08, + "loss": 0.0005, + "step": 27505 + }, + { + "epoch": 0.53, + "learning_rate": 9.33788979068774e-08, + "loss": 0.0005, + "step": 27506 + }, + { + "epoch": 0.53, + "learning_rate": 9.337501456254126e-08, + "loss": 0.0024, + "step": 27507 + }, + { + "epoch": 0.53, + "learning_rate": 9.337113121820512e-08, + "loss": 0.221, + "step": 27508 + }, + { + "epoch": 0.53, + "learning_rate": 9.336724787386898e-08, + "loss": 0.0005, + "step": 27509 + }, + { + "epoch": 0.53, + "learning_rate": 9.336336452953284e-08, + "loss": 0.0004, + "step": 27510 + }, + { + "epoch": 0.53, + "learning_rate": 9.335948118519669e-08, + "loss": 0.0004, + "step": 27511 + }, + { + "epoch": 0.53, + "learning_rate": 9.335559784086054e-08, + "loss": 0.0005, + "step": 27512 + }, + { + "epoch": 0.53, + "learning_rate": 9.33517144965244e-08, + "loss": 0.0004, + "step": 27513 + }, + { + "epoch": 0.53, + "learning_rate": 9.334783115218825e-08, + "loss": 0.0007, + "step": 27514 + }, + { + "epoch": 0.53, + "learning_rate": 9.334394780785211e-08, + "loss": 1.0365, + "step": 27515 + }, + { + "epoch": 0.53, + "learning_rate": 9.334006446351597e-08, + "loss": 0.0004, + "step": 27516 + }, + { + "epoch": 0.53, + "learning_rate": 9.333618111917983e-08, + "loss": 0.001, + "step": 27517 + }, + { + "epoch": 0.53, + "learning_rate": 9.333229777484369e-08, + "loss": 0.0005, + "step": 27518 + }, + { + "epoch": 0.53, + "learning_rate": 9.332841443050755e-08, + "loss": 0.0005, + "step": 27519 + }, + { + "epoch": 0.53, + "learning_rate": 9.33245310861714e-08, + "loss": 0.0005, + "step": 27520 + }, + { + "epoch": 0.53, + "learning_rate": 9.332064774183526e-08, + "loss": 0.0006, + "step": 27521 + }, + { + "epoch": 0.53, + "learning_rate": 9.331676439749912e-08, + "loss": 0.0006, + "step": 27522 + }, + { + "epoch": 0.53, + "learning_rate": 9.331288105316298e-08, + "loss": 0.0007, + "step": 27523 + }, + { + "epoch": 0.53, + "learning_rate": 9.330899770882684e-08, + "loss": 0.0009, + "step": 27524 + }, + { + "epoch": 0.53, + "learning_rate": 9.33051143644907e-08, + "loss": 0.0006, + "step": 27525 + }, + { + "epoch": 0.53, + "learning_rate": 9.330123102015455e-08, + "loss": 0.3707, + "step": 27526 + }, + { + "epoch": 0.53, + "learning_rate": 9.32973476758184e-08, + "loss": 0.0005, + "step": 27527 + }, + { + "epoch": 0.53, + "learning_rate": 9.329346433148226e-08, + "loss": 0.3284, + "step": 27528 + }, + { + "epoch": 0.53, + "learning_rate": 9.328958098714612e-08, + "loss": 0.0044, + "step": 27529 + }, + { + "epoch": 0.53, + "learning_rate": 9.328569764280997e-08, + "loss": 0.0005, + "step": 27530 + }, + { + "epoch": 0.53, + "learning_rate": 9.328181429847383e-08, + "loss": 0.0007, + "step": 27531 + }, + { + "epoch": 0.53, + "learning_rate": 9.327793095413769e-08, + "loss": 0.0005, + "step": 27532 + }, + { + "epoch": 0.53, + "learning_rate": 9.327404760980155e-08, + "loss": 0.0005, + "step": 27533 + }, + { + "epoch": 0.53, + "learning_rate": 9.32701642654654e-08, + "loss": 0.0014, + "step": 27534 + }, + { + "epoch": 0.53, + "learning_rate": 9.326628092112926e-08, + "loss": 0.0004, + "step": 27535 + }, + { + "epoch": 0.53, + "learning_rate": 9.326239757679312e-08, + "loss": 0.0008, + "step": 27536 + }, + { + "epoch": 0.53, + "learning_rate": 9.325851423245698e-08, + "loss": 0.0016, + "step": 27537 + }, + { + "epoch": 0.53, + "learning_rate": 9.325463088812084e-08, + "loss": 0.0061, + "step": 27538 + }, + { + "epoch": 0.53, + "learning_rate": 9.32507475437847e-08, + "loss": 0.0005, + "step": 27539 + }, + { + "epoch": 0.53, + "learning_rate": 9.324686419944856e-08, + "loss": 0.0005, + "step": 27540 + }, + { + "epoch": 0.53, + "learning_rate": 9.324298085511241e-08, + "loss": 0.0004, + "step": 27541 + }, + { + "epoch": 0.53, + "learning_rate": 9.323909751077627e-08, + "loss": 0.0353, + "step": 27542 + }, + { + "epoch": 0.53, + "learning_rate": 9.323521416644013e-08, + "loss": 0.0004, + "step": 27543 + }, + { + "epoch": 0.53, + "learning_rate": 9.323133082210399e-08, + "loss": 0.0005, + "step": 27544 + }, + { + "epoch": 0.53, + "learning_rate": 9.322744747776785e-08, + "loss": 0.0004, + "step": 27545 + }, + { + "epoch": 0.53, + "learning_rate": 9.32235641334317e-08, + "loss": 0.0008, + "step": 27546 + }, + { + "epoch": 0.53, + "learning_rate": 9.321968078909556e-08, + "loss": 0.0006, + "step": 27547 + }, + { + "epoch": 0.53, + "learning_rate": 9.321579744475942e-08, + "loss": 0.0005, + "step": 27548 + }, + { + "epoch": 0.53, + "learning_rate": 9.321191410042328e-08, + "loss": 0.1267, + "step": 27549 + }, + { + "epoch": 0.53, + "learning_rate": 9.320803075608714e-08, + "loss": 0.3082, + "step": 27550 + }, + { + "epoch": 0.53, + "learning_rate": 9.3204147411751e-08, + "loss": 1.136, + "step": 27551 + }, + { + "epoch": 0.53, + "learning_rate": 9.320026406741485e-08, + "loss": 0.0008, + "step": 27552 + }, + { + "epoch": 0.53, + "learning_rate": 9.319638072307871e-08, + "loss": 0.0004, + "step": 27553 + }, + { + "epoch": 0.53, + "learning_rate": 9.319249737874257e-08, + "loss": 0.0006, + "step": 27554 + }, + { + "epoch": 0.53, + "learning_rate": 9.318861403440643e-08, + "loss": 0.0009, + "step": 27555 + }, + { + "epoch": 0.53, + "learning_rate": 9.318473069007027e-08, + "loss": 0.0004, + "step": 27556 + }, + { + "epoch": 0.53, + "learning_rate": 9.318084734573413e-08, + "loss": 0.0009, + "step": 27557 + }, + { + "epoch": 0.53, + "learning_rate": 9.317696400139799e-08, + "loss": 0.0005, + "step": 27558 + }, + { + "epoch": 0.53, + "learning_rate": 9.317308065706185e-08, + "loss": 0.0009, + "step": 27559 + }, + { + "epoch": 0.53, + "learning_rate": 9.316919731272571e-08, + "loss": 0.0005, + "step": 27560 + }, + { + "epoch": 0.53, + "learning_rate": 9.316531396838957e-08, + "loss": 0.0006, + "step": 27561 + }, + { + "epoch": 0.53, + "learning_rate": 9.316143062405342e-08, + "loss": 0.0007, + "step": 27562 + }, + { + "epoch": 0.53, + "learning_rate": 9.315754727971728e-08, + "loss": 0.0014, + "step": 27563 + }, + { + "epoch": 0.53, + "learning_rate": 9.315366393538114e-08, + "loss": 0.0006, + "step": 27564 + }, + { + "epoch": 0.53, + "learning_rate": 9.3149780591045e-08, + "loss": 0.0005, + "step": 27565 + }, + { + "epoch": 0.53, + "learning_rate": 9.314589724670886e-08, + "loss": 0.0005, + "step": 27566 + }, + { + "epoch": 0.53, + "learning_rate": 9.314201390237272e-08, + "loss": 1.2197, + "step": 27567 + }, + { + "epoch": 0.53, + "learning_rate": 9.313813055803657e-08, + "loss": 0.0004, + "step": 27568 + }, + { + "epoch": 0.53, + "learning_rate": 9.313424721370043e-08, + "loss": 0.0005, + "step": 27569 + }, + { + "epoch": 0.53, + "learning_rate": 9.313036386936429e-08, + "loss": 0.0006, + "step": 27570 + }, + { + "epoch": 0.53, + "learning_rate": 9.312648052502815e-08, + "loss": 0.003, + "step": 27571 + }, + { + "epoch": 0.53, + "learning_rate": 9.3122597180692e-08, + "loss": 0.0006, + "step": 27572 + }, + { + "epoch": 0.53, + "learning_rate": 9.311871383635586e-08, + "loss": 0.0003, + "step": 27573 + }, + { + "epoch": 0.53, + "learning_rate": 9.311483049201972e-08, + "loss": 0.0006, + "step": 27574 + }, + { + "epoch": 0.53, + "learning_rate": 9.311094714768358e-08, + "loss": 0.0007, + "step": 27575 + }, + { + "epoch": 0.53, + "learning_rate": 9.310706380334744e-08, + "loss": 0.0005, + "step": 27576 + }, + { + "epoch": 0.53, + "learning_rate": 9.31031804590113e-08, + "loss": 0.0004, + "step": 27577 + }, + { + "epoch": 0.53, + "learning_rate": 9.309929711467516e-08, + "loss": 0.006, + "step": 27578 + }, + { + "epoch": 0.53, + "learning_rate": 9.309541377033901e-08, + "loss": 0.0006, + "step": 27579 + }, + { + "epoch": 0.53, + "learning_rate": 9.309153042600287e-08, + "loss": 0.0179, + "step": 27580 + }, + { + "epoch": 0.54, + "learning_rate": 9.308764708166673e-08, + "loss": 0.6569, + "step": 27581 + }, + { + "epoch": 0.54, + "learning_rate": 9.308376373733059e-08, + "loss": 0.0036, + "step": 27582 + }, + { + "epoch": 0.54, + "learning_rate": 9.307988039299445e-08, + "loss": 0.7794, + "step": 27583 + }, + { + "epoch": 0.54, + "learning_rate": 9.30759970486583e-08, + "loss": 0.0009, + "step": 27584 + }, + { + "epoch": 0.54, + "learning_rate": 9.307211370432215e-08, + "loss": 0.0005, + "step": 27585 + }, + { + "epoch": 0.54, + "learning_rate": 9.306823035998601e-08, + "loss": 0.0005, + "step": 27586 + }, + { + "epoch": 0.54, + "learning_rate": 9.306434701564987e-08, + "loss": 0.0009, + "step": 27587 + }, + { + "epoch": 0.54, + "learning_rate": 9.306046367131373e-08, + "loss": 0.0005, + "step": 27588 + }, + { + "epoch": 0.54, + "learning_rate": 9.305658032697758e-08, + "loss": 0.2102, + "step": 27589 + }, + { + "epoch": 0.54, + "learning_rate": 9.305269698264144e-08, + "loss": 0.0041, + "step": 27590 + }, + { + "epoch": 0.54, + "learning_rate": 9.30488136383053e-08, + "loss": 0.0005, + "step": 27591 + }, + { + "epoch": 0.54, + "learning_rate": 9.304493029396916e-08, + "loss": 1.0585, + "step": 27592 + }, + { + "epoch": 0.54, + "learning_rate": 9.304104694963302e-08, + "loss": 0.002, + "step": 27593 + }, + { + "epoch": 0.54, + "learning_rate": 9.303716360529687e-08, + "loss": 0.0005, + "step": 27594 + }, + { + "epoch": 0.54, + "learning_rate": 9.303328026096073e-08, + "loss": 0.0006, + "step": 27595 + }, + { + "epoch": 0.54, + "learning_rate": 9.302939691662459e-08, + "loss": 0.0004, + "step": 27596 + }, + { + "epoch": 0.54, + "learning_rate": 9.302551357228845e-08, + "loss": 0.0005, + "step": 27597 + }, + { + "epoch": 0.54, + "learning_rate": 9.302163022795231e-08, + "loss": 0.0006, + "step": 27598 + }, + { + "epoch": 0.54, + "learning_rate": 9.301774688361617e-08, + "loss": 0.8308, + "step": 27599 + }, + { + "epoch": 0.54, + "learning_rate": 9.301386353928002e-08, + "loss": 0.0006, + "step": 27600 + }, + { + "epoch": 0.54, + "learning_rate": 9.300998019494388e-08, + "loss": 0.0005, + "step": 27601 + }, + { + "epoch": 0.54, + "learning_rate": 9.300609685060774e-08, + "loss": 0.0004, + "step": 27602 + }, + { + "epoch": 0.54, + "learning_rate": 9.30022135062716e-08, + "loss": 1.0517, + "step": 27603 + }, + { + "epoch": 0.54, + "learning_rate": 9.299833016193546e-08, + "loss": 0.0006, + "step": 27604 + }, + { + "epoch": 0.54, + "learning_rate": 9.299444681759932e-08, + "loss": 0.0008, + "step": 27605 + }, + { + "epoch": 0.54, + "learning_rate": 9.299056347326317e-08, + "loss": 0.002, + "step": 27606 + }, + { + "epoch": 0.54, + "learning_rate": 9.298668012892703e-08, + "loss": 0.0005, + "step": 27607 + }, + { + "epoch": 0.54, + "learning_rate": 9.298279678459089e-08, + "loss": 0.0007, + "step": 27608 + }, + { + "epoch": 0.54, + "learning_rate": 9.297891344025475e-08, + "loss": 0.0005, + "step": 27609 + }, + { + "epoch": 0.54, + "learning_rate": 9.29750300959186e-08, + "loss": 0.0006, + "step": 27610 + }, + { + "epoch": 0.54, + "learning_rate": 9.297114675158246e-08, + "loss": 0.0016, + "step": 27611 + }, + { + "epoch": 0.54, + "learning_rate": 9.296726340724632e-08, + "loss": 0.0005, + "step": 27612 + }, + { + "epoch": 0.54, + "learning_rate": 9.296338006291018e-08, + "loss": 0.0004, + "step": 27613 + }, + { + "epoch": 0.54, + "learning_rate": 9.295949671857403e-08, + "loss": 0.0006, + "step": 27614 + }, + { + "epoch": 0.54, + "learning_rate": 9.295561337423788e-08, + "loss": 0.0008, + "step": 27615 + }, + { + "epoch": 0.54, + "learning_rate": 9.295173002990174e-08, + "loss": 0.2313, + "step": 27616 + }, + { + "epoch": 0.54, + "learning_rate": 9.29478466855656e-08, + "loss": 0.0006, + "step": 27617 + }, + { + "epoch": 0.54, + "learning_rate": 9.294396334122946e-08, + "loss": 0.0005, + "step": 27618 + }, + { + "epoch": 0.54, + "learning_rate": 9.294007999689332e-08, + "loss": 0.0004, + "step": 27619 + }, + { + "epoch": 0.54, + "learning_rate": 9.293619665255718e-08, + "loss": 0.0004, + "step": 27620 + }, + { + "epoch": 0.54, + "learning_rate": 9.293231330822103e-08, + "loss": 0.0005, + "step": 27621 + }, + { + "epoch": 0.54, + "learning_rate": 9.292842996388489e-08, + "loss": 0.0007, + "step": 27622 + }, + { + "epoch": 0.54, + "learning_rate": 9.292454661954875e-08, + "loss": 0.0072, + "step": 27623 + }, + { + "epoch": 0.54, + "learning_rate": 9.292066327521261e-08, + "loss": 0.0004, + "step": 27624 + }, + { + "epoch": 0.54, + "learning_rate": 9.291677993087647e-08, + "loss": 0.0004, + "step": 27625 + }, + { + "epoch": 0.54, + "learning_rate": 9.291289658654033e-08, + "loss": 0.0005, + "step": 27626 + }, + { + "epoch": 0.54, + "learning_rate": 9.290901324220418e-08, + "loss": 0.0418, + "step": 27627 + }, + { + "epoch": 0.54, + "learning_rate": 9.290512989786804e-08, + "loss": 0.0004, + "step": 27628 + }, + { + "epoch": 0.54, + "learning_rate": 9.29012465535319e-08, + "loss": 0.0005, + "step": 27629 + }, + { + "epoch": 0.54, + "learning_rate": 9.289736320919576e-08, + "loss": 0.0005, + "step": 27630 + }, + { + "epoch": 0.54, + "learning_rate": 9.289347986485962e-08, + "loss": 0.0006, + "step": 27631 + }, + { + "epoch": 0.54, + "learning_rate": 9.288959652052347e-08, + "loss": 0.0011, + "step": 27632 + }, + { + "epoch": 0.54, + "learning_rate": 9.288571317618733e-08, + "loss": 0.0006, + "step": 27633 + }, + { + "epoch": 0.54, + "learning_rate": 9.288182983185119e-08, + "loss": 0.0006, + "step": 27634 + }, + { + "epoch": 0.54, + "learning_rate": 9.287794648751505e-08, + "loss": 0.0003, + "step": 27635 + }, + { + "epoch": 0.54, + "learning_rate": 9.287406314317891e-08, + "loss": 0.0006, + "step": 27636 + }, + { + "epoch": 0.54, + "learning_rate": 9.287017979884277e-08, + "loss": 0.5381, + "step": 27637 + }, + { + "epoch": 0.54, + "learning_rate": 9.286629645450662e-08, + "loss": 0.0004, + "step": 27638 + }, + { + "epoch": 0.54, + "learning_rate": 9.286241311017048e-08, + "loss": 0.0007, + "step": 27639 + }, + { + "epoch": 0.54, + "learning_rate": 9.285852976583434e-08, + "loss": 0.0006, + "step": 27640 + }, + { + "epoch": 0.54, + "learning_rate": 9.28546464214982e-08, + "loss": 0.0006, + "step": 27641 + }, + { + "epoch": 0.54, + "learning_rate": 9.285076307716206e-08, + "loss": 0.0009, + "step": 27642 + }, + { + "epoch": 0.54, + "learning_rate": 9.28468797328259e-08, + "loss": 0.0027, + "step": 27643 + }, + { + "epoch": 0.54, + "learning_rate": 9.284299638848976e-08, + "loss": 0.0157, + "step": 27644 + }, + { + "epoch": 0.54, + "learning_rate": 9.283911304415362e-08, + "loss": 1.1532, + "step": 27645 + }, + { + "epoch": 0.54, + "learning_rate": 9.283522969981748e-08, + "loss": 0.0009, + "step": 27646 + }, + { + "epoch": 0.54, + "learning_rate": 9.283134635548134e-08, + "loss": 0.0005, + "step": 27647 + }, + { + "epoch": 0.54, + "learning_rate": 9.282746301114519e-08, + "loss": 0.0007, + "step": 27648 + }, + { + "epoch": 0.54, + "learning_rate": 9.282357966680905e-08, + "loss": 0.0005, + "step": 27649 + }, + { + "epoch": 0.54, + "learning_rate": 9.281969632247291e-08, + "loss": 0.0026, + "step": 27650 + }, + { + "epoch": 0.54, + "learning_rate": 9.281581297813677e-08, + "loss": 0.0037, + "step": 27651 + }, + { + "epoch": 0.54, + "learning_rate": 9.281192963380063e-08, + "loss": 0.0005, + "step": 27652 + }, + { + "epoch": 0.54, + "learning_rate": 9.280804628946448e-08, + "loss": 0.0003, + "step": 27653 + }, + { + "epoch": 0.54, + "learning_rate": 9.280416294512834e-08, + "loss": 0.0004, + "step": 27654 + }, + { + "epoch": 0.54, + "learning_rate": 9.28002796007922e-08, + "loss": 0.0006, + "step": 27655 + }, + { + "epoch": 0.54, + "learning_rate": 9.279639625645606e-08, + "loss": 0.0007, + "step": 27656 + }, + { + "epoch": 0.54, + "learning_rate": 9.279251291211992e-08, + "loss": 0.0011, + "step": 27657 + }, + { + "epoch": 0.54, + "learning_rate": 9.278862956778378e-08, + "loss": 0.0007, + "step": 27658 + }, + { + "epoch": 0.54, + "learning_rate": 9.278474622344763e-08, + "loss": 0.0027, + "step": 27659 + }, + { + "epoch": 0.54, + "learning_rate": 9.278086287911149e-08, + "loss": 0.0095, + "step": 27660 + }, + { + "epoch": 0.54, + "learning_rate": 9.277697953477535e-08, + "loss": 0.7416, + "step": 27661 + }, + { + "epoch": 0.54, + "learning_rate": 9.277309619043921e-08, + "loss": 0.446, + "step": 27662 + }, + { + "epoch": 0.54, + "learning_rate": 9.276921284610307e-08, + "loss": 0.0006, + "step": 27663 + }, + { + "epoch": 0.54, + "learning_rate": 9.276532950176693e-08, + "loss": 0.0004, + "step": 27664 + }, + { + "epoch": 0.54, + "learning_rate": 9.276144615743078e-08, + "loss": 0.0005, + "step": 27665 + }, + { + "epoch": 0.54, + "learning_rate": 9.275756281309464e-08, + "loss": 0.0005, + "step": 27666 + }, + { + "epoch": 0.54, + "learning_rate": 9.27536794687585e-08, + "loss": 0.0014, + "step": 27667 + }, + { + "epoch": 0.54, + "learning_rate": 9.274979612442236e-08, + "loss": 0.0005, + "step": 27668 + }, + { + "epoch": 0.54, + "learning_rate": 9.274591278008622e-08, + "loss": 0.0007, + "step": 27669 + }, + { + "epoch": 0.54, + "learning_rate": 9.274202943575007e-08, + "loss": 0.0004, + "step": 27670 + }, + { + "epoch": 0.54, + "learning_rate": 9.273814609141393e-08, + "loss": 0.0009, + "step": 27671 + }, + { + "epoch": 0.54, + "learning_rate": 9.273426274707778e-08, + "loss": 0.0008, + "step": 27672 + }, + { + "epoch": 0.54, + "learning_rate": 9.273037940274164e-08, + "loss": 0.0003, + "step": 27673 + }, + { + "epoch": 0.54, + "learning_rate": 9.27264960584055e-08, + "loss": 0.0008, + "step": 27674 + }, + { + "epoch": 0.54, + "learning_rate": 9.272261271406935e-08, + "loss": 0.0005, + "step": 27675 + }, + { + "epoch": 0.54, + "learning_rate": 9.271872936973321e-08, + "loss": 0.0005, + "step": 27676 + }, + { + "epoch": 0.54, + "learning_rate": 9.271484602539707e-08, + "loss": 0.0006, + "step": 27677 + }, + { + "epoch": 0.54, + "learning_rate": 9.271096268106093e-08, + "loss": 1.1833, + "step": 27678 + }, + { + "epoch": 0.54, + "learning_rate": 9.270707933672479e-08, + "loss": 0.1011, + "step": 27679 + }, + { + "epoch": 0.54, + "learning_rate": 9.270319599238864e-08, + "loss": 0.0006, + "step": 27680 + }, + { + "epoch": 0.54, + "learning_rate": 9.26993126480525e-08, + "loss": 0.001, + "step": 27681 + }, + { + "epoch": 0.54, + "learning_rate": 9.269542930371636e-08, + "loss": 0.0005, + "step": 27682 + }, + { + "epoch": 0.54, + "learning_rate": 9.269154595938022e-08, + "loss": 0.0019, + "step": 27683 + }, + { + "epoch": 0.54, + "learning_rate": 9.268766261504408e-08, + "loss": 0.0007, + "step": 27684 + }, + { + "epoch": 0.54, + "learning_rate": 9.268377927070794e-08, + "loss": 0.0007, + "step": 27685 + }, + { + "epoch": 0.54, + "learning_rate": 9.26798959263718e-08, + "loss": 0.8293, + "step": 27686 + }, + { + "epoch": 0.54, + "learning_rate": 9.267601258203565e-08, + "loss": 0.0313, + "step": 27687 + }, + { + "epoch": 0.54, + "learning_rate": 9.267212923769951e-08, + "loss": 0.0007, + "step": 27688 + }, + { + "epoch": 0.54, + "learning_rate": 9.266824589336335e-08, + "loss": 1.0567, + "step": 27689 + }, + { + "epoch": 0.54, + "learning_rate": 9.266436254902721e-08, + "loss": 0.0008, + "step": 27690 + }, + { + "epoch": 0.54, + "learning_rate": 9.266047920469107e-08, + "loss": 1.0349, + "step": 27691 + }, + { + "epoch": 0.54, + "learning_rate": 9.265659586035493e-08, + "loss": 0.0006, + "step": 27692 + }, + { + "epoch": 0.54, + "learning_rate": 9.265271251601879e-08, + "loss": 0.0009, + "step": 27693 + }, + { + "epoch": 0.54, + "learning_rate": 9.264882917168265e-08, + "loss": 0.1622, + "step": 27694 + }, + { + "epoch": 0.54, + "learning_rate": 9.26449458273465e-08, + "loss": 0.0008, + "step": 27695 + }, + { + "epoch": 0.54, + "learning_rate": 9.264106248301036e-08, + "loss": 0.0006, + "step": 27696 + }, + { + "epoch": 0.54, + "learning_rate": 9.263717913867422e-08, + "loss": 0.0007, + "step": 27697 + }, + { + "epoch": 0.54, + "learning_rate": 9.263329579433808e-08, + "loss": 0.0006, + "step": 27698 + }, + { + "epoch": 0.54, + "learning_rate": 9.262941245000194e-08, + "loss": 0.0005, + "step": 27699 + }, + { + "epoch": 0.54, + "learning_rate": 9.26255291056658e-08, + "loss": 0.0235, + "step": 27700 + }, + { + "epoch": 0.54, + "learning_rate": 9.262164576132965e-08, + "loss": 0.0026, + "step": 27701 + }, + { + "epoch": 0.54, + "learning_rate": 9.261776241699351e-08, + "loss": 0.0005, + "step": 27702 + }, + { + "epoch": 0.54, + "learning_rate": 9.261387907265737e-08, + "loss": 0.0005, + "step": 27703 + }, + { + "epoch": 0.54, + "learning_rate": 9.260999572832122e-08, + "loss": 0.6245, + "step": 27704 + }, + { + "epoch": 0.54, + "learning_rate": 9.260611238398507e-08, + "loss": 0.0005, + "step": 27705 + }, + { + "epoch": 0.54, + "learning_rate": 9.260222903964893e-08, + "loss": 0.0006, + "step": 27706 + }, + { + "epoch": 0.54, + "learning_rate": 9.259834569531279e-08, + "loss": 0.0767, + "step": 27707 + }, + { + "epoch": 0.54, + "learning_rate": 9.259446235097665e-08, + "loss": 0.0009, + "step": 27708 + }, + { + "epoch": 0.54, + "learning_rate": 9.25905790066405e-08, + "loss": 0.5869, + "step": 27709 + }, + { + "epoch": 0.54, + "learning_rate": 9.258669566230436e-08, + "loss": 0.0006, + "step": 27710 + }, + { + "epoch": 0.54, + "learning_rate": 9.258281231796822e-08, + "loss": 0.0004, + "step": 27711 + }, + { + "epoch": 0.54, + "learning_rate": 9.257892897363208e-08, + "loss": 0.6798, + "step": 27712 + }, + { + "epoch": 0.54, + "learning_rate": 9.257504562929594e-08, + "loss": 0.004, + "step": 27713 + }, + { + "epoch": 0.54, + "learning_rate": 9.25711622849598e-08, + "loss": 0.0004, + "step": 27714 + }, + { + "epoch": 0.54, + "learning_rate": 9.256727894062366e-08, + "loss": 0.0004, + "step": 27715 + }, + { + "epoch": 0.54, + "learning_rate": 9.256339559628751e-08, + "loss": 0.0005, + "step": 27716 + }, + { + "epoch": 0.54, + "learning_rate": 9.255951225195137e-08, + "loss": 0.0208, + "step": 27717 + }, + { + "epoch": 0.54, + "learning_rate": 9.255562890761523e-08, + "loss": 0.2905, + "step": 27718 + }, + { + "epoch": 0.54, + "learning_rate": 9.255174556327909e-08, + "loss": 0.0004, + "step": 27719 + }, + { + "epoch": 0.54, + "learning_rate": 9.254786221894295e-08, + "loss": 0.0004, + "step": 27720 + }, + { + "epoch": 0.54, + "learning_rate": 9.25439788746068e-08, + "loss": 0.0005, + "step": 27721 + }, + { + "epoch": 0.54, + "learning_rate": 9.254009553027066e-08, + "loss": 0.0004, + "step": 27722 + }, + { + "epoch": 0.54, + "learning_rate": 9.253621218593452e-08, + "loss": 0.0005, + "step": 27723 + }, + { + "epoch": 0.54, + "learning_rate": 9.253232884159838e-08, + "loss": 0.9943, + "step": 27724 + }, + { + "epoch": 0.54, + "learning_rate": 9.252844549726224e-08, + "loss": 0.0006, + "step": 27725 + }, + { + "epoch": 0.54, + "learning_rate": 9.25245621529261e-08, + "loss": 0.0006, + "step": 27726 + }, + { + "epoch": 0.54, + "learning_rate": 9.252067880858995e-08, + "loss": 0.0007, + "step": 27727 + }, + { + "epoch": 0.54, + "learning_rate": 9.251679546425381e-08, + "loss": 0.0304, + "step": 27728 + }, + { + "epoch": 0.54, + "learning_rate": 9.251291211991767e-08, + "loss": 0.0006, + "step": 27729 + }, + { + "epoch": 0.54, + "learning_rate": 9.250902877558152e-08, + "loss": 0.0005, + "step": 27730 + }, + { + "epoch": 0.54, + "learning_rate": 9.250514543124537e-08, + "loss": 0.0005, + "step": 27731 + }, + { + "epoch": 0.54, + "learning_rate": 9.250126208690923e-08, + "loss": 0.0005, + "step": 27732 + }, + { + "epoch": 0.54, + "learning_rate": 9.249737874257309e-08, + "loss": 0.0007, + "step": 27733 + }, + { + "epoch": 0.54, + "learning_rate": 9.249349539823695e-08, + "loss": 0.0006, + "step": 27734 + }, + { + "epoch": 0.54, + "learning_rate": 9.248961205390081e-08, + "loss": 0.0009, + "step": 27735 + }, + { + "epoch": 0.54, + "learning_rate": 9.248572870956467e-08, + "loss": 0.0486, + "step": 27736 + }, + { + "epoch": 0.54, + "learning_rate": 9.248184536522852e-08, + "loss": 0.0007, + "step": 27737 + }, + { + "epoch": 0.54, + "learning_rate": 9.247796202089238e-08, + "loss": 0.0007, + "step": 27738 + }, + { + "epoch": 0.54, + "learning_rate": 9.247407867655624e-08, + "loss": 0.0055, + "step": 27739 + }, + { + "epoch": 0.54, + "learning_rate": 9.24701953322201e-08, + "loss": 0.0006, + "step": 27740 + }, + { + "epoch": 0.54, + "learning_rate": 9.246631198788396e-08, + "loss": 0.0007, + "step": 27741 + }, + { + "epoch": 0.54, + "learning_rate": 9.246242864354782e-08, + "loss": 0.0006, + "step": 27742 + }, + { + "epoch": 0.54, + "learning_rate": 9.245854529921167e-08, + "loss": 0.0481, + "step": 27743 + }, + { + "epoch": 0.54, + "learning_rate": 9.245466195487553e-08, + "loss": 0.0005, + "step": 27744 + }, + { + "epoch": 0.54, + "learning_rate": 9.245077861053939e-08, + "loss": 0.0011, + "step": 27745 + }, + { + "epoch": 0.54, + "learning_rate": 9.244689526620325e-08, + "loss": 0.0004, + "step": 27746 + }, + { + "epoch": 0.54, + "learning_rate": 9.24430119218671e-08, + "loss": 0.0005, + "step": 27747 + }, + { + "epoch": 0.54, + "learning_rate": 9.243912857753096e-08, + "loss": 0.0004, + "step": 27748 + }, + { + "epoch": 0.54, + "learning_rate": 9.243524523319482e-08, + "loss": 0.0003, + "step": 27749 + }, + { + "epoch": 0.54, + "learning_rate": 9.243136188885868e-08, + "loss": 0.7196, + "step": 27750 + }, + { + "epoch": 0.54, + "learning_rate": 9.242747854452254e-08, + "loss": 0.0041, + "step": 27751 + }, + { + "epoch": 0.54, + "learning_rate": 9.24235952001864e-08, + "loss": 0.0006, + "step": 27752 + }, + { + "epoch": 0.54, + "learning_rate": 9.241971185585026e-08, + "loss": 0.2306, + "step": 27753 + }, + { + "epoch": 0.54, + "learning_rate": 9.241582851151411e-08, + "loss": 0.0017, + "step": 27754 + }, + { + "epoch": 0.54, + "learning_rate": 9.241194516717797e-08, + "loss": 0.0004, + "step": 27755 + }, + { + "epoch": 0.54, + "learning_rate": 9.240806182284183e-08, + "loss": 0.0006, + "step": 27756 + }, + { + "epoch": 0.54, + "learning_rate": 9.240417847850569e-08, + "loss": 0.0004, + "step": 27757 + }, + { + "epoch": 0.54, + "learning_rate": 9.240029513416955e-08, + "loss": 0.0005, + "step": 27758 + }, + { + "epoch": 0.54, + "learning_rate": 9.239641178983339e-08, + "loss": 0.0005, + "step": 27759 + }, + { + "epoch": 0.54, + "learning_rate": 9.239252844549725e-08, + "loss": 0.0004, + "step": 27760 + }, + { + "epoch": 0.54, + "learning_rate": 9.238864510116111e-08, + "loss": 0.0006, + "step": 27761 + }, + { + "epoch": 0.54, + "learning_rate": 9.238476175682497e-08, + "loss": 0.002, + "step": 27762 + }, + { + "epoch": 0.54, + "learning_rate": 9.238087841248883e-08, + "loss": 0.0046, + "step": 27763 + }, + { + "epoch": 0.54, + "learning_rate": 9.237699506815268e-08, + "loss": 0.0008, + "step": 27764 + }, + { + "epoch": 0.54, + "learning_rate": 9.237311172381654e-08, + "loss": 0.0004, + "step": 27765 + }, + { + "epoch": 0.54, + "learning_rate": 9.23692283794804e-08, + "loss": 0.0006, + "step": 27766 + }, + { + "epoch": 0.54, + "learning_rate": 9.236534503514426e-08, + "loss": 0.0006, + "step": 27767 + }, + { + "epoch": 0.54, + "learning_rate": 9.236146169080812e-08, + "loss": 0.0005, + "step": 27768 + }, + { + "epoch": 0.54, + "learning_rate": 9.235757834647197e-08, + "loss": 0.0005, + "step": 27769 + }, + { + "epoch": 0.54, + "learning_rate": 9.235369500213583e-08, + "loss": 0.0008, + "step": 27770 + }, + { + "epoch": 0.54, + "learning_rate": 9.234981165779969e-08, + "loss": 0.0005, + "step": 27771 + }, + { + "epoch": 0.54, + "learning_rate": 9.234592831346355e-08, + "loss": 0.0094, + "step": 27772 + }, + { + "epoch": 0.54, + "learning_rate": 9.234204496912741e-08, + "loss": 0.0011, + "step": 27773 + }, + { + "epoch": 0.54, + "learning_rate": 9.233816162479127e-08, + "loss": 0.0004, + "step": 27774 + }, + { + "epoch": 0.54, + "learning_rate": 9.233427828045512e-08, + "loss": 0.0004, + "step": 27775 + }, + { + "epoch": 0.54, + "learning_rate": 9.233039493611898e-08, + "loss": 0.0006, + "step": 27776 + }, + { + "epoch": 0.54, + "learning_rate": 9.232651159178284e-08, + "loss": 0.0007, + "step": 27777 + }, + { + "epoch": 0.54, + "learning_rate": 9.23226282474467e-08, + "loss": 0.0006, + "step": 27778 + }, + { + "epoch": 0.54, + "learning_rate": 9.231874490311056e-08, + "loss": 0.0006, + "step": 27779 + }, + { + "epoch": 0.54, + "learning_rate": 9.231486155877442e-08, + "loss": 0.0007, + "step": 27780 + }, + { + "epoch": 0.54, + "learning_rate": 9.231097821443827e-08, + "loss": 0.0005, + "step": 27781 + }, + { + "epoch": 0.54, + "learning_rate": 9.230709487010213e-08, + "loss": 0.2403, + "step": 27782 + }, + { + "epoch": 0.54, + "learning_rate": 9.230321152576599e-08, + "loss": 0.0004, + "step": 27783 + }, + { + "epoch": 0.54, + "learning_rate": 9.229932818142985e-08, + "loss": 0.0006, + "step": 27784 + }, + { + "epoch": 0.54, + "learning_rate": 9.229544483709371e-08, + "loss": 0.0011, + "step": 27785 + }, + { + "epoch": 0.54, + "learning_rate": 9.229156149275756e-08, + "loss": 0.0005, + "step": 27786 + }, + { + "epoch": 0.54, + "learning_rate": 9.228767814842142e-08, + "loss": 0.0003, + "step": 27787 + }, + { + "epoch": 0.54, + "learning_rate": 9.228379480408527e-08, + "loss": 0.0006, + "step": 27788 + }, + { + "epoch": 0.54, + "learning_rate": 9.227991145974913e-08, + "loss": 0.0004, + "step": 27789 + }, + { + "epoch": 0.54, + "learning_rate": 9.227602811541298e-08, + "loss": 0.0005, + "step": 27790 + }, + { + "epoch": 0.54, + "learning_rate": 9.227214477107684e-08, + "loss": 0.0004, + "step": 27791 + }, + { + "epoch": 0.54, + "learning_rate": 9.22682614267407e-08, + "loss": 0.0005, + "step": 27792 + }, + { + "epoch": 0.54, + "learning_rate": 9.226437808240456e-08, + "loss": 0.001, + "step": 27793 + }, + { + "epoch": 0.54, + "learning_rate": 9.226049473806842e-08, + "loss": 0.0006, + "step": 27794 + }, + { + "epoch": 0.54, + "learning_rate": 9.225661139373228e-08, + "loss": 0.0006, + "step": 27795 + }, + { + "epoch": 0.54, + "learning_rate": 9.225272804939613e-08, + "loss": 0.0005, + "step": 27796 + }, + { + "epoch": 0.54, + "learning_rate": 9.224884470505999e-08, + "loss": 0.0005, + "step": 27797 + }, + { + "epoch": 0.54, + "learning_rate": 9.224496136072385e-08, + "loss": 0.0007, + "step": 27798 + }, + { + "epoch": 0.54, + "learning_rate": 9.224107801638771e-08, + "loss": 0.0005, + "step": 27799 + }, + { + "epoch": 0.54, + "learning_rate": 9.223719467205157e-08, + "loss": 0.0004, + "step": 27800 + }, + { + "epoch": 0.54, + "learning_rate": 9.223331132771543e-08, + "loss": 0.0005, + "step": 27801 + }, + { + "epoch": 0.54, + "learning_rate": 9.222942798337928e-08, + "loss": 0.0007, + "step": 27802 + }, + { + "epoch": 0.54, + "learning_rate": 9.222554463904314e-08, + "loss": 0.0075, + "step": 27803 + }, + { + "epoch": 0.54, + "learning_rate": 9.2221661294707e-08, + "loss": 1.2937, + "step": 27804 + }, + { + "epoch": 0.54, + "learning_rate": 9.221777795037086e-08, + "loss": 0.0006, + "step": 27805 + }, + { + "epoch": 0.54, + "learning_rate": 9.221389460603472e-08, + "loss": 0.0005, + "step": 27806 + }, + { + "epoch": 0.54, + "learning_rate": 9.221001126169857e-08, + "loss": 0.0005, + "step": 27807 + }, + { + "epoch": 0.54, + "learning_rate": 9.220612791736243e-08, + "loss": 0.0071, + "step": 27808 + }, + { + "epoch": 0.54, + "learning_rate": 9.220224457302629e-08, + "loss": 0.0008, + "step": 27809 + }, + { + "epoch": 0.54, + "learning_rate": 9.219836122869015e-08, + "loss": 0.0005, + "step": 27810 + }, + { + "epoch": 0.54, + "learning_rate": 9.219447788435401e-08, + "loss": 0.0004, + "step": 27811 + }, + { + "epoch": 0.54, + "learning_rate": 9.219059454001787e-08, + "loss": 0.0046, + "step": 27812 + }, + { + "epoch": 0.54, + "learning_rate": 9.218671119568172e-08, + "loss": 0.0004, + "step": 27813 + }, + { + "epoch": 0.54, + "learning_rate": 9.218282785134558e-08, + "loss": 0.0005, + "step": 27814 + }, + { + "epoch": 0.54, + "learning_rate": 9.217894450700944e-08, + "loss": 0.0005, + "step": 27815 + }, + { + "epoch": 0.54, + "learning_rate": 9.21750611626733e-08, + "loss": 0.0007, + "step": 27816 + }, + { + "epoch": 0.54, + "learning_rate": 9.217117781833714e-08, + "loss": 0.0006, + "step": 27817 + }, + { + "epoch": 0.54, + "learning_rate": 9.2167294474001e-08, + "loss": 0.0006, + "step": 27818 + }, + { + "epoch": 0.54, + "learning_rate": 9.216341112966486e-08, + "loss": 0.0006, + "step": 27819 + }, + { + "epoch": 0.54, + "learning_rate": 9.215952778532872e-08, + "loss": 0.0028, + "step": 27820 + }, + { + "epoch": 0.54, + "learning_rate": 9.215564444099258e-08, + "loss": 0.0006, + "step": 27821 + }, + { + "epoch": 0.54, + "learning_rate": 9.215176109665644e-08, + "loss": 0.0006, + "step": 27822 + }, + { + "epoch": 0.54, + "learning_rate": 9.21478777523203e-08, + "loss": 0.0004, + "step": 27823 + }, + { + "epoch": 0.54, + "learning_rate": 9.214399440798415e-08, + "loss": 0.0011, + "step": 27824 + }, + { + "epoch": 0.54, + "learning_rate": 9.214011106364801e-08, + "loss": 0.0005, + "step": 27825 + }, + { + "epoch": 0.54, + "learning_rate": 9.213622771931187e-08, + "loss": 0.0008, + "step": 27826 + }, + { + "epoch": 0.54, + "learning_rate": 9.213234437497573e-08, + "loss": 0.0006, + "step": 27827 + }, + { + "epoch": 0.54, + "learning_rate": 9.212846103063958e-08, + "loss": 0.0007, + "step": 27828 + }, + { + "epoch": 0.54, + "learning_rate": 9.212457768630344e-08, + "loss": 0.0006, + "step": 27829 + }, + { + "epoch": 0.54, + "learning_rate": 9.21206943419673e-08, + "loss": 0.0006, + "step": 27830 + }, + { + "epoch": 0.54, + "learning_rate": 9.211681099763116e-08, + "loss": 0.0006, + "step": 27831 + }, + { + "epoch": 0.54, + "learning_rate": 9.211292765329502e-08, + "loss": 0.0004, + "step": 27832 + }, + { + "epoch": 0.54, + "learning_rate": 9.210904430895888e-08, + "loss": 0.0026, + "step": 27833 + }, + { + "epoch": 0.54, + "learning_rate": 9.210516096462273e-08, + "loss": 0.5319, + "step": 27834 + }, + { + "epoch": 0.54, + "learning_rate": 9.210127762028659e-08, + "loss": 0.0005, + "step": 27835 + }, + { + "epoch": 0.54, + "learning_rate": 9.209739427595045e-08, + "loss": 0.3321, + "step": 27836 + }, + { + "epoch": 0.54, + "learning_rate": 9.209351093161431e-08, + "loss": 0.0008, + "step": 27837 + }, + { + "epoch": 0.54, + "learning_rate": 9.208962758727817e-08, + "loss": 0.0009, + "step": 27838 + }, + { + "epoch": 0.54, + "learning_rate": 9.208574424294203e-08, + "loss": 0.0005, + "step": 27839 + }, + { + "epoch": 0.54, + "learning_rate": 9.208186089860588e-08, + "loss": 0.0005, + "step": 27840 + }, + { + "epoch": 0.54, + "learning_rate": 9.207797755426974e-08, + "loss": 0.0005, + "step": 27841 + }, + { + "epoch": 0.54, + "learning_rate": 9.20740942099336e-08, + "loss": 0.0004, + "step": 27842 + }, + { + "epoch": 0.54, + "learning_rate": 9.207021086559746e-08, + "loss": 0.0007, + "step": 27843 + }, + { + "epoch": 0.54, + "learning_rate": 9.206632752126132e-08, + "loss": 0.0007, + "step": 27844 + }, + { + "epoch": 0.54, + "learning_rate": 9.206244417692517e-08, + "loss": 0.0005, + "step": 27845 + }, + { + "epoch": 0.54, + "learning_rate": 9.205856083258902e-08, + "loss": 1.0437, + "step": 27846 + }, + { + "epoch": 0.54, + "learning_rate": 9.205467748825288e-08, + "loss": 0.0004, + "step": 27847 + }, + { + "epoch": 0.54, + "learning_rate": 9.205079414391674e-08, + "loss": 0.0005, + "step": 27848 + }, + { + "epoch": 0.54, + "learning_rate": 9.20469107995806e-08, + "loss": 0.0004, + "step": 27849 + }, + { + "epoch": 0.54, + "learning_rate": 9.204302745524445e-08, + "loss": 0.2045, + "step": 27850 + }, + { + "epoch": 0.54, + "learning_rate": 9.203914411090831e-08, + "loss": 0.0006, + "step": 27851 + }, + { + "epoch": 0.54, + "learning_rate": 9.203526076657217e-08, + "loss": 0.0005, + "step": 27852 + }, + { + "epoch": 0.54, + "learning_rate": 9.203137742223603e-08, + "loss": 0.1319, + "step": 27853 + }, + { + "epoch": 0.54, + "learning_rate": 9.202749407789989e-08, + "loss": 0.0003, + "step": 27854 + }, + { + "epoch": 0.54, + "learning_rate": 9.202361073356374e-08, + "loss": 0.0005, + "step": 27855 + }, + { + "epoch": 0.54, + "learning_rate": 9.20197273892276e-08, + "loss": 0.0931, + "step": 27856 + }, + { + "epoch": 0.54, + "learning_rate": 9.201584404489146e-08, + "loss": 0.7212, + "step": 27857 + }, + { + "epoch": 0.54, + "learning_rate": 9.201196070055532e-08, + "loss": 0.0006, + "step": 27858 + }, + { + "epoch": 0.54, + "learning_rate": 9.200807735621918e-08, + "loss": 0.5315, + "step": 27859 + }, + { + "epoch": 0.54, + "learning_rate": 9.200419401188304e-08, + "loss": 0.0004, + "step": 27860 + }, + { + "epoch": 0.54, + "learning_rate": 9.20003106675469e-08, + "loss": 0.8438, + "step": 27861 + }, + { + "epoch": 0.54, + "learning_rate": 9.199642732321075e-08, + "loss": 0.0005, + "step": 27862 + }, + { + "epoch": 0.54, + "learning_rate": 9.199254397887461e-08, + "loss": 0.0005, + "step": 27863 + }, + { + "epoch": 0.54, + "learning_rate": 9.198866063453847e-08, + "loss": 0.0939, + "step": 27864 + }, + { + "epoch": 0.54, + "learning_rate": 9.198477729020233e-08, + "loss": 0.0004, + "step": 27865 + }, + { + "epoch": 0.54, + "learning_rate": 9.198089394586617e-08, + "loss": 0.0005, + "step": 27866 + }, + { + "epoch": 0.54, + "learning_rate": 9.197701060153003e-08, + "loss": 0.0008, + "step": 27867 + }, + { + "epoch": 0.54, + "learning_rate": 9.197312725719389e-08, + "loss": 0.0009, + "step": 27868 + }, + { + "epoch": 0.54, + "learning_rate": 9.196924391285775e-08, + "loss": 0.0004, + "step": 27869 + }, + { + "epoch": 0.54, + "learning_rate": 9.19653605685216e-08, + "loss": 0.0005, + "step": 27870 + }, + { + "epoch": 0.54, + "learning_rate": 9.196147722418546e-08, + "loss": 0.0009, + "step": 27871 + }, + { + "epoch": 0.54, + "learning_rate": 9.195759387984932e-08, + "loss": 0.0006, + "step": 27872 + }, + { + "epoch": 0.54, + "learning_rate": 9.195371053551318e-08, + "loss": 0.0004, + "step": 27873 + }, + { + "epoch": 0.54, + "learning_rate": 9.194982719117704e-08, + "loss": 0.0006, + "step": 27874 + }, + { + "epoch": 0.54, + "learning_rate": 9.19459438468409e-08, + "loss": 0.0005, + "step": 27875 + }, + { + "epoch": 0.54, + "learning_rate": 9.194206050250475e-08, + "loss": 0.0006, + "step": 27876 + }, + { + "epoch": 0.54, + "learning_rate": 9.193817715816861e-08, + "loss": 0.0014, + "step": 27877 + }, + { + "epoch": 0.54, + "learning_rate": 9.193429381383247e-08, + "loss": 0.0006, + "step": 27878 + }, + { + "epoch": 0.54, + "learning_rate": 9.193041046949633e-08, + "loss": 0.0011, + "step": 27879 + }, + { + "epoch": 0.54, + "learning_rate": 9.192652712516019e-08, + "loss": 0.0004, + "step": 27880 + }, + { + "epoch": 0.54, + "learning_rate": 9.192264378082403e-08, + "loss": 0.0004, + "step": 27881 + }, + { + "epoch": 0.54, + "learning_rate": 9.191876043648789e-08, + "loss": 0.0222, + "step": 27882 + }, + { + "epoch": 0.54, + "learning_rate": 9.191487709215175e-08, + "loss": 0.0005, + "step": 27883 + }, + { + "epoch": 0.54, + "learning_rate": 9.191099374781561e-08, + "loss": 0.0005, + "step": 27884 + }, + { + "epoch": 0.54, + "learning_rate": 9.190711040347946e-08, + "loss": 0.0022, + "step": 27885 + }, + { + "epoch": 0.54, + "learning_rate": 9.190322705914332e-08, + "loss": 0.8288, + "step": 27886 + }, + { + "epoch": 0.54, + "learning_rate": 9.189934371480718e-08, + "loss": 0.0006, + "step": 27887 + }, + { + "epoch": 0.54, + "learning_rate": 9.189546037047104e-08, + "loss": 0.0006, + "step": 27888 + }, + { + "epoch": 0.54, + "learning_rate": 9.18915770261349e-08, + "loss": 0.0004, + "step": 27889 + }, + { + "epoch": 0.54, + "learning_rate": 9.188769368179876e-08, + "loss": 0.0008, + "step": 27890 + }, + { + "epoch": 0.54, + "learning_rate": 9.188381033746261e-08, + "loss": 0.0006, + "step": 27891 + }, + { + "epoch": 0.54, + "learning_rate": 9.187992699312647e-08, + "loss": 0.0007, + "step": 27892 + }, + { + "epoch": 0.54, + "learning_rate": 9.187604364879033e-08, + "loss": 0.0008, + "step": 27893 + }, + { + "epoch": 0.54, + "learning_rate": 9.187216030445419e-08, + "loss": 0.0006, + "step": 27894 + }, + { + "epoch": 0.54, + "learning_rate": 9.186827696011805e-08, + "loss": 0.0007, + "step": 27895 + }, + { + "epoch": 0.54, + "learning_rate": 9.18643936157819e-08, + "loss": 0.0007, + "step": 27896 + }, + { + "epoch": 0.54, + "learning_rate": 9.186051027144576e-08, + "loss": 0.0052, + "step": 27897 + }, + { + "epoch": 0.54, + "learning_rate": 9.185662692710962e-08, + "loss": 0.0006, + "step": 27898 + }, + { + "epoch": 0.54, + "learning_rate": 9.185274358277348e-08, + "loss": 0.0007, + "step": 27899 + }, + { + "epoch": 0.54, + "learning_rate": 9.184886023843734e-08, + "loss": 0.0005, + "step": 27900 + }, + { + "epoch": 0.54, + "learning_rate": 9.18449768941012e-08, + "loss": 0.7979, + "step": 27901 + }, + { + "epoch": 0.54, + "learning_rate": 9.184109354976506e-08, + "loss": 0.0005, + "step": 27902 + }, + { + "epoch": 0.54, + "learning_rate": 9.183721020542891e-08, + "loss": 0.0004, + "step": 27903 + }, + { + "epoch": 0.54, + "learning_rate": 9.183332686109276e-08, + "loss": 0.0008, + "step": 27904 + }, + { + "epoch": 0.54, + "learning_rate": 9.182944351675662e-08, + "loss": 0.1796, + "step": 27905 + }, + { + "epoch": 0.54, + "learning_rate": 9.182556017242047e-08, + "loss": 0.0006, + "step": 27906 + }, + { + "epoch": 0.54, + "learning_rate": 9.182167682808433e-08, + "loss": 0.001, + "step": 27907 + }, + { + "epoch": 0.54, + "learning_rate": 9.181779348374819e-08, + "loss": 0.0008, + "step": 27908 + }, + { + "epoch": 0.54, + "learning_rate": 9.181391013941205e-08, + "loss": 0.0007, + "step": 27909 + }, + { + "epoch": 0.54, + "learning_rate": 9.181002679507591e-08, + "loss": 0.0008, + "step": 27910 + }, + { + "epoch": 0.54, + "learning_rate": 9.180614345073977e-08, + "loss": 0.0006, + "step": 27911 + }, + { + "epoch": 0.54, + "learning_rate": 9.180226010640362e-08, + "loss": 0.0004, + "step": 27912 + }, + { + "epoch": 0.54, + "learning_rate": 9.179837676206748e-08, + "loss": 0.0006, + "step": 27913 + }, + { + "epoch": 0.54, + "learning_rate": 9.179449341773134e-08, + "loss": 0.0007, + "step": 27914 + }, + { + "epoch": 0.54, + "learning_rate": 9.17906100733952e-08, + "loss": 0.0006, + "step": 27915 + }, + { + "epoch": 0.54, + "learning_rate": 9.178672672905906e-08, + "loss": 0.0009, + "step": 27916 + }, + { + "epoch": 0.54, + "learning_rate": 9.178284338472292e-08, + "loss": 0.0003, + "step": 27917 + }, + { + "epoch": 0.54, + "learning_rate": 9.177896004038677e-08, + "loss": 0.0005, + "step": 27918 + }, + { + "epoch": 0.54, + "learning_rate": 9.177507669605063e-08, + "loss": 0.0004, + "step": 27919 + }, + { + "epoch": 0.54, + "learning_rate": 9.177119335171449e-08, + "loss": 0.0005, + "step": 27920 + }, + { + "epoch": 0.54, + "learning_rate": 9.176731000737835e-08, + "loss": 0.0012, + "step": 27921 + }, + { + "epoch": 0.54, + "learning_rate": 9.176342666304221e-08, + "loss": 0.0008, + "step": 27922 + }, + { + "epoch": 0.54, + "learning_rate": 9.175954331870606e-08, + "loss": 0.0005, + "step": 27923 + }, + { + "epoch": 0.54, + "learning_rate": 9.175565997436992e-08, + "loss": 0.0006, + "step": 27924 + }, + { + "epoch": 0.54, + "learning_rate": 9.175177663003378e-08, + "loss": 0.0005, + "step": 27925 + }, + { + "epoch": 0.54, + "learning_rate": 9.174789328569764e-08, + "loss": 0.0012, + "step": 27926 + }, + { + "epoch": 0.54, + "learning_rate": 9.17440099413615e-08, + "loss": 0.0009, + "step": 27927 + }, + { + "epoch": 0.54, + "learning_rate": 9.174012659702536e-08, + "loss": 0.0005, + "step": 27928 + }, + { + "epoch": 0.54, + "learning_rate": 9.173624325268921e-08, + "loss": 0.0005, + "step": 27929 + }, + { + "epoch": 0.54, + "learning_rate": 9.173235990835307e-08, + "loss": 0.0062, + "step": 27930 + }, + { + "epoch": 0.54, + "learning_rate": 9.172847656401693e-08, + "loss": 0.0139, + "step": 27931 + }, + { + "epoch": 0.54, + "learning_rate": 9.172459321968079e-08, + "loss": 0.0006, + "step": 27932 + }, + { + "epoch": 0.54, + "learning_rate": 9.172070987534463e-08, + "loss": 0.0006, + "step": 27933 + }, + { + "epoch": 0.54, + "learning_rate": 9.171682653100849e-08, + "loss": 0.0006, + "step": 27934 + }, + { + "epoch": 0.54, + "learning_rate": 9.171294318667235e-08, + "loss": 0.1003, + "step": 27935 + }, + { + "epoch": 0.54, + "learning_rate": 9.170905984233621e-08, + "loss": 0.0005, + "step": 27936 + }, + { + "epoch": 0.54, + "learning_rate": 9.170517649800007e-08, + "loss": 0.0009, + "step": 27937 + }, + { + "epoch": 0.54, + "learning_rate": 9.170129315366393e-08, + "loss": 0.0004, + "step": 27938 + }, + { + "epoch": 0.54, + "learning_rate": 9.169740980932778e-08, + "loss": 0.0023, + "step": 27939 + }, + { + "epoch": 0.54, + "learning_rate": 9.169352646499164e-08, + "loss": 0.0006, + "step": 27940 + }, + { + "epoch": 0.54, + "learning_rate": 9.16896431206555e-08, + "loss": 0.0005, + "step": 27941 + }, + { + "epoch": 0.54, + "learning_rate": 9.168575977631936e-08, + "loss": 0.0102, + "step": 27942 + }, + { + "epoch": 0.54, + "learning_rate": 9.168187643198322e-08, + "loss": 0.001, + "step": 27943 + }, + { + "epoch": 0.54, + "learning_rate": 9.167799308764707e-08, + "loss": 0.061, + "step": 27944 + }, + { + "epoch": 0.54, + "learning_rate": 9.167410974331093e-08, + "loss": 0.0006, + "step": 27945 + }, + { + "epoch": 0.54, + "learning_rate": 9.167022639897479e-08, + "loss": 0.0005, + "step": 27946 + }, + { + "epoch": 0.54, + "learning_rate": 9.166634305463865e-08, + "loss": 0.0008, + "step": 27947 + }, + { + "epoch": 0.54, + "learning_rate": 9.166245971030251e-08, + "loss": 0.0303, + "step": 27948 + }, + { + "epoch": 0.54, + "learning_rate": 9.165857636596637e-08, + "loss": 0.4272, + "step": 27949 + }, + { + "epoch": 0.54, + "learning_rate": 9.165469302163022e-08, + "loss": 0.0006, + "step": 27950 + }, + { + "epoch": 0.54, + "learning_rate": 9.165080967729408e-08, + "loss": 0.0007, + "step": 27951 + }, + { + "epoch": 0.54, + "learning_rate": 9.164692633295794e-08, + "loss": 0.0005, + "step": 27952 + }, + { + "epoch": 0.54, + "learning_rate": 9.16430429886218e-08, + "loss": 0.0005, + "step": 27953 + }, + { + "epoch": 0.54, + "learning_rate": 9.163915964428566e-08, + "loss": 0.0005, + "step": 27954 + }, + { + "epoch": 0.54, + "learning_rate": 9.163527629994952e-08, + "loss": 0.0007, + "step": 27955 + }, + { + "epoch": 0.54, + "learning_rate": 9.163139295561337e-08, + "loss": 0.0005, + "step": 27956 + }, + { + "epoch": 0.54, + "learning_rate": 9.162750961127723e-08, + "loss": 0.0009, + "step": 27957 + }, + { + "epoch": 0.54, + "learning_rate": 9.162362626694109e-08, + "loss": 0.0016, + "step": 27958 + }, + { + "epoch": 0.54, + "learning_rate": 9.161974292260495e-08, + "loss": 0.0006, + "step": 27959 + }, + { + "epoch": 0.54, + "learning_rate": 9.161585957826881e-08, + "loss": 0.0592, + "step": 27960 + }, + { + "epoch": 0.54, + "learning_rate": 9.161197623393267e-08, + "loss": 0.0008, + "step": 27961 + }, + { + "epoch": 0.54, + "learning_rate": 9.160809288959651e-08, + "loss": 0.0005, + "step": 27962 + }, + { + "epoch": 0.54, + "learning_rate": 9.160420954526037e-08, + "loss": 0.0005, + "step": 27963 + }, + { + "epoch": 0.54, + "learning_rate": 9.160032620092423e-08, + "loss": 0.0004, + "step": 27964 + }, + { + "epoch": 0.54, + "learning_rate": 9.159644285658808e-08, + "loss": 0.0004, + "step": 27965 + }, + { + "epoch": 0.54, + "learning_rate": 9.159255951225194e-08, + "loss": 0.1088, + "step": 27966 + }, + { + "epoch": 0.54, + "learning_rate": 9.15886761679158e-08, + "loss": 0.0006, + "step": 27967 + }, + { + "epoch": 0.54, + "learning_rate": 9.158479282357966e-08, + "loss": 0.0005, + "step": 27968 + }, + { + "epoch": 0.54, + "learning_rate": 9.158090947924352e-08, + "loss": 0.0004, + "step": 27969 + }, + { + "epoch": 0.54, + "learning_rate": 9.157702613490738e-08, + "loss": 0.0014, + "step": 27970 + }, + { + "epoch": 0.54, + "learning_rate": 9.157314279057123e-08, + "loss": 0.0067, + "step": 27971 + }, + { + "epoch": 0.54, + "learning_rate": 9.156925944623509e-08, + "loss": 1.0693, + "step": 27972 + }, + { + "epoch": 0.54, + "learning_rate": 9.156537610189895e-08, + "loss": 0.0007, + "step": 27973 + }, + { + "epoch": 0.54, + "learning_rate": 9.156149275756281e-08, + "loss": 0.016, + "step": 27974 + }, + { + "epoch": 0.54, + "learning_rate": 9.155760941322667e-08, + "loss": 0.0005, + "step": 27975 + }, + { + "epoch": 0.54, + "learning_rate": 9.155372606889053e-08, + "loss": 0.0005, + "step": 27976 + }, + { + "epoch": 0.54, + "learning_rate": 9.154984272455438e-08, + "loss": 0.0004, + "step": 27977 + }, + { + "epoch": 0.54, + "learning_rate": 9.154595938021824e-08, + "loss": 0.0014, + "step": 27978 + }, + { + "epoch": 0.54, + "learning_rate": 9.15420760358821e-08, + "loss": 0.0007, + "step": 27979 + }, + { + "epoch": 0.54, + "learning_rate": 9.153819269154596e-08, + "loss": 0.0005, + "step": 27980 + }, + { + "epoch": 0.54, + "learning_rate": 9.153430934720982e-08, + "loss": 0.0005, + "step": 27981 + }, + { + "epoch": 0.54, + "learning_rate": 9.153042600287367e-08, + "loss": 0.0005, + "step": 27982 + }, + { + "epoch": 0.54, + "learning_rate": 9.152654265853753e-08, + "loss": 0.0009, + "step": 27983 + }, + { + "epoch": 0.54, + "learning_rate": 9.152265931420139e-08, + "loss": 0.0008, + "step": 27984 + }, + { + "epoch": 0.54, + "learning_rate": 9.151877596986525e-08, + "loss": 0.0005, + "step": 27985 + }, + { + "epoch": 0.54, + "learning_rate": 9.151489262552911e-08, + "loss": 0.0008, + "step": 27986 + }, + { + "epoch": 0.54, + "learning_rate": 9.151100928119297e-08, + "loss": 0.0005, + "step": 27987 + }, + { + "epoch": 0.54, + "learning_rate": 9.150712593685682e-08, + "loss": 0.0005, + "step": 27988 + }, + { + "epoch": 0.54, + "learning_rate": 9.150324259252068e-08, + "loss": 0.0252, + "step": 27989 + }, + { + "epoch": 0.54, + "learning_rate": 9.149935924818454e-08, + "loss": 0.0005, + "step": 27990 + }, + { + "epoch": 0.54, + "learning_rate": 9.149547590384839e-08, + "loss": 0.0006, + "step": 27991 + }, + { + "epoch": 0.54, + "learning_rate": 9.149159255951224e-08, + "loss": 0.0039, + "step": 27992 + }, + { + "epoch": 0.54, + "learning_rate": 9.14877092151761e-08, + "loss": 0.0006, + "step": 27993 + }, + { + "epoch": 0.54, + "learning_rate": 9.148382587083996e-08, + "loss": 0.0005, + "step": 27994 + }, + { + "epoch": 0.54, + "learning_rate": 9.147994252650382e-08, + "loss": 0.0008, + "step": 27995 + }, + { + "epoch": 0.54, + "learning_rate": 9.147605918216768e-08, + "loss": 0.0006, + "step": 27996 + }, + { + "epoch": 0.54, + "learning_rate": 9.147217583783154e-08, + "loss": 0.0004, + "step": 27997 + }, + { + "epoch": 0.54, + "learning_rate": 9.14682924934954e-08, + "loss": 0.0006, + "step": 27998 + }, + { + "epoch": 0.54, + "learning_rate": 9.146440914915925e-08, + "loss": 0.0005, + "step": 27999 + }, + { + "epoch": 0.54, + "learning_rate": 9.146052580482311e-08, + "loss": 0.0006, + "step": 28000 + }, + { + "epoch": 0.54, + "learning_rate": 9.145664246048697e-08, + "loss": 0.001, + "step": 28001 + }, + { + "epoch": 0.54, + "learning_rate": 9.145275911615083e-08, + "loss": 0.9619, + "step": 28002 + }, + { + "epoch": 0.54, + "learning_rate": 9.144887577181468e-08, + "loss": 0.0004, + "step": 28003 + }, + { + "epoch": 0.54, + "learning_rate": 9.144499242747854e-08, + "loss": 0.0006, + "step": 28004 + }, + { + "epoch": 0.54, + "learning_rate": 9.14411090831424e-08, + "loss": 0.0005, + "step": 28005 + }, + { + "epoch": 0.54, + "learning_rate": 9.143722573880626e-08, + "loss": 0.0529, + "step": 28006 + }, + { + "epoch": 0.54, + "learning_rate": 9.143334239447012e-08, + "loss": 0.0006, + "step": 28007 + }, + { + "epoch": 0.54, + "learning_rate": 9.142945905013398e-08, + "loss": 0.0007, + "step": 28008 + }, + { + "epoch": 0.54, + "learning_rate": 9.142557570579783e-08, + "loss": 0.0006, + "step": 28009 + }, + { + "epoch": 0.54, + "learning_rate": 9.142169236146169e-08, + "loss": 0.0006, + "step": 28010 + }, + { + "epoch": 0.54, + "learning_rate": 9.141780901712555e-08, + "loss": 0.0013, + "step": 28011 + }, + { + "epoch": 0.54, + "learning_rate": 9.141392567278941e-08, + "loss": 0.001, + "step": 28012 + }, + { + "epoch": 0.54, + "learning_rate": 9.141004232845327e-08, + "loss": 0.0007, + "step": 28013 + }, + { + "epoch": 0.54, + "learning_rate": 9.140615898411713e-08, + "loss": 0.0004, + "step": 28014 + }, + { + "epoch": 0.54, + "learning_rate": 9.140227563978098e-08, + "loss": 0.0005, + "step": 28015 + }, + { + "epoch": 0.54, + "learning_rate": 9.139839229544484e-08, + "loss": 0.6087, + "step": 28016 + }, + { + "epoch": 0.54, + "learning_rate": 9.13945089511087e-08, + "loss": 0.0004, + "step": 28017 + }, + { + "epoch": 0.54, + "learning_rate": 9.139062560677256e-08, + "loss": 0.1117, + "step": 28018 + }, + { + "epoch": 0.54, + "learning_rate": 9.138674226243642e-08, + "loss": 0.0005, + "step": 28019 + }, + { + "epoch": 0.54, + "learning_rate": 9.138285891810026e-08, + "loss": 0.0006, + "step": 28020 + }, + { + "epoch": 0.54, + "learning_rate": 9.137897557376412e-08, + "loss": 0.2101, + "step": 28021 + }, + { + "epoch": 0.54, + "learning_rate": 9.137509222942798e-08, + "loss": 0.0004, + "step": 28022 + }, + { + "epoch": 0.54, + "learning_rate": 9.137120888509184e-08, + "loss": 0.0007, + "step": 28023 + }, + { + "epoch": 0.54, + "learning_rate": 9.13673255407557e-08, + "loss": 0.0009, + "step": 28024 + }, + { + "epoch": 0.54, + "learning_rate": 9.136344219641955e-08, + "loss": 0.0004, + "step": 28025 + }, + { + "epoch": 0.54, + "learning_rate": 9.135955885208341e-08, + "loss": 0.0006, + "step": 28026 + }, + { + "epoch": 0.54, + "learning_rate": 9.135567550774727e-08, + "loss": 0.0013, + "step": 28027 + }, + { + "epoch": 0.54, + "learning_rate": 9.135179216341113e-08, + "loss": 0.0005, + "step": 28028 + }, + { + "epoch": 0.54, + "learning_rate": 9.134790881907499e-08, + "loss": 0.0152, + "step": 28029 + }, + { + "epoch": 0.54, + "learning_rate": 9.134402547473884e-08, + "loss": 0.2702, + "step": 28030 + }, + { + "epoch": 0.54, + "learning_rate": 9.13401421304027e-08, + "loss": 0.0019, + "step": 28031 + }, + { + "epoch": 0.54, + "learning_rate": 9.133625878606656e-08, + "loss": 0.0006, + "step": 28032 + }, + { + "epoch": 0.54, + "learning_rate": 9.133237544173042e-08, + "loss": 0.0006, + "step": 28033 + }, + { + "epoch": 0.54, + "learning_rate": 9.132849209739428e-08, + "loss": 0.0005, + "step": 28034 + }, + { + "epoch": 0.54, + "learning_rate": 9.132460875305814e-08, + "loss": 0.0005, + "step": 28035 + }, + { + "epoch": 0.54, + "learning_rate": 9.1320725408722e-08, + "loss": 0.1963, + "step": 28036 + }, + { + "epoch": 0.54, + "learning_rate": 9.131684206438585e-08, + "loss": 0.0086, + "step": 28037 + }, + { + "epoch": 0.54, + "learning_rate": 9.131295872004971e-08, + "loss": 0.0009, + "step": 28038 + }, + { + "epoch": 0.54, + "learning_rate": 9.130907537571357e-08, + "loss": 0.001, + "step": 28039 + }, + { + "epoch": 0.54, + "learning_rate": 9.130519203137743e-08, + "loss": 0.0019, + "step": 28040 + }, + { + "epoch": 0.54, + "learning_rate": 9.130130868704128e-08, + "loss": 1.0138, + "step": 28041 + }, + { + "epoch": 0.54, + "learning_rate": 9.129742534270514e-08, + "loss": 0.0005, + "step": 28042 + }, + { + "epoch": 0.54, + "learning_rate": 9.129354199836899e-08, + "loss": 0.0006, + "step": 28043 + }, + { + "epoch": 0.54, + "learning_rate": 9.128965865403285e-08, + "loss": 0.0005, + "step": 28044 + }, + { + "epoch": 0.54, + "learning_rate": 9.12857753096967e-08, + "loss": 0.0006, + "step": 28045 + }, + { + "epoch": 0.54, + "learning_rate": 9.128189196536056e-08, + "loss": 0.0004, + "step": 28046 + }, + { + "epoch": 0.54, + "learning_rate": 9.127800862102442e-08, + "loss": 0.0005, + "step": 28047 + }, + { + "epoch": 0.54, + "learning_rate": 9.127412527668828e-08, + "loss": 0.0005, + "step": 28048 + }, + { + "epoch": 0.54, + "learning_rate": 9.127024193235214e-08, + "loss": 0.0012, + "step": 28049 + }, + { + "epoch": 0.54, + "learning_rate": 9.1266358588016e-08, + "loss": 0.0007, + "step": 28050 + }, + { + "epoch": 0.54, + "learning_rate": 9.126247524367985e-08, + "loss": 0.0006, + "step": 28051 + }, + { + "epoch": 0.54, + "learning_rate": 9.125859189934371e-08, + "loss": 0.0192, + "step": 28052 + }, + { + "epoch": 0.54, + "learning_rate": 9.125470855500757e-08, + "loss": 0.0005, + "step": 28053 + }, + { + "epoch": 0.54, + "learning_rate": 9.125082521067143e-08, + "loss": 0.0004, + "step": 28054 + }, + { + "epoch": 0.54, + "learning_rate": 9.124694186633529e-08, + "loss": 0.0003, + "step": 28055 + }, + { + "epoch": 0.54, + "learning_rate": 9.124305852199915e-08, + "loss": 0.0005, + "step": 28056 + }, + { + "epoch": 0.54, + "learning_rate": 9.1239175177663e-08, + "loss": 1.5315, + "step": 28057 + }, + { + "epoch": 0.54, + "learning_rate": 9.123529183332685e-08, + "loss": 0.0502, + "step": 28058 + }, + { + "epoch": 0.54, + "learning_rate": 9.123140848899071e-08, + "loss": 0.4699, + "step": 28059 + }, + { + "epoch": 0.54, + "learning_rate": 9.122752514465457e-08, + "loss": 0.0009, + "step": 28060 + }, + { + "epoch": 0.54, + "learning_rate": 9.122364180031842e-08, + "loss": 0.0407, + "step": 28061 + }, + { + "epoch": 0.54, + "learning_rate": 9.121975845598228e-08, + "loss": 0.0005, + "step": 28062 + }, + { + "epoch": 0.54, + "learning_rate": 9.121587511164614e-08, + "loss": 0.0007, + "step": 28063 + }, + { + "epoch": 0.54, + "learning_rate": 9.121199176731e-08, + "loss": 0.0007, + "step": 28064 + }, + { + "epoch": 0.54, + "learning_rate": 9.120810842297386e-08, + "loss": 0.0043, + "step": 28065 + }, + { + "epoch": 0.54, + "learning_rate": 9.120422507863771e-08, + "loss": 0.0009, + "step": 28066 + }, + { + "epoch": 0.54, + "learning_rate": 9.120034173430157e-08, + "loss": 0.0006, + "step": 28067 + }, + { + "epoch": 0.54, + "learning_rate": 9.119645838996543e-08, + "loss": 0.0587, + "step": 28068 + }, + { + "epoch": 0.54, + "learning_rate": 9.119257504562929e-08, + "loss": 0.0005, + "step": 28069 + }, + { + "epoch": 0.54, + "learning_rate": 9.118869170129315e-08, + "loss": 0.0005, + "step": 28070 + }, + { + "epoch": 0.54, + "learning_rate": 9.1184808356957e-08, + "loss": 0.0008, + "step": 28071 + }, + { + "epoch": 0.54, + "learning_rate": 9.118092501262086e-08, + "loss": 0.0005, + "step": 28072 + }, + { + "epoch": 0.54, + "learning_rate": 9.117704166828472e-08, + "loss": 0.0568, + "step": 28073 + }, + { + "epoch": 0.54, + "learning_rate": 9.117315832394858e-08, + "loss": 0.0006, + "step": 28074 + }, + { + "epoch": 0.54, + "learning_rate": 9.116927497961244e-08, + "loss": 0.7707, + "step": 28075 + }, + { + "epoch": 0.54, + "learning_rate": 9.11653916352763e-08, + "loss": 0.001, + "step": 28076 + }, + { + "epoch": 0.54, + "learning_rate": 9.116150829094016e-08, + "loss": 0.0005, + "step": 28077 + }, + { + "epoch": 0.54, + "learning_rate": 9.1157624946604e-08, + "loss": 0.0027, + "step": 28078 + }, + { + "epoch": 0.54, + "learning_rate": 9.115374160226786e-08, + "loss": 0.0004, + "step": 28079 + }, + { + "epoch": 0.54, + "learning_rate": 9.114985825793172e-08, + "loss": 0.0008, + "step": 28080 + }, + { + "epoch": 0.54, + "learning_rate": 9.114597491359557e-08, + "loss": 0.0057, + "step": 28081 + }, + { + "epoch": 0.54, + "learning_rate": 9.114209156925943e-08, + "loss": 0.0014, + "step": 28082 + }, + { + "epoch": 0.54, + "learning_rate": 9.113820822492329e-08, + "loss": 0.0006, + "step": 28083 + }, + { + "epoch": 0.54, + "learning_rate": 9.113432488058715e-08, + "loss": 0.0007, + "step": 28084 + }, + { + "epoch": 0.54, + "learning_rate": 9.113044153625101e-08, + "loss": 0.0007, + "step": 28085 + }, + { + "epoch": 0.54, + "learning_rate": 9.112655819191487e-08, + "loss": 0.0012, + "step": 28086 + }, + { + "epoch": 0.54, + "learning_rate": 9.112267484757872e-08, + "loss": 0.0005, + "step": 28087 + }, + { + "epoch": 0.54, + "learning_rate": 9.111879150324258e-08, + "loss": 0.5995, + "step": 28088 + }, + { + "epoch": 0.54, + "learning_rate": 9.111490815890644e-08, + "loss": 0.0006, + "step": 28089 + }, + { + "epoch": 0.54, + "learning_rate": 9.11110248145703e-08, + "loss": 0.002, + "step": 28090 + }, + { + "epoch": 0.54, + "learning_rate": 9.110714147023416e-08, + "loss": 0.0006, + "step": 28091 + }, + { + "epoch": 0.54, + "learning_rate": 9.110325812589802e-08, + "loss": 0.0005, + "step": 28092 + }, + { + "epoch": 0.54, + "learning_rate": 9.109937478156187e-08, + "loss": 0.0008, + "step": 28093 + }, + { + "epoch": 0.54, + "learning_rate": 9.109549143722573e-08, + "loss": 0.0004, + "step": 28094 + }, + { + "epoch": 0.54, + "learning_rate": 9.109160809288959e-08, + "loss": 0.0008, + "step": 28095 + }, + { + "epoch": 0.55, + "learning_rate": 9.108772474855345e-08, + "loss": 0.0091, + "step": 28096 + }, + { + "epoch": 0.55, + "learning_rate": 9.108384140421731e-08, + "loss": 0.9812, + "step": 28097 + }, + { + "epoch": 0.55, + "learning_rate": 9.107995805988117e-08, + "loss": 0.0008, + "step": 28098 + }, + { + "epoch": 0.55, + "learning_rate": 9.107607471554502e-08, + "loss": 0.0007, + "step": 28099 + }, + { + "epoch": 0.55, + "learning_rate": 9.107219137120888e-08, + "loss": 0.0004, + "step": 28100 + }, + { + "epoch": 0.55, + "learning_rate": 9.106830802687274e-08, + "loss": 0.0006, + "step": 28101 + }, + { + "epoch": 0.55, + "learning_rate": 9.10644246825366e-08, + "loss": 0.0006, + "step": 28102 + }, + { + "epoch": 0.55, + "learning_rate": 9.106054133820046e-08, + "loss": 0.0007, + "step": 28103 + }, + { + "epoch": 0.55, + "learning_rate": 9.105665799386431e-08, + "loss": 0.0006, + "step": 28104 + }, + { + "epoch": 0.55, + "learning_rate": 9.105277464952817e-08, + "loss": 0.0005, + "step": 28105 + }, + { + "epoch": 0.55, + "learning_rate": 9.104889130519203e-08, + "loss": 0.0007, + "step": 28106 + }, + { + "epoch": 0.55, + "learning_rate": 9.104500796085588e-08, + "loss": 0.0006, + "step": 28107 + }, + { + "epoch": 0.55, + "learning_rate": 9.104112461651973e-08, + "loss": 0.0005, + "step": 28108 + }, + { + "epoch": 0.55, + "learning_rate": 9.103724127218359e-08, + "loss": 0.0007, + "step": 28109 + }, + { + "epoch": 0.55, + "learning_rate": 9.103335792784745e-08, + "loss": 0.0005, + "step": 28110 + }, + { + "epoch": 0.55, + "learning_rate": 9.102947458351131e-08, + "loss": 0.0006, + "step": 28111 + }, + { + "epoch": 0.55, + "learning_rate": 9.102559123917517e-08, + "loss": 0.0004, + "step": 28112 + }, + { + "epoch": 0.55, + "learning_rate": 9.102170789483903e-08, + "loss": 0.361, + "step": 28113 + }, + { + "epoch": 0.55, + "learning_rate": 9.101782455050288e-08, + "loss": 0.0005, + "step": 28114 + }, + { + "epoch": 0.55, + "learning_rate": 9.101394120616674e-08, + "loss": 0.0004, + "step": 28115 + }, + { + "epoch": 0.55, + "learning_rate": 9.10100578618306e-08, + "loss": 0.0005, + "step": 28116 + }, + { + "epoch": 0.55, + "learning_rate": 9.100617451749446e-08, + "loss": 0.0006, + "step": 28117 + }, + { + "epoch": 0.55, + "learning_rate": 9.100229117315832e-08, + "loss": 0.0005, + "step": 28118 + }, + { + "epoch": 0.55, + "learning_rate": 9.099840782882217e-08, + "loss": 0.0007, + "step": 28119 + }, + { + "epoch": 0.55, + "learning_rate": 9.099452448448603e-08, + "loss": 0.0005, + "step": 28120 + }, + { + "epoch": 0.55, + "learning_rate": 9.099064114014989e-08, + "loss": 0.0005, + "step": 28121 + }, + { + "epoch": 0.55, + "learning_rate": 9.098675779581375e-08, + "loss": 1.1157, + "step": 28122 + }, + { + "epoch": 0.55, + "learning_rate": 9.098287445147761e-08, + "loss": 0.0005, + "step": 28123 + }, + { + "epoch": 0.55, + "learning_rate": 9.097899110714147e-08, + "loss": 0.0004, + "step": 28124 + }, + { + "epoch": 0.55, + "learning_rate": 9.097510776280532e-08, + "loss": 0.0004, + "step": 28125 + }, + { + "epoch": 0.55, + "learning_rate": 9.097122441846918e-08, + "loss": 0.0004, + "step": 28126 + }, + { + "epoch": 0.55, + "learning_rate": 9.096734107413304e-08, + "loss": 0.0709, + "step": 28127 + }, + { + "epoch": 0.55, + "learning_rate": 9.09634577297969e-08, + "loss": 0.0005, + "step": 28128 + }, + { + "epoch": 0.55, + "learning_rate": 9.095957438546076e-08, + "loss": 0.0006, + "step": 28129 + }, + { + "epoch": 0.55, + "learning_rate": 9.095569104112462e-08, + "loss": 0.0006, + "step": 28130 + }, + { + "epoch": 0.55, + "learning_rate": 9.095180769678847e-08, + "loss": 0.0006, + "step": 28131 + }, + { + "epoch": 0.55, + "learning_rate": 9.094792435245233e-08, + "loss": 0.0363, + "step": 28132 + }, + { + "epoch": 0.55, + "learning_rate": 9.094404100811619e-08, + "loss": 0.0006, + "step": 28133 + }, + { + "epoch": 0.55, + "learning_rate": 9.094015766378005e-08, + "loss": 0.0004, + "step": 28134 + }, + { + "epoch": 0.55, + "learning_rate": 9.093627431944391e-08, + "loss": 0.0005, + "step": 28135 + }, + { + "epoch": 0.55, + "learning_rate": 9.093239097510775e-08, + "loss": 0.7499, + "step": 28136 + }, + { + "epoch": 0.55, + "learning_rate": 9.092850763077161e-08, + "loss": 0.3827, + "step": 28137 + }, + { + "epoch": 0.55, + "learning_rate": 9.092462428643547e-08, + "loss": 0.0004, + "step": 28138 + }, + { + "epoch": 0.55, + "learning_rate": 9.092074094209933e-08, + "loss": 0.0005, + "step": 28139 + }, + { + "epoch": 0.55, + "learning_rate": 9.091685759776318e-08, + "loss": 0.0007, + "step": 28140 + }, + { + "epoch": 0.55, + "learning_rate": 9.091297425342704e-08, + "loss": 0.0005, + "step": 28141 + }, + { + "epoch": 0.55, + "learning_rate": 9.09090909090909e-08, + "loss": 0.5734, + "step": 28142 + }, + { + "epoch": 0.55, + "learning_rate": 9.090520756475476e-08, + "loss": 0.0006, + "step": 28143 + }, + { + "epoch": 0.55, + "learning_rate": 9.090132422041862e-08, + "loss": 0.0007, + "step": 28144 + }, + { + "epoch": 0.55, + "learning_rate": 9.089744087608248e-08, + "loss": 0.0005, + "step": 28145 + }, + { + "epoch": 0.55, + "learning_rate": 9.089355753174633e-08, + "loss": 0.0005, + "step": 28146 + }, + { + "epoch": 0.55, + "learning_rate": 9.088967418741019e-08, + "loss": 0.0006, + "step": 28147 + }, + { + "epoch": 0.55, + "learning_rate": 9.088579084307405e-08, + "loss": 0.0007, + "step": 28148 + }, + { + "epoch": 0.55, + "learning_rate": 9.088190749873791e-08, + "loss": 0.6499, + "step": 28149 + }, + { + "epoch": 0.55, + "learning_rate": 9.087802415440177e-08, + "loss": 0.0009, + "step": 28150 + }, + { + "epoch": 0.55, + "learning_rate": 9.087414081006563e-08, + "loss": 0.0006, + "step": 28151 + }, + { + "epoch": 0.55, + "learning_rate": 9.087025746572948e-08, + "loss": 0.0004, + "step": 28152 + }, + { + "epoch": 0.55, + "learning_rate": 9.086637412139334e-08, + "loss": 0.0006, + "step": 28153 + }, + { + "epoch": 0.55, + "learning_rate": 9.08624907770572e-08, + "loss": 0.6949, + "step": 28154 + }, + { + "epoch": 0.55, + "learning_rate": 9.085860743272106e-08, + "loss": 0.0007, + "step": 28155 + }, + { + "epoch": 0.55, + "learning_rate": 9.085472408838492e-08, + "loss": 0.0461, + "step": 28156 + }, + { + "epoch": 0.55, + "learning_rate": 9.085084074404878e-08, + "loss": 2.3416, + "step": 28157 + }, + { + "epoch": 0.55, + "learning_rate": 9.084695739971263e-08, + "loss": 0.0005, + "step": 28158 + }, + { + "epoch": 0.55, + "learning_rate": 9.084307405537649e-08, + "loss": 0.0004, + "step": 28159 + }, + { + "epoch": 0.55, + "learning_rate": 9.083919071104035e-08, + "loss": 0.0007, + "step": 28160 + }, + { + "epoch": 0.55, + "learning_rate": 9.083530736670421e-08, + "loss": 0.0006, + "step": 28161 + }, + { + "epoch": 0.55, + "learning_rate": 9.083142402236807e-08, + "loss": 0.0033, + "step": 28162 + }, + { + "epoch": 0.55, + "learning_rate": 9.082754067803192e-08, + "loss": 0.0472, + "step": 28163 + }, + { + "epoch": 0.55, + "learning_rate": 9.082365733369578e-08, + "loss": 0.0006, + "step": 28164 + }, + { + "epoch": 0.55, + "learning_rate": 9.081977398935963e-08, + "loss": 0.0006, + "step": 28165 + }, + { + "epoch": 0.55, + "learning_rate": 9.081589064502349e-08, + "loss": 0.0005, + "step": 28166 + }, + { + "epoch": 0.55, + "learning_rate": 9.081200730068734e-08, + "loss": 0.0008, + "step": 28167 + }, + { + "epoch": 0.55, + "learning_rate": 9.08081239563512e-08, + "loss": 0.0005, + "step": 28168 + }, + { + "epoch": 0.55, + "learning_rate": 9.080424061201506e-08, + "loss": 0.0006, + "step": 28169 + }, + { + "epoch": 0.55, + "learning_rate": 9.080035726767892e-08, + "loss": 0.0009, + "step": 28170 + }, + { + "epoch": 0.55, + "learning_rate": 9.079647392334278e-08, + "loss": 0.0006, + "step": 28171 + }, + { + "epoch": 0.55, + "learning_rate": 9.079259057900664e-08, + "loss": 0.0007, + "step": 28172 + }, + { + "epoch": 0.55, + "learning_rate": 9.07887072346705e-08, + "loss": 0.0009, + "step": 28173 + }, + { + "epoch": 0.55, + "learning_rate": 9.078482389033435e-08, + "loss": 0.0004, + "step": 28174 + }, + { + "epoch": 0.55, + "learning_rate": 9.078094054599821e-08, + "loss": 0.0009, + "step": 28175 + }, + { + "epoch": 0.55, + "learning_rate": 9.077705720166207e-08, + "loss": 0.0007, + "step": 28176 + }, + { + "epoch": 0.55, + "learning_rate": 9.077317385732593e-08, + "loss": 0.0004, + "step": 28177 + }, + { + "epoch": 0.55, + "learning_rate": 9.076929051298978e-08, + "loss": 0.0006, + "step": 28178 + }, + { + "epoch": 0.55, + "learning_rate": 9.076540716865364e-08, + "loss": 1.1835, + "step": 28179 + }, + { + "epoch": 0.55, + "learning_rate": 9.07615238243175e-08, + "loss": 0.0004, + "step": 28180 + }, + { + "epoch": 0.55, + "learning_rate": 9.075764047998136e-08, + "loss": 0.0008, + "step": 28181 + }, + { + "epoch": 0.55, + "learning_rate": 9.075375713564522e-08, + "loss": 0.0006, + "step": 28182 + }, + { + "epoch": 0.55, + "learning_rate": 9.074987379130908e-08, + "loss": 0.0008, + "step": 28183 + }, + { + "epoch": 0.55, + "learning_rate": 9.074599044697293e-08, + "loss": 0.0005, + "step": 28184 + }, + { + "epoch": 0.55, + "learning_rate": 9.074210710263679e-08, + "loss": 0.0005, + "step": 28185 + }, + { + "epoch": 0.55, + "learning_rate": 9.073822375830065e-08, + "loss": 0.0005, + "step": 28186 + }, + { + "epoch": 0.55, + "learning_rate": 9.073434041396451e-08, + "loss": 0.0009, + "step": 28187 + }, + { + "epoch": 0.55, + "learning_rate": 9.073045706962837e-08, + "loss": 0.001, + "step": 28188 + }, + { + "epoch": 0.55, + "learning_rate": 9.072657372529223e-08, + "loss": 0.0005, + "step": 28189 + }, + { + "epoch": 0.55, + "learning_rate": 9.072269038095608e-08, + "loss": 0.0004, + "step": 28190 + }, + { + "epoch": 0.55, + "learning_rate": 9.071880703661994e-08, + "loss": 0.0003, + "step": 28191 + }, + { + "epoch": 0.55, + "learning_rate": 9.07149236922838e-08, + "loss": 0.0008, + "step": 28192 + }, + { + "epoch": 0.55, + "learning_rate": 9.071104034794766e-08, + "loss": 0.6472, + "step": 28193 + }, + { + "epoch": 0.55, + "learning_rate": 9.07071570036115e-08, + "loss": 0.0019, + "step": 28194 + }, + { + "epoch": 0.55, + "learning_rate": 9.070327365927536e-08, + "loss": 0.0005, + "step": 28195 + }, + { + "epoch": 0.55, + "learning_rate": 9.069939031493922e-08, + "loss": 0.0005, + "step": 28196 + }, + { + "epoch": 0.55, + "learning_rate": 9.069550697060308e-08, + "loss": 0.0006, + "step": 28197 + }, + { + "epoch": 0.55, + "learning_rate": 9.069162362626694e-08, + "loss": 0.0009, + "step": 28198 + }, + { + "epoch": 0.55, + "learning_rate": 9.06877402819308e-08, + "loss": 0.0005, + "step": 28199 + }, + { + "epoch": 0.55, + "learning_rate": 9.068385693759465e-08, + "loss": 0.0004, + "step": 28200 + }, + { + "epoch": 0.55, + "learning_rate": 9.067997359325851e-08, + "loss": 0.0007, + "step": 28201 + }, + { + "epoch": 0.55, + "learning_rate": 9.067609024892237e-08, + "loss": 0.0007, + "step": 28202 + }, + { + "epoch": 0.55, + "learning_rate": 9.067220690458623e-08, + "loss": 0.0004, + "step": 28203 + }, + { + "epoch": 0.55, + "learning_rate": 9.066832356025009e-08, + "loss": 0.0005, + "step": 28204 + }, + { + "epoch": 0.55, + "learning_rate": 9.066444021591394e-08, + "loss": 0.0006, + "step": 28205 + }, + { + "epoch": 0.55, + "learning_rate": 9.06605568715778e-08, + "loss": 0.0005, + "step": 28206 + }, + { + "epoch": 0.55, + "learning_rate": 9.065667352724166e-08, + "loss": 0.0006, + "step": 28207 + }, + { + "epoch": 0.55, + "learning_rate": 9.065279018290552e-08, + "loss": 0.008, + "step": 28208 + }, + { + "epoch": 0.55, + "learning_rate": 9.064890683856938e-08, + "loss": 0.0006, + "step": 28209 + }, + { + "epoch": 0.55, + "learning_rate": 9.064502349423324e-08, + "loss": 0.0007, + "step": 28210 + }, + { + "epoch": 0.55, + "learning_rate": 9.06411401498971e-08, + "loss": 0.0006, + "step": 28211 + }, + { + "epoch": 0.55, + "learning_rate": 9.063725680556095e-08, + "loss": 0.0006, + "step": 28212 + }, + { + "epoch": 0.55, + "learning_rate": 9.063337346122481e-08, + "loss": 0.0006, + "step": 28213 + }, + { + "epoch": 0.55, + "learning_rate": 9.062949011688867e-08, + "loss": 0.0073, + "step": 28214 + }, + { + "epoch": 0.55, + "learning_rate": 9.062560677255253e-08, + "loss": 0.0007, + "step": 28215 + }, + { + "epoch": 0.55, + "learning_rate": 9.062172342821638e-08, + "loss": 0.0005, + "step": 28216 + }, + { + "epoch": 0.55, + "learning_rate": 9.061784008388024e-08, + "loss": 0.0005, + "step": 28217 + }, + { + "epoch": 0.55, + "learning_rate": 9.06139567395441e-08, + "loss": 0.0005, + "step": 28218 + }, + { + "epoch": 0.55, + "learning_rate": 9.061007339520796e-08, + "loss": 0.0006, + "step": 28219 + }, + { + "epoch": 0.55, + "learning_rate": 9.06061900508718e-08, + "loss": 0.0005, + "step": 28220 + }, + { + "epoch": 0.55, + "learning_rate": 9.060230670653566e-08, + "loss": 0.0005, + "step": 28221 + }, + { + "epoch": 0.55, + "learning_rate": 9.059842336219952e-08, + "loss": 0.0005, + "step": 28222 + }, + { + "epoch": 0.55, + "learning_rate": 9.059454001786338e-08, + "loss": 0.0006, + "step": 28223 + }, + { + "epoch": 0.55, + "learning_rate": 9.059065667352724e-08, + "loss": 0.063, + "step": 28224 + }, + { + "epoch": 0.55, + "learning_rate": 9.05867733291911e-08, + "loss": 0.0003, + "step": 28225 + }, + { + "epoch": 0.55, + "learning_rate": 9.058288998485495e-08, + "loss": 0.0021, + "step": 28226 + }, + { + "epoch": 0.55, + "learning_rate": 9.057900664051881e-08, + "loss": 0.0005, + "step": 28227 + }, + { + "epoch": 0.55, + "learning_rate": 9.057512329618267e-08, + "loss": 0.0006, + "step": 28228 + }, + { + "epoch": 0.55, + "learning_rate": 9.057123995184653e-08, + "loss": 0.0005, + "step": 28229 + }, + { + "epoch": 0.55, + "learning_rate": 9.056735660751039e-08, + "loss": 0.162, + "step": 28230 + }, + { + "epoch": 0.55, + "learning_rate": 9.056347326317425e-08, + "loss": 0.0005, + "step": 28231 + }, + { + "epoch": 0.55, + "learning_rate": 9.05595899188381e-08, + "loss": 0.0005, + "step": 28232 + }, + { + "epoch": 0.55, + "learning_rate": 9.055570657450196e-08, + "loss": 0.0006, + "step": 28233 + }, + { + "epoch": 0.55, + "learning_rate": 9.055182323016582e-08, + "loss": 0.0005, + "step": 28234 + }, + { + "epoch": 0.55, + "learning_rate": 9.054793988582967e-08, + "loss": 1.1092, + "step": 28235 + }, + { + "epoch": 0.55, + "learning_rate": 9.054405654149352e-08, + "loss": 0.0005, + "step": 28236 + }, + { + "epoch": 0.55, + "learning_rate": 9.054017319715738e-08, + "loss": 0.0004, + "step": 28237 + }, + { + "epoch": 0.55, + "learning_rate": 9.053628985282124e-08, + "loss": 0.0006, + "step": 28238 + }, + { + "epoch": 0.55, + "learning_rate": 9.05324065084851e-08, + "loss": 0.6521, + "step": 28239 + }, + { + "epoch": 0.55, + "learning_rate": 9.052852316414896e-08, + "loss": 0.0005, + "step": 28240 + }, + { + "epoch": 0.55, + "learning_rate": 9.052463981981281e-08, + "loss": 0.0005, + "step": 28241 + }, + { + "epoch": 0.55, + "learning_rate": 9.052075647547667e-08, + "loss": 0.0005, + "step": 28242 + }, + { + "epoch": 0.55, + "learning_rate": 9.051687313114053e-08, + "loss": 0.0007, + "step": 28243 + }, + { + "epoch": 0.55, + "learning_rate": 9.051298978680439e-08, + "loss": 0.5396, + "step": 28244 + }, + { + "epoch": 0.55, + "learning_rate": 9.050910644246825e-08, + "loss": 1.2053, + "step": 28245 + }, + { + "epoch": 0.55, + "learning_rate": 9.05052230981321e-08, + "loss": 0.0005, + "step": 28246 + }, + { + "epoch": 0.55, + "learning_rate": 9.050133975379596e-08, + "loss": 0.0005, + "step": 28247 + }, + { + "epoch": 0.55, + "learning_rate": 9.049745640945982e-08, + "loss": 0.0006, + "step": 28248 + }, + { + "epoch": 0.55, + "learning_rate": 9.049357306512368e-08, + "loss": 0.4797, + "step": 28249 + }, + { + "epoch": 0.55, + "learning_rate": 9.048968972078754e-08, + "loss": 0.0004, + "step": 28250 + }, + { + "epoch": 0.55, + "learning_rate": 9.04858063764514e-08, + "loss": 0.0009, + "step": 28251 + }, + { + "epoch": 0.55, + "learning_rate": 9.048192303211524e-08, + "loss": 0.0005, + "step": 28252 + }, + { + "epoch": 0.55, + "learning_rate": 9.04780396877791e-08, + "loss": 0.0012, + "step": 28253 + }, + { + "epoch": 0.55, + "learning_rate": 9.047415634344296e-08, + "loss": 0.1643, + "step": 28254 + }, + { + "epoch": 0.55, + "learning_rate": 9.047027299910682e-08, + "loss": 0.0013, + "step": 28255 + }, + { + "epoch": 0.55, + "learning_rate": 9.046638965477068e-08, + "loss": 0.9845, + "step": 28256 + }, + { + "epoch": 0.55, + "learning_rate": 9.046250631043453e-08, + "loss": 1.0205, + "step": 28257 + }, + { + "epoch": 0.55, + "learning_rate": 9.045862296609839e-08, + "loss": 0.0006, + "step": 28258 + }, + { + "epoch": 0.55, + "learning_rate": 9.045473962176225e-08, + "loss": 0.0008, + "step": 28259 + }, + { + "epoch": 0.55, + "learning_rate": 9.045085627742611e-08, + "loss": 0.0007, + "step": 28260 + }, + { + "epoch": 0.55, + "learning_rate": 9.044697293308997e-08, + "loss": 0.0006, + "step": 28261 + }, + { + "epoch": 0.55, + "learning_rate": 9.044308958875382e-08, + "loss": 0.6519, + "step": 28262 + }, + { + "epoch": 0.55, + "learning_rate": 9.043920624441768e-08, + "loss": 0.0006, + "step": 28263 + }, + { + "epoch": 0.55, + "learning_rate": 9.043532290008154e-08, + "loss": 0.0004, + "step": 28264 + }, + { + "epoch": 0.55, + "learning_rate": 9.04314395557454e-08, + "loss": 0.0039, + "step": 28265 + }, + { + "epoch": 0.55, + "learning_rate": 9.042755621140926e-08, + "loss": 0.0005, + "step": 28266 + }, + { + "epoch": 0.55, + "learning_rate": 9.042367286707312e-08, + "loss": 0.0007, + "step": 28267 + }, + { + "epoch": 0.55, + "learning_rate": 9.041978952273697e-08, + "loss": 0.0005, + "step": 28268 + }, + { + "epoch": 0.55, + "learning_rate": 9.041590617840083e-08, + "loss": 0.0004, + "step": 28269 + }, + { + "epoch": 0.55, + "learning_rate": 9.041202283406469e-08, + "loss": 0.3315, + "step": 28270 + }, + { + "epoch": 0.55, + "learning_rate": 9.040813948972855e-08, + "loss": 0.0005, + "step": 28271 + }, + { + "epoch": 0.55, + "learning_rate": 9.040425614539241e-08, + "loss": 0.1299, + "step": 28272 + }, + { + "epoch": 0.55, + "learning_rate": 9.040037280105627e-08, + "loss": 0.0987, + "step": 28273 + }, + { + "epoch": 0.55, + "learning_rate": 9.039648945672012e-08, + "loss": 0.0004, + "step": 28274 + }, + { + "epoch": 0.55, + "learning_rate": 9.039260611238398e-08, + "loss": 0.0025, + "step": 28275 + }, + { + "epoch": 0.55, + "learning_rate": 9.038872276804784e-08, + "loss": 0.0026, + "step": 28276 + }, + { + "epoch": 0.55, + "learning_rate": 9.03848394237117e-08, + "loss": 0.0176, + "step": 28277 + }, + { + "epoch": 0.55, + "learning_rate": 9.038095607937556e-08, + "loss": 0.0005, + "step": 28278 + }, + { + "epoch": 0.55, + "learning_rate": 9.037707273503941e-08, + "loss": 0.0004, + "step": 28279 + }, + { + "epoch": 0.55, + "learning_rate": 9.037318939070327e-08, + "loss": 0.0007, + "step": 28280 + }, + { + "epoch": 0.55, + "learning_rate": 9.036930604636712e-08, + "loss": 0.0005, + "step": 28281 + }, + { + "epoch": 0.55, + "learning_rate": 9.036542270203098e-08, + "loss": 0.0012, + "step": 28282 + }, + { + "epoch": 0.55, + "learning_rate": 9.036153935769483e-08, + "loss": 0.0111, + "step": 28283 + }, + { + "epoch": 0.55, + "learning_rate": 9.035765601335869e-08, + "loss": 0.0007, + "step": 28284 + }, + { + "epoch": 0.55, + "learning_rate": 9.035377266902255e-08, + "loss": 0.0004, + "step": 28285 + }, + { + "epoch": 0.55, + "learning_rate": 9.034988932468641e-08, + "loss": 0.0006, + "step": 28286 + }, + { + "epoch": 0.55, + "learning_rate": 9.034600598035027e-08, + "loss": 0.6095, + "step": 28287 + }, + { + "epoch": 0.55, + "learning_rate": 9.034212263601413e-08, + "loss": 0.0005, + "step": 28288 + }, + { + "epoch": 0.55, + "learning_rate": 9.033823929167798e-08, + "loss": 0.0004, + "step": 28289 + }, + { + "epoch": 0.55, + "learning_rate": 9.033435594734184e-08, + "loss": 0.0005, + "step": 28290 + }, + { + "epoch": 0.55, + "learning_rate": 9.03304726030057e-08, + "loss": 0.0006, + "step": 28291 + }, + { + "epoch": 0.55, + "learning_rate": 9.032658925866956e-08, + "loss": 0.1644, + "step": 28292 + }, + { + "epoch": 0.55, + "learning_rate": 9.032270591433342e-08, + "loss": 0.3665, + "step": 28293 + }, + { + "epoch": 0.55, + "learning_rate": 9.031882256999728e-08, + "loss": 0.0009, + "step": 28294 + }, + { + "epoch": 0.55, + "learning_rate": 9.031493922566113e-08, + "loss": 0.0006, + "step": 28295 + }, + { + "epoch": 0.55, + "learning_rate": 9.031105588132499e-08, + "loss": 0.0004, + "step": 28296 + }, + { + "epoch": 0.55, + "learning_rate": 9.030717253698885e-08, + "loss": 0.0006, + "step": 28297 + }, + { + "epoch": 0.55, + "learning_rate": 9.030328919265271e-08, + "loss": 0.0004, + "step": 28298 + }, + { + "epoch": 0.55, + "learning_rate": 9.029940584831657e-08, + "loss": 0.7663, + "step": 28299 + }, + { + "epoch": 0.55, + "learning_rate": 9.029552250398042e-08, + "loss": 0.0005, + "step": 28300 + }, + { + "epoch": 0.55, + "learning_rate": 9.029163915964428e-08, + "loss": 0.0007, + "step": 28301 + }, + { + "epoch": 0.55, + "learning_rate": 9.028775581530814e-08, + "loss": 0.0007, + "step": 28302 + }, + { + "epoch": 0.55, + "learning_rate": 9.0283872470972e-08, + "loss": 0.0007, + "step": 28303 + }, + { + "epoch": 0.55, + "learning_rate": 9.027998912663586e-08, + "loss": 0.3259, + "step": 28304 + }, + { + "epoch": 0.55, + "learning_rate": 9.027610578229972e-08, + "loss": 0.0007, + "step": 28305 + }, + { + "epoch": 0.55, + "learning_rate": 9.027222243796357e-08, + "loss": 0.0026, + "step": 28306 + }, + { + "epoch": 0.55, + "learning_rate": 9.026833909362743e-08, + "loss": 0.0012, + "step": 28307 + }, + { + "epoch": 0.55, + "learning_rate": 9.026445574929129e-08, + "loss": 0.0005, + "step": 28308 + }, + { + "epoch": 0.55, + "learning_rate": 9.026057240495515e-08, + "loss": 0.0007, + "step": 28309 + }, + { + "epoch": 0.55, + "learning_rate": 9.0256689060619e-08, + "loss": 0.0004, + "step": 28310 + }, + { + "epoch": 0.55, + "learning_rate": 9.025280571628285e-08, + "loss": 0.3409, + "step": 28311 + }, + { + "epoch": 0.55, + "learning_rate": 9.024892237194671e-08, + "loss": 0.0006, + "step": 28312 + }, + { + "epoch": 0.55, + "learning_rate": 9.024503902761057e-08, + "loss": 0.0004, + "step": 28313 + }, + { + "epoch": 0.55, + "learning_rate": 9.024115568327443e-08, + "loss": 0.0008, + "step": 28314 + }, + { + "epoch": 0.55, + "learning_rate": 9.023727233893828e-08, + "loss": 0.0004, + "step": 28315 + }, + { + "epoch": 0.55, + "learning_rate": 9.023338899460214e-08, + "loss": 0.037, + "step": 28316 + }, + { + "epoch": 0.55, + "learning_rate": 9.0229505650266e-08, + "loss": 0.0006, + "step": 28317 + }, + { + "epoch": 0.55, + "learning_rate": 9.022562230592986e-08, + "loss": 1.266, + "step": 28318 + }, + { + "epoch": 0.55, + "learning_rate": 9.022173896159372e-08, + "loss": 0.0004, + "step": 28319 + }, + { + "epoch": 0.55, + "learning_rate": 9.021785561725758e-08, + "loss": 0.0005, + "step": 28320 + }, + { + "epoch": 0.55, + "learning_rate": 9.021397227292143e-08, + "loss": 0.0875, + "step": 28321 + }, + { + "epoch": 0.55, + "learning_rate": 9.021008892858529e-08, + "loss": 0.001, + "step": 28322 + }, + { + "epoch": 0.55, + "learning_rate": 9.020620558424915e-08, + "loss": 0.0004, + "step": 28323 + }, + { + "epoch": 0.55, + "learning_rate": 9.020232223991301e-08, + "loss": 0.0004, + "step": 28324 + }, + { + "epoch": 0.55, + "learning_rate": 9.019843889557687e-08, + "loss": 0.0045, + "step": 28325 + }, + { + "epoch": 0.55, + "learning_rate": 9.019455555124073e-08, + "loss": 0.0004, + "step": 28326 + }, + { + "epoch": 0.55, + "learning_rate": 9.019067220690458e-08, + "loss": 0.0006, + "step": 28327 + }, + { + "epoch": 0.55, + "learning_rate": 9.018678886256844e-08, + "loss": 0.0005, + "step": 28328 + }, + { + "epoch": 0.55, + "learning_rate": 9.01829055182323e-08, + "loss": 0.0006, + "step": 28329 + }, + { + "epoch": 0.55, + "learning_rate": 9.017902217389616e-08, + "loss": 0.0006, + "step": 28330 + }, + { + "epoch": 0.55, + "learning_rate": 9.017513882956002e-08, + "loss": 0.677, + "step": 28331 + }, + { + "epoch": 0.55, + "learning_rate": 9.017125548522388e-08, + "loss": 0.0005, + "step": 28332 + }, + { + "epoch": 0.55, + "learning_rate": 9.016737214088773e-08, + "loss": 0.0004, + "step": 28333 + }, + { + "epoch": 0.55, + "learning_rate": 9.016348879655159e-08, + "loss": 0.0005, + "step": 28334 + }, + { + "epoch": 0.55, + "learning_rate": 9.015960545221545e-08, + "loss": 0.0005, + "step": 28335 + }, + { + "epoch": 0.55, + "learning_rate": 9.015572210787931e-08, + "loss": 0.0005, + "step": 28336 + }, + { + "epoch": 0.55, + "learning_rate": 9.015183876354317e-08, + "loss": 0.0003, + "step": 28337 + }, + { + "epoch": 0.55, + "learning_rate": 9.014795541920702e-08, + "loss": 1.2346, + "step": 28338 + }, + { + "epoch": 0.55, + "learning_rate": 9.014407207487087e-08, + "loss": 0.2689, + "step": 28339 + }, + { + "epoch": 0.55, + "learning_rate": 9.014018873053473e-08, + "loss": 0.0005, + "step": 28340 + }, + { + "epoch": 0.55, + "learning_rate": 9.013630538619859e-08, + "loss": 0.0006, + "step": 28341 + }, + { + "epoch": 0.55, + "learning_rate": 9.013242204186244e-08, + "loss": 0.0004, + "step": 28342 + }, + { + "epoch": 0.55, + "learning_rate": 9.01285386975263e-08, + "loss": 0.0004, + "step": 28343 + }, + { + "epoch": 0.55, + "learning_rate": 9.012465535319016e-08, + "loss": 0.0004, + "step": 28344 + }, + { + "epoch": 0.55, + "learning_rate": 9.012077200885402e-08, + "loss": 0.0006, + "step": 28345 + }, + { + "epoch": 0.55, + "learning_rate": 9.011688866451788e-08, + "loss": 0.0005, + "step": 28346 + }, + { + "epoch": 0.55, + "learning_rate": 9.011300532018174e-08, + "loss": 0.0006, + "step": 28347 + }, + { + "epoch": 0.55, + "learning_rate": 9.01091219758456e-08, + "loss": 0.0007, + "step": 28348 + }, + { + "epoch": 0.55, + "learning_rate": 9.010523863150945e-08, + "loss": 0.0005, + "step": 28349 + }, + { + "epoch": 0.55, + "learning_rate": 9.010135528717331e-08, + "loss": 0.0005, + "step": 28350 + }, + { + "epoch": 0.55, + "learning_rate": 9.009747194283717e-08, + "loss": 0.046, + "step": 28351 + }, + { + "epoch": 0.55, + "learning_rate": 9.009358859850103e-08, + "loss": 0.0005, + "step": 28352 + }, + { + "epoch": 0.55, + "learning_rate": 9.008970525416489e-08, + "loss": 0.0005, + "step": 28353 + }, + { + "epoch": 0.55, + "learning_rate": 9.008582190982874e-08, + "loss": 0.0004, + "step": 28354 + }, + { + "epoch": 0.55, + "learning_rate": 9.00819385654926e-08, + "loss": 0.0004, + "step": 28355 + }, + { + "epoch": 0.55, + "learning_rate": 9.007805522115646e-08, + "loss": 0.0017, + "step": 28356 + }, + { + "epoch": 0.55, + "learning_rate": 9.007417187682032e-08, + "loss": 0.0006, + "step": 28357 + }, + { + "epoch": 0.55, + "learning_rate": 9.007028853248418e-08, + "loss": 0.0006, + "step": 28358 + }, + { + "epoch": 0.55, + "learning_rate": 9.006640518814803e-08, + "loss": 0.001, + "step": 28359 + }, + { + "epoch": 0.55, + "learning_rate": 9.006252184381189e-08, + "loss": 0.0015, + "step": 28360 + }, + { + "epoch": 0.55, + "learning_rate": 9.005863849947575e-08, + "loss": 0.0006, + "step": 28361 + }, + { + "epoch": 0.55, + "learning_rate": 9.005475515513961e-08, + "loss": 0.0005, + "step": 28362 + }, + { + "epoch": 0.55, + "learning_rate": 9.005087181080347e-08, + "loss": 0.0164, + "step": 28363 + }, + { + "epoch": 0.55, + "learning_rate": 9.004698846646733e-08, + "loss": 0.0006, + "step": 28364 + }, + { + "epoch": 0.55, + "learning_rate": 9.004310512213118e-08, + "loss": 0.0014, + "step": 28365 + }, + { + "epoch": 0.55, + "learning_rate": 9.003922177779504e-08, + "loss": 1.2246, + "step": 28366 + }, + { + "epoch": 0.55, + "learning_rate": 9.00353384334589e-08, + "loss": 0.0016, + "step": 28367 + }, + { + "epoch": 0.55, + "learning_rate": 9.003145508912275e-08, + "loss": 0.0191, + "step": 28368 + }, + { + "epoch": 0.55, + "learning_rate": 9.00275717447866e-08, + "loss": 0.0004, + "step": 28369 + }, + { + "epoch": 0.55, + "learning_rate": 9.002368840045046e-08, + "loss": 0.0009, + "step": 28370 + }, + { + "epoch": 0.55, + "learning_rate": 9.001980505611432e-08, + "loss": 0.0008, + "step": 28371 + }, + { + "epoch": 0.55, + "learning_rate": 9.001592171177818e-08, + "loss": 0.0006, + "step": 28372 + }, + { + "epoch": 0.55, + "learning_rate": 9.001203836744204e-08, + "loss": 0.0005, + "step": 28373 + }, + { + "epoch": 0.55, + "learning_rate": 9.00081550231059e-08, + "loss": 0.0118, + "step": 28374 + }, + { + "epoch": 0.55, + "learning_rate": 9.000427167876975e-08, + "loss": 0.0004, + "step": 28375 + }, + { + "epoch": 0.55, + "learning_rate": 9.000038833443361e-08, + "loss": 0.0004, + "step": 28376 + }, + { + "epoch": 0.55, + "learning_rate": 8.999650499009747e-08, + "loss": 0.0008, + "step": 28377 + }, + { + "epoch": 0.55, + "learning_rate": 8.999262164576133e-08, + "loss": 0.002, + "step": 28378 + }, + { + "epoch": 0.55, + "learning_rate": 8.998873830142519e-08, + "loss": 0.0004, + "step": 28379 + }, + { + "epoch": 0.55, + "learning_rate": 8.998485495708904e-08, + "loss": 0.0005, + "step": 28380 + }, + { + "epoch": 0.55, + "learning_rate": 8.99809716127529e-08, + "loss": 0.0004, + "step": 28381 + }, + { + "epoch": 0.55, + "learning_rate": 8.997708826841676e-08, + "loss": 0.0005, + "step": 28382 + }, + { + "epoch": 0.55, + "learning_rate": 8.997320492408062e-08, + "loss": 0.0007, + "step": 28383 + }, + { + "epoch": 0.55, + "learning_rate": 8.996932157974448e-08, + "loss": 0.0007, + "step": 28384 + }, + { + "epoch": 0.55, + "learning_rate": 8.996543823540834e-08, + "loss": 0.0004, + "step": 28385 + }, + { + "epoch": 0.55, + "learning_rate": 8.99615548910722e-08, + "loss": 0.0007, + "step": 28386 + }, + { + "epoch": 0.55, + "learning_rate": 8.995767154673605e-08, + "loss": 0.0021, + "step": 28387 + }, + { + "epoch": 0.55, + "learning_rate": 8.995378820239991e-08, + "loss": 0.0004, + "step": 28388 + }, + { + "epoch": 0.55, + "learning_rate": 8.994990485806377e-08, + "loss": 0.0006, + "step": 28389 + }, + { + "epoch": 0.55, + "learning_rate": 8.994602151372763e-08, + "loss": 0.0077, + "step": 28390 + }, + { + "epoch": 0.55, + "learning_rate": 8.994213816939149e-08, + "loss": 0.0005, + "step": 28391 + }, + { + "epoch": 0.55, + "learning_rate": 8.993825482505534e-08, + "loss": 0.0007, + "step": 28392 + }, + { + "epoch": 0.55, + "learning_rate": 8.99343714807192e-08, + "loss": 0.0007, + "step": 28393 + }, + { + "epoch": 0.55, + "learning_rate": 8.993048813638306e-08, + "loss": 0.0006, + "step": 28394 + }, + { + "epoch": 0.55, + "learning_rate": 8.992660479204692e-08, + "loss": 0.0016, + "step": 28395 + }, + { + "epoch": 0.55, + "learning_rate": 8.992272144771078e-08, + "loss": 0.0006, + "step": 28396 + }, + { + "epoch": 0.55, + "learning_rate": 8.991883810337462e-08, + "loss": 0.0005, + "step": 28397 + }, + { + "epoch": 0.55, + "learning_rate": 8.991495475903848e-08, + "loss": 0.0116, + "step": 28398 + }, + { + "epoch": 0.55, + "learning_rate": 8.991107141470234e-08, + "loss": 0.0005, + "step": 28399 + }, + { + "epoch": 0.55, + "learning_rate": 8.99071880703662e-08, + "loss": 0.0007, + "step": 28400 + }, + { + "epoch": 0.55, + "learning_rate": 8.990330472603005e-08, + "loss": 0.0005, + "step": 28401 + }, + { + "epoch": 0.55, + "learning_rate": 8.989942138169391e-08, + "loss": 0.0004, + "step": 28402 + }, + { + "epoch": 0.55, + "learning_rate": 8.989553803735777e-08, + "loss": 0.0005, + "step": 28403 + }, + { + "epoch": 0.55, + "learning_rate": 8.989165469302163e-08, + "loss": 0.0006, + "step": 28404 + }, + { + "epoch": 0.55, + "learning_rate": 8.988777134868549e-08, + "loss": 0.0005, + "step": 28405 + }, + { + "epoch": 0.55, + "learning_rate": 8.988388800434935e-08, + "loss": 0.0005, + "step": 28406 + }, + { + "epoch": 0.55, + "learning_rate": 8.98800046600132e-08, + "loss": 0.0006, + "step": 28407 + }, + { + "epoch": 0.55, + "learning_rate": 8.987612131567706e-08, + "loss": 0.1386, + "step": 28408 + }, + { + "epoch": 0.55, + "learning_rate": 8.987223797134092e-08, + "loss": 0.0006, + "step": 28409 + }, + { + "epoch": 0.55, + "learning_rate": 8.986835462700478e-08, + "loss": 0.0005, + "step": 28410 + }, + { + "epoch": 0.55, + "learning_rate": 8.986447128266864e-08, + "loss": 0.0006, + "step": 28411 + }, + { + "epoch": 0.55, + "learning_rate": 8.986058793833248e-08, + "loss": 0.0006, + "step": 28412 + }, + { + "epoch": 0.55, + "learning_rate": 8.985670459399634e-08, + "loss": 0.0005, + "step": 28413 + }, + { + "epoch": 0.55, + "learning_rate": 8.98528212496602e-08, + "loss": 0.0667, + "step": 28414 + }, + { + "epoch": 0.55, + "learning_rate": 8.984893790532406e-08, + "loss": 0.0004, + "step": 28415 + }, + { + "epoch": 0.55, + "learning_rate": 8.984505456098791e-08, + "loss": 0.0005, + "step": 28416 + }, + { + "epoch": 0.55, + "learning_rate": 8.984117121665177e-08, + "loss": 0.3922, + "step": 28417 + }, + { + "epoch": 0.55, + "learning_rate": 8.983728787231563e-08, + "loss": 0.0007, + "step": 28418 + }, + { + "epoch": 0.55, + "learning_rate": 8.983340452797949e-08, + "loss": 0.0287, + "step": 28419 + }, + { + "epoch": 0.55, + "learning_rate": 8.982952118364335e-08, + "loss": 0.0008, + "step": 28420 + }, + { + "epoch": 0.55, + "learning_rate": 8.98256378393072e-08, + "loss": 0.0005, + "step": 28421 + }, + { + "epoch": 0.55, + "learning_rate": 8.982175449497106e-08, + "loss": 0.0005, + "step": 28422 + }, + { + "epoch": 0.55, + "learning_rate": 8.981787115063492e-08, + "loss": 0.0005, + "step": 28423 + }, + { + "epoch": 0.55, + "learning_rate": 8.981398780629878e-08, + "loss": 0.0007, + "step": 28424 + }, + { + "epoch": 0.55, + "learning_rate": 8.981010446196264e-08, + "loss": 0.0005, + "step": 28425 + }, + { + "epoch": 0.55, + "learning_rate": 8.98062211176265e-08, + "loss": 0.0005, + "step": 28426 + }, + { + "epoch": 0.55, + "learning_rate": 8.980233777329034e-08, + "loss": 0.0005, + "step": 28427 + }, + { + "epoch": 0.55, + "learning_rate": 8.97984544289542e-08, + "loss": 0.0004, + "step": 28428 + }, + { + "epoch": 0.55, + "learning_rate": 8.979457108461806e-08, + "loss": 0.0004, + "step": 28429 + }, + { + "epoch": 0.55, + "learning_rate": 8.979068774028192e-08, + "loss": 0.0005, + "step": 28430 + }, + { + "epoch": 0.55, + "learning_rate": 8.978680439594578e-08, + "loss": 0.0007, + "step": 28431 + }, + { + "epoch": 0.55, + "learning_rate": 8.978292105160963e-08, + "loss": 0.0005, + "step": 28432 + }, + { + "epoch": 0.55, + "learning_rate": 8.977903770727349e-08, + "loss": 0.0005, + "step": 28433 + }, + { + "epoch": 0.55, + "learning_rate": 8.977515436293735e-08, + "loss": 0.0006, + "step": 28434 + }, + { + "epoch": 0.55, + "learning_rate": 8.977127101860121e-08, + "loss": 1.1026, + "step": 28435 + }, + { + "epoch": 0.55, + "learning_rate": 8.976738767426507e-08, + "loss": 0.0007, + "step": 28436 + }, + { + "epoch": 0.55, + "learning_rate": 8.976350432992892e-08, + "loss": 0.0006, + "step": 28437 + }, + { + "epoch": 0.55, + "learning_rate": 8.975962098559278e-08, + "loss": 0.0007, + "step": 28438 + }, + { + "epoch": 0.55, + "learning_rate": 8.975573764125664e-08, + "loss": 0.0005, + "step": 28439 + }, + { + "epoch": 0.55, + "learning_rate": 8.97518542969205e-08, + "loss": 0.0005, + "step": 28440 + }, + { + "epoch": 0.55, + "learning_rate": 8.974797095258436e-08, + "loss": 0.0007, + "step": 28441 + }, + { + "epoch": 0.55, + "learning_rate": 8.974408760824822e-08, + "loss": 0.0009, + "step": 28442 + }, + { + "epoch": 0.55, + "learning_rate": 8.974020426391207e-08, + "loss": 0.0005, + "step": 28443 + }, + { + "epoch": 0.55, + "learning_rate": 8.973632091957593e-08, + "loss": 0.0011, + "step": 28444 + }, + { + "epoch": 0.55, + "learning_rate": 8.973243757523979e-08, + "loss": 0.0005, + "step": 28445 + }, + { + "epoch": 0.55, + "learning_rate": 8.972855423090365e-08, + "loss": 0.0005, + "step": 28446 + }, + { + "epoch": 0.55, + "learning_rate": 8.972467088656751e-08, + "loss": 0.0005, + "step": 28447 + }, + { + "epoch": 0.55, + "learning_rate": 8.972078754223137e-08, + "loss": 0.0006, + "step": 28448 + }, + { + "epoch": 0.55, + "learning_rate": 8.971690419789522e-08, + "loss": 0.0009, + "step": 28449 + }, + { + "epoch": 0.55, + "learning_rate": 8.971302085355908e-08, + "loss": 0.0004, + "step": 28450 + }, + { + "epoch": 0.55, + "learning_rate": 8.970913750922294e-08, + "loss": 0.0006, + "step": 28451 + }, + { + "epoch": 0.55, + "learning_rate": 8.97052541648868e-08, + "loss": 0.0059, + "step": 28452 + }, + { + "epoch": 0.55, + "learning_rate": 8.970137082055066e-08, + "loss": 0.0005, + "step": 28453 + }, + { + "epoch": 0.55, + "learning_rate": 8.969748747621451e-08, + "loss": 0.0005, + "step": 28454 + }, + { + "epoch": 0.55, + "learning_rate": 8.969360413187836e-08, + "loss": 0.0007, + "step": 28455 + }, + { + "epoch": 0.55, + "learning_rate": 8.968972078754222e-08, + "loss": 0.0004, + "step": 28456 + }, + { + "epoch": 0.55, + "learning_rate": 8.968583744320608e-08, + "loss": 0.0006, + "step": 28457 + }, + { + "epoch": 0.55, + "learning_rate": 8.968195409886993e-08, + "loss": 0.0005, + "step": 28458 + }, + { + "epoch": 0.55, + "learning_rate": 8.967807075453379e-08, + "loss": 0.0013, + "step": 28459 + }, + { + "epoch": 0.55, + "learning_rate": 8.967418741019765e-08, + "loss": 0.6726, + "step": 28460 + }, + { + "epoch": 0.55, + "learning_rate": 8.967030406586151e-08, + "loss": 0.0004, + "step": 28461 + }, + { + "epoch": 0.55, + "learning_rate": 8.966642072152537e-08, + "loss": 0.0008, + "step": 28462 + }, + { + "epoch": 0.55, + "learning_rate": 8.966253737718923e-08, + "loss": 0.0006, + "step": 28463 + }, + { + "epoch": 0.55, + "learning_rate": 8.965865403285308e-08, + "loss": 0.001, + "step": 28464 + }, + { + "epoch": 0.55, + "learning_rate": 8.965477068851694e-08, + "loss": 0.0006, + "step": 28465 + }, + { + "epoch": 0.55, + "learning_rate": 8.96508873441808e-08, + "loss": 0.2918, + "step": 28466 + }, + { + "epoch": 0.55, + "learning_rate": 8.964700399984466e-08, + "loss": 0.0006, + "step": 28467 + }, + { + "epoch": 0.55, + "learning_rate": 8.964312065550852e-08, + "loss": 1.194, + "step": 28468 + }, + { + "epoch": 0.55, + "learning_rate": 8.963923731117238e-08, + "loss": 0.0004, + "step": 28469 + }, + { + "epoch": 0.55, + "learning_rate": 8.963535396683623e-08, + "loss": 1.0622, + "step": 28470 + }, + { + "epoch": 0.55, + "learning_rate": 8.963147062250009e-08, + "loss": 0.2472, + "step": 28471 + }, + { + "epoch": 0.55, + "learning_rate": 8.962758727816395e-08, + "loss": 0.0008, + "step": 28472 + }, + { + "epoch": 0.55, + "learning_rate": 8.962370393382781e-08, + "loss": 0.6651, + "step": 28473 + }, + { + "epoch": 0.55, + "learning_rate": 8.961982058949167e-08, + "loss": 0.0117, + "step": 28474 + }, + { + "epoch": 0.55, + "learning_rate": 8.961593724515552e-08, + "loss": 0.0007, + "step": 28475 + }, + { + "epoch": 0.55, + "learning_rate": 8.961205390081938e-08, + "loss": 0.0008, + "step": 28476 + }, + { + "epoch": 0.55, + "learning_rate": 8.960817055648324e-08, + "loss": 0.0007, + "step": 28477 + }, + { + "epoch": 0.55, + "learning_rate": 8.96042872121471e-08, + "loss": 0.0009, + "step": 28478 + }, + { + "epoch": 0.55, + "learning_rate": 8.960040386781096e-08, + "loss": 0.0006, + "step": 28479 + }, + { + "epoch": 0.55, + "learning_rate": 8.959652052347482e-08, + "loss": 0.0004, + "step": 28480 + }, + { + "epoch": 0.55, + "learning_rate": 8.959263717913867e-08, + "loss": 0.0042, + "step": 28481 + }, + { + "epoch": 0.55, + "learning_rate": 8.958875383480253e-08, + "loss": 0.0006, + "step": 28482 + }, + { + "epoch": 0.55, + "learning_rate": 8.958487049046639e-08, + "loss": 0.0186, + "step": 28483 + }, + { + "epoch": 0.55, + "learning_rate": 8.958098714613024e-08, + "loss": 0.0005, + "step": 28484 + }, + { + "epoch": 0.55, + "learning_rate": 8.95771038017941e-08, + "loss": 0.0007, + "step": 28485 + }, + { + "epoch": 0.55, + "learning_rate": 8.957322045745795e-08, + "loss": 0.0009, + "step": 28486 + }, + { + "epoch": 0.55, + "learning_rate": 8.956933711312181e-08, + "loss": 0.0003, + "step": 28487 + }, + { + "epoch": 0.55, + "learning_rate": 8.956545376878567e-08, + "loss": 0.004, + "step": 28488 + }, + { + "epoch": 0.55, + "learning_rate": 8.956157042444953e-08, + "loss": 0.0004, + "step": 28489 + }, + { + "epoch": 0.55, + "learning_rate": 8.955768708011339e-08, + "loss": 1.1476, + "step": 28490 + }, + { + "epoch": 0.55, + "learning_rate": 8.955380373577724e-08, + "loss": 0.0005, + "step": 28491 + }, + { + "epoch": 0.55, + "learning_rate": 8.95499203914411e-08, + "loss": 0.0007, + "step": 28492 + }, + { + "epoch": 0.55, + "learning_rate": 8.954603704710496e-08, + "loss": 0.0006, + "step": 28493 + }, + { + "epoch": 0.55, + "learning_rate": 8.954215370276882e-08, + "loss": 0.0009, + "step": 28494 + }, + { + "epoch": 0.55, + "learning_rate": 8.953827035843268e-08, + "loss": 0.0005, + "step": 28495 + }, + { + "epoch": 0.55, + "learning_rate": 8.953438701409653e-08, + "loss": 0.0005, + "step": 28496 + }, + { + "epoch": 0.55, + "learning_rate": 8.953050366976039e-08, + "loss": 0.0008, + "step": 28497 + }, + { + "epoch": 0.55, + "learning_rate": 8.952662032542425e-08, + "loss": 0.0006, + "step": 28498 + }, + { + "epoch": 0.55, + "learning_rate": 8.952273698108811e-08, + "loss": 0.0019, + "step": 28499 + }, + { + "epoch": 0.55, + "learning_rate": 8.951885363675197e-08, + "loss": 0.001, + "step": 28500 + }, + { + "epoch": 0.55, + "learning_rate": 8.951497029241583e-08, + "loss": 0.0007, + "step": 28501 + }, + { + "epoch": 0.55, + "learning_rate": 8.951108694807968e-08, + "loss": 0.0005, + "step": 28502 + }, + { + "epoch": 0.55, + "learning_rate": 8.950720360374354e-08, + "loss": 0.0005, + "step": 28503 + }, + { + "epoch": 0.55, + "learning_rate": 8.95033202594074e-08, + "loss": 0.0005, + "step": 28504 + }, + { + "epoch": 0.55, + "learning_rate": 8.949943691507126e-08, + "loss": 0.0005, + "step": 28505 + }, + { + "epoch": 0.55, + "learning_rate": 8.949555357073512e-08, + "loss": 0.0008, + "step": 28506 + }, + { + "epoch": 0.55, + "learning_rate": 8.949167022639898e-08, + "loss": 0.0015, + "step": 28507 + }, + { + "epoch": 0.55, + "learning_rate": 8.948778688206283e-08, + "loss": 0.0006, + "step": 28508 + }, + { + "epoch": 0.55, + "learning_rate": 8.948390353772669e-08, + "loss": 0.0008, + "step": 28509 + }, + { + "epoch": 0.55, + "learning_rate": 8.948002019339055e-08, + "loss": 1.1303, + "step": 28510 + }, + { + "epoch": 0.55, + "learning_rate": 8.947613684905441e-08, + "loss": 0.0056, + "step": 28511 + }, + { + "epoch": 0.55, + "learning_rate": 8.947225350471827e-08, + "loss": 0.006, + "step": 28512 + }, + { + "epoch": 0.55, + "learning_rate": 8.946837016038211e-08, + "loss": 0.0005, + "step": 28513 + }, + { + "epoch": 0.55, + "learning_rate": 8.946448681604597e-08, + "loss": 0.0004, + "step": 28514 + }, + { + "epoch": 0.55, + "learning_rate": 8.946060347170983e-08, + "loss": 0.8885, + "step": 28515 + }, + { + "epoch": 0.55, + "learning_rate": 8.945672012737369e-08, + "loss": 0.0004, + "step": 28516 + }, + { + "epoch": 0.55, + "learning_rate": 8.945283678303754e-08, + "loss": 0.0005, + "step": 28517 + }, + { + "epoch": 0.55, + "learning_rate": 8.94489534387014e-08, + "loss": 0.0018, + "step": 28518 + }, + { + "epoch": 0.55, + "learning_rate": 8.944507009436526e-08, + "loss": 0.0172, + "step": 28519 + }, + { + "epoch": 0.55, + "learning_rate": 8.944118675002912e-08, + "loss": 0.0007, + "step": 28520 + }, + { + "epoch": 0.55, + "learning_rate": 8.943730340569298e-08, + "loss": 0.0006, + "step": 28521 + }, + { + "epoch": 0.55, + "learning_rate": 8.943342006135684e-08, + "loss": 0.0858, + "step": 28522 + }, + { + "epoch": 0.55, + "learning_rate": 8.94295367170207e-08, + "loss": 0.0007, + "step": 28523 + }, + { + "epoch": 0.55, + "learning_rate": 8.942565337268455e-08, + "loss": 0.0032, + "step": 28524 + }, + { + "epoch": 0.55, + "learning_rate": 8.942177002834841e-08, + "loss": 0.0005, + "step": 28525 + }, + { + "epoch": 0.55, + "learning_rate": 8.941788668401227e-08, + "loss": 1.2699, + "step": 28526 + }, + { + "epoch": 0.55, + "learning_rate": 8.941400333967613e-08, + "loss": 0.0005, + "step": 28527 + }, + { + "epoch": 0.55, + "learning_rate": 8.941011999533999e-08, + "loss": 0.049, + "step": 28528 + }, + { + "epoch": 0.55, + "learning_rate": 8.940623665100384e-08, + "loss": 0.0006, + "step": 28529 + }, + { + "epoch": 0.55, + "learning_rate": 8.94023533066677e-08, + "loss": 0.0004, + "step": 28530 + }, + { + "epoch": 0.55, + "learning_rate": 8.939846996233156e-08, + "loss": 0.0006, + "step": 28531 + }, + { + "epoch": 0.55, + "learning_rate": 8.939458661799542e-08, + "loss": 0.0006, + "step": 28532 + }, + { + "epoch": 0.55, + "learning_rate": 8.939070327365928e-08, + "loss": 0.0007, + "step": 28533 + }, + { + "epoch": 0.55, + "learning_rate": 8.938681992932313e-08, + "loss": 0.0009, + "step": 28534 + }, + { + "epoch": 0.55, + "learning_rate": 8.938293658498699e-08, + "loss": 0.0516, + "step": 28535 + }, + { + "epoch": 0.55, + "learning_rate": 8.937905324065085e-08, + "loss": 0.8403, + "step": 28536 + }, + { + "epoch": 0.55, + "learning_rate": 8.937516989631471e-08, + "loss": 0.0004, + "step": 28537 + }, + { + "epoch": 0.55, + "learning_rate": 8.937128655197857e-08, + "loss": 0.0007, + "step": 28538 + }, + { + "epoch": 0.55, + "learning_rate": 8.936740320764243e-08, + "loss": 0.0004, + "step": 28539 + }, + { + "epoch": 0.55, + "learning_rate": 8.936351986330628e-08, + "loss": 0.1432, + "step": 28540 + }, + { + "epoch": 0.55, + "learning_rate": 8.935963651897014e-08, + "loss": 0.0004, + "step": 28541 + }, + { + "epoch": 0.55, + "learning_rate": 8.935575317463399e-08, + "loss": 0.0006, + "step": 28542 + }, + { + "epoch": 0.55, + "learning_rate": 8.935186983029785e-08, + "loss": 0.0006, + "step": 28543 + }, + { + "epoch": 0.55, + "learning_rate": 8.93479864859617e-08, + "loss": 0.0004, + "step": 28544 + }, + { + "epoch": 0.55, + "learning_rate": 8.934410314162556e-08, + "loss": 0.0004, + "step": 28545 + }, + { + "epoch": 0.55, + "learning_rate": 8.934021979728942e-08, + "loss": 0.4014, + "step": 28546 + }, + { + "epoch": 0.55, + "learning_rate": 8.933633645295328e-08, + "loss": 0.0003, + "step": 28547 + }, + { + "epoch": 0.55, + "learning_rate": 8.933245310861714e-08, + "loss": 0.0006, + "step": 28548 + }, + { + "epoch": 0.55, + "learning_rate": 8.9328569764281e-08, + "loss": 0.0008, + "step": 28549 + }, + { + "epoch": 0.55, + "learning_rate": 8.932468641994485e-08, + "loss": 0.0004, + "step": 28550 + }, + { + "epoch": 0.55, + "learning_rate": 8.932080307560871e-08, + "loss": 0.2641, + "step": 28551 + }, + { + "epoch": 0.55, + "learning_rate": 8.931691973127257e-08, + "loss": 0.0005, + "step": 28552 + }, + { + "epoch": 0.55, + "learning_rate": 8.931303638693643e-08, + "loss": 0.0006, + "step": 28553 + }, + { + "epoch": 0.55, + "learning_rate": 8.930915304260029e-08, + "loss": 0.1021, + "step": 28554 + }, + { + "epoch": 0.55, + "learning_rate": 8.930526969826414e-08, + "loss": 0.0005, + "step": 28555 + }, + { + "epoch": 0.55, + "learning_rate": 8.9301386353928e-08, + "loss": 0.0006, + "step": 28556 + }, + { + "epoch": 0.55, + "learning_rate": 8.929750300959186e-08, + "loss": 0.0015, + "step": 28557 + }, + { + "epoch": 0.55, + "learning_rate": 8.929361966525572e-08, + "loss": 0.0014, + "step": 28558 + }, + { + "epoch": 0.55, + "learning_rate": 8.928973632091958e-08, + "loss": 0.002, + "step": 28559 + }, + { + "epoch": 0.55, + "learning_rate": 8.928585297658344e-08, + "loss": 0.2834, + "step": 28560 + }, + { + "epoch": 0.55, + "learning_rate": 8.92819696322473e-08, + "loss": 0.0012, + "step": 28561 + }, + { + "epoch": 0.55, + "learning_rate": 8.927808628791115e-08, + "loss": 0.0006, + "step": 28562 + }, + { + "epoch": 0.55, + "learning_rate": 8.927420294357501e-08, + "loss": 0.0004, + "step": 28563 + }, + { + "epoch": 0.55, + "learning_rate": 8.927031959923887e-08, + "loss": 0.0006, + "step": 28564 + }, + { + "epoch": 0.55, + "learning_rate": 8.926643625490273e-08, + "loss": 0.0006, + "step": 28565 + }, + { + "epoch": 0.55, + "learning_rate": 8.926255291056659e-08, + "loss": 0.0005, + "step": 28566 + }, + { + "epoch": 0.55, + "learning_rate": 8.925866956623044e-08, + "loss": 0.0009, + "step": 28567 + }, + { + "epoch": 0.55, + "learning_rate": 8.92547862218943e-08, + "loss": 0.0006, + "step": 28568 + }, + { + "epoch": 0.55, + "learning_rate": 8.925090287755816e-08, + "loss": 0.0008, + "step": 28569 + }, + { + "epoch": 0.55, + "learning_rate": 8.924701953322202e-08, + "loss": 0.0004, + "step": 28570 + }, + { + "epoch": 0.55, + "learning_rate": 8.924313618888586e-08, + "loss": 0.0006, + "step": 28571 + }, + { + "epoch": 0.55, + "learning_rate": 8.923925284454972e-08, + "loss": 0.1744, + "step": 28572 + }, + { + "epoch": 0.55, + "learning_rate": 8.923536950021358e-08, + "loss": 0.0006, + "step": 28573 + }, + { + "epoch": 0.55, + "learning_rate": 8.923148615587744e-08, + "loss": 0.0005, + "step": 28574 + }, + { + "epoch": 0.55, + "learning_rate": 8.92276028115413e-08, + "loss": 0.0007, + "step": 28575 + }, + { + "epoch": 0.55, + "learning_rate": 8.922371946720515e-08, + "loss": 0.1615, + "step": 28576 + }, + { + "epoch": 0.55, + "learning_rate": 8.921983612286901e-08, + "loss": 0.0006, + "step": 28577 + }, + { + "epoch": 0.55, + "learning_rate": 8.921595277853287e-08, + "loss": 0.0004, + "step": 28578 + }, + { + "epoch": 0.55, + "learning_rate": 8.921206943419673e-08, + "loss": 0.0006, + "step": 28579 + }, + { + "epoch": 0.55, + "learning_rate": 8.920818608986059e-08, + "loss": 0.0004, + "step": 28580 + }, + { + "epoch": 0.55, + "learning_rate": 8.920430274552445e-08, + "loss": 0.0006, + "step": 28581 + }, + { + "epoch": 0.55, + "learning_rate": 8.92004194011883e-08, + "loss": 0.0006, + "step": 28582 + }, + { + "epoch": 0.55, + "learning_rate": 8.919653605685216e-08, + "loss": 0.0007, + "step": 28583 + }, + { + "epoch": 0.55, + "learning_rate": 8.919265271251602e-08, + "loss": 0.0006, + "step": 28584 + }, + { + "epoch": 0.55, + "learning_rate": 8.918876936817988e-08, + "loss": 0.0005, + "step": 28585 + }, + { + "epoch": 0.55, + "learning_rate": 8.918488602384374e-08, + "loss": 1.2209, + "step": 28586 + }, + { + "epoch": 0.55, + "learning_rate": 8.91810026795076e-08, + "loss": 0.0008, + "step": 28587 + }, + { + "epoch": 0.55, + "learning_rate": 8.917711933517145e-08, + "loss": 0.0005, + "step": 28588 + }, + { + "epoch": 0.55, + "learning_rate": 8.91732359908353e-08, + "loss": 0.0826, + "step": 28589 + }, + { + "epoch": 0.55, + "learning_rate": 8.916935264649916e-08, + "loss": 0.0005, + "step": 28590 + }, + { + "epoch": 0.55, + "learning_rate": 8.916546930216301e-08, + "loss": 0.6506, + "step": 28591 + }, + { + "epoch": 0.55, + "learning_rate": 8.916158595782687e-08, + "loss": 0.0009, + "step": 28592 + }, + { + "epoch": 0.55, + "learning_rate": 8.915770261349073e-08, + "loss": 0.0007, + "step": 28593 + }, + { + "epoch": 0.55, + "learning_rate": 8.915381926915459e-08, + "loss": 0.0008, + "step": 28594 + }, + { + "epoch": 0.55, + "learning_rate": 8.914993592481845e-08, + "loss": 0.0312, + "step": 28595 + }, + { + "epoch": 0.55, + "learning_rate": 8.91460525804823e-08, + "loss": 0.0004, + "step": 28596 + }, + { + "epoch": 0.55, + "learning_rate": 8.914216923614616e-08, + "loss": 0.0004, + "step": 28597 + }, + { + "epoch": 0.55, + "learning_rate": 8.913828589181002e-08, + "loss": 0.0005, + "step": 28598 + }, + { + "epoch": 0.55, + "learning_rate": 8.913440254747388e-08, + "loss": 0.0011, + "step": 28599 + }, + { + "epoch": 0.55, + "learning_rate": 8.913051920313774e-08, + "loss": 0.0008, + "step": 28600 + }, + { + "epoch": 0.55, + "learning_rate": 8.91266358588016e-08, + "loss": 0.0005, + "step": 28601 + }, + { + "epoch": 0.55, + "learning_rate": 8.912275251446546e-08, + "loss": 0.0006, + "step": 28602 + }, + { + "epoch": 0.55, + "learning_rate": 8.911886917012931e-08, + "loss": 0.0007, + "step": 28603 + }, + { + "epoch": 0.55, + "learning_rate": 8.911498582579316e-08, + "loss": 0.0012, + "step": 28604 + }, + { + "epoch": 0.55, + "learning_rate": 8.911110248145702e-08, + "loss": 0.002, + "step": 28605 + }, + { + "epoch": 0.55, + "learning_rate": 8.910721913712088e-08, + "loss": 0.0006, + "step": 28606 + }, + { + "epoch": 0.55, + "learning_rate": 8.910333579278473e-08, + "loss": 0.0008, + "step": 28607 + }, + { + "epoch": 0.55, + "learning_rate": 8.909945244844859e-08, + "loss": 0.0004, + "step": 28608 + }, + { + "epoch": 0.55, + "learning_rate": 8.909556910411245e-08, + "loss": 0.0004, + "step": 28609 + }, + { + "epoch": 0.55, + "learning_rate": 8.909168575977631e-08, + "loss": 0.0004, + "step": 28610 + }, + { + "epoch": 0.55, + "learning_rate": 8.908780241544017e-08, + "loss": 0.0005, + "step": 28611 + }, + { + "epoch": 0.56, + "learning_rate": 8.908391907110402e-08, + "loss": 0.001, + "step": 28612 + }, + { + "epoch": 0.56, + "learning_rate": 8.908003572676788e-08, + "loss": 0.0005, + "step": 28613 + }, + { + "epoch": 0.56, + "learning_rate": 8.907615238243174e-08, + "loss": 0.3027, + "step": 28614 + }, + { + "epoch": 0.56, + "learning_rate": 8.90722690380956e-08, + "loss": 0.0007, + "step": 28615 + }, + { + "epoch": 0.56, + "learning_rate": 8.906838569375946e-08, + "loss": 0.0003, + "step": 28616 + }, + { + "epoch": 0.56, + "learning_rate": 8.906450234942332e-08, + "loss": 0.0006, + "step": 28617 + }, + { + "epoch": 0.56, + "learning_rate": 8.906061900508717e-08, + "loss": 0.001, + "step": 28618 + }, + { + "epoch": 0.56, + "learning_rate": 8.905673566075103e-08, + "loss": 0.0025, + "step": 28619 + }, + { + "epoch": 0.56, + "learning_rate": 8.905285231641489e-08, + "loss": 0.8396, + "step": 28620 + }, + { + "epoch": 0.56, + "learning_rate": 8.904896897207875e-08, + "loss": 0.0003, + "step": 28621 + }, + { + "epoch": 0.56, + "learning_rate": 8.904508562774261e-08, + "loss": 0.1461, + "step": 28622 + }, + { + "epoch": 0.56, + "learning_rate": 8.904120228340647e-08, + "loss": 0.0013, + "step": 28623 + }, + { + "epoch": 0.56, + "learning_rate": 8.903731893907032e-08, + "loss": 0.0006, + "step": 28624 + }, + { + "epoch": 0.56, + "learning_rate": 8.903343559473418e-08, + "loss": 0.0004, + "step": 28625 + }, + { + "epoch": 0.56, + "learning_rate": 8.902955225039804e-08, + "loss": 0.0004, + "step": 28626 + }, + { + "epoch": 0.56, + "learning_rate": 8.90256689060619e-08, + "loss": 0.0006, + "step": 28627 + }, + { + "epoch": 0.56, + "learning_rate": 8.902178556172576e-08, + "loss": 0.4577, + "step": 28628 + }, + { + "epoch": 0.56, + "learning_rate": 8.90179022173896e-08, + "loss": 0.0235, + "step": 28629 + }, + { + "epoch": 0.56, + "learning_rate": 8.901401887305346e-08, + "loss": 0.0008, + "step": 28630 + }, + { + "epoch": 0.56, + "learning_rate": 8.901013552871732e-08, + "loss": 0.0005, + "step": 28631 + }, + { + "epoch": 0.56, + "learning_rate": 8.900625218438118e-08, + "loss": 0.0042, + "step": 28632 + }, + { + "epoch": 0.56, + "learning_rate": 8.900236884004503e-08, + "loss": 0.0006, + "step": 28633 + }, + { + "epoch": 0.56, + "learning_rate": 8.899848549570889e-08, + "loss": 0.0006, + "step": 28634 + }, + { + "epoch": 0.56, + "learning_rate": 8.899460215137275e-08, + "loss": 0.004, + "step": 28635 + }, + { + "epoch": 0.56, + "learning_rate": 8.899071880703661e-08, + "loss": 0.0004, + "step": 28636 + }, + { + "epoch": 0.56, + "learning_rate": 8.898683546270047e-08, + "loss": 0.0007, + "step": 28637 + }, + { + "epoch": 0.56, + "learning_rate": 8.898295211836433e-08, + "loss": 0.0005, + "step": 28638 + }, + { + "epoch": 0.56, + "learning_rate": 8.897906877402818e-08, + "loss": 0.0008, + "step": 28639 + }, + { + "epoch": 0.56, + "learning_rate": 8.897518542969204e-08, + "loss": 0.0004, + "step": 28640 + }, + { + "epoch": 0.56, + "learning_rate": 8.89713020853559e-08, + "loss": 0.0005, + "step": 28641 + }, + { + "epoch": 0.56, + "learning_rate": 8.896741874101976e-08, + "loss": 0.0007, + "step": 28642 + }, + { + "epoch": 0.56, + "learning_rate": 8.896353539668362e-08, + "loss": 0.0009, + "step": 28643 + }, + { + "epoch": 0.56, + "learning_rate": 8.895965205234748e-08, + "loss": 0.0005, + "step": 28644 + }, + { + "epoch": 0.56, + "learning_rate": 8.895576870801133e-08, + "loss": 0.0006, + "step": 28645 + }, + { + "epoch": 0.56, + "learning_rate": 8.895188536367519e-08, + "loss": 0.0003, + "step": 28646 + }, + { + "epoch": 0.56, + "learning_rate": 8.894800201933905e-08, + "loss": 0.0004, + "step": 28647 + }, + { + "epoch": 0.56, + "learning_rate": 8.894411867500291e-08, + "loss": 0.0006, + "step": 28648 + }, + { + "epoch": 0.56, + "learning_rate": 8.894023533066677e-08, + "loss": 0.0005, + "step": 28649 + }, + { + "epoch": 0.56, + "learning_rate": 8.893635198633062e-08, + "loss": 0.0005, + "step": 28650 + }, + { + "epoch": 0.56, + "learning_rate": 8.893246864199448e-08, + "loss": 0.0007, + "step": 28651 + }, + { + "epoch": 0.56, + "learning_rate": 8.892858529765834e-08, + "loss": 0.0007, + "step": 28652 + }, + { + "epoch": 0.56, + "learning_rate": 8.89247019533222e-08, + "loss": 0.0599, + "step": 28653 + }, + { + "epoch": 0.56, + "learning_rate": 8.892081860898606e-08, + "loss": 0.0005, + "step": 28654 + }, + { + "epoch": 0.56, + "learning_rate": 8.891693526464992e-08, + "loss": 0.0006, + "step": 28655 + }, + { + "epoch": 0.56, + "learning_rate": 8.891305192031377e-08, + "loss": 0.0006, + "step": 28656 + }, + { + "epoch": 0.56, + "learning_rate": 8.890916857597763e-08, + "loss": 0.5775, + "step": 28657 + }, + { + "epoch": 0.56, + "learning_rate": 8.890528523164148e-08, + "loss": 0.0008, + "step": 28658 + }, + { + "epoch": 0.56, + "learning_rate": 8.890140188730534e-08, + "loss": 0.0005, + "step": 28659 + }, + { + "epoch": 0.56, + "learning_rate": 8.88975185429692e-08, + "loss": 0.0008, + "step": 28660 + }, + { + "epoch": 0.56, + "learning_rate": 8.889363519863305e-08, + "loss": 0.0005, + "step": 28661 + }, + { + "epoch": 0.56, + "learning_rate": 8.888975185429691e-08, + "loss": 0.0005, + "step": 28662 + }, + { + "epoch": 0.56, + "learning_rate": 8.888586850996077e-08, + "loss": 0.0005, + "step": 28663 + }, + { + "epoch": 0.56, + "learning_rate": 8.888198516562463e-08, + "loss": 0.0006, + "step": 28664 + }, + { + "epoch": 0.56, + "learning_rate": 8.887810182128849e-08, + "loss": 0.0004, + "step": 28665 + }, + { + "epoch": 0.56, + "learning_rate": 8.887421847695234e-08, + "loss": 0.0009, + "step": 28666 + }, + { + "epoch": 0.56, + "learning_rate": 8.88703351326162e-08, + "loss": 0.001, + "step": 28667 + }, + { + "epoch": 0.56, + "learning_rate": 8.886645178828006e-08, + "loss": 0.0004, + "step": 28668 + }, + { + "epoch": 0.56, + "learning_rate": 8.886256844394392e-08, + "loss": 0.0007, + "step": 28669 + }, + { + "epoch": 0.56, + "learning_rate": 8.885868509960778e-08, + "loss": 0.0005, + "step": 28670 + }, + { + "epoch": 0.56, + "learning_rate": 8.885480175527163e-08, + "loss": 0.0004, + "step": 28671 + }, + { + "epoch": 0.56, + "learning_rate": 8.885091841093549e-08, + "loss": 0.0005, + "step": 28672 + }, + { + "epoch": 0.56, + "learning_rate": 8.884703506659935e-08, + "loss": 0.0005, + "step": 28673 + }, + { + "epoch": 0.56, + "learning_rate": 8.884315172226321e-08, + "loss": 0.0134, + "step": 28674 + }, + { + "epoch": 0.56, + "learning_rate": 8.883926837792707e-08, + "loss": 0.993, + "step": 28675 + }, + { + "epoch": 0.56, + "learning_rate": 8.883538503359093e-08, + "loss": 0.0007, + "step": 28676 + }, + { + "epoch": 0.56, + "learning_rate": 8.883150168925478e-08, + "loss": 0.0005, + "step": 28677 + }, + { + "epoch": 0.56, + "learning_rate": 8.882761834491864e-08, + "loss": 0.0004, + "step": 28678 + }, + { + "epoch": 0.56, + "learning_rate": 8.88237350005825e-08, + "loss": 0.008, + "step": 28679 + }, + { + "epoch": 0.56, + "learning_rate": 8.881985165624636e-08, + "loss": 0.0056, + "step": 28680 + }, + { + "epoch": 0.56, + "learning_rate": 8.881596831191022e-08, + "loss": 0.0006, + "step": 28681 + }, + { + "epoch": 0.56, + "learning_rate": 8.881208496757408e-08, + "loss": 0.0012, + "step": 28682 + }, + { + "epoch": 0.56, + "learning_rate": 8.880820162323793e-08, + "loss": 0.0005, + "step": 28683 + }, + { + "epoch": 0.56, + "learning_rate": 8.880431827890179e-08, + "loss": 0.0006, + "step": 28684 + }, + { + "epoch": 0.56, + "learning_rate": 8.880043493456565e-08, + "loss": 0.0006, + "step": 28685 + }, + { + "epoch": 0.56, + "learning_rate": 8.879655159022951e-08, + "loss": 0.0008, + "step": 28686 + }, + { + "epoch": 0.56, + "learning_rate": 8.879266824589335e-08, + "loss": 0.3888, + "step": 28687 + }, + { + "epoch": 0.56, + "learning_rate": 8.878878490155721e-08, + "loss": 0.0005, + "step": 28688 + }, + { + "epoch": 0.56, + "learning_rate": 8.878490155722107e-08, + "loss": 0.0006, + "step": 28689 + }, + { + "epoch": 0.56, + "learning_rate": 8.878101821288493e-08, + "loss": 0.0005, + "step": 28690 + }, + { + "epoch": 0.56, + "learning_rate": 8.877713486854879e-08, + "loss": 0.0014, + "step": 28691 + }, + { + "epoch": 0.56, + "learning_rate": 8.877325152421264e-08, + "loss": 0.0004, + "step": 28692 + }, + { + "epoch": 0.56, + "learning_rate": 8.87693681798765e-08, + "loss": 0.0012, + "step": 28693 + }, + { + "epoch": 0.56, + "learning_rate": 8.876548483554036e-08, + "loss": 0.0008, + "step": 28694 + }, + { + "epoch": 0.56, + "learning_rate": 8.876160149120422e-08, + "loss": 0.0004, + "step": 28695 + }, + { + "epoch": 0.56, + "learning_rate": 8.875771814686808e-08, + "loss": 0.0005, + "step": 28696 + }, + { + "epoch": 0.56, + "learning_rate": 8.875383480253194e-08, + "loss": 0.0006, + "step": 28697 + }, + { + "epoch": 0.56, + "learning_rate": 8.87499514581958e-08, + "loss": 0.0003, + "step": 28698 + }, + { + "epoch": 0.56, + "learning_rate": 8.874606811385965e-08, + "loss": 0.0006, + "step": 28699 + }, + { + "epoch": 0.56, + "learning_rate": 8.874218476952351e-08, + "loss": 0.0006, + "step": 28700 + }, + { + "epoch": 0.56, + "learning_rate": 8.873830142518737e-08, + "loss": 0.0006, + "step": 28701 + }, + { + "epoch": 0.56, + "learning_rate": 8.873441808085123e-08, + "loss": 0.001, + "step": 28702 + }, + { + "epoch": 0.56, + "learning_rate": 8.873053473651509e-08, + "loss": 0.0005, + "step": 28703 + }, + { + "epoch": 0.56, + "learning_rate": 8.872665139217894e-08, + "loss": 0.0012, + "step": 28704 + }, + { + "epoch": 0.56, + "learning_rate": 8.87227680478428e-08, + "loss": 0.0116, + "step": 28705 + }, + { + "epoch": 0.56, + "learning_rate": 8.871888470350666e-08, + "loss": 0.0019, + "step": 28706 + }, + { + "epoch": 0.56, + "learning_rate": 8.871500135917052e-08, + "loss": 0.2142, + "step": 28707 + }, + { + "epoch": 0.56, + "learning_rate": 8.871111801483438e-08, + "loss": 0.0005, + "step": 28708 + }, + { + "epoch": 0.56, + "learning_rate": 8.870723467049823e-08, + "loss": 0.0011, + "step": 28709 + }, + { + "epoch": 0.56, + "learning_rate": 8.870335132616209e-08, + "loss": 0.5243, + "step": 28710 + }, + { + "epoch": 0.56, + "learning_rate": 8.869946798182595e-08, + "loss": 0.0005, + "step": 28711 + }, + { + "epoch": 0.56, + "learning_rate": 8.869558463748981e-08, + "loss": 0.007, + "step": 28712 + }, + { + "epoch": 0.56, + "learning_rate": 8.869170129315367e-08, + "loss": 0.178, + "step": 28713 + }, + { + "epoch": 0.56, + "learning_rate": 8.868781794881753e-08, + "loss": 0.0019, + "step": 28714 + }, + { + "epoch": 0.56, + "learning_rate": 8.868393460448138e-08, + "loss": 0.0005, + "step": 28715 + }, + { + "epoch": 0.56, + "learning_rate": 8.868005126014523e-08, + "loss": 0.0005, + "step": 28716 + }, + { + "epoch": 0.56, + "learning_rate": 8.867616791580909e-08, + "loss": 0.0006, + "step": 28717 + }, + { + "epoch": 0.56, + "learning_rate": 8.867228457147295e-08, + "loss": 0.0005, + "step": 28718 + }, + { + "epoch": 0.56, + "learning_rate": 8.86684012271368e-08, + "loss": 0.0005, + "step": 28719 + }, + { + "epoch": 0.56, + "learning_rate": 8.866451788280066e-08, + "loss": 0.582, + "step": 28720 + }, + { + "epoch": 0.56, + "learning_rate": 8.866063453846452e-08, + "loss": 0.0005, + "step": 28721 + }, + { + "epoch": 0.56, + "learning_rate": 8.865675119412838e-08, + "loss": 0.0006, + "step": 28722 + }, + { + "epoch": 0.56, + "learning_rate": 8.865286784979224e-08, + "loss": 0.8255, + "step": 28723 + }, + { + "epoch": 0.56, + "learning_rate": 8.86489845054561e-08, + "loss": 0.0007, + "step": 28724 + }, + { + "epoch": 0.56, + "learning_rate": 8.864510116111995e-08, + "loss": 0.0016, + "step": 28725 + }, + { + "epoch": 0.56, + "learning_rate": 8.864121781678381e-08, + "loss": 0.0005, + "step": 28726 + }, + { + "epoch": 0.56, + "learning_rate": 8.863733447244767e-08, + "loss": 0.0006, + "step": 28727 + }, + { + "epoch": 0.56, + "learning_rate": 8.863345112811153e-08, + "loss": 0.0004, + "step": 28728 + }, + { + "epoch": 0.56, + "learning_rate": 8.862956778377539e-08, + "loss": 0.0005, + "step": 28729 + }, + { + "epoch": 0.56, + "learning_rate": 8.862568443943924e-08, + "loss": 0.0006, + "step": 28730 + }, + { + "epoch": 0.56, + "learning_rate": 8.86218010951031e-08, + "loss": 0.0003, + "step": 28731 + }, + { + "epoch": 0.56, + "learning_rate": 8.861791775076696e-08, + "loss": 0.0009, + "step": 28732 + }, + { + "epoch": 0.56, + "learning_rate": 8.861403440643082e-08, + "loss": 0.0005, + "step": 28733 + }, + { + "epoch": 0.56, + "learning_rate": 8.861015106209468e-08, + "loss": 0.0004, + "step": 28734 + }, + { + "epoch": 0.56, + "learning_rate": 8.860626771775854e-08, + "loss": 0.001, + "step": 28735 + }, + { + "epoch": 0.56, + "learning_rate": 8.86023843734224e-08, + "loss": 0.0006, + "step": 28736 + }, + { + "epoch": 0.56, + "learning_rate": 8.859850102908625e-08, + "loss": 0.0016, + "step": 28737 + }, + { + "epoch": 0.56, + "learning_rate": 8.859461768475011e-08, + "loss": 0.5996, + "step": 28738 + }, + { + "epoch": 0.56, + "learning_rate": 8.859073434041397e-08, + "loss": 0.0004, + "step": 28739 + }, + { + "epoch": 0.56, + "learning_rate": 8.858685099607783e-08, + "loss": 0.1027, + "step": 28740 + }, + { + "epoch": 0.56, + "learning_rate": 8.858296765174169e-08, + "loss": 1.2398, + "step": 28741 + }, + { + "epoch": 0.56, + "learning_rate": 8.857908430740554e-08, + "loss": 0.0004, + "step": 28742 + }, + { + "epoch": 0.56, + "learning_rate": 8.85752009630694e-08, + "loss": 0.0004, + "step": 28743 + }, + { + "epoch": 0.56, + "learning_rate": 8.857131761873326e-08, + "loss": 0.0005, + "step": 28744 + }, + { + "epoch": 0.56, + "learning_rate": 8.85674342743971e-08, + "loss": 0.0007, + "step": 28745 + }, + { + "epoch": 0.56, + "learning_rate": 8.856355093006096e-08, + "loss": 0.0005, + "step": 28746 + }, + { + "epoch": 0.56, + "learning_rate": 8.855966758572482e-08, + "loss": 0.0007, + "step": 28747 + }, + { + "epoch": 0.56, + "learning_rate": 8.855578424138868e-08, + "loss": 0.0005, + "step": 28748 + }, + { + "epoch": 0.56, + "learning_rate": 8.855190089705254e-08, + "loss": 0.0008, + "step": 28749 + }, + { + "epoch": 0.56, + "learning_rate": 8.85480175527164e-08, + "loss": 0.0007, + "step": 28750 + }, + { + "epoch": 0.56, + "learning_rate": 8.854413420838025e-08, + "loss": 0.0007, + "step": 28751 + }, + { + "epoch": 0.56, + "learning_rate": 8.854025086404411e-08, + "loss": 0.0005, + "step": 28752 + }, + { + "epoch": 0.56, + "learning_rate": 8.853636751970797e-08, + "loss": 0.0006, + "step": 28753 + }, + { + "epoch": 0.56, + "learning_rate": 8.853248417537183e-08, + "loss": 0.0004, + "step": 28754 + }, + { + "epoch": 0.56, + "learning_rate": 8.852860083103569e-08, + "loss": 0.0026, + "step": 28755 + }, + { + "epoch": 0.56, + "learning_rate": 8.852471748669955e-08, + "loss": 0.0004, + "step": 28756 + }, + { + "epoch": 0.56, + "learning_rate": 8.85208341423634e-08, + "loss": 0.0008, + "step": 28757 + }, + { + "epoch": 0.56, + "learning_rate": 8.851695079802726e-08, + "loss": 0.0005, + "step": 28758 + }, + { + "epoch": 0.56, + "learning_rate": 8.851306745369112e-08, + "loss": 0.7598, + "step": 28759 + }, + { + "epoch": 0.56, + "learning_rate": 8.850918410935498e-08, + "loss": 0.0009, + "step": 28760 + }, + { + "epoch": 0.56, + "learning_rate": 8.850530076501884e-08, + "loss": 0.0004, + "step": 28761 + }, + { + "epoch": 0.56, + "learning_rate": 8.85014174206827e-08, + "loss": 0.0004, + "step": 28762 + }, + { + "epoch": 0.56, + "learning_rate": 8.849753407634655e-08, + "loss": 0.0007, + "step": 28763 + }, + { + "epoch": 0.56, + "learning_rate": 8.849365073201041e-08, + "loss": 1.2356, + "step": 28764 + }, + { + "epoch": 0.56, + "learning_rate": 8.848976738767427e-08, + "loss": 0.0005, + "step": 28765 + }, + { + "epoch": 0.56, + "learning_rate": 8.848588404333811e-08, + "loss": 0.0005, + "step": 28766 + }, + { + "epoch": 0.56, + "learning_rate": 8.848200069900197e-08, + "loss": 0.0007, + "step": 28767 + }, + { + "epoch": 0.56, + "learning_rate": 8.847811735466583e-08, + "loss": 0.0005, + "step": 28768 + }, + { + "epoch": 0.56, + "learning_rate": 8.847423401032969e-08, + "loss": 0.0004, + "step": 28769 + }, + { + "epoch": 0.56, + "learning_rate": 8.847035066599355e-08, + "loss": 0.0005, + "step": 28770 + }, + { + "epoch": 0.56, + "learning_rate": 8.84664673216574e-08, + "loss": 0.0004, + "step": 28771 + }, + { + "epoch": 0.56, + "learning_rate": 8.846258397732126e-08, + "loss": 0.0004, + "step": 28772 + }, + { + "epoch": 0.56, + "learning_rate": 8.845870063298512e-08, + "loss": 0.0006, + "step": 28773 + }, + { + "epoch": 0.56, + "learning_rate": 8.845481728864898e-08, + "loss": 0.0004, + "step": 28774 + }, + { + "epoch": 0.56, + "learning_rate": 8.845093394431284e-08, + "loss": 0.0005, + "step": 28775 + }, + { + "epoch": 0.56, + "learning_rate": 8.84470505999767e-08, + "loss": 0.0005, + "step": 28776 + }, + { + "epoch": 0.56, + "learning_rate": 8.844316725564056e-08, + "loss": 0.0389, + "step": 28777 + }, + { + "epoch": 0.56, + "learning_rate": 8.843928391130441e-08, + "loss": 0.0005, + "step": 28778 + }, + { + "epoch": 0.56, + "learning_rate": 8.843540056696827e-08, + "loss": 0.0004, + "step": 28779 + }, + { + "epoch": 0.56, + "learning_rate": 8.843151722263213e-08, + "loss": 0.0005, + "step": 28780 + }, + { + "epoch": 0.56, + "learning_rate": 8.842763387829598e-08, + "loss": 0.0008, + "step": 28781 + }, + { + "epoch": 0.56, + "learning_rate": 8.842375053395983e-08, + "loss": 0.0005, + "step": 28782 + }, + { + "epoch": 0.56, + "learning_rate": 8.841986718962369e-08, + "loss": 0.0004, + "step": 28783 + }, + { + "epoch": 0.56, + "learning_rate": 8.841598384528755e-08, + "loss": 0.0007, + "step": 28784 + }, + { + "epoch": 0.56, + "learning_rate": 8.841210050095141e-08, + "loss": 0.0325, + "step": 28785 + }, + { + "epoch": 0.56, + "learning_rate": 8.840821715661527e-08, + "loss": 0.9718, + "step": 28786 + }, + { + "epoch": 0.56, + "learning_rate": 8.840433381227912e-08, + "loss": 0.0006, + "step": 28787 + }, + { + "epoch": 0.56, + "learning_rate": 8.840045046794298e-08, + "loss": 0.0009, + "step": 28788 + }, + { + "epoch": 0.56, + "learning_rate": 8.839656712360684e-08, + "loss": 0.5255, + "step": 28789 + }, + { + "epoch": 0.56, + "learning_rate": 8.83926837792707e-08, + "loss": 0.0005, + "step": 28790 + }, + { + "epoch": 0.56, + "learning_rate": 8.838880043493456e-08, + "loss": 0.0006, + "step": 28791 + }, + { + "epoch": 0.56, + "learning_rate": 8.838491709059842e-08, + "loss": 0.0007, + "step": 28792 + }, + { + "epoch": 0.56, + "learning_rate": 8.838103374626227e-08, + "loss": 0.0013, + "step": 28793 + }, + { + "epoch": 0.56, + "learning_rate": 8.837715040192613e-08, + "loss": 0.5305, + "step": 28794 + }, + { + "epoch": 0.56, + "learning_rate": 8.837326705758999e-08, + "loss": 0.0014, + "step": 28795 + }, + { + "epoch": 0.56, + "learning_rate": 8.836938371325385e-08, + "loss": 0.0004, + "step": 28796 + }, + { + "epoch": 0.56, + "learning_rate": 8.836550036891771e-08, + "loss": 0.0005, + "step": 28797 + }, + { + "epoch": 0.56, + "learning_rate": 8.836161702458157e-08, + "loss": 0.0006, + "step": 28798 + }, + { + "epoch": 0.56, + "learning_rate": 8.835773368024542e-08, + "loss": 0.0014, + "step": 28799 + }, + { + "epoch": 0.56, + "learning_rate": 8.835385033590928e-08, + "loss": 0.0006, + "step": 28800 + }, + { + "epoch": 0.56, + "learning_rate": 8.834996699157314e-08, + "loss": 0.0007, + "step": 28801 + }, + { + "epoch": 0.56, + "learning_rate": 8.8346083647237e-08, + "loss": 0.0012, + "step": 28802 + }, + { + "epoch": 0.56, + "learning_rate": 8.834220030290084e-08, + "loss": 0.0005, + "step": 28803 + }, + { + "epoch": 0.56, + "learning_rate": 8.83383169585647e-08, + "loss": 0.6808, + "step": 28804 + }, + { + "epoch": 0.56, + "learning_rate": 8.833443361422856e-08, + "loss": 0.0004, + "step": 28805 + }, + { + "epoch": 0.56, + "learning_rate": 8.833055026989242e-08, + "loss": 0.7045, + "step": 28806 + }, + { + "epoch": 0.56, + "learning_rate": 8.832666692555628e-08, + "loss": 0.0007, + "step": 28807 + }, + { + "epoch": 0.56, + "learning_rate": 8.832278358122013e-08, + "loss": 0.1573, + "step": 28808 + }, + { + "epoch": 0.56, + "learning_rate": 8.831890023688399e-08, + "loss": 0.0005, + "step": 28809 + }, + { + "epoch": 0.56, + "learning_rate": 8.831501689254785e-08, + "loss": 0.0005, + "step": 28810 + }, + { + "epoch": 0.56, + "learning_rate": 8.831113354821171e-08, + "loss": 0.0006, + "step": 28811 + }, + { + "epoch": 0.56, + "learning_rate": 8.830725020387557e-08, + "loss": 0.0016, + "step": 28812 + }, + { + "epoch": 0.56, + "learning_rate": 8.830336685953943e-08, + "loss": 0.0007, + "step": 28813 + }, + { + "epoch": 0.56, + "learning_rate": 8.829948351520328e-08, + "loss": 0.0005, + "step": 28814 + }, + { + "epoch": 0.56, + "learning_rate": 8.829560017086714e-08, + "loss": 0.0005, + "step": 28815 + }, + { + "epoch": 0.56, + "learning_rate": 8.8291716826531e-08, + "loss": 0.0007, + "step": 28816 + }, + { + "epoch": 0.56, + "learning_rate": 8.828783348219486e-08, + "loss": 0.0004, + "step": 28817 + }, + { + "epoch": 0.56, + "learning_rate": 8.828395013785872e-08, + "loss": 0.0004, + "step": 28818 + }, + { + "epoch": 0.56, + "learning_rate": 8.828006679352258e-08, + "loss": 0.0047, + "step": 28819 + }, + { + "epoch": 0.56, + "learning_rate": 8.827618344918643e-08, + "loss": 0.0005, + "step": 28820 + }, + { + "epoch": 0.56, + "learning_rate": 8.827230010485029e-08, + "loss": 0.0007, + "step": 28821 + }, + { + "epoch": 0.56, + "learning_rate": 8.826841676051415e-08, + "loss": 0.0006, + "step": 28822 + }, + { + "epoch": 0.56, + "learning_rate": 8.826453341617801e-08, + "loss": 0.0011, + "step": 28823 + }, + { + "epoch": 0.56, + "learning_rate": 8.826065007184187e-08, + "loss": 0.0005, + "step": 28824 + }, + { + "epoch": 0.56, + "learning_rate": 8.825676672750572e-08, + "loss": 0.0004, + "step": 28825 + }, + { + "epoch": 0.56, + "learning_rate": 8.825288338316958e-08, + "loss": 0.0004, + "step": 28826 + }, + { + "epoch": 0.56, + "learning_rate": 8.824900003883344e-08, + "loss": 0.0009, + "step": 28827 + }, + { + "epoch": 0.56, + "learning_rate": 8.82451166944973e-08, + "loss": 0.0006, + "step": 28828 + }, + { + "epoch": 0.56, + "learning_rate": 8.824123335016116e-08, + "loss": 0.0008, + "step": 28829 + }, + { + "epoch": 0.56, + "learning_rate": 8.823735000582502e-08, + "loss": 0.0006, + "step": 28830 + }, + { + "epoch": 0.56, + "learning_rate": 8.823346666148887e-08, + "loss": 0.0006, + "step": 28831 + }, + { + "epoch": 0.56, + "learning_rate": 8.822958331715272e-08, + "loss": 0.0004, + "step": 28832 + }, + { + "epoch": 0.56, + "learning_rate": 8.822569997281658e-08, + "loss": 0.0008, + "step": 28833 + }, + { + "epoch": 0.56, + "learning_rate": 8.822181662848044e-08, + "loss": 0.0007, + "step": 28834 + }, + { + "epoch": 0.56, + "learning_rate": 8.82179332841443e-08, + "loss": 0.0004, + "step": 28835 + }, + { + "epoch": 0.56, + "learning_rate": 8.821404993980815e-08, + "loss": 0.0269, + "step": 28836 + }, + { + "epoch": 0.56, + "learning_rate": 8.821016659547201e-08, + "loss": 0.0004, + "step": 28837 + }, + { + "epoch": 0.56, + "learning_rate": 8.820628325113587e-08, + "loss": 0.3356, + "step": 28838 + }, + { + "epoch": 0.56, + "learning_rate": 8.820239990679973e-08, + "loss": 0.0008, + "step": 28839 + }, + { + "epoch": 0.56, + "learning_rate": 8.819851656246359e-08, + "loss": 0.0004, + "step": 28840 + }, + { + "epoch": 0.56, + "learning_rate": 8.819463321812744e-08, + "loss": 0.0005, + "step": 28841 + }, + { + "epoch": 0.56, + "learning_rate": 8.81907498737913e-08, + "loss": 0.001, + "step": 28842 + }, + { + "epoch": 0.56, + "learning_rate": 8.818686652945516e-08, + "loss": 0.0004, + "step": 28843 + }, + { + "epoch": 0.56, + "learning_rate": 8.818298318511902e-08, + "loss": 0.0006, + "step": 28844 + }, + { + "epoch": 0.56, + "learning_rate": 8.817909984078288e-08, + "loss": 0.0005, + "step": 28845 + }, + { + "epoch": 0.56, + "learning_rate": 8.817521649644673e-08, + "loss": 0.0012, + "step": 28846 + }, + { + "epoch": 0.56, + "learning_rate": 8.817133315211059e-08, + "loss": 0.0005, + "step": 28847 + }, + { + "epoch": 0.56, + "learning_rate": 8.816744980777445e-08, + "loss": 0.0008, + "step": 28848 + }, + { + "epoch": 0.56, + "learning_rate": 8.816356646343831e-08, + "loss": 0.0005, + "step": 28849 + }, + { + "epoch": 0.56, + "learning_rate": 8.815968311910217e-08, + "loss": 0.0051, + "step": 28850 + }, + { + "epoch": 0.56, + "learning_rate": 8.815579977476603e-08, + "loss": 0.0006, + "step": 28851 + }, + { + "epoch": 0.56, + "learning_rate": 8.815191643042988e-08, + "loss": 0.0004, + "step": 28852 + }, + { + "epoch": 0.56, + "learning_rate": 8.814803308609374e-08, + "loss": 0.0006, + "step": 28853 + }, + { + "epoch": 0.56, + "learning_rate": 8.81441497417576e-08, + "loss": 0.0005, + "step": 28854 + }, + { + "epoch": 0.56, + "learning_rate": 8.814026639742146e-08, + "loss": 0.0008, + "step": 28855 + }, + { + "epoch": 0.56, + "learning_rate": 8.813638305308532e-08, + "loss": 0.8654, + "step": 28856 + }, + { + "epoch": 0.56, + "learning_rate": 8.813249970874918e-08, + "loss": 0.0006, + "step": 28857 + }, + { + "epoch": 0.56, + "learning_rate": 8.812861636441303e-08, + "loss": 0.0006, + "step": 28858 + }, + { + "epoch": 0.56, + "learning_rate": 8.812473302007689e-08, + "loss": 0.0005, + "step": 28859 + }, + { + "epoch": 0.56, + "learning_rate": 8.812084967574075e-08, + "loss": 0.0007, + "step": 28860 + }, + { + "epoch": 0.56, + "learning_rate": 8.81169663314046e-08, + "loss": 0.0006, + "step": 28861 + }, + { + "epoch": 0.56, + "learning_rate": 8.811308298706845e-08, + "loss": 0.0008, + "step": 28862 + }, + { + "epoch": 0.56, + "learning_rate": 8.810919964273231e-08, + "loss": 0.0012, + "step": 28863 + }, + { + "epoch": 0.56, + "learning_rate": 8.810531629839617e-08, + "loss": 0.0005, + "step": 28864 + }, + { + "epoch": 0.56, + "learning_rate": 8.810143295406003e-08, + "loss": 0.0006, + "step": 28865 + }, + { + "epoch": 0.56, + "learning_rate": 8.809754960972389e-08, + "loss": 0.0005, + "step": 28866 + }, + { + "epoch": 0.56, + "learning_rate": 8.809366626538774e-08, + "loss": 0.3869, + "step": 28867 + }, + { + "epoch": 0.56, + "learning_rate": 8.80897829210516e-08, + "loss": 0.0005, + "step": 28868 + }, + { + "epoch": 0.56, + "learning_rate": 8.808589957671546e-08, + "loss": 0.0011, + "step": 28869 + }, + { + "epoch": 0.56, + "learning_rate": 8.808201623237932e-08, + "loss": 0.004, + "step": 28870 + }, + { + "epoch": 0.56, + "learning_rate": 8.807813288804318e-08, + "loss": 0.0085, + "step": 28871 + }, + { + "epoch": 0.56, + "learning_rate": 8.807424954370704e-08, + "loss": 0.0005, + "step": 28872 + }, + { + "epoch": 0.56, + "learning_rate": 8.80703661993709e-08, + "loss": 0.0007, + "step": 28873 + }, + { + "epoch": 0.56, + "learning_rate": 8.806648285503475e-08, + "loss": 0.0015, + "step": 28874 + }, + { + "epoch": 0.56, + "learning_rate": 8.806259951069861e-08, + "loss": 1.0803, + "step": 28875 + }, + { + "epoch": 0.56, + "learning_rate": 8.805871616636247e-08, + "loss": 0.0005, + "step": 28876 + }, + { + "epoch": 0.56, + "learning_rate": 8.805483282202633e-08, + "loss": 0.0008, + "step": 28877 + }, + { + "epoch": 0.56, + "learning_rate": 8.805094947769019e-08, + "loss": 0.0005, + "step": 28878 + }, + { + "epoch": 0.56, + "learning_rate": 8.804706613335404e-08, + "loss": 0.0003, + "step": 28879 + }, + { + "epoch": 0.56, + "learning_rate": 8.80431827890179e-08, + "loss": 0.0337, + "step": 28880 + }, + { + "epoch": 0.56, + "learning_rate": 8.803929944468176e-08, + "loss": 0.0004, + "step": 28881 + }, + { + "epoch": 0.56, + "learning_rate": 8.803541610034562e-08, + "loss": 0.0005, + "step": 28882 + }, + { + "epoch": 0.56, + "learning_rate": 8.803153275600948e-08, + "loss": 0.0005, + "step": 28883 + }, + { + "epoch": 0.56, + "learning_rate": 8.802764941167333e-08, + "loss": 0.0005, + "step": 28884 + }, + { + "epoch": 0.56, + "learning_rate": 8.802376606733719e-08, + "loss": 0.0024, + "step": 28885 + }, + { + "epoch": 0.56, + "learning_rate": 8.801988272300105e-08, + "loss": 0.0008, + "step": 28886 + }, + { + "epoch": 0.56, + "learning_rate": 8.801599937866491e-08, + "loss": 0.0009, + "step": 28887 + }, + { + "epoch": 0.56, + "learning_rate": 8.801211603432877e-08, + "loss": 0.0009, + "step": 28888 + }, + { + "epoch": 0.56, + "learning_rate": 8.800823268999263e-08, + "loss": 0.0004, + "step": 28889 + }, + { + "epoch": 0.56, + "learning_rate": 8.800434934565647e-08, + "loss": 0.0004, + "step": 28890 + }, + { + "epoch": 0.56, + "learning_rate": 8.800046600132033e-08, + "loss": 0.0005, + "step": 28891 + }, + { + "epoch": 0.56, + "learning_rate": 8.799658265698419e-08, + "loss": 0.0005, + "step": 28892 + }, + { + "epoch": 0.56, + "learning_rate": 8.799269931264805e-08, + "loss": 0.0004, + "step": 28893 + }, + { + "epoch": 0.56, + "learning_rate": 8.79888159683119e-08, + "loss": 0.0006, + "step": 28894 + }, + { + "epoch": 0.56, + "learning_rate": 8.798493262397576e-08, + "loss": 0.0012, + "step": 28895 + }, + { + "epoch": 0.56, + "learning_rate": 8.798104927963962e-08, + "loss": 0.0222, + "step": 28896 + }, + { + "epoch": 0.56, + "learning_rate": 8.797716593530348e-08, + "loss": 0.0007, + "step": 28897 + }, + { + "epoch": 0.56, + "learning_rate": 8.797328259096734e-08, + "loss": 0.0004, + "step": 28898 + }, + { + "epoch": 0.56, + "learning_rate": 8.79693992466312e-08, + "loss": 0.0004, + "step": 28899 + }, + { + "epoch": 0.56, + "learning_rate": 8.796551590229505e-08, + "loss": 0.0005, + "step": 28900 + }, + { + "epoch": 0.56, + "learning_rate": 8.796163255795891e-08, + "loss": 0.0007, + "step": 28901 + }, + { + "epoch": 0.56, + "learning_rate": 8.795774921362277e-08, + "loss": 0.0403, + "step": 28902 + }, + { + "epoch": 0.56, + "learning_rate": 8.795386586928663e-08, + "loss": 0.0344, + "step": 28903 + }, + { + "epoch": 0.56, + "learning_rate": 8.794998252495049e-08, + "loss": 0.0007, + "step": 28904 + }, + { + "epoch": 0.56, + "learning_rate": 8.794609918061434e-08, + "loss": 0.0005, + "step": 28905 + }, + { + "epoch": 0.56, + "learning_rate": 8.79422158362782e-08, + "loss": 0.0005, + "step": 28906 + }, + { + "epoch": 0.56, + "learning_rate": 8.793833249194206e-08, + "loss": 0.0005, + "step": 28907 + }, + { + "epoch": 0.56, + "learning_rate": 8.793444914760592e-08, + "loss": 0.0007, + "step": 28908 + }, + { + "epoch": 0.56, + "learning_rate": 8.793056580326978e-08, + "loss": 0.0748, + "step": 28909 + }, + { + "epoch": 0.56, + "learning_rate": 8.792668245893364e-08, + "loss": 0.0006, + "step": 28910 + }, + { + "epoch": 0.56, + "learning_rate": 8.79227991145975e-08, + "loss": 0.1431, + "step": 28911 + }, + { + "epoch": 0.56, + "learning_rate": 8.791891577026135e-08, + "loss": 0.3639, + "step": 28912 + }, + { + "epoch": 0.56, + "learning_rate": 8.791503242592521e-08, + "loss": 0.0005, + "step": 28913 + }, + { + "epoch": 0.56, + "learning_rate": 8.791114908158907e-08, + "loss": 0.0005, + "step": 28914 + }, + { + "epoch": 0.56, + "learning_rate": 8.790726573725293e-08, + "loss": 0.0004, + "step": 28915 + }, + { + "epoch": 0.56, + "learning_rate": 8.790338239291679e-08, + "loss": 0.0004, + "step": 28916 + }, + { + "epoch": 0.56, + "learning_rate": 8.789949904858064e-08, + "loss": 0.0006, + "step": 28917 + }, + { + "epoch": 0.56, + "learning_rate": 8.78956157042445e-08, + "loss": 0.0006, + "step": 28918 + }, + { + "epoch": 0.56, + "learning_rate": 8.789173235990835e-08, + "loss": 0.0919, + "step": 28919 + }, + { + "epoch": 0.56, + "learning_rate": 8.78878490155722e-08, + "loss": 0.0005, + "step": 28920 + }, + { + "epoch": 0.56, + "learning_rate": 8.788396567123606e-08, + "loss": 0.0266, + "step": 28921 + }, + { + "epoch": 0.56, + "learning_rate": 8.788008232689992e-08, + "loss": 0.7029, + "step": 28922 + }, + { + "epoch": 0.56, + "learning_rate": 8.787619898256378e-08, + "loss": 0.0006, + "step": 28923 + }, + { + "epoch": 0.56, + "learning_rate": 8.787231563822764e-08, + "loss": 0.0014, + "step": 28924 + }, + { + "epoch": 0.56, + "learning_rate": 8.78684322938915e-08, + "loss": 0.0004, + "step": 28925 + }, + { + "epoch": 0.56, + "learning_rate": 8.786454894955535e-08, + "loss": 0.3589, + "step": 28926 + }, + { + "epoch": 0.56, + "learning_rate": 8.786066560521921e-08, + "loss": 0.0004, + "step": 28927 + }, + { + "epoch": 0.56, + "learning_rate": 8.785678226088307e-08, + "loss": 0.0007, + "step": 28928 + }, + { + "epoch": 0.56, + "learning_rate": 8.785289891654693e-08, + "loss": 0.0006, + "step": 28929 + }, + { + "epoch": 0.56, + "learning_rate": 8.784901557221079e-08, + "loss": 0.0004, + "step": 28930 + }, + { + "epoch": 0.56, + "learning_rate": 8.784513222787465e-08, + "loss": 0.0005, + "step": 28931 + }, + { + "epoch": 0.56, + "learning_rate": 8.78412488835385e-08, + "loss": 0.0006, + "step": 28932 + }, + { + "epoch": 0.56, + "learning_rate": 8.783736553920236e-08, + "loss": 0.0005, + "step": 28933 + }, + { + "epoch": 0.56, + "learning_rate": 8.783348219486622e-08, + "loss": 0.0006, + "step": 28934 + }, + { + "epoch": 0.56, + "learning_rate": 8.782959885053008e-08, + "loss": 0.0539, + "step": 28935 + }, + { + "epoch": 0.56, + "learning_rate": 8.782571550619394e-08, + "loss": 0.0136, + "step": 28936 + }, + { + "epoch": 0.56, + "learning_rate": 8.78218321618578e-08, + "loss": 0.0004, + "step": 28937 + }, + { + "epoch": 0.56, + "learning_rate": 8.781794881752165e-08, + "loss": 0.0006, + "step": 28938 + }, + { + "epoch": 0.56, + "learning_rate": 8.781406547318551e-08, + "loss": 0.0006, + "step": 28939 + }, + { + "epoch": 0.56, + "learning_rate": 8.781018212884937e-08, + "loss": 0.0005, + "step": 28940 + }, + { + "epoch": 0.56, + "learning_rate": 8.780629878451323e-08, + "loss": 0.0005, + "step": 28941 + }, + { + "epoch": 0.56, + "learning_rate": 8.780241544017709e-08, + "loss": 0.0004, + "step": 28942 + }, + { + "epoch": 0.56, + "learning_rate": 8.779853209584093e-08, + "loss": 0.0005, + "step": 28943 + }, + { + "epoch": 0.56, + "learning_rate": 8.779464875150479e-08, + "loss": 0.0005, + "step": 28944 + }, + { + "epoch": 0.56, + "learning_rate": 8.779076540716865e-08, + "loss": 0.0007, + "step": 28945 + }, + { + "epoch": 0.56, + "learning_rate": 8.77868820628325e-08, + "loss": 0.0004, + "step": 28946 + }, + { + "epoch": 0.56, + "learning_rate": 8.778299871849636e-08, + "loss": 0.1396, + "step": 28947 + }, + { + "epoch": 0.56, + "learning_rate": 8.777911537416022e-08, + "loss": 0.0009, + "step": 28948 + }, + { + "epoch": 0.56, + "learning_rate": 8.777523202982408e-08, + "loss": 0.0386, + "step": 28949 + }, + { + "epoch": 0.56, + "learning_rate": 8.777134868548794e-08, + "loss": 0.0006, + "step": 28950 + }, + { + "epoch": 0.56, + "learning_rate": 8.77674653411518e-08, + "loss": 0.0004, + "step": 28951 + }, + { + "epoch": 0.56, + "learning_rate": 8.776358199681566e-08, + "loss": 0.0005, + "step": 28952 + }, + { + "epoch": 0.56, + "learning_rate": 8.775969865247951e-08, + "loss": 0.0005, + "step": 28953 + }, + { + "epoch": 0.56, + "learning_rate": 8.775581530814337e-08, + "loss": 0.0004, + "step": 28954 + }, + { + "epoch": 0.56, + "learning_rate": 8.775193196380723e-08, + "loss": 0.0006, + "step": 28955 + }, + { + "epoch": 0.56, + "learning_rate": 8.774804861947109e-08, + "loss": 0.0009, + "step": 28956 + }, + { + "epoch": 0.56, + "learning_rate": 8.774416527513495e-08, + "loss": 0.0009, + "step": 28957 + }, + { + "epoch": 0.56, + "learning_rate": 8.774028193079879e-08, + "loss": 0.0014, + "step": 28958 + }, + { + "epoch": 0.56, + "learning_rate": 8.773639858646265e-08, + "loss": 0.0004, + "step": 28959 + }, + { + "epoch": 0.56, + "learning_rate": 8.773251524212651e-08, + "loss": 0.0004, + "step": 28960 + }, + { + "epoch": 0.56, + "learning_rate": 8.772863189779037e-08, + "loss": 1.1964, + "step": 28961 + }, + { + "epoch": 0.56, + "learning_rate": 8.772474855345422e-08, + "loss": 0.7518, + "step": 28962 + }, + { + "epoch": 0.56, + "learning_rate": 8.772086520911808e-08, + "loss": 0.0005, + "step": 28963 + }, + { + "epoch": 0.56, + "learning_rate": 8.771698186478194e-08, + "loss": 0.0009, + "step": 28964 + }, + { + "epoch": 0.56, + "learning_rate": 8.77130985204458e-08, + "loss": 0.0004, + "step": 28965 + }, + { + "epoch": 0.56, + "learning_rate": 8.770921517610966e-08, + "loss": 0.0005, + "step": 28966 + }, + { + "epoch": 0.56, + "learning_rate": 8.770533183177352e-08, + "loss": 0.0005, + "step": 28967 + }, + { + "epoch": 0.56, + "learning_rate": 8.770144848743737e-08, + "loss": 0.0005, + "step": 28968 + }, + { + "epoch": 0.56, + "learning_rate": 8.769756514310123e-08, + "loss": 0.0005, + "step": 28969 + }, + { + "epoch": 0.56, + "learning_rate": 8.769368179876509e-08, + "loss": 0.0005, + "step": 28970 + }, + { + "epoch": 0.56, + "learning_rate": 8.768979845442895e-08, + "loss": 0.0006, + "step": 28971 + }, + { + "epoch": 0.56, + "learning_rate": 8.768591511009281e-08, + "loss": 0.8737, + "step": 28972 + }, + { + "epoch": 0.56, + "learning_rate": 8.768203176575667e-08, + "loss": 1.0576, + "step": 28973 + }, + { + "epoch": 0.56, + "learning_rate": 8.767814842142052e-08, + "loss": 0.0007, + "step": 28974 + }, + { + "epoch": 0.56, + "learning_rate": 8.767426507708438e-08, + "loss": 0.0004, + "step": 28975 + }, + { + "epoch": 0.56, + "learning_rate": 8.767038173274824e-08, + "loss": 0.0005, + "step": 28976 + }, + { + "epoch": 0.56, + "learning_rate": 8.766649838841209e-08, + "loss": 0.0006, + "step": 28977 + }, + { + "epoch": 0.56, + "learning_rate": 8.766261504407594e-08, + "loss": 0.0004, + "step": 28978 + }, + { + "epoch": 0.56, + "learning_rate": 8.76587316997398e-08, + "loss": 0.0005, + "step": 28979 + }, + { + "epoch": 0.56, + "learning_rate": 8.765484835540366e-08, + "loss": 1.2654, + "step": 28980 + }, + { + "epoch": 0.56, + "learning_rate": 8.765096501106752e-08, + "loss": 0.0008, + "step": 28981 + }, + { + "epoch": 0.56, + "learning_rate": 8.764708166673138e-08, + "loss": 0.0006, + "step": 28982 + }, + { + "epoch": 0.56, + "learning_rate": 8.764319832239523e-08, + "loss": 0.5205, + "step": 28983 + }, + { + "epoch": 0.56, + "learning_rate": 8.763931497805909e-08, + "loss": 0.0006, + "step": 28984 + }, + { + "epoch": 0.56, + "learning_rate": 8.763543163372295e-08, + "loss": 1.11, + "step": 28985 + }, + { + "epoch": 0.56, + "learning_rate": 8.763154828938681e-08, + "loss": 0.0005, + "step": 28986 + }, + { + "epoch": 0.56, + "learning_rate": 8.762766494505067e-08, + "loss": 0.1869, + "step": 28987 + }, + { + "epoch": 0.56, + "learning_rate": 8.762378160071453e-08, + "loss": 0.001, + "step": 28988 + }, + { + "epoch": 0.56, + "learning_rate": 8.761989825637838e-08, + "loss": 0.0007, + "step": 28989 + }, + { + "epoch": 0.56, + "learning_rate": 8.761601491204224e-08, + "loss": 0.0036, + "step": 28990 + }, + { + "epoch": 0.56, + "learning_rate": 8.76121315677061e-08, + "loss": 0.0005, + "step": 28991 + }, + { + "epoch": 0.56, + "learning_rate": 8.760824822336996e-08, + "loss": 0.0992, + "step": 28992 + }, + { + "epoch": 0.56, + "learning_rate": 8.760436487903382e-08, + "loss": 0.0005, + "step": 28993 + }, + { + "epoch": 0.56, + "learning_rate": 8.760048153469768e-08, + "loss": 0.0007, + "step": 28994 + }, + { + "epoch": 0.56, + "learning_rate": 8.759659819036153e-08, + "loss": 0.0007, + "step": 28995 + }, + { + "epoch": 0.56, + "learning_rate": 8.759271484602539e-08, + "loss": 0.0006, + "step": 28996 + }, + { + "epoch": 0.56, + "learning_rate": 8.758883150168925e-08, + "loss": 0.0005, + "step": 28997 + }, + { + "epoch": 0.56, + "learning_rate": 8.758494815735311e-08, + "loss": 0.0004, + "step": 28998 + }, + { + "epoch": 0.56, + "learning_rate": 8.758106481301697e-08, + "loss": 0.0008, + "step": 28999 + }, + { + "epoch": 0.56, + "learning_rate": 8.757718146868083e-08, + "loss": 0.0007, + "step": 29000 + }, + { + "epoch": 0.56, + "learning_rate": 8.757329812434468e-08, + "loss": 0.0006, + "step": 29001 + }, + { + "epoch": 0.56, + "learning_rate": 8.756941478000854e-08, + "loss": 0.0007, + "step": 29002 + }, + { + "epoch": 0.56, + "learning_rate": 8.75655314356724e-08, + "loss": 0.0005, + "step": 29003 + }, + { + "epoch": 0.56, + "learning_rate": 8.756164809133626e-08, + "loss": 0.0005, + "step": 29004 + }, + { + "epoch": 0.56, + "learning_rate": 8.755776474700012e-08, + "loss": 0.0005, + "step": 29005 + }, + { + "epoch": 0.56, + "learning_rate": 8.755388140266396e-08, + "loss": 0.0005, + "step": 29006 + }, + { + "epoch": 0.56, + "learning_rate": 8.754999805832782e-08, + "loss": 0.0007, + "step": 29007 + }, + { + "epoch": 0.56, + "learning_rate": 8.754611471399168e-08, + "loss": 0.0005, + "step": 29008 + }, + { + "epoch": 0.56, + "learning_rate": 8.754223136965554e-08, + "loss": 0.0006, + "step": 29009 + }, + { + "epoch": 0.56, + "learning_rate": 8.75383480253194e-08, + "loss": 0.0005, + "step": 29010 + }, + { + "epoch": 0.56, + "learning_rate": 8.753446468098325e-08, + "loss": 0.0084, + "step": 29011 + }, + { + "epoch": 0.56, + "learning_rate": 8.753058133664711e-08, + "loss": 0.0006, + "step": 29012 + }, + { + "epoch": 0.56, + "learning_rate": 8.752669799231097e-08, + "loss": 0.0005, + "step": 29013 + }, + { + "epoch": 0.56, + "learning_rate": 8.752281464797483e-08, + "loss": 0.0005, + "step": 29014 + }, + { + "epoch": 0.56, + "learning_rate": 8.751893130363869e-08, + "loss": 0.0007, + "step": 29015 + }, + { + "epoch": 0.56, + "learning_rate": 8.751504795930254e-08, + "loss": 0.0005, + "step": 29016 + }, + { + "epoch": 0.56, + "learning_rate": 8.75111646149664e-08, + "loss": 0.0005, + "step": 29017 + }, + { + "epoch": 0.56, + "learning_rate": 8.750728127063026e-08, + "loss": 1.307, + "step": 29018 + }, + { + "epoch": 0.56, + "learning_rate": 8.750339792629412e-08, + "loss": 0.0004, + "step": 29019 + }, + { + "epoch": 0.56, + "learning_rate": 8.749951458195798e-08, + "loss": 0.0006, + "step": 29020 + }, + { + "epoch": 0.56, + "learning_rate": 8.749563123762183e-08, + "loss": 0.0006, + "step": 29021 + }, + { + "epoch": 0.56, + "learning_rate": 8.749174789328569e-08, + "loss": 0.0005, + "step": 29022 + }, + { + "epoch": 0.56, + "learning_rate": 8.748786454894955e-08, + "loss": 0.002, + "step": 29023 + }, + { + "epoch": 0.56, + "learning_rate": 8.748398120461341e-08, + "loss": 0.0005, + "step": 29024 + }, + { + "epoch": 0.56, + "learning_rate": 8.748009786027727e-08, + "loss": 0.0005, + "step": 29025 + }, + { + "epoch": 0.56, + "learning_rate": 8.747621451594113e-08, + "loss": 0.0005, + "step": 29026 + }, + { + "epoch": 0.56, + "learning_rate": 8.747233117160498e-08, + "loss": 0.1903, + "step": 29027 + }, + { + "epoch": 0.56, + "learning_rate": 8.746844782726884e-08, + "loss": 0.0091, + "step": 29028 + }, + { + "epoch": 0.56, + "learning_rate": 8.74645644829327e-08, + "loss": 0.0006, + "step": 29029 + }, + { + "epoch": 0.56, + "learning_rate": 8.746068113859656e-08, + "loss": 0.4367, + "step": 29030 + }, + { + "epoch": 0.56, + "learning_rate": 8.745679779426042e-08, + "loss": 0.0006, + "step": 29031 + }, + { + "epoch": 0.56, + "learning_rate": 8.745291444992428e-08, + "loss": 0.0011, + "step": 29032 + }, + { + "epoch": 0.56, + "learning_rate": 8.744903110558813e-08, + "loss": 0.0008, + "step": 29033 + }, + { + "epoch": 0.56, + "learning_rate": 8.744514776125199e-08, + "loss": 0.0005, + "step": 29034 + }, + { + "epoch": 0.56, + "learning_rate": 8.744126441691584e-08, + "loss": 0.0005, + "step": 29035 + }, + { + "epoch": 0.56, + "learning_rate": 8.74373810725797e-08, + "loss": 0.0005, + "step": 29036 + }, + { + "epoch": 0.56, + "learning_rate": 8.743349772824355e-08, + "loss": 0.0068, + "step": 29037 + }, + { + "epoch": 0.56, + "learning_rate": 8.742961438390741e-08, + "loss": 0.0043, + "step": 29038 + }, + { + "epoch": 0.56, + "learning_rate": 8.742573103957127e-08, + "loss": 0.0005, + "step": 29039 + }, + { + "epoch": 0.56, + "learning_rate": 8.742184769523513e-08, + "loss": 0.0376, + "step": 29040 + }, + { + "epoch": 0.56, + "learning_rate": 8.741796435089899e-08, + "loss": 0.0004, + "step": 29041 + }, + { + "epoch": 0.56, + "learning_rate": 8.741408100656284e-08, + "loss": 0.0008, + "step": 29042 + }, + { + "epoch": 0.56, + "learning_rate": 8.74101976622267e-08, + "loss": 0.0005, + "step": 29043 + }, + { + "epoch": 0.56, + "learning_rate": 8.740631431789056e-08, + "loss": 0.0004, + "step": 29044 + }, + { + "epoch": 0.56, + "learning_rate": 8.740243097355442e-08, + "loss": 0.0004, + "step": 29045 + }, + { + "epoch": 0.56, + "learning_rate": 8.739854762921828e-08, + "loss": 0.0006, + "step": 29046 + }, + { + "epoch": 0.56, + "learning_rate": 8.739466428488214e-08, + "loss": 1.0511, + "step": 29047 + }, + { + "epoch": 0.56, + "learning_rate": 8.7390780940546e-08, + "loss": 0.0017, + "step": 29048 + }, + { + "epoch": 0.56, + "learning_rate": 8.738689759620985e-08, + "loss": 0.0011, + "step": 29049 + }, + { + "epoch": 0.56, + "learning_rate": 8.738301425187371e-08, + "loss": 0.0017, + "step": 29050 + }, + { + "epoch": 0.56, + "learning_rate": 8.737913090753757e-08, + "loss": 0.0004, + "step": 29051 + }, + { + "epoch": 0.56, + "learning_rate": 8.737524756320143e-08, + "loss": 0.0009, + "step": 29052 + }, + { + "epoch": 0.56, + "learning_rate": 8.737136421886529e-08, + "loss": 0.0007, + "step": 29053 + }, + { + "epoch": 0.56, + "learning_rate": 8.736748087452914e-08, + "loss": 0.0059, + "step": 29054 + }, + { + "epoch": 0.56, + "learning_rate": 8.7363597530193e-08, + "loss": 0.0014, + "step": 29055 + }, + { + "epoch": 0.56, + "learning_rate": 8.735971418585686e-08, + "loss": 0.0007, + "step": 29056 + }, + { + "epoch": 0.56, + "learning_rate": 8.735583084152072e-08, + "loss": 0.0007, + "step": 29057 + }, + { + "epoch": 0.56, + "learning_rate": 8.735194749718458e-08, + "loss": 0.0007, + "step": 29058 + }, + { + "epoch": 0.56, + "learning_rate": 8.734806415284843e-08, + "loss": 0.0042, + "step": 29059 + }, + { + "epoch": 0.56, + "learning_rate": 8.734418080851229e-08, + "loss": 0.0004, + "step": 29060 + }, + { + "epoch": 0.56, + "learning_rate": 8.734029746417615e-08, + "loss": 0.0004, + "step": 29061 + }, + { + "epoch": 0.56, + "learning_rate": 8.733641411984001e-08, + "loss": 0.6946, + "step": 29062 + }, + { + "epoch": 0.56, + "learning_rate": 8.733253077550387e-08, + "loss": 0.0003, + "step": 29063 + }, + { + "epoch": 0.56, + "learning_rate": 8.732864743116771e-08, + "loss": 0.0006, + "step": 29064 + }, + { + "epoch": 0.56, + "learning_rate": 8.732476408683157e-08, + "loss": 0.0005, + "step": 29065 + }, + { + "epoch": 0.56, + "learning_rate": 8.732088074249543e-08, + "loss": 0.0005, + "step": 29066 + }, + { + "epoch": 0.56, + "learning_rate": 8.731699739815929e-08, + "loss": 0.0005, + "step": 29067 + }, + { + "epoch": 0.56, + "learning_rate": 8.731311405382315e-08, + "loss": 0.0006, + "step": 29068 + }, + { + "epoch": 0.56, + "learning_rate": 8.7309230709487e-08, + "loss": 0.0005, + "step": 29069 + }, + { + "epoch": 0.56, + "learning_rate": 8.730534736515086e-08, + "loss": 0.0008, + "step": 29070 + }, + { + "epoch": 0.56, + "learning_rate": 8.730146402081472e-08, + "loss": 0.0008, + "step": 29071 + }, + { + "epoch": 0.56, + "learning_rate": 8.729758067647858e-08, + "loss": 0.714, + "step": 29072 + }, + { + "epoch": 0.56, + "learning_rate": 8.729369733214244e-08, + "loss": 0.0005, + "step": 29073 + }, + { + "epoch": 0.56, + "learning_rate": 8.72898139878063e-08, + "loss": 0.0006, + "step": 29074 + }, + { + "epoch": 0.56, + "learning_rate": 8.728593064347015e-08, + "loss": 0.0005, + "step": 29075 + }, + { + "epoch": 0.56, + "learning_rate": 8.728204729913401e-08, + "loss": 0.057, + "step": 29076 + }, + { + "epoch": 0.56, + "learning_rate": 8.727816395479787e-08, + "loss": 0.0004, + "step": 29077 + }, + { + "epoch": 0.56, + "learning_rate": 8.727428061046173e-08, + "loss": 0.0033, + "step": 29078 + }, + { + "epoch": 0.56, + "learning_rate": 8.727039726612559e-08, + "loss": 0.0005, + "step": 29079 + }, + { + "epoch": 0.56, + "learning_rate": 8.726651392178944e-08, + "loss": 0.0004, + "step": 29080 + }, + { + "epoch": 0.56, + "learning_rate": 8.72626305774533e-08, + "loss": 0.495, + "step": 29081 + }, + { + "epoch": 0.56, + "learning_rate": 8.725874723311716e-08, + "loss": 0.0008, + "step": 29082 + }, + { + "epoch": 0.56, + "learning_rate": 8.725486388878102e-08, + "loss": 0.0006, + "step": 29083 + }, + { + "epoch": 0.56, + "learning_rate": 8.725098054444488e-08, + "loss": 0.0008, + "step": 29084 + }, + { + "epoch": 0.56, + "learning_rate": 8.724709720010874e-08, + "loss": 0.0004, + "step": 29085 + }, + { + "epoch": 0.56, + "learning_rate": 8.72432138557726e-08, + "loss": 0.0004, + "step": 29086 + }, + { + "epoch": 0.56, + "learning_rate": 8.723933051143645e-08, + "loss": 0.0069, + "step": 29087 + }, + { + "epoch": 0.56, + "learning_rate": 8.723544716710031e-08, + "loss": 0.0055, + "step": 29088 + }, + { + "epoch": 0.56, + "learning_rate": 8.723156382276417e-08, + "loss": 0.0004, + "step": 29089 + }, + { + "epoch": 0.56, + "learning_rate": 8.722768047842803e-08, + "loss": 0.0004, + "step": 29090 + }, + { + "epoch": 0.56, + "learning_rate": 8.722379713409189e-08, + "loss": 0.0006, + "step": 29091 + }, + { + "epoch": 0.56, + "learning_rate": 8.721991378975574e-08, + "loss": 0.001, + "step": 29092 + }, + { + "epoch": 0.56, + "learning_rate": 8.721603044541959e-08, + "loss": 0.0005, + "step": 29093 + }, + { + "epoch": 0.56, + "learning_rate": 8.721214710108345e-08, + "loss": 0.0005, + "step": 29094 + }, + { + "epoch": 0.56, + "learning_rate": 8.72082637567473e-08, + "loss": 0.0009, + "step": 29095 + }, + { + "epoch": 0.56, + "learning_rate": 8.720438041241116e-08, + "loss": 0.0006, + "step": 29096 + }, + { + "epoch": 0.56, + "learning_rate": 8.720049706807502e-08, + "loss": 0.0005, + "step": 29097 + }, + { + "epoch": 0.56, + "learning_rate": 8.719661372373888e-08, + "loss": 0.0006, + "step": 29098 + }, + { + "epoch": 0.56, + "learning_rate": 8.719273037940274e-08, + "loss": 0.0014, + "step": 29099 + }, + { + "epoch": 0.56, + "learning_rate": 8.71888470350666e-08, + "loss": 0.029, + "step": 29100 + }, + { + "epoch": 0.56, + "learning_rate": 8.718496369073045e-08, + "loss": 0.0818, + "step": 29101 + }, + { + "epoch": 0.56, + "learning_rate": 8.718108034639431e-08, + "loss": 0.0005, + "step": 29102 + }, + { + "epoch": 0.56, + "learning_rate": 8.717719700205817e-08, + "loss": 0.0004, + "step": 29103 + }, + { + "epoch": 0.56, + "learning_rate": 8.717331365772203e-08, + "loss": 0.0006, + "step": 29104 + }, + { + "epoch": 0.56, + "learning_rate": 8.716943031338589e-08, + "loss": 0.0006, + "step": 29105 + }, + { + "epoch": 0.56, + "learning_rate": 8.716554696904975e-08, + "loss": 0.0004, + "step": 29106 + }, + { + "epoch": 0.56, + "learning_rate": 8.71616636247136e-08, + "loss": 0.0006, + "step": 29107 + }, + { + "epoch": 0.56, + "learning_rate": 8.715778028037746e-08, + "loss": 0.001, + "step": 29108 + }, + { + "epoch": 0.56, + "learning_rate": 8.715389693604132e-08, + "loss": 0.0005, + "step": 29109 + }, + { + "epoch": 0.56, + "learning_rate": 8.715001359170518e-08, + "loss": 0.0005, + "step": 29110 + }, + { + "epoch": 0.56, + "learning_rate": 8.714613024736904e-08, + "loss": 0.4538, + "step": 29111 + }, + { + "epoch": 0.56, + "learning_rate": 8.71422469030329e-08, + "loss": 0.0006, + "step": 29112 + }, + { + "epoch": 0.56, + "learning_rate": 8.713836355869675e-08, + "loss": 0.0006, + "step": 29113 + }, + { + "epoch": 0.56, + "learning_rate": 8.713448021436061e-08, + "loss": 0.0006, + "step": 29114 + }, + { + "epoch": 0.56, + "learning_rate": 8.713059687002447e-08, + "loss": 0.5452, + "step": 29115 + }, + { + "epoch": 0.56, + "learning_rate": 8.712671352568833e-08, + "loss": 0.001, + "step": 29116 + }, + { + "epoch": 0.56, + "learning_rate": 8.712283018135219e-08, + "loss": 0.0004, + "step": 29117 + }, + { + "epoch": 0.56, + "learning_rate": 8.711894683701604e-08, + "loss": 0.0023, + "step": 29118 + }, + { + "epoch": 0.56, + "learning_rate": 8.71150634926799e-08, + "loss": 0.0006, + "step": 29119 + }, + { + "epoch": 0.56, + "learning_rate": 8.711118014834375e-08, + "loss": 0.0005, + "step": 29120 + }, + { + "epoch": 0.56, + "learning_rate": 8.71072968040076e-08, + "loss": 0.0006, + "step": 29121 + }, + { + "epoch": 0.56, + "learning_rate": 8.710341345967146e-08, + "loss": 0.0003, + "step": 29122 + }, + { + "epoch": 0.56, + "learning_rate": 8.709953011533532e-08, + "loss": 0.0004, + "step": 29123 + }, + { + "epoch": 0.56, + "learning_rate": 8.709564677099918e-08, + "loss": 0.0514, + "step": 29124 + }, + { + "epoch": 0.56, + "learning_rate": 8.709176342666304e-08, + "loss": 0.0174, + "step": 29125 + }, + { + "epoch": 0.56, + "learning_rate": 8.70878800823269e-08, + "loss": 0.0009, + "step": 29126 + }, + { + "epoch": 0.57, + "learning_rate": 8.708399673799076e-08, + "loss": 0.001, + "step": 29127 + }, + { + "epoch": 0.57, + "learning_rate": 8.708011339365461e-08, + "loss": 0.0009, + "step": 29128 + }, + { + "epoch": 0.57, + "learning_rate": 8.707623004931847e-08, + "loss": 0.0004, + "step": 29129 + }, + { + "epoch": 0.57, + "learning_rate": 8.707234670498233e-08, + "loss": 0.0309, + "step": 29130 + }, + { + "epoch": 0.57, + "learning_rate": 8.706846336064619e-08, + "loss": 0.0004, + "step": 29131 + }, + { + "epoch": 0.57, + "learning_rate": 8.706458001631005e-08, + "loss": 0.0075, + "step": 29132 + }, + { + "epoch": 0.57, + "learning_rate": 8.70606966719739e-08, + "loss": 0.0009, + "step": 29133 + }, + { + "epoch": 0.57, + "learning_rate": 8.705681332763776e-08, + "loss": 0.316, + "step": 29134 + }, + { + "epoch": 0.57, + "learning_rate": 8.705292998330161e-08, + "loss": 0.0006, + "step": 29135 + }, + { + "epoch": 0.57, + "learning_rate": 8.704904663896547e-08, + "loss": 0.0004, + "step": 29136 + }, + { + "epoch": 0.57, + "learning_rate": 8.704516329462933e-08, + "loss": 0.8939, + "step": 29137 + }, + { + "epoch": 0.57, + "learning_rate": 8.704127995029318e-08, + "loss": 0.0009, + "step": 29138 + }, + { + "epoch": 0.57, + "learning_rate": 8.703739660595704e-08, + "loss": 0.0009, + "step": 29139 + }, + { + "epoch": 0.57, + "learning_rate": 8.70335132616209e-08, + "loss": 0.0005, + "step": 29140 + }, + { + "epoch": 0.57, + "learning_rate": 8.702962991728476e-08, + "loss": 1.529, + "step": 29141 + }, + { + "epoch": 0.57, + "learning_rate": 8.702574657294862e-08, + "loss": 0.005, + "step": 29142 + }, + { + "epoch": 0.57, + "learning_rate": 8.702186322861247e-08, + "loss": 0.0004, + "step": 29143 + }, + { + "epoch": 0.57, + "learning_rate": 8.701797988427633e-08, + "loss": 0.0006, + "step": 29144 + }, + { + "epoch": 0.57, + "learning_rate": 8.701409653994019e-08, + "loss": 0.0007, + "step": 29145 + }, + { + "epoch": 0.57, + "learning_rate": 8.701021319560405e-08, + "loss": 0.0017, + "step": 29146 + }, + { + "epoch": 0.57, + "learning_rate": 8.700632985126791e-08, + "loss": 0.0006, + "step": 29147 + }, + { + "epoch": 0.57, + "learning_rate": 8.700244650693177e-08, + "loss": 0.0005, + "step": 29148 + }, + { + "epoch": 0.57, + "learning_rate": 8.699856316259562e-08, + "loss": 0.0006, + "step": 29149 + }, + { + "epoch": 0.57, + "learning_rate": 8.699467981825948e-08, + "loss": 0.0005, + "step": 29150 + }, + { + "epoch": 0.57, + "learning_rate": 8.699079647392333e-08, + "loss": 0.009, + "step": 29151 + }, + { + "epoch": 0.57, + "learning_rate": 8.698691312958719e-08, + "loss": 0.0006, + "step": 29152 + }, + { + "epoch": 0.57, + "learning_rate": 8.698302978525104e-08, + "loss": 0.0004, + "step": 29153 + }, + { + "epoch": 0.57, + "learning_rate": 8.69791464409149e-08, + "loss": 1.1463, + "step": 29154 + }, + { + "epoch": 0.57, + "learning_rate": 8.697526309657876e-08, + "loss": 0.0005, + "step": 29155 + }, + { + "epoch": 0.57, + "learning_rate": 8.697137975224262e-08, + "loss": 0.0004, + "step": 29156 + }, + { + "epoch": 0.57, + "learning_rate": 8.696749640790648e-08, + "loss": 0.0005, + "step": 29157 + }, + { + "epoch": 0.57, + "learning_rate": 8.696361306357033e-08, + "loss": 0.0014, + "step": 29158 + }, + { + "epoch": 0.57, + "learning_rate": 8.695972971923419e-08, + "loss": 0.0005, + "step": 29159 + }, + { + "epoch": 0.57, + "learning_rate": 8.695584637489805e-08, + "loss": 0.6284, + "step": 29160 + }, + { + "epoch": 0.57, + "learning_rate": 8.695196303056191e-08, + "loss": 0.4498, + "step": 29161 + }, + { + "epoch": 0.57, + "learning_rate": 8.694807968622577e-08, + "loss": 0.0004, + "step": 29162 + }, + { + "epoch": 0.57, + "learning_rate": 8.694419634188963e-08, + "loss": 0.0006, + "step": 29163 + }, + { + "epoch": 0.57, + "learning_rate": 8.694031299755348e-08, + "loss": 0.0004, + "step": 29164 + }, + { + "epoch": 0.57, + "learning_rate": 8.693642965321734e-08, + "loss": 0.0005, + "step": 29165 + }, + { + "epoch": 0.57, + "learning_rate": 8.69325463088812e-08, + "loss": 0.0009, + "step": 29166 + }, + { + "epoch": 0.57, + "learning_rate": 8.692866296454506e-08, + "loss": 0.0005, + "step": 29167 + }, + { + "epoch": 0.57, + "learning_rate": 8.692477962020892e-08, + "loss": 0.0394, + "step": 29168 + }, + { + "epoch": 0.57, + "learning_rate": 8.692089627587278e-08, + "loss": 0.0006, + "step": 29169 + }, + { + "epoch": 0.57, + "learning_rate": 8.691701293153663e-08, + "loss": 0.0005, + "step": 29170 + }, + { + "epoch": 0.57, + "learning_rate": 8.691312958720049e-08, + "loss": 0.0031, + "step": 29171 + }, + { + "epoch": 0.57, + "learning_rate": 8.690924624286435e-08, + "loss": 0.0006, + "step": 29172 + }, + { + "epoch": 0.57, + "learning_rate": 8.690536289852821e-08, + "loss": 0.491, + "step": 29173 + }, + { + "epoch": 0.57, + "learning_rate": 8.690147955419207e-08, + "loss": 0.0008, + "step": 29174 + }, + { + "epoch": 0.57, + "learning_rate": 8.689759620985593e-08, + "loss": 0.0006, + "step": 29175 + }, + { + "epoch": 0.57, + "learning_rate": 8.689371286551978e-08, + "loss": 0.0344, + "step": 29176 + }, + { + "epoch": 0.57, + "learning_rate": 8.688982952118364e-08, + "loss": 0.0007, + "step": 29177 + }, + { + "epoch": 0.57, + "learning_rate": 8.68859461768475e-08, + "loss": 0.0004, + "step": 29178 + }, + { + "epoch": 0.57, + "learning_rate": 8.688206283251136e-08, + "loss": 0.0004, + "step": 29179 + }, + { + "epoch": 0.57, + "learning_rate": 8.68781794881752e-08, + "loss": 0.0015, + "step": 29180 + }, + { + "epoch": 0.57, + "learning_rate": 8.687429614383906e-08, + "loss": 0.0009, + "step": 29181 + }, + { + "epoch": 0.57, + "learning_rate": 8.687041279950292e-08, + "loss": 0.0007, + "step": 29182 + }, + { + "epoch": 0.57, + "learning_rate": 8.686652945516678e-08, + "loss": 0.6985, + "step": 29183 + }, + { + "epoch": 0.57, + "learning_rate": 8.686264611083064e-08, + "loss": 0.0009, + "step": 29184 + }, + { + "epoch": 0.57, + "learning_rate": 8.68587627664945e-08, + "loss": 0.0006, + "step": 29185 + }, + { + "epoch": 0.57, + "learning_rate": 8.685487942215835e-08, + "loss": 0.0005, + "step": 29186 + }, + { + "epoch": 0.57, + "learning_rate": 8.685099607782221e-08, + "loss": 0.0004, + "step": 29187 + }, + { + "epoch": 0.57, + "learning_rate": 8.684711273348607e-08, + "loss": 0.0006, + "step": 29188 + }, + { + "epoch": 0.57, + "learning_rate": 8.684322938914993e-08, + "loss": 0.0004, + "step": 29189 + }, + { + "epoch": 0.57, + "learning_rate": 8.683934604481379e-08, + "loss": 0.0006, + "step": 29190 + }, + { + "epoch": 0.57, + "learning_rate": 8.683546270047764e-08, + "loss": 0.002, + "step": 29191 + }, + { + "epoch": 0.57, + "learning_rate": 8.68315793561415e-08, + "loss": 1.176, + "step": 29192 + }, + { + "epoch": 0.57, + "learning_rate": 8.682769601180536e-08, + "loss": 0.0006, + "step": 29193 + }, + { + "epoch": 0.57, + "learning_rate": 8.682381266746922e-08, + "loss": 0.0005, + "step": 29194 + }, + { + "epoch": 0.57, + "learning_rate": 8.681992932313308e-08, + "loss": 0.0004, + "step": 29195 + }, + { + "epoch": 0.57, + "learning_rate": 8.681604597879694e-08, + "loss": 0.0006, + "step": 29196 + }, + { + "epoch": 0.57, + "learning_rate": 8.681216263446079e-08, + "loss": 0.0005, + "step": 29197 + }, + { + "epoch": 0.57, + "learning_rate": 8.680827929012465e-08, + "loss": 0.0005, + "step": 29198 + }, + { + "epoch": 0.57, + "learning_rate": 8.680439594578851e-08, + "loss": 0.6196, + "step": 29199 + }, + { + "epoch": 0.57, + "learning_rate": 8.680051260145237e-08, + "loss": 0.0027, + "step": 29200 + }, + { + "epoch": 0.57, + "learning_rate": 8.679662925711623e-08, + "loss": 0.0005, + "step": 29201 + }, + { + "epoch": 0.57, + "learning_rate": 8.679274591278008e-08, + "loss": 0.0005, + "step": 29202 + }, + { + "epoch": 0.57, + "learning_rate": 8.678886256844394e-08, + "loss": 0.5295, + "step": 29203 + }, + { + "epoch": 0.57, + "learning_rate": 8.67849792241078e-08, + "loss": 0.0006, + "step": 29204 + }, + { + "epoch": 0.57, + "learning_rate": 8.678109587977166e-08, + "loss": 0.0194, + "step": 29205 + }, + { + "epoch": 0.57, + "learning_rate": 8.677721253543552e-08, + "loss": 0.0005, + "step": 29206 + }, + { + "epoch": 0.57, + "learning_rate": 8.677332919109938e-08, + "loss": 0.0008, + "step": 29207 + }, + { + "epoch": 0.57, + "learning_rate": 8.676944584676323e-08, + "loss": 0.0007, + "step": 29208 + }, + { + "epoch": 0.57, + "learning_rate": 8.676556250242708e-08, + "loss": 0.0006, + "step": 29209 + }, + { + "epoch": 0.57, + "learning_rate": 8.676167915809094e-08, + "loss": 0.0015, + "step": 29210 + }, + { + "epoch": 0.57, + "learning_rate": 8.67577958137548e-08, + "loss": 0.0006, + "step": 29211 + }, + { + "epoch": 0.57, + "learning_rate": 8.675391246941865e-08, + "loss": 0.0006, + "step": 29212 + }, + { + "epoch": 0.57, + "learning_rate": 8.675002912508251e-08, + "loss": 0.0005, + "step": 29213 + }, + { + "epoch": 0.57, + "learning_rate": 8.674614578074637e-08, + "loss": 0.9787, + "step": 29214 + }, + { + "epoch": 0.57, + "learning_rate": 8.674226243641023e-08, + "loss": 0.0007, + "step": 29215 + }, + { + "epoch": 0.57, + "learning_rate": 8.673837909207409e-08, + "loss": 0.0007, + "step": 29216 + }, + { + "epoch": 0.57, + "learning_rate": 8.673449574773794e-08, + "loss": 0.0006, + "step": 29217 + }, + { + "epoch": 0.57, + "learning_rate": 8.67306124034018e-08, + "loss": 0.3657, + "step": 29218 + }, + { + "epoch": 0.57, + "learning_rate": 8.672672905906566e-08, + "loss": 0.0183, + "step": 29219 + }, + { + "epoch": 0.57, + "learning_rate": 8.672284571472952e-08, + "loss": 0.0006, + "step": 29220 + }, + { + "epoch": 0.57, + "learning_rate": 8.671896237039338e-08, + "loss": 0.0009, + "step": 29221 + }, + { + "epoch": 0.57, + "learning_rate": 8.671507902605724e-08, + "loss": 0.0007, + "step": 29222 + }, + { + "epoch": 0.57, + "learning_rate": 8.67111956817211e-08, + "loss": 0.0009, + "step": 29223 + }, + { + "epoch": 0.57, + "learning_rate": 8.670731233738495e-08, + "loss": 0.0005, + "step": 29224 + }, + { + "epoch": 0.57, + "learning_rate": 8.670342899304881e-08, + "loss": 0.0006, + "step": 29225 + }, + { + "epoch": 0.57, + "learning_rate": 8.669954564871267e-08, + "loss": 0.0004, + "step": 29226 + }, + { + "epoch": 0.57, + "learning_rate": 8.669566230437653e-08, + "loss": 0.0004, + "step": 29227 + }, + { + "epoch": 0.57, + "learning_rate": 8.669177896004039e-08, + "loss": 0.0006, + "step": 29228 + }, + { + "epoch": 0.57, + "learning_rate": 8.668789561570424e-08, + "loss": 0.0029, + "step": 29229 + }, + { + "epoch": 0.57, + "learning_rate": 8.66840122713681e-08, + "loss": 0.0005, + "step": 29230 + }, + { + "epoch": 0.57, + "learning_rate": 8.668012892703196e-08, + "loss": 0.0006, + "step": 29231 + }, + { + "epoch": 0.57, + "learning_rate": 8.667624558269582e-08, + "loss": 0.0006, + "step": 29232 + }, + { + "epoch": 0.57, + "learning_rate": 8.667236223835968e-08, + "loss": 0.001, + "step": 29233 + }, + { + "epoch": 0.57, + "learning_rate": 8.666847889402354e-08, + "loss": 0.0003, + "step": 29234 + }, + { + "epoch": 0.57, + "learning_rate": 8.666459554968739e-08, + "loss": 0.0004, + "step": 29235 + }, + { + "epoch": 0.57, + "learning_rate": 8.666071220535125e-08, + "loss": 0.0005, + "step": 29236 + }, + { + "epoch": 0.57, + "learning_rate": 8.665682886101511e-08, + "loss": 0.0005, + "step": 29237 + }, + { + "epoch": 0.57, + "learning_rate": 8.665294551667895e-08, + "loss": 0.0005, + "step": 29238 + }, + { + "epoch": 0.57, + "learning_rate": 8.664906217234281e-08, + "loss": 0.0004, + "step": 29239 + }, + { + "epoch": 0.57, + "learning_rate": 8.664517882800667e-08, + "loss": 0.0006, + "step": 29240 + }, + { + "epoch": 0.57, + "learning_rate": 8.664129548367053e-08, + "loss": 0.0005, + "step": 29241 + }, + { + "epoch": 0.57, + "learning_rate": 8.663741213933439e-08, + "loss": 0.0009, + "step": 29242 + }, + { + "epoch": 0.57, + "learning_rate": 8.663352879499825e-08, + "loss": 0.0678, + "step": 29243 + }, + { + "epoch": 0.57, + "learning_rate": 8.66296454506621e-08, + "loss": 0.7466, + "step": 29244 + }, + { + "epoch": 0.57, + "learning_rate": 8.662576210632596e-08, + "loss": 0.0006, + "step": 29245 + }, + { + "epoch": 0.57, + "learning_rate": 8.662187876198982e-08, + "loss": 0.0008, + "step": 29246 + }, + { + "epoch": 0.57, + "learning_rate": 8.661799541765368e-08, + "loss": 0.0007, + "step": 29247 + }, + { + "epoch": 0.57, + "learning_rate": 8.661411207331754e-08, + "loss": 0.0007, + "step": 29248 + }, + { + "epoch": 0.57, + "learning_rate": 8.66102287289814e-08, + "loss": 0.0007, + "step": 29249 + }, + { + "epoch": 0.57, + "learning_rate": 8.660634538464525e-08, + "loss": 0.0005, + "step": 29250 + }, + { + "epoch": 0.57, + "learning_rate": 8.660246204030911e-08, + "loss": 0.9673, + "step": 29251 + }, + { + "epoch": 0.57, + "learning_rate": 8.659857869597297e-08, + "loss": 0.0004, + "step": 29252 + }, + { + "epoch": 0.57, + "learning_rate": 8.659469535163683e-08, + "loss": 0.0005, + "step": 29253 + }, + { + "epoch": 0.57, + "learning_rate": 8.659081200730069e-08, + "loss": 0.0007, + "step": 29254 + }, + { + "epoch": 0.57, + "learning_rate": 8.658692866296454e-08, + "loss": 0.0006, + "step": 29255 + }, + { + "epoch": 0.57, + "learning_rate": 8.65830453186284e-08, + "loss": 0.0006, + "step": 29256 + }, + { + "epoch": 0.57, + "learning_rate": 8.657916197429226e-08, + "loss": 0.0005, + "step": 29257 + }, + { + "epoch": 0.57, + "learning_rate": 8.657527862995612e-08, + "loss": 0.0006, + "step": 29258 + }, + { + "epoch": 0.57, + "learning_rate": 8.657139528561998e-08, + "loss": 0.0016, + "step": 29259 + }, + { + "epoch": 0.57, + "learning_rate": 8.656751194128384e-08, + "loss": 0.8557, + "step": 29260 + }, + { + "epoch": 0.57, + "learning_rate": 8.65636285969477e-08, + "loss": 0.0007, + "step": 29261 + }, + { + "epoch": 0.57, + "learning_rate": 8.655974525261155e-08, + "loss": 1.0253, + "step": 29262 + }, + { + "epoch": 0.57, + "learning_rate": 8.655586190827541e-08, + "loss": 0.0005, + "step": 29263 + }, + { + "epoch": 0.57, + "learning_rate": 8.655197856393927e-08, + "loss": 0.0006, + "step": 29264 + }, + { + "epoch": 0.57, + "learning_rate": 8.654809521960313e-08, + "loss": 0.0005, + "step": 29265 + }, + { + "epoch": 0.57, + "learning_rate": 8.654421187526699e-08, + "loss": 0.3479, + "step": 29266 + }, + { + "epoch": 0.57, + "learning_rate": 8.654032853093083e-08, + "loss": 0.0006, + "step": 29267 + }, + { + "epoch": 0.57, + "learning_rate": 8.653644518659469e-08, + "loss": 0.0004, + "step": 29268 + }, + { + "epoch": 0.57, + "learning_rate": 8.653256184225855e-08, + "loss": 0.0003, + "step": 29269 + }, + { + "epoch": 0.57, + "learning_rate": 8.65286784979224e-08, + "loss": 0.002, + "step": 29270 + }, + { + "epoch": 0.57, + "learning_rate": 8.652479515358626e-08, + "loss": 0.0005, + "step": 29271 + }, + { + "epoch": 0.57, + "learning_rate": 8.652091180925012e-08, + "loss": 0.0006, + "step": 29272 + }, + { + "epoch": 0.57, + "learning_rate": 8.651702846491398e-08, + "loss": 0.0005, + "step": 29273 + }, + { + "epoch": 0.57, + "learning_rate": 8.651314512057784e-08, + "loss": 0.2684, + "step": 29274 + }, + { + "epoch": 0.57, + "learning_rate": 8.65092617762417e-08, + "loss": 0.0018, + "step": 29275 + }, + { + "epoch": 0.57, + "learning_rate": 8.650537843190555e-08, + "loss": 0.0008, + "step": 29276 + }, + { + "epoch": 0.57, + "learning_rate": 8.650149508756941e-08, + "loss": 0.0004, + "step": 29277 + }, + { + "epoch": 0.57, + "learning_rate": 8.649761174323327e-08, + "loss": 0.0006, + "step": 29278 + }, + { + "epoch": 0.57, + "learning_rate": 8.649372839889713e-08, + "loss": 0.0106, + "step": 29279 + }, + { + "epoch": 0.57, + "learning_rate": 8.648984505456099e-08, + "loss": 0.0011, + "step": 29280 + }, + { + "epoch": 0.57, + "learning_rate": 8.648596171022485e-08, + "loss": 0.001, + "step": 29281 + }, + { + "epoch": 0.57, + "learning_rate": 8.64820783658887e-08, + "loss": 0.0005, + "step": 29282 + }, + { + "epoch": 0.57, + "learning_rate": 8.647819502155256e-08, + "loss": 0.0006, + "step": 29283 + }, + { + "epoch": 0.57, + "learning_rate": 8.647431167721642e-08, + "loss": 0.0005, + "step": 29284 + }, + { + "epoch": 0.57, + "learning_rate": 8.647042833288028e-08, + "loss": 0.0004, + "step": 29285 + }, + { + "epoch": 0.57, + "learning_rate": 8.646654498854414e-08, + "loss": 0.0004, + "step": 29286 + }, + { + "epoch": 0.57, + "learning_rate": 8.6462661644208e-08, + "loss": 0.0007, + "step": 29287 + }, + { + "epoch": 0.57, + "learning_rate": 8.645877829987185e-08, + "loss": 0.784, + "step": 29288 + }, + { + "epoch": 0.57, + "learning_rate": 8.645489495553571e-08, + "loss": 0.0005, + "step": 29289 + }, + { + "epoch": 0.57, + "learning_rate": 8.645101161119957e-08, + "loss": 1.061, + "step": 29290 + }, + { + "epoch": 0.57, + "learning_rate": 8.644712826686343e-08, + "loss": 0.0977, + "step": 29291 + }, + { + "epoch": 0.57, + "learning_rate": 8.644324492252729e-08, + "loss": 0.0005, + "step": 29292 + }, + { + "epoch": 0.57, + "learning_rate": 8.643936157819115e-08, + "loss": 0.0005, + "step": 29293 + }, + { + "epoch": 0.57, + "learning_rate": 8.6435478233855e-08, + "loss": 0.0066, + "step": 29294 + }, + { + "epoch": 0.57, + "learning_rate": 8.643159488951886e-08, + "loss": 0.0005, + "step": 29295 + }, + { + "epoch": 0.57, + "learning_rate": 8.64277115451827e-08, + "loss": 0.0005, + "step": 29296 + }, + { + "epoch": 0.57, + "learning_rate": 8.642382820084656e-08, + "loss": 0.0005, + "step": 29297 + }, + { + "epoch": 0.57, + "learning_rate": 8.641994485651042e-08, + "loss": 0.0008, + "step": 29298 + }, + { + "epoch": 0.57, + "learning_rate": 8.641606151217428e-08, + "loss": 0.0006, + "step": 29299 + }, + { + "epoch": 0.57, + "learning_rate": 8.641217816783814e-08, + "loss": 0.0006, + "step": 29300 + }, + { + "epoch": 0.57, + "learning_rate": 8.6408294823502e-08, + "loss": 0.0015, + "step": 29301 + }, + { + "epoch": 0.57, + "learning_rate": 8.640441147916586e-08, + "loss": 0.0004, + "step": 29302 + }, + { + "epoch": 0.57, + "learning_rate": 8.640052813482971e-08, + "loss": 0.0005, + "step": 29303 + }, + { + "epoch": 0.57, + "learning_rate": 8.639664479049357e-08, + "loss": 0.0029, + "step": 29304 + }, + { + "epoch": 0.57, + "learning_rate": 8.639276144615743e-08, + "loss": 0.0005, + "step": 29305 + }, + { + "epoch": 0.57, + "learning_rate": 8.638887810182129e-08, + "loss": 0.0006, + "step": 29306 + }, + { + "epoch": 0.57, + "learning_rate": 8.638499475748515e-08, + "loss": 0.0005, + "step": 29307 + }, + { + "epoch": 0.57, + "learning_rate": 8.6381111413149e-08, + "loss": 0.0006, + "step": 29308 + }, + { + "epoch": 0.57, + "learning_rate": 8.637722806881286e-08, + "loss": 0.0008, + "step": 29309 + }, + { + "epoch": 0.57, + "learning_rate": 8.637334472447672e-08, + "loss": 0.0005, + "step": 29310 + }, + { + "epoch": 0.57, + "learning_rate": 8.636946138014058e-08, + "loss": 0.0012, + "step": 29311 + }, + { + "epoch": 0.57, + "learning_rate": 8.636557803580443e-08, + "loss": 0.001, + "step": 29312 + }, + { + "epoch": 0.57, + "learning_rate": 8.636169469146828e-08, + "loss": 0.0004, + "step": 29313 + }, + { + "epoch": 0.57, + "learning_rate": 8.635781134713214e-08, + "loss": 0.0004, + "step": 29314 + }, + { + "epoch": 0.57, + "learning_rate": 8.6353928002796e-08, + "loss": 0.0005, + "step": 29315 + }, + { + "epoch": 0.57, + "learning_rate": 8.635004465845986e-08, + "loss": 0.0005, + "step": 29316 + }, + { + "epoch": 0.57, + "learning_rate": 8.634616131412372e-08, + "loss": 0.0022, + "step": 29317 + }, + { + "epoch": 0.57, + "learning_rate": 8.634227796978757e-08, + "loss": 0.0005, + "step": 29318 + }, + { + "epoch": 0.57, + "learning_rate": 8.633839462545143e-08, + "loss": 0.0004, + "step": 29319 + }, + { + "epoch": 0.57, + "learning_rate": 8.633451128111529e-08, + "loss": 0.0014, + "step": 29320 + }, + { + "epoch": 0.57, + "learning_rate": 8.633062793677915e-08, + "loss": 0.0004, + "step": 29321 + }, + { + "epoch": 0.57, + "learning_rate": 8.632674459244301e-08, + "loss": 0.0005, + "step": 29322 + }, + { + "epoch": 0.57, + "learning_rate": 8.632286124810687e-08, + "loss": 0.0006, + "step": 29323 + }, + { + "epoch": 0.57, + "learning_rate": 8.631897790377072e-08, + "loss": 0.0006, + "step": 29324 + }, + { + "epoch": 0.57, + "learning_rate": 8.631509455943458e-08, + "loss": 0.0009, + "step": 29325 + }, + { + "epoch": 0.57, + "learning_rate": 8.631121121509843e-08, + "loss": 0.0012, + "step": 29326 + }, + { + "epoch": 0.57, + "learning_rate": 8.630732787076229e-08, + "loss": 0.0005, + "step": 29327 + }, + { + "epoch": 0.57, + "learning_rate": 8.630344452642614e-08, + "loss": 0.0005, + "step": 29328 + }, + { + "epoch": 0.57, + "learning_rate": 8.629956118209e-08, + "loss": 0.0007, + "step": 29329 + }, + { + "epoch": 0.57, + "learning_rate": 8.629567783775386e-08, + "loss": 0.0206, + "step": 29330 + }, + { + "epoch": 0.57, + "learning_rate": 8.629179449341772e-08, + "loss": 0.0006, + "step": 29331 + }, + { + "epoch": 0.57, + "learning_rate": 8.628791114908158e-08, + "loss": 0.0008, + "step": 29332 + }, + { + "epoch": 0.57, + "learning_rate": 8.628402780474544e-08, + "loss": 0.0086, + "step": 29333 + }, + { + "epoch": 0.57, + "learning_rate": 8.628014446040929e-08, + "loss": 0.0005, + "step": 29334 + }, + { + "epoch": 0.57, + "learning_rate": 8.627626111607315e-08, + "loss": 0.0006, + "step": 29335 + }, + { + "epoch": 0.57, + "learning_rate": 8.627237777173701e-08, + "loss": 0.0006, + "step": 29336 + }, + { + "epoch": 0.57, + "learning_rate": 8.626849442740087e-08, + "loss": 0.5948, + "step": 29337 + }, + { + "epoch": 0.57, + "learning_rate": 8.626461108306473e-08, + "loss": 0.0006, + "step": 29338 + }, + { + "epoch": 0.57, + "learning_rate": 8.626072773872858e-08, + "loss": 0.0004, + "step": 29339 + }, + { + "epoch": 0.57, + "learning_rate": 8.625684439439244e-08, + "loss": 0.0005, + "step": 29340 + }, + { + "epoch": 0.57, + "learning_rate": 8.62529610500563e-08, + "loss": 0.0006, + "step": 29341 + }, + { + "epoch": 0.57, + "learning_rate": 8.624907770572016e-08, + "loss": 0.0091, + "step": 29342 + }, + { + "epoch": 0.57, + "learning_rate": 8.624519436138402e-08, + "loss": 0.0004, + "step": 29343 + }, + { + "epoch": 0.57, + "learning_rate": 8.624131101704788e-08, + "loss": 0.0007, + "step": 29344 + }, + { + "epoch": 0.57, + "learning_rate": 8.623742767271173e-08, + "loss": 0.0005, + "step": 29345 + }, + { + "epoch": 0.57, + "learning_rate": 8.623354432837559e-08, + "loss": 0.0005, + "step": 29346 + }, + { + "epoch": 0.57, + "learning_rate": 8.622966098403945e-08, + "loss": 0.4281, + "step": 29347 + }, + { + "epoch": 0.57, + "learning_rate": 8.622577763970331e-08, + "loss": 0.0006, + "step": 29348 + }, + { + "epoch": 0.57, + "learning_rate": 8.622189429536717e-08, + "loss": 0.0006, + "step": 29349 + }, + { + "epoch": 0.57, + "learning_rate": 8.621801095103103e-08, + "loss": 0.0005, + "step": 29350 + }, + { + "epoch": 0.57, + "learning_rate": 8.621412760669488e-08, + "loss": 0.0007, + "step": 29351 + }, + { + "epoch": 0.57, + "learning_rate": 8.621024426235874e-08, + "loss": 0.0005, + "step": 29352 + }, + { + "epoch": 0.57, + "learning_rate": 8.62063609180226e-08, + "loss": 0.0006, + "step": 29353 + }, + { + "epoch": 0.57, + "learning_rate": 8.620247757368644e-08, + "loss": 0.0004, + "step": 29354 + }, + { + "epoch": 0.57, + "learning_rate": 8.61985942293503e-08, + "loss": 0.0004, + "step": 29355 + }, + { + "epoch": 0.57, + "learning_rate": 8.619471088501416e-08, + "loss": 0.0004, + "step": 29356 + }, + { + "epoch": 0.57, + "learning_rate": 8.619082754067802e-08, + "loss": 0.0004, + "step": 29357 + }, + { + "epoch": 0.57, + "learning_rate": 8.618694419634188e-08, + "loss": 0.0005, + "step": 29358 + }, + { + "epoch": 0.57, + "learning_rate": 8.618306085200574e-08, + "loss": 0.0092, + "step": 29359 + }, + { + "epoch": 0.57, + "learning_rate": 8.61791775076696e-08, + "loss": 0.0006, + "step": 29360 + }, + { + "epoch": 0.57, + "learning_rate": 8.617529416333345e-08, + "loss": 0.0006, + "step": 29361 + }, + { + "epoch": 0.57, + "learning_rate": 8.617141081899731e-08, + "loss": 0.0005, + "step": 29362 + }, + { + "epoch": 0.57, + "learning_rate": 8.616752747466117e-08, + "loss": 0.0608, + "step": 29363 + }, + { + "epoch": 0.57, + "learning_rate": 8.616364413032503e-08, + "loss": 0.0005, + "step": 29364 + }, + { + "epoch": 0.57, + "learning_rate": 8.615976078598889e-08, + "loss": 0.0045, + "step": 29365 + }, + { + "epoch": 0.57, + "learning_rate": 8.615587744165274e-08, + "loss": 0.0005, + "step": 29366 + }, + { + "epoch": 0.57, + "learning_rate": 8.61519940973166e-08, + "loss": 0.0009, + "step": 29367 + }, + { + "epoch": 0.57, + "learning_rate": 8.614811075298046e-08, + "loss": 0.0006, + "step": 29368 + }, + { + "epoch": 0.57, + "learning_rate": 8.614422740864432e-08, + "loss": 0.0004, + "step": 29369 + }, + { + "epoch": 0.57, + "learning_rate": 8.614034406430818e-08, + "loss": 0.0006, + "step": 29370 + }, + { + "epoch": 0.57, + "learning_rate": 8.613646071997204e-08, + "loss": 0.0238, + "step": 29371 + }, + { + "epoch": 0.57, + "learning_rate": 8.613257737563589e-08, + "loss": 0.0004, + "step": 29372 + }, + { + "epoch": 0.57, + "learning_rate": 8.612869403129975e-08, + "loss": 0.0008, + "step": 29373 + }, + { + "epoch": 0.57, + "learning_rate": 8.612481068696361e-08, + "loss": 0.0004, + "step": 29374 + }, + { + "epoch": 0.57, + "learning_rate": 8.612092734262747e-08, + "loss": 0.0007, + "step": 29375 + }, + { + "epoch": 0.57, + "learning_rate": 8.611704399829133e-08, + "loss": 0.0006, + "step": 29376 + }, + { + "epoch": 0.57, + "learning_rate": 8.611316065395518e-08, + "loss": 0.0007, + "step": 29377 + }, + { + "epoch": 0.57, + "learning_rate": 8.610927730961904e-08, + "loss": 0.02, + "step": 29378 + }, + { + "epoch": 0.57, + "learning_rate": 8.61053939652829e-08, + "loss": 0.0005, + "step": 29379 + }, + { + "epoch": 0.57, + "learning_rate": 8.610151062094676e-08, + "loss": 0.0014, + "step": 29380 + }, + { + "epoch": 0.57, + "learning_rate": 8.609762727661062e-08, + "loss": 0.0007, + "step": 29381 + }, + { + "epoch": 0.57, + "learning_rate": 8.609374393227448e-08, + "loss": 0.0005, + "step": 29382 + }, + { + "epoch": 0.57, + "learning_rate": 8.608986058793832e-08, + "loss": 0.0006, + "step": 29383 + }, + { + "epoch": 0.57, + "learning_rate": 8.608597724360218e-08, + "loss": 0.0004, + "step": 29384 + }, + { + "epoch": 0.57, + "learning_rate": 8.608209389926604e-08, + "loss": 0.0008, + "step": 29385 + }, + { + "epoch": 0.57, + "learning_rate": 8.60782105549299e-08, + "loss": 0.0007, + "step": 29386 + }, + { + "epoch": 0.57, + "learning_rate": 8.607432721059375e-08, + "loss": 0.0004, + "step": 29387 + }, + { + "epoch": 0.57, + "learning_rate": 8.607044386625761e-08, + "loss": 0.0004, + "step": 29388 + }, + { + "epoch": 0.57, + "learning_rate": 8.606656052192147e-08, + "loss": 0.0006, + "step": 29389 + }, + { + "epoch": 0.57, + "learning_rate": 8.606267717758533e-08, + "loss": 0.0045, + "step": 29390 + }, + { + "epoch": 0.57, + "learning_rate": 8.605879383324919e-08, + "loss": 0.0015, + "step": 29391 + }, + { + "epoch": 0.57, + "learning_rate": 8.605491048891305e-08, + "loss": 0.0005, + "step": 29392 + }, + { + "epoch": 0.57, + "learning_rate": 8.60510271445769e-08, + "loss": 0.0006, + "step": 29393 + }, + { + "epoch": 0.57, + "learning_rate": 8.604714380024076e-08, + "loss": 0.0004, + "step": 29394 + }, + { + "epoch": 0.57, + "learning_rate": 8.604326045590462e-08, + "loss": 0.0006, + "step": 29395 + }, + { + "epoch": 0.57, + "learning_rate": 8.603937711156848e-08, + "loss": 0.0005, + "step": 29396 + }, + { + "epoch": 0.57, + "learning_rate": 8.603549376723234e-08, + "loss": 0.0005, + "step": 29397 + }, + { + "epoch": 0.57, + "learning_rate": 8.60316104228962e-08, + "loss": 0.0005, + "step": 29398 + }, + { + "epoch": 0.57, + "learning_rate": 8.602772707856005e-08, + "loss": 0.37, + "step": 29399 + }, + { + "epoch": 0.57, + "learning_rate": 8.602384373422391e-08, + "loss": 0.0004, + "step": 29400 + }, + { + "epoch": 0.57, + "learning_rate": 8.601996038988777e-08, + "loss": 0.0005, + "step": 29401 + }, + { + "epoch": 0.57, + "learning_rate": 8.601607704555163e-08, + "loss": 0.0008, + "step": 29402 + }, + { + "epoch": 0.57, + "learning_rate": 8.601219370121549e-08, + "loss": 0.6022, + "step": 29403 + }, + { + "epoch": 0.57, + "learning_rate": 8.600831035687934e-08, + "loss": 0.0004, + "step": 29404 + }, + { + "epoch": 0.57, + "learning_rate": 8.60044270125432e-08, + "loss": 0.0006, + "step": 29405 + }, + { + "epoch": 0.57, + "learning_rate": 8.600054366820706e-08, + "loss": 0.0004, + "step": 29406 + }, + { + "epoch": 0.57, + "learning_rate": 8.599666032387092e-08, + "loss": 0.0004, + "step": 29407 + }, + { + "epoch": 0.57, + "learning_rate": 8.599277697953478e-08, + "loss": 0.0005, + "step": 29408 + }, + { + "epoch": 0.57, + "learning_rate": 8.598889363519864e-08, + "loss": 0.0005, + "step": 29409 + }, + { + "epoch": 0.57, + "learning_rate": 8.59850102908625e-08, + "loss": 0.0005, + "step": 29410 + }, + { + "epoch": 0.57, + "learning_rate": 8.598112694652635e-08, + "loss": 0.0006, + "step": 29411 + }, + { + "epoch": 0.57, + "learning_rate": 8.59772436021902e-08, + "loss": 0.0004, + "step": 29412 + }, + { + "epoch": 0.57, + "learning_rate": 8.597336025785405e-08, + "loss": 0.0007, + "step": 29413 + }, + { + "epoch": 0.57, + "learning_rate": 8.596947691351791e-08, + "loss": 0.0004, + "step": 29414 + }, + { + "epoch": 0.57, + "learning_rate": 8.596559356918177e-08, + "loss": 0.0005, + "step": 29415 + }, + { + "epoch": 0.57, + "learning_rate": 8.596171022484563e-08, + "loss": 0.0005, + "step": 29416 + }, + { + "epoch": 0.57, + "learning_rate": 8.595782688050949e-08, + "loss": 0.0013, + "step": 29417 + }, + { + "epoch": 0.57, + "learning_rate": 8.595394353617335e-08, + "loss": 0.0006, + "step": 29418 + }, + { + "epoch": 0.57, + "learning_rate": 8.59500601918372e-08, + "loss": 0.0007, + "step": 29419 + }, + { + "epoch": 0.57, + "learning_rate": 8.594617684750106e-08, + "loss": 0.0766, + "step": 29420 + }, + { + "epoch": 0.57, + "learning_rate": 8.594229350316492e-08, + "loss": 0.0006, + "step": 29421 + }, + { + "epoch": 0.57, + "learning_rate": 8.593841015882878e-08, + "loss": 0.0008, + "step": 29422 + }, + { + "epoch": 0.57, + "learning_rate": 8.593452681449264e-08, + "loss": 0.0005, + "step": 29423 + }, + { + "epoch": 0.57, + "learning_rate": 8.59306434701565e-08, + "loss": 0.014, + "step": 29424 + }, + { + "epoch": 0.57, + "learning_rate": 8.592676012582035e-08, + "loss": 0.0005, + "step": 29425 + }, + { + "epoch": 0.57, + "learning_rate": 8.592287678148421e-08, + "loss": 0.0004, + "step": 29426 + }, + { + "epoch": 0.57, + "learning_rate": 8.591899343714807e-08, + "loss": 0.001, + "step": 29427 + }, + { + "epoch": 0.57, + "learning_rate": 8.591511009281193e-08, + "loss": 0.7543, + "step": 29428 + }, + { + "epoch": 0.57, + "learning_rate": 8.591122674847579e-08, + "loss": 0.0004, + "step": 29429 + }, + { + "epoch": 0.57, + "learning_rate": 8.590734340413965e-08, + "loss": 0.0007, + "step": 29430 + }, + { + "epoch": 0.57, + "learning_rate": 8.59034600598035e-08, + "loss": 0.0008, + "step": 29431 + }, + { + "epoch": 0.57, + "learning_rate": 8.589957671546736e-08, + "loss": 0.0005, + "step": 29432 + }, + { + "epoch": 0.57, + "learning_rate": 8.589569337113122e-08, + "loss": 0.0007, + "step": 29433 + }, + { + "epoch": 0.57, + "learning_rate": 8.589181002679508e-08, + "loss": 0.0006, + "step": 29434 + }, + { + "epoch": 0.57, + "learning_rate": 8.588792668245894e-08, + "loss": 0.0004, + "step": 29435 + }, + { + "epoch": 0.57, + "learning_rate": 8.58840433381228e-08, + "loss": 0.0008, + "step": 29436 + }, + { + "epoch": 0.57, + "learning_rate": 8.588015999378665e-08, + "loss": 0.0004, + "step": 29437 + }, + { + "epoch": 0.57, + "learning_rate": 8.587627664945051e-08, + "loss": 0.0005, + "step": 29438 + }, + { + "epoch": 0.57, + "learning_rate": 8.587239330511437e-08, + "loss": 0.0004, + "step": 29439 + }, + { + "epoch": 0.57, + "learning_rate": 8.586850996077823e-08, + "loss": 0.0005, + "step": 29440 + }, + { + "epoch": 0.57, + "learning_rate": 8.586462661644207e-08, + "loss": 0.0005, + "step": 29441 + }, + { + "epoch": 0.57, + "learning_rate": 8.586074327210593e-08, + "loss": 0.0007, + "step": 29442 + }, + { + "epoch": 0.57, + "learning_rate": 8.585685992776979e-08, + "loss": 0.0005, + "step": 29443 + }, + { + "epoch": 0.57, + "learning_rate": 8.585297658343365e-08, + "loss": 0.4854, + "step": 29444 + }, + { + "epoch": 0.57, + "learning_rate": 8.58490932390975e-08, + "loss": 0.0003, + "step": 29445 + }, + { + "epoch": 0.57, + "learning_rate": 8.584520989476136e-08, + "loss": 0.0004, + "step": 29446 + }, + { + "epoch": 0.57, + "learning_rate": 8.584132655042522e-08, + "loss": 0.0004, + "step": 29447 + }, + { + "epoch": 0.57, + "learning_rate": 8.583744320608908e-08, + "loss": 0.0005, + "step": 29448 + }, + { + "epoch": 0.57, + "learning_rate": 8.583355986175294e-08, + "loss": 0.0005, + "step": 29449 + }, + { + "epoch": 0.57, + "learning_rate": 8.58296765174168e-08, + "loss": 0.0016, + "step": 29450 + }, + { + "epoch": 0.57, + "learning_rate": 8.582579317308065e-08, + "loss": 0.0005, + "step": 29451 + }, + { + "epoch": 0.57, + "learning_rate": 8.582190982874451e-08, + "loss": 1.1351, + "step": 29452 + }, + { + "epoch": 0.57, + "learning_rate": 8.581802648440837e-08, + "loss": 0.0004, + "step": 29453 + }, + { + "epoch": 0.57, + "learning_rate": 8.581414314007223e-08, + "loss": 0.0006, + "step": 29454 + }, + { + "epoch": 0.57, + "learning_rate": 8.581025979573609e-08, + "loss": 0.0005, + "step": 29455 + }, + { + "epoch": 0.57, + "learning_rate": 8.580637645139995e-08, + "loss": 0.0026, + "step": 29456 + }, + { + "epoch": 0.57, + "learning_rate": 8.58024931070638e-08, + "loss": 0.0007, + "step": 29457 + }, + { + "epoch": 0.57, + "learning_rate": 8.579860976272766e-08, + "loss": 0.0005, + "step": 29458 + }, + { + "epoch": 0.57, + "learning_rate": 8.579472641839152e-08, + "loss": 0.0006, + "step": 29459 + }, + { + "epoch": 0.57, + "learning_rate": 8.579084307405538e-08, + "loss": 0.0005, + "step": 29460 + }, + { + "epoch": 0.57, + "learning_rate": 8.578695972971924e-08, + "loss": 0.0004, + "step": 29461 + }, + { + "epoch": 0.57, + "learning_rate": 8.57830763853831e-08, + "loss": 0.0006, + "step": 29462 + }, + { + "epoch": 0.57, + "learning_rate": 8.577919304104695e-08, + "loss": 0.0005, + "step": 29463 + }, + { + "epoch": 0.57, + "learning_rate": 8.577530969671081e-08, + "loss": 0.0005, + "step": 29464 + }, + { + "epoch": 0.57, + "learning_rate": 8.577142635237467e-08, + "loss": 0.0005, + "step": 29465 + }, + { + "epoch": 0.57, + "learning_rate": 8.576754300803853e-08, + "loss": 0.0011, + "step": 29466 + }, + { + "epoch": 0.57, + "learning_rate": 8.576365966370239e-08, + "loss": 0.0005, + "step": 29467 + }, + { + "epoch": 0.57, + "learning_rate": 8.575977631936625e-08, + "loss": 0.0005, + "step": 29468 + }, + { + "epoch": 0.57, + "learning_rate": 8.57558929750301e-08, + "loss": 0.0163, + "step": 29469 + }, + { + "epoch": 0.57, + "learning_rate": 8.575200963069395e-08, + "loss": 0.0008, + "step": 29470 + }, + { + "epoch": 0.57, + "learning_rate": 8.574812628635781e-08, + "loss": 0.0005, + "step": 29471 + }, + { + "epoch": 0.57, + "learning_rate": 8.574424294202166e-08, + "loss": 0.0006, + "step": 29472 + }, + { + "epoch": 0.57, + "learning_rate": 8.574035959768552e-08, + "loss": 0.0804, + "step": 29473 + }, + { + "epoch": 0.57, + "learning_rate": 8.573647625334938e-08, + "loss": 0.0004, + "step": 29474 + }, + { + "epoch": 0.57, + "learning_rate": 8.573259290901324e-08, + "loss": 0.0053, + "step": 29475 + }, + { + "epoch": 0.57, + "learning_rate": 8.57287095646771e-08, + "loss": 0.0008, + "step": 29476 + }, + { + "epoch": 0.57, + "learning_rate": 8.572482622034096e-08, + "loss": 0.0006, + "step": 29477 + }, + { + "epoch": 0.57, + "learning_rate": 8.572094287600481e-08, + "loss": 0.0007, + "step": 29478 + }, + { + "epoch": 0.57, + "learning_rate": 8.571705953166867e-08, + "loss": 0.0005, + "step": 29479 + }, + { + "epoch": 0.57, + "learning_rate": 8.571317618733253e-08, + "loss": 0.0273, + "step": 29480 + }, + { + "epoch": 0.57, + "learning_rate": 8.570929284299639e-08, + "loss": 0.0005, + "step": 29481 + }, + { + "epoch": 0.57, + "learning_rate": 8.570540949866025e-08, + "loss": 0.0013, + "step": 29482 + }, + { + "epoch": 0.57, + "learning_rate": 8.57015261543241e-08, + "loss": 0.0006, + "step": 29483 + }, + { + "epoch": 0.57, + "learning_rate": 8.569764280998796e-08, + "loss": 0.1236, + "step": 29484 + }, + { + "epoch": 0.57, + "learning_rate": 8.569375946565182e-08, + "loss": 0.0008, + "step": 29485 + }, + { + "epoch": 0.57, + "learning_rate": 8.568987612131568e-08, + "loss": 0.0006, + "step": 29486 + }, + { + "epoch": 0.57, + "learning_rate": 8.568599277697954e-08, + "loss": 0.0004, + "step": 29487 + }, + { + "epoch": 0.57, + "learning_rate": 8.56821094326434e-08, + "loss": 0.0008, + "step": 29488 + }, + { + "epoch": 0.57, + "learning_rate": 8.567822608830724e-08, + "loss": 0.0032, + "step": 29489 + }, + { + "epoch": 0.57, + "learning_rate": 8.56743427439711e-08, + "loss": 0.0006, + "step": 29490 + }, + { + "epoch": 0.57, + "learning_rate": 8.567045939963496e-08, + "loss": 0.3961, + "step": 29491 + }, + { + "epoch": 0.57, + "learning_rate": 8.566657605529882e-08, + "loss": 0.0841, + "step": 29492 + }, + { + "epoch": 0.57, + "learning_rate": 8.566269271096267e-08, + "loss": 0.0012, + "step": 29493 + }, + { + "epoch": 0.57, + "learning_rate": 8.565880936662653e-08, + "loss": 0.3022, + "step": 29494 + }, + { + "epoch": 0.57, + "learning_rate": 8.565492602229039e-08, + "loss": 0.8021, + "step": 29495 + }, + { + "epoch": 0.57, + "learning_rate": 8.565104267795425e-08, + "loss": 0.0006, + "step": 29496 + }, + { + "epoch": 0.57, + "learning_rate": 8.564715933361811e-08, + "loss": 0.002, + "step": 29497 + }, + { + "epoch": 0.57, + "learning_rate": 8.564327598928197e-08, + "loss": 0.255, + "step": 29498 + }, + { + "epoch": 0.57, + "learning_rate": 8.563939264494582e-08, + "loss": 1.0598, + "step": 29499 + }, + { + "epoch": 0.57, + "learning_rate": 8.563550930060968e-08, + "loss": 0.0005, + "step": 29500 + }, + { + "epoch": 0.57, + "learning_rate": 8.563162595627354e-08, + "loss": 0.0018, + "step": 29501 + }, + { + "epoch": 0.57, + "learning_rate": 8.56277426119374e-08, + "loss": 0.0011, + "step": 29502 + }, + { + "epoch": 0.57, + "learning_rate": 8.562385926760124e-08, + "loss": 0.0019, + "step": 29503 + }, + { + "epoch": 0.57, + "learning_rate": 8.56199759232651e-08, + "loss": 0.0005, + "step": 29504 + }, + { + "epoch": 0.57, + "learning_rate": 8.561609257892896e-08, + "loss": 0.0006, + "step": 29505 + }, + { + "epoch": 0.57, + "learning_rate": 8.561220923459282e-08, + "loss": 0.0022, + "step": 29506 + }, + { + "epoch": 0.57, + "learning_rate": 8.560832589025668e-08, + "loss": 0.0005, + "step": 29507 + }, + { + "epoch": 0.57, + "learning_rate": 8.560444254592054e-08, + "loss": 0.0006, + "step": 29508 + }, + { + "epoch": 0.57, + "learning_rate": 8.56005592015844e-08, + "loss": 0.0005, + "step": 29509 + }, + { + "epoch": 0.57, + "learning_rate": 8.559667585724825e-08, + "loss": 0.2472, + "step": 29510 + }, + { + "epoch": 0.57, + "learning_rate": 8.559279251291211e-08, + "loss": 0.0007, + "step": 29511 + }, + { + "epoch": 0.57, + "learning_rate": 8.558890916857597e-08, + "loss": 0.0005, + "step": 29512 + }, + { + "epoch": 0.57, + "learning_rate": 8.558502582423983e-08, + "loss": 0.0011, + "step": 29513 + }, + { + "epoch": 0.57, + "learning_rate": 8.558114247990368e-08, + "loss": 0.001, + "step": 29514 + }, + { + "epoch": 0.57, + "learning_rate": 8.557725913556754e-08, + "loss": 0.0005, + "step": 29515 + }, + { + "epoch": 0.57, + "learning_rate": 8.55733757912314e-08, + "loss": 0.0004, + "step": 29516 + }, + { + "epoch": 0.57, + "learning_rate": 8.556949244689526e-08, + "loss": 0.0004, + "step": 29517 + }, + { + "epoch": 0.57, + "learning_rate": 8.556560910255912e-08, + "loss": 0.0007, + "step": 29518 + }, + { + "epoch": 0.57, + "learning_rate": 8.556172575822298e-08, + "loss": 0.0003, + "step": 29519 + }, + { + "epoch": 0.57, + "learning_rate": 8.555784241388683e-08, + "loss": 0.0018, + "step": 29520 + }, + { + "epoch": 0.57, + "learning_rate": 8.555395906955069e-08, + "loss": 0.0005, + "step": 29521 + }, + { + "epoch": 0.57, + "learning_rate": 8.555007572521455e-08, + "loss": 0.0006, + "step": 29522 + }, + { + "epoch": 0.57, + "learning_rate": 8.554619238087841e-08, + "loss": 0.0005, + "step": 29523 + }, + { + "epoch": 0.57, + "learning_rate": 8.554230903654227e-08, + "loss": 0.0007, + "step": 29524 + }, + { + "epoch": 0.57, + "learning_rate": 8.553842569220613e-08, + "loss": 0.0004, + "step": 29525 + }, + { + "epoch": 0.57, + "learning_rate": 8.553454234786998e-08, + "loss": 0.0004, + "step": 29526 + }, + { + "epoch": 0.57, + "learning_rate": 8.553065900353384e-08, + "loss": 0.0005, + "step": 29527 + }, + { + "epoch": 0.57, + "learning_rate": 8.552677565919769e-08, + "loss": 0.0692, + "step": 29528 + }, + { + "epoch": 0.57, + "learning_rate": 8.552289231486155e-08, + "loss": 0.0006, + "step": 29529 + }, + { + "epoch": 0.57, + "learning_rate": 8.55190089705254e-08, + "loss": 0.0005, + "step": 29530 + }, + { + "epoch": 0.57, + "learning_rate": 8.551512562618926e-08, + "loss": 0.0005, + "step": 29531 + }, + { + "epoch": 0.57, + "learning_rate": 8.551124228185312e-08, + "loss": 0.0006, + "step": 29532 + }, + { + "epoch": 0.57, + "learning_rate": 8.550735893751698e-08, + "loss": 0.027, + "step": 29533 + }, + { + "epoch": 0.57, + "learning_rate": 8.550347559318084e-08, + "loss": 0.0007, + "step": 29534 + }, + { + "epoch": 0.57, + "learning_rate": 8.54995922488447e-08, + "loss": 0.0007, + "step": 29535 + }, + { + "epoch": 0.57, + "learning_rate": 8.549570890450855e-08, + "loss": 0.0011, + "step": 29536 + }, + { + "epoch": 0.57, + "learning_rate": 8.549182556017241e-08, + "loss": 0.0007, + "step": 29537 + }, + { + "epoch": 0.57, + "learning_rate": 8.548794221583627e-08, + "loss": 0.0005, + "step": 29538 + }, + { + "epoch": 0.57, + "learning_rate": 8.548405887150013e-08, + "loss": 0.0005, + "step": 29539 + }, + { + "epoch": 0.57, + "learning_rate": 8.548017552716399e-08, + "loss": 0.0063, + "step": 29540 + }, + { + "epoch": 0.57, + "learning_rate": 8.547629218282784e-08, + "loss": 0.0004, + "step": 29541 + }, + { + "epoch": 0.57, + "learning_rate": 8.54724088384917e-08, + "loss": 0.0006, + "step": 29542 + }, + { + "epoch": 0.57, + "learning_rate": 8.546852549415556e-08, + "loss": 0.0005, + "step": 29543 + }, + { + "epoch": 0.57, + "learning_rate": 8.546464214981942e-08, + "loss": 0.0007, + "step": 29544 + }, + { + "epoch": 0.57, + "learning_rate": 8.546075880548328e-08, + "loss": 0.0005, + "step": 29545 + }, + { + "epoch": 0.57, + "learning_rate": 8.545687546114714e-08, + "loss": 0.0005, + "step": 29546 + }, + { + "epoch": 0.57, + "learning_rate": 8.5452992116811e-08, + "loss": 0.0006, + "step": 29547 + }, + { + "epoch": 0.57, + "learning_rate": 8.544910877247485e-08, + "loss": 0.0006, + "step": 29548 + }, + { + "epoch": 0.57, + "learning_rate": 8.544522542813871e-08, + "loss": 0.0006, + "step": 29549 + }, + { + "epoch": 0.57, + "learning_rate": 8.544134208380257e-08, + "loss": 0.0005, + "step": 29550 + }, + { + "epoch": 0.57, + "learning_rate": 8.543745873946643e-08, + "loss": 0.0004, + "step": 29551 + }, + { + "epoch": 0.57, + "learning_rate": 8.543357539513028e-08, + "loss": 0.0041, + "step": 29552 + }, + { + "epoch": 0.57, + "learning_rate": 8.542969205079414e-08, + "loss": 0.0005, + "step": 29553 + }, + { + "epoch": 0.57, + "learning_rate": 8.5425808706458e-08, + "loss": 0.0004, + "step": 29554 + }, + { + "epoch": 0.57, + "learning_rate": 8.542192536212186e-08, + "loss": 0.0008, + "step": 29555 + }, + { + "epoch": 0.57, + "learning_rate": 8.541804201778572e-08, + "loss": 0.0005, + "step": 29556 + }, + { + "epoch": 0.57, + "learning_rate": 8.541415867344956e-08, + "loss": 0.0006, + "step": 29557 + }, + { + "epoch": 0.57, + "learning_rate": 8.541027532911342e-08, + "loss": 0.0009, + "step": 29558 + }, + { + "epoch": 0.57, + "learning_rate": 8.540639198477728e-08, + "loss": 0.0005, + "step": 29559 + }, + { + "epoch": 0.57, + "learning_rate": 8.540250864044114e-08, + "loss": 0.0004, + "step": 29560 + }, + { + "epoch": 0.57, + "learning_rate": 8.5398625296105e-08, + "loss": 0.0086, + "step": 29561 + }, + { + "epoch": 0.57, + "learning_rate": 8.539474195176885e-08, + "loss": 0.0005, + "step": 29562 + }, + { + "epoch": 0.57, + "learning_rate": 8.539085860743271e-08, + "loss": 0.0007, + "step": 29563 + }, + { + "epoch": 0.57, + "learning_rate": 8.538697526309657e-08, + "loss": 0.0006, + "step": 29564 + }, + { + "epoch": 0.57, + "learning_rate": 8.538309191876043e-08, + "loss": 0.0006, + "step": 29565 + }, + { + "epoch": 0.57, + "learning_rate": 8.537920857442429e-08, + "loss": 0.0005, + "step": 29566 + }, + { + "epoch": 0.57, + "learning_rate": 8.537532523008815e-08, + "loss": 0.0008, + "step": 29567 + }, + { + "epoch": 0.57, + "learning_rate": 8.5371441885752e-08, + "loss": 0.0005, + "step": 29568 + }, + { + "epoch": 0.57, + "learning_rate": 8.536755854141586e-08, + "loss": 0.0004, + "step": 29569 + }, + { + "epoch": 0.57, + "learning_rate": 8.536367519707972e-08, + "loss": 0.0011, + "step": 29570 + }, + { + "epoch": 0.57, + "learning_rate": 8.535979185274358e-08, + "loss": 0.0007, + "step": 29571 + }, + { + "epoch": 0.57, + "learning_rate": 8.535590850840744e-08, + "loss": 0.0005, + "step": 29572 + }, + { + "epoch": 0.57, + "learning_rate": 8.53520251640713e-08, + "loss": 0.0004, + "step": 29573 + }, + { + "epoch": 0.57, + "learning_rate": 8.534814181973515e-08, + "loss": 0.0429, + "step": 29574 + }, + { + "epoch": 0.57, + "learning_rate": 8.534425847539901e-08, + "loss": 0.0008, + "step": 29575 + }, + { + "epoch": 0.57, + "learning_rate": 8.534037513106287e-08, + "loss": 0.0352, + "step": 29576 + }, + { + "epoch": 0.57, + "learning_rate": 8.533649178672673e-08, + "loss": 0.0004, + "step": 29577 + }, + { + "epoch": 0.57, + "learning_rate": 8.533260844239059e-08, + "loss": 0.9196, + "step": 29578 + }, + { + "epoch": 0.57, + "learning_rate": 8.532872509805444e-08, + "loss": 0.1494, + "step": 29579 + }, + { + "epoch": 0.57, + "learning_rate": 8.53248417537183e-08, + "loss": 0.0007, + "step": 29580 + }, + { + "epoch": 0.57, + "learning_rate": 8.532095840938216e-08, + "loss": 0.0014, + "step": 29581 + }, + { + "epoch": 0.57, + "learning_rate": 8.531707506504602e-08, + "loss": 0.0005, + "step": 29582 + }, + { + "epoch": 0.57, + "learning_rate": 8.531319172070988e-08, + "loss": 1.1251, + "step": 29583 + }, + { + "epoch": 0.57, + "learning_rate": 8.530930837637374e-08, + "loss": 0.002, + "step": 29584 + }, + { + "epoch": 0.57, + "learning_rate": 8.53054250320376e-08, + "loss": 0.0006, + "step": 29585 + }, + { + "epoch": 0.57, + "learning_rate": 8.530154168770144e-08, + "loss": 0.0089, + "step": 29586 + }, + { + "epoch": 0.57, + "learning_rate": 8.52976583433653e-08, + "loss": 0.0008, + "step": 29587 + }, + { + "epoch": 0.57, + "learning_rate": 8.529377499902916e-08, + "loss": 0.0015, + "step": 29588 + }, + { + "epoch": 0.57, + "learning_rate": 8.528989165469301e-08, + "loss": 0.9988, + "step": 29589 + }, + { + "epoch": 0.57, + "learning_rate": 8.528600831035687e-08, + "loss": 0.3609, + "step": 29590 + }, + { + "epoch": 0.57, + "learning_rate": 8.528212496602073e-08, + "loss": 0.0018, + "step": 29591 + }, + { + "epoch": 0.57, + "learning_rate": 8.527824162168459e-08, + "loss": 0.0005, + "step": 29592 + }, + { + "epoch": 0.57, + "learning_rate": 8.527435827734845e-08, + "loss": 0.1435, + "step": 29593 + }, + { + "epoch": 0.57, + "learning_rate": 8.52704749330123e-08, + "loss": 0.0005, + "step": 29594 + }, + { + "epoch": 0.57, + "learning_rate": 8.526659158867616e-08, + "loss": 0.0004, + "step": 29595 + }, + { + "epoch": 0.57, + "learning_rate": 8.526270824434002e-08, + "loss": 0.0004, + "step": 29596 + }, + { + "epoch": 0.57, + "learning_rate": 8.525882490000388e-08, + "loss": 0.0005, + "step": 29597 + }, + { + "epoch": 0.57, + "learning_rate": 8.525494155566774e-08, + "loss": 0.0004, + "step": 29598 + }, + { + "epoch": 0.57, + "learning_rate": 8.52510582113316e-08, + "loss": 0.0005, + "step": 29599 + }, + { + "epoch": 0.57, + "learning_rate": 8.524717486699545e-08, + "loss": 0.0004, + "step": 29600 + }, + { + "epoch": 0.57, + "learning_rate": 8.524329152265931e-08, + "loss": 0.0004, + "step": 29601 + }, + { + "epoch": 0.57, + "learning_rate": 8.523940817832317e-08, + "loss": 0.0007, + "step": 29602 + }, + { + "epoch": 0.57, + "learning_rate": 8.523552483398703e-08, + "loss": 0.0005, + "step": 29603 + }, + { + "epoch": 0.57, + "learning_rate": 8.523164148965089e-08, + "loss": 0.0008, + "step": 29604 + }, + { + "epoch": 0.57, + "learning_rate": 8.522775814531475e-08, + "loss": 0.0059, + "step": 29605 + }, + { + "epoch": 0.57, + "learning_rate": 8.52238748009786e-08, + "loss": 0.0004, + "step": 29606 + }, + { + "epoch": 0.57, + "learning_rate": 8.521999145664246e-08, + "loss": 0.0011, + "step": 29607 + }, + { + "epoch": 0.57, + "learning_rate": 8.521610811230632e-08, + "loss": 0.0005, + "step": 29608 + }, + { + "epoch": 0.57, + "learning_rate": 8.521222476797018e-08, + "loss": 0.0005, + "step": 29609 + }, + { + "epoch": 0.57, + "learning_rate": 8.520834142363404e-08, + "loss": 0.0005, + "step": 29610 + }, + { + "epoch": 0.57, + "learning_rate": 8.52044580792979e-08, + "loss": 0.0006, + "step": 29611 + }, + { + "epoch": 0.57, + "learning_rate": 8.520057473496175e-08, + "loss": 0.049, + "step": 29612 + }, + { + "epoch": 0.57, + "learning_rate": 8.519669139062561e-08, + "loss": 0.0006, + "step": 29613 + }, + { + "epoch": 0.57, + "learning_rate": 8.519280804628947e-08, + "loss": 0.0005, + "step": 29614 + }, + { + "epoch": 0.57, + "learning_rate": 8.518892470195331e-08, + "loss": 0.0003, + "step": 29615 + }, + { + "epoch": 0.57, + "learning_rate": 8.518504135761717e-08, + "loss": 0.0008, + "step": 29616 + }, + { + "epoch": 0.57, + "learning_rate": 8.518115801328103e-08, + "loss": 0.0006, + "step": 29617 + }, + { + "epoch": 0.57, + "learning_rate": 8.517727466894489e-08, + "loss": 0.0008, + "step": 29618 + }, + { + "epoch": 0.57, + "learning_rate": 8.517339132460875e-08, + "loss": 0.0006, + "step": 29619 + }, + { + "epoch": 0.57, + "learning_rate": 8.51695079802726e-08, + "loss": 0.0005, + "step": 29620 + }, + { + "epoch": 0.57, + "learning_rate": 8.516562463593646e-08, + "loss": 0.0007, + "step": 29621 + }, + { + "epoch": 0.57, + "learning_rate": 8.516174129160032e-08, + "loss": 0.0004, + "step": 29622 + }, + { + "epoch": 0.57, + "learning_rate": 8.515785794726418e-08, + "loss": 0.0006, + "step": 29623 + }, + { + "epoch": 0.57, + "learning_rate": 8.515397460292804e-08, + "loss": 0.0005, + "step": 29624 + }, + { + "epoch": 0.57, + "learning_rate": 8.51500912585919e-08, + "loss": 0.0011, + "step": 29625 + }, + { + "epoch": 0.57, + "learning_rate": 8.514620791425576e-08, + "loss": 0.0082, + "step": 29626 + }, + { + "epoch": 0.57, + "learning_rate": 8.514232456991961e-08, + "loss": 0.0006, + "step": 29627 + }, + { + "epoch": 0.57, + "learning_rate": 8.513844122558347e-08, + "loss": 0.0005, + "step": 29628 + }, + { + "epoch": 0.57, + "learning_rate": 8.513455788124733e-08, + "loss": 0.0008, + "step": 29629 + }, + { + "epoch": 0.57, + "learning_rate": 8.513067453691119e-08, + "loss": 0.0004, + "step": 29630 + }, + { + "epoch": 0.57, + "learning_rate": 8.512679119257505e-08, + "loss": 0.001, + "step": 29631 + }, + { + "epoch": 0.57, + "learning_rate": 8.51229078482389e-08, + "loss": 0.0007, + "step": 29632 + }, + { + "epoch": 0.57, + "learning_rate": 8.511902450390276e-08, + "loss": 0.0005, + "step": 29633 + }, + { + "epoch": 0.57, + "learning_rate": 8.511514115956662e-08, + "loss": 0.0006, + "step": 29634 + }, + { + "epoch": 0.57, + "learning_rate": 8.511125781523048e-08, + "loss": 0.0005, + "step": 29635 + }, + { + "epoch": 0.57, + "learning_rate": 8.510737447089434e-08, + "loss": 0.0005, + "step": 29636 + }, + { + "epoch": 0.57, + "learning_rate": 8.51034911265582e-08, + "loss": 0.0006, + "step": 29637 + }, + { + "epoch": 0.57, + "learning_rate": 8.509960778222205e-08, + "loss": 0.0413, + "step": 29638 + }, + { + "epoch": 0.57, + "learning_rate": 8.509572443788591e-08, + "loss": 0.0007, + "step": 29639 + }, + { + "epoch": 0.57, + "learning_rate": 8.509184109354977e-08, + "loss": 0.0004, + "step": 29640 + }, + { + "epoch": 0.57, + "learning_rate": 8.508795774921363e-08, + "loss": 0.0005, + "step": 29641 + }, + { + "epoch": 0.57, + "learning_rate": 8.508407440487749e-08, + "loss": 0.0005, + "step": 29642 + }, + { + "epoch": 0.58, + "learning_rate": 8.508019106054135e-08, + "loss": 0.0005, + "step": 29643 + }, + { + "epoch": 0.58, + "learning_rate": 8.507630771620519e-08, + "loss": 0.0005, + "step": 29644 + }, + { + "epoch": 0.58, + "learning_rate": 8.507242437186905e-08, + "loss": 0.0004, + "step": 29645 + }, + { + "epoch": 0.58, + "learning_rate": 8.506854102753291e-08, + "loss": 0.0006, + "step": 29646 + }, + { + "epoch": 0.58, + "learning_rate": 8.506465768319676e-08, + "loss": 0.0004, + "step": 29647 + }, + { + "epoch": 0.58, + "learning_rate": 8.506077433886062e-08, + "loss": 0.1298, + "step": 29648 + }, + { + "epoch": 0.58, + "learning_rate": 8.505689099452448e-08, + "loss": 0.0005, + "step": 29649 + }, + { + "epoch": 0.58, + "learning_rate": 8.505300765018834e-08, + "loss": 0.0023, + "step": 29650 + }, + { + "epoch": 0.58, + "learning_rate": 8.50491243058522e-08, + "loss": 0.0005, + "step": 29651 + }, + { + "epoch": 0.58, + "learning_rate": 8.504524096151606e-08, + "loss": 0.0004, + "step": 29652 + }, + { + "epoch": 0.58, + "learning_rate": 8.504135761717991e-08, + "loss": 0.0006, + "step": 29653 + }, + { + "epoch": 0.58, + "learning_rate": 8.503747427284377e-08, + "loss": 0.1896, + "step": 29654 + }, + { + "epoch": 0.58, + "learning_rate": 8.503359092850763e-08, + "loss": 0.6477, + "step": 29655 + }, + { + "epoch": 0.58, + "learning_rate": 8.502970758417149e-08, + "loss": 0.0006, + "step": 29656 + }, + { + "epoch": 0.58, + "learning_rate": 8.502582423983535e-08, + "loss": 1.1689, + "step": 29657 + }, + { + "epoch": 0.58, + "learning_rate": 8.50219408954992e-08, + "loss": 0.0011, + "step": 29658 + }, + { + "epoch": 0.58, + "learning_rate": 8.501805755116306e-08, + "loss": 0.0005, + "step": 29659 + }, + { + "epoch": 0.58, + "learning_rate": 8.501417420682692e-08, + "loss": 0.0006, + "step": 29660 + }, + { + "epoch": 0.58, + "learning_rate": 8.501029086249078e-08, + "loss": 0.0055, + "step": 29661 + }, + { + "epoch": 0.58, + "learning_rate": 8.500640751815464e-08, + "loss": 0.0013, + "step": 29662 + }, + { + "epoch": 0.58, + "learning_rate": 8.50025241738185e-08, + "loss": 0.0606, + "step": 29663 + }, + { + "epoch": 0.58, + "learning_rate": 8.499864082948236e-08, + "loss": 0.0005, + "step": 29664 + }, + { + "epoch": 0.58, + "learning_rate": 8.499475748514621e-08, + "loss": 0.0005, + "step": 29665 + }, + { + "epoch": 0.58, + "learning_rate": 8.499087414081006e-08, + "loss": 0.0007, + "step": 29666 + }, + { + "epoch": 0.58, + "learning_rate": 8.498699079647392e-08, + "loss": 0.0009, + "step": 29667 + }, + { + "epoch": 0.58, + "learning_rate": 8.498310745213777e-08, + "loss": 0.0006, + "step": 29668 + }, + { + "epoch": 0.58, + "learning_rate": 8.497922410780163e-08, + "loss": 0.0008, + "step": 29669 + }, + { + "epoch": 0.58, + "learning_rate": 8.497534076346549e-08, + "loss": 0.0005, + "step": 29670 + }, + { + "epoch": 0.58, + "learning_rate": 8.497145741912935e-08, + "loss": 0.0005, + "step": 29671 + }, + { + "epoch": 0.58, + "learning_rate": 8.496757407479321e-08, + "loss": 0.0008, + "step": 29672 + }, + { + "epoch": 0.58, + "learning_rate": 8.496369073045707e-08, + "loss": 0.0004, + "step": 29673 + }, + { + "epoch": 0.58, + "learning_rate": 8.495980738612092e-08, + "loss": 0.0007, + "step": 29674 + }, + { + "epoch": 0.58, + "learning_rate": 8.495592404178478e-08, + "loss": 0.0004, + "step": 29675 + }, + { + "epoch": 0.58, + "learning_rate": 8.495204069744864e-08, + "loss": 0.0004, + "step": 29676 + }, + { + "epoch": 0.58, + "learning_rate": 8.49481573531125e-08, + "loss": 0.0005, + "step": 29677 + }, + { + "epoch": 0.58, + "learning_rate": 8.494427400877636e-08, + "loss": 0.0007, + "step": 29678 + }, + { + "epoch": 0.58, + "learning_rate": 8.494039066444022e-08, + "loss": 0.0007, + "step": 29679 + }, + { + "epoch": 0.58, + "learning_rate": 8.493650732010406e-08, + "loss": 0.0004, + "step": 29680 + }, + { + "epoch": 0.58, + "learning_rate": 8.493262397576792e-08, + "loss": 0.2178, + "step": 29681 + }, + { + "epoch": 0.58, + "learning_rate": 8.492874063143178e-08, + "loss": 0.0004, + "step": 29682 + }, + { + "epoch": 0.58, + "learning_rate": 8.492485728709564e-08, + "loss": 0.005, + "step": 29683 + }, + { + "epoch": 0.58, + "learning_rate": 8.49209739427595e-08, + "loss": 0.0007, + "step": 29684 + }, + { + "epoch": 0.58, + "learning_rate": 8.491709059842335e-08, + "loss": 0.0005, + "step": 29685 + }, + { + "epoch": 0.58, + "learning_rate": 8.491320725408721e-08, + "loss": 0.0007, + "step": 29686 + }, + { + "epoch": 0.58, + "learning_rate": 8.490932390975107e-08, + "loss": 0.0022, + "step": 29687 + }, + { + "epoch": 0.58, + "learning_rate": 8.490544056541493e-08, + "loss": 0.0005, + "step": 29688 + }, + { + "epoch": 0.58, + "learning_rate": 8.490155722107878e-08, + "loss": 0.0012, + "step": 29689 + }, + { + "epoch": 0.58, + "learning_rate": 8.489767387674264e-08, + "loss": 0.0007, + "step": 29690 + }, + { + "epoch": 0.58, + "learning_rate": 8.48937905324065e-08, + "loss": 0.0003, + "step": 29691 + }, + { + "epoch": 0.58, + "learning_rate": 8.488990718807036e-08, + "loss": 0.0005, + "step": 29692 + }, + { + "epoch": 0.58, + "learning_rate": 8.488602384373422e-08, + "loss": 0.0004, + "step": 29693 + }, + { + "epoch": 0.58, + "learning_rate": 8.488214049939808e-08, + "loss": 0.0006, + "step": 29694 + }, + { + "epoch": 0.58, + "learning_rate": 8.487825715506193e-08, + "loss": 0.0007, + "step": 29695 + }, + { + "epoch": 0.58, + "learning_rate": 8.487437381072579e-08, + "loss": 0.0004, + "step": 29696 + }, + { + "epoch": 0.58, + "learning_rate": 8.487049046638965e-08, + "loss": 0.0007, + "step": 29697 + }, + { + "epoch": 0.58, + "learning_rate": 8.486660712205351e-08, + "loss": 0.0006, + "step": 29698 + }, + { + "epoch": 0.58, + "learning_rate": 8.486272377771737e-08, + "loss": 0.0005, + "step": 29699 + }, + { + "epoch": 0.58, + "learning_rate": 8.485884043338123e-08, + "loss": 0.0005, + "step": 29700 + }, + { + "epoch": 0.58, + "learning_rate": 8.485495708904508e-08, + "loss": 0.0005, + "step": 29701 + }, + { + "epoch": 0.58, + "learning_rate": 8.485107374470893e-08, + "loss": 0.0015, + "step": 29702 + }, + { + "epoch": 0.58, + "learning_rate": 8.484719040037279e-08, + "loss": 0.0006, + "step": 29703 + }, + { + "epoch": 0.58, + "learning_rate": 8.484330705603665e-08, + "loss": 0.0037, + "step": 29704 + }, + { + "epoch": 0.58, + "learning_rate": 8.48394237117005e-08, + "loss": 0.0005, + "step": 29705 + }, + { + "epoch": 0.58, + "learning_rate": 8.483554036736436e-08, + "loss": 0.0004, + "step": 29706 + }, + { + "epoch": 0.58, + "learning_rate": 8.483165702302822e-08, + "loss": 0.0008, + "step": 29707 + }, + { + "epoch": 0.58, + "learning_rate": 8.482777367869208e-08, + "loss": 0.0004, + "step": 29708 + }, + { + "epoch": 0.58, + "learning_rate": 8.482389033435594e-08, + "loss": 0.0007, + "step": 29709 + }, + { + "epoch": 0.58, + "learning_rate": 8.48200069900198e-08, + "loss": 0.0006, + "step": 29710 + }, + { + "epoch": 0.58, + "learning_rate": 8.481612364568365e-08, + "loss": 0.0099, + "step": 29711 + }, + { + "epoch": 0.58, + "learning_rate": 8.481224030134751e-08, + "loss": 0.0004, + "step": 29712 + }, + { + "epoch": 0.58, + "learning_rate": 8.480835695701137e-08, + "loss": 0.4007, + "step": 29713 + }, + { + "epoch": 0.58, + "learning_rate": 8.480447361267523e-08, + "loss": 0.0005, + "step": 29714 + }, + { + "epoch": 0.58, + "learning_rate": 8.480059026833909e-08, + "loss": 0.0007, + "step": 29715 + }, + { + "epoch": 0.58, + "learning_rate": 8.479670692400294e-08, + "loss": 0.0003, + "step": 29716 + }, + { + "epoch": 0.58, + "learning_rate": 8.47928235796668e-08, + "loss": 0.0006, + "step": 29717 + }, + { + "epoch": 0.58, + "learning_rate": 8.478894023533066e-08, + "loss": 0.0004, + "step": 29718 + }, + { + "epoch": 0.58, + "learning_rate": 8.478505689099452e-08, + "loss": 0.0007, + "step": 29719 + }, + { + "epoch": 0.58, + "learning_rate": 8.478117354665838e-08, + "loss": 0.0006, + "step": 29720 + }, + { + "epoch": 0.58, + "learning_rate": 8.477729020232224e-08, + "loss": 0.0004, + "step": 29721 + }, + { + "epoch": 0.58, + "learning_rate": 8.47734068579861e-08, + "loss": 0.0005, + "step": 29722 + }, + { + "epoch": 0.58, + "learning_rate": 8.476952351364995e-08, + "loss": 0.0015, + "step": 29723 + }, + { + "epoch": 0.58, + "learning_rate": 8.476564016931381e-08, + "loss": 0.0005, + "step": 29724 + }, + { + "epoch": 0.58, + "learning_rate": 8.476175682497767e-08, + "loss": 0.0007, + "step": 29725 + }, + { + "epoch": 0.58, + "learning_rate": 8.475787348064153e-08, + "loss": 0.0005, + "step": 29726 + }, + { + "epoch": 0.58, + "learning_rate": 8.475399013630538e-08, + "loss": 0.0005, + "step": 29727 + }, + { + "epoch": 0.58, + "learning_rate": 8.475010679196924e-08, + "loss": 0.0005, + "step": 29728 + }, + { + "epoch": 0.58, + "learning_rate": 8.47462234476331e-08, + "loss": 0.0005, + "step": 29729 + }, + { + "epoch": 0.58, + "learning_rate": 8.474234010329696e-08, + "loss": 0.3051, + "step": 29730 + }, + { + "epoch": 0.58, + "learning_rate": 8.47384567589608e-08, + "loss": 0.0004, + "step": 29731 + }, + { + "epoch": 0.58, + "learning_rate": 8.473457341462466e-08, + "loss": 0.0004, + "step": 29732 + }, + { + "epoch": 0.58, + "learning_rate": 8.473069007028852e-08, + "loss": 0.0063, + "step": 29733 + }, + { + "epoch": 0.58, + "learning_rate": 8.472680672595238e-08, + "loss": 0.0006, + "step": 29734 + }, + { + "epoch": 0.58, + "learning_rate": 8.472292338161624e-08, + "loss": 0.6605, + "step": 29735 + }, + { + "epoch": 0.58, + "learning_rate": 8.47190400372801e-08, + "loss": 0.0004, + "step": 29736 + }, + { + "epoch": 0.58, + "learning_rate": 8.471515669294395e-08, + "loss": 0.0007, + "step": 29737 + }, + { + "epoch": 0.58, + "learning_rate": 8.471127334860781e-08, + "loss": 0.0008, + "step": 29738 + }, + { + "epoch": 0.58, + "learning_rate": 8.470739000427167e-08, + "loss": 0.0005, + "step": 29739 + }, + { + "epoch": 0.58, + "learning_rate": 8.470350665993553e-08, + "loss": 0.0005, + "step": 29740 + }, + { + "epoch": 0.58, + "learning_rate": 8.469962331559939e-08, + "loss": 0.0005, + "step": 29741 + }, + { + "epoch": 0.58, + "learning_rate": 8.469573997126325e-08, + "loss": 0.0005, + "step": 29742 + }, + { + "epoch": 0.58, + "learning_rate": 8.46918566269271e-08, + "loss": 0.0006, + "step": 29743 + }, + { + "epoch": 0.58, + "learning_rate": 8.468797328259096e-08, + "loss": 0.0006, + "step": 29744 + }, + { + "epoch": 0.58, + "learning_rate": 8.468408993825482e-08, + "loss": 0.0005, + "step": 29745 + }, + { + "epoch": 0.58, + "learning_rate": 8.468020659391868e-08, + "loss": 0.4038, + "step": 29746 + }, + { + "epoch": 0.58, + "learning_rate": 8.467632324958254e-08, + "loss": 0.2579, + "step": 29747 + }, + { + "epoch": 0.58, + "learning_rate": 8.46724399052464e-08, + "loss": 0.0006, + "step": 29748 + }, + { + "epoch": 0.58, + "learning_rate": 8.466855656091025e-08, + "loss": 0.0005, + "step": 29749 + }, + { + "epoch": 0.58, + "learning_rate": 8.466467321657411e-08, + "loss": 0.0006, + "step": 29750 + }, + { + "epoch": 0.58, + "learning_rate": 8.466078987223797e-08, + "loss": 0.246, + "step": 29751 + }, + { + "epoch": 0.58, + "learning_rate": 8.465690652790183e-08, + "loss": 0.0004, + "step": 29752 + }, + { + "epoch": 0.58, + "learning_rate": 8.465302318356569e-08, + "loss": 0.0004, + "step": 29753 + }, + { + "epoch": 0.58, + "learning_rate": 8.464913983922954e-08, + "loss": 0.0005, + "step": 29754 + }, + { + "epoch": 0.58, + "learning_rate": 8.46452564948934e-08, + "loss": 0.0007, + "step": 29755 + }, + { + "epoch": 0.58, + "learning_rate": 8.464137315055726e-08, + "loss": 0.0013, + "step": 29756 + }, + { + "epoch": 0.58, + "learning_rate": 8.463748980622112e-08, + "loss": 0.0006, + "step": 29757 + }, + { + "epoch": 0.58, + "learning_rate": 8.463360646188498e-08, + "loss": 0.0005, + "step": 29758 + }, + { + "epoch": 0.58, + "learning_rate": 8.462972311754884e-08, + "loss": 0.0005, + "step": 29759 + }, + { + "epoch": 0.58, + "learning_rate": 8.462583977321268e-08, + "loss": 0.0004, + "step": 29760 + }, + { + "epoch": 0.58, + "learning_rate": 8.462195642887654e-08, + "loss": 0.0005, + "step": 29761 + }, + { + "epoch": 0.58, + "learning_rate": 8.46180730845404e-08, + "loss": 0.0007, + "step": 29762 + }, + { + "epoch": 0.58, + "learning_rate": 8.461418974020426e-08, + "loss": 0.0004, + "step": 29763 + }, + { + "epoch": 0.58, + "learning_rate": 8.461030639586811e-08, + "loss": 0.1034, + "step": 29764 + }, + { + "epoch": 0.58, + "learning_rate": 8.460642305153197e-08, + "loss": 1.1004, + "step": 29765 + }, + { + "epoch": 0.58, + "learning_rate": 8.460253970719583e-08, + "loss": 0.0004, + "step": 29766 + }, + { + "epoch": 0.58, + "learning_rate": 8.459865636285969e-08, + "loss": 0.0006, + "step": 29767 + }, + { + "epoch": 0.58, + "learning_rate": 8.459477301852355e-08, + "loss": 0.0011, + "step": 29768 + }, + { + "epoch": 0.58, + "learning_rate": 8.45908896741874e-08, + "loss": 0.1557, + "step": 29769 + }, + { + "epoch": 0.58, + "learning_rate": 8.458700632985126e-08, + "loss": 0.0006, + "step": 29770 + }, + { + "epoch": 0.58, + "learning_rate": 8.458312298551512e-08, + "loss": 0.1954, + "step": 29771 + }, + { + "epoch": 0.58, + "learning_rate": 8.457923964117898e-08, + "loss": 0.9135, + "step": 29772 + }, + { + "epoch": 0.58, + "learning_rate": 8.457535629684284e-08, + "loss": 0.0005, + "step": 29773 + }, + { + "epoch": 0.58, + "learning_rate": 8.45714729525067e-08, + "loss": 0.0005, + "step": 29774 + }, + { + "epoch": 0.58, + "learning_rate": 8.456758960817055e-08, + "loss": 0.0004, + "step": 29775 + }, + { + "epoch": 0.58, + "learning_rate": 8.456370626383441e-08, + "loss": 0.0005, + "step": 29776 + }, + { + "epoch": 0.58, + "learning_rate": 8.455982291949827e-08, + "loss": 0.001, + "step": 29777 + }, + { + "epoch": 0.58, + "learning_rate": 8.455593957516213e-08, + "loss": 0.0007, + "step": 29778 + }, + { + "epoch": 0.58, + "learning_rate": 8.455205623082599e-08, + "loss": 0.0007, + "step": 29779 + }, + { + "epoch": 0.58, + "learning_rate": 8.454817288648985e-08, + "loss": 0.876, + "step": 29780 + }, + { + "epoch": 0.58, + "learning_rate": 8.45442895421537e-08, + "loss": 0.0005, + "step": 29781 + }, + { + "epoch": 0.58, + "learning_rate": 8.454040619781756e-08, + "loss": 0.0005, + "step": 29782 + }, + { + "epoch": 0.58, + "learning_rate": 8.453652285348142e-08, + "loss": 0.0006, + "step": 29783 + }, + { + "epoch": 0.58, + "learning_rate": 8.453263950914528e-08, + "loss": 0.0004, + "step": 29784 + }, + { + "epoch": 0.58, + "learning_rate": 8.452875616480914e-08, + "loss": 0.3333, + "step": 29785 + }, + { + "epoch": 0.58, + "learning_rate": 8.4524872820473e-08, + "loss": 0.0005, + "step": 29786 + }, + { + "epoch": 0.58, + "learning_rate": 8.452098947613685e-08, + "loss": 0.0006, + "step": 29787 + }, + { + "epoch": 0.58, + "learning_rate": 8.451710613180071e-08, + "loss": 0.0008, + "step": 29788 + }, + { + "epoch": 0.58, + "learning_rate": 8.451322278746456e-08, + "loss": 0.005, + "step": 29789 + }, + { + "epoch": 0.58, + "learning_rate": 8.450933944312841e-08, + "loss": 0.0005, + "step": 29790 + }, + { + "epoch": 0.58, + "learning_rate": 8.450545609879227e-08, + "loss": 0.0006, + "step": 29791 + }, + { + "epoch": 0.58, + "learning_rate": 8.450157275445613e-08, + "loss": 0.0005, + "step": 29792 + }, + { + "epoch": 0.58, + "learning_rate": 8.449768941011999e-08, + "loss": 0.0008, + "step": 29793 + }, + { + "epoch": 0.58, + "learning_rate": 8.449380606578385e-08, + "loss": 0.0007, + "step": 29794 + }, + { + "epoch": 0.58, + "learning_rate": 8.44899227214477e-08, + "loss": 0.0007, + "step": 29795 + }, + { + "epoch": 0.58, + "learning_rate": 8.448603937711156e-08, + "loss": 0.0008, + "step": 29796 + }, + { + "epoch": 0.58, + "learning_rate": 8.448215603277542e-08, + "loss": 0.0005, + "step": 29797 + }, + { + "epoch": 0.58, + "learning_rate": 8.447827268843928e-08, + "loss": 0.0005, + "step": 29798 + }, + { + "epoch": 0.58, + "learning_rate": 8.447438934410314e-08, + "loss": 0.0004, + "step": 29799 + }, + { + "epoch": 0.58, + "learning_rate": 8.4470505999767e-08, + "loss": 0.0005, + "step": 29800 + }, + { + "epoch": 0.58, + "learning_rate": 8.446662265543086e-08, + "loss": 0.0005, + "step": 29801 + }, + { + "epoch": 0.58, + "learning_rate": 8.446273931109471e-08, + "loss": 0.0008, + "step": 29802 + }, + { + "epoch": 0.58, + "learning_rate": 8.445885596675857e-08, + "loss": 0.6603, + "step": 29803 + }, + { + "epoch": 0.58, + "learning_rate": 8.445497262242243e-08, + "loss": 0.0017, + "step": 29804 + }, + { + "epoch": 0.58, + "learning_rate": 8.445108927808629e-08, + "loss": 0.0006, + "step": 29805 + }, + { + "epoch": 0.58, + "learning_rate": 8.444720593375015e-08, + "loss": 0.0004, + "step": 29806 + }, + { + "epoch": 0.58, + "learning_rate": 8.4443322589414e-08, + "loss": 0.0014, + "step": 29807 + }, + { + "epoch": 0.58, + "learning_rate": 8.443943924507786e-08, + "loss": 0.0006, + "step": 29808 + }, + { + "epoch": 0.58, + "learning_rate": 8.443555590074172e-08, + "loss": 0.0007, + "step": 29809 + }, + { + "epoch": 0.58, + "learning_rate": 8.443167255640558e-08, + "loss": 0.0711, + "step": 29810 + }, + { + "epoch": 0.58, + "learning_rate": 8.442778921206944e-08, + "loss": 0.0004, + "step": 29811 + }, + { + "epoch": 0.58, + "learning_rate": 8.44239058677333e-08, + "loss": 0.001, + "step": 29812 + }, + { + "epoch": 0.58, + "learning_rate": 8.442002252339715e-08, + "loss": 0.0005, + "step": 29813 + }, + { + "epoch": 0.58, + "learning_rate": 8.441613917906101e-08, + "loss": 0.0004, + "step": 29814 + }, + { + "epoch": 0.58, + "learning_rate": 8.441225583472487e-08, + "loss": 0.0007, + "step": 29815 + }, + { + "epoch": 0.58, + "learning_rate": 8.440837249038873e-08, + "loss": 1.3089, + "step": 29816 + }, + { + "epoch": 0.58, + "learning_rate": 8.440448914605259e-08, + "loss": 0.0004, + "step": 29817 + }, + { + "epoch": 0.58, + "learning_rate": 8.440060580171643e-08, + "loss": 0.0005, + "step": 29818 + }, + { + "epoch": 0.58, + "learning_rate": 8.439672245738029e-08, + "loss": 0.0005, + "step": 29819 + }, + { + "epoch": 0.58, + "learning_rate": 8.439283911304415e-08, + "loss": 0.0369, + "step": 29820 + }, + { + "epoch": 0.58, + "learning_rate": 8.438895576870801e-08, + "loss": 0.4165, + "step": 29821 + }, + { + "epoch": 0.58, + "learning_rate": 8.438507242437187e-08, + "loss": 0.4472, + "step": 29822 + }, + { + "epoch": 0.58, + "learning_rate": 8.438118908003572e-08, + "loss": 0.0004, + "step": 29823 + }, + { + "epoch": 0.58, + "learning_rate": 8.437730573569958e-08, + "loss": 0.6245, + "step": 29824 + }, + { + "epoch": 0.58, + "learning_rate": 8.437342239136344e-08, + "loss": 0.0005, + "step": 29825 + }, + { + "epoch": 0.58, + "learning_rate": 8.43695390470273e-08, + "loss": 0.0022, + "step": 29826 + }, + { + "epoch": 0.58, + "learning_rate": 8.436565570269116e-08, + "loss": 0.0006, + "step": 29827 + }, + { + "epoch": 0.58, + "learning_rate": 8.436177235835501e-08, + "loss": 0.0007, + "step": 29828 + }, + { + "epoch": 0.58, + "learning_rate": 8.435788901401887e-08, + "loss": 0.0005, + "step": 29829 + }, + { + "epoch": 0.58, + "learning_rate": 8.435400566968273e-08, + "loss": 0.0004, + "step": 29830 + }, + { + "epoch": 0.58, + "learning_rate": 8.435012232534659e-08, + "loss": 0.0004, + "step": 29831 + }, + { + "epoch": 0.58, + "learning_rate": 8.434623898101045e-08, + "loss": 0.0007, + "step": 29832 + }, + { + "epoch": 0.58, + "learning_rate": 8.43423556366743e-08, + "loss": 0.0545, + "step": 29833 + }, + { + "epoch": 0.58, + "learning_rate": 8.433847229233816e-08, + "loss": 0.0406, + "step": 29834 + }, + { + "epoch": 0.58, + "learning_rate": 8.433458894800202e-08, + "loss": 0.0009, + "step": 29835 + }, + { + "epoch": 0.58, + "learning_rate": 8.433070560366588e-08, + "loss": 0.0003, + "step": 29836 + }, + { + "epoch": 0.58, + "learning_rate": 8.432682225932974e-08, + "loss": 0.0007, + "step": 29837 + }, + { + "epoch": 0.58, + "learning_rate": 8.43229389149936e-08, + "loss": 0.0005, + "step": 29838 + }, + { + "epoch": 0.58, + "learning_rate": 8.431905557065746e-08, + "loss": 0.0095, + "step": 29839 + }, + { + "epoch": 0.58, + "learning_rate": 8.431517222632131e-08, + "loss": 0.0003, + "step": 29840 + }, + { + "epoch": 0.58, + "learning_rate": 8.431128888198517e-08, + "loss": 0.0006, + "step": 29841 + }, + { + "epoch": 0.58, + "learning_rate": 8.430740553764903e-08, + "loss": 0.0005, + "step": 29842 + }, + { + "epoch": 0.58, + "learning_rate": 8.430352219331287e-08, + "loss": 0.7386, + "step": 29843 + }, + { + "epoch": 0.58, + "learning_rate": 8.429963884897673e-08, + "loss": 0.0005, + "step": 29844 + }, + { + "epoch": 0.58, + "learning_rate": 8.429575550464059e-08, + "loss": 0.7587, + "step": 29845 + }, + { + "epoch": 0.58, + "learning_rate": 8.429187216030445e-08, + "loss": 0.0538, + "step": 29846 + }, + { + "epoch": 0.58, + "learning_rate": 8.428798881596831e-08, + "loss": 0.0005, + "step": 29847 + }, + { + "epoch": 0.58, + "learning_rate": 8.428410547163217e-08, + "loss": 0.0007, + "step": 29848 + }, + { + "epoch": 0.58, + "learning_rate": 8.428022212729602e-08, + "loss": 0.0269, + "step": 29849 + }, + { + "epoch": 0.58, + "learning_rate": 8.427633878295988e-08, + "loss": 0.0005, + "step": 29850 + }, + { + "epoch": 0.58, + "learning_rate": 8.427245543862374e-08, + "loss": 0.0004, + "step": 29851 + }, + { + "epoch": 0.58, + "learning_rate": 8.42685720942876e-08, + "loss": 0.0005, + "step": 29852 + }, + { + "epoch": 0.58, + "learning_rate": 8.426468874995146e-08, + "loss": 0.0007, + "step": 29853 + }, + { + "epoch": 0.58, + "learning_rate": 8.426080540561532e-08, + "loss": 0.0008, + "step": 29854 + }, + { + "epoch": 0.58, + "learning_rate": 8.425692206127917e-08, + "loss": 0.2572, + "step": 29855 + }, + { + "epoch": 0.58, + "learning_rate": 8.425303871694303e-08, + "loss": 0.0005, + "step": 29856 + }, + { + "epoch": 0.58, + "learning_rate": 8.424915537260688e-08, + "loss": 0.0006, + "step": 29857 + }, + { + "epoch": 0.58, + "learning_rate": 8.424527202827074e-08, + "loss": 0.0005, + "step": 29858 + }, + { + "epoch": 0.58, + "learning_rate": 8.42413886839346e-08, + "loss": 0.0004, + "step": 29859 + }, + { + "epoch": 0.58, + "learning_rate": 8.423750533959845e-08, + "loss": 0.3324, + "step": 29860 + }, + { + "epoch": 0.58, + "learning_rate": 8.423362199526231e-08, + "loss": 0.0005, + "step": 29861 + }, + { + "epoch": 0.58, + "learning_rate": 8.422973865092617e-08, + "loss": 0.0005, + "step": 29862 + }, + { + "epoch": 0.58, + "learning_rate": 8.422585530659003e-08, + "loss": 0.0004, + "step": 29863 + }, + { + "epoch": 0.58, + "learning_rate": 8.422197196225388e-08, + "loss": 0.0006, + "step": 29864 + }, + { + "epoch": 0.58, + "learning_rate": 8.421808861791774e-08, + "loss": 0.0005, + "step": 29865 + }, + { + "epoch": 0.58, + "learning_rate": 8.42142052735816e-08, + "loss": 0.0004, + "step": 29866 + }, + { + "epoch": 0.58, + "learning_rate": 8.421032192924546e-08, + "loss": 0.0006, + "step": 29867 + }, + { + "epoch": 0.58, + "learning_rate": 8.420643858490932e-08, + "loss": 0.0007, + "step": 29868 + }, + { + "epoch": 0.58, + "learning_rate": 8.420255524057318e-08, + "loss": 0.0006, + "step": 29869 + }, + { + "epoch": 0.58, + "learning_rate": 8.419867189623703e-08, + "loss": 0.0088, + "step": 29870 + }, + { + "epoch": 0.58, + "learning_rate": 8.419478855190089e-08, + "loss": 1.0811, + "step": 29871 + }, + { + "epoch": 0.58, + "learning_rate": 8.419090520756475e-08, + "loss": 0.0006, + "step": 29872 + }, + { + "epoch": 0.58, + "learning_rate": 8.418702186322861e-08, + "loss": 0.0007, + "step": 29873 + }, + { + "epoch": 0.58, + "learning_rate": 8.418313851889247e-08, + "loss": 0.0004, + "step": 29874 + }, + { + "epoch": 0.58, + "learning_rate": 8.417925517455633e-08, + "loss": 0.0007, + "step": 29875 + }, + { + "epoch": 0.58, + "learning_rate": 8.417537183022017e-08, + "loss": 0.0005, + "step": 29876 + }, + { + "epoch": 0.58, + "learning_rate": 8.417148848588403e-08, + "loss": 0.0006, + "step": 29877 + }, + { + "epoch": 0.58, + "learning_rate": 8.416760514154789e-08, + "loss": 0.0093, + "step": 29878 + }, + { + "epoch": 0.58, + "learning_rate": 8.416372179721175e-08, + "loss": 0.0004, + "step": 29879 + }, + { + "epoch": 0.58, + "learning_rate": 8.41598384528756e-08, + "loss": 0.3391, + "step": 29880 + }, + { + "epoch": 0.58, + "learning_rate": 8.415595510853946e-08, + "loss": 0.0003, + "step": 29881 + }, + { + "epoch": 0.58, + "learning_rate": 8.415207176420332e-08, + "loss": 0.0005, + "step": 29882 + }, + { + "epoch": 0.58, + "learning_rate": 8.414818841986718e-08, + "loss": 0.0004, + "step": 29883 + }, + { + "epoch": 0.58, + "learning_rate": 8.414430507553104e-08, + "loss": 0.0006, + "step": 29884 + }, + { + "epoch": 0.58, + "learning_rate": 8.41404217311949e-08, + "loss": 0.0004, + "step": 29885 + }, + { + "epoch": 0.58, + "learning_rate": 8.413653838685875e-08, + "loss": 0.0006, + "step": 29886 + }, + { + "epoch": 0.58, + "learning_rate": 8.413265504252261e-08, + "loss": 0.0006, + "step": 29887 + }, + { + "epoch": 0.58, + "learning_rate": 8.412877169818647e-08, + "loss": 0.0005, + "step": 29888 + }, + { + "epoch": 0.58, + "learning_rate": 8.412488835385033e-08, + "loss": 0.9988, + "step": 29889 + }, + { + "epoch": 0.58, + "learning_rate": 8.412100500951419e-08, + "loss": 0.0005, + "step": 29890 + }, + { + "epoch": 0.58, + "learning_rate": 8.411712166517804e-08, + "loss": 0.0004, + "step": 29891 + }, + { + "epoch": 0.58, + "learning_rate": 8.41132383208419e-08, + "loss": 0.0008, + "step": 29892 + }, + { + "epoch": 0.58, + "learning_rate": 8.410935497650576e-08, + "loss": 0.0004, + "step": 29893 + }, + { + "epoch": 0.58, + "learning_rate": 8.410547163216962e-08, + "loss": 0.0005, + "step": 29894 + }, + { + "epoch": 0.58, + "learning_rate": 8.410158828783348e-08, + "loss": 0.0008, + "step": 29895 + }, + { + "epoch": 0.58, + "learning_rate": 8.409770494349734e-08, + "loss": 0.3252, + "step": 29896 + }, + { + "epoch": 0.58, + "learning_rate": 8.40938215991612e-08, + "loss": 0.0005, + "step": 29897 + }, + { + "epoch": 0.58, + "learning_rate": 8.408993825482505e-08, + "loss": 1.2666, + "step": 29898 + }, + { + "epoch": 0.58, + "learning_rate": 8.408605491048891e-08, + "loss": 0.0006, + "step": 29899 + }, + { + "epoch": 0.58, + "learning_rate": 8.408217156615277e-08, + "loss": 0.0005, + "step": 29900 + }, + { + "epoch": 0.58, + "learning_rate": 8.407828822181663e-08, + "loss": 0.0006, + "step": 29901 + }, + { + "epoch": 0.58, + "learning_rate": 8.407440487748048e-08, + "loss": 0.0004, + "step": 29902 + }, + { + "epoch": 0.58, + "learning_rate": 8.407052153314434e-08, + "loss": 0.0004, + "step": 29903 + }, + { + "epoch": 0.58, + "learning_rate": 8.40666381888082e-08, + "loss": 0.0005, + "step": 29904 + }, + { + "epoch": 0.58, + "learning_rate": 8.406275484447205e-08, + "loss": 0.9509, + "step": 29905 + }, + { + "epoch": 0.58, + "learning_rate": 8.40588715001359e-08, + "loss": 0.0006, + "step": 29906 + }, + { + "epoch": 0.58, + "learning_rate": 8.405498815579976e-08, + "loss": 0.0039, + "step": 29907 + }, + { + "epoch": 0.58, + "learning_rate": 8.405110481146362e-08, + "loss": 0.0005, + "step": 29908 + }, + { + "epoch": 0.58, + "learning_rate": 8.404722146712748e-08, + "loss": 0.0005, + "step": 29909 + }, + { + "epoch": 0.58, + "learning_rate": 8.404333812279134e-08, + "loss": 0.0005, + "step": 29910 + }, + { + "epoch": 0.58, + "learning_rate": 8.40394547784552e-08, + "loss": 0.0004, + "step": 29911 + }, + { + "epoch": 0.58, + "learning_rate": 8.403557143411905e-08, + "loss": 0.0004, + "step": 29912 + }, + { + "epoch": 0.58, + "learning_rate": 8.403168808978291e-08, + "loss": 0.0004, + "step": 29913 + }, + { + "epoch": 0.58, + "learning_rate": 8.402780474544677e-08, + "loss": 0.0004, + "step": 29914 + }, + { + "epoch": 0.58, + "learning_rate": 8.402392140111063e-08, + "loss": 0.0007, + "step": 29915 + }, + { + "epoch": 0.58, + "learning_rate": 8.402003805677449e-08, + "loss": 0.0008, + "step": 29916 + }, + { + "epoch": 0.58, + "learning_rate": 8.401615471243835e-08, + "loss": 0.0005, + "step": 29917 + }, + { + "epoch": 0.58, + "learning_rate": 8.40122713681022e-08, + "loss": 0.0006, + "step": 29918 + }, + { + "epoch": 0.58, + "learning_rate": 8.400838802376606e-08, + "loss": 0.0024, + "step": 29919 + }, + { + "epoch": 0.58, + "learning_rate": 8.400450467942992e-08, + "loss": 0.0005, + "step": 29920 + }, + { + "epoch": 0.58, + "learning_rate": 8.400062133509378e-08, + "loss": 0.1756, + "step": 29921 + }, + { + "epoch": 0.58, + "learning_rate": 8.399673799075764e-08, + "loss": 0.0022, + "step": 29922 + }, + { + "epoch": 0.58, + "learning_rate": 8.39928546464215e-08, + "loss": 0.0004, + "step": 29923 + }, + { + "epoch": 0.58, + "learning_rate": 8.398897130208535e-08, + "loss": 1.2812, + "step": 29924 + }, + { + "epoch": 0.58, + "learning_rate": 8.398508795774921e-08, + "loss": 0.0006, + "step": 29925 + }, + { + "epoch": 0.58, + "learning_rate": 8.398120461341307e-08, + "loss": 0.0007, + "step": 29926 + }, + { + "epoch": 0.58, + "learning_rate": 8.397732126907693e-08, + "loss": 0.0004, + "step": 29927 + }, + { + "epoch": 0.58, + "learning_rate": 8.397343792474079e-08, + "loss": 0.0022, + "step": 29928 + }, + { + "epoch": 0.58, + "learning_rate": 8.396955458040464e-08, + "loss": 0.0006, + "step": 29929 + }, + { + "epoch": 0.58, + "learning_rate": 8.39656712360685e-08, + "loss": 0.0006, + "step": 29930 + }, + { + "epoch": 0.58, + "learning_rate": 8.396178789173236e-08, + "loss": 0.0006, + "step": 29931 + }, + { + "epoch": 0.58, + "learning_rate": 8.395790454739622e-08, + "loss": 0.0004, + "step": 29932 + }, + { + "epoch": 0.58, + "learning_rate": 8.395402120306008e-08, + "loss": 0.0082, + "step": 29933 + }, + { + "epoch": 0.58, + "learning_rate": 8.395013785872392e-08, + "loss": 0.002, + "step": 29934 + }, + { + "epoch": 0.58, + "learning_rate": 8.394625451438778e-08, + "loss": 0.0005, + "step": 29935 + }, + { + "epoch": 0.58, + "learning_rate": 8.394237117005164e-08, + "loss": 0.0006, + "step": 29936 + }, + { + "epoch": 0.58, + "learning_rate": 8.39384878257155e-08, + "loss": 0.0007, + "step": 29937 + }, + { + "epoch": 0.58, + "learning_rate": 8.393460448137936e-08, + "loss": 0.0007, + "step": 29938 + }, + { + "epoch": 0.58, + "learning_rate": 8.393072113704321e-08, + "loss": 0.0003, + "step": 29939 + }, + { + "epoch": 0.58, + "learning_rate": 8.392683779270707e-08, + "loss": 0.5864, + "step": 29940 + }, + { + "epoch": 0.58, + "learning_rate": 8.392295444837093e-08, + "loss": 0.0006, + "step": 29941 + }, + { + "epoch": 0.58, + "learning_rate": 8.391907110403479e-08, + "loss": 0.0005, + "step": 29942 + }, + { + "epoch": 0.58, + "learning_rate": 8.391518775969865e-08, + "loss": 0.2585, + "step": 29943 + }, + { + "epoch": 0.58, + "learning_rate": 8.39113044153625e-08, + "loss": 0.0005, + "step": 29944 + }, + { + "epoch": 0.58, + "learning_rate": 8.390742107102636e-08, + "loss": 0.0006, + "step": 29945 + }, + { + "epoch": 0.58, + "learning_rate": 8.390353772669022e-08, + "loss": 0.0006, + "step": 29946 + }, + { + "epoch": 0.58, + "learning_rate": 8.389965438235408e-08, + "loss": 0.0004, + "step": 29947 + }, + { + "epoch": 0.58, + "learning_rate": 8.389577103801794e-08, + "loss": 0.0005, + "step": 29948 + }, + { + "epoch": 0.58, + "learning_rate": 8.38918876936818e-08, + "loss": 0.0006, + "step": 29949 + }, + { + "epoch": 0.58, + "learning_rate": 8.388800434934565e-08, + "loss": 0.0006, + "step": 29950 + }, + { + "epoch": 0.58, + "learning_rate": 8.388412100500951e-08, + "loss": 0.0008, + "step": 29951 + }, + { + "epoch": 0.58, + "learning_rate": 8.388023766067337e-08, + "loss": 0.0005, + "step": 29952 + }, + { + "epoch": 0.58, + "learning_rate": 8.387635431633723e-08, + "loss": 0.0017, + "step": 29953 + }, + { + "epoch": 0.58, + "learning_rate": 8.387247097200109e-08, + "loss": 0.0004, + "step": 29954 + }, + { + "epoch": 0.58, + "learning_rate": 8.386858762766495e-08, + "loss": 0.0007, + "step": 29955 + }, + { + "epoch": 0.58, + "learning_rate": 8.38647042833288e-08, + "loss": 0.0004, + "step": 29956 + }, + { + "epoch": 0.58, + "learning_rate": 8.386082093899266e-08, + "loss": 0.0008, + "step": 29957 + }, + { + "epoch": 0.58, + "learning_rate": 8.385693759465652e-08, + "loss": 0.0008, + "step": 29958 + }, + { + "epoch": 0.58, + "learning_rate": 8.385305425032038e-08, + "loss": 0.0005, + "step": 29959 + }, + { + "epoch": 0.58, + "learning_rate": 8.384917090598424e-08, + "loss": 0.0007, + "step": 29960 + }, + { + "epoch": 0.58, + "learning_rate": 8.38452875616481e-08, + "loss": 0.0005, + "step": 29961 + }, + { + "epoch": 0.58, + "learning_rate": 8.384140421731195e-08, + "loss": 0.0005, + "step": 29962 + }, + { + "epoch": 0.58, + "learning_rate": 8.38375208729758e-08, + "loss": 0.7359, + "step": 29963 + }, + { + "epoch": 0.58, + "learning_rate": 8.383363752863966e-08, + "loss": 0.0005, + "step": 29964 + }, + { + "epoch": 0.58, + "learning_rate": 8.382975418430351e-08, + "loss": 0.0006, + "step": 29965 + }, + { + "epoch": 0.58, + "learning_rate": 8.382587083996737e-08, + "loss": 0.0005, + "step": 29966 + }, + { + "epoch": 0.58, + "learning_rate": 8.382198749563123e-08, + "loss": 0.0005, + "step": 29967 + }, + { + "epoch": 0.58, + "learning_rate": 8.381810415129509e-08, + "loss": 0.0005, + "step": 29968 + }, + { + "epoch": 0.58, + "learning_rate": 8.381422080695895e-08, + "loss": 0.0004, + "step": 29969 + }, + { + "epoch": 0.58, + "learning_rate": 8.38103374626228e-08, + "loss": 0.0005, + "step": 29970 + }, + { + "epoch": 0.58, + "learning_rate": 8.380645411828666e-08, + "loss": 0.0005, + "step": 29971 + }, + { + "epoch": 0.58, + "learning_rate": 8.380257077395052e-08, + "loss": 0.0007, + "step": 29972 + }, + { + "epoch": 0.58, + "learning_rate": 8.379868742961438e-08, + "loss": 0.0006, + "step": 29973 + }, + { + "epoch": 0.58, + "learning_rate": 8.379480408527824e-08, + "loss": 0.0005, + "step": 29974 + }, + { + "epoch": 0.58, + "learning_rate": 8.37909207409421e-08, + "loss": 0.0004, + "step": 29975 + }, + { + "epoch": 0.58, + "learning_rate": 8.378703739660596e-08, + "loss": 0.0004, + "step": 29976 + }, + { + "epoch": 0.58, + "learning_rate": 8.378315405226981e-08, + "loss": 0.0006, + "step": 29977 + }, + { + "epoch": 0.58, + "learning_rate": 8.377927070793367e-08, + "loss": 0.0036, + "step": 29978 + }, + { + "epoch": 0.58, + "learning_rate": 8.377538736359753e-08, + "loss": 0.5667, + "step": 29979 + }, + { + "epoch": 0.58, + "learning_rate": 8.377150401926139e-08, + "loss": 0.0004, + "step": 29980 + }, + { + "epoch": 0.58, + "learning_rate": 8.376762067492525e-08, + "loss": 0.0006, + "step": 29981 + }, + { + "epoch": 0.58, + "learning_rate": 8.37637373305891e-08, + "loss": 0.0004, + "step": 29982 + }, + { + "epoch": 0.58, + "learning_rate": 8.375985398625296e-08, + "loss": 0.0005, + "step": 29983 + }, + { + "epoch": 0.58, + "learning_rate": 8.375597064191682e-08, + "loss": 0.2808, + "step": 29984 + }, + { + "epoch": 0.58, + "learning_rate": 8.375208729758068e-08, + "loss": 0.0004, + "step": 29985 + }, + { + "epoch": 0.58, + "learning_rate": 8.374820395324454e-08, + "loss": 0.0004, + "step": 29986 + }, + { + "epoch": 0.58, + "learning_rate": 8.37443206089084e-08, + "loss": 0.0004, + "step": 29987 + }, + { + "epoch": 0.58, + "learning_rate": 8.374043726457225e-08, + "loss": 0.0004, + "step": 29988 + }, + { + "epoch": 0.58, + "learning_rate": 8.373655392023611e-08, + "loss": 0.0006, + "step": 29989 + }, + { + "epoch": 0.58, + "learning_rate": 8.373267057589997e-08, + "loss": 0.0005, + "step": 29990 + }, + { + "epoch": 0.58, + "learning_rate": 8.372878723156383e-08, + "loss": 0.0004, + "step": 29991 + }, + { + "epoch": 0.58, + "learning_rate": 8.372490388722767e-08, + "loss": 0.0018, + "step": 29992 + }, + { + "epoch": 0.58, + "learning_rate": 8.372102054289153e-08, + "loss": 0.0032, + "step": 29993 + }, + { + "epoch": 0.58, + "learning_rate": 8.371713719855539e-08, + "loss": 0.0007, + "step": 29994 + }, + { + "epoch": 0.58, + "learning_rate": 8.371325385421925e-08, + "loss": 0.0004, + "step": 29995 + }, + { + "epoch": 0.58, + "learning_rate": 8.370937050988311e-08, + "loss": 0.0005, + "step": 29996 + }, + { + "epoch": 0.58, + "learning_rate": 8.370548716554697e-08, + "loss": 0.0007, + "step": 29997 + }, + { + "epoch": 0.58, + "learning_rate": 8.370160382121082e-08, + "loss": 0.0009, + "step": 29998 + }, + { + "epoch": 0.58, + "learning_rate": 8.369772047687468e-08, + "loss": 0.0025, + "step": 29999 + }, + { + "epoch": 0.58, + "learning_rate": 8.369383713253854e-08, + "loss": 0.0005, + "step": 30000 + }, + { + "epoch": 0.58, + "learning_rate": 8.36899537882024e-08, + "loss": 0.001, + "step": 30001 + }, + { + "epoch": 0.58, + "learning_rate": 8.368607044386626e-08, + "loss": 0.0007, + "step": 30002 + }, + { + "epoch": 0.58, + "learning_rate": 8.368218709953011e-08, + "loss": 0.0006, + "step": 30003 + }, + { + "epoch": 0.58, + "learning_rate": 8.367830375519397e-08, + "loss": 0.718, + "step": 30004 + }, + { + "epoch": 0.58, + "learning_rate": 8.367442041085783e-08, + "loss": 1.1258, + "step": 30005 + }, + { + "epoch": 0.58, + "learning_rate": 8.367053706652169e-08, + "loss": 0.0004, + "step": 30006 + }, + { + "epoch": 0.58, + "learning_rate": 8.366665372218555e-08, + "loss": 0.0312, + "step": 30007 + }, + { + "epoch": 0.58, + "learning_rate": 8.36627703778494e-08, + "loss": 1.3289, + "step": 30008 + }, + { + "epoch": 0.58, + "learning_rate": 8.365888703351326e-08, + "loss": 0.4889, + "step": 30009 + }, + { + "epoch": 0.58, + "learning_rate": 8.365500368917712e-08, + "loss": 0.0005, + "step": 30010 + }, + { + "epoch": 0.58, + "learning_rate": 8.365112034484098e-08, + "loss": 0.0005, + "step": 30011 + }, + { + "epoch": 0.58, + "learning_rate": 8.364723700050484e-08, + "loss": 0.0004, + "step": 30012 + }, + { + "epoch": 0.58, + "learning_rate": 8.36433536561687e-08, + "loss": 0.0006, + "step": 30013 + }, + { + "epoch": 0.58, + "learning_rate": 8.363947031183256e-08, + "loss": 0.0004, + "step": 30014 + }, + { + "epoch": 0.58, + "learning_rate": 8.363558696749641e-08, + "loss": 0.0005, + "step": 30015 + }, + { + "epoch": 0.58, + "learning_rate": 8.363170362316027e-08, + "loss": 0.0025, + "step": 30016 + }, + { + "epoch": 0.58, + "learning_rate": 8.362782027882413e-08, + "loss": 0.0004, + "step": 30017 + }, + { + "epoch": 0.58, + "learning_rate": 8.362393693448799e-08, + "loss": 0.0008, + "step": 30018 + }, + { + "epoch": 0.58, + "learning_rate": 8.362005359015185e-08, + "loss": 0.0005, + "step": 30019 + }, + { + "epoch": 0.58, + "learning_rate": 8.361617024581569e-08, + "loss": 0.0006, + "step": 30020 + }, + { + "epoch": 0.58, + "learning_rate": 8.361228690147955e-08, + "loss": 0.0005, + "step": 30021 + }, + { + "epoch": 0.58, + "learning_rate": 8.360840355714341e-08, + "loss": 0.0004, + "step": 30022 + }, + { + "epoch": 0.58, + "learning_rate": 8.360452021280727e-08, + "loss": 0.0006, + "step": 30023 + }, + { + "epoch": 0.58, + "learning_rate": 8.360063686847112e-08, + "loss": 0.0026, + "step": 30024 + }, + { + "epoch": 0.58, + "learning_rate": 8.359675352413498e-08, + "loss": 0.748, + "step": 30025 + }, + { + "epoch": 0.58, + "learning_rate": 8.359287017979884e-08, + "loss": 0.0008, + "step": 30026 + }, + { + "epoch": 0.58, + "learning_rate": 8.35889868354627e-08, + "loss": 0.0022, + "step": 30027 + }, + { + "epoch": 0.58, + "learning_rate": 8.358510349112656e-08, + "loss": 0.0095, + "step": 30028 + }, + { + "epoch": 0.58, + "learning_rate": 8.358122014679042e-08, + "loss": 0.0004, + "step": 30029 + }, + { + "epoch": 0.58, + "learning_rate": 8.357733680245427e-08, + "loss": 0.0005, + "step": 30030 + }, + { + "epoch": 0.58, + "learning_rate": 8.357345345811813e-08, + "loss": 0.0733, + "step": 30031 + }, + { + "epoch": 0.58, + "learning_rate": 8.356957011378199e-08, + "loss": 0.175, + "step": 30032 + }, + { + "epoch": 0.58, + "learning_rate": 8.356568676944585e-08, + "loss": 0.0005, + "step": 30033 + }, + { + "epoch": 0.58, + "learning_rate": 8.35618034251097e-08, + "loss": 0.0004, + "step": 30034 + }, + { + "epoch": 0.58, + "learning_rate": 8.355792008077355e-08, + "loss": 0.5971, + "step": 30035 + }, + { + "epoch": 0.58, + "learning_rate": 8.355403673643741e-08, + "loss": 0.0004, + "step": 30036 + }, + { + "epoch": 0.58, + "learning_rate": 8.355015339210127e-08, + "loss": 1.0462, + "step": 30037 + }, + { + "epoch": 0.58, + "learning_rate": 8.354627004776513e-08, + "loss": 0.0005, + "step": 30038 + }, + { + "epoch": 0.58, + "learning_rate": 8.354238670342899e-08, + "loss": 0.9891, + "step": 30039 + }, + { + "epoch": 0.58, + "learning_rate": 8.353850335909284e-08, + "loss": 0.8208, + "step": 30040 + }, + { + "epoch": 0.58, + "learning_rate": 8.35346200147567e-08, + "loss": 0.0242, + "step": 30041 + }, + { + "epoch": 0.58, + "learning_rate": 8.353073667042056e-08, + "loss": 0.0006, + "step": 30042 + }, + { + "epoch": 0.58, + "learning_rate": 8.352685332608442e-08, + "loss": 0.0005, + "step": 30043 + }, + { + "epoch": 0.58, + "learning_rate": 8.352296998174828e-08, + "loss": 0.0005, + "step": 30044 + }, + { + "epoch": 0.58, + "learning_rate": 8.351908663741213e-08, + "loss": 0.0004, + "step": 30045 + }, + { + "epoch": 0.58, + "learning_rate": 8.351520329307599e-08, + "loss": 1.1752, + "step": 30046 + }, + { + "epoch": 0.58, + "learning_rate": 8.351131994873985e-08, + "loss": 0.0005, + "step": 30047 + }, + { + "epoch": 0.58, + "learning_rate": 8.350743660440371e-08, + "loss": 0.0005, + "step": 30048 + }, + { + "epoch": 0.58, + "learning_rate": 8.350355326006757e-08, + "loss": 0.0005, + "step": 30049 + }, + { + "epoch": 0.58, + "learning_rate": 8.349966991573141e-08, + "loss": 0.0007, + "step": 30050 + }, + { + "epoch": 0.58, + "learning_rate": 8.349578657139527e-08, + "loss": 0.6182, + "step": 30051 + }, + { + "epoch": 0.58, + "learning_rate": 8.349190322705913e-08, + "loss": 0.0012, + "step": 30052 + }, + { + "epoch": 0.58, + "learning_rate": 8.348801988272299e-08, + "loss": 0.0004, + "step": 30053 + }, + { + "epoch": 0.58, + "learning_rate": 8.348413653838685e-08, + "loss": 0.0004, + "step": 30054 + }, + { + "epoch": 0.58, + "learning_rate": 8.34802531940507e-08, + "loss": 0.0026, + "step": 30055 + }, + { + "epoch": 0.58, + "learning_rate": 8.347636984971456e-08, + "loss": 0.0005, + "step": 30056 + }, + { + "epoch": 0.58, + "learning_rate": 8.347248650537842e-08, + "loss": 0.0007, + "step": 30057 + }, + { + "epoch": 0.58, + "learning_rate": 8.346860316104228e-08, + "loss": 0.0006, + "step": 30058 + }, + { + "epoch": 0.58, + "learning_rate": 8.346471981670614e-08, + "loss": 0.0007, + "step": 30059 + }, + { + "epoch": 0.58, + "learning_rate": 8.346083647237e-08, + "loss": 0.3131, + "step": 30060 + }, + { + "epoch": 0.58, + "learning_rate": 8.345695312803385e-08, + "loss": 1.1442, + "step": 30061 + }, + { + "epoch": 0.58, + "learning_rate": 8.345306978369771e-08, + "loss": 0.0005, + "step": 30062 + }, + { + "epoch": 0.58, + "learning_rate": 8.344918643936157e-08, + "loss": 0.0004, + "step": 30063 + }, + { + "epoch": 0.58, + "learning_rate": 8.344530309502543e-08, + "loss": 0.0004, + "step": 30064 + }, + { + "epoch": 0.58, + "learning_rate": 8.344141975068929e-08, + "loss": 0.0006, + "step": 30065 + }, + { + "epoch": 0.58, + "learning_rate": 8.343753640635314e-08, + "loss": 0.0004, + "step": 30066 + }, + { + "epoch": 0.58, + "learning_rate": 8.3433653062017e-08, + "loss": 0.0617, + "step": 30067 + }, + { + "epoch": 0.58, + "learning_rate": 8.342976971768086e-08, + "loss": 0.0005, + "step": 30068 + }, + { + "epoch": 0.58, + "learning_rate": 8.342588637334472e-08, + "loss": 0.0005, + "step": 30069 + }, + { + "epoch": 0.58, + "learning_rate": 8.342200302900858e-08, + "loss": 0.0005, + "step": 30070 + }, + { + "epoch": 0.58, + "learning_rate": 8.341811968467244e-08, + "loss": 0.0019, + "step": 30071 + }, + { + "epoch": 0.58, + "learning_rate": 8.34142363403363e-08, + "loss": 0.0011, + "step": 30072 + }, + { + "epoch": 0.58, + "learning_rate": 8.341035299600015e-08, + "loss": 0.0005, + "step": 30073 + }, + { + "epoch": 0.58, + "learning_rate": 8.340646965166401e-08, + "loss": 0.0004, + "step": 30074 + }, + { + "epoch": 0.58, + "learning_rate": 8.340258630732787e-08, + "loss": 0.0004, + "step": 30075 + }, + { + "epoch": 0.58, + "learning_rate": 8.339870296299173e-08, + "loss": 0.0003, + "step": 30076 + }, + { + "epoch": 0.58, + "learning_rate": 8.339481961865559e-08, + "loss": 0.037, + "step": 30077 + }, + { + "epoch": 0.58, + "learning_rate": 8.339093627431944e-08, + "loss": 0.0004, + "step": 30078 + }, + { + "epoch": 0.58, + "learning_rate": 8.338705292998329e-08, + "loss": 0.0004, + "step": 30079 + }, + { + "epoch": 0.58, + "learning_rate": 8.338316958564715e-08, + "loss": 0.0323, + "step": 30080 + }, + { + "epoch": 0.58, + "learning_rate": 8.3379286241311e-08, + "loss": 0.0005, + "step": 30081 + }, + { + "epoch": 0.58, + "learning_rate": 8.337540289697486e-08, + "loss": 0.0003, + "step": 30082 + }, + { + "epoch": 0.58, + "learning_rate": 8.337151955263872e-08, + "loss": 0.0007, + "step": 30083 + }, + { + "epoch": 0.58, + "learning_rate": 8.336763620830258e-08, + "loss": 1.128, + "step": 30084 + }, + { + "epoch": 0.58, + "learning_rate": 8.336375286396644e-08, + "loss": 0.0006, + "step": 30085 + }, + { + "epoch": 0.58, + "learning_rate": 8.33598695196303e-08, + "loss": 0.0007, + "step": 30086 + }, + { + "epoch": 0.58, + "learning_rate": 8.335598617529415e-08, + "loss": 0.0005, + "step": 30087 + }, + { + "epoch": 0.58, + "learning_rate": 8.335210283095801e-08, + "loss": 0.9436, + "step": 30088 + }, + { + "epoch": 0.58, + "learning_rate": 8.334821948662187e-08, + "loss": 0.0005, + "step": 30089 + }, + { + "epoch": 0.58, + "learning_rate": 8.334433614228573e-08, + "loss": 0.0014, + "step": 30090 + }, + { + "epoch": 0.58, + "learning_rate": 8.334045279794959e-08, + "loss": 0.0573, + "step": 30091 + }, + { + "epoch": 0.58, + "learning_rate": 8.333656945361345e-08, + "loss": 0.0006, + "step": 30092 + }, + { + "epoch": 0.58, + "learning_rate": 8.33326861092773e-08, + "loss": 0.0009, + "step": 30093 + }, + { + "epoch": 0.58, + "learning_rate": 8.332880276494116e-08, + "loss": 0.0004, + "step": 30094 + }, + { + "epoch": 0.58, + "learning_rate": 8.332491942060502e-08, + "loss": 0.0006, + "step": 30095 + }, + { + "epoch": 0.58, + "learning_rate": 8.332103607626888e-08, + "loss": 1.1364, + "step": 30096 + }, + { + "epoch": 0.58, + "learning_rate": 8.331715273193274e-08, + "loss": 0.0364, + "step": 30097 + }, + { + "epoch": 0.58, + "learning_rate": 8.33132693875966e-08, + "loss": 0.0005, + "step": 30098 + }, + { + "epoch": 0.58, + "learning_rate": 8.330938604326045e-08, + "loss": 0.0014, + "step": 30099 + }, + { + "epoch": 0.58, + "learning_rate": 8.330550269892431e-08, + "loss": 0.014, + "step": 30100 + }, + { + "epoch": 0.58, + "learning_rate": 8.330161935458817e-08, + "loss": 0.0006, + "step": 30101 + }, + { + "epoch": 0.58, + "learning_rate": 8.329773601025203e-08, + "loss": 0.0567, + "step": 30102 + }, + { + "epoch": 0.58, + "learning_rate": 8.329385266591589e-08, + "loss": 0.0008, + "step": 30103 + }, + { + "epoch": 0.58, + "learning_rate": 8.328996932157974e-08, + "loss": 0.0008, + "step": 30104 + }, + { + "epoch": 0.58, + "learning_rate": 8.32860859772436e-08, + "loss": 0.4215, + "step": 30105 + }, + { + "epoch": 0.58, + "learning_rate": 8.328220263290746e-08, + "loss": 0.0004, + "step": 30106 + }, + { + "epoch": 0.58, + "learning_rate": 8.327831928857132e-08, + "loss": 0.1893, + "step": 30107 + }, + { + "epoch": 0.58, + "learning_rate": 8.327443594423516e-08, + "loss": 0.0006, + "step": 30108 + }, + { + "epoch": 0.58, + "learning_rate": 8.327055259989902e-08, + "loss": 0.0009, + "step": 30109 + }, + { + "epoch": 0.58, + "learning_rate": 8.326666925556288e-08, + "loss": 0.0023, + "step": 30110 + }, + { + "epoch": 0.58, + "learning_rate": 8.326278591122674e-08, + "loss": 0.0008, + "step": 30111 + }, + { + "epoch": 0.58, + "learning_rate": 8.32589025668906e-08, + "loss": 0.0006, + "step": 30112 + }, + { + "epoch": 0.58, + "learning_rate": 8.325501922255446e-08, + "loss": 0.0004, + "step": 30113 + }, + { + "epoch": 0.58, + "learning_rate": 8.325113587821831e-08, + "loss": 0.0005, + "step": 30114 + }, + { + "epoch": 0.58, + "learning_rate": 8.324725253388217e-08, + "loss": 0.7406, + "step": 30115 + }, + { + "epoch": 0.58, + "learning_rate": 8.324336918954603e-08, + "loss": 0.001, + "step": 30116 + }, + { + "epoch": 0.58, + "learning_rate": 8.323948584520989e-08, + "loss": 0.0004, + "step": 30117 + }, + { + "epoch": 0.58, + "learning_rate": 8.323560250087375e-08, + "loss": 0.002, + "step": 30118 + }, + { + "epoch": 0.58, + "learning_rate": 8.32317191565376e-08, + "loss": 0.0004, + "step": 30119 + }, + { + "epoch": 0.58, + "learning_rate": 8.322783581220146e-08, + "loss": 0.6064, + "step": 30120 + }, + { + "epoch": 0.58, + "learning_rate": 8.322395246786532e-08, + "loss": 0.001, + "step": 30121 + }, + { + "epoch": 0.58, + "learning_rate": 8.322006912352918e-08, + "loss": 0.0006, + "step": 30122 + }, + { + "epoch": 0.58, + "learning_rate": 8.321618577919304e-08, + "loss": 0.0037, + "step": 30123 + }, + { + "epoch": 0.58, + "learning_rate": 8.32123024348569e-08, + "loss": 0.0007, + "step": 30124 + }, + { + "epoch": 0.58, + "learning_rate": 8.320841909052075e-08, + "loss": 0.0011, + "step": 30125 + }, + { + "epoch": 0.58, + "learning_rate": 8.320453574618461e-08, + "loss": 0.8483, + "step": 30126 + }, + { + "epoch": 0.58, + "learning_rate": 8.320065240184847e-08, + "loss": 0.001, + "step": 30127 + }, + { + "epoch": 0.58, + "learning_rate": 8.319676905751233e-08, + "loss": 0.0005, + "step": 30128 + }, + { + "epoch": 0.58, + "learning_rate": 8.319288571317619e-08, + "loss": 0.0004, + "step": 30129 + }, + { + "epoch": 0.58, + "learning_rate": 8.318900236884005e-08, + "loss": 0.0004, + "step": 30130 + }, + { + "epoch": 0.58, + "learning_rate": 8.31851190245039e-08, + "loss": 0.0006, + "step": 30131 + }, + { + "epoch": 0.58, + "learning_rate": 8.318123568016776e-08, + "loss": 0.0005, + "step": 30132 + }, + { + "epoch": 0.58, + "learning_rate": 8.317735233583162e-08, + "loss": 0.0005, + "step": 30133 + }, + { + "epoch": 0.58, + "learning_rate": 8.317346899149548e-08, + "loss": 0.0005, + "step": 30134 + }, + { + "epoch": 0.58, + "learning_rate": 8.316958564715934e-08, + "loss": 0.0003, + "step": 30135 + }, + { + "epoch": 0.58, + "learning_rate": 8.31657023028232e-08, + "loss": 1.1957, + "step": 30136 + }, + { + "epoch": 0.58, + "learning_rate": 8.316181895848704e-08, + "loss": 0.4265, + "step": 30137 + }, + { + "epoch": 0.58, + "learning_rate": 8.31579356141509e-08, + "loss": 0.0006, + "step": 30138 + }, + { + "epoch": 0.58, + "learning_rate": 8.315405226981476e-08, + "loss": 0.0005, + "step": 30139 + }, + { + "epoch": 0.58, + "learning_rate": 8.315016892547861e-08, + "loss": 0.0006, + "step": 30140 + }, + { + "epoch": 0.58, + "learning_rate": 8.314628558114247e-08, + "loss": 0.0004, + "step": 30141 + }, + { + "epoch": 0.58, + "learning_rate": 8.314240223680633e-08, + "loss": 0.0023, + "step": 30142 + }, + { + "epoch": 0.58, + "learning_rate": 8.313851889247019e-08, + "loss": 0.0006, + "step": 30143 + }, + { + "epoch": 0.58, + "learning_rate": 8.313463554813405e-08, + "loss": 0.0004, + "step": 30144 + }, + { + "epoch": 0.58, + "learning_rate": 8.31307522037979e-08, + "loss": 0.0008, + "step": 30145 + }, + { + "epoch": 0.58, + "learning_rate": 8.312686885946176e-08, + "loss": 0.0005, + "step": 30146 + }, + { + "epoch": 0.58, + "learning_rate": 8.312298551512562e-08, + "loss": 0.0005, + "step": 30147 + }, + { + "epoch": 0.58, + "learning_rate": 8.311910217078948e-08, + "loss": 0.0005, + "step": 30148 + }, + { + "epoch": 0.58, + "learning_rate": 8.311521882645334e-08, + "loss": 0.0004, + "step": 30149 + }, + { + "epoch": 0.58, + "learning_rate": 8.31113354821172e-08, + "loss": 0.6015, + "step": 30150 + }, + { + "epoch": 0.58, + "learning_rate": 8.310745213778106e-08, + "loss": 0.0006, + "step": 30151 + }, + { + "epoch": 0.58, + "learning_rate": 8.310356879344491e-08, + "loss": 0.227, + "step": 30152 + }, + { + "epoch": 0.58, + "learning_rate": 8.309968544910877e-08, + "loss": 0.0007, + "step": 30153 + }, + { + "epoch": 0.58, + "learning_rate": 8.309580210477263e-08, + "loss": 0.0005, + "step": 30154 + }, + { + "epoch": 0.58, + "learning_rate": 8.309191876043649e-08, + "loss": 0.002, + "step": 30155 + }, + { + "epoch": 0.58, + "learning_rate": 8.308803541610035e-08, + "loss": 0.0005, + "step": 30156 + }, + { + "epoch": 0.58, + "learning_rate": 8.30841520717642e-08, + "loss": 0.0128, + "step": 30157 + }, + { + "epoch": 0.59, + "learning_rate": 8.308026872742806e-08, + "loss": 0.0515, + "step": 30158 + }, + { + "epoch": 0.59, + "learning_rate": 8.307638538309192e-08, + "loss": 0.0006, + "step": 30159 + }, + { + "epoch": 0.59, + "learning_rate": 8.307250203875578e-08, + "loss": 0.0008, + "step": 30160 + }, + { + "epoch": 0.59, + "learning_rate": 8.306861869441964e-08, + "loss": 0.0005, + "step": 30161 + }, + { + "epoch": 0.59, + "learning_rate": 8.30647353500835e-08, + "loss": 0.0007, + "step": 30162 + }, + { + "epoch": 0.59, + "learning_rate": 8.306085200574735e-08, + "loss": 1.4469, + "step": 30163 + }, + { + "epoch": 0.59, + "learning_rate": 8.305696866141121e-08, + "loss": 0.0005, + "step": 30164 + }, + { + "epoch": 0.59, + "learning_rate": 8.305308531707507e-08, + "loss": 0.0019, + "step": 30165 + }, + { + "epoch": 0.59, + "learning_rate": 8.304920197273892e-08, + "loss": 0.0007, + "step": 30166 + }, + { + "epoch": 0.59, + "learning_rate": 8.304531862840277e-08, + "loss": 0.0217, + "step": 30167 + }, + { + "epoch": 0.59, + "learning_rate": 8.304143528406663e-08, + "loss": 0.0006, + "step": 30168 + }, + { + "epoch": 0.59, + "learning_rate": 8.303755193973049e-08, + "loss": 0.0007, + "step": 30169 + }, + { + "epoch": 0.59, + "learning_rate": 8.303366859539435e-08, + "loss": 0.0006, + "step": 30170 + }, + { + "epoch": 0.59, + "learning_rate": 8.302978525105821e-08, + "loss": 0.0044, + "step": 30171 + }, + { + "epoch": 0.59, + "learning_rate": 8.302590190672207e-08, + "loss": 0.8606, + "step": 30172 + }, + { + "epoch": 0.59, + "learning_rate": 8.302201856238592e-08, + "loss": 0.0297, + "step": 30173 + }, + { + "epoch": 0.59, + "learning_rate": 8.301813521804978e-08, + "loss": 0.0005, + "step": 30174 + }, + { + "epoch": 0.59, + "learning_rate": 8.301425187371364e-08, + "loss": 0.0008, + "step": 30175 + }, + { + "epoch": 0.59, + "learning_rate": 8.30103685293775e-08, + "loss": 0.0006, + "step": 30176 + }, + { + "epoch": 0.59, + "learning_rate": 8.300648518504136e-08, + "loss": 0.0018, + "step": 30177 + }, + { + "epoch": 0.59, + "learning_rate": 8.300260184070521e-08, + "loss": 0.0031, + "step": 30178 + }, + { + "epoch": 0.59, + "learning_rate": 8.299871849636907e-08, + "loss": 0.001, + "step": 30179 + }, + { + "epoch": 0.59, + "learning_rate": 8.299483515203293e-08, + "loss": 0.1239, + "step": 30180 + }, + { + "epoch": 0.59, + "learning_rate": 8.299095180769679e-08, + "loss": 0.0006, + "step": 30181 + }, + { + "epoch": 0.59, + "learning_rate": 8.298706846336065e-08, + "loss": 0.0013, + "step": 30182 + }, + { + "epoch": 0.59, + "learning_rate": 8.29831851190245e-08, + "loss": 0.0006, + "step": 30183 + }, + { + "epoch": 0.59, + "learning_rate": 8.297930177468836e-08, + "loss": 0.0005, + "step": 30184 + }, + { + "epoch": 0.59, + "learning_rate": 8.297541843035222e-08, + "loss": 0.0006, + "step": 30185 + }, + { + "epoch": 0.59, + "learning_rate": 8.297153508601608e-08, + "loss": 0.0005, + "step": 30186 + }, + { + "epoch": 0.59, + "learning_rate": 8.296765174167994e-08, + "loss": 0.0012, + "step": 30187 + }, + { + "epoch": 0.59, + "learning_rate": 8.29637683973438e-08, + "loss": 0.0006, + "step": 30188 + }, + { + "epoch": 0.59, + "learning_rate": 8.295988505300766e-08, + "loss": 0.0004, + "step": 30189 + }, + { + "epoch": 0.59, + "learning_rate": 8.295600170867151e-08, + "loss": 0.0128, + "step": 30190 + }, + { + "epoch": 0.59, + "learning_rate": 8.295211836433537e-08, + "loss": 0.0003, + "step": 30191 + }, + { + "epoch": 0.59, + "learning_rate": 8.294823501999923e-08, + "loss": 0.0005, + "step": 30192 + }, + { + "epoch": 0.59, + "learning_rate": 8.294435167566309e-08, + "loss": 0.0005, + "step": 30193 + }, + { + "epoch": 0.59, + "learning_rate": 8.294046833132695e-08, + "loss": 0.0005, + "step": 30194 + }, + { + "epoch": 0.59, + "learning_rate": 8.293658498699079e-08, + "loss": 0.0005, + "step": 30195 + }, + { + "epoch": 0.59, + "learning_rate": 8.293270164265465e-08, + "loss": 0.0004, + "step": 30196 + }, + { + "epoch": 0.59, + "learning_rate": 8.292881829831851e-08, + "loss": 0.0006, + "step": 30197 + }, + { + "epoch": 0.59, + "learning_rate": 8.292493495398237e-08, + "loss": 0.0006, + "step": 30198 + }, + { + "epoch": 0.59, + "learning_rate": 8.292105160964622e-08, + "loss": 0.0012, + "step": 30199 + }, + { + "epoch": 0.59, + "learning_rate": 8.291716826531008e-08, + "loss": 0.0006, + "step": 30200 + }, + { + "epoch": 0.59, + "learning_rate": 8.291328492097394e-08, + "loss": 0.0005, + "step": 30201 + }, + { + "epoch": 0.59, + "learning_rate": 8.29094015766378e-08, + "loss": 0.0008, + "step": 30202 + }, + { + "epoch": 0.59, + "learning_rate": 8.290551823230166e-08, + "loss": 1.0395, + "step": 30203 + }, + { + "epoch": 0.59, + "learning_rate": 8.290163488796552e-08, + "loss": 0.0005, + "step": 30204 + }, + { + "epoch": 0.59, + "learning_rate": 8.289775154362937e-08, + "loss": 0.0003, + "step": 30205 + }, + { + "epoch": 0.59, + "learning_rate": 8.289386819929323e-08, + "loss": 0.002, + "step": 30206 + }, + { + "epoch": 0.59, + "learning_rate": 8.288998485495709e-08, + "loss": 0.0004, + "step": 30207 + }, + { + "epoch": 0.59, + "learning_rate": 8.288610151062095e-08, + "loss": 0.0005, + "step": 30208 + }, + { + "epoch": 0.59, + "learning_rate": 8.288221816628481e-08, + "loss": 0.0006, + "step": 30209 + }, + { + "epoch": 0.59, + "learning_rate": 8.287833482194867e-08, + "loss": 0.0006, + "step": 30210 + }, + { + "epoch": 0.59, + "learning_rate": 8.287445147761251e-08, + "loss": 0.0005, + "step": 30211 + }, + { + "epoch": 0.59, + "learning_rate": 8.287056813327637e-08, + "loss": 0.0004, + "step": 30212 + }, + { + "epoch": 0.59, + "learning_rate": 8.286668478894023e-08, + "loss": 0.0003, + "step": 30213 + }, + { + "epoch": 0.59, + "learning_rate": 8.286280144460409e-08, + "loss": 0.0005, + "step": 30214 + }, + { + "epoch": 0.59, + "learning_rate": 8.285891810026794e-08, + "loss": 0.0004, + "step": 30215 + }, + { + "epoch": 0.59, + "learning_rate": 8.28550347559318e-08, + "loss": 0.0006, + "step": 30216 + }, + { + "epoch": 0.59, + "learning_rate": 8.285115141159566e-08, + "loss": 0.0005, + "step": 30217 + }, + { + "epoch": 0.59, + "learning_rate": 8.284726806725952e-08, + "loss": 0.5792, + "step": 30218 + }, + { + "epoch": 0.59, + "learning_rate": 8.284338472292338e-08, + "loss": 0.0017, + "step": 30219 + }, + { + "epoch": 0.59, + "learning_rate": 8.283950137858723e-08, + "loss": 0.5174, + "step": 30220 + }, + { + "epoch": 0.59, + "learning_rate": 8.283561803425109e-08, + "loss": 0.0007, + "step": 30221 + }, + { + "epoch": 0.59, + "learning_rate": 8.283173468991495e-08, + "loss": 0.0006, + "step": 30222 + }, + { + "epoch": 0.59, + "learning_rate": 8.282785134557881e-08, + "loss": 0.0004, + "step": 30223 + }, + { + "epoch": 0.59, + "learning_rate": 8.282396800124267e-08, + "loss": 0.0005, + "step": 30224 + }, + { + "epoch": 0.59, + "learning_rate": 8.282008465690653e-08, + "loss": 0.2964, + "step": 30225 + }, + { + "epoch": 0.59, + "learning_rate": 8.281620131257037e-08, + "loss": 0.565, + "step": 30226 + }, + { + "epoch": 0.59, + "learning_rate": 8.281231796823423e-08, + "loss": 0.0005, + "step": 30227 + }, + { + "epoch": 0.59, + "learning_rate": 8.280843462389809e-08, + "loss": 0.0636, + "step": 30228 + }, + { + "epoch": 0.59, + "learning_rate": 8.280455127956195e-08, + "loss": 0.0009, + "step": 30229 + }, + { + "epoch": 0.59, + "learning_rate": 8.28006679352258e-08, + "loss": 0.0006, + "step": 30230 + }, + { + "epoch": 0.59, + "learning_rate": 8.279678459088966e-08, + "loss": 0.0007, + "step": 30231 + }, + { + "epoch": 0.59, + "learning_rate": 8.279290124655352e-08, + "loss": 0.0006, + "step": 30232 + }, + { + "epoch": 0.59, + "learning_rate": 8.278901790221738e-08, + "loss": 0.0006, + "step": 30233 + }, + { + "epoch": 0.59, + "learning_rate": 8.278513455788124e-08, + "loss": 0.0003, + "step": 30234 + }, + { + "epoch": 0.59, + "learning_rate": 8.27812512135451e-08, + "loss": 0.0004, + "step": 30235 + }, + { + "epoch": 0.59, + "learning_rate": 8.277736786920895e-08, + "loss": 0.0007, + "step": 30236 + }, + { + "epoch": 0.59, + "learning_rate": 8.277348452487281e-08, + "loss": 0.0004, + "step": 30237 + }, + { + "epoch": 0.59, + "learning_rate": 8.276960118053667e-08, + "loss": 0.0006, + "step": 30238 + }, + { + "epoch": 0.59, + "learning_rate": 8.276571783620053e-08, + "loss": 0.0004, + "step": 30239 + }, + { + "epoch": 0.59, + "learning_rate": 8.276183449186439e-08, + "loss": 1.6943, + "step": 30240 + }, + { + "epoch": 0.59, + "learning_rate": 8.275795114752824e-08, + "loss": 0.0006, + "step": 30241 + }, + { + "epoch": 0.59, + "learning_rate": 8.27540678031921e-08, + "loss": 0.0008, + "step": 30242 + }, + { + "epoch": 0.59, + "learning_rate": 8.275018445885596e-08, + "loss": 0.0004, + "step": 30243 + }, + { + "epoch": 0.59, + "learning_rate": 8.274630111451982e-08, + "loss": 0.0004, + "step": 30244 + }, + { + "epoch": 0.59, + "learning_rate": 8.274241777018368e-08, + "loss": 0.0004, + "step": 30245 + }, + { + "epoch": 0.59, + "learning_rate": 8.273853442584754e-08, + "loss": 0.0004, + "step": 30246 + }, + { + "epoch": 0.59, + "learning_rate": 8.27346510815114e-08, + "loss": 0.0009, + "step": 30247 + }, + { + "epoch": 0.59, + "learning_rate": 8.273076773717525e-08, + "loss": 0.1115, + "step": 30248 + }, + { + "epoch": 0.59, + "learning_rate": 8.272688439283911e-08, + "loss": 0.0004, + "step": 30249 + }, + { + "epoch": 0.59, + "learning_rate": 8.272300104850297e-08, + "loss": 0.0004, + "step": 30250 + }, + { + "epoch": 0.59, + "learning_rate": 8.271911770416683e-08, + "loss": 0.0009, + "step": 30251 + }, + { + "epoch": 0.59, + "learning_rate": 8.271523435983069e-08, + "loss": 0.0003, + "step": 30252 + }, + { + "epoch": 0.59, + "learning_rate": 8.271135101549453e-08, + "loss": 0.0005, + "step": 30253 + }, + { + "epoch": 0.59, + "learning_rate": 8.270746767115839e-08, + "loss": 0.0894, + "step": 30254 + }, + { + "epoch": 0.59, + "learning_rate": 8.270358432682225e-08, + "loss": 0.0198, + "step": 30255 + }, + { + "epoch": 0.59, + "learning_rate": 8.26997009824861e-08, + "loss": 0.589, + "step": 30256 + }, + { + "epoch": 0.59, + "learning_rate": 8.269581763814996e-08, + "loss": 0.0007, + "step": 30257 + }, + { + "epoch": 0.59, + "learning_rate": 8.269193429381382e-08, + "loss": 0.0004, + "step": 30258 + }, + { + "epoch": 0.59, + "learning_rate": 8.268805094947768e-08, + "loss": 0.3262, + "step": 30259 + }, + { + "epoch": 0.59, + "learning_rate": 8.268416760514154e-08, + "loss": 0.0007, + "step": 30260 + }, + { + "epoch": 0.59, + "learning_rate": 8.26802842608054e-08, + "loss": 0.0005, + "step": 30261 + }, + { + "epoch": 0.59, + "learning_rate": 8.267640091646925e-08, + "loss": 0.0003, + "step": 30262 + }, + { + "epoch": 0.59, + "learning_rate": 8.267251757213311e-08, + "loss": 0.0227, + "step": 30263 + }, + { + "epoch": 0.59, + "learning_rate": 8.266863422779697e-08, + "loss": 0.0035, + "step": 30264 + }, + { + "epoch": 0.59, + "learning_rate": 8.266475088346083e-08, + "loss": 0.0006, + "step": 30265 + }, + { + "epoch": 0.59, + "learning_rate": 8.266086753912469e-08, + "loss": 0.0004, + "step": 30266 + }, + { + "epoch": 0.59, + "learning_rate": 8.265698419478855e-08, + "loss": 0.0005, + "step": 30267 + }, + { + "epoch": 0.59, + "learning_rate": 8.26531008504524e-08, + "loss": 0.0004, + "step": 30268 + }, + { + "epoch": 0.59, + "learning_rate": 8.264921750611626e-08, + "loss": 0.0033, + "step": 30269 + }, + { + "epoch": 0.59, + "learning_rate": 8.264533416178012e-08, + "loss": 0.0007, + "step": 30270 + }, + { + "epoch": 0.59, + "learning_rate": 8.264145081744398e-08, + "loss": 0.0006, + "step": 30271 + }, + { + "epoch": 0.59, + "learning_rate": 8.263756747310784e-08, + "loss": 0.0006, + "step": 30272 + }, + { + "epoch": 0.59, + "learning_rate": 8.26336841287717e-08, + "loss": 0.0004, + "step": 30273 + }, + { + "epoch": 0.59, + "learning_rate": 8.262980078443555e-08, + "loss": 0.0011, + "step": 30274 + }, + { + "epoch": 0.59, + "learning_rate": 8.262591744009941e-08, + "loss": 0.0005, + "step": 30275 + }, + { + "epoch": 0.59, + "learning_rate": 8.262203409576327e-08, + "loss": 0.0005, + "step": 30276 + }, + { + "epoch": 0.59, + "learning_rate": 8.261815075142713e-08, + "loss": 0.0003, + "step": 30277 + }, + { + "epoch": 0.59, + "learning_rate": 8.261426740709099e-08, + "loss": 0.001, + "step": 30278 + }, + { + "epoch": 0.59, + "learning_rate": 8.261038406275484e-08, + "loss": 0.0008, + "step": 30279 + }, + { + "epoch": 0.59, + "learning_rate": 8.26065007184187e-08, + "loss": 0.0004, + "step": 30280 + }, + { + "epoch": 0.59, + "learning_rate": 8.260261737408256e-08, + "loss": 0.0004, + "step": 30281 + }, + { + "epoch": 0.59, + "learning_rate": 8.25987340297464e-08, + "loss": 0.0004, + "step": 30282 + }, + { + "epoch": 0.59, + "learning_rate": 8.259485068541026e-08, + "loss": 0.0006, + "step": 30283 + }, + { + "epoch": 0.59, + "learning_rate": 8.259096734107412e-08, + "loss": 0.0005, + "step": 30284 + }, + { + "epoch": 0.59, + "learning_rate": 8.258708399673798e-08, + "loss": 0.0004, + "step": 30285 + }, + { + "epoch": 0.59, + "learning_rate": 8.258320065240184e-08, + "loss": 0.0003, + "step": 30286 + }, + { + "epoch": 0.59, + "learning_rate": 8.25793173080657e-08, + "loss": 0.0004, + "step": 30287 + }, + { + "epoch": 0.59, + "learning_rate": 8.257543396372956e-08, + "loss": 0.0006, + "step": 30288 + }, + { + "epoch": 0.59, + "learning_rate": 8.257155061939341e-08, + "loss": 0.0005, + "step": 30289 + }, + { + "epoch": 0.59, + "learning_rate": 8.256766727505727e-08, + "loss": 0.0005, + "step": 30290 + }, + { + "epoch": 0.59, + "learning_rate": 8.256378393072113e-08, + "loss": 0.0007, + "step": 30291 + }, + { + "epoch": 0.59, + "learning_rate": 8.255990058638499e-08, + "loss": 1.0138, + "step": 30292 + }, + { + "epoch": 0.59, + "learning_rate": 8.255601724204885e-08, + "loss": 0.0006, + "step": 30293 + }, + { + "epoch": 0.59, + "learning_rate": 8.25521338977127e-08, + "loss": 0.698, + "step": 30294 + }, + { + "epoch": 0.59, + "learning_rate": 8.254825055337656e-08, + "loss": 0.0007, + "step": 30295 + }, + { + "epoch": 0.59, + "learning_rate": 8.254436720904042e-08, + "loss": 0.0007, + "step": 30296 + }, + { + "epoch": 0.59, + "learning_rate": 8.254048386470428e-08, + "loss": 0.001, + "step": 30297 + }, + { + "epoch": 0.59, + "learning_rate": 8.253660052036814e-08, + "loss": 0.0004, + "step": 30298 + }, + { + "epoch": 0.59, + "learning_rate": 8.2532717176032e-08, + "loss": 0.0007, + "step": 30299 + }, + { + "epoch": 0.59, + "learning_rate": 8.252883383169585e-08, + "loss": 0.0073, + "step": 30300 + }, + { + "epoch": 0.59, + "learning_rate": 8.252495048735971e-08, + "loss": 0.0004, + "step": 30301 + }, + { + "epoch": 0.59, + "learning_rate": 8.252106714302357e-08, + "loss": 0.0007, + "step": 30302 + }, + { + "epoch": 0.59, + "learning_rate": 8.251718379868743e-08, + "loss": 0.0006, + "step": 30303 + }, + { + "epoch": 0.59, + "learning_rate": 8.251330045435129e-08, + "loss": 0.0005, + "step": 30304 + }, + { + "epoch": 0.59, + "learning_rate": 8.250941711001515e-08, + "loss": 0.0003, + "step": 30305 + }, + { + "epoch": 0.59, + "learning_rate": 8.2505533765679e-08, + "loss": 0.0091, + "step": 30306 + }, + { + "epoch": 0.59, + "learning_rate": 8.250165042134286e-08, + "loss": 0.2299, + "step": 30307 + }, + { + "epoch": 0.59, + "learning_rate": 8.249776707700672e-08, + "loss": 0.0005, + "step": 30308 + }, + { + "epoch": 0.59, + "learning_rate": 8.249388373267058e-08, + "loss": 0.0007, + "step": 30309 + }, + { + "epoch": 0.59, + "learning_rate": 8.249000038833444e-08, + "loss": 0.0006, + "step": 30310 + }, + { + "epoch": 0.59, + "learning_rate": 8.248611704399828e-08, + "loss": 0.0014, + "step": 30311 + }, + { + "epoch": 0.59, + "learning_rate": 8.248223369966214e-08, + "loss": 0.0005, + "step": 30312 + }, + { + "epoch": 0.59, + "learning_rate": 8.2478350355326e-08, + "loss": 0.0004, + "step": 30313 + }, + { + "epoch": 0.59, + "learning_rate": 8.247446701098986e-08, + "loss": 0.0006, + "step": 30314 + }, + { + "epoch": 0.59, + "learning_rate": 8.247058366665371e-08, + "loss": 0.0005, + "step": 30315 + }, + { + "epoch": 0.59, + "learning_rate": 8.246670032231757e-08, + "loss": 0.0005, + "step": 30316 + }, + { + "epoch": 0.59, + "learning_rate": 8.246281697798143e-08, + "loss": 0.0005, + "step": 30317 + }, + { + "epoch": 0.59, + "learning_rate": 8.245893363364529e-08, + "loss": 0.0006, + "step": 30318 + }, + { + "epoch": 0.59, + "learning_rate": 8.245505028930915e-08, + "loss": 1.1595, + "step": 30319 + }, + { + "epoch": 0.59, + "learning_rate": 8.2451166944973e-08, + "loss": 0.0006, + "step": 30320 + }, + { + "epoch": 0.59, + "learning_rate": 8.244728360063686e-08, + "loss": 0.0009, + "step": 30321 + }, + { + "epoch": 0.59, + "learning_rate": 8.244340025630072e-08, + "loss": 0.0517, + "step": 30322 + }, + { + "epoch": 0.59, + "learning_rate": 8.243951691196458e-08, + "loss": 0.0325, + "step": 30323 + }, + { + "epoch": 0.59, + "learning_rate": 8.243563356762844e-08, + "loss": 0.0005, + "step": 30324 + }, + { + "epoch": 0.59, + "learning_rate": 8.24317502232923e-08, + "loss": 0.0006, + "step": 30325 + }, + { + "epoch": 0.59, + "learning_rate": 8.242786687895616e-08, + "loss": 0.0024, + "step": 30326 + }, + { + "epoch": 0.59, + "learning_rate": 8.242398353462001e-08, + "loss": 0.5422, + "step": 30327 + }, + { + "epoch": 0.59, + "learning_rate": 8.242010019028387e-08, + "loss": 0.0005, + "step": 30328 + }, + { + "epoch": 0.59, + "learning_rate": 8.241621684594773e-08, + "loss": 0.0004, + "step": 30329 + }, + { + "epoch": 0.59, + "learning_rate": 8.241233350161159e-08, + "loss": 0.001, + "step": 30330 + }, + { + "epoch": 0.59, + "learning_rate": 8.240845015727545e-08, + "loss": 0.0005, + "step": 30331 + }, + { + "epoch": 0.59, + "learning_rate": 8.24045668129393e-08, + "loss": 0.0005, + "step": 30332 + }, + { + "epoch": 0.59, + "learning_rate": 8.240068346860316e-08, + "loss": 0.0004, + "step": 30333 + }, + { + "epoch": 0.59, + "learning_rate": 8.239680012426702e-08, + "loss": 0.0011, + "step": 30334 + }, + { + "epoch": 0.59, + "learning_rate": 8.239291677993088e-08, + "loss": 0.0005, + "step": 30335 + }, + { + "epoch": 0.59, + "learning_rate": 8.238903343559474e-08, + "loss": 0.0008, + "step": 30336 + }, + { + "epoch": 0.59, + "learning_rate": 8.23851500912586e-08, + "loss": 0.0005, + "step": 30337 + }, + { + "epoch": 0.59, + "learning_rate": 8.238126674692245e-08, + "loss": 0.0003, + "step": 30338 + }, + { + "epoch": 0.59, + "learning_rate": 8.237738340258631e-08, + "loss": 0.0006, + "step": 30339 + }, + { + "epoch": 0.59, + "learning_rate": 8.237350005825016e-08, + "loss": 0.0004, + "step": 30340 + }, + { + "epoch": 0.59, + "learning_rate": 8.236961671391402e-08, + "loss": 0.0014, + "step": 30341 + }, + { + "epoch": 0.59, + "learning_rate": 8.236573336957787e-08, + "loss": 0.0005, + "step": 30342 + }, + { + "epoch": 0.59, + "learning_rate": 8.236185002524173e-08, + "loss": 0.0006, + "step": 30343 + }, + { + "epoch": 0.59, + "learning_rate": 8.235796668090559e-08, + "loss": 0.0005, + "step": 30344 + }, + { + "epoch": 0.59, + "learning_rate": 8.235408333656945e-08, + "loss": 0.6127, + "step": 30345 + }, + { + "epoch": 0.59, + "learning_rate": 8.235019999223331e-08, + "loss": 0.0005, + "step": 30346 + }, + { + "epoch": 0.59, + "learning_rate": 8.234631664789717e-08, + "loss": 0.0004, + "step": 30347 + }, + { + "epoch": 0.59, + "learning_rate": 8.234243330356102e-08, + "loss": 1.2471, + "step": 30348 + }, + { + "epoch": 0.59, + "learning_rate": 8.233854995922488e-08, + "loss": 0.0007, + "step": 30349 + }, + { + "epoch": 0.59, + "learning_rate": 8.233466661488874e-08, + "loss": 0.0007, + "step": 30350 + }, + { + "epoch": 0.59, + "learning_rate": 8.23307832705526e-08, + "loss": 0.0021, + "step": 30351 + }, + { + "epoch": 0.59, + "learning_rate": 8.232689992621646e-08, + "loss": 1.1858, + "step": 30352 + }, + { + "epoch": 0.59, + "learning_rate": 8.232301658188031e-08, + "loss": 0.0028, + "step": 30353 + }, + { + "epoch": 0.59, + "learning_rate": 8.231913323754417e-08, + "loss": 0.0008, + "step": 30354 + }, + { + "epoch": 0.59, + "learning_rate": 8.231524989320803e-08, + "loss": 0.0014, + "step": 30355 + }, + { + "epoch": 0.59, + "learning_rate": 8.231136654887189e-08, + "loss": 0.5634, + "step": 30356 + }, + { + "epoch": 0.59, + "learning_rate": 8.230748320453575e-08, + "loss": 0.0356, + "step": 30357 + }, + { + "epoch": 0.59, + "learning_rate": 8.23035998601996e-08, + "loss": 1.1462, + "step": 30358 + }, + { + "epoch": 0.59, + "learning_rate": 8.229971651586346e-08, + "loss": 0.0009, + "step": 30359 + }, + { + "epoch": 0.59, + "learning_rate": 8.229583317152732e-08, + "loss": 0.0004, + "step": 30360 + }, + { + "epoch": 0.59, + "learning_rate": 8.229194982719118e-08, + "loss": 0.4897, + "step": 30361 + }, + { + "epoch": 0.59, + "learning_rate": 8.228806648285504e-08, + "loss": 0.0005, + "step": 30362 + }, + { + "epoch": 0.59, + "learning_rate": 8.22841831385189e-08, + "loss": 0.0005, + "step": 30363 + }, + { + "epoch": 0.59, + "learning_rate": 8.228029979418276e-08, + "loss": 0.0006, + "step": 30364 + }, + { + "epoch": 0.59, + "learning_rate": 8.227641644984661e-08, + "loss": 0.0004, + "step": 30365 + }, + { + "epoch": 0.59, + "learning_rate": 8.227253310551047e-08, + "loss": 0.0004, + "step": 30366 + }, + { + "epoch": 0.59, + "learning_rate": 8.226864976117433e-08, + "loss": 0.0011, + "step": 30367 + }, + { + "epoch": 0.59, + "learning_rate": 8.226476641683819e-08, + "loss": 0.0006, + "step": 30368 + }, + { + "epoch": 0.59, + "learning_rate": 8.226088307250203e-08, + "loss": 0.0004, + "step": 30369 + }, + { + "epoch": 0.59, + "learning_rate": 8.225699972816589e-08, + "loss": 0.0006, + "step": 30370 + }, + { + "epoch": 0.59, + "learning_rate": 8.225311638382975e-08, + "loss": 0.0014, + "step": 30371 + }, + { + "epoch": 0.59, + "learning_rate": 8.224923303949361e-08, + "loss": 0.0006, + "step": 30372 + }, + { + "epoch": 0.59, + "learning_rate": 8.224534969515747e-08, + "loss": 0.0008, + "step": 30373 + }, + { + "epoch": 0.59, + "learning_rate": 8.224146635082132e-08, + "loss": 1.3019, + "step": 30374 + }, + { + "epoch": 0.59, + "learning_rate": 8.223758300648518e-08, + "loss": 0.0005, + "step": 30375 + }, + { + "epoch": 0.59, + "learning_rate": 8.223369966214904e-08, + "loss": 0.0006, + "step": 30376 + }, + { + "epoch": 0.59, + "learning_rate": 8.22298163178129e-08, + "loss": 0.0005, + "step": 30377 + }, + { + "epoch": 0.59, + "learning_rate": 8.222593297347676e-08, + "loss": 0.0005, + "step": 30378 + }, + { + "epoch": 0.59, + "learning_rate": 8.222204962914062e-08, + "loss": 0.0047, + "step": 30379 + }, + { + "epoch": 0.59, + "learning_rate": 8.221816628480447e-08, + "loss": 0.0006, + "step": 30380 + }, + { + "epoch": 0.59, + "learning_rate": 8.221428294046833e-08, + "loss": 0.0007, + "step": 30381 + }, + { + "epoch": 0.59, + "learning_rate": 8.221039959613219e-08, + "loss": 0.0005, + "step": 30382 + }, + { + "epoch": 0.59, + "learning_rate": 8.220651625179605e-08, + "loss": 0.0007, + "step": 30383 + }, + { + "epoch": 0.59, + "learning_rate": 8.220263290745991e-08, + "loss": 0.0078, + "step": 30384 + }, + { + "epoch": 0.59, + "learning_rate": 8.219874956312377e-08, + "loss": 0.0004, + "step": 30385 + }, + { + "epoch": 0.59, + "learning_rate": 8.219486621878762e-08, + "loss": 0.0005, + "step": 30386 + }, + { + "epoch": 0.59, + "learning_rate": 8.219098287445148e-08, + "loss": 0.0017, + "step": 30387 + }, + { + "epoch": 0.59, + "learning_rate": 8.218709953011533e-08, + "loss": 0.0009, + "step": 30388 + }, + { + "epoch": 0.59, + "learning_rate": 8.218321618577919e-08, + "loss": 0.0007, + "step": 30389 + }, + { + "epoch": 0.59, + "learning_rate": 8.217933284144304e-08, + "loss": 0.0006, + "step": 30390 + }, + { + "epoch": 0.59, + "learning_rate": 8.21754494971069e-08, + "loss": 0.3893, + "step": 30391 + }, + { + "epoch": 0.59, + "learning_rate": 8.217156615277076e-08, + "loss": 0.0004, + "step": 30392 + }, + { + "epoch": 0.59, + "learning_rate": 8.216768280843462e-08, + "loss": 0.0004, + "step": 30393 + }, + { + "epoch": 0.59, + "learning_rate": 8.216379946409848e-08, + "loss": 0.0008, + "step": 30394 + }, + { + "epoch": 0.59, + "learning_rate": 8.215991611976233e-08, + "loss": 0.0008, + "step": 30395 + }, + { + "epoch": 0.59, + "learning_rate": 8.215603277542619e-08, + "loss": 0.243, + "step": 30396 + }, + { + "epoch": 0.59, + "learning_rate": 8.215214943109005e-08, + "loss": 0.0004, + "step": 30397 + }, + { + "epoch": 0.59, + "learning_rate": 8.214826608675391e-08, + "loss": 0.0006, + "step": 30398 + }, + { + "epoch": 0.59, + "learning_rate": 8.214438274241777e-08, + "loss": 0.0006, + "step": 30399 + }, + { + "epoch": 0.59, + "learning_rate": 8.214049939808163e-08, + "loss": 0.0005, + "step": 30400 + }, + { + "epoch": 0.59, + "learning_rate": 8.213661605374548e-08, + "loss": 0.0004, + "step": 30401 + }, + { + "epoch": 0.59, + "learning_rate": 8.213273270940934e-08, + "loss": 0.0005, + "step": 30402 + }, + { + "epoch": 0.59, + "learning_rate": 8.212884936507319e-08, + "loss": 0.0004, + "step": 30403 + }, + { + "epoch": 0.59, + "learning_rate": 8.212496602073705e-08, + "loss": 0.0005, + "step": 30404 + }, + { + "epoch": 0.59, + "learning_rate": 8.21210826764009e-08, + "loss": 0.0004, + "step": 30405 + }, + { + "epoch": 0.59, + "learning_rate": 8.211719933206476e-08, + "loss": 0.0046, + "step": 30406 + }, + { + "epoch": 0.59, + "learning_rate": 8.211331598772862e-08, + "loss": 0.0005, + "step": 30407 + }, + { + "epoch": 0.59, + "learning_rate": 8.210943264339248e-08, + "loss": 0.1159, + "step": 30408 + }, + { + "epoch": 0.59, + "learning_rate": 8.210554929905634e-08, + "loss": 0.0005, + "step": 30409 + }, + { + "epoch": 0.59, + "learning_rate": 8.21016659547202e-08, + "loss": 0.4052, + "step": 30410 + }, + { + "epoch": 0.59, + "learning_rate": 8.209778261038405e-08, + "loss": 0.4327, + "step": 30411 + }, + { + "epoch": 0.59, + "learning_rate": 8.209389926604791e-08, + "loss": 0.0009, + "step": 30412 + }, + { + "epoch": 0.59, + "learning_rate": 8.209001592171177e-08, + "loss": 0.0003, + "step": 30413 + }, + { + "epoch": 0.59, + "learning_rate": 8.208613257737563e-08, + "loss": 0.2158, + "step": 30414 + }, + { + "epoch": 0.59, + "learning_rate": 8.208224923303949e-08, + "loss": 0.0006, + "step": 30415 + }, + { + "epoch": 0.59, + "learning_rate": 8.207836588870334e-08, + "loss": 1.234, + "step": 30416 + }, + { + "epoch": 0.59, + "learning_rate": 8.20744825443672e-08, + "loss": 0.0006, + "step": 30417 + }, + { + "epoch": 0.59, + "learning_rate": 8.207059920003106e-08, + "loss": 0.0919, + "step": 30418 + }, + { + "epoch": 0.59, + "learning_rate": 8.206671585569492e-08, + "loss": 0.0003, + "step": 30419 + }, + { + "epoch": 0.59, + "learning_rate": 8.206283251135878e-08, + "loss": 0.0006, + "step": 30420 + }, + { + "epoch": 0.59, + "learning_rate": 8.205894916702264e-08, + "loss": 0.0004, + "step": 30421 + }, + { + "epoch": 0.59, + "learning_rate": 8.20550658226865e-08, + "loss": 0.0005, + "step": 30422 + }, + { + "epoch": 0.59, + "learning_rate": 8.205118247835035e-08, + "loss": 0.0005, + "step": 30423 + }, + { + "epoch": 0.59, + "learning_rate": 8.204729913401421e-08, + "loss": 1.1104, + "step": 30424 + }, + { + "epoch": 0.59, + "learning_rate": 8.204341578967807e-08, + "loss": 0.0004, + "step": 30425 + }, + { + "epoch": 0.59, + "learning_rate": 8.203953244534193e-08, + "loss": 0.0005, + "step": 30426 + }, + { + "epoch": 0.59, + "learning_rate": 8.203564910100577e-08, + "loss": 0.0004, + "step": 30427 + }, + { + "epoch": 0.59, + "learning_rate": 8.203176575666963e-08, + "loss": 0.0004, + "step": 30428 + }, + { + "epoch": 0.59, + "learning_rate": 8.202788241233349e-08, + "loss": 0.0006, + "step": 30429 + }, + { + "epoch": 0.59, + "learning_rate": 8.202399906799735e-08, + "loss": 0.0006, + "step": 30430 + }, + { + "epoch": 0.59, + "learning_rate": 8.20201157236612e-08, + "loss": 0.001, + "step": 30431 + }, + { + "epoch": 0.59, + "learning_rate": 8.201623237932506e-08, + "loss": 0.0006, + "step": 30432 + }, + { + "epoch": 0.59, + "learning_rate": 8.201234903498892e-08, + "loss": 0.0007, + "step": 30433 + }, + { + "epoch": 0.59, + "learning_rate": 8.200846569065278e-08, + "loss": 0.0008, + "step": 30434 + }, + { + "epoch": 0.59, + "learning_rate": 8.200458234631664e-08, + "loss": 0.0004, + "step": 30435 + }, + { + "epoch": 0.59, + "learning_rate": 8.20006990019805e-08, + "loss": 0.0005, + "step": 30436 + }, + { + "epoch": 0.59, + "learning_rate": 8.199681565764435e-08, + "loss": 0.0006, + "step": 30437 + }, + { + "epoch": 0.59, + "learning_rate": 8.199293231330821e-08, + "loss": 0.89, + "step": 30438 + }, + { + "epoch": 0.59, + "learning_rate": 8.198904896897207e-08, + "loss": 1.0632, + "step": 30439 + }, + { + "epoch": 0.59, + "learning_rate": 8.198516562463593e-08, + "loss": 0.0006, + "step": 30440 + }, + { + "epoch": 0.59, + "learning_rate": 8.198128228029979e-08, + "loss": 0.0007, + "step": 30441 + }, + { + "epoch": 0.59, + "learning_rate": 8.197739893596365e-08, + "loss": 0.0008, + "step": 30442 + }, + { + "epoch": 0.59, + "learning_rate": 8.19735155916275e-08, + "loss": 0.0005, + "step": 30443 + }, + { + "epoch": 0.59, + "learning_rate": 8.196963224729136e-08, + "loss": 0.0007, + "step": 30444 + }, + { + "epoch": 0.59, + "learning_rate": 8.196574890295522e-08, + "loss": 0.8917, + "step": 30445 + }, + { + "epoch": 0.59, + "learning_rate": 8.196186555861908e-08, + "loss": 0.0007, + "step": 30446 + }, + { + "epoch": 0.59, + "learning_rate": 8.195798221428294e-08, + "loss": 0.0005, + "step": 30447 + }, + { + "epoch": 0.59, + "learning_rate": 8.19540988699468e-08, + "loss": 1.1601, + "step": 30448 + }, + { + "epoch": 0.59, + "learning_rate": 8.195021552561065e-08, + "loss": 0.0005, + "step": 30449 + }, + { + "epoch": 0.59, + "learning_rate": 8.194633218127451e-08, + "loss": 0.0005, + "step": 30450 + }, + { + "epoch": 0.59, + "learning_rate": 8.194244883693837e-08, + "loss": 0.0872, + "step": 30451 + }, + { + "epoch": 0.59, + "learning_rate": 8.193856549260223e-08, + "loss": 0.0014, + "step": 30452 + }, + { + "epoch": 0.59, + "learning_rate": 8.193468214826609e-08, + "loss": 0.0003, + "step": 30453 + }, + { + "epoch": 0.59, + "learning_rate": 8.193079880392994e-08, + "loss": 0.0005, + "step": 30454 + }, + { + "epoch": 0.59, + "learning_rate": 8.19269154595938e-08, + "loss": 0.0005, + "step": 30455 + }, + { + "epoch": 0.59, + "learning_rate": 8.192303211525765e-08, + "loss": 0.0005, + "step": 30456 + }, + { + "epoch": 0.59, + "learning_rate": 8.19191487709215e-08, + "loss": 0.0004, + "step": 30457 + }, + { + "epoch": 0.59, + "learning_rate": 8.191526542658536e-08, + "loss": 0.0005, + "step": 30458 + }, + { + "epoch": 0.59, + "learning_rate": 8.191138208224922e-08, + "loss": 0.0005, + "step": 30459 + }, + { + "epoch": 0.59, + "learning_rate": 8.190749873791308e-08, + "loss": 0.0004, + "step": 30460 + }, + { + "epoch": 0.59, + "learning_rate": 8.190361539357694e-08, + "loss": 0.0006, + "step": 30461 + }, + { + "epoch": 0.59, + "learning_rate": 8.18997320492408e-08, + "loss": 0.0007, + "step": 30462 + }, + { + "epoch": 0.59, + "learning_rate": 8.189584870490466e-08, + "loss": 0.0006, + "step": 30463 + }, + { + "epoch": 0.59, + "learning_rate": 8.189196536056851e-08, + "loss": 0.0004, + "step": 30464 + }, + { + "epoch": 0.59, + "learning_rate": 8.188808201623237e-08, + "loss": 0.0005, + "step": 30465 + }, + { + "epoch": 0.59, + "learning_rate": 8.188419867189623e-08, + "loss": 0.0012, + "step": 30466 + }, + { + "epoch": 0.59, + "learning_rate": 8.188031532756009e-08, + "loss": 0.0009, + "step": 30467 + }, + { + "epoch": 0.59, + "learning_rate": 8.187643198322395e-08, + "loss": 0.0005, + "step": 30468 + }, + { + "epoch": 0.59, + "learning_rate": 8.18725486388878e-08, + "loss": 0.0005, + "step": 30469 + }, + { + "epoch": 0.59, + "learning_rate": 8.186866529455166e-08, + "loss": 0.0006, + "step": 30470 + }, + { + "epoch": 0.59, + "learning_rate": 8.186478195021552e-08, + "loss": 0.0024, + "step": 30471 + }, + { + "epoch": 0.59, + "learning_rate": 8.186089860587938e-08, + "loss": 0.0005, + "step": 30472 + }, + { + "epoch": 0.59, + "learning_rate": 8.185701526154324e-08, + "loss": 0.0527, + "step": 30473 + }, + { + "epoch": 0.59, + "learning_rate": 8.18531319172071e-08, + "loss": 0.0005, + "step": 30474 + }, + { + "epoch": 0.59, + "learning_rate": 8.184924857287095e-08, + "loss": 0.0005, + "step": 30475 + }, + { + "epoch": 0.59, + "learning_rate": 8.184536522853481e-08, + "loss": 0.0005, + "step": 30476 + }, + { + "epoch": 0.59, + "learning_rate": 8.184148188419867e-08, + "loss": 0.0012, + "step": 30477 + }, + { + "epoch": 0.59, + "learning_rate": 8.183759853986253e-08, + "loss": 0.001, + "step": 30478 + }, + { + "epoch": 0.59, + "learning_rate": 8.183371519552639e-08, + "loss": 0.0005, + "step": 30479 + }, + { + "epoch": 0.59, + "learning_rate": 8.182983185119025e-08, + "loss": 0.0007, + "step": 30480 + }, + { + "epoch": 0.59, + "learning_rate": 8.18259485068541e-08, + "loss": 0.0004, + "step": 30481 + }, + { + "epoch": 0.59, + "learning_rate": 8.182206516251796e-08, + "loss": 0.0013, + "step": 30482 + }, + { + "epoch": 0.59, + "learning_rate": 8.181818181818182e-08, + "loss": 0.0004, + "step": 30483 + }, + { + "epoch": 0.59, + "learning_rate": 8.181429847384568e-08, + "loss": 0.0006, + "step": 30484 + }, + { + "epoch": 0.59, + "learning_rate": 8.181041512950952e-08, + "loss": 0.0005, + "step": 30485 + }, + { + "epoch": 0.59, + "learning_rate": 8.180653178517338e-08, + "loss": 0.0007, + "step": 30486 + }, + { + "epoch": 0.59, + "learning_rate": 8.180264844083724e-08, + "loss": 0.0068, + "step": 30487 + }, + { + "epoch": 0.59, + "learning_rate": 8.17987650965011e-08, + "loss": 0.0004, + "step": 30488 + }, + { + "epoch": 0.59, + "learning_rate": 8.179488175216496e-08, + "loss": 0.0004, + "step": 30489 + }, + { + "epoch": 0.59, + "learning_rate": 8.179099840782881e-08, + "loss": 0.0004, + "step": 30490 + }, + { + "epoch": 0.59, + "learning_rate": 8.178711506349267e-08, + "loss": 0.0095, + "step": 30491 + }, + { + "epoch": 0.59, + "learning_rate": 8.178323171915653e-08, + "loss": 0.0005, + "step": 30492 + }, + { + "epoch": 0.59, + "learning_rate": 8.177934837482039e-08, + "loss": 0.0004, + "step": 30493 + }, + { + "epoch": 0.59, + "learning_rate": 8.177546503048425e-08, + "loss": 0.0007, + "step": 30494 + }, + { + "epoch": 0.59, + "learning_rate": 8.17715816861481e-08, + "loss": 0.0006, + "step": 30495 + }, + { + "epoch": 0.59, + "learning_rate": 8.176769834181196e-08, + "loss": 0.0003, + "step": 30496 + }, + { + "epoch": 0.59, + "learning_rate": 8.176381499747582e-08, + "loss": 0.0006, + "step": 30497 + }, + { + "epoch": 0.59, + "learning_rate": 8.175993165313968e-08, + "loss": 0.0018, + "step": 30498 + }, + { + "epoch": 0.59, + "learning_rate": 8.175604830880354e-08, + "loss": 0.0006, + "step": 30499 + }, + { + "epoch": 0.59, + "learning_rate": 8.17521649644674e-08, + "loss": 0.0007, + "step": 30500 + }, + { + "epoch": 0.59, + "learning_rate": 8.174828162013126e-08, + "loss": 0.0005, + "step": 30501 + }, + { + "epoch": 0.59, + "learning_rate": 8.174439827579511e-08, + "loss": 0.0006, + "step": 30502 + }, + { + "epoch": 0.59, + "learning_rate": 8.174051493145897e-08, + "loss": 1.0016, + "step": 30503 + }, + { + "epoch": 0.59, + "learning_rate": 8.173663158712283e-08, + "loss": 0.0005, + "step": 30504 + }, + { + "epoch": 0.59, + "learning_rate": 8.173274824278669e-08, + "loss": 0.0003, + "step": 30505 + }, + { + "epoch": 0.59, + "learning_rate": 8.172886489845055e-08, + "loss": 0.0006, + "step": 30506 + }, + { + "epoch": 0.59, + "learning_rate": 8.17249815541144e-08, + "loss": 0.0006, + "step": 30507 + }, + { + "epoch": 0.59, + "learning_rate": 8.172109820977826e-08, + "loss": 0.4864, + "step": 30508 + }, + { + "epoch": 0.59, + "learning_rate": 8.171721486544212e-08, + "loss": 0.0006, + "step": 30509 + }, + { + "epoch": 0.59, + "learning_rate": 8.171333152110598e-08, + "loss": 0.0012, + "step": 30510 + }, + { + "epoch": 0.59, + "learning_rate": 8.170944817676984e-08, + "loss": 0.0005, + "step": 30511 + }, + { + "epoch": 0.59, + "learning_rate": 8.17055648324337e-08, + "loss": 0.4475, + "step": 30512 + }, + { + "epoch": 0.59, + "learning_rate": 8.170168148809755e-08, + "loss": 0.0005, + "step": 30513 + }, + { + "epoch": 0.59, + "learning_rate": 8.16977981437614e-08, + "loss": 0.0032, + "step": 30514 + }, + { + "epoch": 0.59, + "learning_rate": 8.169391479942526e-08, + "loss": 0.0311, + "step": 30515 + }, + { + "epoch": 0.59, + "learning_rate": 8.169003145508912e-08, + "loss": 0.0128, + "step": 30516 + }, + { + "epoch": 0.59, + "learning_rate": 8.168614811075297e-08, + "loss": 0.0005, + "step": 30517 + }, + { + "epoch": 0.59, + "learning_rate": 8.168226476641683e-08, + "loss": 0.0005, + "step": 30518 + }, + { + "epoch": 0.59, + "learning_rate": 8.167838142208069e-08, + "loss": 0.0008, + "step": 30519 + }, + { + "epoch": 0.59, + "learning_rate": 8.167449807774455e-08, + "loss": 0.006, + "step": 30520 + }, + { + "epoch": 0.59, + "learning_rate": 8.167061473340841e-08, + "loss": 1.3721, + "step": 30521 + }, + { + "epoch": 0.59, + "learning_rate": 8.166673138907227e-08, + "loss": 0.0009, + "step": 30522 + }, + { + "epoch": 0.59, + "learning_rate": 8.166284804473612e-08, + "loss": 0.0005, + "step": 30523 + }, + { + "epoch": 0.59, + "learning_rate": 8.165896470039998e-08, + "loss": 0.0004, + "step": 30524 + }, + { + "epoch": 0.59, + "learning_rate": 8.165508135606384e-08, + "loss": 0.0005, + "step": 30525 + }, + { + "epoch": 0.59, + "learning_rate": 8.16511980117277e-08, + "loss": 0.0007, + "step": 30526 + }, + { + "epoch": 0.59, + "learning_rate": 8.164731466739156e-08, + "loss": 0.0005, + "step": 30527 + }, + { + "epoch": 0.59, + "learning_rate": 8.164343132305542e-08, + "loss": 0.001, + "step": 30528 + }, + { + "epoch": 0.59, + "learning_rate": 8.163954797871927e-08, + "loss": 0.0007, + "step": 30529 + }, + { + "epoch": 0.59, + "learning_rate": 8.163566463438313e-08, + "loss": 0.0005, + "step": 30530 + }, + { + "epoch": 0.59, + "learning_rate": 8.163178129004699e-08, + "loss": 0.0005, + "step": 30531 + }, + { + "epoch": 0.59, + "learning_rate": 8.162789794571085e-08, + "loss": 0.0007, + "step": 30532 + }, + { + "epoch": 0.59, + "learning_rate": 8.16240146013747e-08, + "loss": 0.0006, + "step": 30533 + }, + { + "epoch": 0.59, + "learning_rate": 8.162013125703856e-08, + "loss": 0.0005, + "step": 30534 + }, + { + "epoch": 0.59, + "learning_rate": 8.161624791270242e-08, + "loss": 0.0005, + "step": 30535 + }, + { + "epoch": 0.59, + "learning_rate": 8.161236456836628e-08, + "loss": 0.0009, + "step": 30536 + }, + { + "epoch": 0.59, + "learning_rate": 8.160848122403014e-08, + "loss": 0.0226, + "step": 30537 + }, + { + "epoch": 0.59, + "learning_rate": 8.1604597879694e-08, + "loss": 0.9676, + "step": 30538 + }, + { + "epoch": 0.59, + "learning_rate": 8.160071453535786e-08, + "loss": 0.0004, + "step": 30539 + }, + { + "epoch": 0.59, + "learning_rate": 8.159683119102171e-08, + "loss": 0.0005, + "step": 30540 + }, + { + "epoch": 0.59, + "learning_rate": 8.159294784668557e-08, + "loss": 0.0005, + "step": 30541 + }, + { + "epoch": 0.59, + "learning_rate": 8.158906450234943e-08, + "loss": 0.0008, + "step": 30542 + }, + { + "epoch": 0.59, + "learning_rate": 8.158518115801328e-08, + "loss": 0.0005, + "step": 30543 + }, + { + "epoch": 0.59, + "learning_rate": 8.158129781367713e-08, + "loss": 1.2591, + "step": 30544 + }, + { + "epoch": 0.59, + "learning_rate": 8.157741446934099e-08, + "loss": 0.0004, + "step": 30545 + }, + { + "epoch": 0.59, + "learning_rate": 8.157353112500485e-08, + "loss": 0.0011, + "step": 30546 + }, + { + "epoch": 0.59, + "learning_rate": 8.156964778066871e-08, + "loss": 0.0005, + "step": 30547 + }, + { + "epoch": 0.59, + "learning_rate": 8.156576443633257e-08, + "loss": 0.0005, + "step": 30548 + }, + { + "epoch": 0.59, + "learning_rate": 8.156188109199642e-08, + "loss": 0.0008, + "step": 30549 + }, + { + "epoch": 0.59, + "learning_rate": 8.155799774766028e-08, + "loss": 0.0004, + "step": 30550 + }, + { + "epoch": 0.59, + "learning_rate": 8.155411440332414e-08, + "loss": 0.0007, + "step": 30551 + }, + { + "epoch": 0.59, + "learning_rate": 8.1550231058988e-08, + "loss": 0.0006, + "step": 30552 + }, + { + "epoch": 0.59, + "learning_rate": 8.154634771465186e-08, + "loss": 0.0004, + "step": 30553 + }, + { + "epoch": 0.59, + "learning_rate": 8.154246437031572e-08, + "loss": 0.0012, + "step": 30554 + }, + { + "epoch": 0.59, + "learning_rate": 8.153858102597957e-08, + "loss": 0.0006, + "step": 30555 + }, + { + "epoch": 0.59, + "learning_rate": 8.153469768164343e-08, + "loss": 0.005, + "step": 30556 + }, + { + "epoch": 0.59, + "learning_rate": 8.153081433730729e-08, + "loss": 0.0019, + "step": 30557 + }, + { + "epoch": 0.59, + "learning_rate": 8.152693099297115e-08, + "loss": 0.0007, + "step": 30558 + }, + { + "epoch": 0.59, + "learning_rate": 8.152304764863501e-08, + "loss": 0.0004, + "step": 30559 + }, + { + "epoch": 0.59, + "learning_rate": 8.151916430429887e-08, + "loss": 0.0006, + "step": 30560 + }, + { + "epoch": 0.59, + "learning_rate": 8.151528095996272e-08, + "loss": 0.0013, + "step": 30561 + }, + { + "epoch": 0.59, + "learning_rate": 8.151139761562658e-08, + "loss": 0.0011, + "step": 30562 + }, + { + "epoch": 0.59, + "learning_rate": 8.150751427129044e-08, + "loss": 0.0004, + "step": 30563 + }, + { + "epoch": 0.59, + "learning_rate": 8.15036309269543e-08, + "loss": 0.0006, + "step": 30564 + }, + { + "epoch": 0.59, + "learning_rate": 8.149974758261814e-08, + "loss": 0.0005, + "step": 30565 + }, + { + "epoch": 0.59, + "learning_rate": 8.1495864238282e-08, + "loss": 0.0023, + "step": 30566 + }, + { + "epoch": 0.59, + "learning_rate": 8.149198089394586e-08, + "loss": 0.3377, + "step": 30567 + }, + { + "epoch": 0.59, + "learning_rate": 8.148809754960972e-08, + "loss": 0.0004, + "step": 30568 + }, + { + "epoch": 0.59, + "learning_rate": 8.148421420527358e-08, + "loss": 0.0007, + "step": 30569 + }, + { + "epoch": 0.59, + "learning_rate": 8.148033086093743e-08, + "loss": 0.0017, + "step": 30570 + }, + { + "epoch": 0.59, + "learning_rate": 8.147644751660129e-08, + "loss": 0.9647, + "step": 30571 + }, + { + "epoch": 0.59, + "learning_rate": 8.147256417226515e-08, + "loss": 0.006, + "step": 30572 + }, + { + "epoch": 0.59, + "learning_rate": 8.146868082792901e-08, + "loss": 0.2163, + "step": 30573 + }, + { + "epoch": 0.59, + "learning_rate": 8.146479748359287e-08, + "loss": 0.0006, + "step": 30574 + }, + { + "epoch": 0.59, + "learning_rate": 8.146091413925673e-08, + "loss": 0.0005, + "step": 30575 + }, + { + "epoch": 0.59, + "learning_rate": 8.145703079492058e-08, + "loss": 0.0004, + "step": 30576 + }, + { + "epoch": 0.59, + "learning_rate": 8.145314745058444e-08, + "loss": 0.0007, + "step": 30577 + }, + { + "epoch": 0.59, + "learning_rate": 8.14492641062483e-08, + "loss": 0.0005, + "step": 30578 + }, + { + "epoch": 0.59, + "learning_rate": 8.144538076191216e-08, + "loss": 0.0008, + "step": 30579 + }, + { + "epoch": 0.59, + "learning_rate": 8.1441497417576e-08, + "loss": 0.0005, + "step": 30580 + }, + { + "epoch": 0.59, + "learning_rate": 8.143761407323986e-08, + "loss": 0.0003, + "step": 30581 + }, + { + "epoch": 0.59, + "learning_rate": 8.143373072890372e-08, + "loss": 0.0005, + "step": 30582 + }, + { + "epoch": 0.59, + "learning_rate": 8.142984738456758e-08, + "loss": 0.0005, + "step": 30583 + }, + { + "epoch": 0.59, + "learning_rate": 8.142596404023144e-08, + "loss": 0.0005, + "step": 30584 + }, + { + "epoch": 0.59, + "learning_rate": 8.14220806958953e-08, + "loss": 0.0005, + "step": 30585 + }, + { + "epoch": 0.59, + "learning_rate": 8.141819735155915e-08, + "loss": 0.0007, + "step": 30586 + }, + { + "epoch": 0.59, + "learning_rate": 8.141431400722301e-08, + "loss": 0.3183, + "step": 30587 + }, + { + "epoch": 0.59, + "learning_rate": 8.141043066288687e-08, + "loss": 0.0036, + "step": 30588 + }, + { + "epoch": 0.59, + "learning_rate": 8.140654731855073e-08, + "loss": 0.0004, + "step": 30589 + }, + { + "epoch": 0.59, + "learning_rate": 8.140266397421459e-08, + "loss": 0.0006, + "step": 30590 + }, + { + "epoch": 0.59, + "learning_rate": 8.139878062987844e-08, + "loss": 0.0028, + "step": 30591 + }, + { + "epoch": 0.59, + "learning_rate": 8.13948972855423e-08, + "loss": 0.0005, + "step": 30592 + }, + { + "epoch": 0.59, + "learning_rate": 8.139101394120616e-08, + "loss": 0.0007, + "step": 30593 + }, + { + "epoch": 0.59, + "learning_rate": 8.138713059687002e-08, + "loss": 0.0003, + "step": 30594 + }, + { + "epoch": 0.59, + "learning_rate": 8.138324725253388e-08, + "loss": 0.0006, + "step": 30595 + }, + { + "epoch": 0.59, + "learning_rate": 8.137936390819774e-08, + "loss": 0.0004, + "step": 30596 + }, + { + "epoch": 0.59, + "learning_rate": 8.13754805638616e-08, + "loss": 0.5434, + "step": 30597 + }, + { + "epoch": 0.59, + "learning_rate": 8.137159721952545e-08, + "loss": 0.0004, + "step": 30598 + }, + { + "epoch": 0.59, + "learning_rate": 8.136771387518931e-08, + "loss": 0.5634, + "step": 30599 + }, + { + "epoch": 0.59, + "learning_rate": 8.136383053085317e-08, + "loss": 0.0004, + "step": 30600 + }, + { + "epoch": 0.59, + "learning_rate": 8.135994718651701e-08, + "loss": 0.0052, + "step": 30601 + }, + { + "epoch": 0.59, + "learning_rate": 8.135606384218087e-08, + "loss": 0.0008, + "step": 30602 + }, + { + "epoch": 0.59, + "learning_rate": 8.135218049784473e-08, + "loss": 0.0007, + "step": 30603 + }, + { + "epoch": 0.59, + "learning_rate": 8.134829715350859e-08, + "loss": 1.0958, + "step": 30604 + }, + { + "epoch": 0.59, + "learning_rate": 8.134441380917245e-08, + "loss": 0.1854, + "step": 30605 + }, + { + "epoch": 0.59, + "learning_rate": 8.13405304648363e-08, + "loss": 0.5244, + "step": 30606 + }, + { + "epoch": 0.59, + "learning_rate": 8.133664712050016e-08, + "loss": 0.0005, + "step": 30607 + }, + { + "epoch": 0.59, + "learning_rate": 8.133276377616402e-08, + "loss": 0.0006, + "step": 30608 + }, + { + "epoch": 0.59, + "learning_rate": 8.132888043182788e-08, + "loss": 0.0004, + "step": 30609 + }, + { + "epoch": 0.59, + "learning_rate": 8.132499708749174e-08, + "loss": 0.0006, + "step": 30610 + }, + { + "epoch": 0.59, + "learning_rate": 8.13211137431556e-08, + "loss": 0.0003, + "step": 30611 + }, + { + "epoch": 0.59, + "learning_rate": 8.131723039881945e-08, + "loss": 0.0007, + "step": 30612 + }, + { + "epoch": 0.59, + "learning_rate": 8.131334705448331e-08, + "loss": 0.0006, + "step": 30613 + }, + { + "epoch": 0.59, + "learning_rate": 8.130946371014717e-08, + "loss": 0.0024, + "step": 30614 + }, + { + "epoch": 0.59, + "learning_rate": 8.130558036581103e-08, + "loss": 0.0004, + "step": 30615 + }, + { + "epoch": 0.59, + "learning_rate": 8.130169702147489e-08, + "loss": 0.0011, + "step": 30616 + }, + { + "epoch": 0.59, + "learning_rate": 8.129781367713875e-08, + "loss": 0.0006, + "step": 30617 + }, + { + "epoch": 0.59, + "learning_rate": 8.12939303328026e-08, + "loss": 0.7161, + "step": 30618 + }, + { + "epoch": 0.59, + "learning_rate": 8.129004698846646e-08, + "loss": 0.0005, + "step": 30619 + }, + { + "epoch": 0.59, + "learning_rate": 8.128616364413032e-08, + "loss": 0.0015, + "step": 30620 + }, + { + "epoch": 0.59, + "learning_rate": 8.128228029979418e-08, + "loss": 0.0008, + "step": 30621 + }, + { + "epoch": 0.59, + "learning_rate": 8.127839695545804e-08, + "loss": 0.0005, + "step": 30622 + }, + { + "epoch": 0.59, + "learning_rate": 8.12745136111219e-08, + "loss": 0.0006, + "step": 30623 + }, + { + "epoch": 0.59, + "learning_rate": 8.127063026678575e-08, + "loss": 0.0006, + "step": 30624 + }, + { + "epoch": 0.59, + "learning_rate": 8.126674692244961e-08, + "loss": 0.0004, + "step": 30625 + }, + { + "epoch": 0.59, + "learning_rate": 8.126286357811347e-08, + "loss": 0.0006, + "step": 30626 + }, + { + "epoch": 0.59, + "learning_rate": 8.125898023377733e-08, + "loss": 0.0005, + "step": 30627 + }, + { + "epoch": 0.59, + "learning_rate": 8.125509688944119e-08, + "loss": 0.0492, + "step": 30628 + }, + { + "epoch": 0.59, + "learning_rate": 8.125121354510504e-08, + "loss": 0.0364, + "step": 30629 + }, + { + "epoch": 0.59, + "learning_rate": 8.124733020076889e-08, + "loss": 0.0004, + "step": 30630 + }, + { + "epoch": 0.59, + "learning_rate": 8.124344685643275e-08, + "loss": 0.0004, + "step": 30631 + }, + { + "epoch": 0.59, + "learning_rate": 8.12395635120966e-08, + "loss": 0.0004, + "step": 30632 + }, + { + "epoch": 0.59, + "learning_rate": 8.123568016776046e-08, + "loss": 0.0003, + "step": 30633 + }, + { + "epoch": 0.59, + "learning_rate": 8.123179682342432e-08, + "loss": 0.0004, + "step": 30634 + }, + { + "epoch": 0.59, + "learning_rate": 8.122791347908818e-08, + "loss": 0.0022, + "step": 30635 + }, + { + "epoch": 0.59, + "learning_rate": 8.122403013475204e-08, + "loss": 0.0004, + "step": 30636 + }, + { + "epoch": 0.59, + "learning_rate": 8.12201467904159e-08, + "loss": 0.0005, + "step": 30637 + }, + { + "epoch": 0.59, + "learning_rate": 8.121626344607976e-08, + "loss": 0.0007, + "step": 30638 + }, + { + "epoch": 0.59, + "learning_rate": 8.121238010174361e-08, + "loss": 0.0006, + "step": 30639 + }, + { + "epoch": 0.59, + "learning_rate": 8.120849675740747e-08, + "loss": 0.0004, + "step": 30640 + }, + { + "epoch": 0.59, + "learning_rate": 8.120461341307133e-08, + "loss": 0.0008, + "step": 30641 + }, + { + "epoch": 0.59, + "learning_rate": 8.120073006873519e-08, + "loss": 0.0004, + "step": 30642 + }, + { + "epoch": 0.59, + "learning_rate": 8.119684672439905e-08, + "loss": 0.0177, + "step": 30643 + }, + { + "epoch": 0.59, + "learning_rate": 8.11929633800629e-08, + "loss": 0.0007, + "step": 30644 + }, + { + "epoch": 0.59, + "learning_rate": 8.118908003572676e-08, + "loss": 0.0005, + "step": 30645 + }, + { + "epoch": 0.59, + "learning_rate": 8.118519669139062e-08, + "loss": 0.0005, + "step": 30646 + }, + { + "epoch": 0.59, + "learning_rate": 8.118131334705448e-08, + "loss": 0.0004, + "step": 30647 + }, + { + "epoch": 0.59, + "learning_rate": 8.117743000271834e-08, + "loss": 0.9809, + "step": 30648 + }, + { + "epoch": 0.59, + "learning_rate": 8.11735466583822e-08, + "loss": 0.0006, + "step": 30649 + }, + { + "epoch": 0.59, + "learning_rate": 8.116966331404605e-08, + "loss": 0.0006, + "step": 30650 + }, + { + "epoch": 0.59, + "learning_rate": 8.116577996970991e-08, + "loss": 0.0005, + "step": 30651 + }, + { + "epoch": 0.59, + "learning_rate": 8.116189662537377e-08, + "loss": 0.0004, + "step": 30652 + }, + { + "epoch": 0.59, + "learning_rate": 8.115801328103763e-08, + "loss": 0.0023, + "step": 30653 + }, + { + "epoch": 0.59, + "learning_rate": 8.115412993670149e-08, + "loss": 0.0003, + "step": 30654 + }, + { + "epoch": 0.59, + "learning_rate": 8.115024659236535e-08, + "loss": 1.103, + "step": 30655 + }, + { + "epoch": 0.59, + "learning_rate": 8.11463632480292e-08, + "loss": 0.2168, + "step": 30656 + }, + { + "epoch": 0.59, + "learning_rate": 8.114247990369306e-08, + "loss": 0.0005, + "step": 30657 + }, + { + "epoch": 0.59, + "learning_rate": 8.113859655935692e-08, + "loss": 0.0013, + "step": 30658 + }, + { + "epoch": 0.59, + "learning_rate": 8.113471321502077e-08, + "loss": 0.0009, + "step": 30659 + }, + { + "epoch": 0.59, + "learning_rate": 8.113082987068462e-08, + "loss": 0.0018, + "step": 30660 + }, + { + "epoch": 0.59, + "learning_rate": 8.112694652634848e-08, + "loss": 0.028, + "step": 30661 + }, + { + "epoch": 0.59, + "learning_rate": 8.112306318201234e-08, + "loss": 0.0003, + "step": 30662 + }, + { + "epoch": 0.59, + "learning_rate": 8.11191798376762e-08, + "loss": 0.0005, + "step": 30663 + }, + { + "epoch": 0.59, + "learning_rate": 8.111529649334006e-08, + "loss": 0.0004, + "step": 30664 + }, + { + "epoch": 0.59, + "learning_rate": 8.111141314900392e-08, + "loss": 0.0004, + "step": 30665 + }, + { + "epoch": 0.59, + "learning_rate": 8.110752980466777e-08, + "loss": 0.0005, + "step": 30666 + }, + { + "epoch": 0.59, + "learning_rate": 8.110364646033163e-08, + "loss": 0.0007, + "step": 30667 + }, + { + "epoch": 0.59, + "learning_rate": 8.109976311599549e-08, + "loss": 0.0004, + "step": 30668 + }, + { + "epoch": 0.59, + "learning_rate": 8.109587977165935e-08, + "loss": 0.0006, + "step": 30669 + }, + { + "epoch": 0.59, + "learning_rate": 8.10919964273232e-08, + "loss": 0.0078, + "step": 30670 + }, + { + "epoch": 0.59, + "learning_rate": 8.108811308298706e-08, + "loss": 0.0006, + "step": 30671 + }, + { + "epoch": 0.59, + "learning_rate": 8.108422973865092e-08, + "loss": 0.0005, + "step": 30672 + }, + { + "epoch": 0.59, + "learning_rate": 8.108034639431478e-08, + "loss": 0.0005, + "step": 30673 + }, + { + "epoch": 0.6, + "learning_rate": 8.107646304997864e-08, + "loss": 0.0004, + "step": 30674 + }, + { + "epoch": 0.6, + "learning_rate": 8.10725797056425e-08, + "loss": 0.0005, + "step": 30675 + }, + { + "epoch": 0.6, + "learning_rate": 8.106869636130636e-08, + "loss": 0.0006, + "step": 30676 + }, + { + "epoch": 0.6, + "learning_rate": 8.106481301697021e-08, + "loss": 0.0004, + "step": 30677 + }, + { + "epoch": 0.6, + "learning_rate": 8.106092967263407e-08, + "loss": 0.0012, + "step": 30678 + }, + { + "epoch": 0.6, + "learning_rate": 8.105704632829793e-08, + "loss": 0.0005, + "step": 30679 + }, + { + "epoch": 0.6, + "learning_rate": 8.105316298396179e-08, + "loss": 0.0004, + "step": 30680 + }, + { + "epoch": 0.6, + "learning_rate": 8.104927963962565e-08, + "loss": 0.001, + "step": 30681 + }, + { + "epoch": 0.6, + "learning_rate": 8.10453962952895e-08, + "loss": 0.0006, + "step": 30682 + }, + { + "epoch": 0.6, + "learning_rate": 8.104151295095336e-08, + "loss": 0.009, + "step": 30683 + }, + { + "epoch": 0.6, + "learning_rate": 8.103762960661722e-08, + "loss": 1.3234, + "step": 30684 + }, + { + "epoch": 0.6, + "learning_rate": 8.103374626228108e-08, + "loss": 0.0003, + "step": 30685 + }, + { + "epoch": 0.6, + "learning_rate": 8.102986291794494e-08, + "loss": 0.0006, + "step": 30686 + }, + { + "epoch": 0.6, + "learning_rate": 8.10259795736088e-08, + "loss": 0.0746, + "step": 30687 + }, + { + "epoch": 0.6, + "learning_rate": 8.102209622927264e-08, + "loss": 0.1147, + "step": 30688 + }, + { + "epoch": 0.6, + "learning_rate": 8.10182128849365e-08, + "loss": 0.0004, + "step": 30689 + }, + { + "epoch": 0.6, + "learning_rate": 8.101432954060036e-08, + "loss": 0.0007, + "step": 30690 + }, + { + "epoch": 0.6, + "learning_rate": 8.101044619626422e-08, + "loss": 0.0004, + "step": 30691 + }, + { + "epoch": 0.6, + "learning_rate": 8.100656285192807e-08, + "loss": 0.0068, + "step": 30692 + }, + { + "epoch": 0.6, + "learning_rate": 8.100267950759193e-08, + "loss": 0.0009, + "step": 30693 + }, + { + "epoch": 0.6, + "learning_rate": 8.099879616325579e-08, + "loss": 0.0003, + "step": 30694 + }, + { + "epoch": 0.6, + "learning_rate": 8.099491281891965e-08, + "loss": 0.0004, + "step": 30695 + }, + { + "epoch": 0.6, + "learning_rate": 8.099102947458351e-08, + "loss": 0.0006, + "step": 30696 + }, + { + "epoch": 0.6, + "learning_rate": 8.098714613024737e-08, + "loss": 0.0004, + "step": 30697 + }, + { + "epoch": 0.6, + "learning_rate": 8.098326278591122e-08, + "loss": 0.0005, + "step": 30698 + }, + { + "epoch": 0.6, + "learning_rate": 8.097937944157508e-08, + "loss": 0.0005, + "step": 30699 + }, + { + "epoch": 0.6, + "learning_rate": 8.097549609723894e-08, + "loss": 0.0004, + "step": 30700 + }, + { + "epoch": 0.6, + "learning_rate": 8.09716127529028e-08, + "loss": 0.0005, + "step": 30701 + }, + { + "epoch": 0.6, + "learning_rate": 8.096772940856666e-08, + "loss": 0.1217, + "step": 30702 + }, + { + "epoch": 0.6, + "learning_rate": 8.096384606423052e-08, + "loss": 0.0004, + "step": 30703 + }, + { + "epoch": 0.6, + "learning_rate": 8.095996271989437e-08, + "loss": 0.0004, + "step": 30704 + }, + { + "epoch": 0.6, + "learning_rate": 8.095607937555823e-08, + "loss": 0.0009, + "step": 30705 + }, + { + "epoch": 0.6, + "learning_rate": 8.095219603122209e-08, + "loss": 0.2429, + "step": 30706 + }, + { + "epoch": 0.6, + "learning_rate": 8.094831268688595e-08, + "loss": 0.0004, + "step": 30707 + }, + { + "epoch": 0.6, + "learning_rate": 8.09444293425498e-08, + "loss": 0.0007, + "step": 30708 + }, + { + "epoch": 0.6, + "learning_rate": 8.094054599821366e-08, + "loss": 0.0006, + "step": 30709 + }, + { + "epoch": 0.6, + "learning_rate": 8.093666265387752e-08, + "loss": 0.0404, + "step": 30710 + }, + { + "epoch": 0.6, + "learning_rate": 8.093277930954138e-08, + "loss": 0.0006, + "step": 30711 + }, + { + "epoch": 0.6, + "learning_rate": 8.092889596520524e-08, + "loss": 0.0004, + "step": 30712 + }, + { + "epoch": 0.6, + "learning_rate": 8.09250126208691e-08, + "loss": 0.0004, + "step": 30713 + }, + { + "epoch": 0.6, + "learning_rate": 8.092112927653296e-08, + "loss": 0.001, + "step": 30714 + }, + { + "epoch": 0.6, + "learning_rate": 8.091724593219681e-08, + "loss": 0.0007, + "step": 30715 + }, + { + "epoch": 0.6, + "learning_rate": 8.091336258786067e-08, + "loss": 0.0011, + "step": 30716 + }, + { + "epoch": 0.6, + "learning_rate": 8.090947924352452e-08, + "loss": 0.0004, + "step": 30717 + }, + { + "epoch": 0.6, + "learning_rate": 8.090559589918838e-08, + "loss": 0.2696, + "step": 30718 + }, + { + "epoch": 0.6, + "learning_rate": 8.090171255485223e-08, + "loss": 0.0005, + "step": 30719 + }, + { + "epoch": 0.6, + "learning_rate": 8.089782921051609e-08, + "loss": 0.0003, + "step": 30720 + }, + { + "epoch": 0.6, + "learning_rate": 8.089394586617995e-08, + "loss": 0.0005, + "step": 30721 + }, + { + "epoch": 0.6, + "learning_rate": 8.089006252184381e-08, + "loss": 0.0005, + "step": 30722 + }, + { + "epoch": 0.6, + "learning_rate": 8.088617917750767e-08, + "loss": 0.0005, + "step": 30723 + }, + { + "epoch": 0.6, + "learning_rate": 8.088229583317153e-08, + "loss": 0.0006, + "step": 30724 + }, + { + "epoch": 0.6, + "learning_rate": 8.087841248883538e-08, + "loss": 0.0152, + "step": 30725 + }, + { + "epoch": 0.6, + "learning_rate": 8.087452914449924e-08, + "loss": 0.0006, + "step": 30726 + }, + { + "epoch": 0.6, + "learning_rate": 8.08706458001631e-08, + "loss": 0.0005, + "step": 30727 + }, + { + "epoch": 0.6, + "learning_rate": 8.086676245582696e-08, + "loss": 0.4362, + "step": 30728 + }, + { + "epoch": 0.6, + "learning_rate": 8.086287911149082e-08, + "loss": 0.0004, + "step": 30729 + }, + { + "epoch": 0.6, + "learning_rate": 8.085899576715467e-08, + "loss": 0.0005, + "step": 30730 + }, + { + "epoch": 0.6, + "learning_rate": 8.085511242281853e-08, + "loss": 0.0006, + "step": 30731 + }, + { + "epoch": 0.6, + "learning_rate": 8.085122907848239e-08, + "loss": 0.0006, + "step": 30732 + }, + { + "epoch": 0.6, + "learning_rate": 8.084734573414625e-08, + "loss": 0.0003, + "step": 30733 + }, + { + "epoch": 0.6, + "learning_rate": 8.084346238981011e-08, + "loss": 0.0006, + "step": 30734 + }, + { + "epoch": 0.6, + "learning_rate": 8.083957904547397e-08, + "loss": 0.0005, + "step": 30735 + }, + { + "epoch": 0.6, + "learning_rate": 8.083569570113782e-08, + "loss": 0.0006, + "step": 30736 + }, + { + "epoch": 0.6, + "learning_rate": 8.083181235680168e-08, + "loss": 0.0004, + "step": 30737 + }, + { + "epoch": 0.6, + "learning_rate": 8.082792901246554e-08, + "loss": 0.0005, + "step": 30738 + }, + { + "epoch": 0.6, + "learning_rate": 8.08240456681294e-08, + "loss": 0.0007, + "step": 30739 + }, + { + "epoch": 0.6, + "learning_rate": 8.082016232379326e-08, + "loss": 0.0006, + "step": 30740 + }, + { + "epoch": 0.6, + "learning_rate": 8.081627897945712e-08, + "loss": 0.0005, + "step": 30741 + }, + { + "epoch": 0.6, + "learning_rate": 8.081239563512096e-08, + "loss": 0.0005, + "step": 30742 + }, + { + "epoch": 0.6, + "learning_rate": 8.080851229078482e-08, + "loss": 0.1528, + "step": 30743 + }, + { + "epoch": 0.6, + "learning_rate": 8.080462894644868e-08, + "loss": 0.0008, + "step": 30744 + }, + { + "epoch": 0.6, + "learning_rate": 8.080074560211253e-08, + "loss": 0.0008, + "step": 30745 + }, + { + "epoch": 0.6, + "learning_rate": 8.079686225777639e-08, + "loss": 0.0006, + "step": 30746 + }, + { + "epoch": 0.6, + "learning_rate": 8.079297891344025e-08, + "loss": 0.0005, + "step": 30747 + }, + { + "epoch": 0.6, + "learning_rate": 8.078909556910411e-08, + "loss": 0.0005, + "step": 30748 + }, + { + "epoch": 0.6, + "learning_rate": 8.078521222476797e-08, + "loss": 0.0006, + "step": 30749 + }, + { + "epoch": 0.6, + "learning_rate": 8.078132888043183e-08, + "loss": 0.0098, + "step": 30750 + }, + { + "epoch": 0.6, + "learning_rate": 8.077744553609568e-08, + "loss": 0.0005, + "step": 30751 + }, + { + "epoch": 0.6, + "learning_rate": 8.077356219175954e-08, + "loss": 0.041, + "step": 30752 + }, + { + "epoch": 0.6, + "learning_rate": 8.07696788474234e-08, + "loss": 0.2122, + "step": 30753 + }, + { + "epoch": 0.6, + "learning_rate": 8.076579550308726e-08, + "loss": 0.0005, + "step": 30754 + }, + { + "epoch": 0.6, + "learning_rate": 8.076191215875112e-08, + "loss": 0.0008, + "step": 30755 + }, + { + "epoch": 0.6, + "learning_rate": 8.075802881441498e-08, + "loss": 0.0004, + "step": 30756 + }, + { + "epoch": 0.6, + "learning_rate": 8.075414547007882e-08, + "loss": 0.0004, + "step": 30757 + }, + { + "epoch": 0.6, + "learning_rate": 8.075026212574268e-08, + "loss": 0.2741, + "step": 30758 + }, + { + "epoch": 0.6, + "learning_rate": 8.074637878140654e-08, + "loss": 0.0006, + "step": 30759 + }, + { + "epoch": 0.6, + "learning_rate": 8.07424954370704e-08, + "loss": 0.0004, + "step": 30760 + }, + { + "epoch": 0.6, + "learning_rate": 8.073861209273425e-08, + "loss": 0.0005, + "step": 30761 + }, + { + "epoch": 0.6, + "learning_rate": 8.073472874839811e-08, + "loss": 0.0005, + "step": 30762 + }, + { + "epoch": 0.6, + "learning_rate": 8.073084540406197e-08, + "loss": 0.0007, + "step": 30763 + }, + { + "epoch": 0.6, + "learning_rate": 8.072696205972583e-08, + "loss": 0.0008, + "step": 30764 + }, + { + "epoch": 0.6, + "learning_rate": 8.072307871538969e-08, + "loss": 0.0006, + "step": 30765 + }, + { + "epoch": 0.6, + "learning_rate": 8.071919537105354e-08, + "loss": 0.0005, + "step": 30766 + }, + { + "epoch": 0.6, + "learning_rate": 8.07153120267174e-08, + "loss": 0.0004, + "step": 30767 + }, + { + "epoch": 0.6, + "learning_rate": 8.071142868238126e-08, + "loss": 0.0005, + "step": 30768 + }, + { + "epoch": 0.6, + "learning_rate": 8.070754533804512e-08, + "loss": 0.0006, + "step": 30769 + }, + { + "epoch": 0.6, + "learning_rate": 8.070366199370898e-08, + "loss": 0.0004, + "step": 30770 + }, + { + "epoch": 0.6, + "learning_rate": 8.069977864937284e-08, + "loss": 0.0008, + "step": 30771 + }, + { + "epoch": 0.6, + "learning_rate": 8.06958953050367e-08, + "loss": 0.0004, + "step": 30772 + }, + { + "epoch": 0.6, + "learning_rate": 8.069201196070055e-08, + "loss": 0.0005, + "step": 30773 + }, + { + "epoch": 0.6, + "learning_rate": 8.068812861636441e-08, + "loss": 0.0006, + "step": 30774 + }, + { + "epoch": 0.6, + "learning_rate": 8.068424527202826e-08, + "loss": 0.0005, + "step": 30775 + }, + { + "epoch": 0.6, + "learning_rate": 8.068036192769211e-08, + "loss": 0.0004, + "step": 30776 + }, + { + "epoch": 0.6, + "learning_rate": 8.067647858335597e-08, + "loss": 0.0005, + "step": 30777 + }, + { + "epoch": 0.6, + "learning_rate": 8.067259523901983e-08, + "loss": 0.0006, + "step": 30778 + }, + { + "epoch": 0.6, + "learning_rate": 8.066871189468369e-08, + "loss": 0.0007, + "step": 30779 + }, + { + "epoch": 0.6, + "learning_rate": 8.066482855034755e-08, + "loss": 0.0007, + "step": 30780 + }, + { + "epoch": 0.6, + "learning_rate": 8.06609452060114e-08, + "loss": 0.0066, + "step": 30781 + }, + { + "epoch": 0.6, + "learning_rate": 8.065706186167526e-08, + "loss": 0.1402, + "step": 30782 + }, + { + "epoch": 0.6, + "learning_rate": 8.065317851733912e-08, + "loss": 0.0013, + "step": 30783 + }, + { + "epoch": 0.6, + "learning_rate": 8.064929517300298e-08, + "loss": 0.0049, + "step": 30784 + }, + { + "epoch": 0.6, + "learning_rate": 8.064541182866684e-08, + "loss": 0.0005, + "step": 30785 + }, + { + "epoch": 0.6, + "learning_rate": 8.06415284843307e-08, + "loss": 0.0005, + "step": 30786 + }, + { + "epoch": 0.6, + "learning_rate": 8.063764513999455e-08, + "loss": 0.0004, + "step": 30787 + }, + { + "epoch": 0.6, + "learning_rate": 8.063376179565841e-08, + "loss": 0.0007, + "step": 30788 + }, + { + "epoch": 0.6, + "learning_rate": 8.062987845132227e-08, + "loss": 0.0005, + "step": 30789 + }, + { + "epoch": 0.6, + "learning_rate": 8.062599510698613e-08, + "loss": 0.0005, + "step": 30790 + }, + { + "epoch": 0.6, + "learning_rate": 8.062211176264999e-08, + "loss": 0.0005, + "step": 30791 + }, + { + "epoch": 0.6, + "learning_rate": 8.061822841831385e-08, + "loss": 0.0004, + "step": 30792 + }, + { + "epoch": 0.6, + "learning_rate": 8.06143450739777e-08, + "loss": 0.0057, + "step": 30793 + }, + { + "epoch": 0.6, + "learning_rate": 8.061046172964156e-08, + "loss": 0.0031, + "step": 30794 + }, + { + "epoch": 0.6, + "learning_rate": 8.060657838530542e-08, + "loss": 0.0007, + "step": 30795 + }, + { + "epoch": 0.6, + "learning_rate": 8.060269504096928e-08, + "loss": 0.0008, + "step": 30796 + }, + { + "epoch": 0.6, + "learning_rate": 8.059881169663314e-08, + "loss": 0.5858, + "step": 30797 + }, + { + "epoch": 0.6, + "learning_rate": 8.0594928352297e-08, + "loss": 0.0006, + "step": 30798 + }, + { + "epoch": 0.6, + "learning_rate": 8.059104500796085e-08, + "loss": 0.0004, + "step": 30799 + }, + { + "epoch": 0.6, + "learning_rate": 8.058716166362471e-08, + "loss": 0.0005, + "step": 30800 + }, + { + "epoch": 0.6, + "learning_rate": 8.058327831928857e-08, + "loss": 0.2626, + "step": 30801 + }, + { + "epoch": 0.6, + "learning_rate": 8.057939497495243e-08, + "loss": 0.0004, + "step": 30802 + }, + { + "epoch": 0.6, + "learning_rate": 8.057551163061629e-08, + "loss": 0.0004, + "step": 30803 + }, + { + "epoch": 0.6, + "learning_rate": 8.057162828628013e-08, + "loss": 0.0012, + "step": 30804 + }, + { + "epoch": 0.6, + "learning_rate": 8.056774494194399e-08, + "loss": 0.001, + "step": 30805 + }, + { + "epoch": 0.6, + "learning_rate": 8.056386159760785e-08, + "loss": 0.0005, + "step": 30806 + }, + { + "epoch": 0.6, + "learning_rate": 8.05599782532717e-08, + "loss": 0.0005, + "step": 30807 + }, + { + "epoch": 0.6, + "learning_rate": 8.055609490893556e-08, + "loss": 0.0006, + "step": 30808 + }, + { + "epoch": 0.6, + "learning_rate": 8.055221156459942e-08, + "loss": 0.0006, + "step": 30809 + }, + { + "epoch": 0.6, + "learning_rate": 8.054832822026328e-08, + "loss": 0.0005, + "step": 30810 + }, + { + "epoch": 0.6, + "learning_rate": 8.054444487592714e-08, + "loss": 1.072, + "step": 30811 + }, + { + "epoch": 0.6, + "learning_rate": 8.0540561531591e-08, + "loss": 0.0004, + "step": 30812 + }, + { + "epoch": 0.6, + "learning_rate": 8.053667818725486e-08, + "loss": 0.0018, + "step": 30813 + }, + { + "epoch": 0.6, + "learning_rate": 8.053279484291871e-08, + "loss": 0.0005, + "step": 30814 + }, + { + "epoch": 0.6, + "learning_rate": 8.052891149858257e-08, + "loss": 0.0109, + "step": 30815 + }, + { + "epoch": 0.6, + "learning_rate": 8.052502815424643e-08, + "loss": 0.1729, + "step": 30816 + }, + { + "epoch": 0.6, + "learning_rate": 8.052114480991029e-08, + "loss": 0.0004, + "step": 30817 + }, + { + "epoch": 0.6, + "learning_rate": 8.051726146557415e-08, + "loss": 0.0005, + "step": 30818 + }, + { + "epoch": 0.6, + "learning_rate": 8.0513378121238e-08, + "loss": 0.0005, + "step": 30819 + }, + { + "epoch": 0.6, + "learning_rate": 8.050949477690186e-08, + "loss": 0.0005, + "step": 30820 + }, + { + "epoch": 0.6, + "learning_rate": 8.050561143256572e-08, + "loss": 0.0006, + "step": 30821 + }, + { + "epoch": 0.6, + "learning_rate": 8.050172808822958e-08, + "loss": 0.0005, + "step": 30822 + }, + { + "epoch": 0.6, + "learning_rate": 8.049784474389344e-08, + "loss": 0.0007, + "step": 30823 + }, + { + "epoch": 0.6, + "learning_rate": 8.04939613995573e-08, + "loss": 0.0029, + "step": 30824 + }, + { + "epoch": 0.6, + "learning_rate": 8.049007805522115e-08, + "loss": 0.0006, + "step": 30825 + }, + { + "epoch": 0.6, + "learning_rate": 8.048619471088501e-08, + "loss": 0.0004, + "step": 30826 + }, + { + "epoch": 0.6, + "learning_rate": 8.048231136654887e-08, + "loss": 0.0006, + "step": 30827 + }, + { + "epoch": 0.6, + "learning_rate": 8.047842802221273e-08, + "loss": 0.0005, + "step": 30828 + }, + { + "epoch": 0.6, + "learning_rate": 8.047454467787659e-08, + "loss": 0.0005, + "step": 30829 + }, + { + "epoch": 0.6, + "learning_rate": 8.047066133354045e-08, + "loss": 0.0005, + "step": 30830 + }, + { + "epoch": 0.6, + "learning_rate": 8.04667779892043e-08, + "loss": 1.0782, + "step": 30831 + }, + { + "epoch": 0.6, + "learning_rate": 8.046289464486816e-08, + "loss": 0.0005, + "step": 30832 + }, + { + "epoch": 0.6, + "learning_rate": 8.045901130053201e-08, + "loss": 0.0006, + "step": 30833 + }, + { + "epoch": 0.6, + "learning_rate": 8.045512795619587e-08, + "loss": 0.0006, + "step": 30834 + }, + { + "epoch": 0.6, + "learning_rate": 8.045124461185972e-08, + "loss": 0.0017, + "step": 30835 + }, + { + "epoch": 0.6, + "learning_rate": 8.044736126752358e-08, + "loss": 0.0728, + "step": 30836 + }, + { + "epoch": 0.6, + "learning_rate": 8.044347792318744e-08, + "loss": 0.0005, + "step": 30837 + }, + { + "epoch": 0.6, + "learning_rate": 8.04395945788513e-08, + "loss": 0.0004, + "step": 30838 + }, + { + "epoch": 0.6, + "learning_rate": 8.043571123451516e-08, + "loss": 0.0004, + "step": 30839 + }, + { + "epoch": 0.6, + "learning_rate": 8.043182789017902e-08, + "loss": 0.0003, + "step": 30840 + }, + { + "epoch": 0.6, + "learning_rate": 8.042794454584287e-08, + "loss": 0.0005, + "step": 30841 + }, + { + "epoch": 0.6, + "learning_rate": 8.042406120150673e-08, + "loss": 0.0005, + "step": 30842 + }, + { + "epoch": 0.6, + "learning_rate": 8.042017785717059e-08, + "loss": 0.0004, + "step": 30843 + }, + { + "epoch": 0.6, + "learning_rate": 8.041629451283445e-08, + "loss": 0.0005, + "step": 30844 + }, + { + "epoch": 0.6, + "learning_rate": 8.04124111684983e-08, + "loss": 0.0005, + "step": 30845 + }, + { + "epoch": 0.6, + "learning_rate": 8.040852782416216e-08, + "loss": 0.002, + "step": 30846 + }, + { + "epoch": 0.6, + "learning_rate": 8.040464447982602e-08, + "loss": 0.0006, + "step": 30847 + }, + { + "epoch": 0.6, + "learning_rate": 8.040076113548988e-08, + "loss": 0.0005, + "step": 30848 + }, + { + "epoch": 0.6, + "learning_rate": 8.039687779115374e-08, + "loss": 0.0004, + "step": 30849 + }, + { + "epoch": 0.6, + "learning_rate": 8.03929944468176e-08, + "loss": 0.0005, + "step": 30850 + }, + { + "epoch": 0.6, + "learning_rate": 8.038911110248146e-08, + "loss": 0.0006, + "step": 30851 + }, + { + "epoch": 0.6, + "learning_rate": 8.038522775814531e-08, + "loss": 0.0006, + "step": 30852 + }, + { + "epoch": 0.6, + "learning_rate": 8.038134441380917e-08, + "loss": 0.0112, + "step": 30853 + }, + { + "epoch": 0.6, + "learning_rate": 8.037746106947303e-08, + "loss": 0.0004, + "step": 30854 + }, + { + "epoch": 0.6, + "learning_rate": 8.037357772513689e-08, + "loss": 0.0006, + "step": 30855 + }, + { + "epoch": 0.6, + "learning_rate": 8.036969438080075e-08, + "loss": 0.0006, + "step": 30856 + }, + { + "epoch": 0.6, + "learning_rate": 8.03658110364646e-08, + "loss": 0.0007, + "step": 30857 + }, + { + "epoch": 0.6, + "learning_rate": 8.036192769212846e-08, + "loss": 0.0004, + "step": 30858 + }, + { + "epoch": 0.6, + "learning_rate": 8.035804434779232e-08, + "loss": 0.0004, + "step": 30859 + }, + { + "epoch": 0.6, + "learning_rate": 8.035416100345618e-08, + "loss": 0.0055, + "step": 30860 + }, + { + "epoch": 0.6, + "learning_rate": 8.035027765912004e-08, + "loss": 0.0004, + "step": 30861 + }, + { + "epoch": 0.6, + "learning_rate": 8.034639431478388e-08, + "loss": 0.0004, + "step": 30862 + }, + { + "epoch": 0.6, + "learning_rate": 8.034251097044774e-08, + "loss": 0.0007, + "step": 30863 + }, + { + "epoch": 0.6, + "learning_rate": 8.03386276261116e-08, + "loss": 0.0005, + "step": 30864 + }, + { + "epoch": 0.6, + "learning_rate": 8.033474428177546e-08, + "loss": 0.0004, + "step": 30865 + }, + { + "epoch": 0.6, + "learning_rate": 8.033086093743932e-08, + "loss": 0.0006, + "step": 30866 + }, + { + "epoch": 0.6, + "learning_rate": 8.032697759310317e-08, + "loss": 0.0005, + "step": 30867 + }, + { + "epoch": 0.6, + "learning_rate": 8.032309424876703e-08, + "loss": 0.0006, + "step": 30868 + }, + { + "epoch": 0.6, + "learning_rate": 8.031921090443089e-08, + "loss": 0.0005, + "step": 30869 + }, + { + "epoch": 0.6, + "learning_rate": 8.031532756009475e-08, + "loss": 0.0004, + "step": 30870 + }, + { + "epoch": 0.6, + "learning_rate": 8.031144421575861e-08, + "loss": 0.4654, + "step": 30871 + }, + { + "epoch": 0.6, + "learning_rate": 8.030756087142247e-08, + "loss": 0.0004, + "step": 30872 + }, + { + "epoch": 0.6, + "learning_rate": 8.030367752708632e-08, + "loss": 0.0006, + "step": 30873 + }, + { + "epoch": 0.6, + "learning_rate": 8.029979418275018e-08, + "loss": 0.3275, + "step": 30874 + }, + { + "epoch": 0.6, + "learning_rate": 8.029591083841404e-08, + "loss": 0.0005, + "step": 30875 + }, + { + "epoch": 0.6, + "learning_rate": 8.02920274940779e-08, + "loss": 0.0004, + "step": 30876 + }, + { + "epoch": 0.6, + "learning_rate": 8.028814414974176e-08, + "loss": 0.0004, + "step": 30877 + }, + { + "epoch": 0.6, + "learning_rate": 8.028426080540562e-08, + "loss": 0.0004, + "step": 30878 + }, + { + "epoch": 0.6, + "learning_rate": 8.028037746106947e-08, + "loss": 0.0005, + "step": 30879 + }, + { + "epoch": 0.6, + "learning_rate": 8.027649411673333e-08, + "loss": 0.0004, + "step": 30880 + }, + { + "epoch": 0.6, + "learning_rate": 8.027261077239719e-08, + "loss": 0.0008, + "step": 30881 + }, + { + "epoch": 0.6, + "learning_rate": 8.026872742806105e-08, + "loss": 0.0004, + "step": 30882 + }, + { + "epoch": 0.6, + "learning_rate": 8.02648440837249e-08, + "loss": 0.0007, + "step": 30883 + }, + { + "epoch": 0.6, + "learning_rate": 8.026096073938876e-08, + "loss": 0.0006, + "step": 30884 + }, + { + "epoch": 0.6, + "learning_rate": 8.025707739505262e-08, + "loss": 0.0005, + "step": 30885 + }, + { + "epoch": 0.6, + "learning_rate": 8.025319405071648e-08, + "loss": 0.0006, + "step": 30886 + }, + { + "epoch": 0.6, + "learning_rate": 8.024931070638034e-08, + "loss": 0.8777, + "step": 30887 + }, + { + "epoch": 0.6, + "learning_rate": 8.02454273620442e-08, + "loss": 0.0003, + "step": 30888 + }, + { + "epoch": 0.6, + "learning_rate": 8.024154401770806e-08, + "loss": 0.0013, + "step": 30889 + }, + { + "epoch": 0.6, + "learning_rate": 8.023766067337191e-08, + "loss": 0.0005, + "step": 30890 + }, + { + "epoch": 0.6, + "learning_rate": 8.023377732903576e-08, + "loss": 0.0008, + "step": 30891 + }, + { + "epoch": 0.6, + "learning_rate": 8.022989398469962e-08, + "loss": 0.0004, + "step": 30892 + }, + { + "epoch": 0.6, + "learning_rate": 8.022601064036348e-08, + "loss": 0.721, + "step": 30893 + }, + { + "epoch": 0.6, + "learning_rate": 8.022212729602733e-08, + "loss": 0.0004, + "step": 30894 + }, + { + "epoch": 0.6, + "learning_rate": 8.021824395169119e-08, + "loss": 0.0004, + "step": 30895 + }, + { + "epoch": 0.6, + "learning_rate": 8.021436060735505e-08, + "loss": 0.0005, + "step": 30896 + }, + { + "epoch": 0.6, + "learning_rate": 8.021047726301891e-08, + "loss": 0.0007, + "step": 30897 + }, + { + "epoch": 0.6, + "learning_rate": 8.020659391868277e-08, + "loss": 0.0004, + "step": 30898 + }, + { + "epoch": 0.6, + "learning_rate": 8.020271057434663e-08, + "loss": 0.0005, + "step": 30899 + }, + { + "epoch": 0.6, + "learning_rate": 8.019882723001048e-08, + "loss": 0.0008, + "step": 30900 + }, + { + "epoch": 0.6, + "learning_rate": 8.019494388567434e-08, + "loss": 0.0005, + "step": 30901 + }, + { + "epoch": 0.6, + "learning_rate": 8.01910605413382e-08, + "loss": 0.0004, + "step": 30902 + }, + { + "epoch": 0.6, + "learning_rate": 8.018717719700206e-08, + "loss": 0.0007, + "step": 30903 + }, + { + "epoch": 0.6, + "learning_rate": 8.018329385266592e-08, + "loss": 0.0005, + "step": 30904 + }, + { + "epoch": 0.6, + "learning_rate": 8.017941050832977e-08, + "loss": 0.0005, + "step": 30905 + }, + { + "epoch": 0.6, + "learning_rate": 8.017552716399363e-08, + "loss": 0.0006, + "step": 30906 + }, + { + "epoch": 0.6, + "learning_rate": 8.017164381965749e-08, + "loss": 0.0005, + "step": 30907 + }, + { + "epoch": 0.6, + "learning_rate": 8.016776047532135e-08, + "loss": 0.0007, + "step": 30908 + }, + { + "epoch": 0.6, + "learning_rate": 8.016387713098521e-08, + "loss": 0.0005, + "step": 30909 + }, + { + "epoch": 0.6, + "learning_rate": 8.015999378664907e-08, + "loss": 0.0005, + "step": 30910 + }, + { + "epoch": 0.6, + "learning_rate": 8.015611044231292e-08, + "loss": 0.0153, + "step": 30911 + }, + { + "epoch": 0.6, + "learning_rate": 8.015222709797678e-08, + "loss": 0.2772, + "step": 30912 + }, + { + "epoch": 0.6, + "learning_rate": 8.014834375364064e-08, + "loss": 0.0006, + "step": 30913 + }, + { + "epoch": 0.6, + "learning_rate": 8.01444604093045e-08, + "loss": 0.0003, + "step": 30914 + }, + { + "epoch": 0.6, + "learning_rate": 8.014057706496836e-08, + "loss": 0.0007, + "step": 30915 + }, + { + "epoch": 0.6, + "learning_rate": 8.013669372063222e-08, + "loss": 0.0006, + "step": 30916 + }, + { + "epoch": 0.6, + "learning_rate": 8.013281037629607e-08, + "loss": 0.0006, + "step": 30917 + }, + { + "epoch": 0.6, + "learning_rate": 8.012892703195993e-08, + "loss": 0.0003, + "step": 30918 + }, + { + "epoch": 0.6, + "learning_rate": 8.012504368762378e-08, + "loss": 0.0163, + "step": 30919 + }, + { + "epoch": 0.6, + "learning_rate": 8.012116034328764e-08, + "loss": 0.0004, + "step": 30920 + }, + { + "epoch": 0.6, + "learning_rate": 8.011727699895149e-08, + "loss": 0.0005, + "step": 30921 + }, + { + "epoch": 0.6, + "learning_rate": 8.011339365461535e-08, + "loss": 0.0011, + "step": 30922 + }, + { + "epoch": 0.6, + "learning_rate": 8.010951031027921e-08, + "loss": 0.0004, + "step": 30923 + }, + { + "epoch": 0.6, + "learning_rate": 8.010562696594307e-08, + "loss": 0.0006, + "step": 30924 + }, + { + "epoch": 0.6, + "learning_rate": 8.010174362160693e-08, + "loss": 0.0004, + "step": 30925 + }, + { + "epoch": 0.6, + "learning_rate": 8.009786027727078e-08, + "loss": 0.0007, + "step": 30926 + }, + { + "epoch": 0.6, + "learning_rate": 8.009397693293464e-08, + "loss": 0.0033, + "step": 30927 + }, + { + "epoch": 0.6, + "learning_rate": 8.00900935885985e-08, + "loss": 0.0005, + "step": 30928 + }, + { + "epoch": 0.6, + "learning_rate": 8.008621024426236e-08, + "loss": 0.0005, + "step": 30929 + }, + { + "epoch": 0.6, + "learning_rate": 8.008232689992622e-08, + "loss": 0.0004, + "step": 30930 + }, + { + "epoch": 0.6, + "learning_rate": 8.007844355559008e-08, + "loss": 0.0692, + "step": 30931 + }, + { + "epoch": 0.6, + "learning_rate": 8.007456021125393e-08, + "loss": 0.0007, + "step": 30932 + }, + { + "epoch": 0.6, + "learning_rate": 8.007067686691779e-08, + "loss": 0.0006, + "step": 30933 + }, + { + "epoch": 0.6, + "learning_rate": 8.006679352258164e-08, + "loss": 0.9686, + "step": 30934 + }, + { + "epoch": 0.6, + "learning_rate": 8.00629101782455e-08, + "loss": 0.0005, + "step": 30935 + }, + { + "epoch": 0.6, + "learning_rate": 8.005902683390935e-08, + "loss": 0.0003, + "step": 30936 + }, + { + "epoch": 0.6, + "learning_rate": 8.005514348957321e-08, + "loss": 0.0005, + "step": 30937 + }, + { + "epoch": 0.6, + "learning_rate": 8.005126014523707e-08, + "loss": 0.0006, + "step": 30938 + }, + { + "epoch": 0.6, + "learning_rate": 8.004737680090093e-08, + "loss": 0.0005, + "step": 30939 + }, + { + "epoch": 0.6, + "learning_rate": 8.004349345656479e-08, + "loss": 0.0005, + "step": 30940 + }, + { + "epoch": 0.6, + "learning_rate": 8.003961011222864e-08, + "loss": 0.0005, + "step": 30941 + }, + { + "epoch": 0.6, + "learning_rate": 8.00357267678925e-08, + "loss": 0.0005, + "step": 30942 + }, + { + "epoch": 0.6, + "learning_rate": 8.003184342355636e-08, + "loss": 0.0006, + "step": 30943 + }, + { + "epoch": 0.6, + "learning_rate": 8.002796007922022e-08, + "loss": 0.4755, + "step": 30944 + }, + { + "epoch": 0.6, + "learning_rate": 8.002407673488408e-08, + "loss": 0.0006, + "step": 30945 + }, + { + "epoch": 0.6, + "learning_rate": 8.002019339054794e-08, + "loss": 0.0004, + "step": 30946 + }, + { + "epoch": 0.6, + "learning_rate": 8.00163100462118e-08, + "loss": 0.0004, + "step": 30947 + }, + { + "epoch": 0.6, + "learning_rate": 8.001242670187565e-08, + "loss": 0.0004, + "step": 30948 + }, + { + "epoch": 0.6, + "learning_rate": 8.00085433575395e-08, + "loss": 0.0041, + "step": 30949 + }, + { + "epoch": 0.6, + "learning_rate": 8.000466001320336e-08, + "loss": 0.0004, + "step": 30950 + }, + { + "epoch": 0.6, + "learning_rate": 8.000077666886721e-08, + "loss": 0.0008, + "step": 30951 + }, + { + "epoch": 0.6, + "learning_rate": 7.999689332453107e-08, + "loss": 0.0005, + "step": 30952 + }, + { + "epoch": 0.6, + "learning_rate": 7.999300998019493e-08, + "loss": 0.1441, + "step": 30953 + }, + { + "epoch": 0.6, + "learning_rate": 7.998912663585879e-08, + "loss": 0.0025, + "step": 30954 + }, + { + "epoch": 0.6, + "learning_rate": 7.998524329152265e-08, + "loss": 0.4107, + "step": 30955 + }, + { + "epoch": 0.6, + "learning_rate": 7.99813599471865e-08, + "loss": 1.1476, + "step": 30956 + }, + { + "epoch": 0.6, + "learning_rate": 7.997747660285036e-08, + "loss": 0.0005, + "step": 30957 + }, + { + "epoch": 0.6, + "learning_rate": 7.997359325851422e-08, + "loss": 0.0019, + "step": 30958 + }, + { + "epoch": 0.6, + "learning_rate": 7.996970991417808e-08, + "loss": 0.0008, + "step": 30959 + }, + { + "epoch": 0.6, + "learning_rate": 7.996582656984194e-08, + "loss": 0.0008, + "step": 30960 + }, + { + "epoch": 0.6, + "learning_rate": 7.99619432255058e-08, + "loss": 0.0592, + "step": 30961 + }, + { + "epoch": 0.6, + "learning_rate": 7.995805988116965e-08, + "loss": 0.2027, + "step": 30962 + }, + { + "epoch": 0.6, + "learning_rate": 7.995417653683351e-08, + "loss": 0.0006, + "step": 30963 + }, + { + "epoch": 0.6, + "learning_rate": 7.995029319249737e-08, + "loss": 0.0006, + "step": 30964 + }, + { + "epoch": 0.6, + "learning_rate": 7.994640984816123e-08, + "loss": 0.7471, + "step": 30965 + }, + { + "epoch": 0.6, + "learning_rate": 7.994252650382509e-08, + "loss": 0.0252, + "step": 30966 + }, + { + "epoch": 0.6, + "learning_rate": 7.993864315948895e-08, + "loss": 0.0012, + "step": 30967 + }, + { + "epoch": 0.6, + "learning_rate": 7.99347598151528e-08, + "loss": 0.0006, + "step": 30968 + }, + { + "epoch": 0.6, + "learning_rate": 7.993087647081666e-08, + "loss": 0.126, + "step": 30969 + }, + { + "epoch": 0.6, + "learning_rate": 7.992699312648052e-08, + "loss": 0.0073, + "step": 30970 + }, + { + "epoch": 0.6, + "learning_rate": 7.992310978214438e-08, + "loss": 0.0007, + "step": 30971 + }, + { + "epoch": 0.6, + "learning_rate": 7.991922643780824e-08, + "loss": 0.0017, + "step": 30972 + }, + { + "epoch": 0.6, + "learning_rate": 7.99153430934721e-08, + "loss": 0.0029, + "step": 30973 + }, + { + "epoch": 0.6, + "learning_rate": 7.991145974913595e-08, + "loss": 0.0005, + "step": 30974 + }, + { + "epoch": 0.6, + "learning_rate": 7.990757640479981e-08, + "loss": 0.0005, + "step": 30975 + }, + { + "epoch": 0.6, + "learning_rate": 7.990369306046367e-08, + "loss": 0.0005, + "step": 30976 + }, + { + "epoch": 0.6, + "learning_rate": 7.989980971612753e-08, + "loss": 0.0007, + "step": 30977 + }, + { + "epoch": 0.6, + "learning_rate": 7.989592637179137e-08, + "loss": 0.0004, + "step": 30978 + }, + { + "epoch": 0.6, + "learning_rate": 7.989204302745523e-08, + "loss": 0.0005, + "step": 30979 + }, + { + "epoch": 0.6, + "learning_rate": 7.988815968311909e-08, + "loss": 0.0004, + "step": 30980 + }, + { + "epoch": 0.6, + "learning_rate": 7.988427633878295e-08, + "loss": 0.0005, + "step": 30981 + }, + { + "epoch": 0.6, + "learning_rate": 7.98803929944468e-08, + "loss": 0.0005, + "step": 30982 + }, + { + "epoch": 0.6, + "learning_rate": 7.987650965011066e-08, + "loss": 0.0708, + "step": 30983 + }, + { + "epoch": 0.6, + "learning_rate": 7.987262630577452e-08, + "loss": 0.0004, + "step": 30984 + }, + { + "epoch": 0.6, + "learning_rate": 7.986874296143838e-08, + "loss": 0.0004, + "step": 30985 + }, + { + "epoch": 0.6, + "learning_rate": 7.986485961710224e-08, + "loss": 0.0006, + "step": 30986 + }, + { + "epoch": 0.6, + "learning_rate": 7.98609762727661e-08, + "loss": 0.0008, + "step": 30987 + }, + { + "epoch": 0.6, + "learning_rate": 7.985709292842996e-08, + "loss": 0.0005, + "step": 30988 + }, + { + "epoch": 0.6, + "learning_rate": 7.985320958409381e-08, + "loss": 0.0008, + "step": 30989 + }, + { + "epoch": 0.6, + "learning_rate": 7.984932623975767e-08, + "loss": 0.0004, + "step": 30990 + }, + { + "epoch": 0.6, + "learning_rate": 7.984544289542153e-08, + "loss": 0.0007, + "step": 30991 + }, + { + "epoch": 0.6, + "learning_rate": 7.984155955108539e-08, + "loss": 0.0548, + "step": 30992 + }, + { + "epoch": 0.6, + "learning_rate": 7.983767620674925e-08, + "loss": 0.0004, + "step": 30993 + }, + { + "epoch": 0.6, + "learning_rate": 7.98337928624131e-08, + "loss": 0.0006, + "step": 30994 + }, + { + "epoch": 0.6, + "learning_rate": 7.982990951807696e-08, + "loss": 1.1409, + "step": 30995 + }, + { + "epoch": 0.6, + "learning_rate": 7.982602617374082e-08, + "loss": 0.102, + "step": 30996 + }, + { + "epoch": 0.6, + "learning_rate": 7.982214282940468e-08, + "loss": 0.0004, + "step": 30997 + }, + { + "epoch": 0.6, + "learning_rate": 7.981825948506854e-08, + "loss": 0.0005, + "step": 30998 + }, + { + "epoch": 0.6, + "learning_rate": 7.98143761407324e-08, + "loss": 0.0009, + "step": 30999 + }, + { + "epoch": 0.6, + "learning_rate": 7.981049279639625e-08, + "loss": 0.0004, + "step": 31000 + }, + { + "epoch": 0.6, + "learning_rate": 7.980660945206011e-08, + "loss": 0.0005, + "step": 31001 + }, + { + "epoch": 0.6, + "learning_rate": 7.980272610772397e-08, + "loss": 0.017, + "step": 31002 + }, + { + "epoch": 0.6, + "learning_rate": 7.979884276338783e-08, + "loss": 0.0005, + "step": 31003 + }, + { + "epoch": 0.6, + "learning_rate": 7.979495941905169e-08, + "loss": 0.0004, + "step": 31004 + }, + { + "epoch": 0.6, + "learning_rate": 7.979107607471555e-08, + "loss": 0.0003, + "step": 31005 + }, + { + "epoch": 0.6, + "learning_rate": 7.97871927303794e-08, + "loss": 0.0005, + "step": 31006 + }, + { + "epoch": 0.6, + "learning_rate": 7.978330938604325e-08, + "loss": 0.0006, + "step": 31007 + }, + { + "epoch": 0.6, + "learning_rate": 7.977942604170711e-08, + "loss": 0.0006, + "step": 31008 + }, + { + "epoch": 0.6, + "learning_rate": 7.977554269737097e-08, + "loss": 0.0004, + "step": 31009 + }, + { + "epoch": 0.6, + "learning_rate": 7.977165935303482e-08, + "loss": 0.0021, + "step": 31010 + }, + { + "epoch": 0.6, + "learning_rate": 7.976777600869868e-08, + "loss": 0.0005, + "step": 31011 + }, + { + "epoch": 0.6, + "learning_rate": 7.976389266436254e-08, + "loss": 0.7974, + "step": 31012 + }, + { + "epoch": 0.6, + "learning_rate": 7.97600093200264e-08, + "loss": 0.0008, + "step": 31013 + }, + { + "epoch": 0.6, + "learning_rate": 7.975612597569026e-08, + "loss": 0.0005, + "step": 31014 + }, + { + "epoch": 0.6, + "learning_rate": 7.975224263135412e-08, + "loss": 0.0006, + "step": 31015 + }, + { + "epoch": 0.6, + "learning_rate": 7.974835928701797e-08, + "loss": 0.0881, + "step": 31016 + }, + { + "epoch": 0.6, + "learning_rate": 7.974447594268183e-08, + "loss": 0.0006, + "step": 31017 + }, + { + "epoch": 0.6, + "learning_rate": 7.974059259834569e-08, + "loss": 0.0006, + "step": 31018 + }, + { + "epoch": 0.6, + "learning_rate": 7.973670925400955e-08, + "loss": 0.0006, + "step": 31019 + }, + { + "epoch": 0.6, + "learning_rate": 7.97328259096734e-08, + "loss": 0.0005, + "step": 31020 + }, + { + "epoch": 0.6, + "learning_rate": 7.972894256533726e-08, + "loss": 0.0007, + "step": 31021 + }, + { + "epoch": 0.6, + "learning_rate": 7.972505922100112e-08, + "loss": 0.0005, + "step": 31022 + }, + { + "epoch": 0.6, + "learning_rate": 7.972117587666498e-08, + "loss": 0.0013, + "step": 31023 + }, + { + "epoch": 0.6, + "learning_rate": 7.971729253232884e-08, + "loss": 0.0006, + "step": 31024 + }, + { + "epoch": 0.6, + "learning_rate": 7.97134091879927e-08, + "loss": 0.0004, + "step": 31025 + }, + { + "epoch": 0.6, + "learning_rate": 7.970952584365656e-08, + "loss": 0.0004, + "step": 31026 + }, + { + "epoch": 0.6, + "learning_rate": 7.970564249932041e-08, + "loss": 0.0006, + "step": 31027 + }, + { + "epoch": 0.6, + "learning_rate": 7.970175915498427e-08, + "loss": 0.0567, + "step": 31028 + }, + { + "epoch": 0.6, + "learning_rate": 7.969787581064813e-08, + "loss": 0.0006, + "step": 31029 + }, + { + "epoch": 0.6, + "learning_rate": 7.969399246631199e-08, + "loss": 0.0006, + "step": 31030 + }, + { + "epoch": 0.6, + "learning_rate": 7.969010912197585e-08, + "loss": 0.0012, + "step": 31031 + }, + { + "epoch": 0.6, + "learning_rate": 7.96862257776397e-08, + "loss": 0.0005, + "step": 31032 + }, + { + "epoch": 0.6, + "learning_rate": 7.968234243330356e-08, + "loss": 0.0006, + "step": 31033 + }, + { + "epoch": 0.6, + "learning_rate": 7.967845908896742e-08, + "loss": 0.0034, + "step": 31034 + }, + { + "epoch": 0.6, + "learning_rate": 7.967457574463128e-08, + "loss": 0.0006, + "step": 31035 + }, + { + "epoch": 0.6, + "learning_rate": 7.967069240029513e-08, + "loss": 0.0005, + "step": 31036 + }, + { + "epoch": 0.6, + "learning_rate": 7.966680905595898e-08, + "loss": 0.0004, + "step": 31037 + }, + { + "epoch": 0.6, + "learning_rate": 7.966292571162284e-08, + "loss": 0.0006, + "step": 31038 + }, + { + "epoch": 0.6, + "learning_rate": 7.96590423672867e-08, + "loss": 0.0004, + "step": 31039 + }, + { + "epoch": 0.6, + "learning_rate": 7.965515902295056e-08, + "loss": 0.0012, + "step": 31040 + }, + { + "epoch": 0.6, + "learning_rate": 7.965127567861442e-08, + "loss": 0.7588, + "step": 31041 + }, + { + "epoch": 0.6, + "learning_rate": 7.964739233427827e-08, + "loss": 0.0487, + "step": 31042 + }, + { + "epoch": 0.6, + "learning_rate": 7.964350898994213e-08, + "loss": 0.0005, + "step": 31043 + }, + { + "epoch": 0.6, + "learning_rate": 7.963962564560599e-08, + "loss": 0.0007, + "step": 31044 + }, + { + "epoch": 0.6, + "learning_rate": 7.963574230126985e-08, + "loss": 0.0007, + "step": 31045 + }, + { + "epoch": 0.6, + "learning_rate": 7.963185895693371e-08, + "loss": 0.0005, + "step": 31046 + }, + { + "epoch": 0.6, + "learning_rate": 7.962797561259757e-08, + "loss": 0.0005, + "step": 31047 + }, + { + "epoch": 0.6, + "learning_rate": 7.962409226826142e-08, + "loss": 0.0005, + "step": 31048 + }, + { + "epoch": 0.6, + "learning_rate": 7.962020892392528e-08, + "loss": 0.0006, + "step": 31049 + }, + { + "epoch": 0.6, + "learning_rate": 7.961632557958914e-08, + "loss": 0.0005, + "step": 31050 + }, + { + "epoch": 0.6, + "learning_rate": 7.9612442235253e-08, + "loss": 0.0089, + "step": 31051 + }, + { + "epoch": 0.6, + "learning_rate": 7.960855889091686e-08, + "loss": 0.0007, + "step": 31052 + }, + { + "epoch": 0.6, + "learning_rate": 7.960467554658072e-08, + "loss": 0.0007, + "step": 31053 + }, + { + "epoch": 0.6, + "learning_rate": 7.960079220224457e-08, + "loss": 0.0006, + "step": 31054 + }, + { + "epoch": 0.6, + "learning_rate": 7.959690885790843e-08, + "loss": 0.0006, + "step": 31055 + }, + { + "epoch": 0.6, + "learning_rate": 7.959302551357229e-08, + "loss": 0.0005, + "step": 31056 + }, + { + "epoch": 0.6, + "learning_rate": 7.958914216923615e-08, + "loss": 0.0008, + "step": 31057 + }, + { + "epoch": 0.6, + "learning_rate": 7.95852588249e-08, + "loss": 0.6147, + "step": 31058 + }, + { + "epoch": 0.6, + "learning_rate": 7.958137548056386e-08, + "loss": 0.0006, + "step": 31059 + }, + { + "epoch": 0.6, + "learning_rate": 7.957749213622772e-08, + "loss": 0.0003, + "step": 31060 + }, + { + "epoch": 0.6, + "learning_rate": 7.957360879189158e-08, + "loss": 0.0006, + "step": 31061 + }, + { + "epoch": 0.6, + "learning_rate": 7.956972544755544e-08, + "loss": 0.0007, + "step": 31062 + }, + { + "epoch": 0.6, + "learning_rate": 7.95658421032193e-08, + "loss": 0.0056, + "step": 31063 + }, + { + "epoch": 0.6, + "learning_rate": 7.956195875888316e-08, + "loss": 0.0006, + "step": 31064 + }, + { + "epoch": 0.6, + "learning_rate": 7.9558075414547e-08, + "loss": 0.0011, + "step": 31065 + }, + { + "epoch": 0.6, + "learning_rate": 7.955419207021086e-08, + "loss": 0.0005, + "step": 31066 + }, + { + "epoch": 0.6, + "learning_rate": 7.955030872587472e-08, + "loss": 0.0007, + "step": 31067 + }, + { + "epoch": 0.6, + "learning_rate": 7.954642538153858e-08, + "loss": 0.0004, + "step": 31068 + }, + { + "epoch": 0.6, + "learning_rate": 7.954254203720243e-08, + "loss": 0.0005, + "step": 31069 + }, + { + "epoch": 0.6, + "learning_rate": 7.953865869286629e-08, + "loss": 0.0004, + "step": 31070 + }, + { + "epoch": 0.6, + "learning_rate": 7.953477534853015e-08, + "loss": 0.3085, + "step": 31071 + }, + { + "epoch": 0.6, + "learning_rate": 7.953089200419401e-08, + "loss": 0.0021, + "step": 31072 + }, + { + "epoch": 0.6, + "learning_rate": 7.952700865985787e-08, + "loss": 0.0007, + "step": 31073 + }, + { + "epoch": 0.6, + "learning_rate": 7.952312531552173e-08, + "loss": 0.0005, + "step": 31074 + }, + { + "epoch": 0.6, + "learning_rate": 7.951924197118558e-08, + "loss": 0.0003, + "step": 31075 + }, + { + "epoch": 0.6, + "learning_rate": 7.951535862684944e-08, + "loss": 0.0006, + "step": 31076 + }, + { + "epoch": 0.6, + "learning_rate": 7.95114752825133e-08, + "loss": 0.0005, + "step": 31077 + }, + { + "epoch": 0.6, + "learning_rate": 7.950759193817716e-08, + "loss": 0.0006, + "step": 31078 + }, + { + "epoch": 0.6, + "learning_rate": 7.950370859384102e-08, + "loss": 0.0006, + "step": 31079 + }, + { + "epoch": 0.6, + "learning_rate": 7.949982524950487e-08, + "loss": 0.0006, + "step": 31080 + }, + { + "epoch": 0.6, + "learning_rate": 7.949594190516873e-08, + "loss": 0.0005, + "step": 31081 + }, + { + "epoch": 0.6, + "learning_rate": 7.949205856083259e-08, + "loss": 0.0012, + "step": 31082 + }, + { + "epoch": 0.6, + "learning_rate": 7.948817521649645e-08, + "loss": 0.0004, + "step": 31083 + }, + { + "epoch": 0.6, + "learning_rate": 7.948429187216031e-08, + "loss": 0.0011, + "step": 31084 + }, + { + "epoch": 0.6, + "learning_rate": 7.948040852782417e-08, + "loss": 0.0022, + "step": 31085 + }, + { + "epoch": 0.6, + "learning_rate": 7.947652518348802e-08, + "loss": 0.0005, + "step": 31086 + }, + { + "epoch": 0.6, + "learning_rate": 7.947264183915188e-08, + "loss": 0.0004, + "step": 31087 + }, + { + "epoch": 0.6, + "learning_rate": 7.946875849481574e-08, + "loss": 0.0008, + "step": 31088 + }, + { + "epoch": 0.6, + "learning_rate": 7.94648751504796e-08, + "loss": 0.0006, + "step": 31089 + }, + { + "epoch": 0.6, + "learning_rate": 7.946099180614346e-08, + "loss": 0.0018, + "step": 31090 + }, + { + "epoch": 0.6, + "learning_rate": 7.945710846180732e-08, + "loss": 0.0005, + "step": 31091 + }, + { + "epoch": 0.6, + "learning_rate": 7.945322511747117e-08, + "loss": 0.1402, + "step": 31092 + }, + { + "epoch": 0.6, + "learning_rate": 7.944934177313503e-08, + "loss": 0.0053, + "step": 31093 + }, + { + "epoch": 0.6, + "learning_rate": 7.944545842879888e-08, + "loss": 0.7246, + "step": 31094 + }, + { + "epoch": 0.6, + "learning_rate": 7.944157508446274e-08, + "loss": 0.0005, + "step": 31095 + }, + { + "epoch": 0.6, + "learning_rate": 7.94376917401266e-08, + "loss": 0.0004, + "step": 31096 + }, + { + "epoch": 0.6, + "learning_rate": 7.943380839579045e-08, + "loss": 0.003, + "step": 31097 + }, + { + "epoch": 0.6, + "learning_rate": 7.942992505145431e-08, + "loss": 0.0005, + "step": 31098 + }, + { + "epoch": 0.6, + "learning_rate": 7.942604170711817e-08, + "loss": 0.0007, + "step": 31099 + }, + { + "epoch": 0.6, + "learning_rate": 7.942215836278203e-08, + "loss": 0.0004, + "step": 31100 + }, + { + "epoch": 0.6, + "learning_rate": 7.941827501844588e-08, + "loss": 0.0011, + "step": 31101 + }, + { + "epoch": 0.6, + "learning_rate": 7.941439167410974e-08, + "loss": 0.0006, + "step": 31102 + }, + { + "epoch": 0.6, + "learning_rate": 7.94105083297736e-08, + "loss": 0.0012, + "step": 31103 + }, + { + "epoch": 0.6, + "learning_rate": 7.940662498543746e-08, + "loss": 0.0005, + "step": 31104 + }, + { + "epoch": 0.6, + "learning_rate": 7.940274164110132e-08, + "loss": 0.001, + "step": 31105 + }, + { + "epoch": 0.6, + "learning_rate": 7.939885829676518e-08, + "loss": 0.0005, + "step": 31106 + }, + { + "epoch": 0.6, + "learning_rate": 7.939497495242903e-08, + "loss": 0.0006, + "step": 31107 + }, + { + "epoch": 0.6, + "learning_rate": 7.939109160809289e-08, + "loss": 0.0007, + "step": 31108 + }, + { + "epoch": 0.6, + "learning_rate": 7.938720826375675e-08, + "loss": 0.0004, + "step": 31109 + }, + { + "epoch": 0.6, + "learning_rate": 7.938332491942061e-08, + "loss": 0.0008, + "step": 31110 + }, + { + "epoch": 0.6, + "learning_rate": 7.937944157508445e-08, + "loss": 0.0004, + "step": 31111 + }, + { + "epoch": 0.6, + "learning_rate": 7.937555823074831e-08, + "loss": 0.0008, + "step": 31112 + }, + { + "epoch": 0.6, + "learning_rate": 7.937167488641217e-08, + "loss": 0.0003, + "step": 31113 + }, + { + "epoch": 0.6, + "learning_rate": 7.936779154207603e-08, + "loss": 0.0007, + "step": 31114 + }, + { + "epoch": 0.6, + "learning_rate": 7.936390819773989e-08, + "loss": 0.0007, + "step": 31115 + }, + { + "epoch": 0.6, + "learning_rate": 7.936002485340375e-08, + "loss": 0.0005, + "step": 31116 + }, + { + "epoch": 0.6, + "learning_rate": 7.93561415090676e-08, + "loss": 0.0029, + "step": 31117 + }, + { + "epoch": 0.6, + "learning_rate": 7.935225816473146e-08, + "loss": 0.0008, + "step": 31118 + }, + { + "epoch": 0.6, + "learning_rate": 7.934837482039532e-08, + "loss": 0.0005, + "step": 31119 + }, + { + "epoch": 0.6, + "learning_rate": 7.934449147605918e-08, + "loss": 0.0006, + "step": 31120 + }, + { + "epoch": 0.6, + "learning_rate": 7.934060813172304e-08, + "loss": 0.0004, + "step": 31121 + }, + { + "epoch": 0.6, + "learning_rate": 7.93367247873869e-08, + "loss": 0.0004, + "step": 31122 + }, + { + "epoch": 0.6, + "learning_rate": 7.933284144305075e-08, + "loss": 0.0006, + "step": 31123 + }, + { + "epoch": 0.6, + "learning_rate": 7.932895809871461e-08, + "loss": 0.0005, + "step": 31124 + }, + { + "epoch": 0.6, + "learning_rate": 7.932507475437847e-08, + "loss": 0.0005, + "step": 31125 + }, + { + "epoch": 0.6, + "learning_rate": 7.932119141004231e-08, + "loss": 0.0005, + "step": 31126 + }, + { + "epoch": 0.6, + "learning_rate": 7.931730806570617e-08, + "loss": 0.0293, + "step": 31127 + }, + { + "epoch": 0.6, + "learning_rate": 7.931342472137003e-08, + "loss": 0.0293, + "step": 31128 + }, + { + "epoch": 0.6, + "learning_rate": 7.930954137703389e-08, + "loss": 0.0005, + "step": 31129 + }, + { + "epoch": 0.6, + "learning_rate": 7.930565803269775e-08, + "loss": 0.0004, + "step": 31130 + }, + { + "epoch": 0.6, + "learning_rate": 7.93017746883616e-08, + "loss": 0.0005, + "step": 31131 + }, + { + "epoch": 0.6, + "learning_rate": 7.929789134402546e-08, + "loss": 0.7106, + "step": 31132 + }, + { + "epoch": 0.6, + "learning_rate": 7.929400799968932e-08, + "loss": 0.0008, + "step": 31133 + }, + { + "epoch": 0.6, + "learning_rate": 7.929012465535318e-08, + "loss": 0.0004, + "step": 31134 + }, + { + "epoch": 0.6, + "learning_rate": 7.928624131101704e-08, + "loss": 0.0006, + "step": 31135 + }, + { + "epoch": 0.6, + "learning_rate": 7.92823579666809e-08, + "loss": 0.0006, + "step": 31136 + }, + { + "epoch": 0.6, + "learning_rate": 7.927847462234475e-08, + "loss": 0.0005, + "step": 31137 + }, + { + "epoch": 0.6, + "learning_rate": 7.927459127800861e-08, + "loss": 0.0005, + "step": 31138 + }, + { + "epoch": 0.6, + "learning_rate": 7.927070793367247e-08, + "loss": 0.0006, + "step": 31139 + }, + { + "epoch": 0.6, + "learning_rate": 7.926682458933633e-08, + "loss": 0.0003, + "step": 31140 + }, + { + "epoch": 0.6, + "learning_rate": 7.926294124500019e-08, + "loss": 0.0005, + "step": 31141 + }, + { + "epoch": 0.6, + "learning_rate": 7.925905790066405e-08, + "loss": 0.0004, + "step": 31142 + }, + { + "epoch": 0.6, + "learning_rate": 7.92551745563279e-08, + "loss": 0.0005, + "step": 31143 + }, + { + "epoch": 0.6, + "learning_rate": 7.925129121199176e-08, + "loss": 0.0005, + "step": 31144 + }, + { + "epoch": 0.6, + "learning_rate": 7.924740786765562e-08, + "loss": 0.0006, + "step": 31145 + }, + { + "epoch": 0.6, + "learning_rate": 7.924352452331948e-08, + "loss": 0.0005, + "step": 31146 + }, + { + "epoch": 0.6, + "learning_rate": 7.923964117898334e-08, + "loss": 0.039, + "step": 31147 + }, + { + "epoch": 0.6, + "learning_rate": 7.92357578346472e-08, + "loss": 0.0007, + "step": 31148 + }, + { + "epoch": 0.6, + "learning_rate": 7.923187449031105e-08, + "loss": 0.0003, + "step": 31149 + }, + { + "epoch": 0.6, + "learning_rate": 7.922799114597491e-08, + "loss": 0.0004, + "step": 31150 + }, + { + "epoch": 0.6, + "learning_rate": 7.922410780163877e-08, + "loss": 0.0004, + "step": 31151 + }, + { + "epoch": 0.6, + "learning_rate": 7.922022445730262e-08, + "loss": 0.7884, + "step": 31152 + }, + { + "epoch": 0.6, + "learning_rate": 7.921634111296647e-08, + "loss": 0.5727, + "step": 31153 + }, + { + "epoch": 0.6, + "learning_rate": 7.921245776863033e-08, + "loss": 0.0181, + "step": 31154 + }, + { + "epoch": 0.6, + "learning_rate": 7.920857442429419e-08, + "loss": 0.0005, + "step": 31155 + }, + { + "epoch": 0.6, + "learning_rate": 7.920469107995805e-08, + "loss": 0.0012, + "step": 31156 + }, + { + "epoch": 0.6, + "learning_rate": 7.92008077356219e-08, + "loss": 0.0007, + "step": 31157 + }, + { + "epoch": 0.6, + "learning_rate": 7.919692439128576e-08, + "loss": 0.4578, + "step": 31158 + }, + { + "epoch": 0.6, + "learning_rate": 7.919304104694962e-08, + "loss": 0.0004, + "step": 31159 + }, + { + "epoch": 0.6, + "learning_rate": 7.918915770261348e-08, + "loss": 0.0114, + "step": 31160 + }, + { + "epoch": 0.6, + "learning_rate": 7.918527435827734e-08, + "loss": 0.0005, + "step": 31161 + }, + { + "epoch": 0.6, + "learning_rate": 7.91813910139412e-08, + "loss": 0.0004, + "step": 31162 + }, + { + "epoch": 0.6, + "learning_rate": 7.917750766960506e-08, + "loss": 0.0005, + "step": 31163 + }, + { + "epoch": 0.6, + "learning_rate": 7.917362432526891e-08, + "loss": 0.0003, + "step": 31164 + }, + { + "epoch": 0.6, + "learning_rate": 7.916974098093277e-08, + "loss": 0.0003, + "step": 31165 + }, + { + "epoch": 0.6, + "learning_rate": 7.916585763659663e-08, + "loss": 0.0005, + "step": 31166 + }, + { + "epoch": 0.6, + "learning_rate": 7.916197429226049e-08, + "loss": 0.0005, + "step": 31167 + }, + { + "epoch": 0.6, + "learning_rate": 7.915809094792435e-08, + "loss": 0.0004, + "step": 31168 + }, + { + "epoch": 0.6, + "learning_rate": 7.91542076035882e-08, + "loss": 0.0053, + "step": 31169 + }, + { + "epoch": 0.6, + "learning_rate": 7.915032425925206e-08, + "loss": 0.0004, + "step": 31170 + }, + { + "epoch": 0.6, + "learning_rate": 7.914644091491592e-08, + "loss": 0.0004, + "step": 31171 + }, + { + "epoch": 0.6, + "learning_rate": 7.914255757057978e-08, + "loss": 0.0004, + "step": 31172 + }, + { + "epoch": 0.6, + "learning_rate": 7.913867422624364e-08, + "loss": 0.0004, + "step": 31173 + }, + { + "epoch": 0.6, + "learning_rate": 7.91347908819075e-08, + "loss": 0.0709, + "step": 31174 + }, + { + "epoch": 0.6, + "learning_rate": 7.913090753757135e-08, + "loss": 0.0004, + "step": 31175 + }, + { + "epoch": 0.6, + "learning_rate": 7.912702419323521e-08, + "loss": 0.0005, + "step": 31176 + }, + { + "epoch": 0.6, + "learning_rate": 7.912314084889907e-08, + "loss": 0.0098, + "step": 31177 + }, + { + "epoch": 0.6, + "learning_rate": 7.911925750456293e-08, + "loss": 0.0005, + "step": 31178 + }, + { + "epoch": 0.6, + "learning_rate": 7.911537416022679e-08, + "loss": 0.0004, + "step": 31179 + }, + { + "epoch": 0.6, + "learning_rate": 7.911149081589065e-08, + "loss": 0.0007, + "step": 31180 + }, + { + "epoch": 0.6, + "learning_rate": 7.910760747155449e-08, + "loss": 0.0005, + "step": 31181 + }, + { + "epoch": 0.6, + "learning_rate": 7.910372412721835e-08, + "loss": 0.0009, + "step": 31182 + }, + { + "epoch": 0.6, + "learning_rate": 7.909984078288221e-08, + "loss": 0.0004, + "step": 31183 + }, + { + "epoch": 0.6, + "learning_rate": 7.909595743854607e-08, + "loss": 0.0004, + "step": 31184 + }, + { + "epoch": 0.6, + "learning_rate": 7.909207409420992e-08, + "loss": 0.0006, + "step": 31185 + }, + { + "epoch": 0.6, + "learning_rate": 7.908819074987378e-08, + "loss": 0.0005, + "step": 31186 + }, + { + "epoch": 0.6, + "learning_rate": 7.908430740553764e-08, + "loss": 0.0004, + "step": 31187 + }, + { + "epoch": 0.6, + "learning_rate": 7.90804240612015e-08, + "loss": 0.0116, + "step": 31188 + }, + { + "epoch": 0.61, + "learning_rate": 7.907654071686536e-08, + "loss": 0.0004, + "step": 31189 + }, + { + "epoch": 0.61, + "learning_rate": 7.907265737252922e-08, + "loss": 0.2085, + "step": 31190 + }, + { + "epoch": 0.61, + "learning_rate": 7.906877402819307e-08, + "loss": 0.0004, + "step": 31191 + }, + { + "epoch": 0.61, + "learning_rate": 7.906489068385693e-08, + "loss": 0.0007, + "step": 31192 + }, + { + "epoch": 0.61, + "learning_rate": 7.906100733952079e-08, + "loss": 0.0003, + "step": 31193 + }, + { + "epoch": 0.61, + "learning_rate": 7.905712399518465e-08, + "loss": 0.0004, + "step": 31194 + }, + { + "epoch": 0.61, + "learning_rate": 7.905324065084851e-08, + "loss": 0.0008, + "step": 31195 + }, + { + "epoch": 0.61, + "learning_rate": 7.904935730651236e-08, + "loss": 0.0006, + "step": 31196 + }, + { + "epoch": 0.61, + "learning_rate": 7.904547396217622e-08, + "loss": 0.0003, + "step": 31197 + }, + { + "epoch": 0.61, + "learning_rate": 7.904159061784008e-08, + "loss": 0.0006, + "step": 31198 + }, + { + "epoch": 0.61, + "learning_rate": 7.903770727350394e-08, + "loss": 0.0006, + "step": 31199 + }, + { + "epoch": 0.61, + "learning_rate": 7.90338239291678e-08, + "loss": 0.0004, + "step": 31200 + }, + { + "epoch": 0.61, + "learning_rate": 7.902994058483166e-08, + "loss": 0.0008, + "step": 31201 + }, + { + "epoch": 0.61, + "learning_rate": 7.902605724049551e-08, + "loss": 0.0006, + "step": 31202 + }, + { + "epoch": 0.61, + "learning_rate": 7.902217389615937e-08, + "loss": 0.6258, + "step": 31203 + }, + { + "epoch": 0.61, + "learning_rate": 7.901829055182323e-08, + "loss": 0.0008, + "step": 31204 + }, + { + "epoch": 0.61, + "learning_rate": 7.901440720748709e-08, + "loss": 0.0007, + "step": 31205 + }, + { + "epoch": 0.61, + "learning_rate": 7.901052386315095e-08, + "loss": 0.0008, + "step": 31206 + }, + { + "epoch": 0.61, + "learning_rate": 7.90066405188148e-08, + "loss": 0.0004, + "step": 31207 + }, + { + "epoch": 0.61, + "learning_rate": 7.900275717447866e-08, + "loss": 0.0009, + "step": 31208 + }, + { + "epoch": 0.61, + "learning_rate": 7.899887383014252e-08, + "loss": 0.0067, + "step": 31209 + }, + { + "epoch": 0.61, + "learning_rate": 7.899499048580637e-08, + "loss": 0.0003, + "step": 31210 + }, + { + "epoch": 0.61, + "learning_rate": 7.899110714147023e-08, + "loss": 0.0004, + "step": 31211 + }, + { + "epoch": 0.61, + "learning_rate": 7.898722379713408e-08, + "loss": 0.0005, + "step": 31212 + }, + { + "epoch": 0.61, + "learning_rate": 7.898334045279794e-08, + "loss": 0.0005, + "step": 31213 + }, + { + "epoch": 0.61, + "learning_rate": 7.89794571084618e-08, + "loss": 0.454, + "step": 31214 + }, + { + "epoch": 0.61, + "learning_rate": 7.897557376412566e-08, + "loss": 0.0004, + "step": 31215 + }, + { + "epoch": 0.61, + "learning_rate": 7.897169041978952e-08, + "loss": 0.0004, + "step": 31216 + }, + { + "epoch": 0.61, + "learning_rate": 7.896780707545337e-08, + "loss": 0.0004, + "step": 31217 + }, + { + "epoch": 0.61, + "learning_rate": 7.896392373111723e-08, + "loss": 0.0007, + "step": 31218 + }, + { + "epoch": 0.61, + "learning_rate": 7.896004038678109e-08, + "loss": 0.0005, + "step": 31219 + }, + { + "epoch": 0.61, + "learning_rate": 7.895615704244495e-08, + "loss": 0.0004, + "step": 31220 + }, + { + "epoch": 0.61, + "learning_rate": 7.895227369810881e-08, + "loss": 0.0013, + "step": 31221 + }, + { + "epoch": 0.61, + "learning_rate": 7.894839035377267e-08, + "loss": 0.0185, + "step": 31222 + }, + { + "epoch": 0.61, + "learning_rate": 7.894450700943652e-08, + "loss": 0.0006, + "step": 31223 + }, + { + "epoch": 0.61, + "learning_rate": 7.894062366510038e-08, + "loss": 0.0006, + "step": 31224 + }, + { + "epoch": 0.61, + "learning_rate": 7.893674032076424e-08, + "loss": 1.3574, + "step": 31225 + }, + { + "epoch": 0.61, + "learning_rate": 7.89328569764281e-08, + "loss": 0.0005, + "step": 31226 + }, + { + "epoch": 0.61, + "learning_rate": 7.892897363209196e-08, + "loss": 0.0004, + "step": 31227 + }, + { + "epoch": 0.61, + "learning_rate": 7.892509028775582e-08, + "loss": 0.0003, + "step": 31228 + }, + { + "epoch": 0.61, + "learning_rate": 7.892120694341967e-08, + "loss": 1.1469, + "step": 31229 + }, + { + "epoch": 0.61, + "learning_rate": 7.891732359908353e-08, + "loss": 0.0007, + "step": 31230 + }, + { + "epoch": 0.61, + "learning_rate": 7.891344025474739e-08, + "loss": 0.0705, + "step": 31231 + }, + { + "epoch": 0.61, + "learning_rate": 7.890955691041125e-08, + "loss": 0.0005, + "step": 31232 + }, + { + "epoch": 0.61, + "learning_rate": 7.890567356607511e-08, + "loss": 0.0004, + "step": 31233 + }, + { + "epoch": 0.61, + "learning_rate": 7.890179022173896e-08, + "loss": 0.0005, + "step": 31234 + }, + { + "epoch": 0.61, + "learning_rate": 7.889790687740282e-08, + "loss": 0.0005, + "step": 31235 + }, + { + "epoch": 0.61, + "learning_rate": 7.889402353306668e-08, + "loss": 0.0034, + "step": 31236 + }, + { + "epoch": 0.61, + "learning_rate": 7.889014018873054e-08, + "loss": 0.0005, + "step": 31237 + }, + { + "epoch": 0.61, + "learning_rate": 7.88862568443944e-08, + "loss": 0.0005, + "step": 31238 + }, + { + "epoch": 0.61, + "learning_rate": 7.888237350005824e-08, + "loss": 0.0005, + "step": 31239 + }, + { + "epoch": 0.61, + "learning_rate": 7.88784901557221e-08, + "loss": 0.0003, + "step": 31240 + }, + { + "epoch": 0.61, + "learning_rate": 7.887460681138596e-08, + "loss": 0.0007, + "step": 31241 + }, + { + "epoch": 0.61, + "learning_rate": 7.887072346704982e-08, + "loss": 0.0004, + "step": 31242 + }, + { + "epoch": 0.61, + "learning_rate": 7.886684012271368e-08, + "loss": 0.0005, + "step": 31243 + }, + { + "epoch": 0.61, + "learning_rate": 7.886295677837753e-08, + "loss": 0.0004, + "step": 31244 + }, + { + "epoch": 0.61, + "learning_rate": 7.885907343404139e-08, + "loss": 0.0005, + "step": 31245 + }, + { + "epoch": 0.61, + "learning_rate": 7.885519008970525e-08, + "loss": 1.2805, + "step": 31246 + }, + { + "epoch": 0.61, + "learning_rate": 7.885130674536911e-08, + "loss": 0.9245, + "step": 31247 + }, + { + "epoch": 0.61, + "learning_rate": 7.884742340103297e-08, + "loss": 0.0204, + "step": 31248 + }, + { + "epoch": 0.61, + "learning_rate": 7.884354005669683e-08, + "loss": 0.0004, + "step": 31249 + }, + { + "epoch": 0.61, + "learning_rate": 7.883965671236068e-08, + "loss": 0.0006, + "step": 31250 + }, + { + "epoch": 0.61, + "learning_rate": 7.883577336802454e-08, + "loss": 0.0154, + "step": 31251 + }, + { + "epoch": 0.61, + "learning_rate": 7.88318900236884e-08, + "loss": 0.0004, + "step": 31252 + }, + { + "epoch": 0.61, + "learning_rate": 7.882800667935226e-08, + "loss": 0.013, + "step": 31253 + }, + { + "epoch": 0.61, + "learning_rate": 7.882412333501612e-08, + "loss": 0.0005, + "step": 31254 + }, + { + "epoch": 0.61, + "learning_rate": 7.882023999067997e-08, + "loss": 0.0003, + "step": 31255 + }, + { + "epoch": 0.61, + "learning_rate": 7.881635664634383e-08, + "loss": 0.0003, + "step": 31256 + }, + { + "epoch": 0.61, + "learning_rate": 7.881247330200769e-08, + "loss": 0.0004, + "step": 31257 + }, + { + "epoch": 0.61, + "learning_rate": 7.880858995767155e-08, + "loss": 0.0005, + "step": 31258 + }, + { + "epoch": 0.61, + "learning_rate": 7.880470661333541e-08, + "loss": 0.0004, + "step": 31259 + }, + { + "epoch": 0.61, + "learning_rate": 7.880082326899927e-08, + "loss": 0.0004, + "step": 31260 + }, + { + "epoch": 0.61, + "learning_rate": 7.879693992466312e-08, + "loss": 0.0005, + "step": 31261 + }, + { + "epoch": 0.61, + "learning_rate": 7.879305658032698e-08, + "loss": 0.0005, + "step": 31262 + }, + { + "epoch": 0.61, + "learning_rate": 7.878917323599084e-08, + "loss": 0.0006, + "step": 31263 + }, + { + "epoch": 0.61, + "learning_rate": 7.87852898916547e-08, + "loss": 0.0033, + "step": 31264 + }, + { + "epoch": 0.61, + "learning_rate": 7.878140654731856e-08, + "loss": 0.0004, + "step": 31265 + }, + { + "epoch": 0.61, + "learning_rate": 7.877752320298242e-08, + "loss": 0.0005, + "step": 31266 + }, + { + "epoch": 0.61, + "learning_rate": 7.877363985864627e-08, + "loss": 0.0006, + "step": 31267 + }, + { + "epoch": 0.61, + "learning_rate": 7.876975651431012e-08, + "loss": 0.0005, + "step": 31268 + }, + { + "epoch": 0.61, + "learning_rate": 7.876587316997398e-08, + "loss": 0.0107, + "step": 31269 + }, + { + "epoch": 0.61, + "learning_rate": 7.876198982563784e-08, + "loss": 0.0004, + "step": 31270 + }, + { + "epoch": 0.61, + "learning_rate": 7.87581064813017e-08, + "loss": 0.0005, + "step": 31271 + }, + { + "epoch": 0.61, + "learning_rate": 7.875422313696555e-08, + "loss": 0.0006, + "step": 31272 + }, + { + "epoch": 0.61, + "learning_rate": 7.875033979262941e-08, + "loss": 0.0006, + "step": 31273 + }, + { + "epoch": 0.61, + "learning_rate": 7.874645644829327e-08, + "loss": 0.0005, + "step": 31274 + }, + { + "epoch": 0.61, + "learning_rate": 7.874257310395713e-08, + "loss": 0.0017, + "step": 31275 + }, + { + "epoch": 0.61, + "learning_rate": 7.873868975962098e-08, + "loss": 0.0006, + "step": 31276 + }, + { + "epoch": 0.61, + "learning_rate": 7.873480641528484e-08, + "loss": 1.157, + "step": 31277 + }, + { + "epoch": 0.61, + "learning_rate": 7.87309230709487e-08, + "loss": 0.0005, + "step": 31278 + }, + { + "epoch": 0.61, + "learning_rate": 7.872703972661256e-08, + "loss": 0.4055, + "step": 31279 + }, + { + "epoch": 0.61, + "learning_rate": 7.872315638227642e-08, + "loss": 0.0004, + "step": 31280 + }, + { + "epoch": 0.61, + "learning_rate": 7.871927303794028e-08, + "loss": 1.0751, + "step": 31281 + }, + { + "epoch": 0.61, + "learning_rate": 7.871538969360413e-08, + "loss": 0.7471, + "step": 31282 + }, + { + "epoch": 0.61, + "learning_rate": 7.871150634926799e-08, + "loss": 0.0452, + "step": 31283 + }, + { + "epoch": 0.61, + "learning_rate": 7.870762300493185e-08, + "loss": 0.0005, + "step": 31284 + }, + { + "epoch": 0.61, + "learning_rate": 7.870373966059571e-08, + "loss": 0.0007, + "step": 31285 + }, + { + "epoch": 0.61, + "learning_rate": 7.869985631625957e-08, + "loss": 0.0006, + "step": 31286 + }, + { + "epoch": 0.61, + "learning_rate": 7.869597297192343e-08, + "loss": 0.1589, + "step": 31287 + }, + { + "epoch": 0.61, + "learning_rate": 7.869208962758727e-08, + "loss": 0.0006, + "step": 31288 + }, + { + "epoch": 0.61, + "learning_rate": 7.868820628325113e-08, + "loss": 0.5952, + "step": 31289 + }, + { + "epoch": 0.61, + "learning_rate": 7.868432293891499e-08, + "loss": 0.0011, + "step": 31290 + }, + { + "epoch": 0.61, + "learning_rate": 7.868043959457885e-08, + "loss": 0.0004, + "step": 31291 + }, + { + "epoch": 0.61, + "learning_rate": 7.86765562502427e-08, + "loss": 0.295, + "step": 31292 + }, + { + "epoch": 0.61, + "learning_rate": 7.867267290590656e-08, + "loss": 0.0004, + "step": 31293 + }, + { + "epoch": 0.61, + "learning_rate": 7.866878956157042e-08, + "loss": 0.0004, + "step": 31294 + }, + { + "epoch": 0.61, + "learning_rate": 7.866490621723428e-08, + "loss": 0.0005, + "step": 31295 + }, + { + "epoch": 0.61, + "learning_rate": 7.866102287289814e-08, + "loss": 0.9934, + "step": 31296 + }, + { + "epoch": 0.61, + "learning_rate": 7.8657139528562e-08, + "loss": 0.0011, + "step": 31297 + }, + { + "epoch": 0.61, + "learning_rate": 7.865325618422585e-08, + "loss": 0.0005, + "step": 31298 + }, + { + "epoch": 0.61, + "learning_rate": 7.864937283988971e-08, + "loss": 0.0005, + "step": 31299 + }, + { + "epoch": 0.61, + "learning_rate": 7.864548949555357e-08, + "loss": 0.0004, + "step": 31300 + }, + { + "epoch": 0.61, + "learning_rate": 7.864160615121743e-08, + "loss": 0.0005, + "step": 31301 + }, + { + "epoch": 0.61, + "learning_rate": 7.863772280688129e-08, + "loss": 0.0005, + "step": 31302 + }, + { + "epoch": 0.61, + "learning_rate": 7.863383946254513e-08, + "loss": 0.0007, + "step": 31303 + }, + { + "epoch": 0.61, + "learning_rate": 7.862995611820899e-08, + "loss": 0.0005, + "step": 31304 + }, + { + "epoch": 0.61, + "learning_rate": 7.862607277387285e-08, + "loss": 0.001, + "step": 31305 + }, + { + "epoch": 0.61, + "learning_rate": 7.86221894295367e-08, + "loss": 0.0016, + "step": 31306 + }, + { + "epoch": 0.61, + "learning_rate": 7.861830608520056e-08, + "loss": 0.0005, + "step": 31307 + }, + { + "epoch": 0.61, + "learning_rate": 7.861442274086442e-08, + "loss": 0.6777, + "step": 31308 + }, + { + "epoch": 0.61, + "learning_rate": 7.861053939652828e-08, + "loss": 0.0014, + "step": 31309 + }, + { + "epoch": 0.61, + "learning_rate": 7.860665605219214e-08, + "loss": 0.0005, + "step": 31310 + }, + { + "epoch": 0.61, + "learning_rate": 7.8602772707856e-08, + "loss": 0.0005, + "step": 31311 + }, + { + "epoch": 0.61, + "learning_rate": 7.859888936351986e-08, + "loss": 0.0008, + "step": 31312 + }, + { + "epoch": 0.61, + "learning_rate": 7.859500601918371e-08, + "loss": 0.0003, + "step": 31313 + }, + { + "epoch": 0.61, + "learning_rate": 7.859112267484757e-08, + "loss": 0.0005, + "step": 31314 + }, + { + "epoch": 0.61, + "learning_rate": 7.858723933051143e-08, + "loss": 0.0009, + "step": 31315 + }, + { + "epoch": 0.61, + "learning_rate": 7.858335598617529e-08, + "loss": 0.0007, + "step": 31316 + }, + { + "epoch": 0.61, + "learning_rate": 7.857947264183915e-08, + "loss": 0.0006, + "step": 31317 + }, + { + "epoch": 0.61, + "learning_rate": 7.8575589297503e-08, + "loss": 0.5351, + "step": 31318 + }, + { + "epoch": 0.61, + "learning_rate": 7.857170595316686e-08, + "loss": 0.0005, + "step": 31319 + }, + { + "epoch": 0.61, + "learning_rate": 7.856782260883072e-08, + "loss": 0.0005, + "step": 31320 + }, + { + "epoch": 0.61, + "learning_rate": 7.856393926449458e-08, + "loss": 0.0018, + "step": 31321 + }, + { + "epoch": 0.61, + "learning_rate": 7.856005592015844e-08, + "loss": 0.0006, + "step": 31322 + }, + { + "epoch": 0.61, + "learning_rate": 7.85561725758223e-08, + "loss": 0.0005, + "step": 31323 + }, + { + "epoch": 0.61, + "learning_rate": 7.855228923148615e-08, + "loss": 0.0006, + "step": 31324 + }, + { + "epoch": 0.61, + "learning_rate": 7.854840588715001e-08, + "loss": 0.0005, + "step": 31325 + }, + { + "epoch": 0.61, + "learning_rate": 7.854452254281386e-08, + "loss": 0.0005, + "step": 31326 + }, + { + "epoch": 0.61, + "learning_rate": 7.854063919847772e-08, + "loss": 0.0006, + "step": 31327 + }, + { + "epoch": 0.61, + "learning_rate": 7.853675585414157e-08, + "loss": 0.0059, + "step": 31328 + }, + { + "epoch": 0.61, + "learning_rate": 7.853287250980543e-08, + "loss": 0.0006, + "step": 31329 + }, + { + "epoch": 0.61, + "learning_rate": 7.852898916546929e-08, + "loss": 0.1019, + "step": 31330 + }, + { + "epoch": 0.61, + "learning_rate": 7.852510582113315e-08, + "loss": 0.0005, + "step": 31331 + }, + { + "epoch": 0.61, + "learning_rate": 7.852122247679701e-08, + "loss": 0.1189, + "step": 31332 + }, + { + "epoch": 0.61, + "learning_rate": 7.851733913246086e-08, + "loss": 0.0005, + "step": 31333 + }, + { + "epoch": 0.61, + "learning_rate": 7.851345578812472e-08, + "loss": 0.0007, + "step": 31334 + }, + { + "epoch": 0.61, + "learning_rate": 7.850957244378858e-08, + "loss": 0.0005, + "step": 31335 + }, + { + "epoch": 0.61, + "learning_rate": 7.850568909945244e-08, + "loss": 0.9337, + "step": 31336 + }, + { + "epoch": 0.61, + "learning_rate": 7.85018057551163e-08, + "loss": 0.489, + "step": 31337 + }, + { + "epoch": 0.61, + "learning_rate": 7.849792241078016e-08, + "loss": 0.0007, + "step": 31338 + }, + { + "epoch": 0.61, + "learning_rate": 7.849403906644401e-08, + "loss": 0.0004, + "step": 31339 + }, + { + "epoch": 0.61, + "learning_rate": 7.849015572210787e-08, + "loss": 0.0037, + "step": 31340 + }, + { + "epoch": 0.61, + "learning_rate": 7.848627237777173e-08, + "loss": 0.0037, + "step": 31341 + }, + { + "epoch": 0.61, + "learning_rate": 7.848238903343559e-08, + "loss": 0.0004, + "step": 31342 + }, + { + "epoch": 0.61, + "learning_rate": 7.847850568909945e-08, + "loss": 0.0003, + "step": 31343 + }, + { + "epoch": 0.61, + "learning_rate": 7.84746223447633e-08, + "loss": 0.0006, + "step": 31344 + }, + { + "epoch": 0.61, + "learning_rate": 7.847073900042716e-08, + "loss": 0.005, + "step": 31345 + }, + { + "epoch": 0.61, + "learning_rate": 7.846685565609102e-08, + "loss": 0.6778, + "step": 31346 + }, + { + "epoch": 0.61, + "learning_rate": 7.846297231175488e-08, + "loss": 0.0008, + "step": 31347 + }, + { + "epoch": 0.61, + "learning_rate": 7.845908896741874e-08, + "loss": 0.0005, + "step": 31348 + }, + { + "epoch": 0.61, + "learning_rate": 7.84552056230826e-08, + "loss": 0.0004, + "step": 31349 + }, + { + "epoch": 0.61, + "learning_rate": 7.845132227874646e-08, + "loss": 0.278, + "step": 31350 + }, + { + "epoch": 0.61, + "learning_rate": 7.844743893441031e-08, + "loss": 0.0005, + "step": 31351 + }, + { + "epoch": 0.61, + "learning_rate": 7.844355559007417e-08, + "loss": 0.0012, + "step": 31352 + }, + { + "epoch": 0.61, + "learning_rate": 7.843967224573803e-08, + "loss": 0.0005, + "step": 31353 + }, + { + "epoch": 0.61, + "learning_rate": 7.843578890140189e-08, + "loss": 0.0005, + "step": 31354 + }, + { + "epoch": 0.61, + "learning_rate": 7.843190555706573e-08, + "loss": 0.0006, + "step": 31355 + }, + { + "epoch": 0.61, + "learning_rate": 7.842802221272959e-08, + "loss": 0.0004, + "step": 31356 + }, + { + "epoch": 0.61, + "learning_rate": 7.842413886839345e-08, + "loss": 0.0004, + "step": 31357 + }, + { + "epoch": 0.61, + "learning_rate": 7.842025552405731e-08, + "loss": 1.1445, + "step": 31358 + }, + { + "epoch": 0.61, + "learning_rate": 7.841637217972117e-08, + "loss": 0.0006, + "step": 31359 + }, + { + "epoch": 0.61, + "learning_rate": 7.841248883538502e-08, + "loss": 0.1463, + "step": 31360 + }, + { + "epoch": 0.61, + "learning_rate": 7.840860549104888e-08, + "loss": 0.0006, + "step": 31361 + }, + { + "epoch": 0.61, + "learning_rate": 7.840472214671274e-08, + "loss": 0.0082, + "step": 31362 + }, + { + "epoch": 0.61, + "learning_rate": 7.84008388023766e-08, + "loss": 0.0004, + "step": 31363 + }, + { + "epoch": 0.61, + "learning_rate": 7.839695545804046e-08, + "loss": 0.0004, + "step": 31364 + }, + { + "epoch": 0.61, + "learning_rate": 7.839307211370432e-08, + "loss": 0.0004, + "step": 31365 + }, + { + "epoch": 0.61, + "learning_rate": 7.838918876936817e-08, + "loss": 0.1575, + "step": 31366 + }, + { + "epoch": 0.61, + "learning_rate": 7.838530542503203e-08, + "loss": 0.0008, + "step": 31367 + }, + { + "epoch": 0.61, + "learning_rate": 7.838142208069589e-08, + "loss": 0.0006, + "step": 31368 + }, + { + "epoch": 0.61, + "learning_rate": 7.837753873635975e-08, + "loss": 0.0005, + "step": 31369 + }, + { + "epoch": 0.61, + "learning_rate": 7.837365539202361e-08, + "loss": 0.0005, + "step": 31370 + }, + { + "epoch": 0.61, + "learning_rate": 7.836977204768747e-08, + "loss": 0.0004, + "step": 31371 + }, + { + "epoch": 0.61, + "learning_rate": 7.836588870335132e-08, + "loss": 0.0005, + "step": 31372 + }, + { + "epoch": 0.61, + "learning_rate": 7.836200535901518e-08, + "loss": 0.0004, + "step": 31373 + }, + { + "epoch": 0.61, + "learning_rate": 7.835812201467904e-08, + "loss": 0.0006, + "step": 31374 + }, + { + "epoch": 0.61, + "learning_rate": 7.83542386703429e-08, + "loss": 0.0007, + "step": 31375 + }, + { + "epoch": 0.61, + "learning_rate": 7.835035532600676e-08, + "loss": 0.0003, + "step": 31376 + }, + { + "epoch": 0.61, + "learning_rate": 7.834647198167061e-08, + "loss": 0.0005, + "step": 31377 + }, + { + "epoch": 0.61, + "learning_rate": 7.834258863733447e-08, + "loss": 0.0004, + "step": 31378 + }, + { + "epoch": 0.61, + "learning_rate": 7.833870529299833e-08, + "loss": 0.0025, + "step": 31379 + }, + { + "epoch": 0.61, + "learning_rate": 7.833482194866219e-08, + "loss": 0.0008, + "step": 31380 + }, + { + "epoch": 0.61, + "learning_rate": 7.833093860432605e-08, + "loss": 0.0004, + "step": 31381 + }, + { + "epoch": 0.61, + "learning_rate": 7.83270552599899e-08, + "loss": 0.0007, + "step": 31382 + }, + { + "epoch": 0.61, + "learning_rate": 7.832317191565376e-08, + "loss": 0.0005, + "step": 31383 + }, + { + "epoch": 0.61, + "learning_rate": 7.831928857131761e-08, + "loss": 1.5496, + "step": 31384 + }, + { + "epoch": 0.61, + "learning_rate": 7.831540522698147e-08, + "loss": 0.0004, + "step": 31385 + }, + { + "epoch": 0.61, + "learning_rate": 7.831152188264533e-08, + "loss": 0.0004, + "step": 31386 + }, + { + "epoch": 0.61, + "learning_rate": 7.830763853830918e-08, + "loss": 0.0018, + "step": 31387 + }, + { + "epoch": 0.61, + "learning_rate": 7.830375519397304e-08, + "loss": 0.0003, + "step": 31388 + }, + { + "epoch": 0.61, + "learning_rate": 7.82998718496369e-08, + "loss": 0.0005, + "step": 31389 + }, + { + "epoch": 0.61, + "learning_rate": 7.829598850530076e-08, + "loss": 0.0004, + "step": 31390 + }, + { + "epoch": 0.61, + "learning_rate": 7.829210516096462e-08, + "loss": 0.0015, + "step": 31391 + }, + { + "epoch": 0.61, + "learning_rate": 7.828822181662847e-08, + "loss": 0.0005, + "step": 31392 + }, + { + "epoch": 0.61, + "learning_rate": 7.828433847229233e-08, + "loss": 0.0032, + "step": 31393 + }, + { + "epoch": 0.61, + "learning_rate": 7.828045512795619e-08, + "loss": 0.0005, + "step": 31394 + }, + { + "epoch": 0.61, + "learning_rate": 7.827657178362005e-08, + "loss": 0.0007, + "step": 31395 + }, + { + "epoch": 0.61, + "learning_rate": 7.827268843928391e-08, + "loss": 0.0023, + "step": 31396 + }, + { + "epoch": 0.61, + "learning_rate": 7.826880509494777e-08, + "loss": 0.0098, + "step": 31397 + }, + { + "epoch": 0.61, + "learning_rate": 7.826492175061162e-08, + "loss": 0.0003, + "step": 31398 + }, + { + "epoch": 0.61, + "learning_rate": 7.826103840627548e-08, + "loss": 0.0006, + "step": 31399 + }, + { + "epoch": 0.61, + "learning_rate": 7.825715506193934e-08, + "loss": 0.0006, + "step": 31400 + }, + { + "epoch": 0.61, + "learning_rate": 7.82532717176032e-08, + "loss": 0.0004, + "step": 31401 + }, + { + "epoch": 0.61, + "learning_rate": 7.824938837326706e-08, + "loss": 0.2838, + "step": 31402 + }, + { + "epoch": 0.61, + "learning_rate": 7.824550502893092e-08, + "loss": 0.0027, + "step": 31403 + }, + { + "epoch": 0.61, + "learning_rate": 7.824162168459477e-08, + "loss": 0.0159, + "step": 31404 + }, + { + "epoch": 0.61, + "learning_rate": 7.823773834025863e-08, + "loss": 0.0004, + "step": 31405 + }, + { + "epoch": 0.61, + "learning_rate": 7.823385499592249e-08, + "loss": 0.0005, + "step": 31406 + }, + { + "epoch": 0.61, + "learning_rate": 7.822997165158635e-08, + "loss": 0.0004, + "step": 31407 + }, + { + "epoch": 0.61, + "learning_rate": 7.822608830725021e-08, + "loss": 0.0004, + "step": 31408 + }, + { + "epoch": 0.61, + "learning_rate": 7.822220496291407e-08, + "loss": 0.8154, + "step": 31409 + }, + { + "epoch": 0.61, + "learning_rate": 7.821832161857792e-08, + "loss": 0.0012, + "step": 31410 + }, + { + "epoch": 0.61, + "learning_rate": 7.821443827424178e-08, + "loss": 0.3223, + "step": 31411 + }, + { + "epoch": 0.61, + "learning_rate": 7.821055492990564e-08, + "loss": 0.0005, + "step": 31412 + }, + { + "epoch": 0.61, + "learning_rate": 7.820667158556948e-08, + "loss": 0.024, + "step": 31413 + }, + { + "epoch": 0.61, + "learning_rate": 7.820278824123334e-08, + "loss": 0.0004, + "step": 31414 + }, + { + "epoch": 0.61, + "learning_rate": 7.81989048968972e-08, + "loss": 0.0004, + "step": 31415 + }, + { + "epoch": 0.61, + "learning_rate": 7.819502155256106e-08, + "loss": 0.0005, + "step": 31416 + }, + { + "epoch": 0.61, + "learning_rate": 7.819113820822492e-08, + "loss": 0.0005, + "step": 31417 + }, + { + "epoch": 0.61, + "learning_rate": 7.818725486388878e-08, + "loss": 0.0009, + "step": 31418 + }, + { + "epoch": 0.61, + "learning_rate": 7.818337151955263e-08, + "loss": 0.0005, + "step": 31419 + }, + { + "epoch": 0.61, + "learning_rate": 7.817948817521649e-08, + "loss": 0.0017, + "step": 31420 + }, + { + "epoch": 0.61, + "learning_rate": 7.817560483088035e-08, + "loss": 0.0004, + "step": 31421 + }, + { + "epoch": 0.61, + "learning_rate": 7.817172148654421e-08, + "loss": 0.0005, + "step": 31422 + }, + { + "epoch": 0.61, + "learning_rate": 7.816783814220807e-08, + "loss": 0.076, + "step": 31423 + }, + { + "epoch": 0.61, + "learning_rate": 7.816395479787193e-08, + "loss": 0.0004, + "step": 31424 + }, + { + "epoch": 0.61, + "learning_rate": 7.816007145353578e-08, + "loss": 0.0004, + "step": 31425 + }, + { + "epoch": 0.61, + "learning_rate": 7.815618810919964e-08, + "loss": 0.0005, + "step": 31426 + }, + { + "epoch": 0.61, + "learning_rate": 7.81523047648635e-08, + "loss": 0.0005, + "step": 31427 + }, + { + "epoch": 0.61, + "learning_rate": 7.814842142052736e-08, + "loss": 0.0004, + "step": 31428 + }, + { + "epoch": 0.61, + "learning_rate": 7.814453807619122e-08, + "loss": 0.0007, + "step": 31429 + }, + { + "epoch": 0.61, + "learning_rate": 7.814065473185507e-08, + "loss": 0.0004, + "step": 31430 + }, + { + "epoch": 0.61, + "learning_rate": 7.813677138751893e-08, + "loss": 0.0005, + "step": 31431 + }, + { + "epoch": 0.61, + "learning_rate": 7.813288804318279e-08, + "loss": 0.0008, + "step": 31432 + }, + { + "epoch": 0.61, + "learning_rate": 7.812900469884665e-08, + "loss": 0.0004, + "step": 31433 + }, + { + "epoch": 0.61, + "learning_rate": 7.812512135451051e-08, + "loss": 0.002, + "step": 31434 + }, + { + "epoch": 0.61, + "learning_rate": 7.812123801017437e-08, + "loss": 0.0012, + "step": 31435 + }, + { + "epoch": 0.61, + "learning_rate": 7.811735466583822e-08, + "loss": 0.0004, + "step": 31436 + }, + { + "epoch": 0.61, + "learning_rate": 7.811347132150208e-08, + "loss": 0.0004, + "step": 31437 + }, + { + "epoch": 0.61, + "learning_rate": 7.810958797716594e-08, + "loss": 0.0106, + "step": 31438 + }, + { + "epoch": 0.61, + "learning_rate": 7.81057046328298e-08, + "loss": 1.0064, + "step": 31439 + }, + { + "epoch": 0.61, + "learning_rate": 7.810182128849366e-08, + "loss": 0.0005, + "step": 31440 + }, + { + "epoch": 0.61, + "learning_rate": 7.809793794415752e-08, + "loss": 0.0004, + "step": 31441 + }, + { + "epoch": 0.61, + "learning_rate": 7.809405459982136e-08, + "loss": 0.0005, + "step": 31442 + }, + { + "epoch": 0.61, + "learning_rate": 7.809017125548522e-08, + "loss": 0.0008, + "step": 31443 + }, + { + "epoch": 0.61, + "learning_rate": 7.808628791114908e-08, + "loss": 0.0005, + "step": 31444 + }, + { + "epoch": 0.61, + "learning_rate": 7.808240456681294e-08, + "loss": 0.0005, + "step": 31445 + }, + { + "epoch": 0.61, + "learning_rate": 7.80785212224768e-08, + "loss": 0.0006, + "step": 31446 + }, + { + "epoch": 0.61, + "learning_rate": 7.807463787814065e-08, + "loss": 0.0005, + "step": 31447 + }, + { + "epoch": 0.61, + "learning_rate": 7.807075453380451e-08, + "loss": 0.0003, + "step": 31448 + }, + { + "epoch": 0.61, + "learning_rate": 7.806687118946837e-08, + "loss": 0.2538, + "step": 31449 + }, + { + "epoch": 0.61, + "learning_rate": 7.806298784513223e-08, + "loss": 0.0006, + "step": 31450 + }, + { + "epoch": 0.61, + "learning_rate": 7.805910450079608e-08, + "loss": 0.0145, + "step": 31451 + }, + { + "epoch": 0.61, + "learning_rate": 7.805522115645994e-08, + "loss": 0.0005, + "step": 31452 + }, + { + "epoch": 0.61, + "learning_rate": 7.80513378121238e-08, + "loss": 0.0006, + "step": 31453 + }, + { + "epoch": 0.61, + "learning_rate": 7.804745446778766e-08, + "loss": 1.1135, + "step": 31454 + }, + { + "epoch": 0.61, + "learning_rate": 7.804357112345152e-08, + "loss": 0.0005, + "step": 31455 + }, + { + "epoch": 0.61, + "learning_rate": 7.803968777911538e-08, + "loss": 0.0004, + "step": 31456 + }, + { + "epoch": 0.61, + "learning_rate": 7.803580443477923e-08, + "loss": 0.0005, + "step": 31457 + }, + { + "epoch": 0.61, + "learning_rate": 7.803192109044309e-08, + "loss": 0.0005, + "step": 31458 + }, + { + "epoch": 0.61, + "learning_rate": 7.802803774610695e-08, + "loss": 0.0005, + "step": 31459 + }, + { + "epoch": 0.61, + "learning_rate": 7.802415440177081e-08, + "loss": 0.0004, + "step": 31460 + }, + { + "epoch": 0.61, + "learning_rate": 7.802027105743467e-08, + "loss": 0.0014, + "step": 31461 + }, + { + "epoch": 0.61, + "learning_rate": 7.801638771309853e-08, + "loss": 0.0009, + "step": 31462 + }, + { + "epoch": 0.61, + "learning_rate": 7.801250436876238e-08, + "loss": 0.0004, + "step": 31463 + }, + { + "epoch": 0.61, + "learning_rate": 7.800862102442624e-08, + "loss": 0.9768, + "step": 31464 + }, + { + "epoch": 0.61, + "learning_rate": 7.800473768009009e-08, + "loss": 0.0006, + "step": 31465 + }, + { + "epoch": 0.61, + "learning_rate": 7.800085433575395e-08, + "loss": 0.0005, + "step": 31466 + }, + { + "epoch": 0.61, + "learning_rate": 7.79969709914178e-08, + "loss": 0.0007, + "step": 31467 + }, + { + "epoch": 0.61, + "learning_rate": 7.799308764708166e-08, + "loss": 0.0005, + "step": 31468 + }, + { + "epoch": 0.61, + "learning_rate": 7.798920430274552e-08, + "loss": 0.0005, + "step": 31469 + }, + { + "epoch": 0.61, + "learning_rate": 7.798532095840938e-08, + "loss": 0.0004, + "step": 31470 + }, + { + "epoch": 0.61, + "learning_rate": 7.798143761407324e-08, + "loss": 0.0005, + "step": 31471 + }, + { + "epoch": 0.61, + "learning_rate": 7.79775542697371e-08, + "loss": 0.0004, + "step": 31472 + }, + { + "epoch": 0.61, + "learning_rate": 7.797367092540095e-08, + "loss": 0.0004, + "step": 31473 + }, + { + "epoch": 0.61, + "learning_rate": 7.796978758106481e-08, + "loss": 0.0007, + "step": 31474 + }, + { + "epoch": 0.61, + "learning_rate": 7.796590423672867e-08, + "loss": 0.0011, + "step": 31475 + }, + { + "epoch": 0.61, + "learning_rate": 7.796202089239253e-08, + "loss": 0.0006, + "step": 31476 + }, + { + "epoch": 0.61, + "learning_rate": 7.795813754805639e-08, + "loss": 0.0004, + "step": 31477 + }, + { + "epoch": 0.61, + "learning_rate": 7.795425420372024e-08, + "loss": 0.0003, + "step": 31478 + }, + { + "epoch": 0.61, + "learning_rate": 7.79503708593841e-08, + "loss": 0.0005, + "step": 31479 + }, + { + "epoch": 0.61, + "learning_rate": 7.794648751504795e-08, + "loss": 1.3375, + "step": 31480 + }, + { + "epoch": 0.61, + "learning_rate": 7.79426041707118e-08, + "loss": 0.0008, + "step": 31481 + }, + { + "epoch": 0.61, + "learning_rate": 7.793872082637566e-08, + "loss": 0.0005, + "step": 31482 + }, + { + "epoch": 0.61, + "learning_rate": 7.793483748203952e-08, + "loss": 0.0106, + "step": 31483 + }, + { + "epoch": 0.61, + "learning_rate": 7.793095413770338e-08, + "loss": 0.0004, + "step": 31484 + }, + { + "epoch": 0.61, + "learning_rate": 7.792707079336724e-08, + "loss": 0.0005, + "step": 31485 + }, + { + "epoch": 0.61, + "learning_rate": 7.79231874490311e-08, + "loss": 0.0007, + "step": 31486 + }, + { + "epoch": 0.61, + "learning_rate": 7.791930410469496e-08, + "loss": 0.0005, + "step": 31487 + }, + { + "epoch": 0.61, + "learning_rate": 7.791542076035881e-08, + "loss": 0.0008, + "step": 31488 + }, + { + "epoch": 0.61, + "learning_rate": 7.791153741602267e-08, + "loss": 0.0005, + "step": 31489 + }, + { + "epoch": 0.61, + "learning_rate": 7.790765407168653e-08, + "loss": 1.043, + "step": 31490 + }, + { + "epoch": 0.61, + "learning_rate": 7.790377072735039e-08, + "loss": 0.0008, + "step": 31491 + }, + { + "epoch": 0.61, + "learning_rate": 7.789988738301425e-08, + "loss": 0.0005, + "step": 31492 + }, + { + "epoch": 0.61, + "learning_rate": 7.78960040386781e-08, + "loss": 0.0004, + "step": 31493 + }, + { + "epoch": 0.61, + "learning_rate": 7.789212069434196e-08, + "loss": 0.0004, + "step": 31494 + }, + { + "epoch": 0.61, + "learning_rate": 7.788823735000582e-08, + "loss": 0.0426, + "step": 31495 + }, + { + "epoch": 0.61, + "learning_rate": 7.788435400566968e-08, + "loss": 0.005, + "step": 31496 + }, + { + "epoch": 0.61, + "learning_rate": 7.788047066133354e-08, + "loss": 0.001, + "step": 31497 + }, + { + "epoch": 0.61, + "learning_rate": 7.78765873169974e-08, + "loss": 0.0006, + "step": 31498 + }, + { + "epoch": 0.61, + "learning_rate": 7.787270397266125e-08, + "loss": 0.0005, + "step": 31499 + }, + { + "epoch": 0.61, + "learning_rate": 7.78688206283251e-08, + "loss": 0.0003, + "step": 31500 + }, + { + "epoch": 0.61, + "learning_rate": 7.786493728398896e-08, + "loss": 0.0004, + "step": 31501 + }, + { + "epoch": 0.61, + "learning_rate": 7.786105393965282e-08, + "loss": 0.0044, + "step": 31502 + }, + { + "epoch": 0.61, + "learning_rate": 7.785717059531667e-08, + "loss": 0.1661, + "step": 31503 + }, + { + "epoch": 0.61, + "learning_rate": 7.785328725098053e-08, + "loss": 0.0008, + "step": 31504 + }, + { + "epoch": 0.61, + "learning_rate": 7.784940390664439e-08, + "loss": 0.0006, + "step": 31505 + }, + { + "epoch": 0.61, + "learning_rate": 7.784552056230825e-08, + "loss": 0.0007, + "step": 31506 + }, + { + "epoch": 0.61, + "learning_rate": 7.784163721797211e-08, + "loss": 0.0036, + "step": 31507 + }, + { + "epoch": 0.61, + "learning_rate": 7.783775387363597e-08, + "loss": 0.0006, + "step": 31508 + }, + { + "epoch": 0.61, + "learning_rate": 7.783387052929982e-08, + "loss": 0.0006, + "step": 31509 + }, + { + "epoch": 0.61, + "learning_rate": 7.782998718496368e-08, + "loss": 0.0007, + "step": 31510 + }, + { + "epoch": 0.61, + "learning_rate": 7.782610384062754e-08, + "loss": 0.2713, + "step": 31511 + }, + { + "epoch": 0.61, + "learning_rate": 7.78222204962914e-08, + "loss": 0.0005, + "step": 31512 + }, + { + "epoch": 0.61, + "learning_rate": 7.781833715195526e-08, + "loss": 0.0008, + "step": 31513 + }, + { + "epoch": 0.61, + "learning_rate": 7.781445380761911e-08, + "loss": 0.0004, + "step": 31514 + }, + { + "epoch": 0.61, + "learning_rate": 7.781057046328297e-08, + "loss": 0.0006, + "step": 31515 + }, + { + "epoch": 0.61, + "learning_rate": 7.780668711894683e-08, + "loss": 0.0018, + "step": 31516 + }, + { + "epoch": 0.61, + "learning_rate": 7.780280377461069e-08, + "loss": 0.0004, + "step": 31517 + }, + { + "epoch": 0.61, + "learning_rate": 7.779892043027455e-08, + "loss": 0.0005, + "step": 31518 + }, + { + "epoch": 0.61, + "learning_rate": 7.77950370859384e-08, + "loss": 0.0005, + "step": 31519 + }, + { + "epoch": 0.61, + "learning_rate": 7.779115374160226e-08, + "loss": 0.0005, + "step": 31520 + }, + { + "epoch": 0.61, + "learning_rate": 7.778727039726612e-08, + "loss": 0.3107, + "step": 31521 + }, + { + "epoch": 0.61, + "learning_rate": 7.778338705292998e-08, + "loss": 0.0004, + "step": 31522 + }, + { + "epoch": 0.61, + "learning_rate": 7.777950370859384e-08, + "loss": 0.0004, + "step": 31523 + }, + { + "epoch": 0.61, + "learning_rate": 7.77756203642577e-08, + "loss": 0.0004, + "step": 31524 + }, + { + "epoch": 0.61, + "learning_rate": 7.777173701992156e-08, + "loss": 0.0004, + "step": 31525 + }, + { + "epoch": 0.61, + "learning_rate": 7.776785367558541e-08, + "loss": 0.0492, + "step": 31526 + }, + { + "epoch": 0.61, + "learning_rate": 7.776397033124927e-08, + "loss": 0.0005, + "step": 31527 + }, + { + "epoch": 0.61, + "learning_rate": 7.776008698691313e-08, + "loss": 0.0005, + "step": 31528 + }, + { + "epoch": 0.61, + "learning_rate": 7.775620364257697e-08, + "loss": 0.0007, + "step": 31529 + }, + { + "epoch": 0.61, + "learning_rate": 7.775232029824083e-08, + "loss": 0.0006, + "step": 31530 + }, + { + "epoch": 0.61, + "learning_rate": 7.774843695390469e-08, + "loss": 0.0004, + "step": 31531 + }, + { + "epoch": 0.61, + "learning_rate": 7.774455360956855e-08, + "loss": 0.0006, + "step": 31532 + }, + { + "epoch": 0.61, + "learning_rate": 7.774067026523241e-08, + "loss": 0.0006, + "step": 31533 + }, + { + "epoch": 0.61, + "learning_rate": 7.773678692089627e-08, + "loss": 0.0005, + "step": 31534 + }, + { + "epoch": 0.61, + "learning_rate": 7.773290357656012e-08, + "loss": 0.0004, + "step": 31535 + }, + { + "epoch": 0.61, + "learning_rate": 7.772902023222398e-08, + "loss": 0.0004, + "step": 31536 + }, + { + "epoch": 0.61, + "learning_rate": 7.772513688788784e-08, + "loss": 0.0006, + "step": 31537 + }, + { + "epoch": 0.61, + "learning_rate": 7.77212535435517e-08, + "loss": 0.0006, + "step": 31538 + }, + { + "epoch": 0.61, + "learning_rate": 7.771737019921556e-08, + "loss": 0.0005, + "step": 31539 + }, + { + "epoch": 0.61, + "learning_rate": 7.771348685487942e-08, + "loss": 0.0016, + "step": 31540 + }, + { + "epoch": 0.61, + "learning_rate": 7.770960351054327e-08, + "loss": 0.0007, + "step": 31541 + }, + { + "epoch": 0.61, + "learning_rate": 7.770572016620713e-08, + "loss": 0.0005, + "step": 31542 + }, + { + "epoch": 0.61, + "learning_rate": 7.770183682187099e-08, + "loss": 0.0006, + "step": 31543 + }, + { + "epoch": 0.61, + "learning_rate": 7.769795347753485e-08, + "loss": 0.272, + "step": 31544 + }, + { + "epoch": 0.61, + "learning_rate": 7.769407013319871e-08, + "loss": 0.0004, + "step": 31545 + }, + { + "epoch": 0.61, + "learning_rate": 7.769018678886257e-08, + "loss": 0.0004, + "step": 31546 + }, + { + "epoch": 0.61, + "learning_rate": 7.768630344452642e-08, + "loss": 0.0006, + "step": 31547 + }, + { + "epoch": 0.61, + "learning_rate": 7.768242010019028e-08, + "loss": 0.0005, + "step": 31548 + }, + { + "epoch": 0.61, + "learning_rate": 7.767853675585414e-08, + "loss": 0.0005, + "step": 31549 + }, + { + "epoch": 0.61, + "learning_rate": 7.7674653411518e-08, + "loss": 0.0347, + "step": 31550 + }, + { + "epoch": 0.61, + "learning_rate": 7.767077006718186e-08, + "loss": 0.0004, + "step": 31551 + }, + { + "epoch": 0.61, + "learning_rate": 7.766688672284571e-08, + "loss": 0.0006, + "step": 31552 + }, + { + "epoch": 0.61, + "learning_rate": 7.766300337850957e-08, + "loss": 0.0005, + "step": 31553 + }, + { + "epoch": 0.61, + "learning_rate": 7.765912003417343e-08, + "loss": 0.0004, + "step": 31554 + }, + { + "epoch": 0.61, + "learning_rate": 7.765523668983729e-08, + "loss": 0.0006, + "step": 31555 + }, + { + "epoch": 0.61, + "learning_rate": 7.765135334550115e-08, + "loss": 0.0017, + "step": 31556 + }, + { + "epoch": 0.61, + "learning_rate": 7.7647470001165e-08, + "loss": 0.0005, + "step": 31557 + }, + { + "epoch": 0.61, + "learning_rate": 7.764358665682885e-08, + "loss": 0.0005, + "step": 31558 + }, + { + "epoch": 0.61, + "learning_rate": 7.763970331249271e-08, + "loss": 0.0003, + "step": 31559 + }, + { + "epoch": 0.61, + "learning_rate": 7.763581996815657e-08, + "loss": 0.0004, + "step": 31560 + }, + { + "epoch": 0.61, + "learning_rate": 7.763193662382043e-08, + "loss": 0.0006, + "step": 31561 + }, + { + "epoch": 0.61, + "learning_rate": 7.762805327948428e-08, + "loss": 0.0918, + "step": 31562 + }, + { + "epoch": 0.61, + "learning_rate": 7.762416993514814e-08, + "loss": 0.0038, + "step": 31563 + }, + { + "epoch": 0.61, + "learning_rate": 7.7620286590812e-08, + "loss": 0.0016, + "step": 31564 + }, + { + "epoch": 0.61, + "learning_rate": 7.761640324647586e-08, + "loss": 0.0007, + "step": 31565 + }, + { + "epoch": 0.61, + "learning_rate": 7.761251990213972e-08, + "loss": 0.0003, + "step": 31566 + }, + { + "epoch": 0.61, + "learning_rate": 7.760863655780358e-08, + "loss": 0.0004, + "step": 31567 + }, + { + "epoch": 0.61, + "learning_rate": 7.760475321346743e-08, + "loss": 0.8729, + "step": 31568 + }, + { + "epoch": 0.61, + "learning_rate": 7.760086986913129e-08, + "loss": 0.0003, + "step": 31569 + }, + { + "epoch": 0.61, + "learning_rate": 7.759698652479515e-08, + "loss": 0.0005, + "step": 31570 + }, + { + "epoch": 0.61, + "learning_rate": 7.759310318045901e-08, + "loss": 0.0006, + "step": 31571 + }, + { + "epoch": 0.61, + "learning_rate": 7.758921983612287e-08, + "loss": 1.2331, + "step": 31572 + }, + { + "epoch": 0.61, + "learning_rate": 7.758533649178672e-08, + "loss": 0.0004, + "step": 31573 + }, + { + "epoch": 0.61, + "learning_rate": 7.758145314745058e-08, + "loss": 0.0007, + "step": 31574 + }, + { + "epoch": 0.61, + "learning_rate": 7.757756980311444e-08, + "loss": 0.0055, + "step": 31575 + }, + { + "epoch": 0.61, + "learning_rate": 7.75736864587783e-08, + "loss": 0.0005, + "step": 31576 + }, + { + "epoch": 0.61, + "learning_rate": 7.756980311444216e-08, + "loss": 0.0013, + "step": 31577 + }, + { + "epoch": 0.61, + "learning_rate": 7.756591977010602e-08, + "loss": 0.0005, + "step": 31578 + }, + { + "epoch": 0.61, + "learning_rate": 7.756203642576987e-08, + "loss": 0.0004, + "step": 31579 + }, + { + "epoch": 0.61, + "learning_rate": 7.755815308143373e-08, + "loss": 0.0003, + "step": 31580 + }, + { + "epoch": 0.61, + "learning_rate": 7.755426973709759e-08, + "loss": 0.0011, + "step": 31581 + }, + { + "epoch": 0.61, + "learning_rate": 7.755038639276145e-08, + "loss": 1.2404, + "step": 31582 + }, + { + "epoch": 0.61, + "learning_rate": 7.754650304842531e-08, + "loss": 0.0004, + "step": 31583 + }, + { + "epoch": 0.61, + "learning_rate": 7.754261970408917e-08, + "loss": 0.0005, + "step": 31584 + }, + { + "epoch": 0.61, + "learning_rate": 7.753873635975302e-08, + "loss": 0.1116, + "step": 31585 + }, + { + "epoch": 0.61, + "learning_rate": 7.753485301541688e-08, + "loss": 0.0004, + "step": 31586 + }, + { + "epoch": 0.61, + "learning_rate": 7.753096967108073e-08, + "loss": 0.0003, + "step": 31587 + }, + { + "epoch": 0.61, + "learning_rate": 7.752708632674458e-08, + "loss": 0.0004, + "step": 31588 + }, + { + "epoch": 0.61, + "learning_rate": 7.752320298240844e-08, + "loss": 0.0005, + "step": 31589 + }, + { + "epoch": 0.61, + "learning_rate": 7.75193196380723e-08, + "loss": 0.0005, + "step": 31590 + }, + { + "epoch": 0.61, + "learning_rate": 7.751543629373616e-08, + "loss": 0.0004, + "step": 31591 + }, + { + "epoch": 0.61, + "learning_rate": 7.751155294940002e-08, + "loss": 0.0147, + "step": 31592 + }, + { + "epoch": 0.61, + "learning_rate": 7.750766960506388e-08, + "loss": 0.0362, + "step": 31593 + }, + { + "epoch": 0.61, + "learning_rate": 7.750378626072773e-08, + "loss": 0.0004, + "step": 31594 + }, + { + "epoch": 0.61, + "learning_rate": 7.749990291639159e-08, + "loss": 0.0005, + "step": 31595 + }, + { + "epoch": 0.61, + "learning_rate": 7.749601957205545e-08, + "loss": 0.6254, + "step": 31596 + }, + { + "epoch": 0.61, + "learning_rate": 7.749213622771931e-08, + "loss": 0.0006, + "step": 31597 + }, + { + "epoch": 0.61, + "learning_rate": 7.748825288338317e-08, + "loss": 0.0005, + "step": 31598 + }, + { + "epoch": 0.61, + "learning_rate": 7.748436953904703e-08, + "loss": 0.0005, + "step": 31599 + }, + { + "epoch": 0.61, + "learning_rate": 7.748048619471088e-08, + "loss": 0.0012, + "step": 31600 + }, + { + "epoch": 0.61, + "learning_rate": 7.747660285037474e-08, + "loss": 0.0011, + "step": 31601 + }, + { + "epoch": 0.61, + "learning_rate": 7.74727195060386e-08, + "loss": 0.0006, + "step": 31602 + }, + { + "epoch": 0.61, + "learning_rate": 7.746883616170246e-08, + "loss": 0.0008, + "step": 31603 + }, + { + "epoch": 0.61, + "learning_rate": 7.746495281736632e-08, + "loss": 0.0005, + "step": 31604 + }, + { + "epoch": 0.61, + "learning_rate": 7.746106947303018e-08, + "loss": 0.0003, + "step": 31605 + }, + { + "epoch": 0.61, + "learning_rate": 7.745718612869403e-08, + "loss": 0.0004, + "step": 31606 + }, + { + "epoch": 0.61, + "learning_rate": 7.745330278435789e-08, + "loss": 0.0005, + "step": 31607 + }, + { + "epoch": 0.61, + "learning_rate": 7.744941944002175e-08, + "loss": 0.0004, + "step": 31608 + }, + { + "epoch": 0.61, + "learning_rate": 7.744553609568561e-08, + "loss": 0.0004, + "step": 31609 + }, + { + "epoch": 0.61, + "learning_rate": 7.744165275134947e-08, + "loss": 0.0004, + "step": 31610 + }, + { + "epoch": 0.61, + "learning_rate": 7.743776940701332e-08, + "loss": 0.0016, + "step": 31611 + }, + { + "epoch": 0.61, + "learning_rate": 7.743388606267718e-08, + "loss": 0.0005, + "step": 31612 + }, + { + "epoch": 0.61, + "learning_rate": 7.743000271834104e-08, + "loss": 0.0004, + "step": 31613 + }, + { + "epoch": 0.61, + "learning_rate": 7.74261193740049e-08, + "loss": 0.0005, + "step": 31614 + }, + { + "epoch": 0.61, + "learning_rate": 7.742223602966876e-08, + "loss": 0.0004, + "step": 31615 + }, + { + "epoch": 0.61, + "learning_rate": 7.74183526853326e-08, + "loss": 0.0112, + "step": 31616 + }, + { + "epoch": 0.61, + "learning_rate": 7.741446934099646e-08, + "loss": 0.0005, + "step": 31617 + }, + { + "epoch": 0.61, + "learning_rate": 7.741058599666032e-08, + "loss": 0.0009, + "step": 31618 + }, + { + "epoch": 0.61, + "learning_rate": 7.740670265232418e-08, + "loss": 0.0006, + "step": 31619 + }, + { + "epoch": 0.61, + "learning_rate": 7.740281930798804e-08, + "loss": 1.2584, + "step": 31620 + }, + { + "epoch": 0.61, + "learning_rate": 7.73989359636519e-08, + "loss": 0.0021, + "step": 31621 + }, + { + "epoch": 0.61, + "learning_rate": 7.739505261931575e-08, + "loss": 0.0005, + "step": 31622 + }, + { + "epoch": 0.61, + "learning_rate": 7.739116927497961e-08, + "loss": 0.0005, + "step": 31623 + }, + { + "epoch": 0.61, + "learning_rate": 7.738728593064347e-08, + "loss": 0.0481, + "step": 31624 + }, + { + "epoch": 0.61, + "learning_rate": 7.738340258630733e-08, + "loss": 0.0007, + "step": 31625 + }, + { + "epoch": 0.61, + "learning_rate": 7.737951924197118e-08, + "loss": 0.0004, + "step": 31626 + }, + { + "epoch": 0.61, + "learning_rate": 7.737563589763504e-08, + "loss": 0.0005, + "step": 31627 + }, + { + "epoch": 0.61, + "learning_rate": 7.73717525532989e-08, + "loss": 0.0005, + "step": 31628 + }, + { + "epoch": 0.61, + "learning_rate": 7.736786920896276e-08, + "loss": 0.0008, + "step": 31629 + }, + { + "epoch": 0.61, + "learning_rate": 7.736398586462662e-08, + "loss": 0.0005, + "step": 31630 + }, + { + "epoch": 0.61, + "learning_rate": 7.736010252029048e-08, + "loss": 0.006, + "step": 31631 + }, + { + "epoch": 0.61, + "learning_rate": 7.735621917595433e-08, + "loss": 0.0007, + "step": 31632 + }, + { + "epoch": 0.61, + "learning_rate": 7.735233583161819e-08, + "loss": 0.0005, + "step": 31633 + }, + { + "epoch": 0.61, + "learning_rate": 7.734845248728205e-08, + "loss": 0.0008, + "step": 31634 + }, + { + "epoch": 0.61, + "learning_rate": 7.734456914294591e-08, + "loss": 1.2805, + "step": 31635 + }, + { + "epoch": 0.61, + "learning_rate": 7.734068579860977e-08, + "loss": 0.0005, + "step": 31636 + }, + { + "epoch": 0.61, + "learning_rate": 7.733680245427363e-08, + "loss": 0.0005, + "step": 31637 + }, + { + "epoch": 0.61, + "learning_rate": 7.733291910993748e-08, + "loss": 0.0006, + "step": 31638 + }, + { + "epoch": 0.61, + "learning_rate": 7.732903576560134e-08, + "loss": 1.2029, + "step": 31639 + }, + { + "epoch": 0.61, + "learning_rate": 7.73251524212652e-08, + "loss": 0.0006, + "step": 31640 + }, + { + "epoch": 0.61, + "learning_rate": 7.732126907692906e-08, + "loss": 0.9079, + "step": 31641 + }, + { + "epoch": 0.61, + "learning_rate": 7.73173857325929e-08, + "loss": 0.0013, + "step": 31642 + }, + { + "epoch": 0.61, + "learning_rate": 7.731350238825676e-08, + "loss": 0.0005, + "step": 31643 + }, + { + "epoch": 0.61, + "learning_rate": 7.730961904392062e-08, + "loss": 0.0005, + "step": 31644 + }, + { + "epoch": 0.61, + "learning_rate": 7.730573569958448e-08, + "loss": 0.0175, + "step": 31645 + }, + { + "epoch": 0.61, + "learning_rate": 7.730185235524834e-08, + "loss": 0.0005, + "step": 31646 + }, + { + "epoch": 0.61, + "learning_rate": 7.72979690109122e-08, + "loss": 0.0004, + "step": 31647 + }, + { + "epoch": 0.61, + "learning_rate": 7.729408566657605e-08, + "loss": 0.0005, + "step": 31648 + }, + { + "epoch": 0.61, + "learning_rate": 7.729020232223991e-08, + "loss": 0.0004, + "step": 31649 + }, + { + "epoch": 0.61, + "learning_rate": 7.728631897790377e-08, + "loss": 0.0004, + "step": 31650 + }, + { + "epoch": 0.61, + "learning_rate": 7.728243563356763e-08, + "loss": 0.8539, + "step": 31651 + }, + { + "epoch": 0.61, + "learning_rate": 7.727855228923149e-08, + "loss": 0.0007, + "step": 31652 + }, + { + "epoch": 0.61, + "learning_rate": 7.727466894489534e-08, + "loss": 0.0005, + "step": 31653 + }, + { + "epoch": 0.61, + "learning_rate": 7.72707856005592e-08, + "loss": 0.0004, + "step": 31654 + }, + { + "epoch": 0.61, + "learning_rate": 7.726690225622306e-08, + "loss": 0.0027, + "step": 31655 + }, + { + "epoch": 0.61, + "learning_rate": 7.726301891188692e-08, + "loss": 0.0005, + "step": 31656 + }, + { + "epoch": 0.61, + "learning_rate": 7.725913556755076e-08, + "loss": 0.0004, + "step": 31657 + }, + { + "epoch": 0.61, + "learning_rate": 7.725525222321462e-08, + "loss": 0.0731, + "step": 31658 + }, + { + "epoch": 0.61, + "learning_rate": 7.725136887887848e-08, + "loss": 0.1065, + "step": 31659 + }, + { + "epoch": 0.61, + "learning_rate": 7.724748553454234e-08, + "loss": 0.0004, + "step": 31660 + }, + { + "epoch": 0.61, + "learning_rate": 7.72436021902062e-08, + "loss": 0.0006, + "step": 31661 + }, + { + "epoch": 0.61, + "learning_rate": 7.723971884587006e-08, + "loss": 1.0594, + "step": 31662 + }, + { + "epoch": 0.61, + "learning_rate": 7.723583550153391e-08, + "loss": 0.0005, + "step": 31663 + }, + { + "epoch": 0.61, + "learning_rate": 7.723195215719777e-08, + "loss": 0.002, + "step": 31664 + }, + { + "epoch": 0.61, + "learning_rate": 7.722806881286163e-08, + "loss": 0.0005, + "step": 31665 + }, + { + "epoch": 0.61, + "learning_rate": 7.722418546852549e-08, + "loss": 0.0004, + "step": 31666 + }, + { + "epoch": 0.61, + "learning_rate": 7.722030212418935e-08, + "loss": 0.0004, + "step": 31667 + }, + { + "epoch": 0.61, + "learning_rate": 7.72164187798532e-08, + "loss": 0.0004, + "step": 31668 + }, + { + "epoch": 0.61, + "learning_rate": 7.721253543551706e-08, + "loss": 0.0005, + "step": 31669 + }, + { + "epoch": 0.61, + "learning_rate": 7.720865209118092e-08, + "loss": 0.0005, + "step": 31670 + }, + { + "epoch": 0.61, + "learning_rate": 7.720476874684478e-08, + "loss": 0.0006, + "step": 31671 + }, + { + "epoch": 0.61, + "learning_rate": 7.720088540250864e-08, + "loss": 0.0004, + "step": 31672 + }, + { + "epoch": 0.61, + "learning_rate": 7.71970020581725e-08, + "loss": 0.0004, + "step": 31673 + }, + { + "epoch": 0.61, + "learning_rate": 7.719311871383634e-08, + "loss": 0.0004, + "step": 31674 + }, + { + "epoch": 0.61, + "learning_rate": 7.71892353695002e-08, + "loss": 0.0021, + "step": 31675 + }, + { + "epoch": 0.61, + "learning_rate": 7.718535202516406e-08, + "loss": 0.0007, + "step": 31676 + }, + { + "epoch": 0.61, + "learning_rate": 7.718146868082792e-08, + "loss": 0.0007, + "step": 31677 + }, + { + "epoch": 0.61, + "learning_rate": 7.717758533649177e-08, + "loss": 0.1159, + "step": 31678 + }, + { + "epoch": 0.61, + "learning_rate": 7.717370199215563e-08, + "loss": 0.0007, + "step": 31679 + }, + { + "epoch": 0.61, + "learning_rate": 7.716981864781949e-08, + "loss": 0.0003, + "step": 31680 + }, + { + "epoch": 0.61, + "learning_rate": 7.716593530348335e-08, + "loss": 0.0004, + "step": 31681 + }, + { + "epoch": 0.61, + "learning_rate": 7.716205195914721e-08, + "loss": 0.0005, + "step": 31682 + }, + { + "epoch": 0.61, + "learning_rate": 7.715816861481107e-08, + "loss": 0.0005, + "step": 31683 + }, + { + "epoch": 0.61, + "learning_rate": 7.715428527047492e-08, + "loss": 0.4677, + "step": 31684 + }, + { + "epoch": 0.61, + "learning_rate": 7.715040192613878e-08, + "loss": 0.0004, + "step": 31685 + }, + { + "epoch": 0.61, + "learning_rate": 7.714651858180264e-08, + "loss": 0.0004, + "step": 31686 + }, + { + "epoch": 0.61, + "learning_rate": 7.71426352374665e-08, + "loss": 1.343, + "step": 31687 + }, + { + "epoch": 0.61, + "learning_rate": 7.713875189313036e-08, + "loss": 0.0006, + "step": 31688 + }, + { + "epoch": 0.61, + "learning_rate": 7.713486854879421e-08, + "loss": 0.0004, + "step": 31689 + }, + { + "epoch": 0.61, + "learning_rate": 7.713098520445807e-08, + "loss": 0.1779, + "step": 31690 + }, + { + "epoch": 0.61, + "learning_rate": 7.712710186012193e-08, + "loss": 0.0005, + "step": 31691 + }, + { + "epoch": 0.61, + "learning_rate": 7.712321851578579e-08, + "loss": 0.0006, + "step": 31692 + }, + { + "epoch": 0.61, + "learning_rate": 7.711933517144965e-08, + "loss": 0.0005, + "step": 31693 + }, + { + "epoch": 0.61, + "learning_rate": 7.71154518271135e-08, + "loss": 0.0004, + "step": 31694 + }, + { + "epoch": 0.61, + "learning_rate": 7.711156848277736e-08, + "loss": 0.0007, + "step": 31695 + }, + { + "epoch": 0.61, + "learning_rate": 7.710768513844122e-08, + "loss": 0.0005, + "step": 31696 + }, + { + "epoch": 0.61, + "learning_rate": 7.710380179410508e-08, + "loss": 0.0005, + "step": 31697 + }, + { + "epoch": 0.61, + "learning_rate": 7.709991844976894e-08, + "loss": 0.0007, + "step": 31698 + }, + { + "epoch": 0.61, + "learning_rate": 7.70960351054328e-08, + "loss": 0.0003, + "step": 31699 + }, + { + "epoch": 0.61, + "learning_rate": 7.709215176109666e-08, + "loss": 0.0005, + "step": 31700 + }, + { + "epoch": 0.61, + "learning_rate": 7.708826841676051e-08, + "loss": 0.0004, + "step": 31701 + }, + { + "epoch": 0.61, + "learning_rate": 7.708438507242437e-08, + "loss": 0.0004, + "step": 31702 + }, + { + "epoch": 0.61, + "learning_rate": 7.708050172808822e-08, + "loss": 0.0005, + "step": 31703 + }, + { + "epoch": 0.61, + "learning_rate": 7.707661838375208e-08, + "loss": 0.1461, + "step": 31704 + }, + { + "epoch": 0.62, + "learning_rate": 7.707273503941593e-08, + "loss": 0.0004, + "step": 31705 + }, + { + "epoch": 0.62, + "learning_rate": 7.706885169507979e-08, + "loss": 0.0005, + "step": 31706 + }, + { + "epoch": 0.62, + "learning_rate": 7.706496835074365e-08, + "loss": 0.0009, + "step": 31707 + }, + { + "epoch": 0.62, + "learning_rate": 7.706108500640751e-08, + "loss": 0.0018, + "step": 31708 + }, + { + "epoch": 0.62, + "learning_rate": 7.705720166207137e-08, + "loss": 0.0004, + "step": 31709 + }, + { + "epoch": 0.62, + "learning_rate": 7.705331831773522e-08, + "loss": 0.0038, + "step": 31710 + }, + { + "epoch": 0.62, + "learning_rate": 7.704943497339908e-08, + "loss": 0.0007, + "step": 31711 + }, + { + "epoch": 0.62, + "learning_rate": 7.704555162906294e-08, + "loss": 0.0005, + "step": 31712 + }, + { + "epoch": 0.62, + "learning_rate": 7.70416682847268e-08, + "loss": 0.0006, + "step": 31713 + }, + { + "epoch": 0.62, + "learning_rate": 7.703778494039066e-08, + "loss": 0.0005, + "step": 31714 + }, + { + "epoch": 0.62, + "learning_rate": 7.703390159605452e-08, + "loss": 0.0006, + "step": 31715 + }, + { + "epoch": 0.62, + "learning_rate": 7.703001825171837e-08, + "loss": 0.0006, + "step": 31716 + }, + { + "epoch": 0.62, + "learning_rate": 7.702613490738223e-08, + "loss": 0.0004, + "step": 31717 + }, + { + "epoch": 0.62, + "learning_rate": 7.702225156304609e-08, + "loss": 0.2606, + "step": 31718 + }, + { + "epoch": 0.62, + "learning_rate": 7.701836821870995e-08, + "loss": 0.0004, + "step": 31719 + }, + { + "epoch": 0.62, + "learning_rate": 7.701448487437381e-08, + "loss": 0.0003, + "step": 31720 + }, + { + "epoch": 0.62, + "learning_rate": 7.701060153003767e-08, + "loss": 0.0005, + "step": 31721 + }, + { + "epoch": 0.62, + "learning_rate": 7.700671818570152e-08, + "loss": 0.0005, + "step": 31722 + }, + { + "epoch": 0.62, + "learning_rate": 7.700283484136538e-08, + "loss": 0.0385, + "step": 31723 + }, + { + "epoch": 0.62, + "learning_rate": 7.699895149702924e-08, + "loss": 0.0037, + "step": 31724 + }, + { + "epoch": 0.62, + "learning_rate": 7.69950681526931e-08, + "loss": 1.138, + "step": 31725 + }, + { + "epoch": 0.62, + "learning_rate": 7.699118480835696e-08, + "loss": 0.0006, + "step": 31726 + }, + { + "epoch": 0.62, + "learning_rate": 7.698730146402081e-08, + "loss": 0.0007, + "step": 31727 + }, + { + "epoch": 0.62, + "learning_rate": 7.698341811968467e-08, + "loss": 1.2249, + "step": 31728 + }, + { + "epoch": 0.62, + "learning_rate": 7.697953477534853e-08, + "loss": 0.0005, + "step": 31729 + }, + { + "epoch": 0.62, + "learning_rate": 7.697565143101239e-08, + "loss": 0.0004, + "step": 31730 + }, + { + "epoch": 0.62, + "learning_rate": 7.697176808667625e-08, + "loss": 0.0004, + "step": 31731 + }, + { + "epoch": 0.62, + "learning_rate": 7.696788474234009e-08, + "loss": 0.0004, + "step": 31732 + }, + { + "epoch": 0.62, + "learning_rate": 7.696400139800395e-08, + "loss": 0.0007, + "step": 31733 + }, + { + "epoch": 0.62, + "learning_rate": 7.696011805366781e-08, + "loss": 0.0005, + "step": 31734 + }, + { + "epoch": 0.62, + "learning_rate": 7.695623470933167e-08, + "loss": 0.0007, + "step": 31735 + }, + { + "epoch": 0.62, + "learning_rate": 7.695235136499553e-08, + "loss": 0.0006, + "step": 31736 + }, + { + "epoch": 0.62, + "learning_rate": 7.694846802065938e-08, + "loss": 0.0005, + "step": 31737 + }, + { + "epoch": 0.62, + "learning_rate": 7.694458467632324e-08, + "loss": 0.0004, + "step": 31738 + }, + { + "epoch": 0.62, + "learning_rate": 7.69407013319871e-08, + "loss": 0.0006, + "step": 31739 + }, + { + "epoch": 0.62, + "learning_rate": 7.693681798765096e-08, + "loss": 0.0006, + "step": 31740 + }, + { + "epoch": 0.62, + "learning_rate": 7.693293464331482e-08, + "loss": 0.0012, + "step": 31741 + }, + { + "epoch": 0.62, + "learning_rate": 7.692905129897868e-08, + "loss": 0.0005, + "step": 31742 + }, + { + "epoch": 0.62, + "learning_rate": 7.692516795464253e-08, + "loss": 1.1713, + "step": 31743 + }, + { + "epoch": 0.62, + "learning_rate": 7.692128461030639e-08, + "loss": 0.0004, + "step": 31744 + }, + { + "epoch": 0.62, + "learning_rate": 7.691740126597025e-08, + "loss": 0.0006, + "step": 31745 + }, + { + "epoch": 0.62, + "learning_rate": 7.691351792163411e-08, + "loss": 0.0006, + "step": 31746 + }, + { + "epoch": 0.62, + "learning_rate": 7.690963457729797e-08, + "loss": 0.0003, + "step": 31747 + }, + { + "epoch": 0.62, + "learning_rate": 7.690575123296182e-08, + "loss": 0.8294, + "step": 31748 + }, + { + "epoch": 0.62, + "learning_rate": 7.690186788862568e-08, + "loss": 0.0009, + "step": 31749 + }, + { + "epoch": 0.62, + "learning_rate": 7.689798454428954e-08, + "loss": 0.0004, + "step": 31750 + }, + { + "epoch": 0.62, + "learning_rate": 7.68941011999534e-08, + "loss": 0.0005, + "step": 31751 + }, + { + "epoch": 0.62, + "learning_rate": 7.689021785561726e-08, + "loss": 0.0006, + "step": 31752 + }, + { + "epoch": 0.62, + "learning_rate": 7.688633451128112e-08, + "loss": 0.1957, + "step": 31753 + }, + { + "epoch": 0.62, + "learning_rate": 7.688245116694497e-08, + "loss": 0.0004, + "step": 31754 + }, + { + "epoch": 0.62, + "learning_rate": 7.687856782260883e-08, + "loss": 0.0005, + "step": 31755 + }, + { + "epoch": 0.62, + "learning_rate": 7.687468447827269e-08, + "loss": 0.0004, + "step": 31756 + }, + { + "epoch": 0.62, + "learning_rate": 7.687080113393655e-08, + "loss": 0.0004, + "step": 31757 + }, + { + "epoch": 0.62, + "learning_rate": 7.686691778960041e-08, + "loss": 0.0014, + "step": 31758 + }, + { + "epoch": 0.62, + "learning_rate": 7.686303444526427e-08, + "loss": 0.0007, + "step": 31759 + }, + { + "epoch": 0.62, + "learning_rate": 7.685915110092812e-08, + "loss": 0.3172, + "step": 31760 + }, + { + "epoch": 0.62, + "learning_rate": 7.685526775659197e-08, + "loss": 0.0005, + "step": 31761 + }, + { + "epoch": 0.62, + "learning_rate": 7.685138441225583e-08, + "loss": 0.0003, + "step": 31762 + }, + { + "epoch": 0.62, + "learning_rate": 7.684750106791969e-08, + "loss": 0.0006, + "step": 31763 + }, + { + "epoch": 0.62, + "learning_rate": 7.684361772358354e-08, + "loss": 0.0005, + "step": 31764 + }, + { + "epoch": 0.62, + "learning_rate": 7.68397343792474e-08, + "loss": 0.0004, + "step": 31765 + }, + { + "epoch": 0.62, + "learning_rate": 7.683585103491126e-08, + "loss": 0.0006, + "step": 31766 + }, + { + "epoch": 0.62, + "learning_rate": 7.683196769057512e-08, + "loss": 0.0006, + "step": 31767 + }, + { + "epoch": 0.62, + "learning_rate": 7.682808434623898e-08, + "loss": 0.7322, + "step": 31768 + }, + { + "epoch": 0.62, + "learning_rate": 7.682420100190283e-08, + "loss": 0.0094, + "step": 31769 + }, + { + "epoch": 0.62, + "learning_rate": 7.682031765756669e-08, + "loss": 0.0004, + "step": 31770 + }, + { + "epoch": 0.62, + "learning_rate": 7.681643431323055e-08, + "loss": 0.0004, + "step": 31771 + }, + { + "epoch": 0.62, + "learning_rate": 7.681255096889441e-08, + "loss": 0.0005, + "step": 31772 + }, + { + "epoch": 0.62, + "learning_rate": 7.680866762455827e-08, + "loss": 0.4974, + "step": 31773 + }, + { + "epoch": 0.62, + "learning_rate": 7.680478428022213e-08, + "loss": 0.0004, + "step": 31774 + }, + { + "epoch": 0.62, + "learning_rate": 7.680090093588598e-08, + "loss": 0.0004, + "step": 31775 + }, + { + "epoch": 0.62, + "learning_rate": 7.679701759154984e-08, + "loss": 0.0004, + "step": 31776 + }, + { + "epoch": 0.62, + "learning_rate": 7.67931342472137e-08, + "loss": 0.0004, + "step": 31777 + }, + { + "epoch": 0.62, + "learning_rate": 7.678925090287756e-08, + "loss": 0.0006, + "step": 31778 + }, + { + "epoch": 0.62, + "learning_rate": 7.678536755854142e-08, + "loss": 0.0004, + "step": 31779 + }, + { + "epoch": 0.62, + "learning_rate": 7.678148421420528e-08, + "loss": 0.0008, + "step": 31780 + }, + { + "epoch": 0.62, + "learning_rate": 7.677760086986913e-08, + "loss": 0.0004, + "step": 31781 + }, + { + "epoch": 0.62, + "learning_rate": 7.677371752553299e-08, + "loss": 0.0006, + "step": 31782 + }, + { + "epoch": 0.62, + "learning_rate": 7.676983418119685e-08, + "loss": 0.0003, + "step": 31783 + }, + { + "epoch": 0.62, + "learning_rate": 7.676595083686071e-08, + "loss": 0.0005, + "step": 31784 + }, + { + "epoch": 0.62, + "learning_rate": 7.676206749252457e-08, + "loss": 0.0006, + "step": 31785 + }, + { + "epoch": 0.62, + "learning_rate": 7.675818414818842e-08, + "loss": 0.0005, + "step": 31786 + }, + { + "epoch": 0.62, + "learning_rate": 7.675430080385228e-08, + "loss": 0.0006, + "step": 31787 + }, + { + "epoch": 0.62, + "learning_rate": 7.675041745951614e-08, + "loss": 0.0007, + "step": 31788 + }, + { + "epoch": 0.62, + "learning_rate": 7.674653411518e-08, + "loss": 0.0004, + "step": 31789 + }, + { + "epoch": 0.62, + "learning_rate": 7.674265077084384e-08, + "loss": 0.0003, + "step": 31790 + }, + { + "epoch": 0.62, + "learning_rate": 7.67387674265077e-08, + "loss": 0.0007, + "step": 31791 + }, + { + "epoch": 0.62, + "learning_rate": 7.673488408217156e-08, + "loss": 0.0007, + "step": 31792 + }, + { + "epoch": 0.62, + "learning_rate": 7.673100073783542e-08, + "loss": 0.0006, + "step": 31793 + }, + { + "epoch": 0.62, + "learning_rate": 7.672711739349928e-08, + "loss": 0.0005, + "step": 31794 + }, + { + "epoch": 0.62, + "learning_rate": 7.672323404916314e-08, + "loss": 0.0007, + "step": 31795 + }, + { + "epoch": 0.62, + "learning_rate": 7.6719350704827e-08, + "loss": 0.0004, + "step": 31796 + }, + { + "epoch": 0.62, + "learning_rate": 7.671546736049085e-08, + "loss": 0.8131, + "step": 31797 + }, + { + "epoch": 0.62, + "learning_rate": 7.671158401615471e-08, + "loss": 0.0006, + "step": 31798 + }, + { + "epoch": 0.62, + "learning_rate": 7.670770067181857e-08, + "loss": 0.0005, + "step": 31799 + }, + { + "epoch": 0.62, + "learning_rate": 7.670381732748243e-08, + "loss": 0.0025, + "step": 31800 + }, + { + "epoch": 0.62, + "learning_rate": 7.669993398314629e-08, + "loss": 0.0006, + "step": 31801 + }, + { + "epoch": 0.62, + "learning_rate": 7.669605063881014e-08, + "loss": 0.0004, + "step": 31802 + }, + { + "epoch": 0.62, + "learning_rate": 7.6692167294474e-08, + "loss": 0.0004, + "step": 31803 + }, + { + "epoch": 0.62, + "learning_rate": 7.668828395013786e-08, + "loss": 0.0003, + "step": 31804 + }, + { + "epoch": 0.62, + "learning_rate": 7.668440060580172e-08, + "loss": 0.0019, + "step": 31805 + }, + { + "epoch": 0.62, + "learning_rate": 7.668051726146558e-08, + "loss": 0.0003, + "step": 31806 + }, + { + "epoch": 0.62, + "learning_rate": 7.667663391712943e-08, + "loss": 0.0005, + "step": 31807 + }, + { + "epoch": 0.62, + "learning_rate": 7.667275057279329e-08, + "loss": 1.0335, + "step": 31808 + }, + { + "epoch": 0.62, + "learning_rate": 7.666886722845715e-08, + "loss": 0.0005, + "step": 31809 + }, + { + "epoch": 0.62, + "learning_rate": 7.666498388412101e-08, + "loss": 0.0056, + "step": 31810 + }, + { + "epoch": 0.62, + "learning_rate": 7.666110053978487e-08, + "loss": 0.0007, + "step": 31811 + }, + { + "epoch": 0.62, + "learning_rate": 7.665721719544873e-08, + "loss": 0.0005, + "step": 31812 + }, + { + "epoch": 0.62, + "learning_rate": 7.665333385111258e-08, + "loss": 0.0005, + "step": 31813 + }, + { + "epoch": 0.62, + "learning_rate": 7.664945050677644e-08, + "loss": 0.0004, + "step": 31814 + }, + { + "epoch": 0.62, + "learning_rate": 7.66455671624403e-08, + "loss": 0.0006, + "step": 31815 + }, + { + "epoch": 0.62, + "learning_rate": 7.664168381810416e-08, + "loss": 0.0007, + "step": 31816 + }, + { + "epoch": 0.62, + "learning_rate": 7.663780047376802e-08, + "loss": 0.6388, + "step": 31817 + }, + { + "epoch": 0.62, + "learning_rate": 7.663391712943188e-08, + "loss": 0.0004, + "step": 31818 + }, + { + "epoch": 0.62, + "learning_rate": 7.663003378509572e-08, + "loss": 0.0004, + "step": 31819 + }, + { + "epoch": 0.62, + "learning_rate": 7.662615044075958e-08, + "loss": 0.7596, + "step": 31820 + }, + { + "epoch": 0.62, + "learning_rate": 7.662226709642344e-08, + "loss": 0.0006, + "step": 31821 + }, + { + "epoch": 0.62, + "learning_rate": 7.66183837520873e-08, + "loss": 0.0003, + "step": 31822 + }, + { + "epoch": 0.62, + "learning_rate": 7.661450040775115e-08, + "loss": 0.0006, + "step": 31823 + }, + { + "epoch": 0.62, + "learning_rate": 7.661061706341501e-08, + "loss": 0.0004, + "step": 31824 + }, + { + "epoch": 0.62, + "learning_rate": 7.660673371907887e-08, + "loss": 0.0005, + "step": 31825 + }, + { + "epoch": 0.62, + "learning_rate": 7.660285037474273e-08, + "loss": 0.0005, + "step": 31826 + }, + { + "epoch": 0.62, + "learning_rate": 7.659896703040659e-08, + "loss": 0.0004, + "step": 31827 + }, + { + "epoch": 0.62, + "learning_rate": 7.659508368607044e-08, + "loss": 0.0005, + "step": 31828 + }, + { + "epoch": 0.62, + "learning_rate": 7.65912003417343e-08, + "loss": 0.0005, + "step": 31829 + }, + { + "epoch": 0.62, + "learning_rate": 7.658731699739816e-08, + "loss": 0.0005, + "step": 31830 + }, + { + "epoch": 0.62, + "learning_rate": 7.658343365306202e-08, + "loss": 0.0004, + "step": 31831 + }, + { + "epoch": 0.62, + "learning_rate": 7.657955030872588e-08, + "loss": 0.0099, + "step": 31832 + }, + { + "epoch": 0.62, + "learning_rate": 7.657566696438974e-08, + "loss": 0.0276, + "step": 31833 + }, + { + "epoch": 0.62, + "learning_rate": 7.657178362005358e-08, + "loss": 0.0003, + "step": 31834 + }, + { + "epoch": 0.62, + "learning_rate": 7.656790027571744e-08, + "loss": 0.0004, + "step": 31835 + }, + { + "epoch": 0.62, + "learning_rate": 7.65640169313813e-08, + "loss": 0.0059, + "step": 31836 + }, + { + "epoch": 0.62, + "learning_rate": 7.656013358704516e-08, + "loss": 0.0005, + "step": 31837 + }, + { + "epoch": 0.62, + "learning_rate": 7.655625024270901e-08, + "loss": 0.0005, + "step": 31838 + }, + { + "epoch": 0.62, + "learning_rate": 7.655236689837287e-08, + "loss": 0.0009, + "step": 31839 + }, + { + "epoch": 0.62, + "learning_rate": 7.654848355403673e-08, + "loss": 0.0007, + "step": 31840 + }, + { + "epoch": 0.62, + "learning_rate": 7.654460020970059e-08, + "loss": 0.0006, + "step": 31841 + }, + { + "epoch": 0.62, + "learning_rate": 7.654071686536445e-08, + "loss": 0.0007, + "step": 31842 + }, + { + "epoch": 0.62, + "learning_rate": 7.65368335210283e-08, + "loss": 0.0005, + "step": 31843 + }, + { + "epoch": 0.62, + "learning_rate": 7.653295017669216e-08, + "loss": 0.0005, + "step": 31844 + }, + { + "epoch": 0.62, + "learning_rate": 7.652906683235602e-08, + "loss": 0.0008, + "step": 31845 + }, + { + "epoch": 0.62, + "learning_rate": 7.652518348801988e-08, + "loss": 0.0066, + "step": 31846 + }, + { + "epoch": 0.62, + "learning_rate": 7.652130014368374e-08, + "loss": 0.0005, + "step": 31847 + }, + { + "epoch": 0.62, + "learning_rate": 7.651741679934758e-08, + "loss": 1.3307, + "step": 31848 + }, + { + "epoch": 0.62, + "learning_rate": 7.651353345501144e-08, + "loss": 0.0007, + "step": 31849 + }, + { + "epoch": 0.62, + "learning_rate": 7.65096501106753e-08, + "loss": 0.0006, + "step": 31850 + }, + { + "epoch": 0.62, + "learning_rate": 7.650576676633916e-08, + "loss": 0.0005, + "step": 31851 + }, + { + "epoch": 0.62, + "learning_rate": 7.650188342200302e-08, + "loss": 0.0005, + "step": 31852 + }, + { + "epoch": 0.62, + "learning_rate": 7.649800007766687e-08, + "loss": 0.0005, + "step": 31853 + }, + { + "epoch": 0.62, + "learning_rate": 7.649411673333073e-08, + "loss": 0.0005, + "step": 31854 + }, + { + "epoch": 0.62, + "learning_rate": 7.649023338899459e-08, + "loss": 0.0006, + "step": 31855 + }, + { + "epoch": 0.62, + "learning_rate": 7.648635004465845e-08, + "loss": 0.0005, + "step": 31856 + }, + { + "epoch": 0.62, + "learning_rate": 7.648246670032231e-08, + "loss": 0.0007, + "step": 31857 + }, + { + "epoch": 0.62, + "learning_rate": 7.647858335598617e-08, + "loss": 0.0027, + "step": 31858 + }, + { + "epoch": 0.62, + "learning_rate": 7.647470001165002e-08, + "loss": 0.0023, + "step": 31859 + }, + { + "epoch": 0.62, + "learning_rate": 7.647081666731388e-08, + "loss": 0.003, + "step": 31860 + }, + { + "epoch": 0.62, + "learning_rate": 7.646693332297774e-08, + "loss": 0.0004, + "step": 31861 + }, + { + "epoch": 0.62, + "learning_rate": 7.64630499786416e-08, + "loss": 0.0004, + "step": 31862 + }, + { + "epoch": 0.62, + "learning_rate": 7.645916663430546e-08, + "loss": 0.0004, + "step": 31863 + }, + { + "epoch": 0.62, + "learning_rate": 7.645528328996931e-08, + "loss": 0.0005, + "step": 31864 + }, + { + "epoch": 0.62, + "learning_rate": 7.645139994563317e-08, + "loss": 0.002, + "step": 31865 + }, + { + "epoch": 0.62, + "learning_rate": 7.644751660129703e-08, + "loss": 0.0004, + "step": 31866 + }, + { + "epoch": 0.62, + "learning_rate": 7.644363325696089e-08, + "loss": 0.0004, + "step": 31867 + }, + { + "epoch": 0.62, + "learning_rate": 7.643974991262475e-08, + "loss": 0.0005, + "step": 31868 + }, + { + "epoch": 0.62, + "learning_rate": 7.64358665682886e-08, + "loss": 0.0004, + "step": 31869 + }, + { + "epoch": 0.62, + "learning_rate": 7.643198322395246e-08, + "loss": 0.0008, + "step": 31870 + }, + { + "epoch": 0.62, + "learning_rate": 7.642809987961632e-08, + "loss": 0.847, + "step": 31871 + }, + { + "epoch": 0.62, + "learning_rate": 7.642421653528018e-08, + "loss": 0.1743, + "step": 31872 + }, + { + "epoch": 0.62, + "learning_rate": 7.642033319094404e-08, + "loss": 0.0019, + "step": 31873 + }, + { + "epoch": 0.62, + "learning_rate": 7.64164498466079e-08, + "loss": 0.0004, + "step": 31874 + }, + { + "epoch": 0.62, + "learning_rate": 7.641256650227176e-08, + "loss": 0.6921, + "step": 31875 + }, + { + "epoch": 0.62, + "learning_rate": 7.640868315793561e-08, + "loss": 0.0004, + "step": 31876 + }, + { + "epoch": 0.62, + "learning_rate": 7.640479981359946e-08, + "loss": 0.0005, + "step": 31877 + }, + { + "epoch": 0.62, + "learning_rate": 7.640091646926332e-08, + "loss": 0.0006, + "step": 31878 + }, + { + "epoch": 0.62, + "learning_rate": 7.639703312492718e-08, + "loss": 0.0006, + "step": 31879 + }, + { + "epoch": 0.62, + "learning_rate": 7.639314978059103e-08, + "loss": 0.0006, + "step": 31880 + }, + { + "epoch": 0.62, + "learning_rate": 7.638926643625489e-08, + "loss": 0.0005, + "step": 31881 + }, + { + "epoch": 0.62, + "learning_rate": 7.638538309191875e-08, + "loss": 0.0005, + "step": 31882 + }, + { + "epoch": 0.62, + "learning_rate": 7.638149974758261e-08, + "loss": 0.0005, + "step": 31883 + }, + { + "epoch": 0.62, + "learning_rate": 7.637761640324647e-08, + "loss": 0.0005, + "step": 31884 + }, + { + "epoch": 0.62, + "learning_rate": 7.637373305891032e-08, + "loss": 0.0008, + "step": 31885 + }, + { + "epoch": 0.62, + "learning_rate": 7.636984971457418e-08, + "loss": 0.0005, + "step": 31886 + }, + { + "epoch": 0.62, + "learning_rate": 7.636596637023804e-08, + "loss": 1.0357, + "step": 31887 + }, + { + "epoch": 0.62, + "learning_rate": 7.63620830259019e-08, + "loss": 0.0006, + "step": 31888 + }, + { + "epoch": 0.62, + "learning_rate": 7.635819968156576e-08, + "loss": 0.0006, + "step": 31889 + }, + { + "epoch": 0.62, + "learning_rate": 7.635431633722962e-08, + "loss": 0.0005, + "step": 31890 + }, + { + "epoch": 0.62, + "learning_rate": 7.635043299289347e-08, + "loss": 1.0726, + "step": 31891 + }, + { + "epoch": 0.62, + "learning_rate": 7.634654964855733e-08, + "loss": 0.0008, + "step": 31892 + }, + { + "epoch": 0.62, + "learning_rate": 7.634266630422119e-08, + "loss": 0.0005, + "step": 31893 + }, + { + "epoch": 0.62, + "learning_rate": 7.633878295988505e-08, + "loss": 0.0005, + "step": 31894 + }, + { + "epoch": 0.62, + "learning_rate": 7.633489961554891e-08, + "loss": 0.0399, + "step": 31895 + }, + { + "epoch": 0.62, + "learning_rate": 7.633101627121277e-08, + "loss": 0.0004, + "step": 31896 + }, + { + "epoch": 0.62, + "learning_rate": 7.632713292687662e-08, + "loss": 0.0051, + "step": 31897 + }, + { + "epoch": 0.62, + "learning_rate": 7.632324958254048e-08, + "loss": 0.0005, + "step": 31898 + }, + { + "epoch": 0.62, + "learning_rate": 7.631936623820434e-08, + "loss": 0.0006, + "step": 31899 + }, + { + "epoch": 0.62, + "learning_rate": 7.63154828938682e-08, + "loss": 0.0009, + "step": 31900 + }, + { + "epoch": 0.62, + "learning_rate": 7.631159954953206e-08, + "loss": 0.0005, + "step": 31901 + }, + { + "epoch": 0.62, + "learning_rate": 7.630771620519591e-08, + "loss": 0.0005, + "step": 31902 + }, + { + "epoch": 0.62, + "learning_rate": 7.630383286085977e-08, + "loss": 0.0007, + "step": 31903 + }, + { + "epoch": 0.62, + "learning_rate": 7.629994951652363e-08, + "loss": 0.0007, + "step": 31904 + }, + { + "epoch": 0.62, + "learning_rate": 7.629606617218749e-08, + "loss": 0.7575, + "step": 31905 + }, + { + "epoch": 0.62, + "learning_rate": 7.629218282785133e-08, + "loss": 0.0008, + "step": 31906 + }, + { + "epoch": 0.62, + "learning_rate": 7.628829948351519e-08, + "loss": 0.0006, + "step": 31907 + }, + { + "epoch": 0.62, + "learning_rate": 7.628441613917905e-08, + "loss": 0.0008, + "step": 31908 + }, + { + "epoch": 0.62, + "learning_rate": 7.628053279484291e-08, + "loss": 0.0004, + "step": 31909 + }, + { + "epoch": 0.62, + "learning_rate": 7.627664945050677e-08, + "loss": 0.0006, + "step": 31910 + }, + { + "epoch": 0.62, + "learning_rate": 7.627276610617063e-08, + "loss": 0.0066, + "step": 31911 + }, + { + "epoch": 0.62, + "learning_rate": 7.626888276183448e-08, + "loss": 0.1847, + "step": 31912 + }, + { + "epoch": 0.62, + "learning_rate": 7.626499941749834e-08, + "loss": 0.0007, + "step": 31913 + }, + { + "epoch": 0.62, + "learning_rate": 7.62611160731622e-08, + "loss": 0.0007, + "step": 31914 + }, + { + "epoch": 0.62, + "learning_rate": 7.625723272882606e-08, + "loss": 0.0003, + "step": 31915 + }, + { + "epoch": 0.62, + "learning_rate": 7.625334938448992e-08, + "loss": 0.0003, + "step": 31916 + }, + { + "epoch": 0.62, + "learning_rate": 7.624946604015378e-08, + "loss": 0.0005, + "step": 31917 + }, + { + "epoch": 0.62, + "learning_rate": 7.624558269581763e-08, + "loss": 0.0005, + "step": 31918 + }, + { + "epoch": 0.62, + "learning_rate": 7.624169935148149e-08, + "loss": 0.0004, + "step": 31919 + }, + { + "epoch": 0.62, + "learning_rate": 7.623781600714535e-08, + "loss": 0.0006, + "step": 31920 + }, + { + "epoch": 0.62, + "learning_rate": 7.623393266280921e-08, + "loss": 0.0004, + "step": 31921 + }, + { + "epoch": 0.62, + "learning_rate": 7.623004931847307e-08, + "loss": 0.0015, + "step": 31922 + }, + { + "epoch": 0.62, + "learning_rate": 7.622616597413692e-08, + "loss": 0.0006, + "step": 31923 + }, + { + "epoch": 0.62, + "learning_rate": 7.622228262980078e-08, + "loss": 0.0005, + "step": 31924 + }, + { + "epoch": 0.62, + "learning_rate": 7.621839928546464e-08, + "loss": 0.0008, + "step": 31925 + }, + { + "epoch": 0.62, + "learning_rate": 7.62145159411285e-08, + "loss": 0.0006, + "step": 31926 + }, + { + "epoch": 0.62, + "learning_rate": 7.621063259679236e-08, + "loss": 0.0004, + "step": 31927 + }, + { + "epoch": 0.62, + "learning_rate": 7.620674925245622e-08, + "loss": 0.0006, + "step": 31928 + }, + { + "epoch": 0.62, + "learning_rate": 7.620286590812007e-08, + "loss": 0.0005, + "step": 31929 + }, + { + "epoch": 0.62, + "learning_rate": 7.619898256378393e-08, + "loss": 0.0005, + "step": 31930 + }, + { + "epoch": 0.62, + "learning_rate": 7.619509921944779e-08, + "loss": 0.0005, + "step": 31931 + }, + { + "epoch": 0.62, + "learning_rate": 7.619121587511165e-08, + "loss": 0.0006, + "step": 31932 + }, + { + "epoch": 0.62, + "learning_rate": 7.618733253077551e-08, + "loss": 0.666, + "step": 31933 + }, + { + "epoch": 0.62, + "learning_rate": 7.618344918643937e-08, + "loss": 0.0004, + "step": 31934 + }, + { + "epoch": 0.62, + "learning_rate": 7.617956584210321e-08, + "loss": 0.0005, + "step": 31935 + }, + { + "epoch": 0.62, + "learning_rate": 7.617568249776707e-08, + "loss": 0.0006, + "step": 31936 + }, + { + "epoch": 0.62, + "learning_rate": 7.617179915343093e-08, + "loss": 0.0005, + "step": 31937 + }, + { + "epoch": 0.62, + "learning_rate": 7.616791580909479e-08, + "loss": 0.0005, + "step": 31938 + }, + { + "epoch": 0.62, + "learning_rate": 7.616403246475864e-08, + "loss": 0.0005, + "step": 31939 + }, + { + "epoch": 0.62, + "learning_rate": 7.61601491204225e-08, + "loss": 0.0003, + "step": 31940 + }, + { + "epoch": 0.62, + "learning_rate": 7.615626577608636e-08, + "loss": 0.0004, + "step": 31941 + }, + { + "epoch": 0.62, + "learning_rate": 7.615238243175022e-08, + "loss": 0.0006, + "step": 31942 + }, + { + "epoch": 0.62, + "learning_rate": 7.614849908741408e-08, + "loss": 0.0004, + "step": 31943 + }, + { + "epoch": 0.62, + "learning_rate": 7.614461574307793e-08, + "loss": 0.0053, + "step": 31944 + }, + { + "epoch": 0.62, + "learning_rate": 7.614073239874179e-08, + "loss": 0.0004, + "step": 31945 + }, + { + "epoch": 0.62, + "learning_rate": 7.613684905440565e-08, + "loss": 0.0005, + "step": 31946 + }, + { + "epoch": 0.62, + "learning_rate": 7.613296571006951e-08, + "loss": 1.1821, + "step": 31947 + }, + { + "epoch": 0.62, + "learning_rate": 7.612908236573337e-08, + "loss": 0.0081, + "step": 31948 + }, + { + "epoch": 0.62, + "learning_rate": 7.612519902139723e-08, + "loss": 0.0005, + "step": 31949 + }, + { + "epoch": 0.62, + "learning_rate": 7.612131567706108e-08, + "loss": 0.0004, + "step": 31950 + }, + { + "epoch": 0.62, + "learning_rate": 7.611743233272494e-08, + "loss": 0.0015, + "step": 31951 + }, + { + "epoch": 0.62, + "learning_rate": 7.61135489883888e-08, + "loss": 0.0006, + "step": 31952 + }, + { + "epoch": 0.62, + "learning_rate": 7.610966564405266e-08, + "loss": 0.0004, + "step": 31953 + }, + { + "epoch": 0.62, + "learning_rate": 7.610578229971652e-08, + "loss": 0.0005, + "step": 31954 + }, + { + "epoch": 0.62, + "learning_rate": 7.610189895538038e-08, + "loss": 0.0004, + "step": 31955 + }, + { + "epoch": 0.62, + "learning_rate": 7.609801561104423e-08, + "loss": 0.0005, + "step": 31956 + }, + { + "epoch": 0.62, + "learning_rate": 7.609413226670809e-08, + "loss": 0.0005, + "step": 31957 + }, + { + "epoch": 0.62, + "learning_rate": 7.609024892237195e-08, + "loss": 0.0004, + "step": 31958 + }, + { + "epoch": 0.62, + "learning_rate": 7.608636557803581e-08, + "loss": 0.0005, + "step": 31959 + }, + { + "epoch": 0.62, + "learning_rate": 7.608248223369967e-08, + "loss": 0.0004, + "step": 31960 + }, + { + "epoch": 0.62, + "learning_rate": 7.607859888936352e-08, + "loss": 0.3164, + "step": 31961 + }, + { + "epoch": 0.62, + "learning_rate": 7.607471554502738e-08, + "loss": 0.001, + "step": 31962 + }, + { + "epoch": 0.62, + "learning_rate": 7.607083220069124e-08, + "loss": 0.0717, + "step": 31963 + }, + { + "epoch": 0.62, + "learning_rate": 7.606694885635509e-08, + "loss": 0.0371, + "step": 31964 + }, + { + "epoch": 0.62, + "learning_rate": 7.606306551201894e-08, + "loss": 0.0006, + "step": 31965 + }, + { + "epoch": 0.62, + "learning_rate": 7.60591821676828e-08, + "loss": 0.0006, + "step": 31966 + }, + { + "epoch": 0.62, + "learning_rate": 7.605529882334666e-08, + "loss": 0.0014, + "step": 31967 + }, + { + "epoch": 0.62, + "learning_rate": 7.605141547901052e-08, + "loss": 0.0005, + "step": 31968 + }, + { + "epoch": 0.62, + "learning_rate": 7.604753213467438e-08, + "loss": 0.0003, + "step": 31969 + }, + { + "epoch": 0.62, + "learning_rate": 7.604364879033824e-08, + "loss": 0.0007, + "step": 31970 + }, + { + "epoch": 0.62, + "learning_rate": 7.60397654460021e-08, + "loss": 0.0025, + "step": 31971 + }, + { + "epoch": 0.62, + "learning_rate": 7.603588210166595e-08, + "loss": 1.1361, + "step": 31972 + }, + { + "epoch": 0.62, + "learning_rate": 7.603199875732981e-08, + "loss": 0.0004, + "step": 31973 + }, + { + "epoch": 0.62, + "learning_rate": 7.602811541299367e-08, + "loss": 0.0008, + "step": 31974 + }, + { + "epoch": 0.62, + "learning_rate": 7.602423206865753e-08, + "loss": 0.0815, + "step": 31975 + }, + { + "epoch": 0.62, + "learning_rate": 7.602034872432139e-08, + "loss": 0.2727, + "step": 31976 + }, + { + "epoch": 0.62, + "learning_rate": 7.601646537998524e-08, + "loss": 0.7146, + "step": 31977 + }, + { + "epoch": 0.62, + "learning_rate": 7.60125820356491e-08, + "loss": 0.0004, + "step": 31978 + }, + { + "epoch": 0.62, + "learning_rate": 7.600869869131296e-08, + "loss": 0.5958, + "step": 31979 + }, + { + "epoch": 0.62, + "learning_rate": 7.600481534697682e-08, + "loss": 0.0004, + "step": 31980 + }, + { + "epoch": 0.62, + "learning_rate": 7.600093200264068e-08, + "loss": 0.0004, + "step": 31981 + }, + { + "epoch": 0.62, + "learning_rate": 7.599704865830453e-08, + "loss": 0.0005, + "step": 31982 + }, + { + "epoch": 0.62, + "learning_rate": 7.599316531396839e-08, + "loss": 0.0006, + "step": 31983 + }, + { + "epoch": 0.62, + "learning_rate": 7.598928196963225e-08, + "loss": 0.0159, + "step": 31984 + }, + { + "epoch": 0.62, + "learning_rate": 7.598539862529611e-08, + "loss": 0.0231, + "step": 31985 + }, + { + "epoch": 0.62, + "learning_rate": 7.598151528095997e-08, + "loss": 0.0004, + "step": 31986 + }, + { + "epoch": 0.62, + "learning_rate": 7.597763193662383e-08, + "loss": 0.001, + "step": 31987 + }, + { + "epoch": 0.62, + "learning_rate": 7.597374859228768e-08, + "loss": 1.0719, + "step": 31988 + }, + { + "epoch": 0.62, + "learning_rate": 7.596986524795154e-08, + "loss": 0.0005, + "step": 31989 + }, + { + "epoch": 0.62, + "learning_rate": 7.59659819036154e-08, + "loss": 0.1126, + "step": 31990 + }, + { + "epoch": 0.62, + "learning_rate": 7.596209855927926e-08, + "loss": 0.003, + "step": 31991 + }, + { + "epoch": 0.62, + "learning_rate": 7.595821521494312e-08, + "loss": 0.0005, + "step": 31992 + }, + { + "epoch": 0.62, + "learning_rate": 7.595433187060696e-08, + "loss": 0.0007, + "step": 31993 + }, + { + "epoch": 0.62, + "learning_rate": 7.595044852627082e-08, + "loss": 0.0417, + "step": 31994 + }, + { + "epoch": 0.62, + "learning_rate": 7.594656518193468e-08, + "loss": 0.0063, + "step": 31995 + }, + { + "epoch": 0.62, + "learning_rate": 7.594268183759854e-08, + "loss": 0.0385, + "step": 31996 + }, + { + "epoch": 0.62, + "learning_rate": 7.59387984932624e-08, + "loss": 0.0006, + "step": 31997 + }, + { + "epoch": 0.62, + "learning_rate": 7.593491514892625e-08, + "loss": 0.0006, + "step": 31998 + }, + { + "epoch": 0.62, + "learning_rate": 7.593103180459011e-08, + "loss": 0.0158, + "step": 31999 + }, + { + "epoch": 0.62, + "learning_rate": 7.592714846025397e-08, + "loss": 0.0003, + "step": 32000 + }, + { + "epoch": 0.62, + "learning_rate": 7.592326511591783e-08, + "loss": 0.0009, + "step": 32001 + }, + { + "epoch": 0.62, + "learning_rate": 7.591938177158169e-08, + "loss": 0.0005, + "step": 32002 + }, + { + "epoch": 0.62, + "learning_rate": 7.591549842724554e-08, + "loss": 0.0007, + "step": 32003 + }, + { + "epoch": 0.62, + "learning_rate": 7.59116150829094e-08, + "loss": 0.0005, + "step": 32004 + }, + { + "epoch": 0.62, + "learning_rate": 7.590773173857326e-08, + "loss": 0.0004, + "step": 32005 + }, + { + "epoch": 0.62, + "learning_rate": 7.590384839423712e-08, + "loss": 0.0007, + "step": 32006 + }, + { + "epoch": 0.62, + "learning_rate": 7.589996504990098e-08, + "loss": 0.0006, + "step": 32007 + }, + { + "epoch": 0.62, + "learning_rate": 7.589608170556484e-08, + "loss": 0.0005, + "step": 32008 + }, + { + "epoch": 0.62, + "learning_rate": 7.58921983612287e-08, + "loss": 0.0005, + "step": 32009 + }, + { + "epoch": 0.62, + "learning_rate": 7.588831501689255e-08, + "loss": 0.0063, + "step": 32010 + }, + { + "epoch": 0.62, + "learning_rate": 7.58844316725564e-08, + "loss": 0.0005, + "step": 32011 + }, + { + "epoch": 0.62, + "learning_rate": 7.588054832822026e-08, + "loss": 0.9084, + "step": 32012 + }, + { + "epoch": 0.62, + "learning_rate": 7.587666498388411e-08, + "loss": 0.0016, + "step": 32013 + }, + { + "epoch": 0.62, + "learning_rate": 7.587278163954797e-08, + "loss": 0.4438, + "step": 32014 + }, + { + "epoch": 0.62, + "learning_rate": 7.586889829521183e-08, + "loss": 0.0006, + "step": 32015 + }, + { + "epoch": 0.62, + "learning_rate": 7.586501495087569e-08, + "loss": 0.0117, + "step": 32016 + }, + { + "epoch": 0.62, + "learning_rate": 7.586113160653955e-08, + "loss": 0.0005, + "step": 32017 + }, + { + "epoch": 0.62, + "learning_rate": 7.58572482622034e-08, + "loss": 0.993, + "step": 32018 + }, + { + "epoch": 0.62, + "learning_rate": 7.585336491786726e-08, + "loss": 0.0004, + "step": 32019 + }, + { + "epoch": 0.62, + "learning_rate": 7.584948157353112e-08, + "loss": 0.0006, + "step": 32020 + }, + { + "epoch": 0.62, + "learning_rate": 7.584559822919498e-08, + "loss": 0.0134, + "step": 32021 + }, + { + "epoch": 0.62, + "learning_rate": 7.584171488485884e-08, + "loss": 0.0004, + "step": 32022 + }, + { + "epoch": 0.62, + "learning_rate": 7.58378315405227e-08, + "loss": 0.0005, + "step": 32023 + }, + { + "epoch": 0.62, + "learning_rate": 7.583394819618655e-08, + "loss": 0.0005, + "step": 32024 + }, + { + "epoch": 0.62, + "learning_rate": 7.58300648518504e-08, + "loss": 0.0614, + "step": 32025 + }, + { + "epoch": 0.62, + "learning_rate": 7.582618150751426e-08, + "loss": 0.0005, + "step": 32026 + }, + { + "epoch": 0.62, + "learning_rate": 7.582229816317812e-08, + "loss": 0.0009, + "step": 32027 + }, + { + "epoch": 0.62, + "learning_rate": 7.581841481884197e-08, + "loss": 0.0023, + "step": 32028 + }, + { + "epoch": 0.62, + "learning_rate": 7.581453147450583e-08, + "loss": 0.0005, + "step": 32029 + }, + { + "epoch": 0.62, + "learning_rate": 7.581064813016969e-08, + "loss": 0.318, + "step": 32030 + }, + { + "epoch": 0.62, + "learning_rate": 7.580676478583355e-08, + "loss": 0.0006, + "step": 32031 + }, + { + "epoch": 0.62, + "learning_rate": 7.580288144149741e-08, + "loss": 0.0005, + "step": 32032 + }, + { + "epoch": 0.62, + "learning_rate": 7.579899809716127e-08, + "loss": 0.0009, + "step": 32033 + }, + { + "epoch": 0.62, + "learning_rate": 7.579511475282512e-08, + "loss": 0.2816, + "step": 32034 + }, + { + "epoch": 0.62, + "learning_rate": 7.579123140848898e-08, + "loss": 0.0004, + "step": 32035 + }, + { + "epoch": 0.62, + "learning_rate": 7.578734806415284e-08, + "loss": 0.0463, + "step": 32036 + }, + { + "epoch": 0.62, + "learning_rate": 7.57834647198167e-08, + "loss": 0.0005, + "step": 32037 + }, + { + "epoch": 0.62, + "learning_rate": 7.577958137548056e-08, + "loss": 0.0004, + "step": 32038 + }, + { + "epoch": 0.62, + "learning_rate": 7.577569803114441e-08, + "loss": 0.0103, + "step": 32039 + }, + { + "epoch": 0.62, + "learning_rate": 7.577181468680827e-08, + "loss": 0.0006, + "step": 32040 + }, + { + "epoch": 0.62, + "learning_rate": 7.576793134247213e-08, + "loss": 0.0005, + "step": 32041 + }, + { + "epoch": 0.62, + "learning_rate": 7.576404799813599e-08, + "loss": 0.0006, + "step": 32042 + }, + { + "epoch": 0.62, + "learning_rate": 7.576016465379985e-08, + "loss": 0.0004, + "step": 32043 + }, + { + "epoch": 0.62, + "learning_rate": 7.57562813094637e-08, + "loss": 0.0005, + "step": 32044 + }, + { + "epoch": 0.62, + "learning_rate": 7.575239796512756e-08, + "loss": 0.0006, + "step": 32045 + }, + { + "epoch": 0.62, + "learning_rate": 7.574851462079142e-08, + "loss": 0.0004, + "step": 32046 + }, + { + "epoch": 0.62, + "learning_rate": 7.574463127645528e-08, + "loss": 0.0005, + "step": 32047 + }, + { + "epoch": 0.62, + "learning_rate": 7.574074793211914e-08, + "loss": 0.0005, + "step": 32048 + }, + { + "epoch": 0.62, + "learning_rate": 7.5736864587783e-08, + "loss": 0.0005, + "step": 32049 + }, + { + "epoch": 0.62, + "learning_rate": 7.573298124344686e-08, + "loss": 0.0008, + "step": 32050 + }, + { + "epoch": 0.62, + "learning_rate": 7.57290978991107e-08, + "loss": 0.0007, + "step": 32051 + }, + { + "epoch": 0.62, + "learning_rate": 7.572521455477456e-08, + "loss": 0.0014, + "step": 32052 + }, + { + "epoch": 0.62, + "learning_rate": 7.572133121043842e-08, + "loss": 0.0007, + "step": 32053 + }, + { + "epoch": 0.62, + "learning_rate": 7.571744786610228e-08, + "loss": 0.0005, + "step": 32054 + }, + { + "epoch": 0.62, + "learning_rate": 7.571356452176613e-08, + "loss": 0.0006, + "step": 32055 + }, + { + "epoch": 0.62, + "learning_rate": 7.570968117742999e-08, + "loss": 0.0006, + "step": 32056 + }, + { + "epoch": 0.62, + "learning_rate": 7.570579783309385e-08, + "loss": 0.0003, + "step": 32057 + }, + { + "epoch": 0.62, + "learning_rate": 7.570191448875771e-08, + "loss": 0.0004, + "step": 32058 + }, + { + "epoch": 0.62, + "learning_rate": 7.569803114442157e-08, + "loss": 0.2333, + "step": 32059 + }, + { + "epoch": 0.62, + "learning_rate": 7.569414780008542e-08, + "loss": 0.1675, + "step": 32060 + }, + { + "epoch": 0.62, + "learning_rate": 7.569026445574928e-08, + "loss": 0.0003, + "step": 32061 + }, + { + "epoch": 0.62, + "learning_rate": 7.568638111141314e-08, + "loss": 0.0011, + "step": 32062 + }, + { + "epoch": 0.62, + "learning_rate": 7.5682497767077e-08, + "loss": 0.0006, + "step": 32063 + }, + { + "epoch": 0.62, + "learning_rate": 7.567861442274086e-08, + "loss": 0.0004, + "step": 32064 + }, + { + "epoch": 0.62, + "learning_rate": 7.567473107840472e-08, + "loss": 0.0003, + "step": 32065 + }, + { + "epoch": 0.62, + "learning_rate": 7.567084773406857e-08, + "loss": 0.0006, + "step": 32066 + }, + { + "epoch": 0.62, + "learning_rate": 7.566696438973243e-08, + "loss": 0.0004, + "step": 32067 + }, + { + "epoch": 0.62, + "learning_rate": 7.566308104539629e-08, + "loss": 0.0004, + "step": 32068 + }, + { + "epoch": 0.62, + "learning_rate": 7.565919770106015e-08, + "loss": 0.0005, + "step": 32069 + }, + { + "epoch": 0.62, + "learning_rate": 7.565531435672401e-08, + "loss": 0.0004, + "step": 32070 + }, + { + "epoch": 0.62, + "learning_rate": 7.565143101238787e-08, + "loss": 0.0004, + "step": 32071 + }, + { + "epoch": 0.62, + "learning_rate": 7.564754766805172e-08, + "loss": 0.0005, + "step": 32072 + }, + { + "epoch": 0.62, + "learning_rate": 7.564366432371558e-08, + "loss": 0.0005, + "step": 32073 + }, + { + "epoch": 0.62, + "learning_rate": 7.563978097937944e-08, + "loss": 0.0022, + "step": 32074 + }, + { + "epoch": 0.62, + "learning_rate": 7.56358976350433e-08, + "loss": 0.0005, + "step": 32075 + }, + { + "epoch": 0.62, + "learning_rate": 7.563201429070716e-08, + "loss": 0.0004, + "step": 32076 + }, + { + "epoch": 0.62, + "learning_rate": 7.562813094637101e-08, + "loss": 0.0005, + "step": 32077 + }, + { + "epoch": 0.62, + "learning_rate": 7.562424760203487e-08, + "loss": 0.0005, + "step": 32078 + }, + { + "epoch": 0.62, + "learning_rate": 7.562036425769873e-08, + "loss": 0.0006, + "step": 32079 + }, + { + "epoch": 0.62, + "learning_rate": 7.561648091336258e-08, + "loss": 0.0005, + "step": 32080 + }, + { + "epoch": 0.62, + "learning_rate": 7.561259756902643e-08, + "loss": 0.4056, + "step": 32081 + }, + { + "epoch": 0.62, + "learning_rate": 7.560871422469029e-08, + "loss": 0.0054, + "step": 32082 + }, + { + "epoch": 0.62, + "learning_rate": 7.560483088035415e-08, + "loss": 0.0003, + "step": 32083 + }, + { + "epoch": 0.62, + "learning_rate": 7.560094753601801e-08, + "loss": 0.0004, + "step": 32084 + }, + { + "epoch": 0.62, + "learning_rate": 7.559706419168187e-08, + "loss": 0.0004, + "step": 32085 + }, + { + "epoch": 0.62, + "learning_rate": 7.559318084734573e-08, + "loss": 0.0005, + "step": 32086 + }, + { + "epoch": 0.62, + "learning_rate": 7.558929750300958e-08, + "loss": 0.0033, + "step": 32087 + }, + { + "epoch": 0.62, + "learning_rate": 7.558541415867344e-08, + "loss": 0.0005, + "step": 32088 + }, + { + "epoch": 0.62, + "learning_rate": 7.55815308143373e-08, + "loss": 0.0024, + "step": 32089 + }, + { + "epoch": 0.62, + "learning_rate": 7.557764747000116e-08, + "loss": 0.0009, + "step": 32090 + }, + { + "epoch": 0.62, + "learning_rate": 7.557376412566502e-08, + "loss": 0.0003, + "step": 32091 + }, + { + "epoch": 0.62, + "learning_rate": 7.556988078132888e-08, + "loss": 0.0004, + "step": 32092 + }, + { + "epoch": 0.62, + "learning_rate": 7.556599743699273e-08, + "loss": 0.0004, + "step": 32093 + }, + { + "epoch": 0.62, + "learning_rate": 7.556211409265659e-08, + "loss": 0.0412, + "step": 32094 + }, + { + "epoch": 0.62, + "learning_rate": 7.555823074832045e-08, + "loss": 0.0726, + "step": 32095 + }, + { + "epoch": 0.62, + "learning_rate": 7.555434740398431e-08, + "loss": 0.0005, + "step": 32096 + }, + { + "epoch": 0.62, + "learning_rate": 7.555046405964817e-08, + "loss": 0.0004, + "step": 32097 + }, + { + "epoch": 0.62, + "learning_rate": 7.554658071531202e-08, + "loss": 0.0003, + "step": 32098 + }, + { + "epoch": 0.62, + "learning_rate": 7.554269737097588e-08, + "loss": 0.0004, + "step": 32099 + }, + { + "epoch": 0.62, + "learning_rate": 7.553881402663974e-08, + "loss": 0.0004, + "step": 32100 + }, + { + "epoch": 0.62, + "learning_rate": 7.55349306823036e-08, + "loss": 0.0006, + "step": 32101 + }, + { + "epoch": 0.62, + "learning_rate": 7.553104733796746e-08, + "loss": 0.0006, + "step": 32102 + }, + { + "epoch": 0.62, + "learning_rate": 7.552716399363132e-08, + "loss": 0.0004, + "step": 32103 + }, + { + "epoch": 0.62, + "learning_rate": 7.552328064929517e-08, + "loss": 0.0004, + "step": 32104 + }, + { + "epoch": 0.62, + "learning_rate": 7.551939730495903e-08, + "loss": 0.0005, + "step": 32105 + }, + { + "epoch": 0.62, + "learning_rate": 7.551551396062289e-08, + "loss": 0.0004, + "step": 32106 + }, + { + "epoch": 0.62, + "learning_rate": 7.551163061628675e-08, + "loss": 0.0005, + "step": 32107 + }, + { + "epoch": 0.62, + "learning_rate": 7.550774727195061e-08, + "loss": 0.0004, + "step": 32108 + }, + { + "epoch": 0.62, + "learning_rate": 7.550386392761445e-08, + "loss": 0.0246, + "step": 32109 + }, + { + "epoch": 0.62, + "learning_rate": 7.549998058327831e-08, + "loss": 0.0012, + "step": 32110 + }, + { + "epoch": 0.62, + "learning_rate": 7.549609723894217e-08, + "loss": 0.0082, + "step": 32111 + }, + { + "epoch": 0.62, + "learning_rate": 7.549221389460603e-08, + "loss": 0.0009, + "step": 32112 + }, + { + "epoch": 0.62, + "learning_rate": 7.548833055026989e-08, + "loss": 0.0005, + "step": 32113 + }, + { + "epoch": 0.62, + "learning_rate": 7.548444720593374e-08, + "loss": 1.1023, + "step": 32114 + }, + { + "epoch": 0.62, + "learning_rate": 7.54805638615976e-08, + "loss": 0.0005, + "step": 32115 + }, + { + "epoch": 0.62, + "learning_rate": 7.547668051726146e-08, + "loss": 0.0008, + "step": 32116 + }, + { + "epoch": 0.62, + "learning_rate": 7.547279717292532e-08, + "loss": 0.0007, + "step": 32117 + }, + { + "epoch": 0.62, + "learning_rate": 7.546891382858918e-08, + "loss": 0.0004, + "step": 32118 + }, + { + "epoch": 0.62, + "learning_rate": 7.546503048425303e-08, + "loss": 0.0004, + "step": 32119 + }, + { + "epoch": 0.62, + "learning_rate": 7.546114713991689e-08, + "loss": 0.001, + "step": 32120 + }, + { + "epoch": 0.62, + "learning_rate": 7.545726379558075e-08, + "loss": 0.0007, + "step": 32121 + }, + { + "epoch": 0.62, + "learning_rate": 7.545338045124461e-08, + "loss": 0.0006, + "step": 32122 + }, + { + "epoch": 0.62, + "learning_rate": 7.544949710690847e-08, + "loss": 0.0005, + "step": 32123 + }, + { + "epoch": 0.62, + "learning_rate": 7.544561376257233e-08, + "loss": 0.0004, + "step": 32124 + }, + { + "epoch": 0.62, + "learning_rate": 7.544173041823618e-08, + "loss": 0.249, + "step": 32125 + }, + { + "epoch": 0.62, + "learning_rate": 7.543784707390004e-08, + "loss": 0.0004, + "step": 32126 + }, + { + "epoch": 0.62, + "learning_rate": 7.54339637295639e-08, + "loss": 0.0007, + "step": 32127 + }, + { + "epoch": 0.62, + "learning_rate": 7.543008038522776e-08, + "loss": 0.0077, + "step": 32128 + }, + { + "epoch": 0.62, + "learning_rate": 7.542619704089162e-08, + "loss": 0.0005, + "step": 32129 + }, + { + "epoch": 0.62, + "learning_rate": 7.542231369655548e-08, + "loss": 0.0006, + "step": 32130 + }, + { + "epoch": 0.62, + "learning_rate": 7.541843035221933e-08, + "loss": 0.0003, + "step": 32131 + }, + { + "epoch": 0.62, + "learning_rate": 7.541454700788319e-08, + "loss": 0.0004, + "step": 32132 + }, + { + "epoch": 0.62, + "learning_rate": 7.541066366354705e-08, + "loss": 0.0006, + "step": 32133 + }, + { + "epoch": 0.62, + "learning_rate": 7.540678031921091e-08, + "loss": 0.0006, + "step": 32134 + }, + { + "epoch": 0.62, + "learning_rate": 7.540289697487477e-08, + "loss": 0.0012, + "step": 32135 + }, + { + "epoch": 0.62, + "learning_rate": 7.539901363053862e-08, + "loss": 0.0096, + "step": 32136 + }, + { + "epoch": 0.62, + "learning_rate": 7.539513028620248e-08, + "loss": 0.0005, + "step": 32137 + }, + { + "epoch": 0.62, + "learning_rate": 7.539124694186633e-08, + "loss": 0.0004, + "step": 32138 + }, + { + "epoch": 0.62, + "learning_rate": 7.538736359753019e-08, + "loss": 0.0003, + "step": 32139 + }, + { + "epoch": 0.62, + "learning_rate": 7.538348025319404e-08, + "loss": 0.0004, + "step": 32140 + }, + { + "epoch": 0.62, + "learning_rate": 7.53795969088579e-08, + "loss": 0.0004, + "step": 32141 + }, + { + "epoch": 0.62, + "learning_rate": 7.537571356452176e-08, + "loss": 0.0677, + "step": 32142 + }, + { + "epoch": 0.62, + "learning_rate": 7.537183022018562e-08, + "loss": 0.0006, + "step": 32143 + }, + { + "epoch": 0.62, + "learning_rate": 7.536794687584948e-08, + "loss": 0.0006, + "step": 32144 + }, + { + "epoch": 0.62, + "learning_rate": 7.536406353151334e-08, + "loss": 0.0006, + "step": 32145 + }, + { + "epoch": 0.62, + "learning_rate": 7.53601801871772e-08, + "loss": 0.0006, + "step": 32146 + }, + { + "epoch": 0.62, + "learning_rate": 7.535629684284105e-08, + "loss": 0.0005, + "step": 32147 + }, + { + "epoch": 0.62, + "learning_rate": 7.535241349850491e-08, + "loss": 0.0004, + "step": 32148 + }, + { + "epoch": 0.62, + "learning_rate": 7.534853015416877e-08, + "loss": 0.0005, + "step": 32149 + }, + { + "epoch": 0.62, + "learning_rate": 7.534464680983263e-08, + "loss": 0.0005, + "step": 32150 + }, + { + "epoch": 0.62, + "learning_rate": 7.534076346549649e-08, + "loss": 0.0024, + "step": 32151 + }, + { + "epoch": 0.62, + "learning_rate": 7.533688012116034e-08, + "loss": 0.0011, + "step": 32152 + }, + { + "epoch": 0.62, + "learning_rate": 7.53329967768242e-08, + "loss": 0.025, + "step": 32153 + }, + { + "epoch": 0.62, + "learning_rate": 7.532911343248806e-08, + "loss": 0.0004, + "step": 32154 + }, + { + "epoch": 0.62, + "learning_rate": 7.532523008815192e-08, + "loss": 0.5996, + "step": 32155 + }, + { + "epoch": 0.62, + "learning_rate": 7.532134674381578e-08, + "loss": 0.1748, + "step": 32156 + }, + { + "epoch": 0.62, + "learning_rate": 7.531746339947963e-08, + "loss": 0.0005, + "step": 32157 + }, + { + "epoch": 0.62, + "learning_rate": 7.531358005514349e-08, + "loss": 0.0024, + "step": 32158 + }, + { + "epoch": 0.62, + "learning_rate": 7.530969671080735e-08, + "loss": 0.0004, + "step": 32159 + }, + { + "epoch": 0.62, + "learning_rate": 7.530581336647121e-08, + "loss": 0.0013, + "step": 32160 + }, + { + "epoch": 0.62, + "learning_rate": 7.530193002213507e-08, + "loss": 0.0005, + "step": 32161 + }, + { + "epoch": 0.62, + "learning_rate": 7.529804667779893e-08, + "loss": 0.0004, + "step": 32162 + }, + { + "epoch": 0.62, + "learning_rate": 7.529416333346278e-08, + "loss": 0.0092, + "step": 32163 + }, + { + "epoch": 0.62, + "learning_rate": 7.529027998912664e-08, + "loss": 0.0004, + "step": 32164 + }, + { + "epoch": 0.62, + "learning_rate": 7.52863966447905e-08, + "loss": 0.0008, + "step": 32165 + }, + { + "epoch": 0.62, + "learning_rate": 7.528251330045436e-08, + "loss": 0.0004, + "step": 32166 + }, + { + "epoch": 0.62, + "learning_rate": 7.52786299561182e-08, + "loss": 0.0005, + "step": 32167 + }, + { + "epoch": 0.62, + "learning_rate": 7.527474661178206e-08, + "loss": 0.0081, + "step": 32168 + }, + { + "epoch": 0.62, + "learning_rate": 7.527086326744592e-08, + "loss": 0.0005, + "step": 32169 + }, + { + "epoch": 0.62, + "learning_rate": 7.526697992310978e-08, + "loss": 0.0005, + "step": 32170 + }, + { + "epoch": 0.62, + "learning_rate": 7.526309657877364e-08, + "loss": 0.6296, + "step": 32171 + }, + { + "epoch": 0.62, + "learning_rate": 7.52592132344375e-08, + "loss": 0.1948, + "step": 32172 + }, + { + "epoch": 0.62, + "learning_rate": 7.525532989010135e-08, + "loss": 0.0004, + "step": 32173 + }, + { + "epoch": 0.62, + "learning_rate": 7.525144654576521e-08, + "loss": 0.0004, + "step": 32174 + }, + { + "epoch": 0.62, + "learning_rate": 7.524756320142907e-08, + "loss": 0.0005, + "step": 32175 + }, + { + "epoch": 0.62, + "learning_rate": 7.524367985709293e-08, + "loss": 0.0005, + "step": 32176 + }, + { + "epoch": 0.62, + "learning_rate": 7.523979651275679e-08, + "loss": 0.0004, + "step": 32177 + }, + { + "epoch": 0.62, + "learning_rate": 7.523591316842064e-08, + "loss": 0.0197, + "step": 32178 + }, + { + "epoch": 0.62, + "learning_rate": 7.52320298240845e-08, + "loss": 0.0004, + "step": 32179 + }, + { + "epoch": 0.62, + "learning_rate": 7.522814647974836e-08, + "loss": 0.0004, + "step": 32180 + }, + { + "epoch": 0.62, + "learning_rate": 7.522426313541222e-08, + "loss": 0.0008, + "step": 32181 + }, + { + "epoch": 0.62, + "learning_rate": 7.522037979107608e-08, + "loss": 0.0015, + "step": 32182 + }, + { + "epoch": 0.62, + "learning_rate": 7.521649644673994e-08, + "loss": 0.0116, + "step": 32183 + }, + { + "epoch": 0.62, + "learning_rate": 7.52126131024038e-08, + "loss": 0.0009, + "step": 32184 + }, + { + "epoch": 0.62, + "learning_rate": 7.520872975806765e-08, + "loss": 0.9978, + "step": 32185 + }, + { + "epoch": 0.62, + "learning_rate": 7.520484641373151e-08, + "loss": 0.0004, + "step": 32186 + }, + { + "epoch": 0.62, + "learning_rate": 7.520096306939537e-08, + "loss": 0.0004, + "step": 32187 + }, + { + "epoch": 0.62, + "learning_rate": 7.519707972505921e-08, + "loss": 0.0004, + "step": 32188 + }, + { + "epoch": 0.62, + "learning_rate": 7.519319638072307e-08, + "loss": 0.0005, + "step": 32189 + }, + { + "epoch": 0.62, + "learning_rate": 7.518931303638693e-08, + "loss": 0.0005, + "step": 32190 + }, + { + "epoch": 0.62, + "learning_rate": 7.518542969205079e-08, + "loss": 0.0004, + "step": 32191 + }, + { + "epoch": 0.62, + "learning_rate": 7.518154634771465e-08, + "loss": 0.0006, + "step": 32192 + }, + { + "epoch": 0.62, + "learning_rate": 7.51776630033785e-08, + "loss": 0.0004, + "step": 32193 + }, + { + "epoch": 0.62, + "learning_rate": 7.517377965904236e-08, + "loss": 0.0003, + "step": 32194 + }, + { + "epoch": 0.62, + "learning_rate": 7.516989631470622e-08, + "loss": 0.0005, + "step": 32195 + }, + { + "epoch": 0.62, + "learning_rate": 7.516601297037008e-08, + "loss": 0.0006, + "step": 32196 + }, + { + "epoch": 0.62, + "learning_rate": 7.516212962603394e-08, + "loss": 0.0003, + "step": 32197 + }, + { + "epoch": 0.62, + "learning_rate": 7.51582462816978e-08, + "loss": 0.0006, + "step": 32198 + }, + { + "epoch": 0.62, + "learning_rate": 7.515436293736165e-08, + "loss": 0.0005, + "step": 32199 + }, + { + "epoch": 0.62, + "learning_rate": 7.515047959302551e-08, + "loss": 0.0005, + "step": 32200 + }, + { + "epoch": 0.62, + "learning_rate": 7.514659624868937e-08, + "loss": 0.0006, + "step": 32201 + }, + { + "epoch": 0.62, + "learning_rate": 7.514271290435322e-08, + "loss": 0.0004, + "step": 32202 + }, + { + "epoch": 0.62, + "learning_rate": 7.513882956001707e-08, + "loss": 0.2581, + "step": 32203 + }, + { + "epoch": 0.62, + "learning_rate": 7.513494621568093e-08, + "loss": 0.0005, + "step": 32204 + }, + { + "epoch": 0.62, + "learning_rate": 7.513106287134479e-08, + "loss": 0.0004, + "step": 32205 + }, + { + "epoch": 0.62, + "learning_rate": 7.512717952700865e-08, + "loss": 0.0005, + "step": 32206 + }, + { + "epoch": 0.62, + "learning_rate": 7.512329618267251e-08, + "loss": 0.0004, + "step": 32207 + }, + { + "epoch": 0.62, + "learning_rate": 7.511941283833637e-08, + "loss": 0.0004, + "step": 32208 + }, + { + "epoch": 0.62, + "learning_rate": 7.511552949400022e-08, + "loss": 0.0004, + "step": 32209 + }, + { + "epoch": 0.62, + "learning_rate": 7.511164614966408e-08, + "loss": 0.0004, + "step": 32210 + }, + { + "epoch": 0.62, + "learning_rate": 7.510776280532794e-08, + "loss": 0.0004, + "step": 32211 + }, + { + "epoch": 0.62, + "learning_rate": 7.51038794609918e-08, + "loss": 0.0022, + "step": 32212 + }, + { + "epoch": 0.62, + "learning_rate": 7.509999611665566e-08, + "loss": 0.0005, + "step": 32213 + }, + { + "epoch": 0.62, + "learning_rate": 7.509611277231951e-08, + "loss": 0.0011, + "step": 32214 + }, + { + "epoch": 0.62, + "learning_rate": 7.509222942798337e-08, + "loss": 0.0004, + "step": 32215 + }, + { + "epoch": 0.62, + "learning_rate": 7.508834608364723e-08, + "loss": 0.0479, + "step": 32216 + }, + { + "epoch": 0.62, + "learning_rate": 7.508446273931109e-08, + "loss": 0.0004, + "step": 32217 + }, + { + "epoch": 0.62, + "learning_rate": 7.508057939497495e-08, + "loss": 0.0004, + "step": 32218 + }, + { + "epoch": 0.62, + "learning_rate": 7.50766960506388e-08, + "loss": 0.8428, + "step": 32219 + }, + { + "epoch": 0.62, + "learning_rate": 7.507281270630266e-08, + "loss": 0.0007, + "step": 32220 + }, + { + "epoch": 0.63, + "learning_rate": 7.506892936196652e-08, + "loss": 0.0005, + "step": 32221 + }, + { + "epoch": 0.63, + "learning_rate": 7.506504601763038e-08, + "loss": 0.0003, + "step": 32222 + }, + { + "epoch": 0.63, + "learning_rate": 7.506116267329424e-08, + "loss": 0.0037, + "step": 32223 + }, + { + "epoch": 0.63, + "learning_rate": 7.50572793289581e-08, + "loss": 0.0264, + "step": 32224 + }, + { + "epoch": 0.63, + "learning_rate": 7.505339598462194e-08, + "loss": 0.6609, + "step": 32225 + }, + { + "epoch": 0.63, + "learning_rate": 7.50495126402858e-08, + "loss": 0.8704, + "step": 32226 + }, + { + "epoch": 0.63, + "learning_rate": 7.504562929594966e-08, + "loss": 0.0006, + "step": 32227 + }, + { + "epoch": 0.63, + "learning_rate": 7.504174595161352e-08, + "loss": 0.0005, + "step": 32228 + }, + { + "epoch": 0.63, + "learning_rate": 7.503786260727738e-08, + "loss": 0.075, + "step": 32229 + }, + { + "epoch": 0.63, + "learning_rate": 7.503397926294123e-08, + "loss": 1.3779, + "step": 32230 + }, + { + "epoch": 0.63, + "learning_rate": 7.503009591860509e-08, + "loss": 0.0005, + "step": 32231 + }, + { + "epoch": 0.63, + "learning_rate": 7.502621257426895e-08, + "loss": 0.002, + "step": 32232 + }, + { + "epoch": 0.63, + "learning_rate": 7.502232922993281e-08, + "loss": 0.0251, + "step": 32233 + }, + { + "epoch": 0.63, + "learning_rate": 7.501844588559667e-08, + "loss": 0.0003, + "step": 32234 + }, + { + "epoch": 0.63, + "learning_rate": 7.501456254126052e-08, + "loss": 0.0006, + "step": 32235 + }, + { + "epoch": 0.63, + "learning_rate": 7.501067919692438e-08, + "loss": 0.0005, + "step": 32236 + }, + { + "epoch": 0.63, + "learning_rate": 7.500679585258824e-08, + "loss": 0.0005, + "step": 32237 + }, + { + "epoch": 0.63, + "learning_rate": 7.50029125082521e-08, + "loss": 0.0003, + "step": 32238 + }, + { + "epoch": 0.63, + "learning_rate": 7.499902916391596e-08, + "loss": 0.0006, + "step": 32239 + }, + { + "epoch": 0.63, + "learning_rate": 7.499514581957982e-08, + "loss": 0.0007, + "step": 32240 + }, + { + "epoch": 0.63, + "learning_rate": 7.499126247524367e-08, + "loss": 0.0005, + "step": 32241 + }, + { + "epoch": 0.63, + "learning_rate": 7.498737913090753e-08, + "loss": 0.0005, + "step": 32242 + }, + { + "epoch": 0.63, + "learning_rate": 7.498349578657139e-08, + "loss": 0.0004, + "step": 32243 + }, + { + "epoch": 0.63, + "learning_rate": 7.497961244223525e-08, + "loss": 0.0005, + "step": 32244 + }, + { + "epoch": 0.63, + "learning_rate": 7.497572909789911e-08, + "loss": 0.8495, + "step": 32245 + }, + { + "epoch": 0.63, + "learning_rate": 7.497184575356297e-08, + "loss": 0.0018, + "step": 32246 + }, + { + "epoch": 0.63, + "learning_rate": 7.496796240922682e-08, + "loss": 0.0005, + "step": 32247 + }, + { + "epoch": 0.63, + "learning_rate": 7.496407906489068e-08, + "loss": 0.0006, + "step": 32248 + }, + { + "epoch": 0.63, + "learning_rate": 7.496019572055454e-08, + "loss": 0.0076, + "step": 32249 + }, + { + "epoch": 0.63, + "learning_rate": 7.49563123762184e-08, + "loss": 0.0004, + "step": 32250 + }, + { + "epoch": 0.63, + "learning_rate": 7.495242903188226e-08, + "loss": 0.0007, + "step": 32251 + }, + { + "epoch": 0.63, + "learning_rate": 7.494854568754612e-08, + "loss": 0.5113, + "step": 32252 + }, + { + "epoch": 0.63, + "learning_rate": 7.494466234320997e-08, + "loss": 0.0005, + "step": 32253 + }, + { + "epoch": 0.63, + "learning_rate": 7.494077899887382e-08, + "loss": 0.0477, + "step": 32254 + }, + { + "epoch": 0.63, + "learning_rate": 7.493689565453768e-08, + "loss": 0.0005, + "step": 32255 + }, + { + "epoch": 0.63, + "learning_rate": 7.493301231020153e-08, + "loss": 0.0006, + "step": 32256 + }, + { + "epoch": 0.63, + "learning_rate": 7.492912896586539e-08, + "loss": 0.0005, + "step": 32257 + }, + { + "epoch": 0.63, + "learning_rate": 7.492524562152925e-08, + "loss": 0.0004, + "step": 32258 + }, + { + "epoch": 0.63, + "learning_rate": 7.492136227719311e-08, + "loss": 0.0003, + "step": 32259 + }, + { + "epoch": 0.63, + "learning_rate": 7.491747893285697e-08, + "loss": 0.0003, + "step": 32260 + }, + { + "epoch": 0.63, + "learning_rate": 7.491359558852083e-08, + "loss": 0.0012, + "step": 32261 + }, + { + "epoch": 0.63, + "learning_rate": 7.490971224418468e-08, + "loss": 0.0004, + "step": 32262 + }, + { + "epoch": 0.63, + "learning_rate": 7.490582889984854e-08, + "loss": 0.8115, + "step": 32263 + }, + { + "epoch": 0.63, + "learning_rate": 7.49019455555124e-08, + "loss": 0.0003, + "step": 32264 + }, + { + "epoch": 0.63, + "learning_rate": 7.489806221117626e-08, + "loss": 0.0004, + "step": 32265 + }, + { + "epoch": 0.63, + "learning_rate": 7.489417886684012e-08, + "loss": 0.0005, + "step": 32266 + }, + { + "epoch": 0.63, + "learning_rate": 7.489029552250398e-08, + "loss": 0.0107, + "step": 32267 + }, + { + "epoch": 0.63, + "learning_rate": 7.488641217816783e-08, + "loss": 0.0005, + "step": 32268 + }, + { + "epoch": 0.63, + "learning_rate": 7.488252883383169e-08, + "loss": 0.0005, + "step": 32269 + }, + { + "epoch": 0.63, + "learning_rate": 7.487864548949555e-08, + "loss": 0.0006, + "step": 32270 + }, + { + "epoch": 0.63, + "learning_rate": 7.487476214515941e-08, + "loss": 0.0004, + "step": 32271 + }, + { + "epoch": 0.63, + "learning_rate": 7.487087880082327e-08, + "loss": 0.0006, + "step": 32272 + }, + { + "epoch": 0.63, + "learning_rate": 7.486699545648712e-08, + "loss": 0.0004, + "step": 32273 + }, + { + "epoch": 0.63, + "learning_rate": 7.486311211215098e-08, + "loss": 0.0005, + "step": 32274 + }, + { + "epoch": 0.63, + "learning_rate": 7.485922876781484e-08, + "loss": 0.0005, + "step": 32275 + }, + { + "epoch": 0.63, + "learning_rate": 7.48553454234787e-08, + "loss": 0.0005, + "step": 32276 + }, + { + "epoch": 0.63, + "learning_rate": 7.485146207914256e-08, + "loss": 0.0006, + "step": 32277 + }, + { + "epoch": 0.63, + "learning_rate": 7.484757873480642e-08, + "loss": 0.0004, + "step": 32278 + }, + { + "epoch": 0.63, + "learning_rate": 7.484369539047027e-08, + "loss": 0.0006, + "step": 32279 + }, + { + "epoch": 0.63, + "learning_rate": 7.483981204613413e-08, + "loss": 0.0004, + "step": 32280 + }, + { + "epoch": 0.63, + "learning_rate": 7.483592870179799e-08, + "loss": 0.0005, + "step": 32281 + }, + { + "epoch": 0.63, + "learning_rate": 7.483204535746185e-08, + "loss": 0.0006, + "step": 32282 + }, + { + "epoch": 0.63, + "learning_rate": 7.48281620131257e-08, + "loss": 0.0006, + "step": 32283 + }, + { + "epoch": 0.63, + "learning_rate": 7.482427866878955e-08, + "loss": 0.0005, + "step": 32284 + }, + { + "epoch": 0.63, + "learning_rate": 7.482039532445341e-08, + "loss": 0.001, + "step": 32285 + }, + { + "epoch": 0.63, + "learning_rate": 7.481651198011727e-08, + "loss": 0.0014, + "step": 32286 + }, + { + "epoch": 0.63, + "learning_rate": 7.481262863578113e-08, + "loss": 0.0004, + "step": 32287 + }, + { + "epoch": 0.63, + "learning_rate": 7.480874529144499e-08, + "loss": 0.0018, + "step": 32288 + }, + { + "epoch": 0.63, + "learning_rate": 7.480486194710884e-08, + "loss": 0.0009, + "step": 32289 + }, + { + "epoch": 0.63, + "learning_rate": 7.48009786027727e-08, + "loss": 0.0004, + "step": 32290 + }, + { + "epoch": 0.63, + "learning_rate": 7.479709525843656e-08, + "loss": 0.0005, + "step": 32291 + }, + { + "epoch": 0.63, + "learning_rate": 7.479321191410042e-08, + "loss": 0.0005, + "step": 32292 + }, + { + "epoch": 0.63, + "learning_rate": 7.478932856976428e-08, + "loss": 0.7224, + "step": 32293 + }, + { + "epoch": 0.63, + "learning_rate": 7.478544522542813e-08, + "loss": 0.0004, + "step": 32294 + }, + { + "epoch": 0.63, + "learning_rate": 7.478156188109199e-08, + "loss": 0.0004, + "step": 32295 + }, + { + "epoch": 0.63, + "learning_rate": 7.477767853675585e-08, + "loss": 0.0007, + "step": 32296 + }, + { + "epoch": 0.63, + "learning_rate": 7.477379519241971e-08, + "loss": 0.0006, + "step": 32297 + }, + { + "epoch": 0.63, + "learning_rate": 7.476991184808357e-08, + "loss": 0.0004, + "step": 32298 + }, + { + "epoch": 0.63, + "learning_rate": 7.476602850374743e-08, + "loss": 0.0006, + "step": 32299 + }, + { + "epoch": 0.63, + "learning_rate": 7.476214515941128e-08, + "loss": 0.0009, + "step": 32300 + }, + { + "epoch": 0.63, + "learning_rate": 7.475826181507514e-08, + "loss": 0.0004, + "step": 32301 + }, + { + "epoch": 0.63, + "learning_rate": 7.4754378470739e-08, + "loss": 0.0004, + "step": 32302 + }, + { + "epoch": 0.63, + "learning_rate": 7.475049512640286e-08, + "loss": 0.0006, + "step": 32303 + }, + { + "epoch": 0.63, + "learning_rate": 7.474661178206672e-08, + "loss": 0.0005, + "step": 32304 + }, + { + "epoch": 0.63, + "learning_rate": 7.474272843773058e-08, + "loss": 1.3111, + "step": 32305 + }, + { + "epoch": 0.63, + "learning_rate": 7.473884509339443e-08, + "loss": 0.0005, + "step": 32306 + }, + { + "epoch": 0.63, + "learning_rate": 7.473496174905829e-08, + "loss": 0.0008, + "step": 32307 + }, + { + "epoch": 0.63, + "learning_rate": 7.473107840472215e-08, + "loss": 0.0005, + "step": 32308 + }, + { + "epoch": 0.63, + "learning_rate": 7.472719506038601e-08, + "loss": 0.0007, + "step": 32309 + }, + { + "epoch": 0.63, + "learning_rate": 7.472331171604987e-08, + "loss": 0.0004, + "step": 32310 + }, + { + "epoch": 0.63, + "learning_rate": 7.471942837171372e-08, + "loss": 0.7825, + "step": 32311 + }, + { + "epoch": 0.63, + "learning_rate": 7.471554502737757e-08, + "loss": 0.0003, + "step": 32312 + }, + { + "epoch": 0.63, + "learning_rate": 7.471166168304143e-08, + "loss": 0.0006, + "step": 32313 + }, + { + "epoch": 0.63, + "learning_rate": 7.470777833870529e-08, + "loss": 0.0009, + "step": 32314 + }, + { + "epoch": 0.63, + "learning_rate": 7.470389499436914e-08, + "loss": 0.0005, + "step": 32315 + }, + { + "epoch": 0.63, + "learning_rate": 7.4700011650033e-08, + "loss": 0.0004, + "step": 32316 + }, + { + "epoch": 0.63, + "learning_rate": 7.469612830569686e-08, + "loss": 0.0005, + "step": 32317 + }, + { + "epoch": 0.63, + "learning_rate": 7.469224496136072e-08, + "loss": 0.3338, + "step": 32318 + }, + { + "epoch": 0.63, + "learning_rate": 7.468836161702458e-08, + "loss": 0.0007, + "step": 32319 + }, + { + "epoch": 0.63, + "learning_rate": 7.468447827268844e-08, + "loss": 0.0004, + "step": 32320 + }, + { + "epoch": 0.63, + "learning_rate": 7.46805949283523e-08, + "loss": 0.0003, + "step": 32321 + }, + { + "epoch": 0.63, + "learning_rate": 7.467671158401615e-08, + "loss": 0.0004, + "step": 32322 + }, + { + "epoch": 0.63, + "learning_rate": 7.467282823968001e-08, + "loss": 0.0003, + "step": 32323 + }, + { + "epoch": 0.63, + "learning_rate": 7.466894489534387e-08, + "loss": 0.0006, + "step": 32324 + }, + { + "epoch": 0.63, + "learning_rate": 7.466506155100773e-08, + "loss": 0.0003, + "step": 32325 + }, + { + "epoch": 0.63, + "learning_rate": 7.466117820667159e-08, + "loss": 0.0003, + "step": 32326 + }, + { + "epoch": 0.63, + "learning_rate": 7.465729486233544e-08, + "loss": 0.0016, + "step": 32327 + }, + { + "epoch": 0.63, + "learning_rate": 7.46534115179993e-08, + "loss": 0.003, + "step": 32328 + }, + { + "epoch": 0.63, + "learning_rate": 7.464952817366316e-08, + "loss": 1.1354, + "step": 32329 + }, + { + "epoch": 0.63, + "learning_rate": 7.464564482932702e-08, + "loss": 0.0006, + "step": 32330 + }, + { + "epoch": 0.63, + "learning_rate": 7.464176148499088e-08, + "loss": 0.0005, + "step": 32331 + }, + { + "epoch": 0.63, + "learning_rate": 7.463787814065473e-08, + "loss": 0.0004, + "step": 32332 + }, + { + "epoch": 0.63, + "learning_rate": 7.463399479631859e-08, + "loss": 0.0004, + "step": 32333 + }, + { + "epoch": 0.63, + "learning_rate": 7.463011145198245e-08, + "loss": 0.0015, + "step": 32334 + }, + { + "epoch": 0.63, + "learning_rate": 7.462622810764631e-08, + "loss": 0.4651, + "step": 32335 + }, + { + "epoch": 0.63, + "learning_rate": 7.462234476331017e-08, + "loss": 0.0004, + "step": 32336 + }, + { + "epoch": 0.63, + "learning_rate": 7.461846141897403e-08, + "loss": 0.0005, + "step": 32337 + }, + { + "epoch": 0.63, + "learning_rate": 7.461457807463788e-08, + "loss": 0.0005, + "step": 32338 + }, + { + "epoch": 0.63, + "learning_rate": 7.461069473030174e-08, + "loss": 0.0003, + "step": 32339 + }, + { + "epoch": 0.63, + "learning_rate": 7.46068113859656e-08, + "loss": 0.0004, + "step": 32340 + }, + { + "epoch": 0.63, + "learning_rate": 7.460292804162945e-08, + "loss": 0.0174, + "step": 32341 + }, + { + "epoch": 0.63, + "learning_rate": 7.45990446972933e-08, + "loss": 0.0026, + "step": 32342 + }, + { + "epoch": 0.63, + "learning_rate": 7.459516135295716e-08, + "loss": 0.0004, + "step": 32343 + }, + { + "epoch": 0.63, + "learning_rate": 7.459127800862102e-08, + "loss": 0.1925, + "step": 32344 + }, + { + "epoch": 0.63, + "learning_rate": 7.458739466428488e-08, + "loss": 0.0003, + "step": 32345 + }, + { + "epoch": 0.63, + "learning_rate": 7.458351131994874e-08, + "loss": 0.0004, + "step": 32346 + }, + { + "epoch": 0.63, + "learning_rate": 7.45796279756126e-08, + "loss": 0.0005, + "step": 32347 + }, + { + "epoch": 0.63, + "learning_rate": 7.457574463127645e-08, + "loss": 1.1904, + "step": 32348 + }, + { + "epoch": 0.63, + "learning_rate": 7.457186128694031e-08, + "loss": 0.0003, + "step": 32349 + }, + { + "epoch": 0.63, + "learning_rate": 7.456797794260417e-08, + "loss": 0.0007, + "step": 32350 + }, + { + "epoch": 0.63, + "learning_rate": 7.456409459826803e-08, + "loss": 0.0006, + "step": 32351 + }, + { + "epoch": 0.63, + "learning_rate": 7.456021125393189e-08, + "loss": 0.0007, + "step": 32352 + }, + { + "epoch": 0.63, + "learning_rate": 7.455632790959574e-08, + "loss": 0.1849, + "step": 32353 + }, + { + "epoch": 0.63, + "learning_rate": 7.45524445652596e-08, + "loss": 0.0007, + "step": 32354 + }, + { + "epoch": 0.63, + "learning_rate": 7.454856122092346e-08, + "loss": 0.1681, + "step": 32355 + }, + { + "epoch": 0.63, + "learning_rate": 7.454467787658732e-08, + "loss": 0.0005, + "step": 32356 + }, + { + "epoch": 0.63, + "learning_rate": 7.454079453225118e-08, + "loss": 0.0029, + "step": 32357 + }, + { + "epoch": 0.63, + "learning_rate": 7.453691118791504e-08, + "loss": 0.0004, + "step": 32358 + }, + { + "epoch": 0.63, + "learning_rate": 7.45330278435789e-08, + "loss": 0.0025, + "step": 32359 + }, + { + "epoch": 0.63, + "learning_rate": 7.452914449924275e-08, + "loss": 0.0005, + "step": 32360 + }, + { + "epoch": 0.63, + "learning_rate": 7.452526115490661e-08, + "loss": 0.0034, + "step": 32361 + }, + { + "epoch": 0.63, + "learning_rate": 7.452137781057047e-08, + "loss": 0.0004, + "step": 32362 + }, + { + "epoch": 0.63, + "learning_rate": 7.451749446623433e-08, + "loss": 0.0004, + "step": 32363 + }, + { + "epoch": 0.63, + "learning_rate": 7.451361112189819e-08, + "loss": 0.0005, + "step": 32364 + }, + { + "epoch": 0.63, + "learning_rate": 7.450972777756203e-08, + "loss": 0.0005, + "step": 32365 + }, + { + "epoch": 0.63, + "learning_rate": 7.450584443322589e-08, + "loss": 0.0006, + "step": 32366 + }, + { + "epoch": 0.63, + "learning_rate": 7.450196108888975e-08, + "loss": 0.0005, + "step": 32367 + }, + { + "epoch": 0.63, + "learning_rate": 7.44980777445536e-08, + "loss": 1.4791, + "step": 32368 + }, + { + "epoch": 0.63, + "learning_rate": 7.449419440021746e-08, + "loss": 0.0333, + "step": 32369 + }, + { + "epoch": 0.63, + "learning_rate": 7.449031105588132e-08, + "loss": 0.0003, + "step": 32370 + }, + { + "epoch": 0.63, + "learning_rate": 7.448642771154518e-08, + "loss": 0.0222, + "step": 32371 + }, + { + "epoch": 0.63, + "learning_rate": 7.448254436720904e-08, + "loss": 0.0005, + "step": 32372 + }, + { + "epoch": 0.63, + "learning_rate": 7.44786610228729e-08, + "loss": 0.0004, + "step": 32373 + }, + { + "epoch": 0.63, + "learning_rate": 7.447477767853675e-08, + "loss": 0.0005, + "step": 32374 + }, + { + "epoch": 0.63, + "learning_rate": 7.447089433420061e-08, + "loss": 0.3331, + "step": 32375 + }, + { + "epoch": 0.63, + "learning_rate": 7.446701098986447e-08, + "loss": 0.0007, + "step": 32376 + }, + { + "epoch": 0.63, + "learning_rate": 7.446312764552833e-08, + "loss": 0.0005, + "step": 32377 + }, + { + "epoch": 0.63, + "learning_rate": 7.445924430119219e-08, + "loss": 0.0004, + "step": 32378 + }, + { + "epoch": 0.63, + "learning_rate": 7.445536095685603e-08, + "loss": 0.0008, + "step": 32379 + }, + { + "epoch": 0.63, + "learning_rate": 7.445147761251989e-08, + "loss": 0.0005, + "step": 32380 + }, + { + "epoch": 0.63, + "learning_rate": 7.444759426818375e-08, + "loss": 0.0005, + "step": 32381 + }, + { + "epoch": 0.63, + "learning_rate": 7.444371092384761e-08, + "loss": 0.0007, + "step": 32382 + }, + { + "epoch": 0.63, + "learning_rate": 7.443982757951147e-08, + "loss": 0.0004, + "step": 32383 + }, + { + "epoch": 0.63, + "learning_rate": 7.443594423517532e-08, + "loss": 0.0016, + "step": 32384 + }, + { + "epoch": 0.63, + "learning_rate": 7.443206089083918e-08, + "loss": 0.0003, + "step": 32385 + }, + { + "epoch": 0.63, + "learning_rate": 7.442817754650304e-08, + "loss": 0.0013, + "step": 32386 + }, + { + "epoch": 0.63, + "learning_rate": 7.44242942021669e-08, + "loss": 0.6385, + "step": 32387 + }, + { + "epoch": 0.63, + "learning_rate": 7.442041085783076e-08, + "loss": 2.3167, + "step": 32388 + }, + { + "epoch": 0.63, + "learning_rate": 7.441652751349462e-08, + "loss": 0.0004, + "step": 32389 + }, + { + "epoch": 0.63, + "learning_rate": 7.441264416915847e-08, + "loss": 0.0004, + "step": 32390 + }, + { + "epoch": 0.63, + "learning_rate": 7.440876082482233e-08, + "loss": 0.0004, + "step": 32391 + }, + { + "epoch": 0.63, + "learning_rate": 7.440487748048619e-08, + "loss": 0.0008, + "step": 32392 + }, + { + "epoch": 0.63, + "learning_rate": 7.440099413615005e-08, + "loss": 0.0004, + "step": 32393 + }, + { + "epoch": 0.63, + "learning_rate": 7.43971107918139e-08, + "loss": 0.0059, + "step": 32394 + }, + { + "epoch": 0.63, + "learning_rate": 7.439322744747776e-08, + "loss": 0.0004, + "step": 32395 + }, + { + "epoch": 0.63, + "learning_rate": 7.438934410314162e-08, + "loss": 0.0006, + "step": 32396 + }, + { + "epoch": 0.63, + "learning_rate": 7.438546075880548e-08, + "loss": 0.0004, + "step": 32397 + }, + { + "epoch": 0.63, + "learning_rate": 7.438157741446934e-08, + "loss": 0.2518, + "step": 32398 + }, + { + "epoch": 0.63, + "learning_rate": 7.437769407013318e-08, + "loss": 0.012, + "step": 32399 + }, + { + "epoch": 0.63, + "learning_rate": 7.437381072579704e-08, + "loss": 0.0005, + "step": 32400 + }, + { + "epoch": 0.63, + "learning_rate": 7.43699273814609e-08, + "loss": 0.8659, + "step": 32401 + }, + { + "epoch": 0.63, + "learning_rate": 7.436604403712476e-08, + "loss": 0.0008, + "step": 32402 + }, + { + "epoch": 0.63, + "learning_rate": 7.436216069278862e-08, + "loss": 0.0005, + "step": 32403 + }, + { + "epoch": 0.63, + "learning_rate": 7.435827734845248e-08, + "loss": 0.0004, + "step": 32404 + }, + { + "epoch": 0.63, + "learning_rate": 7.435439400411633e-08, + "loss": 0.0006, + "step": 32405 + }, + { + "epoch": 0.63, + "learning_rate": 7.435051065978019e-08, + "loss": 0.0004, + "step": 32406 + }, + { + "epoch": 0.63, + "learning_rate": 7.434662731544405e-08, + "loss": 0.0003, + "step": 32407 + }, + { + "epoch": 0.63, + "learning_rate": 7.434274397110791e-08, + "loss": 0.0008, + "step": 32408 + }, + { + "epoch": 0.63, + "learning_rate": 7.433886062677177e-08, + "loss": 0.0005, + "step": 32409 + }, + { + "epoch": 0.63, + "learning_rate": 7.433497728243562e-08, + "loss": 0.0009, + "step": 32410 + }, + { + "epoch": 0.63, + "learning_rate": 7.433109393809948e-08, + "loss": 0.0003, + "step": 32411 + }, + { + "epoch": 0.63, + "learning_rate": 7.432721059376334e-08, + "loss": 0.0067, + "step": 32412 + }, + { + "epoch": 0.63, + "learning_rate": 7.43233272494272e-08, + "loss": 0.0004, + "step": 32413 + }, + { + "epoch": 0.63, + "learning_rate": 7.431944390509106e-08, + "loss": 0.0011, + "step": 32414 + }, + { + "epoch": 0.63, + "learning_rate": 7.431556056075492e-08, + "loss": 0.0003, + "step": 32415 + }, + { + "epoch": 0.63, + "learning_rate": 7.431167721641877e-08, + "loss": 0.0027, + "step": 32416 + }, + { + "epoch": 0.63, + "learning_rate": 7.430779387208263e-08, + "loss": 0.0004, + "step": 32417 + }, + { + "epoch": 0.63, + "learning_rate": 7.430391052774649e-08, + "loss": 0.0015, + "step": 32418 + }, + { + "epoch": 0.63, + "learning_rate": 7.430002718341035e-08, + "loss": 1.1269, + "step": 32419 + }, + { + "epoch": 0.63, + "learning_rate": 7.429614383907421e-08, + "loss": 0.0004, + "step": 32420 + }, + { + "epoch": 0.63, + "learning_rate": 7.429226049473807e-08, + "loss": 0.0005, + "step": 32421 + }, + { + "epoch": 0.63, + "learning_rate": 7.428837715040192e-08, + "loss": 0.0005, + "step": 32422 + }, + { + "epoch": 0.63, + "learning_rate": 7.428449380606578e-08, + "loss": 0.0005, + "step": 32423 + }, + { + "epoch": 0.63, + "learning_rate": 7.428061046172964e-08, + "loss": 0.0004, + "step": 32424 + }, + { + "epoch": 0.63, + "learning_rate": 7.42767271173935e-08, + "loss": 0.0004, + "step": 32425 + }, + { + "epoch": 0.63, + "learning_rate": 7.427284377305736e-08, + "loss": 0.0006, + "step": 32426 + }, + { + "epoch": 0.63, + "learning_rate": 7.426896042872122e-08, + "loss": 0.0004, + "step": 32427 + }, + { + "epoch": 0.63, + "learning_rate": 7.426507708438506e-08, + "loss": 0.0006, + "step": 32428 + }, + { + "epoch": 0.63, + "learning_rate": 7.426119374004892e-08, + "loss": 0.0006, + "step": 32429 + }, + { + "epoch": 0.63, + "learning_rate": 7.425731039571278e-08, + "loss": 0.1101, + "step": 32430 + }, + { + "epoch": 0.63, + "learning_rate": 7.425342705137663e-08, + "loss": 0.0007, + "step": 32431 + }, + { + "epoch": 0.63, + "learning_rate": 7.424954370704049e-08, + "loss": 0.0011, + "step": 32432 + }, + { + "epoch": 0.63, + "learning_rate": 7.424566036270435e-08, + "loss": 0.0005, + "step": 32433 + }, + { + "epoch": 0.63, + "learning_rate": 7.424177701836821e-08, + "loss": 0.0021, + "step": 32434 + }, + { + "epoch": 0.63, + "learning_rate": 7.423789367403207e-08, + "loss": 0.0004, + "step": 32435 + }, + { + "epoch": 0.63, + "learning_rate": 7.423401032969593e-08, + "loss": 0.0004, + "step": 32436 + }, + { + "epoch": 0.63, + "learning_rate": 7.423012698535978e-08, + "loss": 0.0003, + "step": 32437 + }, + { + "epoch": 0.63, + "learning_rate": 7.422624364102364e-08, + "loss": 0.0003, + "step": 32438 + }, + { + "epoch": 0.63, + "learning_rate": 7.42223602966875e-08, + "loss": 0.0009, + "step": 32439 + }, + { + "epoch": 0.63, + "learning_rate": 7.421847695235136e-08, + "loss": 0.0008, + "step": 32440 + }, + { + "epoch": 0.63, + "learning_rate": 7.421459360801522e-08, + "loss": 0.1945, + "step": 32441 + }, + { + "epoch": 0.63, + "learning_rate": 7.421071026367908e-08, + "loss": 0.0004, + "step": 32442 + }, + { + "epoch": 0.63, + "learning_rate": 7.420682691934293e-08, + "loss": 0.0004, + "step": 32443 + }, + { + "epoch": 0.63, + "learning_rate": 7.420294357500679e-08, + "loss": 0.3728, + "step": 32444 + }, + { + "epoch": 0.63, + "learning_rate": 7.419906023067065e-08, + "loss": 0.0088, + "step": 32445 + }, + { + "epoch": 0.63, + "learning_rate": 7.419517688633451e-08, + "loss": 0.0006, + "step": 32446 + }, + { + "epoch": 0.63, + "learning_rate": 7.419129354199837e-08, + "loss": 0.0007, + "step": 32447 + }, + { + "epoch": 0.63, + "learning_rate": 7.418741019766223e-08, + "loss": 0.0006, + "step": 32448 + }, + { + "epoch": 0.63, + "learning_rate": 7.418352685332608e-08, + "loss": 0.0004, + "step": 32449 + }, + { + "epoch": 0.63, + "learning_rate": 7.417964350898994e-08, + "loss": 0.0004, + "step": 32450 + }, + { + "epoch": 0.63, + "learning_rate": 7.41757601646538e-08, + "loss": 0.0004, + "step": 32451 + }, + { + "epoch": 0.63, + "learning_rate": 7.417187682031766e-08, + "loss": 0.0004, + "step": 32452 + }, + { + "epoch": 0.63, + "learning_rate": 7.416799347598152e-08, + "loss": 0.0003, + "step": 32453 + }, + { + "epoch": 0.63, + "learning_rate": 7.416411013164537e-08, + "loss": 0.0005, + "step": 32454 + }, + { + "epoch": 0.63, + "learning_rate": 7.416022678730923e-08, + "loss": 0.0006, + "step": 32455 + }, + { + "epoch": 0.63, + "learning_rate": 7.415634344297309e-08, + "loss": 0.0004, + "step": 32456 + }, + { + "epoch": 0.63, + "learning_rate": 7.415246009863694e-08, + "loss": 0.0004, + "step": 32457 + }, + { + "epoch": 0.63, + "learning_rate": 7.41485767543008e-08, + "loss": 0.0003, + "step": 32458 + }, + { + "epoch": 0.63, + "learning_rate": 7.414469340996465e-08, + "loss": 0.0127, + "step": 32459 + }, + { + "epoch": 0.63, + "learning_rate": 7.414081006562851e-08, + "loss": 0.0007, + "step": 32460 + }, + { + "epoch": 0.63, + "learning_rate": 7.413692672129237e-08, + "loss": 0.0006, + "step": 32461 + }, + { + "epoch": 0.63, + "learning_rate": 7.413304337695623e-08, + "loss": 0.0004, + "step": 32462 + }, + { + "epoch": 0.63, + "learning_rate": 7.412916003262009e-08, + "loss": 0.0009, + "step": 32463 + }, + { + "epoch": 0.63, + "learning_rate": 7.412527668828394e-08, + "loss": 0.0004, + "step": 32464 + }, + { + "epoch": 0.63, + "learning_rate": 7.41213933439478e-08, + "loss": 0.0005, + "step": 32465 + }, + { + "epoch": 0.63, + "learning_rate": 7.411750999961166e-08, + "loss": 0.0005, + "step": 32466 + }, + { + "epoch": 0.63, + "learning_rate": 7.411362665527552e-08, + "loss": 0.0005, + "step": 32467 + }, + { + "epoch": 0.63, + "learning_rate": 7.410974331093938e-08, + "loss": 0.0004, + "step": 32468 + }, + { + "epoch": 0.63, + "learning_rate": 7.410585996660323e-08, + "loss": 0.0014, + "step": 32469 + }, + { + "epoch": 0.63, + "learning_rate": 7.410197662226709e-08, + "loss": 0.0006, + "step": 32470 + }, + { + "epoch": 0.63, + "learning_rate": 7.409809327793095e-08, + "loss": 0.0003, + "step": 32471 + }, + { + "epoch": 0.63, + "learning_rate": 7.409420993359481e-08, + "loss": 0.0004, + "step": 32472 + }, + { + "epoch": 0.63, + "learning_rate": 7.409032658925867e-08, + "loss": 0.0005, + "step": 32473 + }, + { + "epoch": 0.63, + "learning_rate": 7.408644324492253e-08, + "loss": 0.0004, + "step": 32474 + }, + { + "epoch": 0.63, + "learning_rate": 7.408255990058638e-08, + "loss": 0.0009, + "step": 32475 + }, + { + "epoch": 0.63, + "learning_rate": 7.407867655625024e-08, + "loss": 0.0005, + "step": 32476 + }, + { + "epoch": 0.63, + "learning_rate": 7.40747932119141e-08, + "loss": 0.0005, + "step": 32477 + }, + { + "epoch": 0.63, + "learning_rate": 7.407090986757796e-08, + "loss": 0.9997, + "step": 32478 + }, + { + "epoch": 0.63, + "learning_rate": 7.406702652324182e-08, + "loss": 0.0007, + "step": 32479 + }, + { + "epoch": 0.63, + "learning_rate": 7.406314317890568e-08, + "loss": 0.0009, + "step": 32480 + }, + { + "epoch": 0.63, + "learning_rate": 7.405925983456953e-08, + "loss": 0.0005, + "step": 32481 + }, + { + "epoch": 0.63, + "learning_rate": 7.405537649023339e-08, + "loss": 0.0011, + "step": 32482 + }, + { + "epoch": 0.63, + "learning_rate": 7.405149314589725e-08, + "loss": 0.0008, + "step": 32483 + }, + { + "epoch": 0.63, + "learning_rate": 7.404760980156111e-08, + "loss": 0.0207, + "step": 32484 + }, + { + "epoch": 0.63, + "learning_rate": 7.404372645722497e-08, + "loss": 0.001, + "step": 32485 + }, + { + "epoch": 0.63, + "learning_rate": 7.403984311288881e-08, + "loss": 0.0005, + "step": 32486 + }, + { + "epoch": 0.63, + "learning_rate": 7.403595976855267e-08, + "loss": 0.0004, + "step": 32487 + }, + { + "epoch": 0.63, + "learning_rate": 7.403207642421653e-08, + "loss": 0.036, + "step": 32488 + }, + { + "epoch": 0.63, + "learning_rate": 7.402819307988039e-08, + "loss": 0.2227, + "step": 32489 + }, + { + "epoch": 0.63, + "learning_rate": 7.402430973554424e-08, + "loss": 0.0378, + "step": 32490 + }, + { + "epoch": 0.63, + "learning_rate": 7.40204263912081e-08, + "loss": 0.0004, + "step": 32491 + }, + { + "epoch": 0.63, + "learning_rate": 7.401654304687196e-08, + "loss": 0.0003, + "step": 32492 + }, + { + "epoch": 0.63, + "learning_rate": 7.401265970253582e-08, + "loss": 0.0005, + "step": 32493 + }, + { + "epoch": 0.63, + "learning_rate": 7.400877635819968e-08, + "loss": 0.007, + "step": 32494 + }, + { + "epoch": 0.63, + "learning_rate": 7.400489301386354e-08, + "loss": 0.0003, + "step": 32495 + }, + { + "epoch": 0.63, + "learning_rate": 7.40010096695274e-08, + "loss": 0.0016, + "step": 32496 + }, + { + "epoch": 0.63, + "learning_rate": 7.399712632519125e-08, + "loss": 0.0005, + "step": 32497 + }, + { + "epoch": 0.63, + "learning_rate": 7.399324298085511e-08, + "loss": 0.0006, + "step": 32498 + }, + { + "epoch": 0.63, + "learning_rate": 7.398935963651897e-08, + "loss": 0.0003, + "step": 32499 + }, + { + "epoch": 0.63, + "learning_rate": 7.398547629218283e-08, + "loss": 0.0003, + "step": 32500 + }, + { + "epoch": 0.63, + "learning_rate": 7.398159294784669e-08, + "loss": 0.001, + "step": 32501 + }, + { + "epoch": 0.63, + "learning_rate": 7.397770960351054e-08, + "loss": 0.0008, + "step": 32502 + }, + { + "epoch": 0.63, + "learning_rate": 7.39738262591744e-08, + "loss": 0.0069, + "step": 32503 + }, + { + "epoch": 0.63, + "learning_rate": 7.396994291483826e-08, + "loss": 0.0004, + "step": 32504 + }, + { + "epoch": 0.63, + "learning_rate": 7.396605957050212e-08, + "loss": 0.067, + "step": 32505 + }, + { + "epoch": 0.63, + "learning_rate": 7.396217622616598e-08, + "loss": 0.0004, + "step": 32506 + }, + { + "epoch": 0.63, + "learning_rate": 7.395829288182983e-08, + "loss": 0.0004, + "step": 32507 + }, + { + "epoch": 0.63, + "learning_rate": 7.395440953749369e-08, + "loss": 0.0006, + "step": 32508 + }, + { + "epoch": 0.63, + "learning_rate": 7.395052619315755e-08, + "loss": 0.0326, + "step": 32509 + }, + { + "epoch": 0.63, + "learning_rate": 7.394664284882141e-08, + "loss": 0.2157, + "step": 32510 + }, + { + "epoch": 0.63, + "learning_rate": 7.394275950448527e-08, + "loss": 0.0003, + "step": 32511 + }, + { + "epoch": 0.63, + "learning_rate": 7.393887616014913e-08, + "loss": 0.0005, + "step": 32512 + }, + { + "epoch": 0.63, + "learning_rate": 7.393499281581298e-08, + "loss": 0.0018, + "step": 32513 + }, + { + "epoch": 0.63, + "learning_rate": 7.393110947147684e-08, + "loss": 0.0005, + "step": 32514 + }, + { + "epoch": 0.63, + "learning_rate": 7.392722612714069e-08, + "loss": 0.0006, + "step": 32515 + }, + { + "epoch": 0.63, + "learning_rate": 7.392334278280455e-08, + "loss": 0.0004, + "step": 32516 + }, + { + "epoch": 0.63, + "learning_rate": 7.39194594384684e-08, + "loss": 0.0013, + "step": 32517 + }, + { + "epoch": 0.63, + "learning_rate": 7.391557609413226e-08, + "loss": 0.0006, + "step": 32518 + }, + { + "epoch": 0.63, + "learning_rate": 7.391169274979612e-08, + "loss": 0.0005, + "step": 32519 + }, + { + "epoch": 0.63, + "learning_rate": 7.390780940545998e-08, + "loss": 0.0004, + "step": 32520 + }, + { + "epoch": 0.63, + "learning_rate": 7.390392606112384e-08, + "loss": 0.0005, + "step": 32521 + }, + { + "epoch": 0.63, + "learning_rate": 7.39000427167877e-08, + "loss": 0.0013, + "step": 32522 + }, + { + "epoch": 0.63, + "learning_rate": 7.389615937245155e-08, + "loss": 0.0004, + "step": 32523 + }, + { + "epoch": 0.63, + "learning_rate": 7.389227602811541e-08, + "loss": 0.0003, + "step": 32524 + }, + { + "epoch": 0.63, + "learning_rate": 7.388839268377927e-08, + "loss": 0.0005, + "step": 32525 + }, + { + "epoch": 0.63, + "learning_rate": 7.388450933944313e-08, + "loss": 0.0004, + "step": 32526 + }, + { + "epoch": 0.63, + "learning_rate": 7.388062599510699e-08, + "loss": 0.0006, + "step": 32527 + }, + { + "epoch": 0.63, + "learning_rate": 7.387674265077084e-08, + "loss": 0.0005, + "step": 32528 + }, + { + "epoch": 0.63, + "learning_rate": 7.38728593064347e-08, + "loss": 0.0089, + "step": 32529 + }, + { + "epoch": 0.63, + "learning_rate": 7.386897596209856e-08, + "loss": 0.0005, + "step": 32530 + }, + { + "epoch": 0.63, + "learning_rate": 7.386509261776242e-08, + "loss": 0.0004, + "step": 32531 + }, + { + "epoch": 0.63, + "learning_rate": 7.386120927342628e-08, + "loss": 0.047, + "step": 32532 + }, + { + "epoch": 0.63, + "learning_rate": 7.385732592909014e-08, + "loss": 0.0005, + "step": 32533 + }, + { + "epoch": 0.63, + "learning_rate": 7.3853442584754e-08, + "loss": 0.0004, + "step": 32534 + }, + { + "epoch": 0.63, + "learning_rate": 7.384955924041785e-08, + "loss": 0.0004, + "step": 32535 + }, + { + "epoch": 0.63, + "learning_rate": 7.384567589608171e-08, + "loss": 0.6108, + "step": 32536 + }, + { + "epoch": 0.63, + "learning_rate": 7.384179255174557e-08, + "loss": 0.0007, + "step": 32537 + }, + { + "epoch": 0.63, + "learning_rate": 7.383790920740943e-08, + "loss": 0.0245, + "step": 32538 + }, + { + "epoch": 0.63, + "learning_rate": 7.383402586307329e-08, + "loss": 0.0003, + "step": 32539 + }, + { + "epoch": 0.63, + "learning_rate": 7.383014251873714e-08, + "loss": 0.0006, + "step": 32540 + }, + { + "epoch": 0.63, + "learning_rate": 7.3826259174401e-08, + "loss": 1.1834, + "step": 32541 + }, + { + "epoch": 0.63, + "learning_rate": 7.382237583006485e-08, + "loss": 0.0005, + "step": 32542 + }, + { + "epoch": 0.63, + "learning_rate": 7.38184924857287e-08, + "loss": 0.0004, + "step": 32543 + }, + { + "epoch": 0.63, + "learning_rate": 7.381460914139256e-08, + "loss": 0.0312, + "step": 32544 + }, + { + "epoch": 0.63, + "learning_rate": 7.381072579705642e-08, + "loss": 0.0006, + "step": 32545 + }, + { + "epoch": 0.63, + "learning_rate": 7.380684245272028e-08, + "loss": 0.0003, + "step": 32546 + }, + { + "epoch": 0.63, + "learning_rate": 7.380295910838414e-08, + "loss": 0.0007, + "step": 32547 + }, + { + "epoch": 0.63, + "learning_rate": 7.3799075764048e-08, + "loss": 0.0004, + "step": 32548 + }, + { + "epoch": 0.63, + "learning_rate": 7.379519241971185e-08, + "loss": 0.0005, + "step": 32549 + }, + { + "epoch": 0.63, + "learning_rate": 7.379130907537571e-08, + "loss": 0.0005, + "step": 32550 + }, + { + "epoch": 0.63, + "learning_rate": 7.378742573103957e-08, + "loss": 0.0006, + "step": 32551 + }, + { + "epoch": 0.63, + "learning_rate": 7.378354238670343e-08, + "loss": 0.0004, + "step": 32552 + }, + { + "epoch": 0.63, + "learning_rate": 7.377965904236729e-08, + "loss": 0.0005, + "step": 32553 + }, + { + "epoch": 0.63, + "learning_rate": 7.377577569803115e-08, + "loss": 0.0004, + "step": 32554 + }, + { + "epoch": 0.63, + "learning_rate": 7.3771892353695e-08, + "loss": 0.0004, + "step": 32555 + }, + { + "epoch": 0.63, + "learning_rate": 7.376800900935885e-08, + "loss": 0.0296, + "step": 32556 + }, + { + "epoch": 0.63, + "learning_rate": 7.376412566502271e-08, + "loss": 0.0005, + "step": 32557 + }, + { + "epoch": 0.63, + "learning_rate": 7.376024232068657e-08, + "loss": 0.0005, + "step": 32558 + }, + { + "epoch": 0.63, + "learning_rate": 7.375635897635042e-08, + "loss": 0.003, + "step": 32559 + }, + { + "epoch": 0.63, + "learning_rate": 7.375247563201428e-08, + "loss": 0.001, + "step": 32560 + }, + { + "epoch": 0.63, + "learning_rate": 7.374859228767814e-08, + "loss": 0.0003, + "step": 32561 + }, + { + "epoch": 0.63, + "learning_rate": 7.3744708943342e-08, + "loss": 0.0005, + "step": 32562 + }, + { + "epoch": 0.63, + "learning_rate": 7.374082559900586e-08, + "loss": 0.0005, + "step": 32563 + }, + { + "epoch": 0.63, + "learning_rate": 7.373694225466972e-08, + "loss": 0.0005, + "step": 32564 + }, + { + "epoch": 0.63, + "learning_rate": 7.373305891033357e-08, + "loss": 0.0005, + "step": 32565 + }, + { + "epoch": 0.63, + "learning_rate": 7.372917556599743e-08, + "loss": 0.0003, + "step": 32566 + }, + { + "epoch": 0.63, + "learning_rate": 7.372529222166129e-08, + "loss": 0.0006, + "step": 32567 + }, + { + "epoch": 0.63, + "learning_rate": 7.372140887732515e-08, + "loss": 0.0005, + "step": 32568 + }, + { + "epoch": 0.63, + "learning_rate": 7.3717525532989e-08, + "loss": 0.0073, + "step": 32569 + }, + { + "epoch": 0.63, + "learning_rate": 7.371364218865286e-08, + "loss": 0.0006, + "step": 32570 + }, + { + "epoch": 0.63, + "learning_rate": 7.370975884431672e-08, + "loss": 0.0019, + "step": 32571 + }, + { + "epoch": 0.63, + "learning_rate": 7.370587549998058e-08, + "loss": 0.0004, + "step": 32572 + }, + { + "epoch": 0.63, + "learning_rate": 7.370199215564443e-08, + "loss": 0.1797, + "step": 32573 + }, + { + "epoch": 0.63, + "learning_rate": 7.369810881130828e-08, + "loss": 0.1325, + "step": 32574 + }, + { + "epoch": 0.63, + "learning_rate": 7.369422546697214e-08, + "loss": 0.0004, + "step": 32575 + }, + { + "epoch": 0.63, + "learning_rate": 7.3690342122636e-08, + "loss": 0.0005, + "step": 32576 + }, + { + "epoch": 0.63, + "learning_rate": 7.368645877829986e-08, + "loss": 0.0006, + "step": 32577 + }, + { + "epoch": 0.63, + "learning_rate": 7.368257543396372e-08, + "loss": 0.0006, + "step": 32578 + }, + { + "epoch": 0.63, + "learning_rate": 7.367869208962758e-08, + "loss": 0.0007, + "step": 32579 + }, + { + "epoch": 0.63, + "learning_rate": 7.367480874529143e-08, + "loss": 1.1455, + "step": 32580 + }, + { + "epoch": 0.63, + "learning_rate": 7.367092540095529e-08, + "loss": 0.0004, + "step": 32581 + }, + { + "epoch": 0.63, + "learning_rate": 7.366704205661915e-08, + "loss": 0.001, + "step": 32582 + }, + { + "epoch": 0.63, + "learning_rate": 7.366315871228301e-08, + "loss": 0.0005, + "step": 32583 + }, + { + "epoch": 0.63, + "learning_rate": 7.365927536794687e-08, + "loss": 0.0008, + "step": 32584 + }, + { + "epoch": 0.63, + "learning_rate": 7.365539202361073e-08, + "loss": 0.0004, + "step": 32585 + }, + { + "epoch": 0.63, + "learning_rate": 7.365150867927458e-08, + "loss": 0.0008, + "step": 32586 + }, + { + "epoch": 0.63, + "learning_rate": 7.364762533493844e-08, + "loss": 1.3933, + "step": 32587 + }, + { + "epoch": 0.63, + "learning_rate": 7.36437419906023e-08, + "loss": 0.0003, + "step": 32588 + }, + { + "epoch": 0.63, + "learning_rate": 7.363985864626616e-08, + "loss": 0.0005, + "step": 32589 + }, + { + "epoch": 0.63, + "learning_rate": 7.363597530193002e-08, + "loss": 0.0004, + "step": 32590 + }, + { + "epoch": 0.63, + "learning_rate": 7.363209195759387e-08, + "loss": 0.0005, + "step": 32591 + }, + { + "epoch": 0.63, + "learning_rate": 7.362820861325773e-08, + "loss": 0.0004, + "step": 32592 + }, + { + "epoch": 0.63, + "learning_rate": 7.362432526892159e-08, + "loss": 0.0006, + "step": 32593 + }, + { + "epoch": 0.63, + "learning_rate": 7.362044192458545e-08, + "loss": 0.0008, + "step": 32594 + }, + { + "epoch": 0.63, + "learning_rate": 7.361655858024931e-08, + "loss": 0.0003, + "step": 32595 + }, + { + "epoch": 0.63, + "learning_rate": 7.361267523591317e-08, + "loss": 0.0005, + "step": 32596 + }, + { + "epoch": 0.63, + "learning_rate": 7.360879189157702e-08, + "loss": 0.2104, + "step": 32597 + }, + { + "epoch": 0.63, + "learning_rate": 7.360490854724088e-08, + "loss": 0.0004, + "step": 32598 + }, + { + "epoch": 0.63, + "learning_rate": 7.360102520290474e-08, + "loss": 0.0007, + "step": 32599 + }, + { + "epoch": 0.63, + "learning_rate": 7.35971418585686e-08, + "loss": 0.0005, + "step": 32600 + }, + { + "epoch": 0.63, + "learning_rate": 7.359325851423246e-08, + "loss": 0.0513, + "step": 32601 + }, + { + "epoch": 0.63, + "learning_rate": 7.35893751698963e-08, + "loss": 0.0004, + "step": 32602 + }, + { + "epoch": 0.63, + "learning_rate": 7.358549182556016e-08, + "loss": 0.0004, + "step": 32603 + }, + { + "epoch": 0.63, + "learning_rate": 7.358160848122402e-08, + "loss": 0.2285, + "step": 32604 + }, + { + "epoch": 0.63, + "learning_rate": 7.357772513688788e-08, + "loss": 0.0027, + "step": 32605 + }, + { + "epoch": 0.63, + "learning_rate": 7.357384179255174e-08, + "loss": 0.0004, + "step": 32606 + }, + { + "epoch": 0.63, + "learning_rate": 7.356995844821559e-08, + "loss": 0.0008, + "step": 32607 + }, + { + "epoch": 0.63, + "learning_rate": 7.356607510387945e-08, + "loss": 0.0005, + "step": 32608 + }, + { + "epoch": 0.63, + "learning_rate": 7.356219175954331e-08, + "loss": 0.0005, + "step": 32609 + }, + { + "epoch": 0.63, + "learning_rate": 7.355830841520717e-08, + "loss": 0.0007, + "step": 32610 + }, + { + "epoch": 0.63, + "learning_rate": 7.355442507087103e-08, + "loss": 0.0005, + "step": 32611 + }, + { + "epoch": 0.63, + "learning_rate": 7.355054172653488e-08, + "loss": 0.0006, + "step": 32612 + }, + { + "epoch": 0.63, + "learning_rate": 7.354665838219874e-08, + "loss": 0.0008, + "step": 32613 + }, + { + "epoch": 0.63, + "learning_rate": 7.35427750378626e-08, + "loss": 0.0005, + "step": 32614 + }, + { + "epoch": 0.63, + "learning_rate": 7.353889169352646e-08, + "loss": 0.0004, + "step": 32615 + }, + { + "epoch": 0.63, + "learning_rate": 7.353500834919032e-08, + "loss": 0.0005, + "step": 32616 + }, + { + "epoch": 0.63, + "learning_rate": 7.353112500485418e-08, + "loss": 0.0004, + "step": 32617 + }, + { + "epoch": 0.63, + "learning_rate": 7.352724166051803e-08, + "loss": 0.0005, + "step": 32618 + }, + { + "epoch": 0.63, + "learning_rate": 7.352335831618189e-08, + "loss": 0.0004, + "step": 32619 + }, + { + "epoch": 0.63, + "learning_rate": 7.351947497184575e-08, + "loss": 0.0004, + "step": 32620 + }, + { + "epoch": 0.63, + "learning_rate": 7.351559162750961e-08, + "loss": 0.0031, + "step": 32621 + }, + { + "epoch": 0.63, + "learning_rate": 7.351170828317347e-08, + "loss": 0.0005, + "step": 32622 + }, + { + "epoch": 0.63, + "learning_rate": 7.350782493883733e-08, + "loss": 0.0003, + "step": 32623 + }, + { + "epoch": 0.63, + "learning_rate": 7.350394159450118e-08, + "loss": 0.0004, + "step": 32624 + }, + { + "epoch": 0.63, + "learning_rate": 7.350005825016504e-08, + "loss": 0.0005, + "step": 32625 + }, + { + "epoch": 0.63, + "learning_rate": 7.34961749058289e-08, + "loss": 0.0012, + "step": 32626 + }, + { + "epoch": 0.63, + "learning_rate": 7.349229156149276e-08, + "loss": 0.0004, + "step": 32627 + }, + { + "epoch": 0.63, + "learning_rate": 7.348840821715662e-08, + "loss": 0.0006, + "step": 32628 + }, + { + "epoch": 0.63, + "learning_rate": 7.348452487282047e-08, + "loss": 0.0004, + "step": 32629 + }, + { + "epoch": 0.63, + "learning_rate": 7.348064152848433e-08, + "loss": 0.0004, + "step": 32630 + }, + { + "epoch": 0.63, + "learning_rate": 7.347675818414818e-08, + "loss": 0.0004, + "step": 32631 + }, + { + "epoch": 0.63, + "learning_rate": 7.347287483981204e-08, + "loss": 0.087, + "step": 32632 + }, + { + "epoch": 0.63, + "learning_rate": 7.34689914954759e-08, + "loss": 0.0009, + "step": 32633 + }, + { + "epoch": 0.63, + "learning_rate": 7.346510815113975e-08, + "loss": 0.0013, + "step": 32634 + }, + { + "epoch": 0.63, + "learning_rate": 7.346122480680361e-08, + "loss": 0.0006, + "step": 32635 + }, + { + "epoch": 0.63, + "learning_rate": 7.345734146246747e-08, + "loss": 0.0006, + "step": 32636 + }, + { + "epoch": 0.63, + "learning_rate": 7.345345811813133e-08, + "loss": 0.0394, + "step": 32637 + }, + { + "epoch": 0.63, + "learning_rate": 7.344957477379519e-08, + "loss": 0.0005, + "step": 32638 + }, + { + "epoch": 0.63, + "learning_rate": 7.344569142945904e-08, + "loss": 0.06, + "step": 32639 + }, + { + "epoch": 0.63, + "learning_rate": 7.34418080851229e-08, + "loss": 0.0006, + "step": 32640 + }, + { + "epoch": 0.63, + "learning_rate": 7.343792474078676e-08, + "loss": 0.0004, + "step": 32641 + }, + { + "epoch": 0.63, + "learning_rate": 7.343404139645062e-08, + "loss": 0.0005, + "step": 32642 + }, + { + "epoch": 0.63, + "learning_rate": 7.343015805211448e-08, + "loss": 0.0004, + "step": 32643 + }, + { + "epoch": 0.63, + "learning_rate": 7.342627470777834e-08, + "loss": 0.0005, + "step": 32644 + }, + { + "epoch": 0.63, + "learning_rate": 7.342239136344219e-08, + "loss": 0.0004, + "step": 32645 + }, + { + "epoch": 0.63, + "learning_rate": 7.341850801910605e-08, + "loss": 0.0009, + "step": 32646 + }, + { + "epoch": 0.63, + "learning_rate": 7.341462467476991e-08, + "loss": 0.0004, + "step": 32647 + }, + { + "epoch": 0.63, + "learning_rate": 7.341074133043377e-08, + "loss": 0.0004, + "step": 32648 + }, + { + "epoch": 0.63, + "learning_rate": 7.340685798609763e-08, + "loss": 0.0005, + "step": 32649 + }, + { + "epoch": 0.63, + "learning_rate": 7.340297464176148e-08, + "loss": 0.0005, + "step": 32650 + }, + { + "epoch": 0.63, + "learning_rate": 7.339909129742534e-08, + "loss": 0.0048, + "step": 32651 + }, + { + "epoch": 0.63, + "learning_rate": 7.33952079530892e-08, + "loss": 0.0007, + "step": 32652 + }, + { + "epoch": 0.63, + "learning_rate": 7.339132460875306e-08, + "loss": 0.0118, + "step": 32653 + }, + { + "epoch": 0.63, + "learning_rate": 7.338744126441692e-08, + "loss": 0.0005, + "step": 32654 + }, + { + "epoch": 0.63, + "learning_rate": 7.338355792008078e-08, + "loss": 0.0003, + "step": 32655 + }, + { + "epoch": 0.63, + "learning_rate": 7.337967457574463e-08, + "loss": 0.0004, + "step": 32656 + }, + { + "epoch": 0.63, + "learning_rate": 7.337579123140849e-08, + "loss": 0.0111, + "step": 32657 + }, + { + "epoch": 0.63, + "learning_rate": 7.337190788707235e-08, + "loss": 1.1936, + "step": 32658 + }, + { + "epoch": 0.63, + "learning_rate": 7.336802454273621e-08, + "loss": 0.0004, + "step": 32659 + }, + { + "epoch": 0.63, + "learning_rate": 7.336414119840005e-08, + "loss": 0.0005, + "step": 32660 + }, + { + "epoch": 0.63, + "learning_rate": 7.336025785406391e-08, + "loss": 0.0005, + "step": 32661 + }, + { + "epoch": 0.63, + "learning_rate": 7.335637450972777e-08, + "loss": 0.0004, + "step": 32662 + }, + { + "epoch": 0.63, + "learning_rate": 7.335249116539163e-08, + "loss": 0.8897, + "step": 32663 + }, + { + "epoch": 0.63, + "learning_rate": 7.334860782105549e-08, + "loss": 0.0004, + "step": 32664 + }, + { + "epoch": 0.63, + "learning_rate": 7.334472447671934e-08, + "loss": 0.0005, + "step": 32665 + }, + { + "epoch": 0.63, + "learning_rate": 7.33408411323832e-08, + "loss": 0.0007, + "step": 32666 + }, + { + "epoch": 0.63, + "learning_rate": 7.333695778804706e-08, + "loss": 0.0006, + "step": 32667 + }, + { + "epoch": 0.63, + "learning_rate": 7.333307444371092e-08, + "loss": 0.2735, + "step": 32668 + }, + { + "epoch": 0.63, + "learning_rate": 7.332919109937478e-08, + "loss": 0.0008, + "step": 32669 + }, + { + "epoch": 0.63, + "learning_rate": 7.332530775503864e-08, + "loss": 0.0004, + "step": 32670 + }, + { + "epoch": 0.63, + "learning_rate": 7.33214244107025e-08, + "loss": 0.0006, + "step": 32671 + }, + { + "epoch": 0.63, + "learning_rate": 7.331754106636635e-08, + "loss": 0.0005, + "step": 32672 + }, + { + "epoch": 0.63, + "learning_rate": 7.331365772203021e-08, + "loss": 0.0006, + "step": 32673 + }, + { + "epoch": 0.63, + "learning_rate": 7.330977437769407e-08, + "loss": 0.0004, + "step": 32674 + }, + { + "epoch": 0.63, + "learning_rate": 7.330589103335793e-08, + "loss": 0.0004, + "step": 32675 + }, + { + "epoch": 0.63, + "learning_rate": 7.330200768902179e-08, + "loss": 0.0035, + "step": 32676 + }, + { + "epoch": 0.63, + "learning_rate": 7.329812434468564e-08, + "loss": 0.0006, + "step": 32677 + }, + { + "epoch": 0.63, + "learning_rate": 7.32942410003495e-08, + "loss": 0.0006, + "step": 32678 + }, + { + "epoch": 0.63, + "learning_rate": 7.329035765601336e-08, + "loss": 0.0003, + "step": 32679 + }, + { + "epoch": 0.63, + "learning_rate": 7.328647431167722e-08, + "loss": 0.0007, + "step": 32680 + }, + { + "epoch": 0.63, + "learning_rate": 7.328259096734108e-08, + "loss": 0.0055, + "step": 32681 + }, + { + "epoch": 0.63, + "learning_rate": 7.327870762300494e-08, + "loss": 0.0003, + "step": 32682 + }, + { + "epoch": 0.63, + "learning_rate": 7.327482427866879e-08, + "loss": 0.0004, + "step": 32683 + }, + { + "epoch": 0.63, + "learning_rate": 7.327094093433265e-08, + "loss": 0.0007, + "step": 32684 + }, + { + "epoch": 0.63, + "learning_rate": 7.326705758999651e-08, + "loss": 0.8073, + "step": 32685 + }, + { + "epoch": 0.63, + "learning_rate": 7.326317424566037e-08, + "loss": 0.0005, + "step": 32686 + }, + { + "epoch": 0.63, + "learning_rate": 7.325929090132423e-08, + "loss": 0.0005, + "step": 32687 + }, + { + "epoch": 0.63, + "learning_rate": 7.325540755698808e-08, + "loss": 0.0011, + "step": 32688 + }, + { + "epoch": 0.63, + "learning_rate": 7.325152421265193e-08, + "loss": 0.0005, + "step": 32689 + }, + { + "epoch": 0.63, + "learning_rate": 7.324764086831579e-08, + "loss": 0.0006, + "step": 32690 + }, + { + "epoch": 0.63, + "learning_rate": 7.324375752397965e-08, + "loss": 0.0008, + "step": 32691 + }, + { + "epoch": 0.63, + "learning_rate": 7.32398741796435e-08, + "loss": 0.5129, + "step": 32692 + }, + { + "epoch": 0.63, + "learning_rate": 7.323599083530736e-08, + "loss": 1.239, + "step": 32693 + }, + { + "epoch": 0.63, + "learning_rate": 7.323210749097122e-08, + "loss": 0.0004, + "step": 32694 + }, + { + "epoch": 0.63, + "learning_rate": 7.322822414663508e-08, + "loss": 0.0004, + "step": 32695 + }, + { + "epoch": 0.63, + "learning_rate": 7.322434080229894e-08, + "loss": 0.0004, + "step": 32696 + }, + { + "epoch": 0.63, + "learning_rate": 7.32204574579628e-08, + "loss": 0.0005, + "step": 32697 + }, + { + "epoch": 0.63, + "learning_rate": 7.321657411362665e-08, + "loss": 0.001, + "step": 32698 + }, + { + "epoch": 0.63, + "learning_rate": 7.321269076929051e-08, + "loss": 0.0005, + "step": 32699 + }, + { + "epoch": 0.63, + "learning_rate": 7.320880742495437e-08, + "loss": 0.0004, + "step": 32700 + }, + { + "epoch": 0.63, + "learning_rate": 7.320492408061823e-08, + "loss": 0.0005, + "step": 32701 + }, + { + "epoch": 0.63, + "learning_rate": 7.320104073628209e-08, + "loss": 0.0007, + "step": 32702 + }, + { + "epoch": 0.63, + "learning_rate": 7.319715739194594e-08, + "loss": 0.0011, + "step": 32703 + }, + { + "epoch": 0.63, + "learning_rate": 7.31932740476098e-08, + "loss": 0.0017, + "step": 32704 + }, + { + "epoch": 0.63, + "learning_rate": 7.318939070327366e-08, + "loss": 0.0067, + "step": 32705 + }, + { + "epoch": 0.63, + "learning_rate": 7.318550735893752e-08, + "loss": 0.1562, + "step": 32706 + }, + { + "epoch": 0.63, + "learning_rate": 7.318162401460138e-08, + "loss": 0.0006, + "step": 32707 + }, + { + "epoch": 0.63, + "learning_rate": 7.317774067026524e-08, + "loss": 0.0004, + "step": 32708 + }, + { + "epoch": 0.63, + "learning_rate": 7.31738573259291e-08, + "loss": 0.0005, + "step": 32709 + }, + { + "epoch": 0.63, + "learning_rate": 7.316997398159295e-08, + "loss": 0.0003, + "step": 32710 + }, + { + "epoch": 0.63, + "learning_rate": 7.316609063725681e-08, + "loss": 0.0006, + "step": 32711 + }, + { + "epoch": 0.63, + "learning_rate": 7.316220729292067e-08, + "loss": 0.1278, + "step": 32712 + }, + { + "epoch": 0.63, + "learning_rate": 7.315832394858453e-08, + "loss": 0.0009, + "step": 32713 + }, + { + "epoch": 0.63, + "learning_rate": 7.315444060424839e-08, + "loss": 0.0008, + "step": 32714 + }, + { + "epoch": 0.63, + "learning_rate": 7.315055725991224e-08, + "loss": 0.0005, + "step": 32715 + }, + { + "epoch": 0.63, + "learning_rate": 7.31466739155761e-08, + "loss": 0.0004, + "step": 32716 + }, + { + "epoch": 0.63, + "learning_rate": 7.314279057123996e-08, + "loss": 0.0004, + "step": 32717 + }, + { + "epoch": 0.63, + "learning_rate": 7.31389072269038e-08, + "loss": 0.0005, + "step": 32718 + }, + { + "epoch": 0.63, + "learning_rate": 7.313502388256766e-08, + "loss": 1.4313, + "step": 32719 + }, + { + "epoch": 0.63, + "learning_rate": 7.313114053823152e-08, + "loss": 0.5435, + "step": 32720 + }, + { + "epoch": 0.63, + "learning_rate": 7.312725719389538e-08, + "loss": 0.0006, + "step": 32721 + }, + { + "epoch": 0.63, + "learning_rate": 7.312337384955924e-08, + "loss": 1.1022, + "step": 32722 + }, + { + "epoch": 0.63, + "learning_rate": 7.31194905052231e-08, + "loss": 0.0005, + "step": 32723 + }, + { + "epoch": 0.63, + "learning_rate": 7.311560716088695e-08, + "loss": 0.0008, + "step": 32724 + }, + { + "epoch": 0.63, + "learning_rate": 7.311172381655081e-08, + "loss": 0.0005, + "step": 32725 + }, + { + "epoch": 0.63, + "learning_rate": 7.310784047221467e-08, + "loss": 0.0006, + "step": 32726 + }, + { + "epoch": 0.63, + "learning_rate": 7.310395712787853e-08, + "loss": 0.0008, + "step": 32727 + }, + { + "epoch": 0.63, + "learning_rate": 7.310007378354239e-08, + "loss": 0.4266, + "step": 32728 + }, + { + "epoch": 0.63, + "learning_rate": 7.309619043920625e-08, + "loss": 0.0003, + "step": 32729 + }, + { + "epoch": 0.63, + "learning_rate": 7.30923070948701e-08, + "loss": 0.4424, + "step": 32730 + }, + { + "epoch": 0.63, + "learning_rate": 7.308842375053396e-08, + "loss": 0.0822, + "step": 32731 + }, + { + "epoch": 0.63, + "learning_rate": 7.308454040619782e-08, + "loss": 0.0004, + "step": 32732 + }, + { + "epoch": 0.63, + "learning_rate": 7.308065706186167e-08, + "loss": 0.0004, + "step": 32733 + }, + { + "epoch": 0.63, + "learning_rate": 7.307677371752552e-08, + "loss": 0.0006, + "step": 32734 + }, + { + "epoch": 0.63, + "learning_rate": 7.307289037318938e-08, + "loss": 0.9909, + "step": 32735 + }, + { + "epoch": 0.64, + "learning_rate": 7.306900702885324e-08, + "loss": 0.0003, + "step": 32736 + }, + { + "epoch": 0.64, + "learning_rate": 7.30651236845171e-08, + "loss": 0.0005, + "step": 32737 + }, + { + "epoch": 0.64, + "learning_rate": 7.306124034018096e-08, + "loss": 0.0004, + "step": 32738 + }, + { + "epoch": 0.64, + "learning_rate": 7.305735699584482e-08, + "loss": 0.0006, + "step": 32739 + }, + { + "epoch": 0.64, + "learning_rate": 7.305347365150867e-08, + "loss": 0.0004, + "step": 32740 + }, + { + "epoch": 0.64, + "learning_rate": 7.304959030717253e-08, + "loss": 0.001, + "step": 32741 + }, + { + "epoch": 0.64, + "learning_rate": 7.304570696283639e-08, + "loss": 0.4662, + "step": 32742 + }, + { + "epoch": 0.64, + "learning_rate": 7.304182361850025e-08, + "loss": 0.2099, + "step": 32743 + }, + { + "epoch": 0.64, + "learning_rate": 7.30379402741641e-08, + "loss": 0.0006, + "step": 32744 + }, + { + "epoch": 0.64, + "learning_rate": 7.303405692982796e-08, + "loss": 0.1517, + "step": 32745 + }, + { + "epoch": 0.64, + "learning_rate": 7.303017358549182e-08, + "loss": 0.0007, + "step": 32746 + }, + { + "epoch": 0.64, + "learning_rate": 7.302629024115568e-08, + "loss": 0.0007, + "step": 32747 + }, + { + "epoch": 0.64, + "learning_rate": 7.302240689681953e-08, + "loss": 0.0005, + "step": 32748 + }, + { + "epoch": 0.64, + "learning_rate": 7.301852355248338e-08, + "loss": 0.0011, + "step": 32749 + }, + { + "epoch": 0.64, + "learning_rate": 7.301464020814724e-08, + "loss": 0.0017, + "step": 32750 + }, + { + "epoch": 0.64, + "learning_rate": 7.30107568638111e-08, + "loss": 0.0006, + "step": 32751 + }, + { + "epoch": 0.64, + "learning_rate": 7.300687351947496e-08, + "loss": 0.0004, + "step": 32752 + }, + { + "epoch": 0.64, + "learning_rate": 7.300299017513882e-08, + "loss": 0.0006, + "step": 32753 + }, + { + "epoch": 0.64, + "learning_rate": 7.299910683080268e-08, + "loss": 0.0005, + "step": 32754 + }, + { + "epoch": 0.64, + "learning_rate": 7.299522348646653e-08, + "loss": 0.0005, + "step": 32755 + }, + { + "epoch": 0.64, + "learning_rate": 7.299134014213039e-08, + "loss": 0.0006, + "step": 32756 + }, + { + "epoch": 0.64, + "learning_rate": 7.298745679779425e-08, + "loss": 0.0648, + "step": 32757 + }, + { + "epoch": 0.64, + "learning_rate": 7.298357345345811e-08, + "loss": 0.0005, + "step": 32758 + }, + { + "epoch": 0.64, + "learning_rate": 7.297969010912197e-08, + "loss": 0.0004, + "step": 32759 + }, + { + "epoch": 0.64, + "learning_rate": 7.297580676478583e-08, + "loss": 0.0005, + "step": 32760 + }, + { + "epoch": 0.64, + "learning_rate": 7.297192342044968e-08, + "loss": 0.0004, + "step": 32761 + }, + { + "epoch": 0.64, + "learning_rate": 7.296804007611354e-08, + "loss": 0.0004, + "step": 32762 + }, + { + "epoch": 0.64, + "learning_rate": 7.29641567317774e-08, + "loss": 0.0004, + "step": 32763 + }, + { + "epoch": 0.64, + "learning_rate": 7.296027338744126e-08, + "loss": 0.0075, + "step": 32764 + }, + { + "epoch": 0.64, + "learning_rate": 7.295639004310512e-08, + "loss": 0.0003, + "step": 32765 + }, + { + "epoch": 0.64, + "learning_rate": 7.295250669876897e-08, + "loss": 0.8888, + "step": 32766 + }, + { + "epoch": 0.64, + "learning_rate": 7.294862335443283e-08, + "loss": 0.6166, + "step": 32767 + }, + { + "epoch": 0.64, + "learning_rate": 7.294474001009669e-08, + "loss": 0.0006, + "step": 32768 + }, + { + "epoch": 0.64, + "learning_rate": 7.294085666576055e-08, + "loss": 0.0527, + "step": 32769 + }, + { + "epoch": 0.64, + "learning_rate": 7.293697332142441e-08, + "loss": 0.0006, + "step": 32770 + }, + { + "epoch": 0.64, + "learning_rate": 7.293308997708827e-08, + "loss": 0.0004, + "step": 32771 + }, + { + "epoch": 0.64, + "learning_rate": 7.292920663275212e-08, + "loss": 0.0005, + "step": 32772 + }, + { + "epoch": 0.64, + "learning_rate": 7.292532328841598e-08, + "loss": 0.0005, + "step": 32773 + }, + { + "epoch": 0.64, + "learning_rate": 7.292143994407984e-08, + "loss": 0.0326, + "step": 32774 + }, + { + "epoch": 0.64, + "learning_rate": 7.29175565997437e-08, + "loss": 0.4992, + "step": 32775 + }, + { + "epoch": 0.64, + "learning_rate": 7.291367325540754e-08, + "loss": 0.0013, + "step": 32776 + }, + { + "epoch": 0.64, + "learning_rate": 7.29097899110714e-08, + "loss": 0.0007, + "step": 32777 + }, + { + "epoch": 0.64, + "learning_rate": 7.290590656673526e-08, + "loss": 0.0232, + "step": 32778 + }, + { + "epoch": 0.64, + "learning_rate": 7.290202322239912e-08, + "loss": 0.0006, + "step": 32779 + }, + { + "epoch": 0.64, + "learning_rate": 7.289813987806298e-08, + "loss": 1.013, + "step": 32780 + }, + { + "epoch": 0.64, + "learning_rate": 7.289425653372684e-08, + "loss": 0.0005, + "step": 32781 + }, + { + "epoch": 0.64, + "learning_rate": 7.289037318939069e-08, + "loss": 0.0023, + "step": 32782 + }, + { + "epoch": 0.64, + "learning_rate": 7.288648984505455e-08, + "loss": 0.0783, + "step": 32783 + }, + { + "epoch": 0.64, + "learning_rate": 7.288260650071841e-08, + "loss": 0.0007, + "step": 32784 + }, + { + "epoch": 0.64, + "learning_rate": 7.287872315638227e-08, + "loss": 0.0005, + "step": 32785 + }, + { + "epoch": 0.64, + "learning_rate": 7.287483981204613e-08, + "loss": 0.1015, + "step": 32786 + }, + { + "epoch": 0.64, + "learning_rate": 7.287095646770998e-08, + "loss": 0.0016, + "step": 32787 + }, + { + "epoch": 0.64, + "learning_rate": 7.286707312337384e-08, + "loss": 0.0004, + "step": 32788 + }, + { + "epoch": 0.64, + "learning_rate": 7.28631897790377e-08, + "loss": 0.0003, + "step": 32789 + }, + { + "epoch": 0.64, + "learning_rate": 7.285930643470156e-08, + "loss": 0.0005, + "step": 32790 + }, + { + "epoch": 0.64, + "learning_rate": 7.285542309036542e-08, + "loss": 0.0004, + "step": 32791 + }, + { + "epoch": 0.64, + "learning_rate": 7.285153974602928e-08, + "loss": 0.0006, + "step": 32792 + }, + { + "epoch": 0.64, + "learning_rate": 7.284765640169313e-08, + "loss": 0.0004, + "step": 32793 + }, + { + "epoch": 0.64, + "learning_rate": 7.284377305735699e-08, + "loss": 0.0003, + "step": 32794 + }, + { + "epoch": 0.64, + "learning_rate": 7.283988971302085e-08, + "loss": 0.0004, + "step": 32795 + }, + { + "epoch": 0.64, + "learning_rate": 7.283600636868471e-08, + "loss": 0.0004, + "step": 32796 + }, + { + "epoch": 0.64, + "learning_rate": 7.283212302434857e-08, + "loss": 0.0007, + "step": 32797 + }, + { + "epoch": 0.64, + "learning_rate": 7.282823968001243e-08, + "loss": 0.0015, + "step": 32798 + }, + { + "epoch": 0.64, + "learning_rate": 7.282435633567628e-08, + "loss": 0.5854, + "step": 32799 + }, + { + "epoch": 0.64, + "learning_rate": 7.282047299134014e-08, + "loss": 0.0017, + "step": 32800 + }, + { + "epoch": 0.64, + "learning_rate": 7.2816589647004e-08, + "loss": 0.0032, + "step": 32801 + }, + { + "epoch": 0.64, + "learning_rate": 7.281270630266786e-08, + "loss": 0.0005, + "step": 32802 + }, + { + "epoch": 0.64, + "learning_rate": 7.280882295833172e-08, + "loss": 0.0006, + "step": 32803 + }, + { + "epoch": 0.64, + "learning_rate": 7.280493961399557e-08, + "loss": 0.5308, + "step": 32804 + }, + { + "epoch": 0.64, + "learning_rate": 7.280105626965942e-08, + "loss": 0.0004, + "step": 32805 + }, + { + "epoch": 0.64, + "learning_rate": 7.279717292532328e-08, + "loss": 0.0006, + "step": 32806 + }, + { + "epoch": 0.64, + "learning_rate": 7.279328958098714e-08, + "loss": 0.0004, + "step": 32807 + }, + { + "epoch": 0.64, + "learning_rate": 7.2789406236651e-08, + "loss": 0.0005, + "step": 32808 + }, + { + "epoch": 0.64, + "learning_rate": 7.278552289231485e-08, + "loss": 0.0003, + "step": 32809 + }, + { + "epoch": 0.64, + "learning_rate": 7.278163954797871e-08, + "loss": 0.0005, + "step": 32810 + }, + { + "epoch": 0.64, + "learning_rate": 7.277775620364257e-08, + "loss": 0.0005, + "step": 32811 + }, + { + "epoch": 0.64, + "learning_rate": 7.277387285930643e-08, + "loss": 0.0004, + "step": 32812 + }, + { + "epoch": 0.64, + "learning_rate": 7.276998951497029e-08, + "loss": 0.0005, + "step": 32813 + }, + { + "epoch": 0.64, + "learning_rate": 7.276610617063414e-08, + "loss": 0.0004, + "step": 32814 + }, + { + "epoch": 0.64, + "learning_rate": 7.2762222826298e-08, + "loss": 0.0004, + "step": 32815 + }, + { + "epoch": 0.64, + "learning_rate": 7.275833948196186e-08, + "loss": 0.9128, + "step": 32816 + }, + { + "epoch": 0.64, + "learning_rate": 7.275445613762572e-08, + "loss": 0.0004, + "step": 32817 + }, + { + "epoch": 0.64, + "learning_rate": 7.275057279328958e-08, + "loss": 0.0005, + "step": 32818 + }, + { + "epoch": 0.64, + "learning_rate": 7.274668944895344e-08, + "loss": 1.4225, + "step": 32819 + }, + { + "epoch": 0.64, + "learning_rate": 7.27428061046173e-08, + "loss": 0.0004, + "step": 32820 + }, + { + "epoch": 0.64, + "learning_rate": 7.273892276028115e-08, + "loss": 0.0006, + "step": 32821 + }, + { + "epoch": 0.64, + "learning_rate": 7.273503941594501e-08, + "loss": 0.0004, + "step": 32822 + }, + { + "epoch": 0.64, + "learning_rate": 7.273115607160887e-08, + "loss": 0.0006, + "step": 32823 + }, + { + "epoch": 0.64, + "learning_rate": 7.272727272727273e-08, + "loss": 0.0006, + "step": 32824 + }, + { + "epoch": 0.64, + "learning_rate": 7.272338938293658e-08, + "loss": 0.0004, + "step": 32825 + }, + { + "epoch": 0.64, + "learning_rate": 7.271950603860044e-08, + "loss": 0.0015, + "step": 32826 + }, + { + "epoch": 0.64, + "learning_rate": 7.27156226942643e-08, + "loss": 0.0006, + "step": 32827 + }, + { + "epoch": 0.64, + "learning_rate": 7.271173934992816e-08, + "loss": 0.0008, + "step": 32828 + }, + { + "epoch": 0.64, + "learning_rate": 7.270785600559202e-08, + "loss": 0.0004, + "step": 32829 + }, + { + "epoch": 0.64, + "learning_rate": 7.270397266125588e-08, + "loss": 0.0008, + "step": 32830 + }, + { + "epoch": 0.64, + "learning_rate": 7.270008931691973e-08, + "loss": 0.0004, + "step": 32831 + }, + { + "epoch": 0.64, + "learning_rate": 7.269620597258359e-08, + "loss": 0.0008, + "step": 32832 + }, + { + "epoch": 0.64, + "learning_rate": 7.269232262824745e-08, + "loss": 0.0005, + "step": 32833 + }, + { + "epoch": 0.64, + "learning_rate": 7.26884392839113e-08, + "loss": 0.0004, + "step": 32834 + }, + { + "epoch": 0.64, + "learning_rate": 7.268455593957515e-08, + "loss": 0.0004, + "step": 32835 + }, + { + "epoch": 0.64, + "learning_rate": 7.268067259523901e-08, + "loss": 0.0005, + "step": 32836 + }, + { + "epoch": 0.64, + "learning_rate": 7.267678925090287e-08, + "loss": 0.0006, + "step": 32837 + }, + { + "epoch": 0.64, + "learning_rate": 7.267290590656673e-08, + "loss": 0.0598, + "step": 32838 + }, + { + "epoch": 0.64, + "learning_rate": 7.266902256223059e-08, + "loss": 0.1539, + "step": 32839 + }, + { + "epoch": 0.64, + "learning_rate": 7.266513921789445e-08, + "loss": 0.0005, + "step": 32840 + }, + { + "epoch": 0.64, + "learning_rate": 7.26612558735583e-08, + "loss": 0.0035, + "step": 32841 + }, + { + "epoch": 0.64, + "learning_rate": 7.265737252922216e-08, + "loss": 0.0005, + "step": 32842 + }, + { + "epoch": 0.64, + "learning_rate": 7.265348918488602e-08, + "loss": 0.0006, + "step": 32843 + }, + { + "epoch": 0.64, + "learning_rate": 7.264960584054988e-08, + "loss": 0.0003, + "step": 32844 + }, + { + "epoch": 0.64, + "learning_rate": 7.264572249621374e-08, + "loss": 0.0003, + "step": 32845 + }, + { + "epoch": 0.64, + "learning_rate": 7.26418391518776e-08, + "loss": 0.0005, + "step": 32846 + }, + { + "epoch": 0.64, + "learning_rate": 7.263795580754145e-08, + "loss": 0.0007, + "step": 32847 + }, + { + "epoch": 0.64, + "learning_rate": 7.263407246320531e-08, + "loss": 0.0005, + "step": 32848 + }, + { + "epoch": 0.64, + "learning_rate": 7.263018911886917e-08, + "loss": 0.0003, + "step": 32849 + }, + { + "epoch": 0.64, + "learning_rate": 7.262630577453303e-08, + "loss": 0.0005, + "step": 32850 + }, + { + "epoch": 0.64, + "learning_rate": 7.262242243019689e-08, + "loss": 0.0007, + "step": 32851 + }, + { + "epoch": 0.64, + "learning_rate": 7.261853908586074e-08, + "loss": 0.0005, + "step": 32852 + }, + { + "epoch": 0.64, + "learning_rate": 7.26146557415246e-08, + "loss": 0.0003, + "step": 32853 + }, + { + "epoch": 0.64, + "learning_rate": 7.261077239718846e-08, + "loss": 0.0005, + "step": 32854 + }, + { + "epoch": 0.64, + "learning_rate": 7.260688905285232e-08, + "loss": 0.0023, + "step": 32855 + }, + { + "epoch": 0.64, + "learning_rate": 7.260300570851618e-08, + "loss": 0.0005, + "step": 32856 + }, + { + "epoch": 0.64, + "learning_rate": 7.259912236418004e-08, + "loss": 0.0004, + "step": 32857 + }, + { + "epoch": 0.64, + "learning_rate": 7.25952390198439e-08, + "loss": 0.0003, + "step": 32858 + }, + { + "epoch": 0.64, + "learning_rate": 7.259135567550775e-08, + "loss": 0.0013, + "step": 32859 + }, + { + "epoch": 0.64, + "learning_rate": 7.258747233117161e-08, + "loss": 0.0008, + "step": 32860 + }, + { + "epoch": 0.64, + "learning_rate": 7.258358898683547e-08, + "loss": 0.0007, + "step": 32861 + }, + { + "epoch": 0.64, + "learning_rate": 7.257970564249933e-08, + "loss": 0.0004, + "step": 32862 + }, + { + "epoch": 0.64, + "learning_rate": 7.257582229816317e-08, + "loss": 0.0004, + "step": 32863 + }, + { + "epoch": 0.64, + "learning_rate": 7.257193895382703e-08, + "loss": 0.0008, + "step": 32864 + }, + { + "epoch": 0.64, + "learning_rate": 7.256805560949089e-08, + "loss": 0.0004, + "step": 32865 + }, + { + "epoch": 0.64, + "learning_rate": 7.256417226515475e-08, + "loss": 0.2494, + "step": 32866 + }, + { + "epoch": 0.64, + "learning_rate": 7.25602889208186e-08, + "loss": 0.0004, + "step": 32867 + }, + { + "epoch": 0.64, + "learning_rate": 7.255640557648246e-08, + "loss": 0.0003, + "step": 32868 + }, + { + "epoch": 0.64, + "learning_rate": 7.255252223214632e-08, + "loss": 0.0005, + "step": 32869 + }, + { + "epoch": 0.64, + "learning_rate": 7.254863888781018e-08, + "loss": 0.0005, + "step": 32870 + }, + { + "epoch": 0.64, + "learning_rate": 7.254475554347404e-08, + "loss": 0.0319, + "step": 32871 + }, + { + "epoch": 0.64, + "learning_rate": 7.25408721991379e-08, + "loss": 0.5946, + "step": 32872 + }, + { + "epoch": 0.64, + "learning_rate": 7.253698885480175e-08, + "loss": 0.0004, + "step": 32873 + }, + { + "epoch": 0.64, + "learning_rate": 7.253310551046561e-08, + "loss": 0.0022, + "step": 32874 + }, + { + "epoch": 0.64, + "learning_rate": 7.252922216612947e-08, + "loss": 0.0005, + "step": 32875 + }, + { + "epoch": 0.64, + "learning_rate": 7.252533882179333e-08, + "loss": 0.2528, + "step": 32876 + }, + { + "epoch": 0.64, + "learning_rate": 7.252145547745719e-08, + "loss": 0.0004, + "step": 32877 + }, + { + "epoch": 0.64, + "learning_rate": 7.251757213312105e-08, + "loss": 0.0005, + "step": 32878 + }, + { + "epoch": 0.64, + "learning_rate": 7.25136887887849e-08, + "loss": 0.0004, + "step": 32879 + }, + { + "epoch": 0.64, + "learning_rate": 7.250980544444876e-08, + "loss": 0.0006, + "step": 32880 + }, + { + "epoch": 0.64, + "learning_rate": 7.250592210011262e-08, + "loss": 0.0009, + "step": 32881 + }, + { + "epoch": 0.64, + "learning_rate": 7.250203875577648e-08, + "loss": 0.001, + "step": 32882 + }, + { + "epoch": 0.64, + "learning_rate": 7.249815541144034e-08, + "loss": 0.0003, + "step": 32883 + }, + { + "epoch": 0.64, + "learning_rate": 7.24942720671042e-08, + "loss": 0.0004, + "step": 32884 + }, + { + "epoch": 0.64, + "learning_rate": 7.249038872276805e-08, + "loss": 0.6685, + "step": 32885 + }, + { + "epoch": 0.64, + "learning_rate": 7.248650537843191e-08, + "loss": 0.0004, + "step": 32886 + }, + { + "epoch": 0.64, + "learning_rate": 7.248262203409577e-08, + "loss": 0.0004, + "step": 32887 + }, + { + "epoch": 0.64, + "learning_rate": 7.247873868975963e-08, + "loss": 0.0006, + "step": 32888 + }, + { + "epoch": 0.64, + "learning_rate": 7.247485534542349e-08, + "loss": 0.0006, + "step": 32889 + }, + { + "epoch": 0.64, + "learning_rate": 7.247097200108734e-08, + "loss": 0.0051, + "step": 32890 + }, + { + "epoch": 0.64, + "learning_rate": 7.24670886567512e-08, + "loss": 0.0006, + "step": 32891 + }, + { + "epoch": 0.64, + "learning_rate": 7.246320531241505e-08, + "loss": 0.9981, + "step": 32892 + }, + { + "epoch": 0.64, + "learning_rate": 7.24593219680789e-08, + "loss": 0.0005, + "step": 32893 + }, + { + "epoch": 0.64, + "learning_rate": 7.245543862374276e-08, + "loss": 0.0007, + "step": 32894 + }, + { + "epoch": 0.64, + "learning_rate": 7.245155527940662e-08, + "loss": 0.0004, + "step": 32895 + }, + { + "epoch": 0.64, + "learning_rate": 7.244767193507048e-08, + "loss": 0.0004, + "step": 32896 + }, + { + "epoch": 0.64, + "learning_rate": 7.244378859073434e-08, + "loss": 0.0006, + "step": 32897 + }, + { + "epoch": 0.64, + "learning_rate": 7.24399052463982e-08, + "loss": 0.0005, + "step": 32898 + }, + { + "epoch": 0.64, + "learning_rate": 7.243602190206206e-08, + "loss": 0.0006, + "step": 32899 + }, + { + "epoch": 0.64, + "learning_rate": 7.243213855772591e-08, + "loss": 0.0003, + "step": 32900 + }, + { + "epoch": 0.64, + "learning_rate": 7.242825521338977e-08, + "loss": 0.0004, + "step": 32901 + }, + { + "epoch": 0.64, + "learning_rate": 7.242437186905363e-08, + "loss": 0.0985, + "step": 32902 + }, + { + "epoch": 0.64, + "learning_rate": 7.242048852471749e-08, + "loss": 0.0056, + "step": 32903 + }, + { + "epoch": 0.64, + "learning_rate": 7.241660518038135e-08, + "loss": 0.0004, + "step": 32904 + }, + { + "epoch": 0.64, + "learning_rate": 7.24127218360452e-08, + "loss": 0.0004, + "step": 32905 + }, + { + "epoch": 0.64, + "learning_rate": 7.240883849170906e-08, + "loss": 0.0009, + "step": 32906 + }, + { + "epoch": 0.64, + "learning_rate": 7.240495514737292e-08, + "loss": 1.2784, + "step": 32907 + }, + { + "epoch": 0.64, + "learning_rate": 7.240107180303678e-08, + "loss": 0.0006, + "step": 32908 + }, + { + "epoch": 0.64, + "learning_rate": 7.239718845870064e-08, + "loss": 0.0005, + "step": 32909 + }, + { + "epoch": 0.64, + "learning_rate": 7.239330511436448e-08, + "loss": 0.0007, + "step": 32910 + }, + { + "epoch": 0.64, + "learning_rate": 7.238942177002834e-08, + "loss": 0.0006, + "step": 32911 + }, + { + "epoch": 0.64, + "learning_rate": 7.23855384256922e-08, + "loss": 0.0017, + "step": 32912 + }, + { + "epoch": 0.64, + "learning_rate": 7.238165508135606e-08, + "loss": 0.5673, + "step": 32913 + }, + { + "epoch": 0.64, + "learning_rate": 7.237777173701992e-08, + "loss": 0.0005, + "step": 32914 + }, + { + "epoch": 0.64, + "learning_rate": 7.237388839268377e-08, + "loss": 0.0004, + "step": 32915 + }, + { + "epoch": 0.64, + "learning_rate": 7.237000504834763e-08, + "loss": 0.0008, + "step": 32916 + }, + { + "epoch": 0.64, + "learning_rate": 7.236612170401149e-08, + "loss": 0.0006, + "step": 32917 + }, + { + "epoch": 0.64, + "learning_rate": 7.236223835967535e-08, + "loss": 0.0004, + "step": 32918 + }, + { + "epoch": 0.64, + "learning_rate": 7.235835501533921e-08, + "loss": 0.0005, + "step": 32919 + }, + { + "epoch": 0.64, + "learning_rate": 7.235447167100306e-08, + "loss": 0.0008, + "step": 32920 + }, + { + "epoch": 0.64, + "learning_rate": 7.235058832666692e-08, + "loss": 0.0009, + "step": 32921 + }, + { + "epoch": 0.64, + "learning_rate": 7.234670498233078e-08, + "loss": 0.2581, + "step": 32922 + }, + { + "epoch": 0.64, + "learning_rate": 7.234282163799464e-08, + "loss": 0.0027, + "step": 32923 + }, + { + "epoch": 0.64, + "learning_rate": 7.23389382936585e-08, + "loss": 0.0005, + "step": 32924 + }, + { + "epoch": 0.64, + "learning_rate": 7.233505494932234e-08, + "loss": 0.0005, + "step": 32925 + }, + { + "epoch": 0.64, + "learning_rate": 7.23311716049862e-08, + "loss": 0.0005, + "step": 32926 + }, + { + "epoch": 0.64, + "learning_rate": 7.232728826065006e-08, + "loss": 0.0004, + "step": 32927 + }, + { + "epoch": 0.64, + "learning_rate": 7.232340491631392e-08, + "loss": 0.0006, + "step": 32928 + }, + { + "epoch": 0.64, + "learning_rate": 7.231952157197778e-08, + "loss": 0.0131, + "step": 32929 + }, + { + "epoch": 0.64, + "learning_rate": 7.231563822764163e-08, + "loss": 0.0008, + "step": 32930 + }, + { + "epoch": 0.64, + "learning_rate": 7.231175488330549e-08, + "loss": 0.0006, + "step": 32931 + }, + { + "epoch": 0.64, + "learning_rate": 7.230787153896935e-08, + "loss": 0.001, + "step": 32932 + }, + { + "epoch": 0.64, + "learning_rate": 7.230398819463321e-08, + "loss": 0.0006, + "step": 32933 + }, + { + "epoch": 0.64, + "learning_rate": 7.230010485029707e-08, + "loss": 0.0003, + "step": 32934 + }, + { + "epoch": 0.64, + "learning_rate": 7.229622150596093e-08, + "loss": 0.5365, + "step": 32935 + }, + { + "epoch": 0.64, + "learning_rate": 7.229233816162478e-08, + "loss": 0.0005, + "step": 32936 + }, + { + "epoch": 0.64, + "learning_rate": 7.228845481728864e-08, + "loss": 0.0005, + "step": 32937 + }, + { + "epoch": 0.64, + "learning_rate": 7.22845714729525e-08, + "loss": 0.0004, + "step": 32938 + }, + { + "epoch": 0.64, + "learning_rate": 7.228068812861636e-08, + "loss": 0.0005, + "step": 32939 + }, + { + "epoch": 0.64, + "learning_rate": 7.227680478428022e-08, + "loss": 1.9953, + "step": 32940 + }, + { + "epoch": 0.64, + "learning_rate": 7.227292143994407e-08, + "loss": 0.0005, + "step": 32941 + }, + { + "epoch": 0.64, + "learning_rate": 7.226903809560793e-08, + "loss": 0.0004, + "step": 32942 + }, + { + "epoch": 0.64, + "learning_rate": 7.226515475127179e-08, + "loss": 0.0006, + "step": 32943 + }, + { + "epoch": 0.64, + "learning_rate": 7.226127140693565e-08, + "loss": 0.0003, + "step": 32944 + }, + { + "epoch": 0.64, + "learning_rate": 7.225738806259951e-08, + "loss": 0.0074, + "step": 32945 + }, + { + "epoch": 0.64, + "learning_rate": 7.225350471826337e-08, + "loss": 0.0006, + "step": 32946 + }, + { + "epoch": 0.64, + "learning_rate": 7.224962137392722e-08, + "loss": 0.0004, + "step": 32947 + }, + { + "epoch": 0.64, + "learning_rate": 7.224573802959108e-08, + "loss": 0.0004, + "step": 32948 + }, + { + "epoch": 0.64, + "learning_rate": 7.224185468525494e-08, + "loss": 0.0006, + "step": 32949 + }, + { + "epoch": 0.64, + "learning_rate": 7.223797134091879e-08, + "loss": 0.0004, + "step": 32950 + }, + { + "epoch": 0.64, + "learning_rate": 7.223408799658264e-08, + "loss": 0.0004, + "step": 32951 + }, + { + "epoch": 0.64, + "learning_rate": 7.22302046522465e-08, + "loss": 0.0006, + "step": 32952 + }, + { + "epoch": 0.64, + "learning_rate": 7.222632130791036e-08, + "loss": 1.2954, + "step": 32953 + }, + { + "epoch": 0.64, + "learning_rate": 7.222243796357422e-08, + "loss": 0.0007, + "step": 32954 + }, + { + "epoch": 0.64, + "learning_rate": 7.221855461923808e-08, + "loss": 0.0004, + "step": 32955 + }, + { + "epoch": 0.64, + "learning_rate": 7.221467127490194e-08, + "loss": 0.0007, + "step": 32956 + }, + { + "epoch": 0.64, + "learning_rate": 7.22107879305658e-08, + "loss": 0.0004, + "step": 32957 + }, + { + "epoch": 0.64, + "learning_rate": 7.220690458622965e-08, + "loss": 0.0004, + "step": 32958 + }, + { + "epoch": 0.64, + "learning_rate": 7.220302124189351e-08, + "loss": 1.2718, + "step": 32959 + }, + { + "epoch": 0.64, + "learning_rate": 7.219913789755737e-08, + "loss": 0.0017, + "step": 32960 + }, + { + "epoch": 0.64, + "learning_rate": 7.219525455322123e-08, + "loss": 0.9043, + "step": 32961 + }, + { + "epoch": 0.64, + "learning_rate": 7.219137120888508e-08, + "loss": 0.0004, + "step": 32962 + }, + { + "epoch": 0.64, + "learning_rate": 7.218748786454894e-08, + "loss": 0.0005, + "step": 32963 + }, + { + "epoch": 0.64, + "learning_rate": 7.21836045202128e-08, + "loss": 0.0561, + "step": 32964 + }, + { + "epoch": 0.64, + "learning_rate": 7.217972117587666e-08, + "loss": 0.0004, + "step": 32965 + }, + { + "epoch": 0.64, + "learning_rate": 7.217583783154052e-08, + "loss": 0.0004, + "step": 32966 + }, + { + "epoch": 0.64, + "learning_rate": 7.217195448720438e-08, + "loss": 0.0081, + "step": 32967 + }, + { + "epoch": 0.64, + "learning_rate": 7.216807114286823e-08, + "loss": 0.0013, + "step": 32968 + }, + { + "epoch": 0.64, + "learning_rate": 7.216418779853209e-08, + "loss": 0.0005, + "step": 32969 + }, + { + "epoch": 0.64, + "learning_rate": 7.216030445419595e-08, + "loss": 0.008, + "step": 32970 + }, + { + "epoch": 0.64, + "learning_rate": 7.215642110985981e-08, + "loss": 0.0004, + "step": 32971 + }, + { + "epoch": 0.64, + "learning_rate": 7.215253776552367e-08, + "loss": 0.0005, + "step": 32972 + }, + { + "epoch": 0.64, + "learning_rate": 7.214865442118753e-08, + "loss": 0.0005, + "step": 32973 + }, + { + "epoch": 0.64, + "learning_rate": 7.214477107685138e-08, + "loss": 0.0036, + "step": 32974 + }, + { + "epoch": 0.64, + "learning_rate": 7.214088773251524e-08, + "loss": 0.0004, + "step": 32975 + }, + { + "epoch": 0.64, + "learning_rate": 7.21370043881791e-08, + "loss": 0.0005, + "step": 32976 + }, + { + "epoch": 0.64, + "learning_rate": 7.213312104384296e-08, + "loss": 0.0005, + "step": 32977 + }, + { + "epoch": 0.64, + "learning_rate": 7.212923769950682e-08, + "loss": 0.0003, + "step": 32978 + }, + { + "epoch": 0.64, + "learning_rate": 7.212535435517066e-08, + "loss": 0.0005, + "step": 32979 + }, + { + "epoch": 0.64, + "learning_rate": 7.212147101083452e-08, + "loss": 0.0005, + "step": 32980 + }, + { + "epoch": 0.64, + "learning_rate": 7.211758766649838e-08, + "loss": 0.0006, + "step": 32981 + }, + { + "epoch": 0.64, + "learning_rate": 7.211370432216224e-08, + "loss": 0.0042, + "step": 32982 + }, + { + "epoch": 0.64, + "learning_rate": 7.21098209778261e-08, + "loss": 0.0011, + "step": 32983 + }, + { + "epoch": 0.64, + "learning_rate": 7.210593763348995e-08, + "loss": 0.001, + "step": 32984 + }, + { + "epoch": 0.64, + "learning_rate": 7.210205428915381e-08, + "loss": 0.0006, + "step": 32985 + }, + { + "epoch": 0.64, + "learning_rate": 7.209817094481767e-08, + "loss": 0.0009, + "step": 32986 + }, + { + "epoch": 0.64, + "learning_rate": 7.209428760048153e-08, + "loss": 0.0008, + "step": 32987 + }, + { + "epoch": 0.64, + "learning_rate": 7.209040425614539e-08, + "loss": 0.0005, + "step": 32988 + }, + { + "epoch": 0.64, + "learning_rate": 7.208652091180924e-08, + "loss": 0.0005, + "step": 32989 + }, + { + "epoch": 0.64, + "learning_rate": 7.20826375674731e-08, + "loss": 0.0004, + "step": 32990 + }, + { + "epoch": 0.64, + "learning_rate": 7.207875422313696e-08, + "loss": 0.0171, + "step": 32991 + }, + { + "epoch": 0.64, + "learning_rate": 7.207487087880082e-08, + "loss": 0.0004, + "step": 32992 + }, + { + "epoch": 0.64, + "learning_rate": 7.207098753446468e-08, + "loss": 0.0004, + "step": 32993 + }, + { + "epoch": 0.64, + "learning_rate": 7.206710419012854e-08, + "loss": 0.5387, + "step": 32994 + }, + { + "epoch": 0.64, + "learning_rate": 7.20632208457924e-08, + "loss": 0.0006, + "step": 32995 + }, + { + "epoch": 0.64, + "learning_rate": 7.205933750145625e-08, + "loss": 0.0004, + "step": 32996 + }, + { + "epoch": 0.64, + "learning_rate": 7.205545415712011e-08, + "loss": 0.984, + "step": 32997 + }, + { + "epoch": 0.64, + "learning_rate": 7.205157081278397e-08, + "loss": 0.0005, + "step": 32998 + }, + { + "epoch": 0.64, + "learning_rate": 7.204768746844783e-08, + "loss": 0.0006, + "step": 32999 + }, + { + "epoch": 0.64, + "learning_rate": 7.204380412411168e-08, + "loss": 0.0004, + "step": 33000 + }, + { + "epoch": 0.64, + "learning_rate": 7.203992077977554e-08, + "loss": 0.0014, + "step": 33001 + }, + { + "epoch": 0.64, + "learning_rate": 7.20360374354394e-08, + "loss": 0.0005, + "step": 33002 + }, + { + "epoch": 0.64, + "learning_rate": 7.203215409110326e-08, + "loss": 0.0004, + "step": 33003 + }, + { + "epoch": 0.64, + "learning_rate": 7.202827074676712e-08, + "loss": 0.0004, + "step": 33004 + }, + { + "epoch": 0.64, + "learning_rate": 7.202438740243098e-08, + "loss": 0.0004, + "step": 33005 + }, + { + "epoch": 0.64, + "learning_rate": 7.202050405809483e-08, + "loss": 0.0004, + "step": 33006 + }, + { + "epoch": 0.64, + "learning_rate": 7.201662071375869e-08, + "loss": 0.0004, + "step": 33007 + }, + { + "epoch": 0.64, + "learning_rate": 7.201273736942254e-08, + "loss": 0.0009, + "step": 33008 + }, + { + "epoch": 0.64, + "learning_rate": 7.20088540250864e-08, + "loss": 0.0004, + "step": 33009 + }, + { + "epoch": 0.64, + "learning_rate": 7.200497068075025e-08, + "loss": 0.0008, + "step": 33010 + }, + { + "epoch": 0.64, + "learning_rate": 7.200108733641411e-08, + "loss": 0.0004, + "step": 33011 + }, + { + "epoch": 0.64, + "learning_rate": 7.199720399207797e-08, + "loss": 0.0005, + "step": 33012 + }, + { + "epoch": 0.64, + "learning_rate": 7.199332064774183e-08, + "loss": 0.0009, + "step": 33013 + }, + { + "epoch": 0.64, + "learning_rate": 7.198943730340569e-08, + "loss": 0.0005, + "step": 33014 + }, + { + "epoch": 0.64, + "learning_rate": 7.198555395906955e-08, + "loss": 0.0003, + "step": 33015 + }, + { + "epoch": 0.64, + "learning_rate": 7.19816706147334e-08, + "loss": 0.0006, + "step": 33016 + }, + { + "epoch": 0.64, + "learning_rate": 7.197778727039726e-08, + "loss": 0.0006, + "step": 33017 + }, + { + "epoch": 0.64, + "learning_rate": 7.197390392606112e-08, + "loss": 0.0115, + "step": 33018 + }, + { + "epoch": 0.64, + "learning_rate": 7.197002058172498e-08, + "loss": 0.0004, + "step": 33019 + }, + { + "epoch": 0.64, + "learning_rate": 7.196613723738884e-08, + "loss": 0.0006, + "step": 33020 + }, + { + "epoch": 0.64, + "learning_rate": 7.19622538930527e-08, + "loss": 0.0005, + "step": 33021 + }, + { + "epoch": 0.64, + "learning_rate": 7.195837054871655e-08, + "loss": 0.0004, + "step": 33022 + }, + { + "epoch": 0.64, + "learning_rate": 7.195448720438041e-08, + "loss": 0.0004, + "step": 33023 + }, + { + "epoch": 0.64, + "learning_rate": 7.195060386004427e-08, + "loss": 0.0005, + "step": 33024 + }, + { + "epoch": 0.64, + "learning_rate": 7.194672051570813e-08, + "loss": 0.0009, + "step": 33025 + }, + { + "epoch": 0.64, + "learning_rate": 7.194283717137199e-08, + "loss": 0.085, + "step": 33026 + }, + { + "epoch": 0.64, + "learning_rate": 7.193895382703584e-08, + "loss": 0.4113, + "step": 33027 + }, + { + "epoch": 0.64, + "learning_rate": 7.19350704826997e-08, + "loss": 0.0004, + "step": 33028 + }, + { + "epoch": 0.64, + "learning_rate": 7.193118713836356e-08, + "loss": 0.0005, + "step": 33029 + }, + { + "epoch": 0.64, + "learning_rate": 7.192730379402742e-08, + "loss": 0.0006, + "step": 33030 + }, + { + "epoch": 0.64, + "learning_rate": 7.192342044969128e-08, + "loss": 0.0009, + "step": 33031 + }, + { + "epoch": 0.64, + "learning_rate": 7.191953710535514e-08, + "loss": 0.0003, + "step": 33032 + }, + { + "epoch": 0.64, + "learning_rate": 7.1915653761019e-08, + "loss": 0.0004, + "step": 33033 + }, + { + "epoch": 0.64, + "learning_rate": 7.191177041668285e-08, + "loss": 0.0006, + "step": 33034 + }, + { + "epoch": 0.64, + "learning_rate": 7.190788707234671e-08, + "loss": 0.0004, + "step": 33035 + }, + { + "epoch": 0.64, + "learning_rate": 7.190400372801057e-08, + "loss": 0.0004, + "step": 33036 + }, + { + "epoch": 0.64, + "learning_rate": 7.190012038367441e-08, + "loss": 0.0005, + "step": 33037 + }, + { + "epoch": 0.64, + "learning_rate": 7.189623703933827e-08, + "loss": 0.0005, + "step": 33038 + }, + { + "epoch": 0.64, + "learning_rate": 7.189235369500213e-08, + "loss": 0.0008, + "step": 33039 + }, + { + "epoch": 0.64, + "learning_rate": 7.188847035066599e-08, + "loss": 0.1578, + "step": 33040 + }, + { + "epoch": 0.64, + "learning_rate": 7.188458700632985e-08, + "loss": 0.0006, + "step": 33041 + }, + { + "epoch": 0.64, + "learning_rate": 7.18807036619937e-08, + "loss": 0.0005, + "step": 33042 + }, + { + "epoch": 0.64, + "learning_rate": 7.187682031765756e-08, + "loss": 0.0004, + "step": 33043 + }, + { + "epoch": 0.64, + "learning_rate": 7.187293697332142e-08, + "loss": 0.0007, + "step": 33044 + }, + { + "epoch": 0.64, + "learning_rate": 7.186905362898528e-08, + "loss": 0.0014, + "step": 33045 + }, + { + "epoch": 0.64, + "learning_rate": 7.186517028464914e-08, + "loss": 0.0031, + "step": 33046 + }, + { + "epoch": 0.64, + "learning_rate": 7.1861286940313e-08, + "loss": 0.0004, + "step": 33047 + }, + { + "epoch": 0.64, + "learning_rate": 7.185740359597685e-08, + "loss": 0.002, + "step": 33048 + }, + { + "epoch": 0.64, + "learning_rate": 7.185352025164071e-08, + "loss": 0.0006, + "step": 33049 + }, + { + "epoch": 0.64, + "learning_rate": 7.184963690730457e-08, + "loss": 0.0005, + "step": 33050 + }, + { + "epoch": 0.64, + "learning_rate": 7.184575356296843e-08, + "loss": 0.1913, + "step": 33051 + }, + { + "epoch": 0.64, + "learning_rate": 7.184187021863229e-08, + "loss": 0.0004, + "step": 33052 + }, + { + "epoch": 0.64, + "learning_rate": 7.183798687429615e-08, + "loss": 0.0004, + "step": 33053 + }, + { + "epoch": 0.64, + "learning_rate": 7.183410352996e-08, + "loss": 0.0004, + "step": 33054 + }, + { + "epoch": 0.64, + "learning_rate": 7.183022018562386e-08, + "loss": 0.0005, + "step": 33055 + }, + { + "epoch": 0.64, + "learning_rate": 7.182633684128772e-08, + "loss": 0.0007, + "step": 33056 + }, + { + "epoch": 0.64, + "learning_rate": 7.182245349695158e-08, + "loss": 0.0007, + "step": 33057 + }, + { + "epoch": 0.64, + "learning_rate": 7.181857015261544e-08, + "loss": 0.006, + "step": 33058 + }, + { + "epoch": 0.64, + "learning_rate": 7.18146868082793e-08, + "loss": 0.0006, + "step": 33059 + }, + { + "epoch": 0.64, + "learning_rate": 7.181080346394315e-08, + "loss": 0.0007, + "step": 33060 + }, + { + "epoch": 0.64, + "learning_rate": 7.180692011960701e-08, + "loss": 0.0006, + "step": 33061 + }, + { + "epoch": 0.64, + "learning_rate": 7.180303677527087e-08, + "loss": 0.0232, + "step": 33062 + }, + { + "epoch": 0.64, + "learning_rate": 7.179915343093473e-08, + "loss": 0.0771, + "step": 33063 + }, + { + "epoch": 0.64, + "learning_rate": 7.179527008659859e-08, + "loss": 0.0004, + "step": 33064 + }, + { + "epoch": 0.64, + "learning_rate": 7.179138674226244e-08, + "loss": 0.0004, + "step": 33065 + }, + { + "epoch": 0.64, + "learning_rate": 7.178750339792629e-08, + "loss": 0.0303, + "step": 33066 + }, + { + "epoch": 0.64, + "learning_rate": 7.178362005359015e-08, + "loss": 0.0009, + "step": 33067 + }, + { + "epoch": 0.64, + "learning_rate": 7.1779736709254e-08, + "loss": 0.0004, + "step": 33068 + }, + { + "epoch": 0.64, + "learning_rate": 7.177585336491786e-08, + "loss": 0.0004, + "step": 33069 + }, + { + "epoch": 0.64, + "learning_rate": 7.177197002058172e-08, + "loss": 0.0004, + "step": 33070 + }, + { + "epoch": 0.64, + "learning_rate": 7.176808667624558e-08, + "loss": 0.0005, + "step": 33071 + }, + { + "epoch": 0.64, + "learning_rate": 7.176420333190944e-08, + "loss": 0.0009, + "step": 33072 + }, + { + "epoch": 0.64, + "learning_rate": 7.17603199875733e-08, + "loss": 0.0005, + "step": 33073 + }, + { + "epoch": 0.64, + "learning_rate": 7.175643664323716e-08, + "loss": 0.0018, + "step": 33074 + }, + { + "epoch": 0.64, + "learning_rate": 7.175255329890101e-08, + "loss": 0.0007, + "step": 33075 + }, + { + "epoch": 0.64, + "learning_rate": 7.174866995456487e-08, + "loss": 0.0005, + "step": 33076 + }, + { + "epoch": 0.64, + "learning_rate": 7.174478661022873e-08, + "loss": 0.0004, + "step": 33077 + }, + { + "epoch": 0.64, + "learning_rate": 7.174090326589259e-08, + "loss": 0.0006, + "step": 33078 + }, + { + "epoch": 0.64, + "learning_rate": 7.173701992155645e-08, + "loss": 0.001, + "step": 33079 + }, + { + "epoch": 0.64, + "learning_rate": 7.17331365772203e-08, + "loss": 0.0004, + "step": 33080 + }, + { + "epoch": 0.64, + "learning_rate": 7.172925323288416e-08, + "loss": 0.0006, + "step": 33081 + }, + { + "epoch": 0.64, + "learning_rate": 7.172536988854802e-08, + "loss": 0.0015, + "step": 33082 + }, + { + "epoch": 0.64, + "learning_rate": 7.172148654421188e-08, + "loss": 0.0005, + "step": 33083 + }, + { + "epoch": 0.64, + "learning_rate": 7.171760319987574e-08, + "loss": 0.0004, + "step": 33084 + }, + { + "epoch": 0.64, + "learning_rate": 7.17137198555396e-08, + "loss": 0.0003, + "step": 33085 + }, + { + "epoch": 0.64, + "learning_rate": 7.170983651120345e-08, + "loss": 0.0004, + "step": 33086 + }, + { + "epoch": 0.64, + "learning_rate": 7.17059531668673e-08, + "loss": 0.0005, + "step": 33087 + }, + { + "epoch": 0.64, + "learning_rate": 7.170206982253116e-08, + "loss": 0.0005, + "step": 33088 + }, + { + "epoch": 0.64, + "learning_rate": 7.169818647819502e-08, + "loss": 0.0006, + "step": 33089 + }, + { + "epoch": 0.64, + "learning_rate": 7.169430313385887e-08, + "loss": 0.0005, + "step": 33090 + }, + { + "epoch": 0.64, + "learning_rate": 7.169041978952273e-08, + "loss": 0.0005, + "step": 33091 + }, + { + "epoch": 0.64, + "learning_rate": 7.168653644518659e-08, + "loss": 0.0026, + "step": 33092 + }, + { + "epoch": 0.64, + "learning_rate": 7.168265310085045e-08, + "loss": 0.0073, + "step": 33093 + }, + { + "epoch": 0.64, + "learning_rate": 7.167876975651431e-08, + "loss": 0.0004, + "step": 33094 + }, + { + "epoch": 0.64, + "learning_rate": 7.167488641217817e-08, + "loss": 0.0005, + "step": 33095 + }, + { + "epoch": 0.64, + "learning_rate": 7.167100306784202e-08, + "loss": 0.0005, + "step": 33096 + }, + { + "epoch": 0.64, + "learning_rate": 7.166711972350588e-08, + "loss": 0.0015, + "step": 33097 + }, + { + "epoch": 0.64, + "learning_rate": 7.166323637916974e-08, + "loss": 0.0005, + "step": 33098 + }, + { + "epoch": 0.64, + "learning_rate": 7.16593530348336e-08, + "loss": 0.0005, + "step": 33099 + }, + { + "epoch": 0.64, + "learning_rate": 7.165546969049746e-08, + "loss": 0.0007, + "step": 33100 + }, + { + "epoch": 0.64, + "learning_rate": 7.165158634616131e-08, + "loss": 0.0004, + "step": 33101 + }, + { + "epoch": 0.64, + "learning_rate": 7.164770300182516e-08, + "loss": 0.0005, + "step": 33102 + }, + { + "epoch": 0.64, + "learning_rate": 7.164381965748902e-08, + "loss": 0.0005, + "step": 33103 + }, + { + "epoch": 0.64, + "learning_rate": 7.163993631315288e-08, + "loss": 0.0005, + "step": 33104 + }, + { + "epoch": 0.64, + "learning_rate": 7.163605296881673e-08, + "loss": 0.92, + "step": 33105 + }, + { + "epoch": 0.64, + "learning_rate": 7.163216962448059e-08, + "loss": 0.0005, + "step": 33106 + }, + { + "epoch": 0.64, + "learning_rate": 7.162828628014445e-08, + "loss": 1.982, + "step": 33107 + }, + { + "epoch": 0.64, + "learning_rate": 7.162440293580831e-08, + "loss": 0.0006, + "step": 33108 + }, + { + "epoch": 0.64, + "learning_rate": 7.162051959147217e-08, + "loss": 0.0023, + "step": 33109 + }, + { + "epoch": 0.64, + "learning_rate": 7.161663624713603e-08, + "loss": 0.0019, + "step": 33110 + }, + { + "epoch": 0.64, + "learning_rate": 7.161275290279988e-08, + "loss": 0.0007, + "step": 33111 + }, + { + "epoch": 0.64, + "learning_rate": 7.160886955846374e-08, + "loss": 0.0005, + "step": 33112 + }, + { + "epoch": 0.64, + "learning_rate": 7.16049862141276e-08, + "loss": 0.0005, + "step": 33113 + }, + { + "epoch": 0.64, + "learning_rate": 7.160110286979146e-08, + "loss": 0.0015, + "step": 33114 + }, + { + "epoch": 0.64, + "learning_rate": 7.159721952545532e-08, + "loss": 0.0004, + "step": 33115 + }, + { + "epoch": 0.64, + "learning_rate": 7.159333618111917e-08, + "loss": 1.2565, + "step": 33116 + }, + { + "epoch": 0.64, + "learning_rate": 7.158945283678303e-08, + "loss": 0.2376, + "step": 33117 + }, + { + "epoch": 0.64, + "learning_rate": 7.158556949244689e-08, + "loss": 0.0004, + "step": 33118 + }, + { + "epoch": 0.64, + "learning_rate": 7.158168614811075e-08, + "loss": 0.0004, + "step": 33119 + }, + { + "epoch": 0.64, + "learning_rate": 7.157780280377461e-08, + "loss": 0.0005, + "step": 33120 + }, + { + "epoch": 0.64, + "learning_rate": 7.157391945943847e-08, + "loss": 0.0003, + "step": 33121 + }, + { + "epoch": 0.64, + "learning_rate": 7.157003611510232e-08, + "loss": 0.0005, + "step": 33122 + }, + { + "epoch": 0.64, + "learning_rate": 7.156615277076618e-08, + "loss": 0.0006, + "step": 33123 + }, + { + "epoch": 0.64, + "learning_rate": 7.156226942643003e-08, + "loss": 0.0004, + "step": 33124 + }, + { + "epoch": 0.64, + "learning_rate": 7.155838608209389e-08, + "loss": 0.0006, + "step": 33125 + }, + { + "epoch": 0.64, + "learning_rate": 7.155450273775774e-08, + "loss": 0.0005, + "step": 33126 + }, + { + "epoch": 0.64, + "learning_rate": 7.15506193934216e-08, + "loss": 0.0005, + "step": 33127 + }, + { + "epoch": 0.64, + "learning_rate": 7.154673604908546e-08, + "loss": 0.0005, + "step": 33128 + }, + { + "epoch": 0.64, + "learning_rate": 7.154285270474932e-08, + "loss": 0.0006, + "step": 33129 + }, + { + "epoch": 0.64, + "learning_rate": 7.153896936041318e-08, + "loss": 0.0005, + "step": 33130 + }, + { + "epoch": 0.64, + "learning_rate": 7.153508601607704e-08, + "loss": 0.001, + "step": 33131 + }, + { + "epoch": 0.64, + "learning_rate": 7.15312026717409e-08, + "loss": 0.0007, + "step": 33132 + }, + { + "epoch": 0.64, + "learning_rate": 7.152731932740475e-08, + "loss": 0.0005, + "step": 33133 + }, + { + "epoch": 0.64, + "learning_rate": 7.152343598306861e-08, + "loss": 0.0003, + "step": 33134 + }, + { + "epoch": 0.64, + "learning_rate": 7.151955263873247e-08, + "loss": 0.0005, + "step": 33135 + }, + { + "epoch": 0.64, + "learning_rate": 7.151566929439633e-08, + "loss": 0.0005, + "step": 33136 + }, + { + "epoch": 0.64, + "learning_rate": 7.151178595006018e-08, + "loss": 0.0004, + "step": 33137 + }, + { + "epoch": 0.64, + "learning_rate": 7.150790260572404e-08, + "loss": 0.0008, + "step": 33138 + }, + { + "epoch": 0.64, + "learning_rate": 7.15040192613879e-08, + "loss": 0.0004, + "step": 33139 + }, + { + "epoch": 0.64, + "learning_rate": 7.150013591705176e-08, + "loss": 0.0005, + "step": 33140 + }, + { + "epoch": 0.64, + "learning_rate": 7.149625257271562e-08, + "loss": 0.0005, + "step": 33141 + }, + { + "epoch": 0.64, + "learning_rate": 7.149236922837948e-08, + "loss": 0.0004, + "step": 33142 + }, + { + "epoch": 0.64, + "learning_rate": 7.148848588404333e-08, + "loss": 0.0004, + "step": 33143 + }, + { + "epoch": 0.64, + "learning_rate": 7.148460253970719e-08, + "loss": 0.0005, + "step": 33144 + }, + { + "epoch": 0.64, + "learning_rate": 7.148071919537105e-08, + "loss": 0.0014, + "step": 33145 + }, + { + "epoch": 0.64, + "learning_rate": 7.147683585103491e-08, + "loss": 0.0003, + "step": 33146 + }, + { + "epoch": 0.64, + "learning_rate": 7.147295250669877e-08, + "loss": 1.2548, + "step": 33147 + }, + { + "epoch": 0.64, + "learning_rate": 7.146906916236263e-08, + "loss": 0.0018, + "step": 33148 + }, + { + "epoch": 0.64, + "learning_rate": 7.146518581802648e-08, + "loss": 0.0007, + "step": 33149 + }, + { + "epoch": 0.64, + "learning_rate": 7.146130247369034e-08, + "loss": 0.0023, + "step": 33150 + }, + { + "epoch": 0.64, + "learning_rate": 7.14574191293542e-08, + "loss": 0.0006, + "step": 33151 + }, + { + "epoch": 0.64, + "learning_rate": 7.145353578501806e-08, + "loss": 0.0005, + "step": 33152 + }, + { + "epoch": 0.64, + "learning_rate": 7.14496524406819e-08, + "loss": 0.0005, + "step": 33153 + }, + { + "epoch": 0.64, + "learning_rate": 7.144576909634576e-08, + "loss": 0.0003, + "step": 33154 + }, + { + "epoch": 0.64, + "learning_rate": 7.144188575200962e-08, + "loss": 0.0004, + "step": 33155 + }, + { + "epoch": 0.64, + "learning_rate": 7.143800240767348e-08, + "loss": 0.0008, + "step": 33156 + }, + { + "epoch": 0.64, + "learning_rate": 7.143411906333734e-08, + "loss": 0.0007, + "step": 33157 + }, + { + "epoch": 0.64, + "learning_rate": 7.14302357190012e-08, + "loss": 0.0006, + "step": 33158 + }, + { + "epoch": 0.64, + "learning_rate": 7.142635237466505e-08, + "loss": 0.7706, + "step": 33159 + }, + { + "epoch": 0.64, + "learning_rate": 7.142246903032891e-08, + "loss": 0.0003, + "step": 33160 + }, + { + "epoch": 0.64, + "learning_rate": 7.141858568599277e-08, + "loss": 0.0005, + "step": 33161 + }, + { + "epoch": 0.64, + "learning_rate": 7.141470234165663e-08, + "loss": 0.0005, + "step": 33162 + }, + { + "epoch": 0.64, + "learning_rate": 7.141081899732049e-08, + "loss": 0.0003, + "step": 33163 + }, + { + "epoch": 0.64, + "learning_rate": 7.140693565298434e-08, + "loss": 0.0004, + "step": 33164 + }, + { + "epoch": 0.64, + "learning_rate": 7.14030523086482e-08, + "loss": 0.0036, + "step": 33165 + }, + { + "epoch": 0.64, + "learning_rate": 7.139916896431206e-08, + "loss": 0.0005, + "step": 33166 + }, + { + "epoch": 0.64, + "learning_rate": 7.139528561997592e-08, + "loss": 0.0047, + "step": 33167 + }, + { + "epoch": 0.64, + "learning_rate": 7.139140227563978e-08, + "loss": 0.0099, + "step": 33168 + }, + { + "epoch": 0.64, + "learning_rate": 7.138751893130364e-08, + "loss": 0.0005, + "step": 33169 + }, + { + "epoch": 0.64, + "learning_rate": 7.13836355869675e-08, + "loss": 0.0006, + "step": 33170 + }, + { + "epoch": 0.64, + "learning_rate": 7.137975224263135e-08, + "loss": 0.0025, + "step": 33171 + }, + { + "epoch": 0.64, + "learning_rate": 7.137586889829521e-08, + "loss": 0.0007, + "step": 33172 + }, + { + "epoch": 0.64, + "learning_rate": 7.137198555395907e-08, + "loss": 0.0005, + "step": 33173 + }, + { + "epoch": 0.64, + "learning_rate": 7.136810220962293e-08, + "loss": 0.0022, + "step": 33174 + }, + { + "epoch": 0.64, + "learning_rate": 7.136421886528678e-08, + "loss": 0.3939, + "step": 33175 + }, + { + "epoch": 0.64, + "learning_rate": 7.136033552095064e-08, + "loss": 0.0004, + "step": 33176 + }, + { + "epoch": 0.64, + "learning_rate": 7.13564521766145e-08, + "loss": 0.0006, + "step": 33177 + }, + { + "epoch": 0.64, + "learning_rate": 7.135256883227836e-08, + "loss": 0.0003, + "step": 33178 + }, + { + "epoch": 0.64, + "learning_rate": 7.134868548794222e-08, + "loss": 0.0014, + "step": 33179 + }, + { + "epoch": 0.64, + "learning_rate": 7.134480214360608e-08, + "loss": 0.0007, + "step": 33180 + }, + { + "epoch": 0.64, + "learning_rate": 7.134091879926993e-08, + "loss": 0.0005, + "step": 33181 + }, + { + "epoch": 0.64, + "learning_rate": 7.133703545493378e-08, + "loss": 0.0008, + "step": 33182 + }, + { + "epoch": 0.64, + "learning_rate": 7.133315211059764e-08, + "loss": 0.0003, + "step": 33183 + }, + { + "epoch": 0.64, + "learning_rate": 7.13292687662615e-08, + "loss": 0.0005, + "step": 33184 + }, + { + "epoch": 0.64, + "learning_rate": 7.132538542192535e-08, + "loss": 0.0006, + "step": 33185 + }, + { + "epoch": 0.64, + "learning_rate": 7.132150207758921e-08, + "loss": 0.0107, + "step": 33186 + }, + { + "epoch": 0.64, + "learning_rate": 7.131761873325307e-08, + "loss": 0.0004, + "step": 33187 + }, + { + "epoch": 0.64, + "learning_rate": 7.131373538891693e-08, + "loss": 0.0005, + "step": 33188 + }, + { + "epoch": 0.64, + "learning_rate": 7.130985204458079e-08, + "loss": 0.0005, + "step": 33189 + }, + { + "epoch": 0.64, + "learning_rate": 7.130596870024465e-08, + "loss": 0.0004, + "step": 33190 + }, + { + "epoch": 0.64, + "learning_rate": 7.13020853559085e-08, + "loss": 0.0004, + "step": 33191 + }, + { + "epoch": 0.64, + "learning_rate": 7.129820201157236e-08, + "loss": 0.0005, + "step": 33192 + }, + { + "epoch": 0.64, + "learning_rate": 7.129431866723622e-08, + "loss": 0.0006, + "step": 33193 + }, + { + "epoch": 0.64, + "learning_rate": 7.129043532290008e-08, + "loss": 0.0005, + "step": 33194 + }, + { + "epoch": 0.64, + "learning_rate": 7.128655197856394e-08, + "loss": 0.0028, + "step": 33195 + }, + { + "epoch": 0.64, + "learning_rate": 7.12826686342278e-08, + "loss": 0.0003, + "step": 33196 + }, + { + "epoch": 0.64, + "learning_rate": 7.127878528989165e-08, + "loss": 0.0004, + "step": 33197 + }, + { + "epoch": 0.64, + "learning_rate": 7.127490194555551e-08, + "loss": 0.0007, + "step": 33198 + }, + { + "epoch": 0.64, + "learning_rate": 7.127101860121937e-08, + "loss": 0.0004, + "step": 33199 + }, + { + "epoch": 0.64, + "learning_rate": 7.126713525688323e-08, + "loss": 0.0401, + "step": 33200 + }, + { + "epoch": 0.64, + "learning_rate": 7.126325191254709e-08, + "loss": 0.016, + "step": 33201 + }, + { + "epoch": 0.64, + "learning_rate": 7.125936856821094e-08, + "loss": 0.2031, + "step": 33202 + }, + { + "epoch": 0.64, + "learning_rate": 7.12554852238748e-08, + "loss": 0.0005, + "step": 33203 + }, + { + "epoch": 0.64, + "learning_rate": 7.125160187953866e-08, + "loss": 0.0006, + "step": 33204 + }, + { + "epoch": 0.64, + "learning_rate": 7.124771853520252e-08, + "loss": 0.1365, + "step": 33205 + }, + { + "epoch": 0.64, + "learning_rate": 7.124383519086638e-08, + "loss": 0.0053, + "step": 33206 + }, + { + "epoch": 0.64, + "learning_rate": 7.123995184653024e-08, + "loss": 0.0004, + "step": 33207 + }, + { + "epoch": 0.64, + "learning_rate": 7.12360685021941e-08, + "loss": 0.0005, + "step": 33208 + }, + { + "epoch": 0.64, + "learning_rate": 7.123218515785795e-08, + "loss": 0.0015, + "step": 33209 + }, + { + "epoch": 0.64, + "learning_rate": 7.122830181352181e-08, + "loss": 0.0006, + "step": 33210 + }, + { + "epoch": 0.64, + "learning_rate": 7.122441846918566e-08, + "loss": 0.0004, + "step": 33211 + }, + { + "epoch": 0.64, + "learning_rate": 7.122053512484951e-08, + "loss": 0.8756, + "step": 33212 + }, + { + "epoch": 0.64, + "learning_rate": 7.121665178051337e-08, + "loss": 0.75, + "step": 33213 + }, + { + "epoch": 0.64, + "learning_rate": 7.121276843617723e-08, + "loss": 0.0042, + "step": 33214 + }, + { + "epoch": 0.64, + "learning_rate": 7.120888509184109e-08, + "loss": 0.0011, + "step": 33215 + }, + { + "epoch": 0.64, + "learning_rate": 7.120500174750495e-08, + "loss": 0.0005, + "step": 33216 + }, + { + "epoch": 0.64, + "learning_rate": 7.12011184031688e-08, + "loss": 0.0004, + "step": 33217 + }, + { + "epoch": 0.64, + "learning_rate": 7.119723505883266e-08, + "loss": 0.0006, + "step": 33218 + }, + { + "epoch": 0.64, + "learning_rate": 7.119335171449652e-08, + "loss": 0.6478, + "step": 33219 + }, + { + "epoch": 0.64, + "learning_rate": 7.118946837016038e-08, + "loss": 0.0005, + "step": 33220 + }, + { + "epoch": 0.64, + "learning_rate": 7.118558502582424e-08, + "loss": 0.0004, + "step": 33221 + }, + { + "epoch": 0.64, + "learning_rate": 7.11817016814881e-08, + "loss": 0.0005, + "step": 33222 + }, + { + "epoch": 0.64, + "learning_rate": 7.117781833715195e-08, + "loss": 0.0005, + "step": 33223 + }, + { + "epoch": 0.64, + "learning_rate": 7.117393499281581e-08, + "loss": 0.0005, + "step": 33224 + }, + { + "epoch": 0.64, + "learning_rate": 7.117005164847967e-08, + "loss": 0.0004, + "step": 33225 + }, + { + "epoch": 0.64, + "learning_rate": 7.116616830414353e-08, + "loss": 0.0003, + "step": 33226 + }, + { + "epoch": 0.64, + "learning_rate": 7.116228495980739e-08, + "loss": 0.0004, + "step": 33227 + }, + { + "epoch": 0.64, + "learning_rate": 7.115840161547125e-08, + "loss": 0.3749, + "step": 33228 + }, + { + "epoch": 0.64, + "learning_rate": 7.11545182711351e-08, + "loss": 0.0004, + "step": 33229 + }, + { + "epoch": 0.64, + "learning_rate": 7.115063492679896e-08, + "loss": 0.0005, + "step": 33230 + }, + { + "epoch": 0.64, + "learning_rate": 7.114675158246282e-08, + "loss": 0.0006, + "step": 33231 + }, + { + "epoch": 0.64, + "learning_rate": 7.114286823812668e-08, + "loss": 0.0005, + "step": 33232 + }, + { + "epoch": 0.64, + "learning_rate": 7.113898489379054e-08, + "loss": 0.0007, + "step": 33233 + }, + { + "epoch": 0.64, + "learning_rate": 7.11351015494544e-08, + "loss": 0.0028, + "step": 33234 + }, + { + "epoch": 0.64, + "learning_rate": 7.113121820511825e-08, + "loss": 0.0005, + "step": 33235 + }, + { + "epoch": 0.64, + "learning_rate": 7.112733486078211e-08, + "loss": 0.0011, + "step": 33236 + }, + { + "epoch": 0.64, + "learning_rate": 7.112345151644597e-08, + "loss": 0.0004, + "step": 33237 + }, + { + "epoch": 0.64, + "learning_rate": 7.111956817210983e-08, + "loss": 0.0004, + "step": 33238 + }, + { + "epoch": 0.64, + "learning_rate": 7.111568482777369e-08, + "loss": 0.0005, + "step": 33239 + }, + { + "epoch": 0.64, + "learning_rate": 7.111180148343753e-08, + "loss": 0.0007, + "step": 33240 + }, + { + "epoch": 0.64, + "learning_rate": 7.110791813910139e-08, + "loss": 0.0004, + "step": 33241 + }, + { + "epoch": 0.64, + "learning_rate": 7.110403479476525e-08, + "loss": 0.0005, + "step": 33242 + }, + { + "epoch": 0.64, + "learning_rate": 7.11001514504291e-08, + "loss": 0.0005, + "step": 33243 + }, + { + "epoch": 0.64, + "learning_rate": 7.109626810609296e-08, + "loss": 0.0005, + "step": 33244 + }, + { + "epoch": 0.64, + "learning_rate": 7.109238476175682e-08, + "loss": 0.0005, + "step": 33245 + }, + { + "epoch": 0.64, + "learning_rate": 7.108850141742068e-08, + "loss": 0.0015, + "step": 33246 + }, + { + "epoch": 0.64, + "learning_rate": 7.108461807308454e-08, + "loss": 0.0008, + "step": 33247 + }, + { + "epoch": 0.64, + "learning_rate": 7.10807347287484e-08, + "loss": 0.7712, + "step": 33248 + }, + { + "epoch": 0.64, + "learning_rate": 7.107685138441226e-08, + "loss": 0.0005, + "step": 33249 + }, + { + "epoch": 0.64, + "learning_rate": 7.107296804007611e-08, + "loss": 0.0005, + "step": 33250 + }, + { + "epoch": 0.64, + "learning_rate": 7.106908469573997e-08, + "loss": 0.0005, + "step": 33251 + }, + { + "epoch": 0.65, + "learning_rate": 7.106520135140383e-08, + "loss": 0.0005, + "step": 33252 + }, + { + "epoch": 0.65, + "learning_rate": 7.106131800706769e-08, + "loss": 0.0007, + "step": 33253 + }, + { + "epoch": 0.65, + "learning_rate": 7.105743466273155e-08, + "loss": 0.0003, + "step": 33254 + }, + { + "epoch": 0.65, + "learning_rate": 7.10535513183954e-08, + "loss": 0.0005, + "step": 33255 + }, + { + "epoch": 0.65, + "learning_rate": 7.104966797405926e-08, + "loss": 0.0005, + "step": 33256 + }, + { + "epoch": 0.65, + "learning_rate": 7.104578462972312e-08, + "loss": 0.726, + "step": 33257 + }, + { + "epoch": 0.65, + "learning_rate": 7.104190128538698e-08, + "loss": 0.0005, + "step": 33258 + }, + { + "epoch": 0.65, + "learning_rate": 7.103801794105084e-08, + "loss": 0.2924, + "step": 33259 + }, + { + "epoch": 0.65, + "learning_rate": 7.10341345967147e-08, + "loss": 0.0004, + "step": 33260 + }, + { + "epoch": 0.65, + "learning_rate": 7.103025125237855e-08, + "loss": 0.0005, + "step": 33261 + }, + { + "epoch": 0.65, + "learning_rate": 7.102636790804241e-08, + "loss": 0.0005, + "step": 33262 + }, + { + "epoch": 0.65, + "learning_rate": 7.102248456370627e-08, + "loss": 0.0006, + "step": 33263 + }, + { + "epoch": 0.65, + "learning_rate": 7.101860121937012e-08, + "loss": 0.0005, + "step": 33264 + }, + { + "epoch": 0.65, + "learning_rate": 7.101471787503397e-08, + "loss": 0.0005, + "step": 33265 + }, + { + "epoch": 0.65, + "learning_rate": 7.101083453069783e-08, + "loss": 0.0007, + "step": 33266 + }, + { + "epoch": 0.65, + "learning_rate": 7.100695118636169e-08, + "loss": 0.0004, + "step": 33267 + }, + { + "epoch": 0.65, + "learning_rate": 7.100306784202555e-08, + "loss": 0.0005, + "step": 33268 + }, + { + "epoch": 0.65, + "learning_rate": 7.099918449768941e-08, + "loss": 0.0008, + "step": 33269 + }, + { + "epoch": 0.65, + "learning_rate": 7.099530115335327e-08, + "loss": 0.0004, + "step": 33270 + }, + { + "epoch": 0.65, + "learning_rate": 7.099141780901712e-08, + "loss": 0.0006, + "step": 33271 + }, + { + "epoch": 0.65, + "learning_rate": 7.098753446468098e-08, + "loss": 0.0005, + "step": 33272 + }, + { + "epoch": 0.65, + "learning_rate": 7.098365112034484e-08, + "loss": 0.001, + "step": 33273 + }, + { + "epoch": 0.65, + "learning_rate": 7.09797677760087e-08, + "loss": 0.0016, + "step": 33274 + }, + { + "epoch": 0.65, + "learning_rate": 7.097588443167256e-08, + "loss": 0.0004, + "step": 33275 + }, + { + "epoch": 0.65, + "learning_rate": 7.097200108733641e-08, + "loss": 0.0005, + "step": 33276 + }, + { + "epoch": 0.65, + "learning_rate": 7.096811774300027e-08, + "loss": 0.0007, + "step": 33277 + }, + { + "epoch": 0.65, + "learning_rate": 7.096423439866413e-08, + "loss": 0.003, + "step": 33278 + }, + { + "epoch": 0.65, + "learning_rate": 7.096035105432798e-08, + "loss": 1.0425, + "step": 33279 + }, + { + "epoch": 0.65, + "learning_rate": 7.095646770999183e-08, + "loss": 0.0006, + "step": 33280 + }, + { + "epoch": 0.65, + "learning_rate": 7.095258436565569e-08, + "loss": 0.0006, + "step": 33281 + }, + { + "epoch": 0.65, + "learning_rate": 7.094870102131955e-08, + "loss": 0.0005, + "step": 33282 + }, + { + "epoch": 0.65, + "learning_rate": 7.094481767698341e-08, + "loss": 0.0004, + "step": 33283 + }, + { + "epoch": 0.65, + "learning_rate": 7.094093433264727e-08, + "loss": 0.0005, + "step": 33284 + }, + { + "epoch": 0.65, + "learning_rate": 7.093705098831113e-08, + "loss": 0.0004, + "step": 33285 + }, + { + "epoch": 0.65, + "learning_rate": 7.093316764397498e-08, + "loss": 0.0005, + "step": 33286 + }, + { + "epoch": 0.65, + "learning_rate": 7.092928429963884e-08, + "loss": 0.0007, + "step": 33287 + }, + { + "epoch": 0.65, + "learning_rate": 7.09254009553027e-08, + "loss": 0.1157, + "step": 33288 + }, + { + "epoch": 0.65, + "learning_rate": 7.092151761096656e-08, + "loss": 0.0019, + "step": 33289 + }, + { + "epoch": 0.65, + "learning_rate": 7.091763426663042e-08, + "loss": 0.0008, + "step": 33290 + }, + { + "epoch": 0.65, + "learning_rate": 7.091375092229428e-08, + "loss": 0.0005, + "step": 33291 + }, + { + "epoch": 0.65, + "learning_rate": 7.090986757795813e-08, + "loss": 0.0009, + "step": 33292 + }, + { + "epoch": 0.65, + "learning_rate": 7.090598423362199e-08, + "loss": 0.0006, + "step": 33293 + }, + { + "epoch": 0.65, + "learning_rate": 7.090210088928585e-08, + "loss": 0.0003, + "step": 33294 + }, + { + "epoch": 0.65, + "learning_rate": 7.089821754494971e-08, + "loss": 0.0005, + "step": 33295 + }, + { + "epoch": 0.65, + "learning_rate": 7.089433420061357e-08, + "loss": 0.0003, + "step": 33296 + }, + { + "epoch": 0.65, + "learning_rate": 7.089045085627742e-08, + "loss": 0.0008, + "step": 33297 + }, + { + "epoch": 0.65, + "learning_rate": 7.088656751194127e-08, + "loss": 0.0005, + "step": 33298 + }, + { + "epoch": 0.65, + "learning_rate": 7.088268416760513e-08, + "loss": 0.0004, + "step": 33299 + }, + { + "epoch": 0.65, + "learning_rate": 7.087880082326899e-08, + "loss": 0.0005, + "step": 33300 + }, + { + "epoch": 0.65, + "learning_rate": 7.087491747893284e-08, + "loss": 0.0005, + "step": 33301 + }, + { + "epoch": 0.65, + "learning_rate": 7.08710341345967e-08, + "loss": 0.0006, + "step": 33302 + }, + { + "epoch": 0.65, + "learning_rate": 7.086715079026056e-08, + "loss": 0.0005, + "step": 33303 + }, + { + "epoch": 0.65, + "learning_rate": 7.086326744592442e-08, + "loss": 0.0004, + "step": 33304 + }, + { + "epoch": 0.65, + "learning_rate": 7.085938410158828e-08, + "loss": 0.0022, + "step": 33305 + }, + { + "epoch": 0.65, + "learning_rate": 7.085550075725214e-08, + "loss": 0.0006, + "step": 33306 + }, + { + "epoch": 0.65, + "learning_rate": 7.0851617412916e-08, + "loss": 0.0013, + "step": 33307 + }, + { + "epoch": 0.65, + "learning_rate": 7.084773406857985e-08, + "loss": 0.0004, + "step": 33308 + }, + { + "epoch": 0.65, + "learning_rate": 7.084385072424371e-08, + "loss": 0.0075, + "step": 33309 + }, + { + "epoch": 0.65, + "learning_rate": 7.083996737990757e-08, + "loss": 0.0005, + "step": 33310 + }, + { + "epoch": 0.65, + "learning_rate": 7.083608403557143e-08, + "loss": 0.0006, + "step": 33311 + }, + { + "epoch": 0.65, + "learning_rate": 7.083220069123528e-08, + "loss": 0.0004, + "step": 33312 + }, + { + "epoch": 0.65, + "learning_rate": 7.082831734689914e-08, + "loss": 0.0009, + "step": 33313 + }, + { + "epoch": 0.65, + "learning_rate": 7.0824434002563e-08, + "loss": 0.0005, + "step": 33314 + }, + { + "epoch": 0.65, + "learning_rate": 7.082055065822686e-08, + "loss": 0.0004, + "step": 33315 + }, + { + "epoch": 0.65, + "learning_rate": 7.081666731389072e-08, + "loss": 0.0004, + "step": 33316 + }, + { + "epoch": 0.65, + "learning_rate": 7.081278396955458e-08, + "loss": 0.0009, + "step": 33317 + }, + { + "epoch": 0.65, + "learning_rate": 7.080890062521843e-08, + "loss": 0.0005, + "step": 33318 + }, + { + "epoch": 0.65, + "learning_rate": 7.080501728088229e-08, + "loss": 0.0003, + "step": 33319 + }, + { + "epoch": 0.65, + "learning_rate": 7.080113393654615e-08, + "loss": 0.0005, + "step": 33320 + }, + { + "epoch": 0.65, + "learning_rate": 7.079725059221001e-08, + "loss": 0.0005, + "step": 33321 + }, + { + "epoch": 0.65, + "learning_rate": 7.079336724787387e-08, + "loss": 0.0003, + "step": 33322 + }, + { + "epoch": 0.65, + "learning_rate": 7.078948390353773e-08, + "loss": 0.0013, + "step": 33323 + }, + { + "epoch": 0.65, + "learning_rate": 7.078560055920158e-08, + "loss": 0.0005, + "step": 33324 + }, + { + "epoch": 0.65, + "learning_rate": 7.078171721486544e-08, + "loss": 0.0004, + "step": 33325 + }, + { + "epoch": 0.65, + "learning_rate": 7.07778338705293e-08, + "loss": 0.0005, + "step": 33326 + }, + { + "epoch": 0.65, + "learning_rate": 7.077395052619315e-08, + "loss": 0.0007, + "step": 33327 + }, + { + "epoch": 0.65, + "learning_rate": 7.0770067181857e-08, + "loss": 0.3683, + "step": 33328 + }, + { + "epoch": 0.65, + "learning_rate": 7.076618383752086e-08, + "loss": 0.0004, + "step": 33329 + }, + { + "epoch": 0.65, + "learning_rate": 7.076230049318472e-08, + "loss": 0.0007, + "step": 33330 + }, + { + "epoch": 0.65, + "learning_rate": 7.075841714884858e-08, + "loss": 0.0004, + "step": 33331 + }, + { + "epoch": 0.65, + "learning_rate": 7.075453380451244e-08, + "loss": 0.0007, + "step": 33332 + }, + { + "epoch": 0.65, + "learning_rate": 7.07506504601763e-08, + "loss": 0.0007, + "step": 33333 + }, + { + "epoch": 0.65, + "learning_rate": 7.074676711584015e-08, + "loss": 0.0014, + "step": 33334 + }, + { + "epoch": 0.65, + "learning_rate": 7.074288377150401e-08, + "loss": 0.0005, + "step": 33335 + }, + { + "epoch": 0.65, + "learning_rate": 7.073900042716787e-08, + "loss": 0.0003, + "step": 33336 + }, + { + "epoch": 0.65, + "learning_rate": 7.073511708283173e-08, + "loss": 0.8421, + "step": 33337 + }, + { + "epoch": 0.65, + "learning_rate": 7.073123373849559e-08, + "loss": 0.0008, + "step": 33338 + }, + { + "epoch": 0.65, + "learning_rate": 7.072735039415944e-08, + "loss": 0.0005, + "step": 33339 + }, + { + "epoch": 0.65, + "learning_rate": 7.07234670498233e-08, + "loss": 0.0005, + "step": 33340 + }, + { + "epoch": 0.65, + "learning_rate": 7.071958370548716e-08, + "loss": 0.0005, + "step": 33341 + }, + { + "epoch": 0.65, + "learning_rate": 7.071570036115102e-08, + "loss": 0.0045, + "step": 33342 + }, + { + "epoch": 0.65, + "learning_rate": 7.071181701681488e-08, + "loss": 0.7652, + "step": 33343 + }, + { + "epoch": 0.65, + "learning_rate": 7.070793367247874e-08, + "loss": 0.0021, + "step": 33344 + }, + { + "epoch": 0.65, + "learning_rate": 7.07040503281426e-08, + "loss": 0.2438, + "step": 33345 + }, + { + "epoch": 0.65, + "learning_rate": 7.070016698380645e-08, + "loss": 0.0006, + "step": 33346 + }, + { + "epoch": 0.65, + "learning_rate": 7.069628363947031e-08, + "loss": 0.1265, + "step": 33347 + }, + { + "epoch": 0.65, + "learning_rate": 7.069240029513417e-08, + "loss": 0.0005, + "step": 33348 + }, + { + "epoch": 0.65, + "learning_rate": 7.068851695079803e-08, + "loss": 0.0564, + "step": 33349 + }, + { + "epoch": 0.65, + "learning_rate": 7.068463360646188e-08, + "loss": 0.0005, + "step": 33350 + }, + { + "epoch": 0.65, + "learning_rate": 7.068075026212574e-08, + "loss": 1.1352, + "step": 33351 + }, + { + "epoch": 0.65, + "learning_rate": 7.06768669177896e-08, + "loss": 0.0023, + "step": 33352 + }, + { + "epoch": 0.65, + "learning_rate": 7.067298357345346e-08, + "loss": 0.0005, + "step": 33353 + }, + { + "epoch": 0.65, + "learning_rate": 7.066910022911732e-08, + "loss": 0.0005, + "step": 33354 + }, + { + "epoch": 0.65, + "learning_rate": 7.066521688478118e-08, + "loss": 0.0003, + "step": 33355 + }, + { + "epoch": 0.65, + "learning_rate": 7.066133354044502e-08, + "loss": 0.0005, + "step": 33356 + }, + { + "epoch": 0.65, + "learning_rate": 7.065745019610888e-08, + "loss": 0.0008, + "step": 33357 + }, + { + "epoch": 0.65, + "learning_rate": 7.065356685177274e-08, + "loss": 0.092, + "step": 33358 + }, + { + "epoch": 0.65, + "learning_rate": 7.06496835074366e-08, + "loss": 0.0005, + "step": 33359 + }, + { + "epoch": 0.65, + "learning_rate": 7.064580016310045e-08, + "loss": 0.0006, + "step": 33360 + }, + { + "epoch": 0.65, + "learning_rate": 7.064191681876431e-08, + "loss": 0.0005, + "step": 33361 + }, + { + "epoch": 0.65, + "learning_rate": 7.063803347442817e-08, + "loss": 0.0003, + "step": 33362 + }, + { + "epoch": 0.65, + "learning_rate": 7.063415013009203e-08, + "loss": 0.0009, + "step": 33363 + }, + { + "epoch": 0.65, + "learning_rate": 7.063026678575589e-08, + "loss": 0.0006, + "step": 33364 + }, + { + "epoch": 0.65, + "learning_rate": 7.062638344141975e-08, + "loss": 1.0565, + "step": 33365 + }, + { + "epoch": 0.65, + "learning_rate": 7.06225000970836e-08, + "loss": 0.0011, + "step": 33366 + }, + { + "epoch": 0.65, + "learning_rate": 7.061861675274746e-08, + "loss": 0.0003, + "step": 33367 + }, + { + "epoch": 0.65, + "learning_rate": 7.061473340841132e-08, + "loss": 0.0004, + "step": 33368 + }, + { + "epoch": 0.65, + "learning_rate": 7.061085006407518e-08, + "loss": 0.0008, + "step": 33369 + }, + { + "epoch": 0.65, + "learning_rate": 7.060696671973904e-08, + "loss": 0.0005, + "step": 33370 + }, + { + "epoch": 0.65, + "learning_rate": 7.06030833754029e-08, + "loss": 0.0006, + "step": 33371 + }, + { + "epoch": 0.65, + "learning_rate": 7.059920003106675e-08, + "loss": 0.0008, + "step": 33372 + }, + { + "epoch": 0.65, + "learning_rate": 7.059531668673061e-08, + "loss": 0.001, + "step": 33373 + }, + { + "epoch": 0.65, + "learning_rate": 7.059143334239447e-08, + "loss": 0.0007, + "step": 33374 + }, + { + "epoch": 0.65, + "learning_rate": 7.058754999805833e-08, + "loss": 0.0009, + "step": 33375 + }, + { + "epoch": 0.65, + "learning_rate": 7.058366665372219e-08, + "loss": 0.0268, + "step": 33376 + }, + { + "epoch": 0.65, + "learning_rate": 7.057978330938604e-08, + "loss": 0.0004, + "step": 33377 + }, + { + "epoch": 0.65, + "learning_rate": 7.05758999650499e-08, + "loss": 0.0008, + "step": 33378 + }, + { + "epoch": 0.65, + "learning_rate": 7.057201662071376e-08, + "loss": 0.0004, + "step": 33379 + }, + { + "epoch": 0.65, + "learning_rate": 7.056813327637762e-08, + "loss": 0.0071, + "step": 33380 + }, + { + "epoch": 0.65, + "learning_rate": 7.056424993204148e-08, + "loss": 0.0006, + "step": 33381 + }, + { + "epoch": 0.65, + "learning_rate": 7.056036658770534e-08, + "loss": 0.0042, + "step": 33382 + }, + { + "epoch": 0.65, + "learning_rate": 7.05564832433692e-08, + "loss": 0.0005, + "step": 33383 + }, + { + "epoch": 0.65, + "learning_rate": 7.055259989903305e-08, + "loss": 0.001, + "step": 33384 + }, + { + "epoch": 0.65, + "learning_rate": 7.05487165546969e-08, + "loss": 0.0005, + "step": 33385 + }, + { + "epoch": 0.65, + "learning_rate": 7.054483321036076e-08, + "loss": 0.0004, + "step": 33386 + }, + { + "epoch": 0.65, + "learning_rate": 7.054094986602461e-08, + "loss": 0.0005, + "step": 33387 + }, + { + "epoch": 0.65, + "learning_rate": 7.053706652168847e-08, + "loss": 0.0005, + "step": 33388 + }, + { + "epoch": 0.65, + "learning_rate": 7.053318317735233e-08, + "loss": 0.0004, + "step": 33389 + }, + { + "epoch": 0.65, + "learning_rate": 7.052929983301619e-08, + "loss": 0.0007, + "step": 33390 + }, + { + "epoch": 0.65, + "learning_rate": 7.052541648868005e-08, + "loss": 0.0005, + "step": 33391 + }, + { + "epoch": 0.65, + "learning_rate": 7.05215331443439e-08, + "loss": 0.0064, + "step": 33392 + }, + { + "epoch": 0.65, + "learning_rate": 7.051764980000776e-08, + "loss": 0.0005, + "step": 33393 + }, + { + "epoch": 0.65, + "learning_rate": 7.051376645567162e-08, + "loss": 0.027, + "step": 33394 + }, + { + "epoch": 0.65, + "learning_rate": 7.050988311133548e-08, + "loss": 0.0004, + "step": 33395 + }, + { + "epoch": 0.65, + "learning_rate": 7.050599976699934e-08, + "loss": 0.0016, + "step": 33396 + }, + { + "epoch": 0.65, + "learning_rate": 7.05021164226632e-08, + "loss": 0.0006, + "step": 33397 + }, + { + "epoch": 0.65, + "learning_rate": 7.049823307832705e-08, + "loss": 0.459, + "step": 33398 + }, + { + "epoch": 0.65, + "learning_rate": 7.049434973399091e-08, + "loss": 0.0015, + "step": 33399 + }, + { + "epoch": 0.65, + "learning_rate": 7.049046638965477e-08, + "loss": 0.0103, + "step": 33400 + }, + { + "epoch": 0.65, + "learning_rate": 7.048658304531863e-08, + "loss": 0.0006, + "step": 33401 + }, + { + "epoch": 0.65, + "learning_rate": 7.048269970098249e-08, + "loss": 0.0005, + "step": 33402 + }, + { + "epoch": 0.65, + "learning_rate": 7.047881635664635e-08, + "loss": 0.0017, + "step": 33403 + }, + { + "epoch": 0.65, + "learning_rate": 7.04749330123102e-08, + "loss": 0.0005, + "step": 33404 + }, + { + "epoch": 0.65, + "learning_rate": 7.047104966797406e-08, + "loss": 0.0005, + "step": 33405 + }, + { + "epoch": 0.65, + "learning_rate": 7.046716632363792e-08, + "loss": 0.0004, + "step": 33406 + }, + { + "epoch": 0.65, + "learning_rate": 7.046328297930178e-08, + "loss": 0.0005, + "step": 33407 + }, + { + "epoch": 0.65, + "learning_rate": 7.045939963496564e-08, + "loss": 0.0004, + "step": 33408 + }, + { + "epoch": 0.65, + "learning_rate": 7.04555162906295e-08, + "loss": 0.0005, + "step": 33409 + }, + { + "epoch": 0.65, + "learning_rate": 7.045163294629335e-08, + "loss": 0.0004, + "step": 33410 + }, + { + "epoch": 0.65, + "learning_rate": 7.044774960195721e-08, + "loss": 0.0004, + "step": 33411 + }, + { + "epoch": 0.65, + "learning_rate": 7.044386625762107e-08, + "loss": 0.0005, + "step": 33412 + }, + { + "epoch": 0.65, + "learning_rate": 7.043998291328493e-08, + "loss": 0.0023, + "step": 33413 + }, + { + "epoch": 0.65, + "learning_rate": 7.043609956894877e-08, + "loss": 0.0005, + "step": 33414 + }, + { + "epoch": 0.65, + "learning_rate": 7.043221622461263e-08, + "loss": 0.0004, + "step": 33415 + }, + { + "epoch": 0.65, + "learning_rate": 7.042833288027649e-08, + "loss": 0.0008, + "step": 33416 + }, + { + "epoch": 0.65, + "learning_rate": 7.042444953594035e-08, + "loss": 0.0007, + "step": 33417 + }, + { + "epoch": 0.65, + "learning_rate": 7.04205661916042e-08, + "loss": 0.0016, + "step": 33418 + }, + { + "epoch": 0.65, + "learning_rate": 7.041668284726806e-08, + "loss": 0.0005, + "step": 33419 + }, + { + "epoch": 0.65, + "learning_rate": 7.041279950293192e-08, + "loss": 0.0004, + "step": 33420 + }, + { + "epoch": 0.65, + "learning_rate": 7.040891615859578e-08, + "loss": 0.0019, + "step": 33421 + }, + { + "epoch": 0.65, + "learning_rate": 7.040503281425964e-08, + "loss": 0.0004, + "step": 33422 + }, + { + "epoch": 0.65, + "learning_rate": 7.04011494699235e-08, + "loss": 0.0005, + "step": 33423 + }, + { + "epoch": 0.65, + "learning_rate": 7.039726612558736e-08, + "loss": 0.0004, + "step": 33424 + }, + { + "epoch": 0.65, + "learning_rate": 7.039338278125121e-08, + "loss": 0.0005, + "step": 33425 + }, + { + "epoch": 0.65, + "learning_rate": 7.038949943691507e-08, + "loss": 0.0005, + "step": 33426 + }, + { + "epoch": 0.65, + "learning_rate": 7.038561609257893e-08, + "loss": 0.0008, + "step": 33427 + }, + { + "epoch": 0.65, + "learning_rate": 7.038173274824279e-08, + "loss": 0.0004, + "step": 33428 + }, + { + "epoch": 0.65, + "learning_rate": 7.037784940390665e-08, + "loss": 0.0017, + "step": 33429 + }, + { + "epoch": 0.65, + "learning_rate": 7.03739660595705e-08, + "loss": 0.0003, + "step": 33430 + }, + { + "epoch": 0.65, + "learning_rate": 7.037008271523436e-08, + "loss": 0.0006, + "step": 33431 + }, + { + "epoch": 0.65, + "learning_rate": 7.036619937089822e-08, + "loss": 0.0056, + "step": 33432 + }, + { + "epoch": 0.65, + "learning_rate": 7.036231602656208e-08, + "loss": 0.0004, + "step": 33433 + }, + { + "epoch": 0.65, + "learning_rate": 7.035843268222594e-08, + "loss": 0.0003, + "step": 33434 + }, + { + "epoch": 0.65, + "learning_rate": 7.03545493378898e-08, + "loss": 0.0005, + "step": 33435 + }, + { + "epoch": 0.65, + "learning_rate": 7.035066599355365e-08, + "loss": 0.0005, + "step": 33436 + }, + { + "epoch": 0.65, + "learning_rate": 7.034678264921751e-08, + "loss": 0.0005, + "step": 33437 + }, + { + "epoch": 0.65, + "learning_rate": 7.034289930488137e-08, + "loss": 0.0005, + "step": 33438 + }, + { + "epoch": 0.65, + "learning_rate": 7.033901596054523e-08, + "loss": 0.0005, + "step": 33439 + }, + { + "epoch": 0.65, + "learning_rate": 7.033513261620909e-08, + "loss": 0.0005, + "step": 33440 + }, + { + "epoch": 0.65, + "learning_rate": 7.033124927187293e-08, + "loss": 0.0003, + "step": 33441 + }, + { + "epoch": 0.65, + "learning_rate": 7.032736592753679e-08, + "loss": 0.0057, + "step": 33442 + }, + { + "epoch": 0.65, + "learning_rate": 7.032348258320065e-08, + "loss": 0.0004, + "step": 33443 + }, + { + "epoch": 0.65, + "learning_rate": 7.031959923886451e-08, + "loss": 0.0006, + "step": 33444 + }, + { + "epoch": 0.65, + "learning_rate": 7.031571589452837e-08, + "loss": 0.0008, + "step": 33445 + }, + { + "epoch": 0.65, + "learning_rate": 7.031183255019222e-08, + "loss": 0.0003, + "step": 33446 + }, + { + "epoch": 0.65, + "learning_rate": 7.030794920585608e-08, + "loss": 0.0005, + "step": 33447 + }, + { + "epoch": 0.65, + "learning_rate": 7.030406586151994e-08, + "loss": 0.0004, + "step": 33448 + }, + { + "epoch": 0.65, + "learning_rate": 7.03001825171838e-08, + "loss": 0.0005, + "step": 33449 + }, + { + "epoch": 0.65, + "learning_rate": 7.029629917284766e-08, + "loss": 0.0009, + "step": 33450 + }, + { + "epoch": 0.65, + "learning_rate": 7.029241582851151e-08, + "loss": 0.0005, + "step": 33451 + }, + { + "epoch": 0.65, + "learning_rate": 7.028853248417537e-08, + "loss": 0.0004, + "step": 33452 + }, + { + "epoch": 0.65, + "learning_rate": 7.028464913983923e-08, + "loss": 0.0026, + "step": 33453 + }, + { + "epoch": 0.65, + "learning_rate": 7.028076579550309e-08, + "loss": 0.0027, + "step": 33454 + }, + { + "epoch": 0.65, + "learning_rate": 7.027688245116695e-08, + "loss": 0.0004, + "step": 33455 + }, + { + "epoch": 0.65, + "learning_rate": 7.027299910683079e-08, + "loss": 0.0004, + "step": 33456 + }, + { + "epoch": 0.65, + "learning_rate": 7.026911576249465e-08, + "loss": 0.0009, + "step": 33457 + }, + { + "epoch": 0.65, + "learning_rate": 7.026523241815851e-08, + "loss": 0.0072, + "step": 33458 + }, + { + "epoch": 0.65, + "learning_rate": 7.026134907382237e-08, + "loss": 0.0004, + "step": 33459 + }, + { + "epoch": 0.65, + "learning_rate": 7.025746572948623e-08, + "loss": 1.0938, + "step": 33460 + }, + { + "epoch": 0.65, + "learning_rate": 7.025358238515008e-08, + "loss": 0.0004, + "step": 33461 + }, + { + "epoch": 0.65, + "learning_rate": 7.024969904081394e-08, + "loss": 0.0006, + "step": 33462 + }, + { + "epoch": 0.65, + "learning_rate": 7.02458156964778e-08, + "loss": 0.4817, + "step": 33463 + }, + { + "epoch": 0.65, + "learning_rate": 7.024193235214166e-08, + "loss": 0.0004, + "step": 33464 + }, + { + "epoch": 0.65, + "learning_rate": 7.023804900780552e-08, + "loss": 0.0531, + "step": 33465 + }, + { + "epoch": 0.65, + "learning_rate": 7.023416566346938e-08, + "loss": 0.0006, + "step": 33466 + }, + { + "epoch": 0.65, + "learning_rate": 7.023028231913323e-08, + "loss": 0.0004, + "step": 33467 + }, + { + "epoch": 0.65, + "learning_rate": 7.022639897479709e-08, + "loss": 0.0004, + "step": 33468 + }, + { + "epoch": 0.65, + "learning_rate": 7.022251563046095e-08, + "loss": 0.0004, + "step": 33469 + }, + { + "epoch": 0.65, + "learning_rate": 7.021863228612481e-08, + "loss": 0.0008, + "step": 33470 + }, + { + "epoch": 0.65, + "learning_rate": 7.021474894178867e-08, + "loss": 0.0006, + "step": 33471 + }, + { + "epoch": 0.65, + "learning_rate": 7.021086559745251e-08, + "loss": 0.0008, + "step": 33472 + }, + { + "epoch": 0.65, + "learning_rate": 7.020698225311637e-08, + "loss": 0.0006, + "step": 33473 + }, + { + "epoch": 0.65, + "learning_rate": 7.020309890878023e-08, + "loss": 0.0003, + "step": 33474 + }, + { + "epoch": 0.65, + "learning_rate": 7.019921556444409e-08, + "loss": 0.8467, + "step": 33475 + }, + { + "epoch": 0.65, + "learning_rate": 7.019533222010794e-08, + "loss": 0.0005, + "step": 33476 + }, + { + "epoch": 0.65, + "learning_rate": 7.01914488757718e-08, + "loss": 0.0005, + "step": 33477 + }, + { + "epoch": 0.65, + "learning_rate": 7.018756553143566e-08, + "loss": 0.0005, + "step": 33478 + }, + { + "epoch": 0.65, + "learning_rate": 7.018368218709952e-08, + "loss": 0.0005, + "step": 33479 + }, + { + "epoch": 0.65, + "learning_rate": 7.017979884276338e-08, + "loss": 0.0005, + "step": 33480 + }, + { + "epoch": 0.65, + "learning_rate": 7.017591549842724e-08, + "loss": 0.0005, + "step": 33481 + }, + { + "epoch": 0.65, + "learning_rate": 7.01720321540911e-08, + "loss": 0.0004, + "step": 33482 + }, + { + "epoch": 0.65, + "learning_rate": 7.016814880975495e-08, + "loss": 0.0005, + "step": 33483 + }, + { + "epoch": 0.65, + "learning_rate": 7.016426546541881e-08, + "loss": 0.0004, + "step": 33484 + }, + { + "epoch": 0.65, + "learning_rate": 7.016038212108267e-08, + "loss": 0.0007, + "step": 33485 + }, + { + "epoch": 0.65, + "learning_rate": 7.015649877674653e-08, + "loss": 0.0005, + "step": 33486 + }, + { + "epoch": 0.65, + "learning_rate": 7.015261543241039e-08, + "loss": 0.0029, + "step": 33487 + }, + { + "epoch": 0.65, + "learning_rate": 7.014873208807424e-08, + "loss": 0.0005, + "step": 33488 + }, + { + "epoch": 0.65, + "learning_rate": 7.01448487437381e-08, + "loss": 0.0004, + "step": 33489 + }, + { + "epoch": 0.65, + "learning_rate": 7.014096539940196e-08, + "loss": 0.0004, + "step": 33490 + }, + { + "epoch": 0.65, + "learning_rate": 7.013708205506582e-08, + "loss": 0.0004, + "step": 33491 + }, + { + "epoch": 0.65, + "learning_rate": 7.013319871072968e-08, + "loss": 0.0008, + "step": 33492 + }, + { + "epoch": 0.65, + "learning_rate": 7.012931536639353e-08, + "loss": 0.0009, + "step": 33493 + }, + { + "epoch": 0.65, + "learning_rate": 7.012543202205739e-08, + "loss": 0.0006, + "step": 33494 + }, + { + "epoch": 0.65, + "learning_rate": 7.012154867772125e-08, + "loss": 0.0003, + "step": 33495 + }, + { + "epoch": 0.65, + "learning_rate": 7.011766533338511e-08, + "loss": 0.0004, + "step": 33496 + }, + { + "epoch": 0.65, + "learning_rate": 7.011378198904897e-08, + "loss": 0.0004, + "step": 33497 + }, + { + "epoch": 0.65, + "learning_rate": 7.010989864471283e-08, + "loss": 0.0007, + "step": 33498 + }, + { + "epoch": 0.65, + "learning_rate": 7.010601530037668e-08, + "loss": 0.0004, + "step": 33499 + }, + { + "epoch": 0.65, + "learning_rate": 7.010213195604054e-08, + "loss": 0.0021, + "step": 33500 + }, + { + "epoch": 0.65, + "learning_rate": 7.009824861170439e-08, + "loss": 0.0007, + "step": 33501 + }, + { + "epoch": 0.65, + "learning_rate": 7.009436526736825e-08, + "loss": 0.0004, + "step": 33502 + }, + { + "epoch": 0.65, + "learning_rate": 7.00904819230321e-08, + "loss": 0.0005, + "step": 33503 + }, + { + "epoch": 0.65, + "learning_rate": 7.008659857869596e-08, + "loss": 0.0005, + "step": 33504 + }, + { + "epoch": 0.65, + "learning_rate": 7.008271523435982e-08, + "loss": 0.0006, + "step": 33505 + }, + { + "epoch": 0.65, + "learning_rate": 7.007883189002368e-08, + "loss": 0.0006, + "step": 33506 + }, + { + "epoch": 0.65, + "learning_rate": 7.007494854568754e-08, + "loss": 0.0004, + "step": 33507 + }, + { + "epoch": 0.65, + "learning_rate": 7.00710652013514e-08, + "loss": 0.0004, + "step": 33508 + }, + { + "epoch": 0.65, + "learning_rate": 7.006718185701525e-08, + "loss": 0.0006, + "step": 33509 + }, + { + "epoch": 0.65, + "learning_rate": 7.006329851267911e-08, + "loss": 0.0004, + "step": 33510 + }, + { + "epoch": 0.65, + "learning_rate": 7.005941516834297e-08, + "loss": 0.5485, + "step": 33511 + }, + { + "epoch": 0.65, + "learning_rate": 7.005553182400683e-08, + "loss": 0.0004, + "step": 33512 + }, + { + "epoch": 0.65, + "learning_rate": 7.005164847967069e-08, + "loss": 0.674, + "step": 33513 + }, + { + "epoch": 0.65, + "learning_rate": 7.004776513533454e-08, + "loss": 0.0005, + "step": 33514 + }, + { + "epoch": 0.65, + "learning_rate": 7.00438817909984e-08, + "loss": 0.0005, + "step": 33515 + }, + { + "epoch": 0.65, + "learning_rate": 7.003999844666226e-08, + "loss": 0.1696, + "step": 33516 + }, + { + "epoch": 0.65, + "learning_rate": 7.003611510232612e-08, + "loss": 0.0004, + "step": 33517 + }, + { + "epoch": 0.65, + "learning_rate": 7.003223175798998e-08, + "loss": 0.0005, + "step": 33518 + }, + { + "epoch": 0.65, + "learning_rate": 7.002834841365384e-08, + "loss": 0.0294, + "step": 33519 + }, + { + "epoch": 0.65, + "learning_rate": 7.00244650693177e-08, + "loss": 0.0004, + "step": 33520 + }, + { + "epoch": 0.65, + "learning_rate": 7.002058172498155e-08, + "loss": 0.0151, + "step": 33521 + }, + { + "epoch": 0.65, + "learning_rate": 7.001669838064541e-08, + "loss": 0.0005, + "step": 33522 + }, + { + "epoch": 0.65, + "learning_rate": 7.001281503630927e-08, + "loss": 0.0005, + "step": 33523 + }, + { + "epoch": 0.65, + "learning_rate": 7.000893169197313e-08, + "loss": 0.0005, + "step": 33524 + }, + { + "epoch": 0.65, + "learning_rate": 7.000504834763699e-08, + "loss": 0.0005, + "step": 33525 + }, + { + "epoch": 0.65, + "learning_rate": 7.000116500330084e-08, + "loss": 0.0004, + "step": 33526 + }, + { + "epoch": 0.65, + "learning_rate": 6.99972816589647e-08, + "loss": 0.0006, + "step": 33527 + }, + { + "epoch": 0.65, + "learning_rate": 6.999339831462856e-08, + "loss": 0.0004, + "step": 33528 + }, + { + "epoch": 0.65, + "learning_rate": 6.998951497029242e-08, + "loss": 0.0004, + "step": 33529 + }, + { + "epoch": 0.65, + "learning_rate": 6.998563162595626e-08, + "loss": 0.0005, + "step": 33530 + }, + { + "epoch": 0.65, + "learning_rate": 6.998174828162012e-08, + "loss": 0.9944, + "step": 33531 + }, + { + "epoch": 0.65, + "learning_rate": 6.997786493728398e-08, + "loss": 0.0008, + "step": 33532 + }, + { + "epoch": 0.65, + "learning_rate": 6.997398159294784e-08, + "loss": 0.7245, + "step": 33533 + }, + { + "epoch": 0.65, + "learning_rate": 6.99700982486117e-08, + "loss": 0.0004, + "step": 33534 + }, + { + "epoch": 0.65, + "learning_rate": 6.996621490427555e-08, + "loss": 0.0005, + "step": 33535 + }, + { + "epoch": 0.65, + "learning_rate": 6.996233155993941e-08, + "loss": 0.3311, + "step": 33536 + }, + { + "epoch": 0.65, + "learning_rate": 6.995844821560327e-08, + "loss": 0.4407, + "step": 33537 + }, + { + "epoch": 0.65, + "learning_rate": 6.995456487126713e-08, + "loss": 0.0004, + "step": 33538 + }, + { + "epoch": 0.65, + "learning_rate": 6.995068152693099e-08, + "loss": 0.0005, + "step": 33539 + }, + { + "epoch": 0.65, + "learning_rate": 6.994679818259485e-08, + "loss": 0.3692, + "step": 33540 + }, + { + "epoch": 0.65, + "learning_rate": 6.99429148382587e-08, + "loss": 0.0005, + "step": 33541 + }, + { + "epoch": 0.65, + "learning_rate": 6.993903149392256e-08, + "loss": 0.4027, + "step": 33542 + }, + { + "epoch": 0.65, + "learning_rate": 6.993514814958642e-08, + "loss": 0.001, + "step": 33543 + }, + { + "epoch": 0.65, + "learning_rate": 6.993126480525028e-08, + "loss": 0.0005, + "step": 33544 + }, + { + "epoch": 0.65, + "learning_rate": 6.992738146091414e-08, + "loss": 0.0008, + "step": 33545 + }, + { + "epoch": 0.65, + "learning_rate": 6.9923498116578e-08, + "loss": 0.0004, + "step": 33546 + }, + { + "epoch": 0.65, + "learning_rate": 6.991961477224185e-08, + "loss": 0.0026, + "step": 33547 + }, + { + "epoch": 0.65, + "learning_rate": 6.991573142790571e-08, + "loss": 0.0005, + "step": 33548 + }, + { + "epoch": 0.65, + "learning_rate": 6.991184808356957e-08, + "loss": 0.0005, + "step": 33549 + }, + { + "epoch": 0.65, + "learning_rate": 6.990796473923343e-08, + "loss": 0.0006, + "step": 33550 + }, + { + "epoch": 0.65, + "learning_rate": 6.990408139489729e-08, + "loss": 0.0004, + "step": 33551 + }, + { + "epoch": 0.65, + "learning_rate": 6.990019805056114e-08, + "loss": 0.1816, + "step": 33552 + }, + { + "epoch": 0.65, + "learning_rate": 6.9896314706225e-08, + "loss": 0.2537, + "step": 33553 + }, + { + "epoch": 0.65, + "learning_rate": 6.989243136188886e-08, + "loss": 0.0003, + "step": 33554 + }, + { + "epoch": 0.65, + "learning_rate": 6.988854801755272e-08, + "loss": 0.0004, + "step": 33555 + }, + { + "epoch": 0.65, + "learning_rate": 6.988466467321658e-08, + "loss": 0.0005, + "step": 33556 + }, + { + "epoch": 0.65, + "learning_rate": 6.988078132888044e-08, + "loss": 0.0006, + "step": 33557 + }, + { + "epoch": 0.65, + "learning_rate": 6.98768979845443e-08, + "loss": 0.0006, + "step": 33558 + }, + { + "epoch": 0.65, + "learning_rate": 6.987301464020814e-08, + "loss": 0.001, + "step": 33559 + }, + { + "epoch": 0.65, + "learning_rate": 6.9869131295872e-08, + "loss": 0.0006, + "step": 33560 + }, + { + "epoch": 0.65, + "learning_rate": 6.986524795153586e-08, + "loss": 0.0005, + "step": 33561 + }, + { + "epoch": 0.65, + "learning_rate": 6.986136460719971e-08, + "loss": 0.0007, + "step": 33562 + }, + { + "epoch": 0.65, + "learning_rate": 6.985748126286357e-08, + "loss": 0.0005, + "step": 33563 + }, + { + "epoch": 0.65, + "learning_rate": 6.985359791852743e-08, + "loss": 0.0004, + "step": 33564 + }, + { + "epoch": 0.65, + "learning_rate": 6.984971457419129e-08, + "loss": 0.0004, + "step": 33565 + }, + { + "epoch": 0.65, + "learning_rate": 6.984583122985515e-08, + "loss": 1.3871, + "step": 33566 + }, + { + "epoch": 0.65, + "learning_rate": 6.9841947885519e-08, + "loss": 0.0005, + "step": 33567 + }, + { + "epoch": 0.65, + "learning_rate": 6.983806454118286e-08, + "loss": 0.0004, + "step": 33568 + }, + { + "epoch": 0.65, + "learning_rate": 6.983418119684672e-08, + "loss": 0.0004, + "step": 33569 + }, + { + "epoch": 0.65, + "learning_rate": 6.983029785251058e-08, + "loss": 0.0005, + "step": 33570 + }, + { + "epoch": 0.65, + "learning_rate": 6.982641450817444e-08, + "loss": 0.0005, + "step": 33571 + }, + { + "epoch": 0.65, + "learning_rate": 6.98225311638383e-08, + "loss": 0.0032, + "step": 33572 + }, + { + "epoch": 0.65, + "learning_rate": 6.981864781950215e-08, + "loss": 0.0007, + "step": 33573 + }, + { + "epoch": 0.65, + "learning_rate": 6.981476447516601e-08, + "loss": 0.0004, + "step": 33574 + }, + { + "epoch": 0.65, + "learning_rate": 6.981088113082987e-08, + "loss": 0.0005, + "step": 33575 + }, + { + "epoch": 0.65, + "learning_rate": 6.980699778649373e-08, + "loss": 1.1883, + "step": 33576 + }, + { + "epoch": 0.65, + "learning_rate": 6.980311444215759e-08, + "loss": 0.0005, + "step": 33577 + }, + { + "epoch": 0.65, + "learning_rate": 6.979923109782145e-08, + "loss": 0.0005, + "step": 33578 + }, + { + "epoch": 0.65, + "learning_rate": 6.97953477534853e-08, + "loss": 0.0006, + "step": 33579 + }, + { + "epoch": 0.65, + "learning_rate": 6.979146440914916e-08, + "loss": 0.0005, + "step": 33580 + }, + { + "epoch": 0.65, + "learning_rate": 6.978758106481302e-08, + "loss": 0.0025, + "step": 33581 + }, + { + "epoch": 0.65, + "learning_rate": 6.978369772047688e-08, + "loss": 0.0003, + "step": 33582 + }, + { + "epoch": 0.65, + "learning_rate": 6.977981437614074e-08, + "loss": 0.0004, + "step": 33583 + }, + { + "epoch": 0.65, + "learning_rate": 6.97759310318046e-08, + "loss": 0.0003, + "step": 33584 + }, + { + "epoch": 0.65, + "learning_rate": 6.977204768746845e-08, + "loss": 0.0006, + "step": 33585 + }, + { + "epoch": 0.65, + "learning_rate": 6.976816434313231e-08, + "loss": 0.0005, + "step": 33586 + }, + { + "epoch": 0.65, + "learning_rate": 6.976428099879617e-08, + "loss": 0.0004, + "step": 33587 + }, + { + "epoch": 0.65, + "learning_rate": 6.976039765446001e-08, + "loss": 0.0005, + "step": 33588 + }, + { + "epoch": 0.65, + "learning_rate": 6.975651431012387e-08, + "loss": 0.0022, + "step": 33589 + }, + { + "epoch": 0.65, + "learning_rate": 6.975263096578773e-08, + "loss": 0.0005, + "step": 33590 + }, + { + "epoch": 0.65, + "learning_rate": 6.974874762145159e-08, + "loss": 0.0005, + "step": 33591 + }, + { + "epoch": 0.65, + "learning_rate": 6.974486427711545e-08, + "loss": 0.0005, + "step": 33592 + }, + { + "epoch": 0.65, + "learning_rate": 6.97409809327793e-08, + "loss": 0.0004, + "step": 33593 + }, + { + "epoch": 0.65, + "learning_rate": 6.973709758844316e-08, + "loss": 0.0236, + "step": 33594 + }, + { + "epoch": 0.65, + "learning_rate": 6.973321424410702e-08, + "loss": 0.0004, + "step": 33595 + }, + { + "epoch": 0.65, + "learning_rate": 6.972933089977088e-08, + "loss": 1.3546, + "step": 33596 + }, + { + "epoch": 0.65, + "learning_rate": 6.972544755543474e-08, + "loss": 0.0006, + "step": 33597 + }, + { + "epoch": 0.65, + "learning_rate": 6.97215642110986e-08, + "loss": 0.0006, + "step": 33598 + }, + { + "epoch": 0.65, + "learning_rate": 6.971768086676246e-08, + "loss": 0.4379, + "step": 33599 + }, + { + "epoch": 0.65, + "learning_rate": 6.971379752242631e-08, + "loss": 0.0005, + "step": 33600 + }, + { + "epoch": 0.65, + "learning_rate": 6.970991417809017e-08, + "loss": 0.0005, + "step": 33601 + }, + { + "epoch": 0.65, + "learning_rate": 6.970603083375403e-08, + "loss": 0.0005, + "step": 33602 + }, + { + "epoch": 0.65, + "learning_rate": 6.970214748941789e-08, + "loss": 0.0003, + "step": 33603 + }, + { + "epoch": 0.65, + "learning_rate": 6.969826414508175e-08, + "loss": 0.0005, + "step": 33604 + }, + { + "epoch": 0.65, + "learning_rate": 6.96943808007456e-08, + "loss": 0.0003, + "step": 33605 + }, + { + "epoch": 0.65, + "learning_rate": 6.969049745640946e-08, + "loss": 0.0005, + "step": 33606 + }, + { + "epoch": 0.65, + "learning_rate": 6.968661411207332e-08, + "loss": 0.0006, + "step": 33607 + }, + { + "epoch": 0.65, + "learning_rate": 6.968273076773718e-08, + "loss": 0.0005, + "step": 33608 + }, + { + "epoch": 0.65, + "learning_rate": 6.967884742340104e-08, + "loss": 0.0269, + "step": 33609 + }, + { + "epoch": 0.65, + "learning_rate": 6.96749640790649e-08, + "loss": 0.0004, + "step": 33610 + }, + { + "epoch": 0.65, + "learning_rate": 6.967108073472875e-08, + "loss": 0.0008, + "step": 33611 + }, + { + "epoch": 0.65, + "learning_rate": 6.966719739039261e-08, + "loss": 0.0004, + "step": 33612 + }, + { + "epoch": 0.65, + "learning_rate": 6.966331404605647e-08, + "loss": 0.0036, + "step": 33613 + }, + { + "epoch": 0.65, + "learning_rate": 6.965943070172033e-08, + "loss": 0.0005, + "step": 33614 + }, + { + "epoch": 0.65, + "learning_rate": 6.965554735738419e-08, + "loss": 0.0006, + "step": 33615 + }, + { + "epoch": 0.65, + "learning_rate": 6.965166401304805e-08, + "loss": 0.0005, + "step": 33616 + }, + { + "epoch": 0.65, + "learning_rate": 6.964778066871189e-08, + "loss": 1.2956, + "step": 33617 + }, + { + "epoch": 0.65, + "learning_rate": 6.964389732437575e-08, + "loss": 0.0026, + "step": 33618 + }, + { + "epoch": 0.65, + "learning_rate": 6.964001398003961e-08, + "loss": 0.2632, + "step": 33619 + }, + { + "epoch": 0.65, + "learning_rate": 6.963613063570347e-08, + "loss": 0.0005, + "step": 33620 + }, + { + "epoch": 0.65, + "learning_rate": 6.963224729136732e-08, + "loss": 0.0005, + "step": 33621 + }, + { + "epoch": 0.65, + "learning_rate": 6.962836394703118e-08, + "loss": 0.0038, + "step": 33622 + }, + { + "epoch": 0.65, + "learning_rate": 6.962448060269504e-08, + "loss": 0.0004, + "step": 33623 + }, + { + "epoch": 0.65, + "learning_rate": 6.96205972583589e-08, + "loss": 0.0008, + "step": 33624 + }, + { + "epoch": 0.65, + "learning_rate": 6.961671391402276e-08, + "loss": 0.0006, + "step": 33625 + }, + { + "epoch": 0.65, + "learning_rate": 6.961283056968661e-08, + "loss": 0.0005, + "step": 33626 + }, + { + "epoch": 0.65, + "learning_rate": 6.960894722535047e-08, + "loss": 0.0004, + "step": 33627 + }, + { + "epoch": 0.65, + "learning_rate": 6.960506388101433e-08, + "loss": 0.0005, + "step": 33628 + }, + { + "epoch": 0.65, + "learning_rate": 6.960118053667819e-08, + "loss": 0.0005, + "step": 33629 + }, + { + "epoch": 0.65, + "learning_rate": 6.959729719234205e-08, + "loss": 0.064, + "step": 33630 + }, + { + "epoch": 0.65, + "learning_rate": 6.95934138480059e-08, + "loss": 0.0004, + "step": 33631 + }, + { + "epoch": 0.65, + "learning_rate": 6.958953050366976e-08, + "loss": 0.0004, + "step": 33632 + }, + { + "epoch": 0.65, + "learning_rate": 6.958564715933361e-08, + "loss": 0.0013, + "step": 33633 + }, + { + "epoch": 0.65, + "learning_rate": 6.958176381499747e-08, + "loss": 0.1083, + "step": 33634 + }, + { + "epoch": 0.65, + "learning_rate": 6.957788047066133e-08, + "loss": 0.0006, + "step": 33635 + }, + { + "epoch": 0.65, + "learning_rate": 6.957399712632518e-08, + "loss": 0.2587, + "step": 33636 + }, + { + "epoch": 0.65, + "learning_rate": 6.957011378198904e-08, + "loss": 0.0004, + "step": 33637 + }, + { + "epoch": 0.65, + "learning_rate": 6.95662304376529e-08, + "loss": 0.0004, + "step": 33638 + }, + { + "epoch": 0.65, + "learning_rate": 6.956234709331676e-08, + "loss": 0.0008, + "step": 33639 + }, + { + "epoch": 0.65, + "learning_rate": 6.955846374898062e-08, + "loss": 0.2349, + "step": 33640 + }, + { + "epoch": 0.65, + "learning_rate": 6.955458040464448e-08, + "loss": 0.0005, + "step": 33641 + }, + { + "epoch": 0.65, + "learning_rate": 6.955069706030833e-08, + "loss": 0.4461, + "step": 33642 + }, + { + "epoch": 0.65, + "learning_rate": 6.954681371597219e-08, + "loss": 0.0008, + "step": 33643 + }, + { + "epoch": 0.65, + "learning_rate": 6.954293037163605e-08, + "loss": 0.0004, + "step": 33644 + }, + { + "epoch": 0.65, + "learning_rate": 6.953904702729991e-08, + "loss": 0.0003, + "step": 33645 + }, + { + "epoch": 0.65, + "learning_rate": 6.953516368296377e-08, + "loss": 0.0004, + "step": 33646 + }, + { + "epoch": 0.65, + "learning_rate": 6.953128033862762e-08, + "loss": 0.0003, + "step": 33647 + }, + { + "epoch": 0.65, + "learning_rate": 6.952739699429147e-08, + "loss": 0.0005, + "step": 33648 + }, + { + "epoch": 0.65, + "learning_rate": 6.952351364995533e-08, + "loss": 0.0005, + "step": 33649 + }, + { + "epoch": 0.65, + "learning_rate": 6.951963030561919e-08, + "loss": 0.0004, + "step": 33650 + }, + { + "epoch": 0.65, + "learning_rate": 6.951574696128304e-08, + "loss": 0.0005, + "step": 33651 + }, + { + "epoch": 0.65, + "learning_rate": 6.95118636169469e-08, + "loss": 0.0047, + "step": 33652 + }, + { + "epoch": 0.65, + "learning_rate": 6.950798027261076e-08, + "loss": 0.0015, + "step": 33653 + }, + { + "epoch": 0.65, + "learning_rate": 6.950409692827462e-08, + "loss": 0.0003, + "step": 33654 + }, + { + "epoch": 0.65, + "learning_rate": 6.950021358393848e-08, + "loss": 0.0006, + "step": 33655 + }, + { + "epoch": 0.65, + "learning_rate": 6.949633023960234e-08, + "loss": 0.0011, + "step": 33656 + }, + { + "epoch": 0.65, + "learning_rate": 6.94924468952662e-08, + "loss": 0.0003, + "step": 33657 + }, + { + "epoch": 0.65, + "learning_rate": 6.948856355093005e-08, + "loss": 0.0005, + "step": 33658 + }, + { + "epoch": 0.65, + "learning_rate": 6.948468020659391e-08, + "loss": 0.0009, + "step": 33659 + }, + { + "epoch": 0.65, + "learning_rate": 6.948079686225777e-08, + "loss": 0.0004, + "step": 33660 + }, + { + "epoch": 0.65, + "learning_rate": 6.947691351792163e-08, + "loss": 1.2544, + "step": 33661 + }, + { + "epoch": 0.65, + "learning_rate": 6.947303017358549e-08, + "loss": 0.0017, + "step": 33662 + }, + { + "epoch": 0.65, + "learning_rate": 6.946914682924934e-08, + "loss": 0.0003, + "step": 33663 + }, + { + "epoch": 0.65, + "learning_rate": 6.94652634849132e-08, + "loss": 0.0008, + "step": 33664 + }, + { + "epoch": 0.65, + "learning_rate": 6.946138014057706e-08, + "loss": 0.0243, + "step": 33665 + }, + { + "epoch": 0.65, + "learning_rate": 6.945749679624092e-08, + "loss": 0.0005, + "step": 33666 + }, + { + "epoch": 0.65, + "learning_rate": 6.945361345190478e-08, + "loss": 0.0031, + "step": 33667 + }, + { + "epoch": 0.65, + "learning_rate": 6.944973010756863e-08, + "loss": 0.001, + "step": 33668 + }, + { + "epoch": 0.65, + "learning_rate": 6.944584676323249e-08, + "loss": 0.0005, + "step": 33669 + }, + { + "epoch": 0.65, + "learning_rate": 6.944196341889635e-08, + "loss": 0.0004, + "step": 33670 + }, + { + "epoch": 0.65, + "learning_rate": 6.943808007456021e-08, + "loss": 0.0004, + "step": 33671 + }, + { + "epoch": 0.65, + "learning_rate": 6.943419673022407e-08, + "loss": 0.0005, + "step": 33672 + }, + { + "epoch": 0.65, + "learning_rate": 6.943031338588793e-08, + "loss": 0.0003, + "step": 33673 + }, + { + "epoch": 0.65, + "learning_rate": 6.942643004155178e-08, + "loss": 0.0007, + "step": 33674 + }, + { + "epoch": 0.65, + "learning_rate": 6.942254669721563e-08, + "loss": 0.0005, + "step": 33675 + }, + { + "epoch": 0.65, + "learning_rate": 6.941866335287949e-08, + "loss": 0.0003, + "step": 33676 + }, + { + "epoch": 0.65, + "learning_rate": 6.941478000854335e-08, + "loss": 0.0017, + "step": 33677 + }, + { + "epoch": 0.65, + "learning_rate": 6.94108966642072e-08, + "loss": 0.0006, + "step": 33678 + }, + { + "epoch": 0.65, + "learning_rate": 6.940701331987106e-08, + "loss": 0.0003, + "step": 33679 + }, + { + "epoch": 0.65, + "learning_rate": 6.940312997553492e-08, + "loss": 0.0005, + "step": 33680 + }, + { + "epoch": 0.65, + "learning_rate": 6.939924663119878e-08, + "loss": 0.0005, + "step": 33681 + }, + { + "epoch": 0.65, + "learning_rate": 6.939536328686264e-08, + "loss": 0.0004, + "step": 33682 + }, + { + "epoch": 0.65, + "learning_rate": 6.93914799425265e-08, + "loss": 0.0004, + "step": 33683 + }, + { + "epoch": 0.65, + "learning_rate": 6.938759659819035e-08, + "loss": 0.0006, + "step": 33684 + }, + { + "epoch": 0.65, + "learning_rate": 6.938371325385421e-08, + "loss": 0.0004, + "step": 33685 + }, + { + "epoch": 0.65, + "learning_rate": 6.937982990951807e-08, + "loss": 0.0004, + "step": 33686 + }, + { + "epoch": 0.65, + "learning_rate": 6.937594656518193e-08, + "loss": 0.002, + "step": 33687 + }, + { + "epoch": 0.65, + "learning_rate": 6.937206322084579e-08, + "loss": 0.0004, + "step": 33688 + }, + { + "epoch": 0.65, + "learning_rate": 6.936817987650964e-08, + "loss": 0.0005, + "step": 33689 + }, + { + "epoch": 0.65, + "learning_rate": 6.93642965321735e-08, + "loss": 0.0019, + "step": 33690 + }, + { + "epoch": 0.65, + "learning_rate": 6.936041318783736e-08, + "loss": 0.0075, + "step": 33691 + }, + { + "epoch": 0.65, + "learning_rate": 6.935652984350122e-08, + "loss": 0.0004, + "step": 33692 + }, + { + "epoch": 0.65, + "learning_rate": 6.935264649916508e-08, + "loss": 0.0004, + "step": 33693 + }, + { + "epoch": 0.65, + "learning_rate": 6.934876315482894e-08, + "loss": 0.0003, + "step": 33694 + }, + { + "epoch": 0.65, + "learning_rate": 6.93448798104928e-08, + "loss": 0.0006, + "step": 33695 + }, + { + "epoch": 0.65, + "learning_rate": 6.934099646615665e-08, + "loss": 0.0003, + "step": 33696 + }, + { + "epoch": 0.65, + "learning_rate": 6.933711312182051e-08, + "loss": 0.0111, + "step": 33697 + }, + { + "epoch": 0.65, + "learning_rate": 6.933322977748437e-08, + "loss": 0.0003, + "step": 33698 + }, + { + "epoch": 0.65, + "learning_rate": 6.932934643314823e-08, + "loss": 0.0005, + "step": 33699 + }, + { + "epoch": 0.65, + "learning_rate": 6.932546308881209e-08, + "loss": 0.0016, + "step": 33700 + }, + { + "epoch": 0.65, + "learning_rate": 6.932157974447594e-08, + "loss": 0.0005, + "step": 33701 + }, + { + "epoch": 0.65, + "learning_rate": 6.93176964001398e-08, + "loss": 0.0004, + "step": 33702 + }, + { + "epoch": 0.65, + "learning_rate": 6.931381305580366e-08, + "loss": 0.0007, + "step": 33703 + }, + { + "epoch": 0.65, + "learning_rate": 6.93099297114675e-08, + "loss": 0.0004, + "step": 33704 + }, + { + "epoch": 0.65, + "learning_rate": 6.930604636713136e-08, + "loss": 0.0088, + "step": 33705 + }, + { + "epoch": 0.65, + "learning_rate": 6.930216302279522e-08, + "loss": 0.0052, + "step": 33706 + }, + { + "epoch": 0.65, + "learning_rate": 6.929827967845908e-08, + "loss": 0.0006, + "step": 33707 + }, + { + "epoch": 0.65, + "learning_rate": 6.929439633412294e-08, + "loss": 0.0004, + "step": 33708 + }, + { + "epoch": 0.65, + "learning_rate": 6.92905129897868e-08, + "loss": 0.0005, + "step": 33709 + }, + { + "epoch": 0.65, + "learning_rate": 6.928662964545065e-08, + "loss": 0.1407, + "step": 33710 + }, + { + "epoch": 0.65, + "learning_rate": 6.928274630111451e-08, + "loss": 0.0811, + "step": 33711 + }, + { + "epoch": 0.65, + "learning_rate": 6.927886295677837e-08, + "loss": 0.0056, + "step": 33712 + }, + { + "epoch": 0.65, + "learning_rate": 6.927497961244223e-08, + "loss": 0.0004, + "step": 33713 + }, + { + "epoch": 0.65, + "learning_rate": 6.927109626810609e-08, + "loss": 0.001, + "step": 33714 + }, + { + "epoch": 0.65, + "learning_rate": 6.926721292376995e-08, + "loss": 0.0005, + "step": 33715 + }, + { + "epoch": 0.65, + "learning_rate": 6.92633295794338e-08, + "loss": 0.0016, + "step": 33716 + }, + { + "epoch": 0.65, + "learning_rate": 6.925944623509766e-08, + "loss": 0.0003, + "step": 33717 + }, + { + "epoch": 0.65, + "learning_rate": 6.925556289076152e-08, + "loss": 0.0004, + "step": 33718 + }, + { + "epoch": 0.65, + "learning_rate": 6.925167954642538e-08, + "loss": 0.0004, + "step": 33719 + }, + { + "epoch": 0.65, + "learning_rate": 6.924779620208924e-08, + "loss": 0.8074, + "step": 33720 + }, + { + "epoch": 0.65, + "learning_rate": 6.92439128577531e-08, + "loss": 0.0004, + "step": 33721 + }, + { + "epoch": 0.65, + "learning_rate": 6.924002951341695e-08, + "loss": 0.0004, + "step": 33722 + }, + { + "epoch": 0.65, + "learning_rate": 6.923614616908081e-08, + "loss": 0.0003, + "step": 33723 + }, + { + "epoch": 0.65, + "learning_rate": 6.923226282474467e-08, + "loss": 0.0004, + "step": 33724 + }, + { + "epoch": 0.65, + "learning_rate": 6.922837948040853e-08, + "loss": 0.0007, + "step": 33725 + }, + { + "epoch": 0.65, + "learning_rate": 6.922449613607239e-08, + "loss": 0.0005, + "step": 33726 + }, + { + "epoch": 0.65, + "learning_rate": 6.922061279173624e-08, + "loss": 0.0006, + "step": 33727 + }, + { + "epoch": 0.65, + "learning_rate": 6.92167294474001e-08, + "loss": 0.2531, + "step": 33728 + }, + { + "epoch": 0.65, + "learning_rate": 6.921284610306396e-08, + "loss": 0.0004, + "step": 33729 + }, + { + "epoch": 0.65, + "learning_rate": 6.920896275872782e-08, + "loss": 0.0006, + "step": 33730 + }, + { + "epoch": 0.65, + "learning_rate": 6.920507941439168e-08, + "loss": 0.0009, + "step": 33731 + }, + { + "epoch": 0.65, + "learning_rate": 6.920119607005554e-08, + "loss": 0.0005, + "step": 33732 + }, + { + "epoch": 0.65, + "learning_rate": 6.919731272571938e-08, + "loss": 0.3571, + "step": 33733 + }, + { + "epoch": 0.65, + "learning_rate": 6.919342938138324e-08, + "loss": 0.0008, + "step": 33734 + }, + { + "epoch": 0.65, + "learning_rate": 6.91895460370471e-08, + "loss": 0.0004, + "step": 33735 + }, + { + "epoch": 0.65, + "learning_rate": 6.918566269271096e-08, + "loss": 0.0004, + "step": 33736 + }, + { + "epoch": 0.65, + "learning_rate": 6.918177934837481e-08, + "loss": 0.0004, + "step": 33737 + }, + { + "epoch": 0.65, + "learning_rate": 6.917789600403867e-08, + "loss": 0.0004, + "step": 33738 + }, + { + "epoch": 0.65, + "learning_rate": 6.917401265970253e-08, + "loss": 0.0006, + "step": 33739 + }, + { + "epoch": 0.65, + "learning_rate": 6.917012931536639e-08, + "loss": 0.0005, + "step": 33740 + }, + { + "epoch": 0.65, + "learning_rate": 6.916624597103025e-08, + "loss": 0.0003, + "step": 33741 + }, + { + "epoch": 0.65, + "learning_rate": 6.91623626266941e-08, + "loss": 0.7248, + "step": 33742 + }, + { + "epoch": 0.65, + "learning_rate": 6.915847928235796e-08, + "loss": 0.0004, + "step": 33743 + }, + { + "epoch": 0.65, + "learning_rate": 6.915459593802182e-08, + "loss": 0.3379, + "step": 33744 + }, + { + "epoch": 0.65, + "learning_rate": 6.915071259368568e-08, + "loss": 0.0004, + "step": 33745 + }, + { + "epoch": 0.65, + "learning_rate": 6.914682924934954e-08, + "loss": 0.0005, + "step": 33746 + }, + { + "epoch": 0.65, + "learning_rate": 6.91429459050134e-08, + "loss": 0.0004, + "step": 33747 + }, + { + "epoch": 0.65, + "learning_rate": 6.913906256067725e-08, + "loss": 0.0004, + "step": 33748 + }, + { + "epoch": 0.65, + "learning_rate": 6.913517921634111e-08, + "loss": 0.0008, + "step": 33749 + }, + { + "epoch": 0.65, + "learning_rate": 6.913129587200497e-08, + "loss": 0.0004, + "step": 33750 + }, + { + "epoch": 0.65, + "learning_rate": 6.912741252766883e-08, + "loss": 0.018, + "step": 33751 + }, + { + "epoch": 0.65, + "learning_rate": 6.912352918333269e-08, + "loss": 0.0005, + "step": 33752 + }, + { + "epoch": 0.65, + "learning_rate": 6.911964583899655e-08, + "loss": 0.0002, + "step": 33753 + }, + { + "epoch": 0.65, + "learning_rate": 6.91157624946604e-08, + "loss": 0.0004, + "step": 33754 + }, + { + "epoch": 0.65, + "learning_rate": 6.911187915032426e-08, + "loss": 0.0006, + "step": 33755 + }, + { + "epoch": 0.65, + "learning_rate": 6.910799580598812e-08, + "loss": 0.0009, + "step": 33756 + }, + { + "epoch": 0.65, + "learning_rate": 6.910411246165198e-08, + "loss": 0.0006, + "step": 33757 + }, + { + "epoch": 0.65, + "learning_rate": 6.910022911731584e-08, + "loss": 1.0533, + "step": 33758 + }, + { + "epoch": 0.65, + "learning_rate": 6.90963457729797e-08, + "loss": 0.0021, + "step": 33759 + }, + { + "epoch": 0.65, + "learning_rate": 6.909246242864355e-08, + "loss": 0.0006, + "step": 33760 + }, + { + "epoch": 0.65, + "learning_rate": 6.908857908430741e-08, + "loss": 0.0006, + "step": 33761 + }, + { + "epoch": 0.65, + "learning_rate": 6.908469573997126e-08, + "loss": 0.0003, + "step": 33762 + }, + { + "epoch": 0.65, + "learning_rate": 6.908081239563511e-08, + "loss": 0.0003, + "step": 33763 + }, + { + "epoch": 0.65, + "learning_rate": 6.907692905129897e-08, + "loss": 0.0006, + "step": 33764 + }, + { + "epoch": 0.65, + "learning_rate": 6.907304570696283e-08, + "loss": 1.0819, + "step": 33765 + }, + { + "epoch": 0.65, + "learning_rate": 6.906916236262669e-08, + "loss": 0.0007, + "step": 33766 + }, + { + "epoch": 0.66, + "learning_rate": 6.906527901829055e-08, + "loss": 0.0004, + "step": 33767 + }, + { + "epoch": 0.66, + "learning_rate": 6.90613956739544e-08, + "loss": 0.0004, + "step": 33768 + }, + { + "epoch": 0.66, + "learning_rate": 6.905751232961826e-08, + "loss": 0.0004, + "step": 33769 + }, + { + "epoch": 0.66, + "learning_rate": 6.905362898528212e-08, + "loss": 0.0008, + "step": 33770 + }, + { + "epoch": 0.66, + "learning_rate": 6.904974564094598e-08, + "loss": 0.0097, + "step": 33771 + }, + { + "epoch": 0.66, + "learning_rate": 6.904586229660984e-08, + "loss": 0.0004, + "step": 33772 + }, + { + "epoch": 0.66, + "learning_rate": 6.90419789522737e-08, + "loss": 0.0005, + "step": 33773 + }, + { + "epoch": 0.66, + "learning_rate": 6.903809560793756e-08, + "loss": 0.0017, + "step": 33774 + }, + { + "epoch": 0.66, + "learning_rate": 6.903421226360141e-08, + "loss": 0.0006, + "step": 33775 + }, + { + "epoch": 0.66, + "learning_rate": 6.903032891926527e-08, + "loss": 0.0006, + "step": 33776 + }, + { + "epoch": 0.66, + "learning_rate": 6.902644557492913e-08, + "loss": 0.0024, + "step": 33777 + }, + { + "epoch": 0.66, + "learning_rate": 6.902256223059299e-08, + "loss": 0.1205, + "step": 33778 + }, + { + "epoch": 0.66, + "learning_rate": 6.901867888625685e-08, + "loss": 0.0007, + "step": 33779 + }, + { + "epoch": 0.66, + "learning_rate": 6.90147955419207e-08, + "loss": 0.0004, + "step": 33780 + }, + { + "epoch": 0.66, + "learning_rate": 6.901091219758456e-08, + "loss": 0.0123, + "step": 33781 + }, + { + "epoch": 0.66, + "learning_rate": 6.900702885324842e-08, + "loss": 0.0005, + "step": 33782 + }, + { + "epoch": 0.66, + "learning_rate": 6.900314550891228e-08, + "loss": 0.0004, + "step": 33783 + }, + { + "epoch": 0.66, + "learning_rate": 6.899926216457614e-08, + "loss": 0.0005, + "step": 33784 + }, + { + "epoch": 0.66, + "learning_rate": 6.899537882024e-08, + "loss": 0.0003, + "step": 33785 + }, + { + "epoch": 0.66, + "learning_rate": 6.899149547590385e-08, + "loss": 0.0328, + "step": 33786 + }, + { + "epoch": 0.66, + "learning_rate": 6.898761213156771e-08, + "loss": 0.0004, + "step": 33787 + }, + { + "epoch": 0.66, + "learning_rate": 6.898372878723157e-08, + "loss": 0.0005, + "step": 33788 + }, + { + "epoch": 0.66, + "learning_rate": 6.897984544289543e-08, + "loss": 0.946, + "step": 33789 + }, + { + "epoch": 0.66, + "learning_rate": 6.897596209855929e-08, + "loss": 0.0061, + "step": 33790 + }, + { + "epoch": 0.66, + "learning_rate": 6.897207875422313e-08, + "loss": 0.0007, + "step": 33791 + }, + { + "epoch": 0.66, + "learning_rate": 6.896819540988699e-08, + "loss": 0.0005, + "step": 33792 + }, + { + "epoch": 0.66, + "learning_rate": 6.896431206555085e-08, + "loss": 0.0005, + "step": 33793 + }, + { + "epoch": 0.66, + "learning_rate": 6.896042872121471e-08, + "loss": 0.0015, + "step": 33794 + }, + { + "epoch": 0.66, + "learning_rate": 6.895654537687857e-08, + "loss": 0.0004, + "step": 33795 + }, + { + "epoch": 0.66, + "learning_rate": 6.895266203254242e-08, + "loss": 0.0004, + "step": 33796 + }, + { + "epoch": 0.66, + "learning_rate": 6.894877868820628e-08, + "loss": 0.0005, + "step": 33797 + }, + { + "epoch": 0.66, + "learning_rate": 6.894489534387014e-08, + "loss": 0.0004, + "step": 33798 + }, + { + "epoch": 0.66, + "learning_rate": 6.8941011999534e-08, + "loss": 0.0006, + "step": 33799 + }, + { + "epoch": 0.66, + "learning_rate": 6.893712865519786e-08, + "loss": 0.0004, + "step": 33800 + }, + { + "epoch": 0.66, + "learning_rate": 6.893324531086171e-08, + "loss": 0.0012, + "step": 33801 + }, + { + "epoch": 0.66, + "learning_rate": 6.892936196652557e-08, + "loss": 0.0004, + "step": 33802 + }, + { + "epoch": 0.66, + "learning_rate": 6.892547862218943e-08, + "loss": 0.2312, + "step": 33803 + }, + { + "epoch": 0.66, + "learning_rate": 6.892159527785329e-08, + "loss": 0.5875, + "step": 33804 + }, + { + "epoch": 0.66, + "learning_rate": 6.891771193351715e-08, + "loss": 0.0004, + "step": 33805 + }, + { + "epoch": 0.66, + "learning_rate": 6.8913828589181e-08, + "loss": 0.9873, + "step": 33806 + }, + { + "epoch": 0.66, + "learning_rate": 6.890994524484486e-08, + "loss": 0.001, + "step": 33807 + }, + { + "epoch": 0.66, + "learning_rate": 6.890606190050872e-08, + "loss": 0.0003, + "step": 33808 + }, + { + "epoch": 0.66, + "learning_rate": 6.890217855617258e-08, + "loss": 0.0005, + "step": 33809 + }, + { + "epoch": 0.66, + "learning_rate": 6.889829521183643e-08, + "loss": 0.0005, + "step": 33810 + }, + { + "epoch": 0.66, + "learning_rate": 6.889441186750028e-08, + "loss": 0.0004, + "step": 33811 + }, + { + "epoch": 0.66, + "learning_rate": 6.889052852316414e-08, + "loss": 0.0004, + "step": 33812 + }, + { + "epoch": 0.66, + "learning_rate": 6.8886645178828e-08, + "loss": 0.0004, + "step": 33813 + }, + { + "epoch": 0.66, + "learning_rate": 6.888276183449186e-08, + "loss": 0.0005, + "step": 33814 + }, + { + "epoch": 0.66, + "learning_rate": 6.887887849015572e-08, + "loss": 0.0004, + "step": 33815 + }, + { + "epoch": 0.66, + "learning_rate": 6.887499514581958e-08, + "loss": 0.001, + "step": 33816 + }, + { + "epoch": 0.66, + "learning_rate": 6.887111180148343e-08, + "loss": 0.0005, + "step": 33817 + }, + { + "epoch": 0.66, + "learning_rate": 6.886722845714729e-08, + "loss": 0.0041, + "step": 33818 + }, + { + "epoch": 0.66, + "learning_rate": 6.886334511281115e-08, + "loss": 0.0004, + "step": 33819 + }, + { + "epoch": 0.66, + "learning_rate": 6.885946176847501e-08, + "loss": 0.0005, + "step": 33820 + }, + { + "epoch": 0.66, + "learning_rate": 6.885557842413887e-08, + "loss": 0.5981, + "step": 33821 + }, + { + "epoch": 0.66, + "learning_rate": 6.885169507980272e-08, + "loss": 0.0467, + "step": 33822 + }, + { + "epoch": 0.66, + "learning_rate": 6.884781173546658e-08, + "loss": 0.0005, + "step": 33823 + }, + { + "epoch": 0.66, + "learning_rate": 6.884392839113044e-08, + "loss": 0.0004, + "step": 33824 + }, + { + "epoch": 0.66, + "learning_rate": 6.884004504679429e-08, + "loss": 0.0005, + "step": 33825 + }, + { + "epoch": 0.66, + "learning_rate": 6.883616170245814e-08, + "loss": 0.005, + "step": 33826 + }, + { + "epoch": 0.66, + "learning_rate": 6.8832278358122e-08, + "loss": 1.1667, + "step": 33827 + }, + { + "epoch": 0.66, + "learning_rate": 6.882839501378586e-08, + "loss": 0.0004, + "step": 33828 + }, + { + "epoch": 0.66, + "learning_rate": 6.882451166944972e-08, + "loss": 0.0005, + "step": 33829 + }, + { + "epoch": 0.66, + "learning_rate": 6.882062832511358e-08, + "loss": 0.0004, + "step": 33830 + }, + { + "epoch": 0.66, + "learning_rate": 6.881674498077744e-08, + "loss": 0.0004, + "step": 33831 + }, + { + "epoch": 0.66, + "learning_rate": 6.88128616364413e-08, + "loss": 0.472, + "step": 33832 + }, + { + "epoch": 0.66, + "learning_rate": 6.880897829210515e-08, + "loss": 0.0594, + "step": 33833 + }, + { + "epoch": 0.66, + "learning_rate": 6.880509494776901e-08, + "loss": 0.7393, + "step": 33834 + }, + { + "epoch": 0.66, + "learning_rate": 6.880121160343287e-08, + "loss": 0.2002, + "step": 33835 + }, + { + "epoch": 0.66, + "learning_rate": 6.879732825909673e-08, + "loss": 0.0005, + "step": 33836 + }, + { + "epoch": 0.66, + "learning_rate": 6.879344491476059e-08, + "loss": 0.0006, + "step": 33837 + }, + { + "epoch": 0.66, + "learning_rate": 6.878956157042444e-08, + "loss": 0.0008, + "step": 33838 + }, + { + "epoch": 0.66, + "learning_rate": 6.87856782260883e-08, + "loss": 0.0004, + "step": 33839 + }, + { + "epoch": 0.66, + "learning_rate": 6.878179488175216e-08, + "loss": 0.0003, + "step": 33840 + }, + { + "epoch": 0.66, + "learning_rate": 6.877791153741602e-08, + "loss": 0.0012, + "step": 33841 + }, + { + "epoch": 0.66, + "learning_rate": 6.877402819307988e-08, + "loss": 0.0006, + "step": 33842 + }, + { + "epoch": 0.66, + "learning_rate": 6.877014484874373e-08, + "loss": 0.0004, + "step": 33843 + }, + { + "epoch": 0.66, + "learning_rate": 6.876626150440759e-08, + "loss": 0.0006, + "step": 33844 + }, + { + "epoch": 0.66, + "learning_rate": 6.876237816007145e-08, + "loss": 0.0008, + "step": 33845 + }, + { + "epoch": 0.66, + "learning_rate": 6.875849481573531e-08, + "loss": 0.001, + "step": 33846 + }, + { + "epoch": 0.66, + "learning_rate": 6.875461147139917e-08, + "loss": 0.0007, + "step": 33847 + }, + { + "epoch": 0.66, + "learning_rate": 6.875072812706303e-08, + "loss": 0.7522, + "step": 33848 + }, + { + "epoch": 0.66, + "learning_rate": 6.874684478272687e-08, + "loss": 0.0009, + "step": 33849 + }, + { + "epoch": 0.66, + "learning_rate": 6.874296143839073e-08, + "loss": 0.0004, + "step": 33850 + }, + { + "epoch": 0.66, + "learning_rate": 6.873907809405459e-08, + "loss": 0.9955, + "step": 33851 + }, + { + "epoch": 0.66, + "learning_rate": 6.873519474971845e-08, + "loss": 0.0004, + "step": 33852 + }, + { + "epoch": 0.66, + "learning_rate": 6.87313114053823e-08, + "loss": 0.0004, + "step": 33853 + }, + { + "epoch": 0.66, + "learning_rate": 6.872742806104616e-08, + "loss": 0.0004, + "step": 33854 + }, + { + "epoch": 0.66, + "learning_rate": 6.872354471671002e-08, + "loss": 0.0005, + "step": 33855 + }, + { + "epoch": 0.66, + "learning_rate": 6.871966137237388e-08, + "loss": 0.0004, + "step": 33856 + }, + { + "epoch": 0.66, + "learning_rate": 6.871577802803774e-08, + "loss": 0.0005, + "step": 33857 + }, + { + "epoch": 0.66, + "learning_rate": 6.87118946837016e-08, + "loss": 0.0005, + "step": 33858 + }, + { + "epoch": 0.66, + "learning_rate": 6.870801133936545e-08, + "loss": 0.0006, + "step": 33859 + }, + { + "epoch": 0.66, + "learning_rate": 6.870412799502931e-08, + "loss": 0.0005, + "step": 33860 + }, + { + "epoch": 0.66, + "learning_rate": 6.870024465069317e-08, + "loss": 0.0005, + "step": 33861 + }, + { + "epoch": 0.66, + "learning_rate": 6.869636130635703e-08, + "loss": 0.0005, + "step": 33862 + }, + { + "epoch": 0.66, + "learning_rate": 6.869247796202089e-08, + "loss": 0.0005, + "step": 33863 + }, + { + "epoch": 0.66, + "learning_rate": 6.868859461768474e-08, + "loss": 0.0004, + "step": 33864 + }, + { + "epoch": 0.66, + "learning_rate": 6.86847112733486e-08, + "loss": 1.1001, + "step": 33865 + }, + { + "epoch": 0.66, + "learning_rate": 6.868082792901246e-08, + "loss": 0.0006, + "step": 33866 + }, + { + "epoch": 0.66, + "learning_rate": 6.867694458467632e-08, + "loss": 1.0373, + "step": 33867 + }, + { + "epoch": 0.66, + "learning_rate": 6.867306124034018e-08, + "loss": 0.0005, + "step": 33868 + }, + { + "epoch": 0.66, + "learning_rate": 6.866917789600404e-08, + "loss": 0.0009, + "step": 33869 + }, + { + "epoch": 0.66, + "learning_rate": 6.86652945516679e-08, + "loss": 0.0004, + "step": 33870 + }, + { + "epoch": 0.66, + "learning_rate": 6.866141120733175e-08, + "loss": 0.0005, + "step": 33871 + }, + { + "epoch": 0.66, + "learning_rate": 6.865752786299561e-08, + "loss": 0.0004, + "step": 33872 + }, + { + "epoch": 0.66, + "learning_rate": 6.865364451865947e-08, + "loss": 0.0005, + "step": 33873 + }, + { + "epoch": 0.66, + "learning_rate": 6.864976117432333e-08, + "loss": 0.0005, + "step": 33874 + }, + { + "epoch": 0.66, + "learning_rate": 6.864587782998719e-08, + "loss": 1.184, + "step": 33875 + }, + { + "epoch": 0.66, + "learning_rate": 6.864199448565104e-08, + "loss": 0.0007, + "step": 33876 + }, + { + "epoch": 0.66, + "learning_rate": 6.86381111413149e-08, + "loss": 0.0004, + "step": 33877 + }, + { + "epoch": 0.66, + "learning_rate": 6.863422779697875e-08, + "loss": 0.7359, + "step": 33878 + }, + { + "epoch": 0.66, + "learning_rate": 6.86303444526426e-08, + "loss": 0.0011, + "step": 33879 + }, + { + "epoch": 0.66, + "learning_rate": 6.862646110830646e-08, + "loss": 0.0005, + "step": 33880 + }, + { + "epoch": 0.66, + "learning_rate": 6.862257776397032e-08, + "loss": 0.1247, + "step": 33881 + }, + { + "epoch": 0.66, + "learning_rate": 6.861869441963418e-08, + "loss": 0.0005, + "step": 33882 + }, + { + "epoch": 0.66, + "learning_rate": 6.861481107529804e-08, + "loss": 0.0005, + "step": 33883 + }, + { + "epoch": 0.66, + "learning_rate": 6.86109277309619e-08, + "loss": 0.0004, + "step": 33884 + }, + { + "epoch": 0.66, + "learning_rate": 6.860704438662575e-08, + "loss": 0.0004, + "step": 33885 + }, + { + "epoch": 0.66, + "learning_rate": 6.860316104228961e-08, + "loss": 0.0005, + "step": 33886 + }, + { + "epoch": 0.66, + "learning_rate": 6.859927769795347e-08, + "loss": 0.4453, + "step": 33887 + }, + { + "epoch": 0.66, + "learning_rate": 6.859539435361733e-08, + "loss": 0.0007, + "step": 33888 + }, + { + "epoch": 0.66, + "learning_rate": 6.859151100928119e-08, + "loss": 0.0006, + "step": 33889 + }, + { + "epoch": 0.66, + "learning_rate": 6.858762766494505e-08, + "loss": 0.0003, + "step": 33890 + }, + { + "epoch": 0.66, + "learning_rate": 6.85837443206089e-08, + "loss": 0.0005, + "step": 33891 + }, + { + "epoch": 0.66, + "learning_rate": 6.857986097627276e-08, + "loss": 0.0021, + "step": 33892 + }, + { + "epoch": 0.66, + "learning_rate": 6.857597763193662e-08, + "loss": 0.0006, + "step": 33893 + }, + { + "epoch": 0.66, + "learning_rate": 6.857209428760048e-08, + "loss": 0.0003, + "step": 33894 + }, + { + "epoch": 0.66, + "learning_rate": 6.856821094326434e-08, + "loss": 0.0006, + "step": 33895 + }, + { + "epoch": 0.66, + "learning_rate": 6.85643275989282e-08, + "loss": 0.0012, + "step": 33896 + }, + { + "epoch": 0.66, + "learning_rate": 6.856044425459205e-08, + "loss": 0.0043, + "step": 33897 + }, + { + "epoch": 0.66, + "learning_rate": 6.855656091025591e-08, + "loss": 0.0005, + "step": 33898 + }, + { + "epoch": 0.66, + "learning_rate": 6.855267756591977e-08, + "loss": 0.0005, + "step": 33899 + }, + { + "epoch": 0.66, + "learning_rate": 6.854879422158363e-08, + "loss": 0.0006, + "step": 33900 + }, + { + "epoch": 0.66, + "learning_rate": 6.854491087724749e-08, + "loss": 0.0004, + "step": 33901 + }, + { + "epoch": 0.66, + "learning_rate": 6.854102753291134e-08, + "loss": 0.0005, + "step": 33902 + }, + { + "epoch": 0.66, + "learning_rate": 6.85371441885752e-08, + "loss": 0.0004, + "step": 33903 + }, + { + "epoch": 0.66, + "learning_rate": 6.853326084423906e-08, + "loss": 0.0005, + "step": 33904 + }, + { + "epoch": 0.66, + "learning_rate": 6.852937749990292e-08, + "loss": 0.0007, + "step": 33905 + }, + { + "epoch": 0.66, + "learning_rate": 6.852549415556678e-08, + "loss": 0.0007, + "step": 33906 + }, + { + "epoch": 0.66, + "learning_rate": 6.852161081123062e-08, + "loss": 0.1334, + "step": 33907 + }, + { + "epoch": 0.66, + "learning_rate": 6.851772746689448e-08, + "loss": 0.0004, + "step": 33908 + }, + { + "epoch": 0.66, + "learning_rate": 6.851384412255834e-08, + "loss": 0.0007, + "step": 33909 + }, + { + "epoch": 0.66, + "learning_rate": 6.85099607782222e-08, + "loss": 0.0007, + "step": 33910 + }, + { + "epoch": 0.66, + "learning_rate": 6.850607743388606e-08, + "loss": 0.0003, + "step": 33911 + }, + { + "epoch": 0.66, + "learning_rate": 6.850219408954991e-08, + "loss": 0.0007, + "step": 33912 + }, + { + "epoch": 0.66, + "learning_rate": 6.849831074521377e-08, + "loss": 0.0017, + "step": 33913 + }, + { + "epoch": 0.66, + "learning_rate": 6.849442740087763e-08, + "loss": 0.0006, + "step": 33914 + }, + { + "epoch": 0.66, + "learning_rate": 6.849054405654149e-08, + "loss": 0.0003, + "step": 33915 + }, + { + "epoch": 0.66, + "learning_rate": 6.848666071220535e-08, + "loss": 0.0004, + "step": 33916 + }, + { + "epoch": 0.66, + "learning_rate": 6.84827773678692e-08, + "loss": 0.0005, + "step": 33917 + }, + { + "epoch": 0.66, + "learning_rate": 6.847889402353306e-08, + "loss": 0.0941, + "step": 33918 + }, + { + "epoch": 0.66, + "learning_rate": 6.847501067919692e-08, + "loss": 0.0004, + "step": 33919 + }, + { + "epoch": 0.66, + "learning_rate": 6.847112733486078e-08, + "loss": 0.4562, + "step": 33920 + }, + { + "epoch": 0.66, + "learning_rate": 6.846724399052464e-08, + "loss": 0.0027, + "step": 33921 + }, + { + "epoch": 0.66, + "learning_rate": 6.84633606461885e-08, + "loss": 0.0004, + "step": 33922 + }, + { + "epoch": 0.66, + "learning_rate": 6.845947730185235e-08, + "loss": 0.1136, + "step": 33923 + }, + { + "epoch": 0.66, + "learning_rate": 6.845559395751621e-08, + "loss": 0.0005, + "step": 33924 + }, + { + "epoch": 0.66, + "learning_rate": 6.845171061318007e-08, + "loss": 0.0004, + "step": 33925 + }, + { + "epoch": 0.66, + "learning_rate": 6.844782726884393e-08, + "loss": 0.0006, + "step": 33926 + }, + { + "epoch": 0.66, + "learning_rate": 6.844394392450779e-08, + "loss": 0.0005, + "step": 33927 + }, + { + "epoch": 0.66, + "learning_rate": 6.844006058017165e-08, + "loss": 0.0004, + "step": 33928 + }, + { + "epoch": 0.66, + "learning_rate": 6.84361772358355e-08, + "loss": 0.0009, + "step": 33929 + }, + { + "epoch": 0.66, + "learning_rate": 6.843229389149936e-08, + "loss": 0.0003, + "step": 33930 + }, + { + "epoch": 0.66, + "learning_rate": 6.842841054716322e-08, + "loss": 0.0023, + "step": 33931 + }, + { + "epoch": 0.66, + "learning_rate": 6.842452720282708e-08, + "loss": 0.0004, + "step": 33932 + }, + { + "epoch": 0.66, + "learning_rate": 6.842064385849094e-08, + "loss": 0.0004, + "step": 33933 + }, + { + "epoch": 0.66, + "learning_rate": 6.84167605141548e-08, + "loss": 0.0005, + "step": 33934 + }, + { + "epoch": 0.66, + "learning_rate": 6.841287716981865e-08, + "loss": 0.0004, + "step": 33935 + }, + { + "epoch": 0.66, + "learning_rate": 6.84089938254825e-08, + "loss": 0.0005, + "step": 33936 + }, + { + "epoch": 0.66, + "learning_rate": 6.840511048114636e-08, + "loss": 0.933, + "step": 33937 + }, + { + "epoch": 0.66, + "learning_rate": 6.840122713681021e-08, + "loss": 0.0006, + "step": 33938 + }, + { + "epoch": 0.66, + "learning_rate": 6.839734379247407e-08, + "loss": 0.0007, + "step": 33939 + }, + { + "epoch": 0.66, + "learning_rate": 6.839346044813793e-08, + "loss": 0.0005, + "step": 33940 + }, + { + "epoch": 0.66, + "learning_rate": 6.838957710380179e-08, + "loss": 0.0005, + "step": 33941 + }, + { + "epoch": 0.66, + "learning_rate": 6.838569375946565e-08, + "loss": 0.0008, + "step": 33942 + }, + { + "epoch": 0.66, + "learning_rate": 6.83818104151295e-08, + "loss": 0.0008, + "step": 33943 + }, + { + "epoch": 0.66, + "learning_rate": 6.837792707079336e-08, + "loss": 0.0004, + "step": 33944 + }, + { + "epoch": 0.66, + "learning_rate": 6.837404372645722e-08, + "loss": 0.0016, + "step": 33945 + }, + { + "epoch": 0.66, + "learning_rate": 6.837016038212108e-08, + "loss": 0.001, + "step": 33946 + }, + { + "epoch": 0.66, + "learning_rate": 6.836627703778494e-08, + "loss": 0.0004, + "step": 33947 + }, + { + "epoch": 0.66, + "learning_rate": 6.83623936934488e-08, + "loss": 0.0006, + "step": 33948 + }, + { + "epoch": 0.66, + "learning_rate": 6.835851034911266e-08, + "loss": 0.0005, + "step": 33949 + }, + { + "epoch": 0.66, + "learning_rate": 6.835462700477651e-08, + "loss": 0.0182, + "step": 33950 + }, + { + "epoch": 0.66, + "learning_rate": 6.835074366044037e-08, + "loss": 0.0004, + "step": 33951 + }, + { + "epoch": 0.66, + "learning_rate": 6.834686031610423e-08, + "loss": 0.0004, + "step": 33952 + }, + { + "epoch": 0.66, + "learning_rate": 6.834297697176809e-08, + "loss": 0.0007, + "step": 33953 + }, + { + "epoch": 0.66, + "learning_rate": 6.833909362743195e-08, + "loss": 0.2906, + "step": 33954 + }, + { + "epoch": 0.66, + "learning_rate": 6.83352102830958e-08, + "loss": 0.0005, + "step": 33955 + }, + { + "epoch": 0.66, + "learning_rate": 6.833132693875966e-08, + "loss": 0.0021, + "step": 33956 + }, + { + "epoch": 0.66, + "learning_rate": 6.832744359442352e-08, + "loss": 0.0004, + "step": 33957 + }, + { + "epoch": 0.66, + "learning_rate": 6.832356025008738e-08, + "loss": 0.0005, + "step": 33958 + }, + { + "epoch": 0.66, + "learning_rate": 6.831967690575124e-08, + "loss": 0.0005, + "step": 33959 + }, + { + "epoch": 0.66, + "learning_rate": 6.83157935614151e-08, + "loss": 0.0004, + "step": 33960 + }, + { + "epoch": 0.66, + "learning_rate": 6.831191021707895e-08, + "loss": 0.0007, + "step": 33961 + }, + { + "epoch": 0.66, + "learning_rate": 6.830802687274281e-08, + "loss": 0.0005, + "step": 33962 + }, + { + "epoch": 0.66, + "learning_rate": 6.830414352840667e-08, + "loss": 0.0019, + "step": 33963 + }, + { + "epoch": 0.66, + "learning_rate": 6.830026018407053e-08, + "loss": 0.0041, + "step": 33964 + }, + { + "epoch": 0.66, + "learning_rate": 6.829637683973437e-08, + "loss": 0.0005, + "step": 33965 + }, + { + "epoch": 0.66, + "learning_rate": 6.829249349539823e-08, + "loss": 0.0005, + "step": 33966 + }, + { + "epoch": 0.66, + "learning_rate": 6.828861015106209e-08, + "loss": 0.0004, + "step": 33967 + }, + { + "epoch": 0.66, + "learning_rate": 6.828472680672595e-08, + "loss": 0.0004, + "step": 33968 + }, + { + "epoch": 0.66, + "learning_rate": 6.828084346238981e-08, + "loss": 0.0005, + "step": 33969 + }, + { + "epoch": 0.66, + "learning_rate": 6.827696011805367e-08, + "loss": 1.3217, + "step": 33970 + }, + { + "epoch": 0.66, + "learning_rate": 6.827307677371752e-08, + "loss": 0.0005, + "step": 33971 + }, + { + "epoch": 0.66, + "learning_rate": 6.826919342938138e-08, + "loss": 0.0006, + "step": 33972 + }, + { + "epoch": 0.66, + "learning_rate": 6.826531008504524e-08, + "loss": 0.0006, + "step": 33973 + }, + { + "epoch": 0.66, + "learning_rate": 6.82614267407091e-08, + "loss": 0.0005, + "step": 33974 + }, + { + "epoch": 0.66, + "learning_rate": 6.825754339637296e-08, + "loss": 0.0016, + "step": 33975 + }, + { + "epoch": 0.66, + "learning_rate": 6.825366005203682e-08, + "loss": 0.0005, + "step": 33976 + }, + { + "epoch": 0.66, + "learning_rate": 6.824977670770067e-08, + "loss": 0.0005, + "step": 33977 + }, + { + "epoch": 0.66, + "learning_rate": 6.824589336336453e-08, + "loss": 1.0392, + "step": 33978 + }, + { + "epoch": 0.66, + "learning_rate": 6.824201001902839e-08, + "loss": 0.0007, + "step": 33979 + }, + { + "epoch": 0.66, + "learning_rate": 6.823812667469225e-08, + "loss": 0.0004, + "step": 33980 + }, + { + "epoch": 0.66, + "learning_rate": 6.82342433303561e-08, + "loss": 0.0006, + "step": 33981 + }, + { + "epoch": 0.66, + "learning_rate": 6.823035998601996e-08, + "loss": 0.0005, + "step": 33982 + }, + { + "epoch": 0.66, + "learning_rate": 6.822647664168382e-08, + "loss": 0.0004, + "step": 33983 + }, + { + "epoch": 0.66, + "learning_rate": 6.822259329734768e-08, + "loss": 0.0004, + "step": 33984 + }, + { + "epoch": 0.66, + "learning_rate": 6.821870995301154e-08, + "loss": 0.0004, + "step": 33985 + }, + { + "epoch": 0.66, + "learning_rate": 6.82148266086754e-08, + "loss": 0.0012, + "step": 33986 + }, + { + "epoch": 0.66, + "learning_rate": 6.821094326433924e-08, + "loss": 0.0004, + "step": 33987 + }, + { + "epoch": 0.66, + "learning_rate": 6.82070599200031e-08, + "loss": 1.3543, + "step": 33988 + }, + { + "epoch": 0.66, + "learning_rate": 6.820317657566696e-08, + "loss": 0.0005, + "step": 33989 + }, + { + "epoch": 0.66, + "learning_rate": 6.819929323133082e-08, + "loss": 0.0005, + "step": 33990 + }, + { + "epoch": 0.66, + "learning_rate": 6.819540988699468e-08, + "loss": 0.0006, + "step": 33991 + }, + { + "epoch": 0.66, + "learning_rate": 6.819152654265853e-08, + "loss": 0.0015, + "step": 33992 + }, + { + "epoch": 0.66, + "learning_rate": 6.818764319832239e-08, + "loss": 0.0006, + "step": 33993 + }, + { + "epoch": 0.66, + "learning_rate": 6.818375985398625e-08, + "loss": 0.0005, + "step": 33994 + }, + { + "epoch": 0.66, + "learning_rate": 6.817987650965011e-08, + "loss": 0.0004, + "step": 33995 + }, + { + "epoch": 0.66, + "learning_rate": 6.817599316531397e-08, + "loss": 0.0005, + "step": 33996 + }, + { + "epoch": 0.66, + "learning_rate": 6.817210982097782e-08, + "loss": 0.0004, + "step": 33997 + }, + { + "epoch": 0.66, + "learning_rate": 6.816822647664168e-08, + "loss": 0.0007, + "step": 33998 + }, + { + "epoch": 0.66, + "learning_rate": 6.816434313230554e-08, + "loss": 0.0003, + "step": 33999 + }, + { + "epoch": 0.66, + "learning_rate": 6.81604597879694e-08, + "loss": 0.0003, + "step": 34000 + }, + { + "epoch": 0.66, + "learning_rate": 6.815657644363326e-08, + "loss": 0.0004, + "step": 34001 + }, + { + "epoch": 0.66, + "learning_rate": 6.81526930992971e-08, + "loss": 0.0007, + "step": 34002 + }, + { + "epoch": 0.66, + "learning_rate": 6.814880975496096e-08, + "loss": 0.0045, + "step": 34003 + }, + { + "epoch": 0.66, + "learning_rate": 6.814492641062482e-08, + "loss": 0.0005, + "step": 34004 + }, + { + "epoch": 0.66, + "learning_rate": 6.814104306628868e-08, + "loss": 0.0005, + "step": 34005 + }, + { + "epoch": 0.66, + "learning_rate": 6.813715972195254e-08, + "loss": 0.0006, + "step": 34006 + }, + { + "epoch": 0.66, + "learning_rate": 6.81332763776164e-08, + "loss": 0.7934, + "step": 34007 + }, + { + "epoch": 0.66, + "learning_rate": 6.812939303328025e-08, + "loss": 0.0005, + "step": 34008 + }, + { + "epoch": 0.66, + "learning_rate": 6.812550968894411e-08, + "loss": 0.0006, + "step": 34009 + }, + { + "epoch": 0.66, + "learning_rate": 6.812162634460797e-08, + "loss": 0.0005, + "step": 34010 + }, + { + "epoch": 0.66, + "learning_rate": 6.811774300027183e-08, + "loss": 0.0004, + "step": 34011 + }, + { + "epoch": 0.66, + "learning_rate": 6.811385965593569e-08, + "loss": 1.2073, + "step": 34012 + }, + { + "epoch": 0.66, + "learning_rate": 6.810997631159954e-08, + "loss": 0.0005, + "step": 34013 + }, + { + "epoch": 0.66, + "learning_rate": 6.81060929672634e-08, + "loss": 0.001, + "step": 34014 + }, + { + "epoch": 0.66, + "learning_rate": 6.810220962292726e-08, + "loss": 0.0004, + "step": 34015 + }, + { + "epoch": 0.66, + "learning_rate": 6.809832627859112e-08, + "loss": 0.0004, + "step": 34016 + }, + { + "epoch": 0.66, + "learning_rate": 6.809444293425498e-08, + "loss": 0.0006, + "step": 34017 + }, + { + "epoch": 0.66, + "learning_rate": 6.809055958991883e-08, + "loss": 0.0005, + "step": 34018 + }, + { + "epoch": 0.66, + "learning_rate": 6.808667624558269e-08, + "loss": 0.0008, + "step": 34019 + }, + { + "epoch": 0.66, + "learning_rate": 6.808279290124655e-08, + "loss": 0.0099, + "step": 34020 + }, + { + "epoch": 0.66, + "learning_rate": 6.807890955691041e-08, + "loss": 0.0007, + "step": 34021 + }, + { + "epoch": 0.66, + "learning_rate": 6.807502621257427e-08, + "loss": 0.0259, + "step": 34022 + }, + { + "epoch": 0.66, + "learning_rate": 6.807114286823811e-08, + "loss": 0.0005, + "step": 34023 + }, + { + "epoch": 0.66, + "learning_rate": 6.806725952390197e-08, + "loss": 0.0004, + "step": 34024 + }, + { + "epoch": 0.66, + "learning_rate": 6.806337617956583e-08, + "loss": 0.0006, + "step": 34025 + }, + { + "epoch": 0.66, + "learning_rate": 6.805949283522969e-08, + "loss": 0.0009, + "step": 34026 + }, + { + "epoch": 0.66, + "learning_rate": 6.805560949089355e-08, + "loss": 0.6889, + "step": 34027 + }, + { + "epoch": 0.66, + "learning_rate": 6.80517261465574e-08, + "loss": 0.0004, + "step": 34028 + }, + { + "epoch": 0.66, + "learning_rate": 6.804784280222126e-08, + "loss": 0.0004, + "step": 34029 + }, + { + "epoch": 0.66, + "learning_rate": 6.804395945788512e-08, + "loss": 0.0006, + "step": 34030 + }, + { + "epoch": 0.66, + "learning_rate": 6.804007611354898e-08, + "loss": 0.0006, + "step": 34031 + }, + { + "epoch": 0.66, + "learning_rate": 6.803619276921284e-08, + "loss": 0.0011, + "step": 34032 + }, + { + "epoch": 0.66, + "learning_rate": 6.80323094248767e-08, + "loss": 0.0045, + "step": 34033 + }, + { + "epoch": 0.66, + "learning_rate": 6.802842608054055e-08, + "loss": 0.0005, + "step": 34034 + }, + { + "epoch": 0.66, + "learning_rate": 6.802454273620441e-08, + "loss": 0.0167, + "step": 34035 + }, + { + "epoch": 0.66, + "learning_rate": 6.802065939186827e-08, + "loss": 0.0004, + "step": 34036 + }, + { + "epoch": 0.66, + "learning_rate": 6.801677604753213e-08, + "loss": 0.7623, + "step": 34037 + }, + { + "epoch": 0.66, + "learning_rate": 6.801289270319599e-08, + "loss": 0.0003, + "step": 34038 + }, + { + "epoch": 0.66, + "learning_rate": 6.800900935885984e-08, + "loss": 0.0005, + "step": 34039 + }, + { + "epoch": 0.66, + "learning_rate": 6.80051260145237e-08, + "loss": 0.0004, + "step": 34040 + }, + { + "epoch": 0.66, + "learning_rate": 6.800124267018756e-08, + "loss": 0.7456, + "step": 34041 + }, + { + "epoch": 0.66, + "learning_rate": 6.799735932585142e-08, + "loss": 0.0006, + "step": 34042 + }, + { + "epoch": 0.66, + "learning_rate": 6.799347598151528e-08, + "loss": 0.0005, + "step": 34043 + }, + { + "epoch": 0.66, + "learning_rate": 6.798959263717914e-08, + "loss": 0.0006, + "step": 34044 + }, + { + "epoch": 0.66, + "learning_rate": 6.7985709292843e-08, + "loss": 0.0003, + "step": 34045 + }, + { + "epoch": 0.66, + "learning_rate": 6.798182594850685e-08, + "loss": 0.0009, + "step": 34046 + }, + { + "epoch": 0.66, + "learning_rate": 6.797794260417071e-08, + "loss": 0.0004, + "step": 34047 + }, + { + "epoch": 0.66, + "learning_rate": 6.797405925983457e-08, + "loss": 0.0009, + "step": 34048 + }, + { + "epoch": 0.66, + "learning_rate": 6.797017591549843e-08, + "loss": 0.0004, + "step": 34049 + }, + { + "epoch": 0.66, + "learning_rate": 6.796629257116229e-08, + "loss": 0.4034, + "step": 34050 + }, + { + "epoch": 0.66, + "learning_rate": 6.796240922682614e-08, + "loss": 0.0004, + "step": 34051 + }, + { + "epoch": 0.66, + "learning_rate": 6.795852588248999e-08, + "loss": 0.0005, + "step": 34052 + }, + { + "epoch": 0.66, + "learning_rate": 6.795464253815385e-08, + "loss": 0.0019, + "step": 34053 + }, + { + "epoch": 0.66, + "learning_rate": 6.79507591938177e-08, + "loss": 0.0005, + "step": 34054 + }, + { + "epoch": 0.66, + "learning_rate": 6.794687584948156e-08, + "loss": 0.0007, + "step": 34055 + }, + { + "epoch": 0.66, + "learning_rate": 6.794299250514542e-08, + "loss": 0.0008, + "step": 34056 + }, + { + "epoch": 0.66, + "learning_rate": 6.793910916080928e-08, + "loss": 0.0005, + "step": 34057 + }, + { + "epoch": 0.66, + "learning_rate": 6.793522581647314e-08, + "loss": 0.0005, + "step": 34058 + }, + { + "epoch": 0.66, + "learning_rate": 6.7931342472137e-08, + "loss": 0.0004, + "step": 34059 + }, + { + "epoch": 0.66, + "learning_rate": 6.792745912780085e-08, + "loss": 0.0004, + "step": 34060 + }, + { + "epoch": 0.66, + "learning_rate": 6.792357578346471e-08, + "loss": 0.0096, + "step": 34061 + }, + { + "epoch": 0.66, + "learning_rate": 6.791969243912857e-08, + "loss": 0.0005, + "step": 34062 + }, + { + "epoch": 0.66, + "learning_rate": 6.791580909479243e-08, + "loss": 0.0004, + "step": 34063 + }, + { + "epoch": 0.66, + "learning_rate": 6.791192575045629e-08, + "loss": 0.0049, + "step": 34064 + }, + { + "epoch": 0.66, + "learning_rate": 6.790804240612015e-08, + "loss": 0.0005, + "step": 34065 + }, + { + "epoch": 0.66, + "learning_rate": 6.7904159061784e-08, + "loss": 0.0004, + "step": 34066 + }, + { + "epoch": 0.66, + "learning_rate": 6.790027571744786e-08, + "loss": 0.0006, + "step": 34067 + }, + { + "epoch": 0.66, + "learning_rate": 6.789639237311172e-08, + "loss": 0.0005, + "step": 34068 + }, + { + "epoch": 0.66, + "learning_rate": 6.789250902877558e-08, + "loss": 0.0005, + "step": 34069 + }, + { + "epoch": 0.66, + "learning_rate": 6.788862568443944e-08, + "loss": 0.0005, + "step": 34070 + }, + { + "epoch": 0.66, + "learning_rate": 6.78847423401033e-08, + "loss": 0.0004, + "step": 34071 + }, + { + "epoch": 0.66, + "learning_rate": 6.788085899576715e-08, + "loss": 0.0006, + "step": 34072 + }, + { + "epoch": 0.66, + "learning_rate": 6.787697565143101e-08, + "loss": 0.0006, + "step": 34073 + }, + { + "epoch": 0.66, + "learning_rate": 6.787309230709487e-08, + "loss": 0.0005, + "step": 34074 + }, + { + "epoch": 0.66, + "learning_rate": 6.786920896275873e-08, + "loss": 0.0005, + "step": 34075 + }, + { + "epoch": 0.66, + "learning_rate": 6.786532561842259e-08, + "loss": 0.0006, + "step": 34076 + }, + { + "epoch": 0.66, + "learning_rate": 6.786144227408644e-08, + "loss": 0.0006, + "step": 34077 + }, + { + "epoch": 0.66, + "learning_rate": 6.78575589297503e-08, + "loss": 0.0006, + "step": 34078 + }, + { + "epoch": 0.66, + "learning_rate": 6.785367558541416e-08, + "loss": 0.5531, + "step": 34079 + }, + { + "epoch": 0.66, + "learning_rate": 6.784979224107802e-08, + "loss": 0.0004, + "step": 34080 + }, + { + "epoch": 0.66, + "learning_rate": 6.784590889674186e-08, + "loss": 0.0023, + "step": 34081 + }, + { + "epoch": 0.66, + "learning_rate": 6.784202555240572e-08, + "loss": 0.0986, + "step": 34082 + }, + { + "epoch": 0.66, + "learning_rate": 6.783814220806958e-08, + "loss": 0.0006, + "step": 34083 + }, + { + "epoch": 0.66, + "learning_rate": 6.783425886373344e-08, + "loss": 0.0004, + "step": 34084 + }, + { + "epoch": 0.66, + "learning_rate": 6.78303755193973e-08, + "loss": 0.0006, + "step": 34085 + }, + { + "epoch": 0.66, + "learning_rate": 6.782649217506116e-08, + "loss": 0.0006, + "step": 34086 + }, + { + "epoch": 0.66, + "learning_rate": 6.782260883072501e-08, + "loss": 0.0006, + "step": 34087 + }, + { + "epoch": 0.66, + "learning_rate": 6.781872548638887e-08, + "loss": 0.0004, + "step": 34088 + }, + { + "epoch": 0.66, + "learning_rate": 6.781484214205273e-08, + "loss": 0.0005, + "step": 34089 + }, + { + "epoch": 0.66, + "learning_rate": 6.781095879771659e-08, + "loss": 0.0003, + "step": 34090 + }, + { + "epoch": 0.66, + "learning_rate": 6.780707545338045e-08, + "loss": 0.0094, + "step": 34091 + }, + { + "epoch": 0.66, + "learning_rate": 6.78031921090443e-08, + "loss": 0.0004, + "step": 34092 + }, + { + "epoch": 0.66, + "learning_rate": 6.779930876470816e-08, + "loss": 0.0007, + "step": 34093 + }, + { + "epoch": 0.66, + "learning_rate": 6.779542542037202e-08, + "loss": 0.0004, + "step": 34094 + }, + { + "epoch": 0.66, + "learning_rate": 6.779154207603588e-08, + "loss": 0.0008, + "step": 34095 + }, + { + "epoch": 0.66, + "learning_rate": 6.778765873169974e-08, + "loss": 0.1629, + "step": 34096 + }, + { + "epoch": 0.66, + "learning_rate": 6.77837753873636e-08, + "loss": 0.0003, + "step": 34097 + }, + { + "epoch": 0.66, + "learning_rate": 6.777989204302745e-08, + "loss": 0.0004, + "step": 34098 + }, + { + "epoch": 0.66, + "learning_rate": 6.777600869869131e-08, + "loss": 0.0033, + "step": 34099 + }, + { + "epoch": 0.66, + "learning_rate": 6.777212535435517e-08, + "loss": 0.0156, + "step": 34100 + }, + { + "epoch": 0.66, + "learning_rate": 6.776824201001903e-08, + "loss": 0.0005, + "step": 34101 + }, + { + "epoch": 0.66, + "learning_rate": 6.776435866568289e-08, + "loss": 0.0006, + "step": 34102 + }, + { + "epoch": 0.66, + "learning_rate": 6.776047532134675e-08, + "loss": 0.0004, + "step": 34103 + }, + { + "epoch": 0.66, + "learning_rate": 6.77565919770106e-08, + "loss": 0.0006, + "step": 34104 + }, + { + "epoch": 0.66, + "learning_rate": 6.775270863267446e-08, + "loss": 0.0005, + "step": 34105 + }, + { + "epoch": 0.66, + "learning_rate": 6.774882528833832e-08, + "loss": 0.005, + "step": 34106 + }, + { + "epoch": 0.66, + "learning_rate": 6.774494194400218e-08, + "loss": 0.0003, + "step": 34107 + }, + { + "epoch": 0.66, + "learning_rate": 6.774105859966604e-08, + "loss": 0.0017, + "step": 34108 + }, + { + "epoch": 0.66, + "learning_rate": 6.77371752553299e-08, + "loss": 0.294, + "step": 34109 + }, + { + "epoch": 0.66, + "learning_rate": 6.773329191099374e-08, + "loss": 0.0007, + "step": 34110 + }, + { + "epoch": 0.66, + "learning_rate": 6.77294085666576e-08, + "loss": 0.0004, + "step": 34111 + }, + { + "epoch": 0.66, + "learning_rate": 6.772552522232146e-08, + "loss": 0.0006, + "step": 34112 + }, + { + "epoch": 0.66, + "learning_rate": 6.772164187798532e-08, + "loss": 0.0005, + "step": 34113 + }, + { + "epoch": 0.66, + "learning_rate": 6.771775853364917e-08, + "loss": 0.003, + "step": 34114 + }, + { + "epoch": 0.66, + "learning_rate": 6.771387518931303e-08, + "loss": 0.0006, + "step": 34115 + }, + { + "epoch": 0.66, + "learning_rate": 6.770999184497689e-08, + "loss": 0.0006, + "step": 34116 + }, + { + "epoch": 0.66, + "learning_rate": 6.770610850064075e-08, + "loss": 0.8113, + "step": 34117 + }, + { + "epoch": 0.66, + "learning_rate": 6.77022251563046e-08, + "loss": 0.0004, + "step": 34118 + }, + { + "epoch": 0.66, + "learning_rate": 6.769834181196846e-08, + "loss": 0.0005, + "step": 34119 + }, + { + "epoch": 0.66, + "learning_rate": 6.769445846763232e-08, + "loss": 0.0004, + "step": 34120 + }, + { + "epoch": 0.66, + "learning_rate": 6.769057512329618e-08, + "loss": 0.0006, + "step": 34121 + }, + { + "epoch": 0.66, + "learning_rate": 6.768669177896004e-08, + "loss": 0.0005, + "step": 34122 + }, + { + "epoch": 0.66, + "learning_rate": 6.76828084346239e-08, + "loss": 0.0004, + "step": 34123 + }, + { + "epoch": 0.66, + "learning_rate": 6.767892509028776e-08, + "loss": 1.1969, + "step": 34124 + }, + { + "epoch": 0.66, + "learning_rate": 6.767504174595161e-08, + "loss": 0.0005, + "step": 34125 + }, + { + "epoch": 0.66, + "learning_rate": 6.767115840161547e-08, + "loss": 0.0007, + "step": 34126 + }, + { + "epoch": 0.66, + "learning_rate": 6.766727505727933e-08, + "loss": 0.0006, + "step": 34127 + }, + { + "epoch": 0.66, + "learning_rate": 6.766339171294319e-08, + "loss": 0.0009, + "step": 34128 + }, + { + "epoch": 0.66, + "learning_rate": 6.765950836860705e-08, + "loss": 0.0006, + "step": 34129 + }, + { + "epoch": 0.66, + "learning_rate": 6.76556250242709e-08, + "loss": 0.0006, + "step": 34130 + }, + { + "epoch": 0.66, + "learning_rate": 6.765174167993476e-08, + "loss": 0.0004, + "step": 34131 + }, + { + "epoch": 0.66, + "learning_rate": 6.764785833559862e-08, + "loss": 0.0003, + "step": 34132 + }, + { + "epoch": 0.66, + "learning_rate": 6.764397499126248e-08, + "loss": 0.0003, + "step": 34133 + }, + { + "epoch": 0.66, + "learning_rate": 6.764009164692634e-08, + "loss": 0.0005, + "step": 34134 + }, + { + "epoch": 0.66, + "learning_rate": 6.76362083025902e-08, + "loss": 0.0007, + "step": 34135 + }, + { + "epoch": 0.66, + "learning_rate": 6.763232495825405e-08, + "loss": 0.0006, + "step": 34136 + }, + { + "epoch": 0.66, + "learning_rate": 6.762844161391791e-08, + "loss": 0.0005, + "step": 34137 + }, + { + "epoch": 0.66, + "learning_rate": 6.762455826958177e-08, + "loss": 0.091, + "step": 34138 + }, + { + "epoch": 0.66, + "learning_rate": 6.762067492524562e-08, + "loss": 0.0004, + "step": 34139 + }, + { + "epoch": 0.66, + "learning_rate": 6.761679158090947e-08, + "loss": 0.0005, + "step": 34140 + }, + { + "epoch": 0.66, + "learning_rate": 6.761290823657333e-08, + "loss": 0.0004, + "step": 34141 + }, + { + "epoch": 0.66, + "learning_rate": 6.760902489223719e-08, + "loss": 0.0005, + "step": 34142 + }, + { + "epoch": 0.66, + "learning_rate": 6.760514154790105e-08, + "loss": 0.0206, + "step": 34143 + }, + { + "epoch": 0.66, + "learning_rate": 6.760125820356491e-08, + "loss": 0.0005, + "step": 34144 + }, + { + "epoch": 0.66, + "learning_rate": 6.759737485922877e-08, + "loss": 0.0034, + "step": 34145 + }, + { + "epoch": 0.66, + "learning_rate": 6.759349151489262e-08, + "loss": 0.0986, + "step": 34146 + }, + { + "epoch": 0.66, + "learning_rate": 6.758960817055648e-08, + "loss": 0.0004, + "step": 34147 + }, + { + "epoch": 0.66, + "learning_rate": 6.758572482622034e-08, + "loss": 0.0117, + "step": 34148 + }, + { + "epoch": 0.66, + "learning_rate": 6.75818414818842e-08, + "loss": 0.0003, + "step": 34149 + }, + { + "epoch": 0.66, + "learning_rate": 6.757795813754806e-08, + "loss": 0.0006, + "step": 34150 + }, + { + "epoch": 0.66, + "learning_rate": 6.757407479321192e-08, + "loss": 0.0005, + "step": 34151 + }, + { + "epoch": 0.66, + "learning_rate": 6.757019144887577e-08, + "loss": 0.0008, + "step": 34152 + }, + { + "epoch": 0.66, + "learning_rate": 6.756630810453963e-08, + "loss": 0.0007, + "step": 34153 + }, + { + "epoch": 0.66, + "learning_rate": 6.756242476020349e-08, + "loss": 0.1561, + "step": 34154 + }, + { + "epoch": 0.66, + "learning_rate": 6.755854141586735e-08, + "loss": 0.0006, + "step": 34155 + }, + { + "epoch": 0.66, + "learning_rate": 6.75546580715312e-08, + "loss": 0.0004, + "step": 34156 + }, + { + "epoch": 0.66, + "learning_rate": 6.755077472719506e-08, + "loss": 0.0004, + "step": 34157 + }, + { + "epoch": 0.66, + "learning_rate": 6.754689138285892e-08, + "loss": 0.0012, + "step": 34158 + }, + { + "epoch": 0.66, + "learning_rate": 6.754300803852278e-08, + "loss": 0.0004, + "step": 34159 + }, + { + "epoch": 0.66, + "learning_rate": 6.753912469418664e-08, + "loss": 0.0064, + "step": 34160 + }, + { + "epoch": 0.66, + "learning_rate": 6.75352413498505e-08, + "loss": 0.0004, + "step": 34161 + }, + { + "epoch": 0.66, + "learning_rate": 6.753135800551436e-08, + "loss": 0.0005, + "step": 34162 + }, + { + "epoch": 0.66, + "learning_rate": 6.752747466117821e-08, + "loss": 0.0004, + "step": 34163 + }, + { + "epoch": 0.66, + "learning_rate": 6.752359131684206e-08, + "loss": 0.0005, + "step": 34164 + }, + { + "epoch": 0.66, + "learning_rate": 6.751970797250592e-08, + "loss": 0.0007, + "step": 34165 + }, + { + "epoch": 0.66, + "learning_rate": 6.751582462816978e-08, + "loss": 0.0004, + "step": 34166 + }, + { + "epoch": 0.66, + "learning_rate": 6.751194128383363e-08, + "loss": 1.3159, + "step": 34167 + }, + { + "epoch": 0.66, + "learning_rate": 6.750805793949749e-08, + "loss": 0.0004, + "step": 34168 + }, + { + "epoch": 0.66, + "learning_rate": 6.750417459516135e-08, + "loss": 0.0004, + "step": 34169 + }, + { + "epoch": 0.66, + "learning_rate": 6.750029125082521e-08, + "loss": 0.0004, + "step": 34170 + }, + { + "epoch": 0.66, + "learning_rate": 6.749640790648907e-08, + "loss": 0.0003, + "step": 34171 + }, + { + "epoch": 0.66, + "learning_rate": 6.749252456215293e-08, + "loss": 0.0004, + "step": 34172 + }, + { + "epoch": 0.66, + "learning_rate": 6.748864121781678e-08, + "loss": 0.0005, + "step": 34173 + }, + { + "epoch": 0.66, + "learning_rate": 6.748475787348064e-08, + "loss": 0.0007, + "step": 34174 + }, + { + "epoch": 0.66, + "learning_rate": 6.74808745291445e-08, + "loss": 0.0012, + "step": 34175 + }, + { + "epoch": 0.66, + "learning_rate": 6.747699118480836e-08, + "loss": 0.0003, + "step": 34176 + }, + { + "epoch": 0.66, + "learning_rate": 6.747310784047222e-08, + "loss": 0.9606, + "step": 34177 + }, + { + "epoch": 0.66, + "learning_rate": 6.746922449613607e-08, + "loss": 0.0003, + "step": 34178 + }, + { + "epoch": 0.66, + "learning_rate": 6.746534115179992e-08, + "loss": 0.0152, + "step": 34179 + }, + { + "epoch": 0.66, + "learning_rate": 6.746145780746378e-08, + "loss": 0.0004, + "step": 34180 + }, + { + "epoch": 0.66, + "learning_rate": 6.745757446312764e-08, + "loss": 0.0003, + "step": 34181 + }, + { + "epoch": 0.66, + "learning_rate": 6.74536911187915e-08, + "loss": 0.0005, + "step": 34182 + }, + { + "epoch": 0.66, + "learning_rate": 6.744980777445535e-08, + "loss": 0.0016, + "step": 34183 + }, + { + "epoch": 0.66, + "learning_rate": 6.744592443011921e-08, + "loss": 0.0004, + "step": 34184 + }, + { + "epoch": 0.66, + "learning_rate": 6.744204108578307e-08, + "loss": 0.0004, + "step": 34185 + }, + { + "epoch": 0.66, + "learning_rate": 6.743815774144693e-08, + "loss": 0.0005, + "step": 34186 + }, + { + "epoch": 0.66, + "learning_rate": 6.743427439711079e-08, + "loss": 0.0005, + "step": 34187 + }, + { + "epoch": 0.66, + "learning_rate": 6.743039105277464e-08, + "loss": 0.0004, + "step": 34188 + }, + { + "epoch": 0.66, + "learning_rate": 6.74265077084385e-08, + "loss": 0.2857, + "step": 34189 + }, + { + "epoch": 0.66, + "learning_rate": 6.742262436410236e-08, + "loss": 0.0004, + "step": 34190 + }, + { + "epoch": 0.66, + "learning_rate": 6.741874101976622e-08, + "loss": 0.0004, + "step": 34191 + }, + { + "epoch": 0.66, + "learning_rate": 6.741485767543008e-08, + "loss": 0.0003, + "step": 34192 + }, + { + "epoch": 0.66, + "learning_rate": 6.741097433109393e-08, + "loss": 0.0005, + "step": 34193 + }, + { + "epoch": 0.66, + "learning_rate": 6.740709098675779e-08, + "loss": 0.0005, + "step": 34194 + }, + { + "epoch": 0.66, + "learning_rate": 6.740320764242165e-08, + "loss": 0.0006, + "step": 34195 + }, + { + "epoch": 0.66, + "learning_rate": 6.739932429808551e-08, + "loss": 0.0006, + "step": 34196 + }, + { + "epoch": 0.66, + "learning_rate": 6.739544095374935e-08, + "loss": 0.0004, + "step": 34197 + }, + { + "epoch": 0.66, + "learning_rate": 6.739155760941321e-08, + "loss": 0.0005, + "step": 34198 + }, + { + "epoch": 0.66, + "learning_rate": 6.738767426507707e-08, + "loss": 0.001, + "step": 34199 + }, + { + "epoch": 0.66, + "learning_rate": 6.738379092074093e-08, + "loss": 0.0008, + "step": 34200 + }, + { + "epoch": 0.66, + "learning_rate": 6.737990757640479e-08, + "loss": 0.2026, + "step": 34201 + }, + { + "epoch": 0.66, + "learning_rate": 6.737602423206865e-08, + "loss": 0.0004, + "step": 34202 + }, + { + "epoch": 0.66, + "learning_rate": 6.73721408877325e-08, + "loss": 0.0005, + "step": 34203 + }, + { + "epoch": 0.66, + "learning_rate": 6.736825754339636e-08, + "loss": 0.0004, + "step": 34204 + }, + { + "epoch": 0.66, + "learning_rate": 6.736437419906022e-08, + "loss": 0.3091, + "step": 34205 + }, + { + "epoch": 0.66, + "learning_rate": 6.736049085472408e-08, + "loss": 0.6195, + "step": 34206 + }, + { + "epoch": 0.66, + "learning_rate": 6.735660751038794e-08, + "loss": 0.1306, + "step": 34207 + }, + { + "epoch": 0.66, + "learning_rate": 6.73527241660518e-08, + "loss": 0.0005, + "step": 34208 + }, + { + "epoch": 0.66, + "learning_rate": 6.734884082171565e-08, + "loss": 0.0005, + "step": 34209 + }, + { + "epoch": 0.66, + "learning_rate": 6.734495747737951e-08, + "loss": 0.0003, + "step": 34210 + }, + { + "epoch": 0.66, + "learning_rate": 6.734107413304337e-08, + "loss": 0.0004, + "step": 34211 + }, + { + "epoch": 0.66, + "learning_rate": 6.733719078870723e-08, + "loss": 0.0006, + "step": 34212 + }, + { + "epoch": 0.66, + "learning_rate": 6.733330744437109e-08, + "loss": 0.0878, + "step": 34213 + }, + { + "epoch": 0.66, + "learning_rate": 6.732942410003494e-08, + "loss": 0.0003, + "step": 34214 + }, + { + "epoch": 0.66, + "learning_rate": 6.73255407556988e-08, + "loss": 0.0005, + "step": 34215 + }, + { + "epoch": 0.66, + "learning_rate": 6.732165741136266e-08, + "loss": 0.0003, + "step": 34216 + }, + { + "epoch": 0.66, + "learning_rate": 6.731777406702652e-08, + "loss": 0.0004, + "step": 34217 + }, + { + "epoch": 0.66, + "learning_rate": 6.731389072269038e-08, + "loss": 0.0016, + "step": 34218 + }, + { + "epoch": 0.66, + "learning_rate": 6.731000737835424e-08, + "loss": 0.0004, + "step": 34219 + }, + { + "epoch": 0.66, + "learning_rate": 6.73061240340181e-08, + "loss": 0.0004, + "step": 34220 + }, + { + "epoch": 0.66, + "learning_rate": 6.730224068968195e-08, + "loss": 0.0004, + "step": 34221 + }, + { + "epoch": 0.66, + "learning_rate": 6.729835734534581e-08, + "loss": 0.0241, + "step": 34222 + }, + { + "epoch": 0.66, + "learning_rate": 6.729447400100967e-08, + "loss": 0.0005, + "step": 34223 + }, + { + "epoch": 0.66, + "learning_rate": 6.729059065667353e-08, + "loss": 0.0007, + "step": 34224 + }, + { + "epoch": 0.66, + "learning_rate": 6.728670731233739e-08, + "loss": 0.0004, + "step": 34225 + }, + { + "epoch": 0.66, + "learning_rate": 6.728282396800123e-08, + "loss": 0.1138, + "step": 34226 + }, + { + "epoch": 0.66, + "learning_rate": 6.727894062366509e-08, + "loss": 0.0004, + "step": 34227 + }, + { + "epoch": 0.66, + "learning_rate": 6.727505727932895e-08, + "loss": 0.0004, + "step": 34228 + }, + { + "epoch": 0.66, + "learning_rate": 6.72711739349928e-08, + "loss": 0.0005, + "step": 34229 + }, + { + "epoch": 0.66, + "learning_rate": 6.726729059065666e-08, + "loss": 0.7051, + "step": 34230 + }, + { + "epoch": 0.66, + "learning_rate": 6.726340724632052e-08, + "loss": 0.0004, + "step": 34231 + }, + { + "epoch": 0.66, + "learning_rate": 6.725952390198438e-08, + "loss": 0.0006, + "step": 34232 + }, + { + "epoch": 0.66, + "learning_rate": 6.725564055764824e-08, + "loss": 0.0006, + "step": 34233 + }, + { + "epoch": 0.66, + "learning_rate": 6.72517572133121e-08, + "loss": 0.0004, + "step": 34234 + }, + { + "epoch": 0.66, + "learning_rate": 6.724787386897595e-08, + "loss": 0.0004, + "step": 34235 + }, + { + "epoch": 0.66, + "learning_rate": 6.724399052463981e-08, + "loss": 0.0005, + "step": 34236 + }, + { + "epoch": 0.66, + "learning_rate": 6.724010718030367e-08, + "loss": 0.0006, + "step": 34237 + }, + { + "epoch": 0.66, + "learning_rate": 6.723622383596753e-08, + "loss": 0.0006, + "step": 34238 + }, + { + "epoch": 0.66, + "learning_rate": 6.723234049163139e-08, + "loss": 0.0006, + "step": 34239 + }, + { + "epoch": 0.66, + "learning_rate": 6.722845714729525e-08, + "loss": 0.0004, + "step": 34240 + }, + { + "epoch": 0.66, + "learning_rate": 6.72245738029591e-08, + "loss": 0.0006, + "step": 34241 + }, + { + "epoch": 0.66, + "learning_rate": 6.722069045862296e-08, + "loss": 0.0006, + "step": 34242 + }, + { + "epoch": 0.66, + "learning_rate": 6.721680711428682e-08, + "loss": 0.003, + "step": 34243 + }, + { + "epoch": 0.66, + "learning_rate": 6.721292376995068e-08, + "loss": 0.0005, + "step": 34244 + }, + { + "epoch": 0.66, + "learning_rate": 6.720904042561454e-08, + "loss": 0.0005, + "step": 34245 + }, + { + "epoch": 0.66, + "learning_rate": 6.72051570812784e-08, + "loss": 0.0042, + "step": 34246 + }, + { + "epoch": 0.66, + "learning_rate": 6.720127373694225e-08, + "loss": 0.0004, + "step": 34247 + }, + { + "epoch": 0.66, + "learning_rate": 6.719739039260611e-08, + "loss": 0.0004, + "step": 34248 + }, + { + "epoch": 0.66, + "learning_rate": 6.719350704826997e-08, + "loss": 0.0005, + "step": 34249 + }, + { + "epoch": 0.66, + "learning_rate": 6.718962370393383e-08, + "loss": 0.0004, + "step": 34250 + }, + { + "epoch": 0.66, + "learning_rate": 6.718574035959769e-08, + "loss": 0.0008, + "step": 34251 + }, + { + "epoch": 0.66, + "learning_rate": 6.718185701526154e-08, + "loss": 0.0004, + "step": 34252 + }, + { + "epoch": 0.66, + "learning_rate": 6.71779736709254e-08, + "loss": 0.0004, + "step": 34253 + }, + { + "epoch": 0.66, + "learning_rate": 6.717409032658926e-08, + "loss": 0.0005, + "step": 34254 + }, + { + "epoch": 0.66, + "learning_rate": 6.71702069822531e-08, + "loss": 0.0006, + "step": 34255 + }, + { + "epoch": 0.66, + "learning_rate": 6.716632363791696e-08, + "loss": 0.0008, + "step": 34256 + }, + { + "epoch": 0.66, + "learning_rate": 6.716244029358082e-08, + "loss": 0.0004, + "step": 34257 + }, + { + "epoch": 0.66, + "learning_rate": 6.715855694924468e-08, + "loss": 0.0015, + "step": 34258 + }, + { + "epoch": 0.66, + "learning_rate": 6.715467360490854e-08, + "loss": 0.0007, + "step": 34259 + }, + { + "epoch": 0.66, + "learning_rate": 6.71507902605724e-08, + "loss": 0.0005, + "step": 34260 + }, + { + "epoch": 0.66, + "learning_rate": 6.714690691623626e-08, + "loss": 0.0004, + "step": 34261 + }, + { + "epoch": 0.66, + "learning_rate": 6.714302357190011e-08, + "loss": 0.0004, + "step": 34262 + }, + { + "epoch": 0.66, + "learning_rate": 6.713914022756397e-08, + "loss": 0.0257, + "step": 34263 + }, + { + "epoch": 0.66, + "learning_rate": 6.713525688322783e-08, + "loss": 0.5098, + "step": 34264 + }, + { + "epoch": 0.66, + "learning_rate": 6.713137353889169e-08, + "loss": 0.0009, + "step": 34265 + }, + { + "epoch": 0.66, + "learning_rate": 6.712749019455555e-08, + "loss": 0.4699, + "step": 34266 + }, + { + "epoch": 0.66, + "learning_rate": 6.71236068502194e-08, + "loss": 0.0005, + "step": 34267 + }, + { + "epoch": 0.66, + "learning_rate": 6.711972350588326e-08, + "loss": 0.0007, + "step": 34268 + }, + { + "epoch": 0.66, + "learning_rate": 6.711584016154712e-08, + "loss": 0.0007, + "step": 34269 + }, + { + "epoch": 0.66, + "learning_rate": 6.711195681721098e-08, + "loss": 0.0004, + "step": 34270 + }, + { + "epoch": 0.66, + "learning_rate": 6.710807347287484e-08, + "loss": 0.0011, + "step": 34271 + }, + { + "epoch": 0.66, + "learning_rate": 6.71041901285387e-08, + "loss": 0.0008, + "step": 34272 + }, + { + "epoch": 0.66, + "learning_rate": 6.710030678420255e-08, + "loss": 0.0004, + "step": 34273 + }, + { + "epoch": 0.66, + "learning_rate": 6.709642343986641e-08, + "loss": 0.0005, + "step": 34274 + }, + { + "epoch": 0.66, + "learning_rate": 6.709254009553027e-08, + "loss": 0.0006, + "step": 34275 + }, + { + "epoch": 0.66, + "learning_rate": 6.708865675119413e-08, + "loss": 0.0006, + "step": 34276 + }, + { + "epoch": 0.66, + "learning_rate": 6.708477340685799e-08, + "loss": 0.0012, + "step": 34277 + }, + { + "epoch": 0.66, + "learning_rate": 6.708089006252185e-08, + "loss": 0.0006, + "step": 34278 + }, + { + "epoch": 0.66, + "learning_rate": 6.70770067181857e-08, + "loss": 0.0004, + "step": 34279 + }, + { + "epoch": 0.66, + "learning_rate": 6.707312337384956e-08, + "loss": 0.0005, + "step": 34280 + }, + { + "epoch": 0.66, + "learning_rate": 6.706924002951342e-08, + "loss": 0.0004, + "step": 34281 + }, + { + "epoch": 0.66, + "learning_rate": 6.706535668517728e-08, + "loss": 0.0003, + "step": 34282 + }, + { + "epoch": 0.67, + "learning_rate": 6.706147334084114e-08, + "loss": 0.0007, + "step": 34283 + }, + { + "epoch": 0.67, + "learning_rate": 6.705758999650498e-08, + "loss": 0.0003, + "step": 34284 + }, + { + "epoch": 0.67, + "learning_rate": 6.705370665216884e-08, + "loss": 0.0004, + "step": 34285 + }, + { + "epoch": 0.67, + "learning_rate": 6.70498233078327e-08, + "loss": 0.1144, + "step": 34286 + }, + { + "epoch": 0.67, + "learning_rate": 6.704593996349656e-08, + "loss": 0.0003, + "step": 34287 + }, + { + "epoch": 0.67, + "learning_rate": 6.704205661916042e-08, + "loss": 0.0004, + "step": 34288 + }, + { + "epoch": 0.67, + "learning_rate": 6.703817327482427e-08, + "loss": 0.0004, + "step": 34289 + }, + { + "epoch": 0.67, + "learning_rate": 6.703428993048813e-08, + "loss": 0.0004, + "step": 34290 + }, + { + "epoch": 0.67, + "learning_rate": 6.703040658615199e-08, + "loss": 0.0006, + "step": 34291 + }, + { + "epoch": 0.67, + "learning_rate": 6.702652324181585e-08, + "loss": 0.0004, + "step": 34292 + }, + { + "epoch": 0.67, + "learning_rate": 6.70226398974797e-08, + "loss": 0.0004, + "step": 34293 + }, + { + "epoch": 0.67, + "learning_rate": 6.701875655314356e-08, + "loss": 0.0074, + "step": 34294 + }, + { + "epoch": 0.67, + "learning_rate": 6.701487320880742e-08, + "loss": 0.0213, + "step": 34295 + }, + { + "epoch": 0.67, + "learning_rate": 6.701098986447128e-08, + "loss": 0.0005, + "step": 34296 + }, + { + "epoch": 0.67, + "learning_rate": 6.700710652013514e-08, + "loss": 0.0006, + "step": 34297 + }, + { + "epoch": 0.67, + "learning_rate": 6.7003223175799e-08, + "loss": 0.0005, + "step": 34298 + }, + { + "epoch": 0.67, + "learning_rate": 6.699933983146286e-08, + "loss": 0.0151, + "step": 34299 + }, + { + "epoch": 0.67, + "learning_rate": 6.699545648712671e-08, + "loss": 0.0004, + "step": 34300 + }, + { + "epoch": 0.67, + "learning_rate": 6.699157314279057e-08, + "loss": 0.0005, + "step": 34301 + }, + { + "epoch": 0.67, + "learning_rate": 6.698768979845443e-08, + "loss": 0.0006, + "step": 34302 + }, + { + "epoch": 0.67, + "learning_rate": 6.698380645411829e-08, + "loss": 0.0004, + "step": 34303 + }, + { + "epoch": 0.67, + "learning_rate": 6.697992310978215e-08, + "loss": 0.0022, + "step": 34304 + }, + { + "epoch": 0.67, + "learning_rate": 6.6976039765446e-08, + "loss": 0.0004, + "step": 34305 + }, + { + "epoch": 0.67, + "learning_rate": 6.697215642110986e-08, + "loss": 0.0004, + "step": 34306 + }, + { + "epoch": 0.67, + "learning_rate": 6.696827307677372e-08, + "loss": 0.0004, + "step": 34307 + }, + { + "epoch": 0.67, + "learning_rate": 6.696438973243758e-08, + "loss": 0.0008, + "step": 34308 + }, + { + "epoch": 0.67, + "learning_rate": 6.696050638810144e-08, + "loss": 0.1121, + "step": 34309 + }, + { + "epoch": 0.67, + "learning_rate": 6.69566230437653e-08, + "loss": 0.0003, + "step": 34310 + }, + { + "epoch": 0.67, + "learning_rate": 6.695273969942915e-08, + "loss": 0.0264, + "step": 34311 + }, + { + "epoch": 0.67, + "learning_rate": 6.694885635509301e-08, + "loss": 0.6763, + "step": 34312 + }, + { + "epoch": 0.67, + "learning_rate": 6.694497301075686e-08, + "loss": 0.0005, + "step": 34313 + }, + { + "epoch": 0.67, + "learning_rate": 6.694108966642072e-08, + "loss": 0.0003, + "step": 34314 + }, + { + "epoch": 0.67, + "learning_rate": 6.693720632208457e-08, + "loss": 0.0004, + "step": 34315 + }, + { + "epoch": 0.67, + "learning_rate": 6.693332297774843e-08, + "loss": 0.0005, + "step": 34316 + }, + { + "epoch": 0.67, + "learning_rate": 6.692943963341229e-08, + "loss": 0.0006, + "step": 34317 + }, + { + "epoch": 0.67, + "learning_rate": 6.692555628907615e-08, + "loss": 0.0006, + "step": 34318 + }, + { + "epoch": 0.67, + "learning_rate": 6.692167294474001e-08, + "loss": 0.0005, + "step": 34319 + }, + { + "epoch": 0.67, + "learning_rate": 6.691778960040387e-08, + "loss": 0.0951, + "step": 34320 + }, + { + "epoch": 0.67, + "learning_rate": 6.691390625606772e-08, + "loss": 0.0004, + "step": 34321 + }, + { + "epoch": 0.67, + "learning_rate": 6.691002291173158e-08, + "loss": 0.0005, + "step": 34322 + }, + { + "epoch": 0.67, + "learning_rate": 6.690613956739544e-08, + "loss": 0.0004, + "step": 34323 + }, + { + "epoch": 0.67, + "learning_rate": 6.69022562230593e-08, + "loss": 0.0007, + "step": 34324 + }, + { + "epoch": 0.67, + "learning_rate": 6.689837287872316e-08, + "loss": 0.0005, + "step": 34325 + }, + { + "epoch": 0.67, + "learning_rate": 6.689448953438702e-08, + "loss": 0.0006, + "step": 34326 + }, + { + "epoch": 0.67, + "learning_rate": 6.689060619005087e-08, + "loss": 0.0004, + "step": 34327 + }, + { + "epoch": 0.67, + "learning_rate": 6.688672284571473e-08, + "loss": 0.0006, + "step": 34328 + }, + { + "epoch": 0.67, + "learning_rate": 6.688283950137859e-08, + "loss": 0.0003, + "step": 34329 + }, + { + "epoch": 0.67, + "learning_rate": 6.687895615704245e-08, + "loss": 1.3751, + "step": 34330 + }, + { + "epoch": 0.67, + "learning_rate": 6.68750728127063e-08, + "loss": 0.0005, + "step": 34331 + }, + { + "epoch": 0.67, + "learning_rate": 6.687118946837016e-08, + "loss": 0.815, + "step": 34332 + }, + { + "epoch": 0.67, + "learning_rate": 6.686730612403402e-08, + "loss": 0.0006, + "step": 34333 + }, + { + "epoch": 0.67, + "learning_rate": 6.686342277969788e-08, + "loss": 0.0005, + "step": 34334 + }, + { + "epoch": 0.67, + "learning_rate": 6.685953943536174e-08, + "loss": 0.0005, + "step": 34335 + }, + { + "epoch": 0.67, + "learning_rate": 6.68556560910256e-08, + "loss": 0.0004, + "step": 34336 + }, + { + "epoch": 0.67, + "learning_rate": 6.685177274668946e-08, + "loss": 0.0004, + "step": 34337 + }, + { + "epoch": 0.67, + "learning_rate": 6.684788940235331e-08, + "loss": 0.0011, + "step": 34338 + }, + { + "epoch": 0.67, + "learning_rate": 6.684400605801717e-08, + "loss": 0.0004, + "step": 34339 + }, + { + "epoch": 0.67, + "learning_rate": 6.684012271368103e-08, + "loss": 0.0005, + "step": 34340 + }, + { + "epoch": 0.67, + "learning_rate": 6.683623936934488e-08, + "loss": 0.0003, + "step": 34341 + }, + { + "epoch": 0.67, + "learning_rate": 6.683235602500873e-08, + "loss": 0.7435, + "step": 34342 + }, + { + "epoch": 0.67, + "learning_rate": 6.682847268067259e-08, + "loss": 0.0004, + "step": 34343 + }, + { + "epoch": 0.67, + "learning_rate": 6.682458933633645e-08, + "loss": 0.0043, + "step": 34344 + }, + { + "epoch": 0.67, + "learning_rate": 6.682070599200031e-08, + "loss": 0.0005, + "step": 34345 + }, + { + "epoch": 0.67, + "learning_rate": 6.681682264766417e-08, + "loss": 0.0006, + "step": 34346 + }, + { + "epoch": 0.67, + "learning_rate": 6.681293930332803e-08, + "loss": 0.0006, + "step": 34347 + }, + { + "epoch": 0.67, + "learning_rate": 6.680905595899188e-08, + "loss": 0.0005, + "step": 34348 + }, + { + "epoch": 0.67, + "learning_rate": 6.680517261465574e-08, + "loss": 0.0004, + "step": 34349 + }, + { + "epoch": 0.67, + "learning_rate": 6.68012892703196e-08, + "loss": 0.0004, + "step": 34350 + }, + { + "epoch": 0.67, + "learning_rate": 6.679740592598346e-08, + "loss": 0.0003, + "step": 34351 + }, + { + "epoch": 0.67, + "learning_rate": 6.679352258164732e-08, + "loss": 0.0004, + "step": 34352 + }, + { + "epoch": 0.67, + "learning_rate": 6.678963923731117e-08, + "loss": 0.0005, + "step": 34353 + }, + { + "epoch": 0.67, + "learning_rate": 6.678575589297503e-08, + "loss": 0.001, + "step": 34354 + }, + { + "epoch": 0.67, + "learning_rate": 6.678187254863889e-08, + "loss": 0.001, + "step": 34355 + }, + { + "epoch": 0.67, + "learning_rate": 6.677798920430274e-08, + "loss": 0.0007, + "step": 34356 + }, + { + "epoch": 0.67, + "learning_rate": 6.67741058599666e-08, + "loss": 0.0005, + "step": 34357 + }, + { + "epoch": 0.67, + "learning_rate": 6.677022251563045e-08, + "loss": 0.0017, + "step": 34358 + }, + { + "epoch": 0.67, + "learning_rate": 6.676633917129431e-08, + "loss": 0.0005, + "step": 34359 + }, + { + "epoch": 0.67, + "learning_rate": 6.676245582695817e-08, + "loss": 0.0004, + "step": 34360 + }, + { + "epoch": 0.67, + "learning_rate": 6.675857248262203e-08, + "loss": 0.0009, + "step": 34361 + }, + { + "epoch": 0.67, + "learning_rate": 6.675468913828589e-08, + "loss": 0.0004, + "step": 34362 + }, + { + "epoch": 0.67, + "learning_rate": 6.675080579394974e-08, + "loss": 0.0005, + "step": 34363 + }, + { + "epoch": 0.67, + "learning_rate": 6.67469224496136e-08, + "loss": 0.0005, + "step": 34364 + }, + { + "epoch": 0.67, + "learning_rate": 6.674303910527746e-08, + "loss": 0.0004, + "step": 34365 + }, + { + "epoch": 0.67, + "learning_rate": 6.673915576094132e-08, + "loss": 0.0009, + "step": 34366 + }, + { + "epoch": 0.67, + "learning_rate": 6.673527241660518e-08, + "loss": 0.0004, + "step": 34367 + }, + { + "epoch": 0.67, + "learning_rate": 6.673138907226904e-08, + "loss": 0.0004, + "step": 34368 + }, + { + "epoch": 0.67, + "learning_rate": 6.672750572793289e-08, + "loss": 0.0006, + "step": 34369 + }, + { + "epoch": 0.67, + "learning_rate": 6.672362238359675e-08, + "loss": 0.0046, + "step": 34370 + }, + { + "epoch": 0.67, + "learning_rate": 6.67197390392606e-08, + "loss": 0.0057, + "step": 34371 + }, + { + "epoch": 0.67, + "learning_rate": 6.671585569492445e-08, + "loss": 0.0005, + "step": 34372 + }, + { + "epoch": 0.67, + "learning_rate": 6.671197235058831e-08, + "loss": 0.0005, + "step": 34373 + }, + { + "epoch": 0.67, + "learning_rate": 6.670808900625217e-08, + "loss": 0.9866, + "step": 34374 + }, + { + "epoch": 0.67, + "learning_rate": 6.670420566191603e-08, + "loss": 0.0004, + "step": 34375 + }, + { + "epoch": 0.67, + "learning_rate": 6.670032231757989e-08, + "loss": 0.0003, + "step": 34376 + }, + { + "epoch": 0.67, + "learning_rate": 6.669643897324375e-08, + "loss": 0.0005, + "step": 34377 + }, + { + "epoch": 0.67, + "learning_rate": 6.66925556289076e-08, + "loss": 0.0004, + "step": 34378 + }, + { + "epoch": 0.67, + "learning_rate": 6.668867228457146e-08, + "loss": 0.0005, + "step": 34379 + }, + { + "epoch": 0.67, + "learning_rate": 6.668478894023532e-08, + "loss": 0.0006, + "step": 34380 + }, + { + "epoch": 0.67, + "learning_rate": 6.668090559589918e-08, + "loss": 0.0004, + "step": 34381 + }, + { + "epoch": 0.67, + "learning_rate": 6.667702225156304e-08, + "loss": 0.0005, + "step": 34382 + }, + { + "epoch": 0.67, + "learning_rate": 6.66731389072269e-08, + "loss": 0.0004, + "step": 34383 + }, + { + "epoch": 0.67, + "learning_rate": 6.666925556289075e-08, + "loss": 0.0004, + "step": 34384 + }, + { + "epoch": 0.67, + "learning_rate": 6.666537221855461e-08, + "loss": 0.0005, + "step": 34385 + }, + { + "epoch": 0.67, + "learning_rate": 6.666148887421847e-08, + "loss": 0.5653, + "step": 34386 + }, + { + "epoch": 0.67, + "learning_rate": 6.665760552988233e-08, + "loss": 0.0005, + "step": 34387 + }, + { + "epoch": 0.67, + "learning_rate": 6.665372218554619e-08, + "loss": 0.0003, + "step": 34388 + }, + { + "epoch": 0.67, + "learning_rate": 6.664983884121004e-08, + "loss": 0.0004, + "step": 34389 + }, + { + "epoch": 0.67, + "learning_rate": 6.66459554968739e-08, + "loss": 0.0034, + "step": 34390 + }, + { + "epoch": 0.67, + "learning_rate": 6.664207215253776e-08, + "loss": 0.0006, + "step": 34391 + }, + { + "epoch": 0.67, + "learning_rate": 6.663818880820162e-08, + "loss": 0.0006, + "step": 34392 + }, + { + "epoch": 0.67, + "learning_rate": 6.663430546386548e-08, + "loss": 0.0016, + "step": 34393 + }, + { + "epoch": 0.67, + "learning_rate": 6.663042211952934e-08, + "loss": 0.0005, + "step": 34394 + }, + { + "epoch": 0.67, + "learning_rate": 6.66265387751932e-08, + "loss": 0.0005, + "step": 34395 + }, + { + "epoch": 0.67, + "learning_rate": 6.662265543085705e-08, + "loss": 0.7242, + "step": 34396 + }, + { + "epoch": 0.67, + "learning_rate": 6.661877208652091e-08, + "loss": 0.0008, + "step": 34397 + }, + { + "epoch": 0.67, + "learning_rate": 6.661488874218477e-08, + "loss": 0.0003, + "step": 34398 + }, + { + "epoch": 0.67, + "learning_rate": 6.661100539784863e-08, + "loss": 0.0005, + "step": 34399 + }, + { + "epoch": 0.67, + "learning_rate": 6.660712205351247e-08, + "loss": 0.0004, + "step": 34400 + }, + { + "epoch": 0.67, + "learning_rate": 6.660323870917633e-08, + "loss": 0.0004, + "step": 34401 + }, + { + "epoch": 0.67, + "learning_rate": 6.659935536484019e-08, + "loss": 0.0004, + "step": 34402 + }, + { + "epoch": 0.67, + "learning_rate": 6.659547202050405e-08, + "loss": 0.0004, + "step": 34403 + }, + { + "epoch": 0.67, + "learning_rate": 6.65915886761679e-08, + "loss": 0.0004, + "step": 34404 + }, + { + "epoch": 0.67, + "learning_rate": 6.658770533183176e-08, + "loss": 0.0008, + "step": 34405 + }, + { + "epoch": 0.67, + "learning_rate": 6.658382198749562e-08, + "loss": 0.0004, + "step": 34406 + }, + { + "epoch": 0.67, + "learning_rate": 6.657993864315948e-08, + "loss": 0.0004, + "step": 34407 + }, + { + "epoch": 0.67, + "learning_rate": 6.657605529882334e-08, + "loss": 0.0005, + "step": 34408 + }, + { + "epoch": 0.67, + "learning_rate": 6.65721719544872e-08, + "loss": 0.0004, + "step": 34409 + }, + { + "epoch": 0.67, + "learning_rate": 6.656828861015105e-08, + "loss": 0.0007, + "step": 34410 + }, + { + "epoch": 0.67, + "learning_rate": 6.656440526581491e-08, + "loss": 0.0017, + "step": 34411 + }, + { + "epoch": 0.67, + "learning_rate": 6.656052192147877e-08, + "loss": 0.0005, + "step": 34412 + }, + { + "epoch": 0.67, + "learning_rate": 6.655663857714263e-08, + "loss": 0.0004, + "step": 34413 + }, + { + "epoch": 0.67, + "learning_rate": 6.655275523280649e-08, + "loss": 0.0009, + "step": 34414 + }, + { + "epoch": 0.67, + "learning_rate": 6.654887188847035e-08, + "loss": 0.0006, + "step": 34415 + }, + { + "epoch": 0.67, + "learning_rate": 6.65449885441342e-08, + "loss": 0.0004, + "step": 34416 + }, + { + "epoch": 0.67, + "learning_rate": 6.654110519979806e-08, + "loss": 0.0007, + "step": 34417 + }, + { + "epoch": 0.67, + "learning_rate": 6.653722185546192e-08, + "loss": 0.0004, + "step": 34418 + }, + { + "epoch": 0.67, + "learning_rate": 6.653333851112578e-08, + "loss": 0.0004, + "step": 34419 + }, + { + "epoch": 0.67, + "learning_rate": 6.652945516678964e-08, + "loss": 0.0004, + "step": 34420 + }, + { + "epoch": 0.67, + "learning_rate": 6.65255718224535e-08, + "loss": 0.0004, + "step": 34421 + }, + { + "epoch": 0.67, + "learning_rate": 6.652168847811735e-08, + "loss": 0.1546, + "step": 34422 + }, + { + "epoch": 0.67, + "learning_rate": 6.651780513378121e-08, + "loss": 0.0004, + "step": 34423 + }, + { + "epoch": 0.67, + "learning_rate": 6.651392178944507e-08, + "loss": 0.001, + "step": 34424 + }, + { + "epoch": 0.67, + "learning_rate": 6.651003844510893e-08, + "loss": 0.0003, + "step": 34425 + }, + { + "epoch": 0.67, + "learning_rate": 6.650615510077279e-08, + "loss": 1.0476, + "step": 34426 + }, + { + "epoch": 0.67, + "learning_rate": 6.650227175643665e-08, + "loss": 0.0003, + "step": 34427 + }, + { + "epoch": 0.67, + "learning_rate": 6.64983884121005e-08, + "loss": 0.0005, + "step": 34428 + }, + { + "epoch": 0.67, + "learning_rate": 6.649450506776435e-08, + "loss": 0.5803, + "step": 34429 + }, + { + "epoch": 0.67, + "learning_rate": 6.64906217234282e-08, + "loss": 0.0003, + "step": 34430 + }, + { + "epoch": 0.67, + "learning_rate": 6.648673837909206e-08, + "loss": 0.0006, + "step": 34431 + }, + { + "epoch": 0.67, + "learning_rate": 6.648285503475592e-08, + "loss": 0.0003, + "step": 34432 + }, + { + "epoch": 0.67, + "learning_rate": 6.647897169041978e-08, + "loss": 0.0005, + "step": 34433 + }, + { + "epoch": 0.67, + "learning_rate": 6.647508834608364e-08, + "loss": 0.0034, + "step": 34434 + }, + { + "epoch": 0.67, + "learning_rate": 6.64712050017475e-08, + "loss": 0.0005, + "step": 34435 + }, + { + "epoch": 0.67, + "learning_rate": 6.646732165741136e-08, + "loss": 0.5288, + "step": 34436 + }, + { + "epoch": 0.67, + "learning_rate": 6.646343831307521e-08, + "loss": 0.4281, + "step": 34437 + }, + { + "epoch": 0.67, + "learning_rate": 6.645955496873907e-08, + "loss": 0.0005, + "step": 34438 + }, + { + "epoch": 0.67, + "learning_rate": 6.645567162440293e-08, + "loss": 0.0003, + "step": 34439 + }, + { + "epoch": 0.67, + "learning_rate": 6.645178828006679e-08, + "loss": 0.0007, + "step": 34440 + }, + { + "epoch": 0.67, + "learning_rate": 6.644790493573065e-08, + "loss": 0.0005, + "step": 34441 + }, + { + "epoch": 0.67, + "learning_rate": 6.64440215913945e-08, + "loss": 0.0867, + "step": 34442 + }, + { + "epoch": 0.67, + "learning_rate": 6.644013824705836e-08, + "loss": 0.0005, + "step": 34443 + }, + { + "epoch": 0.67, + "learning_rate": 6.643625490272222e-08, + "loss": 0.0006, + "step": 34444 + }, + { + "epoch": 0.67, + "learning_rate": 6.643237155838608e-08, + "loss": 0.0004, + "step": 34445 + }, + { + "epoch": 0.67, + "learning_rate": 6.642848821404994e-08, + "loss": 0.0004, + "step": 34446 + }, + { + "epoch": 0.67, + "learning_rate": 6.64246048697138e-08, + "loss": 0.0004, + "step": 34447 + }, + { + "epoch": 0.67, + "learning_rate": 6.642072152537765e-08, + "loss": 0.0005, + "step": 34448 + }, + { + "epoch": 0.67, + "learning_rate": 6.641683818104151e-08, + "loss": 0.0006, + "step": 34449 + }, + { + "epoch": 0.67, + "learning_rate": 6.641295483670537e-08, + "loss": 0.0004, + "step": 34450 + }, + { + "epoch": 0.67, + "learning_rate": 6.640907149236923e-08, + "loss": 1.0958, + "step": 34451 + }, + { + "epoch": 0.67, + "learning_rate": 6.640518814803309e-08, + "loss": 0.0006, + "step": 34452 + }, + { + "epoch": 0.67, + "learning_rate": 6.640130480369695e-08, + "loss": 0.0004, + "step": 34453 + }, + { + "epoch": 0.67, + "learning_rate": 6.63974214593608e-08, + "loss": 0.0004, + "step": 34454 + }, + { + "epoch": 0.67, + "learning_rate": 6.639353811502466e-08, + "loss": 0.0007, + "step": 34455 + }, + { + "epoch": 0.67, + "learning_rate": 6.638965477068852e-08, + "loss": 0.0005, + "step": 34456 + }, + { + "epoch": 0.67, + "learning_rate": 6.638577142635238e-08, + "loss": 0.0005, + "step": 34457 + }, + { + "epoch": 0.67, + "learning_rate": 6.638188808201622e-08, + "loss": 0.0202, + "step": 34458 + }, + { + "epoch": 0.67, + "learning_rate": 6.637800473768008e-08, + "loss": 0.0005, + "step": 34459 + }, + { + "epoch": 0.67, + "learning_rate": 6.637412139334394e-08, + "loss": 0.1845, + "step": 34460 + }, + { + "epoch": 0.67, + "learning_rate": 6.63702380490078e-08, + "loss": 0.0023, + "step": 34461 + }, + { + "epoch": 0.67, + "learning_rate": 6.636635470467166e-08, + "loss": 0.0007, + "step": 34462 + }, + { + "epoch": 0.67, + "learning_rate": 6.636247136033552e-08, + "loss": 0.001, + "step": 34463 + }, + { + "epoch": 0.67, + "learning_rate": 6.635858801599937e-08, + "loss": 0.0007, + "step": 34464 + }, + { + "epoch": 0.67, + "learning_rate": 6.635470467166323e-08, + "loss": 0.0002, + "step": 34465 + }, + { + "epoch": 0.67, + "learning_rate": 6.635082132732709e-08, + "loss": 0.0005, + "step": 34466 + }, + { + "epoch": 0.67, + "learning_rate": 6.634693798299095e-08, + "loss": 0.0004, + "step": 34467 + }, + { + "epoch": 0.67, + "learning_rate": 6.63430546386548e-08, + "loss": 0.0005, + "step": 34468 + }, + { + "epoch": 0.67, + "learning_rate": 6.633917129431866e-08, + "loss": 0.0004, + "step": 34469 + }, + { + "epoch": 0.67, + "learning_rate": 6.633528794998252e-08, + "loss": 0.0005, + "step": 34470 + }, + { + "epoch": 0.67, + "learning_rate": 6.633140460564638e-08, + "loss": 0.0005, + "step": 34471 + }, + { + "epoch": 0.67, + "learning_rate": 6.632752126131024e-08, + "loss": 0.0007, + "step": 34472 + }, + { + "epoch": 0.67, + "learning_rate": 6.63236379169741e-08, + "loss": 0.0108, + "step": 34473 + }, + { + "epoch": 0.67, + "learning_rate": 6.631975457263796e-08, + "loss": 0.0045, + "step": 34474 + }, + { + "epoch": 0.67, + "learning_rate": 6.631587122830181e-08, + "loss": 0.0007, + "step": 34475 + }, + { + "epoch": 0.67, + "learning_rate": 6.631198788396567e-08, + "loss": 0.0004, + "step": 34476 + }, + { + "epoch": 0.67, + "learning_rate": 6.630810453962953e-08, + "loss": 0.0003, + "step": 34477 + }, + { + "epoch": 0.67, + "learning_rate": 6.630422119529339e-08, + "loss": 0.0006, + "step": 34478 + }, + { + "epoch": 0.67, + "learning_rate": 6.630033785095725e-08, + "loss": 0.0004, + "step": 34479 + }, + { + "epoch": 0.67, + "learning_rate": 6.62964545066211e-08, + "loss": 0.0007, + "step": 34480 + }, + { + "epoch": 0.67, + "learning_rate": 6.629257116228496e-08, + "loss": 0.0005, + "step": 34481 + }, + { + "epoch": 0.67, + "learning_rate": 6.628868781794882e-08, + "loss": 0.0006, + "step": 34482 + }, + { + "epoch": 0.67, + "learning_rate": 6.628480447361268e-08, + "loss": 0.0005, + "step": 34483 + }, + { + "epoch": 0.67, + "learning_rate": 6.628092112927654e-08, + "loss": 0.0005, + "step": 34484 + }, + { + "epoch": 0.67, + "learning_rate": 6.62770377849404e-08, + "loss": 0.0005, + "step": 34485 + }, + { + "epoch": 0.67, + "learning_rate": 6.627315444060425e-08, + "loss": 0.0004, + "step": 34486 + }, + { + "epoch": 0.67, + "learning_rate": 6.62692710962681e-08, + "loss": 0.0003, + "step": 34487 + }, + { + "epoch": 0.67, + "learning_rate": 6.626538775193196e-08, + "loss": 0.6057, + "step": 34488 + }, + { + "epoch": 0.67, + "learning_rate": 6.626150440759582e-08, + "loss": 0.0007, + "step": 34489 + }, + { + "epoch": 0.67, + "learning_rate": 6.625762106325967e-08, + "loss": 0.0005, + "step": 34490 + }, + { + "epoch": 0.67, + "learning_rate": 6.625373771892353e-08, + "loss": 0.0006, + "step": 34491 + }, + { + "epoch": 0.67, + "learning_rate": 6.624985437458739e-08, + "loss": 0.92, + "step": 34492 + }, + { + "epoch": 0.67, + "learning_rate": 6.624597103025125e-08, + "loss": 0.0005, + "step": 34493 + }, + { + "epoch": 0.67, + "learning_rate": 6.624208768591511e-08, + "loss": 0.0004, + "step": 34494 + }, + { + "epoch": 0.67, + "learning_rate": 6.623820434157897e-08, + "loss": 0.0005, + "step": 34495 + }, + { + "epoch": 0.67, + "learning_rate": 6.623432099724282e-08, + "loss": 0.0004, + "step": 34496 + }, + { + "epoch": 0.67, + "learning_rate": 6.623043765290668e-08, + "loss": 0.0025, + "step": 34497 + }, + { + "epoch": 0.67, + "learning_rate": 6.622655430857054e-08, + "loss": 0.0005, + "step": 34498 + }, + { + "epoch": 0.67, + "learning_rate": 6.62226709642344e-08, + "loss": 0.0004, + "step": 34499 + }, + { + "epoch": 0.67, + "learning_rate": 6.621878761989826e-08, + "loss": 0.0004, + "step": 34500 + }, + { + "epoch": 0.67, + "learning_rate": 6.621490427556212e-08, + "loss": 0.0003, + "step": 34501 + }, + { + "epoch": 0.67, + "learning_rate": 6.621102093122597e-08, + "loss": 0.0004, + "step": 34502 + }, + { + "epoch": 0.67, + "learning_rate": 6.620713758688983e-08, + "loss": 0.0004, + "step": 34503 + }, + { + "epoch": 0.67, + "learning_rate": 6.620325424255369e-08, + "loss": 0.0009, + "step": 34504 + }, + { + "epoch": 0.67, + "learning_rate": 6.619937089821755e-08, + "loss": 0.2097, + "step": 34505 + }, + { + "epoch": 0.67, + "learning_rate": 6.61954875538814e-08, + "loss": 0.0003, + "step": 34506 + }, + { + "epoch": 0.67, + "learning_rate": 6.619160420954526e-08, + "loss": 0.0005, + "step": 34507 + }, + { + "epoch": 0.67, + "learning_rate": 6.618772086520912e-08, + "loss": 0.0007, + "step": 34508 + }, + { + "epoch": 0.67, + "learning_rate": 6.618383752087298e-08, + "loss": 0.0004, + "step": 34509 + }, + { + "epoch": 0.67, + "learning_rate": 6.617995417653684e-08, + "loss": 0.0025, + "step": 34510 + }, + { + "epoch": 0.67, + "learning_rate": 6.61760708322007e-08, + "loss": 0.0003, + "step": 34511 + }, + { + "epoch": 0.67, + "learning_rate": 6.617218748786456e-08, + "loss": 0.0006, + "step": 34512 + }, + { + "epoch": 0.67, + "learning_rate": 6.616830414352841e-08, + "loss": 0.0905, + "step": 34513 + }, + { + "epoch": 0.67, + "learning_rate": 6.616442079919227e-08, + "loss": 0.0006, + "step": 34514 + }, + { + "epoch": 0.67, + "learning_rate": 6.616053745485613e-08, + "loss": 0.0003, + "step": 34515 + }, + { + "epoch": 0.67, + "learning_rate": 6.615665411051998e-08, + "loss": 0.0004, + "step": 34516 + }, + { + "epoch": 0.67, + "learning_rate": 6.615277076618383e-08, + "loss": 0.0005, + "step": 34517 + }, + { + "epoch": 0.67, + "learning_rate": 6.614888742184769e-08, + "loss": 0.0009, + "step": 34518 + }, + { + "epoch": 0.67, + "learning_rate": 6.614500407751155e-08, + "loss": 0.0004, + "step": 34519 + }, + { + "epoch": 0.67, + "learning_rate": 6.614112073317541e-08, + "loss": 0.0012, + "step": 34520 + }, + { + "epoch": 0.67, + "learning_rate": 6.613723738883927e-08, + "loss": 0.4527, + "step": 34521 + }, + { + "epoch": 0.67, + "learning_rate": 6.613335404450313e-08, + "loss": 0.038, + "step": 34522 + }, + { + "epoch": 0.67, + "learning_rate": 6.612947070016698e-08, + "loss": 0.0006, + "step": 34523 + }, + { + "epoch": 0.67, + "learning_rate": 6.612558735583084e-08, + "loss": 0.0003, + "step": 34524 + }, + { + "epoch": 0.67, + "learning_rate": 6.61217040114947e-08, + "loss": 0.0006, + "step": 34525 + }, + { + "epoch": 0.67, + "learning_rate": 6.611782066715856e-08, + "loss": 0.0005, + "step": 34526 + }, + { + "epoch": 0.67, + "learning_rate": 6.611393732282242e-08, + "loss": 0.001, + "step": 34527 + }, + { + "epoch": 0.67, + "learning_rate": 6.611005397848627e-08, + "loss": 0.0004, + "step": 34528 + }, + { + "epoch": 0.67, + "learning_rate": 6.610617063415013e-08, + "loss": 0.0004, + "step": 34529 + }, + { + "epoch": 0.67, + "learning_rate": 6.610228728981399e-08, + "loss": 0.0004, + "step": 34530 + }, + { + "epoch": 0.67, + "learning_rate": 6.609840394547785e-08, + "loss": 0.0004, + "step": 34531 + }, + { + "epoch": 0.67, + "learning_rate": 6.609452060114171e-08, + "loss": 0.0009, + "step": 34532 + }, + { + "epoch": 0.67, + "learning_rate": 6.609063725680555e-08, + "loss": 0.7448, + "step": 34533 + }, + { + "epoch": 0.67, + "learning_rate": 6.608675391246941e-08, + "loss": 0.0006, + "step": 34534 + }, + { + "epoch": 0.67, + "learning_rate": 6.608287056813327e-08, + "loss": 0.0004, + "step": 34535 + }, + { + "epoch": 0.67, + "learning_rate": 6.607898722379713e-08, + "loss": 0.0004, + "step": 34536 + }, + { + "epoch": 0.67, + "learning_rate": 6.607510387946099e-08, + "loss": 0.5461, + "step": 34537 + }, + { + "epoch": 0.67, + "learning_rate": 6.607122053512484e-08, + "loss": 0.0005, + "step": 34538 + }, + { + "epoch": 0.67, + "learning_rate": 6.60673371907887e-08, + "loss": 0.0043, + "step": 34539 + }, + { + "epoch": 0.67, + "learning_rate": 6.606345384645256e-08, + "loss": 0.0005, + "step": 34540 + }, + { + "epoch": 0.67, + "learning_rate": 6.605957050211642e-08, + "loss": 0.0006, + "step": 34541 + }, + { + "epoch": 0.67, + "learning_rate": 6.605568715778028e-08, + "loss": 0.0004, + "step": 34542 + }, + { + "epoch": 0.67, + "learning_rate": 6.605180381344414e-08, + "loss": 0.0003, + "step": 34543 + }, + { + "epoch": 0.67, + "learning_rate": 6.6047920469108e-08, + "loss": 0.0004, + "step": 34544 + }, + { + "epoch": 0.67, + "learning_rate": 6.604403712477185e-08, + "loss": 0.0003, + "step": 34545 + }, + { + "epoch": 0.67, + "learning_rate": 6.604015378043571e-08, + "loss": 0.0006, + "step": 34546 + }, + { + "epoch": 0.67, + "learning_rate": 6.603627043609955e-08, + "loss": 0.0003, + "step": 34547 + }, + { + "epoch": 0.67, + "learning_rate": 6.603238709176341e-08, + "loss": 0.0118, + "step": 34548 + }, + { + "epoch": 0.67, + "learning_rate": 6.602850374742727e-08, + "loss": 0.0005, + "step": 34549 + }, + { + "epoch": 0.67, + "learning_rate": 6.602462040309113e-08, + "loss": 0.0004, + "step": 34550 + }, + { + "epoch": 0.67, + "learning_rate": 6.602073705875499e-08, + "loss": 0.0003, + "step": 34551 + }, + { + "epoch": 0.67, + "learning_rate": 6.601685371441885e-08, + "loss": 0.0003, + "step": 34552 + }, + { + "epoch": 0.67, + "learning_rate": 6.60129703700827e-08, + "loss": 0.0425, + "step": 34553 + }, + { + "epoch": 0.67, + "learning_rate": 6.600908702574656e-08, + "loss": 0.0007, + "step": 34554 + }, + { + "epoch": 0.67, + "learning_rate": 6.600520368141042e-08, + "loss": 0.0015, + "step": 34555 + }, + { + "epoch": 0.67, + "learning_rate": 6.600132033707428e-08, + "loss": 0.0004, + "step": 34556 + }, + { + "epoch": 0.67, + "learning_rate": 6.599743699273814e-08, + "loss": 0.0004, + "step": 34557 + }, + { + "epoch": 0.67, + "learning_rate": 6.5993553648402e-08, + "loss": 0.0003, + "step": 34558 + }, + { + "epoch": 0.67, + "learning_rate": 6.598967030406585e-08, + "loss": 0.0004, + "step": 34559 + }, + { + "epoch": 0.67, + "learning_rate": 6.598578695972971e-08, + "loss": 0.0004, + "step": 34560 + }, + { + "epoch": 0.67, + "learning_rate": 6.598190361539357e-08, + "loss": 0.0005, + "step": 34561 + }, + { + "epoch": 0.67, + "learning_rate": 6.597802027105743e-08, + "loss": 0.0027, + "step": 34562 + }, + { + "epoch": 0.67, + "learning_rate": 6.597413692672129e-08, + "loss": 0.0005, + "step": 34563 + }, + { + "epoch": 0.67, + "learning_rate": 6.597025358238515e-08, + "loss": 0.0004, + "step": 34564 + }, + { + "epoch": 0.67, + "learning_rate": 6.5966370238049e-08, + "loss": 0.0007, + "step": 34565 + }, + { + "epoch": 0.67, + "learning_rate": 6.596248689371286e-08, + "loss": 0.0006, + "step": 34566 + }, + { + "epoch": 0.67, + "learning_rate": 6.595860354937672e-08, + "loss": 0.2194, + "step": 34567 + }, + { + "epoch": 0.67, + "learning_rate": 6.595472020504058e-08, + "loss": 0.0006, + "step": 34568 + }, + { + "epoch": 0.67, + "learning_rate": 6.595083686070444e-08, + "loss": 0.6194, + "step": 34569 + }, + { + "epoch": 0.67, + "learning_rate": 6.59469535163683e-08, + "loss": 0.0005, + "step": 34570 + }, + { + "epoch": 0.67, + "learning_rate": 6.594307017203215e-08, + "loss": 0.0006, + "step": 34571 + }, + { + "epoch": 0.67, + "learning_rate": 6.593918682769601e-08, + "loss": 0.0004, + "step": 34572 + }, + { + "epoch": 0.67, + "learning_rate": 6.593530348335987e-08, + "loss": 0.0004, + "step": 34573 + }, + { + "epoch": 0.67, + "learning_rate": 6.593142013902371e-08, + "loss": 0.0004, + "step": 34574 + }, + { + "epoch": 0.67, + "learning_rate": 6.592753679468757e-08, + "loss": 0.0005, + "step": 34575 + }, + { + "epoch": 0.67, + "learning_rate": 6.592365345035143e-08, + "loss": 0.0005, + "step": 34576 + }, + { + "epoch": 0.67, + "learning_rate": 6.591977010601529e-08, + "loss": 0.0006, + "step": 34577 + }, + { + "epoch": 0.67, + "learning_rate": 6.591588676167915e-08, + "loss": 0.0485, + "step": 34578 + }, + { + "epoch": 0.67, + "learning_rate": 6.5912003417343e-08, + "loss": 0.0004, + "step": 34579 + }, + { + "epoch": 0.67, + "learning_rate": 6.590812007300686e-08, + "loss": 0.0004, + "step": 34580 + }, + { + "epoch": 0.67, + "learning_rate": 6.590423672867072e-08, + "loss": 0.0003, + "step": 34581 + }, + { + "epoch": 0.67, + "learning_rate": 6.590035338433458e-08, + "loss": 0.0005, + "step": 34582 + }, + { + "epoch": 0.67, + "learning_rate": 6.589647003999844e-08, + "loss": 0.0003, + "step": 34583 + }, + { + "epoch": 0.67, + "learning_rate": 6.58925866956623e-08, + "loss": 0.0004, + "step": 34584 + }, + { + "epoch": 0.67, + "learning_rate": 6.588870335132615e-08, + "loss": 0.0004, + "step": 34585 + }, + { + "epoch": 0.67, + "learning_rate": 6.588482000699001e-08, + "loss": 0.69, + "step": 34586 + }, + { + "epoch": 0.67, + "learning_rate": 6.588093666265387e-08, + "loss": 0.0008, + "step": 34587 + }, + { + "epoch": 0.67, + "learning_rate": 6.587705331831773e-08, + "loss": 0.9682, + "step": 34588 + }, + { + "epoch": 0.67, + "learning_rate": 6.587316997398159e-08, + "loss": 0.0006, + "step": 34589 + }, + { + "epoch": 0.67, + "learning_rate": 6.586928662964545e-08, + "loss": 0.0005, + "step": 34590 + }, + { + "epoch": 0.67, + "learning_rate": 6.58654032853093e-08, + "loss": 0.0004, + "step": 34591 + }, + { + "epoch": 0.67, + "learning_rate": 6.586151994097316e-08, + "loss": 0.4271, + "step": 34592 + }, + { + "epoch": 0.67, + "learning_rate": 6.585763659663702e-08, + "loss": 0.0005, + "step": 34593 + }, + { + "epoch": 0.67, + "learning_rate": 6.585375325230088e-08, + "loss": 0.0005, + "step": 34594 + }, + { + "epoch": 0.67, + "learning_rate": 6.584986990796474e-08, + "loss": 0.4001, + "step": 34595 + }, + { + "epoch": 0.67, + "learning_rate": 6.58459865636286e-08, + "loss": 0.0003, + "step": 34596 + }, + { + "epoch": 0.67, + "learning_rate": 6.584210321929245e-08, + "loss": 0.0003, + "step": 34597 + }, + { + "epoch": 0.67, + "learning_rate": 6.583821987495631e-08, + "loss": 0.0006, + "step": 34598 + }, + { + "epoch": 0.67, + "learning_rate": 6.583433653062017e-08, + "loss": 0.0006, + "step": 34599 + }, + { + "epoch": 0.67, + "learning_rate": 6.583045318628403e-08, + "loss": 0.008, + "step": 34600 + }, + { + "epoch": 0.67, + "learning_rate": 6.582656984194789e-08, + "loss": 0.5447, + "step": 34601 + }, + { + "epoch": 0.67, + "learning_rate": 6.582268649761175e-08, + "loss": 0.1141, + "step": 34602 + }, + { + "epoch": 0.67, + "learning_rate": 6.581880315327559e-08, + "loss": 0.0003, + "step": 34603 + }, + { + "epoch": 0.67, + "learning_rate": 6.581491980893945e-08, + "loss": 0.0004, + "step": 34604 + }, + { + "epoch": 0.67, + "learning_rate": 6.581103646460331e-08, + "loss": 0.0004, + "step": 34605 + }, + { + "epoch": 0.67, + "learning_rate": 6.580715312026716e-08, + "loss": 0.0005, + "step": 34606 + }, + { + "epoch": 0.67, + "learning_rate": 6.580326977593102e-08, + "loss": 0.0006, + "step": 34607 + }, + { + "epoch": 0.67, + "learning_rate": 6.579938643159488e-08, + "loss": 1.0979, + "step": 34608 + }, + { + "epoch": 0.67, + "learning_rate": 6.579550308725874e-08, + "loss": 0.0004, + "step": 34609 + }, + { + "epoch": 0.67, + "learning_rate": 6.57916197429226e-08, + "loss": 0.0004, + "step": 34610 + }, + { + "epoch": 0.67, + "learning_rate": 6.578773639858646e-08, + "loss": 0.0003, + "step": 34611 + }, + { + "epoch": 0.67, + "learning_rate": 6.578385305425031e-08, + "loss": 0.0004, + "step": 34612 + }, + { + "epoch": 0.67, + "learning_rate": 6.577996970991417e-08, + "loss": 1.2849, + "step": 34613 + }, + { + "epoch": 0.67, + "learning_rate": 6.577608636557803e-08, + "loss": 0.0005, + "step": 34614 + }, + { + "epoch": 0.67, + "learning_rate": 6.577220302124189e-08, + "loss": 0.0004, + "step": 34615 + }, + { + "epoch": 0.67, + "learning_rate": 6.576831967690575e-08, + "loss": 0.0004, + "step": 34616 + }, + { + "epoch": 0.67, + "learning_rate": 6.57644363325696e-08, + "loss": 0.0005, + "step": 34617 + }, + { + "epoch": 0.67, + "learning_rate": 6.576055298823346e-08, + "loss": 0.0004, + "step": 34618 + }, + { + "epoch": 0.67, + "learning_rate": 6.575666964389732e-08, + "loss": 0.0005, + "step": 34619 + }, + { + "epoch": 0.67, + "learning_rate": 6.575278629956118e-08, + "loss": 0.1453, + "step": 34620 + }, + { + "epoch": 0.67, + "learning_rate": 6.574890295522504e-08, + "loss": 0.0005, + "step": 34621 + }, + { + "epoch": 0.67, + "learning_rate": 6.57450196108889e-08, + "loss": 0.0005, + "step": 34622 + }, + { + "epoch": 0.67, + "learning_rate": 6.574113626655276e-08, + "loss": 0.0004, + "step": 34623 + }, + { + "epoch": 0.67, + "learning_rate": 6.573725292221661e-08, + "loss": 0.0024, + "step": 34624 + }, + { + "epoch": 0.67, + "learning_rate": 6.573336957788047e-08, + "loss": 0.0003, + "step": 34625 + }, + { + "epoch": 0.67, + "learning_rate": 6.572948623354433e-08, + "loss": 0.0013, + "step": 34626 + }, + { + "epoch": 0.67, + "learning_rate": 6.572560288920819e-08, + "loss": 0.0004, + "step": 34627 + }, + { + "epoch": 0.67, + "learning_rate": 6.572171954487205e-08, + "loss": 0.0007, + "step": 34628 + }, + { + "epoch": 0.67, + "learning_rate": 6.57178362005359e-08, + "loss": 0.0027, + "step": 34629 + }, + { + "epoch": 0.67, + "learning_rate": 6.571395285619976e-08, + "loss": 0.0004, + "step": 34630 + }, + { + "epoch": 0.67, + "learning_rate": 6.571006951186362e-08, + "loss": 0.0004, + "step": 34631 + }, + { + "epoch": 0.67, + "learning_rate": 6.570618616752747e-08, + "loss": 0.0006, + "step": 34632 + }, + { + "epoch": 0.67, + "learning_rate": 6.570230282319132e-08, + "loss": 0.0004, + "step": 34633 + }, + { + "epoch": 0.67, + "learning_rate": 6.569841947885518e-08, + "loss": 0.0004, + "step": 34634 + }, + { + "epoch": 0.67, + "learning_rate": 6.569453613451904e-08, + "loss": 0.0003, + "step": 34635 + }, + { + "epoch": 0.67, + "learning_rate": 6.56906527901829e-08, + "loss": 0.001, + "step": 34636 + }, + { + "epoch": 0.67, + "learning_rate": 6.568676944584676e-08, + "loss": 0.0007, + "step": 34637 + }, + { + "epoch": 0.67, + "learning_rate": 6.568288610151062e-08, + "loss": 0.0005, + "step": 34638 + }, + { + "epoch": 0.67, + "learning_rate": 6.567900275717447e-08, + "loss": 0.0086, + "step": 34639 + }, + { + "epoch": 0.67, + "learning_rate": 6.567511941283833e-08, + "loss": 0.0004, + "step": 34640 + }, + { + "epoch": 0.67, + "learning_rate": 6.567123606850219e-08, + "loss": 0.0014, + "step": 34641 + }, + { + "epoch": 0.67, + "learning_rate": 6.566735272416605e-08, + "loss": 0.2687, + "step": 34642 + }, + { + "epoch": 0.67, + "learning_rate": 6.566346937982991e-08, + "loss": 0.0017, + "step": 34643 + }, + { + "epoch": 0.67, + "learning_rate": 6.565958603549376e-08, + "loss": 0.0006, + "step": 34644 + }, + { + "epoch": 0.67, + "learning_rate": 6.565570269115762e-08, + "loss": 0.0004, + "step": 34645 + }, + { + "epoch": 0.67, + "learning_rate": 6.565181934682148e-08, + "loss": 0.4842, + "step": 34646 + }, + { + "epoch": 0.67, + "learning_rate": 6.564793600248534e-08, + "loss": 0.0007, + "step": 34647 + }, + { + "epoch": 0.67, + "learning_rate": 6.56440526581492e-08, + "loss": 0.0005, + "step": 34648 + }, + { + "epoch": 0.67, + "learning_rate": 6.564016931381306e-08, + "loss": 0.0006, + "step": 34649 + }, + { + "epoch": 0.67, + "learning_rate": 6.563628596947691e-08, + "loss": 0.0007, + "step": 34650 + }, + { + "epoch": 0.67, + "learning_rate": 6.563240262514077e-08, + "loss": 0.0004, + "step": 34651 + }, + { + "epoch": 0.67, + "learning_rate": 6.562851928080463e-08, + "loss": 0.0005, + "step": 34652 + }, + { + "epoch": 0.67, + "learning_rate": 6.562463593646849e-08, + "loss": 0.0005, + "step": 34653 + }, + { + "epoch": 0.67, + "learning_rate": 6.562075259213235e-08, + "loss": 0.0037, + "step": 34654 + }, + { + "epoch": 0.67, + "learning_rate": 6.56168692477962e-08, + "loss": 0.0004, + "step": 34655 + }, + { + "epoch": 0.67, + "learning_rate": 6.561298590346006e-08, + "loss": 0.0005, + "step": 34656 + }, + { + "epoch": 0.67, + "learning_rate": 6.560910255912392e-08, + "loss": 0.0007, + "step": 34657 + }, + { + "epoch": 0.67, + "learning_rate": 6.560521921478778e-08, + "loss": 0.8593, + "step": 34658 + }, + { + "epoch": 0.67, + "learning_rate": 6.560133587045164e-08, + "loss": 0.0008, + "step": 34659 + }, + { + "epoch": 0.67, + "learning_rate": 6.55974525261155e-08, + "loss": 0.0035, + "step": 34660 + }, + { + "epoch": 0.67, + "learning_rate": 6.559356918177934e-08, + "loss": 0.0003, + "step": 34661 + }, + { + "epoch": 0.67, + "learning_rate": 6.55896858374432e-08, + "loss": 0.0005, + "step": 34662 + }, + { + "epoch": 0.67, + "learning_rate": 6.558580249310706e-08, + "loss": 0.0006, + "step": 34663 + }, + { + "epoch": 0.67, + "learning_rate": 6.558191914877092e-08, + "loss": 0.5935, + "step": 34664 + }, + { + "epoch": 0.67, + "learning_rate": 6.557803580443477e-08, + "loss": 1.0958, + "step": 34665 + }, + { + "epoch": 0.67, + "learning_rate": 6.557415246009863e-08, + "loss": 1.3687, + "step": 34666 + }, + { + "epoch": 0.67, + "learning_rate": 6.557026911576249e-08, + "loss": 0.8462, + "step": 34667 + }, + { + "epoch": 0.67, + "learning_rate": 6.556638577142635e-08, + "loss": 0.0005, + "step": 34668 + }, + { + "epoch": 0.67, + "learning_rate": 6.556250242709021e-08, + "loss": 0.0004, + "step": 34669 + }, + { + "epoch": 0.67, + "learning_rate": 6.555861908275407e-08, + "loss": 0.0005, + "step": 34670 + }, + { + "epoch": 0.67, + "learning_rate": 6.555473573841792e-08, + "loss": 0.0004, + "step": 34671 + }, + { + "epoch": 0.67, + "learning_rate": 6.555085239408178e-08, + "loss": 0.0004, + "step": 34672 + }, + { + "epoch": 0.67, + "learning_rate": 6.554696904974564e-08, + "loss": 0.0004, + "step": 34673 + }, + { + "epoch": 0.67, + "learning_rate": 6.55430857054095e-08, + "loss": 0.0042, + "step": 34674 + }, + { + "epoch": 0.67, + "learning_rate": 6.553920236107336e-08, + "loss": 0.0004, + "step": 34675 + }, + { + "epoch": 0.67, + "learning_rate": 6.553531901673722e-08, + "loss": 0.0004, + "step": 34676 + }, + { + "epoch": 0.67, + "learning_rate": 6.553143567240107e-08, + "loss": 0.0009, + "step": 34677 + }, + { + "epoch": 0.67, + "learning_rate": 6.552755232806493e-08, + "loss": 0.0004, + "step": 34678 + }, + { + "epoch": 0.67, + "learning_rate": 6.552366898372879e-08, + "loss": 0.0011, + "step": 34679 + }, + { + "epoch": 0.67, + "learning_rate": 6.551978563939265e-08, + "loss": 0.0028, + "step": 34680 + }, + { + "epoch": 0.67, + "learning_rate": 6.551590229505651e-08, + "loss": 0.0004, + "step": 34681 + }, + { + "epoch": 0.67, + "learning_rate": 6.551201895072036e-08, + "loss": 0.0005, + "step": 34682 + }, + { + "epoch": 0.67, + "learning_rate": 6.550813560638422e-08, + "loss": 0.0008, + "step": 34683 + }, + { + "epoch": 0.67, + "learning_rate": 6.550425226204808e-08, + "loss": 0.0032, + "step": 34684 + }, + { + "epoch": 0.67, + "learning_rate": 6.550036891771194e-08, + "loss": 0.0007, + "step": 34685 + }, + { + "epoch": 0.67, + "learning_rate": 6.54964855733758e-08, + "loss": 0.0005, + "step": 34686 + }, + { + "epoch": 0.67, + "learning_rate": 6.549260222903966e-08, + "loss": 0.0005, + "step": 34687 + }, + { + "epoch": 0.67, + "learning_rate": 6.548871888470351e-08, + "loss": 0.0005, + "step": 34688 + }, + { + "epoch": 0.67, + "learning_rate": 6.548483554036737e-08, + "loss": 0.0005, + "step": 34689 + }, + { + "epoch": 0.67, + "learning_rate": 6.548095219603122e-08, + "loss": 0.0005, + "step": 34690 + }, + { + "epoch": 0.67, + "learning_rate": 6.547706885169508e-08, + "loss": 0.0006, + "step": 34691 + }, + { + "epoch": 0.67, + "learning_rate": 6.547318550735893e-08, + "loss": 0.0005, + "step": 34692 + }, + { + "epoch": 0.67, + "learning_rate": 6.546930216302279e-08, + "loss": 0.0006, + "step": 34693 + }, + { + "epoch": 0.67, + "learning_rate": 6.546541881868665e-08, + "loss": 0.6302, + "step": 34694 + }, + { + "epoch": 0.67, + "learning_rate": 6.546153547435051e-08, + "loss": 0.8449, + "step": 34695 + }, + { + "epoch": 0.67, + "learning_rate": 6.545765213001437e-08, + "loss": 0.0004, + "step": 34696 + }, + { + "epoch": 0.67, + "learning_rate": 6.545376878567823e-08, + "loss": 0.0004, + "step": 34697 + }, + { + "epoch": 0.67, + "learning_rate": 6.544988544134208e-08, + "loss": 0.0004, + "step": 34698 + }, + { + "epoch": 0.67, + "learning_rate": 6.544600209700594e-08, + "loss": 0.0003, + "step": 34699 + }, + { + "epoch": 0.67, + "learning_rate": 6.54421187526698e-08, + "loss": 0.8838, + "step": 34700 + }, + { + "epoch": 0.67, + "learning_rate": 6.543823540833366e-08, + "loss": 0.0005, + "step": 34701 + }, + { + "epoch": 0.67, + "learning_rate": 6.543435206399752e-08, + "loss": 0.0005, + "step": 34702 + }, + { + "epoch": 0.67, + "learning_rate": 6.543046871966137e-08, + "loss": 0.0006, + "step": 34703 + }, + { + "epoch": 0.67, + "learning_rate": 6.542658537532523e-08, + "loss": 0.0004, + "step": 34704 + }, + { + "epoch": 0.67, + "learning_rate": 6.542270203098909e-08, + "loss": 0.0024, + "step": 34705 + }, + { + "epoch": 0.67, + "learning_rate": 6.541881868665295e-08, + "loss": 0.0006, + "step": 34706 + }, + { + "epoch": 0.67, + "learning_rate": 6.541493534231681e-08, + "loss": 0.0005, + "step": 34707 + }, + { + "epoch": 0.67, + "learning_rate": 6.541105199798067e-08, + "loss": 0.0004, + "step": 34708 + }, + { + "epoch": 0.67, + "learning_rate": 6.540716865364452e-08, + "loss": 0.0006, + "step": 34709 + }, + { + "epoch": 0.67, + "learning_rate": 6.540328530930837e-08, + "loss": 0.0009, + "step": 34710 + }, + { + "epoch": 0.67, + "learning_rate": 6.539940196497223e-08, + "loss": 0.0005, + "step": 34711 + }, + { + "epoch": 0.67, + "learning_rate": 6.539551862063609e-08, + "loss": 0.0007, + "step": 34712 + }, + { + "epoch": 0.67, + "learning_rate": 6.539163527629994e-08, + "loss": 0.002, + "step": 34713 + }, + { + "epoch": 0.67, + "learning_rate": 6.53877519319638e-08, + "loss": 0.0007, + "step": 34714 + }, + { + "epoch": 0.67, + "learning_rate": 6.538386858762766e-08, + "loss": 0.0003, + "step": 34715 + }, + { + "epoch": 0.67, + "learning_rate": 6.537998524329152e-08, + "loss": 0.0006, + "step": 34716 + }, + { + "epoch": 0.67, + "learning_rate": 6.537610189895538e-08, + "loss": 0.0005, + "step": 34717 + }, + { + "epoch": 0.67, + "learning_rate": 6.537221855461924e-08, + "loss": 0.5266, + "step": 34718 + }, + { + "epoch": 0.67, + "learning_rate": 6.53683352102831e-08, + "loss": 0.0004, + "step": 34719 + }, + { + "epoch": 0.67, + "learning_rate": 6.536445186594695e-08, + "loss": 0.0007, + "step": 34720 + }, + { + "epoch": 0.67, + "learning_rate": 6.536056852161081e-08, + "loss": 0.0016, + "step": 34721 + }, + { + "epoch": 0.67, + "learning_rate": 6.535668517727467e-08, + "loss": 0.0004, + "step": 34722 + }, + { + "epoch": 0.67, + "learning_rate": 6.535280183293853e-08, + "loss": 0.0108, + "step": 34723 + }, + { + "epoch": 0.67, + "learning_rate": 6.534891848860237e-08, + "loss": 0.0114, + "step": 34724 + }, + { + "epoch": 0.67, + "learning_rate": 6.534503514426623e-08, + "loss": 0.0007, + "step": 34725 + }, + { + "epoch": 0.67, + "learning_rate": 6.534115179993009e-08, + "loss": 0.0009, + "step": 34726 + }, + { + "epoch": 0.67, + "learning_rate": 6.533726845559395e-08, + "loss": 0.001, + "step": 34727 + }, + { + "epoch": 0.67, + "learning_rate": 6.53333851112578e-08, + "loss": 0.0008, + "step": 34728 + }, + { + "epoch": 0.67, + "learning_rate": 6.532950176692166e-08, + "loss": 0.0005, + "step": 34729 + }, + { + "epoch": 0.67, + "learning_rate": 6.532561842258552e-08, + "loss": 0.0004, + "step": 34730 + }, + { + "epoch": 0.67, + "learning_rate": 6.532173507824938e-08, + "loss": 0.0136, + "step": 34731 + }, + { + "epoch": 0.67, + "learning_rate": 6.531785173391324e-08, + "loss": 0.0004, + "step": 34732 + }, + { + "epoch": 0.67, + "learning_rate": 6.53139683895771e-08, + "loss": 0.0006, + "step": 34733 + }, + { + "epoch": 0.67, + "learning_rate": 6.531008504524095e-08, + "loss": 0.0008, + "step": 34734 + }, + { + "epoch": 0.67, + "learning_rate": 6.530620170090481e-08, + "loss": 0.0005, + "step": 34735 + }, + { + "epoch": 0.67, + "learning_rate": 6.530231835656867e-08, + "loss": 0.458, + "step": 34736 + }, + { + "epoch": 0.67, + "learning_rate": 6.529843501223253e-08, + "loss": 0.0006, + "step": 34737 + }, + { + "epoch": 0.67, + "learning_rate": 6.529455166789639e-08, + "loss": 0.0006, + "step": 34738 + }, + { + "epoch": 0.67, + "learning_rate": 6.529066832356025e-08, + "loss": 0.0009, + "step": 34739 + }, + { + "epoch": 0.67, + "learning_rate": 6.52867849792241e-08, + "loss": 0.0004, + "step": 34740 + }, + { + "epoch": 0.67, + "learning_rate": 6.528290163488796e-08, + "loss": 0.0006, + "step": 34741 + }, + { + "epoch": 0.67, + "learning_rate": 6.527901829055182e-08, + "loss": 0.0004, + "step": 34742 + }, + { + "epoch": 0.67, + "learning_rate": 6.527513494621568e-08, + "loss": 0.0005, + "step": 34743 + }, + { + "epoch": 0.67, + "learning_rate": 6.527125160187954e-08, + "loss": 0.0011, + "step": 34744 + }, + { + "epoch": 0.67, + "learning_rate": 6.52673682575434e-08, + "loss": 0.0006, + "step": 34745 + }, + { + "epoch": 0.67, + "learning_rate": 6.526348491320725e-08, + "loss": 0.1368, + "step": 34746 + }, + { + "epoch": 0.67, + "learning_rate": 6.525960156887111e-08, + "loss": 0.0004, + "step": 34747 + }, + { + "epoch": 0.67, + "learning_rate": 6.525571822453496e-08, + "loss": 0.0006, + "step": 34748 + }, + { + "epoch": 0.67, + "learning_rate": 6.525183488019881e-08, + "loss": 1.1429, + "step": 34749 + }, + { + "epoch": 0.67, + "learning_rate": 6.524795153586267e-08, + "loss": 0.0007, + "step": 34750 + }, + { + "epoch": 0.67, + "learning_rate": 6.524406819152653e-08, + "loss": 0.0004, + "step": 34751 + }, + { + "epoch": 0.67, + "learning_rate": 6.524018484719039e-08, + "loss": 0.0004, + "step": 34752 + }, + { + "epoch": 0.67, + "learning_rate": 6.523630150285425e-08, + "loss": 0.0006, + "step": 34753 + }, + { + "epoch": 0.67, + "learning_rate": 6.52324181585181e-08, + "loss": 0.0005, + "step": 34754 + }, + { + "epoch": 0.67, + "learning_rate": 6.522853481418196e-08, + "loss": 0.0005, + "step": 34755 + }, + { + "epoch": 0.67, + "learning_rate": 6.522465146984582e-08, + "loss": 0.0006, + "step": 34756 + }, + { + "epoch": 0.67, + "learning_rate": 6.522076812550968e-08, + "loss": 0.1507, + "step": 34757 + }, + { + "epoch": 0.67, + "learning_rate": 6.521688478117354e-08, + "loss": 0.0022, + "step": 34758 + }, + { + "epoch": 0.67, + "learning_rate": 6.52130014368374e-08, + "loss": 0.0004, + "step": 34759 + }, + { + "epoch": 0.67, + "learning_rate": 6.520911809250126e-08, + "loss": 0.0004, + "step": 34760 + }, + { + "epoch": 0.67, + "learning_rate": 6.520523474816511e-08, + "loss": 0.0022, + "step": 34761 + }, + { + "epoch": 0.67, + "learning_rate": 6.520135140382897e-08, + "loss": 0.0006, + "step": 34762 + }, + { + "epoch": 0.67, + "learning_rate": 6.519746805949283e-08, + "loss": 0.0051, + "step": 34763 + }, + { + "epoch": 0.67, + "learning_rate": 6.519358471515669e-08, + "loss": 0.0004, + "step": 34764 + }, + { + "epoch": 0.67, + "learning_rate": 6.518970137082055e-08, + "loss": 0.0005, + "step": 34765 + }, + { + "epoch": 0.67, + "learning_rate": 6.51858180264844e-08, + "loss": 0.0004, + "step": 34766 + }, + { + "epoch": 0.67, + "learning_rate": 6.518193468214826e-08, + "loss": 0.0004, + "step": 34767 + }, + { + "epoch": 0.67, + "learning_rate": 6.517805133781212e-08, + "loss": 0.0006, + "step": 34768 + }, + { + "epoch": 0.67, + "learning_rate": 6.517416799347598e-08, + "loss": 0.0007, + "step": 34769 + }, + { + "epoch": 0.67, + "learning_rate": 6.517028464913984e-08, + "loss": 0.0003, + "step": 34770 + }, + { + "epoch": 0.67, + "learning_rate": 6.51664013048037e-08, + "loss": 0.0006, + "step": 34771 + }, + { + "epoch": 0.67, + "learning_rate": 6.516251796046755e-08, + "loss": 0.0003, + "step": 34772 + }, + { + "epoch": 0.67, + "learning_rate": 6.515863461613141e-08, + "loss": 0.0004, + "step": 34773 + }, + { + "epoch": 0.67, + "learning_rate": 6.515475127179527e-08, + "loss": 0.0005, + "step": 34774 + }, + { + "epoch": 0.67, + "learning_rate": 6.515086792745913e-08, + "loss": 0.0004, + "step": 34775 + }, + { + "epoch": 0.67, + "learning_rate": 6.514698458312299e-08, + "loss": 0.0003, + "step": 34776 + }, + { + "epoch": 0.67, + "learning_rate": 6.514310123878683e-08, + "loss": 0.0006, + "step": 34777 + }, + { + "epoch": 0.67, + "learning_rate": 6.513921789445069e-08, + "loss": 0.0005, + "step": 34778 + }, + { + "epoch": 0.67, + "learning_rate": 6.513533455011455e-08, + "loss": 0.0004, + "step": 34779 + }, + { + "epoch": 0.67, + "learning_rate": 6.513145120577841e-08, + "loss": 0.001, + "step": 34780 + }, + { + "epoch": 0.67, + "learning_rate": 6.512756786144226e-08, + "loss": 0.0005, + "step": 34781 + }, + { + "epoch": 0.67, + "learning_rate": 6.512368451710612e-08, + "loss": 0.0004, + "step": 34782 + }, + { + "epoch": 0.67, + "learning_rate": 6.511980117276998e-08, + "loss": 0.0006, + "step": 34783 + }, + { + "epoch": 0.67, + "learning_rate": 6.511591782843384e-08, + "loss": 0.0004, + "step": 34784 + }, + { + "epoch": 0.67, + "learning_rate": 6.51120344840977e-08, + "loss": 0.9538, + "step": 34785 + }, + { + "epoch": 0.67, + "learning_rate": 6.510815113976156e-08, + "loss": 0.0005, + "step": 34786 + }, + { + "epoch": 0.67, + "learning_rate": 6.510426779542541e-08, + "loss": 1.1758, + "step": 34787 + }, + { + "epoch": 0.67, + "learning_rate": 6.510038445108927e-08, + "loss": 0.0004, + "step": 34788 + }, + { + "epoch": 0.67, + "learning_rate": 6.509650110675313e-08, + "loss": 0.0005, + "step": 34789 + }, + { + "epoch": 0.67, + "learning_rate": 6.509261776241699e-08, + "loss": 0.0005, + "step": 34790 + }, + { + "epoch": 0.67, + "learning_rate": 6.508873441808085e-08, + "loss": 1.0495, + "step": 34791 + }, + { + "epoch": 0.67, + "learning_rate": 6.50848510737447e-08, + "loss": 0.0008, + "step": 34792 + }, + { + "epoch": 0.67, + "learning_rate": 6.508096772940856e-08, + "loss": 0.0005, + "step": 34793 + }, + { + "epoch": 0.67, + "learning_rate": 6.507708438507242e-08, + "loss": 0.0208, + "step": 34794 + }, + { + "epoch": 0.67, + "learning_rate": 6.507320104073628e-08, + "loss": 0.0007, + "step": 34795 + }, + { + "epoch": 0.67, + "learning_rate": 6.506931769640014e-08, + "loss": 0.0004, + "step": 34796 + }, + { + "epoch": 0.67, + "learning_rate": 6.5065434352064e-08, + "loss": 0.0004, + "step": 34797 + }, + { + "epoch": 0.68, + "learning_rate": 6.506155100772786e-08, + "loss": 0.0006, + "step": 34798 + }, + { + "epoch": 0.68, + "learning_rate": 6.505766766339171e-08, + "loss": 0.001, + "step": 34799 + }, + { + "epoch": 0.68, + "learning_rate": 6.505378431905557e-08, + "loss": 0.0006, + "step": 34800 + }, + { + "epoch": 0.68, + "learning_rate": 6.504990097471943e-08, + "loss": 0.0005, + "step": 34801 + }, + { + "epoch": 0.68, + "learning_rate": 6.504601763038329e-08, + "loss": 0.0003, + "step": 34802 + }, + { + "epoch": 0.68, + "learning_rate": 6.504213428604715e-08, + "loss": 0.0005, + "step": 34803 + }, + { + "epoch": 0.68, + "learning_rate": 6.5038250941711e-08, + "loss": 0.0007, + "step": 34804 + }, + { + "epoch": 0.68, + "learning_rate": 6.503436759737486e-08, + "loss": 0.1503, + "step": 34805 + }, + { + "epoch": 0.68, + "learning_rate": 6.503048425303871e-08, + "loss": 0.0004, + "step": 34806 + }, + { + "epoch": 0.68, + "learning_rate": 6.502660090870257e-08, + "loss": 0.0004, + "step": 34807 + }, + { + "epoch": 0.68, + "learning_rate": 6.502271756436642e-08, + "loss": 0.0005, + "step": 34808 + }, + { + "epoch": 0.68, + "learning_rate": 6.501883422003028e-08, + "loss": 0.0004, + "step": 34809 + }, + { + "epoch": 0.68, + "learning_rate": 6.501495087569414e-08, + "loss": 0.0004, + "step": 34810 + }, + { + "epoch": 0.68, + "learning_rate": 6.5011067531358e-08, + "loss": 0.0005, + "step": 34811 + }, + { + "epoch": 0.68, + "learning_rate": 6.500718418702186e-08, + "loss": 0.0005, + "step": 34812 + }, + { + "epoch": 0.68, + "learning_rate": 6.500330084268572e-08, + "loss": 0.0005, + "step": 34813 + }, + { + "epoch": 0.68, + "learning_rate": 6.499941749834957e-08, + "loss": 0.0007, + "step": 34814 + }, + { + "epoch": 0.68, + "learning_rate": 6.499553415401343e-08, + "loss": 0.0003, + "step": 34815 + }, + { + "epoch": 0.68, + "learning_rate": 6.499165080967729e-08, + "loss": 0.0004, + "step": 34816 + }, + { + "epoch": 0.68, + "learning_rate": 6.498776746534115e-08, + "loss": 0.0007, + "step": 34817 + }, + { + "epoch": 0.68, + "learning_rate": 6.498388412100501e-08, + "loss": 0.0004, + "step": 34818 + }, + { + "epoch": 0.68, + "learning_rate": 6.498000077666887e-08, + "loss": 0.0005, + "step": 34819 + }, + { + "epoch": 0.68, + "learning_rate": 6.497611743233272e-08, + "loss": 0.0007, + "step": 34820 + }, + { + "epoch": 0.68, + "learning_rate": 6.497223408799658e-08, + "loss": 0.0004, + "step": 34821 + }, + { + "epoch": 0.68, + "learning_rate": 6.496835074366044e-08, + "loss": 0.0004, + "step": 34822 + }, + { + "epoch": 0.68, + "learning_rate": 6.49644673993243e-08, + "loss": 0.0005, + "step": 34823 + }, + { + "epoch": 0.68, + "learning_rate": 6.496058405498816e-08, + "loss": 0.0005, + "step": 34824 + }, + { + "epoch": 0.68, + "learning_rate": 6.495670071065201e-08, + "loss": 0.0006, + "step": 34825 + }, + { + "epoch": 0.68, + "learning_rate": 6.495281736631587e-08, + "loss": 0.0005, + "step": 34826 + }, + { + "epoch": 0.68, + "learning_rate": 6.494893402197973e-08, + "loss": 0.0005, + "step": 34827 + }, + { + "epoch": 0.68, + "learning_rate": 6.494505067764359e-08, + "loss": 0.0007, + "step": 34828 + }, + { + "epoch": 0.68, + "learning_rate": 6.494116733330745e-08, + "loss": 0.0004, + "step": 34829 + }, + { + "epoch": 0.68, + "learning_rate": 6.49372839889713e-08, + "loss": 0.0004, + "step": 34830 + }, + { + "epoch": 0.68, + "learning_rate": 6.493340064463516e-08, + "loss": 0.0004, + "step": 34831 + }, + { + "epoch": 0.68, + "learning_rate": 6.492951730029902e-08, + "loss": 0.0003, + "step": 34832 + }, + { + "epoch": 0.68, + "learning_rate": 6.492563395596288e-08, + "loss": 0.0003, + "step": 34833 + }, + { + "epoch": 0.68, + "learning_rate": 6.492175061162674e-08, + "loss": 0.0003, + "step": 34834 + }, + { + "epoch": 0.68, + "learning_rate": 6.491786726729058e-08, + "loss": 0.0004, + "step": 34835 + }, + { + "epoch": 0.68, + "learning_rate": 6.491398392295444e-08, + "loss": 0.0004, + "step": 34836 + }, + { + "epoch": 0.68, + "learning_rate": 6.49101005786183e-08, + "loss": 0.0004, + "step": 34837 + }, + { + "epoch": 0.68, + "learning_rate": 6.490621723428216e-08, + "loss": 0.0002, + "step": 34838 + }, + { + "epoch": 0.68, + "learning_rate": 6.490233388994602e-08, + "loss": 0.0003, + "step": 34839 + }, + { + "epoch": 0.68, + "learning_rate": 6.489845054560987e-08, + "loss": 0.0005, + "step": 34840 + }, + { + "epoch": 0.68, + "learning_rate": 6.489456720127373e-08, + "loss": 1.0824, + "step": 34841 + }, + { + "epoch": 0.68, + "learning_rate": 6.489068385693759e-08, + "loss": 0.0005, + "step": 34842 + }, + { + "epoch": 0.68, + "learning_rate": 6.488680051260145e-08, + "loss": 0.0005, + "step": 34843 + }, + { + "epoch": 0.68, + "learning_rate": 6.488291716826531e-08, + "loss": 0.0538, + "step": 34844 + }, + { + "epoch": 0.68, + "learning_rate": 6.487903382392917e-08, + "loss": 0.0005, + "step": 34845 + }, + { + "epoch": 0.68, + "learning_rate": 6.487515047959302e-08, + "loss": 0.0005, + "step": 34846 + }, + { + "epoch": 0.68, + "learning_rate": 6.487126713525688e-08, + "loss": 0.0003, + "step": 34847 + }, + { + "epoch": 0.68, + "learning_rate": 6.486738379092074e-08, + "loss": 0.3849, + "step": 34848 + }, + { + "epoch": 0.68, + "learning_rate": 6.48635004465846e-08, + "loss": 0.0031, + "step": 34849 + }, + { + "epoch": 0.68, + "learning_rate": 6.485961710224846e-08, + "loss": 0.0005, + "step": 34850 + }, + { + "epoch": 0.68, + "learning_rate": 6.485573375791232e-08, + "loss": 0.0007, + "step": 34851 + }, + { + "epoch": 0.68, + "learning_rate": 6.485185041357617e-08, + "loss": 0.0005, + "step": 34852 + }, + { + "epoch": 0.68, + "learning_rate": 6.484796706924003e-08, + "loss": 0.0004, + "step": 34853 + }, + { + "epoch": 0.68, + "learning_rate": 6.484408372490389e-08, + "loss": 0.0004, + "step": 34854 + }, + { + "epoch": 0.68, + "learning_rate": 6.484020038056775e-08, + "loss": 0.4666, + "step": 34855 + }, + { + "epoch": 0.68, + "learning_rate": 6.483631703623161e-08, + "loss": 0.0003, + "step": 34856 + }, + { + "epoch": 0.68, + "learning_rate": 6.483243369189547e-08, + "loss": 0.0005, + "step": 34857 + }, + { + "epoch": 0.68, + "learning_rate": 6.482855034755932e-08, + "loss": 0.0005, + "step": 34858 + }, + { + "epoch": 0.68, + "learning_rate": 6.482466700322318e-08, + "loss": 0.0006, + "step": 34859 + }, + { + "epoch": 0.68, + "learning_rate": 6.482078365888704e-08, + "loss": 0.0004, + "step": 34860 + }, + { + "epoch": 0.68, + "learning_rate": 6.48169003145509e-08, + "loss": 0.0005, + "step": 34861 + }, + { + "epoch": 0.68, + "learning_rate": 6.481301697021476e-08, + "loss": 0.229, + "step": 34862 + }, + { + "epoch": 0.68, + "learning_rate": 6.480913362587861e-08, + "loss": 0.0004, + "step": 34863 + }, + { + "epoch": 0.68, + "learning_rate": 6.480525028154246e-08, + "loss": 0.0007, + "step": 34864 + }, + { + "epoch": 0.68, + "learning_rate": 6.480136693720632e-08, + "loss": 0.0007, + "step": 34865 + }, + { + "epoch": 0.68, + "learning_rate": 6.479748359287018e-08, + "loss": 0.0017, + "step": 34866 + }, + { + "epoch": 0.68, + "learning_rate": 6.479360024853403e-08, + "loss": 0.0004, + "step": 34867 + }, + { + "epoch": 0.68, + "learning_rate": 6.478971690419789e-08, + "loss": 0.0005, + "step": 34868 + }, + { + "epoch": 0.68, + "learning_rate": 6.478583355986175e-08, + "loss": 0.0003, + "step": 34869 + }, + { + "epoch": 0.68, + "learning_rate": 6.478195021552561e-08, + "loss": 0.0361, + "step": 34870 + }, + { + "epoch": 0.68, + "learning_rate": 6.477806687118947e-08, + "loss": 0.3656, + "step": 34871 + }, + { + "epoch": 0.68, + "learning_rate": 6.477418352685333e-08, + "loss": 0.0007, + "step": 34872 + }, + { + "epoch": 0.68, + "learning_rate": 6.477030018251718e-08, + "loss": 0.0005, + "step": 34873 + }, + { + "epoch": 0.68, + "learning_rate": 6.476641683818104e-08, + "loss": 0.0006, + "step": 34874 + }, + { + "epoch": 0.68, + "learning_rate": 6.47625334938449e-08, + "loss": 0.0004, + "step": 34875 + }, + { + "epoch": 0.68, + "learning_rate": 6.475865014950876e-08, + "loss": 0.457, + "step": 34876 + }, + { + "epoch": 0.68, + "learning_rate": 6.475476680517262e-08, + "loss": 0.0005, + "step": 34877 + }, + { + "epoch": 0.68, + "learning_rate": 6.475088346083647e-08, + "loss": 0.0004, + "step": 34878 + }, + { + "epoch": 0.68, + "learning_rate": 6.474700011650033e-08, + "loss": 0.0003, + "step": 34879 + }, + { + "epoch": 0.68, + "learning_rate": 6.474311677216419e-08, + "loss": 0.0005, + "step": 34880 + }, + { + "epoch": 0.68, + "learning_rate": 6.473923342782805e-08, + "loss": 0.0004, + "step": 34881 + }, + { + "epoch": 0.68, + "learning_rate": 6.473535008349191e-08, + "loss": 0.0005, + "step": 34882 + }, + { + "epoch": 0.68, + "learning_rate": 6.473146673915577e-08, + "loss": 0.0004, + "step": 34883 + }, + { + "epoch": 0.68, + "learning_rate": 6.472758339481962e-08, + "loss": 0.0006, + "step": 34884 + }, + { + "epoch": 0.68, + "learning_rate": 6.472370005048348e-08, + "loss": 1.14, + "step": 34885 + }, + { + "epoch": 0.68, + "learning_rate": 6.471981670614734e-08, + "loss": 0.0005, + "step": 34886 + }, + { + "epoch": 0.68, + "learning_rate": 6.471593336181119e-08, + "loss": 0.0003, + "step": 34887 + }, + { + "epoch": 0.68, + "learning_rate": 6.471205001747504e-08, + "loss": 0.0305, + "step": 34888 + }, + { + "epoch": 0.68, + "learning_rate": 6.47081666731389e-08, + "loss": 0.0064, + "step": 34889 + }, + { + "epoch": 0.68, + "learning_rate": 6.470428332880276e-08, + "loss": 0.0005, + "step": 34890 + }, + { + "epoch": 0.68, + "learning_rate": 6.470039998446662e-08, + "loss": 0.0007, + "step": 34891 + }, + { + "epoch": 0.68, + "learning_rate": 6.469651664013048e-08, + "loss": 0.0004, + "step": 34892 + }, + { + "epoch": 0.68, + "learning_rate": 6.469263329579434e-08, + "loss": 0.0004, + "step": 34893 + }, + { + "epoch": 0.68, + "learning_rate": 6.46887499514582e-08, + "loss": 0.0004, + "step": 34894 + }, + { + "epoch": 0.68, + "learning_rate": 6.468486660712205e-08, + "loss": 0.0004, + "step": 34895 + }, + { + "epoch": 0.68, + "learning_rate": 6.468098326278591e-08, + "loss": 0.0004, + "step": 34896 + }, + { + "epoch": 0.68, + "learning_rate": 6.467709991844977e-08, + "loss": 0.0005, + "step": 34897 + }, + { + "epoch": 0.68, + "learning_rate": 6.467321657411363e-08, + "loss": 0.8703, + "step": 34898 + }, + { + "epoch": 0.68, + "learning_rate": 6.466933322977748e-08, + "loss": 0.0005, + "step": 34899 + }, + { + "epoch": 0.68, + "learning_rate": 6.466544988544134e-08, + "loss": 0.0017, + "step": 34900 + }, + { + "epoch": 0.68, + "learning_rate": 6.466156654110519e-08, + "loss": 0.0004, + "step": 34901 + }, + { + "epoch": 0.68, + "learning_rate": 6.465768319676905e-08, + "loss": 0.0011, + "step": 34902 + }, + { + "epoch": 0.68, + "learning_rate": 6.46537998524329e-08, + "loss": 0.0005, + "step": 34903 + }, + { + "epoch": 0.68, + "learning_rate": 6.464991650809676e-08, + "loss": 0.0005, + "step": 34904 + }, + { + "epoch": 0.68, + "learning_rate": 6.464603316376062e-08, + "loss": 0.0007, + "step": 34905 + }, + { + "epoch": 0.68, + "learning_rate": 6.464214981942448e-08, + "loss": 0.0019, + "step": 34906 + }, + { + "epoch": 0.68, + "learning_rate": 6.463826647508834e-08, + "loss": 0.0153, + "step": 34907 + }, + { + "epoch": 0.68, + "learning_rate": 6.46343831307522e-08, + "loss": 0.0005, + "step": 34908 + }, + { + "epoch": 0.68, + "learning_rate": 6.463049978641605e-08, + "loss": 0.0005, + "step": 34909 + }, + { + "epoch": 0.68, + "learning_rate": 6.462661644207991e-08, + "loss": 0.0003, + "step": 34910 + }, + { + "epoch": 0.68, + "learning_rate": 6.462273309774377e-08, + "loss": 0.0004, + "step": 34911 + }, + { + "epoch": 0.68, + "learning_rate": 6.461884975340763e-08, + "loss": 0.0038, + "step": 34912 + }, + { + "epoch": 0.68, + "learning_rate": 6.461496640907149e-08, + "loss": 0.0006, + "step": 34913 + }, + { + "epoch": 0.68, + "learning_rate": 6.461108306473535e-08, + "loss": 0.0006, + "step": 34914 + }, + { + "epoch": 0.68, + "learning_rate": 6.46071997203992e-08, + "loss": 0.0006, + "step": 34915 + }, + { + "epoch": 0.68, + "learning_rate": 6.460331637606306e-08, + "loss": 0.0003, + "step": 34916 + }, + { + "epoch": 0.68, + "learning_rate": 6.459943303172692e-08, + "loss": 0.0346, + "step": 34917 + }, + { + "epoch": 0.68, + "learning_rate": 6.459554968739078e-08, + "loss": 0.0004, + "step": 34918 + }, + { + "epoch": 0.68, + "learning_rate": 6.459166634305464e-08, + "loss": 0.0258, + "step": 34919 + }, + { + "epoch": 0.68, + "learning_rate": 6.45877829987185e-08, + "loss": 0.5263, + "step": 34920 + }, + { + "epoch": 0.68, + "learning_rate": 6.458389965438235e-08, + "loss": 0.0006, + "step": 34921 + }, + { + "epoch": 0.68, + "learning_rate": 6.45800163100462e-08, + "loss": 0.0011, + "step": 34922 + }, + { + "epoch": 0.68, + "learning_rate": 6.457613296571006e-08, + "loss": 0.0005, + "step": 34923 + }, + { + "epoch": 0.68, + "learning_rate": 6.457224962137391e-08, + "loss": 0.0733, + "step": 34924 + }, + { + "epoch": 0.68, + "learning_rate": 6.456836627703777e-08, + "loss": 0.001, + "step": 34925 + }, + { + "epoch": 0.68, + "learning_rate": 6.456448293270163e-08, + "loss": 0.0004, + "step": 34926 + }, + { + "epoch": 0.68, + "learning_rate": 6.456059958836549e-08, + "loss": 0.0005, + "step": 34927 + }, + { + "epoch": 0.68, + "learning_rate": 6.455671624402935e-08, + "loss": 0.0003, + "step": 34928 + }, + { + "epoch": 0.68, + "learning_rate": 6.45528328996932e-08, + "loss": 1.2512, + "step": 34929 + }, + { + "epoch": 0.68, + "learning_rate": 6.454894955535706e-08, + "loss": 0.0003, + "step": 34930 + }, + { + "epoch": 0.68, + "learning_rate": 6.454506621102092e-08, + "loss": 0.0006, + "step": 34931 + }, + { + "epoch": 0.68, + "learning_rate": 6.454118286668478e-08, + "loss": 0.0005, + "step": 34932 + }, + { + "epoch": 0.68, + "learning_rate": 6.453729952234864e-08, + "loss": 0.0005, + "step": 34933 + }, + { + "epoch": 0.68, + "learning_rate": 6.45334161780125e-08, + "loss": 0.0005, + "step": 34934 + }, + { + "epoch": 0.68, + "learning_rate": 6.452953283367636e-08, + "loss": 0.0005, + "step": 34935 + }, + { + "epoch": 0.68, + "learning_rate": 6.452564948934021e-08, + "loss": 0.0006, + "step": 34936 + }, + { + "epoch": 0.68, + "learning_rate": 6.452176614500407e-08, + "loss": 0.0004, + "step": 34937 + }, + { + "epoch": 0.68, + "learning_rate": 6.451788280066793e-08, + "loss": 0.0007, + "step": 34938 + }, + { + "epoch": 0.68, + "learning_rate": 6.451399945633179e-08, + "loss": 0.0004, + "step": 34939 + }, + { + "epoch": 0.68, + "learning_rate": 6.451011611199565e-08, + "loss": 0.0007, + "step": 34940 + }, + { + "epoch": 0.68, + "learning_rate": 6.45062327676595e-08, + "loss": 0.0057, + "step": 34941 + }, + { + "epoch": 0.68, + "learning_rate": 6.450234942332336e-08, + "loss": 0.0064, + "step": 34942 + }, + { + "epoch": 0.68, + "learning_rate": 6.449846607898722e-08, + "loss": 0.0005, + "step": 34943 + }, + { + "epoch": 0.68, + "learning_rate": 6.449458273465108e-08, + "loss": 0.5034, + "step": 34944 + }, + { + "epoch": 0.68, + "learning_rate": 6.449069939031494e-08, + "loss": 0.0004, + "step": 34945 + }, + { + "epoch": 0.68, + "learning_rate": 6.44868160459788e-08, + "loss": 0.0812, + "step": 34946 + }, + { + "epoch": 0.68, + "learning_rate": 6.448293270164265e-08, + "loss": 0.0004, + "step": 34947 + }, + { + "epoch": 0.68, + "learning_rate": 6.447904935730651e-08, + "loss": 0.0004, + "step": 34948 + }, + { + "epoch": 0.68, + "learning_rate": 6.447516601297037e-08, + "loss": 0.0004, + "step": 34949 + }, + { + "epoch": 0.68, + "learning_rate": 6.447128266863423e-08, + "loss": 0.0003, + "step": 34950 + }, + { + "epoch": 0.68, + "learning_rate": 6.446739932429807e-08, + "loss": 0.0004, + "step": 34951 + }, + { + "epoch": 0.68, + "learning_rate": 6.446351597996193e-08, + "loss": 0.0234, + "step": 34952 + }, + { + "epoch": 0.68, + "learning_rate": 6.445963263562579e-08, + "loss": 0.0004, + "step": 34953 + }, + { + "epoch": 0.68, + "learning_rate": 6.445574929128965e-08, + "loss": 0.0003, + "step": 34954 + }, + { + "epoch": 0.68, + "learning_rate": 6.445186594695351e-08, + "loss": 0.0005, + "step": 34955 + }, + { + "epoch": 0.68, + "learning_rate": 6.444798260261737e-08, + "loss": 0.0005, + "step": 34956 + }, + { + "epoch": 0.68, + "learning_rate": 6.444409925828122e-08, + "loss": 0.0003, + "step": 34957 + }, + { + "epoch": 0.68, + "learning_rate": 6.444021591394508e-08, + "loss": 1.1314, + "step": 34958 + }, + { + "epoch": 0.68, + "learning_rate": 6.443633256960894e-08, + "loss": 0.0005, + "step": 34959 + }, + { + "epoch": 0.68, + "learning_rate": 6.44324492252728e-08, + "loss": 0.0366, + "step": 34960 + }, + { + "epoch": 0.68, + "learning_rate": 6.442856588093666e-08, + "loss": 0.0004, + "step": 34961 + }, + { + "epoch": 0.68, + "learning_rate": 6.442468253660051e-08, + "loss": 0.0003, + "step": 34962 + }, + { + "epoch": 0.68, + "learning_rate": 6.442079919226437e-08, + "loss": 0.0004, + "step": 34963 + }, + { + "epoch": 0.68, + "learning_rate": 6.441691584792823e-08, + "loss": 0.0004, + "step": 34964 + }, + { + "epoch": 0.68, + "learning_rate": 6.441303250359209e-08, + "loss": 0.0003, + "step": 34965 + }, + { + "epoch": 0.68, + "learning_rate": 6.440914915925595e-08, + "loss": 0.2242, + "step": 34966 + }, + { + "epoch": 0.68, + "learning_rate": 6.44052658149198e-08, + "loss": 0.0006, + "step": 34967 + }, + { + "epoch": 0.68, + "learning_rate": 6.440138247058366e-08, + "loss": 0.0006, + "step": 34968 + }, + { + "epoch": 0.68, + "learning_rate": 6.439749912624752e-08, + "loss": 0.0004, + "step": 34969 + }, + { + "epoch": 0.68, + "learning_rate": 6.439361578191138e-08, + "loss": 0.0009, + "step": 34970 + }, + { + "epoch": 0.68, + "learning_rate": 6.438973243757524e-08, + "loss": 0.0005, + "step": 34971 + }, + { + "epoch": 0.68, + "learning_rate": 6.43858490932391e-08, + "loss": 0.0005, + "step": 34972 + }, + { + "epoch": 0.68, + "learning_rate": 6.438196574890296e-08, + "loss": 0.0555, + "step": 34973 + }, + { + "epoch": 0.68, + "learning_rate": 6.437808240456681e-08, + "loss": 0.0004, + "step": 34974 + }, + { + "epoch": 0.68, + "learning_rate": 6.437419906023067e-08, + "loss": 0.0005, + "step": 34975 + }, + { + "epoch": 0.68, + "learning_rate": 6.437031571589453e-08, + "loss": 0.0004, + "step": 34976 + }, + { + "epoch": 0.68, + "learning_rate": 6.436643237155839e-08, + "loss": 0.0008, + "step": 34977 + }, + { + "epoch": 0.68, + "learning_rate": 6.436254902722225e-08, + "loss": 0.0003, + "step": 34978 + }, + { + "epoch": 0.68, + "learning_rate": 6.43586656828861e-08, + "loss": 0.0004, + "step": 34979 + }, + { + "epoch": 0.68, + "learning_rate": 6.435478233854995e-08, + "loss": 0.0004, + "step": 34980 + }, + { + "epoch": 0.68, + "learning_rate": 6.435089899421381e-08, + "loss": 0.0004, + "step": 34981 + }, + { + "epoch": 0.68, + "learning_rate": 6.434701564987767e-08, + "loss": 0.0005, + "step": 34982 + }, + { + "epoch": 0.68, + "learning_rate": 6.434313230554152e-08, + "loss": 0.0013, + "step": 34983 + }, + { + "epoch": 0.68, + "learning_rate": 6.433924896120538e-08, + "loss": 0.0047, + "step": 34984 + }, + { + "epoch": 0.68, + "learning_rate": 6.433536561686924e-08, + "loss": 0.0005, + "step": 34985 + }, + { + "epoch": 0.68, + "learning_rate": 6.43314822725331e-08, + "loss": 0.0005, + "step": 34986 + }, + { + "epoch": 0.68, + "learning_rate": 6.432759892819696e-08, + "loss": 0.0005, + "step": 34987 + }, + { + "epoch": 0.68, + "learning_rate": 6.432371558386082e-08, + "loss": 1.1126, + "step": 34988 + }, + { + "epoch": 0.68, + "learning_rate": 6.431983223952467e-08, + "loss": 0.0007, + "step": 34989 + }, + { + "epoch": 0.68, + "learning_rate": 6.431594889518853e-08, + "loss": 0.0003, + "step": 34990 + }, + { + "epoch": 0.68, + "learning_rate": 6.431206555085239e-08, + "loss": 0.0008, + "step": 34991 + }, + { + "epoch": 0.68, + "learning_rate": 6.430818220651625e-08, + "loss": 0.0013, + "step": 34992 + }, + { + "epoch": 0.68, + "learning_rate": 6.430429886218011e-08, + "loss": 0.0005, + "step": 34993 + }, + { + "epoch": 0.68, + "learning_rate": 6.430041551784397e-08, + "loss": 0.0005, + "step": 34994 + }, + { + "epoch": 0.68, + "learning_rate": 6.429653217350782e-08, + "loss": 0.0004, + "step": 34995 + }, + { + "epoch": 0.68, + "learning_rate": 6.429264882917168e-08, + "loss": 0.0006, + "step": 34996 + }, + { + "epoch": 0.68, + "learning_rate": 6.428876548483554e-08, + "loss": 0.0005, + "step": 34997 + }, + { + "epoch": 0.68, + "learning_rate": 6.42848821404994e-08, + "loss": 0.0008, + "step": 34998 + }, + { + "epoch": 0.68, + "learning_rate": 6.428099879616326e-08, + "loss": 0.0006, + "step": 34999 + }, + { + "epoch": 0.68, + "learning_rate": 6.427711545182711e-08, + "loss": 0.0004, + "step": 35000 + }, + { + "epoch": 0.68, + "learning_rate": 6.427323210749097e-08, + "loss": 0.0003, + "step": 35001 + }, + { + "epoch": 0.68, + "learning_rate": 6.426934876315483e-08, + "loss": 0.0065, + "step": 35002 + }, + { + "epoch": 0.68, + "learning_rate": 6.426546541881869e-08, + "loss": 0.0003, + "step": 35003 + }, + { + "epoch": 0.68, + "learning_rate": 6.426158207448255e-08, + "loss": 1.1868, + "step": 35004 + }, + { + "epoch": 0.68, + "learning_rate": 6.42576987301464e-08, + "loss": 0.333, + "step": 35005 + }, + { + "epoch": 0.68, + "learning_rate": 6.425381538581026e-08, + "loss": 0.0004, + "step": 35006 + }, + { + "epoch": 0.68, + "learning_rate": 6.424993204147412e-08, + "loss": 0.0005, + "step": 35007 + }, + { + "epoch": 0.68, + "learning_rate": 6.424604869713798e-08, + "loss": 0.0004, + "step": 35008 + }, + { + "epoch": 0.68, + "learning_rate": 6.424216535280183e-08, + "loss": 0.0006, + "step": 35009 + }, + { + "epoch": 0.68, + "learning_rate": 6.423828200846568e-08, + "loss": 0.0005, + "step": 35010 + }, + { + "epoch": 0.68, + "learning_rate": 6.423439866412954e-08, + "loss": 0.7452, + "step": 35011 + }, + { + "epoch": 0.68, + "learning_rate": 6.42305153197934e-08, + "loss": 0.0012, + "step": 35012 + }, + { + "epoch": 0.68, + "learning_rate": 6.422663197545726e-08, + "loss": 0.8417, + "step": 35013 + }, + { + "epoch": 0.68, + "learning_rate": 6.422274863112112e-08, + "loss": 0.0033, + "step": 35014 + }, + { + "epoch": 0.68, + "learning_rate": 6.421886528678498e-08, + "loss": 1.2589, + "step": 35015 + }, + { + "epoch": 0.68, + "learning_rate": 6.421498194244883e-08, + "loss": 0.0004, + "step": 35016 + }, + { + "epoch": 0.68, + "learning_rate": 6.421109859811269e-08, + "loss": 0.0004, + "step": 35017 + }, + { + "epoch": 0.68, + "learning_rate": 6.420721525377655e-08, + "loss": 0.0004, + "step": 35018 + }, + { + "epoch": 0.68, + "learning_rate": 6.420333190944041e-08, + "loss": 0.0005, + "step": 35019 + }, + { + "epoch": 0.68, + "learning_rate": 6.419944856510427e-08, + "loss": 0.0005, + "step": 35020 + }, + { + "epoch": 0.68, + "learning_rate": 6.419556522076812e-08, + "loss": 0.0008, + "step": 35021 + }, + { + "epoch": 0.68, + "learning_rate": 6.419168187643198e-08, + "loss": 0.0005, + "step": 35022 + }, + { + "epoch": 0.68, + "learning_rate": 6.418779853209584e-08, + "loss": 0.0003, + "step": 35023 + }, + { + "epoch": 0.68, + "learning_rate": 6.41839151877597e-08, + "loss": 0.0004, + "step": 35024 + }, + { + "epoch": 0.68, + "learning_rate": 6.418003184342356e-08, + "loss": 0.0004, + "step": 35025 + }, + { + "epoch": 0.68, + "learning_rate": 6.417614849908742e-08, + "loss": 1.2362, + "step": 35026 + }, + { + "epoch": 0.68, + "learning_rate": 6.417226515475127e-08, + "loss": 0.0005, + "step": 35027 + }, + { + "epoch": 0.68, + "learning_rate": 6.416838181041513e-08, + "loss": 0.0004, + "step": 35028 + }, + { + "epoch": 0.68, + "learning_rate": 6.416449846607899e-08, + "loss": 0.0005, + "step": 35029 + }, + { + "epoch": 0.68, + "learning_rate": 6.416061512174285e-08, + "loss": 0.0005, + "step": 35030 + }, + { + "epoch": 0.68, + "learning_rate": 6.415673177740671e-08, + "loss": 0.0004, + "step": 35031 + }, + { + "epoch": 0.68, + "learning_rate": 6.415284843307057e-08, + "loss": 0.0004, + "step": 35032 + }, + { + "epoch": 0.68, + "learning_rate": 6.414896508873442e-08, + "loss": 0.0004, + "step": 35033 + }, + { + "epoch": 0.68, + "learning_rate": 6.414508174439828e-08, + "loss": 0.0005, + "step": 35034 + }, + { + "epoch": 0.68, + "learning_rate": 6.414119840006214e-08, + "loss": 0.0005, + "step": 35035 + }, + { + "epoch": 0.68, + "learning_rate": 6.4137315055726e-08, + "loss": 0.0005, + "step": 35036 + }, + { + "epoch": 0.68, + "learning_rate": 6.413343171138986e-08, + "loss": 0.8118, + "step": 35037 + }, + { + "epoch": 0.68, + "learning_rate": 6.41295483670537e-08, + "loss": 0.0005, + "step": 35038 + }, + { + "epoch": 0.68, + "learning_rate": 6.412566502271756e-08, + "loss": 0.0007, + "step": 35039 + }, + { + "epoch": 0.68, + "learning_rate": 6.412178167838142e-08, + "loss": 0.0004, + "step": 35040 + }, + { + "epoch": 0.68, + "learning_rate": 6.411789833404528e-08, + "loss": 0.0004, + "step": 35041 + }, + { + "epoch": 0.68, + "learning_rate": 6.411401498970913e-08, + "loss": 0.0039, + "step": 35042 + }, + { + "epoch": 0.68, + "learning_rate": 6.411013164537299e-08, + "loss": 0.0005, + "step": 35043 + }, + { + "epoch": 0.68, + "learning_rate": 6.410624830103685e-08, + "loss": 0.0004, + "step": 35044 + }, + { + "epoch": 0.68, + "learning_rate": 6.410236495670071e-08, + "loss": 0.0609, + "step": 35045 + }, + { + "epoch": 0.68, + "learning_rate": 6.409848161236457e-08, + "loss": 0.0005, + "step": 35046 + }, + { + "epoch": 0.68, + "learning_rate": 6.409459826802843e-08, + "loss": 0.0005, + "step": 35047 + }, + { + "epoch": 0.68, + "learning_rate": 6.409071492369228e-08, + "loss": 0.0005, + "step": 35048 + }, + { + "epoch": 0.68, + "learning_rate": 6.408683157935614e-08, + "loss": 0.0006, + "step": 35049 + }, + { + "epoch": 0.68, + "learning_rate": 6.408294823502e-08, + "loss": 0.0007, + "step": 35050 + }, + { + "epoch": 0.68, + "learning_rate": 6.407906489068386e-08, + "loss": 0.1977, + "step": 35051 + }, + { + "epoch": 0.68, + "learning_rate": 6.407518154634772e-08, + "loss": 0.0168, + "step": 35052 + }, + { + "epoch": 0.68, + "learning_rate": 6.407129820201158e-08, + "loss": 0.0003, + "step": 35053 + }, + { + "epoch": 0.68, + "learning_rate": 6.406741485767543e-08, + "loss": 0.0005, + "step": 35054 + }, + { + "epoch": 0.68, + "learning_rate": 6.406353151333929e-08, + "loss": 0.0355, + "step": 35055 + }, + { + "epoch": 0.68, + "learning_rate": 6.405964816900315e-08, + "loss": 0.0004, + "step": 35056 + }, + { + "epoch": 0.68, + "learning_rate": 6.405576482466701e-08, + "loss": 0.0016, + "step": 35057 + }, + { + "epoch": 0.68, + "learning_rate": 6.405188148033087e-08, + "loss": 0.095, + "step": 35058 + }, + { + "epoch": 0.68, + "learning_rate": 6.404799813599472e-08, + "loss": 0.0003, + "step": 35059 + }, + { + "epoch": 0.68, + "learning_rate": 6.404411479165858e-08, + "loss": 0.0004, + "step": 35060 + }, + { + "epoch": 0.68, + "learning_rate": 6.404023144732244e-08, + "loss": 0.0014, + "step": 35061 + }, + { + "epoch": 0.68, + "learning_rate": 6.40363481029863e-08, + "loss": 0.0004, + "step": 35062 + }, + { + "epoch": 0.68, + "learning_rate": 6.403246475865016e-08, + "loss": 0.0007, + "step": 35063 + }, + { + "epoch": 0.68, + "learning_rate": 6.4028581414314e-08, + "loss": 0.0003, + "step": 35064 + }, + { + "epoch": 0.68, + "learning_rate": 6.402469806997786e-08, + "loss": 0.0004, + "step": 35065 + }, + { + "epoch": 0.68, + "learning_rate": 6.402081472564172e-08, + "loss": 0.0038, + "step": 35066 + }, + { + "epoch": 0.68, + "learning_rate": 6.401693138130558e-08, + "loss": 0.0004, + "step": 35067 + }, + { + "epoch": 0.68, + "learning_rate": 6.401304803696944e-08, + "loss": 0.9448, + "step": 35068 + }, + { + "epoch": 0.68, + "learning_rate": 6.40091646926333e-08, + "loss": 0.0004, + "step": 35069 + }, + { + "epoch": 0.68, + "learning_rate": 6.400528134829715e-08, + "loss": 0.0011, + "step": 35070 + }, + { + "epoch": 0.68, + "learning_rate": 6.400139800396101e-08, + "loss": 1.0294, + "step": 35071 + }, + { + "epoch": 0.68, + "learning_rate": 6.399751465962487e-08, + "loss": 0.0004, + "step": 35072 + }, + { + "epoch": 0.68, + "learning_rate": 6.399363131528873e-08, + "loss": 0.0005, + "step": 35073 + }, + { + "epoch": 0.68, + "learning_rate": 6.398974797095258e-08, + "loss": 0.0006, + "step": 35074 + }, + { + "epoch": 0.68, + "learning_rate": 6.398586462661644e-08, + "loss": 0.0008, + "step": 35075 + }, + { + "epoch": 0.68, + "learning_rate": 6.39819812822803e-08, + "loss": 0.019, + "step": 35076 + }, + { + "epoch": 0.68, + "learning_rate": 6.397809793794416e-08, + "loss": 0.0004, + "step": 35077 + }, + { + "epoch": 0.68, + "learning_rate": 6.3974214593608e-08, + "loss": 0.7326, + "step": 35078 + }, + { + "epoch": 0.68, + "learning_rate": 6.397033124927186e-08, + "loss": 0.0004, + "step": 35079 + }, + { + "epoch": 0.68, + "learning_rate": 6.396644790493572e-08, + "loss": 0.0008, + "step": 35080 + }, + { + "epoch": 0.68, + "learning_rate": 6.396256456059958e-08, + "loss": 0.0003, + "step": 35081 + }, + { + "epoch": 0.68, + "learning_rate": 6.395868121626344e-08, + "loss": 0.0006, + "step": 35082 + }, + { + "epoch": 0.68, + "learning_rate": 6.39547978719273e-08, + "loss": 0.0005, + "step": 35083 + }, + { + "epoch": 0.68, + "learning_rate": 6.395091452759115e-08, + "loss": 0.0451, + "step": 35084 + }, + { + "epoch": 0.68, + "learning_rate": 6.394703118325501e-08, + "loss": 0.4083, + "step": 35085 + }, + { + "epoch": 0.68, + "learning_rate": 6.394314783891887e-08, + "loss": 0.0005, + "step": 35086 + }, + { + "epoch": 0.68, + "learning_rate": 6.393926449458273e-08, + "loss": 0.0005, + "step": 35087 + }, + { + "epoch": 0.68, + "learning_rate": 6.393538115024659e-08, + "loss": 0.0003, + "step": 35088 + }, + { + "epoch": 0.68, + "learning_rate": 6.393149780591045e-08, + "loss": 0.0006, + "step": 35089 + }, + { + "epoch": 0.68, + "learning_rate": 6.39276144615743e-08, + "loss": 0.0004, + "step": 35090 + }, + { + "epoch": 0.68, + "learning_rate": 6.392373111723816e-08, + "loss": 0.0005, + "step": 35091 + }, + { + "epoch": 0.68, + "learning_rate": 6.391984777290202e-08, + "loss": 0.0009, + "step": 35092 + }, + { + "epoch": 0.68, + "learning_rate": 6.391596442856588e-08, + "loss": 0.0003, + "step": 35093 + }, + { + "epoch": 0.68, + "learning_rate": 6.391208108422974e-08, + "loss": 0.0006, + "step": 35094 + }, + { + "epoch": 0.68, + "learning_rate": 6.39081977398936e-08, + "loss": 0.1387, + "step": 35095 + }, + { + "epoch": 0.68, + "learning_rate": 6.390431439555744e-08, + "loss": 0.0007, + "step": 35096 + }, + { + "epoch": 0.68, + "learning_rate": 6.39004310512213e-08, + "loss": 1.0977, + "step": 35097 + }, + { + "epoch": 0.68, + "learning_rate": 6.389654770688516e-08, + "loss": 0.0005, + "step": 35098 + }, + { + "epoch": 0.68, + "learning_rate": 6.389266436254901e-08, + "loss": 0.0004, + "step": 35099 + }, + { + "epoch": 0.68, + "learning_rate": 6.388878101821287e-08, + "loss": 0.0004, + "step": 35100 + }, + { + "epoch": 0.68, + "learning_rate": 6.388489767387673e-08, + "loss": 0.0007, + "step": 35101 + }, + { + "epoch": 0.68, + "learning_rate": 6.388101432954059e-08, + "loss": 0.0004, + "step": 35102 + }, + { + "epoch": 0.68, + "learning_rate": 6.387713098520445e-08, + "loss": 0.0004, + "step": 35103 + }, + { + "epoch": 0.68, + "learning_rate": 6.38732476408683e-08, + "loss": 0.0006, + "step": 35104 + }, + { + "epoch": 0.68, + "learning_rate": 6.386936429653216e-08, + "loss": 0.0004, + "step": 35105 + }, + { + "epoch": 0.68, + "learning_rate": 6.386548095219602e-08, + "loss": 0.0005, + "step": 35106 + }, + { + "epoch": 0.68, + "learning_rate": 6.386159760785988e-08, + "loss": 0.0004, + "step": 35107 + }, + { + "epoch": 0.68, + "learning_rate": 6.385771426352374e-08, + "loss": 0.0006, + "step": 35108 + }, + { + "epoch": 0.68, + "learning_rate": 6.38538309191876e-08, + "loss": 0.4302, + "step": 35109 + }, + { + "epoch": 0.68, + "learning_rate": 6.384994757485146e-08, + "loss": 1.1121, + "step": 35110 + }, + { + "epoch": 0.68, + "learning_rate": 6.384606423051531e-08, + "loss": 0.0006, + "step": 35111 + }, + { + "epoch": 0.68, + "learning_rate": 6.384218088617917e-08, + "loss": 0.0005, + "step": 35112 + }, + { + "epoch": 0.68, + "learning_rate": 6.383829754184303e-08, + "loss": 0.0005, + "step": 35113 + }, + { + "epoch": 0.68, + "learning_rate": 6.383441419750689e-08, + "loss": 0.0006, + "step": 35114 + }, + { + "epoch": 0.68, + "learning_rate": 6.383053085317075e-08, + "loss": 0.0301, + "step": 35115 + }, + { + "epoch": 0.68, + "learning_rate": 6.38266475088346e-08, + "loss": 0.0006, + "step": 35116 + }, + { + "epoch": 0.68, + "learning_rate": 6.382276416449846e-08, + "loss": 0.0006, + "step": 35117 + }, + { + "epoch": 0.68, + "learning_rate": 6.381888082016232e-08, + "loss": 0.0007, + "step": 35118 + }, + { + "epoch": 0.68, + "learning_rate": 6.381499747582618e-08, + "loss": 0.0004, + "step": 35119 + }, + { + "epoch": 0.68, + "learning_rate": 6.381111413149004e-08, + "loss": 0.0005, + "step": 35120 + }, + { + "epoch": 0.68, + "learning_rate": 6.38072307871539e-08, + "loss": 0.0016, + "step": 35121 + }, + { + "epoch": 0.68, + "learning_rate": 6.380334744281775e-08, + "loss": 0.0005, + "step": 35122 + }, + { + "epoch": 0.68, + "learning_rate": 6.379946409848161e-08, + "loss": 0.0007, + "step": 35123 + }, + { + "epoch": 0.68, + "learning_rate": 6.379558075414547e-08, + "loss": 0.0036, + "step": 35124 + }, + { + "epoch": 0.68, + "learning_rate": 6.379169740980932e-08, + "loss": 0.0005, + "step": 35125 + }, + { + "epoch": 0.68, + "learning_rate": 6.378781406547317e-08, + "loss": 0.0004, + "step": 35126 + }, + { + "epoch": 0.68, + "learning_rate": 6.378393072113703e-08, + "loss": 0.0008, + "step": 35127 + }, + { + "epoch": 0.68, + "learning_rate": 6.378004737680089e-08, + "loss": 0.0005, + "step": 35128 + }, + { + "epoch": 0.68, + "learning_rate": 6.377616403246475e-08, + "loss": 0.0004, + "step": 35129 + }, + { + "epoch": 0.68, + "learning_rate": 6.377228068812861e-08, + "loss": 0.0003, + "step": 35130 + }, + { + "epoch": 0.68, + "learning_rate": 6.376839734379247e-08, + "loss": 0.0004, + "step": 35131 + }, + { + "epoch": 0.68, + "learning_rate": 6.376451399945632e-08, + "loss": 0.0004, + "step": 35132 + }, + { + "epoch": 0.68, + "learning_rate": 6.376063065512018e-08, + "loss": 0.0007, + "step": 35133 + }, + { + "epoch": 0.68, + "learning_rate": 6.375674731078404e-08, + "loss": 0.0004, + "step": 35134 + }, + { + "epoch": 0.68, + "learning_rate": 6.37528639664479e-08, + "loss": 0.0005, + "step": 35135 + }, + { + "epoch": 0.68, + "learning_rate": 6.374898062211176e-08, + "loss": 0.0005, + "step": 35136 + }, + { + "epoch": 0.68, + "learning_rate": 6.374509727777561e-08, + "loss": 0.0004, + "step": 35137 + }, + { + "epoch": 0.68, + "learning_rate": 6.374121393343947e-08, + "loss": 0.0006, + "step": 35138 + }, + { + "epoch": 0.68, + "learning_rate": 6.373733058910333e-08, + "loss": 0.0023, + "step": 35139 + }, + { + "epoch": 0.68, + "learning_rate": 6.373344724476719e-08, + "loss": 0.0014, + "step": 35140 + }, + { + "epoch": 0.68, + "learning_rate": 6.372956390043105e-08, + "loss": 0.0005, + "step": 35141 + }, + { + "epoch": 0.68, + "learning_rate": 6.37256805560949e-08, + "loss": 0.0003, + "step": 35142 + }, + { + "epoch": 0.68, + "learning_rate": 6.372179721175876e-08, + "loss": 0.315, + "step": 35143 + }, + { + "epoch": 0.68, + "learning_rate": 6.371791386742262e-08, + "loss": 0.0004, + "step": 35144 + }, + { + "epoch": 0.68, + "learning_rate": 6.371403052308648e-08, + "loss": 0.0004, + "step": 35145 + }, + { + "epoch": 0.68, + "learning_rate": 6.371014717875034e-08, + "loss": 0.0004, + "step": 35146 + }, + { + "epoch": 0.68, + "learning_rate": 6.37062638344142e-08, + "loss": 0.0004, + "step": 35147 + }, + { + "epoch": 0.68, + "learning_rate": 6.370238049007806e-08, + "loss": 0.0004, + "step": 35148 + }, + { + "epoch": 0.68, + "learning_rate": 6.369849714574191e-08, + "loss": 0.0005, + "step": 35149 + }, + { + "epoch": 0.68, + "learning_rate": 6.369461380140577e-08, + "loss": 0.1136, + "step": 35150 + }, + { + "epoch": 0.68, + "learning_rate": 6.369073045706963e-08, + "loss": 0.0004, + "step": 35151 + }, + { + "epoch": 0.68, + "learning_rate": 6.368684711273349e-08, + "loss": 0.0009, + "step": 35152 + }, + { + "epoch": 0.68, + "learning_rate": 6.368296376839735e-08, + "loss": 0.0004, + "step": 35153 + }, + { + "epoch": 0.68, + "learning_rate": 6.367908042406119e-08, + "loss": 0.0004, + "step": 35154 + }, + { + "epoch": 0.68, + "learning_rate": 6.367519707972505e-08, + "loss": 0.0033, + "step": 35155 + }, + { + "epoch": 0.68, + "learning_rate": 6.367131373538891e-08, + "loss": 0.0003, + "step": 35156 + }, + { + "epoch": 0.68, + "learning_rate": 6.366743039105277e-08, + "loss": 1.2309, + "step": 35157 + }, + { + "epoch": 0.68, + "learning_rate": 6.366354704671662e-08, + "loss": 0.0005, + "step": 35158 + }, + { + "epoch": 0.68, + "learning_rate": 6.365966370238048e-08, + "loss": 0.0004, + "step": 35159 + }, + { + "epoch": 0.68, + "learning_rate": 6.365578035804434e-08, + "loss": 0.0005, + "step": 35160 + }, + { + "epoch": 0.68, + "learning_rate": 6.36518970137082e-08, + "loss": 0.0005, + "step": 35161 + }, + { + "epoch": 0.68, + "learning_rate": 6.364801366937206e-08, + "loss": 0.6128, + "step": 35162 + }, + { + "epoch": 0.68, + "learning_rate": 6.364413032503592e-08, + "loss": 0.0003, + "step": 35163 + }, + { + "epoch": 0.68, + "learning_rate": 6.364024698069977e-08, + "loss": 0.0004, + "step": 35164 + }, + { + "epoch": 0.68, + "learning_rate": 6.363636363636363e-08, + "loss": 0.0005, + "step": 35165 + }, + { + "epoch": 0.68, + "learning_rate": 6.363248029202749e-08, + "loss": 0.0004, + "step": 35166 + }, + { + "epoch": 0.68, + "learning_rate": 6.362859694769135e-08, + "loss": 0.0004, + "step": 35167 + }, + { + "epoch": 0.68, + "learning_rate": 6.362471360335521e-08, + "loss": 0.0003, + "step": 35168 + }, + { + "epoch": 0.68, + "learning_rate": 6.362083025901907e-08, + "loss": 0.0007, + "step": 35169 + }, + { + "epoch": 0.68, + "learning_rate": 6.361694691468292e-08, + "loss": 0.0005, + "step": 35170 + }, + { + "epoch": 0.68, + "learning_rate": 6.361306357034678e-08, + "loss": 0.0004, + "step": 35171 + }, + { + "epoch": 0.68, + "learning_rate": 6.360918022601064e-08, + "loss": 0.3972, + "step": 35172 + }, + { + "epoch": 0.68, + "learning_rate": 6.36052968816745e-08, + "loss": 0.0007, + "step": 35173 + }, + { + "epoch": 0.68, + "learning_rate": 6.360141353733836e-08, + "loss": 0.0365, + "step": 35174 + }, + { + "epoch": 0.68, + "learning_rate": 6.359753019300221e-08, + "loss": 0.0003, + "step": 35175 + }, + { + "epoch": 0.68, + "learning_rate": 6.359364684866607e-08, + "loss": 0.0004, + "step": 35176 + }, + { + "epoch": 0.68, + "learning_rate": 6.358976350432993e-08, + "loss": 0.0004, + "step": 35177 + }, + { + "epoch": 0.68, + "learning_rate": 6.358588015999379e-08, + "loss": 0.0005, + "step": 35178 + }, + { + "epoch": 0.68, + "learning_rate": 6.358199681565765e-08, + "loss": 0.0005, + "step": 35179 + }, + { + "epoch": 0.68, + "learning_rate": 6.35781134713215e-08, + "loss": 0.0013, + "step": 35180 + }, + { + "epoch": 0.68, + "learning_rate": 6.357423012698536e-08, + "loss": 0.0005, + "step": 35181 + }, + { + "epoch": 0.68, + "learning_rate": 6.357034678264922e-08, + "loss": 0.0007, + "step": 35182 + }, + { + "epoch": 0.68, + "learning_rate": 6.356646343831307e-08, + "loss": 0.0007, + "step": 35183 + }, + { + "epoch": 0.68, + "learning_rate": 6.356258009397693e-08, + "loss": 0.0005, + "step": 35184 + }, + { + "epoch": 0.68, + "learning_rate": 6.355869674964078e-08, + "loss": 1.2648, + "step": 35185 + }, + { + "epoch": 0.68, + "learning_rate": 6.355481340530464e-08, + "loss": 0.0003, + "step": 35186 + }, + { + "epoch": 0.68, + "learning_rate": 6.35509300609685e-08, + "loss": 0.0005, + "step": 35187 + }, + { + "epoch": 0.68, + "learning_rate": 6.354704671663236e-08, + "loss": 0.0009, + "step": 35188 + }, + { + "epoch": 0.68, + "learning_rate": 6.354316337229622e-08, + "loss": 0.0004, + "step": 35189 + }, + { + "epoch": 0.68, + "learning_rate": 6.353928002796008e-08, + "loss": 0.0003, + "step": 35190 + }, + { + "epoch": 0.68, + "learning_rate": 6.353539668362393e-08, + "loss": 0.0005, + "step": 35191 + }, + { + "epoch": 0.68, + "learning_rate": 6.353151333928779e-08, + "loss": 0.0118, + "step": 35192 + }, + { + "epoch": 0.68, + "learning_rate": 6.352762999495165e-08, + "loss": 0.0004, + "step": 35193 + }, + { + "epoch": 0.68, + "learning_rate": 6.352374665061551e-08, + "loss": 0.2683, + "step": 35194 + }, + { + "epoch": 0.68, + "learning_rate": 6.351986330627937e-08, + "loss": 0.0007, + "step": 35195 + }, + { + "epoch": 0.68, + "learning_rate": 6.351597996194322e-08, + "loss": 0.0004, + "step": 35196 + }, + { + "epoch": 0.68, + "learning_rate": 6.351209661760708e-08, + "loss": 0.0004, + "step": 35197 + }, + { + "epoch": 0.68, + "learning_rate": 6.350821327327094e-08, + "loss": 0.0004, + "step": 35198 + }, + { + "epoch": 0.68, + "learning_rate": 6.35043299289348e-08, + "loss": 1.2456, + "step": 35199 + }, + { + "epoch": 0.68, + "learning_rate": 6.350044658459866e-08, + "loss": 0.0004, + "step": 35200 + }, + { + "epoch": 0.68, + "learning_rate": 6.349656324026252e-08, + "loss": 0.0048, + "step": 35201 + }, + { + "epoch": 0.68, + "learning_rate": 6.349267989592637e-08, + "loss": 0.0004, + "step": 35202 + }, + { + "epoch": 0.68, + "learning_rate": 6.348879655159023e-08, + "loss": 0.0014, + "step": 35203 + }, + { + "epoch": 0.68, + "learning_rate": 6.348491320725409e-08, + "loss": 0.3648, + "step": 35204 + }, + { + "epoch": 0.68, + "learning_rate": 6.348102986291795e-08, + "loss": 0.001, + "step": 35205 + }, + { + "epoch": 0.68, + "learning_rate": 6.347714651858181e-08, + "loss": 0.0004, + "step": 35206 + }, + { + "epoch": 0.68, + "learning_rate": 6.347326317424567e-08, + "loss": 0.0059, + "step": 35207 + }, + { + "epoch": 0.68, + "learning_rate": 6.346937982990952e-08, + "loss": 0.8604, + "step": 35208 + }, + { + "epoch": 0.68, + "learning_rate": 6.346549648557338e-08, + "loss": 0.0006, + "step": 35209 + }, + { + "epoch": 0.68, + "learning_rate": 6.346161314123724e-08, + "loss": 0.0007, + "step": 35210 + }, + { + "epoch": 0.68, + "learning_rate": 6.34577297969011e-08, + "loss": 0.0004, + "step": 35211 + }, + { + "epoch": 0.68, + "learning_rate": 6.345384645256494e-08, + "loss": 0.0004, + "step": 35212 + }, + { + "epoch": 0.68, + "learning_rate": 6.34499631082288e-08, + "loss": 0.0019, + "step": 35213 + }, + { + "epoch": 0.68, + "learning_rate": 6.344607976389266e-08, + "loss": 0.0003, + "step": 35214 + }, + { + "epoch": 0.68, + "learning_rate": 6.344219641955652e-08, + "loss": 0.0004, + "step": 35215 + }, + { + "epoch": 0.68, + "learning_rate": 6.343831307522038e-08, + "loss": 0.0003, + "step": 35216 + }, + { + "epoch": 0.68, + "learning_rate": 6.343442973088423e-08, + "loss": 0.0006, + "step": 35217 + }, + { + "epoch": 0.68, + "learning_rate": 6.343054638654809e-08, + "loss": 0.0005, + "step": 35218 + }, + { + "epoch": 0.68, + "learning_rate": 6.342666304221195e-08, + "loss": 0.0006, + "step": 35219 + }, + { + "epoch": 0.68, + "learning_rate": 6.342277969787581e-08, + "loss": 0.0009, + "step": 35220 + }, + { + "epoch": 0.68, + "learning_rate": 6.341889635353967e-08, + "loss": 0.0017, + "step": 35221 + }, + { + "epoch": 0.68, + "learning_rate": 6.341501300920353e-08, + "loss": 0.0005, + "step": 35222 + }, + { + "epoch": 0.68, + "learning_rate": 6.341112966486738e-08, + "loss": 0.0278, + "step": 35223 + }, + { + "epoch": 0.68, + "learning_rate": 6.340724632053124e-08, + "loss": 0.0006, + "step": 35224 + }, + { + "epoch": 0.68, + "learning_rate": 6.34033629761951e-08, + "loss": 0.1616, + "step": 35225 + }, + { + "epoch": 0.68, + "learning_rate": 6.339947963185896e-08, + "loss": 0.0003, + "step": 35226 + }, + { + "epoch": 0.68, + "learning_rate": 6.339559628752282e-08, + "loss": 0.0004, + "step": 35227 + }, + { + "epoch": 0.68, + "learning_rate": 6.339171294318668e-08, + "loss": 0.0005, + "step": 35228 + }, + { + "epoch": 0.68, + "learning_rate": 6.338782959885053e-08, + "loss": 0.0019, + "step": 35229 + }, + { + "epoch": 0.68, + "learning_rate": 6.338394625451439e-08, + "loss": 0.0004, + "step": 35230 + }, + { + "epoch": 0.68, + "learning_rate": 6.338006291017825e-08, + "loss": 0.7791, + "step": 35231 + }, + { + "epoch": 0.68, + "learning_rate": 6.337617956584211e-08, + "loss": 0.0003, + "step": 35232 + }, + { + "epoch": 0.68, + "learning_rate": 6.337229622150597e-08, + "loss": 0.0006, + "step": 35233 + }, + { + "epoch": 0.68, + "learning_rate": 6.336841287716982e-08, + "loss": 0.0005, + "step": 35234 + }, + { + "epoch": 0.68, + "learning_rate": 6.336452953283368e-08, + "loss": 0.001, + "step": 35235 + }, + { + "epoch": 0.68, + "learning_rate": 6.336064618849754e-08, + "loss": 0.0003, + "step": 35236 + }, + { + "epoch": 0.68, + "learning_rate": 6.33567628441614e-08, + "loss": 0.0004, + "step": 35237 + }, + { + "epoch": 0.68, + "learning_rate": 6.335287949982526e-08, + "loss": 0.0011, + "step": 35238 + }, + { + "epoch": 0.68, + "learning_rate": 6.334899615548912e-08, + "loss": 0.0005, + "step": 35239 + }, + { + "epoch": 0.68, + "learning_rate": 6.334511281115297e-08, + "loss": 0.0005, + "step": 35240 + }, + { + "epoch": 0.68, + "learning_rate": 6.334122946681682e-08, + "loss": 0.0004, + "step": 35241 + }, + { + "epoch": 0.68, + "learning_rate": 6.333734612248068e-08, + "loss": 0.0006, + "step": 35242 + }, + { + "epoch": 0.68, + "learning_rate": 6.333346277814454e-08, + "loss": 0.0006, + "step": 35243 + }, + { + "epoch": 0.68, + "learning_rate": 6.33295794338084e-08, + "loss": 0.0005, + "step": 35244 + }, + { + "epoch": 0.68, + "learning_rate": 6.332569608947225e-08, + "loss": 0.0004, + "step": 35245 + }, + { + "epoch": 0.68, + "learning_rate": 6.332181274513611e-08, + "loss": 0.0004, + "step": 35246 + }, + { + "epoch": 0.68, + "learning_rate": 6.331792940079997e-08, + "loss": 0.0004, + "step": 35247 + }, + { + "epoch": 0.68, + "learning_rate": 6.331404605646383e-08, + "loss": 0.0005, + "step": 35248 + }, + { + "epoch": 0.68, + "learning_rate": 6.331016271212769e-08, + "loss": 0.0004, + "step": 35249 + }, + { + "epoch": 0.68, + "learning_rate": 6.330627936779154e-08, + "loss": 0.0003, + "step": 35250 + }, + { + "epoch": 0.68, + "learning_rate": 6.33023960234554e-08, + "loss": 0.0004, + "step": 35251 + }, + { + "epoch": 0.68, + "learning_rate": 6.329851267911926e-08, + "loss": 1.1998, + "step": 35252 + }, + { + "epoch": 0.68, + "learning_rate": 6.329462933478312e-08, + "loss": 0.0008, + "step": 35253 + }, + { + "epoch": 0.68, + "learning_rate": 6.329074599044698e-08, + "loss": 0.0006, + "step": 35254 + }, + { + "epoch": 0.68, + "learning_rate": 6.328686264611082e-08, + "loss": 0.319, + "step": 35255 + }, + { + "epoch": 0.68, + "learning_rate": 6.328297930177468e-08, + "loss": 0.0003, + "step": 35256 + }, + { + "epoch": 0.68, + "learning_rate": 6.327909595743854e-08, + "loss": 0.0009, + "step": 35257 + }, + { + "epoch": 0.68, + "learning_rate": 6.32752126131024e-08, + "loss": 0.0005, + "step": 35258 + }, + { + "epoch": 0.68, + "learning_rate": 6.327132926876625e-08, + "loss": 0.0004, + "step": 35259 + }, + { + "epoch": 0.68, + "learning_rate": 6.326744592443011e-08, + "loss": 0.0006, + "step": 35260 + }, + { + "epoch": 0.68, + "learning_rate": 6.326356258009397e-08, + "loss": 0.0004, + "step": 35261 + }, + { + "epoch": 0.68, + "learning_rate": 6.325967923575783e-08, + "loss": 0.0005, + "step": 35262 + }, + { + "epoch": 0.68, + "learning_rate": 6.325579589142169e-08, + "loss": 0.0005, + "step": 35263 + }, + { + "epoch": 0.68, + "learning_rate": 6.325191254708555e-08, + "loss": 0.0003, + "step": 35264 + }, + { + "epoch": 0.68, + "learning_rate": 6.32480292027494e-08, + "loss": 0.0005, + "step": 35265 + }, + { + "epoch": 0.68, + "learning_rate": 6.324414585841326e-08, + "loss": 0.0005, + "step": 35266 + }, + { + "epoch": 0.68, + "learning_rate": 6.324026251407712e-08, + "loss": 0.004, + "step": 35267 + }, + { + "epoch": 0.68, + "learning_rate": 6.323637916974098e-08, + "loss": 0.0004, + "step": 35268 + }, + { + "epoch": 0.68, + "learning_rate": 6.323249582540484e-08, + "loss": 0.0008, + "step": 35269 + }, + { + "epoch": 0.68, + "learning_rate": 6.322861248106868e-08, + "loss": 0.0003, + "step": 35270 + }, + { + "epoch": 0.68, + "learning_rate": 6.322472913673254e-08, + "loss": 0.0004, + "step": 35271 + }, + { + "epoch": 0.68, + "learning_rate": 6.32208457923964e-08, + "loss": 0.0004, + "step": 35272 + }, + { + "epoch": 0.68, + "learning_rate": 6.321696244806026e-08, + "loss": 0.0006, + "step": 35273 + }, + { + "epoch": 0.68, + "learning_rate": 6.321307910372411e-08, + "loss": 0.0056, + "step": 35274 + }, + { + "epoch": 0.68, + "learning_rate": 6.320919575938797e-08, + "loss": 0.0004, + "step": 35275 + }, + { + "epoch": 0.68, + "learning_rate": 6.320531241505183e-08, + "loss": 0.0005, + "step": 35276 + }, + { + "epoch": 0.68, + "learning_rate": 6.320142907071569e-08, + "loss": 0.0004, + "step": 35277 + }, + { + "epoch": 0.68, + "learning_rate": 6.319754572637955e-08, + "loss": 0.0004, + "step": 35278 + }, + { + "epoch": 0.68, + "learning_rate": 6.31936623820434e-08, + "loss": 0.0194, + "step": 35279 + }, + { + "epoch": 0.68, + "learning_rate": 6.318977903770726e-08, + "loss": 0.5561, + "step": 35280 + }, + { + "epoch": 0.68, + "learning_rate": 6.318589569337112e-08, + "loss": 0.0006, + "step": 35281 + }, + { + "epoch": 0.68, + "learning_rate": 6.318201234903498e-08, + "loss": 0.0007, + "step": 35282 + }, + { + "epoch": 0.68, + "learning_rate": 6.317812900469884e-08, + "loss": 0.001, + "step": 35283 + }, + { + "epoch": 0.68, + "learning_rate": 6.31742456603627e-08, + "loss": 0.0006, + "step": 35284 + }, + { + "epoch": 0.68, + "learning_rate": 6.317036231602656e-08, + "loss": 0.8078, + "step": 35285 + }, + { + "epoch": 0.68, + "learning_rate": 6.316647897169041e-08, + "loss": 0.0004, + "step": 35286 + }, + { + "epoch": 0.68, + "learning_rate": 6.316259562735427e-08, + "loss": 0.0003, + "step": 35287 + }, + { + "epoch": 0.68, + "learning_rate": 6.315871228301813e-08, + "loss": 0.0004, + "step": 35288 + }, + { + "epoch": 0.68, + "learning_rate": 6.315482893868199e-08, + "loss": 0.0003, + "step": 35289 + }, + { + "epoch": 0.68, + "learning_rate": 6.315094559434585e-08, + "loss": 0.1085, + "step": 35290 + }, + { + "epoch": 0.68, + "learning_rate": 6.31470622500097e-08, + "loss": 0.0003, + "step": 35291 + }, + { + "epoch": 0.68, + "learning_rate": 6.314317890567356e-08, + "loss": 0.0004, + "step": 35292 + }, + { + "epoch": 0.68, + "learning_rate": 6.313929556133742e-08, + "loss": 0.0004, + "step": 35293 + }, + { + "epoch": 0.68, + "learning_rate": 6.313541221700128e-08, + "loss": 0.0006, + "step": 35294 + }, + { + "epoch": 0.68, + "learning_rate": 6.313152887266514e-08, + "loss": 0.0005, + "step": 35295 + }, + { + "epoch": 0.68, + "learning_rate": 6.3127645528329e-08, + "loss": 0.0007, + "step": 35296 + }, + { + "epoch": 0.68, + "learning_rate": 6.312376218399285e-08, + "loss": 0.0006, + "step": 35297 + }, + { + "epoch": 0.68, + "learning_rate": 6.311987883965671e-08, + "loss": 1.0253, + "step": 35298 + }, + { + "epoch": 0.68, + "learning_rate": 6.311599549532056e-08, + "loss": 0.0003, + "step": 35299 + }, + { + "epoch": 0.68, + "learning_rate": 6.311211215098442e-08, + "loss": 0.0005, + "step": 35300 + }, + { + "epoch": 0.68, + "learning_rate": 6.310822880664827e-08, + "loss": 1.0343, + "step": 35301 + }, + { + "epoch": 0.68, + "learning_rate": 6.310434546231213e-08, + "loss": 0.0093, + "step": 35302 + }, + { + "epoch": 0.68, + "learning_rate": 6.310046211797599e-08, + "loss": 0.0004, + "step": 35303 + }, + { + "epoch": 0.68, + "learning_rate": 6.309657877363985e-08, + "loss": 0.0012, + "step": 35304 + }, + { + "epoch": 0.68, + "learning_rate": 6.309269542930371e-08, + "loss": 0.0004, + "step": 35305 + }, + { + "epoch": 0.68, + "learning_rate": 6.308881208496757e-08, + "loss": 0.2727, + "step": 35306 + }, + { + "epoch": 0.68, + "learning_rate": 6.308492874063142e-08, + "loss": 0.0005, + "step": 35307 + }, + { + "epoch": 0.68, + "learning_rate": 6.308104539629528e-08, + "loss": 0.001, + "step": 35308 + }, + { + "epoch": 0.68, + "learning_rate": 6.307716205195914e-08, + "loss": 0.0004, + "step": 35309 + }, + { + "epoch": 0.68, + "learning_rate": 6.3073278707623e-08, + "loss": 0.8686, + "step": 35310 + }, + { + "epoch": 0.68, + "learning_rate": 6.306939536328686e-08, + "loss": 0.0005, + "step": 35311 + }, + { + "epoch": 0.68, + "learning_rate": 6.306551201895071e-08, + "loss": 0.0005, + "step": 35312 + }, + { + "epoch": 0.68, + "learning_rate": 6.306162867461457e-08, + "loss": 0.0013, + "step": 35313 + }, + { + "epoch": 0.69, + "learning_rate": 6.305774533027843e-08, + "loss": 0.0014, + "step": 35314 + }, + { + "epoch": 0.69, + "learning_rate": 6.305386198594229e-08, + "loss": 0.0003, + "step": 35315 + }, + { + "epoch": 0.69, + "learning_rate": 6.304997864160615e-08, + "loss": 0.0004, + "step": 35316 + }, + { + "epoch": 0.69, + "learning_rate": 6.304609529727e-08, + "loss": 0.0004, + "step": 35317 + }, + { + "epoch": 0.69, + "learning_rate": 6.304221195293386e-08, + "loss": 0.0005, + "step": 35318 + }, + { + "epoch": 0.69, + "learning_rate": 6.303832860859772e-08, + "loss": 0.0005, + "step": 35319 + }, + { + "epoch": 0.69, + "learning_rate": 6.303444526426158e-08, + "loss": 0.3329, + "step": 35320 + }, + { + "epoch": 0.69, + "learning_rate": 6.303056191992544e-08, + "loss": 0.1079, + "step": 35321 + }, + { + "epoch": 0.69, + "learning_rate": 6.30266785755893e-08, + "loss": 0.0005, + "step": 35322 + }, + { + "epoch": 0.69, + "learning_rate": 6.302279523125316e-08, + "loss": 0.0005, + "step": 35323 + }, + { + "epoch": 0.69, + "learning_rate": 6.301891188691701e-08, + "loss": 0.0005, + "step": 35324 + }, + { + "epoch": 0.69, + "learning_rate": 6.301502854258087e-08, + "loss": 0.0004, + "step": 35325 + }, + { + "epoch": 0.69, + "learning_rate": 6.301114519824473e-08, + "loss": 0.0004, + "step": 35326 + }, + { + "epoch": 0.69, + "learning_rate": 6.300726185390859e-08, + "loss": 0.001, + "step": 35327 + }, + { + "epoch": 0.69, + "learning_rate": 6.300337850957243e-08, + "loss": 0.0018, + "step": 35328 + }, + { + "epoch": 0.69, + "learning_rate": 6.299949516523629e-08, + "loss": 0.0006, + "step": 35329 + }, + { + "epoch": 0.69, + "learning_rate": 6.299561182090015e-08, + "loss": 0.0005, + "step": 35330 + }, + { + "epoch": 0.69, + "learning_rate": 6.299172847656401e-08, + "loss": 0.0053, + "step": 35331 + }, + { + "epoch": 0.69, + "learning_rate": 6.298784513222787e-08, + "loss": 0.0006, + "step": 35332 + }, + { + "epoch": 0.69, + "learning_rate": 6.298396178789172e-08, + "loss": 0.0049, + "step": 35333 + }, + { + "epoch": 0.69, + "learning_rate": 6.298007844355558e-08, + "loss": 0.0005, + "step": 35334 + }, + { + "epoch": 0.69, + "learning_rate": 6.297619509921944e-08, + "loss": 0.0024, + "step": 35335 + }, + { + "epoch": 0.69, + "learning_rate": 6.29723117548833e-08, + "loss": 0.0004, + "step": 35336 + }, + { + "epoch": 0.69, + "learning_rate": 6.296842841054716e-08, + "loss": 0.0004, + "step": 35337 + }, + { + "epoch": 0.69, + "learning_rate": 6.296454506621102e-08, + "loss": 0.0004, + "step": 35338 + }, + { + "epoch": 0.69, + "learning_rate": 6.296066172187487e-08, + "loss": 0.0003, + "step": 35339 + }, + { + "epoch": 0.69, + "learning_rate": 6.295677837753873e-08, + "loss": 0.6085, + "step": 35340 + }, + { + "epoch": 0.69, + "learning_rate": 6.295289503320259e-08, + "loss": 0.0006, + "step": 35341 + }, + { + "epoch": 0.69, + "learning_rate": 6.294901168886645e-08, + "loss": 0.0004, + "step": 35342 + }, + { + "epoch": 0.69, + "learning_rate": 6.294512834453031e-08, + "loss": 0.0004, + "step": 35343 + }, + { + "epoch": 0.69, + "learning_rate": 6.294124500019417e-08, + "loss": 0.0004, + "step": 35344 + }, + { + "epoch": 0.69, + "learning_rate": 6.293736165585802e-08, + "loss": 0.4677, + "step": 35345 + }, + { + "epoch": 0.69, + "learning_rate": 6.293347831152188e-08, + "loss": 0.0006, + "step": 35346 + }, + { + "epoch": 0.69, + "learning_rate": 6.292959496718574e-08, + "loss": 0.0004, + "step": 35347 + }, + { + "epoch": 0.69, + "learning_rate": 6.29257116228496e-08, + "loss": 0.0026, + "step": 35348 + }, + { + "epoch": 0.69, + "learning_rate": 6.292182827851346e-08, + "loss": 0.001, + "step": 35349 + }, + { + "epoch": 0.69, + "learning_rate": 6.291794493417731e-08, + "loss": 0.001, + "step": 35350 + }, + { + "epoch": 0.69, + "learning_rate": 6.291406158984117e-08, + "loss": 0.0004, + "step": 35351 + }, + { + "epoch": 0.69, + "learning_rate": 6.291017824550503e-08, + "loss": 0.0003, + "step": 35352 + }, + { + "epoch": 0.69, + "learning_rate": 6.290629490116889e-08, + "loss": 0.0004, + "step": 35353 + }, + { + "epoch": 0.69, + "learning_rate": 6.290241155683275e-08, + "loss": 0.0004, + "step": 35354 + }, + { + "epoch": 0.69, + "learning_rate": 6.28985282124966e-08, + "loss": 0.0014, + "step": 35355 + }, + { + "epoch": 0.69, + "learning_rate": 6.289464486816046e-08, + "loss": 0.0013, + "step": 35356 + }, + { + "epoch": 0.69, + "learning_rate": 6.289076152382431e-08, + "loss": 0.0003, + "step": 35357 + }, + { + "epoch": 0.69, + "learning_rate": 6.288687817948817e-08, + "loss": 0.0006, + "step": 35358 + }, + { + "epoch": 0.69, + "learning_rate": 6.288299483515203e-08, + "loss": 0.0003, + "step": 35359 + }, + { + "epoch": 0.69, + "learning_rate": 6.287911149081588e-08, + "loss": 0.0004, + "step": 35360 + }, + { + "epoch": 0.69, + "learning_rate": 6.287522814647974e-08, + "loss": 0.0007, + "step": 35361 + }, + { + "epoch": 0.69, + "learning_rate": 6.28713448021436e-08, + "loss": 0.0006, + "step": 35362 + }, + { + "epoch": 0.69, + "learning_rate": 6.286746145780746e-08, + "loss": 0.0005, + "step": 35363 + }, + { + "epoch": 0.69, + "learning_rate": 6.286357811347132e-08, + "loss": 0.0004, + "step": 35364 + }, + { + "epoch": 0.69, + "learning_rate": 6.285969476913518e-08, + "loss": 0.946, + "step": 35365 + }, + { + "epoch": 0.69, + "learning_rate": 6.285581142479903e-08, + "loss": 0.0006, + "step": 35366 + }, + { + "epoch": 0.69, + "learning_rate": 6.285192808046289e-08, + "loss": 0.0004, + "step": 35367 + }, + { + "epoch": 0.69, + "learning_rate": 6.284804473612675e-08, + "loss": 0.0003, + "step": 35368 + }, + { + "epoch": 0.69, + "learning_rate": 6.284416139179061e-08, + "loss": 0.0004, + "step": 35369 + }, + { + "epoch": 0.69, + "learning_rate": 6.284027804745447e-08, + "loss": 0.0009, + "step": 35370 + }, + { + "epoch": 0.69, + "learning_rate": 6.283639470311832e-08, + "loss": 0.0004, + "step": 35371 + }, + { + "epoch": 0.69, + "learning_rate": 6.283251135878218e-08, + "loss": 0.0008, + "step": 35372 + }, + { + "epoch": 0.69, + "learning_rate": 6.282862801444604e-08, + "loss": 0.0004, + "step": 35373 + }, + { + "epoch": 0.69, + "learning_rate": 6.28247446701099e-08, + "loss": 0.0004, + "step": 35374 + }, + { + "epoch": 0.69, + "learning_rate": 6.282086132577376e-08, + "loss": 0.001, + "step": 35375 + }, + { + "epoch": 0.69, + "learning_rate": 6.281697798143762e-08, + "loss": 0.0004, + "step": 35376 + }, + { + "epoch": 0.69, + "learning_rate": 6.281309463710147e-08, + "loss": 0.0006, + "step": 35377 + }, + { + "epoch": 0.69, + "learning_rate": 6.280921129276533e-08, + "loss": 0.0005, + "step": 35378 + }, + { + "epoch": 0.69, + "learning_rate": 6.280532794842919e-08, + "loss": 0.0004, + "step": 35379 + }, + { + "epoch": 0.69, + "learning_rate": 6.280144460409305e-08, + "loss": 0.0006, + "step": 35380 + }, + { + "epoch": 0.69, + "learning_rate": 6.279756125975691e-08, + "loss": 0.0008, + "step": 35381 + }, + { + "epoch": 0.69, + "learning_rate": 6.279367791542077e-08, + "loss": 0.0008, + "step": 35382 + }, + { + "epoch": 0.69, + "learning_rate": 6.278979457108462e-08, + "loss": 0.001, + "step": 35383 + }, + { + "epoch": 0.69, + "learning_rate": 6.278591122674848e-08, + "loss": 0.0008, + "step": 35384 + }, + { + "epoch": 0.69, + "learning_rate": 6.278202788241234e-08, + "loss": 0.0007, + "step": 35385 + }, + { + "epoch": 0.69, + "learning_rate": 6.277814453807619e-08, + "loss": 0.0004, + "step": 35386 + }, + { + "epoch": 0.69, + "learning_rate": 6.277426119374004e-08, + "loss": 0.0004, + "step": 35387 + }, + { + "epoch": 0.69, + "learning_rate": 6.27703778494039e-08, + "loss": 0.0003, + "step": 35388 + }, + { + "epoch": 0.69, + "learning_rate": 6.276649450506776e-08, + "loss": 0.0006, + "step": 35389 + }, + { + "epoch": 0.69, + "learning_rate": 6.276261116073162e-08, + "loss": 1.5168, + "step": 35390 + }, + { + "epoch": 0.69, + "learning_rate": 6.275872781639548e-08, + "loss": 0.0003, + "step": 35391 + }, + { + "epoch": 0.69, + "learning_rate": 6.275484447205933e-08, + "loss": 0.0098, + "step": 35392 + }, + { + "epoch": 0.69, + "learning_rate": 6.275096112772319e-08, + "loss": 0.0005, + "step": 35393 + }, + { + "epoch": 0.69, + "learning_rate": 6.274707778338705e-08, + "loss": 0.0005, + "step": 35394 + }, + { + "epoch": 0.69, + "learning_rate": 6.274319443905091e-08, + "loss": 0.0004, + "step": 35395 + }, + { + "epoch": 0.69, + "learning_rate": 6.273931109471477e-08, + "loss": 0.0004, + "step": 35396 + }, + { + "epoch": 0.69, + "learning_rate": 6.273542775037863e-08, + "loss": 0.0008, + "step": 35397 + }, + { + "epoch": 0.69, + "learning_rate": 6.273154440604248e-08, + "loss": 0.0004, + "step": 35398 + }, + { + "epoch": 0.69, + "learning_rate": 6.272766106170634e-08, + "loss": 0.0005, + "step": 35399 + }, + { + "epoch": 0.69, + "learning_rate": 6.27237777173702e-08, + "loss": 0.0009, + "step": 35400 + }, + { + "epoch": 0.69, + "learning_rate": 6.271989437303406e-08, + "loss": 0.0007, + "step": 35401 + }, + { + "epoch": 0.69, + "learning_rate": 6.271601102869792e-08, + "loss": 0.0004, + "step": 35402 + }, + { + "epoch": 0.69, + "learning_rate": 6.271212768436178e-08, + "loss": 0.0801, + "step": 35403 + }, + { + "epoch": 0.69, + "learning_rate": 6.270824434002563e-08, + "loss": 0.0007, + "step": 35404 + }, + { + "epoch": 0.69, + "learning_rate": 6.270436099568949e-08, + "loss": 0.0004, + "step": 35405 + }, + { + "epoch": 0.69, + "learning_rate": 6.270047765135335e-08, + "loss": 0.0004, + "step": 35406 + }, + { + "epoch": 0.69, + "learning_rate": 6.269659430701721e-08, + "loss": 0.0006, + "step": 35407 + }, + { + "epoch": 0.69, + "learning_rate": 6.269271096268107e-08, + "loss": 0.0005, + "step": 35408 + }, + { + "epoch": 0.69, + "learning_rate": 6.268882761834492e-08, + "loss": 0.0005, + "step": 35409 + }, + { + "epoch": 0.69, + "learning_rate": 6.268494427400878e-08, + "loss": 0.0003, + "step": 35410 + }, + { + "epoch": 0.69, + "learning_rate": 6.268106092967264e-08, + "loss": 0.0005, + "step": 35411 + }, + { + "epoch": 0.69, + "learning_rate": 6.26771775853365e-08, + "loss": 0.0185, + "step": 35412 + }, + { + "epoch": 0.69, + "learning_rate": 6.267329424100036e-08, + "loss": 0.0005, + "step": 35413 + }, + { + "epoch": 0.69, + "learning_rate": 6.266941089666422e-08, + "loss": 0.0005, + "step": 35414 + }, + { + "epoch": 0.69, + "learning_rate": 6.266552755232806e-08, + "loss": 0.0004, + "step": 35415 + }, + { + "epoch": 0.69, + "learning_rate": 6.266164420799192e-08, + "loss": 0.0004, + "step": 35416 + }, + { + "epoch": 0.69, + "learning_rate": 6.265776086365578e-08, + "loss": 0.0004, + "step": 35417 + }, + { + "epoch": 0.69, + "learning_rate": 6.265387751931964e-08, + "loss": 0.0006, + "step": 35418 + }, + { + "epoch": 0.69, + "learning_rate": 6.26499941749835e-08, + "loss": 0.0008, + "step": 35419 + }, + { + "epoch": 0.69, + "learning_rate": 6.264611083064735e-08, + "loss": 0.0003, + "step": 35420 + }, + { + "epoch": 0.69, + "learning_rate": 6.264222748631121e-08, + "loss": 0.0005, + "step": 35421 + }, + { + "epoch": 0.69, + "learning_rate": 6.263834414197507e-08, + "loss": 0.0005, + "step": 35422 + }, + { + "epoch": 0.69, + "learning_rate": 6.263446079763893e-08, + "loss": 0.0003, + "step": 35423 + }, + { + "epoch": 0.69, + "learning_rate": 6.263057745330279e-08, + "loss": 0.0049, + "step": 35424 + }, + { + "epoch": 0.69, + "learning_rate": 6.262669410896664e-08, + "loss": 0.0013, + "step": 35425 + }, + { + "epoch": 0.69, + "learning_rate": 6.26228107646305e-08, + "loss": 0.0006, + "step": 35426 + }, + { + "epoch": 0.69, + "learning_rate": 6.261892742029436e-08, + "loss": 0.0004, + "step": 35427 + }, + { + "epoch": 0.69, + "learning_rate": 6.261504407595822e-08, + "loss": 0.0006, + "step": 35428 + }, + { + "epoch": 0.69, + "learning_rate": 6.261116073162208e-08, + "loss": 0.0006, + "step": 35429 + }, + { + "epoch": 0.69, + "learning_rate": 6.260727738728593e-08, + "loss": 0.0004, + "step": 35430 + }, + { + "epoch": 0.69, + "learning_rate": 6.260339404294979e-08, + "loss": 0.0003, + "step": 35431 + }, + { + "epoch": 0.69, + "learning_rate": 6.259951069861364e-08, + "loss": 0.0004, + "step": 35432 + }, + { + "epoch": 0.69, + "learning_rate": 6.25956273542775e-08, + "loss": 0.0011, + "step": 35433 + }, + { + "epoch": 0.69, + "learning_rate": 6.259174400994135e-08, + "loss": 0.0005, + "step": 35434 + }, + { + "epoch": 0.69, + "learning_rate": 6.258786066560521e-08, + "loss": 0.0006, + "step": 35435 + }, + { + "epoch": 0.69, + "learning_rate": 6.258397732126907e-08, + "loss": 0.0003, + "step": 35436 + }, + { + "epoch": 0.69, + "learning_rate": 6.258009397693293e-08, + "loss": 0.0005, + "step": 35437 + }, + { + "epoch": 0.69, + "learning_rate": 6.257621063259679e-08, + "loss": 0.0028, + "step": 35438 + }, + { + "epoch": 0.69, + "learning_rate": 6.257232728826065e-08, + "loss": 0.0004, + "step": 35439 + }, + { + "epoch": 0.69, + "learning_rate": 6.25684439439245e-08, + "loss": 0.0005, + "step": 35440 + }, + { + "epoch": 0.69, + "learning_rate": 6.256456059958836e-08, + "loss": 0.0006, + "step": 35441 + }, + { + "epoch": 0.69, + "learning_rate": 6.256067725525222e-08, + "loss": 0.0005, + "step": 35442 + }, + { + "epoch": 0.69, + "learning_rate": 6.255679391091608e-08, + "loss": 0.0004, + "step": 35443 + }, + { + "epoch": 0.69, + "learning_rate": 6.255291056657994e-08, + "loss": 0.0005, + "step": 35444 + }, + { + "epoch": 0.69, + "learning_rate": 6.25490272222438e-08, + "loss": 0.0007, + "step": 35445 + }, + { + "epoch": 0.69, + "learning_rate": 6.254514387790765e-08, + "loss": 0.0006, + "step": 35446 + }, + { + "epoch": 0.69, + "learning_rate": 6.25412605335715e-08, + "loss": 0.0057, + "step": 35447 + }, + { + "epoch": 0.69, + "learning_rate": 6.253737718923536e-08, + "loss": 0.0005, + "step": 35448 + }, + { + "epoch": 0.69, + "learning_rate": 6.253349384489921e-08, + "loss": 0.0005, + "step": 35449 + }, + { + "epoch": 0.69, + "learning_rate": 6.252961050056307e-08, + "loss": 0.0004, + "step": 35450 + }, + { + "epoch": 0.69, + "learning_rate": 6.252572715622693e-08, + "loss": 0.0004, + "step": 35451 + }, + { + "epoch": 0.69, + "learning_rate": 6.252184381189079e-08, + "loss": 0.0424, + "step": 35452 + }, + { + "epoch": 0.69, + "learning_rate": 6.251796046755465e-08, + "loss": 0.0005, + "step": 35453 + }, + { + "epoch": 0.69, + "learning_rate": 6.25140771232185e-08, + "loss": 0.0004, + "step": 35454 + }, + { + "epoch": 0.69, + "learning_rate": 6.251019377888236e-08, + "loss": 0.0004, + "step": 35455 + }, + { + "epoch": 0.69, + "learning_rate": 6.250631043454622e-08, + "loss": 0.0005, + "step": 35456 + }, + { + "epoch": 0.69, + "learning_rate": 6.250242709021008e-08, + "loss": 0.0197, + "step": 35457 + }, + { + "epoch": 0.69, + "learning_rate": 6.249854374587394e-08, + "loss": 0.0005, + "step": 35458 + }, + { + "epoch": 0.69, + "learning_rate": 6.24946604015378e-08, + "loss": 0.0004, + "step": 35459 + }, + { + "epoch": 0.69, + "learning_rate": 6.249077705720166e-08, + "loss": 0.0004, + "step": 35460 + }, + { + "epoch": 0.69, + "learning_rate": 6.248689371286551e-08, + "loss": 0.0003, + "step": 35461 + }, + { + "epoch": 0.69, + "learning_rate": 6.248301036852937e-08, + "loss": 0.0004, + "step": 35462 + }, + { + "epoch": 0.69, + "learning_rate": 6.247912702419323e-08, + "loss": 0.108, + "step": 35463 + }, + { + "epoch": 0.69, + "learning_rate": 6.247524367985709e-08, + "loss": 0.0007, + "step": 35464 + }, + { + "epoch": 0.69, + "learning_rate": 6.247136033552095e-08, + "loss": 0.0007, + "step": 35465 + }, + { + "epoch": 0.69, + "learning_rate": 6.24674769911848e-08, + "loss": 0.0005, + "step": 35466 + }, + { + "epoch": 0.69, + "learning_rate": 6.246359364684866e-08, + "loss": 1.0355, + "step": 35467 + }, + { + "epoch": 0.69, + "learning_rate": 6.245971030251252e-08, + "loss": 0.0005, + "step": 35468 + }, + { + "epoch": 0.69, + "learning_rate": 6.245582695817638e-08, + "loss": 0.0005, + "step": 35469 + }, + { + "epoch": 0.69, + "learning_rate": 6.245194361384024e-08, + "loss": 0.0005, + "step": 35470 + }, + { + "epoch": 0.69, + "learning_rate": 6.24480602695041e-08, + "loss": 0.0008, + "step": 35471 + }, + { + "epoch": 0.69, + "learning_rate": 6.244417692516795e-08, + "loss": 0.0004, + "step": 35472 + }, + { + "epoch": 0.69, + "learning_rate": 6.24402935808318e-08, + "loss": 0.0005, + "step": 35473 + }, + { + "epoch": 0.69, + "learning_rate": 6.243641023649566e-08, + "loss": 0.0011, + "step": 35474 + }, + { + "epoch": 0.69, + "learning_rate": 6.243252689215952e-08, + "loss": 0.0005, + "step": 35475 + }, + { + "epoch": 0.69, + "learning_rate": 6.242864354782337e-08, + "loss": 0.0005, + "step": 35476 + }, + { + "epoch": 0.69, + "learning_rate": 6.242476020348723e-08, + "loss": 0.8001, + "step": 35477 + }, + { + "epoch": 0.69, + "learning_rate": 6.242087685915109e-08, + "loss": 0.0011, + "step": 35478 + }, + { + "epoch": 0.69, + "learning_rate": 6.241699351481495e-08, + "loss": 0.0007, + "step": 35479 + }, + { + "epoch": 0.69, + "learning_rate": 6.241311017047881e-08, + "loss": 0.0008, + "step": 35480 + }, + { + "epoch": 0.69, + "learning_rate": 6.240922682614267e-08, + "loss": 0.0005, + "step": 35481 + }, + { + "epoch": 0.69, + "learning_rate": 6.240534348180652e-08, + "loss": 0.0003, + "step": 35482 + }, + { + "epoch": 0.69, + "learning_rate": 6.240146013747038e-08, + "loss": 0.0003, + "step": 35483 + }, + { + "epoch": 0.69, + "learning_rate": 6.239757679313424e-08, + "loss": 0.0004, + "step": 35484 + }, + { + "epoch": 0.69, + "learning_rate": 6.23936934487981e-08, + "loss": 0.0005, + "step": 35485 + }, + { + "epoch": 0.69, + "learning_rate": 6.238981010446196e-08, + "loss": 0.0004, + "step": 35486 + }, + { + "epoch": 0.69, + "learning_rate": 6.238592676012581e-08, + "loss": 0.0006, + "step": 35487 + }, + { + "epoch": 0.69, + "learning_rate": 6.238204341578967e-08, + "loss": 0.0005, + "step": 35488 + }, + { + "epoch": 0.69, + "learning_rate": 6.237816007145353e-08, + "loss": 0.0005, + "step": 35489 + }, + { + "epoch": 0.69, + "learning_rate": 6.237427672711739e-08, + "loss": 0.0004, + "step": 35490 + }, + { + "epoch": 0.69, + "learning_rate": 6.237039338278125e-08, + "loss": 0.6696, + "step": 35491 + }, + { + "epoch": 0.69, + "learning_rate": 6.23665100384451e-08, + "loss": 0.0005, + "step": 35492 + }, + { + "epoch": 0.69, + "learning_rate": 6.236262669410896e-08, + "loss": 0.0004, + "step": 35493 + }, + { + "epoch": 0.69, + "learning_rate": 6.235874334977282e-08, + "loss": 0.0005, + "step": 35494 + }, + { + "epoch": 0.69, + "learning_rate": 6.235486000543668e-08, + "loss": 0.0008, + "step": 35495 + }, + { + "epoch": 0.69, + "learning_rate": 6.235097666110054e-08, + "loss": 0.0005, + "step": 35496 + }, + { + "epoch": 0.69, + "learning_rate": 6.23470933167644e-08, + "loss": 0.0005, + "step": 35497 + }, + { + "epoch": 0.69, + "learning_rate": 6.234320997242826e-08, + "loss": 0.0004, + "step": 35498 + }, + { + "epoch": 0.69, + "learning_rate": 6.233932662809211e-08, + "loss": 0.0159, + "step": 35499 + }, + { + "epoch": 0.69, + "learning_rate": 6.233544328375597e-08, + "loss": 0.0004, + "step": 35500 + }, + { + "epoch": 0.69, + "learning_rate": 6.233155993941983e-08, + "loss": 0.0024, + "step": 35501 + }, + { + "epoch": 0.69, + "learning_rate": 6.232767659508368e-08, + "loss": 0.8483, + "step": 35502 + }, + { + "epoch": 0.69, + "learning_rate": 6.232379325074753e-08, + "loss": 0.6188, + "step": 35503 + }, + { + "epoch": 0.69, + "learning_rate": 6.231990990641139e-08, + "loss": 1.4885, + "step": 35504 + }, + { + "epoch": 0.69, + "learning_rate": 6.231602656207525e-08, + "loss": 0.0005, + "step": 35505 + }, + { + "epoch": 0.69, + "learning_rate": 6.231214321773911e-08, + "loss": 0.0457, + "step": 35506 + }, + { + "epoch": 0.69, + "learning_rate": 6.230825987340297e-08, + "loss": 0.0003, + "step": 35507 + }, + { + "epoch": 0.69, + "learning_rate": 6.230437652906682e-08, + "loss": 0.0004, + "step": 35508 + }, + { + "epoch": 0.69, + "learning_rate": 6.230049318473068e-08, + "loss": 0.0005, + "step": 35509 + }, + { + "epoch": 0.69, + "learning_rate": 6.229660984039454e-08, + "loss": 0.8768, + "step": 35510 + }, + { + "epoch": 0.69, + "learning_rate": 6.22927264960584e-08, + "loss": 0.0005, + "step": 35511 + }, + { + "epoch": 0.69, + "learning_rate": 6.228884315172226e-08, + "loss": 0.0003, + "step": 35512 + }, + { + "epoch": 0.69, + "learning_rate": 6.228495980738612e-08, + "loss": 0.0004, + "step": 35513 + }, + { + "epoch": 0.69, + "learning_rate": 6.228107646304997e-08, + "loss": 0.0004, + "step": 35514 + }, + { + "epoch": 0.69, + "learning_rate": 6.227719311871383e-08, + "loss": 0.0003, + "step": 35515 + }, + { + "epoch": 0.69, + "learning_rate": 6.227330977437769e-08, + "loss": 0.0003, + "step": 35516 + }, + { + "epoch": 0.69, + "learning_rate": 6.226942643004155e-08, + "loss": 0.0004, + "step": 35517 + }, + { + "epoch": 0.69, + "learning_rate": 6.226554308570541e-08, + "loss": 0.0005, + "step": 35518 + }, + { + "epoch": 0.69, + "learning_rate": 6.226165974136927e-08, + "loss": 0.0003, + "step": 35519 + }, + { + "epoch": 0.69, + "learning_rate": 6.225777639703312e-08, + "loss": 0.0003, + "step": 35520 + }, + { + "epoch": 0.69, + "learning_rate": 6.225389305269698e-08, + "loss": 0.0005, + "step": 35521 + }, + { + "epoch": 0.69, + "learning_rate": 6.225000970836084e-08, + "loss": 0.0012, + "step": 35522 + }, + { + "epoch": 0.69, + "learning_rate": 6.22461263640247e-08, + "loss": 0.0075, + "step": 35523 + }, + { + "epoch": 0.69, + "learning_rate": 6.224224301968856e-08, + "loss": 0.0005, + "step": 35524 + }, + { + "epoch": 0.69, + "learning_rate": 6.223835967535241e-08, + "loss": 0.0006, + "step": 35525 + }, + { + "epoch": 0.69, + "learning_rate": 6.223447633101627e-08, + "loss": 0.0005, + "step": 35526 + }, + { + "epoch": 0.69, + "learning_rate": 6.223059298668013e-08, + "loss": 0.0004, + "step": 35527 + }, + { + "epoch": 0.69, + "learning_rate": 6.222670964234399e-08, + "loss": 0.0004, + "step": 35528 + }, + { + "epoch": 0.69, + "learning_rate": 6.222282629800785e-08, + "loss": 0.0003, + "step": 35529 + }, + { + "epoch": 0.69, + "learning_rate": 6.22189429536717e-08, + "loss": 0.0004, + "step": 35530 + }, + { + "epoch": 0.69, + "learning_rate": 6.221505960933555e-08, + "loss": 0.0005, + "step": 35531 + }, + { + "epoch": 0.69, + "learning_rate": 6.221117626499941e-08, + "loss": 0.0004, + "step": 35532 + }, + { + "epoch": 0.69, + "learning_rate": 6.220729292066327e-08, + "loss": 0.0005, + "step": 35533 + }, + { + "epoch": 0.69, + "learning_rate": 6.220340957632713e-08, + "loss": 0.0006, + "step": 35534 + }, + { + "epoch": 0.69, + "learning_rate": 6.219952623199098e-08, + "loss": 0.0003, + "step": 35535 + }, + { + "epoch": 0.69, + "learning_rate": 6.219564288765484e-08, + "loss": 0.0003, + "step": 35536 + }, + { + "epoch": 0.69, + "learning_rate": 6.21917595433187e-08, + "loss": 0.0006, + "step": 35537 + }, + { + "epoch": 0.69, + "learning_rate": 6.218787619898256e-08, + "loss": 0.0005, + "step": 35538 + }, + { + "epoch": 0.69, + "learning_rate": 6.218399285464642e-08, + "loss": 0.0007, + "step": 35539 + }, + { + "epoch": 0.69, + "learning_rate": 6.218010951031028e-08, + "loss": 0.0216, + "step": 35540 + }, + { + "epoch": 0.69, + "learning_rate": 6.217622616597413e-08, + "loss": 0.0004, + "step": 35541 + }, + { + "epoch": 0.69, + "learning_rate": 6.217234282163799e-08, + "loss": 0.0709, + "step": 35542 + }, + { + "epoch": 0.69, + "learning_rate": 6.216845947730185e-08, + "loss": 0.0005, + "step": 35543 + }, + { + "epoch": 0.69, + "learning_rate": 6.216457613296571e-08, + "loss": 0.0004, + "step": 35544 + }, + { + "epoch": 0.69, + "learning_rate": 6.216069278862957e-08, + "loss": 0.001, + "step": 35545 + }, + { + "epoch": 0.69, + "learning_rate": 6.215680944429342e-08, + "loss": 0.0007, + "step": 35546 + }, + { + "epoch": 0.69, + "learning_rate": 6.215292609995728e-08, + "loss": 0.0007, + "step": 35547 + }, + { + "epoch": 0.69, + "learning_rate": 6.214904275562114e-08, + "loss": 0.2576, + "step": 35548 + }, + { + "epoch": 0.69, + "learning_rate": 6.2145159411285e-08, + "loss": 0.0007, + "step": 35549 + }, + { + "epoch": 0.69, + "learning_rate": 6.214127606694886e-08, + "loss": 0.0002, + "step": 35550 + }, + { + "epoch": 0.69, + "learning_rate": 6.213739272261272e-08, + "loss": 0.0003, + "step": 35551 + }, + { + "epoch": 0.69, + "learning_rate": 6.213350937827657e-08, + "loss": 0.0008, + "step": 35552 + }, + { + "epoch": 0.69, + "learning_rate": 6.212962603394043e-08, + "loss": 0.0006, + "step": 35553 + }, + { + "epoch": 0.69, + "learning_rate": 6.212574268960429e-08, + "loss": 0.0005, + "step": 35554 + }, + { + "epoch": 0.69, + "learning_rate": 6.212185934526815e-08, + "loss": 0.0004, + "step": 35555 + }, + { + "epoch": 0.69, + "learning_rate": 6.211797600093201e-08, + "loss": 0.0003, + "step": 35556 + }, + { + "epoch": 0.69, + "learning_rate": 6.211409265659587e-08, + "loss": 0.0016, + "step": 35557 + }, + { + "epoch": 0.69, + "learning_rate": 6.211020931225972e-08, + "loss": 0.0008, + "step": 35558 + }, + { + "epoch": 0.69, + "learning_rate": 6.210632596792358e-08, + "loss": 0.0104, + "step": 35559 + }, + { + "epoch": 0.69, + "learning_rate": 6.210244262358743e-08, + "loss": 0.0059, + "step": 35560 + }, + { + "epoch": 0.69, + "learning_rate": 6.209855927925129e-08, + "loss": 0.0003, + "step": 35561 + }, + { + "epoch": 0.69, + "learning_rate": 6.209467593491514e-08, + "loss": 0.0004, + "step": 35562 + }, + { + "epoch": 0.69, + "learning_rate": 6.2090792590579e-08, + "loss": 0.8907, + "step": 35563 + }, + { + "epoch": 0.69, + "learning_rate": 6.208690924624286e-08, + "loss": 0.0005, + "step": 35564 + }, + { + "epoch": 0.69, + "learning_rate": 6.208302590190672e-08, + "loss": 0.0004, + "step": 35565 + }, + { + "epoch": 0.69, + "learning_rate": 6.207914255757058e-08, + "loss": 0.0005, + "step": 35566 + }, + { + "epoch": 0.69, + "learning_rate": 6.207525921323443e-08, + "loss": 0.0005, + "step": 35567 + }, + { + "epoch": 0.69, + "learning_rate": 6.207137586889829e-08, + "loss": 0.0004, + "step": 35568 + }, + { + "epoch": 0.69, + "learning_rate": 6.206749252456215e-08, + "loss": 0.0004, + "step": 35569 + }, + { + "epoch": 0.69, + "learning_rate": 6.206360918022601e-08, + "loss": 0.0004, + "step": 35570 + }, + { + "epoch": 0.69, + "learning_rate": 6.205972583588987e-08, + "loss": 0.0006, + "step": 35571 + }, + { + "epoch": 0.69, + "learning_rate": 6.205584249155373e-08, + "loss": 0.0006, + "step": 35572 + }, + { + "epoch": 0.69, + "learning_rate": 6.205195914721758e-08, + "loss": 0.0004, + "step": 35573 + }, + { + "epoch": 0.69, + "learning_rate": 6.204807580288144e-08, + "loss": 0.0005, + "step": 35574 + }, + { + "epoch": 0.69, + "learning_rate": 6.20441924585453e-08, + "loss": 0.0005, + "step": 35575 + }, + { + "epoch": 0.69, + "learning_rate": 6.204030911420916e-08, + "loss": 0.0005, + "step": 35576 + }, + { + "epoch": 0.69, + "learning_rate": 6.203642576987302e-08, + "loss": 0.0007, + "step": 35577 + }, + { + "epoch": 0.69, + "learning_rate": 6.203254242553688e-08, + "loss": 0.6125, + "step": 35578 + }, + { + "epoch": 0.69, + "learning_rate": 6.202865908120073e-08, + "loss": 0.0005, + "step": 35579 + }, + { + "epoch": 0.69, + "learning_rate": 6.202477573686459e-08, + "loss": 0.5477, + "step": 35580 + }, + { + "epoch": 0.69, + "learning_rate": 6.202089239252845e-08, + "loss": 0.0005, + "step": 35581 + }, + { + "epoch": 0.69, + "learning_rate": 6.201700904819231e-08, + "loss": 0.0004, + "step": 35582 + }, + { + "epoch": 0.69, + "learning_rate": 6.201312570385617e-08, + "loss": 0.0067, + "step": 35583 + }, + { + "epoch": 0.69, + "learning_rate": 6.200924235952002e-08, + "loss": 0.001, + "step": 35584 + }, + { + "epoch": 0.69, + "learning_rate": 6.200535901518388e-08, + "loss": 0.0003, + "step": 35585 + }, + { + "epoch": 0.69, + "learning_rate": 6.200147567084774e-08, + "loss": 0.0003, + "step": 35586 + }, + { + "epoch": 0.69, + "learning_rate": 6.19975923265116e-08, + "loss": 0.0004, + "step": 35587 + }, + { + "epoch": 0.69, + "learning_rate": 6.199370898217546e-08, + "loss": 0.0141, + "step": 35588 + }, + { + "epoch": 0.69, + "learning_rate": 6.19898256378393e-08, + "loss": 0.0004, + "step": 35589 + }, + { + "epoch": 0.69, + "learning_rate": 6.198594229350316e-08, + "loss": 0.0341, + "step": 35590 + }, + { + "epoch": 0.69, + "learning_rate": 6.198205894916702e-08, + "loss": 0.001, + "step": 35591 + }, + { + "epoch": 0.69, + "learning_rate": 6.197817560483088e-08, + "loss": 0.0005, + "step": 35592 + }, + { + "epoch": 0.69, + "learning_rate": 6.197429226049474e-08, + "loss": 0.0003, + "step": 35593 + }, + { + "epoch": 0.69, + "learning_rate": 6.19704089161586e-08, + "loss": 0.0005, + "step": 35594 + }, + { + "epoch": 0.69, + "learning_rate": 6.196652557182245e-08, + "loss": 0.0005, + "step": 35595 + }, + { + "epoch": 0.69, + "learning_rate": 6.196264222748631e-08, + "loss": 0.0003, + "step": 35596 + }, + { + "epoch": 0.69, + "learning_rate": 6.195875888315017e-08, + "loss": 0.0006, + "step": 35597 + }, + { + "epoch": 0.69, + "learning_rate": 6.195487553881403e-08, + "loss": 0.0005, + "step": 35598 + }, + { + "epoch": 0.69, + "learning_rate": 6.195099219447789e-08, + "loss": 0.0011, + "step": 35599 + }, + { + "epoch": 0.69, + "learning_rate": 6.194710885014174e-08, + "loss": 0.0003, + "step": 35600 + }, + { + "epoch": 0.69, + "learning_rate": 6.19432255058056e-08, + "loss": 0.1081, + "step": 35601 + }, + { + "epoch": 0.69, + "learning_rate": 6.193934216146946e-08, + "loss": 0.0014, + "step": 35602 + }, + { + "epoch": 0.69, + "learning_rate": 6.193545881713332e-08, + "loss": 0.0004, + "step": 35603 + }, + { + "epoch": 0.69, + "learning_rate": 6.193157547279718e-08, + "loss": 0.0004, + "step": 35604 + }, + { + "epoch": 0.69, + "learning_rate": 6.192769212846103e-08, + "loss": 0.0003, + "step": 35605 + }, + { + "epoch": 0.69, + "learning_rate": 6.192380878412489e-08, + "loss": 0.0003, + "step": 35606 + }, + { + "epoch": 0.69, + "learning_rate": 6.191992543978875e-08, + "loss": 0.0005, + "step": 35607 + }, + { + "epoch": 0.69, + "learning_rate": 6.191604209545261e-08, + "loss": 0.8245, + "step": 35608 + }, + { + "epoch": 0.69, + "learning_rate": 6.191215875111645e-08, + "loss": 0.0004, + "step": 35609 + }, + { + "epoch": 0.69, + "learning_rate": 6.190827540678031e-08, + "loss": 0.0009, + "step": 35610 + }, + { + "epoch": 0.69, + "learning_rate": 6.190439206244417e-08, + "loss": 0.0005, + "step": 35611 + }, + { + "epoch": 0.69, + "learning_rate": 6.190050871810803e-08, + "loss": 0.017, + "step": 35612 + }, + { + "epoch": 0.69, + "learning_rate": 6.189662537377189e-08, + "loss": 0.0045, + "step": 35613 + }, + { + "epoch": 0.69, + "learning_rate": 6.189274202943575e-08, + "loss": 0.0003, + "step": 35614 + }, + { + "epoch": 0.69, + "learning_rate": 6.18888586850996e-08, + "loss": 0.0004, + "step": 35615 + }, + { + "epoch": 0.69, + "learning_rate": 6.188497534076346e-08, + "loss": 0.0005, + "step": 35616 + }, + { + "epoch": 0.69, + "learning_rate": 6.188109199642732e-08, + "loss": 0.027, + "step": 35617 + }, + { + "epoch": 0.69, + "learning_rate": 6.187720865209118e-08, + "loss": 0.5475, + "step": 35618 + }, + { + "epoch": 0.69, + "learning_rate": 6.187332530775504e-08, + "loss": 0.0007, + "step": 35619 + }, + { + "epoch": 0.69, + "learning_rate": 6.18694419634189e-08, + "loss": 0.001, + "step": 35620 + }, + { + "epoch": 0.69, + "learning_rate": 6.186555861908275e-08, + "loss": 0.0005, + "step": 35621 + }, + { + "epoch": 0.69, + "learning_rate": 6.186167527474661e-08, + "loss": 0.1819, + "step": 35622 + }, + { + "epoch": 0.69, + "learning_rate": 6.185779193041047e-08, + "loss": 0.0007, + "step": 35623 + }, + { + "epoch": 0.69, + "learning_rate": 6.185390858607431e-08, + "loss": 0.0004, + "step": 35624 + }, + { + "epoch": 0.69, + "learning_rate": 6.185002524173817e-08, + "loss": 0.0006, + "step": 35625 + }, + { + "epoch": 0.69, + "learning_rate": 6.184614189740203e-08, + "loss": 0.0004, + "step": 35626 + }, + { + "epoch": 0.69, + "learning_rate": 6.184225855306589e-08, + "loss": 0.0005, + "step": 35627 + }, + { + "epoch": 0.69, + "learning_rate": 6.183837520872975e-08, + "loss": 0.0004, + "step": 35628 + }, + { + "epoch": 0.69, + "learning_rate": 6.18344918643936e-08, + "loss": 0.0007, + "step": 35629 + }, + { + "epoch": 0.69, + "learning_rate": 6.183060852005746e-08, + "loss": 0.2847, + "step": 35630 + }, + { + "epoch": 0.69, + "learning_rate": 6.182672517572132e-08, + "loss": 0.0003, + "step": 35631 + }, + { + "epoch": 0.69, + "learning_rate": 6.182284183138518e-08, + "loss": 0.0005, + "step": 35632 + }, + { + "epoch": 0.69, + "learning_rate": 6.181895848704904e-08, + "loss": 0.294, + "step": 35633 + }, + { + "epoch": 0.69, + "learning_rate": 6.18150751427129e-08, + "loss": 0.0005, + "step": 35634 + }, + { + "epoch": 0.69, + "learning_rate": 6.181119179837676e-08, + "loss": 0.0013, + "step": 35635 + }, + { + "epoch": 0.69, + "learning_rate": 6.180730845404061e-08, + "loss": 0.0004, + "step": 35636 + }, + { + "epoch": 0.69, + "learning_rate": 6.180342510970447e-08, + "loss": 0.0003, + "step": 35637 + }, + { + "epoch": 0.69, + "learning_rate": 6.179954176536833e-08, + "loss": 0.0007, + "step": 35638 + }, + { + "epoch": 0.69, + "learning_rate": 6.179565842103219e-08, + "loss": 0.0004, + "step": 35639 + }, + { + "epoch": 0.69, + "learning_rate": 6.179177507669605e-08, + "loss": 0.9725, + "step": 35640 + }, + { + "epoch": 0.69, + "learning_rate": 6.17878917323599e-08, + "loss": 0.0005, + "step": 35641 + }, + { + "epoch": 0.69, + "learning_rate": 6.178400838802376e-08, + "loss": 0.0004, + "step": 35642 + }, + { + "epoch": 0.69, + "learning_rate": 6.178012504368762e-08, + "loss": 0.0052, + "step": 35643 + }, + { + "epoch": 0.69, + "learning_rate": 6.177624169935148e-08, + "loss": 0.0012, + "step": 35644 + }, + { + "epoch": 0.69, + "learning_rate": 6.177235835501534e-08, + "loss": 0.0008, + "step": 35645 + }, + { + "epoch": 0.69, + "learning_rate": 6.17684750106792e-08, + "loss": 0.3479, + "step": 35646 + }, + { + "epoch": 0.69, + "learning_rate": 6.176459166634304e-08, + "loss": 0.0005, + "step": 35647 + }, + { + "epoch": 0.69, + "learning_rate": 6.17607083220069e-08, + "loss": 0.0005, + "step": 35648 + }, + { + "epoch": 0.69, + "learning_rate": 6.175682497767076e-08, + "loss": 0.0003, + "step": 35649 + }, + { + "epoch": 0.69, + "learning_rate": 6.175294163333462e-08, + "loss": 0.0004, + "step": 35650 + }, + { + "epoch": 0.69, + "learning_rate": 6.174905828899847e-08, + "loss": 0.0006, + "step": 35651 + }, + { + "epoch": 0.69, + "learning_rate": 6.174517494466233e-08, + "loss": 0.0005, + "step": 35652 + }, + { + "epoch": 0.69, + "learning_rate": 6.174129160032619e-08, + "loss": 0.0004, + "step": 35653 + }, + { + "epoch": 0.69, + "learning_rate": 6.173740825599005e-08, + "loss": 0.0003, + "step": 35654 + }, + { + "epoch": 0.69, + "learning_rate": 6.173352491165391e-08, + "loss": 0.0009, + "step": 35655 + }, + { + "epoch": 0.69, + "learning_rate": 6.172964156731777e-08, + "loss": 0.0007, + "step": 35656 + }, + { + "epoch": 0.69, + "learning_rate": 6.172575822298162e-08, + "loss": 0.0003, + "step": 35657 + }, + { + "epoch": 0.69, + "learning_rate": 6.172187487864548e-08, + "loss": 0.0005, + "step": 35658 + }, + { + "epoch": 0.69, + "learning_rate": 6.171799153430934e-08, + "loss": 0.0007, + "step": 35659 + }, + { + "epoch": 0.69, + "learning_rate": 6.17141081899732e-08, + "loss": 0.8071, + "step": 35660 + }, + { + "epoch": 0.69, + "learning_rate": 6.171022484563706e-08, + "loss": 0.0003, + "step": 35661 + }, + { + "epoch": 0.69, + "learning_rate": 6.170634150130092e-08, + "loss": 0.0004, + "step": 35662 + }, + { + "epoch": 0.69, + "learning_rate": 6.170245815696477e-08, + "loss": 0.0009, + "step": 35663 + }, + { + "epoch": 0.69, + "learning_rate": 6.169857481262863e-08, + "loss": 0.0004, + "step": 35664 + }, + { + "epoch": 0.69, + "learning_rate": 6.169469146829249e-08, + "loss": 0.0004, + "step": 35665 + }, + { + "epoch": 0.69, + "learning_rate": 6.169080812395635e-08, + "loss": 0.0005, + "step": 35666 + }, + { + "epoch": 0.69, + "learning_rate": 6.16869247796202e-08, + "loss": 0.0004, + "step": 35667 + }, + { + "epoch": 0.69, + "learning_rate": 6.168304143528406e-08, + "loss": 0.0995, + "step": 35668 + }, + { + "epoch": 0.69, + "learning_rate": 6.167915809094792e-08, + "loss": 0.0004, + "step": 35669 + }, + { + "epoch": 0.69, + "learning_rate": 6.167527474661178e-08, + "loss": 0.0005, + "step": 35670 + }, + { + "epoch": 0.69, + "learning_rate": 6.167139140227564e-08, + "loss": 0.4452, + "step": 35671 + }, + { + "epoch": 0.69, + "learning_rate": 6.16675080579395e-08, + "loss": 0.0007, + "step": 35672 + }, + { + "epoch": 0.69, + "learning_rate": 6.166362471360336e-08, + "loss": 0.0004, + "step": 35673 + }, + { + "epoch": 0.69, + "learning_rate": 6.165974136926721e-08, + "loss": 0.0008, + "step": 35674 + }, + { + "epoch": 0.69, + "learning_rate": 6.165585802493107e-08, + "loss": 0.0003, + "step": 35675 + }, + { + "epoch": 0.69, + "learning_rate": 6.165197468059492e-08, + "loss": 0.0005, + "step": 35676 + }, + { + "epoch": 0.69, + "learning_rate": 6.164809133625878e-08, + "loss": 0.0006, + "step": 35677 + }, + { + "epoch": 0.69, + "learning_rate": 6.164420799192263e-08, + "loss": 0.0004, + "step": 35678 + }, + { + "epoch": 0.69, + "learning_rate": 6.164032464758649e-08, + "loss": 0.0004, + "step": 35679 + }, + { + "epoch": 0.69, + "learning_rate": 6.163644130325035e-08, + "loss": 0.0004, + "step": 35680 + }, + { + "epoch": 0.69, + "learning_rate": 6.163255795891421e-08, + "loss": 0.7009, + "step": 35681 + }, + { + "epoch": 0.69, + "learning_rate": 6.162867461457807e-08, + "loss": 0.0005, + "step": 35682 + }, + { + "epoch": 0.69, + "learning_rate": 6.162479127024192e-08, + "loss": 0.0006, + "step": 35683 + }, + { + "epoch": 0.69, + "learning_rate": 6.162090792590578e-08, + "loss": 0.0135, + "step": 35684 + }, + { + "epoch": 0.69, + "learning_rate": 6.161702458156964e-08, + "loss": 0.0005, + "step": 35685 + }, + { + "epoch": 0.69, + "learning_rate": 6.16131412372335e-08, + "loss": 0.0004, + "step": 35686 + }, + { + "epoch": 0.69, + "learning_rate": 6.160925789289736e-08, + "loss": 0.3386, + "step": 35687 + }, + { + "epoch": 0.69, + "learning_rate": 6.160537454856122e-08, + "loss": 0.5326, + "step": 35688 + }, + { + "epoch": 0.69, + "learning_rate": 6.160149120422507e-08, + "loss": 0.0006, + "step": 35689 + }, + { + "epoch": 0.69, + "learning_rate": 6.159760785988893e-08, + "loss": 0.0005, + "step": 35690 + }, + { + "epoch": 0.69, + "learning_rate": 6.159372451555279e-08, + "loss": 0.0014, + "step": 35691 + }, + { + "epoch": 0.69, + "learning_rate": 6.158984117121665e-08, + "loss": 0.0004, + "step": 35692 + }, + { + "epoch": 0.69, + "learning_rate": 6.158595782688051e-08, + "loss": 0.0005, + "step": 35693 + }, + { + "epoch": 0.69, + "learning_rate": 6.158207448254437e-08, + "loss": 0.0006, + "step": 35694 + }, + { + "epoch": 0.69, + "learning_rate": 6.157819113820822e-08, + "loss": 0.0012, + "step": 35695 + }, + { + "epoch": 0.69, + "learning_rate": 6.157430779387208e-08, + "loss": 0.0009, + "step": 35696 + }, + { + "epoch": 0.69, + "learning_rate": 6.157042444953594e-08, + "loss": 0.0017, + "step": 35697 + }, + { + "epoch": 0.69, + "learning_rate": 6.15665411051998e-08, + "loss": 0.0003, + "step": 35698 + }, + { + "epoch": 0.69, + "learning_rate": 6.156265776086366e-08, + "loss": 0.0005, + "step": 35699 + }, + { + "epoch": 0.69, + "learning_rate": 6.155877441652752e-08, + "loss": 0.0007, + "step": 35700 + }, + { + "epoch": 0.69, + "learning_rate": 6.155489107219137e-08, + "loss": 0.0005, + "step": 35701 + }, + { + "epoch": 0.69, + "learning_rate": 6.155100772785523e-08, + "loss": 0.0017, + "step": 35702 + }, + { + "epoch": 0.69, + "learning_rate": 6.154712438351909e-08, + "loss": 0.0006, + "step": 35703 + }, + { + "epoch": 0.69, + "learning_rate": 6.154324103918295e-08, + "loss": 0.0006, + "step": 35704 + }, + { + "epoch": 0.69, + "learning_rate": 6.153935769484679e-08, + "loss": 0.0003, + "step": 35705 + }, + { + "epoch": 0.69, + "learning_rate": 6.153547435051065e-08, + "loss": 0.0004, + "step": 35706 + }, + { + "epoch": 0.69, + "learning_rate": 6.153159100617451e-08, + "loss": 0.0005, + "step": 35707 + }, + { + "epoch": 0.69, + "learning_rate": 6.152770766183837e-08, + "loss": 0.0005, + "step": 35708 + }, + { + "epoch": 0.69, + "learning_rate": 6.152382431750223e-08, + "loss": 0.0005, + "step": 35709 + }, + { + "epoch": 0.69, + "learning_rate": 6.151994097316608e-08, + "loss": 0.0004, + "step": 35710 + }, + { + "epoch": 0.69, + "learning_rate": 6.151605762882994e-08, + "loss": 0.0004, + "step": 35711 + }, + { + "epoch": 0.69, + "learning_rate": 6.15121742844938e-08, + "loss": 0.0003, + "step": 35712 + }, + { + "epoch": 0.69, + "learning_rate": 6.150829094015766e-08, + "loss": 0.0005, + "step": 35713 + }, + { + "epoch": 0.69, + "learning_rate": 6.150440759582152e-08, + "loss": 1.1426, + "step": 35714 + }, + { + "epoch": 0.69, + "learning_rate": 6.150052425148538e-08, + "loss": 0.0005, + "step": 35715 + }, + { + "epoch": 0.69, + "learning_rate": 6.149664090714923e-08, + "loss": 0.0006, + "step": 35716 + }, + { + "epoch": 0.69, + "learning_rate": 6.149275756281309e-08, + "loss": 0.0004, + "step": 35717 + }, + { + "epoch": 0.69, + "learning_rate": 6.148887421847695e-08, + "loss": 0.0015, + "step": 35718 + }, + { + "epoch": 0.69, + "learning_rate": 6.148499087414081e-08, + "loss": 0.0005, + "step": 35719 + }, + { + "epoch": 0.69, + "learning_rate": 6.148110752980467e-08, + "loss": 0.0003, + "step": 35720 + }, + { + "epoch": 0.69, + "learning_rate": 6.147722418546852e-08, + "loss": 1.03, + "step": 35721 + }, + { + "epoch": 0.69, + "learning_rate": 6.147334084113238e-08, + "loss": 0.0004, + "step": 35722 + }, + { + "epoch": 0.69, + "learning_rate": 6.146945749679624e-08, + "loss": 0.0007, + "step": 35723 + }, + { + "epoch": 0.69, + "learning_rate": 6.14655741524601e-08, + "loss": 0.4092, + "step": 35724 + }, + { + "epoch": 0.69, + "learning_rate": 6.146169080812396e-08, + "loss": 0.0004, + "step": 35725 + }, + { + "epoch": 0.69, + "learning_rate": 6.145780746378782e-08, + "loss": 0.0005, + "step": 35726 + }, + { + "epoch": 0.69, + "learning_rate": 6.145392411945167e-08, + "loss": 0.3421, + "step": 35727 + }, + { + "epoch": 0.69, + "learning_rate": 6.145004077511553e-08, + "loss": 0.0005, + "step": 35728 + }, + { + "epoch": 0.69, + "learning_rate": 6.144615743077939e-08, + "loss": 0.0003, + "step": 35729 + }, + { + "epoch": 0.69, + "learning_rate": 6.144227408644325e-08, + "loss": 0.0005, + "step": 35730 + }, + { + "epoch": 0.69, + "learning_rate": 6.143839074210711e-08, + "loss": 1.0036, + "step": 35731 + }, + { + "epoch": 0.69, + "learning_rate": 6.143450739777097e-08, + "loss": 1.0346, + "step": 35732 + }, + { + "epoch": 0.69, + "learning_rate": 6.143062405343482e-08, + "loss": 0.0004, + "step": 35733 + }, + { + "epoch": 0.69, + "learning_rate": 6.142674070909867e-08, + "loss": 0.0009, + "step": 35734 + }, + { + "epoch": 0.69, + "learning_rate": 6.142285736476253e-08, + "loss": 0.0005, + "step": 35735 + }, + { + "epoch": 0.69, + "learning_rate": 6.141897402042639e-08, + "loss": 0.0005, + "step": 35736 + }, + { + "epoch": 0.69, + "learning_rate": 6.141509067609024e-08, + "loss": 1.2428, + "step": 35737 + }, + { + "epoch": 0.69, + "learning_rate": 6.14112073317541e-08, + "loss": 0.0004, + "step": 35738 + }, + { + "epoch": 0.69, + "learning_rate": 6.140732398741796e-08, + "loss": 0.0004, + "step": 35739 + }, + { + "epoch": 0.69, + "learning_rate": 6.140344064308182e-08, + "loss": 0.0012, + "step": 35740 + }, + { + "epoch": 0.69, + "learning_rate": 6.139955729874568e-08, + "loss": 0.0005, + "step": 35741 + }, + { + "epoch": 0.69, + "learning_rate": 6.139567395440953e-08, + "loss": 0.0003, + "step": 35742 + }, + { + "epoch": 0.69, + "learning_rate": 6.139179061007339e-08, + "loss": 0.0015, + "step": 35743 + }, + { + "epoch": 0.69, + "learning_rate": 6.138790726573725e-08, + "loss": 0.001, + "step": 35744 + }, + { + "epoch": 0.69, + "learning_rate": 6.138402392140111e-08, + "loss": 0.0006, + "step": 35745 + }, + { + "epoch": 0.69, + "learning_rate": 6.138014057706497e-08, + "loss": 0.0006, + "step": 35746 + }, + { + "epoch": 0.69, + "learning_rate": 6.137625723272883e-08, + "loss": 0.0005, + "step": 35747 + }, + { + "epoch": 0.69, + "learning_rate": 6.137237388839268e-08, + "loss": 0.0005, + "step": 35748 + }, + { + "epoch": 0.69, + "learning_rate": 6.136849054405654e-08, + "loss": 0.7194, + "step": 35749 + }, + { + "epoch": 0.69, + "learning_rate": 6.13646071997204e-08, + "loss": 0.0006, + "step": 35750 + }, + { + "epoch": 0.69, + "learning_rate": 6.136072385538426e-08, + "loss": 0.0006, + "step": 35751 + }, + { + "epoch": 0.69, + "learning_rate": 6.135684051104812e-08, + "loss": 0.0005, + "step": 35752 + }, + { + "epoch": 0.69, + "learning_rate": 6.135295716671198e-08, + "loss": 0.0016, + "step": 35753 + }, + { + "epoch": 0.69, + "learning_rate": 6.134907382237583e-08, + "loss": 0.04, + "step": 35754 + }, + { + "epoch": 0.69, + "learning_rate": 6.134519047803969e-08, + "loss": 0.0039, + "step": 35755 + }, + { + "epoch": 0.69, + "learning_rate": 6.134130713370355e-08, + "loss": 0.0005, + "step": 35756 + }, + { + "epoch": 0.69, + "learning_rate": 6.133742378936741e-08, + "loss": 0.0004, + "step": 35757 + }, + { + "epoch": 0.69, + "learning_rate": 6.133354044503127e-08, + "loss": 0.0004, + "step": 35758 + }, + { + "epoch": 0.69, + "learning_rate": 6.132965710069513e-08, + "loss": 0.0005, + "step": 35759 + }, + { + "epoch": 0.69, + "learning_rate": 6.132577375635898e-08, + "loss": 0.0006, + "step": 35760 + }, + { + "epoch": 0.69, + "learning_rate": 6.132189041202284e-08, + "loss": 0.0004, + "step": 35761 + }, + { + "epoch": 0.69, + "learning_rate": 6.13180070676867e-08, + "loss": 0.8848, + "step": 35762 + }, + { + "epoch": 0.69, + "learning_rate": 6.131412372335054e-08, + "loss": 0.1008, + "step": 35763 + }, + { + "epoch": 0.69, + "learning_rate": 6.13102403790144e-08, + "loss": 0.0005, + "step": 35764 + }, + { + "epoch": 0.69, + "learning_rate": 6.130635703467826e-08, + "loss": 0.0034, + "step": 35765 + }, + { + "epoch": 0.69, + "learning_rate": 6.130247369034212e-08, + "loss": 1.5365, + "step": 35766 + }, + { + "epoch": 0.69, + "learning_rate": 6.129859034600598e-08, + "loss": 0.0006, + "step": 35767 + }, + { + "epoch": 0.69, + "learning_rate": 6.129470700166984e-08, + "loss": 0.0005, + "step": 35768 + }, + { + "epoch": 0.69, + "learning_rate": 6.12908236573337e-08, + "loss": 0.0003, + "step": 35769 + }, + { + "epoch": 0.69, + "learning_rate": 6.128694031299755e-08, + "loss": 0.177, + "step": 35770 + }, + { + "epoch": 0.69, + "learning_rate": 6.128305696866141e-08, + "loss": 0.0028, + "step": 35771 + }, + { + "epoch": 0.69, + "learning_rate": 6.127917362432527e-08, + "loss": 0.0005, + "step": 35772 + }, + { + "epoch": 0.69, + "learning_rate": 6.127529027998913e-08, + "loss": 0.0004, + "step": 35773 + }, + { + "epoch": 0.69, + "learning_rate": 6.127140693565299e-08, + "loss": 0.0003, + "step": 35774 + }, + { + "epoch": 0.69, + "learning_rate": 6.126752359131684e-08, + "loss": 0.0152, + "step": 35775 + }, + { + "epoch": 0.69, + "learning_rate": 6.12636402469807e-08, + "loss": 0.0005, + "step": 35776 + }, + { + "epoch": 0.69, + "learning_rate": 6.125975690264456e-08, + "loss": 0.0028, + "step": 35777 + }, + { + "epoch": 0.69, + "learning_rate": 6.125587355830842e-08, + "loss": 0.0004, + "step": 35778 + }, + { + "epoch": 0.69, + "learning_rate": 6.125199021397228e-08, + "loss": 0.0003, + "step": 35779 + }, + { + "epoch": 0.69, + "learning_rate": 6.124810686963613e-08, + "loss": 0.0005, + "step": 35780 + }, + { + "epoch": 0.69, + "learning_rate": 6.124422352529999e-08, + "loss": 0.0004, + "step": 35781 + }, + { + "epoch": 0.69, + "learning_rate": 6.124034018096385e-08, + "loss": 0.0004, + "step": 35782 + }, + { + "epoch": 0.69, + "learning_rate": 6.123645683662771e-08, + "loss": 0.7709, + "step": 35783 + }, + { + "epoch": 0.69, + "learning_rate": 6.123257349229157e-08, + "loss": 0.0003, + "step": 35784 + }, + { + "epoch": 0.69, + "learning_rate": 6.122869014795543e-08, + "loss": 0.0004, + "step": 35785 + }, + { + "epoch": 0.69, + "learning_rate": 6.122480680361927e-08, + "loss": 0.0006, + "step": 35786 + }, + { + "epoch": 0.69, + "learning_rate": 6.122092345928313e-08, + "loss": 0.0005, + "step": 35787 + }, + { + "epoch": 0.69, + "learning_rate": 6.121704011494699e-08, + "loss": 0.0005, + "step": 35788 + }, + { + "epoch": 0.69, + "learning_rate": 6.121315677061085e-08, + "loss": 0.0004, + "step": 35789 + }, + { + "epoch": 0.69, + "learning_rate": 6.12092734262747e-08, + "loss": 0.0007, + "step": 35790 + }, + { + "epoch": 0.69, + "learning_rate": 6.120539008193856e-08, + "loss": 0.0291, + "step": 35791 + }, + { + "epoch": 0.69, + "learning_rate": 6.120150673760242e-08, + "loss": 0.0007, + "step": 35792 + }, + { + "epoch": 0.69, + "learning_rate": 6.119762339326628e-08, + "loss": 0.0008, + "step": 35793 + }, + { + "epoch": 0.69, + "learning_rate": 6.119374004893014e-08, + "loss": 0.0004, + "step": 35794 + }, + { + "epoch": 0.69, + "learning_rate": 6.1189856704594e-08, + "loss": 0.0004, + "step": 35795 + }, + { + "epoch": 0.69, + "learning_rate": 6.118597336025785e-08, + "loss": 0.0003, + "step": 35796 + }, + { + "epoch": 0.69, + "learning_rate": 6.118209001592171e-08, + "loss": 0.0008, + "step": 35797 + }, + { + "epoch": 0.69, + "learning_rate": 6.117820667158557e-08, + "loss": 0.0004, + "step": 35798 + }, + { + "epoch": 0.69, + "learning_rate": 6.117432332724943e-08, + "loss": 0.0012, + "step": 35799 + }, + { + "epoch": 0.69, + "learning_rate": 6.117043998291329e-08, + "loss": 0.0006, + "step": 35800 + }, + { + "epoch": 0.69, + "learning_rate": 6.116655663857713e-08, + "loss": 0.0004, + "step": 35801 + }, + { + "epoch": 0.69, + "learning_rate": 6.116267329424099e-08, + "loss": 0.7753, + "step": 35802 + }, + { + "epoch": 0.69, + "learning_rate": 6.115878994990485e-08, + "loss": 0.0012, + "step": 35803 + }, + { + "epoch": 0.69, + "learning_rate": 6.11549066055687e-08, + "loss": 0.0005, + "step": 35804 + }, + { + "epoch": 0.69, + "learning_rate": 6.115102326123256e-08, + "loss": 0.0005, + "step": 35805 + }, + { + "epoch": 0.69, + "learning_rate": 6.114713991689642e-08, + "loss": 0.0005, + "step": 35806 + }, + { + "epoch": 0.69, + "learning_rate": 6.114325657256028e-08, + "loss": 0.0003, + "step": 35807 + }, + { + "epoch": 0.69, + "learning_rate": 6.113937322822414e-08, + "loss": 0.0004, + "step": 35808 + }, + { + "epoch": 0.69, + "learning_rate": 6.1135489883888e-08, + "loss": 0.0032, + "step": 35809 + }, + { + "epoch": 0.69, + "learning_rate": 6.113160653955186e-08, + "loss": 0.0005, + "step": 35810 + }, + { + "epoch": 0.69, + "learning_rate": 6.112772319521571e-08, + "loss": 0.0005, + "step": 35811 + }, + { + "epoch": 0.69, + "learning_rate": 6.112383985087957e-08, + "loss": 0.0004, + "step": 35812 + }, + { + "epoch": 0.69, + "learning_rate": 6.111995650654343e-08, + "loss": 0.0054, + "step": 35813 + }, + { + "epoch": 0.69, + "learning_rate": 6.111607316220729e-08, + "loss": 0.0012, + "step": 35814 + }, + { + "epoch": 0.69, + "learning_rate": 6.111218981787115e-08, + "loss": 0.0007, + "step": 35815 + }, + { + "epoch": 0.69, + "learning_rate": 6.1108306473535e-08, + "loss": 0.0009, + "step": 35816 + }, + { + "epoch": 0.69, + "learning_rate": 6.110442312919886e-08, + "loss": 0.5615, + "step": 35817 + }, + { + "epoch": 0.69, + "learning_rate": 6.110053978486272e-08, + "loss": 0.0003, + "step": 35818 + }, + { + "epoch": 0.69, + "learning_rate": 6.109665644052658e-08, + "loss": 0.0004, + "step": 35819 + }, + { + "epoch": 0.69, + "learning_rate": 6.109277309619044e-08, + "loss": 0.0031, + "step": 35820 + }, + { + "epoch": 0.69, + "learning_rate": 6.108888975185428e-08, + "loss": 0.0005, + "step": 35821 + }, + { + "epoch": 0.69, + "learning_rate": 6.108500640751814e-08, + "loss": 0.0003, + "step": 35822 + }, + { + "epoch": 0.69, + "learning_rate": 6.1081123063182e-08, + "loss": 0.5458, + "step": 35823 + }, + { + "epoch": 0.69, + "learning_rate": 6.107723971884586e-08, + "loss": 0.0005, + "step": 35824 + }, + { + "epoch": 0.69, + "learning_rate": 6.107335637450972e-08, + "loss": 0.0043, + "step": 35825 + }, + { + "epoch": 0.69, + "learning_rate": 6.106947303017357e-08, + "loss": 0.0004, + "step": 35826 + }, + { + "epoch": 0.69, + "learning_rate": 6.106558968583743e-08, + "loss": 0.0118, + "step": 35827 + }, + { + "epoch": 0.69, + "learning_rate": 6.106170634150129e-08, + "loss": 0.0005, + "step": 35828 + }, + { + "epoch": 0.7, + "learning_rate": 6.105782299716515e-08, + "loss": 0.0458, + "step": 35829 + }, + { + "epoch": 0.7, + "learning_rate": 6.105393965282901e-08, + "loss": 0.0003, + "step": 35830 + }, + { + "epoch": 0.7, + "learning_rate": 6.105005630849287e-08, + "loss": 1.0373, + "step": 35831 + }, + { + "epoch": 0.7, + "learning_rate": 6.104617296415672e-08, + "loss": 0.0004, + "step": 35832 + }, + { + "epoch": 0.7, + "learning_rate": 6.104228961982058e-08, + "loss": 0.0005, + "step": 35833 + }, + { + "epoch": 0.7, + "learning_rate": 6.103840627548444e-08, + "loss": 0.0004, + "step": 35834 + }, + { + "epoch": 0.7, + "learning_rate": 6.10345229311483e-08, + "loss": 0.0003, + "step": 35835 + }, + { + "epoch": 0.7, + "learning_rate": 6.103063958681216e-08, + "loss": 0.0004, + "step": 35836 + }, + { + "epoch": 0.7, + "learning_rate": 6.102675624247602e-08, + "loss": 0.0004, + "step": 35837 + }, + { + "epoch": 0.7, + "learning_rate": 6.102287289813987e-08, + "loss": 0.0004, + "step": 35838 + }, + { + "epoch": 0.7, + "learning_rate": 6.101898955380373e-08, + "loss": 0.0055, + "step": 35839 + }, + { + "epoch": 0.7, + "learning_rate": 6.101510620946759e-08, + "loss": 0.0008, + "step": 35840 + }, + { + "epoch": 0.7, + "learning_rate": 6.101122286513145e-08, + "loss": 0.0011, + "step": 35841 + }, + { + "epoch": 0.7, + "learning_rate": 6.10073395207953e-08, + "loss": 0.2892, + "step": 35842 + }, + { + "epoch": 0.7, + "learning_rate": 6.100345617645916e-08, + "loss": 0.0005, + "step": 35843 + }, + { + "epoch": 0.7, + "learning_rate": 6.099957283212302e-08, + "loss": 0.0004, + "step": 35844 + }, + { + "epoch": 0.7, + "learning_rate": 6.099568948778688e-08, + "loss": 0.0004, + "step": 35845 + }, + { + "epoch": 0.7, + "learning_rate": 6.099180614345074e-08, + "loss": 0.0004, + "step": 35846 + }, + { + "epoch": 0.7, + "learning_rate": 6.09879227991146e-08, + "loss": 0.0005, + "step": 35847 + }, + { + "epoch": 0.7, + "learning_rate": 6.098403945477846e-08, + "loss": 0.3157, + "step": 35848 + }, + { + "epoch": 0.7, + "learning_rate": 6.098015611044231e-08, + "loss": 0.3887, + "step": 35849 + }, + { + "epoch": 0.7, + "learning_rate": 6.097627276610616e-08, + "loss": 0.3582, + "step": 35850 + }, + { + "epoch": 0.7, + "learning_rate": 6.097238942177002e-08, + "loss": 0.0005, + "step": 35851 + }, + { + "epoch": 0.7, + "learning_rate": 6.096850607743388e-08, + "loss": 0.0004, + "step": 35852 + }, + { + "epoch": 0.7, + "learning_rate": 6.096462273309773e-08, + "loss": 0.0007, + "step": 35853 + }, + { + "epoch": 0.7, + "learning_rate": 6.096073938876159e-08, + "loss": 1.067, + "step": 35854 + }, + { + "epoch": 0.7, + "learning_rate": 6.095685604442545e-08, + "loss": 0.0004, + "step": 35855 + }, + { + "epoch": 0.7, + "learning_rate": 6.095297270008931e-08, + "loss": 0.0005, + "step": 35856 + }, + { + "epoch": 0.7, + "learning_rate": 6.094908935575317e-08, + "loss": 0.0008, + "step": 35857 + }, + { + "epoch": 0.7, + "learning_rate": 6.094520601141703e-08, + "loss": 0.0008, + "step": 35858 + }, + { + "epoch": 0.7, + "learning_rate": 6.094132266708088e-08, + "loss": 0.0004, + "step": 35859 + }, + { + "epoch": 0.7, + "learning_rate": 6.093743932274474e-08, + "loss": 0.7163, + "step": 35860 + }, + { + "epoch": 0.7, + "learning_rate": 6.09335559784086e-08, + "loss": 0.0005, + "step": 35861 + }, + { + "epoch": 0.7, + "learning_rate": 6.092967263407246e-08, + "loss": 0.0005, + "step": 35862 + }, + { + "epoch": 0.7, + "learning_rate": 6.092578928973632e-08, + "loss": 0.0003, + "step": 35863 + }, + { + "epoch": 0.7, + "learning_rate": 6.092190594540017e-08, + "loss": 0.0005, + "step": 35864 + }, + { + "epoch": 0.7, + "learning_rate": 6.091802260106403e-08, + "loss": 0.0003, + "step": 35865 + }, + { + "epoch": 0.7, + "learning_rate": 6.091413925672789e-08, + "loss": 0.0004, + "step": 35866 + }, + { + "epoch": 0.7, + "learning_rate": 6.091025591239175e-08, + "loss": 0.0004, + "step": 35867 + }, + { + "epoch": 0.7, + "learning_rate": 6.090637256805561e-08, + "loss": 0.0004, + "step": 35868 + }, + { + "epoch": 0.7, + "learning_rate": 6.090248922371947e-08, + "loss": 0.0005, + "step": 35869 + }, + { + "epoch": 0.7, + "learning_rate": 6.089860587938332e-08, + "loss": 0.0003, + "step": 35870 + }, + { + "epoch": 0.7, + "learning_rate": 6.089472253504718e-08, + "loss": 0.0005, + "step": 35871 + }, + { + "epoch": 0.7, + "learning_rate": 6.089083919071104e-08, + "loss": 0.0004, + "step": 35872 + }, + { + "epoch": 0.7, + "learning_rate": 6.08869558463749e-08, + "loss": 0.0004, + "step": 35873 + }, + { + "epoch": 0.7, + "learning_rate": 6.088307250203876e-08, + "loss": 0.0005, + "step": 35874 + }, + { + "epoch": 0.7, + "learning_rate": 6.087918915770262e-08, + "loss": 0.0004, + "step": 35875 + }, + { + "epoch": 0.7, + "learning_rate": 6.087530581336647e-08, + "loss": 0.8855, + "step": 35876 + }, + { + "epoch": 0.7, + "learning_rate": 6.087142246903033e-08, + "loss": 0.0004, + "step": 35877 + }, + { + "epoch": 0.7, + "learning_rate": 6.086753912469419e-08, + "loss": 0.0003, + "step": 35878 + }, + { + "epoch": 0.7, + "learning_rate": 6.086365578035803e-08, + "loss": 0.0005, + "step": 35879 + }, + { + "epoch": 0.7, + "learning_rate": 6.085977243602189e-08, + "loss": 0.0004, + "step": 35880 + }, + { + "epoch": 0.7, + "learning_rate": 6.085588909168575e-08, + "loss": 0.0004, + "step": 35881 + }, + { + "epoch": 0.7, + "learning_rate": 6.085200574734961e-08, + "loss": 0.0004, + "step": 35882 + }, + { + "epoch": 0.7, + "learning_rate": 6.084812240301347e-08, + "loss": 0.0004, + "step": 35883 + }, + { + "epoch": 0.7, + "learning_rate": 6.084423905867733e-08, + "loss": 0.0406, + "step": 35884 + }, + { + "epoch": 0.7, + "learning_rate": 6.084035571434118e-08, + "loss": 0.0024, + "step": 35885 + }, + { + "epoch": 0.7, + "learning_rate": 6.083647237000504e-08, + "loss": 0.0006, + "step": 35886 + }, + { + "epoch": 0.7, + "learning_rate": 6.08325890256689e-08, + "loss": 0.0004, + "step": 35887 + }, + { + "epoch": 0.7, + "learning_rate": 6.082870568133276e-08, + "loss": 0.0003, + "step": 35888 + }, + { + "epoch": 0.7, + "learning_rate": 6.082482233699662e-08, + "loss": 0.0004, + "step": 35889 + }, + { + "epoch": 0.7, + "learning_rate": 6.082093899266048e-08, + "loss": 0.0006, + "step": 35890 + }, + { + "epoch": 0.7, + "learning_rate": 6.081705564832433e-08, + "loss": 0.0023, + "step": 35891 + }, + { + "epoch": 0.7, + "learning_rate": 6.081317230398819e-08, + "loss": 0.0004, + "step": 35892 + }, + { + "epoch": 0.7, + "learning_rate": 6.080928895965205e-08, + "loss": 0.0004, + "step": 35893 + }, + { + "epoch": 0.7, + "learning_rate": 6.080540561531591e-08, + "loss": 0.0004, + "step": 35894 + }, + { + "epoch": 0.7, + "learning_rate": 6.080152227097977e-08, + "loss": 0.0003, + "step": 35895 + }, + { + "epoch": 0.7, + "learning_rate": 6.079763892664363e-08, + "loss": 0.0004, + "step": 35896 + }, + { + "epoch": 0.7, + "learning_rate": 6.079375558230748e-08, + "loss": 0.0008, + "step": 35897 + }, + { + "epoch": 0.7, + "learning_rate": 6.078987223797134e-08, + "loss": 0.0004, + "step": 35898 + }, + { + "epoch": 0.7, + "learning_rate": 6.07859888936352e-08, + "loss": 0.0004, + "step": 35899 + }, + { + "epoch": 0.7, + "learning_rate": 6.078210554929906e-08, + "loss": 0.0006, + "step": 35900 + }, + { + "epoch": 0.7, + "learning_rate": 6.077822220496292e-08, + "loss": 0.0004, + "step": 35901 + }, + { + "epoch": 0.7, + "learning_rate": 6.077433886062677e-08, + "loss": 0.0003, + "step": 35902 + }, + { + "epoch": 0.7, + "learning_rate": 6.077045551629063e-08, + "loss": 0.0006, + "step": 35903 + }, + { + "epoch": 0.7, + "learning_rate": 6.076657217195449e-08, + "loss": 0.0004, + "step": 35904 + }, + { + "epoch": 0.7, + "learning_rate": 6.076268882761835e-08, + "loss": 0.0003, + "step": 35905 + }, + { + "epoch": 0.7, + "learning_rate": 6.075880548328221e-08, + "loss": 0.0005, + "step": 35906 + }, + { + "epoch": 0.7, + "learning_rate": 6.075492213894607e-08, + "loss": 0.0004, + "step": 35907 + }, + { + "epoch": 0.7, + "learning_rate": 6.075103879460991e-08, + "loss": 0.0006, + "step": 35908 + }, + { + "epoch": 0.7, + "learning_rate": 6.074715545027377e-08, + "loss": 0.0004, + "step": 35909 + }, + { + "epoch": 0.7, + "learning_rate": 6.074327210593763e-08, + "loss": 0.0006, + "step": 35910 + }, + { + "epoch": 0.7, + "learning_rate": 6.073938876160149e-08, + "loss": 0.0006, + "step": 35911 + }, + { + "epoch": 0.7, + "learning_rate": 6.073550541726534e-08, + "loss": 0.0009, + "step": 35912 + }, + { + "epoch": 0.7, + "learning_rate": 6.07316220729292e-08, + "loss": 0.0005, + "step": 35913 + }, + { + "epoch": 0.7, + "learning_rate": 6.072773872859306e-08, + "loss": 0.0006, + "step": 35914 + }, + { + "epoch": 0.7, + "learning_rate": 6.072385538425692e-08, + "loss": 0.0176, + "step": 35915 + }, + { + "epoch": 0.7, + "learning_rate": 6.071997203992078e-08, + "loss": 0.0004, + "step": 35916 + }, + { + "epoch": 0.7, + "learning_rate": 6.071608869558463e-08, + "loss": 0.0004, + "step": 35917 + }, + { + "epoch": 0.7, + "learning_rate": 6.071220535124849e-08, + "loss": 0.0004, + "step": 35918 + }, + { + "epoch": 0.7, + "learning_rate": 6.070832200691235e-08, + "loss": 0.4984, + "step": 35919 + }, + { + "epoch": 0.7, + "learning_rate": 6.070443866257621e-08, + "loss": 0.0003, + "step": 35920 + }, + { + "epoch": 0.7, + "learning_rate": 6.070055531824007e-08, + "loss": 0.0004, + "step": 35921 + }, + { + "epoch": 0.7, + "learning_rate": 6.069667197390393e-08, + "loss": 0.0004, + "step": 35922 + }, + { + "epoch": 0.7, + "learning_rate": 6.069278862956778e-08, + "loss": 0.6955, + "step": 35923 + }, + { + "epoch": 0.7, + "learning_rate": 6.068890528523164e-08, + "loss": 0.0004, + "step": 35924 + }, + { + "epoch": 0.7, + "learning_rate": 6.06850219408955e-08, + "loss": 0.0004, + "step": 35925 + }, + { + "epoch": 0.7, + "learning_rate": 6.068113859655936e-08, + "loss": 0.0006, + "step": 35926 + }, + { + "epoch": 0.7, + "learning_rate": 6.067725525222322e-08, + "loss": 0.0003, + "step": 35927 + }, + { + "epoch": 0.7, + "learning_rate": 6.067337190788708e-08, + "loss": 0.0006, + "step": 35928 + }, + { + "epoch": 0.7, + "learning_rate": 6.066948856355093e-08, + "loss": 0.0003, + "step": 35929 + }, + { + "epoch": 0.7, + "learning_rate": 6.066560521921479e-08, + "loss": 0.0005, + "step": 35930 + }, + { + "epoch": 0.7, + "learning_rate": 6.066172187487865e-08, + "loss": 0.0011, + "step": 35931 + }, + { + "epoch": 0.7, + "learning_rate": 6.065783853054251e-08, + "loss": 0.0039, + "step": 35932 + }, + { + "epoch": 0.7, + "learning_rate": 6.065395518620637e-08, + "loss": 0.0005, + "step": 35933 + }, + { + "epoch": 0.7, + "learning_rate": 6.065007184187023e-08, + "loss": 0.0003, + "step": 35934 + }, + { + "epoch": 0.7, + "learning_rate": 6.064618849753408e-08, + "loss": 0.0003, + "step": 35935 + }, + { + "epoch": 0.7, + "learning_rate": 6.064230515319794e-08, + "loss": 0.0005, + "step": 35936 + }, + { + "epoch": 0.7, + "learning_rate": 6.063842180886179e-08, + "loss": 0.0004, + "step": 35937 + }, + { + "epoch": 0.7, + "learning_rate": 6.063453846452564e-08, + "loss": 0.0006, + "step": 35938 + }, + { + "epoch": 0.7, + "learning_rate": 6.06306551201895e-08, + "loss": 0.0152, + "step": 35939 + }, + { + "epoch": 0.7, + "learning_rate": 6.062677177585336e-08, + "loss": 0.0004, + "step": 35940 + }, + { + "epoch": 0.7, + "learning_rate": 6.062288843151722e-08, + "loss": 0.0004, + "step": 35941 + }, + { + "epoch": 0.7, + "learning_rate": 6.061900508718108e-08, + "loss": 0.0003, + "step": 35942 + }, + { + "epoch": 0.7, + "learning_rate": 6.061512174284494e-08, + "loss": 0.0007, + "step": 35943 + }, + { + "epoch": 0.7, + "learning_rate": 6.06112383985088e-08, + "loss": 0.87, + "step": 35944 + }, + { + "epoch": 0.7, + "learning_rate": 6.060735505417265e-08, + "loss": 0.0004, + "step": 35945 + }, + { + "epoch": 0.7, + "learning_rate": 6.060347170983651e-08, + "loss": 0.2609, + "step": 35946 + }, + { + "epoch": 0.7, + "learning_rate": 6.059958836550037e-08, + "loss": 0.0033, + "step": 35947 + }, + { + "epoch": 0.7, + "learning_rate": 6.059570502116423e-08, + "loss": 0.0004, + "step": 35948 + }, + { + "epoch": 0.7, + "learning_rate": 6.059182167682809e-08, + "loss": 0.0006, + "step": 35949 + }, + { + "epoch": 0.7, + "learning_rate": 6.058793833249194e-08, + "loss": 0.0006, + "step": 35950 + }, + { + "epoch": 0.7, + "learning_rate": 6.05840549881558e-08, + "loss": 0.0004, + "step": 35951 + }, + { + "epoch": 0.7, + "learning_rate": 6.058017164381966e-08, + "loss": 0.0396, + "step": 35952 + }, + { + "epoch": 0.7, + "learning_rate": 6.057628829948352e-08, + "loss": 0.0006, + "step": 35953 + }, + { + "epoch": 0.7, + "learning_rate": 6.057240495514738e-08, + "loss": 0.0006, + "step": 35954 + }, + { + "epoch": 0.7, + "learning_rate": 6.056852161081124e-08, + "loss": 0.0004, + "step": 35955 + }, + { + "epoch": 0.7, + "learning_rate": 6.056463826647509e-08, + "loss": 0.0004, + "step": 35956 + }, + { + "epoch": 0.7, + "learning_rate": 6.056075492213895e-08, + "loss": 0.0284, + "step": 35957 + }, + { + "epoch": 0.7, + "learning_rate": 6.055687157780281e-08, + "loss": 0.0006, + "step": 35958 + }, + { + "epoch": 0.7, + "learning_rate": 6.055298823346667e-08, + "loss": 0.0004, + "step": 35959 + }, + { + "epoch": 0.7, + "learning_rate": 6.054910488913053e-08, + "loss": 0.0004, + "step": 35960 + }, + { + "epoch": 0.7, + "learning_rate": 6.054522154479438e-08, + "loss": 0.0007, + "step": 35961 + }, + { + "epoch": 0.7, + "learning_rate": 6.054133820045824e-08, + "loss": 0.0005, + "step": 35962 + }, + { + "epoch": 0.7, + "learning_rate": 6.053745485612209e-08, + "loss": 0.1386, + "step": 35963 + }, + { + "epoch": 0.7, + "learning_rate": 6.053357151178595e-08, + "loss": 0.0004, + "step": 35964 + }, + { + "epoch": 0.7, + "learning_rate": 6.05296881674498e-08, + "loss": 0.0008, + "step": 35965 + }, + { + "epoch": 0.7, + "learning_rate": 6.052580482311366e-08, + "loss": 0.0006, + "step": 35966 + }, + { + "epoch": 0.7, + "learning_rate": 6.052192147877752e-08, + "loss": 0.0022, + "step": 35967 + }, + { + "epoch": 0.7, + "learning_rate": 6.051803813444138e-08, + "loss": 0.0005, + "step": 35968 + }, + { + "epoch": 0.7, + "learning_rate": 6.051415479010524e-08, + "loss": 0.0005, + "step": 35969 + }, + { + "epoch": 0.7, + "learning_rate": 6.05102714457691e-08, + "loss": 0.0004, + "step": 35970 + }, + { + "epoch": 0.7, + "learning_rate": 6.050638810143295e-08, + "loss": 0.0004, + "step": 35971 + }, + { + "epoch": 0.7, + "learning_rate": 6.050250475709681e-08, + "loss": 0.0003, + "step": 35972 + }, + { + "epoch": 0.7, + "learning_rate": 6.049862141276067e-08, + "loss": 0.0006, + "step": 35973 + }, + { + "epoch": 0.7, + "learning_rate": 6.049473806842453e-08, + "loss": 0.9543, + "step": 35974 + }, + { + "epoch": 0.7, + "learning_rate": 6.049085472408839e-08, + "loss": 0.0003, + "step": 35975 + }, + { + "epoch": 0.7, + "learning_rate": 6.048697137975224e-08, + "loss": 0.0006, + "step": 35976 + }, + { + "epoch": 0.7, + "learning_rate": 6.04830880354161e-08, + "loss": 0.0005, + "step": 35977 + }, + { + "epoch": 0.7, + "learning_rate": 6.047920469107995e-08, + "loss": 0.0005, + "step": 35978 + }, + { + "epoch": 0.7, + "learning_rate": 6.04753213467438e-08, + "loss": 0.0041, + "step": 35979 + }, + { + "epoch": 0.7, + "learning_rate": 6.047143800240766e-08, + "loss": 0.0003, + "step": 35980 + }, + { + "epoch": 0.7, + "learning_rate": 6.046755465807152e-08, + "loss": 0.0004, + "step": 35981 + }, + { + "epoch": 0.7, + "learning_rate": 6.046367131373538e-08, + "loss": 0.0004, + "step": 35982 + }, + { + "epoch": 0.7, + "learning_rate": 6.045978796939924e-08, + "loss": 0.0005, + "step": 35983 + }, + { + "epoch": 0.7, + "learning_rate": 6.04559046250631e-08, + "loss": 0.0006, + "step": 35984 + }, + { + "epoch": 0.7, + "learning_rate": 6.045202128072696e-08, + "loss": 0.0003, + "step": 35985 + }, + { + "epoch": 0.7, + "learning_rate": 6.044813793639081e-08, + "loss": 0.0005, + "step": 35986 + }, + { + "epoch": 0.7, + "learning_rate": 6.044425459205467e-08, + "loss": 0.0004, + "step": 35987 + }, + { + "epoch": 0.7, + "learning_rate": 6.044037124771853e-08, + "loss": 0.0011, + "step": 35988 + }, + { + "epoch": 0.7, + "learning_rate": 6.043648790338239e-08, + "loss": 0.0006, + "step": 35989 + }, + { + "epoch": 0.7, + "learning_rate": 6.043260455904625e-08, + "loss": 0.0007, + "step": 35990 + }, + { + "epoch": 0.7, + "learning_rate": 6.04287212147101e-08, + "loss": 0.0005, + "step": 35991 + }, + { + "epoch": 0.7, + "learning_rate": 6.042483787037396e-08, + "loss": 0.0004, + "step": 35992 + }, + { + "epoch": 0.7, + "learning_rate": 6.042095452603782e-08, + "loss": 0.0009, + "step": 35993 + }, + { + "epoch": 0.7, + "learning_rate": 6.041707118170168e-08, + "loss": 0.0569, + "step": 35994 + }, + { + "epoch": 0.7, + "learning_rate": 6.041318783736553e-08, + "loss": 0.0008, + "step": 35995 + }, + { + "epoch": 0.7, + "learning_rate": 6.040930449302938e-08, + "loss": 0.1925, + "step": 35996 + }, + { + "epoch": 0.7, + "learning_rate": 6.040542114869324e-08, + "loss": 0.0004, + "step": 35997 + }, + { + "epoch": 0.7, + "learning_rate": 6.04015378043571e-08, + "loss": 0.002, + "step": 35998 + }, + { + "epoch": 0.7, + "learning_rate": 6.039765446002096e-08, + "loss": 0.0006, + "step": 35999 + }, + { + "epoch": 0.7, + "learning_rate": 6.039377111568482e-08, + "loss": 0.0003, + "step": 36000 + }, + { + "epoch": 0.7, + "learning_rate": 6.038988777134867e-08, + "loss": 0.0003, + "step": 36001 + }, + { + "epoch": 0.7, + "learning_rate": 6.038600442701253e-08, + "loss": 0.0003, + "step": 36002 + }, + { + "epoch": 0.7, + "learning_rate": 6.038212108267639e-08, + "loss": 0.0004, + "step": 36003 + }, + { + "epoch": 0.7, + "learning_rate": 6.037823773834025e-08, + "loss": 0.0007, + "step": 36004 + }, + { + "epoch": 0.7, + "learning_rate": 6.037435439400411e-08, + "loss": 0.0005, + "step": 36005 + }, + { + "epoch": 0.7, + "learning_rate": 6.037047104966797e-08, + "loss": 0.0004, + "step": 36006 + }, + { + "epoch": 0.7, + "learning_rate": 6.036658770533182e-08, + "loss": 0.0034, + "step": 36007 + }, + { + "epoch": 0.7, + "learning_rate": 6.036270436099568e-08, + "loss": 0.0006, + "step": 36008 + }, + { + "epoch": 0.7, + "learning_rate": 6.035882101665954e-08, + "loss": 0.0004, + "step": 36009 + }, + { + "epoch": 0.7, + "learning_rate": 6.03549376723234e-08, + "loss": 0.0003, + "step": 36010 + }, + { + "epoch": 0.7, + "learning_rate": 6.035105432798726e-08, + "loss": 0.0054, + "step": 36011 + }, + { + "epoch": 0.7, + "learning_rate": 6.034717098365112e-08, + "loss": 0.2447, + "step": 36012 + }, + { + "epoch": 0.7, + "learning_rate": 6.034328763931497e-08, + "loss": 0.0004, + "step": 36013 + }, + { + "epoch": 0.7, + "learning_rate": 6.033940429497883e-08, + "loss": 0.0004, + "step": 36014 + }, + { + "epoch": 0.7, + "learning_rate": 6.033552095064269e-08, + "loss": 0.0004, + "step": 36015 + }, + { + "epoch": 0.7, + "learning_rate": 6.033163760630655e-08, + "loss": 0.0003, + "step": 36016 + }, + { + "epoch": 0.7, + "learning_rate": 6.03277542619704e-08, + "loss": 0.0015, + "step": 36017 + }, + { + "epoch": 0.7, + "learning_rate": 6.032387091763426e-08, + "loss": 0.0012, + "step": 36018 + }, + { + "epoch": 0.7, + "learning_rate": 6.031998757329812e-08, + "loss": 0.4548, + "step": 36019 + }, + { + "epoch": 0.7, + "learning_rate": 6.031610422896198e-08, + "loss": 0.0003, + "step": 36020 + }, + { + "epoch": 0.7, + "learning_rate": 6.031222088462584e-08, + "loss": 0.0005, + "step": 36021 + }, + { + "epoch": 0.7, + "learning_rate": 6.03083375402897e-08, + "loss": 0.0007, + "step": 36022 + }, + { + "epoch": 0.7, + "learning_rate": 6.030445419595356e-08, + "loss": 0.0004, + "step": 36023 + }, + { + "epoch": 0.7, + "learning_rate": 6.03005708516174e-08, + "loss": 0.0004, + "step": 36024 + }, + { + "epoch": 0.7, + "learning_rate": 6.029668750728126e-08, + "loss": 0.0003, + "step": 36025 + }, + { + "epoch": 0.7, + "learning_rate": 6.029280416294512e-08, + "loss": 0.0004, + "step": 36026 + }, + { + "epoch": 0.7, + "learning_rate": 6.028892081860898e-08, + "loss": 0.0005, + "step": 36027 + }, + { + "epoch": 0.7, + "learning_rate": 6.028503747427283e-08, + "loss": 0.0005, + "step": 36028 + }, + { + "epoch": 0.7, + "learning_rate": 6.028115412993669e-08, + "loss": 0.0007, + "step": 36029 + }, + { + "epoch": 0.7, + "learning_rate": 6.027727078560055e-08, + "loss": 0.0004, + "step": 36030 + }, + { + "epoch": 0.7, + "learning_rate": 6.027338744126441e-08, + "loss": 0.0004, + "step": 36031 + }, + { + "epoch": 0.7, + "learning_rate": 6.026950409692827e-08, + "loss": 0.0004, + "step": 36032 + }, + { + "epoch": 0.7, + "learning_rate": 6.026562075259213e-08, + "loss": 0.0003, + "step": 36033 + }, + { + "epoch": 0.7, + "learning_rate": 6.026173740825598e-08, + "loss": 0.0003, + "step": 36034 + }, + { + "epoch": 0.7, + "learning_rate": 6.025785406391984e-08, + "loss": 0.0035, + "step": 36035 + }, + { + "epoch": 0.7, + "learning_rate": 6.02539707195837e-08, + "loss": 0.0005, + "step": 36036 + }, + { + "epoch": 0.7, + "learning_rate": 6.025008737524756e-08, + "loss": 0.5463, + "step": 36037 + }, + { + "epoch": 0.7, + "learning_rate": 6.024620403091142e-08, + "loss": 0.0005, + "step": 36038 + }, + { + "epoch": 0.7, + "learning_rate": 6.024232068657527e-08, + "loss": 0.0005, + "step": 36039 + }, + { + "epoch": 0.7, + "learning_rate": 6.023843734223913e-08, + "loss": 0.0004, + "step": 36040 + }, + { + "epoch": 0.7, + "learning_rate": 6.023455399790299e-08, + "loss": 0.0005, + "step": 36041 + }, + { + "epoch": 0.7, + "learning_rate": 6.023067065356685e-08, + "loss": 0.0004, + "step": 36042 + }, + { + "epoch": 0.7, + "learning_rate": 6.022678730923071e-08, + "loss": 0.3966, + "step": 36043 + }, + { + "epoch": 0.7, + "learning_rate": 6.022290396489457e-08, + "loss": 0.0011, + "step": 36044 + }, + { + "epoch": 0.7, + "learning_rate": 6.021902062055842e-08, + "loss": 0.9585, + "step": 36045 + }, + { + "epoch": 0.7, + "learning_rate": 6.021513727622228e-08, + "loss": 0.0008, + "step": 36046 + }, + { + "epoch": 0.7, + "learning_rate": 6.021125393188614e-08, + "loss": 0.0004, + "step": 36047 + }, + { + "epoch": 0.7, + "learning_rate": 6.020737058755e-08, + "loss": 0.0015, + "step": 36048 + }, + { + "epoch": 0.7, + "learning_rate": 6.020348724321386e-08, + "loss": 0.0007, + "step": 36049 + }, + { + "epoch": 0.7, + "learning_rate": 6.019960389887772e-08, + "loss": 1.0766, + "step": 36050 + }, + { + "epoch": 0.7, + "learning_rate": 6.019572055454157e-08, + "loss": 0.0056, + "step": 36051 + }, + { + "epoch": 0.7, + "learning_rate": 6.019183721020543e-08, + "loss": 0.0004, + "step": 36052 + }, + { + "epoch": 0.7, + "learning_rate": 6.018795386586928e-08, + "loss": 0.0004, + "step": 36053 + }, + { + "epoch": 0.7, + "learning_rate": 6.018407052153314e-08, + "loss": 0.0006, + "step": 36054 + }, + { + "epoch": 0.7, + "learning_rate": 6.018018717719699e-08, + "loss": 0.0004, + "step": 36055 + }, + { + "epoch": 0.7, + "learning_rate": 6.017630383286085e-08, + "loss": 0.0004, + "step": 36056 + }, + { + "epoch": 0.7, + "learning_rate": 6.017242048852471e-08, + "loss": 0.0157, + "step": 36057 + }, + { + "epoch": 0.7, + "learning_rate": 6.016853714418857e-08, + "loss": 0.0923, + "step": 36058 + }, + { + "epoch": 0.7, + "learning_rate": 6.016465379985243e-08, + "loss": 0.0004, + "step": 36059 + }, + { + "epoch": 0.7, + "learning_rate": 6.016077045551628e-08, + "loss": 0.2789, + "step": 36060 + }, + { + "epoch": 0.7, + "learning_rate": 6.015688711118014e-08, + "loss": 0.0005, + "step": 36061 + }, + { + "epoch": 0.7, + "learning_rate": 6.0153003766844e-08, + "loss": 0.0008, + "step": 36062 + }, + { + "epoch": 0.7, + "learning_rate": 6.014912042250786e-08, + "loss": 0.6866, + "step": 36063 + }, + { + "epoch": 0.7, + "learning_rate": 6.014523707817172e-08, + "loss": 0.0006, + "step": 36064 + }, + { + "epoch": 0.7, + "learning_rate": 6.014135373383558e-08, + "loss": 0.0067, + "step": 36065 + }, + { + "epoch": 0.7, + "learning_rate": 6.013747038949943e-08, + "loss": 0.0005, + "step": 36066 + }, + { + "epoch": 0.7, + "learning_rate": 6.013358704516329e-08, + "loss": 0.0004, + "step": 36067 + }, + { + "epoch": 0.7, + "learning_rate": 6.012970370082715e-08, + "loss": 1.559, + "step": 36068 + }, + { + "epoch": 0.7, + "learning_rate": 6.012582035649101e-08, + "loss": 0.0006, + "step": 36069 + }, + { + "epoch": 0.7, + "learning_rate": 6.012193701215487e-08, + "loss": 0.0006, + "step": 36070 + }, + { + "epoch": 0.7, + "learning_rate": 6.011805366781873e-08, + "loss": 0.0008, + "step": 36071 + }, + { + "epoch": 0.7, + "learning_rate": 6.011417032348258e-08, + "loss": 0.0006, + "step": 36072 + }, + { + "epoch": 0.7, + "learning_rate": 6.011028697914644e-08, + "loss": 0.0008, + "step": 36073 + }, + { + "epoch": 0.7, + "learning_rate": 6.01064036348103e-08, + "loss": 0.0004, + "step": 36074 + }, + { + "epoch": 0.7, + "learning_rate": 6.010252029047416e-08, + "loss": 0.0006, + "step": 36075 + }, + { + "epoch": 0.7, + "learning_rate": 6.009863694613802e-08, + "loss": 0.0007, + "step": 36076 + }, + { + "epoch": 0.7, + "learning_rate": 6.009475360180187e-08, + "loss": 0.001, + "step": 36077 + }, + { + "epoch": 0.7, + "learning_rate": 6.009087025746573e-08, + "loss": 0.0007, + "step": 36078 + }, + { + "epoch": 0.7, + "learning_rate": 6.008698691312959e-08, + "loss": 0.0004, + "step": 36079 + }, + { + "epoch": 0.7, + "learning_rate": 6.008310356879345e-08, + "loss": 0.0006, + "step": 36080 + }, + { + "epoch": 0.7, + "learning_rate": 6.007922022445731e-08, + "loss": 0.0003, + "step": 36081 + }, + { + "epoch": 0.7, + "learning_rate": 6.007533688012115e-08, + "loss": 0.0003, + "step": 36082 + }, + { + "epoch": 0.7, + "learning_rate": 6.007145353578501e-08, + "loss": 0.0003, + "step": 36083 + }, + { + "epoch": 0.7, + "learning_rate": 6.006757019144887e-08, + "loss": 0.0007, + "step": 36084 + }, + { + "epoch": 0.7, + "learning_rate": 6.006368684711273e-08, + "loss": 0.0007, + "step": 36085 + }, + { + "epoch": 0.7, + "learning_rate": 6.005980350277659e-08, + "loss": 0.0003, + "step": 36086 + }, + { + "epoch": 0.7, + "learning_rate": 6.005592015844044e-08, + "loss": 0.0004, + "step": 36087 + }, + { + "epoch": 0.7, + "learning_rate": 6.00520368141043e-08, + "loss": 0.0004, + "step": 36088 + }, + { + "epoch": 0.7, + "learning_rate": 6.004815346976816e-08, + "loss": 0.0005, + "step": 36089 + }, + { + "epoch": 0.7, + "learning_rate": 6.004427012543202e-08, + "loss": 0.0003, + "step": 36090 + }, + { + "epoch": 0.7, + "learning_rate": 6.004038678109588e-08, + "loss": 0.0763, + "step": 36091 + }, + { + "epoch": 0.7, + "learning_rate": 6.003650343675974e-08, + "loss": 0.0005, + "step": 36092 + }, + { + "epoch": 0.7, + "learning_rate": 6.003262009242359e-08, + "loss": 0.0008, + "step": 36093 + }, + { + "epoch": 0.7, + "learning_rate": 6.002873674808745e-08, + "loss": 0.0005, + "step": 36094 + }, + { + "epoch": 0.7, + "learning_rate": 6.002485340375131e-08, + "loss": 0.0005, + "step": 36095 + }, + { + "epoch": 0.7, + "learning_rate": 6.002097005941517e-08, + "loss": 0.0008, + "step": 36096 + }, + { + "epoch": 0.7, + "learning_rate": 6.001708671507903e-08, + "loss": 0.0003, + "step": 36097 + }, + { + "epoch": 0.7, + "learning_rate": 6.001320337074288e-08, + "loss": 0.0005, + "step": 36098 + }, + { + "epoch": 0.7, + "learning_rate": 6.000932002640674e-08, + "loss": 0.0004, + "step": 36099 + }, + { + "epoch": 0.7, + "learning_rate": 6.00054366820706e-08, + "loss": 0.001, + "step": 36100 + }, + { + "epoch": 0.7, + "learning_rate": 6.000155333773446e-08, + "loss": 0.0005, + "step": 36101 + }, + { + "epoch": 0.7, + "learning_rate": 5.999766999339832e-08, + "loss": 0.0003, + "step": 36102 + }, + { + "epoch": 0.7, + "learning_rate": 5.999378664906218e-08, + "loss": 0.0006, + "step": 36103 + }, + { + "epoch": 0.7, + "learning_rate": 5.998990330472603e-08, + "loss": 0.0014, + "step": 36104 + }, + { + "epoch": 0.7, + "learning_rate": 5.998601996038989e-08, + "loss": 0.002, + "step": 36105 + }, + { + "epoch": 0.7, + "learning_rate": 5.998213661605375e-08, + "loss": 0.4265, + "step": 36106 + }, + { + "epoch": 0.7, + "learning_rate": 5.997825327171761e-08, + "loss": 0.0017, + "step": 36107 + }, + { + "epoch": 0.7, + "learning_rate": 5.997436992738147e-08, + "loss": 0.0006, + "step": 36108 + }, + { + "epoch": 0.7, + "learning_rate": 5.997048658304533e-08, + "loss": 0.0005, + "step": 36109 + }, + { + "epoch": 0.7, + "learning_rate": 5.996660323870918e-08, + "loss": 0.0179, + "step": 36110 + }, + { + "epoch": 0.7, + "learning_rate": 5.996271989437303e-08, + "loss": 0.0006, + "step": 36111 + }, + { + "epoch": 0.7, + "learning_rate": 5.995883655003689e-08, + "loss": 1.7727, + "step": 36112 + }, + { + "epoch": 0.7, + "learning_rate": 5.995495320570074e-08, + "loss": 0.0007, + "step": 36113 + }, + { + "epoch": 0.7, + "learning_rate": 5.99510698613646e-08, + "loss": 0.0004, + "step": 36114 + }, + { + "epoch": 0.7, + "learning_rate": 5.994718651702846e-08, + "loss": 0.0012, + "step": 36115 + }, + { + "epoch": 0.7, + "learning_rate": 5.994330317269232e-08, + "loss": 0.0005, + "step": 36116 + }, + { + "epoch": 0.7, + "learning_rate": 5.993941982835618e-08, + "loss": 0.0004, + "step": 36117 + }, + { + "epoch": 0.7, + "learning_rate": 5.993553648402004e-08, + "loss": 0.0006, + "step": 36118 + }, + { + "epoch": 0.7, + "learning_rate": 5.99316531396839e-08, + "loss": 0.0007, + "step": 36119 + }, + { + "epoch": 0.7, + "learning_rate": 5.992776979534775e-08, + "loss": 0.0003, + "step": 36120 + }, + { + "epoch": 0.7, + "learning_rate": 5.992388645101161e-08, + "loss": 0.0004, + "step": 36121 + }, + { + "epoch": 0.7, + "learning_rate": 5.992000310667547e-08, + "loss": 0.0004, + "step": 36122 + }, + { + "epoch": 0.7, + "learning_rate": 5.991611976233933e-08, + "loss": 0.0004, + "step": 36123 + }, + { + "epoch": 0.7, + "learning_rate": 5.991223641800319e-08, + "loss": 0.0004, + "step": 36124 + }, + { + "epoch": 0.7, + "learning_rate": 5.990835307366704e-08, + "loss": 0.0005, + "step": 36125 + }, + { + "epoch": 0.7, + "learning_rate": 5.99044697293309e-08, + "loss": 0.012, + "step": 36126 + }, + { + "epoch": 0.7, + "learning_rate": 5.990058638499476e-08, + "loss": 0.0005, + "step": 36127 + }, + { + "epoch": 0.7, + "learning_rate": 5.989670304065862e-08, + "loss": 0.0006, + "step": 36128 + }, + { + "epoch": 0.7, + "learning_rate": 5.989281969632248e-08, + "loss": 0.0005, + "step": 36129 + }, + { + "epoch": 0.7, + "learning_rate": 5.988893635198634e-08, + "loss": 0.0004, + "step": 36130 + }, + { + "epoch": 0.7, + "learning_rate": 5.988505300765019e-08, + "loss": 0.0004, + "step": 36131 + }, + { + "epoch": 0.7, + "learning_rate": 5.988116966331405e-08, + "loss": 0.0004, + "step": 36132 + }, + { + "epoch": 0.7, + "learning_rate": 5.987728631897791e-08, + "loss": 0.0007, + "step": 36133 + }, + { + "epoch": 0.7, + "learning_rate": 5.987340297464177e-08, + "loss": 0.0011, + "step": 36134 + }, + { + "epoch": 0.7, + "learning_rate": 5.986951963030563e-08, + "loss": 0.0005, + "step": 36135 + }, + { + "epoch": 0.7, + "learning_rate": 5.986563628596948e-08, + "loss": 0.0004, + "step": 36136 + }, + { + "epoch": 0.7, + "learning_rate": 5.986175294163334e-08, + "loss": 0.0009, + "step": 36137 + }, + { + "epoch": 0.7, + "learning_rate": 5.98578695972972e-08, + "loss": 0.0006, + "step": 36138 + }, + { + "epoch": 0.7, + "learning_rate": 5.985398625296106e-08, + "loss": 0.0003, + "step": 36139 + }, + { + "epoch": 0.7, + "learning_rate": 5.98501029086249e-08, + "loss": 0.0006, + "step": 36140 + }, + { + "epoch": 0.7, + "learning_rate": 5.984621956428876e-08, + "loss": 0.0009, + "step": 36141 + }, + { + "epoch": 0.7, + "learning_rate": 5.984233621995262e-08, + "loss": 0.0005, + "step": 36142 + }, + { + "epoch": 0.7, + "learning_rate": 5.983845287561648e-08, + "loss": 0.0006, + "step": 36143 + }, + { + "epoch": 0.7, + "learning_rate": 5.983456953128034e-08, + "loss": 0.0004, + "step": 36144 + }, + { + "epoch": 0.7, + "learning_rate": 5.98306861869442e-08, + "loss": 0.0172, + "step": 36145 + }, + { + "epoch": 0.7, + "learning_rate": 5.982680284260805e-08, + "loss": 0.0847, + "step": 36146 + }, + { + "epoch": 0.7, + "learning_rate": 5.982291949827191e-08, + "loss": 0.0005, + "step": 36147 + }, + { + "epoch": 0.7, + "learning_rate": 5.981903615393577e-08, + "loss": 0.3126, + "step": 36148 + }, + { + "epoch": 0.7, + "learning_rate": 5.981515280959963e-08, + "loss": 0.537, + "step": 36149 + }, + { + "epoch": 0.7, + "learning_rate": 5.981126946526349e-08, + "loss": 0.0037, + "step": 36150 + }, + { + "epoch": 0.7, + "learning_rate": 5.980738612092735e-08, + "loss": 0.0005, + "step": 36151 + }, + { + "epoch": 0.7, + "learning_rate": 5.98035027765912e-08, + "loss": 0.2597, + "step": 36152 + }, + { + "epoch": 0.7, + "learning_rate": 5.979961943225506e-08, + "loss": 0.8978, + "step": 36153 + }, + { + "epoch": 0.7, + "learning_rate": 5.979573608791892e-08, + "loss": 0.0004, + "step": 36154 + }, + { + "epoch": 0.7, + "learning_rate": 5.979185274358276e-08, + "loss": 0.0004, + "step": 36155 + }, + { + "epoch": 0.7, + "learning_rate": 5.978796939924662e-08, + "loss": 0.001, + "step": 36156 + }, + { + "epoch": 0.7, + "learning_rate": 5.978408605491048e-08, + "loss": 0.0006, + "step": 36157 + }, + { + "epoch": 0.7, + "learning_rate": 5.978020271057434e-08, + "loss": 0.0006, + "step": 36158 + }, + { + "epoch": 0.7, + "learning_rate": 5.97763193662382e-08, + "loss": 0.0005, + "step": 36159 + }, + { + "epoch": 0.7, + "learning_rate": 5.977243602190206e-08, + "loss": 0.0003, + "step": 36160 + }, + { + "epoch": 0.7, + "learning_rate": 5.976855267756591e-08, + "loss": 0.0005, + "step": 36161 + }, + { + "epoch": 0.7, + "learning_rate": 5.976466933322977e-08, + "loss": 0.0004, + "step": 36162 + }, + { + "epoch": 0.7, + "learning_rate": 5.976078598889363e-08, + "loss": 0.0005, + "step": 36163 + }, + { + "epoch": 0.7, + "learning_rate": 5.975690264455749e-08, + "loss": 0.0004, + "step": 36164 + }, + { + "epoch": 0.7, + "learning_rate": 5.975301930022135e-08, + "loss": 0.0006, + "step": 36165 + }, + { + "epoch": 0.7, + "learning_rate": 5.97491359558852e-08, + "loss": 0.0006, + "step": 36166 + }, + { + "epoch": 0.7, + "learning_rate": 5.974525261154906e-08, + "loss": 0.0005, + "step": 36167 + }, + { + "epoch": 0.7, + "learning_rate": 5.974136926721292e-08, + "loss": 0.0004, + "step": 36168 + }, + { + "epoch": 0.7, + "learning_rate": 5.973748592287678e-08, + "loss": 0.0014, + "step": 36169 + }, + { + "epoch": 0.7, + "learning_rate": 5.973360257854063e-08, + "loss": 0.0018, + "step": 36170 + }, + { + "epoch": 0.7, + "learning_rate": 5.972971923420448e-08, + "loss": 0.0005, + "step": 36171 + }, + { + "epoch": 0.7, + "learning_rate": 5.972583588986834e-08, + "loss": 0.0024, + "step": 36172 + }, + { + "epoch": 0.7, + "learning_rate": 5.97219525455322e-08, + "loss": 0.0004, + "step": 36173 + }, + { + "epoch": 0.7, + "learning_rate": 5.971806920119606e-08, + "loss": 0.0004, + "step": 36174 + }, + { + "epoch": 0.7, + "learning_rate": 5.971418585685992e-08, + "loss": 0.0004, + "step": 36175 + }, + { + "epoch": 0.7, + "learning_rate": 5.971030251252377e-08, + "loss": 0.0007, + "step": 36176 + }, + { + "epoch": 0.7, + "learning_rate": 5.970641916818763e-08, + "loss": 0.0102, + "step": 36177 + }, + { + "epoch": 0.7, + "learning_rate": 5.970253582385149e-08, + "loss": 0.0004, + "step": 36178 + }, + { + "epoch": 0.7, + "learning_rate": 5.969865247951535e-08, + "loss": 0.0008, + "step": 36179 + }, + { + "epoch": 0.7, + "learning_rate": 5.969476913517921e-08, + "loss": 1.3688, + "step": 36180 + }, + { + "epoch": 0.7, + "learning_rate": 5.969088579084307e-08, + "loss": 0.0006, + "step": 36181 + }, + { + "epoch": 0.7, + "learning_rate": 5.968700244650692e-08, + "loss": 0.0409, + "step": 36182 + }, + { + "epoch": 0.7, + "learning_rate": 5.968311910217078e-08, + "loss": 0.0005, + "step": 36183 + }, + { + "epoch": 0.7, + "learning_rate": 5.967923575783464e-08, + "loss": 0.0006, + "step": 36184 + }, + { + "epoch": 0.7, + "learning_rate": 5.96753524134985e-08, + "loss": 0.0004, + "step": 36185 + }, + { + "epoch": 0.7, + "learning_rate": 5.967146906916236e-08, + "loss": 0.0005, + "step": 36186 + }, + { + "epoch": 0.7, + "learning_rate": 5.966758572482622e-08, + "loss": 1.0811, + "step": 36187 + }, + { + "epoch": 0.7, + "learning_rate": 5.966370238049007e-08, + "loss": 0.0006, + "step": 36188 + }, + { + "epoch": 0.7, + "learning_rate": 5.965981903615393e-08, + "loss": 0.0005, + "step": 36189 + }, + { + "epoch": 0.7, + "learning_rate": 5.965593569181779e-08, + "loss": 0.0004, + "step": 36190 + }, + { + "epoch": 0.7, + "learning_rate": 5.965205234748165e-08, + "loss": 0.0004, + "step": 36191 + }, + { + "epoch": 0.7, + "learning_rate": 5.96481690031455e-08, + "loss": 0.0027, + "step": 36192 + }, + { + "epoch": 0.7, + "learning_rate": 5.964428565880936e-08, + "loss": 0.0005, + "step": 36193 + }, + { + "epoch": 0.7, + "learning_rate": 5.964040231447322e-08, + "loss": 0.0006, + "step": 36194 + }, + { + "epoch": 0.7, + "learning_rate": 5.963651897013708e-08, + "loss": 0.0006, + "step": 36195 + }, + { + "epoch": 0.7, + "learning_rate": 5.963263562580094e-08, + "loss": 0.001, + "step": 36196 + }, + { + "epoch": 0.7, + "learning_rate": 5.96287522814648e-08, + "loss": 0.0005, + "step": 36197 + }, + { + "epoch": 0.7, + "learning_rate": 5.962486893712864e-08, + "loss": 0.0003, + "step": 36198 + }, + { + "epoch": 0.7, + "learning_rate": 5.96209855927925e-08, + "loss": 0.0003, + "step": 36199 + }, + { + "epoch": 0.7, + "learning_rate": 5.961710224845636e-08, + "loss": 0.0003, + "step": 36200 + }, + { + "epoch": 0.7, + "learning_rate": 5.961321890412022e-08, + "loss": 0.0003, + "step": 36201 + }, + { + "epoch": 0.7, + "learning_rate": 5.960933555978408e-08, + "loss": 0.0004, + "step": 36202 + }, + { + "epoch": 0.7, + "learning_rate": 5.960545221544793e-08, + "loss": 0.0003, + "step": 36203 + }, + { + "epoch": 0.7, + "learning_rate": 5.96015688711118e-08, + "loss": 0.0004, + "step": 36204 + }, + { + "epoch": 0.7, + "learning_rate": 5.959768552677566e-08, + "loss": 0.0004, + "step": 36205 + }, + { + "epoch": 0.7, + "learning_rate": 5.9593802182439515e-08, + "loss": 0.0005, + "step": 36206 + }, + { + "epoch": 0.7, + "learning_rate": 5.958991883810337e-08, + "loss": 0.0006, + "step": 36207 + }, + { + "epoch": 0.7, + "learning_rate": 5.9586035493767225e-08, + "loss": 0.3039, + "step": 36208 + }, + { + "epoch": 0.7, + "learning_rate": 5.9582152149431083e-08, + "loss": 0.0009, + "step": 36209 + }, + { + "epoch": 0.7, + "learning_rate": 5.957826880509494e-08, + "loss": 0.0006, + "step": 36210 + }, + { + "epoch": 0.7, + "learning_rate": 5.95743854607588e-08, + "loss": 0.0005, + "step": 36211 + }, + { + "epoch": 0.7, + "learning_rate": 5.957050211642266e-08, + "loss": 1.2276, + "step": 36212 + }, + { + "epoch": 0.7, + "learning_rate": 5.9566618772086516e-08, + "loss": 0.0004, + "step": 36213 + }, + { + "epoch": 0.7, + "learning_rate": 5.9562735427750375e-08, + "loss": 0.0004, + "step": 36214 + }, + { + "epoch": 0.7, + "learning_rate": 5.955885208341423e-08, + "loss": 0.0006, + "step": 36215 + }, + { + "epoch": 0.7, + "learning_rate": 5.955496873907809e-08, + "loss": 0.0004, + "step": 36216 + }, + { + "epoch": 0.7, + "learning_rate": 5.955108539474195e-08, + "loss": 0.0004, + "step": 36217 + }, + { + "epoch": 0.7, + "learning_rate": 5.954720205040581e-08, + "loss": 0.0004, + "step": 36218 + }, + { + "epoch": 0.7, + "learning_rate": 5.9543318706069666e-08, + "loss": 0.0006, + "step": 36219 + }, + { + "epoch": 0.7, + "learning_rate": 5.9539435361733524e-08, + "loss": 0.0005, + "step": 36220 + }, + { + "epoch": 0.7, + "learning_rate": 5.953555201739738e-08, + "loss": 0.0007, + "step": 36221 + }, + { + "epoch": 0.7, + "learning_rate": 5.953166867306124e-08, + "loss": 0.0006, + "step": 36222 + }, + { + "epoch": 0.7, + "learning_rate": 5.95277853287251e-08, + "loss": 0.0027, + "step": 36223 + }, + { + "epoch": 0.7, + "learning_rate": 5.952390198438896e-08, + "loss": 0.0005, + "step": 36224 + }, + { + "epoch": 0.7, + "learning_rate": 5.9520018640052815e-08, + "loss": 0.0747, + "step": 36225 + }, + { + "epoch": 0.7, + "learning_rate": 5.9516135295716674e-08, + "loss": 0.0006, + "step": 36226 + }, + { + "epoch": 0.7, + "learning_rate": 5.951225195138052e-08, + "loss": 0.0004, + "step": 36227 + }, + { + "epoch": 0.7, + "learning_rate": 5.950836860704438e-08, + "loss": 0.0004, + "step": 36228 + }, + { + "epoch": 0.7, + "learning_rate": 5.9504485262708235e-08, + "loss": 1.3311, + "step": 36229 + }, + { + "epoch": 0.7, + "learning_rate": 5.9500601918372093e-08, + "loss": 0.0004, + "step": 36230 + }, + { + "epoch": 0.7, + "learning_rate": 5.949671857403595e-08, + "loss": 0.0004, + "step": 36231 + }, + { + "epoch": 0.7, + "learning_rate": 5.949283522969981e-08, + "loss": 0.046, + "step": 36232 + }, + { + "epoch": 0.7, + "learning_rate": 5.948895188536367e-08, + "loss": 0.0004, + "step": 36233 + }, + { + "epoch": 0.7, + "learning_rate": 5.9485068541027526e-08, + "loss": 0.0005, + "step": 36234 + }, + { + "epoch": 0.7, + "learning_rate": 5.9481185196691385e-08, + "loss": 0.0006, + "step": 36235 + }, + { + "epoch": 0.7, + "learning_rate": 5.947730185235524e-08, + "loss": 0.0005, + "step": 36236 + }, + { + "epoch": 0.7, + "learning_rate": 5.94734185080191e-08, + "loss": 0.0869, + "step": 36237 + }, + { + "epoch": 0.7, + "learning_rate": 5.946953516368296e-08, + "loss": 0.0004, + "step": 36238 + }, + { + "epoch": 0.7, + "learning_rate": 5.946565181934682e-08, + "loss": 0.0005, + "step": 36239 + }, + { + "epoch": 0.7, + "learning_rate": 5.9461768475010676e-08, + "loss": 0.0003, + "step": 36240 + }, + { + "epoch": 0.7, + "learning_rate": 5.9457885130674534e-08, + "loss": 0.0013, + "step": 36241 + }, + { + "epoch": 0.7, + "learning_rate": 5.945400178633839e-08, + "loss": 0.0123, + "step": 36242 + }, + { + "epoch": 0.7, + "learning_rate": 5.945011844200225e-08, + "loss": 0.0087, + "step": 36243 + }, + { + "epoch": 0.7, + "learning_rate": 5.944623509766611e-08, + "loss": 0.0207, + "step": 36244 + }, + { + "epoch": 0.7, + "learning_rate": 5.944235175332997e-08, + "loss": 0.0004, + "step": 36245 + }, + { + "epoch": 0.7, + "learning_rate": 5.9438468408993825e-08, + "loss": 0.0005, + "step": 36246 + }, + { + "epoch": 0.7, + "learning_rate": 5.9434585064657684e-08, + "loss": 0.0004, + "step": 36247 + }, + { + "epoch": 0.7, + "learning_rate": 5.943070172032154e-08, + "loss": 0.0006, + "step": 36248 + }, + { + "epoch": 0.7, + "learning_rate": 5.94268183759854e-08, + "loss": 0.0008, + "step": 36249 + }, + { + "epoch": 0.7, + "learning_rate": 5.942293503164926e-08, + "loss": 1.0516, + "step": 36250 + }, + { + "epoch": 0.7, + "learning_rate": 5.9419051687313117e-08, + "loss": 0.0003, + "step": 36251 + }, + { + "epoch": 0.7, + "learning_rate": 5.9415168342976975e-08, + "loss": 0.0005, + "step": 36252 + }, + { + "epoch": 0.7, + "learning_rate": 5.941128499864083e-08, + "loss": 0.0008, + "step": 36253 + }, + { + "epoch": 0.7, + "learning_rate": 5.940740165430469e-08, + "loss": 0.0005, + "step": 36254 + }, + { + "epoch": 0.7, + "learning_rate": 5.940351830996855e-08, + "loss": 0.0003, + "step": 36255 + }, + { + "epoch": 0.7, + "learning_rate": 5.9399634965632395e-08, + "loss": 0.0005, + "step": 36256 + }, + { + "epoch": 0.7, + "learning_rate": 5.939575162129625e-08, + "loss": 0.0004, + "step": 36257 + }, + { + "epoch": 0.7, + "learning_rate": 5.939186827696011e-08, + "loss": 0.5546, + "step": 36258 + }, + { + "epoch": 0.7, + "learning_rate": 5.938798493262397e-08, + "loss": 0.0004, + "step": 36259 + }, + { + "epoch": 0.7, + "learning_rate": 5.938410158828783e-08, + "loss": 0.0004, + "step": 36260 + }, + { + "epoch": 0.7, + "learning_rate": 5.9380218243951686e-08, + "loss": 0.0006, + "step": 36261 + }, + { + "epoch": 0.7, + "learning_rate": 5.9376334899615544e-08, + "loss": 0.0004, + "step": 36262 + }, + { + "epoch": 0.7, + "learning_rate": 5.93724515552794e-08, + "loss": 0.0004, + "step": 36263 + }, + { + "epoch": 0.7, + "learning_rate": 5.936856821094326e-08, + "loss": 0.0005, + "step": 36264 + }, + { + "epoch": 0.7, + "learning_rate": 5.936468486660712e-08, + "loss": 0.0004, + "step": 36265 + }, + { + "epoch": 0.7, + "learning_rate": 5.936080152227098e-08, + "loss": 0.0004, + "step": 36266 + }, + { + "epoch": 0.7, + "learning_rate": 5.9356918177934835e-08, + "loss": 1.3479, + "step": 36267 + }, + { + "epoch": 0.7, + "learning_rate": 5.9353034833598693e-08, + "loss": 0.0006, + "step": 36268 + }, + { + "epoch": 0.7, + "learning_rate": 5.934915148926255e-08, + "loss": 0.0003, + "step": 36269 + }, + { + "epoch": 0.7, + "learning_rate": 5.934526814492641e-08, + "loss": 0.8099, + "step": 36270 + }, + { + "epoch": 0.7, + "learning_rate": 5.934138480059027e-08, + "loss": 0.0004, + "step": 36271 + }, + { + "epoch": 0.7, + "learning_rate": 5.9337501456254126e-08, + "loss": 0.0009, + "step": 36272 + }, + { + "epoch": 0.7, + "learning_rate": 5.9333618111917985e-08, + "loss": 0.0003, + "step": 36273 + }, + { + "epoch": 0.7, + "learning_rate": 5.932973476758184e-08, + "loss": 0.0006, + "step": 36274 + }, + { + "epoch": 0.7, + "learning_rate": 5.93258514232457e-08, + "loss": 0.0004, + "step": 36275 + }, + { + "epoch": 0.7, + "learning_rate": 5.932196807890956e-08, + "loss": 0.0005, + "step": 36276 + }, + { + "epoch": 0.7, + "learning_rate": 5.931808473457342e-08, + "loss": 0.0006, + "step": 36277 + }, + { + "epoch": 0.7, + "learning_rate": 5.9314201390237276e-08, + "loss": 0.0019, + "step": 36278 + }, + { + "epoch": 0.7, + "learning_rate": 5.9310318045901134e-08, + "loss": 0.0005, + "step": 36279 + }, + { + "epoch": 0.7, + "learning_rate": 5.930643470156499e-08, + "loss": 0.1357, + "step": 36280 + }, + { + "epoch": 0.7, + "learning_rate": 5.9302551357228844e-08, + "loss": 0.0003, + "step": 36281 + }, + { + "epoch": 0.7, + "learning_rate": 5.92986680128927e-08, + "loss": 0.0005, + "step": 36282 + }, + { + "epoch": 0.7, + "learning_rate": 5.929478466855656e-08, + "loss": 0.0005, + "step": 36283 + }, + { + "epoch": 0.7, + "learning_rate": 5.929090132422042e-08, + "loss": 0.0004, + "step": 36284 + }, + { + "epoch": 0.7, + "learning_rate": 5.928701797988427e-08, + "loss": 0.0006, + "step": 36285 + }, + { + "epoch": 0.7, + "learning_rate": 5.928313463554813e-08, + "loss": 0.0004, + "step": 36286 + }, + { + "epoch": 0.7, + "learning_rate": 5.927925129121199e-08, + "loss": 0.0006, + "step": 36287 + }, + { + "epoch": 0.7, + "learning_rate": 5.9275367946875845e-08, + "loss": 0.0023, + "step": 36288 + }, + { + "epoch": 0.7, + "learning_rate": 5.9271484602539703e-08, + "loss": 0.0005, + "step": 36289 + }, + { + "epoch": 0.7, + "learning_rate": 5.926760125820356e-08, + "loss": 0.0004, + "step": 36290 + }, + { + "epoch": 0.7, + "learning_rate": 5.926371791386742e-08, + "loss": 0.0004, + "step": 36291 + }, + { + "epoch": 0.7, + "learning_rate": 5.925983456953128e-08, + "loss": 0.0044, + "step": 36292 + }, + { + "epoch": 0.7, + "learning_rate": 5.9255951225195136e-08, + "loss": 0.0008, + "step": 36293 + }, + { + "epoch": 0.7, + "learning_rate": 5.9252067880858995e-08, + "loss": 0.0006, + "step": 36294 + }, + { + "epoch": 0.7, + "learning_rate": 5.9248184536522846e-08, + "loss": 0.0004, + "step": 36295 + }, + { + "epoch": 0.7, + "learning_rate": 5.9244301192186704e-08, + "loss": 0.0004, + "step": 36296 + }, + { + "epoch": 0.7, + "learning_rate": 5.924041784785056e-08, + "loss": 0.0006, + "step": 36297 + }, + { + "epoch": 0.7, + "learning_rate": 5.923653450351442e-08, + "loss": 0.0004, + "step": 36298 + }, + { + "epoch": 0.7, + "learning_rate": 5.923265115917828e-08, + "loss": 0.0009, + "step": 36299 + }, + { + "epoch": 0.7, + "learning_rate": 5.922876781484214e-08, + "loss": 0.0004, + "step": 36300 + }, + { + "epoch": 0.7, + "learning_rate": 5.9224884470505996e-08, + "loss": 0.0008, + "step": 36301 + }, + { + "epoch": 0.7, + "learning_rate": 5.9221001126169854e-08, + "loss": 0.0006, + "step": 36302 + }, + { + "epoch": 0.7, + "learning_rate": 5.921711778183371e-08, + "loss": 0.0006, + "step": 36303 + }, + { + "epoch": 0.7, + "learning_rate": 5.921323443749757e-08, + "loss": 0.0004, + "step": 36304 + }, + { + "epoch": 0.7, + "learning_rate": 5.920935109316143e-08, + "loss": 0.0005, + "step": 36305 + }, + { + "epoch": 0.7, + "learning_rate": 5.920546774882529e-08, + "loss": 0.0004, + "step": 36306 + }, + { + "epoch": 0.7, + "learning_rate": 5.9201584404489145e-08, + "loss": 0.0005, + "step": 36307 + }, + { + "epoch": 0.7, + "learning_rate": 5.9197701060153003e-08, + "loss": 0.0004, + "step": 36308 + }, + { + "epoch": 0.7, + "learning_rate": 5.919381771581686e-08, + "loss": 0.0004, + "step": 36309 + }, + { + "epoch": 0.7, + "learning_rate": 5.918993437148072e-08, + "loss": 0.0003, + "step": 36310 + }, + { + "epoch": 0.7, + "learning_rate": 5.918605102714458e-08, + "loss": 0.0009, + "step": 36311 + }, + { + "epoch": 0.7, + "learning_rate": 5.9182167682808436e-08, + "loss": 0.0004, + "step": 36312 + }, + { + "epoch": 0.7, + "learning_rate": 5.9178284338472295e-08, + "loss": 0.0004, + "step": 36313 + }, + { + "epoch": 0.7, + "learning_rate": 5.917440099413614e-08, + "loss": 0.0004, + "step": 36314 + }, + { + "epoch": 0.7, + "learning_rate": 5.91705176498e-08, + "loss": 0.0004, + "step": 36315 + }, + { + "epoch": 0.7, + "learning_rate": 5.9166634305463856e-08, + "loss": 0.0004, + "step": 36316 + }, + { + "epoch": 0.7, + "learning_rate": 5.9162750961127714e-08, + "loss": 0.0005, + "step": 36317 + }, + { + "epoch": 0.7, + "learning_rate": 5.915886761679157e-08, + "loss": 0.0004, + "step": 36318 + }, + { + "epoch": 0.7, + "learning_rate": 5.915498427245543e-08, + "loss": 0.0005, + "step": 36319 + }, + { + "epoch": 0.7, + "learning_rate": 5.915110092811929e-08, + "loss": 0.0005, + "step": 36320 + }, + { + "epoch": 0.7, + "learning_rate": 5.914721758378315e-08, + "loss": 0.0018, + "step": 36321 + }, + { + "epoch": 0.7, + "learning_rate": 5.9143334239447006e-08, + "loss": 0.0004, + "step": 36322 + }, + { + "epoch": 0.7, + "learning_rate": 5.9139450895110864e-08, + "loss": 0.242, + "step": 36323 + }, + { + "epoch": 0.7, + "learning_rate": 5.913556755077472e-08, + "loss": 0.0004, + "step": 36324 + }, + { + "epoch": 0.7, + "learning_rate": 5.913168420643858e-08, + "loss": 0.0076, + "step": 36325 + }, + { + "epoch": 0.7, + "learning_rate": 5.912780086210244e-08, + "loss": 0.0004, + "step": 36326 + }, + { + "epoch": 0.7, + "learning_rate": 5.91239175177663e-08, + "loss": 0.0006, + "step": 36327 + }, + { + "epoch": 0.7, + "learning_rate": 5.9120034173430155e-08, + "loss": 0.0004, + "step": 36328 + }, + { + "epoch": 0.7, + "learning_rate": 5.911615082909401e-08, + "loss": 0.0004, + "step": 36329 + }, + { + "epoch": 0.7, + "learning_rate": 5.911226748475787e-08, + "loss": 0.0009, + "step": 36330 + }, + { + "epoch": 0.7, + "learning_rate": 5.910838414042173e-08, + "loss": 0.0006, + "step": 36331 + }, + { + "epoch": 0.7, + "learning_rate": 5.910450079608559e-08, + "loss": 0.4943, + "step": 36332 + }, + { + "epoch": 0.7, + "learning_rate": 5.9100617451749446e-08, + "loss": 0.0799, + "step": 36333 + }, + { + "epoch": 0.7, + "learning_rate": 5.9096734107413304e-08, + "loss": 0.7224, + "step": 36334 + }, + { + "epoch": 0.7, + "learning_rate": 5.909285076307716e-08, + "loss": 0.0005, + "step": 36335 + }, + { + "epoch": 0.7, + "learning_rate": 5.908896741874102e-08, + "loss": 0.0005, + "step": 36336 + }, + { + "epoch": 0.7, + "learning_rate": 5.908508407440488e-08, + "loss": 0.0005, + "step": 36337 + }, + { + "epoch": 0.7, + "learning_rate": 5.908120073006874e-08, + "loss": 0.0005, + "step": 36338 + }, + { + "epoch": 0.7, + "learning_rate": 5.9077317385732596e-08, + "loss": 0.0871, + "step": 36339 + }, + { + "epoch": 0.7, + "learning_rate": 5.9073434041396454e-08, + "loss": 0.0291, + "step": 36340 + }, + { + "epoch": 0.7, + "learning_rate": 5.906955069706031e-08, + "loss": 0.0006, + "step": 36341 + }, + { + "epoch": 0.7, + "learning_rate": 5.906566735272417e-08, + "loss": 0.0005, + "step": 36342 + }, + { + "epoch": 0.7, + "learning_rate": 5.9061784008388015e-08, + "loss": 0.0003, + "step": 36343 + }, + { + "epoch": 0.7, + "learning_rate": 5.9057900664051874e-08, + "loss": 0.0004, + "step": 36344 + }, + { + "epoch": 0.71, + "learning_rate": 5.905401731971573e-08, + "loss": 0.0005, + "step": 36345 + }, + { + "epoch": 0.71, + "learning_rate": 5.905013397537959e-08, + "loss": 0.0005, + "step": 36346 + }, + { + "epoch": 0.71, + "learning_rate": 5.904625063104345e-08, + "loss": 0.0004, + "step": 36347 + }, + { + "epoch": 0.71, + "learning_rate": 5.9042367286707307e-08, + "loss": 1.1617, + "step": 36348 + }, + { + "epoch": 0.71, + "learning_rate": 5.9038483942371165e-08, + "loss": 0.0004, + "step": 36349 + }, + { + "epoch": 0.71, + "learning_rate": 5.903460059803502e-08, + "loss": 0.0005, + "step": 36350 + }, + { + "epoch": 0.71, + "learning_rate": 5.903071725369888e-08, + "loss": 0.0005, + "step": 36351 + }, + { + "epoch": 0.71, + "learning_rate": 5.902683390936274e-08, + "loss": 0.0011, + "step": 36352 + }, + { + "epoch": 0.71, + "learning_rate": 5.90229505650266e-08, + "loss": 0.0023, + "step": 36353 + }, + { + "epoch": 0.71, + "learning_rate": 5.9019067220690456e-08, + "loss": 0.0004, + "step": 36354 + }, + { + "epoch": 0.71, + "learning_rate": 5.9015183876354314e-08, + "loss": 0.0007, + "step": 36355 + }, + { + "epoch": 0.71, + "learning_rate": 5.901130053201817e-08, + "loss": 0.0005, + "step": 36356 + }, + { + "epoch": 0.71, + "learning_rate": 5.900741718768203e-08, + "loss": 0.0005, + "step": 36357 + }, + { + "epoch": 0.71, + "learning_rate": 5.900353384334589e-08, + "loss": 0.0004, + "step": 36358 + }, + { + "epoch": 0.71, + "learning_rate": 5.899965049900975e-08, + "loss": 0.0005, + "step": 36359 + }, + { + "epoch": 0.71, + "learning_rate": 5.8995767154673606e-08, + "loss": 0.0003, + "step": 36360 + }, + { + "epoch": 0.71, + "learning_rate": 5.8991883810337464e-08, + "loss": 0.0003, + "step": 36361 + }, + { + "epoch": 0.71, + "learning_rate": 5.898800046600132e-08, + "loss": 0.0004, + "step": 36362 + }, + { + "epoch": 0.71, + "learning_rate": 5.898411712166518e-08, + "loss": 0.0004, + "step": 36363 + }, + { + "epoch": 0.71, + "learning_rate": 5.898023377732904e-08, + "loss": 0.0004, + "step": 36364 + }, + { + "epoch": 0.71, + "learning_rate": 5.89763504329929e-08, + "loss": 0.0004, + "step": 36365 + }, + { + "epoch": 0.71, + "learning_rate": 5.8972467088656755e-08, + "loss": 0.0017, + "step": 36366 + }, + { + "epoch": 0.71, + "learning_rate": 5.896858374432061e-08, + "loss": 0.0005, + "step": 36367 + }, + { + "epoch": 0.71, + "learning_rate": 5.896470039998447e-08, + "loss": 0.0005, + "step": 36368 + }, + { + "epoch": 0.71, + "learning_rate": 5.896081705564832e-08, + "loss": 0.0003, + "step": 36369 + }, + { + "epoch": 0.71, + "learning_rate": 5.895693371131218e-08, + "loss": 0.0003, + "step": 36370 + }, + { + "epoch": 0.71, + "learning_rate": 5.895305036697604e-08, + "loss": 0.0004, + "step": 36371 + }, + { + "epoch": 0.71, + "learning_rate": 5.894916702263989e-08, + "loss": 0.2121, + "step": 36372 + }, + { + "epoch": 0.71, + "learning_rate": 5.894528367830375e-08, + "loss": 0.0003, + "step": 36373 + }, + { + "epoch": 0.71, + "learning_rate": 5.894140033396761e-08, + "loss": 0.0005, + "step": 36374 + }, + { + "epoch": 0.71, + "learning_rate": 5.8937516989631466e-08, + "loss": 0.0005, + "step": 36375 + }, + { + "epoch": 0.71, + "learning_rate": 5.8933633645295324e-08, + "loss": 0.0003, + "step": 36376 + }, + { + "epoch": 0.71, + "learning_rate": 5.892975030095918e-08, + "loss": 0.0004, + "step": 36377 + }, + { + "epoch": 0.71, + "learning_rate": 5.892586695662304e-08, + "loss": 0.0005, + "step": 36378 + }, + { + "epoch": 0.71, + "learning_rate": 5.89219836122869e-08, + "loss": 0.0985, + "step": 36379 + }, + { + "epoch": 0.71, + "learning_rate": 5.891810026795076e-08, + "loss": 0.0005, + "step": 36380 + }, + { + "epoch": 0.71, + "learning_rate": 5.8914216923614615e-08, + "loss": 0.0006, + "step": 36381 + }, + { + "epoch": 0.71, + "learning_rate": 5.8910333579278474e-08, + "loss": 0.0005, + "step": 36382 + }, + { + "epoch": 0.71, + "learning_rate": 5.890645023494233e-08, + "loss": 1.23, + "step": 36383 + }, + { + "epoch": 0.71, + "learning_rate": 5.8902566890606184e-08, + "loss": 0.0005, + "step": 36384 + }, + { + "epoch": 0.71, + "learning_rate": 5.889868354627004e-08, + "loss": 0.0006, + "step": 36385 + }, + { + "epoch": 0.71, + "learning_rate": 5.88948002019339e-08, + "loss": 0.0006, + "step": 36386 + }, + { + "epoch": 0.71, + "learning_rate": 5.889091685759776e-08, + "loss": 0.0004, + "step": 36387 + }, + { + "epoch": 0.71, + "learning_rate": 5.8887033513261617e-08, + "loss": 0.0003, + "step": 36388 + }, + { + "epoch": 0.71, + "learning_rate": 5.8883150168925475e-08, + "loss": 0.0011, + "step": 36389 + }, + { + "epoch": 0.71, + "learning_rate": 5.887926682458933e-08, + "loss": 0.0024, + "step": 36390 + }, + { + "epoch": 0.71, + "learning_rate": 5.887538348025319e-08, + "loss": 0.0006, + "step": 36391 + }, + { + "epoch": 0.71, + "learning_rate": 5.887150013591705e-08, + "loss": 0.0007, + "step": 36392 + }, + { + "epoch": 0.71, + "learning_rate": 5.886761679158091e-08, + "loss": 0.0006, + "step": 36393 + }, + { + "epoch": 0.71, + "learning_rate": 5.8863733447244766e-08, + "loss": 0.0005, + "step": 36394 + }, + { + "epoch": 0.71, + "learning_rate": 5.8859850102908624e-08, + "loss": 0.0004, + "step": 36395 + }, + { + "epoch": 0.71, + "learning_rate": 5.885596675857248e-08, + "loss": 0.0007, + "step": 36396 + }, + { + "epoch": 0.71, + "learning_rate": 5.885208341423634e-08, + "loss": 0.0003, + "step": 36397 + }, + { + "epoch": 0.71, + "learning_rate": 5.88482000699002e-08, + "loss": 0.0003, + "step": 36398 + }, + { + "epoch": 0.71, + "learning_rate": 5.884431672556406e-08, + "loss": 0.0004, + "step": 36399 + }, + { + "epoch": 0.71, + "learning_rate": 5.8840433381227916e-08, + "loss": 0.0006, + "step": 36400 + }, + { + "epoch": 0.71, + "learning_rate": 5.883655003689176e-08, + "loss": 0.0003, + "step": 36401 + }, + { + "epoch": 0.71, + "learning_rate": 5.883266669255562e-08, + "loss": 0.0004, + "step": 36402 + }, + { + "epoch": 0.71, + "learning_rate": 5.882878334821948e-08, + "loss": 0.0006, + "step": 36403 + }, + { + "epoch": 0.71, + "learning_rate": 5.8824900003883335e-08, + "loss": 0.0004, + "step": 36404 + }, + { + "epoch": 0.71, + "learning_rate": 5.8821016659547194e-08, + "loss": 0.0006, + "step": 36405 + }, + { + "epoch": 0.71, + "learning_rate": 5.881713331521105e-08, + "loss": 0.0004, + "step": 36406 + }, + { + "epoch": 0.71, + "learning_rate": 5.881324997087491e-08, + "loss": 0.0004, + "step": 36407 + }, + { + "epoch": 0.71, + "learning_rate": 5.880936662653877e-08, + "loss": 0.0003, + "step": 36408 + }, + { + "epoch": 0.71, + "learning_rate": 5.8805483282202626e-08, + "loss": 0.0385, + "step": 36409 + }, + { + "epoch": 0.71, + "learning_rate": 5.8801599937866485e-08, + "loss": 0.0006, + "step": 36410 + }, + { + "epoch": 0.71, + "learning_rate": 5.879771659353034e-08, + "loss": 0.2708, + "step": 36411 + }, + { + "epoch": 0.71, + "learning_rate": 5.87938332491942e-08, + "loss": 0.0003, + "step": 36412 + }, + { + "epoch": 0.71, + "learning_rate": 5.878994990485806e-08, + "loss": 0.0004, + "step": 36413 + }, + { + "epoch": 0.71, + "learning_rate": 5.878606656052192e-08, + "loss": 0.0005, + "step": 36414 + }, + { + "epoch": 0.71, + "learning_rate": 5.8782183216185776e-08, + "loss": 0.8403, + "step": 36415 + }, + { + "epoch": 0.71, + "learning_rate": 5.8778299871849634e-08, + "loss": 0.0004, + "step": 36416 + }, + { + "epoch": 0.71, + "learning_rate": 5.877441652751349e-08, + "loss": 0.0004, + "step": 36417 + }, + { + "epoch": 0.71, + "learning_rate": 5.877053318317735e-08, + "loss": 0.0004, + "step": 36418 + }, + { + "epoch": 0.71, + "learning_rate": 5.876664983884121e-08, + "loss": 0.0003, + "step": 36419 + }, + { + "epoch": 0.71, + "learning_rate": 5.876276649450507e-08, + "loss": 0.0003, + "step": 36420 + }, + { + "epoch": 0.71, + "learning_rate": 5.8758883150168925e-08, + "loss": 0.0004, + "step": 36421 + }, + { + "epoch": 0.71, + "learning_rate": 5.8754999805832784e-08, + "loss": 0.0708, + "step": 36422 + }, + { + "epoch": 0.71, + "learning_rate": 5.875111646149664e-08, + "loss": 0.0004, + "step": 36423 + }, + { + "epoch": 0.71, + "learning_rate": 5.87472331171605e-08, + "loss": 0.0113, + "step": 36424 + }, + { + "epoch": 0.71, + "learning_rate": 5.874334977282436e-08, + "loss": 0.2972, + "step": 36425 + }, + { + "epoch": 0.71, + "learning_rate": 5.8739466428488217e-08, + "loss": 0.0004, + "step": 36426 + }, + { + "epoch": 0.71, + "learning_rate": 5.8735583084152075e-08, + "loss": 0.0005, + "step": 36427 + }, + { + "epoch": 0.71, + "learning_rate": 5.873169973981593e-08, + "loss": 0.0004, + "step": 36428 + }, + { + "epoch": 0.71, + "learning_rate": 5.872781639547979e-08, + "loss": 0.0004, + "step": 36429 + }, + { + "epoch": 0.71, + "learning_rate": 5.8723933051143636e-08, + "loss": 1.2028, + "step": 36430 + }, + { + "epoch": 0.71, + "learning_rate": 5.8720049706807495e-08, + "loss": 0.0006, + "step": 36431 + }, + { + "epoch": 0.71, + "learning_rate": 5.871616636247135e-08, + "loss": 0.0015, + "step": 36432 + }, + { + "epoch": 0.71, + "learning_rate": 5.871228301813521e-08, + "loss": 0.0302, + "step": 36433 + }, + { + "epoch": 0.71, + "learning_rate": 5.870839967379907e-08, + "loss": 0.0006, + "step": 36434 + }, + { + "epoch": 0.71, + "learning_rate": 5.870451632946293e-08, + "loss": 0.0004, + "step": 36435 + }, + { + "epoch": 0.71, + "learning_rate": 5.8700632985126786e-08, + "loss": 0.0004, + "step": 36436 + }, + { + "epoch": 0.71, + "learning_rate": 5.8696749640790644e-08, + "loss": 0.0969, + "step": 36437 + }, + { + "epoch": 0.71, + "learning_rate": 5.86928662964545e-08, + "loss": 0.0048, + "step": 36438 + }, + { + "epoch": 0.71, + "learning_rate": 5.868898295211836e-08, + "loss": 0.001, + "step": 36439 + }, + { + "epoch": 0.71, + "learning_rate": 5.868509960778222e-08, + "loss": 0.0003, + "step": 36440 + }, + { + "epoch": 0.71, + "learning_rate": 5.868121626344608e-08, + "loss": 0.0006, + "step": 36441 + }, + { + "epoch": 0.71, + "learning_rate": 5.8677332919109935e-08, + "loss": 0.0007, + "step": 36442 + }, + { + "epoch": 0.71, + "learning_rate": 5.8673449574773794e-08, + "loss": 0.0006, + "step": 36443 + }, + { + "epoch": 0.71, + "learning_rate": 5.866956623043765e-08, + "loss": 1.0359, + "step": 36444 + }, + { + "epoch": 0.71, + "learning_rate": 5.866568288610151e-08, + "loss": 0.0007, + "step": 36445 + }, + { + "epoch": 0.71, + "learning_rate": 5.866179954176537e-08, + "loss": 0.0004, + "step": 36446 + }, + { + "epoch": 0.71, + "learning_rate": 5.8657916197429227e-08, + "loss": 0.0006, + "step": 36447 + }, + { + "epoch": 0.71, + "learning_rate": 5.8654032853093085e-08, + "loss": 0.0008, + "step": 36448 + }, + { + "epoch": 0.71, + "learning_rate": 5.865014950875694e-08, + "loss": 0.0004, + "step": 36449 + }, + { + "epoch": 0.71, + "learning_rate": 5.86462661644208e-08, + "loss": 0.0003, + "step": 36450 + }, + { + "epoch": 0.71, + "learning_rate": 5.864238282008466e-08, + "loss": 0.0006, + "step": 36451 + }, + { + "epoch": 0.71, + "learning_rate": 5.863849947574852e-08, + "loss": 0.0006, + "step": 36452 + }, + { + "epoch": 0.71, + "learning_rate": 5.8634616131412376e-08, + "loss": 0.0004, + "step": 36453 + }, + { + "epoch": 0.71, + "learning_rate": 5.8630732787076234e-08, + "loss": 0.0817, + "step": 36454 + }, + { + "epoch": 0.71, + "learning_rate": 5.862684944274009e-08, + "loss": 0.1529, + "step": 36455 + }, + { + "epoch": 0.71, + "learning_rate": 5.862296609840395e-08, + "loss": 0.1086, + "step": 36456 + }, + { + "epoch": 0.71, + "learning_rate": 5.861908275406781e-08, + "loss": 0.0004, + "step": 36457 + }, + { + "epoch": 0.71, + "learning_rate": 5.861519940973166e-08, + "loss": 0.0003, + "step": 36458 + }, + { + "epoch": 0.71, + "learning_rate": 5.861131606539551e-08, + "loss": 0.0013, + "step": 36459 + }, + { + "epoch": 0.71, + "learning_rate": 5.860743272105937e-08, + "loss": 0.0008, + "step": 36460 + }, + { + "epoch": 0.71, + "learning_rate": 5.860354937672323e-08, + "loss": 0.0008, + "step": 36461 + }, + { + "epoch": 0.71, + "learning_rate": 5.859966603238709e-08, + "loss": 0.0004, + "step": 36462 + }, + { + "epoch": 0.71, + "learning_rate": 5.8595782688050945e-08, + "loss": 0.0004, + "step": 36463 + }, + { + "epoch": 0.71, + "learning_rate": 5.8591899343714803e-08, + "loss": 0.0006, + "step": 36464 + }, + { + "epoch": 0.71, + "learning_rate": 5.858801599937866e-08, + "loss": 0.0005, + "step": 36465 + }, + { + "epoch": 0.71, + "learning_rate": 5.858413265504252e-08, + "loss": 0.0004, + "step": 36466 + }, + { + "epoch": 0.71, + "learning_rate": 5.858024931070638e-08, + "loss": 0.0006, + "step": 36467 + }, + { + "epoch": 0.71, + "learning_rate": 5.8576365966370236e-08, + "loss": 0.0004, + "step": 36468 + }, + { + "epoch": 0.71, + "learning_rate": 5.8572482622034095e-08, + "loss": 0.0003, + "step": 36469 + }, + { + "epoch": 0.71, + "learning_rate": 5.856859927769795e-08, + "loss": 0.0154, + "step": 36470 + }, + { + "epoch": 0.71, + "learning_rate": 5.856471593336181e-08, + "loss": 1.0613, + "step": 36471 + }, + { + "epoch": 0.71, + "learning_rate": 5.856083258902566e-08, + "loss": 0.0005, + "step": 36472 + }, + { + "epoch": 0.71, + "learning_rate": 5.855694924468952e-08, + "loss": 0.0004, + "step": 36473 + }, + { + "epoch": 0.71, + "learning_rate": 5.855306590035338e-08, + "loss": 0.0005, + "step": 36474 + }, + { + "epoch": 0.71, + "learning_rate": 5.854918255601724e-08, + "loss": 0.8621, + "step": 36475 + }, + { + "epoch": 0.71, + "learning_rate": 5.8545299211681096e-08, + "loss": 0.0007, + "step": 36476 + }, + { + "epoch": 0.71, + "learning_rate": 5.8541415867344954e-08, + "loss": 0.0012, + "step": 36477 + }, + { + "epoch": 0.71, + "learning_rate": 5.853753252300881e-08, + "loss": 0.0005, + "step": 36478 + }, + { + "epoch": 0.71, + "learning_rate": 5.853364917867267e-08, + "loss": 0.0003, + "step": 36479 + }, + { + "epoch": 0.71, + "learning_rate": 5.852976583433653e-08, + "loss": 0.0003, + "step": 36480 + }, + { + "epoch": 0.71, + "learning_rate": 5.852588249000039e-08, + "loss": 0.0004, + "step": 36481 + }, + { + "epoch": 0.71, + "learning_rate": 5.8521999145664245e-08, + "loss": 0.0006, + "step": 36482 + }, + { + "epoch": 0.71, + "learning_rate": 5.8518115801328103e-08, + "loss": 0.0004, + "step": 36483 + }, + { + "epoch": 0.71, + "learning_rate": 5.851423245699196e-08, + "loss": 0.0004, + "step": 36484 + }, + { + "epoch": 0.71, + "learning_rate": 5.851034911265582e-08, + "loss": 0.0007, + "step": 36485 + }, + { + "epoch": 0.71, + "learning_rate": 5.850646576831968e-08, + "loss": 0.0004, + "step": 36486 + }, + { + "epoch": 0.71, + "learning_rate": 5.8502582423983536e-08, + "loss": 0.0083, + "step": 36487 + }, + { + "epoch": 0.71, + "learning_rate": 5.849869907964738e-08, + "loss": 0.0006, + "step": 36488 + }, + { + "epoch": 0.71, + "learning_rate": 5.849481573531124e-08, + "loss": 0.0005, + "step": 36489 + }, + { + "epoch": 0.71, + "learning_rate": 5.84909323909751e-08, + "loss": 0.0004, + "step": 36490 + }, + { + "epoch": 0.71, + "learning_rate": 5.8487049046638956e-08, + "loss": 0.5285, + "step": 36491 + }, + { + "epoch": 0.71, + "learning_rate": 5.8483165702302814e-08, + "loss": 0.0073, + "step": 36492 + }, + { + "epoch": 0.71, + "learning_rate": 5.847928235796667e-08, + "loss": 0.0005, + "step": 36493 + }, + { + "epoch": 0.71, + "learning_rate": 5.847539901363053e-08, + "loss": 0.0005, + "step": 36494 + }, + { + "epoch": 0.71, + "learning_rate": 5.847151566929439e-08, + "loss": 0.0007, + "step": 36495 + }, + { + "epoch": 0.71, + "learning_rate": 5.846763232495825e-08, + "loss": 0.0006, + "step": 36496 + }, + { + "epoch": 0.71, + "learning_rate": 5.8463748980622106e-08, + "loss": 0.0004, + "step": 36497 + }, + { + "epoch": 0.71, + "learning_rate": 5.8459865636285964e-08, + "loss": 0.0005, + "step": 36498 + }, + { + "epoch": 0.71, + "learning_rate": 5.845598229194982e-08, + "loss": 0.0006, + "step": 36499 + }, + { + "epoch": 0.71, + "learning_rate": 5.845209894761368e-08, + "loss": 0.0003, + "step": 36500 + }, + { + "epoch": 0.71, + "learning_rate": 5.844821560327754e-08, + "loss": 0.0006, + "step": 36501 + }, + { + "epoch": 0.71, + "learning_rate": 5.84443322589414e-08, + "loss": 0.0003, + "step": 36502 + }, + { + "epoch": 0.71, + "learning_rate": 5.8440448914605255e-08, + "loss": 0.0008, + "step": 36503 + }, + { + "epoch": 0.71, + "learning_rate": 5.8436565570269113e-08, + "loss": 0.2186, + "step": 36504 + }, + { + "epoch": 0.71, + "learning_rate": 5.843268222593297e-08, + "loss": 0.9052, + "step": 36505 + }, + { + "epoch": 0.71, + "learning_rate": 5.842879888159683e-08, + "loss": 0.0004, + "step": 36506 + }, + { + "epoch": 0.71, + "learning_rate": 5.842491553726069e-08, + "loss": 0.0005, + "step": 36507 + }, + { + "epoch": 0.71, + "learning_rate": 5.8421032192924546e-08, + "loss": 0.039, + "step": 36508 + }, + { + "epoch": 0.71, + "learning_rate": 5.8417148848588405e-08, + "loss": 0.0004, + "step": 36509 + }, + { + "epoch": 0.71, + "learning_rate": 5.841326550425226e-08, + "loss": 0.0004, + "step": 36510 + }, + { + "epoch": 0.71, + "learning_rate": 5.840938215991612e-08, + "loss": 0.0003, + "step": 36511 + }, + { + "epoch": 0.71, + "learning_rate": 5.840549881557998e-08, + "loss": 0.0006, + "step": 36512 + }, + { + "epoch": 0.71, + "learning_rate": 5.840161547124384e-08, + "loss": 0.0006, + "step": 36513 + }, + { + "epoch": 0.71, + "learning_rate": 5.8397732126907696e-08, + "loss": 0.0003, + "step": 36514 + }, + { + "epoch": 0.71, + "learning_rate": 5.8393848782571554e-08, + "loss": 0.0004, + "step": 36515 + }, + { + "epoch": 0.71, + "learning_rate": 5.838996543823541e-08, + "loss": 0.0004, + "step": 36516 + }, + { + "epoch": 0.71, + "learning_rate": 5.838608209389926e-08, + "loss": 0.9437, + "step": 36517 + }, + { + "epoch": 0.71, + "learning_rate": 5.8382198749563116e-08, + "loss": 0.0007, + "step": 36518 + }, + { + "epoch": 0.71, + "learning_rate": 5.8378315405226974e-08, + "loss": 0.0006, + "step": 36519 + }, + { + "epoch": 0.71, + "learning_rate": 5.837443206089083e-08, + "loss": 0.0004, + "step": 36520 + }, + { + "epoch": 0.71, + "learning_rate": 5.837054871655469e-08, + "loss": 0.0005, + "step": 36521 + }, + { + "epoch": 0.71, + "learning_rate": 5.836666537221855e-08, + "loss": 0.0005, + "step": 36522 + }, + { + "epoch": 0.71, + "learning_rate": 5.836278202788241e-08, + "loss": 0.0007, + "step": 36523 + }, + { + "epoch": 0.71, + "learning_rate": 5.8358898683546265e-08, + "loss": 0.0005, + "step": 36524 + }, + { + "epoch": 0.71, + "learning_rate": 5.835501533921012e-08, + "loss": 0.0005, + "step": 36525 + }, + { + "epoch": 0.71, + "learning_rate": 5.835113199487398e-08, + "loss": 0.001, + "step": 36526 + }, + { + "epoch": 0.71, + "learning_rate": 5.834724865053784e-08, + "loss": 0.0004, + "step": 36527 + }, + { + "epoch": 0.71, + "learning_rate": 5.83433653062017e-08, + "loss": 0.0004, + "step": 36528 + }, + { + "epoch": 0.71, + "learning_rate": 5.8339481961865556e-08, + "loss": 0.0006, + "step": 36529 + }, + { + "epoch": 0.71, + "learning_rate": 5.8335598617529414e-08, + "loss": 0.0004, + "step": 36530 + }, + { + "epoch": 0.71, + "learning_rate": 5.833171527319327e-08, + "loss": 0.0007, + "step": 36531 + }, + { + "epoch": 0.71, + "learning_rate": 5.832783192885713e-08, + "loss": 0.0006, + "step": 36532 + }, + { + "epoch": 0.71, + "learning_rate": 5.832394858452099e-08, + "loss": 0.0005, + "step": 36533 + }, + { + "epoch": 0.71, + "learning_rate": 5.832006524018485e-08, + "loss": 0.0004, + "step": 36534 + }, + { + "epoch": 0.71, + "learning_rate": 5.8316181895848706e-08, + "loss": 0.0006, + "step": 36535 + }, + { + "epoch": 0.71, + "learning_rate": 5.8312298551512564e-08, + "loss": 0.0007, + "step": 36536 + }, + { + "epoch": 0.71, + "learning_rate": 5.830841520717642e-08, + "loss": 0.0006, + "step": 36537 + }, + { + "epoch": 0.71, + "learning_rate": 5.830453186284028e-08, + "loss": 0.2721, + "step": 36538 + }, + { + "epoch": 0.71, + "learning_rate": 5.830064851850414e-08, + "loss": 0.0006, + "step": 36539 + }, + { + "epoch": 0.71, + "learning_rate": 5.8296765174168e-08, + "loss": 0.0005, + "step": 36540 + }, + { + "epoch": 0.71, + "learning_rate": 5.8292881829831855e-08, + "loss": 0.0006, + "step": 36541 + }, + { + "epoch": 0.71, + "learning_rate": 5.8288998485495713e-08, + "loss": 0.0005, + "step": 36542 + }, + { + "epoch": 0.71, + "learning_rate": 5.828511514115957e-08, + "loss": 0.0042, + "step": 36543 + }, + { + "epoch": 0.71, + "learning_rate": 5.828123179682343e-08, + "loss": 0.0004, + "step": 36544 + }, + { + "epoch": 0.71, + "learning_rate": 5.827734845248729e-08, + "loss": 0.0004, + "step": 36545 + }, + { + "epoch": 0.71, + "learning_rate": 5.827346510815113e-08, + "loss": 0.0008, + "step": 36546 + }, + { + "epoch": 0.71, + "learning_rate": 5.826958176381499e-08, + "loss": 0.0003, + "step": 36547 + }, + { + "epoch": 0.71, + "learning_rate": 5.826569841947885e-08, + "loss": 0.0003, + "step": 36548 + }, + { + "epoch": 0.71, + "learning_rate": 5.826181507514271e-08, + "loss": 0.0005, + "step": 36549 + }, + { + "epoch": 0.71, + "learning_rate": 5.8257931730806566e-08, + "loss": 0.0004, + "step": 36550 + }, + { + "epoch": 0.71, + "learning_rate": 5.8254048386470424e-08, + "loss": 0.0004, + "step": 36551 + }, + { + "epoch": 0.71, + "learning_rate": 5.825016504213428e-08, + "loss": 0.0004, + "step": 36552 + }, + { + "epoch": 0.71, + "learning_rate": 5.824628169779814e-08, + "loss": 0.4276, + "step": 36553 + }, + { + "epoch": 0.71, + "learning_rate": 5.8242398353462e-08, + "loss": 0.3593, + "step": 36554 + }, + { + "epoch": 0.71, + "learning_rate": 5.823851500912586e-08, + "loss": 0.0006, + "step": 36555 + }, + { + "epoch": 0.71, + "learning_rate": 5.8234631664789716e-08, + "loss": 0.0005, + "step": 36556 + }, + { + "epoch": 0.71, + "learning_rate": 5.8230748320453574e-08, + "loss": 0.0004, + "step": 36557 + }, + { + "epoch": 0.71, + "learning_rate": 5.822686497611743e-08, + "loss": 0.0005, + "step": 36558 + }, + { + "epoch": 0.71, + "learning_rate": 5.822298163178129e-08, + "loss": 0.0004, + "step": 36559 + }, + { + "epoch": 0.71, + "learning_rate": 5.821909828744515e-08, + "loss": 0.4167, + "step": 36560 + }, + { + "epoch": 0.71, + "learning_rate": 5.8215214943109e-08, + "loss": 0.019, + "step": 36561 + }, + { + "epoch": 0.71, + "learning_rate": 5.821133159877286e-08, + "loss": 0.0003, + "step": 36562 + }, + { + "epoch": 0.71, + "learning_rate": 5.820744825443672e-08, + "loss": 0.0004, + "step": 36563 + }, + { + "epoch": 0.71, + "learning_rate": 5.8203564910100575e-08, + "loss": 0.0004, + "step": 36564 + }, + { + "epoch": 0.71, + "learning_rate": 5.819968156576443e-08, + "loss": 0.0005, + "step": 36565 + }, + { + "epoch": 0.71, + "learning_rate": 5.819579822142829e-08, + "loss": 0.0028, + "step": 36566 + }, + { + "epoch": 0.71, + "learning_rate": 5.819191487709215e-08, + "loss": 0.0003, + "step": 36567 + }, + { + "epoch": 0.71, + "learning_rate": 5.818803153275601e-08, + "loss": 0.005, + "step": 36568 + }, + { + "epoch": 0.71, + "learning_rate": 5.8184148188419866e-08, + "loss": 0.0005, + "step": 36569 + }, + { + "epoch": 0.71, + "learning_rate": 5.8180264844083724e-08, + "loss": 0.0005, + "step": 36570 + }, + { + "epoch": 0.71, + "learning_rate": 5.817638149974758e-08, + "loss": 0.0004, + "step": 36571 + }, + { + "epoch": 0.71, + "learning_rate": 5.817249815541144e-08, + "loss": 0.0003, + "step": 36572 + }, + { + "epoch": 0.71, + "learning_rate": 5.81686148110753e-08, + "loss": 0.0004, + "step": 36573 + }, + { + "epoch": 0.71, + "learning_rate": 5.816473146673916e-08, + "loss": 0.0004, + "step": 36574 + }, + { + "epoch": 0.71, + "learning_rate": 5.8160848122403e-08, + "loss": 0.0004, + "step": 36575 + }, + { + "epoch": 0.71, + "learning_rate": 5.815696477806686e-08, + "loss": 0.0004, + "step": 36576 + }, + { + "epoch": 0.71, + "learning_rate": 5.815308143373072e-08, + "loss": 0.0005, + "step": 36577 + }, + { + "epoch": 0.71, + "learning_rate": 5.814919808939458e-08, + "loss": 0.0004, + "step": 36578 + }, + { + "epoch": 0.71, + "learning_rate": 5.8145314745058435e-08, + "loss": 0.0005, + "step": 36579 + }, + { + "epoch": 0.71, + "learning_rate": 5.8141431400722294e-08, + "loss": 0.0004, + "step": 36580 + }, + { + "epoch": 0.71, + "learning_rate": 5.813754805638615e-08, + "loss": 0.0004, + "step": 36581 + }, + { + "epoch": 0.71, + "learning_rate": 5.813366471205001e-08, + "loss": 0.0005, + "step": 36582 + }, + { + "epoch": 0.71, + "learning_rate": 5.812978136771387e-08, + "loss": 0.0003, + "step": 36583 + }, + { + "epoch": 0.71, + "learning_rate": 5.8125898023377727e-08, + "loss": 0.001, + "step": 36584 + }, + { + "epoch": 0.71, + "learning_rate": 5.8122014679041585e-08, + "loss": 0.0019, + "step": 36585 + }, + { + "epoch": 0.71, + "learning_rate": 5.811813133470544e-08, + "loss": 0.0006, + "step": 36586 + }, + { + "epoch": 0.71, + "learning_rate": 5.81142479903693e-08, + "loss": 0.196, + "step": 36587 + }, + { + "epoch": 0.71, + "learning_rate": 5.811036464603316e-08, + "loss": 0.2041, + "step": 36588 + }, + { + "epoch": 0.71, + "learning_rate": 5.810648130169702e-08, + "loss": 0.0003, + "step": 36589 + }, + { + "epoch": 0.71, + "learning_rate": 5.8102597957360876e-08, + "loss": 0.0005, + "step": 36590 + }, + { + "epoch": 0.71, + "learning_rate": 5.8098714613024734e-08, + "loss": 0.0052, + "step": 36591 + }, + { + "epoch": 0.71, + "learning_rate": 5.809483126868859e-08, + "loss": 0.0007, + "step": 36592 + }, + { + "epoch": 0.71, + "learning_rate": 5.809094792435245e-08, + "loss": 0.0004, + "step": 36593 + }, + { + "epoch": 0.71, + "learning_rate": 5.808706458001631e-08, + "loss": 0.0005, + "step": 36594 + }, + { + "epoch": 0.71, + "learning_rate": 5.808318123568017e-08, + "loss": 0.0003, + "step": 36595 + }, + { + "epoch": 0.71, + "learning_rate": 5.8079297891344026e-08, + "loss": 0.0005, + "step": 36596 + }, + { + "epoch": 0.71, + "learning_rate": 5.8075414547007884e-08, + "loss": 0.0004, + "step": 36597 + }, + { + "epoch": 0.71, + "learning_rate": 5.807153120267174e-08, + "loss": 0.0004, + "step": 36598 + }, + { + "epoch": 0.71, + "learning_rate": 5.80676478583356e-08, + "loss": 0.0005, + "step": 36599 + }, + { + "epoch": 0.71, + "learning_rate": 5.806376451399946e-08, + "loss": 0.0004, + "step": 36600 + }, + { + "epoch": 0.71, + "learning_rate": 5.805988116966332e-08, + "loss": 0.0007, + "step": 36601 + }, + { + "epoch": 0.71, + "learning_rate": 5.8055997825327175e-08, + "loss": 0.0003, + "step": 36602 + }, + { + "epoch": 0.71, + "learning_rate": 5.805211448099103e-08, + "loss": 0.0006, + "step": 36603 + }, + { + "epoch": 0.71, + "learning_rate": 5.804823113665488e-08, + "loss": 0.0005, + "step": 36604 + }, + { + "epoch": 0.71, + "learning_rate": 5.8044347792318736e-08, + "loss": 0.0004, + "step": 36605 + }, + { + "epoch": 0.71, + "learning_rate": 5.8040464447982595e-08, + "loss": 1.1235, + "step": 36606 + }, + { + "epoch": 0.71, + "learning_rate": 5.803658110364645e-08, + "loss": 0.0005, + "step": 36607 + }, + { + "epoch": 0.71, + "learning_rate": 5.803269775931031e-08, + "loss": 0.0004, + "step": 36608 + }, + { + "epoch": 0.71, + "learning_rate": 5.802881441497417e-08, + "loss": 0.0005, + "step": 36609 + }, + { + "epoch": 0.71, + "learning_rate": 5.802493107063803e-08, + "loss": 0.0003, + "step": 36610 + }, + { + "epoch": 0.71, + "learning_rate": 5.8021047726301886e-08, + "loss": 0.7746, + "step": 36611 + }, + { + "epoch": 0.71, + "learning_rate": 5.8017164381965744e-08, + "loss": 0.0003, + "step": 36612 + }, + { + "epoch": 0.71, + "learning_rate": 5.80132810376296e-08, + "loss": 0.0005, + "step": 36613 + }, + { + "epoch": 0.71, + "learning_rate": 5.800939769329346e-08, + "loss": 0.0012, + "step": 36614 + }, + { + "epoch": 0.71, + "learning_rate": 5.800551434895732e-08, + "loss": 1.3036, + "step": 36615 + }, + { + "epoch": 0.71, + "learning_rate": 5.800163100462118e-08, + "loss": 0.0004, + "step": 36616 + }, + { + "epoch": 0.71, + "learning_rate": 5.7997747660285035e-08, + "loss": 0.003, + "step": 36617 + }, + { + "epoch": 0.71, + "learning_rate": 5.7993864315948894e-08, + "loss": 0.0007, + "step": 36618 + }, + { + "epoch": 0.71, + "learning_rate": 5.798998097161275e-08, + "loss": 0.0004, + "step": 36619 + }, + { + "epoch": 0.71, + "learning_rate": 5.798609762727661e-08, + "loss": 0.0006, + "step": 36620 + }, + { + "epoch": 0.71, + "learning_rate": 5.798221428294047e-08, + "loss": 0.0033, + "step": 36621 + }, + { + "epoch": 0.71, + "learning_rate": 5.7978330938604327e-08, + "loss": 0.3499, + "step": 36622 + }, + { + "epoch": 0.71, + "learning_rate": 5.7974447594268185e-08, + "loss": 0.0004, + "step": 36623 + }, + { + "epoch": 0.71, + "learning_rate": 5.797056424993204e-08, + "loss": 0.0005, + "step": 36624 + }, + { + "epoch": 0.71, + "learning_rate": 5.79666809055959e-08, + "loss": 0.0005, + "step": 36625 + }, + { + "epoch": 0.71, + "learning_rate": 5.796279756125976e-08, + "loss": 0.0003, + "step": 36626 + }, + { + "epoch": 0.71, + "learning_rate": 5.795891421692362e-08, + "loss": 0.9542, + "step": 36627 + }, + { + "epoch": 0.71, + "learning_rate": 5.7955030872587476e-08, + "loss": 0.0005, + "step": 36628 + }, + { + "epoch": 0.71, + "learning_rate": 5.7951147528251334e-08, + "loss": 0.0004, + "step": 36629 + }, + { + "epoch": 0.71, + "learning_rate": 5.794726418391519e-08, + "loss": 0.0005, + "step": 36630 + }, + { + "epoch": 0.71, + "learning_rate": 5.794338083957905e-08, + "loss": 0.0003, + "step": 36631 + }, + { + "epoch": 0.71, + "learning_rate": 5.793949749524291e-08, + "loss": 0.415, + "step": 36632 + }, + { + "epoch": 0.71, + "learning_rate": 5.7935614150906754e-08, + "loss": 0.0005, + "step": 36633 + }, + { + "epoch": 0.71, + "learning_rate": 5.793173080657061e-08, + "loss": 0.0004, + "step": 36634 + }, + { + "epoch": 0.71, + "learning_rate": 5.792784746223447e-08, + "loss": 0.0005, + "step": 36635 + }, + { + "epoch": 0.71, + "learning_rate": 5.792396411789833e-08, + "loss": 0.0005, + "step": 36636 + }, + { + "epoch": 0.71, + "learning_rate": 5.792008077356219e-08, + "loss": 0.0004, + "step": 36637 + }, + { + "epoch": 0.71, + "learning_rate": 5.7916197429226045e-08, + "loss": 0.0004, + "step": 36638 + }, + { + "epoch": 0.71, + "learning_rate": 5.7912314084889904e-08, + "loss": 0.0006, + "step": 36639 + }, + { + "epoch": 0.71, + "learning_rate": 5.790843074055376e-08, + "loss": 0.0004, + "step": 36640 + }, + { + "epoch": 0.71, + "learning_rate": 5.790454739621762e-08, + "loss": 1.0595, + "step": 36641 + }, + { + "epoch": 0.71, + "learning_rate": 5.790066405188148e-08, + "loss": 0.0004, + "step": 36642 + }, + { + "epoch": 0.71, + "learning_rate": 5.7896780707545337e-08, + "loss": 0.0005, + "step": 36643 + }, + { + "epoch": 0.71, + "learning_rate": 5.7892897363209195e-08, + "loss": 0.0004, + "step": 36644 + }, + { + "epoch": 0.71, + "learning_rate": 5.788901401887305e-08, + "loss": 0.0005, + "step": 36645 + }, + { + "epoch": 0.71, + "learning_rate": 5.788513067453691e-08, + "loss": 0.0004, + "step": 36646 + }, + { + "epoch": 0.71, + "learning_rate": 5.788124733020077e-08, + "loss": 0.0005, + "step": 36647 + }, + { + "epoch": 0.71, + "learning_rate": 5.787736398586463e-08, + "loss": 0.0004, + "step": 36648 + }, + { + "epoch": 0.71, + "learning_rate": 5.787348064152848e-08, + "loss": 0.0425, + "step": 36649 + }, + { + "epoch": 0.71, + "learning_rate": 5.786959729719234e-08, + "loss": 0.0005, + "step": 36650 + }, + { + "epoch": 0.71, + "learning_rate": 5.7865713952856196e-08, + "loss": 0.0036, + "step": 36651 + }, + { + "epoch": 0.71, + "learning_rate": 5.7861830608520054e-08, + "loss": 1.0922, + "step": 36652 + }, + { + "epoch": 0.71, + "learning_rate": 5.785794726418391e-08, + "loss": 0.0004, + "step": 36653 + }, + { + "epoch": 0.71, + "learning_rate": 5.785406391984777e-08, + "loss": 0.0005, + "step": 36654 + }, + { + "epoch": 0.71, + "learning_rate": 5.785018057551163e-08, + "loss": 1.2338, + "step": 36655 + }, + { + "epoch": 0.71, + "learning_rate": 5.784629723117549e-08, + "loss": 0.0005, + "step": 36656 + }, + { + "epoch": 0.71, + "learning_rate": 5.7842413886839345e-08, + "loss": 0.0003, + "step": 36657 + }, + { + "epoch": 0.71, + "learning_rate": 5.7838530542503204e-08, + "loss": 0.0008, + "step": 36658 + }, + { + "epoch": 0.71, + "learning_rate": 5.783464719816706e-08, + "loss": 0.0004, + "step": 36659 + }, + { + "epoch": 0.71, + "learning_rate": 5.783076385383092e-08, + "loss": 0.0005, + "step": 36660 + }, + { + "epoch": 0.71, + "learning_rate": 5.782688050949478e-08, + "loss": 0.0005, + "step": 36661 + }, + { + "epoch": 0.71, + "learning_rate": 5.782299716515863e-08, + "loss": 0.0004, + "step": 36662 + }, + { + "epoch": 0.71, + "learning_rate": 5.781911382082249e-08, + "loss": 0.0006, + "step": 36663 + }, + { + "epoch": 0.71, + "learning_rate": 5.781523047648634e-08, + "loss": 0.0004, + "step": 36664 + }, + { + "epoch": 0.71, + "learning_rate": 5.78113471321502e-08, + "loss": 0.0006, + "step": 36665 + }, + { + "epoch": 0.71, + "learning_rate": 5.7807463787814056e-08, + "loss": 0.0006, + "step": 36666 + }, + { + "epoch": 0.71, + "learning_rate": 5.7803580443477915e-08, + "loss": 0.0005, + "step": 36667 + }, + { + "epoch": 0.71, + "learning_rate": 5.779969709914177e-08, + "loss": 0.0005, + "step": 36668 + }, + { + "epoch": 0.71, + "learning_rate": 5.779581375480563e-08, + "loss": 0.035, + "step": 36669 + }, + { + "epoch": 0.71, + "learning_rate": 5.779193041046949e-08, + "loss": 0.0005, + "step": 36670 + }, + { + "epoch": 0.71, + "learning_rate": 5.778804706613335e-08, + "loss": 0.0003, + "step": 36671 + }, + { + "epoch": 0.71, + "learning_rate": 5.7784163721797206e-08, + "loss": 0.0003, + "step": 36672 + }, + { + "epoch": 0.71, + "learning_rate": 5.7780280377461064e-08, + "loss": 1.3945, + "step": 36673 + }, + { + "epoch": 0.71, + "learning_rate": 5.777639703312492e-08, + "loss": 0.0005, + "step": 36674 + }, + { + "epoch": 0.71, + "learning_rate": 5.777251368878878e-08, + "loss": 0.0007, + "step": 36675 + }, + { + "epoch": 0.71, + "learning_rate": 5.776863034445264e-08, + "loss": 0.0012, + "step": 36676 + }, + { + "epoch": 0.71, + "learning_rate": 5.77647470001165e-08, + "loss": 0.0003, + "step": 36677 + }, + { + "epoch": 0.71, + "learning_rate": 5.7760863655780355e-08, + "loss": 0.0006, + "step": 36678 + }, + { + "epoch": 0.71, + "learning_rate": 5.7756980311444213e-08, + "loss": 0.0007, + "step": 36679 + }, + { + "epoch": 0.71, + "learning_rate": 5.775309696710807e-08, + "loss": 0.0005, + "step": 36680 + }, + { + "epoch": 0.71, + "learning_rate": 5.774921362277193e-08, + "loss": 0.0006, + "step": 36681 + }, + { + "epoch": 0.71, + "learning_rate": 5.774533027843579e-08, + "loss": 0.0005, + "step": 36682 + }, + { + "epoch": 0.71, + "learning_rate": 5.7741446934099646e-08, + "loss": 0.0008, + "step": 36683 + }, + { + "epoch": 0.71, + "learning_rate": 5.7737563589763505e-08, + "loss": 0.0004, + "step": 36684 + }, + { + "epoch": 0.71, + "learning_rate": 5.773368024542736e-08, + "loss": 0.0005, + "step": 36685 + }, + { + "epoch": 0.71, + "learning_rate": 5.772979690109122e-08, + "loss": 0.4477, + "step": 36686 + }, + { + "epoch": 0.71, + "learning_rate": 5.772591355675508e-08, + "loss": 0.0007, + "step": 36687 + }, + { + "epoch": 0.71, + "learning_rate": 5.772203021241894e-08, + "loss": 0.0004, + "step": 36688 + }, + { + "epoch": 0.71, + "learning_rate": 5.7718146868082796e-08, + "loss": 0.0005, + "step": 36689 + }, + { + "epoch": 0.71, + "learning_rate": 5.7714263523746654e-08, + "loss": 1.1722, + "step": 36690 + }, + { + "epoch": 0.71, + "learning_rate": 5.77103801794105e-08, + "loss": 0.0004, + "step": 36691 + }, + { + "epoch": 0.71, + "learning_rate": 5.770649683507436e-08, + "loss": 0.0502, + "step": 36692 + }, + { + "epoch": 0.71, + "learning_rate": 5.7702613490738216e-08, + "loss": 0.0005, + "step": 36693 + }, + { + "epoch": 0.71, + "learning_rate": 5.7698730146402074e-08, + "loss": 0.0005, + "step": 36694 + }, + { + "epoch": 0.71, + "learning_rate": 5.769484680206593e-08, + "loss": 0.0006, + "step": 36695 + }, + { + "epoch": 0.71, + "learning_rate": 5.769096345772979e-08, + "loss": 0.0406, + "step": 36696 + }, + { + "epoch": 0.71, + "learning_rate": 5.768708011339365e-08, + "loss": 0.0272, + "step": 36697 + }, + { + "epoch": 0.71, + "learning_rate": 5.768319676905751e-08, + "loss": 0.0005, + "step": 36698 + }, + { + "epoch": 0.71, + "learning_rate": 5.7679313424721365e-08, + "loss": 0.0023, + "step": 36699 + }, + { + "epoch": 0.71, + "learning_rate": 5.7675430080385223e-08, + "loss": 0.0004, + "step": 36700 + }, + { + "epoch": 0.71, + "learning_rate": 5.767154673604908e-08, + "loss": 0.001, + "step": 36701 + }, + { + "epoch": 0.71, + "learning_rate": 5.766766339171294e-08, + "loss": 0.0006, + "step": 36702 + }, + { + "epoch": 0.71, + "learning_rate": 5.76637800473768e-08, + "loss": 0.0005, + "step": 36703 + }, + { + "epoch": 0.71, + "learning_rate": 5.7659896703040656e-08, + "loss": 0.0107, + "step": 36704 + }, + { + "epoch": 0.71, + "learning_rate": 5.7656013358704515e-08, + "loss": 0.0101, + "step": 36705 + }, + { + "epoch": 0.71, + "learning_rate": 5.765213001436837e-08, + "loss": 0.014, + "step": 36706 + }, + { + "epoch": 0.71, + "learning_rate": 5.764824667003223e-08, + "loss": 0.0006, + "step": 36707 + }, + { + "epoch": 0.71, + "learning_rate": 5.764436332569609e-08, + "loss": 0.0004, + "step": 36708 + }, + { + "epoch": 0.71, + "learning_rate": 5.764047998135995e-08, + "loss": 0.0005, + "step": 36709 + }, + { + "epoch": 0.71, + "learning_rate": 5.7636596637023806e-08, + "loss": 0.0004, + "step": 36710 + }, + { + "epoch": 0.71, + "learning_rate": 5.7632713292687664e-08, + "loss": 0.0006, + "step": 36711 + }, + { + "epoch": 0.71, + "learning_rate": 5.762882994835152e-08, + "loss": 0.0005, + "step": 36712 + }, + { + "epoch": 0.71, + "learning_rate": 5.762494660401538e-08, + "loss": 0.8495, + "step": 36713 + }, + { + "epoch": 0.71, + "learning_rate": 5.762106325967924e-08, + "loss": 0.0005, + "step": 36714 + }, + { + "epoch": 0.71, + "learning_rate": 5.76171799153431e-08, + "loss": 0.0004, + "step": 36715 + }, + { + "epoch": 0.71, + "learning_rate": 5.7613296571006955e-08, + "loss": 0.0005, + "step": 36716 + }, + { + "epoch": 0.71, + "learning_rate": 5.7609413226670814e-08, + "loss": 0.7468, + "step": 36717 + }, + { + "epoch": 0.71, + "learning_rate": 5.760552988233467e-08, + "loss": 0.5628, + "step": 36718 + }, + { + "epoch": 0.71, + "learning_rate": 5.760164653799853e-08, + "loss": 0.0005, + "step": 36719 + }, + { + "epoch": 0.71, + "learning_rate": 5.7597763193662375e-08, + "loss": 0.0004, + "step": 36720 + }, + { + "epoch": 0.71, + "learning_rate": 5.759387984932623e-08, + "loss": 0.0007, + "step": 36721 + }, + { + "epoch": 0.71, + "learning_rate": 5.758999650499009e-08, + "loss": 0.001, + "step": 36722 + }, + { + "epoch": 0.71, + "learning_rate": 5.758611316065395e-08, + "loss": 0.7829, + "step": 36723 + }, + { + "epoch": 0.71, + "learning_rate": 5.758222981631781e-08, + "loss": 0.0007, + "step": 36724 + }, + { + "epoch": 0.71, + "learning_rate": 5.7578346471981666e-08, + "loss": 0.0004, + "step": 36725 + }, + { + "epoch": 0.71, + "learning_rate": 5.7574463127645524e-08, + "loss": 0.0004, + "step": 36726 + }, + { + "epoch": 0.71, + "learning_rate": 5.757057978330938e-08, + "loss": 0.004, + "step": 36727 + }, + { + "epoch": 0.71, + "learning_rate": 5.756669643897324e-08, + "loss": 0.0006, + "step": 36728 + }, + { + "epoch": 0.71, + "learning_rate": 5.75628130946371e-08, + "loss": 0.0003, + "step": 36729 + }, + { + "epoch": 0.71, + "learning_rate": 5.755892975030096e-08, + "loss": 0.0005, + "step": 36730 + }, + { + "epoch": 0.71, + "learning_rate": 5.7555046405964816e-08, + "loss": 0.0004, + "step": 36731 + }, + { + "epoch": 0.71, + "learning_rate": 5.7551163061628674e-08, + "loss": 0.0005, + "step": 36732 + }, + { + "epoch": 0.71, + "learning_rate": 5.754727971729253e-08, + "loss": 0.0005, + "step": 36733 + }, + { + "epoch": 0.71, + "learning_rate": 5.754339637295639e-08, + "loss": 0.0004, + "step": 36734 + }, + { + "epoch": 0.71, + "learning_rate": 5.753951302862025e-08, + "loss": 0.0006, + "step": 36735 + }, + { + "epoch": 0.71, + "learning_rate": 5.753562968428411e-08, + "loss": 0.0004, + "step": 36736 + }, + { + "epoch": 0.71, + "learning_rate": 5.7531746339947965e-08, + "loss": 0.0005, + "step": 36737 + }, + { + "epoch": 0.71, + "learning_rate": 5.752786299561182e-08, + "loss": 0.8533, + "step": 36738 + }, + { + "epoch": 0.71, + "learning_rate": 5.7523979651275675e-08, + "loss": 0.0222, + "step": 36739 + }, + { + "epoch": 0.71, + "learning_rate": 5.752009630693953e-08, + "loss": 0.0003, + "step": 36740 + }, + { + "epoch": 0.71, + "learning_rate": 5.751621296260339e-08, + "loss": 0.0003, + "step": 36741 + }, + { + "epoch": 0.71, + "learning_rate": 5.751232961826725e-08, + "loss": 0.0005, + "step": 36742 + }, + { + "epoch": 0.71, + "learning_rate": 5.750844627393111e-08, + "loss": 0.0006, + "step": 36743 + }, + { + "epoch": 0.71, + "learning_rate": 5.7504562929594966e-08, + "loss": 0.0004, + "step": 36744 + }, + { + "epoch": 0.71, + "learning_rate": 5.7500679585258825e-08, + "loss": 0.9491, + "step": 36745 + }, + { + "epoch": 0.71, + "learning_rate": 5.749679624092268e-08, + "loss": 0.0009, + "step": 36746 + }, + { + "epoch": 0.71, + "learning_rate": 5.749291289658654e-08, + "loss": 0.0063, + "step": 36747 + }, + { + "epoch": 0.71, + "learning_rate": 5.74890295522504e-08, + "loss": 0.0006, + "step": 36748 + }, + { + "epoch": 0.71, + "learning_rate": 5.748514620791425e-08, + "loss": 0.0004, + "step": 36749 + }, + { + "epoch": 0.71, + "learning_rate": 5.748126286357811e-08, + "loss": 0.0004, + "step": 36750 + }, + { + "epoch": 0.71, + "learning_rate": 5.747737951924197e-08, + "loss": 0.0008, + "step": 36751 + }, + { + "epoch": 0.71, + "learning_rate": 5.747349617490582e-08, + "loss": 0.0005, + "step": 36752 + }, + { + "epoch": 0.71, + "learning_rate": 5.746961283056968e-08, + "loss": 0.0004, + "step": 36753 + }, + { + "epoch": 0.71, + "learning_rate": 5.7465729486233535e-08, + "loss": 0.0004, + "step": 36754 + }, + { + "epoch": 0.71, + "learning_rate": 5.7461846141897394e-08, + "loss": 0.0007, + "step": 36755 + }, + { + "epoch": 0.71, + "learning_rate": 5.745796279756125e-08, + "loss": 0.0006, + "step": 36756 + }, + { + "epoch": 0.71, + "learning_rate": 5.745407945322511e-08, + "loss": 0.0003, + "step": 36757 + }, + { + "epoch": 0.71, + "learning_rate": 5.745019610888897e-08, + "loss": 0.0004, + "step": 36758 + }, + { + "epoch": 0.71, + "learning_rate": 5.744631276455283e-08, + "loss": 0.0004, + "step": 36759 + }, + { + "epoch": 0.71, + "learning_rate": 5.7442429420216685e-08, + "loss": 0.0005, + "step": 36760 + }, + { + "epoch": 0.71, + "learning_rate": 5.743854607588054e-08, + "loss": 0.0003, + "step": 36761 + }, + { + "epoch": 0.71, + "learning_rate": 5.74346627315444e-08, + "loss": 0.0005, + "step": 36762 + }, + { + "epoch": 0.71, + "learning_rate": 5.743077938720826e-08, + "loss": 0.001, + "step": 36763 + }, + { + "epoch": 0.71, + "learning_rate": 5.742689604287212e-08, + "loss": 0.0003, + "step": 36764 + }, + { + "epoch": 0.71, + "learning_rate": 5.7423012698535976e-08, + "loss": 0.0004, + "step": 36765 + }, + { + "epoch": 0.71, + "learning_rate": 5.7419129354199834e-08, + "loss": 0.0005, + "step": 36766 + }, + { + "epoch": 0.71, + "learning_rate": 5.741524600986369e-08, + "loss": 0.0005, + "step": 36767 + }, + { + "epoch": 0.71, + "learning_rate": 5.741136266552755e-08, + "loss": 0.4178, + "step": 36768 + }, + { + "epoch": 0.71, + "learning_rate": 5.740747932119141e-08, + "loss": 0.0006, + "step": 36769 + }, + { + "epoch": 0.71, + "learning_rate": 5.740359597685527e-08, + "loss": 0.0006, + "step": 36770 + }, + { + "epoch": 0.71, + "learning_rate": 5.7399712632519126e-08, + "loss": 0.0003, + "step": 36771 + }, + { + "epoch": 0.71, + "learning_rate": 5.7395829288182984e-08, + "loss": 0.0005, + "step": 36772 + }, + { + "epoch": 0.71, + "learning_rate": 5.739194594384684e-08, + "loss": 0.0005, + "step": 36773 + }, + { + "epoch": 0.71, + "learning_rate": 5.73880625995107e-08, + "loss": 0.0008, + "step": 36774 + }, + { + "epoch": 0.71, + "learning_rate": 5.738417925517456e-08, + "loss": 0.0003, + "step": 36775 + }, + { + "epoch": 0.71, + "learning_rate": 5.738029591083842e-08, + "loss": 0.0004, + "step": 36776 + }, + { + "epoch": 0.71, + "learning_rate": 5.7376412566502275e-08, + "loss": 0.0004, + "step": 36777 + }, + { + "epoch": 0.71, + "learning_rate": 5.737252922216612e-08, + "loss": 0.0004, + "step": 36778 + }, + { + "epoch": 0.71, + "learning_rate": 5.736864587782998e-08, + "loss": 0.0004, + "step": 36779 + }, + { + "epoch": 0.71, + "learning_rate": 5.7364762533493837e-08, + "loss": 0.752, + "step": 36780 + }, + { + "epoch": 0.71, + "learning_rate": 5.7360879189157695e-08, + "loss": 0.0004, + "step": 36781 + }, + { + "epoch": 0.71, + "learning_rate": 5.735699584482155e-08, + "loss": 0.0003, + "step": 36782 + }, + { + "epoch": 0.71, + "learning_rate": 5.735311250048541e-08, + "loss": 0.0007, + "step": 36783 + }, + { + "epoch": 0.71, + "learning_rate": 5.734922915614927e-08, + "loss": 0.0004, + "step": 36784 + }, + { + "epoch": 0.71, + "learning_rate": 5.734534581181313e-08, + "loss": 1.0401, + "step": 36785 + }, + { + "epoch": 0.71, + "learning_rate": 5.7341462467476986e-08, + "loss": 0.3728, + "step": 36786 + }, + { + "epoch": 0.71, + "learning_rate": 5.7337579123140844e-08, + "loss": 0.0005, + "step": 36787 + }, + { + "epoch": 0.71, + "learning_rate": 5.73336957788047e-08, + "loss": 0.0004, + "step": 36788 + }, + { + "epoch": 0.71, + "learning_rate": 5.732981243446856e-08, + "loss": 0.06, + "step": 36789 + }, + { + "epoch": 0.71, + "learning_rate": 5.732592909013242e-08, + "loss": 0.0004, + "step": 36790 + }, + { + "epoch": 0.71, + "learning_rate": 5.732204574579628e-08, + "loss": 0.0004, + "step": 36791 + }, + { + "epoch": 0.71, + "learning_rate": 5.7318162401460136e-08, + "loss": 0.3382, + "step": 36792 + }, + { + "epoch": 0.71, + "learning_rate": 5.7314279057123994e-08, + "loss": 0.7111, + "step": 36793 + }, + { + "epoch": 0.71, + "learning_rate": 5.731039571278785e-08, + "loss": 0.0004, + "step": 36794 + }, + { + "epoch": 0.71, + "learning_rate": 5.730651236845171e-08, + "loss": 0.9122, + "step": 36795 + }, + { + "epoch": 0.71, + "learning_rate": 5.730262902411557e-08, + "loss": 0.0005, + "step": 36796 + }, + { + "epoch": 0.71, + "learning_rate": 5.729874567977943e-08, + "loss": 0.0008, + "step": 36797 + }, + { + "epoch": 0.71, + "learning_rate": 5.7294862335443285e-08, + "loss": 0.0008, + "step": 36798 + }, + { + "epoch": 0.71, + "learning_rate": 5.729097899110714e-08, + "loss": 0.0006, + "step": 36799 + }, + { + "epoch": 0.71, + "learning_rate": 5.7287095646771e-08, + "loss": 1.2542, + "step": 36800 + }, + { + "epoch": 0.71, + "learning_rate": 5.728321230243486e-08, + "loss": 0.0007, + "step": 36801 + }, + { + "epoch": 0.71, + "learning_rate": 5.727932895809872e-08, + "loss": 1.0391, + "step": 36802 + }, + { + "epoch": 0.71, + "learning_rate": 5.7275445613762576e-08, + "loss": 0.0006, + "step": 36803 + }, + { + "epoch": 0.71, + "learning_rate": 5.7271562269426434e-08, + "loss": 0.7116, + "step": 36804 + }, + { + "epoch": 0.71, + "learning_rate": 5.726767892509029e-08, + "loss": 0.5476, + "step": 36805 + }, + { + "epoch": 0.71, + "learning_rate": 5.726379558075415e-08, + "loss": 0.0004, + "step": 36806 + }, + { + "epoch": 0.71, + "learning_rate": 5.7259912236417996e-08, + "loss": 0.0027, + "step": 36807 + }, + { + "epoch": 0.71, + "learning_rate": 5.7256028892081854e-08, + "loss": 0.0006, + "step": 36808 + }, + { + "epoch": 0.71, + "learning_rate": 5.725214554774571e-08, + "loss": 0.0004, + "step": 36809 + }, + { + "epoch": 0.71, + "learning_rate": 5.724826220340957e-08, + "loss": 0.0008, + "step": 36810 + }, + { + "epoch": 0.71, + "learning_rate": 5.724437885907343e-08, + "loss": 0.0018, + "step": 36811 + }, + { + "epoch": 0.71, + "learning_rate": 5.724049551473729e-08, + "loss": 0.0191, + "step": 36812 + }, + { + "epoch": 0.71, + "learning_rate": 5.7236612170401145e-08, + "loss": 0.0005, + "step": 36813 + }, + { + "epoch": 0.71, + "learning_rate": 5.7232728826065004e-08, + "loss": 0.1113, + "step": 36814 + }, + { + "epoch": 0.71, + "learning_rate": 5.722884548172886e-08, + "loss": 0.0005, + "step": 36815 + }, + { + "epoch": 0.71, + "learning_rate": 5.722496213739272e-08, + "loss": 0.0004, + "step": 36816 + }, + { + "epoch": 0.71, + "learning_rate": 5.722107879305658e-08, + "loss": 0.0004, + "step": 36817 + }, + { + "epoch": 0.71, + "learning_rate": 5.7217195448720437e-08, + "loss": 0.0005, + "step": 36818 + }, + { + "epoch": 0.71, + "learning_rate": 5.7213312104384295e-08, + "loss": 0.0006, + "step": 36819 + }, + { + "epoch": 0.71, + "learning_rate": 5.720942876004815e-08, + "loss": 0.0005, + "step": 36820 + }, + { + "epoch": 0.71, + "learning_rate": 5.720554541571201e-08, + "loss": 0.0005, + "step": 36821 + }, + { + "epoch": 0.71, + "learning_rate": 5.720166207137587e-08, + "loss": 0.0004, + "step": 36822 + }, + { + "epoch": 0.71, + "learning_rate": 5.719777872703973e-08, + "loss": 0.0006, + "step": 36823 + }, + { + "epoch": 0.71, + "learning_rate": 5.7193895382703586e-08, + "loss": 0.0003, + "step": 36824 + }, + { + "epoch": 0.71, + "learning_rate": 5.7190012038367444e-08, + "loss": 0.0004, + "step": 36825 + }, + { + "epoch": 0.71, + "learning_rate": 5.7186128694031296e-08, + "loss": 0.0009, + "step": 36826 + }, + { + "epoch": 0.71, + "learning_rate": 5.7182245349695154e-08, + "loss": 0.0005, + "step": 36827 + }, + { + "epoch": 0.71, + "learning_rate": 5.717836200535901e-08, + "loss": 0.0005, + "step": 36828 + }, + { + "epoch": 0.71, + "learning_rate": 5.717447866102287e-08, + "loss": 0.0004, + "step": 36829 + }, + { + "epoch": 0.71, + "learning_rate": 5.717059531668673e-08, + "loss": 0.0016, + "step": 36830 + }, + { + "epoch": 0.71, + "learning_rate": 5.716671197235059e-08, + "loss": 0.0009, + "step": 36831 + }, + { + "epoch": 0.71, + "learning_rate": 5.7162828628014445e-08, + "loss": 0.0005, + "step": 36832 + }, + { + "epoch": 0.71, + "learning_rate": 5.7158945283678304e-08, + "loss": 0.0011, + "step": 36833 + }, + { + "epoch": 0.71, + "learning_rate": 5.715506193934216e-08, + "loss": 0.0005, + "step": 36834 + }, + { + "epoch": 0.71, + "learning_rate": 5.715117859500602e-08, + "loss": 0.0008, + "step": 36835 + }, + { + "epoch": 0.71, + "learning_rate": 5.714729525066987e-08, + "loss": 0.0011, + "step": 36836 + }, + { + "epoch": 0.71, + "learning_rate": 5.714341190633373e-08, + "loss": 0.0004, + "step": 36837 + }, + { + "epoch": 0.71, + "learning_rate": 5.713952856199759e-08, + "loss": 0.0004, + "step": 36838 + }, + { + "epoch": 0.71, + "learning_rate": 5.7135645217661447e-08, + "loss": 0.0005, + "step": 36839 + }, + { + "epoch": 0.71, + "learning_rate": 5.7131761873325305e-08, + "loss": 0.0003, + "step": 36840 + }, + { + "epoch": 0.71, + "learning_rate": 5.7127878528989156e-08, + "loss": 0.0005, + "step": 36841 + }, + { + "epoch": 0.71, + "learning_rate": 5.7123995184653015e-08, + "loss": 0.0007, + "step": 36842 + }, + { + "epoch": 0.71, + "learning_rate": 5.712011184031687e-08, + "loss": 0.0005, + "step": 36843 + }, + { + "epoch": 0.71, + "learning_rate": 5.711622849598073e-08, + "loss": 0.301, + "step": 36844 + }, + { + "epoch": 0.71, + "learning_rate": 5.711234515164459e-08, + "loss": 0.007, + "step": 36845 + }, + { + "epoch": 0.71, + "learning_rate": 5.710846180730845e-08, + "loss": 0.0005, + "step": 36846 + }, + { + "epoch": 0.71, + "learning_rate": 5.7104578462972306e-08, + "loss": 0.0005, + "step": 36847 + }, + { + "epoch": 0.71, + "learning_rate": 5.7100695118636164e-08, + "loss": 0.5131, + "step": 36848 + }, + { + "epoch": 0.71, + "learning_rate": 5.709681177430002e-08, + "loss": 2.0909, + "step": 36849 + }, + { + "epoch": 0.71, + "learning_rate": 5.709292842996388e-08, + "loss": 0.0028, + "step": 36850 + }, + { + "epoch": 0.71, + "learning_rate": 5.708904508562774e-08, + "loss": 0.0004, + "step": 36851 + }, + { + "epoch": 0.71, + "learning_rate": 5.70851617412916e-08, + "loss": 0.0005, + "step": 36852 + }, + { + "epoch": 0.71, + "learning_rate": 5.7081278396955455e-08, + "loss": 1.0728, + "step": 36853 + }, + { + "epoch": 0.71, + "learning_rate": 5.7077395052619314e-08, + "loss": 0.0003, + "step": 36854 + }, + { + "epoch": 0.71, + "learning_rate": 5.707351170828317e-08, + "loss": 0.0004, + "step": 36855 + }, + { + "epoch": 0.71, + "learning_rate": 5.706962836394703e-08, + "loss": 0.0003, + "step": 36856 + }, + { + "epoch": 0.71, + "learning_rate": 5.706574501961089e-08, + "loss": 0.0006, + "step": 36857 + }, + { + "epoch": 0.71, + "learning_rate": 5.7061861675274747e-08, + "loss": 0.1173, + "step": 36858 + }, + { + "epoch": 0.71, + "learning_rate": 5.7057978330938605e-08, + "loss": 0.0006, + "step": 36859 + }, + { + "epoch": 0.72, + "learning_rate": 5.705409498660246e-08, + "loss": 0.0005, + "step": 36860 + }, + { + "epoch": 0.72, + "learning_rate": 5.705021164226632e-08, + "loss": 0.0003, + "step": 36861 + }, + { + "epoch": 0.72, + "learning_rate": 5.704632829793018e-08, + "loss": 0.0007, + "step": 36862 + }, + { + "epoch": 0.72, + "learning_rate": 5.704244495359404e-08, + "loss": 0.0004, + "step": 36863 + }, + { + "epoch": 0.72, + "learning_rate": 5.7038561609257896e-08, + "loss": 0.0007, + "step": 36864 + }, + { + "epoch": 0.72, + "learning_rate": 5.703467826492174e-08, + "loss": 0.0005, + "step": 36865 + }, + { + "epoch": 0.72, + "learning_rate": 5.70307949205856e-08, + "loss": 0.0005, + "step": 36866 + }, + { + "epoch": 0.72, + "learning_rate": 5.702691157624946e-08, + "loss": 0.0004, + "step": 36867 + }, + { + "epoch": 0.72, + "learning_rate": 5.7023028231913316e-08, + "loss": 0.0006, + "step": 36868 + }, + { + "epoch": 0.72, + "learning_rate": 5.7019144887577174e-08, + "loss": 0.0004, + "step": 36869 + }, + { + "epoch": 0.72, + "learning_rate": 5.701526154324103e-08, + "loss": 0.0004, + "step": 36870 + }, + { + "epoch": 0.72, + "learning_rate": 5.701137819890489e-08, + "loss": 0.0031, + "step": 36871 + }, + { + "epoch": 0.72, + "learning_rate": 5.700749485456875e-08, + "loss": 0.001, + "step": 36872 + }, + { + "epoch": 0.72, + "learning_rate": 5.700361151023261e-08, + "loss": 0.2734, + "step": 36873 + }, + { + "epoch": 0.72, + "learning_rate": 5.6999728165896465e-08, + "loss": 0.0006, + "step": 36874 + }, + { + "epoch": 0.72, + "learning_rate": 5.6995844821560323e-08, + "loss": 0.0006, + "step": 36875 + }, + { + "epoch": 0.72, + "learning_rate": 5.699196147722418e-08, + "loss": 0.0009, + "step": 36876 + }, + { + "epoch": 0.72, + "learning_rate": 5.698807813288804e-08, + "loss": 0.0005, + "step": 36877 + }, + { + "epoch": 0.72, + "learning_rate": 5.69841947885519e-08, + "loss": 0.0005, + "step": 36878 + }, + { + "epoch": 0.72, + "learning_rate": 5.6980311444215756e-08, + "loss": 0.0004, + "step": 36879 + }, + { + "epoch": 0.72, + "learning_rate": 5.6976428099879615e-08, + "loss": 0.0004, + "step": 36880 + }, + { + "epoch": 0.72, + "learning_rate": 5.697254475554347e-08, + "loss": 0.0024, + "step": 36881 + }, + { + "epoch": 0.72, + "learning_rate": 5.696866141120733e-08, + "loss": 0.0004, + "step": 36882 + }, + { + "epoch": 0.72, + "learning_rate": 5.696477806687119e-08, + "loss": 0.0005, + "step": 36883 + }, + { + "epoch": 0.72, + "learning_rate": 5.696089472253505e-08, + "loss": 0.0005, + "step": 36884 + }, + { + "epoch": 0.72, + "learning_rate": 5.6957011378198906e-08, + "loss": 0.0004, + "step": 36885 + }, + { + "epoch": 0.72, + "learning_rate": 5.6953128033862764e-08, + "loss": 0.0006, + "step": 36886 + }, + { + "epoch": 0.72, + "learning_rate": 5.694924468952662e-08, + "loss": 0.7779, + "step": 36887 + }, + { + "epoch": 0.72, + "learning_rate": 5.694536134519048e-08, + "loss": 0.0005, + "step": 36888 + }, + { + "epoch": 0.72, + "learning_rate": 5.694147800085434e-08, + "loss": 0.0005, + "step": 36889 + }, + { + "epoch": 0.72, + "learning_rate": 5.69375946565182e-08, + "loss": 0.0005, + "step": 36890 + }, + { + "epoch": 0.72, + "learning_rate": 5.6933711312182055e-08, + "loss": 0.0048, + "step": 36891 + }, + { + "epoch": 0.72, + "learning_rate": 5.6929827967845914e-08, + "loss": 1.1372, + "step": 36892 + }, + { + "epoch": 0.72, + "learning_rate": 5.692594462350977e-08, + "loss": 0.0004, + "step": 36893 + }, + { + "epoch": 0.72, + "learning_rate": 5.692206127917362e-08, + "loss": 0.0013, + "step": 36894 + }, + { + "epoch": 0.72, + "learning_rate": 5.6918177934837475e-08, + "loss": 0.0008, + "step": 36895 + }, + { + "epoch": 0.72, + "learning_rate": 5.6914294590501333e-08, + "loss": 0.0006, + "step": 36896 + }, + { + "epoch": 0.72, + "learning_rate": 5.691041124616519e-08, + "loss": 1.2139, + "step": 36897 + }, + { + "epoch": 0.72, + "learning_rate": 5.690652790182905e-08, + "loss": 0.0004, + "step": 36898 + }, + { + "epoch": 0.72, + "learning_rate": 5.690264455749291e-08, + "loss": 0.0849, + "step": 36899 + }, + { + "epoch": 0.72, + "learning_rate": 5.6898761213156766e-08, + "loss": 0.0003, + "step": 36900 + }, + { + "epoch": 0.72, + "learning_rate": 5.6894877868820625e-08, + "loss": 0.0009, + "step": 36901 + }, + { + "epoch": 0.72, + "learning_rate": 5.689099452448448e-08, + "loss": 0.0338, + "step": 36902 + }, + { + "epoch": 0.72, + "learning_rate": 5.688711118014834e-08, + "loss": 0.0006, + "step": 36903 + }, + { + "epoch": 0.72, + "learning_rate": 5.68832278358122e-08, + "loss": 0.0278, + "step": 36904 + }, + { + "epoch": 0.72, + "learning_rate": 5.687934449147606e-08, + "loss": 0.0004, + "step": 36905 + }, + { + "epoch": 0.72, + "learning_rate": 5.6875461147139916e-08, + "loss": 0.0004, + "step": 36906 + }, + { + "epoch": 0.72, + "learning_rate": 5.6871577802803774e-08, + "loss": 0.0036, + "step": 36907 + }, + { + "epoch": 0.72, + "learning_rate": 5.686769445846763e-08, + "loss": 0.5038, + "step": 36908 + }, + { + "epoch": 0.72, + "learning_rate": 5.686381111413149e-08, + "loss": 0.0005, + "step": 36909 + }, + { + "epoch": 0.72, + "learning_rate": 5.685992776979535e-08, + "loss": 0.0003, + "step": 36910 + }, + { + "epoch": 0.72, + "learning_rate": 5.685604442545921e-08, + "loss": 0.0005, + "step": 36911 + }, + { + "epoch": 0.72, + "learning_rate": 5.6852161081123065e-08, + "loss": 0.0008, + "step": 36912 + }, + { + "epoch": 0.72, + "learning_rate": 5.6848277736786924e-08, + "loss": 0.0003, + "step": 36913 + }, + { + "epoch": 0.72, + "learning_rate": 5.684439439245078e-08, + "loss": 0.0016, + "step": 36914 + }, + { + "epoch": 0.72, + "learning_rate": 5.6840511048114633e-08, + "loss": 0.0003, + "step": 36915 + }, + { + "epoch": 0.72, + "learning_rate": 5.683662770377849e-08, + "loss": 0.0007, + "step": 36916 + }, + { + "epoch": 0.72, + "learning_rate": 5.683274435944235e-08, + "loss": 0.0005, + "step": 36917 + }, + { + "epoch": 0.72, + "learning_rate": 5.682886101510621e-08, + "loss": 0.0004, + "step": 36918 + }, + { + "epoch": 0.72, + "learning_rate": 5.6824977670770066e-08, + "loss": 0.0008, + "step": 36919 + }, + { + "epoch": 0.72, + "learning_rate": 5.6821094326433925e-08, + "loss": 0.0005, + "step": 36920 + }, + { + "epoch": 0.72, + "learning_rate": 5.681721098209778e-08, + "loss": 0.0005, + "step": 36921 + }, + { + "epoch": 0.72, + "learning_rate": 5.681332763776164e-08, + "loss": 0.0004, + "step": 36922 + }, + { + "epoch": 0.72, + "learning_rate": 5.680944429342549e-08, + "loss": 0.0006, + "step": 36923 + }, + { + "epoch": 0.72, + "learning_rate": 5.680556094908935e-08, + "loss": 0.0005, + "step": 36924 + }, + { + "epoch": 0.72, + "learning_rate": 5.680167760475321e-08, + "loss": 0.0007, + "step": 36925 + }, + { + "epoch": 0.72, + "learning_rate": 5.679779426041707e-08, + "loss": 0.0005, + "step": 36926 + }, + { + "epoch": 0.72, + "learning_rate": 5.6793910916080926e-08, + "loss": 0.0004, + "step": 36927 + }, + { + "epoch": 0.72, + "learning_rate": 5.6790027571744784e-08, + "loss": 0.0003, + "step": 36928 + }, + { + "epoch": 0.72, + "learning_rate": 5.6786144227408636e-08, + "loss": 0.0005, + "step": 36929 + }, + { + "epoch": 0.72, + "learning_rate": 5.6782260883072494e-08, + "loss": 0.0005, + "step": 36930 + }, + { + "epoch": 0.72, + "learning_rate": 5.677837753873635e-08, + "loss": 0.0006, + "step": 36931 + }, + { + "epoch": 0.72, + "learning_rate": 5.677449419440021e-08, + "loss": 1.1245, + "step": 36932 + }, + { + "epoch": 0.72, + "learning_rate": 5.677061085006407e-08, + "loss": 0.0006, + "step": 36933 + }, + { + "epoch": 0.72, + "learning_rate": 5.676672750572793e-08, + "loss": 0.0008, + "step": 36934 + }, + { + "epoch": 0.72, + "learning_rate": 5.6762844161391785e-08, + "loss": 0.0004, + "step": 36935 + }, + { + "epoch": 0.72, + "learning_rate": 5.6758960817055643e-08, + "loss": 0.0004, + "step": 36936 + }, + { + "epoch": 0.72, + "learning_rate": 5.67550774727195e-08, + "loss": 0.0004, + "step": 36937 + }, + { + "epoch": 0.72, + "learning_rate": 5.675119412838336e-08, + "loss": 0.0004, + "step": 36938 + }, + { + "epoch": 0.72, + "learning_rate": 5.674731078404722e-08, + "loss": 0.0007, + "step": 36939 + }, + { + "epoch": 0.72, + "learning_rate": 5.6743427439711076e-08, + "loss": 0.0003, + "step": 36940 + }, + { + "epoch": 0.72, + "learning_rate": 5.6739544095374935e-08, + "loss": 0.0004, + "step": 36941 + }, + { + "epoch": 0.72, + "learning_rate": 5.673566075103879e-08, + "loss": 0.0004, + "step": 36942 + }, + { + "epoch": 0.72, + "learning_rate": 5.673177740670265e-08, + "loss": 0.0006, + "step": 36943 + }, + { + "epoch": 0.72, + "learning_rate": 5.672789406236651e-08, + "loss": 0.0004, + "step": 36944 + }, + { + "epoch": 0.72, + "learning_rate": 5.672401071803037e-08, + "loss": 0.0005, + "step": 36945 + }, + { + "epoch": 0.72, + "learning_rate": 5.6720127373694226e-08, + "loss": 0.0004, + "step": 36946 + }, + { + "epoch": 0.72, + "learning_rate": 5.6716244029358084e-08, + "loss": 0.0004, + "step": 36947 + }, + { + "epoch": 0.72, + "learning_rate": 5.671236068502194e-08, + "loss": 0.0006, + "step": 36948 + }, + { + "epoch": 0.72, + "learning_rate": 5.67084773406858e-08, + "loss": 0.0004, + "step": 36949 + }, + { + "epoch": 0.72, + "learning_rate": 5.670459399634966e-08, + "loss": 0.0008, + "step": 36950 + }, + { + "epoch": 0.72, + "learning_rate": 5.670071065201352e-08, + "loss": 0.0004, + "step": 36951 + }, + { + "epoch": 0.72, + "learning_rate": 5.669682730767736e-08, + "loss": 0.0004, + "step": 36952 + }, + { + "epoch": 0.72, + "learning_rate": 5.669294396334122e-08, + "loss": 0.0003, + "step": 36953 + }, + { + "epoch": 0.72, + "learning_rate": 5.668906061900508e-08, + "loss": 0.0015, + "step": 36954 + }, + { + "epoch": 0.72, + "learning_rate": 5.668517727466894e-08, + "loss": 0.0019, + "step": 36955 + }, + { + "epoch": 0.72, + "learning_rate": 5.6681293930332795e-08, + "loss": 0.0621, + "step": 36956 + }, + { + "epoch": 0.72, + "learning_rate": 5.667741058599665e-08, + "loss": 0.0004, + "step": 36957 + }, + { + "epoch": 0.72, + "learning_rate": 5.667352724166051e-08, + "loss": 0.0021, + "step": 36958 + }, + { + "epoch": 0.72, + "learning_rate": 5.666964389732437e-08, + "loss": 0.0004, + "step": 36959 + }, + { + "epoch": 0.72, + "learning_rate": 5.666576055298823e-08, + "loss": 0.0004, + "step": 36960 + }, + { + "epoch": 0.72, + "learning_rate": 5.6661877208652086e-08, + "loss": 0.0004, + "step": 36961 + }, + { + "epoch": 0.72, + "learning_rate": 5.6657993864315944e-08, + "loss": 0.0005, + "step": 36962 + }, + { + "epoch": 0.72, + "learning_rate": 5.66541105199798e-08, + "loss": 0.0005, + "step": 36963 + }, + { + "epoch": 0.72, + "learning_rate": 5.665022717564366e-08, + "loss": 0.0004, + "step": 36964 + }, + { + "epoch": 0.72, + "learning_rate": 5.664634383130752e-08, + "loss": 0.0005, + "step": 36965 + }, + { + "epoch": 0.72, + "learning_rate": 5.664246048697138e-08, + "loss": 0.0004, + "step": 36966 + }, + { + "epoch": 0.72, + "learning_rate": 5.6638577142635236e-08, + "loss": 0.0005, + "step": 36967 + }, + { + "epoch": 0.72, + "learning_rate": 5.6634693798299094e-08, + "loss": 0.0004, + "step": 36968 + }, + { + "epoch": 0.72, + "learning_rate": 5.663081045396295e-08, + "loss": 0.0004, + "step": 36969 + }, + { + "epoch": 0.72, + "learning_rate": 5.662692710962681e-08, + "loss": 0.0022, + "step": 36970 + }, + { + "epoch": 0.72, + "learning_rate": 5.662304376529067e-08, + "loss": 0.0004, + "step": 36971 + }, + { + "epoch": 0.72, + "learning_rate": 5.661916042095453e-08, + "loss": 0.0004, + "step": 36972 + }, + { + "epoch": 0.72, + "learning_rate": 5.6615277076618385e-08, + "loss": 0.0005, + "step": 36973 + }, + { + "epoch": 0.72, + "learning_rate": 5.6611393732282243e-08, + "loss": 0.0004, + "step": 36974 + }, + { + "epoch": 0.72, + "learning_rate": 5.66075103879461e-08, + "loss": 0.0109, + "step": 36975 + }, + { + "epoch": 0.72, + "learning_rate": 5.660362704360996e-08, + "loss": 0.0007, + "step": 36976 + }, + { + "epoch": 0.72, + "learning_rate": 5.659974369927382e-08, + "loss": 0.0005, + "step": 36977 + }, + { + "epoch": 0.72, + "learning_rate": 5.6595860354937676e-08, + "loss": 0.0004, + "step": 36978 + }, + { + "epoch": 0.72, + "learning_rate": 5.6591977010601535e-08, + "loss": 0.0005, + "step": 36979 + }, + { + "epoch": 0.72, + "learning_rate": 5.658809366626539e-08, + "loss": 0.0005, + "step": 36980 + }, + { + "epoch": 0.72, + "learning_rate": 5.658421032192924e-08, + "loss": 0.0004, + "step": 36981 + }, + { + "epoch": 0.72, + "learning_rate": 5.6580326977593096e-08, + "loss": 0.0003, + "step": 36982 + }, + { + "epoch": 0.72, + "learning_rate": 5.6576443633256954e-08, + "loss": 0.76, + "step": 36983 + }, + { + "epoch": 0.72, + "learning_rate": 5.657256028892081e-08, + "loss": 0.0006, + "step": 36984 + }, + { + "epoch": 0.72, + "learning_rate": 5.656867694458467e-08, + "loss": 0.024, + "step": 36985 + }, + { + "epoch": 0.72, + "learning_rate": 5.656479360024853e-08, + "loss": 0.0005, + "step": 36986 + }, + { + "epoch": 0.72, + "learning_rate": 5.656091025591239e-08, + "loss": 0.0005, + "step": 36987 + }, + { + "epoch": 0.72, + "learning_rate": 5.6557026911576246e-08, + "loss": 0.0004, + "step": 36988 + }, + { + "epoch": 0.72, + "learning_rate": 5.6553143567240104e-08, + "loss": 0.0012, + "step": 36989 + }, + { + "epoch": 0.72, + "learning_rate": 5.654926022290396e-08, + "loss": 0.0004, + "step": 36990 + }, + { + "epoch": 0.72, + "learning_rate": 5.654537687856782e-08, + "loss": 0.001, + "step": 36991 + }, + { + "epoch": 0.72, + "learning_rate": 5.654149353423168e-08, + "loss": 0.9578, + "step": 36992 + }, + { + "epoch": 0.72, + "learning_rate": 5.653761018989554e-08, + "loss": 0.0019, + "step": 36993 + }, + { + "epoch": 0.72, + "learning_rate": 5.6533726845559395e-08, + "loss": 0.0005, + "step": 36994 + }, + { + "epoch": 0.72, + "learning_rate": 5.652984350122325e-08, + "loss": 0.0005, + "step": 36995 + }, + { + "epoch": 0.72, + "learning_rate": 5.652596015688711e-08, + "loss": 0.333, + "step": 36996 + }, + { + "epoch": 0.72, + "learning_rate": 5.652207681255097e-08, + "loss": 0.0007, + "step": 36997 + }, + { + "epoch": 0.72, + "learning_rate": 5.651819346821483e-08, + "loss": 0.0005, + "step": 36998 + }, + { + "epoch": 0.72, + "learning_rate": 5.6514310123878686e-08, + "loss": 0.0005, + "step": 36999 + }, + { + "epoch": 0.72, + "learning_rate": 5.6510426779542544e-08, + "loss": 0.0654, + "step": 37000 + }, + { + "epoch": 0.72, + "learning_rate": 5.65065434352064e-08, + "loss": 0.0508, + "step": 37001 + }, + { + "epoch": 0.72, + "learning_rate": 5.650266009087026e-08, + "loss": 0.0008, + "step": 37002 + }, + { + "epoch": 0.72, + "learning_rate": 5.649877674653411e-08, + "loss": 0.0004, + "step": 37003 + }, + { + "epoch": 0.72, + "learning_rate": 5.649489340219797e-08, + "loss": 0.001, + "step": 37004 + }, + { + "epoch": 0.72, + "learning_rate": 5.649101005786183e-08, + "loss": 0.0004, + "step": 37005 + }, + { + "epoch": 0.72, + "learning_rate": 5.648712671352569e-08, + "loss": 0.7417, + "step": 37006 + }, + { + "epoch": 0.72, + "learning_rate": 5.6483243369189546e-08, + "loss": 1.575, + "step": 37007 + }, + { + "epoch": 0.72, + "learning_rate": 5.6479360024853404e-08, + "loss": 0.0007, + "step": 37008 + }, + { + "epoch": 0.72, + "learning_rate": 5.647547668051726e-08, + "loss": 0.0005, + "step": 37009 + }, + { + "epoch": 0.72, + "learning_rate": 5.6471593336181114e-08, + "loss": 0.0007, + "step": 37010 + }, + { + "epoch": 0.72, + "learning_rate": 5.646770999184497e-08, + "loss": 0.0004, + "step": 37011 + }, + { + "epoch": 0.72, + "learning_rate": 5.646382664750883e-08, + "loss": 0.0005, + "step": 37012 + }, + { + "epoch": 0.72, + "learning_rate": 5.645994330317269e-08, + "loss": 0.0046, + "step": 37013 + }, + { + "epoch": 0.72, + "learning_rate": 5.6456059958836547e-08, + "loss": 0.0006, + "step": 37014 + }, + { + "epoch": 0.72, + "learning_rate": 5.6452176614500405e-08, + "loss": 0.2383, + "step": 37015 + }, + { + "epoch": 0.72, + "learning_rate": 5.644829327016426e-08, + "loss": 0.015, + "step": 37016 + }, + { + "epoch": 0.72, + "learning_rate": 5.644440992582812e-08, + "loss": 0.0022, + "step": 37017 + }, + { + "epoch": 0.72, + "learning_rate": 5.644052658149197e-08, + "loss": 0.0004, + "step": 37018 + }, + { + "epoch": 0.72, + "learning_rate": 5.643664323715583e-08, + "loss": 0.0009, + "step": 37019 + }, + { + "epoch": 0.72, + "learning_rate": 5.643275989281969e-08, + "loss": 0.0004, + "step": 37020 + }, + { + "epoch": 0.72, + "learning_rate": 5.642887654848355e-08, + "loss": 0.0005, + "step": 37021 + }, + { + "epoch": 0.72, + "learning_rate": 5.6424993204147406e-08, + "loss": 0.0003, + "step": 37022 + }, + { + "epoch": 0.72, + "learning_rate": 5.6421109859811264e-08, + "loss": 0.0006, + "step": 37023 + }, + { + "epoch": 0.72, + "learning_rate": 5.641722651547512e-08, + "loss": 0.0003, + "step": 37024 + }, + { + "epoch": 0.72, + "learning_rate": 5.641334317113898e-08, + "loss": 0.7143, + "step": 37025 + }, + { + "epoch": 0.72, + "learning_rate": 5.640945982680284e-08, + "loss": 0.0003, + "step": 37026 + }, + { + "epoch": 0.72, + "learning_rate": 5.64055764824667e-08, + "loss": 0.0007, + "step": 37027 + }, + { + "epoch": 0.72, + "learning_rate": 5.6401693138130555e-08, + "loss": 0.0003, + "step": 37028 + }, + { + "epoch": 0.72, + "learning_rate": 5.6397809793794414e-08, + "loss": 0.0005, + "step": 37029 + }, + { + "epoch": 0.72, + "learning_rate": 5.639392644945827e-08, + "loss": 0.0004, + "step": 37030 + }, + { + "epoch": 0.72, + "learning_rate": 5.639004310512213e-08, + "loss": 0.0003, + "step": 37031 + }, + { + "epoch": 0.72, + "learning_rate": 5.638615976078599e-08, + "loss": 0.0004, + "step": 37032 + }, + { + "epoch": 0.72, + "learning_rate": 5.6382276416449847e-08, + "loss": 0.0166, + "step": 37033 + }, + { + "epoch": 0.72, + "learning_rate": 5.6378393072113705e-08, + "loss": 0.0004, + "step": 37034 + }, + { + "epoch": 0.72, + "learning_rate": 5.637450972777756e-08, + "loss": 0.0005, + "step": 37035 + }, + { + "epoch": 0.72, + "learning_rate": 5.637062638344142e-08, + "loss": 0.0003, + "step": 37036 + }, + { + "epoch": 0.72, + "learning_rate": 5.636674303910528e-08, + "loss": 0.0005, + "step": 37037 + }, + { + "epoch": 0.72, + "learning_rate": 5.636285969476914e-08, + "loss": 0.0005, + "step": 37038 + }, + { + "epoch": 0.72, + "learning_rate": 5.635897635043298e-08, + "loss": 0.0004, + "step": 37039 + }, + { + "epoch": 0.72, + "learning_rate": 5.635509300609684e-08, + "loss": 0.0003, + "step": 37040 + }, + { + "epoch": 0.72, + "learning_rate": 5.63512096617607e-08, + "loss": 0.0004, + "step": 37041 + }, + { + "epoch": 0.72, + "learning_rate": 5.634732631742456e-08, + "loss": 0.0012, + "step": 37042 + }, + { + "epoch": 0.72, + "learning_rate": 5.6343442973088416e-08, + "loss": 0.0003, + "step": 37043 + }, + { + "epoch": 0.72, + "learning_rate": 5.6339559628752274e-08, + "loss": 0.0006, + "step": 37044 + }, + { + "epoch": 0.72, + "learning_rate": 5.633567628441613e-08, + "loss": 0.0004, + "step": 37045 + }, + { + "epoch": 0.72, + "learning_rate": 5.633179294007999e-08, + "loss": 0.0005, + "step": 37046 + }, + { + "epoch": 0.72, + "learning_rate": 5.632790959574385e-08, + "loss": 1.3745, + "step": 37047 + }, + { + "epoch": 0.72, + "learning_rate": 5.632402625140771e-08, + "loss": 0.0004, + "step": 37048 + }, + { + "epoch": 0.72, + "learning_rate": 5.6320142907071565e-08, + "loss": 0.0004, + "step": 37049 + }, + { + "epoch": 0.72, + "learning_rate": 5.6316259562735424e-08, + "loss": 0.0004, + "step": 37050 + }, + { + "epoch": 0.72, + "learning_rate": 5.631237621839928e-08, + "loss": 0.0004, + "step": 37051 + }, + { + "epoch": 0.72, + "learning_rate": 5.630849287406314e-08, + "loss": 0.9921, + "step": 37052 + }, + { + "epoch": 0.72, + "learning_rate": 5.6304609529727e-08, + "loss": 0.0004, + "step": 37053 + }, + { + "epoch": 0.72, + "learning_rate": 5.6300726185390857e-08, + "loss": 0.0004, + "step": 37054 + }, + { + "epoch": 0.72, + "learning_rate": 5.6296842841054715e-08, + "loss": 0.0005, + "step": 37055 + }, + { + "epoch": 0.72, + "learning_rate": 5.629295949671857e-08, + "loss": 0.0003, + "step": 37056 + }, + { + "epoch": 0.72, + "learning_rate": 5.628907615238243e-08, + "loss": 0.0006, + "step": 37057 + }, + { + "epoch": 0.72, + "learning_rate": 5.628519280804629e-08, + "loss": 0.0022, + "step": 37058 + }, + { + "epoch": 0.72, + "learning_rate": 5.628130946371015e-08, + "loss": 0.0075, + "step": 37059 + }, + { + "epoch": 0.72, + "learning_rate": 5.6277426119374006e-08, + "loss": 0.0006, + "step": 37060 + }, + { + "epoch": 0.72, + "learning_rate": 5.6273542775037864e-08, + "loss": 0.0003, + "step": 37061 + }, + { + "epoch": 0.72, + "learning_rate": 5.626965943070172e-08, + "loss": 0.0005, + "step": 37062 + }, + { + "epoch": 0.72, + "learning_rate": 5.626577608636558e-08, + "loss": 0.0005, + "step": 37063 + }, + { + "epoch": 0.72, + "learning_rate": 5.626189274202944e-08, + "loss": 0.0005, + "step": 37064 + }, + { + "epoch": 0.72, + "learning_rate": 5.62580093976933e-08, + "loss": 0.3621, + "step": 37065 + }, + { + "epoch": 0.72, + "learning_rate": 5.6254126053357156e-08, + "loss": 0.9314, + "step": 37066 + }, + { + "epoch": 0.72, + "learning_rate": 5.6250242709021014e-08, + "loss": 0.0005, + "step": 37067 + }, + { + "epoch": 0.72, + "learning_rate": 5.624635936468486e-08, + "loss": 0.0004, + "step": 37068 + }, + { + "epoch": 0.72, + "learning_rate": 5.624247602034872e-08, + "loss": 0.0005, + "step": 37069 + }, + { + "epoch": 0.72, + "learning_rate": 5.6238592676012575e-08, + "loss": 0.0004, + "step": 37070 + }, + { + "epoch": 0.72, + "learning_rate": 5.6234709331676434e-08, + "loss": 0.0004, + "step": 37071 + }, + { + "epoch": 0.72, + "learning_rate": 5.623082598734029e-08, + "loss": 0.0003, + "step": 37072 + }, + { + "epoch": 0.72, + "learning_rate": 5.622694264300415e-08, + "loss": 0.0004, + "step": 37073 + }, + { + "epoch": 0.72, + "learning_rate": 5.622305929866801e-08, + "loss": 0.0005, + "step": 37074 + }, + { + "epoch": 0.72, + "learning_rate": 5.6219175954331866e-08, + "loss": 1.0168, + "step": 37075 + }, + { + "epoch": 0.72, + "learning_rate": 5.6215292609995725e-08, + "loss": 0.0005, + "step": 37076 + }, + { + "epoch": 0.72, + "learning_rate": 5.621140926565958e-08, + "loss": 0.0006, + "step": 37077 + }, + { + "epoch": 0.72, + "learning_rate": 5.620752592132344e-08, + "loss": 0.0006, + "step": 37078 + }, + { + "epoch": 0.72, + "learning_rate": 5.62036425769873e-08, + "loss": 0.0003, + "step": 37079 + }, + { + "epoch": 0.72, + "learning_rate": 5.619975923265116e-08, + "loss": 0.0025, + "step": 37080 + }, + { + "epoch": 0.72, + "learning_rate": 5.6195875888315016e-08, + "loss": 0.0204, + "step": 37081 + }, + { + "epoch": 0.72, + "learning_rate": 5.6191992543978874e-08, + "loss": 0.0026, + "step": 37082 + }, + { + "epoch": 0.72, + "learning_rate": 5.618810919964273e-08, + "loss": 0.0007, + "step": 37083 + }, + { + "epoch": 0.72, + "learning_rate": 5.618422585530659e-08, + "loss": 0.0013, + "step": 37084 + }, + { + "epoch": 0.72, + "learning_rate": 5.618034251097045e-08, + "loss": 0.1018, + "step": 37085 + }, + { + "epoch": 0.72, + "learning_rate": 5.617645916663431e-08, + "loss": 0.5119, + "step": 37086 + }, + { + "epoch": 0.72, + "learning_rate": 5.6172575822298165e-08, + "loss": 0.0003, + "step": 37087 + }, + { + "epoch": 0.72, + "learning_rate": 5.6168692477962024e-08, + "loss": 0.0005, + "step": 37088 + }, + { + "epoch": 0.72, + "learning_rate": 5.616480913362588e-08, + "loss": 0.0003, + "step": 37089 + }, + { + "epoch": 0.72, + "learning_rate": 5.616092578928974e-08, + "loss": 0.0002, + "step": 37090 + }, + { + "epoch": 0.72, + "learning_rate": 5.61570424449536e-08, + "loss": 0.0004, + "step": 37091 + }, + { + "epoch": 0.72, + "learning_rate": 5.615315910061745e-08, + "loss": 0.0175, + "step": 37092 + }, + { + "epoch": 0.72, + "learning_rate": 5.614927575628131e-08, + "loss": 0.0009, + "step": 37093 + }, + { + "epoch": 0.72, + "learning_rate": 5.6145392411945167e-08, + "loss": 0.0008, + "step": 37094 + }, + { + "epoch": 0.72, + "learning_rate": 5.6141509067609025e-08, + "loss": 0.0005, + "step": 37095 + }, + { + "epoch": 0.72, + "learning_rate": 5.613762572327288e-08, + "loss": 0.0005, + "step": 37096 + }, + { + "epoch": 0.72, + "learning_rate": 5.6133742378936735e-08, + "loss": 0.0006, + "step": 37097 + }, + { + "epoch": 0.72, + "learning_rate": 5.612985903460059e-08, + "loss": 0.0005, + "step": 37098 + }, + { + "epoch": 0.72, + "learning_rate": 5.612597569026445e-08, + "loss": 0.0004, + "step": 37099 + }, + { + "epoch": 0.72, + "learning_rate": 5.612209234592831e-08, + "loss": 0.0004, + "step": 37100 + }, + { + "epoch": 0.72, + "learning_rate": 5.611820900159217e-08, + "loss": 0.0005, + "step": 37101 + }, + { + "epoch": 0.72, + "learning_rate": 5.6114325657256026e-08, + "loss": 0.0005, + "step": 37102 + }, + { + "epoch": 0.72, + "learning_rate": 5.6110442312919884e-08, + "loss": 0.003, + "step": 37103 + }, + { + "epoch": 0.72, + "learning_rate": 5.610655896858374e-08, + "loss": 0.4274, + "step": 37104 + }, + { + "epoch": 0.72, + "learning_rate": 5.61026756242476e-08, + "loss": 0.0003, + "step": 37105 + }, + { + "epoch": 0.72, + "learning_rate": 5.609879227991145e-08, + "loss": 0.596, + "step": 37106 + }, + { + "epoch": 0.72, + "learning_rate": 5.609490893557531e-08, + "loss": 0.0005, + "step": 37107 + }, + { + "epoch": 0.72, + "learning_rate": 5.609102559123917e-08, + "loss": 0.0004, + "step": 37108 + }, + { + "epoch": 0.72, + "learning_rate": 5.608714224690303e-08, + "loss": 0.0005, + "step": 37109 + }, + { + "epoch": 0.72, + "learning_rate": 5.6083258902566885e-08, + "loss": 0.0004, + "step": 37110 + }, + { + "epoch": 0.72, + "learning_rate": 5.6079375558230743e-08, + "loss": 0.0007, + "step": 37111 + }, + { + "epoch": 0.72, + "learning_rate": 5.60754922138946e-08, + "loss": 0.0004, + "step": 37112 + }, + { + "epoch": 0.72, + "learning_rate": 5.607160886955846e-08, + "loss": 0.0004, + "step": 37113 + }, + { + "epoch": 0.72, + "learning_rate": 5.606772552522232e-08, + "loss": 0.0005, + "step": 37114 + }, + { + "epoch": 0.72, + "learning_rate": 5.6063842180886176e-08, + "loss": 0.0966, + "step": 37115 + }, + { + "epoch": 0.72, + "learning_rate": 5.6059958836550035e-08, + "loss": 0.0003, + "step": 37116 + }, + { + "epoch": 0.72, + "learning_rate": 5.605607549221389e-08, + "loss": 0.0055, + "step": 37117 + }, + { + "epoch": 0.72, + "learning_rate": 5.605219214787775e-08, + "loss": 0.0004, + "step": 37118 + }, + { + "epoch": 0.72, + "learning_rate": 5.604830880354161e-08, + "loss": 0.0005, + "step": 37119 + }, + { + "epoch": 0.72, + "learning_rate": 5.604442545920547e-08, + "loss": 0.0004, + "step": 37120 + }, + { + "epoch": 0.72, + "learning_rate": 5.6040542114869326e-08, + "loss": 0.0003, + "step": 37121 + }, + { + "epoch": 0.72, + "learning_rate": 5.6036658770533184e-08, + "loss": 0.0004, + "step": 37122 + }, + { + "epoch": 0.72, + "learning_rate": 5.603277542619704e-08, + "loss": 0.0004, + "step": 37123 + }, + { + "epoch": 0.72, + "learning_rate": 5.60288920818609e-08, + "loss": 0.0004, + "step": 37124 + }, + { + "epoch": 0.72, + "learning_rate": 5.602500873752476e-08, + "loss": 0.0005, + "step": 37125 + }, + { + "epoch": 0.72, + "learning_rate": 5.6021125393188604e-08, + "loss": 0.0006, + "step": 37126 + }, + { + "epoch": 0.72, + "learning_rate": 5.601724204885246e-08, + "loss": 1.1169, + "step": 37127 + }, + { + "epoch": 0.72, + "learning_rate": 5.601335870451632e-08, + "loss": 0.0006, + "step": 37128 + }, + { + "epoch": 0.72, + "learning_rate": 5.600947536018018e-08, + "loss": 0.0005, + "step": 37129 + }, + { + "epoch": 0.72, + "learning_rate": 5.600559201584404e-08, + "loss": 0.0005, + "step": 37130 + }, + { + "epoch": 0.72, + "learning_rate": 5.6001708671507895e-08, + "loss": 0.0005, + "step": 37131 + }, + { + "epoch": 0.72, + "learning_rate": 5.5997825327171753e-08, + "loss": 0.8912, + "step": 37132 + }, + { + "epoch": 0.72, + "learning_rate": 5.599394198283561e-08, + "loss": 0.0083, + "step": 37133 + }, + { + "epoch": 0.72, + "learning_rate": 5.599005863849947e-08, + "loss": 0.0008, + "step": 37134 + }, + { + "epoch": 0.72, + "learning_rate": 5.598617529416333e-08, + "loss": 0.0005, + "step": 37135 + }, + { + "epoch": 0.72, + "learning_rate": 5.5982291949827186e-08, + "loss": 0.0004, + "step": 37136 + }, + { + "epoch": 0.72, + "learning_rate": 5.5978408605491045e-08, + "loss": 0.0004, + "step": 37137 + }, + { + "epoch": 0.72, + "learning_rate": 5.59745252611549e-08, + "loss": 0.0004, + "step": 37138 + }, + { + "epoch": 0.72, + "learning_rate": 5.597064191681876e-08, + "loss": 0.0005, + "step": 37139 + }, + { + "epoch": 0.72, + "learning_rate": 5.596675857248262e-08, + "loss": 0.0003, + "step": 37140 + }, + { + "epoch": 0.72, + "learning_rate": 5.596287522814648e-08, + "loss": 0.994, + "step": 37141 + }, + { + "epoch": 0.72, + "learning_rate": 5.5958991883810336e-08, + "loss": 0.0005, + "step": 37142 + }, + { + "epoch": 0.72, + "learning_rate": 5.5955108539474194e-08, + "loss": 0.0024, + "step": 37143 + }, + { + "epoch": 0.72, + "learning_rate": 5.595122519513805e-08, + "loss": 0.0005, + "step": 37144 + }, + { + "epoch": 0.72, + "learning_rate": 5.594734185080191e-08, + "loss": 0.0008, + "step": 37145 + }, + { + "epoch": 0.72, + "learning_rate": 5.594345850646577e-08, + "loss": 0.0006, + "step": 37146 + }, + { + "epoch": 0.72, + "learning_rate": 5.593957516212963e-08, + "loss": 0.0009, + "step": 37147 + }, + { + "epoch": 0.72, + "learning_rate": 5.5935691817793485e-08, + "loss": 0.0004, + "step": 37148 + }, + { + "epoch": 0.72, + "learning_rate": 5.5931808473457343e-08, + "loss": 0.0004, + "step": 37149 + }, + { + "epoch": 0.72, + "learning_rate": 5.59279251291212e-08, + "loss": 0.0006, + "step": 37150 + }, + { + "epoch": 0.72, + "learning_rate": 5.592404178478506e-08, + "loss": 0.0028, + "step": 37151 + }, + { + "epoch": 0.72, + "learning_rate": 5.592015844044892e-08, + "loss": 0.0005, + "step": 37152 + }, + { + "epoch": 0.72, + "learning_rate": 5.5916275096112776e-08, + "loss": 0.0005, + "step": 37153 + }, + { + "epoch": 0.72, + "learning_rate": 5.5912391751776635e-08, + "loss": 0.0021, + "step": 37154 + }, + { + "epoch": 0.72, + "learning_rate": 5.590850840744048e-08, + "loss": 0.0004, + "step": 37155 + }, + { + "epoch": 0.72, + "learning_rate": 5.590462506310434e-08, + "loss": 0.0004, + "step": 37156 + }, + { + "epoch": 0.72, + "learning_rate": 5.5900741718768196e-08, + "loss": 0.0014, + "step": 37157 + }, + { + "epoch": 0.72, + "learning_rate": 5.5896858374432054e-08, + "loss": 0.0009, + "step": 37158 + }, + { + "epoch": 0.72, + "learning_rate": 5.589297503009591e-08, + "loss": 0.0008, + "step": 37159 + }, + { + "epoch": 0.72, + "learning_rate": 5.588909168575977e-08, + "loss": 0.0005, + "step": 37160 + }, + { + "epoch": 0.72, + "learning_rate": 5.588520834142363e-08, + "loss": 0.0005, + "step": 37161 + }, + { + "epoch": 0.72, + "learning_rate": 5.588132499708749e-08, + "loss": 0.0009, + "step": 37162 + }, + { + "epoch": 0.72, + "learning_rate": 5.5877441652751346e-08, + "loss": 0.0007, + "step": 37163 + }, + { + "epoch": 0.72, + "learning_rate": 5.5873558308415204e-08, + "loss": 0.0004, + "step": 37164 + }, + { + "epoch": 0.72, + "learning_rate": 5.586967496407906e-08, + "loss": 0.0003, + "step": 37165 + }, + { + "epoch": 0.72, + "learning_rate": 5.586579161974292e-08, + "loss": 0.0004, + "step": 37166 + }, + { + "epoch": 0.72, + "learning_rate": 5.586190827540678e-08, + "loss": 0.0003, + "step": 37167 + }, + { + "epoch": 0.72, + "learning_rate": 5.585802493107064e-08, + "loss": 1.0117, + "step": 37168 + }, + { + "epoch": 0.72, + "learning_rate": 5.5854141586734495e-08, + "loss": 0.0006, + "step": 37169 + }, + { + "epoch": 0.72, + "learning_rate": 5.5850258242398353e-08, + "loss": 0.0004, + "step": 37170 + }, + { + "epoch": 0.72, + "learning_rate": 5.584637489806221e-08, + "loss": 0.1824, + "step": 37171 + }, + { + "epoch": 0.72, + "learning_rate": 5.584249155372607e-08, + "loss": 0.0004, + "step": 37172 + }, + { + "epoch": 0.72, + "learning_rate": 5.583860820938993e-08, + "loss": 0.001, + "step": 37173 + }, + { + "epoch": 0.72, + "learning_rate": 5.5834724865053786e-08, + "loss": 0.0005, + "step": 37174 + }, + { + "epoch": 0.72, + "learning_rate": 5.5830841520717645e-08, + "loss": 0.0006, + "step": 37175 + }, + { + "epoch": 0.72, + "learning_rate": 5.58269581763815e-08, + "loss": 0.9898, + "step": 37176 + }, + { + "epoch": 0.72, + "learning_rate": 5.582307483204536e-08, + "loss": 0.0962, + "step": 37177 + }, + { + "epoch": 0.72, + "learning_rate": 5.581919148770922e-08, + "loss": 0.3144, + "step": 37178 + }, + { + "epoch": 0.72, + "learning_rate": 5.581530814337308e-08, + "loss": 0.0007, + "step": 37179 + }, + { + "epoch": 0.72, + "learning_rate": 5.581142479903693e-08, + "loss": 0.0004, + "step": 37180 + }, + { + "epoch": 0.72, + "learning_rate": 5.580754145470079e-08, + "loss": 0.0006, + "step": 37181 + }, + { + "epoch": 0.72, + "learning_rate": 5.5803658110364646e-08, + "loss": 0.0004, + "step": 37182 + }, + { + "epoch": 0.72, + "learning_rate": 5.5799774766028504e-08, + "loss": 0.0005, + "step": 37183 + }, + { + "epoch": 0.72, + "learning_rate": 5.5795891421692356e-08, + "loss": 0.0005, + "step": 37184 + }, + { + "epoch": 0.72, + "learning_rate": 5.5792008077356214e-08, + "loss": 0.0004, + "step": 37185 + }, + { + "epoch": 0.72, + "learning_rate": 5.578812473302007e-08, + "loss": 0.0005, + "step": 37186 + }, + { + "epoch": 0.72, + "learning_rate": 5.578424138868393e-08, + "loss": 0.0004, + "step": 37187 + }, + { + "epoch": 0.72, + "learning_rate": 5.578035804434779e-08, + "loss": 0.358, + "step": 37188 + }, + { + "epoch": 0.72, + "learning_rate": 5.577647470001165e-08, + "loss": 0.0003, + "step": 37189 + }, + { + "epoch": 0.72, + "learning_rate": 5.5772591355675505e-08, + "loss": 0.0038, + "step": 37190 + }, + { + "epoch": 0.72, + "learning_rate": 5.576870801133936e-08, + "loss": 0.0004, + "step": 37191 + }, + { + "epoch": 0.72, + "learning_rate": 5.576482466700322e-08, + "loss": 1.0635, + "step": 37192 + }, + { + "epoch": 0.72, + "learning_rate": 5.576094132266708e-08, + "loss": 0.0075, + "step": 37193 + }, + { + "epoch": 0.72, + "learning_rate": 5.575705797833094e-08, + "loss": 0.0006, + "step": 37194 + }, + { + "epoch": 0.72, + "learning_rate": 5.575317463399479e-08, + "loss": 0.0008, + "step": 37195 + }, + { + "epoch": 0.72, + "learning_rate": 5.574929128965865e-08, + "loss": 0.0004, + "step": 37196 + }, + { + "epoch": 0.72, + "learning_rate": 5.5745407945322506e-08, + "loss": 0.0005, + "step": 37197 + }, + { + "epoch": 0.72, + "learning_rate": 5.5741524600986364e-08, + "loss": 0.0005, + "step": 37198 + }, + { + "epoch": 0.72, + "learning_rate": 5.573764125665022e-08, + "loss": 0.0004, + "step": 37199 + }, + { + "epoch": 0.72, + "learning_rate": 5.573375791231408e-08, + "loss": 0.0007, + "step": 37200 + }, + { + "epoch": 0.72, + "learning_rate": 5.572987456797794e-08, + "loss": 0.0004, + "step": 37201 + }, + { + "epoch": 0.72, + "learning_rate": 5.57259912236418e-08, + "loss": 0.0005, + "step": 37202 + }, + { + "epoch": 0.72, + "learning_rate": 5.5722107879305656e-08, + "loss": 0.0004, + "step": 37203 + }, + { + "epoch": 0.72, + "learning_rate": 5.5718224534969514e-08, + "loss": 0.0004, + "step": 37204 + }, + { + "epoch": 0.72, + "learning_rate": 5.571434119063337e-08, + "loss": 0.0003, + "step": 37205 + }, + { + "epoch": 0.72, + "learning_rate": 5.571045784629723e-08, + "loss": 0.0011, + "step": 37206 + }, + { + "epoch": 0.72, + "learning_rate": 5.570657450196109e-08, + "loss": 0.0004, + "step": 37207 + }, + { + "epoch": 0.72, + "learning_rate": 5.570269115762495e-08, + "loss": 0.0004, + "step": 37208 + }, + { + "epoch": 0.72, + "learning_rate": 5.5698807813288805e-08, + "loss": 0.0006, + "step": 37209 + }, + { + "epoch": 0.72, + "learning_rate": 5.569492446895266e-08, + "loss": 0.8063, + "step": 37210 + }, + { + "epoch": 0.72, + "learning_rate": 5.569104112461652e-08, + "loss": 0.0005, + "step": 37211 + }, + { + "epoch": 0.72, + "learning_rate": 5.568715778028038e-08, + "loss": 0.0004, + "step": 37212 + }, + { + "epoch": 0.72, + "learning_rate": 5.5683274435944225e-08, + "loss": 0.0006, + "step": 37213 + }, + { + "epoch": 0.72, + "learning_rate": 5.567939109160808e-08, + "loss": 0.0004, + "step": 37214 + }, + { + "epoch": 0.72, + "learning_rate": 5.567550774727194e-08, + "loss": 0.0002, + "step": 37215 + }, + { + "epoch": 0.72, + "learning_rate": 5.56716244029358e-08, + "loss": 0.0008, + "step": 37216 + }, + { + "epoch": 0.72, + "learning_rate": 5.566774105859966e-08, + "loss": 0.0004, + "step": 37217 + }, + { + "epoch": 0.72, + "learning_rate": 5.5663857714263516e-08, + "loss": 0.0004, + "step": 37218 + }, + { + "epoch": 0.72, + "learning_rate": 5.5659974369927374e-08, + "loss": 0.0077, + "step": 37219 + }, + { + "epoch": 0.72, + "learning_rate": 5.565609102559123e-08, + "loss": 0.5888, + "step": 37220 + }, + { + "epoch": 0.72, + "learning_rate": 5.565220768125509e-08, + "loss": 0.0006, + "step": 37221 + }, + { + "epoch": 0.72, + "learning_rate": 5.564832433691895e-08, + "loss": 0.0057, + "step": 37222 + }, + { + "epoch": 0.72, + "learning_rate": 5.564444099258281e-08, + "loss": 0.0004, + "step": 37223 + }, + { + "epoch": 0.72, + "learning_rate": 5.5640557648246665e-08, + "loss": 0.0006, + "step": 37224 + }, + { + "epoch": 0.72, + "learning_rate": 5.5636674303910524e-08, + "loss": 0.0004, + "step": 37225 + }, + { + "epoch": 0.72, + "learning_rate": 5.563279095957438e-08, + "loss": 0.0004, + "step": 37226 + }, + { + "epoch": 0.72, + "learning_rate": 5.562890761523824e-08, + "loss": 0.0004, + "step": 37227 + }, + { + "epoch": 0.72, + "learning_rate": 5.56250242709021e-08, + "loss": 0.0006, + "step": 37228 + }, + { + "epoch": 0.72, + "learning_rate": 5.562114092656596e-08, + "loss": 0.0005, + "step": 37229 + }, + { + "epoch": 0.72, + "learning_rate": 5.5617257582229815e-08, + "loss": 0.0004, + "step": 37230 + }, + { + "epoch": 0.72, + "learning_rate": 5.561337423789367e-08, + "loss": 0.0005, + "step": 37231 + }, + { + "epoch": 0.72, + "learning_rate": 5.560949089355753e-08, + "loss": 0.0005, + "step": 37232 + }, + { + "epoch": 0.72, + "learning_rate": 5.560560754922139e-08, + "loss": 0.0004, + "step": 37233 + }, + { + "epoch": 0.72, + "learning_rate": 5.560172420488525e-08, + "loss": 0.0007, + "step": 37234 + }, + { + "epoch": 0.72, + "learning_rate": 5.5597840860549106e-08, + "loss": 0.3731, + "step": 37235 + }, + { + "epoch": 0.72, + "learning_rate": 5.5593957516212964e-08, + "loss": 0.0005, + "step": 37236 + }, + { + "epoch": 0.72, + "learning_rate": 5.559007417187682e-08, + "loss": 0.0005, + "step": 37237 + }, + { + "epoch": 0.72, + "learning_rate": 5.558619082754068e-08, + "loss": 0.0006, + "step": 37238 + }, + { + "epoch": 0.72, + "learning_rate": 5.558230748320454e-08, + "loss": 0.0003, + "step": 37239 + }, + { + "epoch": 0.72, + "learning_rate": 5.55784241388684e-08, + "loss": 0.0003, + "step": 37240 + }, + { + "epoch": 0.72, + "learning_rate": 5.5574540794532256e-08, + "loss": 0.0014, + "step": 37241 + }, + { + "epoch": 0.72, + "learning_rate": 5.55706574501961e-08, + "loss": 0.0088, + "step": 37242 + }, + { + "epoch": 0.72, + "learning_rate": 5.556677410585996e-08, + "loss": 0.0012, + "step": 37243 + }, + { + "epoch": 0.72, + "learning_rate": 5.556289076152382e-08, + "loss": 0.0005, + "step": 37244 + }, + { + "epoch": 0.72, + "learning_rate": 5.5559007417187675e-08, + "loss": 0.0005, + "step": 37245 + }, + { + "epoch": 0.72, + "learning_rate": 5.5555124072851534e-08, + "loss": 0.0003, + "step": 37246 + }, + { + "epoch": 0.72, + "learning_rate": 5.555124072851539e-08, + "loss": 0.0005, + "step": 37247 + }, + { + "epoch": 0.72, + "learning_rate": 5.554735738417925e-08, + "loss": 0.0004, + "step": 37248 + }, + { + "epoch": 0.72, + "learning_rate": 5.554347403984311e-08, + "loss": 0.0004, + "step": 37249 + }, + { + "epoch": 0.72, + "learning_rate": 5.5539590695506967e-08, + "loss": 0.0004, + "step": 37250 + }, + { + "epoch": 0.72, + "learning_rate": 5.5535707351170825e-08, + "loss": 0.004, + "step": 37251 + }, + { + "epoch": 0.72, + "learning_rate": 5.553182400683468e-08, + "loss": 0.0003, + "step": 37252 + }, + { + "epoch": 0.72, + "learning_rate": 5.552794066249854e-08, + "loss": 0.0007, + "step": 37253 + }, + { + "epoch": 0.72, + "learning_rate": 5.55240573181624e-08, + "loss": 0.0004, + "step": 37254 + }, + { + "epoch": 0.72, + "learning_rate": 5.552017397382626e-08, + "loss": 0.0195, + "step": 37255 + }, + { + "epoch": 0.72, + "learning_rate": 5.5516290629490116e-08, + "loss": 0.0004, + "step": 37256 + }, + { + "epoch": 0.72, + "learning_rate": 5.5512407285153974e-08, + "loss": 0.0006, + "step": 37257 + }, + { + "epoch": 0.72, + "learning_rate": 5.550852394081783e-08, + "loss": 0.0005, + "step": 37258 + }, + { + "epoch": 0.72, + "learning_rate": 5.550464059648169e-08, + "loss": 0.0005, + "step": 37259 + }, + { + "epoch": 0.72, + "learning_rate": 5.550075725214555e-08, + "loss": 0.0004, + "step": 37260 + }, + { + "epoch": 0.72, + "learning_rate": 5.549687390780941e-08, + "loss": 0.0005, + "step": 37261 + }, + { + "epoch": 0.72, + "learning_rate": 5.5492990563473266e-08, + "loss": 0.0011, + "step": 37262 + }, + { + "epoch": 0.72, + "learning_rate": 5.5489107219137124e-08, + "loss": 0.0005, + "step": 37263 + }, + { + "epoch": 0.72, + "learning_rate": 5.548522387480098e-08, + "loss": 0.0004, + "step": 37264 + }, + { + "epoch": 0.72, + "learning_rate": 5.548134053046484e-08, + "loss": 0.0005, + "step": 37265 + }, + { + "epoch": 0.72, + "learning_rate": 5.54774571861287e-08, + "loss": 0.0004, + "step": 37266 + }, + { + "epoch": 0.72, + "learning_rate": 5.547357384179256e-08, + "loss": 0.0004, + "step": 37267 + }, + { + "epoch": 0.72, + "learning_rate": 5.5469690497456415e-08, + "loss": 0.0005, + "step": 37268 + }, + { + "epoch": 0.72, + "learning_rate": 5.5465807153120267e-08, + "loss": 0.0005, + "step": 37269 + }, + { + "epoch": 0.72, + "learning_rate": 5.5461923808784125e-08, + "loss": 0.0005, + "step": 37270 + }, + { + "epoch": 0.72, + "learning_rate": 5.5458040464447976e-08, + "loss": 0.5255, + "step": 37271 + }, + { + "epoch": 0.72, + "learning_rate": 5.5454157120111835e-08, + "loss": 0.0004, + "step": 37272 + }, + { + "epoch": 0.72, + "learning_rate": 5.545027377577569e-08, + "loss": 0.0006, + "step": 37273 + }, + { + "epoch": 0.72, + "learning_rate": 5.544639043143955e-08, + "loss": 0.001, + "step": 37274 + }, + { + "epoch": 0.72, + "learning_rate": 5.544250708710341e-08, + "loss": 0.0007, + "step": 37275 + }, + { + "epoch": 0.72, + "learning_rate": 5.543862374276727e-08, + "loss": 0.029, + "step": 37276 + }, + { + "epoch": 0.72, + "learning_rate": 5.5434740398431126e-08, + "loss": 0.0012, + "step": 37277 + }, + { + "epoch": 0.72, + "learning_rate": 5.5430857054094984e-08, + "loss": 0.0005, + "step": 37278 + }, + { + "epoch": 0.72, + "learning_rate": 5.542697370975884e-08, + "loss": 0.3654, + "step": 37279 + }, + { + "epoch": 0.72, + "learning_rate": 5.54230903654227e-08, + "loss": 0.0007, + "step": 37280 + }, + { + "epoch": 0.72, + "learning_rate": 5.541920702108656e-08, + "loss": 0.0007, + "step": 37281 + }, + { + "epoch": 0.72, + "learning_rate": 5.541532367675042e-08, + "loss": 0.0004, + "step": 37282 + }, + { + "epoch": 0.72, + "learning_rate": 5.541144033241427e-08, + "loss": 0.0008, + "step": 37283 + }, + { + "epoch": 0.72, + "learning_rate": 5.540755698807813e-08, + "loss": 0.0007, + "step": 37284 + }, + { + "epoch": 0.72, + "learning_rate": 5.5403673643741985e-08, + "loss": 0.0003, + "step": 37285 + }, + { + "epoch": 0.72, + "learning_rate": 5.5399790299405844e-08, + "loss": 0.0296, + "step": 37286 + }, + { + "epoch": 0.72, + "learning_rate": 5.53959069550697e-08, + "loss": 0.0004, + "step": 37287 + }, + { + "epoch": 0.72, + "learning_rate": 5.539202361073356e-08, + "loss": 0.0005, + "step": 37288 + }, + { + "epoch": 0.72, + "learning_rate": 5.538814026639742e-08, + "loss": 0.0874, + "step": 37289 + }, + { + "epoch": 0.72, + "learning_rate": 5.5384256922061277e-08, + "loss": 0.0015, + "step": 37290 + }, + { + "epoch": 0.72, + "learning_rate": 5.5380373577725135e-08, + "loss": 0.3057, + "step": 37291 + }, + { + "epoch": 0.72, + "learning_rate": 5.537649023338899e-08, + "loss": 0.0003, + "step": 37292 + }, + { + "epoch": 0.72, + "learning_rate": 5.537260688905285e-08, + "loss": 0.5285, + "step": 37293 + }, + { + "epoch": 0.72, + "learning_rate": 5.536872354471671e-08, + "loss": 0.0006, + "step": 37294 + }, + { + "epoch": 0.72, + "learning_rate": 5.536484020038057e-08, + "loss": 0.0005, + "step": 37295 + }, + { + "epoch": 0.72, + "learning_rate": 5.5360956856044426e-08, + "loss": 0.0005, + "step": 37296 + }, + { + "epoch": 0.72, + "learning_rate": 5.5357073511708284e-08, + "loss": 0.0004, + "step": 37297 + }, + { + "epoch": 0.72, + "learning_rate": 5.535319016737214e-08, + "loss": 0.0004, + "step": 37298 + }, + { + "epoch": 0.72, + "learning_rate": 5.5349306823036e-08, + "loss": 0.0004, + "step": 37299 + }, + { + "epoch": 0.72, + "learning_rate": 5.5345423478699846e-08, + "loss": 1.0281, + "step": 37300 + }, + { + "epoch": 0.72, + "learning_rate": 5.5341540134363704e-08, + "loss": 0.0004, + "step": 37301 + }, + { + "epoch": 0.72, + "learning_rate": 5.533765679002756e-08, + "loss": 0.0008, + "step": 37302 + }, + { + "epoch": 0.72, + "learning_rate": 5.533377344569142e-08, + "loss": 0.0003, + "step": 37303 + }, + { + "epoch": 0.72, + "learning_rate": 5.532989010135528e-08, + "loss": 0.0004, + "step": 37304 + }, + { + "epoch": 0.72, + "learning_rate": 5.532600675701914e-08, + "loss": 0.0004, + "step": 37305 + }, + { + "epoch": 0.72, + "learning_rate": 5.5322123412682995e-08, + "loss": 0.0004, + "step": 37306 + }, + { + "epoch": 0.72, + "learning_rate": 5.5318240068346853e-08, + "loss": 0.0005, + "step": 37307 + }, + { + "epoch": 0.72, + "learning_rate": 5.531435672401071e-08, + "loss": 0.0007, + "step": 37308 + }, + { + "epoch": 0.72, + "learning_rate": 5.531047337967457e-08, + "loss": 0.0004, + "step": 37309 + }, + { + "epoch": 0.72, + "learning_rate": 5.530659003533843e-08, + "loss": 0.0007, + "step": 37310 + }, + { + "epoch": 0.72, + "learning_rate": 5.5302706691002286e-08, + "loss": 0.0004, + "step": 37311 + }, + { + "epoch": 0.72, + "learning_rate": 5.5298823346666145e-08, + "loss": 0.0004, + "step": 37312 + }, + { + "epoch": 0.72, + "learning_rate": 5.529494000233e-08, + "loss": 0.001, + "step": 37313 + }, + { + "epoch": 0.72, + "learning_rate": 5.529105665799386e-08, + "loss": 0.001, + "step": 37314 + }, + { + "epoch": 0.72, + "learning_rate": 5.528717331365772e-08, + "loss": 0.0005, + "step": 37315 + }, + { + "epoch": 0.72, + "learning_rate": 5.528328996932158e-08, + "loss": 0.0007, + "step": 37316 + }, + { + "epoch": 0.72, + "learning_rate": 5.5279406624985436e-08, + "loss": 0.0004, + "step": 37317 + }, + { + "epoch": 0.72, + "learning_rate": 5.5275523280649294e-08, + "loss": 0.0149, + "step": 37318 + }, + { + "epoch": 0.72, + "learning_rate": 5.527163993631315e-08, + "loss": 0.0004, + "step": 37319 + }, + { + "epoch": 0.72, + "learning_rate": 5.526775659197701e-08, + "loss": 0.0004, + "step": 37320 + }, + { + "epoch": 0.72, + "learning_rate": 5.526387324764087e-08, + "loss": 0.0005, + "step": 37321 + }, + { + "epoch": 0.72, + "learning_rate": 5.525998990330473e-08, + "loss": 0.3423, + "step": 37322 + }, + { + "epoch": 0.72, + "learning_rate": 5.5256106558968585e-08, + "loss": 0.0003, + "step": 37323 + }, + { + "epoch": 0.72, + "learning_rate": 5.5252223214632444e-08, + "loss": 0.0005, + "step": 37324 + }, + { + "epoch": 0.72, + "learning_rate": 5.52483398702963e-08, + "loss": 0.0022, + "step": 37325 + }, + { + "epoch": 0.72, + "learning_rate": 5.524445652596016e-08, + "loss": 0.0004, + "step": 37326 + }, + { + "epoch": 0.72, + "learning_rate": 5.524057318162402e-08, + "loss": 0.0005, + "step": 37327 + }, + { + "epoch": 0.72, + "learning_rate": 5.5236689837287877e-08, + "loss": 1.0607, + "step": 37328 + }, + { + "epoch": 0.72, + "learning_rate": 5.523280649295172e-08, + "loss": 0.0013, + "step": 37329 + }, + { + "epoch": 0.72, + "learning_rate": 5.522892314861558e-08, + "loss": 0.0005, + "step": 37330 + }, + { + "epoch": 0.72, + "learning_rate": 5.522503980427944e-08, + "loss": 0.0005, + "step": 37331 + }, + { + "epoch": 0.72, + "learning_rate": 5.5221156459943296e-08, + "loss": 0.0007, + "step": 37332 + }, + { + "epoch": 0.72, + "learning_rate": 5.5217273115607155e-08, + "loss": 0.0004, + "step": 37333 + }, + { + "epoch": 0.72, + "learning_rate": 5.521338977127101e-08, + "loss": 0.0019, + "step": 37334 + }, + { + "epoch": 0.72, + "learning_rate": 5.520950642693487e-08, + "loss": 0.0004, + "step": 37335 + }, + { + "epoch": 0.72, + "learning_rate": 5.520562308259873e-08, + "loss": 0.0004, + "step": 37336 + }, + { + "epoch": 0.72, + "learning_rate": 5.520173973826259e-08, + "loss": 0.0003, + "step": 37337 + }, + { + "epoch": 0.72, + "learning_rate": 5.5197856393926446e-08, + "loss": 0.0006, + "step": 37338 + }, + { + "epoch": 0.72, + "learning_rate": 5.5193973049590304e-08, + "loss": 0.0009, + "step": 37339 + }, + { + "epoch": 0.72, + "learning_rate": 5.519008970525416e-08, + "loss": 0.0004, + "step": 37340 + }, + { + "epoch": 0.72, + "learning_rate": 5.518620636091802e-08, + "loss": 0.5557, + "step": 37341 + }, + { + "epoch": 0.72, + "learning_rate": 5.518232301658188e-08, + "loss": 0.0004, + "step": 37342 + }, + { + "epoch": 0.72, + "learning_rate": 5.517843967224574e-08, + "loss": 0.0006, + "step": 37343 + }, + { + "epoch": 0.72, + "learning_rate": 5.5174556327909595e-08, + "loss": 0.0007, + "step": 37344 + }, + { + "epoch": 0.72, + "learning_rate": 5.5170672983573453e-08, + "loss": 0.0044, + "step": 37345 + }, + { + "epoch": 0.72, + "learning_rate": 5.516678963923731e-08, + "loss": 0.0278, + "step": 37346 + }, + { + "epoch": 0.72, + "learning_rate": 5.516290629490117e-08, + "loss": 0.0005, + "step": 37347 + }, + { + "epoch": 0.72, + "learning_rate": 5.515902295056503e-08, + "loss": 0.0004, + "step": 37348 + }, + { + "epoch": 0.72, + "learning_rate": 5.5155139606228886e-08, + "loss": 0.0008, + "step": 37349 + }, + { + "epoch": 0.72, + "learning_rate": 5.5151256261892745e-08, + "loss": 0.7676, + "step": 37350 + }, + { + "epoch": 0.72, + "learning_rate": 5.51473729175566e-08, + "loss": 0.0005, + "step": 37351 + }, + { + "epoch": 0.72, + "learning_rate": 5.514348957322046e-08, + "loss": 0.0006, + "step": 37352 + }, + { + "epoch": 0.72, + "learning_rate": 5.513960622888432e-08, + "loss": 0.0006, + "step": 37353 + }, + { + "epoch": 0.72, + "learning_rate": 5.513572288454818e-08, + "loss": 0.0005, + "step": 37354 + }, + { + "epoch": 0.72, + "learning_rate": 5.5131839540212036e-08, + "loss": 0.0026, + "step": 37355 + }, + { + "epoch": 0.72, + "learning_rate": 5.5127956195875894e-08, + "loss": 0.0003, + "step": 37356 + }, + { + "epoch": 0.72, + "learning_rate": 5.5124072851539746e-08, + "loss": 0.0008, + "step": 37357 + }, + { + "epoch": 0.72, + "learning_rate": 5.51201895072036e-08, + "loss": 0.0005, + "step": 37358 + }, + { + "epoch": 0.72, + "learning_rate": 5.5116306162867456e-08, + "loss": 0.0524, + "step": 37359 + }, + { + "epoch": 0.72, + "learning_rate": 5.5112422818531314e-08, + "loss": 0.3834, + "step": 37360 + }, + { + "epoch": 0.72, + "learning_rate": 5.510853947419517e-08, + "loss": 0.8081, + "step": 37361 + }, + { + "epoch": 0.72, + "learning_rate": 5.510465612985903e-08, + "loss": 0.3438, + "step": 37362 + }, + { + "epoch": 0.72, + "learning_rate": 5.510077278552289e-08, + "loss": 0.0005, + "step": 37363 + }, + { + "epoch": 0.72, + "learning_rate": 5.509688944118675e-08, + "loss": 0.0007, + "step": 37364 + }, + { + "epoch": 0.72, + "learning_rate": 5.5093006096850605e-08, + "loss": 0.0005, + "step": 37365 + }, + { + "epoch": 0.72, + "learning_rate": 5.5089122752514463e-08, + "loss": 0.0004, + "step": 37366 + }, + { + "epoch": 0.72, + "learning_rate": 5.508523940817832e-08, + "loss": 0.0007, + "step": 37367 + }, + { + "epoch": 0.72, + "learning_rate": 5.508135606384218e-08, + "loss": 0.0004, + "step": 37368 + }, + { + "epoch": 0.72, + "learning_rate": 5.507747271950604e-08, + "loss": 0.0006, + "step": 37369 + }, + { + "epoch": 0.72, + "learning_rate": 5.5073589375169896e-08, + "loss": 0.0004, + "step": 37370 + }, + { + "epoch": 0.72, + "learning_rate": 5.5069706030833755e-08, + "loss": 0.0003, + "step": 37371 + }, + { + "epoch": 0.72, + "learning_rate": 5.5065822686497606e-08, + "loss": 0.3705, + "step": 37372 + }, + { + "epoch": 0.72, + "learning_rate": 5.5061939342161464e-08, + "loss": 0.0004, + "step": 37373 + }, + { + "epoch": 0.72, + "learning_rate": 5.505805599782532e-08, + "loss": 0.0007, + "step": 37374 + }, + { + "epoch": 0.72, + "learning_rate": 5.505417265348918e-08, + "loss": 0.2638, + "step": 37375 + }, + { + "epoch": 0.73, + "learning_rate": 5.505028930915304e-08, + "loss": 0.0005, + "step": 37376 + }, + { + "epoch": 0.73, + "learning_rate": 5.50464059648169e-08, + "loss": 0.2323, + "step": 37377 + }, + { + "epoch": 0.73, + "learning_rate": 5.5042522620480756e-08, + "loss": 0.0012, + "step": 37378 + }, + { + "epoch": 0.73, + "learning_rate": 5.5038639276144614e-08, + "loss": 0.0003, + "step": 37379 + }, + { + "epoch": 0.73, + "learning_rate": 5.503475593180847e-08, + "loss": 0.0004, + "step": 37380 + }, + { + "epoch": 0.73, + "learning_rate": 5.503087258747233e-08, + "loss": 0.0004, + "step": 37381 + }, + { + "epoch": 0.73, + "learning_rate": 5.502698924313619e-08, + "loss": 0.0004, + "step": 37382 + }, + { + "epoch": 0.73, + "learning_rate": 5.502310589880005e-08, + "loss": 0.0002, + "step": 37383 + }, + { + "epoch": 0.73, + "learning_rate": 5.5019222554463905e-08, + "loss": 0.0005, + "step": 37384 + }, + { + "epoch": 0.73, + "learning_rate": 5.5015339210127763e-08, + "loss": 0.0005, + "step": 37385 + }, + { + "epoch": 0.73, + "learning_rate": 5.501145586579162e-08, + "loss": 0.0405, + "step": 37386 + }, + { + "epoch": 0.73, + "learning_rate": 5.5007572521455467e-08, + "loss": 0.0022, + "step": 37387 + }, + { + "epoch": 0.73, + "learning_rate": 5.5003689177119325e-08, + "loss": 0.0003, + "step": 37388 + }, + { + "epoch": 0.73, + "learning_rate": 5.499980583278318e-08, + "loss": 0.0003, + "step": 37389 + }, + { + "epoch": 0.73, + "learning_rate": 5.499592248844704e-08, + "loss": 0.0005, + "step": 37390 + }, + { + "epoch": 0.73, + "learning_rate": 5.49920391441109e-08, + "loss": 0.0004, + "step": 37391 + }, + { + "epoch": 0.73, + "learning_rate": 5.498815579977476e-08, + "loss": 0.0018, + "step": 37392 + }, + { + "epoch": 0.73, + "learning_rate": 5.4984272455438616e-08, + "loss": 0.0011, + "step": 37393 + }, + { + "epoch": 0.73, + "learning_rate": 5.4980389111102474e-08, + "loss": 0.0003, + "step": 37394 + }, + { + "epoch": 0.73, + "learning_rate": 5.497650576676633e-08, + "loss": 0.0029, + "step": 37395 + }, + { + "epoch": 0.73, + "learning_rate": 5.497262242243019e-08, + "loss": 0.0004, + "step": 37396 + }, + { + "epoch": 0.73, + "learning_rate": 5.496873907809405e-08, + "loss": 0.0007, + "step": 37397 + }, + { + "epoch": 0.73, + "learning_rate": 5.496485573375791e-08, + "loss": 0.0003, + "step": 37398 + }, + { + "epoch": 0.73, + "learning_rate": 5.4960972389421766e-08, + "loss": 0.0004, + "step": 37399 + }, + { + "epoch": 0.73, + "learning_rate": 5.4957089045085624e-08, + "loss": 0.0009, + "step": 37400 + }, + { + "epoch": 0.73, + "learning_rate": 5.495320570074948e-08, + "loss": 0.0005, + "step": 37401 + }, + { + "epoch": 0.73, + "learning_rate": 5.494932235641334e-08, + "loss": 0.0008, + "step": 37402 + }, + { + "epoch": 0.73, + "learning_rate": 5.49454390120772e-08, + "loss": 0.0052, + "step": 37403 + }, + { + "epoch": 0.73, + "learning_rate": 5.494155566774106e-08, + "loss": 0.0005, + "step": 37404 + }, + { + "epoch": 0.73, + "learning_rate": 5.4937672323404915e-08, + "loss": 0.0003, + "step": 37405 + }, + { + "epoch": 0.73, + "learning_rate": 5.493378897906877e-08, + "loss": 0.0066, + "step": 37406 + }, + { + "epoch": 0.73, + "learning_rate": 5.492990563473263e-08, + "loss": 0.0004, + "step": 37407 + }, + { + "epoch": 0.73, + "learning_rate": 5.492602229039649e-08, + "loss": 0.0004, + "step": 37408 + }, + { + "epoch": 0.73, + "learning_rate": 5.492213894606035e-08, + "loss": 0.0004, + "step": 37409 + }, + { + "epoch": 0.73, + "learning_rate": 5.4918255601724206e-08, + "loss": 0.0005, + "step": 37410 + }, + { + "epoch": 0.73, + "learning_rate": 5.4914372257388065e-08, + "loss": 0.0005, + "step": 37411 + }, + { + "epoch": 0.73, + "learning_rate": 5.491048891305192e-08, + "loss": 0.0008, + "step": 37412 + }, + { + "epoch": 0.73, + "learning_rate": 5.490660556871578e-08, + "loss": 0.0005, + "step": 37413 + }, + { + "epoch": 0.73, + "learning_rate": 5.490272222437964e-08, + "loss": 0.0004, + "step": 37414 + }, + { + "epoch": 0.73, + "learning_rate": 5.48988388800435e-08, + "loss": 0.0006, + "step": 37415 + }, + { + "epoch": 0.73, + "learning_rate": 5.489495553570734e-08, + "loss": 0.0005, + "step": 37416 + }, + { + "epoch": 0.73, + "learning_rate": 5.48910721913712e-08, + "loss": 0.0005, + "step": 37417 + }, + { + "epoch": 0.73, + "learning_rate": 5.488718884703506e-08, + "loss": 0.0016, + "step": 37418 + }, + { + "epoch": 0.73, + "learning_rate": 5.488330550269892e-08, + "loss": 0.0004, + "step": 37419 + }, + { + "epoch": 0.73, + "learning_rate": 5.4879422158362775e-08, + "loss": 0.0012, + "step": 37420 + }, + { + "epoch": 0.73, + "learning_rate": 5.4875538814026634e-08, + "loss": 0.0005, + "step": 37421 + }, + { + "epoch": 0.73, + "learning_rate": 5.487165546969049e-08, + "loss": 0.0003, + "step": 37422 + }, + { + "epoch": 0.73, + "learning_rate": 5.486777212535435e-08, + "loss": 0.0007, + "step": 37423 + }, + { + "epoch": 0.73, + "learning_rate": 5.486388878101821e-08, + "loss": 0.0004, + "step": 37424 + }, + { + "epoch": 0.73, + "learning_rate": 5.486000543668207e-08, + "loss": 0.0008, + "step": 37425 + }, + { + "epoch": 0.73, + "learning_rate": 5.4856122092345925e-08, + "loss": 0.0005, + "step": 37426 + }, + { + "epoch": 0.73, + "learning_rate": 5.485223874800978e-08, + "loss": 0.0007, + "step": 37427 + }, + { + "epoch": 0.73, + "learning_rate": 5.484835540367364e-08, + "loss": 0.0007, + "step": 37428 + }, + { + "epoch": 0.73, + "learning_rate": 5.48444720593375e-08, + "loss": 0.0005, + "step": 37429 + }, + { + "epoch": 0.73, + "learning_rate": 5.484058871500136e-08, + "loss": 0.0003, + "step": 37430 + }, + { + "epoch": 0.73, + "learning_rate": 5.4836705370665216e-08, + "loss": 0.0003, + "step": 37431 + }, + { + "epoch": 0.73, + "learning_rate": 5.4832822026329074e-08, + "loss": 0.0006, + "step": 37432 + }, + { + "epoch": 0.73, + "learning_rate": 5.482893868199293e-08, + "loss": 0.0138, + "step": 37433 + }, + { + "epoch": 0.73, + "learning_rate": 5.482505533765679e-08, + "loss": 0.0003, + "step": 37434 + }, + { + "epoch": 0.73, + "learning_rate": 5.482117199332065e-08, + "loss": 0.0005, + "step": 37435 + }, + { + "epoch": 0.73, + "learning_rate": 5.481728864898451e-08, + "loss": 0.0014, + "step": 37436 + }, + { + "epoch": 0.73, + "learning_rate": 5.4813405304648366e-08, + "loss": 0.7284, + "step": 37437 + }, + { + "epoch": 0.73, + "learning_rate": 5.4809521960312224e-08, + "loss": 0.0006, + "step": 37438 + }, + { + "epoch": 0.73, + "learning_rate": 5.480563861597608e-08, + "loss": 0.0006, + "step": 37439 + }, + { + "epoch": 0.73, + "learning_rate": 5.480175527163994e-08, + "loss": 0.0015, + "step": 37440 + }, + { + "epoch": 0.73, + "learning_rate": 5.47978719273038e-08, + "loss": 0.0005, + "step": 37441 + }, + { + "epoch": 0.73, + "learning_rate": 5.479398858296766e-08, + "loss": 0.7766, + "step": 37442 + }, + { + "epoch": 0.73, + "learning_rate": 5.4790105238631515e-08, + "loss": 0.0029, + "step": 37443 + }, + { + "epoch": 0.73, + "learning_rate": 5.4786221894295373e-08, + "loss": 1.2239, + "step": 37444 + }, + { + "epoch": 0.73, + "learning_rate": 5.478233854995922e-08, + "loss": 0.0004, + "step": 37445 + }, + { + "epoch": 0.73, + "learning_rate": 5.4778455205623077e-08, + "loss": 0.0004, + "step": 37446 + }, + { + "epoch": 0.73, + "learning_rate": 5.4774571861286935e-08, + "loss": 0.0003, + "step": 37447 + }, + { + "epoch": 0.73, + "learning_rate": 5.477068851695079e-08, + "loss": 0.1046, + "step": 37448 + }, + { + "epoch": 0.73, + "learning_rate": 5.476680517261465e-08, + "loss": 0.0004, + "step": 37449 + }, + { + "epoch": 0.73, + "learning_rate": 5.476292182827851e-08, + "loss": 0.0005, + "step": 37450 + }, + { + "epoch": 0.73, + "learning_rate": 5.475903848394237e-08, + "loss": 0.0004, + "step": 37451 + }, + { + "epoch": 0.73, + "learning_rate": 5.4755155139606226e-08, + "loss": 0.0008, + "step": 37452 + }, + { + "epoch": 0.73, + "learning_rate": 5.4751271795270084e-08, + "loss": 0.0004, + "step": 37453 + }, + { + "epoch": 0.73, + "learning_rate": 5.474738845093394e-08, + "loss": 0.0004, + "step": 37454 + }, + { + "epoch": 0.73, + "learning_rate": 5.47435051065978e-08, + "loss": 0.0005, + "step": 37455 + }, + { + "epoch": 0.73, + "learning_rate": 5.473962176226166e-08, + "loss": 0.0003, + "step": 37456 + }, + { + "epoch": 0.73, + "learning_rate": 5.473573841792552e-08, + "loss": 0.0003, + "step": 37457 + }, + { + "epoch": 0.73, + "learning_rate": 5.4731855073589376e-08, + "loss": 0.0545, + "step": 37458 + }, + { + "epoch": 0.73, + "learning_rate": 5.4727971729253234e-08, + "loss": 0.0004, + "step": 37459 + }, + { + "epoch": 0.73, + "learning_rate": 5.4724088384917085e-08, + "loss": 0.0007, + "step": 37460 + }, + { + "epoch": 0.73, + "learning_rate": 5.4720205040580944e-08, + "loss": 0.6257, + "step": 37461 + }, + { + "epoch": 0.73, + "learning_rate": 5.47163216962448e-08, + "loss": 0.0017, + "step": 37462 + }, + { + "epoch": 0.73, + "learning_rate": 5.471243835190866e-08, + "loss": 0.0921, + "step": 37463 + }, + { + "epoch": 0.73, + "learning_rate": 5.470855500757252e-08, + "loss": 0.0004, + "step": 37464 + }, + { + "epoch": 0.73, + "learning_rate": 5.4704671663236377e-08, + "loss": 0.0004, + "step": 37465 + }, + { + "epoch": 0.73, + "learning_rate": 5.4700788318900235e-08, + "loss": 0.0004, + "step": 37466 + }, + { + "epoch": 0.73, + "learning_rate": 5.469690497456409e-08, + "loss": 0.0068, + "step": 37467 + }, + { + "epoch": 0.73, + "learning_rate": 5.469302163022795e-08, + "loss": 1.1151, + "step": 37468 + }, + { + "epoch": 0.73, + "learning_rate": 5.468913828589181e-08, + "loss": 0.0004, + "step": 37469 + }, + { + "epoch": 0.73, + "learning_rate": 5.468525494155567e-08, + "loss": 0.0007, + "step": 37470 + }, + { + "epoch": 0.73, + "learning_rate": 5.4681371597219526e-08, + "loss": 0.0004, + "step": 37471 + }, + { + "epoch": 0.73, + "learning_rate": 5.4677488252883384e-08, + "loss": 0.0007, + "step": 37472 + }, + { + "epoch": 0.73, + "learning_rate": 5.467360490854724e-08, + "loss": 0.0008, + "step": 37473 + }, + { + "epoch": 0.73, + "learning_rate": 5.4669721564211094e-08, + "loss": 0.0005, + "step": 37474 + }, + { + "epoch": 0.73, + "learning_rate": 5.4665838219874946e-08, + "loss": 0.0004, + "step": 37475 + }, + { + "epoch": 0.73, + "learning_rate": 5.4661954875538804e-08, + "loss": 0.0008, + "step": 37476 + }, + { + "epoch": 0.73, + "learning_rate": 5.465807153120266e-08, + "loss": 0.0004, + "step": 37477 + }, + { + "epoch": 0.73, + "learning_rate": 5.465418818686652e-08, + "loss": 0.0005, + "step": 37478 + }, + { + "epoch": 0.73, + "learning_rate": 5.465030484253038e-08, + "loss": 0.0003, + "step": 37479 + }, + { + "epoch": 0.73, + "learning_rate": 5.464642149819424e-08, + "loss": 0.0004, + "step": 37480 + }, + { + "epoch": 0.73, + "learning_rate": 5.4642538153858095e-08, + "loss": 0.0005, + "step": 37481 + }, + { + "epoch": 0.73, + "learning_rate": 5.4638654809521954e-08, + "loss": 0.003, + "step": 37482 + }, + { + "epoch": 0.73, + "learning_rate": 5.463477146518581e-08, + "loss": 0.0006, + "step": 37483 + }, + { + "epoch": 0.73, + "learning_rate": 5.463088812084967e-08, + "loss": 0.0006, + "step": 37484 + }, + { + "epoch": 0.73, + "learning_rate": 5.462700477651353e-08, + "loss": 0.0005, + "step": 37485 + }, + { + "epoch": 0.73, + "learning_rate": 5.4623121432177387e-08, + "loss": 0.0006, + "step": 37486 + }, + { + "epoch": 0.73, + "learning_rate": 5.4619238087841245e-08, + "loss": 0.0004, + "step": 37487 + }, + { + "epoch": 0.73, + "learning_rate": 5.46153547435051e-08, + "loss": 0.0004, + "step": 37488 + }, + { + "epoch": 0.73, + "learning_rate": 5.461147139916896e-08, + "loss": 0.0003, + "step": 37489 + }, + { + "epoch": 0.73, + "learning_rate": 5.460758805483282e-08, + "loss": 0.0006, + "step": 37490 + }, + { + "epoch": 0.73, + "learning_rate": 5.460370471049668e-08, + "loss": 0.0003, + "step": 37491 + }, + { + "epoch": 0.73, + "learning_rate": 5.4599821366160536e-08, + "loss": 0.0006, + "step": 37492 + }, + { + "epoch": 0.73, + "learning_rate": 5.4595938021824394e-08, + "loss": 0.0004, + "step": 37493 + }, + { + "epoch": 0.73, + "learning_rate": 5.459205467748825e-08, + "loss": 0.0004, + "step": 37494 + }, + { + "epoch": 0.73, + "learning_rate": 5.458817133315211e-08, + "loss": 0.0005, + "step": 37495 + }, + { + "epoch": 0.73, + "learning_rate": 5.458428798881597e-08, + "loss": 0.0013, + "step": 37496 + }, + { + "epoch": 0.73, + "learning_rate": 5.458040464447983e-08, + "loss": 0.0004, + "step": 37497 + }, + { + "epoch": 0.73, + "learning_rate": 5.4576521300143685e-08, + "loss": 0.0005, + "step": 37498 + }, + { + "epoch": 0.73, + "learning_rate": 5.4572637955807544e-08, + "loss": 0.0004, + "step": 37499 + }, + { + "epoch": 0.73, + "learning_rate": 5.45687546114714e-08, + "loss": 0.0007, + "step": 37500 + }, + { + "epoch": 0.73, + "learning_rate": 5.456487126713526e-08, + "loss": 0.0004, + "step": 37501 + }, + { + "epoch": 0.73, + "learning_rate": 5.456098792279912e-08, + "loss": 0.0005, + "step": 37502 + }, + { + "epoch": 0.73, + "learning_rate": 5.4557104578462963e-08, + "loss": 0.0005, + "step": 37503 + }, + { + "epoch": 0.73, + "learning_rate": 5.455322123412682e-08, + "loss": 0.0007, + "step": 37504 + }, + { + "epoch": 0.73, + "learning_rate": 5.454933788979068e-08, + "loss": 0.0004, + "step": 37505 + }, + { + "epoch": 0.73, + "learning_rate": 5.454545454545454e-08, + "loss": 0.0006, + "step": 37506 + }, + { + "epoch": 0.73, + "learning_rate": 5.4541571201118396e-08, + "loss": 0.0004, + "step": 37507 + }, + { + "epoch": 0.73, + "learning_rate": 5.4537687856782255e-08, + "loss": 0.0004, + "step": 37508 + }, + { + "epoch": 0.73, + "learning_rate": 5.453380451244611e-08, + "loss": 0.0006, + "step": 37509 + }, + { + "epoch": 0.73, + "learning_rate": 5.452992116810997e-08, + "loss": 0.0004, + "step": 37510 + }, + { + "epoch": 0.73, + "learning_rate": 5.452603782377383e-08, + "loss": 0.0004, + "step": 37511 + }, + { + "epoch": 0.73, + "learning_rate": 5.452215447943769e-08, + "loss": 0.0005, + "step": 37512 + }, + { + "epoch": 0.73, + "learning_rate": 5.4518271135101546e-08, + "loss": 0.0003, + "step": 37513 + }, + { + "epoch": 0.73, + "learning_rate": 5.4514387790765404e-08, + "loss": 0.0004, + "step": 37514 + }, + { + "epoch": 0.73, + "learning_rate": 5.451050444642926e-08, + "loss": 0.0006, + "step": 37515 + }, + { + "epoch": 0.73, + "learning_rate": 5.450662110209312e-08, + "loss": 0.0004, + "step": 37516 + }, + { + "epoch": 0.73, + "learning_rate": 5.450273775775698e-08, + "loss": 0.3158, + "step": 37517 + }, + { + "epoch": 0.73, + "learning_rate": 5.449885441342084e-08, + "loss": 0.0014, + "step": 37518 + }, + { + "epoch": 0.73, + "learning_rate": 5.4494971069084695e-08, + "loss": 0.0004, + "step": 37519 + }, + { + "epoch": 0.73, + "learning_rate": 5.4491087724748554e-08, + "loss": 0.0005, + "step": 37520 + }, + { + "epoch": 0.73, + "learning_rate": 5.448720438041241e-08, + "loss": 0.0005, + "step": 37521 + }, + { + "epoch": 0.73, + "learning_rate": 5.448332103607627e-08, + "loss": 0.0006, + "step": 37522 + }, + { + "epoch": 0.73, + "learning_rate": 5.447943769174013e-08, + "loss": 0.0004, + "step": 37523 + }, + { + "epoch": 0.73, + "learning_rate": 5.4475554347403987e-08, + "loss": 0.0237, + "step": 37524 + }, + { + "epoch": 0.73, + "learning_rate": 5.4471671003067845e-08, + "loss": 0.0006, + "step": 37525 + }, + { + "epoch": 0.73, + "learning_rate": 5.44677876587317e-08, + "loss": 0.0005, + "step": 37526 + }, + { + "epoch": 0.73, + "learning_rate": 5.446390431439556e-08, + "loss": 0.0004, + "step": 37527 + }, + { + "epoch": 0.73, + "learning_rate": 5.446002097005942e-08, + "loss": 0.0006, + "step": 37528 + }, + { + "epoch": 0.73, + "learning_rate": 5.445613762572328e-08, + "loss": 0.0005, + "step": 37529 + }, + { + "epoch": 0.73, + "learning_rate": 5.4452254281387136e-08, + "loss": 0.0006, + "step": 37530 + }, + { + "epoch": 0.73, + "learning_rate": 5.4448370937050994e-08, + "loss": 0.1932, + "step": 37531 + }, + { + "epoch": 0.73, + "learning_rate": 5.444448759271484e-08, + "loss": 0.0245, + "step": 37532 + }, + { + "epoch": 0.73, + "learning_rate": 5.44406042483787e-08, + "loss": 0.0005, + "step": 37533 + }, + { + "epoch": 0.73, + "learning_rate": 5.4436720904042556e-08, + "loss": 0.0005, + "step": 37534 + }, + { + "epoch": 0.73, + "learning_rate": 5.4432837559706414e-08, + "loss": 0.0006, + "step": 37535 + }, + { + "epoch": 0.73, + "learning_rate": 5.442895421537027e-08, + "loss": 0.0005, + "step": 37536 + }, + { + "epoch": 0.73, + "learning_rate": 5.442507087103413e-08, + "loss": 0.0013, + "step": 37537 + }, + { + "epoch": 0.73, + "learning_rate": 5.442118752669799e-08, + "loss": 0.0004, + "step": 37538 + }, + { + "epoch": 0.73, + "learning_rate": 5.441730418236185e-08, + "loss": 0.4473, + "step": 37539 + }, + { + "epoch": 0.73, + "learning_rate": 5.4413420838025705e-08, + "loss": 0.0005, + "step": 37540 + }, + { + "epoch": 0.73, + "learning_rate": 5.4409537493689563e-08, + "loss": 0.0004, + "step": 37541 + }, + { + "epoch": 0.73, + "learning_rate": 5.440565414935342e-08, + "loss": 0.0004, + "step": 37542 + }, + { + "epoch": 0.73, + "learning_rate": 5.440177080501728e-08, + "loss": 0.473, + "step": 37543 + }, + { + "epoch": 0.73, + "learning_rate": 5.439788746068114e-08, + "loss": 0.0003, + "step": 37544 + }, + { + "epoch": 0.73, + "learning_rate": 5.4394004116344996e-08, + "loss": 0.0004, + "step": 37545 + }, + { + "epoch": 0.73, + "learning_rate": 5.4390120772008855e-08, + "loss": 0.0006, + "step": 37546 + }, + { + "epoch": 0.73, + "learning_rate": 5.438623742767271e-08, + "loss": 0.0003, + "step": 37547 + }, + { + "epoch": 0.73, + "learning_rate": 5.438235408333657e-08, + "loss": 0.0003, + "step": 37548 + }, + { + "epoch": 0.73, + "learning_rate": 5.437847073900042e-08, + "loss": 0.0005, + "step": 37549 + }, + { + "epoch": 0.73, + "learning_rate": 5.437458739466428e-08, + "loss": 0.0007, + "step": 37550 + }, + { + "epoch": 0.73, + "learning_rate": 5.437070405032814e-08, + "loss": 0.0003, + "step": 37551 + }, + { + "epoch": 0.73, + "learning_rate": 5.4366820705992e-08, + "loss": 0.0005, + "step": 37552 + }, + { + "epoch": 0.73, + "learning_rate": 5.4362937361655856e-08, + "loss": 0.0802, + "step": 37553 + }, + { + "epoch": 0.73, + "learning_rate": 5.4359054017319714e-08, + "loss": 0.0006, + "step": 37554 + }, + { + "epoch": 0.73, + "learning_rate": 5.435517067298357e-08, + "loss": 0.0006, + "step": 37555 + }, + { + "epoch": 0.73, + "learning_rate": 5.435128732864743e-08, + "loss": 0.0006, + "step": 37556 + }, + { + "epoch": 0.73, + "learning_rate": 5.434740398431129e-08, + "loss": 0.1687, + "step": 37557 + }, + { + "epoch": 0.73, + "learning_rate": 5.434352063997515e-08, + "loss": 0.0003, + "step": 37558 + }, + { + "epoch": 0.73, + "learning_rate": 5.4339637295639005e-08, + "loss": 0.1411, + "step": 37559 + }, + { + "epoch": 0.73, + "learning_rate": 5.4335753951302864e-08, + "loss": 0.0003, + "step": 37560 + }, + { + "epoch": 0.73, + "learning_rate": 5.4331870606966715e-08, + "loss": 0.0003, + "step": 37561 + }, + { + "epoch": 0.73, + "learning_rate": 5.4327987262630573e-08, + "loss": 0.0007, + "step": 37562 + }, + { + "epoch": 0.73, + "learning_rate": 5.4324103918294425e-08, + "loss": 0.0005, + "step": 37563 + }, + { + "epoch": 0.73, + "learning_rate": 5.432022057395828e-08, + "loss": 0.0005, + "step": 37564 + }, + { + "epoch": 0.73, + "learning_rate": 5.431633722962214e-08, + "loss": 0.0004, + "step": 37565 + }, + { + "epoch": 0.73, + "learning_rate": 5.4312453885286e-08, + "loss": 0.0004, + "step": 37566 + }, + { + "epoch": 0.73, + "learning_rate": 5.430857054094986e-08, + "loss": 0.0006, + "step": 37567 + }, + { + "epoch": 0.73, + "learning_rate": 5.4304687196613716e-08, + "loss": 0.0004, + "step": 37568 + }, + { + "epoch": 0.73, + "learning_rate": 5.4300803852277574e-08, + "loss": 0.0004, + "step": 37569 + }, + { + "epoch": 0.73, + "learning_rate": 5.429692050794143e-08, + "loss": 0.0005, + "step": 37570 + }, + { + "epoch": 0.73, + "learning_rate": 5.429303716360529e-08, + "loss": 0.0005, + "step": 37571 + }, + { + "epoch": 0.73, + "learning_rate": 5.428915381926915e-08, + "loss": 0.9415, + "step": 37572 + }, + { + "epoch": 0.73, + "learning_rate": 5.428527047493301e-08, + "loss": 0.0004, + "step": 37573 + }, + { + "epoch": 0.73, + "learning_rate": 5.4281387130596866e-08, + "loss": 0.0004, + "step": 37574 + }, + { + "epoch": 0.73, + "learning_rate": 5.4277503786260724e-08, + "loss": 0.0004, + "step": 37575 + }, + { + "epoch": 0.73, + "learning_rate": 5.427362044192458e-08, + "loss": 0.0003, + "step": 37576 + }, + { + "epoch": 0.73, + "learning_rate": 5.426973709758844e-08, + "loss": 0.0005, + "step": 37577 + }, + { + "epoch": 0.73, + "learning_rate": 5.42658537532523e-08, + "loss": 0.0196, + "step": 37578 + }, + { + "epoch": 0.73, + "learning_rate": 5.426197040891616e-08, + "loss": 0.0006, + "step": 37579 + }, + { + "epoch": 0.73, + "learning_rate": 5.4258087064580015e-08, + "loss": 0.0007, + "step": 37580 + }, + { + "epoch": 0.73, + "learning_rate": 5.4254203720243873e-08, + "loss": 0.0006, + "step": 37581 + }, + { + "epoch": 0.73, + "learning_rate": 5.425032037590773e-08, + "loss": 0.0004, + "step": 37582 + }, + { + "epoch": 0.73, + "learning_rate": 5.424643703157159e-08, + "loss": 0.0003, + "step": 37583 + }, + { + "epoch": 0.73, + "learning_rate": 5.424255368723545e-08, + "loss": 0.0009, + "step": 37584 + }, + { + "epoch": 0.73, + "learning_rate": 5.4238670342899306e-08, + "loss": 0.0005, + "step": 37585 + }, + { + "epoch": 0.73, + "learning_rate": 5.4234786998563165e-08, + "loss": 0.0004, + "step": 37586 + }, + { + "epoch": 0.73, + "learning_rate": 5.423090365422702e-08, + "loss": 0.0004, + "step": 37587 + }, + { + "epoch": 0.73, + "learning_rate": 5.422702030989088e-08, + "loss": 0.0005, + "step": 37588 + }, + { + "epoch": 0.73, + "learning_rate": 5.422313696555474e-08, + "loss": 0.0168, + "step": 37589 + }, + { + "epoch": 0.73, + "learning_rate": 5.4219253621218584e-08, + "loss": 0.0004, + "step": 37590 + }, + { + "epoch": 0.73, + "learning_rate": 5.421537027688244e-08, + "loss": 0.0032, + "step": 37591 + }, + { + "epoch": 0.73, + "learning_rate": 5.42114869325463e-08, + "loss": 0.0006, + "step": 37592 + }, + { + "epoch": 0.73, + "learning_rate": 5.420760358821016e-08, + "loss": 0.0004, + "step": 37593 + }, + { + "epoch": 0.73, + "learning_rate": 5.420372024387402e-08, + "loss": 0.0006, + "step": 37594 + }, + { + "epoch": 0.73, + "learning_rate": 5.4199836899537876e-08, + "loss": 0.0006, + "step": 37595 + }, + { + "epoch": 0.73, + "learning_rate": 5.4195953555201734e-08, + "loss": 0.0004, + "step": 37596 + }, + { + "epoch": 0.73, + "learning_rate": 5.419207021086559e-08, + "loss": 0.0003, + "step": 37597 + }, + { + "epoch": 0.73, + "learning_rate": 5.418818686652945e-08, + "loss": 0.335, + "step": 37598 + }, + { + "epoch": 0.73, + "learning_rate": 5.418430352219331e-08, + "loss": 0.0004, + "step": 37599 + }, + { + "epoch": 0.73, + "learning_rate": 5.418042017785717e-08, + "loss": 0.0009, + "step": 37600 + }, + { + "epoch": 0.73, + "learning_rate": 5.4176536833521025e-08, + "loss": 0.0005, + "step": 37601 + }, + { + "epoch": 0.73, + "learning_rate": 5.417265348918488e-08, + "loss": 0.0003, + "step": 37602 + }, + { + "epoch": 0.73, + "learning_rate": 5.416877014484874e-08, + "loss": 0.0017, + "step": 37603 + }, + { + "epoch": 0.73, + "learning_rate": 5.41648868005126e-08, + "loss": 0.0013, + "step": 37604 + }, + { + "epoch": 0.73, + "learning_rate": 5.416100345617646e-08, + "loss": 0.0003, + "step": 37605 + }, + { + "epoch": 0.73, + "learning_rate": 5.4157120111840316e-08, + "loss": 0.0009, + "step": 37606 + }, + { + "epoch": 0.73, + "learning_rate": 5.4153236767504175e-08, + "loss": 0.0008, + "step": 37607 + }, + { + "epoch": 0.73, + "learning_rate": 5.414935342316803e-08, + "loss": 0.0029, + "step": 37608 + }, + { + "epoch": 0.73, + "learning_rate": 5.414547007883189e-08, + "loss": 0.0152, + "step": 37609 + }, + { + "epoch": 0.73, + "learning_rate": 5.414158673449575e-08, + "loss": 0.0007, + "step": 37610 + }, + { + "epoch": 0.73, + "learning_rate": 5.413770339015961e-08, + "loss": 0.006, + "step": 37611 + }, + { + "epoch": 0.73, + "learning_rate": 5.4133820045823466e-08, + "loss": 0.0004, + "step": 37612 + }, + { + "epoch": 0.73, + "learning_rate": 5.4129936701487324e-08, + "loss": 0.0046, + "step": 37613 + }, + { + "epoch": 0.73, + "learning_rate": 5.412605335715118e-08, + "loss": 0.0016, + "step": 37614 + }, + { + "epoch": 0.73, + "learning_rate": 5.412217001281504e-08, + "loss": 0.0005, + "step": 37615 + }, + { + "epoch": 0.73, + "learning_rate": 5.41182866684789e-08, + "loss": 0.0004, + "step": 37616 + }, + { + "epoch": 0.73, + "learning_rate": 5.411440332414276e-08, + "loss": 0.0006, + "step": 37617 + }, + { + "epoch": 0.73, + "learning_rate": 5.4110519979806615e-08, + "loss": 0.0003, + "step": 37618 + }, + { + "epoch": 0.73, + "learning_rate": 5.410663663547046e-08, + "loss": 0.0007, + "step": 37619 + }, + { + "epoch": 0.73, + "learning_rate": 5.410275329113432e-08, + "loss": 0.0006, + "step": 37620 + }, + { + "epoch": 0.73, + "learning_rate": 5.409886994679818e-08, + "loss": 0.0004, + "step": 37621 + }, + { + "epoch": 0.73, + "learning_rate": 5.4094986602462035e-08, + "loss": 0.0004, + "step": 37622 + }, + { + "epoch": 0.73, + "learning_rate": 5.409110325812589e-08, + "loss": 0.0003, + "step": 37623 + }, + { + "epoch": 0.73, + "learning_rate": 5.408721991378975e-08, + "loss": 0.0006, + "step": 37624 + }, + { + "epoch": 0.73, + "learning_rate": 5.408333656945361e-08, + "loss": 0.0006, + "step": 37625 + }, + { + "epoch": 0.73, + "learning_rate": 5.407945322511747e-08, + "loss": 0.0003, + "step": 37626 + }, + { + "epoch": 0.73, + "learning_rate": 5.4075569880781326e-08, + "loss": 0.0031, + "step": 37627 + }, + { + "epoch": 0.73, + "learning_rate": 5.4071686536445184e-08, + "loss": 0.0004, + "step": 37628 + }, + { + "epoch": 0.73, + "learning_rate": 5.406780319210904e-08, + "loss": 0.0005, + "step": 37629 + }, + { + "epoch": 0.73, + "learning_rate": 5.40639198477729e-08, + "loss": 0.445, + "step": 37630 + }, + { + "epoch": 0.73, + "learning_rate": 5.406003650343676e-08, + "loss": 0.0006, + "step": 37631 + }, + { + "epoch": 0.73, + "learning_rate": 5.405615315910062e-08, + "loss": 0.0005, + "step": 37632 + }, + { + "epoch": 0.73, + "learning_rate": 5.4052269814764476e-08, + "loss": 0.001, + "step": 37633 + }, + { + "epoch": 0.73, + "learning_rate": 5.4048386470428334e-08, + "loss": 0.0004, + "step": 37634 + }, + { + "epoch": 0.73, + "learning_rate": 5.404450312609219e-08, + "loss": 0.0005, + "step": 37635 + }, + { + "epoch": 0.73, + "learning_rate": 5.404061978175605e-08, + "loss": 0.0004, + "step": 37636 + }, + { + "epoch": 0.73, + "learning_rate": 5.40367364374199e-08, + "loss": 0.0003, + "step": 37637 + }, + { + "epoch": 0.73, + "learning_rate": 5.403285309308376e-08, + "loss": 0.0003, + "step": 37638 + }, + { + "epoch": 0.73, + "learning_rate": 5.402896974874762e-08, + "loss": 0.0004, + "step": 37639 + }, + { + "epoch": 0.73, + "learning_rate": 5.402508640441148e-08, + "loss": 0.0003, + "step": 37640 + }, + { + "epoch": 0.73, + "learning_rate": 5.4021203060075335e-08, + "loss": 0.0005, + "step": 37641 + }, + { + "epoch": 0.73, + "learning_rate": 5.401731971573919e-08, + "loss": 0.0005, + "step": 37642 + }, + { + "epoch": 0.73, + "learning_rate": 5.401343637140305e-08, + "loss": 0.0006, + "step": 37643 + }, + { + "epoch": 0.73, + "learning_rate": 5.400955302706691e-08, + "loss": 0.0006, + "step": 37644 + }, + { + "epoch": 0.73, + "learning_rate": 5.400566968273077e-08, + "loss": 0.0152, + "step": 37645 + }, + { + "epoch": 0.73, + "learning_rate": 5.4001786338394626e-08, + "loss": 0.0004, + "step": 37646 + }, + { + "epoch": 0.73, + "learning_rate": 5.3997902994058484e-08, + "loss": 0.0005, + "step": 37647 + }, + { + "epoch": 0.73, + "learning_rate": 5.3994019649722336e-08, + "loss": 0.0004, + "step": 37648 + }, + { + "epoch": 0.73, + "learning_rate": 5.3990136305386194e-08, + "loss": 0.0004, + "step": 37649 + }, + { + "epoch": 0.73, + "learning_rate": 5.398625296105005e-08, + "loss": 0.004, + "step": 37650 + }, + { + "epoch": 0.73, + "learning_rate": 5.398236961671391e-08, + "loss": 0.0005, + "step": 37651 + }, + { + "epoch": 0.73, + "learning_rate": 5.397848627237776e-08, + "loss": 0.0004, + "step": 37652 + }, + { + "epoch": 0.73, + "learning_rate": 5.397460292804162e-08, + "loss": 0.0004, + "step": 37653 + }, + { + "epoch": 0.73, + "learning_rate": 5.397071958370548e-08, + "loss": 0.0006, + "step": 37654 + }, + { + "epoch": 0.73, + "learning_rate": 5.396683623936934e-08, + "loss": 0.0004, + "step": 37655 + }, + { + "epoch": 0.73, + "learning_rate": 5.3962952895033195e-08, + "loss": 0.0005, + "step": 37656 + }, + { + "epoch": 0.73, + "learning_rate": 5.3959069550697054e-08, + "loss": 0.0009, + "step": 37657 + }, + { + "epoch": 0.73, + "learning_rate": 5.395518620636091e-08, + "loss": 0.0005, + "step": 37658 + }, + { + "epoch": 0.73, + "learning_rate": 5.395130286202477e-08, + "loss": 0.0005, + "step": 37659 + }, + { + "epoch": 0.73, + "learning_rate": 5.394741951768863e-08, + "loss": 0.0003, + "step": 37660 + }, + { + "epoch": 0.73, + "learning_rate": 5.3943536173352487e-08, + "loss": 0.0004, + "step": 37661 + }, + { + "epoch": 0.73, + "learning_rate": 5.3939652829016345e-08, + "loss": 0.0034, + "step": 37662 + }, + { + "epoch": 0.73, + "learning_rate": 5.39357694846802e-08, + "loss": 0.0022, + "step": 37663 + }, + { + "epoch": 0.73, + "learning_rate": 5.393188614034406e-08, + "loss": 0.0004, + "step": 37664 + }, + { + "epoch": 0.73, + "learning_rate": 5.392800279600792e-08, + "loss": 0.168, + "step": 37665 + }, + { + "epoch": 0.73, + "learning_rate": 5.392411945167178e-08, + "loss": 0.0006, + "step": 37666 + }, + { + "epoch": 0.73, + "learning_rate": 5.3920236107335636e-08, + "loss": 0.0009, + "step": 37667 + }, + { + "epoch": 0.73, + "learning_rate": 5.3916352762999494e-08, + "loss": 0.0004, + "step": 37668 + }, + { + "epoch": 0.73, + "learning_rate": 5.391246941866335e-08, + "loss": 0.0004, + "step": 37669 + }, + { + "epoch": 0.73, + "learning_rate": 5.390858607432721e-08, + "loss": 0.2491, + "step": 37670 + }, + { + "epoch": 0.73, + "learning_rate": 5.390470272999107e-08, + "loss": 0.0005, + "step": 37671 + }, + { + "epoch": 0.73, + "learning_rate": 5.390081938565493e-08, + "loss": 0.0005, + "step": 37672 + }, + { + "epoch": 0.73, + "learning_rate": 5.3896936041318786e-08, + "loss": 0.0005, + "step": 37673 + }, + { + "epoch": 0.73, + "learning_rate": 5.3893052696982644e-08, + "loss": 0.0005, + "step": 37674 + }, + { + "epoch": 0.73, + "learning_rate": 5.38891693526465e-08, + "loss": 0.0004, + "step": 37675 + }, + { + "epoch": 0.73, + "learning_rate": 5.388528600831036e-08, + "loss": 0.0006, + "step": 37676 + }, + { + "epoch": 0.73, + "learning_rate": 5.3881402663974205e-08, + "loss": 0.0005, + "step": 37677 + }, + { + "epoch": 0.73, + "learning_rate": 5.3877519319638064e-08, + "loss": 0.0005, + "step": 37678 + }, + { + "epoch": 0.73, + "learning_rate": 5.387363597530192e-08, + "loss": 0.0006, + "step": 37679 + }, + { + "epoch": 0.73, + "learning_rate": 5.386975263096578e-08, + "loss": 0.0004, + "step": 37680 + }, + { + "epoch": 0.73, + "learning_rate": 5.386586928662964e-08, + "loss": 0.0133, + "step": 37681 + }, + { + "epoch": 0.73, + "learning_rate": 5.3861985942293497e-08, + "loss": 0.0004, + "step": 37682 + }, + { + "epoch": 0.73, + "learning_rate": 5.3858102597957355e-08, + "loss": 0.0004, + "step": 37683 + }, + { + "epoch": 0.73, + "learning_rate": 5.385421925362121e-08, + "loss": 0.0003, + "step": 37684 + }, + { + "epoch": 0.73, + "learning_rate": 5.385033590928507e-08, + "loss": 0.0004, + "step": 37685 + }, + { + "epoch": 0.73, + "learning_rate": 5.384645256494893e-08, + "loss": 0.0005, + "step": 37686 + }, + { + "epoch": 0.73, + "learning_rate": 5.384256922061279e-08, + "loss": 0.0004, + "step": 37687 + }, + { + "epoch": 0.73, + "learning_rate": 5.3838685876276646e-08, + "loss": 0.0002, + "step": 37688 + }, + { + "epoch": 0.73, + "learning_rate": 5.3834802531940504e-08, + "loss": 0.0005, + "step": 37689 + }, + { + "epoch": 0.73, + "learning_rate": 5.383091918760436e-08, + "loss": 0.0006, + "step": 37690 + }, + { + "epoch": 0.73, + "learning_rate": 5.382703584326822e-08, + "loss": 0.0046, + "step": 37691 + }, + { + "epoch": 0.73, + "learning_rate": 5.382315249893208e-08, + "loss": 0.0005, + "step": 37692 + }, + { + "epoch": 0.73, + "learning_rate": 5.381926915459594e-08, + "loss": 0.0009, + "step": 37693 + }, + { + "epoch": 0.73, + "learning_rate": 5.3815385810259795e-08, + "loss": 0.0005, + "step": 37694 + }, + { + "epoch": 0.73, + "learning_rate": 5.3811502465923654e-08, + "loss": 0.0004, + "step": 37695 + }, + { + "epoch": 0.73, + "learning_rate": 5.380761912158751e-08, + "loss": 0.0003, + "step": 37696 + }, + { + "epoch": 0.73, + "learning_rate": 5.380373577725137e-08, + "loss": 0.0108, + "step": 37697 + }, + { + "epoch": 0.73, + "learning_rate": 5.379985243291523e-08, + "loss": 0.0005, + "step": 37698 + }, + { + "epoch": 0.73, + "learning_rate": 5.3795969088579087e-08, + "loss": 0.0006, + "step": 37699 + }, + { + "epoch": 0.73, + "learning_rate": 5.3792085744242945e-08, + "loss": 0.0006, + "step": 37700 + }, + { + "epoch": 0.73, + "learning_rate": 5.37882023999068e-08, + "loss": 0.0004, + "step": 37701 + }, + { + "epoch": 0.73, + "learning_rate": 5.378431905557066e-08, + "loss": 0.0005, + "step": 37702 + }, + { + "epoch": 0.73, + "learning_rate": 5.378043571123452e-08, + "loss": 0.0004, + "step": 37703 + }, + { + "epoch": 0.73, + "learning_rate": 5.377655236689838e-08, + "loss": 0.0005, + "step": 37704 + }, + { + "epoch": 0.73, + "learning_rate": 5.3772669022562236e-08, + "loss": 0.0004, + "step": 37705 + }, + { + "epoch": 0.73, + "learning_rate": 5.376878567822608e-08, + "loss": 0.0004, + "step": 37706 + }, + { + "epoch": 0.73, + "learning_rate": 5.376490233388994e-08, + "loss": 0.0004, + "step": 37707 + }, + { + "epoch": 0.73, + "learning_rate": 5.37610189895538e-08, + "loss": 0.0012, + "step": 37708 + }, + { + "epoch": 0.73, + "learning_rate": 5.3757135645217656e-08, + "loss": 0.0004, + "step": 37709 + }, + { + "epoch": 0.73, + "learning_rate": 5.3753252300881514e-08, + "loss": 0.0003, + "step": 37710 + }, + { + "epoch": 0.73, + "learning_rate": 5.374936895654537e-08, + "loss": 0.0004, + "step": 37711 + }, + { + "epoch": 0.73, + "learning_rate": 5.374548561220923e-08, + "loss": 0.0003, + "step": 37712 + }, + { + "epoch": 0.73, + "learning_rate": 5.374160226787309e-08, + "loss": 0.0006, + "step": 37713 + }, + { + "epoch": 0.73, + "learning_rate": 5.373771892353695e-08, + "loss": 0.0003, + "step": 37714 + }, + { + "epoch": 0.73, + "learning_rate": 5.3733835579200805e-08, + "loss": 0.0004, + "step": 37715 + }, + { + "epoch": 0.73, + "learning_rate": 5.3729952234864664e-08, + "loss": 1.0947, + "step": 37716 + }, + { + "epoch": 0.73, + "learning_rate": 5.372606889052852e-08, + "loss": 0.0003, + "step": 37717 + }, + { + "epoch": 0.73, + "learning_rate": 5.372218554619238e-08, + "loss": 0.0005, + "step": 37718 + }, + { + "epoch": 0.73, + "learning_rate": 5.371830220185624e-08, + "loss": 0.0003, + "step": 37719 + }, + { + "epoch": 0.73, + "learning_rate": 5.3714418857520097e-08, + "loss": 0.0005, + "step": 37720 + }, + { + "epoch": 0.73, + "learning_rate": 5.3710535513183955e-08, + "loss": 0.0005, + "step": 37721 + }, + { + "epoch": 0.73, + "learning_rate": 5.370665216884781e-08, + "loss": 0.0004, + "step": 37722 + }, + { + "epoch": 0.73, + "learning_rate": 5.370276882451167e-08, + "loss": 0.0004, + "step": 37723 + }, + { + "epoch": 0.73, + "learning_rate": 5.369888548017553e-08, + "loss": 0.5156, + "step": 37724 + }, + { + "epoch": 0.73, + "learning_rate": 5.369500213583939e-08, + "loss": 0.0005, + "step": 37725 + }, + { + "epoch": 0.73, + "learning_rate": 5.369111879150324e-08, + "loss": 0.0143, + "step": 37726 + }, + { + "epoch": 0.73, + "learning_rate": 5.36872354471671e-08, + "loss": 0.0006, + "step": 37727 + }, + { + "epoch": 0.73, + "learning_rate": 5.3683352102830956e-08, + "loss": 0.0007, + "step": 37728 + }, + { + "epoch": 0.73, + "learning_rate": 5.3679468758494814e-08, + "loss": 0.0004, + "step": 37729 + }, + { + "epoch": 0.73, + "learning_rate": 5.367558541415867e-08, + "loss": 0.0004, + "step": 37730 + }, + { + "epoch": 0.73, + "learning_rate": 5.367170206982253e-08, + "loss": 0.0008, + "step": 37731 + }, + { + "epoch": 0.73, + "learning_rate": 5.366781872548639e-08, + "loss": 0.0004, + "step": 37732 + }, + { + "epoch": 0.73, + "learning_rate": 5.366393538115025e-08, + "loss": 0.0004, + "step": 37733 + }, + { + "epoch": 0.73, + "learning_rate": 5.3660052036814105e-08, + "loss": 0.7249, + "step": 37734 + }, + { + "epoch": 0.73, + "learning_rate": 5.365616869247796e-08, + "loss": 0.0008, + "step": 37735 + }, + { + "epoch": 0.73, + "learning_rate": 5.3652285348141815e-08, + "loss": 0.0005, + "step": 37736 + }, + { + "epoch": 0.73, + "learning_rate": 5.3648402003805673e-08, + "loss": 0.0004, + "step": 37737 + }, + { + "epoch": 0.73, + "learning_rate": 5.364451865946953e-08, + "loss": 0.0004, + "step": 37738 + }, + { + "epoch": 0.73, + "learning_rate": 5.364063531513339e-08, + "loss": 0.0007, + "step": 37739 + }, + { + "epoch": 0.73, + "learning_rate": 5.363675197079724e-08, + "loss": 0.0005, + "step": 37740 + }, + { + "epoch": 0.73, + "learning_rate": 5.36328686264611e-08, + "loss": 0.0006, + "step": 37741 + }, + { + "epoch": 0.73, + "learning_rate": 5.362898528212496e-08, + "loss": 0.0918, + "step": 37742 + }, + { + "epoch": 0.73, + "learning_rate": 5.3625101937788816e-08, + "loss": 0.0007, + "step": 37743 + }, + { + "epoch": 0.73, + "learning_rate": 5.3621218593452675e-08, + "loss": 0.0006, + "step": 37744 + }, + { + "epoch": 0.73, + "learning_rate": 5.361733524911653e-08, + "loss": 0.0004, + "step": 37745 + }, + { + "epoch": 0.73, + "learning_rate": 5.361345190478039e-08, + "loss": 0.0004, + "step": 37746 + }, + { + "epoch": 0.73, + "learning_rate": 5.360956856044425e-08, + "loss": 0.0002, + "step": 37747 + }, + { + "epoch": 0.73, + "learning_rate": 5.360568521610811e-08, + "loss": 0.0003, + "step": 37748 + }, + { + "epoch": 0.73, + "learning_rate": 5.3601801871771966e-08, + "loss": 0.0005, + "step": 37749 + }, + { + "epoch": 0.73, + "learning_rate": 5.3597918527435824e-08, + "loss": 0.0005, + "step": 37750 + }, + { + "epoch": 0.73, + "learning_rate": 5.359403518309968e-08, + "loss": 0.0029, + "step": 37751 + }, + { + "epoch": 0.73, + "learning_rate": 5.359015183876354e-08, + "loss": 0.0003, + "step": 37752 + }, + { + "epoch": 0.73, + "learning_rate": 5.35862684944274e-08, + "loss": 0.0006, + "step": 37753 + }, + { + "epoch": 0.73, + "learning_rate": 5.358238515009126e-08, + "loss": 0.0003, + "step": 37754 + }, + { + "epoch": 0.73, + "learning_rate": 5.3578501805755115e-08, + "loss": 0.0016, + "step": 37755 + }, + { + "epoch": 0.73, + "learning_rate": 5.3574618461418974e-08, + "loss": 0.0004, + "step": 37756 + }, + { + "epoch": 0.73, + "learning_rate": 5.357073511708283e-08, + "loss": 0.0011, + "step": 37757 + }, + { + "epoch": 0.73, + "learning_rate": 5.356685177274669e-08, + "loss": 0.9617, + "step": 37758 + }, + { + "epoch": 0.73, + "learning_rate": 5.356296842841055e-08, + "loss": 0.0035, + "step": 37759 + }, + { + "epoch": 0.73, + "learning_rate": 5.3559085084074407e-08, + "loss": 0.0244, + "step": 37760 + }, + { + "epoch": 0.73, + "learning_rate": 5.3555201739738265e-08, + "loss": 0.0005, + "step": 37761 + }, + { + "epoch": 0.73, + "learning_rate": 5.355131839540212e-08, + "loss": 0.0004, + "step": 37762 + }, + { + "epoch": 0.73, + "learning_rate": 5.354743505106598e-08, + "loss": 1.011, + "step": 37763 + }, + { + "epoch": 0.73, + "learning_rate": 5.3543551706729826e-08, + "loss": 0.0008, + "step": 37764 + }, + { + "epoch": 0.73, + "learning_rate": 5.3539668362393684e-08, + "loss": 0.0007, + "step": 37765 + }, + { + "epoch": 0.73, + "learning_rate": 5.353578501805754e-08, + "loss": 0.0005, + "step": 37766 + }, + { + "epoch": 0.73, + "learning_rate": 5.35319016737214e-08, + "loss": 0.0003, + "step": 37767 + }, + { + "epoch": 0.73, + "learning_rate": 5.352801832938526e-08, + "loss": 0.0447, + "step": 37768 + }, + { + "epoch": 0.73, + "learning_rate": 5.352413498504912e-08, + "loss": 0.0006, + "step": 37769 + }, + { + "epoch": 0.73, + "learning_rate": 5.3520251640712976e-08, + "loss": 0.0005, + "step": 37770 + }, + { + "epoch": 0.73, + "learning_rate": 5.3516368296376834e-08, + "loss": 0.0004, + "step": 37771 + }, + { + "epoch": 0.73, + "learning_rate": 5.351248495204069e-08, + "loss": 0.0004, + "step": 37772 + }, + { + "epoch": 0.73, + "learning_rate": 5.350860160770455e-08, + "loss": 0.008, + "step": 37773 + }, + { + "epoch": 0.73, + "learning_rate": 5.350471826336841e-08, + "loss": 0.0005, + "step": 37774 + }, + { + "epoch": 0.73, + "learning_rate": 5.350083491903227e-08, + "loss": 0.0004, + "step": 37775 + }, + { + "epoch": 0.73, + "learning_rate": 5.3496951574696125e-08, + "loss": 0.0006, + "step": 37776 + }, + { + "epoch": 0.73, + "learning_rate": 5.3493068230359983e-08, + "loss": 0.0004, + "step": 37777 + }, + { + "epoch": 0.73, + "learning_rate": 5.348918488602384e-08, + "loss": 0.0003, + "step": 37778 + }, + { + "epoch": 0.73, + "learning_rate": 5.34853015416877e-08, + "loss": 0.0004, + "step": 37779 + }, + { + "epoch": 0.73, + "learning_rate": 5.348141819735156e-08, + "loss": 0.0006, + "step": 37780 + }, + { + "epoch": 0.73, + "learning_rate": 5.3477534853015416e-08, + "loss": 0.0003, + "step": 37781 + }, + { + "epoch": 0.73, + "learning_rate": 5.3473651508679275e-08, + "loss": 0.0004, + "step": 37782 + }, + { + "epoch": 0.73, + "learning_rate": 5.346976816434313e-08, + "loss": 0.0005, + "step": 37783 + }, + { + "epoch": 0.73, + "learning_rate": 5.346588482000699e-08, + "loss": 0.0003, + "step": 37784 + }, + { + "epoch": 0.73, + "learning_rate": 5.346200147567085e-08, + "loss": 0.0004, + "step": 37785 + }, + { + "epoch": 0.73, + "learning_rate": 5.345811813133471e-08, + "loss": 0.0008, + "step": 37786 + }, + { + "epoch": 0.73, + "learning_rate": 5.3454234786998566e-08, + "loss": 0.0004, + "step": 37787 + }, + { + "epoch": 0.73, + "learning_rate": 5.3450351442662424e-08, + "loss": 0.0005, + "step": 37788 + }, + { + "epoch": 0.73, + "learning_rate": 5.344646809832628e-08, + "loss": 0.0004, + "step": 37789 + }, + { + "epoch": 0.73, + "learning_rate": 5.344258475399014e-08, + "loss": 0.0006, + "step": 37790 + }, + { + "epoch": 0.73, + "learning_rate": 5.3438701409654e-08, + "loss": 0.0003, + "step": 37791 + }, + { + "epoch": 0.73, + "learning_rate": 5.343481806531786e-08, + "loss": 0.0026, + "step": 37792 + }, + { + "epoch": 0.73, + "learning_rate": 5.34309347209817e-08, + "loss": 0.0003, + "step": 37793 + }, + { + "epoch": 0.73, + "learning_rate": 5.342705137664556e-08, + "loss": 0.0003, + "step": 37794 + }, + { + "epoch": 0.73, + "learning_rate": 5.342316803230942e-08, + "loss": 0.0005, + "step": 37795 + }, + { + "epoch": 0.73, + "learning_rate": 5.341928468797328e-08, + "loss": 0.0005, + "step": 37796 + }, + { + "epoch": 0.73, + "learning_rate": 5.3415401343637135e-08, + "loss": 0.0002, + "step": 37797 + }, + { + "epoch": 0.73, + "learning_rate": 5.3411517999300993e-08, + "loss": 1.2887, + "step": 37798 + }, + { + "epoch": 0.73, + "learning_rate": 5.340763465496485e-08, + "loss": 0.5935, + "step": 37799 + }, + { + "epoch": 0.73, + "learning_rate": 5.340375131062871e-08, + "loss": 0.0003, + "step": 37800 + }, + { + "epoch": 0.73, + "learning_rate": 5.339986796629257e-08, + "loss": 0.0004, + "step": 37801 + }, + { + "epoch": 0.73, + "learning_rate": 5.3395984621956426e-08, + "loss": 0.0005, + "step": 37802 + }, + { + "epoch": 0.73, + "learning_rate": 5.3392101277620285e-08, + "loss": 0.0324, + "step": 37803 + }, + { + "epoch": 0.73, + "learning_rate": 5.338821793328414e-08, + "loss": 0.0004, + "step": 37804 + }, + { + "epoch": 0.73, + "learning_rate": 5.3384334588948e-08, + "loss": 0.7179, + "step": 37805 + }, + { + "epoch": 0.73, + "learning_rate": 5.338045124461186e-08, + "loss": 0.0005, + "step": 37806 + }, + { + "epoch": 0.73, + "learning_rate": 5.337656790027572e-08, + "loss": 0.0005, + "step": 37807 + }, + { + "epoch": 0.73, + "learning_rate": 5.3372684555939576e-08, + "loss": 0.9331, + "step": 37808 + }, + { + "epoch": 0.73, + "learning_rate": 5.3368801211603434e-08, + "loss": 0.0004, + "step": 37809 + }, + { + "epoch": 0.73, + "learning_rate": 5.336491786726729e-08, + "loss": 0.0038, + "step": 37810 + }, + { + "epoch": 0.73, + "learning_rate": 5.336103452293115e-08, + "loss": 0.0005, + "step": 37811 + }, + { + "epoch": 0.73, + "learning_rate": 5.335715117859501e-08, + "loss": 0.0004, + "step": 37812 + }, + { + "epoch": 0.73, + "learning_rate": 5.335326783425887e-08, + "loss": 0.0004, + "step": 37813 + }, + { + "epoch": 0.73, + "learning_rate": 5.334938448992272e-08, + "loss": 0.0023, + "step": 37814 + }, + { + "epoch": 0.73, + "learning_rate": 5.334550114558658e-08, + "loss": 0.5399, + "step": 37815 + }, + { + "epoch": 0.73, + "learning_rate": 5.3341617801250435e-08, + "loss": 0.0004, + "step": 37816 + }, + { + "epoch": 0.73, + "learning_rate": 5.3337734456914293e-08, + "loss": 0.0004, + "step": 37817 + }, + { + "epoch": 0.73, + "learning_rate": 5.333385111257815e-08, + "loss": 0.0004, + "step": 37818 + }, + { + "epoch": 0.73, + "learning_rate": 5.332996776824201e-08, + "loss": 0.0004, + "step": 37819 + }, + { + "epoch": 0.73, + "learning_rate": 5.332608442390587e-08, + "loss": 0.006, + "step": 37820 + }, + { + "epoch": 0.73, + "learning_rate": 5.3322201079569726e-08, + "loss": 0.0003, + "step": 37821 + }, + { + "epoch": 0.73, + "learning_rate": 5.331831773523358e-08, + "loss": 0.0004, + "step": 37822 + }, + { + "epoch": 0.73, + "learning_rate": 5.3314434390897436e-08, + "loss": 0.5481, + "step": 37823 + }, + { + "epoch": 0.73, + "learning_rate": 5.3310551046561294e-08, + "loss": 0.0005, + "step": 37824 + }, + { + "epoch": 0.73, + "learning_rate": 5.330666770222515e-08, + "loss": 0.0005, + "step": 37825 + }, + { + "epoch": 0.73, + "learning_rate": 5.330278435788901e-08, + "loss": 1.325, + "step": 37826 + }, + { + "epoch": 0.73, + "learning_rate": 5.329890101355287e-08, + "loss": 0.0004, + "step": 37827 + }, + { + "epoch": 0.73, + "learning_rate": 5.329501766921673e-08, + "loss": 0.0004, + "step": 37828 + }, + { + "epoch": 0.73, + "learning_rate": 5.329113432488058e-08, + "loss": 0.0003, + "step": 37829 + }, + { + "epoch": 0.73, + "learning_rate": 5.328725098054444e-08, + "loss": 0.0004, + "step": 37830 + }, + { + "epoch": 0.73, + "learning_rate": 5.3283367636208296e-08, + "loss": 0.0005, + "step": 37831 + }, + { + "epoch": 0.73, + "learning_rate": 5.3279484291872154e-08, + "loss": 0.0004, + "step": 37832 + }, + { + "epoch": 0.73, + "learning_rate": 5.327560094753601e-08, + "loss": 0.0007, + "step": 37833 + }, + { + "epoch": 0.73, + "learning_rate": 5.327171760319987e-08, + "loss": 0.0004, + "step": 37834 + }, + { + "epoch": 0.73, + "learning_rate": 5.326783425886373e-08, + "loss": 0.0005, + "step": 37835 + }, + { + "epoch": 0.73, + "learning_rate": 5.326395091452759e-08, + "loss": 0.0003, + "step": 37836 + }, + { + "epoch": 0.73, + "learning_rate": 5.3260067570191445e-08, + "loss": 0.0006, + "step": 37837 + }, + { + "epoch": 0.73, + "learning_rate": 5.32561842258553e-08, + "loss": 0.0003, + "step": 37838 + }, + { + "epoch": 0.73, + "learning_rate": 5.325230088151916e-08, + "loss": 0.0006, + "step": 37839 + }, + { + "epoch": 0.73, + "learning_rate": 5.324841753718302e-08, + "loss": 0.0006, + "step": 37840 + }, + { + "epoch": 0.73, + "learning_rate": 5.324453419284688e-08, + "loss": 0.0008, + "step": 37841 + }, + { + "epoch": 0.73, + "learning_rate": 5.3240650848510736e-08, + "loss": 0.0063, + "step": 37842 + }, + { + "epoch": 0.73, + "learning_rate": 5.3236767504174594e-08, + "loss": 0.5697, + "step": 37843 + }, + { + "epoch": 0.73, + "learning_rate": 5.323288415983845e-08, + "loss": 1.097, + "step": 37844 + }, + { + "epoch": 0.73, + "learning_rate": 5.322900081550231e-08, + "loss": 0.0005, + "step": 37845 + }, + { + "epoch": 0.73, + "learning_rate": 5.322511747116617e-08, + "loss": 0.0004, + "step": 37846 + }, + { + "epoch": 0.73, + "learning_rate": 5.322123412683003e-08, + "loss": 0.0019, + "step": 37847 + }, + { + "epoch": 0.73, + "learning_rate": 5.3217350782493886e-08, + "loss": 0.0014, + "step": 37848 + }, + { + "epoch": 0.73, + "learning_rate": 5.3213467438157744e-08, + "loss": 0.0004, + "step": 37849 + }, + { + "epoch": 0.73, + "learning_rate": 5.32095840938216e-08, + "loss": 0.0007, + "step": 37850 + }, + { + "epoch": 0.73, + "learning_rate": 5.320570074948545e-08, + "loss": 0.0006, + "step": 37851 + }, + { + "epoch": 0.73, + "learning_rate": 5.3201817405149305e-08, + "loss": 0.0006, + "step": 37852 + }, + { + "epoch": 0.73, + "learning_rate": 5.3197934060813164e-08, + "loss": 0.0004, + "step": 37853 + }, + { + "epoch": 0.73, + "learning_rate": 5.319405071647702e-08, + "loss": 0.0006, + "step": 37854 + }, + { + "epoch": 0.73, + "learning_rate": 5.319016737214088e-08, + "loss": 0.0006, + "step": 37855 + }, + { + "epoch": 0.73, + "learning_rate": 5.318628402780474e-08, + "loss": 0.3137, + "step": 37856 + }, + { + "epoch": 0.73, + "learning_rate": 5.3182400683468597e-08, + "loss": 0.0004, + "step": 37857 + }, + { + "epoch": 0.73, + "learning_rate": 5.3178517339132455e-08, + "loss": 0.0005, + "step": 37858 + }, + { + "epoch": 0.73, + "learning_rate": 5.317463399479631e-08, + "loss": 0.0005, + "step": 37859 + }, + { + "epoch": 0.73, + "learning_rate": 5.317075065046017e-08, + "loss": 0.0004, + "step": 37860 + }, + { + "epoch": 0.73, + "learning_rate": 5.316686730612403e-08, + "loss": 0.0003, + "step": 37861 + }, + { + "epoch": 0.73, + "learning_rate": 5.316298396178789e-08, + "loss": 0.0519, + "step": 37862 + }, + { + "epoch": 0.73, + "learning_rate": 5.3159100617451746e-08, + "loss": 0.0009, + "step": 37863 + }, + { + "epoch": 0.73, + "learning_rate": 5.3155217273115604e-08, + "loss": 0.0008, + "step": 37864 + }, + { + "epoch": 0.73, + "learning_rate": 5.315133392877946e-08, + "loss": 0.0004, + "step": 37865 + }, + { + "epoch": 0.73, + "learning_rate": 5.314745058444332e-08, + "loss": 0.0005, + "step": 37866 + }, + { + "epoch": 0.73, + "learning_rate": 5.314356724010718e-08, + "loss": 0.0005, + "step": 37867 + }, + { + "epoch": 0.73, + "learning_rate": 5.313968389577104e-08, + "loss": 0.0006, + "step": 37868 + }, + { + "epoch": 0.73, + "learning_rate": 5.3135800551434896e-08, + "loss": 0.0883, + "step": 37869 + }, + { + "epoch": 0.73, + "learning_rate": 5.3131917207098754e-08, + "loss": 0.0012, + "step": 37870 + }, + { + "epoch": 0.73, + "learning_rate": 5.312803386276261e-08, + "loss": 0.004, + "step": 37871 + }, + { + "epoch": 0.73, + "learning_rate": 5.312415051842647e-08, + "loss": 0.0006, + "step": 37872 + }, + { + "epoch": 0.73, + "learning_rate": 5.312026717409033e-08, + "loss": 0.0004, + "step": 37873 + }, + { + "epoch": 0.73, + "learning_rate": 5.311638382975419e-08, + "loss": 0.0004, + "step": 37874 + }, + { + "epoch": 0.73, + "learning_rate": 5.3112500485418045e-08, + "loss": 0.0011, + "step": 37875 + }, + { + "epoch": 0.73, + "learning_rate": 5.31086171410819e-08, + "loss": 0.0078, + "step": 37876 + }, + { + "epoch": 0.73, + "learning_rate": 5.310473379674576e-08, + "loss": 0.0004, + "step": 37877 + }, + { + "epoch": 0.73, + "learning_rate": 5.310085045240962e-08, + "loss": 0.0005, + "step": 37878 + }, + { + "epoch": 0.73, + "learning_rate": 5.309696710807348e-08, + "loss": 0.0004, + "step": 37879 + }, + { + "epoch": 0.73, + "learning_rate": 5.309308376373732e-08, + "loss": 0.0004, + "step": 37880 + }, + { + "epoch": 0.73, + "learning_rate": 5.308920041940118e-08, + "loss": 0.0004, + "step": 37881 + }, + { + "epoch": 0.73, + "learning_rate": 5.308531707506504e-08, + "loss": 0.0008, + "step": 37882 + }, + { + "epoch": 0.73, + "learning_rate": 5.30814337307289e-08, + "loss": 0.3199, + "step": 37883 + }, + { + "epoch": 0.73, + "learning_rate": 5.3077550386392756e-08, + "loss": 0.0005, + "step": 37884 + }, + { + "epoch": 0.73, + "learning_rate": 5.3073667042056614e-08, + "loss": 0.0004, + "step": 37885 + }, + { + "epoch": 0.73, + "learning_rate": 5.306978369772047e-08, + "loss": 0.0052, + "step": 37886 + }, + { + "epoch": 0.73, + "learning_rate": 5.306590035338433e-08, + "loss": 0.0003, + "step": 37887 + }, + { + "epoch": 0.73, + "learning_rate": 5.306201700904819e-08, + "loss": 0.0027, + "step": 37888 + }, + { + "epoch": 0.73, + "learning_rate": 5.305813366471205e-08, + "loss": 0.0027, + "step": 37889 + }, + { + "epoch": 0.73, + "learning_rate": 5.3054250320375905e-08, + "loss": 0.0003, + "step": 37890 + }, + { + "epoch": 0.74, + "learning_rate": 5.3050366976039764e-08, + "loss": 0.0003, + "step": 37891 + }, + { + "epoch": 0.74, + "learning_rate": 5.304648363170362e-08, + "loss": 0.0005, + "step": 37892 + }, + { + "epoch": 0.74, + "learning_rate": 5.304260028736748e-08, + "loss": 0.0003, + "step": 37893 + }, + { + "epoch": 0.74, + "learning_rate": 5.303871694303134e-08, + "loss": 0.0004, + "step": 37894 + }, + { + "epoch": 0.74, + "learning_rate": 5.30348335986952e-08, + "loss": 0.017, + "step": 37895 + }, + { + "epoch": 0.74, + "learning_rate": 5.3030950254359055e-08, + "loss": 0.0004, + "step": 37896 + }, + { + "epoch": 0.74, + "learning_rate": 5.302706691002291e-08, + "loss": 0.0004, + "step": 37897 + }, + { + "epoch": 0.74, + "learning_rate": 5.302318356568677e-08, + "loss": 0.0005, + "step": 37898 + }, + { + "epoch": 0.74, + "learning_rate": 5.301930022135063e-08, + "loss": 0.0005, + "step": 37899 + }, + { + "epoch": 0.74, + "learning_rate": 5.301541687701449e-08, + "loss": 0.0005, + "step": 37900 + }, + { + "epoch": 0.74, + "learning_rate": 5.3011533532678346e-08, + "loss": 0.0048, + "step": 37901 + }, + { + "epoch": 0.74, + "learning_rate": 5.3007650188342204e-08, + "loss": 0.0004, + "step": 37902 + }, + { + "epoch": 0.74, + "learning_rate": 5.3003766844006056e-08, + "loss": 0.0008, + "step": 37903 + }, + { + "epoch": 0.74, + "learning_rate": 5.2999883499669914e-08, + "loss": 0.0006, + "step": 37904 + }, + { + "epoch": 0.74, + "learning_rate": 5.299600015533377e-08, + "loss": 0.0004, + "step": 37905 + }, + { + "epoch": 0.74, + "learning_rate": 5.299211681099763e-08, + "loss": 0.0791, + "step": 37906 + }, + { + "epoch": 0.74, + "learning_rate": 5.298823346666149e-08, + "loss": 0.0004, + "step": 37907 + }, + { + "epoch": 0.74, + "learning_rate": 5.298435012232535e-08, + "loss": 0.0005, + "step": 37908 + }, + { + "epoch": 0.74, + "learning_rate": 5.29804667779892e-08, + "loss": 0.0006, + "step": 37909 + }, + { + "epoch": 0.74, + "learning_rate": 5.297658343365306e-08, + "loss": 0.0004, + "step": 37910 + }, + { + "epoch": 0.74, + "learning_rate": 5.2972700089316915e-08, + "loss": 0.0003, + "step": 37911 + }, + { + "epoch": 0.74, + "learning_rate": 5.2968816744980774e-08, + "loss": 0.0004, + "step": 37912 + }, + { + "epoch": 0.74, + "learning_rate": 5.296493340064463e-08, + "loss": 0.0004, + "step": 37913 + }, + { + "epoch": 0.74, + "learning_rate": 5.296105005630849e-08, + "loss": 0.0006, + "step": 37914 + }, + { + "epoch": 0.74, + "learning_rate": 5.295716671197235e-08, + "loss": 0.0004, + "step": 37915 + }, + { + "epoch": 0.74, + "learning_rate": 5.2953283367636207e-08, + "loss": 0.0006, + "step": 37916 + }, + { + "epoch": 0.74, + "learning_rate": 5.294940002330006e-08, + "loss": 0.0005, + "step": 37917 + }, + { + "epoch": 0.74, + "learning_rate": 5.2945516678963916e-08, + "loss": 0.0007, + "step": 37918 + }, + { + "epoch": 0.74, + "learning_rate": 5.2941633334627775e-08, + "loss": 0.0111, + "step": 37919 + }, + { + "epoch": 0.74, + "learning_rate": 5.293774999029163e-08, + "loss": 0.0004, + "step": 37920 + }, + { + "epoch": 0.74, + "learning_rate": 5.293386664595549e-08, + "loss": 0.0004, + "step": 37921 + }, + { + "epoch": 0.74, + "learning_rate": 5.292998330161935e-08, + "loss": 0.0004, + "step": 37922 + }, + { + "epoch": 0.74, + "learning_rate": 5.292609995728321e-08, + "loss": 0.0005, + "step": 37923 + }, + { + "epoch": 0.74, + "learning_rate": 5.2922216612947066e-08, + "loss": 0.0005, + "step": 37924 + }, + { + "epoch": 0.74, + "learning_rate": 5.2918333268610924e-08, + "loss": 0.0005, + "step": 37925 + }, + { + "epoch": 0.74, + "learning_rate": 5.291444992427478e-08, + "loss": 0.0029, + "step": 37926 + }, + { + "epoch": 0.74, + "learning_rate": 5.291056657993864e-08, + "loss": 0.0006, + "step": 37927 + }, + { + "epoch": 0.74, + "learning_rate": 5.29066832356025e-08, + "loss": 0.0008, + "step": 37928 + }, + { + "epoch": 0.74, + "learning_rate": 5.290279989126636e-08, + "loss": 0.0003, + "step": 37929 + }, + { + "epoch": 0.74, + "learning_rate": 5.2898916546930215e-08, + "loss": 0.0004, + "step": 37930 + }, + { + "epoch": 0.74, + "learning_rate": 5.2895033202594074e-08, + "loss": 0.0003, + "step": 37931 + }, + { + "epoch": 0.74, + "learning_rate": 5.289114985825793e-08, + "loss": 0.7795, + "step": 37932 + }, + { + "epoch": 0.74, + "learning_rate": 5.288726651392179e-08, + "loss": 0.0006, + "step": 37933 + }, + { + "epoch": 0.74, + "learning_rate": 5.288338316958565e-08, + "loss": 0.0011, + "step": 37934 + }, + { + "epoch": 0.74, + "learning_rate": 5.2879499825249507e-08, + "loss": 0.0003, + "step": 37935 + }, + { + "epoch": 0.74, + "learning_rate": 5.2875616480913365e-08, + "loss": 0.0004, + "step": 37936 + }, + { + "epoch": 0.74, + "learning_rate": 5.287173313657722e-08, + "loss": 0.0006, + "step": 37937 + }, + { + "epoch": 0.74, + "learning_rate": 5.286784979224107e-08, + "loss": 0.0042, + "step": 37938 + }, + { + "epoch": 0.74, + "learning_rate": 5.2863966447904926e-08, + "loss": 0.0005, + "step": 37939 + }, + { + "epoch": 0.74, + "learning_rate": 5.2860083103568785e-08, + "loss": 0.0021, + "step": 37940 + }, + { + "epoch": 0.74, + "learning_rate": 5.285619975923264e-08, + "loss": 0.0005, + "step": 37941 + }, + { + "epoch": 0.74, + "learning_rate": 5.28523164148965e-08, + "loss": 0.0003, + "step": 37942 + }, + { + "epoch": 0.74, + "learning_rate": 5.284843307056036e-08, + "loss": 0.0004, + "step": 37943 + }, + { + "epoch": 0.74, + "learning_rate": 5.284454972622422e-08, + "loss": 0.0004, + "step": 37944 + }, + { + "epoch": 0.74, + "learning_rate": 5.2840666381888076e-08, + "loss": 0.0003, + "step": 37945 + }, + { + "epoch": 0.74, + "learning_rate": 5.2836783037551934e-08, + "loss": 0.0003, + "step": 37946 + }, + { + "epoch": 0.74, + "learning_rate": 5.283289969321579e-08, + "loss": 0.0004, + "step": 37947 + }, + { + "epoch": 0.74, + "learning_rate": 5.282901634887965e-08, + "loss": 0.0007, + "step": 37948 + }, + { + "epoch": 0.74, + "learning_rate": 5.282513300454351e-08, + "loss": 0.0003, + "step": 37949 + }, + { + "epoch": 0.74, + "learning_rate": 5.282124966020737e-08, + "loss": 0.0005, + "step": 37950 + }, + { + "epoch": 0.74, + "learning_rate": 5.2817366315871225e-08, + "loss": 0.0005, + "step": 37951 + }, + { + "epoch": 0.74, + "learning_rate": 5.2813482971535084e-08, + "loss": 0.0004, + "step": 37952 + }, + { + "epoch": 0.74, + "learning_rate": 5.280959962719894e-08, + "loss": 0.0053, + "step": 37953 + }, + { + "epoch": 0.74, + "learning_rate": 5.28057162828628e-08, + "loss": 0.0004, + "step": 37954 + }, + { + "epoch": 0.74, + "learning_rate": 5.280183293852666e-08, + "loss": 0.0045, + "step": 37955 + }, + { + "epoch": 0.74, + "learning_rate": 5.2797949594190517e-08, + "loss": 0.0004, + "step": 37956 + }, + { + "epoch": 0.74, + "learning_rate": 5.2794066249854375e-08, + "loss": 0.5307, + "step": 37957 + }, + { + "epoch": 0.74, + "learning_rate": 5.279018290551823e-08, + "loss": 0.0005, + "step": 37958 + }, + { + "epoch": 0.74, + "learning_rate": 5.278629956118209e-08, + "loss": 0.0004, + "step": 37959 + }, + { + "epoch": 0.74, + "learning_rate": 5.278241621684595e-08, + "loss": 0.0099, + "step": 37960 + }, + { + "epoch": 0.74, + "learning_rate": 5.277853287250981e-08, + "loss": 0.0004, + "step": 37961 + }, + { + "epoch": 0.74, + "learning_rate": 5.2774649528173666e-08, + "loss": 0.0005, + "step": 37962 + }, + { + "epoch": 0.74, + "learning_rate": 5.2770766183837524e-08, + "loss": 0.0004, + "step": 37963 + }, + { + "epoch": 0.74, + "learning_rate": 5.276688283950138e-08, + "loss": 0.0003, + "step": 37964 + }, + { + "epoch": 0.74, + "learning_rate": 5.276299949516524e-08, + "loss": 0.0004, + "step": 37965 + }, + { + "epoch": 0.74, + "learning_rate": 5.27591161508291e-08, + "loss": 0.0002, + "step": 37966 + }, + { + "epoch": 0.74, + "learning_rate": 5.2755232806492944e-08, + "loss": 0.0004, + "step": 37967 + }, + { + "epoch": 0.74, + "learning_rate": 5.27513494621568e-08, + "loss": 1.3451, + "step": 37968 + }, + { + "epoch": 0.74, + "learning_rate": 5.274746611782066e-08, + "loss": 0.0022, + "step": 37969 + }, + { + "epoch": 0.74, + "learning_rate": 5.274358277348452e-08, + "loss": 0.0008, + "step": 37970 + }, + { + "epoch": 0.74, + "learning_rate": 5.273969942914838e-08, + "loss": 0.038, + "step": 37971 + }, + { + "epoch": 0.74, + "learning_rate": 5.2735816084812235e-08, + "loss": 0.0004, + "step": 37972 + }, + { + "epoch": 0.74, + "learning_rate": 5.2731932740476093e-08, + "loss": 0.0005, + "step": 37973 + }, + { + "epoch": 0.74, + "learning_rate": 5.272804939613995e-08, + "loss": 0.0004, + "step": 37974 + }, + { + "epoch": 0.74, + "learning_rate": 5.272416605180381e-08, + "loss": 0.0002, + "step": 37975 + }, + { + "epoch": 0.74, + "learning_rate": 5.272028270746767e-08, + "loss": 0.0003, + "step": 37976 + }, + { + "epoch": 0.74, + "learning_rate": 5.2716399363131526e-08, + "loss": 0.0005, + "step": 37977 + }, + { + "epoch": 0.74, + "learning_rate": 5.2712516018795385e-08, + "loss": 0.0012, + "step": 37978 + }, + { + "epoch": 0.74, + "learning_rate": 5.270863267445924e-08, + "loss": 0.0005, + "step": 37979 + }, + { + "epoch": 0.74, + "learning_rate": 5.27047493301231e-08, + "loss": 0.0005, + "step": 37980 + }, + { + "epoch": 0.74, + "learning_rate": 5.270086598578696e-08, + "loss": 0.0004, + "step": 37981 + }, + { + "epoch": 0.74, + "learning_rate": 5.269698264145082e-08, + "loss": 0.0004, + "step": 37982 + }, + { + "epoch": 0.74, + "learning_rate": 5.2693099297114676e-08, + "loss": 0.0005, + "step": 37983 + }, + { + "epoch": 0.74, + "learning_rate": 5.2689215952778534e-08, + "loss": 0.3485, + "step": 37984 + }, + { + "epoch": 0.74, + "learning_rate": 5.268533260844239e-08, + "loss": 0.4195, + "step": 37985 + }, + { + "epoch": 0.74, + "learning_rate": 5.268144926410625e-08, + "loss": 0.972, + "step": 37986 + }, + { + "epoch": 0.74, + "learning_rate": 5.267756591977011e-08, + "loss": 0.0004, + "step": 37987 + }, + { + "epoch": 0.74, + "learning_rate": 5.267368257543397e-08, + "loss": 0.0004, + "step": 37988 + }, + { + "epoch": 0.74, + "learning_rate": 5.2669799231097825e-08, + "loss": 0.0013, + "step": 37989 + }, + { + "epoch": 0.74, + "learning_rate": 5.2665915886761684e-08, + "loss": 0.0004, + "step": 37990 + }, + { + "epoch": 0.74, + "learning_rate": 5.2662032542425535e-08, + "loss": 0.0004, + "step": 37991 + }, + { + "epoch": 0.74, + "learning_rate": 5.2658149198089393e-08, + "loss": 0.0005, + "step": 37992 + }, + { + "epoch": 0.74, + "learning_rate": 5.265426585375325e-08, + "loss": 0.0008, + "step": 37993 + }, + { + "epoch": 0.74, + "learning_rate": 5.265038250941711e-08, + "loss": 1.1526, + "step": 37994 + }, + { + "epoch": 0.74, + "learning_rate": 5.264649916508097e-08, + "loss": 0.0007, + "step": 37995 + }, + { + "epoch": 0.74, + "learning_rate": 5.264261582074482e-08, + "loss": 0.0004, + "step": 37996 + }, + { + "epoch": 0.74, + "learning_rate": 5.263873247640868e-08, + "loss": 0.0004, + "step": 37997 + }, + { + "epoch": 0.74, + "learning_rate": 5.2634849132072536e-08, + "loss": 0.0005, + "step": 37998 + }, + { + "epoch": 0.74, + "learning_rate": 5.2630965787736395e-08, + "loss": 0.0014, + "step": 37999 + }, + { + "epoch": 0.74, + "learning_rate": 5.262708244340025e-08, + "loss": 0.0004, + "step": 38000 + }, + { + "epoch": 0.74, + "learning_rate": 5.262319909906411e-08, + "loss": 0.0052, + "step": 38001 + }, + { + "epoch": 0.74, + "learning_rate": 5.261931575472797e-08, + "loss": 0.3815, + "step": 38002 + }, + { + "epoch": 0.74, + "learning_rate": 5.261543241039183e-08, + "loss": 0.1467, + "step": 38003 + }, + { + "epoch": 0.74, + "learning_rate": 5.2611549066055686e-08, + "loss": 0.0005, + "step": 38004 + }, + { + "epoch": 0.74, + "learning_rate": 5.2607665721719544e-08, + "loss": 0.0005, + "step": 38005 + }, + { + "epoch": 0.74, + "learning_rate": 5.2603782377383396e-08, + "loss": 0.0004, + "step": 38006 + }, + { + "epoch": 0.74, + "learning_rate": 5.2599899033047254e-08, + "loss": 0.1118, + "step": 38007 + }, + { + "epoch": 0.74, + "learning_rate": 5.259601568871111e-08, + "loss": 0.1039, + "step": 38008 + }, + { + "epoch": 0.74, + "learning_rate": 5.259213234437497e-08, + "loss": 0.0004, + "step": 38009 + }, + { + "epoch": 0.74, + "learning_rate": 5.258824900003883e-08, + "loss": 0.0003, + "step": 38010 + }, + { + "epoch": 0.74, + "learning_rate": 5.258436565570269e-08, + "loss": 0.0004, + "step": 38011 + }, + { + "epoch": 0.74, + "learning_rate": 5.2580482311366545e-08, + "loss": 0.0005, + "step": 38012 + }, + { + "epoch": 0.74, + "learning_rate": 5.2576598967030403e-08, + "loss": 0.0004, + "step": 38013 + }, + { + "epoch": 0.74, + "learning_rate": 5.257271562269426e-08, + "loss": 0.0005, + "step": 38014 + }, + { + "epoch": 0.74, + "learning_rate": 5.256883227835812e-08, + "loss": 0.0088, + "step": 38015 + }, + { + "epoch": 0.74, + "learning_rate": 5.256494893402198e-08, + "loss": 0.0024, + "step": 38016 + }, + { + "epoch": 0.74, + "learning_rate": 5.2561065589685836e-08, + "loss": 0.0389, + "step": 38017 + }, + { + "epoch": 0.74, + "learning_rate": 5.2557182245349695e-08, + "loss": 0.0005, + "step": 38018 + }, + { + "epoch": 0.74, + "learning_rate": 5.255329890101355e-08, + "loss": 0.0004, + "step": 38019 + }, + { + "epoch": 0.74, + "learning_rate": 5.254941555667741e-08, + "loss": 0.0005, + "step": 38020 + }, + { + "epoch": 0.74, + "learning_rate": 5.254553221234127e-08, + "loss": 0.0012, + "step": 38021 + }, + { + "epoch": 0.74, + "learning_rate": 5.254164886800513e-08, + "loss": 0.0005, + "step": 38022 + }, + { + "epoch": 0.74, + "learning_rate": 5.2537765523668986e-08, + "loss": 0.0006, + "step": 38023 + }, + { + "epoch": 0.74, + "learning_rate": 5.2533882179332844e-08, + "loss": 0.0006, + "step": 38024 + }, + { + "epoch": 0.74, + "learning_rate": 5.252999883499669e-08, + "loss": 0.0003, + "step": 38025 + }, + { + "epoch": 0.74, + "learning_rate": 5.252611549066055e-08, + "loss": 0.0005, + "step": 38026 + }, + { + "epoch": 0.74, + "learning_rate": 5.2522232146324406e-08, + "loss": 0.0004, + "step": 38027 + }, + { + "epoch": 0.74, + "learning_rate": 5.2518348801988264e-08, + "loss": 0.0035, + "step": 38028 + }, + { + "epoch": 0.74, + "learning_rate": 5.251446545765212e-08, + "loss": 0.0003, + "step": 38029 + }, + { + "epoch": 0.74, + "learning_rate": 5.251058211331598e-08, + "loss": 0.205, + "step": 38030 + }, + { + "epoch": 0.74, + "learning_rate": 5.250669876897984e-08, + "loss": 0.0004, + "step": 38031 + }, + { + "epoch": 0.74, + "learning_rate": 5.25028154246437e-08, + "loss": 0.0006, + "step": 38032 + }, + { + "epoch": 0.74, + "learning_rate": 5.2498932080307555e-08, + "loss": 0.0004, + "step": 38033 + }, + { + "epoch": 0.74, + "learning_rate": 5.249504873597141e-08, + "loss": 0.0006, + "step": 38034 + }, + { + "epoch": 0.74, + "learning_rate": 5.249116539163527e-08, + "loss": 0.0003, + "step": 38035 + }, + { + "epoch": 0.74, + "learning_rate": 5.248728204729913e-08, + "loss": 0.0004, + "step": 38036 + }, + { + "epoch": 0.74, + "learning_rate": 5.248339870296299e-08, + "loss": 0.0006, + "step": 38037 + }, + { + "epoch": 0.74, + "learning_rate": 5.2479515358626846e-08, + "loss": 0.3501, + "step": 38038 + }, + { + "epoch": 0.74, + "learning_rate": 5.2475632014290704e-08, + "loss": 0.0003, + "step": 38039 + }, + { + "epoch": 0.74, + "learning_rate": 5.247174866995456e-08, + "loss": 0.0005, + "step": 38040 + }, + { + "epoch": 0.74, + "learning_rate": 5.246786532561842e-08, + "loss": 0.0027, + "step": 38041 + }, + { + "epoch": 0.74, + "learning_rate": 5.246398198128228e-08, + "loss": 0.0006, + "step": 38042 + }, + { + "epoch": 0.74, + "learning_rate": 5.246009863694614e-08, + "loss": 0.1915, + "step": 38043 + }, + { + "epoch": 0.74, + "learning_rate": 5.2456215292609996e-08, + "loss": 0.0006, + "step": 38044 + }, + { + "epoch": 0.74, + "learning_rate": 5.2452331948273854e-08, + "loss": 0.0007, + "step": 38045 + }, + { + "epoch": 0.74, + "learning_rate": 5.244844860393771e-08, + "loss": 0.0005, + "step": 38046 + }, + { + "epoch": 0.74, + "learning_rate": 5.244456525960157e-08, + "loss": 0.0047, + "step": 38047 + }, + { + "epoch": 0.74, + "learning_rate": 5.244068191526543e-08, + "loss": 0.0005, + "step": 38048 + }, + { + "epoch": 0.74, + "learning_rate": 5.243679857092929e-08, + "loss": 0.0004, + "step": 38049 + }, + { + "epoch": 0.74, + "learning_rate": 5.2432915226593145e-08, + "loss": 0.0004, + "step": 38050 + }, + { + "epoch": 0.74, + "learning_rate": 5.2429031882257003e-08, + "loss": 0.0004, + "step": 38051 + }, + { + "epoch": 0.74, + "learning_rate": 5.242514853792086e-08, + "loss": 0.0007, + "step": 38052 + }, + { + "epoch": 0.74, + "learning_rate": 5.242126519358472e-08, + "loss": 0.0006, + "step": 38053 + }, + { + "epoch": 0.74, + "learning_rate": 5.2417381849248565e-08, + "loss": 1.1335, + "step": 38054 + }, + { + "epoch": 0.74, + "learning_rate": 5.241349850491242e-08, + "loss": 0.0004, + "step": 38055 + }, + { + "epoch": 0.74, + "learning_rate": 5.240961516057628e-08, + "loss": 0.0004, + "step": 38056 + }, + { + "epoch": 0.74, + "learning_rate": 5.240573181624014e-08, + "loss": 0.6531, + "step": 38057 + }, + { + "epoch": 0.74, + "learning_rate": 5.2401848471904e-08, + "loss": 0.0004, + "step": 38058 + }, + { + "epoch": 0.74, + "learning_rate": 5.2397965127567856e-08, + "loss": 0.6273, + "step": 38059 + }, + { + "epoch": 0.74, + "learning_rate": 5.2394081783231714e-08, + "loss": 0.0004, + "step": 38060 + }, + { + "epoch": 0.74, + "learning_rate": 5.239019843889557e-08, + "loss": 0.0005, + "step": 38061 + }, + { + "epoch": 0.74, + "learning_rate": 5.238631509455943e-08, + "loss": 0.0004, + "step": 38062 + }, + { + "epoch": 0.74, + "learning_rate": 5.238243175022329e-08, + "loss": 0.0003, + "step": 38063 + }, + { + "epoch": 0.74, + "learning_rate": 5.237854840588715e-08, + "loss": 0.6047, + "step": 38064 + }, + { + "epoch": 0.74, + "learning_rate": 5.2374665061551006e-08, + "loss": 0.0022, + "step": 38065 + }, + { + "epoch": 0.74, + "learning_rate": 5.2370781717214864e-08, + "loss": 0.3808, + "step": 38066 + }, + { + "epoch": 0.74, + "learning_rate": 5.236689837287872e-08, + "loss": 0.0006, + "step": 38067 + }, + { + "epoch": 0.74, + "learning_rate": 5.236301502854258e-08, + "loss": 0.0005, + "step": 38068 + }, + { + "epoch": 0.74, + "learning_rate": 5.235913168420644e-08, + "loss": 0.0008, + "step": 38069 + }, + { + "epoch": 0.74, + "learning_rate": 5.23552483398703e-08, + "loss": 0.0003, + "step": 38070 + }, + { + "epoch": 0.74, + "learning_rate": 5.2351364995534155e-08, + "loss": 0.0004, + "step": 38071 + }, + { + "epoch": 0.74, + "learning_rate": 5.234748165119801e-08, + "loss": 0.0005, + "step": 38072 + }, + { + "epoch": 0.74, + "learning_rate": 5.234359830686187e-08, + "loss": 0.0004, + "step": 38073 + }, + { + "epoch": 0.74, + "learning_rate": 5.233971496252573e-08, + "loss": 0.0003, + "step": 38074 + }, + { + "epoch": 0.74, + "learning_rate": 5.233583161818959e-08, + "loss": 0.0003, + "step": 38075 + }, + { + "epoch": 0.74, + "learning_rate": 5.2331948273853446e-08, + "loss": 0.0003, + "step": 38076 + }, + { + "epoch": 0.74, + "learning_rate": 5.2328064929517305e-08, + "loss": 0.033, + "step": 38077 + }, + { + "epoch": 0.74, + "learning_rate": 5.232418158518116e-08, + "loss": 0.0005, + "step": 38078 + }, + { + "epoch": 0.74, + "learning_rate": 5.232029824084502e-08, + "loss": 0.0005, + "step": 38079 + }, + { + "epoch": 0.74, + "learning_rate": 5.231641489650887e-08, + "loss": 0.0003, + "step": 38080 + }, + { + "epoch": 0.74, + "learning_rate": 5.231253155217273e-08, + "loss": 0.0004, + "step": 38081 + }, + { + "epoch": 0.74, + "learning_rate": 5.230864820783659e-08, + "loss": 0.0004, + "step": 38082 + }, + { + "epoch": 0.74, + "learning_rate": 5.230476486350044e-08, + "loss": 0.0005, + "step": 38083 + }, + { + "epoch": 0.74, + "learning_rate": 5.23008815191643e-08, + "loss": 0.0005, + "step": 38084 + }, + { + "epoch": 0.74, + "learning_rate": 5.229699817482816e-08, + "loss": 0.0004, + "step": 38085 + }, + { + "epoch": 0.74, + "learning_rate": 5.2293114830492015e-08, + "loss": 0.0005, + "step": 38086 + }, + { + "epoch": 0.74, + "learning_rate": 5.2289231486155874e-08, + "loss": 0.0005, + "step": 38087 + }, + { + "epoch": 0.74, + "learning_rate": 5.228534814181973e-08, + "loss": 0.0003, + "step": 38088 + }, + { + "epoch": 0.74, + "learning_rate": 5.228146479748359e-08, + "loss": 0.0005, + "step": 38089 + }, + { + "epoch": 0.74, + "learning_rate": 5.227758145314745e-08, + "loss": 0.0005, + "step": 38090 + }, + { + "epoch": 0.74, + "learning_rate": 5.227369810881131e-08, + "loss": 0.0009, + "step": 38091 + }, + { + "epoch": 0.74, + "learning_rate": 5.2269814764475165e-08, + "loss": 0.0022, + "step": 38092 + }, + { + "epoch": 0.74, + "learning_rate": 5.226593142013902e-08, + "loss": 0.0004, + "step": 38093 + }, + { + "epoch": 0.74, + "learning_rate": 5.2262048075802875e-08, + "loss": 0.0006, + "step": 38094 + }, + { + "epoch": 0.74, + "learning_rate": 5.225816473146673e-08, + "loss": 0.0004, + "step": 38095 + }, + { + "epoch": 0.74, + "learning_rate": 5.225428138713059e-08, + "loss": 0.0005, + "step": 38096 + }, + { + "epoch": 0.74, + "learning_rate": 5.225039804279445e-08, + "loss": 0.0008, + "step": 38097 + }, + { + "epoch": 0.74, + "learning_rate": 5.224651469845831e-08, + "loss": 1.2005, + "step": 38098 + }, + { + "epoch": 0.74, + "learning_rate": 5.2242631354122166e-08, + "loss": 0.001, + "step": 38099 + }, + { + "epoch": 0.74, + "learning_rate": 5.2238748009786024e-08, + "loss": 0.0006, + "step": 38100 + }, + { + "epoch": 0.74, + "learning_rate": 5.223486466544988e-08, + "loss": 0.0004, + "step": 38101 + }, + { + "epoch": 0.74, + "learning_rate": 5.223098132111374e-08, + "loss": 0.5789, + "step": 38102 + }, + { + "epoch": 0.74, + "learning_rate": 5.22270979767776e-08, + "loss": 0.0006, + "step": 38103 + }, + { + "epoch": 0.74, + "learning_rate": 5.222321463244146e-08, + "loss": 0.0005, + "step": 38104 + }, + { + "epoch": 0.74, + "learning_rate": 5.2219331288105316e-08, + "loss": 0.0005, + "step": 38105 + }, + { + "epoch": 0.74, + "learning_rate": 5.2215447943769174e-08, + "loss": 0.0007, + "step": 38106 + }, + { + "epoch": 0.74, + "learning_rate": 5.221156459943303e-08, + "loss": 0.0004, + "step": 38107 + }, + { + "epoch": 0.74, + "learning_rate": 5.220768125509689e-08, + "loss": 0.0003, + "step": 38108 + }, + { + "epoch": 0.74, + "learning_rate": 5.220379791076075e-08, + "loss": 0.0007, + "step": 38109 + }, + { + "epoch": 0.74, + "learning_rate": 5.219991456642461e-08, + "loss": 0.0004, + "step": 38110 + }, + { + "epoch": 0.74, + "learning_rate": 5.2196031222088465e-08, + "loss": 0.3326, + "step": 38111 + }, + { + "epoch": 0.74, + "learning_rate": 5.219214787775231e-08, + "loss": 0.916, + "step": 38112 + }, + { + "epoch": 0.74, + "learning_rate": 5.218826453341617e-08, + "loss": 0.1377, + "step": 38113 + }, + { + "epoch": 0.74, + "learning_rate": 5.2184381189080026e-08, + "loss": 0.0092, + "step": 38114 + }, + { + "epoch": 0.74, + "learning_rate": 5.2180497844743885e-08, + "loss": 0.0005, + "step": 38115 + }, + { + "epoch": 0.74, + "learning_rate": 5.217661450040774e-08, + "loss": 1.4348, + "step": 38116 + }, + { + "epoch": 0.74, + "learning_rate": 5.21727311560716e-08, + "loss": 0.0005, + "step": 38117 + }, + { + "epoch": 0.74, + "learning_rate": 5.216884781173546e-08, + "loss": 0.0004, + "step": 38118 + }, + { + "epoch": 0.74, + "learning_rate": 5.216496446739932e-08, + "loss": 0.2606, + "step": 38119 + }, + { + "epoch": 0.74, + "learning_rate": 5.2161081123063176e-08, + "loss": 0.0004, + "step": 38120 + }, + { + "epoch": 0.74, + "learning_rate": 5.2157197778727034e-08, + "loss": 0.0004, + "step": 38121 + }, + { + "epoch": 0.74, + "learning_rate": 5.215331443439089e-08, + "loss": 0.0003, + "step": 38122 + }, + { + "epoch": 0.74, + "learning_rate": 5.214943109005475e-08, + "loss": 0.0007, + "step": 38123 + }, + { + "epoch": 0.74, + "learning_rate": 5.214554774571861e-08, + "loss": 0.879, + "step": 38124 + }, + { + "epoch": 0.74, + "learning_rate": 5.214166440138247e-08, + "loss": 0.0003, + "step": 38125 + }, + { + "epoch": 0.74, + "learning_rate": 5.2137781057046325e-08, + "loss": 0.0004, + "step": 38126 + }, + { + "epoch": 0.74, + "learning_rate": 5.2133897712710184e-08, + "loss": 0.0211, + "step": 38127 + }, + { + "epoch": 0.74, + "learning_rate": 5.213001436837404e-08, + "loss": 0.0007, + "step": 38128 + }, + { + "epoch": 0.74, + "learning_rate": 5.21261310240379e-08, + "loss": 0.0004, + "step": 38129 + }, + { + "epoch": 0.74, + "learning_rate": 5.212224767970176e-08, + "loss": 0.0783, + "step": 38130 + }, + { + "epoch": 0.74, + "learning_rate": 5.2118364335365617e-08, + "loss": 0.0004, + "step": 38131 + }, + { + "epoch": 0.74, + "learning_rate": 5.2114480991029475e-08, + "loss": 0.0003, + "step": 38132 + }, + { + "epoch": 0.74, + "learning_rate": 5.211059764669333e-08, + "loss": 0.0037, + "step": 38133 + }, + { + "epoch": 0.74, + "learning_rate": 5.210671430235719e-08, + "loss": 0.0004, + "step": 38134 + }, + { + "epoch": 0.74, + "learning_rate": 5.210283095802105e-08, + "loss": 0.0007, + "step": 38135 + }, + { + "epoch": 0.74, + "learning_rate": 5.209894761368491e-08, + "loss": 0.0007, + "step": 38136 + }, + { + "epoch": 0.74, + "learning_rate": 5.2095064269348766e-08, + "loss": 1.284, + "step": 38137 + }, + { + "epoch": 0.74, + "learning_rate": 5.2091180925012624e-08, + "loss": 0.0004, + "step": 38138 + }, + { + "epoch": 0.74, + "learning_rate": 5.208729758067648e-08, + "loss": 0.0005, + "step": 38139 + }, + { + "epoch": 0.74, + "learning_rate": 5.208341423634034e-08, + "loss": 0.0005, + "step": 38140 + }, + { + "epoch": 0.74, + "learning_rate": 5.2079530892004186e-08, + "loss": 0.0005, + "step": 38141 + }, + { + "epoch": 0.74, + "learning_rate": 5.2075647547668044e-08, + "loss": 0.0005, + "step": 38142 + }, + { + "epoch": 0.74, + "learning_rate": 5.20717642033319e-08, + "loss": 0.0108, + "step": 38143 + }, + { + "epoch": 0.74, + "learning_rate": 5.206788085899576e-08, + "loss": 0.0006, + "step": 38144 + }, + { + "epoch": 0.74, + "learning_rate": 5.206399751465962e-08, + "loss": 0.6207, + "step": 38145 + }, + { + "epoch": 0.74, + "learning_rate": 5.206011417032348e-08, + "loss": 0.0006, + "step": 38146 + }, + { + "epoch": 0.74, + "learning_rate": 5.2056230825987335e-08, + "loss": 0.0004, + "step": 38147 + }, + { + "epoch": 0.74, + "learning_rate": 5.2052347481651194e-08, + "loss": 0.0007, + "step": 38148 + }, + { + "epoch": 0.74, + "learning_rate": 5.204846413731505e-08, + "loss": 0.0004, + "step": 38149 + }, + { + "epoch": 0.74, + "learning_rate": 5.204458079297891e-08, + "loss": 0.0004, + "step": 38150 + }, + { + "epoch": 0.74, + "learning_rate": 5.204069744864277e-08, + "loss": 0.0003, + "step": 38151 + }, + { + "epoch": 0.74, + "learning_rate": 5.2036814104306627e-08, + "loss": 0.0006, + "step": 38152 + }, + { + "epoch": 0.74, + "learning_rate": 5.2032930759970485e-08, + "loss": 0.0149, + "step": 38153 + }, + { + "epoch": 0.74, + "learning_rate": 5.202904741563434e-08, + "loss": 0.0008, + "step": 38154 + }, + { + "epoch": 0.74, + "learning_rate": 5.20251640712982e-08, + "loss": 0.0004, + "step": 38155 + }, + { + "epoch": 0.74, + "learning_rate": 5.202128072696206e-08, + "loss": 0.0722, + "step": 38156 + }, + { + "epoch": 0.74, + "learning_rate": 5.201739738262592e-08, + "loss": 0.0005, + "step": 38157 + }, + { + "epoch": 0.74, + "learning_rate": 5.2013514038289776e-08, + "loss": 0.0944, + "step": 38158 + }, + { + "epoch": 0.74, + "learning_rate": 5.2009630693953634e-08, + "loss": 0.0005, + "step": 38159 + }, + { + "epoch": 0.74, + "learning_rate": 5.200574734961749e-08, + "loss": 0.0011, + "step": 38160 + }, + { + "epoch": 0.74, + "learning_rate": 5.200186400528135e-08, + "loss": 0.0005, + "step": 38161 + }, + { + "epoch": 0.74, + "learning_rate": 5.199798066094521e-08, + "loss": 0.0005, + "step": 38162 + }, + { + "epoch": 0.74, + "learning_rate": 5.199409731660907e-08, + "loss": 0.0004, + "step": 38163 + }, + { + "epoch": 0.74, + "learning_rate": 5.1990213972272925e-08, + "loss": 0.0004, + "step": 38164 + }, + { + "epoch": 0.74, + "learning_rate": 5.1986330627936784e-08, + "loss": 0.0003, + "step": 38165 + }, + { + "epoch": 0.74, + "learning_rate": 5.198244728360064e-08, + "loss": 0.0008, + "step": 38166 + }, + { + "epoch": 0.74, + "learning_rate": 5.19785639392645e-08, + "loss": 0.0006, + "step": 38167 + }, + { + "epoch": 0.74, + "learning_rate": 5.197468059492835e-08, + "loss": 0.0006, + "step": 38168 + }, + { + "epoch": 0.74, + "learning_rate": 5.197079725059221e-08, + "loss": 0.0004, + "step": 38169 + }, + { + "epoch": 0.74, + "learning_rate": 5.196691390625606e-08, + "loss": 0.0005, + "step": 38170 + }, + { + "epoch": 0.74, + "learning_rate": 5.196303056191992e-08, + "loss": 0.0006, + "step": 38171 + }, + { + "epoch": 0.74, + "learning_rate": 5.195914721758378e-08, + "loss": 0.0004, + "step": 38172 + }, + { + "epoch": 0.74, + "learning_rate": 5.1955263873247636e-08, + "loss": 0.0004, + "step": 38173 + }, + { + "epoch": 0.74, + "learning_rate": 5.1951380528911495e-08, + "loss": 0.0005, + "step": 38174 + }, + { + "epoch": 0.74, + "learning_rate": 5.194749718457535e-08, + "loss": 0.0005, + "step": 38175 + }, + { + "epoch": 0.74, + "learning_rate": 5.194361384023921e-08, + "loss": 0.0006, + "step": 38176 + }, + { + "epoch": 0.74, + "learning_rate": 5.193973049590307e-08, + "loss": 0.0006, + "step": 38177 + }, + { + "epoch": 0.74, + "learning_rate": 5.193584715156693e-08, + "loss": 0.0004, + "step": 38178 + }, + { + "epoch": 0.74, + "learning_rate": 5.1931963807230786e-08, + "loss": 0.0005, + "step": 38179 + }, + { + "epoch": 0.74, + "learning_rate": 5.1928080462894644e-08, + "loss": 0.0005, + "step": 38180 + }, + { + "epoch": 0.74, + "learning_rate": 5.19241971185585e-08, + "loss": 0.0005, + "step": 38181 + }, + { + "epoch": 0.74, + "learning_rate": 5.192031377422236e-08, + "loss": 0.0009, + "step": 38182 + }, + { + "epoch": 0.74, + "learning_rate": 5.191643042988621e-08, + "loss": 0.0004, + "step": 38183 + }, + { + "epoch": 0.74, + "learning_rate": 5.191254708555007e-08, + "loss": 0.0003, + "step": 38184 + }, + { + "epoch": 0.74, + "learning_rate": 5.190866374121393e-08, + "loss": 0.0004, + "step": 38185 + }, + { + "epoch": 0.74, + "learning_rate": 5.190478039687779e-08, + "loss": 0.0004, + "step": 38186 + }, + { + "epoch": 0.74, + "learning_rate": 5.1900897052541645e-08, + "loss": 0.0063, + "step": 38187 + }, + { + "epoch": 0.74, + "learning_rate": 5.1897013708205503e-08, + "loss": 0.0689, + "step": 38188 + }, + { + "epoch": 0.74, + "learning_rate": 5.189313036386936e-08, + "loss": 0.3791, + "step": 38189 + }, + { + "epoch": 0.74, + "learning_rate": 5.188924701953322e-08, + "loss": 0.0005, + "step": 38190 + }, + { + "epoch": 0.74, + "learning_rate": 5.188536367519708e-08, + "loss": 0.0006, + "step": 38191 + }, + { + "epoch": 0.74, + "learning_rate": 5.1881480330860936e-08, + "loss": 0.0006, + "step": 38192 + }, + { + "epoch": 0.74, + "learning_rate": 5.1877596986524795e-08, + "loss": 0.0005, + "step": 38193 + }, + { + "epoch": 0.74, + "learning_rate": 5.187371364218865e-08, + "loss": 0.0003, + "step": 38194 + }, + { + "epoch": 0.74, + "learning_rate": 5.186983029785251e-08, + "loss": 0.0003, + "step": 38195 + }, + { + "epoch": 0.74, + "learning_rate": 5.186594695351637e-08, + "loss": 0.0004, + "step": 38196 + }, + { + "epoch": 0.74, + "learning_rate": 5.186206360918023e-08, + "loss": 0.0005, + "step": 38197 + }, + { + "epoch": 0.74, + "learning_rate": 5.1858180264844086e-08, + "loss": 0.1767, + "step": 38198 + }, + { + "epoch": 0.74, + "learning_rate": 5.185429692050793e-08, + "loss": 0.0007, + "step": 38199 + }, + { + "epoch": 0.74, + "learning_rate": 5.185041357617179e-08, + "loss": 0.0019, + "step": 38200 + }, + { + "epoch": 0.74, + "learning_rate": 5.184653023183565e-08, + "loss": 0.0003, + "step": 38201 + }, + { + "epoch": 0.74, + "learning_rate": 5.1842646887499506e-08, + "loss": 0.0004, + "step": 38202 + }, + { + "epoch": 0.74, + "learning_rate": 5.1838763543163364e-08, + "loss": 0.4725, + "step": 38203 + }, + { + "epoch": 0.74, + "learning_rate": 5.183488019882722e-08, + "loss": 0.0003, + "step": 38204 + }, + { + "epoch": 0.74, + "learning_rate": 5.183099685449108e-08, + "loss": 0.0004, + "step": 38205 + }, + { + "epoch": 0.74, + "learning_rate": 5.182711351015494e-08, + "loss": 0.0008, + "step": 38206 + }, + { + "epoch": 0.74, + "learning_rate": 5.18232301658188e-08, + "loss": 0.0008, + "step": 38207 + }, + { + "epoch": 0.74, + "learning_rate": 5.1819346821482655e-08, + "loss": 0.0004, + "step": 38208 + }, + { + "epoch": 0.74, + "learning_rate": 5.1815463477146513e-08, + "loss": 0.0004, + "step": 38209 + }, + { + "epoch": 0.74, + "learning_rate": 5.181158013281037e-08, + "loss": 0.0005, + "step": 38210 + }, + { + "epoch": 0.74, + "learning_rate": 5.180769678847423e-08, + "loss": 0.0008, + "step": 38211 + }, + { + "epoch": 0.74, + "learning_rate": 5.180381344413809e-08, + "loss": 0.0004, + "step": 38212 + }, + { + "epoch": 0.74, + "learning_rate": 5.1799930099801946e-08, + "loss": 0.0004, + "step": 38213 + }, + { + "epoch": 0.74, + "learning_rate": 5.1796046755465805e-08, + "loss": 0.0003, + "step": 38214 + }, + { + "epoch": 0.74, + "learning_rate": 5.179216341112966e-08, + "loss": 0.0005, + "step": 38215 + }, + { + "epoch": 0.74, + "learning_rate": 5.178828006679352e-08, + "loss": 0.0004, + "step": 38216 + }, + { + "epoch": 0.74, + "learning_rate": 5.178439672245738e-08, + "loss": 0.0009, + "step": 38217 + }, + { + "epoch": 0.74, + "learning_rate": 5.178051337812124e-08, + "loss": 0.0004, + "step": 38218 + }, + { + "epoch": 0.74, + "learning_rate": 5.1776630033785096e-08, + "loss": 0.0005, + "step": 38219 + }, + { + "epoch": 0.74, + "learning_rate": 5.1772746689448954e-08, + "loss": 0.0003, + "step": 38220 + }, + { + "epoch": 0.74, + "learning_rate": 5.176886334511281e-08, + "loss": 0.0004, + "step": 38221 + }, + { + "epoch": 0.74, + "learning_rate": 5.176498000077667e-08, + "loss": 0.0003, + "step": 38222 + }, + { + "epoch": 0.74, + "learning_rate": 5.176109665644053e-08, + "loss": 0.0004, + "step": 38223 + }, + { + "epoch": 0.74, + "learning_rate": 5.175721331210439e-08, + "loss": 0.0901, + "step": 38224 + }, + { + "epoch": 0.74, + "learning_rate": 5.1753329967768245e-08, + "loss": 0.0003, + "step": 38225 + }, + { + "epoch": 0.74, + "learning_rate": 5.1749446623432104e-08, + "loss": 2.0631, + "step": 38226 + }, + { + "epoch": 0.74, + "learning_rate": 5.174556327909596e-08, + "loss": 0.0007, + "step": 38227 + }, + { + "epoch": 0.74, + "learning_rate": 5.174167993475981e-08, + "loss": 0.0004, + "step": 38228 + }, + { + "epoch": 0.74, + "learning_rate": 5.1737796590423665e-08, + "loss": 0.0004, + "step": 38229 + }, + { + "epoch": 0.74, + "learning_rate": 5.173391324608752e-08, + "loss": 0.3526, + "step": 38230 + }, + { + "epoch": 0.74, + "learning_rate": 5.173002990175138e-08, + "loss": 0.0004, + "step": 38231 + }, + { + "epoch": 0.74, + "learning_rate": 5.172614655741524e-08, + "loss": 0.0003, + "step": 38232 + }, + { + "epoch": 0.74, + "learning_rate": 5.17222632130791e-08, + "loss": 0.0213, + "step": 38233 + }, + { + "epoch": 0.74, + "learning_rate": 5.1718379868742956e-08, + "loss": 0.0066, + "step": 38234 + }, + { + "epoch": 0.74, + "learning_rate": 5.1714496524406814e-08, + "loss": 0.0003, + "step": 38235 + }, + { + "epoch": 0.74, + "learning_rate": 5.171061318007067e-08, + "loss": 0.0007, + "step": 38236 + }, + { + "epoch": 0.74, + "learning_rate": 5.170672983573453e-08, + "loss": 0.0005, + "step": 38237 + }, + { + "epoch": 0.74, + "learning_rate": 5.170284649139839e-08, + "loss": 0.7666, + "step": 38238 + }, + { + "epoch": 0.74, + "learning_rate": 5.169896314706225e-08, + "loss": 0.0005, + "step": 38239 + }, + { + "epoch": 0.74, + "learning_rate": 5.1695079802726106e-08, + "loss": 0.0005, + "step": 38240 + }, + { + "epoch": 0.74, + "learning_rate": 5.1691196458389964e-08, + "loss": 0.0004, + "step": 38241 + }, + { + "epoch": 0.74, + "learning_rate": 5.168731311405382e-08, + "loss": 0.0004, + "step": 38242 + }, + { + "epoch": 0.74, + "learning_rate": 5.168342976971768e-08, + "loss": 0.0005, + "step": 38243 + }, + { + "epoch": 0.74, + "learning_rate": 5.167954642538154e-08, + "loss": 0.0007, + "step": 38244 + }, + { + "epoch": 0.74, + "learning_rate": 5.16756630810454e-08, + "loss": 0.0004, + "step": 38245 + }, + { + "epoch": 0.74, + "learning_rate": 5.1671779736709255e-08, + "loss": 0.0004, + "step": 38246 + }, + { + "epoch": 0.74, + "learning_rate": 5.1667896392373113e-08, + "loss": 0.0003, + "step": 38247 + }, + { + "epoch": 0.74, + "learning_rate": 5.166401304803697e-08, + "loss": 0.0003, + "step": 38248 + }, + { + "epoch": 0.74, + "learning_rate": 5.166012970370083e-08, + "loss": 0.0005, + "step": 38249 + }, + { + "epoch": 0.74, + "learning_rate": 5.165624635936469e-08, + "loss": 0.0004, + "step": 38250 + }, + { + "epoch": 0.74, + "learning_rate": 5.1652363015028546e-08, + "loss": 0.0007, + "step": 38251 + }, + { + "epoch": 0.74, + "learning_rate": 5.1648479670692405e-08, + "loss": 0.0004, + "step": 38252 + }, + { + "epoch": 0.74, + "learning_rate": 5.164459632635626e-08, + "loss": 0.0055, + "step": 38253 + }, + { + "epoch": 0.74, + "learning_rate": 5.164071298202012e-08, + "loss": 0.0003, + "step": 38254 + }, + { + "epoch": 0.74, + "learning_rate": 5.163682963768398e-08, + "loss": 0.0023, + "step": 38255 + }, + { + "epoch": 0.74, + "learning_rate": 5.163294629334784e-08, + "loss": 0.0003, + "step": 38256 + }, + { + "epoch": 0.74, + "learning_rate": 5.162906294901168e-08, + "loss": 0.0004, + "step": 38257 + }, + { + "epoch": 0.74, + "learning_rate": 5.162517960467554e-08, + "loss": 0.0003, + "step": 38258 + }, + { + "epoch": 0.74, + "learning_rate": 5.16212962603394e-08, + "loss": 0.0044, + "step": 38259 + }, + { + "epoch": 0.74, + "learning_rate": 5.161741291600326e-08, + "loss": 0.001, + "step": 38260 + }, + { + "epoch": 0.74, + "learning_rate": 5.1613529571667116e-08, + "loss": 0.0023, + "step": 38261 + }, + { + "epoch": 0.74, + "learning_rate": 5.1609646227330974e-08, + "loss": 0.0004, + "step": 38262 + }, + { + "epoch": 0.74, + "learning_rate": 5.160576288299483e-08, + "loss": 0.0004, + "step": 38263 + }, + { + "epoch": 0.74, + "learning_rate": 5.160187953865869e-08, + "loss": 0.0003, + "step": 38264 + }, + { + "epoch": 0.74, + "learning_rate": 5.159799619432255e-08, + "loss": 0.0004, + "step": 38265 + }, + { + "epoch": 0.74, + "learning_rate": 5.159411284998641e-08, + "loss": 0.0006, + "step": 38266 + }, + { + "epoch": 0.74, + "learning_rate": 5.1590229505650265e-08, + "loss": 1.0845, + "step": 38267 + }, + { + "epoch": 0.74, + "learning_rate": 5.158634616131412e-08, + "loss": 0.0009, + "step": 38268 + }, + { + "epoch": 0.74, + "learning_rate": 5.158246281697798e-08, + "loss": 0.0004, + "step": 38269 + }, + { + "epoch": 0.74, + "learning_rate": 5.157857947264184e-08, + "loss": 0.0004, + "step": 38270 + }, + { + "epoch": 0.74, + "learning_rate": 5.157469612830569e-08, + "loss": 0.6231, + "step": 38271 + }, + { + "epoch": 0.74, + "learning_rate": 5.157081278396955e-08, + "loss": 0.0003, + "step": 38272 + }, + { + "epoch": 0.74, + "learning_rate": 5.156692943963341e-08, + "loss": 0.3547, + "step": 38273 + }, + { + "epoch": 0.74, + "learning_rate": 5.1563046095297266e-08, + "loss": 0.0006, + "step": 38274 + }, + { + "epoch": 0.74, + "learning_rate": 5.1559162750961124e-08, + "loss": 0.0004, + "step": 38275 + }, + { + "epoch": 0.74, + "learning_rate": 5.155527940662498e-08, + "loss": 0.0004, + "step": 38276 + }, + { + "epoch": 0.74, + "learning_rate": 5.155139606228884e-08, + "loss": 0.0028, + "step": 38277 + }, + { + "epoch": 0.74, + "learning_rate": 5.15475127179527e-08, + "loss": 1.2955, + "step": 38278 + }, + { + "epoch": 0.74, + "learning_rate": 5.154362937361656e-08, + "loss": 0.0005, + "step": 38279 + }, + { + "epoch": 0.74, + "learning_rate": 5.1539746029280416e-08, + "loss": 0.0015, + "step": 38280 + }, + { + "epoch": 0.74, + "learning_rate": 5.1535862684944274e-08, + "loss": 0.0004, + "step": 38281 + }, + { + "epoch": 0.74, + "learning_rate": 5.153197934060813e-08, + "loss": 0.0004, + "step": 38282 + }, + { + "epoch": 0.74, + "learning_rate": 5.152809599627199e-08, + "loss": 0.0004, + "step": 38283 + }, + { + "epoch": 0.74, + "learning_rate": 5.152421265193585e-08, + "loss": 0.0006, + "step": 38284 + }, + { + "epoch": 0.74, + "learning_rate": 5.152032930759971e-08, + "loss": 0.0004, + "step": 38285 + }, + { + "epoch": 0.74, + "learning_rate": 5.151644596326355e-08, + "loss": 0.0004, + "step": 38286 + }, + { + "epoch": 0.74, + "learning_rate": 5.151256261892741e-08, + "loss": 0.0008, + "step": 38287 + }, + { + "epoch": 0.74, + "learning_rate": 5.150867927459127e-08, + "loss": 0.026, + "step": 38288 + }, + { + "epoch": 0.74, + "learning_rate": 5.1504795930255127e-08, + "loss": 0.0003, + "step": 38289 + }, + { + "epoch": 0.74, + "learning_rate": 5.1500912585918985e-08, + "loss": 0.0007, + "step": 38290 + }, + { + "epoch": 0.74, + "learning_rate": 5.149702924158284e-08, + "loss": 0.0009, + "step": 38291 + }, + { + "epoch": 0.74, + "learning_rate": 5.14931458972467e-08, + "loss": 0.0004, + "step": 38292 + }, + { + "epoch": 0.74, + "learning_rate": 5.148926255291056e-08, + "loss": 0.0006, + "step": 38293 + }, + { + "epoch": 0.74, + "learning_rate": 5.148537920857442e-08, + "loss": 0.1977, + "step": 38294 + }, + { + "epoch": 0.74, + "learning_rate": 5.1481495864238276e-08, + "loss": 0.0005, + "step": 38295 + }, + { + "epoch": 0.74, + "learning_rate": 5.1477612519902134e-08, + "loss": 0.0028, + "step": 38296 + }, + { + "epoch": 0.74, + "learning_rate": 5.147372917556599e-08, + "loss": 0.0004, + "step": 38297 + }, + { + "epoch": 0.74, + "learning_rate": 5.146984583122985e-08, + "loss": 0.0006, + "step": 38298 + }, + { + "epoch": 0.74, + "learning_rate": 5.146596248689371e-08, + "loss": 0.0003, + "step": 38299 + }, + { + "epoch": 0.74, + "learning_rate": 5.146207914255757e-08, + "loss": 0.0009, + "step": 38300 + }, + { + "epoch": 0.74, + "learning_rate": 5.1458195798221426e-08, + "loss": 0.0006, + "step": 38301 + }, + { + "epoch": 0.74, + "learning_rate": 5.1454312453885284e-08, + "loss": 0.1528, + "step": 38302 + }, + { + "epoch": 0.74, + "learning_rate": 5.145042910954914e-08, + "loss": 0.0012, + "step": 38303 + }, + { + "epoch": 0.74, + "learning_rate": 5.1446545765213e-08, + "loss": 0.0003, + "step": 38304 + }, + { + "epoch": 0.74, + "learning_rate": 5.144266242087686e-08, + "loss": 0.0004, + "step": 38305 + }, + { + "epoch": 0.74, + "learning_rate": 5.143877907654072e-08, + "loss": 0.0004, + "step": 38306 + }, + { + "epoch": 0.74, + "learning_rate": 5.1434895732204575e-08, + "loss": 0.0005, + "step": 38307 + }, + { + "epoch": 0.74, + "learning_rate": 5.143101238786843e-08, + "loss": 0.0435, + "step": 38308 + }, + { + "epoch": 0.74, + "learning_rate": 5.142712904353229e-08, + "loss": 0.0002, + "step": 38309 + }, + { + "epoch": 0.74, + "learning_rate": 5.142324569919615e-08, + "loss": 0.0004, + "step": 38310 + }, + { + "epoch": 0.74, + "learning_rate": 5.141936235486001e-08, + "loss": 0.0003, + "step": 38311 + }, + { + "epoch": 0.74, + "learning_rate": 5.1415479010523866e-08, + "loss": 0.0004, + "step": 38312 + }, + { + "epoch": 0.74, + "learning_rate": 5.1411595666187724e-08, + "loss": 0.0004, + "step": 38313 + }, + { + "epoch": 0.74, + "learning_rate": 5.140771232185158e-08, + "loss": 0.0004, + "step": 38314 + }, + { + "epoch": 0.74, + "learning_rate": 5.140382897751543e-08, + "loss": 0.0005, + "step": 38315 + }, + { + "epoch": 0.74, + "learning_rate": 5.1399945633179286e-08, + "loss": 0.0044, + "step": 38316 + }, + { + "epoch": 0.74, + "learning_rate": 5.1396062288843144e-08, + "loss": 0.0004, + "step": 38317 + }, + { + "epoch": 0.74, + "learning_rate": 5.1392178944507e-08, + "loss": 0.0011, + "step": 38318 + }, + { + "epoch": 0.74, + "learning_rate": 5.138829560017086e-08, + "loss": 0.0006, + "step": 38319 + }, + { + "epoch": 0.74, + "learning_rate": 5.138441225583472e-08, + "loss": 0.5943, + "step": 38320 + }, + { + "epoch": 0.74, + "learning_rate": 5.138052891149858e-08, + "loss": 0.0178, + "step": 38321 + }, + { + "epoch": 0.74, + "learning_rate": 5.1376645567162435e-08, + "loss": 0.0006, + "step": 38322 + }, + { + "epoch": 0.74, + "learning_rate": 5.1372762222826294e-08, + "loss": 1.4605, + "step": 38323 + }, + { + "epoch": 0.74, + "learning_rate": 5.136887887849015e-08, + "loss": 0.0002, + "step": 38324 + }, + { + "epoch": 0.74, + "learning_rate": 5.136499553415401e-08, + "loss": 0.0004, + "step": 38325 + }, + { + "epoch": 0.74, + "learning_rate": 5.136111218981787e-08, + "loss": 0.0004, + "step": 38326 + }, + { + "epoch": 0.74, + "learning_rate": 5.1357228845481727e-08, + "loss": 0.0005, + "step": 38327 + }, + { + "epoch": 0.74, + "learning_rate": 5.1353345501145585e-08, + "loss": 0.0004, + "step": 38328 + }, + { + "epoch": 0.74, + "learning_rate": 5.134946215680944e-08, + "loss": 0.0005, + "step": 38329 + }, + { + "epoch": 0.74, + "learning_rate": 5.13455788124733e-08, + "loss": 0.0004, + "step": 38330 + }, + { + "epoch": 0.74, + "learning_rate": 5.134169546813716e-08, + "loss": 0.0005, + "step": 38331 + }, + { + "epoch": 0.74, + "learning_rate": 5.133781212380102e-08, + "loss": 0.0005, + "step": 38332 + }, + { + "epoch": 0.74, + "learning_rate": 5.1333928779464876e-08, + "loss": 0.0005, + "step": 38333 + }, + { + "epoch": 0.74, + "learning_rate": 5.1330045435128734e-08, + "loss": 0.0006, + "step": 38334 + }, + { + "epoch": 0.74, + "learning_rate": 5.132616209079259e-08, + "loss": 0.0005, + "step": 38335 + }, + { + "epoch": 0.74, + "learning_rate": 5.132227874645645e-08, + "loss": 0.0005, + "step": 38336 + }, + { + "epoch": 0.74, + "learning_rate": 5.131839540212031e-08, + "loss": 0.0005, + "step": 38337 + }, + { + "epoch": 0.74, + "learning_rate": 5.131451205778417e-08, + "loss": 0.0004, + "step": 38338 + }, + { + "epoch": 0.74, + "learning_rate": 5.1310628713448026e-08, + "loss": 0.0003, + "step": 38339 + }, + { + "epoch": 0.74, + "learning_rate": 5.1306745369111884e-08, + "loss": 0.0006, + "step": 38340 + }, + { + "epoch": 0.74, + "learning_rate": 5.130286202477574e-08, + "loss": 0.0006, + "step": 38341 + }, + { + "epoch": 0.74, + "learning_rate": 5.12989786804396e-08, + "loss": 0.0004, + "step": 38342 + }, + { + "epoch": 0.74, + "learning_rate": 5.129509533610346e-08, + "loss": 0.0007, + "step": 38343 + }, + { + "epoch": 0.74, + "learning_rate": 5.1291211991767304e-08, + "loss": 0.0003, + "step": 38344 + }, + { + "epoch": 0.74, + "learning_rate": 5.128732864743116e-08, + "loss": 0.0016, + "step": 38345 + }, + { + "epoch": 0.74, + "learning_rate": 5.128344530309502e-08, + "loss": 0.0004, + "step": 38346 + }, + { + "epoch": 0.74, + "learning_rate": 5.127956195875888e-08, + "loss": 0.0004, + "step": 38347 + }, + { + "epoch": 0.74, + "learning_rate": 5.1275678614422737e-08, + "loss": 0.0005, + "step": 38348 + }, + { + "epoch": 0.74, + "learning_rate": 5.1271795270086595e-08, + "loss": 0.0006, + "step": 38349 + }, + { + "epoch": 0.74, + "learning_rate": 5.126791192575045e-08, + "loss": 0.0005, + "step": 38350 + }, + { + "epoch": 0.74, + "learning_rate": 5.126402858141431e-08, + "loss": 0.0005, + "step": 38351 + }, + { + "epoch": 0.74, + "learning_rate": 5.126014523707817e-08, + "loss": 0.0004, + "step": 38352 + }, + { + "epoch": 0.74, + "learning_rate": 5.125626189274203e-08, + "loss": 0.9332, + "step": 38353 + }, + { + "epoch": 0.74, + "learning_rate": 5.1252378548405886e-08, + "loss": 0.0057, + "step": 38354 + }, + { + "epoch": 0.74, + "learning_rate": 5.1248495204069744e-08, + "loss": 0.0006, + "step": 38355 + }, + { + "epoch": 0.74, + "learning_rate": 5.12446118597336e-08, + "loss": 0.6384, + "step": 38356 + }, + { + "epoch": 0.74, + "learning_rate": 5.124072851539746e-08, + "loss": 0.0003, + "step": 38357 + }, + { + "epoch": 0.74, + "learning_rate": 5.123684517106132e-08, + "loss": 0.0004, + "step": 38358 + }, + { + "epoch": 0.74, + "learning_rate": 5.123296182672518e-08, + "loss": 0.0013, + "step": 38359 + }, + { + "epoch": 0.74, + "learning_rate": 5.122907848238903e-08, + "loss": 0.0003, + "step": 38360 + }, + { + "epoch": 0.74, + "learning_rate": 5.122519513805289e-08, + "loss": 0.0003, + "step": 38361 + }, + { + "epoch": 0.74, + "learning_rate": 5.1221311793716745e-08, + "loss": 0.2777, + "step": 38362 + }, + { + "epoch": 0.74, + "learning_rate": 5.1217428449380604e-08, + "loss": 0.0004, + "step": 38363 + }, + { + "epoch": 0.74, + "learning_rate": 5.121354510504446e-08, + "loss": 0.0003, + "step": 38364 + }, + { + "epoch": 0.74, + "learning_rate": 5.120966176070832e-08, + "loss": 0.0005, + "step": 38365 + }, + { + "epoch": 0.74, + "learning_rate": 5.120577841637218e-08, + "loss": 0.0005, + "step": 38366 + }, + { + "epoch": 0.74, + "learning_rate": 5.1201895072036037e-08, + "loss": 0.8775, + "step": 38367 + }, + { + "epoch": 0.74, + "learning_rate": 5.1198011727699895e-08, + "loss": 0.0005, + "step": 38368 + }, + { + "epoch": 0.74, + "learning_rate": 5.119412838336375e-08, + "loss": 0.0006, + "step": 38369 + }, + { + "epoch": 0.74, + "learning_rate": 5.119024503902761e-08, + "loss": 0.0006, + "step": 38370 + }, + { + "epoch": 0.74, + "learning_rate": 5.118636169469147e-08, + "loss": 0.0293, + "step": 38371 + }, + { + "epoch": 0.74, + "learning_rate": 5.118247835035533e-08, + "loss": 0.0004, + "step": 38372 + }, + { + "epoch": 0.74, + "learning_rate": 5.117859500601918e-08, + "loss": 0.0004, + "step": 38373 + }, + { + "epoch": 0.74, + "learning_rate": 5.117471166168303e-08, + "loss": 0.0951, + "step": 38374 + }, + { + "epoch": 0.74, + "learning_rate": 5.117082831734689e-08, + "loss": 0.3156, + "step": 38375 + }, + { + "epoch": 0.74, + "learning_rate": 5.116694497301075e-08, + "loss": 0.0007, + "step": 38376 + }, + { + "epoch": 0.74, + "learning_rate": 5.1163061628674606e-08, + "loss": 0.775, + "step": 38377 + }, + { + "epoch": 0.74, + "learning_rate": 5.1159178284338464e-08, + "loss": 0.0144, + "step": 38378 + }, + { + "epoch": 0.74, + "learning_rate": 5.115529494000232e-08, + "loss": 0.0004, + "step": 38379 + }, + { + "epoch": 0.74, + "learning_rate": 5.115141159566618e-08, + "loss": 0.6018, + "step": 38380 + }, + { + "epoch": 0.74, + "learning_rate": 5.114752825133004e-08, + "loss": 0.0006, + "step": 38381 + }, + { + "epoch": 0.74, + "learning_rate": 5.11436449069939e-08, + "loss": 0.0004, + "step": 38382 + }, + { + "epoch": 0.74, + "learning_rate": 5.1139761562657755e-08, + "loss": 0.0005, + "step": 38383 + }, + { + "epoch": 0.74, + "learning_rate": 5.1135878218321613e-08, + "loss": 0.0003, + "step": 38384 + }, + { + "epoch": 0.74, + "learning_rate": 5.113199487398547e-08, + "loss": 0.0007, + "step": 38385 + }, + { + "epoch": 0.74, + "learning_rate": 5.112811152964933e-08, + "loss": 0.0005, + "step": 38386 + }, + { + "epoch": 0.74, + "learning_rate": 5.112422818531319e-08, + "loss": 0.001, + "step": 38387 + }, + { + "epoch": 0.74, + "learning_rate": 5.1120344840977046e-08, + "loss": 0.0004, + "step": 38388 + }, + { + "epoch": 0.74, + "learning_rate": 5.1116461496640905e-08, + "loss": 0.0004, + "step": 38389 + }, + { + "epoch": 0.74, + "learning_rate": 5.111257815230476e-08, + "loss": 0.2336, + "step": 38390 + }, + { + "epoch": 0.74, + "learning_rate": 5.110869480796862e-08, + "loss": 0.0004, + "step": 38391 + }, + { + "epoch": 0.74, + "learning_rate": 5.110481146363248e-08, + "loss": 0.0028, + "step": 38392 + }, + { + "epoch": 0.74, + "learning_rate": 5.110092811929634e-08, + "loss": 0.0005, + "step": 38393 + }, + { + "epoch": 0.74, + "learning_rate": 5.1097044774960196e-08, + "loss": 0.6553, + "step": 38394 + }, + { + "epoch": 0.74, + "learning_rate": 5.1093161430624054e-08, + "loss": 0.1222, + "step": 38395 + }, + { + "epoch": 0.74, + "learning_rate": 5.108927808628791e-08, + "loss": 0.0004, + "step": 38396 + }, + { + "epoch": 0.74, + "learning_rate": 5.108539474195177e-08, + "loss": 0.0004, + "step": 38397 + }, + { + "epoch": 0.74, + "learning_rate": 5.108151139761563e-08, + "loss": 0.8955, + "step": 38398 + }, + { + "epoch": 0.74, + "learning_rate": 5.107762805327949e-08, + "loss": 0.0004, + "step": 38399 + }, + { + "epoch": 0.74, + "learning_rate": 5.1073744708943345e-08, + "loss": 0.0004, + "step": 38400 + }, + { + "epoch": 0.74, + "learning_rate": 5.1069861364607204e-08, + "loss": 0.5266, + "step": 38401 + }, + { + "epoch": 0.74, + "learning_rate": 5.106597802027105e-08, + "loss": 0.0372, + "step": 38402 + }, + { + "epoch": 0.74, + "learning_rate": 5.106209467593491e-08, + "loss": 0.0005, + "step": 38403 + }, + { + "epoch": 0.74, + "learning_rate": 5.1058211331598765e-08, + "loss": 0.0012, + "step": 38404 + }, + { + "epoch": 0.74, + "learning_rate": 5.1054327987262623e-08, + "loss": 0.0005, + "step": 38405 + }, + { + "epoch": 0.74, + "learning_rate": 5.105044464292648e-08, + "loss": 0.0004, + "step": 38406 + }, + { + "epoch": 0.75, + "learning_rate": 5.104656129859034e-08, + "loss": 0.0005, + "step": 38407 + }, + { + "epoch": 0.75, + "learning_rate": 5.10426779542542e-08, + "loss": 0.0004, + "step": 38408 + }, + { + "epoch": 0.75, + "learning_rate": 5.1038794609918056e-08, + "loss": 0.0003, + "step": 38409 + }, + { + "epoch": 0.75, + "learning_rate": 5.1034911265581915e-08, + "loss": 0.0006, + "step": 38410 + }, + { + "epoch": 0.75, + "learning_rate": 5.103102792124577e-08, + "loss": 0.0003, + "step": 38411 + }, + { + "epoch": 0.75, + "learning_rate": 5.102714457690963e-08, + "loss": 0.0005, + "step": 38412 + }, + { + "epoch": 0.75, + "learning_rate": 5.102326123257349e-08, + "loss": 0.001, + "step": 38413 + }, + { + "epoch": 0.75, + "learning_rate": 5.101937788823735e-08, + "loss": 0.0003, + "step": 38414 + }, + { + "epoch": 0.75, + "learning_rate": 5.1015494543901206e-08, + "loss": 0.0004, + "step": 38415 + }, + { + "epoch": 0.75, + "learning_rate": 5.1011611199565064e-08, + "loss": 1.2927, + "step": 38416 + }, + { + "epoch": 0.75, + "learning_rate": 5.100772785522892e-08, + "loss": 0.0003, + "step": 38417 + }, + { + "epoch": 0.75, + "learning_rate": 5.100384451089278e-08, + "loss": 0.0003, + "step": 38418 + }, + { + "epoch": 0.75, + "learning_rate": 5.099996116655664e-08, + "loss": 0.0004, + "step": 38419 + }, + { + "epoch": 0.75, + "learning_rate": 5.09960778222205e-08, + "loss": 0.0004, + "step": 38420 + }, + { + "epoch": 0.75, + "learning_rate": 5.0992194477884355e-08, + "loss": 1.1788, + "step": 38421 + }, + { + "epoch": 0.75, + "learning_rate": 5.0988311133548214e-08, + "loss": 0.0006, + "step": 38422 + }, + { + "epoch": 0.75, + "learning_rate": 5.098442778921207e-08, + "loss": 0.0006, + "step": 38423 + }, + { + "epoch": 0.75, + "learning_rate": 5.098054444487593e-08, + "loss": 0.0003, + "step": 38424 + }, + { + "epoch": 0.75, + "learning_rate": 5.097666110053979e-08, + "loss": 0.1023, + "step": 38425 + }, + { + "epoch": 0.75, + "learning_rate": 5.0972777756203646e-08, + "loss": 0.0004, + "step": 38426 + }, + { + "epoch": 0.75, + "learning_rate": 5.0968894411867505e-08, + "loss": 0.0003, + "step": 38427 + }, + { + "epoch": 0.75, + "learning_rate": 5.096501106753136e-08, + "loss": 0.0003, + "step": 38428 + }, + { + "epoch": 0.75, + "learning_rate": 5.096112772319522e-08, + "loss": 0.0004, + "step": 38429 + }, + { + "epoch": 0.75, + "learning_rate": 5.095724437885908e-08, + "loss": 0.0006, + "step": 38430 + }, + { + "epoch": 0.75, + "learning_rate": 5.0953361034522924e-08, + "loss": 0.0004, + "step": 38431 + }, + { + "epoch": 0.75, + "learning_rate": 5.094947769018678e-08, + "loss": 0.0006, + "step": 38432 + }, + { + "epoch": 0.75, + "learning_rate": 5.094559434585064e-08, + "loss": 0.0005, + "step": 38433 + }, + { + "epoch": 0.75, + "learning_rate": 5.09417110015145e-08, + "loss": 0.0004, + "step": 38434 + }, + { + "epoch": 0.75, + "learning_rate": 5.093782765717836e-08, + "loss": 0.0003, + "step": 38435 + }, + { + "epoch": 0.75, + "learning_rate": 5.0933944312842216e-08, + "loss": 0.0003, + "step": 38436 + }, + { + "epoch": 0.75, + "learning_rate": 5.0930060968506074e-08, + "loss": 0.0005, + "step": 38437 + }, + { + "epoch": 0.75, + "learning_rate": 5.092617762416993e-08, + "loss": 0.0009, + "step": 38438 + }, + { + "epoch": 0.75, + "learning_rate": 5.092229427983379e-08, + "loss": 0.0005, + "step": 38439 + }, + { + "epoch": 0.75, + "learning_rate": 5.091841093549765e-08, + "loss": 0.0004, + "step": 38440 + }, + { + "epoch": 0.75, + "learning_rate": 5.091452759116151e-08, + "loss": 0.4281, + "step": 38441 + }, + { + "epoch": 0.75, + "learning_rate": 5.0910644246825365e-08, + "loss": 0.0004, + "step": 38442 + }, + { + "epoch": 0.75, + "learning_rate": 5.0906760902489223e-08, + "loss": 0.0005, + "step": 38443 + }, + { + "epoch": 0.75, + "learning_rate": 5.090287755815308e-08, + "loss": 0.0006, + "step": 38444 + }, + { + "epoch": 0.75, + "learning_rate": 5.089899421381694e-08, + "loss": 0.0006, + "step": 38445 + }, + { + "epoch": 0.75, + "learning_rate": 5.08951108694808e-08, + "loss": 0.0005, + "step": 38446 + }, + { + "epoch": 0.75, + "learning_rate": 5.0891227525144656e-08, + "loss": 0.0004, + "step": 38447 + }, + { + "epoch": 0.75, + "learning_rate": 5.088734418080851e-08, + "loss": 0.0005, + "step": 38448 + }, + { + "epoch": 0.75, + "learning_rate": 5.0883460836472366e-08, + "loss": 0.0018, + "step": 38449 + }, + { + "epoch": 0.75, + "learning_rate": 5.0879577492136225e-08, + "loss": 0.6179, + "step": 38450 + }, + { + "epoch": 0.75, + "learning_rate": 5.087569414780008e-08, + "loss": 0.0004, + "step": 38451 + }, + { + "epoch": 0.75, + "learning_rate": 5.087181080346394e-08, + "loss": 0.0004, + "step": 38452 + }, + { + "epoch": 0.75, + "learning_rate": 5.08679274591278e-08, + "loss": 0.0005, + "step": 38453 + }, + { + "epoch": 0.75, + "learning_rate": 5.086404411479166e-08, + "loss": 0.0005, + "step": 38454 + }, + { + "epoch": 0.75, + "learning_rate": 5.0860160770455516e-08, + "loss": 0.0004, + "step": 38455 + }, + { + "epoch": 0.75, + "learning_rate": 5.0856277426119374e-08, + "loss": 0.0005, + "step": 38456 + }, + { + "epoch": 0.75, + "learning_rate": 5.085239408178323e-08, + "loss": 0.0003, + "step": 38457 + }, + { + "epoch": 0.75, + "learning_rate": 5.084851073744709e-08, + "loss": 0.0004, + "step": 38458 + }, + { + "epoch": 0.75, + "learning_rate": 5.084462739311095e-08, + "loss": 0.0004, + "step": 38459 + }, + { + "epoch": 0.75, + "learning_rate": 5.08407440487748e-08, + "loss": 0.071, + "step": 38460 + }, + { + "epoch": 0.75, + "learning_rate": 5.083686070443866e-08, + "loss": 0.0003, + "step": 38461 + }, + { + "epoch": 0.75, + "learning_rate": 5.083297736010252e-08, + "loss": 0.0003, + "step": 38462 + }, + { + "epoch": 0.75, + "learning_rate": 5.082909401576637e-08, + "loss": 0.0008, + "step": 38463 + }, + { + "epoch": 0.75, + "learning_rate": 5.082521067143023e-08, + "loss": 0.0005, + "step": 38464 + }, + { + "epoch": 0.75, + "learning_rate": 5.0821327327094085e-08, + "loss": 0.0003, + "step": 38465 + }, + { + "epoch": 0.75, + "learning_rate": 5.081744398275794e-08, + "loss": 0.0003, + "step": 38466 + }, + { + "epoch": 0.75, + "learning_rate": 5.08135606384218e-08, + "loss": 0.0004, + "step": 38467 + }, + { + "epoch": 0.75, + "learning_rate": 5.080967729408566e-08, + "loss": 0.0004, + "step": 38468 + }, + { + "epoch": 0.75, + "learning_rate": 5.080579394974952e-08, + "loss": 0.0006, + "step": 38469 + }, + { + "epoch": 0.75, + "learning_rate": 5.0801910605413376e-08, + "loss": 0.0005, + "step": 38470 + }, + { + "epoch": 0.75, + "learning_rate": 5.0798027261077234e-08, + "loss": 0.0004, + "step": 38471 + }, + { + "epoch": 0.75, + "learning_rate": 5.079414391674109e-08, + "loss": 0.0003, + "step": 38472 + }, + { + "epoch": 0.75, + "learning_rate": 5.079026057240495e-08, + "loss": 0.0542, + "step": 38473 + }, + { + "epoch": 0.75, + "learning_rate": 5.078637722806881e-08, + "loss": 0.0005, + "step": 38474 + }, + { + "epoch": 0.75, + "learning_rate": 5.078249388373267e-08, + "loss": 0.0005, + "step": 38475 + }, + { + "epoch": 0.75, + "learning_rate": 5.0778610539396526e-08, + "loss": 0.0004, + "step": 38476 + }, + { + "epoch": 0.75, + "learning_rate": 5.0774727195060384e-08, + "loss": 0.0523, + "step": 38477 + }, + { + "epoch": 0.75, + "learning_rate": 5.077084385072424e-08, + "loss": 0.3848, + "step": 38478 + }, + { + "epoch": 0.75, + "learning_rate": 5.07669605063881e-08, + "loss": 0.0003, + "step": 38479 + }, + { + "epoch": 0.75, + "learning_rate": 5.076307716205196e-08, + "loss": 0.0004, + "step": 38480 + }, + { + "epoch": 0.75, + "learning_rate": 5.075919381771582e-08, + "loss": 0.0005, + "step": 38481 + }, + { + "epoch": 0.75, + "learning_rate": 5.0755310473379675e-08, + "loss": 0.0005, + "step": 38482 + }, + { + "epoch": 0.75, + "learning_rate": 5.0751427129043533e-08, + "loss": 0.001, + "step": 38483 + }, + { + "epoch": 0.75, + "learning_rate": 5.074754378470739e-08, + "loss": 0.0006, + "step": 38484 + }, + { + "epoch": 0.75, + "learning_rate": 5.074366044037125e-08, + "loss": 0.0006, + "step": 38485 + }, + { + "epoch": 0.75, + "learning_rate": 5.073977709603511e-08, + "loss": 0.0003, + "step": 38486 + }, + { + "epoch": 0.75, + "learning_rate": 5.0735893751698966e-08, + "loss": 0.0009, + "step": 38487 + }, + { + "epoch": 0.75, + "learning_rate": 5.0732010407362825e-08, + "loss": 0.0583, + "step": 38488 + }, + { + "epoch": 0.75, + "learning_rate": 5.072812706302667e-08, + "loss": 0.0707, + "step": 38489 + }, + { + "epoch": 0.75, + "learning_rate": 5.072424371869053e-08, + "loss": 0.0005, + "step": 38490 + }, + { + "epoch": 0.75, + "learning_rate": 5.0720360374354386e-08, + "loss": 0.8553, + "step": 38491 + }, + { + "epoch": 0.75, + "learning_rate": 5.0716477030018244e-08, + "loss": 0.0003, + "step": 38492 + }, + { + "epoch": 0.75, + "learning_rate": 5.07125936856821e-08, + "loss": 0.0005, + "step": 38493 + }, + { + "epoch": 0.75, + "learning_rate": 5.070871034134596e-08, + "loss": 0.0054, + "step": 38494 + }, + { + "epoch": 0.75, + "learning_rate": 5.070482699700982e-08, + "loss": 0.0005, + "step": 38495 + }, + { + "epoch": 0.75, + "learning_rate": 5.070094365267368e-08, + "loss": 0.0004, + "step": 38496 + }, + { + "epoch": 0.75, + "learning_rate": 5.0697060308337536e-08, + "loss": 0.0006, + "step": 38497 + }, + { + "epoch": 0.75, + "learning_rate": 5.0693176964001394e-08, + "loss": 0.0004, + "step": 38498 + }, + { + "epoch": 0.75, + "learning_rate": 5.068929361966525e-08, + "loss": 0.0066, + "step": 38499 + }, + { + "epoch": 0.75, + "learning_rate": 5.068541027532911e-08, + "loss": 0.0006, + "step": 38500 + }, + { + "epoch": 0.75, + "learning_rate": 5.068152693099297e-08, + "loss": 0.0004, + "step": 38501 + }, + { + "epoch": 0.75, + "learning_rate": 5.067764358665683e-08, + "loss": 0.0003, + "step": 38502 + }, + { + "epoch": 0.75, + "learning_rate": 5.0673760242320685e-08, + "loss": 0.0014, + "step": 38503 + }, + { + "epoch": 0.75, + "learning_rate": 5.066987689798454e-08, + "loss": 0.0003, + "step": 38504 + }, + { + "epoch": 0.75, + "learning_rate": 5.06659935536484e-08, + "loss": 0.0007, + "step": 38505 + }, + { + "epoch": 0.75, + "learning_rate": 5.066211020931226e-08, + "loss": 0.0004, + "step": 38506 + }, + { + "epoch": 0.75, + "learning_rate": 5.065822686497612e-08, + "loss": 0.003, + "step": 38507 + }, + { + "epoch": 0.75, + "learning_rate": 5.0654343520639976e-08, + "loss": 0.0005, + "step": 38508 + }, + { + "epoch": 0.75, + "learning_rate": 5.0650460176303834e-08, + "loss": 1.1974, + "step": 38509 + }, + { + "epoch": 0.75, + "learning_rate": 5.064657683196769e-08, + "loss": 0.0003, + "step": 38510 + }, + { + "epoch": 0.75, + "learning_rate": 5.064269348763155e-08, + "loss": 0.0006, + "step": 38511 + }, + { + "epoch": 0.75, + "learning_rate": 5.063881014329541e-08, + "loss": 0.0634, + "step": 38512 + }, + { + "epoch": 0.75, + "learning_rate": 5.063492679895927e-08, + "loss": 0.0008, + "step": 38513 + }, + { + "epoch": 0.75, + "learning_rate": 5.0631043454623126e-08, + "loss": 0.0005, + "step": 38514 + }, + { + "epoch": 0.75, + "learning_rate": 5.0627160110286984e-08, + "loss": 0.0003, + "step": 38515 + }, + { + "epoch": 0.75, + "learning_rate": 5.062327676595084e-08, + "loss": 0.0004, + "step": 38516 + }, + { + "epoch": 0.75, + "learning_rate": 5.06193934216147e-08, + "loss": 0.0003, + "step": 38517 + }, + { + "epoch": 0.75, + "learning_rate": 5.0615510077278545e-08, + "loss": 0.0004, + "step": 38518 + }, + { + "epoch": 0.75, + "learning_rate": 5.0611626732942404e-08, + "loss": 0.0006, + "step": 38519 + }, + { + "epoch": 0.75, + "learning_rate": 5.060774338860626e-08, + "loss": 0.0008, + "step": 38520 + }, + { + "epoch": 0.75, + "learning_rate": 5.060386004427012e-08, + "loss": 0.0004, + "step": 38521 + }, + { + "epoch": 0.75, + "learning_rate": 5.059997669993398e-08, + "loss": 0.0004, + "step": 38522 + }, + { + "epoch": 0.75, + "learning_rate": 5.0596093355597837e-08, + "loss": 0.0003, + "step": 38523 + }, + { + "epoch": 0.75, + "learning_rate": 5.0592210011261695e-08, + "loss": 0.0006, + "step": 38524 + }, + { + "epoch": 0.75, + "learning_rate": 5.058832666692555e-08, + "loss": 0.0006, + "step": 38525 + }, + { + "epoch": 0.75, + "learning_rate": 5.058444332258941e-08, + "loss": 0.0005, + "step": 38526 + }, + { + "epoch": 0.75, + "learning_rate": 5.058055997825327e-08, + "loss": 0.0004, + "step": 38527 + }, + { + "epoch": 0.75, + "learning_rate": 5.057667663391713e-08, + "loss": 0.0004, + "step": 38528 + }, + { + "epoch": 0.75, + "learning_rate": 5.0572793289580986e-08, + "loss": 0.2313, + "step": 38529 + }, + { + "epoch": 0.75, + "learning_rate": 5.0568909945244844e-08, + "loss": 0.0004, + "step": 38530 + }, + { + "epoch": 0.75, + "learning_rate": 5.05650266009087e-08, + "loss": 0.0005, + "step": 38531 + }, + { + "epoch": 0.75, + "learning_rate": 5.056114325657256e-08, + "loss": 0.0005, + "step": 38532 + }, + { + "epoch": 0.75, + "learning_rate": 5.055725991223642e-08, + "loss": 0.0006, + "step": 38533 + }, + { + "epoch": 0.75, + "learning_rate": 5.055337656790028e-08, + "loss": 0.0005, + "step": 38534 + }, + { + "epoch": 0.75, + "learning_rate": 5.0549493223564136e-08, + "loss": 0.0005, + "step": 38535 + }, + { + "epoch": 0.75, + "learning_rate": 5.0545609879227994e-08, + "loss": 0.0004, + "step": 38536 + }, + { + "epoch": 0.75, + "learning_rate": 5.0541726534891845e-08, + "loss": 0.0004, + "step": 38537 + }, + { + "epoch": 0.75, + "learning_rate": 5.0537843190555704e-08, + "loss": 0.0003, + "step": 38538 + }, + { + "epoch": 0.75, + "learning_rate": 5.053395984621956e-08, + "loss": 0.0035, + "step": 38539 + }, + { + "epoch": 0.75, + "learning_rate": 5.053007650188342e-08, + "loss": 1.2804, + "step": 38540 + }, + { + "epoch": 0.75, + "learning_rate": 5.052619315754728e-08, + "loss": 0.0005, + "step": 38541 + }, + { + "epoch": 0.75, + "learning_rate": 5.0522309813211137e-08, + "loss": 0.0007, + "step": 38542 + }, + { + "epoch": 0.75, + "learning_rate": 5.0518426468874995e-08, + "loss": 0.0004, + "step": 38543 + }, + { + "epoch": 0.75, + "learning_rate": 5.051454312453885e-08, + "loss": 0.0008, + "step": 38544 + }, + { + "epoch": 0.75, + "learning_rate": 5.051065978020271e-08, + "loss": 0.0004, + "step": 38545 + }, + { + "epoch": 0.75, + "learning_rate": 5.050677643586657e-08, + "loss": 0.0006, + "step": 38546 + }, + { + "epoch": 0.75, + "learning_rate": 5.050289309153042e-08, + "loss": 0.0004, + "step": 38547 + }, + { + "epoch": 0.75, + "learning_rate": 5.049900974719428e-08, + "loss": 0.0004, + "step": 38548 + }, + { + "epoch": 0.75, + "learning_rate": 5.049512640285814e-08, + "loss": 0.0004, + "step": 38549 + }, + { + "epoch": 0.75, + "learning_rate": 5.0491243058521996e-08, + "loss": 0.4383, + "step": 38550 + }, + { + "epoch": 0.75, + "learning_rate": 5.048735971418585e-08, + "loss": 1.069, + "step": 38551 + }, + { + "epoch": 0.75, + "learning_rate": 5.0483476369849706e-08, + "loss": 0.0037, + "step": 38552 + }, + { + "epoch": 0.75, + "learning_rate": 5.0479593025513564e-08, + "loss": 0.0005, + "step": 38553 + }, + { + "epoch": 0.75, + "learning_rate": 5.047570968117742e-08, + "loss": 0.0007, + "step": 38554 + }, + { + "epoch": 0.75, + "learning_rate": 5.047182633684128e-08, + "loss": 0.0017, + "step": 38555 + }, + { + "epoch": 0.75, + "learning_rate": 5.046794299250514e-08, + "loss": 0.0007, + "step": 38556 + }, + { + "epoch": 0.75, + "learning_rate": 5.0464059648169e-08, + "loss": 0.0005, + "step": 38557 + }, + { + "epoch": 0.75, + "learning_rate": 5.0460176303832855e-08, + "loss": 1.05, + "step": 38558 + }, + { + "epoch": 0.75, + "learning_rate": 5.0456292959496714e-08, + "loss": 0.0003, + "step": 38559 + }, + { + "epoch": 0.75, + "learning_rate": 5.045240961516057e-08, + "loss": 0.0005, + "step": 38560 + }, + { + "epoch": 0.75, + "learning_rate": 5.044852627082443e-08, + "loss": 0.0257, + "step": 38561 + }, + { + "epoch": 0.75, + "learning_rate": 5.044464292648829e-08, + "loss": 0.0015, + "step": 38562 + }, + { + "epoch": 0.75, + "learning_rate": 5.0440759582152147e-08, + "loss": 0.0004, + "step": 38563 + }, + { + "epoch": 0.75, + "learning_rate": 5.0436876237816005e-08, + "loss": 0.006, + "step": 38564 + }, + { + "epoch": 0.75, + "learning_rate": 5.043299289347986e-08, + "loss": 0.0003, + "step": 38565 + }, + { + "epoch": 0.75, + "learning_rate": 5.042910954914372e-08, + "loss": 0.0005, + "step": 38566 + }, + { + "epoch": 0.75, + "learning_rate": 5.042522620480758e-08, + "loss": 0.0011, + "step": 38567 + }, + { + "epoch": 0.75, + "learning_rate": 5.042134286047144e-08, + "loss": 0.0017, + "step": 38568 + }, + { + "epoch": 0.75, + "learning_rate": 5.0417459516135296e-08, + "loss": 0.0007, + "step": 38569 + }, + { + "epoch": 0.75, + "learning_rate": 5.0413576171799154e-08, + "loss": 0.0005, + "step": 38570 + }, + { + "epoch": 0.75, + "learning_rate": 5.040969282746301e-08, + "loss": 0.0006, + "step": 38571 + }, + { + "epoch": 0.75, + "learning_rate": 5.040580948312687e-08, + "loss": 0.0004, + "step": 38572 + }, + { + "epoch": 0.75, + "learning_rate": 5.040192613879073e-08, + "loss": 0.0005, + "step": 38573 + }, + { + "epoch": 0.75, + "learning_rate": 5.039804279445459e-08, + "loss": 0.018, + "step": 38574 + }, + { + "epoch": 0.75, + "learning_rate": 5.0394159450118445e-08, + "loss": 0.0006, + "step": 38575 + }, + { + "epoch": 0.75, + "learning_rate": 5.039027610578229e-08, + "loss": 1.1989, + "step": 38576 + }, + { + "epoch": 0.75, + "learning_rate": 5.038639276144615e-08, + "loss": 0.0004, + "step": 38577 + }, + { + "epoch": 0.75, + "learning_rate": 5.038250941711001e-08, + "loss": 0.0003, + "step": 38578 + }, + { + "epoch": 0.75, + "learning_rate": 5.0378626072773865e-08, + "loss": 0.0008, + "step": 38579 + }, + { + "epoch": 0.75, + "learning_rate": 5.0374742728437723e-08, + "loss": 0.0004, + "step": 38580 + }, + { + "epoch": 0.75, + "learning_rate": 5.037085938410158e-08, + "loss": 0.0005, + "step": 38581 + }, + { + "epoch": 0.75, + "learning_rate": 5.036697603976544e-08, + "loss": 0.0003, + "step": 38582 + }, + { + "epoch": 0.75, + "learning_rate": 5.03630926954293e-08, + "loss": 0.0005, + "step": 38583 + }, + { + "epoch": 0.75, + "learning_rate": 5.0359209351093156e-08, + "loss": 0.0021, + "step": 38584 + }, + { + "epoch": 0.75, + "learning_rate": 5.0355326006757015e-08, + "loss": 0.0007, + "step": 38585 + }, + { + "epoch": 0.75, + "learning_rate": 5.035144266242087e-08, + "loss": 0.0006, + "step": 38586 + }, + { + "epoch": 0.75, + "learning_rate": 5.034755931808473e-08, + "loss": 0.0004, + "step": 38587 + }, + { + "epoch": 0.75, + "learning_rate": 5.034367597374859e-08, + "loss": 1.8332, + "step": 38588 + }, + { + "epoch": 0.75, + "learning_rate": 5.033979262941245e-08, + "loss": 0.7605, + "step": 38589 + }, + { + "epoch": 0.75, + "learning_rate": 5.0335909285076306e-08, + "loss": 0.0005, + "step": 38590 + }, + { + "epoch": 0.75, + "learning_rate": 5.0332025940740164e-08, + "loss": 0.0004, + "step": 38591 + }, + { + "epoch": 0.75, + "learning_rate": 5.032814259640402e-08, + "loss": 0.0004, + "step": 38592 + }, + { + "epoch": 0.75, + "learning_rate": 5.032425925206788e-08, + "loss": 0.0004, + "step": 38593 + }, + { + "epoch": 0.75, + "learning_rate": 5.032037590773174e-08, + "loss": 0.0004, + "step": 38594 + }, + { + "epoch": 0.75, + "learning_rate": 5.03164925633956e-08, + "loss": 0.0014, + "step": 38595 + }, + { + "epoch": 0.75, + "learning_rate": 5.0312609219059455e-08, + "loss": 0.0005, + "step": 38596 + }, + { + "epoch": 0.75, + "learning_rate": 5.0308725874723314e-08, + "loss": 0.0004, + "step": 38597 + }, + { + "epoch": 0.75, + "learning_rate": 5.030484253038717e-08, + "loss": 0.0005, + "step": 38598 + }, + { + "epoch": 0.75, + "learning_rate": 5.030095918605103e-08, + "loss": 0.0018, + "step": 38599 + }, + { + "epoch": 0.75, + "learning_rate": 5.029707584171489e-08, + "loss": 0.0005, + "step": 38600 + }, + { + "epoch": 0.75, + "learning_rate": 5.0293192497378747e-08, + "loss": 0.0004, + "step": 38601 + }, + { + "epoch": 0.75, + "learning_rate": 5.0289309153042605e-08, + "loss": 0.0004, + "step": 38602 + }, + { + "epoch": 0.75, + "learning_rate": 5.028542580870646e-08, + "loss": 0.0007, + "step": 38603 + }, + { + "epoch": 0.75, + "learning_rate": 5.028154246437032e-08, + "loss": 0.0003, + "step": 38604 + }, + { + "epoch": 0.75, + "learning_rate": 5.0277659120034166e-08, + "loss": 0.0004, + "step": 38605 + }, + { + "epoch": 0.75, + "learning_rate": 5.0273775775698025e-08, + "loss": 0.0006, + "step": 38606 + }, + { + "epoch": 0.75, + "learning_rate": 5.026989243136188e-08, + "loss": 0.0004, + "step": 38607 + }, + { + "epoch": 0.75, + "learning_rate": 5.026600908702574e-08, + "loss": 0.0945, + "step": 38608 + }, + { + "epoch": 0.75, + "learning_rate": 5.02621257426896e-08, + "loss": 0.0004, + "step": 38609 + }, + { + "epoch": 0.75, + "learning_rate": 5.025824239835346e-08, + "loss": 0.0004, + "step": 38610 + }, + { + "epoch": 0.75, + "learning_rate": 5.0254359054017316e-08, + "loss": 0.0006, + "step": 38611 + }, + { + "epoch": 0.75, + "learning_rate": 5.0250475709681174e-08, + "loss": 0.0005, + "step": 38612 + }, + { + "epoch": 0.75, + "learning_rate": 5.024659236534503e-08, + "loss": 0.0004, + "step": 38613 + }, + { + "epoch": 0.75, + "learning_rate": 5.024270902100889e-08, + "loss": 0.0005, + "step": 38614 + }, + { + "epoch": 0.75, + "learning_rate": 5.023882567667275e-08, + "loss": 0.0004, + "step": 38615 + }, + { + "epoch": 0.75, + "learning_rate": 5.023494233233661e-08, + "loss": 0.0007, + "step": 38616 + }, + { + "epoch": 0.75, + "learning_rate": 5.0231058988000465e-08, + "loss": 0.0005, + "step": 38617 + }, + { + "epoch": 0.75, + "learning_rate": 5.0227175643664324e-08, + "loss": 0.0004, + "step": 38618 + }, + { + "epoch": 0.75, + "learning_rate": 5.022329229932818e-08, + "loss": 0.0004, + "step": 38619 + }, + { + "epoch": 0.75, + "learning_rate": 5.021940895499204e-08, + "loss": 0.0005, + "step": 38620 + }, + { + "epoch": 0.75, + "learning_rate": 5.02155256106559e-08, + "loss": 0.0004, + "step": 38621 + }, + { + "epoch": 0.75, + "learning_rate": 5.0211642266319757e-08, + "loss": 0.0004, + "step": 38622 + }, + { + "epoch": 0.75, + "learning_rate": 5.0207758921983615e-08, + "loss": 0.0005, + "step": 38623 + }, + { + "epoch": 0.75, + "learning_rate": 5.020387557764747e-08, + "loss": 0.0003, + "step": 38624 + }, + { + "epoch": 0.75, + "learning_rate": 5.0199992233311325e-08, + "loss": 0.0004, + "step": 38625 + }, + { + "epoch": 0.75, + "learning_rate": 5.019610888897518e-08, + "loss": 0.0005, + "step": 38626 + }, + { + "epoch": 0.75, + "learning_rate": 5.019222554463904e-08, + "loss": 0.0012, + "step": 38627 + }, + { + "epoch": 0.75, + "learning_rate": 5.01883422003029e-08, + "loss": 0.0005, + "step": 38628 + }, + { + "epoch": 0.75, + "learning_rate": 5.018445885596676e-08, + "loss": 0.0004, + "step": 38629 + }, + { + "epoch": 0.75, + "learning_rate": 5.0180575511630616e-08, + "loss": 0.0004, + "step": 38630 + }, + { + "epoch": 0.75, + "learning_rate": 5.0176692167294474e-08, + "loss": 0.0078, + "step": 38631 + }, + { + "epoch": 0.75, + "learning_rate": 5.017280882295833e-08, + "loss": 0.0003, + "step": 38632 + }, + { + "epoch": 0.75, + "learning_rate": 5.016892547862219e-08, + "loss": 0.0004, + "step": 38633 + }, + { + "epoch": 0.75, + "learning_rate": 5.016504213428604e-08, + "loss": 0.0006, + "step": 38634 + }, + { + "epoch": 0.75, + "learning_rate": 5.01611587899499e-08, + "loss": 0.002, + "step": 38635 + }, + { + "epoch": 0.75, + "learning_rate": 5.015727544561376e-08, + "loss": 0.0005, + "step": 38636 + }, + { + "epoch": 0.75, + "learning_rate": 5.015339210127762e-08, + "loss": 0.3585, + "step": 38637 + }, + { + "epoch": 0.75, + "learning_rate": 5.0149508756941475e-08, + "loss": 0.0003, + "step": 38638 + }, + { + "epoch": 0.75, + "learning_rate": 5.0145625412605333e-08, + "loss": 0.0004, + "step": 38639 + }, + { + "epoch": 0.75, + "learning_rate": 5.0141742068269185e-08, + "loss": 0.0004, + "step": 38640 + }, + { + "epoch": 0.75, + "learning_rate": 5.013785872393304e-08, + "loss": 0.2768, + "step": 38641 + }, + { + "epoch": 0.75, + "learning_rate": 5.01339753795969e-08, + "loss": 0.0004, + "step": 38642 + }, + { + "epoch": 0.75, + "learning_rate": 5.013009203526076e-08, + "loss": 0.0003, + "step": 38643 + }, + { + "epoch": 0.75, + "learning_rate": 5.012620869092462e-08, + "loss": 0.0033, + "step": 38644 + }, + { + "epoch": 0.75, + "learning_rate": 5.0122325346588476e-08, + "loss": 0.0003, + "step": 38645 + }, + { + "epoch": 0.75, + "learning_rate": 5.0118442002252335e-08, + "loss": 0.0007, + "step": 38646 + }, + { + "epoch": 0.75, + "learning_rate": 5.011455865791619e-08, + "loss": 0.9952, + "step": 38647 + }, + { + "epoch": 0.75, + "learning_rate": 5.011067531358005e-08, + "loss": 0.0004, + "step": 38648 + }, + { + "epoch": 0.75, + "learning_rate": 5.010679196924391e-08, + "loss": 0.0003, + "step": 38649 + }, + { + "epoch": 0.75, + "learning_rate": 5.010290862490777e-08, + "loss": 0.0003, + "step": 38650 + }, + { + "epoch": 0.75, + "learning_rate": 5.0099025280571626e-08, + "loss": 0.0007, + "step": 38651 + }, + { + "epoch": 0.75, + "learning_rate": 5.0095141936235484e-08, + "loss": 0.001, + "step": 38652 + }, + { + "epoch": 0.75, + "learning_rate": 5.009125859189934e-08, + "loss": 0.0005, + "step": 38653 + }, + { + "epoch": 0.75, + "learning_rate": 5.00873752475632e-08, + "loss": 0.0004, + "step": 38654 + }, + { + "epoch": 0.75, + "learning_rate": 5.008349190322706e-08, + "loss": 0.0005, + "step": 38655 + }, + { + "epoch": 0.75, + "learning_rate": 5.007960855889092e-08, + "loss": 0.0006, + "step": 38656 + }, + { + "epoch": 0.75, + "learning_rate": 5.0075725214554775e-08, + "loss": 0.0004, + "step": 38657 + }, + { + "epoch": 0.75, + "learning_rate": 5.0071841870218633e-08, + "loss": 0.0004, + "step": 38658 + }, + { + "epoch": 0.75, + "learning_rate": 5.006795852588249e-08, + "loss": 0.0003, + "step": 38659 + }, + { + "epoch": 0.75, + "learning_rate": 5.006407518154635e-08, + "loss": 0.0006, + "step": 38660 + }, + { + "epoch": 0.75, + "learning_rate": 5.006019183721021e-08, + "loss": 0.0005, + "step": 38661 + }, + { + "epoch": 0.75, + "learning_rate": 5.0056308492874066e-08, + "loss": 0.001, + "step": 38662 + }, + { + "epoch": 0.75, + "learning_rate": 5.005242514853791e-08, + "loss": 0.0004, + "step": 38663 + }, + { + "epoch": 0.75, + "learning_rate": 5.004854180420177e-08, + "loss": 0.0004, + "step": 38664 + }, + { + "epoch": 0.75, + "learning_rate": 5.004465845986563e-08, + "loss": 0.0004, + "step": 38665 + }, + { + "epoch": 0.75, + "learning_rate": 5.0040775115529486e-08, + "loss": 0.5159, + "step": 38666 + }, + { + "epoch": 0.75, + "learning_rate": 5.0036891771193344e-08, + "loss": 0.0164, + "step": 38667 + }, + { + "epoch": 0.75, + "learning_rate": 5.00330084268572e-08, + "loss": 0.0005, + "step": 38668 + }, + { + "epoch": 0.75, + "learning_rate": 5.002912508252106e-08, + "loss": 0.0034, + "step": 38669 + }, + { + "epoch": 0.75, + "learning_rate": 5.002524173818492e-08, + "loss": 0.0003, + "step": 38670 + }, + { + "epoch": 0.75, + "learning_rate": 5.002135839384878e-08, + "loss": 0.0003, + "step": 38671 + }, + { + "epoch": 0.75, + "learning_rate": 5.0017475049512636e-08, + "loss": 0.8922, + "step": 38672 + }, + { + "epoch": 0.75, + "learning_rate": 5.0013591705176494e-08, + "loss": 0.0005, + "step": 38673 + }, + { + "epoch": 0.75, + "learning_rate": 5.000970836084035e-08, + "loss": 0.0004, + "step": 38674 + }, + { + "epoch": 0.75, + "learning_rate": 5.000582501650421e-08, + "loss": 0.0005, + "step": 38675 + }, + { + "epoch": 0.75, + "learning_rate": 5.000194167216807e-08, + "loss": 0.0006, + "step": 38676 + }, + { + "epoch": 0.75, + "learning_rate": 4.999805832783193e-08, + "loss": 0.0016, + "step": 38677 + }, + { + "epoch": 0.75, + "learning_rate": 4.9994174983495785e-08, + "loss": 0.1216, + "step": 38678 + }, + { + "epoch": 0.75, + "learning_rate": 4.9990291639159643e-08, + "loss": 0.0003, + "step": 38679 + }, + { + "epoch": 0.75, + "learning_rate": 4.99864082948235e-08, + "loss": 0.0003, + "step": 38680 + }, + { + "epoch": 0.75, + "learning_rate": 4.998252495048736e-08, + "loss": 0.0005, + "step": 38681 + }, + { + "epoch": 0.75, + "learning_rate": 4.997864160615122e-08, + "loss": 0.0005, + "step": 38682 + }, + { + "epoch": 0.75, + "learning_rate": 4.9974758261815076e-08, + "loss": 1.2846, + "step": 38683 + }, + { + "epoch": 0.75, + "learning_rate": 4.997087491747893e-08, + "loss": 0.0004, + "step": 38684 + }, + { + "epoch": 0.75, + "learning_rate": 4.9966991573142786e-08, + "loss": 0.0003, + "step": 38685 + }, + { + "epoch": 0.75, + "learning_rate": 4.9963108228806644e-08, + "loss": 0.0032, + "step": 38686 + }, + { + "epoch": 0.75, + "learning_rate": 4.99592248844705e-08, + "loss": 0.0004, + "step": 38687 + }, + { + "epoch": 0.75, + "learning_rate": 4.995534154013436e-08, + "loss": 0.0003, + "step": 38688 + }, + { + "epoch": 0.75, + "learning_rate": 4.995145819579822e-08, + "loss": 0.0007, + "step": 38689 + }, + { + "epoch": 0.75, + "learning_rate": 4.994757485146208e-08, + "loss": 0.0003, + "step": 38690 + }, + { + "epoch": 0.75, + "learning_rate": 4.9943691507125936e-08, + "loss": 0.0005, + "step": 38691 + }, + { + "epoch": 0.75, + "learning_rate": 4.9939808162789794e-08, + "loss": 0.0005, + "step": 38692 + }, + { + "epoch": 0.75, + "learning_rate": 4.993592481845365e-08, + "loss": 0.0004, + "step": 38693 + }, + { + "epoch": 0.75, + "learning_rate": 4.993204147411751e-08, + "loss": 0.0021, + "step": 38694 + }, + { + "epoch": 0.75, + "learning_rate": 4.992815812978137e-08, + "loss": 0.0003, + "step": 38695 + }, + { + "epoch": 0.75, + "learning_rate": 4.992427478544523e-08, + "loss": 0.0003, + "step": 38696 + }, + { + "epoch": 0.75, + "learning_rate": 4.9920391441109085e-08, + "loss": 0.0009, + "step": 38697 + }, + { + "epoch": 0.75, + "learning_rate": 4.9916508096772943e-08, + "loss": 0.926, + "step": 38698 + }, + { + "epoch": 0.75, + "learning_rate": 4.9912624752436795e-08, + "loss": 0.0004, + "step": 38699 + }, + { + "epoch": 0.75, + "learning_rate": 4.990874140810065e-08, + "loss": 0.0003, + "step": 38700 + }, + { + "epoch": 0.75, + "learning_rate": 4.990485806376451e-08, + "loss": 0.0007, + "step": 38701 + }, + { + "epoch": 0.75, + "learning_rate": 4.990097471942837e-08, + "loss": 0.0004, + "step": 38702 + }, + { + "epoch": 0.75, + "learning_rate": 4.989709137509223e-08, + "loss": 0.0003, + "step": 38703 + }, + { + "epoch": 0.75, + "learning_rate": 4.9893208030756086e-08, + "loss": 0.0425, + "step": 38704 + }, + { + "epoch": 0.75, + "learning_rate": 4.9889324686419944e-08, + "loss": 0.0012, + "step": 38705 + }, + { + "epoch": 0.75, + "learning_rate": 4.98854413420838e-08, + "loss": 0.002, + "step": 38706 + }, + { + "epoch": 0.75, + "learning_rate": 4.988155799774766e-08, + "loss": 0.0003, + "step": 38707 + }, + { + "epoch": 0.75, + "learning_rate": 4.987767465341152e-08, + "loss": 0.0004, + "step": 38708 + }, + { + "epoch": 0.75, + "learning_rate": 4.987379130907538e-08, + "loss": 0.0005, + "step": 38709 + }, + { + "epoch": 0.75, + "learning_rate": 4.9869907964739236e-08, + "loss": 0.0004, + "step": 38710 + }, + { + "epoch": 0.75, + "learning_rate": 4.9866024620403094e-08, + "loss": 0.0008, + "step": 38711 + }, + { + "epoch": 0.75, + "learning_rate": 4.986214127606695e-08, + "loss": 0.0003, + "step": 38712 + }, + { + "epoch": 0.75, + "learning_rate": 4.9858257931730804e-08, + "loss": 0.0006, + "step": 38713 + }, + { + "epoch": 0.75, + "learning_rate": 4.985437458739466e-08, + "loss": 0.0004, + "step": 38714 + }, + { + "epoch": 0.75, + "learning_rate": 4.985049124305852e-08, + "loss": 0.0011, + "step": 38715 + }, + { + "epoch": 0.75, + "learning_rate": 4.984660789872238e-08, + "loss": 0.0004, + "step": 38716 + }, + { + "epoch": 0.75, + "learning_rate": 4.984272455438624e-08, + "loss": 0.0005, + "step": 38717 + }, + { + "epoch": 0.75, + "learning_rate": 4.9838841210050095e-08, + "loss": 0.0004, + "step": 38718 + }, + { + "epoch": 0.75, + "learning_rate": 4.983495786571395e-08, + "loss": 0.0004, + "step": 38719 + }, + { + "epoch": 0.75, + "learning_rate": 4.983107452137781e-08, + "loss": 0.001, + "step": 38720 + }, + { + "epoch": 0.75, + "learning_rate": 4.982719117704166e-08, + "loss": 0.0004, + "step": 38721 + }, + { + "epoch": 0.75, + "learning_rate": 4.982330783270552e-08, + "loss": 0.0004, + "step": 38722 + }, + { + "epoch": 0.75, + "learning_rate": 4.981942448836938e-08, + "loss": 0.0009, + "step": 38723 + }, + { + "epoch": 0.75, + "learning_rate": 4.981554114403324e-08, + "loss": 0.0005, + "step": 38724 + }, + { + "epoch": 0.75, + "learning_rate": 4.9811657799697096e-08, + "loss": 0.0003, + "step": 38725 + }, + { + "epoch": 0.75, + "learning_rate": 4.9807774455360954e-08, + "loss": 0.0005, + "step": 38726 + }, + { + "epoch": 0.75, + "learning_rate": 4.980389111102481e-08, + "loss": 0.0004, + "step": 38727 + }, + { + "epoch": 0.75, + "learning_rate": 4.980000776668867e-08, + "loss": 0.0007, + "step": 38728 + }, + { + "epoch": 0.75, + "learning_rate": 4.979612442235252e-08, + "loss": 0.0053, + "step": 38729 + }, + { + "epoch": 0.75, + "learning_rate": 4.979224107801638e-08, + "loss": 1.2806, + "step": 38730 + }, + { + "epoch": 0.75, + "learning_rate": 4.978835773368024e-08, + "loss": 0.0004, + "step": 38731 + }, + { + "epoch": 0.75, + "learning_rate": 4.97844743893441e-08, + "loss": 0.0008, + "step": 38732 + }, + { + "epoch": 0.75, + "learning_rate": 4.9780591045007955e-08, + "loss": 0.0011, + "step": 38733 + }, + { + "epoch": 0.75, + "learning_rate": 4.9776707700671814e-08, + "loss": 0.0005, + "step": 38734 + }, + { + "epoch": 0.75, + "learning_rate": 4.977282435633567e-08, + "loss": 0.0004, + "step": 38735 + }, + { + "epoch": 0.75, + "learning_rate": 4.976894101199953e-08, + "loss": 0.0005, + "step": 38736 + }, + { + "epoch": 0.75, + "learning_rate": 4.976505766766339e-08, + "loss": 0.0009, + "step": 38737 + }, + { + "epoch": 0.75, + "learning_rate": 4.9761174323327247e-08, + "loss": 0.0249, + "step": 38738 + }, + { + "epoch": 0.75, + "learning_rate": 4.9757290978991105e-08, + "loss": 0.1858, + "step": 38739 + }, + { + "epoch": 0.75, + "learning_rate": 4.975340763465496e-08, + "loss": 0.0006, + "step": 38740 + }, + { + "epoch": 0.75, + "learning_rate": 4.974952429031882e-08, + "loss": 0.0003, + "step": 38741 + }, + { + "epoch": 0.75, + "learning_rate": 4.974564094598267e-08, + "loss": 0.0027, + "step": 38742 + }, + { + "epoch": 0.75, + "learning_rate": 4.974175760164653e-08, + "loss": 0.0009, + "step": 38743 + }, + { + "epoch": 0.75, + "learning_rate": 4.973787425731039e-08, + "loss": 0.0004, + "step": 38744 + }, + { + "epoch": 0.75, + "learning_rate": 4.973399091297425e-08, + "loss": 0.0027, + "step": 38745 + }, + { + "epoch": 0.75, + "learning_rate": 4.9730107568638106e-08, + "loss": 0.0003, + "step": 38746 + }, + { + "epoch": 0.75, + "learning_rate": 4.9726224224301964e-08, + "loss": 0.0006, + "step": 38747 + }, + { + "epoch": 0.75, + "learning_rate": 4.972234087996582e-08, + "loss": 0.0005, + "step": 38748 + }, + { + "epoch": 0.75, + "learning_rate": 4.971845753562968e-08, + "loss": 0.0005, + "step": 38749 + }, + { + "epoch": 0.75, + "learning_rate": 4.971457419129354e-08, + "loss": 0.0004, + "step": 38750 + }, + { + "epoch": 0.75, + "learning_rate": 4.97106908469574e-08, + "loss": 0.0004, + "step": 38751 + }, + { + "epoch": 0.75, + "learning_rate": 4.9706807502621255e-08, + "loss": 0.0005, + "step": 38752 + }, + { + "epoch": 0.75, + "learning_rate": 4.9702924158285114e-08, + "loss": 0.0004, + "step": 38753 + }, + { + "epoch": 0.75, + "learning_rate": 4.969904081394897e-08, + "loss": 0.0004, + "step": 38754 + }, + { + "epoch": 0.75, + "learning_rate": 4.969515746961283e-08, + "loss": 0.0016, + "step": 38755 + }, + { + "epoch": 0.75, + "learning_rate": 4.969127412527669e-08, + "loss": 0.0012, + "step": 38756 + }, + { + "epoch": 0.75, + "learning_rate": 4.968739078094054e-08, + "loss": 0.0004, + "step": 38757 + }, + { + "epoch": 0.75, + "learning_rate": 4.96835074366044e-08, + "loss": 0.0005, + "step": 38758 + }, + { + "epoch": 0.75, + "learning_rate": 4.9679624092268257e-08, + "loss": 0.0004, + "step": 38759 + }, + { + "epoch": 0.75, + "learning_rate": 4.9675740747932115e-08, + "loss": 0.0006, + "step": 38760 + }, + { + "epoch": 0.75, + "learning_rate": 4.967185740359597e-08, + "loss": 0.0017, + "step": 38761 + }, + { + "epoch": 0.75, + "learning_rate": 4.966797405925983e-08, + "loss": 0.0006, + "step": 38762 + }, + { + "epoch": 0.75, + "learning_rate": 4.966409071492369e-08, + "loss": 0.0003, + "step": 38763 + }, + { + "epoch": 0.75, + "learning_rate": 4.966020737058755e-08, + "loss": 0.0005, + "step": 38764 + }, + { + "epoch": 0.75, + "learning_rate": 4.9656324026251406e-08, + "loss": 0.0059, + "step": 38765 + }, + { + "epoch": 0.75, + "learning_rate": 4.9652440681915264e-08, + "loss": 0.0056, + "step": 38766 + }, + { + "epoch": 0.75, + "learning_rate": 4.964855733757912e-08, + "loss": 0.6792, + "step": 38767 + }, + { + "epoch": 0.75, + "learning_rate": 4.964467399324298e-08, + "loss": 0.001, + "step": 38768 + }, + { + "epoch": 0.75, + "learning_rate": 4.964079064890684e-08, + "loss": 0.0003, + "step": 38769 + }, + { + "epoch": 0.75, + "learning_rate": 4.96369073045707e-08, + "loss": 0.0005, + "step": 38770 + }, + { + "epoch": 0.75, + "learning_rate": 4.963302396023455e-08, + "loss": 0.0035, + "step": 38771 + }, + { + "epoch": 0.75, + "learning_rate": 4.962914061589841e-08, + "loss": 0.6516, + "step": 38772 + }, + { + "epoch": 0.75, + "learning_rate": 4.9625257271562265e-08, + "loss": 0.0005, + "step": 38773 + }, + { + "epoch": 0.75, + "learning_rate": 4.9621373927226124e-08, + "loss": 0.0007, + "step": 38774 + }, + { + "epoch": 0.75, + "learning_rate": 4.961749058288998e-08, + "loss": 0.0004, + "step": 38775 + }, + { + "epoch": 0.75, + "learning_rate": 4.961360723855384e-08, + "loss": 1.2482, + "step": 38776 + }, + { + "epoch": 0.75, + "learning_rate": 4.96097238942177e-08, + "loss": 0.0005, + "step": 38777 + }, + { + "epoch": 0.75, + "learning_rate": 4.9605840549881557e-08, + "loss": 0.0024, + "step": 38778 + }, + { + "epoch": 0.75, + "learning_rate": 4.9601957205545415e-08, + "loss": 0.0005, + "step": 38779 + }, + { + "epoch": 0.75, + "learning_rate": 4.959807386120927e-08, + "loss": 0.0004, + "step": 38780 + }, + { + "epoch": 0.75, + "learning_rate": 4.959419051687313e-08, + "loss": 0.0004, + "step": 38781 + }, + { + "epoch": 0.75, + "learning_rate": 4.959030717253699e-08, + "loss": 0.0003, + "step": 38782 + }, + { + "epoch": 0.75, + "learning_rate": 4.958642382820085e-08, + "loss": 0.5364, + "step": 38783 + }, + { + "epoch": 0.75, + "learning_rate": 4.9582540483864706e-08, + "loss": 0.0004, + "step": 38784 + }, + { + "epoch": 0.75, + "learning_rate": 4.9578657139528564e-08, + "loss": 0.0004, + "step": 38785 + }, + { + "epoch": 0.75, + "learning_rate": 4.9574773795192416e-08, + "loss": 0.0004, + "step": 38786 + }, + { + "epoch": 0.75, + "learning_rate": 4.9570890450856274e-08, + "loss": 0.0005, + "step": 38787 + }, + { + "epoch": 0.75, + "learning_rate": 4.956700710652013e-08, + "loss": 0.9676, + "step": 38788 + }, + { + "epoch": 0.75, + "learning_rate": 4.956312376218399e-08, + "loss": 0.0005, + "step": 38789 + }, + { + "epoch": 0.75, + "learning_rate": 4.955924041784785e-08, + "loss": 0.8653, + "step": 38790 + }, + { + "epoch": 0.75, + "learning_rate": 4.955535707351171e-08, + "loss": 0.0045, + "step": 38791 + }, + { + "epoch": 0.75, + "learning_rate": 4.9551473729175565e-08, + "loss": 0.0003, + "step": 38792 + }, + { + "epoch": 0.75, + "learning_rate": 4.9547590384839424e-08, + "loss": 0.0004, + "step": 38793 + }, + { + "epoch": 0.75, + "learning_rate": 4.954370704050328e-08, + "loss": 0.0006, + "step": 38794 + }, + { + "epoch": 0.75, + "learning_rate": 4.953982369616714e-08, + "loss": 0.0005, + "step": 38795 + }, + { + "epoch": 0.75, + "learning_rate": 4.9535940351831e-08, + "loss": 0.0006, + "step": 38796 + }, + { + "epoch": 0.75, + "learning_rate": 4.9532057007494857e-08, + "loss": 0.0008, + "step": 38797 + }, + { + "epoch": 0.75, + "learning_rate": 4.9528173663158715e-08, + "loss": 0.0005, + "step": 38798 + }, + { + "epoch": 0.75, + "learning_rate": 4.952429031882257e-08, + "loss": 0.0004, + "step": 38799 + }, + { + "epoch": 0.75, + "learning_rate": 4.9520406974486425e-08, + "loss": 0.0004, + "step": 38800 + }, + { + "epoch": 0.75, + "learning_rate": 4.951652363015028e-08, + "loss": 0.0005, + "step": 38801 + }, + { + "epoch": 0.75, + "learning_rate": 4.951264028581414e-08, + "loss": 0.0004, + "step": 38802 + }, + { + "epoch": 0.75, + "learning_rate": 4.9508756941478e-08, + "loss": 0.0104, + "step": 38803 + }, + { + "epoch": 0.75, + "learning_rate": 4.950487359714186e-08, + "loss": 0.0095, + "step": 38804 + }, + { + "epoch": 0.75, + "learning_rate": 4.9500990252805716e-08, + "loss": 0.0942, + "step": 38805 + }, + { + "epoch": 0.75, + "learning_rate": 4.9497106908469574e-08, + "loss": 0.0005, + "step": 38806 + }, + { + "epoch": 0.75, + "learning_rate": 4.949322356413343e-08, + "loss": 0.0004, + "step": 38807 + }, + { + "epoch": 0.75, + "learning_rate": 4.948934021979729e-08, + "loss": 0.0009, + "step": 38808 + }, + { + "epoch": 0.75, + "learning_rate": 4.948545687546115e-08, + "loss": 0.0004, + "step": 38809 + }, + { + "epoch": 0.75, + "learning_rate": 4.9481573531125e-08, + "loss": 0.0003, + "step": 38810 + }, + { + "epoch": 0.75, + "learning_rate": 4.947769018678886e-08, + "loss": 0.0008, + "step": 38811 + }, + { + "epoch": 0.75, + "learning_rate": 4.947380684245272e-08, + "loss": 0.0004, + "step": 38812 + }, + { + "epoch": 0.75, + "learning_rate": 4.9469923498116575e-08, + "loss": 0.0005, + "step": 38813 + }, + { + "epoch": 0.75, + "learning_rate": 4.9466040153780434e-08, + "loss": 0.0002, + "step": 38814 + }, + { + "epoch": 0.75, + "learning_rate": 4.946215680944429e-08, + "loss": 0.0023, + "step": 38815 + }, + { + "epoch": 0.75, + "learning_rate": 4.945827346510815e-08, + "loss": 0.0005, + "step": 38816 + }, + { + "epoch": 0.75, + "learning_rate": 4.9454390120772e-08, + "loss": 0.0003, + "step": 38817 + }, + { + "epoch": 0.75, + "learning_rate": 4.945050677643586e-08, + "loss": 0.0005, + "step": 38818 + }, + { + "epoch": 0.75, + "learning_rate": 4.944662343209972e-08, + "loss": 0.0005, + "step": 38819 + }, + { + "epoch": 0.75, + "learning_rate": 4.9442740087763576e-08, + "loss": 0.0522, + "step": 38820 + }, + { + "epoch": 0.75, + "learning_rate": 4.9438856743427435e-08, + "loss": 0.0005, + "step": 38821 + }, + { + "epoch": 0.75, + "learning_rate": 4.943497339909129e-08, + "loss": 0.0065, + "step": 38822 + }, + { + "epoch": 0.75, + "learning_rate": 4.943109005475515e-08, + "loss": 0.001, + "step": 38823 + }, + { + "epoch": 0.75, + "learning_rate": 4.942720671041901e-08, + "loss": 0.0011, + "step": 38824 + }, + { + "epoch": 0.75, + "learning_rate": 4.942332336608287e-08, + "loss": 0.0022, + "step": 38825 + }, + { + "epoch": 0.75, + "learning_rate": 4.9419440021746726e-08, + "loss": 0.0003, + "step": 38826 + }, + { + "epoch": 0.75, + "learning_rate": 4.9415556677410584e-08, + "loss": 0.0005, + "step": 38827 + }, + { + "epoch": 0.75, + "learning_rate": 4.941167333307444e-08, + "loss": 0.0003, + "step": 38828 + }, + { + "epoch": 0.75, + "learning_rate": 4.9407789988738294e-08, + "loss": 0.0592, + "step": 38829 + }, + { + "epoch": 0.75, + "learning_rate": 4.940390664440215e-08, + "loss": 0.3468, + "step": 38830 + }, + { + "epoch": 0.75, + "learning_rate": 4.940002330006601e-08, + "loss": 0.0006, + "step": 38831 + }, + { + "epoch": 0.75, + "learning_rate": 4.939613995572987e-08, + "loss": 0.0004, + "step": 38832 + }, + { + "epoch": 0.75, + "learning_rate": 4.939225661139373e-08, + "loss": 0.0003, + "step": 38833 + }, + { + "epoch": 0.75, + "learning_rate": 4.9388373267057585e-08, + "loss": 0.0003, + "step": 38834 + }, + { + "epoch": 0.75, + "learning_rate": 4.9384489922721443e-08, + "loss": 0.0003, + "step": 38835 + }, + { + "epoch": 0.75, + "learning_rate": 4.93806065783853e-08, + "loss": 0.0005, + "step": 38836 + }, + { + "epoch": 0.75, + "learning_rate": 4.937672323404916e-08, + "loss": 0.0061, + "step": 38837 + }, + { + "epoch": 0.75, + "learning_rate": 4.937283988971302e-08, + "loss": 0.0005, + "step": 38838 + }, + { + "epoch": 0.75, + "learning_rate": 4.9368956545376876e-08, + "loss": 0.0031, + "step": 38839 + }, + { + "epoch": 0.75, + "learning_rate": 4.9365073201040735e-08, + "loss": 0.0004, + "step": 38840 + }, + { + "epoch": 0.75, + "learning_rate": 4.936118985670459e-08, + "loss": 0.0446, + "step": 38841 + }, + { + "epoch": 0.75, + "learning_rate": 4.935730651236845e-08, + "loss": 0.0007, + "step": 38842 + }, + { + "epoch": 0.75, + "learning_rate": 4.935342316803231e-08, + "loss": 0.8474, + "step": 38843 + }, + { + "epoch": 0.75, + "learning_rate": 4.934953982369616e-08, + "loss": 0.0165, + "step": 38844 + }, + { + "epoch": 0.75, + "learning_rate": 4.934565647936002e-08, + "loss": 0.0004, + "step": 38845 + }, + { + "epoch": 0.75, + "learning_rate": 4.934177313502388e-08, + "loss": 0.0004, + "step": 38846 + }, + { + "epoch": 0.75, + "learning_rate": 4.9337889790687736e-08, + "loss": 0.0003, + "step": 38847 + }, + { + "epoch": 0.75, + "learning_rate": 4.9334006446351594e-08, + "loss": 0.516, + "step": 38848 + }, + { + "epoch": 0.75, + "learning_rate": 4.933012310201545e-08, + "loss": 0.0002, + "step": 38849 + }, + { + "epoch": 0.75, + "learning_rate": 4.932623975767931e-08, + "loss": 0.0006, + "step": 38850 + }, + { + "epoch": 0.75, + "learning_rate": 4.932235641334317e-08, + "loss": 0.0006, + "step": 38851 + }, + { + "epoch": 0.75, + "learning_rate": 4.931847306900703e-08, + "loss": 0.0003, + "step": 38852 + }, + { + "epoch": 0.75, + "learning_rate": 4.9314589724670885e-08, + "loss": 0.002, + "step": 38853 + }, + { + "epoch": 0.75, + "learning_rate": 4.9310706380334743e-08, + "loss": 0.0016, + "step": 38854 + }, + { + "epoch": 0.75, + "learning_rate": 4.93068230359986e-08, + "loss": 0.0004, + "step": 38855 + }, + { + "epoch": 0.75, + "learning_rate": 4.930293969166246e-08, + "loss": 0.0004, + "step": 38856 + }, + { + "epoch": 0.75, + "learning_rate": 4.929905634732632e-08, + "loss": 0.0004, + "step": 38857 + }, + { + "epoch": 0.75, + "learning_rate": 4.929517300299017e-08, + "loss": 0.0005, + "step": 38858 + }, + { + "epoch": 0.75, + "learning_rate": 4.929128965865403e-08, + "loss": 0.0008, + "step": 38859 + }, + { + "epoch": 0.75, + "learning_rate": 4.9287406314317886e-08, + "loss": 0.8095, + "step": 38860 + }, + { + "epoch": 0.75, + "learning_rate": 4.9283522969981745e-08, + "loss": 0.0003, + "step": 38861 + }, + { + "epoch": 0.75, + "learning_rate": 4.92796396256456e-08, + "loss": 0.0008, + "step": 38862 + }, + { + "epoch": 0.75, + "learning_rate": 4.927575628130946e-08, + "loss": 0.0004, + "step": 38863 + }, + { + "epoch": 0.75, + "learning_rate": 4.927187293697332e-08, + "loss": 0.0007, + "step": 38864 + }, + { + "epoch": 0.75, + "learning_rate": 4.926798959263718e-08, + "loss": 0.0004, + "step": 38865 + }, + { + "epoch": 0.75, + "learning_rate": 4.9264106248301036e-08, + "loss": 0.6537, + "step": 38866 + }, + { + "epoch": 0.75, + "learning_rate": 4.9260222903964894e-08, + "loss": 0.0004, + "step": 38867 + }, + { + "epoch": 0.75, + "learning_rate": 4.925633955962875e-08, + "loss": 0.0004, + "step": 38868 + }, + { + "epoch": 0.75, + "learning_rate": 4.925245621529261e-08, + "loss": 0.0005, + "step": 38869 + }, + { + "epoch": 0.75, + "learning_rate": 4.924857287095647e-08, + "loss": 0.0003, + "step": 38870 + }, + { + "epoch": 0.75, + "learning_rate": 4.924468952662033e-08, + "loss": 0.0005, + "step": 38871 + }, + { + "epoch": 0.75, + "learning_rate": 4.9240806182284185e-08, + "loss": 0.0024, + "step": 38872 + }, + { + "epoch": 0.75, + "learning_rate": 4.923692283794804e-08, + "loss": 0.0009, + "step": 38873 + }, + { + "epoch": 0.75, + "learning_rate": 4.9233039493611895e-08, + "loss": 0.0005, + "step": 38874 + }, + { + "epoch": 0.75, + "learning_rate": 4.9229156149275753e-08, + "loss": 0.0003, + "step": 38875 + }, + { + "epoch": 0.75, + "learning_rate": 4.922527280493961e-08, + "loss": 0.0006, + "step": 38876 + }, + { + "epoch": 0.75, + "learning_rate": 4.922138946060347e-08, + "loss": 0.0004, + "step": 38877 + }, + { + "epoch": 0.75, + "learning_rate": 4.921750611626733e-08, + "loss": 0.0004, + "step": 38878 + }, + { + "epoch": 0.75, + "learning_rate": 4.9213622771931186e-08, + "loss": 0.0004, + "step": 38879 + }, + { + "epoch": 0.75, + "learning_rate": 4.9209739427595045e-08, + "loss": 0.0003, + "step": 38880 + }, + { + "epoch": 0.75, + "learning_rate": 4.92058560832589e-08, + "loss": 0.5163, + "step": 38881 + }, + { + "epoch": 0.75, + "learning_rate": 4.920197273892276e-08, + "loss": 0.0006, + "step": 38882 + }, + { + "epoch": 0.75, + "learning_rate": 4.919808939458662e-08, + "loss": 0.0004, + "step": 38883 + }, + { + "epoch": 0.75, + "learning_rate": 4.919420605025048e-08, + "loss": 0.0017, + "step": 38884 + }, + { + "epoch": 0.75, + "learning_rate": 4.9190322705914336e-08, + "loss": 0.0005, + "step": 38885 + }, + { + "epoch": 0.75, + "learning_rate": 4.9186439361578194e-08, + "loss": 0.0004, + "step": 38886 + }, + { + "epoch": 0.75, + "learning_rate": 4.9182556017242046e-08, + "loss": 0.0003, + "step": 38887 + }, + { + "epoch": 0.75, + "learning_rate": 4.9178672672905904e-08, + "loss": 0.0005, + "step": 38888 + }, + { + "epoch": 0.75, + "learning_rate": 4.917478932856976e-08, + "loss": 0.0003, + "step": 38889 + }, + { + "epoch": 0.75, + "learning_rate": 4.917090598423362e-08, + "loss": 0.0006, + "step": 38890 + }, + { + "epoch": 0.75, + "learning_rate": 4.916702263989748e-08, + "loss": 0.0005, + "step": 38891 + }, + { + "epoch": 0.75, + "learning_rate": 4.916313929556134e-08, + "loss": 0.0004, + "step": 38892 + }, + { + "epoch": 0.75, + "learning_rate": 4.9159255951225195e-08, + "loss": 0.0004, + "step": 38893 + }, + { + "epoch": 0.75, + "learning_rate": 4.9155372606889053e-08, + "loss": 0.0006, + "step": 38894 + }, + { + "epoch": 0.75, + "learning_rate": 4.915148926255291e-08, + "loss": 0.0004, + "step": 38895 + }, + { + "epoch": 0.75, + "learning_rate": 4.914760591821677e-08, + "loss": 0.0084, + "step": 38896 + }, + { + "epoch": 0.75, + "learning_rate": 4.914372257388063e-08, + "loss": 0.0003, + "step": 38897 + }, + { + "epoch": 0.75, + "learning_rate": 4.913983922954448e-08, + "loss": 0.0012, + "step": 38898 + }, + { + "epoch": 0.75, + "learning_rate": 4.913595588520834e-08, + "loss": 0.0004, + "step": 38899 + }, + { + "epoch": 0.75, + "learning_rate": 4.9132072540872196e-08, + "loss": 0.0003, + "step": 38900 + }, + { + "epoch": 0.75, + "learning_rate": 4.9128189196536054e-08, + "loss": 0.0005, + "step": 38901 + }, + { + "epoch": 0.75, + "learning_rate": 4.912430585219991e-08, + "loss": 0.0004, + "step": 38902 + }, + { + "epoch": 0.75, + "learning_rate": 4.912042250786377e-08, + "loss": 0.0006, + "step": 38903 + }, + { + "epoch": 0.75, + "learning_rate": 4.911653916352763e-08, + "loss": 0.0003, + "step": 38904 + }, + { + "epoch": 0.75, + "learning_rate": 4.911265581919149e-08, + "loss": 0.0004, + "step": 38905 + }, + { + "epoch": 0.75, + "learning_rate": 4.910877247485534e-08, + "loss": 0.0006, + "step": 38906 + }, + { + "epoch": 0.75, + "learning_rate": 4.91048891305192e-08, + "loss": 0.0005, + "step": 38907 + }, + { + "epoch": 0.75, + "learning_rate": 4.9101005786183056e-08, + "loss": 0.0005, + "step": 38908 + }, + { + "epoch": 0.75, + "learning_rate": 4.9097122441846914e-08, + "loss": 0.0006, + "step": 38909 + }, + { + "epoch": 0.75, + "learning_rate": 4.909323909751077e-08, + "loss": 0.0004, + "step": 38910 + }, + { + "epoch": 0.75, + "learning_rate": 4.908935575317463e-08, + "loss": 0.0005, + "step": 38911 + }, + { + "epoch": 0.75, + "learning_rate": 4.908547240883849e-08, + "loss": 0.0005, + "step": 38912 + }, + { + "epoch": 0.75, + "learning_rate": 4.908158906450235e-08, + "loss": 0.0011, + "step": 38913 + }, + { + "epoch": 0.75, + "learning_rate": 4.9077705720166205e-08, + "loss": 0.0003, + "step": 38914 + }, + { + "epoch": 0.75, + "learning_rate": 4.907382237583006e-08, + "loss": 0.0005, + "step": 38915 + }, + { + "epoch": 0.75, + "learning_rate": 4.9069939031493915e-08, + "loss": 0.0005, + "step": 38916 + }, + { + "epoch": 0.75, + "learning_rate": 4.906605568715777e-08, + "loss": 0.6075, + "step": 38917 + }, + { + "epoch": 0.75, + "learning_rate": 4.906217234282163e-08, + "loss": 0.0003, + "step": 38918 + }, + { + "epoch": 0.75, + "learning_rate": 4.905828899848549e-08, + "loss": 0.0003, + "step": 38919 + }, + { + "epoch": 0.75, + "learning_rate": 4.905440565414935e-08, + "loss": 0.7593, + "step": 38920 + }, + { + "epoch": 0.75, + "learning_rate": 4.9050522309813206e-08, + "loss": 0.0004, + "step": 38921 + }, + { + "epoch": 0.76, + "learning_rate": 4.9046638965477064e-08, + "loss": 0.0004, + "step": 38922 + }, + { + "epoch": 0.76, + "learning_rate": 4.904275562114092e-08, + "loss": 0.0005, + "step": 38923 + }, + { + "epoch": 0.76, + "learning_rate": 4.903887227680478e-08, + "loss": 0.0005, + "step": 38924 + }, + { + "epoch": 0.76, + "learning_rate": 4.903498893246864e-08, + "loss": 0.0205, + "step": 38925 + }, + { + "epoch": 0.76, + "learning_rate": 4.90311055881325e-08, + "loss": 0.0004, + "step": 38926 + }, + { + "epoch": 0.76, + "learning_rate": 4.9027222243796356e-08, + "loss": 0.0035, + "step": 38927 + }, + { + "epoch": 0.76, + "learning_rate": 4.9023338899460214e-08, + "loss": 0.0005, + "step": 38928 + }, + { + "epoch": 0.76, + "learning_rate": 4.901945555512407e-08, + "loss": 0.0003, + "step": 38929 + }, + { + "epoch": 0.76, + "learning_rate": 4.901557221078793e-08, + "loss": 0.0005, + "step": 38930 + }, + { + "epoch": 0.76, + "learning_rate": 4.901168886645178e-08, + "loss": 1.027, + "step": 38931 + }, + { + "epoch": 0.76, + "learning_rate": 4.900780552211564e-08, + "loss": 0.0414, + "step": 38932 + }, + { + "epoch": 0.76, + "learning_rate": 4.90039221777795e-08, + "loss": 0.0006, + "step": 38933 + }, + { + "epoch": 0.76, + "learning_rate": 4.9000038833443357e-08, + "loss": 0.0023, + "step": 38934 + }, + { + "epoch": 0.76, + "learning_rate": 4.8996155489107215e-08, + "loss": 1.0722, + "step": 38935 + }, + { + "epoch": 0.76, + "learning_rate": 4.899227214477107e-08, + "loss": 0.0004, + "step": 38936 + }, + { + "epoch": 0.76, + "learning_rate": 4.898838880043493e-08, + "loss": 0.0004, + "step": 38937 + }, + { + "epoch": 0.76, + "learning_rate": 4.898450545609879e-08, + "loss": 0.0004, + "step": 38938 + }, + { + "epoch": 0.76, + "learning_rate": 4.898062211176265e-08, + "loss": 0.0003, + "step": 38939 + }, + { + "epoch": 0.76, + "learning_rate": 4.8976738767426506e-08, + "loss": 0.5731, + "step": 38940 + }, + { + "epoch": 0.76, + "learning_rate": 4.8972855423090364e-08, + "loss": 0.0005, + "step": 38941 + }, + { + "epoch": 0.76, + "learning_rate": 4.896897207875422e-08, + "loss": 0.0004, + "step": 38942 + }, + { + "epoch": 0.76, + "learning_rate": 4.896508873441808e-08, + "loss": 0.0004, + "step": 38943 + }, + { + "epoch": 0.76, + "learning_rate": 4.896120539008194e-08, + "loss": 0.0003, + "step": 38944 + }, + { + "epoch": 0.76, + "learning_rate": 4.895732204574579e-08, + "loss": 0.0003, + "step": 38945 + }, + { + "epoch": 0.76, + "learning_rate": 4.895343870140965e-08, + "loss": 0.0004, + "step": 38946 + }, + { + "epoch": 0.76, + "learning_rate": 4.894955535707351e-08, + "loss": 0.7, + "step": 38947 + }, + { + "epoch": 0.76, + "learning_rate": 4.8945672012737365e-08, + "loss": 0.0016, + "step": 38948 + }, + { + "epoch": 0.76, + "learning_rate": 4.8941788668401224e-08, + "loss": 0.0004, + "step": 38949 + }, + { + "epoch": 0.76, + "learning_rate": 4.893790532406508e-08, + "loss": 0.0022, + "step": 38950 + }, + { + "epoch": 0.76, + "learning_rate": 4.893402197972894e-08, + "loss": 0.7087, + "step": 38951 + }, + { + "epoch": 0.76, + "learning_rate": 4.89301386353928e-08, + "loss": 0.0004, + "step": 38952 + }, + { + "epoch": 0.76, + "learning_rate": 4.892625529105666e-08, + "loss": 0.0006, + "step": 38953 + }, + { + "epoch": 0.76, + "learning_rate": 4.8922371946720515e-08, + "loss": 0.0006, + "step": 38954 + }, + { + "epoch": 0.76, + "learning_rate": 4.891848860238437e-08, + "loss": 0.0005, + "step": 38955 + }, + { + "epoch": 0.76, + "learning_rate": 4.891460525804823e-08, + "loss": 0.0008, + "step": 38956 + }, + { + "epoch": 0.76, + "learning_rate": 4.891072191371209e-08, + "loss": 0.0573, + "step": 38957 + }, + { + "epoch": 0.76, + "learning_rate": 4.890683856937595e-08, + "loss": 0.0003, + "step": 38958 + }, + { + "epoch": 0.76, + "learning_rate": 4.8902955225039806e-08, + "loss": 0.2521, + "step": 38959 + }, + { + "epoch": 0.76, + "learning_rate": 4.889907188070366e-08, + "loss": 0.2105, + "step": 38960 + }, + { + "epoch": 0.76, + "learning_rate": 4.8895188536367516e-08, + "loss": 0.0037, + "step": 38961 + }, + { + "epoch": 0.76, + "learning_rate": 4.8891305192031374e-08, + "loss": 0.0003, + "step": 38962 + }, + { + "epoch": 0.76, + "learning_rate": 4.888742184769523e-08, + "loss": 0.0004, + "step": 38963 + }, + { + "epoch": 0.76, + "learning_rate": 4.888353850335909e-08, + "loss": 0.0005, + "step": 38964 + }, + { + "epoch": 0.76, + "learning_rate": 4.887965515902295e-08, + "loss": 0.0006, + "step": 38965 + }, + { + "epoch": 0.76, + "learning_rate": 4.887577181468681e-08, + "loss": 0.0018, + "step": 38966 + }, + { + "epoch": 0.76, + "learning_rate": 4.8871888470350666e-08, + "loss": 0.0003, + "step": 38967 + }, + { + "epoch": 0.76, + "learning_rate": 4.8868005126014524e-08, + "loss": 0.0004, + "step": 38968 + }, + { + "epoch": 0.76, + "learning_rate": 4.886412178167838e-08, + "loss": 0.0004, + "step": 38969 + }, + { + "epoch": 0.76, + "learning_rate": 4.886023843734224e-08, + "loss": 0.0005, + "step": 38970 + }, + { + "epoch": 0.76, + "learning_rate": 4.88563550930061e-08, + "loss": 0.0007, + "step": 38971 + }, + { + "epoch": 0.76, + "learning_rate": 4.885247174866996e-08, + "loss": 0.0004, + "step": 38972 + }, + { + "epoch": 0.76, + "learning_rate": 4.8848588404333815e-08, + "loss": 0.0003, + "step": 38973 + }, + { + "epoch": 0.76, + "learning_rate": 4.8844705059997667e-08, + "loss": 0.0004, + "step": 38974 + }, + { + "epoch": 0.76, + "learning_rate": 4.8840821715661525e-08, + "loss": 0.0055, + "step": 38975 + }, + { + "epoch": 0.76, + "learning_rate": 4.883693837132538e-08, + "loss": 0.0004, + "step": 38976 + }, + { + "epoch": 0.76, + "learning_rate": 4.883305502698924e-08, + "loss": 1.043, + "step": 38977 + }, + { + "epoch": 0.76, + "learning_rate": 4.88291716826531e-08, + "loss": 0.0005, + "step": 38978 + }, + { + "epoch": 0.76, + "learning_rate": 4.882528833831696e-08, + "loss": 0.0073, + "step": 38979 + }, + { + "epoch": 0.76, + "learning_rate": 4.8821404993980816e-08, + "loss": 0.5317, + "step": 38980 + }, + { + "epoch": 0.76, + "learning_rate": 4.8817521649644674e-08, + "loss": 0.0005, + "step": 38981 + }, + { + "epoch": 0.76, + "learning_rate": 4.881363830530853e-08, + "loss": 0.0006, + "step": 38982 + }, + { + "epoch": 0.76, + "learning_rate": 4.880975496097239e-08, + "loss": 0.0007, + "step": 38983 + }, + { + "epoch": 0.76, + "learning_rate": 4.880587161663625e-08, + "loss": 0.0006, + "step": 38984 + }, + { + "epoch": 0.76, + "learning_rate": 4.880198827230011e-08, + "loss": 0.0004, + "step": 38985 + }, + { + "epoch": 0.76, + "learning_rate": 4.8798104927963966e-08, + "loss": 1.0264, + "step": 38986 + }, + { + "epoch": 0.76, + "learning_rate": 4.879422158362782e-08, + "loss": 0.0004, + "step": 38987 + }, + { + "epoch": 0.76, + "learning_rate": 4.8790338239291675e-08, + "loss": 0.0035, + "step": 38988 + }, + { + "epoch": 0.76, + "learning_rate": 4.8786454894955534e-08, + "loss": 0.0006, + "step": 38989 + }, + { + "epoch": 0.76, + "learning_rate": 4.878257155061939e-08, + "loss": 0.0004, + "step": 38990 + }, + { + "epoch": 0.76, + "learning_rate": 4.877868820628325e-08, + "loss": 0.0005, + "step": 38991 + }, + { + "epoch": 0.76, + "learning_rate": 4.877480486194711e-08, + "loss": 0.0004, + "step": 38992 + }, + { + "epoch": 0.76, + "learning_rate": 4.8770921517610967e-08, + "loss": 0.0005, + "step": 38993 + }, + { + "epoch": 0.76, + "learning_rate": 4.876703817327482e-08, + "loss": 0.0005, + "step": 38994 + }, + { + "epoch": 0.76, + "learning_rate": 4.8763154828938677e-08, + "loss": 0.0003, + "step": 38995 + }, + { + "epoch": 0.76, + "learning_rate": 4.8759271484602535e-08, + "loss": 0.0005, + "step": 38996 + }, + { + "epoch": 0.76, + "learning_rate": 4.875538814026639e-08, + "loss": 0.0005, + "step": 38997 + }, + { + "epoch": 0.76, + "learning_rate": 4.875150479593025e-08, + "loss": 0.0006, + "step": 38998 + }, + { + "epoch": 0.76, + "learning_rate": 4.874762145159411e-08, + "loss": 0.0003, + "step": 38999 + }, + { + "epoch": 0.76, + "learning_rate": 4.874373810725797e-08, + "loss": 0.0004, + "step": 39000 + }, + { + "epoch": 0.76, + "learning_rate": 4.8739854762921826e-08, + "loss": 0.0004, + "step": 39001 + }, + { + "epoch": 0.76, + "learning_rate": 4.8735971418585684e-08, + "loss": 0.0005, + "step": 39002 + }, + { + "epoch": 0.76, + "learning_rate": 4.8732088074249536e-08, + "loss": 0.0123, + "step": 39003 + }, + { + "epoch": 0.76, + "learning_rate": 4.8728204729913394e-08, + "loss": 0.001, + "step": 39004 + }, + { + "epoch": 0.76, + "learning_rate": 4.872432138557725e-08, + "loss": 0.0006, + "step": 39005 + }, + { + "epoch": 0.76, + "learning_rate": 4.872043804124111e-08, + "loss": 0.0003, + "step": 39006 + }, + { + "epoch": 0.76, + "learning_rate": 4.871655469690497e-08, + "loss": 0.0004, + "step": 39007 + }, + { + "epoch": 0.76, + "learning_rate": 4.871267135256883e-08, + "loss": 0.0006, + "step": 39008 + }, + { + "epoch": 0.76, + "learning_rate": 4.8708788008232685e-08, + "loss": 0.0006, + "step": 39009 + }, + { + "epoch": 0.76, + "learning_rate": 4.8704904663896544e-08, + "loss": 0.0004, + "step": 39010 + }, + { + "epoch": 0.76, + "learning_rate": 4.87010213195604e-08, + "loss": 0.0005, + "step": 39011 + }, + { + "epoch": 0.76, + "learning_rate": 4.869713797522426e-08, + "loss": 0.464, + "step": 39012 + }, + { + "epoch": 0.76, + "learning_rate": 4.869325463088812e-08, + "loss": 0.0003, + "step": 39013 + }, + { + "epoch": 0.76, + "learning_rate": 4.8689371286551977e-08, + "loss": 0.9024, + "step": 39014 + }, + { + "epoch": 0.76, + "learning_rate": 4.8685487942215835e-08, + "loss": 0.0004, + "step": 39015 + }, + { + "epoch": 0.76, + "learning_rate": 4.868160459787969e-08, + "loss": 0.0004, + "step": 39016 + }, + { + "epoch": 0.76, + "learning_rate": 4.867772125354355e-08, + "loss": 0.0005, + "step": 39017 + }, + { + "epoch": 0.76, + "learning_rate": 4.86738379092074e-08, + "loss": 1.2742, + "step": 39018 + }, + { + "epoch": 0.76, + "learning_rate": 4.866995456487126e-08, + "loss": 0.0002, + "step": 39019 + }, + { + "epoch": 0.76, + "learning_rate": 4.866607122053512e-08, + "loss": 0.0004, + "step": 39020 + }, + { + "epoch": 0.76, + "learning_rate": 4.866218787619898e-08, + "loss": 0.0015, + "step": 39021 + }, + { + "epoch": 0.76, + "learning_rate": 4.8658304531862836e-08, + "loss": 0.0004, + "step": 39022 + }, + { + "epoch": 0.76, + "learning_rate": 4.8654421187526694e-08, + "loss": 0.0006, + "step": 39023 + }, + { + "epoch": 0.76, + "learning_rate": 4.865053784319055e-08, + "loss": 0.0003, + "step": 39024 + }, + { + "epoch": 0.76, + "learning_rate": 4.864665449885441e-08, + "loss": 0.2243, + "step": 39025 + }, + { + "epoch": 0.76, + "learning_rate": 4.864277115451827e-08, + "loss": 0.0007, + "step": 39026 + }, + { + "epoch": 0.76, + "learning_rate": 4.863888781018213e-08, + "loss": 0.0005, + "step": 39027 + }, + { + "epoch": 0.76, + "learning_rate": 4.8635004465845985e-08, + "loss": 1.1318, + "step": 39028 + }, + { + "epoch": 0.76, + "learning_rate": 4.8631121121509844e-08, + "loss": 0.0004, + "step": 39029 + }, + { + "epoch": 0.76, + "learning_rate": 4.86272377771737e-08, + "loss": 0.0004, + "step": 39030 + }, + { + "epoch": 0.76, + "learning_rate": 4.862335443283756e-08, + "loss": 0.0005, + "step": 39031 + }, + { + "epoch": 0.76, + "learning_rate": 4.861947108850141e-08, + "loss": 0.0005, + "step": 39032 + }, + { + "epoch": 0.76, + "learning_rate": 4.861558774416527e-08, + "loss": 0.0004, + "step": 39033 + }, + { + "epoch": 0.76, + "learning_rate": 4.861170439982913e-08, + "loss": 0.0005, + "step": 39034 + }, + { + "epoch": 0.76, + "learning_rate": 4.8607821055492986e-08, + "loss": 0.0005, + "step": 39035 + }, + { + "epoch": 0.76, + "learning_rate": 4.8603937711156845e-08, + "loss": 0.0004, + "step": 39036 + }, + { + "epoch": 0.76, + "learning_rate": 4.86000543668207e-08, + "loss": 0.0004, + "step": 39037 + }, + { + "epoch": 0.76, + "learning_rate": 4.859617102248456e-08, + "loss": 0.0009, + "step": 39038 + }, + { + "epoch": 0.76, + "learning_rate": 4.859228767814842e-08, + "loss": 0.0003, + "step": 39039 + }, + { + "epoch": 0.76, + "learning_rate": 4.858840433381228e-08, + "loss": 0.0006, + "step": 39040 + }, + { + "epoch": 0.76, + "learning_rate": 4.8584520989476136e-08, + "loss": 0.0045, + "step": 39041 + }, + { + "epoch": 0.76, + "learning_rate": 4.8580637645139994e-08, + "loss": 0.92, + "step": 39042 + }, + { + "epoch": 0.76, + "learning_rate": 4.857675430080385e-08, + "loss": 0.0004, + "step": 39043 + }, + { + "epoch": 0.76, + "learning_rate": 4.857287095646771e-08, + "loss": 0.3364, + "step": 39044 + }, + { + "epoch": 0.76, + "learning_rate": 4.856898761213157e-08, + "loss": 0.0003, + "step": 39045 + }, + { + "epoch": 0.76, + "learning_rate": 4.856510426779543e-08, + "loss": 0.0043, + "step": 39046 + }, + { + "epoch": 0.76, + "learning_rate": 4.856122092345928e-08, + "loss": 0.0005, + "step": 39047 + }, + { + "epoch": 0.76, + "learning_rate": 4.855733757912314e-08, + "loss": 0.0007, + "step": 39048 + }, + { + "epoch": 0.76, + "learning_rate": 4.8553454234786995e-08, + "loss": 0.0005, + "step": 39049 + }, + { + "epoch": 0.76, + "learning_rate": 4.8549570890450853e-08, + "loss": 0.0004, + "step": 39050 + }, + { + "epoch": 0.76, + "learning_rate": 4.854568754611471e-08, + "loss": 0.0004, + "step": 39051 + }, + { + "epoch": 0.76, + "learning_rate": 4.854180420177857e-08, + "loss": 0.0004, + "step": 39052 + }, + { + "epoch": 0.76, + "learning_rate": 4.853792085744243e-08, + "loss": 0.0005, + "step": 39053 + }, + { + "epoch": 0.76, + "learning_rate": 4.8534037513106286e-08, + "loss": 0.0004, + "step": 39054 + }, + { + "epoch": 0.76, + "learning_rate": 4.8530154168770145e-08, + "loss": 0.0211, + "step": 39055 + }, + { + "epoch": 0.76, + "learning_rate": 4.8526270824434e-08, + "loss": 0.0006, + "step": 39056 + }, + { + "epoch": 0.76, + "learning_rate": 4.852238748009786e-08, + "loss": 0.0005, + "step": 39057 + }, + { + "epoch": 0.76, + "learning_rate": 4.851850413576172e-08, + "loss": 0.002, + "step": 39058 + }, + { + "epoch": 0.76, + "learning_rate": 4.851462079142558e-08, + "loss": 0.0004, + "step": 39059 + }, + { + "epoch": 0.76, + "learning_rate": 4.8510737447089436e-08, + "loss": 0.0003, + "step": 39060 + }, + { + "epoch": 0.76, + "learning_rate": 4.850685410275329e-08, + "loss": 0.0003, + "step": 39061 + }, + { + "epoch": 0.76, + "learning_rate": 4.8502970758417146e-08, + "loss": 0.0005, + "step": 39062 + }, + { + "epoch": 0.76, + "learning_rate": 4.8499087414081004e-08, + "loss": 1.1531, + "step": 39063 + }, + { + "epoch": 0.76, + "learning_rate": 4.849520406974486e-08, + "loss": 0.0004, + "step": 39064 + }, + { + "epoch": 0.76, + "learning_rate": 4.849132072540872e-08, + "loss": 0.0023, + "step": 39065 + }, + { + "epoch": 0.76, + "learning_rate": 4.848743738107258e-08, + "loss": 0.0021, + "step": 39066 + }, + { + "epoch": 0.76, + "learning_rate": 4.848355403673644e-08, + "loss": 0.0007, + "step": 39067 + }, + { + "epoch": 0.76, + "learning_rate": 4.8479670692400295e-08, + "loss": 0.0005, + "step": 39068 + }, + { + "epoch": 0.76, + "learning_rate": 4.8475787348064153e-08, + "loss": 0.0005, + "step": 39069 + }, + { + "epoch": 0.76, + "learning_rate": 4.847190400372801e-08, + "loss": 0.0131, + "step": 39070 + }, + { + "epoch": 0.76, + "learning_rate": 4.846802065939187e-08, + "loss": 0.0005, + "step": 39071 + }, + { + "epoch": 0.76, + "learning_rate": 4.846413731505573e-08, + "loss": 0.0004, + "step": 39072 + }, + { + "epoch": 0.76, + "learning_rate": 4.8460253970719586e-08, + "loss": 0.0005, + "step": 39073 + }, + { + "epoch": 0.76, + "learning_rate": 4.8456370626383445e-08, + "loss": 0.0004, + "step": 39074 + }, + { + "epoch": 0.76, + "learning_rate": 4.8452487282047296e-08, + "loss": 0.0005, + "step": 39075 + }, + { + "epoch": 0.76, + "learning_rate": 4.8448603937711155e-08, + "loss": 0.0006, + "step": 39076 + }, + { + "epoch": 0.76, + "learning_rate": 4.844472059337501e-08, + "loss": 0.0003, + "step": 39077 + }, + { + "epoch": 0.76, + "learning_rate": 4.844083724903887e-08, + "loss": 0.0005, + "step": 39078 + }, + { + "epoch": 0.76, + "learning_rate": 4.843695390470273e-08, + "loss": 0.0007, + "step": 39079 + }, + { + "epoch": 0.76, + "learning_rate": 4.843307056036659e-08, + "loss": 0.0937, + "step": 39080 + }, + { + "epoch": 0.76, + "learning_rate": 4.8429187216030446e-08, + "loss": 0.0008, + "step": 39081 + }, + { + "epoch": 0.76, + "learning_rate": 4.8425303871694304e-08, + "loss": 0.0004, + "step": 39082 + }, + { + "epoch": 0.76, + "learning_rate": 4.8421420527358156e-08, + "loss": 0.0004, + "step": 39083 + }, + { + "epoch": 0.76, + "learning_rate": 4.8417537183022014e-08, + "loss": 0.0003, + "step": 39084 + }, + { + "epoch": 0.76, + "learning_rate": 4.841365383868587e-08, + "loss": 0.7328, + "step": 39085 + }, + { + "epoch": 0.76, + "learning_rate": 4.840977049434973e-08, + "loss": 0.0003, + "step": 39086 + }, + { + "epoch": 0.76, + "learning_rate": 4.840588715001359e-08, + "loss": 0.0911, + "step": 39087 + }, + { + "epoch": 0.76, + "learning_rate": 4.840200380567745e-08, + "loss": 0.0004, + "step": 39088 + }, + { + "epoch": 0.76, + "learning_rate": 4.8398120461341305e-08, + "loss": 0.0005, + "step": 39089 + }, + { + "epoch": 0.76, + "learning_rate": 4.839423711700516e-08, + "loss": 0.0005, + "step": 39090 + }, + { + "epoch": 0.76, + "learning_rate": 4.8390353772669015e-08, + "loss": 0.0026, + "step": 39091 + }, + { + "epoch": 0.76, + "learning_rate": 4.838647042833287e-08, + "loss": 0.0003, + "step": 39092 + }, + { + "epoch": 0.76, + "learning_rate": 4.838258708399673e-08, + "loss": 0.0013, + "step": 39093 + }, + { + "epoch": 0.76, + "learning_rate": 4.837870373966059e-08, + "loss": 0.0006, + "step": 39094 + }, + { + "epoch": 0.76, + "learning_rate": 4.837482039532445e-08, + "loss": 0.0003, + "step": 39095 + }, + { + "epoch": 0.76, + "learning_rate": 4.8370937050988306e-08, + "loss": 0.0006, + "step": 39096 + }, + { + "epoch": 0.76, + "learning_rate": 4.8367053706652164e-08, + "loss": 0.0002, + "step": 39097 + }, + { + "epoch": 0.76, + "learning_rate": 4.836317036231602e-08, + "loss": 0.0005, + "step": 39098 + }, + { + "epoch": 0.76, + "learning_rate": 4.835928701797988e-08, + "loss": 0.0004, + "step": 39099 + }, + { + "epoch": 0.76, + "learning_rate": 4.835540367364374e-08, + "loss": 0.0004, + "step": 39100 + }, + { + "epoch": 0.76, + "learning_rate": 4.83515203293076e-08, + "loss": 0.0003, + "step": 39101 + }, + { + "epoch": 0.76, + "learning_rate": 4.8347636984971456e-08, + "loss": 0.0006, + "step": 39102 + }, + { + "epoch": 0.76, + "learning_rate": 4.8343753640635314e-08, + "loss": 0.0005, + "step": 39103 + }, + { + "epoch": 0.76, + "learning_rate": 4.833987029629917e-08, + "loss": 0.0005, + "step": 39104 + }, + { + "epoch": 0.76, + "learning_rate": 4.8335986951963024e-08, + "loss": 0.0004, + "step": 39105 + }, + { + "epoch": 0.76, + "learning_rate": 4.833210360762688e-08, + "loss": 0.0003, + "step": 39106 + }, + { + "epoch": 0.76, + "learning_rate": 4.832822026329074e-08, + "loss": 0.0005, + "step": 39107 + }, + { + "epoch": 0.76, + "learning_rate": 4.83243369189546e-08, + "loss": 0.0003, + "step": 39108 + }, + { + "epoch": 0.76, + "learning_rate": 4.832045357461846e-08, + "loss": 0.0328, + "step": 39109 + }, + { + "epoch": 0.76, + "learning_rate": 4.8316570230282315e-08, + "loss": 0.0015, + "step": 39110 + }, + { + "epoch": 0.76, + "learning_rate": 4.831268688594617e-08, + "loss": 0.0072, + "step": 39111 + }, + { + "epoch": 0.76, + "learning_rate": 4.830880354161003e-08, + "loss": 0.0005, + "step": 39112 + }, + { + "epoch": 0.76, + "learning_rate": 4.830492019727389e-08, + "loss": 0.1041, + "step": 39113 + }, + { + "epoch": 0.76, + "learning_rate": 4.830103685293775e-08, + "loss": 0.099, + "step": 39114 + }, + { + "epoch": 0.76, + "learning_rate": 4.8297153508601606e-08, + "loss": 0.0004, + "step": 39115 + }, + { + "epoch": 0.76, + "learning_rate": 4.8293270164265465e-08, + "loss": 0.0005, + "step": 39116 + }, + { + "epoch": 0.76, + "learning_rate": 4.828938681992932e-08, + "loss": 0.8478, + "step": 39117 + }, + { + "epoch": 0.76, + "learning_rate": 4.828550347559318e-08, + "loss": 0.0003, + "step": 39118 + }, + { + "epoch": 0.76, + "learning_rate": 4.828162013125703e-08, + "loss": 0.0006, + "step": 39119 + }, + { + "epoch": 0.76, + "learning_rate": 4.827773678692089e-08, + "loss": 0.0005, + "step": 39120 + }, + { + "epoch": 0.76, + "learning_rate": 4.827385344258475e-08, + "loss": 0.0005, + "step": 39121 + }, + { + "epoch": 0.76, + "learning_rate": 4.826997009824861e-08, + "loss": 0.0018, + "step": 39122 + }, + { + "epoch": 0.76, + "learning_rate": 4.8266086753912466e-08, + "loss": 0.0005, + "step": 39123 + }, + { + "epoch": 0.76, + "learning_rate": 4.8262203409576324e-08, + "loss": 0.0004, + "step": 39124 + }, + { + "epoch": 0.76, + "learning_rate": 4.825832006524018e-08, + "loss": 0.0009, + "step": 39125 + }, + { + "epoch": 0.76, + "learning_rate": 4.825443672090404e-08, + "loss": 0.0004, + "step": 39126 + }, + { + "epoch": 0.76, + "learning_rate": 4.82505533765679e-08, + "loss": 0.0004, + "step": 39127 + }, + { + "epoch": 0.76, + "learning_rate": 4.824667003223176e-08, + "loss": 0.0005, + "step": 39128 + }, + { + "epoch": 0.76, + "learning_rate": 4.8242786687895615e-08, + "loss": 0.0005, + "step": 39129 + }, + { + "epoch": 0.76, + "learning_rate": 4.8238903343559473e-08, + "loss": 0.0004, + "step": 39130 + }, + { + "epoch": 0.76, + "learning_rate": 4.823501999922333e-08, + "loss": 0.0005, + "step": 39131 + }, + { + "epoch": 0.76, + "learning_rate": 4.823113665488719e-08, + "loss": 0.5798, + "step": 39132 + }, + { + "epoch": 0.76, + "learning_rate": 4.822725331055105e-08, + "loss": 0.5063, + "step": 39133 + }, + { + "epoch": 0.76, + "learning_rate": 4.82233699662149e-08, + "loss": 0.0004, + "step": 39134 + }, + { + "epoch": 0.76, + "learning_rate": 4.821948662187876e-08, + "loss": 0.0004, + "step": 39135 + }, + { + "epoch": 0.76, + "learning_rate": 4.8215603277542616e-08, + "loss": 0.0005, + "step": 39136 + }, + { + "epoch": 0.76, + "learning_rate": 4.8211719933206474e-08, + "loss": 0.0005, + "step": 39137 + }, + { + "epoch": 0.76, + "learning_rate": 4.820783658887033e-08, + "loss": 0.0005, + "step": 39138 + }, + { + "epoch": 0.76, + "learning_rate": 4.820395324453419e-08, + "loss": 0.0005, + "step": 39139 + }, + { + "epoch": 0.76, + "learning_rate": 4.820006990019805e-08, + "loss": 0.0006, + "step": 39140 + }, + { + "epoch": 0.76, + "learning_rate": 4.819618655586191e-08, + "loss": 0.0005, + "step": 39141 + }, + { + "epoch": 0.76, + "learning_rate": 4.8192303211525766e-08, + "loss": 0.0004, + "step": 39142 + }, + { + "epoch": 0.76, + "learning_rate": 4.8188419867189624e-08, + "loss": 0.0005, + "step": 39143 + }, + { + "epoch": 0.76, + "learning_rate": 4.818453652285348e-08, + "loss": 0.0006, + "step": 39144 + }, + { + "epoch": 0.76, + "learning_rate": 4.818065317851734e-08, + "loss": 0.0005, + "step": 39145 + }, + { + "epoch": 0.76, + "learning_rate": 4.81767698341812e-08, + "loss": 0.0004, + "step": 39146 + }, + { + "epoch": 0.76, + "learning_rate": 4.817288648984506e-08, + "loss": 0.0003, + "step": 39147 + }, + { + "epoch": 0.76, + "learning_rate": 4.816900314550891e-08, + "loss": 0.0005, + "step": 39148 + }, + { + "epoch": 0.76, + "learning_rate": 4.816511980117277e-08, + "loss": 0.0005, + "step": 39149 + }, + { + "epoch": 0.76, + "learning_rate": 4.8161236456836625e-08, + "loss": 0.0012, + "step": 39150 + }, + { + "epoch": 0.76, + "learning_rate": 4.815735311250048e-08, + "loss": 0.0004, + "step": 39151 + }, + { + "epoch": 0.76, + "learning_rate": 4.815346976816434e-08, + "loss": 0.0004, + "step": 39152 + }, + { + "epoch": 0.76, + "learning_rate": 4.81495864238282e-08, + "loss": 0.0005, + "step": 39153 + }, + { + "epoch": 0.76, + "learning_rate": 4.814570307949206e-08, + "loss": 0.0004, + "step": 39154 + }, + { + "epoch": 0.76, + "learning_rate": 4.8141819735155916e-08, + "loss": 0.0032, + "step": 39155 + }, + { + "epoch": 0.76, + "learning_rate": 4.8137936390819774e-08, + "loss": 0.0005, + "step": 39156 + }, + { + "epoch": 0.76, + "learning_rate": 4.813405304648363e-08, + "loss": 0.0005, + "step": 39157 + }, + { + "epoch": 0.76, + "learning_rate": 4.813016970214749e-08, + "loss": 0.0003, + "step": 39158 + }, + { + "epoch": 0.76, + "learning_rate": 4.812628635781135e-08, + "loss": 0.0004, + "step": 39159 + }, + { + "epoch": 0.76, + "learning_rate": 4.812240301347521e-08, + "loss": 0.0003, + "step": 39160 + }, + { + "epoch": 0.76, + "learning_rate": 4.8118519669139066e-08, + "loss": 0.0007, + "step": 39161 + }, + { + "epoch": 0.76, + "learning_rate": 4.8114636324802924e-08, + "loss": 0.0005, + "step": 39162 + }, + { + "epoch": 0.76, + "learning_rate": 4.8110752980466776e-08, + "loss": 0.0028, + "step": 39163 + }, + { + "epoch": 0.76, + "learning_rate": 4.8106869636130634e-08, + "loss": 0.0005, + "step": 39164 + }, + { + "epoch": 0.76, + "learning_rate": 4.810298629179449e-08, + "loss": 0.3555, + "step": 39165 + }, + { + "epoch": 0.76, + "learning_rate": 4.809910294745835e-08, + "loss": 0.0006, + "step": 39166 + }, + { + "epoch": 0.76, + "learning_rate": 4.809521960312221e-08, + "loss": 0.0004, + "step": 39167 + }, + { + "epoch": 0.76, + "learning_rate": 4.809133625878607e-08, + "loss": 0.0006, + "step": 39168 + }, + { + "epoch": 0.76, + "learning_rate": 4.8087452914449925e-08, + "loss": 0.0079, + "step": 39169 + }, + { + "epoch": 0.76, + "learning_rate": 4.808356957011378e-08, + "loss": 0.0005, + "step": 39170 + }, + { + "epoch": 0.76, + "learning_rate": 4.8079686225777635e-08, + "loss": 0.0003, + "step": 39171 + }, + { + "epoch": 0.76, + "learning_rate": 4.807580288144149e-08, + "loss": 0.0004, + "step": 39172 + }, + { + "epoch": 0.76, + "learning_rate": 4.807191953710535e-08, + "loss": 0.0005, + "step": 39173 + }, + { + "epoch": 0.76, + "learning_rate": 4.806803619276921e-08, + "loss": 0.0004, + "step": 39174 + }, + { + "epoch": 0.76, + "learning_rate": 4.806415284843307e-08, + "loss": 0.0004, + "step": 39175 + }, + { + "epoch": 0.76, + "learning_rate": 4.8060269504096926e-08, + "loss": 0.0005, + "step": 39176 + }, + { + "epoch": 0.76, + "learning_rate": 4.8056386159760784e-08, + "loss": 0.0005, + "step": 39177 + }, + { + "epoch": 0.76, + "learning_rate": 4.8052502815424636e-08, + "loss": 0.0005, + "step": 39178 + }, + { + "epoch": 0.76, + "learning_rate": 4.8048619471088494e-08, + "loss": 0.0003, + "step": 39179 + }, + { + "epoch": 0.76, + "learning_rate": 4.804473612675235e-08, + "loss": 0.0003, + "step": 39180 + }, + { + "epoch": 0.76, + "learning_rate": 4.804085278241621e-08, + "loss": 0.0008, + "step": 39181 + }, + { + "epoch": 0.76, + "learning_rate": 4.803696943808007e-08, + "loss": 0.0003, + "step": 39182 + }, + { + "epoch": 0.76, + "learning_rate": 4.803308609374393e-08, + "loss": 0.1917, + "step": 39183 + }, + { + "epoch": 0.76, + "learning_rate": 4.8029202749407785e-08, + "loss": 0.0003, + "step": 39184 + }, + { + "epoch": 0.76, + "learning_rate": 4.8025319405071644e-08, + "loss": 0.0004, + "step": 39185 + }, + { + "epoch": 0.76, + "learning_rate": 4.80214360607355e-08, + "loss": 0.0619, + "step": 39186 + }, + { + "epoch": 0.76, + "learning_rate": 4.801755271639936e-08, + "loss": 0.4385, + "step": 39187 + }, + { + "epoch": 0.76, + "learning_rate": 4.801366937206322e-08, + "loss": 0.2152, + "step": 39188 + }, + { + "epoch": 0.76, + "learning_rate": 4.8009786027727077e-08, + "loss": 0.0006, + "step": 39189 + }, + { + "epoch": 0.76, + "learning_rate": 4.8005902683390935e-08, + "loss": 0.0004, + "step": 39190 + }, + { + "epoch": 0.76, + "learning_rate": 4.800201933905479e-08, + "loss": 0.0003, + "step": 39191 + }, + { + "epoch": 0.76, + "learning_rate": 4.7998135994718645e-08, + "loss": 0.0004, + "step": 39192 + }, + { + "epoch": 0.76, + "learning_rate": 4.79942526503825e-08, + "loss": 0.0003, + "step": 39193 + }, + { + "epoch": 0.76, + "learning_rate": 4.799036930604636e-08, + "loss": 0.0042, + "step": 39194 + }, + { + "epoch": 0.76, + "learning_rate": 4.798648596171022e-08, + "loss": 0.2721, + "step": 39195 + }, + { + "epoch": 0.76, + "learning_rate": 4.798260261737408e-08, + "loss": 0.0019, + "step": 39196 + }, + { + "epoch": 0.76, + "learning_rate": 4.7978719273037936e-08, + "loss": 0.0007, + "step": 39197 + }, + { + "epoch": 0.76, + "learning_rate": 4.7974835928701794e-08, + "loss": 0.0004, + "step": 39198 + }, + { + "epoch": 0.76, + "learning_rate": 4.797095258436565e-08, + "loss": 0.0004, + "step": 39199 + }, + { + "epoch": 0.76, + "learning_rate": 4.796706924002951e-08, + "loss": 0.0004, + "step": 39200 + }, + { + "epoch": 0.76, + "learning_rate": 4.796318589569337e-08, + "loss": 0.0003, + "step": 39201 + }, + { + "epoch": 0.76, + "learning_rate": 4.795930255135723e-08, + "loss": 0.0005, + "step": 39202 + }, + { + "epoch": 0.76, + "learning_rate": 4.7955419207021085e-08, + "loss": 0.0003, + "step": 39203 + }, + { + "epoch": 0.76, + "learning_rate": 4.7951535862684944e-08, + "loss": 0.0005, + "step": 39204 + }, + { + "epoch": 0.76, + "learning_rate": 4.79476525183488e-08, + "loss": 0.0005, + "step": 39205 + }, + { + "epoch": 0.76, + "learning_rate": 4.7943769174012654e-08, + "loss": 0.0004, + "step": 39206 + }, + { + "epoch": 0.76, + "learning_rate": 4.793988582967651e-08, + "loss": 0.3805, + "step": 39207 + }, + { + "epoch": 0.76, + "learning_rate": 4.793600248534037e-08, + "loss": 0.0004, + "step": 39208 + }, + { + "epoch": 0.76, + "learning_rate": 4.793211914100423e-08, + "loss": 0.0003, + "step": 39209 + }, + { + "epoch": 0.76, + "learning_rate": 4.7928235796668087e-08, + "loss": 0.0004, + "step": 39210 + }, + { + "epoch": 0.76, + "learning_rate": 4.7924352452331945e-08, + "loss": 0.0015, + "step": 39211 + }, + { + "epoch": 0.76, + "learning_rate": 4.79204691079958e-08, + "loss": 0.0005, + "step": 39212 + }, + { + "epoch": 0.76, + "learning_rate": 4.791658576365966e-08, + "loss": 0.0006, + "step": 39213 + }, + { + "epoch": 0.76, + "learning_rate": 4.791270241932352e-08, + "loss": 0.0004, + "step": 39214 + }, + { + "epoch": 0.76, + "learning_rate": 4.790881907498738e-08, + "loss": 0.0003, + "step": 39215 + }, + { + "epoch": 0.76, + "learning_rate": 4.7904935730651236e-08, + "loss": 0.0012, + "step": 39216 + }, + { + "epoch": 0.76, + "learning_rate": 4.7901052386315094e-08, + "loss": 0.0006, + "step": 39217 + }, + { + "epoch": 0.76, + "learning_rate": 4.789716904197895e-08, + "loss": 0.0004, + "step": 39218 + }, + { + "epoch": 0.76, + "learning_rate": 4.789328569764281e-08, + "loss": 0.0004, + "step": 39219 + }, + { + "epoch": 0.76, + "learning_rate": 4.788940235330667e-08, + "loss": 0.0005, + "step": 39220 + }, + { + "epoch": 0.76, + "learning_rate": 4.788551900897052e-08, + "loss": 0.0005, + "step": 39221 + }, + { + "epoch": 0.76, + "learning_rate": 4.788163566463438e-08, + "loss": 0.3061, + "step": 39222 + }, + { + "epoch": 0.76, + "learning_rate": 4.787775232029824e-08, + "loss": 0.0004, + "step": 39223 + }, + { + "epoch": 0.76, + "learning_rate": 4.7873868975962095e-08, + "loss": 0.0004, + "step": 39224 + }, + { + "epoch": 0.76, + "learning_rate": 4.7869985631625954e-08, + "loss": 0.001, + "step": 39225 + }, + { + "epoch": 0.76, + "learning_rate": 4.786610228728981e-08, + "loss": 0.0003, + "step": 39226 + }, + { + "epoch": 0.76, + "learning_rate": 4.786221894295367e-08, + "loss": 0.0026, + "step": 39227 + }, + { + "epoch": 0.76, + "learning_rate": 4.785833559861753e-08, + "loss": 0.0003, + "step": 39228 + }, + { + "epoch": 0.76, + "learning_rate": 4.7854452254281387e-08, + "loss": 0.0004, + "step": 39229 + }, + { + "epoch": 0.76, + "learning_rate": 4.7850568909945245e-08, + "loss": 0.0006, + "step": 39230 + }, + { + "epoch": 0.76, + "learning_rate": 4.78466855656091e-08, + "loss": 0.0006, + "step": 39231 + }, + { + "epoch": 0.76, + "learning_rate": 4.784280222127296e-08, + "loss": 0.0004, + "step": 39232 + }, + { + "epoch": 0.76, + "learning_rate": 4.783891887693682e-08, + "loss": 0.0005, + "step": 39233 + }, + { + "epoch": 0.76, + "learning_rate": 4.783503553260068e-08, + "loss": 0.0005, + "step": 39234 + }, + { + "epoch": 0.76, + "learning_rate": 4.783115218826453e-08, + "loss": 0.0003, + "step": 39235 + }, + { + "epoch": 0.76, + "learning_rate": 4.782726884392839e-08, + "loss": 0.0004, + "step": 39236 + }, + { + "epoch": 0.76, + "learning_rate": 4.7823385499592246e-08, + "loss": 0.0005, + "step": 39237 + }, + { + "epoch": 0.76, + "learning_rate": 4.7819502155256104e-08, + "loss": 0.0004, + "step": 39238 + }, + { + "epoch": 0.76, + "learning_rate": 4.781561881091996e-08, + "loss": 0.0005, + "step": 39239 + }, + { + "epoch": 0.76, + "learning_rate": 4.781173546658382e-08, + "loss": 0.0004, + "step": 39240 + }, + { + "epoch": 0.76, + "learning_rate": 4.780785212224768e-08, + "loss": 0.0003, + "step": 39241 + }, + { + "epoch": 0.76, + "learning_rate": 4.780396877791154e-08, + "loss": 0.0004, + "step": 39242 + }, + { + "epoch": 0.76, + "learning_rate": 4.7800085433575395e-08, + "loss": 0.0006, + "step": 39243 + }, + { + "epoch": 0.76, + "learning_rate": 4.7796202089239254e-08, + "loss": 0.0257, + "step": 39244 + }, + { + "epoch": 0.76, + "learning_rate": 4.779231874490311e-08, + "loss": 0.0004, + "step": 39245 + }, + { + "epoch": 0.76, + "learning_rate": 4.778843540056697e-08, + "loss": 0.0005, + "step": 39246 + }, + { + "epoch": 0.76, + "learning_rate": 4.778455205623083e-08, + "loss": 0.0005, + "step": 39247 + }, + { + "epoch": 0.76, + "learning_rate": 4.7780668711894687e-08, + "loss": 0.01, + "step": 39248 + }, + { + "epoch": 0.76, + "learning_rate": 4.7776785367558545e-08, + "loss": 0.0006, + "step": 39249 + }, + { + "epoch": 0.76, + "learning_rate": 4.7772902023222396e-08, + "loss": 0.0004, + "step": 39250 + }, + { + "epoch": 0.76, + "learning_rate": 4.7769018678886255e-08, + "loss": 0.0006, + "step": 39251 + }, + { + "epoch": 0.76, + "learning_rate": 4.776513533455011e-08, + "loss": 0.0005, + "step": 39252 + }, + { + "epoch": 0.76, + "learning_rate": 4.776125199021397e-08, + "loss": 0.0003, + "step": 39253 + }, + { + "epoch": 0.76, + "learning_rate": 4.775736864587783e-08, + "loss": 0.0189, + "step": 39254 + }, + { + "epoch": 0.76, + "learning_rate": 4.775348530154169e-08, + "loss": 1.427, + "step": 39255 + }, + { + "epoch": 0.76, + "learning_rate": 4.7749601957205546e-08, + "loss": 0.0004, + "step": 39256 + }, + { + "epoch": 0.76, + "learning_rate": 4.7745718612869404e-08, + "loss": 0.0003, + "step": 39257 + }, + { + "epoch": 0.76, + "learning_rate": 4.774183526853326e-08, + "loss": 0.0007, + "step": 39258 + }, + { + "epoch": 0.76, + "learning_rate": 4.773795192419712e-08, + "loss": 0.0005, + "step": 39259 + }, + { + "epoch": 0.76, + "learning_rate": 4.773406857986097e-08, + "loss": 0.0005, + "step": 39260 + }, + { + "epoch": 0.76, + "learning_rate": 4.773018523552483e-08, + "loss": 0.0004, + "step": 39261 + }, + { + "epoch": 0.76, + "learning_rate": 4.772630189118869e-08, + "loss": 0.0005, + "step": 39262 + }, + { + "epoch": 0.76, + "learning_rate": 4.772241854685255e-08, + "loss": 0.0004, + "step": 39263 + }, + { + "epoch": 0.76, + "learning_rate": 4.7718535202516405e-08, + "loss": 0.0006, + "step": 39264 + }, + { + "epoch": 0.76, + "learning_rate": 4.7714651858180264e-08, + "loss": 0.0005, + "step": 39265 + }, + { + "epoch": 0.76, + "learning_rate": 4.771076851384412e-08, + "loss": 0.0004, + "step": 39266 + }, + { + "epoch": 0.76, + "learning_rate": 4.7706885169507973e-08, + "loss": 0.0011, + "step": 39267 + }, + { + "epoch": 0.76, + "learning_rate": 4.770300182517183e-08, + "loss": 0.0004, + "step": 39268 + }, + { + "epoch": 0.76, + "learning_rate": 4.769911848083569e-08, + "loss": 0.0004, + "step": 39269 + }, + { + "epoch": 0.76, + "learning_rate": 4.769523513649955e-08, + "loss": 0.0003, + "step": 39270 + }, + { + "epoch": 0.76, + "learning_rate": 4.7691351792163406e-08, + "loss": 0.3432, + "step": 39271 + }, + { + "epoch": 0.76, + "learning_rate": 4.7687468447827265e-08, + "loss": 0.0005, + "step": 39272 + }, + { + "epoch": 0.76, + "learning_rate": 4.768358510349112e-08, + "loss": 0.0004, + "step": 39273 + }, + { + "epoch": 0.76, + "learning_rate": 4.767970175915498e-08, + "loss": 0.0005, + "step": 39274 + }, + { + "epoch": 0.76, + "learning_rate": 4.767581841481884e-08, + "loss": 0.0004, + "step": 39275 + }, + { + "epoch": 0.76, + "learning_rate": 4.76719350704827e-08, + "loss": 0.0005, + "step": 39276 + }, + { + "epoch": 0.76, + "learning_rate": 4.7668051726146556e-08, + "loss": 0.0005, + "step": 39277 + }, + { + "epoch": 0.76, + "learning_rate": 4.7664168381810414e-08, + "loss": 0.8678, + "step": 39278 + }, + { + "epoch": 0.76, + "learning_rate": 4.7660285037474266e-08, + "loss": 0.0004, + "step": 39279 + }, + { + "epoch": 0.76, + "learning_rate": 4.7656401693138124e-08, + "loss": 0.0003, + "step": 39280 + }, + { + "epoch": 0.76, + "learning_rate": 4.765251834880198e-08, + "loss": 0.0005, + "step": 39281 + }, + { + "epoch": 0.76, + "learning_rate": 4.764863500446584e-08, + "loss": 0.0004, + "step": 39282 + }, + { + "epoch": 0.76, + "learning_rate": 4.76447516601297e-08, + "loss": 0.0082, + "step": 39283 + }, + { + "epoch": 0.76, + "learning_rate": 4.764086831579356e-08, + "loss": 0.0004, + "step": 39284 + }, + { + "epoch": 0.76, + "learning_rate": 4.7636984971457415e-08, + "loss": 0.001, + "step": 39285 + }, + { + "epoch": 0.76, + "learning_rate": 4.7633101627121273e-08, + "loss": 0.0008, + "step": 39286 + }, + { + "epoch": 0.76, + "learning_rate": 4.762921828278513e-08, + "loss": 0.0007, + "step": 39287 + }, + { + "epoch": 0.76, + "learning_rate": 4.762533493844899e-08, + "loss": 0.0008, + "step": 39288 + }, + { + "epoch": 0.76, + "learning_rate": 4.762145159411285e-08, + "loss": 0.0013, + "step": 39289 + }, + { + "epoch": 0.76, + "learning_rate": 4.7617568249776706e-08, + "loss": 0.6726, + "step": 39290 + }, + { + "epoch": 0.76, + "learning_rate": 4.7613684905440565e-08, + "loss": 0.0004, + "step": 39291 + }, + { + "epoch": 0.76, + "learning_rate": 4.760980156110442e-08, + "loss": 0.0011, + "step": 39292 + }, + { + "epoch": 0.76, + "learning_rate": 4.7605918216768274e-08, + "loss": 0.0004, + "step": 39293 + }, + { + "epoch": 0.76, + "learning_rate": 4.760203487243213e-08, + "loss": 0.0005, + "step": 39294 + }, + { + "epoch": 0.76, + "learning_rate": 4.759815152809599e-08, + "loss": 0.0005, + "step": 39295 + }, + { + "epoch": 0.76, + "learning_rate": 4.759426818375985e-08, + "loss": 0.0003, + "step": 39296 + }, + { + "epoch": 0.76, + "learning_rate": 4.759038483942371e-08, + "loss": 0.0005, + "step": 39297 + }, + { + "epoch": 0.76, + "learning_rate": 4.7586501495087566e-08, + "loss": 0.0006, + "step": 39298 + }, + { + "epoch": 0.76, + "learning_rate": 4.7582618150751424e-08, + "loss": 0.8946, + "step": 39299 + }, + { + "epoch": 0.76, + "learning_rate": 4.757873480641528e-08, + "loss": 0.0004, + "step": 39300 + }, + { + "epoch": 0.76, + "learning_rate": 4.757485146207914e-08, + "loss": 0.6095, + "step": 39301 + }, + { + "epoch": 0.76, + "learning_rate": 4.7570968117743e-08, + "loss": 0.0005, + "step": 39302 + }, + { + "epoch": 0.76, + "learning_rate": 4.756708477340686e-08, + "loss": 0.0031, + "step": 39303 + }, + { + "epoch": 0.76, + "learning_rate": 4.7563201429070715e-08, + "loss": 0.0004, + "step": 39304 + }, + { + "epoch": 0.76, + "learning_rate": 4.7559318084734573e-08, + "loss": 0.0004, + "step": 39305 + }, + { + "epoch": 0.76, + "learning_rate": 4.755543474039843e-08, + "loss": 0.0094, + "step": 39306 + }, + { + "epoch": 0.76, + "learning_rate": 4.755155139606229e-08, + "loss": 0.0005, + "step": 39307 + }, + { + "epoch": 0.76, + "learning_rate": 4.754766805172614e-08, + "loss": 0.0004, + "step": 39308 + }, + { + "epoch": 0.76, + "learning_rate": 4.754378470739e-08, + "loss": 0.0004, + "step": 39309 + }, + { + "epoch": 0.76, + "learning_rate": 4.753990136305386e-08, + "loss": 0.0006, + "step": 39310 + }, + { + "epoch": 0.76, + "learning_rate": 4.7536018018717716e-08, + "loss": 0.0703, + "step": 39311 + }, + { + "epoch": 0.76, + "learning_rate": 4.7532134674381575e-08, + "loss": 0.9479, + "step": 39312 + }, + { + "epoch": 0.76, + "learning_rate": 4.752825133004543e-08, + "loss": 0.0006, + "step": 39313 + }, + { + "epoch": 0.76, + "learning_rate": 4.752436798570929e-08, + "loss": 0.0004, + "step": 39314 + }, + { + "epoch": 0.76, + "learning_rate": 4.752048464137315e-08, + "loss": 0.0012, + "step": 39315 + }, + { + "epoch": 0.76, + "learning_rate": 4.751660129703701e-08, + "loss": 0.7468, + "step": 39316 + }, + { + "epoch": 0.76, + "learning_rate": 4.7512717952700866e-08, + "loss": 0.0004, + "step": 39317 + }, + { + "epoch": 0.76, + "learning_rate": 4.7508834608364724e-08, + "loss": 0.1371, + "step": 39318 + }, + { + "epoch": 0.76, + "learning_rate": 4.750495126402858e-08, + "loss": 0.0003, + "step": 39319 + }, + { + "epoch": 0.76, + "learning_rate": 4.750106791969244e-08, + "loss": 0.0004, + "step": 39320 + }, + { + "epoch": 0.76, + "learning_rate": 4.74971845753563e-08, + "loss": 0.0004, + "step": 39321 + }, + { + "epoch": 0.76, + "learning_rate": 4.749330123102015e-08, + "loss": 0.0006, + "step": 39322 + }, + { + "epoch": 0.76, + "learning_rate": 4.748941788668401e-08, + "loss": 0.0004, + "step": 39323 + }, + { + "epoch": 0.76, + "learning_rate": 4.748553454234787e-08, + "loss": 0.0007, + "step": 39324 + }, + { + "epoch": 0.76, + "learning_rate": 4.7481651198011725e-08, + "loss": 0.3435, + "step": 39325 + }, + { + "epoch": 0.76, + "learning_rate": 4.7477767853675583e-08, + "loss": 1.1607, + "step": 39326 + }, + { + "epoch": 0.76, + "learning_rate": 4.747388450933944e-08, + "loss": 0.0005, + "step": 39327 + }, + { + "epoch": 0.76, + "learning_rate": 4.74700011650033e-08, + "loss": 0.0004, + "step": 39328 + }, + { + "epoch": 0.76, + "learning_rate": 4.746611782066716e-08, + "loss": 0.0004, + "step": 39329 + }, + { + "epoch": 0.76, + "learning_rate": 4.7462234476331016e-08, + "loss": 0.0003, + "step": 39330 + }, + { + "epoch": 0.76, + "learning_rate": 4.7458351131994875e-08, + "loss": 0.0009, + "step": 39331 + }, + { + "epoch": 0.76, + "learning_rate": 4.745446778765873e-08, + "loss": 0.0004, + "step": 39332 + }, + { + "epoch": 0.76, + "learning_rate": 4.745058444332259e-08, + "loss": 0.0004, + "step": 39333 + }, + { + "epoch": 0.76, + "learning_rate": 4.744670109898645e-08, + "loss": 0.0006, + "step": 39334 + }, + { + "epoch": 0.76, + "learning_rate": 4.744281775465031e-08, + "loss": 0.0005, + "step": 39335 + }, + { + "epoch": 0.76, + "learning_rate": 4.7438934410314166e-08, + "loss": 0.0007, + "step": 39336 + }, + { + "epoch": 0.76, + "learning_rate": 4.743505106597802e-08, + "loss": 0.0005, + "step": 39337 + }, + { + "epoch": 0.76, + "learning_rate": 4.7431167721641876e-08, + "loss": 0.0006, + "step": 39338 + }, + { + "epoch": 0.76, + "learning_rate": 4.7427284377305734e-08, + "loss": 0.0007, + "step": 39339 + }, + { + "epoch": 0.76, + "learning_rate": 4.742340103296959e-08, + "loss": 0.0005, + "step": 39340 + }, + { + "epoch": 0.76, + "learning_rate": 4.741951768863345e-08, + "loss": 0.0005, + "step": 39341 + }, + { + "epoch": 0.76, + "learning_rate": 4.741563434429731e-08, + "loss": 0.0004, + "step": 39342 + }, + { + "epoch": 0.76, + "learning_rate": 4.741175099996117e-08, + "loss": 0.5949, + "step": 39343 + }, + { + "epoch": 0.76, + "learning_rate": 4.7407867655625025e-08, + "loss": 0.0003, + "step": 39344 + }, + { + "epoch": 0.76, + "learning_rate": 4.7403984311288883e-08, + "loss": 0.5965, + "step": 39345 + }, + { + "epoch": 0.76, + "learning_rate": 4.740010096695274e-08, + "loss": 0.0003, + "step": 39346 + }, + { + "epoch": 0.76, + "learning_rate": 4.73962176226166e-08, + "loss": 0.0003, + "step": 39347 + }, + { + "epoch": 0.76, + "learning_rate": 4.739233427828045e-08, + "loss": 0.0005, + "step": 39348 + }, + { + "epoch": 0.76, + "learning_rate": 4.738845093394431e-08, + "loss": 0.0006, + "step": 39349 + }, + { + "epoch": 0.76, + "learning_rate": 4.738456758960817e-08, + "loss": 0.0003, + "step": 39350 + }, + { + "epoch": 0.76, + "learning_rate": 4.7380684245272026e-08, + "loss": 0.0003, + "step": 39351 + }, + { + "epoch": 0.76, + "learning_rate": 4.7376800900935884e-08, + "loss": 0.0003, + "step": 39352 + }, + { + "epoch": 0.76, + "learning_rate": 4.737291755659974e-08, + "loss": 0.0093, + "step": 39353 + }, + { + "epoch": 0.76, + "learning_rate": 4.73690342122636e-08, + "loss": 0.0008, + "step": 39354 + }, + { + "epoch": 0.76, + "learning_rate": 4.736515086792745e-08, + "loss": 0.8929, + "step": 39355 + }, + { + "epoch": 0.76, + "learning_rate": 4.736126752359131e-08, + "loss": 0.0015, + "step": 39356 + }, + { + "epoch": 0.76, + "learning_rate": 4.735738417925517e-08, + "loss": 0.0005, + "step": 39357 + }, + { + "epoch": 0.76, + "learning_rate": 4.735350083491903e-08, + "loss": 0.0005, + "step": 39358 + }, + { + "epoch": 0.76, + "learning_rate": 4.7349617490582886e-08, + "loss": 0.0008, + "step": 39359 + }, + { + "epoch": 0.76, + "learning_rate": 4.7345734146246744e-08, + "loss": 0.0016, + "step": 39360 + }, + { + "epoch": 0.76, + "learning_rate": 4.73418508019106e-08, + "loss": 0.0024, + "step": 39361 + }, + { + "epoch": 0.76, + "learning_rate": 4.733796745757446e-08, + "loss": 0.0004, + "step": 39362 + }, + { + "epoch": 0.76, + "learning_rate": 4.733408411323832e-08, + "loss": 0.0004, + "step": 39363 + }, + { + "epoch": 0.76, + "learning_rate": 4.733020076890218e-08, + "loss": 0.0005, + "step": 39364 + }, + { + "epoch": 0.76, + "learning_rate": 4.7326317424566035e-08, + "loss": 0.0003, + "step": 39365 + }, + { + "epoch": 0.76, + "learning_rate": 4.7322434080229887e-08, + "loss": 0.0004, + "step": 39366 + }, + { + "epoch": 0.76, + "learning_rate": 4.7318550735893745e-08, + "loss": 0.0003, + "step": 39367 + }, + { + "epoch": 0.76, + "learning_rate": 4.73146673915576e-08, + "loss": 0.0005, + "step": 39368 + }, + { + "epoch": 0.76, + "learning_rate": 4.731078404722146e-08, + "loss": 0.9653, + "step": 39369 + }, + { + "epoch": 0.76, + "learning_rate": 4.730690070288532e-08, + "loss": 0.0003, + "step": 39370 + }, + { + "epoch": 0.76, + "learning_rate": 4.730301735854918e-08, + "loss": 0.0003, + "step": 39371 + }, + { + "epoch": 0.76, + "learning_rate": 4.7299134014213036e-08, + "loss": 0.0003, + "step": 39372 + }, + { + "epoch": 0.76, + "learning_rate": 4.7295250669876894e-08, + "loss": 0.0004, + "step": 39373 + }, + { + "epoch": 0.76, + "learning_rate": 4.729136732554075e-08, + "loss": 0.0004, + "step": 39374 + }, + { + "epoch": 0.76, + "learning_rate": 4.728748398120461e-08, + "loss": 0.0004, + "step": 39375 + }, + { + "epoch": 0.76, + "learning_rate": 4.728360063686847e-08, + "loss": 0.0008, + "step": 39376 + }, + { + "epoch": 0.76, + "learning_rate": 4.727971729253233e-08, + "loss": 0.0868, + "step": 39377 + }, + { + "epoch": 0.76, + "learning_rate": 4.7275833948196186e-08, + "loss": 0.0002, + "step": 39378 + }, + { + "epoch": 0.76, + "learning_rate": 4.7271950603860044e-08, + "loss": 0.0005, + "step": 39379 + }, + { + "epoch": 0.76, + "learning_rate": 4.7268067259523895e-08, + "loss": 0.0005, + "step": 39380 + }, + { + "epoch": 0.76, + "learning_rate": 4.7264183915187754e-08, + "loss": 0.0006, + "step": 39381 + }, + { + "epoch": 0.76, + "learning_rate": 4.726030057085161e-08, + "loss": 0.0003, + "step": 39382 + }, + { + "epoch": 0.76, + "learning_rate": 4.725641722651547e-08, + "loss": 0.0005, + "step": 39383 + }, + { + "epoch": 0.76, + "learning_rate": 4.725253388217933e-08, + "loss": 0.0005, + "step": 39384 + }, + { + "epoch": 0.76, + "learning_rate": 4.7248650537843187e-08, + "loss": 0.0003, + "step": 39385 + }, + { + "epoch": 0.76, + "learning_rate": 4.7244767193507045e-08, + "loss": 0.0007, + "step": 39386 + }, + { + "epoch": 0.76, + "learning_rate": 4.72408838491709e-08, + "loss": 0.0004, + "step": 39387 + }, + { + "epoch": 0.76, + "learning_rate": 4.723700050483476e-08, + "loss": 0.0005, + "step": 39388 + }, + { + "epoch": 0.76, + "learning_rate": 4.723311716049862e-08, + "loss": 0.014, + "step": 39389 + }, + { + "epoch": 0.76, + "learning_rate": 4.722923381616248e-08, + "loss": 0.0006, + "step": 39390 + }, + { + "epoch": 0.76, + "learning_rate": 4.7225350471826336e-08, + "loss": 0.3913, + "step": 39391 + }, + { + "epoch": 0.76, + "learning_rate": 4.7221467127490194e-08, + "loss": 0.0004, + "step": 39392 + }, + { + "epoch": 0.76, + "learning_rate": 4.721758378315405e-08, + "loss": 0.0004, + "step": 39393 + }, + { + "epoch": 0.76, + "learning_rate": 4.721370043881791e-08, + "loss": 0.0003, + "step": 39394 + }, + { + "epoch": 0.76, + "learning_rate": 4.720981709448176e-08, + "loss": 0.0004, + "step": 39395 + }, + { + "epoch": 0.76, + "learning_rate": 4.720593375014562e-08, + "loss": 0.0004, + "step": 39396 + }, + { + "epoch": 0.76, + "learning_rate": 4.720205040580948e-08, + "loss": 0.0004, + "step": 39397 + }, + { + "epoch": 0.76, + "learning_rate": 4.719816706147334e-08, + "loss": 0.0003, + "step": 39398 + }, + { + "epoch": 0.76, + "learning_rate": 4.7194283717137195e-08, + "loss": 0.0004, + "step": 39399 + }, + { + "epoch": 0.76, + "learning_rate": 4.7190400372801054e-08, + "loss": 0.0004, + "step": 39400 + }, + { + "epoch": 0.76, + "learning_rate": 4.718651702846491e-08, + "loss": 0.0003, + "step": 39401 + }, + { + "epoch": 0.76, + "learning_rate": 4.718263368412877e-08, + "loss": 0.0004, + "step": 39402 + }, + { + "epoch": 0.76, + "learning_rate": 4.717875033979263e-08, + "loss": 0.0003, + "step": 39403 + }, + { + "epoch": 0.76, + "learning_rate": 4.7174866995456487e-08, + "loss": 0.0003, + "step": 39404 + }, + { + "epoch": 0.76, + "learning_rate": 4.7170983651120345e-08, + "loss": 0.0013, + "step": 39405 + }, + { + "epoch": 0.76, + "learning_rate": 4.71671003067842e-08, + "loss": 0.6296, + "step": 39406 + }, + { + "epoch": 0.76, + "learning_rate": 4.716321696244806e-08, + "loss": 0.0003, + "step": 39407 + }, + { + "epoch": 0.76, + "learning_rate": 4.715933361811192e-08, + "loss": 0.0005, + "step": 39408 + }, + { + "epoch": 0.76, + "learning_rate": 4.715545027377577e-08, + "loss": 0.0003, + "step": 39409 + }, + { + "epoch": 0.76, + "learning_rate": 4.715156692943963e-08, + "loss": 1.2937, + "step": 39410 + }, + { + "epoch": 0.76, + "learning_rate": 4.714768358510349e-08, + "loss": 0.0006, + "step": 39411 + }, + { + "epoch": 0.76, + "learning_rate": 4.7143800240767346e-08, + "loss": 0.0004, + "step": 39412 + }, + { + "epoch": 0.76, + "learning_rate": 4.7139916896431204e-08, + "loss": 0.0005, + "step": 39413 + }, + { + "epoch": 0.76, + "learning_rate": 4.713603355209506e-08, + "loss": 0.0003, + "step": 39414 + }, + { + "epoch": 0.76, + "learning_rate": 4.713215020775892e-08, + "loss": 0.0448, + "step": 39415 + }, + { + "epoch": 0.76, + "learning_rate": 4.712826686342278e-08, + "loss": 0.0003, + "step": 39416 + }, + { + "epoch": 0.76, + "learning_rate": 4.712438351908664e-08, + "loss": 0.3568, + "step": 39417 + }, + { + "epoch": 0.76, + "learning_rate": 4.7120500174750495e-08, + "loss": 0.0005, + "step": 39418 + }, + { + "epoch": 0.76, + "learning_rate": 4.7116616830414354e-08, + "loss": 0.0003, + "step": 39419 + }, + { + "epoch": 0.76, + "learning_rate": 4.711273348607821e-08, + "loss": 0.0006, + "step": 39420 + }, + { + "epoch": 0.76, + "learning_rate": 4.710885014174207e-08, + "loss": 0.0004, + "step": 39421 + }, + { + "epoch": 0.76, + "learning_rate": 4.710496679740593e-08, + "loss": 0.0004, + "step": 39422 + }, + { + "epoch": 0.76, + "learning_rate": 4.710108345306979e-08, + "loss": 1.1926, + "step": 39423 + }, + { + "epoch": 0.76, + "learning_rate": 4.709720010873364e-08, + "loss": 0.0006, + "step": 39424 + }, + { + "epoch": 0.76, + "learning_rate": 4.7093316764397497e-08, + "loss": 0.0005, + "step": 39425 + }, + { + "epoch": 0.76, + "learning_rate": 4.7089433420061355e-08, + "loss": 0.0005, + "step": 39426 + }, + { + "epoch": 0.76, + "learning_rate": 4.708555007572521e-08, + "loss": 0.0003, + "step": 39427 + }, + { + "epoch": 0.76, + "learning_rate": 4.708166673138907e-08, + "loss": 0.334, + "step": 39428 + }, + { + "epoch": 0.76, + "learning_rate": 4.707778338705293e-08, + "loss": 0.0006, + "step": 39429 + }, + { + "epoch": 0.76, + "learning_rate": 4.707390004271679e-08, + "loss": 0.0003, + "step": 39430 + }, + { + "epoch": 0.76, + "learning_rate": 4.7070016698380646e-08, + "loss": 0.0003, + "step": 39431 + }, + { + "epoch": 0.76, + "learning_rate": 4.7066133354044504e-08, + "loss": 0.0003, + "step": 39432 + }, + { + "epoch": 0.76, + "learning_rate": 4.706225000970836e-08, + "loss": 0.0005, + "step": 39433 + }, + { + "epoch": 0.76, + "learning_rate": 4.705836666537222e-08, + "loss": 0.0009, + "step": 39434 + }, + { + "epoch": 0.76, + "learning_rate": 4.705448332103608e-08, + "loss": 0.0006, + "step": 39435 + }, + { + "epoch": 0.76, + "learning_rate": 4.705059997669994e-08, + "loss": 0.0006, + "step": 39436 + }, + { + "epoch": 0.76, + "learning_rate": 4.704671663236379e-08, + "loss": 0.0005, + "step": 39437 + }, + { + "epoch": 0.77, + "learning_rate": 4.704283328802765e-08, + "loss": 0.9051, + "step": 39438 + }, + { + "epoch": 0.77, + "learning_rate": 4.7038949943691505e-08, + "loss": 0.0005, + "step": 39439 + }, + { + "epoch": 0.77, + "learning_rate": 4.7035066599355364e-08, + "loss": 0.0005, + "step": 39440 + }, + { + "epoch": 0.77, + "learning_rate": 4.703118325501922e-08, + "loss": 0.0004, + "step": 39441 + }, + { + "epoch": 0.77, + "learning_rate": 4.702729991068308e-08, + "loss": 0.0004, + "step": 39442 + }, + { + "epoch": 0.77, + "learning_rate": 4.702341656634694e-08, + "loss": 0.0007, + "step": 39443 + }, + { + "epoch": 0.77, + "learning_rate": 4.701953322201079e-08, + "loss": 0.1847, + "step": 39444 + }, + { + "epoch": 0.77, + "learning_rate": 4.701564987767465e-08, + "loss": 0.0005, + "step": 39445 + }, + { + "epoch": 0.77, + "learning_rate": 4.7011766533338506e-08, + "loss": 0.0173, + "step": 39446 + }, + { + "epoch": 0.77, + "learning_rate": 4.7007883189002365e-08, + "loss": 0.5366, + "step": 39447 + }, + { + "epoch": 0.77, + "learning_rate": 4.700399984466622e-08, + "loss": 0.0005, + "step": 39448 + }, + { + "epoch": 0.77, + "learning_rate": 4.700011650033008e-08, + "loss": 0.0022, + "step": 39449 + }, + { + "epoch": 0.77, + "learning_rate": 4.699623315599394e-08, + "loss": 0.0003, + "step": 39450 + }, + { + "epoch": 0.77, + "learning_rate": 4.69923498116578e-08, + "loss": 0.0004, + "step": 39451 + }, + { + "epoch": 0.77, + "learning_rate": 4.6988466467321656e-08, + "loss": 0.1465, + "step": 39452 + }, + { + "epoch": 0.77, + "learning_rate": 4.698458312298551e-08, + "loss": 0.0123, + "step": 39453 + }, + { + "epoch": 0.77, + "learning_rate": 4.6980699778649366e-08, + "loss": 0.0003, + "step": 39454 + }, + { + "epoch": 0.77, + "learning_rate": 4.6976816434313224e-08, + "loss": 0.0008, + "step": 39455 + }, + { + "epoch": 0.77, + "learning_rate": 4.697293308997708e-08, + "loss": 0.0005, + "step": 39456 + }, + { + "epoch": 0.77, + "learning_rate": 4.696904974564094e-08, + "loss": 0.0005, + "step": 39457 + }, + { + "epoch": 0.77, + "learning_rate": 4.69651664013048e-08, + "loss": 0.3551, + "step": 39458 + }, + { + "epoch": 0.77, + "learning_rate": 4.696128305696866e-08, + "loss": 0.0015, + "step": 39459 + }, + { + "epoch": 0.77, + "learning_rate": 4.6957399712632515e-08, + "loss": 0.0002, + "step": 39460 + }, + { + "epoch": 0.77, + "learning_rate": 4.6953516368296374e-08, + "loss": 0.1425, + "step": 39461 + }, + { + "epoch": 0.77, + "learning_rate": 4.694963302396023e-08, + "loss": 0.0007, + "step": 39462 + }, + { + "epoch": 0.77, + "learning_rate": 4.694574967962409e-08, + "loss": 0.0005, + "step": 39463 + }, + { + "epoch": 0.77, + "learning_rate": 4.694186633528795e-08, + "loss": 0.0005, + "step": 39464 + }, + { + "epoch": 0.77, + "learning_rate": 4.6937982990951806e-08, + "loss": 0.4802, + "step": 39465 + }, + { + "epoch": 0.77, + "learning_rate": 4.6934099646615665e-08, + "loss": 0.0004, + "step": 39466 + }, + { + "epoch": 0.77, + "learning_rate": 4.6930216302279516e-08, + "loss": 0.0009, + "step": 39467 + }, + { + "epoch": 0.77, + "learning_rate": 4.6926332957943375e-08, + "loss": 0.0005, + "step": 39468 + }, + { + "epoch": 0.77, + "learning_rate": 4.692244961360723e-08, + "loss": 0.0004, + "step": 39469 + }, + { + "epoch": 0.77, + "learning_rate": 4.691856626927109e-08, + "loss": 0.0004, + "step": 39470 + }, + { + "epoch": 0.77, + "learning_rate": 4.691468292493495e-08, + "loss": 1.2369, + "step": 39471 + }, + { + "epoch": 0.77, + "learning_rate": 4.691079958059881e-08, + "loss": 0.0003, + "step": 39472 + }, + { + "epoch": 0.77, + "learning_rate": 4.6906916236262666e-08, + "loss": 0.0005, + "step": 39473 + }, + { + "epoch": 0.77, + "learning_rate": 4.6903032891926524e-08, + "loss": 1.0663, + "step": 39474 + }, + { + "epoch": 0.77, + "learning_rate": 4.689914954759038e-08, + "loss": 0.0004, + "step": 39475 + }, + { + "epoch": 0.77, + "learning_rate": 4.689526620325424e-08, + "loss": 0.0003, + "step": 39476 + }, + { + "epoch": 0.77, + "learning_rate": 4.68913828589181e-08, + "loss": 0.0003, + "step": 39477 + }, + { + "epoch": 0.77, + "learning_rate": 4.688749951458196e-08, + "loss": 0.0005, + "step": 39478 + }, + { + "epoch": 0.77, + "learning_rate": 4.6883616170245815e-08, + "loss": 0.0005, + "step": 39479 + }, + { + "epoch": 0.77, + "learning_rate": 4.6879732825909674e-08, + "loss": 0.0006, + "step": 39480 + }, + { + "epoch": 0.77, + "learning_rate": 4.687584948157353e-08, + "loss": 0.0006, + "step": 39481 + }, + { + "epoch": 0.77, + "learning_rate": 4.6871966137237383e-08, + "loss": 0.0005, + "step": 39482 + }, + { + "epoch": 0.77, + "learning_rate": 4.686808279290124e-08, + "loss": 0.0004, + "step": 39483 + }, + { + "epoch": 0.77, + "learning_rate": 4.68641994485651e-08, + "loss": 0.0007, + "step": 39484 + }, + { + "epoch": 0.77, + "learning_rate": 4.686031610422896e-08, + "loss": 0.0005, + "step": 39485 + }, + { + "epoch": 0.77, + "learning_rate": 4.6856432759892816e-08, + "loss": 0.002, + "step": 39486 + }, + { + "epoch": 0.77, + "learning_rate": 4.6852549415556675e-08, + "loss": 0.0011, + "step": 39487 + }, + { + "epoch": 0.77, + "learning_rate": 4.684866607122053e-08, + "loss": 0.7505, + "step": 39488 + }, + { + "epoch": 0.77, + "learning_rate": 4.684478272688439e-08, + "loss": 0.0009, + "step": 39489 + }, + { + "epoch": 0.77, + "learning_rate": 4.684089938254825e-08, + "loss": 0.0004, + "step": 39490 + }, + { + "epoch": 0.77, + "learning_rate": 4.683701603821211e-08, + "loss": 0.0005, + "step": 39491 + }, + { + "epoch": 0.77, + "learning_rate": 4.6833132693875966e-08, + "loss": 0.0007, + "step": 39492 + }, + { + "epoch": 0.77, + "learning_rate": 4.6829249349539824e-08, + "loss": 0.0003, + "step": 39493 + }, + { + "epoch": 0.77, + "learning_rate": 4.682536600520368e-08, + "loss": 0.0004, + "step": 39494 + }, + { + "epoch": 0.77, + "learning_rate": 4.682148266086754e-08, + "loss": 0.0004, + "step": 39495 + }, + { + "epoch": 0.77, + "learning_rate": 4.681759931653139e-08, + "loss": 0.0003, + "step": 39496 + }, + { + "epoch": 0.77, + "learning_rate": 4.681371597219525e-08, + "loss": 0.0005, + "step": 39497 + }, + { + "epoch": 0.77, + "learning_rate": 4.680983262785911e-08, + "loss": 0.0006, + "step": 39498 + }, + { + "epoch": 0.77, + "learning_rate": 4.680594928352297e-08, + "loss": 0.0141, + "step": 39499 + }, + { + "epoch": 0.77, + "learning_rate": 4.6802065939186825e-08, + "loss": 0.0004, + "step": 39500 + }, + { + "epoch": 0.77, + "learning_rate": 4.6798182594850683e-08, + "loss": 0.0005, + "step": 39501 + }, + { + "epoch": 0.77, + "learning_rate": 4.679429925051454e-08, + "loss": 0.0003, + "step": 39502 + }, + { + "epoch": 0.77, + "learning_rate": 4.67904159061784e-08, + "loss": 0.0004, + "step": 39503 + }, + { + "epoch": 0.77, + "learning_rate": 4.678653256184226e-08, + "loss": 0.4108, + "step": 39504 + }, + { + "epoch": 0.77, + "learning_rate": 4.6782649217506116e-08, + "loss": 0.0004, + "step": 39505 + }, + { + "epoch": 0.77, + "learning_rate": 4.6778765873169975e-08, + "loss": 0.0182, + "step": 39506 + }, + { + "epoch": 0.77, + "learning_rate": 4.677488252883383e-08, + "loss": 0.0007, + "step": 39507 + }, + { + "epoch": 0.77, + "learning_rate": 4.677099918449769e-08, + "loss": 0.0321, + "step": 39508 + }, + { + "epoch": 0.77, + "learning_rate": 4.676711584016155e-08, + "loss": 0.0004, + "step": 39509 + }, + { + "epoch": 0.77, + "learning_rate": 4.676323249582541e-08, + "loss": 0.0003, + "step": 39510 + }, + { + "epoch": 0.77, + "learning_rate": 4.675934915148926e-08, + "loss": 0.0158, + "step": 39511 + }, + { + "epoch": 0.77, + "learning_rate": 4.675546580715312e-08, + "loss": 0.0005, + "step": 39512 + }, + { + "epoch": 0.77, + "learning_rate": 4.6751582462816976e-08, + "loss": 0.0003, + "step": 39513 + }, + { + "epoch": 0.77, + "learning_rate": 4.6747699118480834e-08, + "loss": 0.0004, + "step": 39514 + }, + { + "epoch": 0.77, + "learning_rate": 4.674381577414469e-08, + "loss": 0.0006, + "step": 39515 + }, + { + "epoch": 0.77, + "learning_rate": 4.673993242980855e-08, + "loss": 0.0004, + "step": 39516 + }, + { + "epoch": 0.77, + "learning_rate": 4.673604908547241e-08, + "loss": 0.213, + "step": 39517 + }, + { + "epoch": 0.77, + "learning_rate": 4.673216574113627e-08, + "loss": 0.0004, + "step": 39518 + }, + { + "epoch": 0.77, + "learning_rate": 4.6728282396800125e-08, + "loss": 0.0004, + "step": 39519 + }, + { + "epoch": 0.77, + "learning_rate": 4.6724399052463983e-08, + "loss": 0.0004, + "step": 39520 + }, + { + "epoch": 0.77, + "learning_rate": 4.672051570812784e-08, + "loss": 0.0004, + "step": 39521 + }, + { + "epoch": 0.77, + "learning_rate": 4.67166323637917e-08, + "loss": 0.0003, + "step": 39522 + }, + { + "epoch": 0.77, + "learning_rate": 4.671274901945556e-08, + "loss": 0.002, + "step": 39523 + }, + { + "epoch": 0.77, + "learning_rate": 4.6708865675119416e-08, + "loss": 0.0005, + "step": 39524 + }, + { + "epoch": 0.77, + "learning_rate": 4.670498233078327e-08, + "loss": 0.0004, + "step": 39525 + }, + { + "epoch": 0.77, + "learning_rate": 4.6701098986447126e-08, + "loss": 0.0004, + "step": 39526 + }, + { + "epoch": 0.77, + "learning_rate": 4.6697215642110985e-08, + "loss": 0.0009, + "step": 39527 + }, + { + "epoch": 0.77, + "learning_rate": 4.669333229777484e-08, + "loss": 0.0005, + "step": 39528 + }, + { + "epoch": 0.77, + "learning_rate": 4.66894489534387e-08, + "loss": 0.4187, + "step": 39529 + }, + { + "epoch": 0.77, + "learning_rate": 4.668556560910256e-08, + "loss": 0.0003, + "step": 39530 + }, + { + "epoch": 0.77, + "learning_rate": 4.668168226476642e-08, + "loss": 0.0003, + "step": 39531 + }, + { + "epoch": 0.77, + "learning_rate": 4.667779892043027e-08, + "loss": 0.0004, + "step": 39532 + }, + { + "epoch": 0.77, + "learning_rate": 4.667391557609413e-08, + "loss": 0.0007, + "step": 39533 + }, + { + "epoch": 0.77, + "learning_rate": 4.6670032231757986e-08, + "loss": 0.0004, + "step": 39534 + }, + { + "epoch": 0.77, + "learning_rate": 4.6666148887421844e-08, + "loss": 0.0002, + "step": 39535 + }, + { + "epoch": 0.77, + "learning_rate": 4.66622655430857e-08, + "loss": 0.0004, + "step": 39536 + }, + { + "epoch": 0.77, + "learning_rate": 4.665838219874956e-08, + "loss": 0.0004, + "step": 39537 + }, + { + "epoch": 0.77, + "learning_rate": 4.665449885441342e-08, + "loss": 0.0082, + "step": 39538 + }, + { + "epoch": 0.77, + "learning_rate": 4.665061551007728e-08, + "loss": 0.0006, + "step": 39539 + }, + { + "epoch": 0.77, + "learning_rate": 4.664673216574113e-08, + "loss": 0.0004, + "step": 39540 + }, + { + "epoch": 0.77, + "learning_rate": 4.664284882140499e-08, + "loss": 0.0764, + "step": 39541 + }, + { + "epoch": 0.77, + "learning_rate": 4.6638965477068845e-08, + "loss": 0.0004, + "step": 39542 + }, + { + "epoch": 0.77, + "learning_rate": 4.66350821327327e-08, + "loss": 0.0006, + "step": 39543 + }, + { + "epoch": 0.77, + "learning_rate": 4.663119878839656e-08, + "loss": 0.0003, + "step": 39544 + }, + { + "epoch": 0.77, + "learning_rate": 4.662731544406042e-08, + "loss": 0.0003, + "step": 39545 + }, + { + "epoch": 0.77, + "learning_rate": 4.662343209972428e-08, + "loss": 0.0007, + "step": 39546 + }, + { + "epoch": 0.77, + "learning_rate": 4.6619548755388136e-08, + "loss": 0.0004, + "step": 39547 + }, + { + "epoch": 0.77, + "learning_rate": 4.6615665411051994e-08, + "loss": 0.1323, + "step": 39548 + }, + { + "epoch": 0.77, + "learning_rate": 4.661178206671585e-08, + "loss": 0.0004, + "step": 39549 + }, + { + "epoch": 0.77, + "learning_rate": 4.660789872237971e-08, + "loss": 0.0006, + "step": 39550 + }, + { + "epoch": 0.77, + "learning_rate": 4.660401537804357e-08, + "loss": 0.0005, + "step": 39551 + }, + { + "epoch": 0.77, + "learning_rate": 4.660013203370743e-08, + "loss": 0.0004, + "step": 39552 + }, + { + "epoch": 0.77, + "learning_rate": 4.6596248689371286e-08, + "loss": 0.0004, + "step": 39553 + }, + { + "epoch": 0.77, + "learning_rate": 4.659236534503514e-08, + "loss": 0.0004, + "step": 39554 + }, + { + "epoch": 0.77, + "learning_rate": 4.6588482000698996e-08, + "loss": 0.0005, + "step": 39555 + }, + { + "epoch": 0.77, + "learning_rate": 4.6584598656362854e-08, + "loss": 0.0003, + "step": 39556 + }, + { + "epoch": 0.77, + "learning_rate": 4.658071531202671e-08, + "loss": 0.0004, + "step": 39557 + }, + { + "epoch": 0.77, + "learning_rate": 4.657683196769057e-08, + "loss": 0.0004, + "step": 39558 + }, + { + "epoch": 0.77, + "learning_rate": 4.657294862335443e-08, + "loss": 0.0003, + "step": 39559 + }, + { + "epoch": 0.77, + "learning_rate": 4.656906527901829e-08, + "loss": 0.0007, + "step": 39560 + }, + { + "epoch": 0.77, + "learning_rate": 4.6565181934682145e-08, + "loss": 0.0008, + "step": 39561 + }, + { + "epoch": 0.77, + "learning_rate": 4.6561298590346e-08, + "loss": 0.0163, + "step": 39562 + }, + { + "epoch": 0.77, + "learning_rate": 4.655741524600986e-08, + "loss": 0.0007, + "step": 39563 + }, + { + "epoch": 0.77, + "learning_rate": 4.655353190167372e-08, + "loss": 0.0004, + "step": 39564 + }, + { + "epoch": 0.77, + "learning_rate": 4.654964855733758e-08, + "loss": 0.0823, + "step": 39565 + }, + { + "epoch": 0.77, + "learning_rate": 4.6545765213001436e-08, + "loss": 0.0005, + "step": 39566 + }, + { + "epoch": 0.77, + "learning_rate": 4.6541881868665294e-08, + "loss": 0.0004, + "step": 39567 + }, + { + "epoch": 0.77, + "learning_rate": 4.653799852432915e-08, + "loss": 0.0004, + "step": 39568 + }, + { + "epoch": 0.77, + "learning_rate": 4.6534115179993004e-08, + "loss": 0.0005, + "step": 39569 + }, + { + "epoch": 0.77, + "learning_rate": 4.653023183565686e-08, + "loss": 0.0003, + "step": 39570 + }, + { + "epoch": 0.77, + "learning_rate": 4.652634849132072e-08, + "loss": 0.0004, + "step": 39571 + }, + { + "epoch": 0.77, + "learning_rate": 4.652246514698458e-08, + "loss": 0.0005, + "step": 39572 + }, + { + "epoch": 0.77, + "learning_rate": 4.651858180264844e-08, + "loss": 0.0005, + "step": 39573 + }, + { + "epoch": 0.77, + "learning_rate": 4.6514698458312296e-08, + "loss": 0.0011, + "step": 39574 + }, + { + "epoch": 0.77, + "learning_rate": 4.6510815113976154e-08, + "loss": 0.0005, + "step": 39575 + }, + { + "epoch": 0.77, + "learning_rate": 4.650693176964001e-08, + "loss": 0.0005, + "step": 39576 + }, + { + "epoch": 0.77, + "learning_rate": 4.650304842530387e-08, + "loss": 0.0152, + "step": 39577 + }, + { + "epoch": 0.77, + "learning_rate": 4.649916508096773e-08, + "loss": 0.0003, + "step": 39578 + }, + { + "epoch": 0.77, + "learning_rate": 4.649528173663159e-08, + "loss": 0.0004, + "step": 39579 + }, + { + "epoch": 0.77, + "learning_rate": 4.6491398392295445e-08, + "loss": 0.0017, + "step": 39580 + }, + { + "epoch": 0.77, + "learning_rate": 4.64875150479593e-08, + "loss": 0.0399, + "step": 39581 + }, + { + "epoch": 0.77, + "learning_rate": 4.648363170362316e-08, + "loss": 0.0003, + "step": 39582 + }, + { + "epoch": 0.77, + "learning_rate": 4.647974835928701e-08, + "loss": 0.0006, + "step": 39583 + }, + { + "epoch": 0.77, + "learning_rate": 4.647586501495087e-08, + "loss": 0.0007, + "step": 39584 + }, + { + "epoch": 0.77, + "learning_rate": 4.647198167061473e-08, + "loss": 0.0667, + "step": 39585 + }, + { + "epoch": 0.77, + "learning_rate": 4.646809832627859e-08, + "loss": 0.0005, + "step": 39586 + }, + { + "epoch": 0.77, + "learning_rate": 4.6464214981942446e-08, + "loss": 0.0004, + "step": 39587 + }, + { + "epoch": 0.77, + "learning_rate": 4.6460331637606304e-08, + "loss": 0.0005, + "step": 39588 + }, + { + "epoch": 0.77, + "learning_rate": 4.645644829327016e-08, + "loss": 0.0004, + "step": 39589 + }, + { + "epoch": 0.77, + "learning_rate": 4.645256494893402e-08, + "loss": 0.0007, + "step": 39590 + }, + { + "epoch": 0.77, + "learning_rate": 4.644868160459788e-08, + "loss": 0.0009, + "step": 39591 + }, + { + "epoch": 0.77, + "learning_rate": 4.644479826026174e-08, + "loss": 0.0016, + "step": 39592 + }, + { + "epoch": 0.77, + "learning_rate": 4.6440914915925596e-08, + "loss": 0.0006, + "step": 39593 + }, + { + "epoch": 0.77, + "learning_rate": 4.6437031571589454e-08, + "loss": 0.0004, + "step": 39594 + }, + { + "epoch": 0.77, + "learning_rate": 4.643314822725331e-08, + "loss": 0.0003, + "step": 39595 + }, + { + "epoch": 0.77, + "learning_rate": 4.642926488291717e-08, + "loss": 0.0004, + "step": 39596 + }, + { + "epoch": 0.77, + "learning_rate": 4.642538153858103e-08, + "loss": 0.0317, + "step": 39597 + }, + { + "epoch": 0.77, + "learning_rate": 4.642149819424488e-08, + "loss": 0.0004, + "step": 39598 + }, + { + "epoch": 0.77, + "learning_rate": 4.641761484990874e-08, + "loss": 1.1951, + "step": 39599 + }, + { + "epoch": 0.77, + "learning_rate": 4.6413731505572597e-08, + "loss": 0.0004, + "step": 39600 + }, + { + "epoch": 0.77, + "learning_rate": 4.6409848161236455e-08, + "loss": 0.0005, + "step": 39601 + }, + { + "epoch": 0.77, + "learning_rate": 4.640596481690031e-08, + "loss": 0.0007, + "step": 39602 + }, + { + "epoch": 0.77, + "learning_rate": 4.640208147256417e-08, + "loss": 0.0005, + "step": 39603 + }, + { + "epoch": 0.77, + "learning_rate": 4.639819812822803e-08, + "loss": 0.0002, + "step": 39604 + }, + { + "epoch": 0.77, + "learning_rate": 4.639431478389189e-08, + "loss": 0.0004, + "step": 39605 + }, + { + "epoch": 0.77, + "learning_rate": 4.6390431439555746e-08, + "loss": 0.0005, + "step": 39606 + }, + { + "epoch": 0.77, + "learning_rate": 4.6386548095219604e-08, + "loss": 0.0004, + "step": 39607 + }, + { + "epoch": 0.77, + "learning_rate": 4.638266475088346e-08, + "loss": 0.0016, + "step": 39608 + }, + { + "epoch": 0.77, + "learning_rate": 4.637878140654732e-08, + "loss": 0.0003, + "step": 39609 + }, + { + "epoch": 0.77, + "learning_rate": 4.637489806221118e-08, + "loss": 0.0017, + "step": 39610 + }, + { + "epoch": 0.77, + "learning_rate": 4.637101471787504e-08, + "loss": 0.4123, + "step": 39611 + }, + { + "epoch": 0.77, + "learning_rate": 4.636713137353889e-08, + "loss": 0.002, + "step": 39612 + }, + { + "epoch": 0.77, + "learning_rate": 4.636324802920275e-08, + "loss": 0.0004, + "step": 39613 + }, + { + "epoch": 0.77, + "learning_rate": 4.6359364684866605e-08, + "loss": 0.0005, + "step": 39614 + }, + { + "epoch": 0.77, + "learning_rate": 4.6355481340530464e-08, + "loss": 0.6423, + "step": 39615 + }, + { + "epoch": 0.77, + "learning_rate": 4.635159799619432e-08, + "loss": 0.0005, + "step": 39616 + }, + { + "epoch": 0.77, + "learning_rate": 4.634771465185818e-08, + "loss": 0.0004, + "step": 39617 + }, + { + "epoch": 0.77, + "learning_rate": 4.634383130752204e-08, + "loss": 0.0092, + "step": 39618 + }, + { + "epoch": 0.77, + "learning_rate": 4.63399479631859e-08, + "loss": 0.0006, + "step": 39619 + }, + { + "epoch": 0.77, + "learning_rate": 4.6336064618849755e-08, + "loss": 0.0004, + "step": 39620 + }, + { + "epoch": 0.77, + "learning_rate": 4.6332181274513607e-08, + "loss": 0.0004, + "step": 39621 + }, + { + "epoch": 0.77, + "learning_rate": 4.6328297930177465e-08, + "loss": 0.0005, + "step": 39622 + }, + { + "epoch": 0.77, + "learning_rate": 4.632441458584132e-08, + "loss": 0.0005, + "step": 39623 + }, + { + "epoch": 0.77, + "learning_rate": 4.632053124150518e-08, + "loss": 0.0003, + "step": 39624 + }, + { + "epoch": 0.77, + "learning_rate": 4.631664789716904e-08, + "loss": 0.0004, + "step": 39625 + }, + { + "epoch": 0.77, + "learning_rate": 4.63127645528329e-08, + "loss": 0.0004, + "step": 39626 + }, + { + "epoch": 0.77, + "learning_rate": 4.6308881208496756e-08, + "loss": 0.0032, + "step": 39627 + }, + { + "epoch": 0.77, + "learning_rate": 4.630499786416061e-08, + "loss": 0.0006, + "step": 39628 + }, + { + "epoch": 0.77, + "learning_rate": 4.6301114519824466e-08, + "loss": 0.0004, + "step": 39629 + }, + { + "epoch": 0.77, + "learning_rate": 4.6297231175488324e-08, + "loss": 0.0037, + "step": 39630 + }, + { + "epoch": 0.77, + "learning_rate": 4.629334783115218e-08, + "loss": 0.0004, + "step": 39631 + }, + { + "epoch": 0.77, + "learning_rate": 4.628946448681604e-08, + "loss": 0.121, + "step": 39632 + }, + { + "epoch": 0.77, + "learning_rate": 4.62855811424799e-08, + "loss": 0.0005, + "step": 39633 + }, + { + "epoch": 0.77, + "learning_rate": 4.628169779814376e-08, + "loss": 0.0008, + "step": 39634 + }, + { + "epoch": 0.77, + "learning_rate": 4.6277814453807615e-08, + "loss": 0.0003, + "step": 39635 + }, + { + "epoch": 0.77, + "learning_rate": 4.6273931109471474e-08, + "loss": 0.0005, + "step": 39636 + }, + { + "epoch": 0.77, + "learning_rate": 4.627004776513533e-08, + "loss": 0.0026, + "step": 39637 + }, + { + "epoch": 0.77, + "learning_rate": 4.626616442079919e-08, + "loss": 0.0003, + "step": 39638 + }, + { + "epoch": 0.77, + "learning_rate": 4.626228107646305e-08, + "loss": 0.0003, + "step": 39639 + }, + { + "epoch": 0.77, + "learning_rate": 4.6258397732126907e-08, + "loss": 0.0003, + "step": 39640 + }, + { + "epoch": 0.77, + "learning_rate": 4.625451438779076e-08, + "loss": 0.0004, + "step": 39641 + }, + { + "epoch": 0.77, + "learning_rate": 4.6250631043454616e-08, + "loss": 0.0023, + "step": 39642 + }, + { + "epoch": 0.77, + "learning_rate": 4.6246747699118475e-08, + "loss": 0.0004, + "step": 39643 + }, + { + "epoch": 0.77, + "learning_rate": 4.624286435478233e-08, + "loss": 0.0003, + "step": 39644 + }, + { + "epoch": 0.77, + "learning_rate": 4.623898101044619e-08, + "loss": 0.0018, + "step": 39645 + }, + { + "epoch": 0.77, + "learning_rate": 4.623509766611005e-08, + "loss": 0.0007, + "step": 39646 + }, + { + "epoch": 0.77, + "learning_rate": 4.623121432177391e-08, + "loss": 0.1255, + "step": 39647 + }, + { + "epoch": 0.77, + "learning_rate": 4.6227330977437766e-08, + "loss": 0.0005, + "step": 39648 + }, + { + "epoch": 0.77, + "learning_rate": 4.6223447633101624e-08, + "loss": 0.0005, + "step": 39649 + }, + { + "epoch": 0.77, + "learning_rate": 4.621956428876548e-08, + "loss": 0.0004, + "step": 39650 + }, + { + "epoch": 0.77, + "learning_rate": 4.621568094442934e-08, + "loss": 0.0005, + "step": 39651 + }, + { + "epoch": 0.77, + "learning_rate": 4.62117976000932e-08, + "loss": 0.0003, + "step": 39652 + }, + { + "epoch": 0.77, + "learning_rate": 4.620791425575706e-08, + "loss": 0.0008, + "step": 39653 + }, + { + "epoch": 0.77, + "learning_rate": 4.6204030911420915e-08, + "loss": 0.0005, + "step": 39654 + }, + { + "epoch": 0.77, + "learning_rate": 4.6200147567084774e-08, + "loss": 0.0009, + "step": 39655 + }, + { + "epoch": 0.77, + "learning_rate": 4.6196264222748625e-08, + "loss": 0.0005, + "step": 39656 + }, + { + "epoch": 0.77, + "learning_rate": 4.6192380878412484e-08, + "loss": 0.0004, + "step": 39657 + }, + { + "epoch": 0.77, + "learning_rate": 4.618849753407634e-08, + "loss": 0.0006, + "step": 39658 + }, + { + "epoch": 0.77, + "learning_rate": 4.61846141897402e-08, + "loss": 0.0006, + "step": 39659 + }, + { + "epoch": 0.77, + "learning_rate": 4.618073084540406e-08, + "loss": 0.0003, + "step": 39660 + }, + { + "epoch": 0.77, + "learning_rate": 4.6176847501067917e-08, + "loss": 0.0014, + "step": 39661 + }, + { + "epoch": 0.77, + "learning_rate": 4.6172964156731775e-08, + "loss": 0.0004, + "step": 39662 + }, + { + "epoch": 0.77, + "learning_rate": 4.616908081239563e-08, + "loss": 0.0007, + "step": 39663 + }, + { + "epoch": 0.77, + "learning_rate": 4.616519746805949e-08, + "loss": 0.0006, + "step": 39664 + }, + { + "epoch": 0.77, + "learning_rate": 4.616131412372335e-08, + "loss": 0.0003, + "step": 39665 + }, + { + "epoch": 0.77, + "learning_rate": 4.615743077938721e-08, + "loss": 0.0003, + "step": 39666 + }, + { + "epoch": 0.77, + "learning_rate": 4.6153547435051066e-08, + "loss": 0.0003, + "step": 39667 + }, + { + "epoch": 0.77, + "learning_rate": 4.6149664090714924e-08, + "loss": 0.0018, + "step": 39668 + }, + { + "epoch": 0.77, + "learning_rate": 4.614578074637878e-08, + "loss": 0.0006, + "step": 39669 + }, + { + "epoch": 0.77, + "learning_rate": 4.6141897402042634e-08, + "loss": 0.0005, + "step": 39670 + }, + { + "epoch": 0.77, + "learning_rate": 4.613801405770649e-08, + "loss": 0.7134, + "step": 39671 + }, + { + "epoch": 0.77, + "learning_rate": 4.613413071337035e-08, + "loss": 0.0005, + "step": 39672 + }, + { + "epoch": 0.77, + "learning_rate": 4.613024736903421e-08, + "loss": 0.0004, + "step": 39673 + }, + { + "epoch": 0.77, + "learning_rate": 4.612636402469807e-08, + "loss": 0.0004, + "step": 39674 + }, + { + "epoch": 0.77, + "learning_rate": 4.6122480680361925e-08, + "loss": 0.0004, + "step": 39675 + }, + { + "epoch": 0.77, + "learning_rate": 4.6118597336025784e-08, + "loss": 0.0004, + "step": 39676 + }, + { + "epoch": 0.77, + "learning_rate": 4.611471399168964e-08, + "loss": 0.0008, + "step": 39677 + }, + { + "epoch": 0.77, + "learning_rate": 4.61108306473535e-08, + "loss": 0.0004, + "step": 39678 + }, + { + "epoch": 0.77, + "learning_rate": 4.610694730301736e-08, + "loss": 0.0003, + "step": 39679 + }, + { + "epoch": 0.77, + "learning_rate": 4.6103063958681217e-08, + "loss": 0.0013, + "step": 39680 + }, + { + "epoch": 0.77, + "learning_rate": 4.6099180614345075e-08, + "loss": 0.3549, + "step": 39681 + }, + { + "epoch": 0.77, + "learning_rate": 4.609529727000893e-08, + "loss": 1.2153, + "step": 39682 + }, + { + "epoch": 0.77, + "learning_rate": 4.609141392567279e-08, + "loss": 0.0004, + "step": 39683 + }, + { + "epoch": 0.77, + "learning_rate": 4.608753058133665e-08, + "loss": 0.0004, + "step": 39684 + }, + { + "epoch": 0.77, + "learning_rate": 4.60836472370005e-08, + "loss": 0.5452, + "step": 39685 + }, + { + "epoch": 0.77, + "learning_rate": 4.607976389266436e-08, + "loss": 0.0005, + "step": 39686 + }, + { + "epoch": 0.77, + "learning_rate": 4.607588054832822e-08, + "loss": 0.0004, + "step": 39687 + }, + { + "epoch": 0.77, + "learning_rate": 4.6071997203992076e-08, + "loss": 0.0005, + "step": 39688 + }, + { + "epoch": 0.77, + "learning_rate": 4.6068113859655934e-08, + "loss": 0.0003, + "step": 39689 + }, + { + "epoch": 0.77, + "learning_rate": 4.606423051531979e-08, + "loss": 0.0005, + "step": 39690 + }, + { + "epoch": 0.77, + "learning_rate": 4.606034717098365e-08, + "loss": 0.0026, + "step": 39691 + }, + { + "epoch": 0.77, + "learning_rate": 4.605646382664751e-08, + "loss": 0.0004, + "step": 39692 + }, + { + "epoch": 0.77, + "learning_rate": 4.605258048231137e-08, + "loss": 0.0004, + "step": 39693 + }, + { + "epoch": 0.77, + "learning_rate": 4.6048697137975225e-08, + "loss": 0.001, + "step": 39694 + }, + { + "epoch": 0.77, + "learning_rate": 4.6044813793639084e-08, + "loss": 0.0007, + "step": 39695 + }, + { + "epoch": 0.77, + "learning_rate": 4.604093044930294e-08, + "loss": 0.0005, + "step": 39696 + }, + { + "epoch": 0.77, + "learning_rate": 4.60370471049668e-08, + "loss": 0.0003, + "step": 39697 + }, + { + "epoch": 0.77, + "learning_rate": 4.603316376063066e-08, + "loss": 0.0004, + "step": 39698 + }, + { + "epoch": 0.77, + "learning_rate": 4.602928041629451e-08, + "loss": 0.0004, + "step": 39699 + }, + { + "epoch": 0.77, + "learning_rate": 4.602539707195837e-08, + "loss": 0.0007, + "step": 39700 + }, + { + "epoch": 0.77, + "learning_rate": 4.6021513727622226e-08, + "loss": 0.7215, + "step": 39701 + }, + { + "epoch": 0.77, + "learning_rate": 4.6017630383286085e-08, + "loss": 0.0002, + "step": 39702 + }, + { + "epoch": 0.77, + "learning_rate": 4.601374703894994e-08, + "loss": 0.0004, + "step": 39703 + }, + { + "epoch": 0.77, + "learning_rate": 4.60098636946138e-08, + "loss": 0.0004, + "step": 39704 + }, + { + "epoch": 0.77, + "learning_rate": 4.600598035027766e-08, + "loss": 0.0002, + "step": 39705 + }, + { + "epoch": 0.77, + "learning_rate": 4.600209700594152e-08, + "loss": 0.0004, + "step": 39706 + }, + { + "epoch": 0.77, + "learning_rate": 4.5998213661605376e-08, + "loss": 0.0003, + "step": 39707 + }, + { + "epoch": 0.77, + "learning_rate": 4.5994330317269234e-08, + "loss": 0.0003, + "step": 39708 + }, + { + "epoch": 0.77, + "learning_rate": 4.5990446972933086e-08, + "loss": 0.0003, + "step": 39709 + }, + { + "epoch": 0.77, + "learning_rate": 4.5986563628596944e-08, + "loss": 0.0006, + "step": 39710 + }, + { + "epoch": 0.77, + "learning_rate": 4.59826802842608e-08, + "loss": 0.0004, + "step": 39711 + }, + { + "epoch": 0.77, + "learning_rate": 4.597879693992466e-08, + "loss": 0.0003, + "step": 39712 + }, + { + "epoch": 0.77, + "learning_rate": 4.597491359558852e-08, + "loss": 0.0202, + "step": 39713 + }, + { + "epoch": 0.77, + "learning_rate": 4.597103025125238e-08, + "loss": 0.0004, + "step": 39714 + }, + { + "epoch": 0.77, + "learning_rate": 4.5967146906916235e-08, + "loss": 0.0004, + "step": 39715 + }, + { + "epoch": 0.77, + "learning_rate": 4.5963263562580093e-08, + "loss": 1.1299, + "step": 39716 + }, + { + "epoch": 0.77, + "learning_rate": 4.5959380218243945e-08, + "loss": 0.0007, + "step": 39717 + }, + { + "epoch": 0.77, + "learning_rate": 4.5955496873907803e-08, + "loss": 0.0003, + "step": 39718 + }, + { + "epoch": 0.77, + "learning_rate": 4.595161352957166e-08, + "loss": 0.0004, + "step": 39719 + }, + { + "epoch": 0.77, + "learning_rate": 4.594773018523552e-08, + "loss": 0.7365, + "step": 39720 + }, + { + "epoch": 0.77, + "learning_rate": 4.594384684089938e-08, + "loss": 0.0005, + "step": 39721 + }, + { + "epoch": 0.77, + "learning_rate": 4.5939963496563236e-08, + "loss": 0.0004, + "step": 39722 + }, + { + "epoch": 0.77, + "learning_rate": 4.5936080152227095e-08, + "loss": 0.0151, + "step": 39723 + }, + { + "epoch": 0.77, + "learning_rate": 4.593219680789095e-08, + "loss": 0.0027, + "step": 39724 + }, + { + "epoch": 0.77, + "learning_rate": 4.592831346355481e-08, + "loss": 0.0004, + "step": 39725 + }, + { + "epoch": 0.77, + "learning_rate": 4.592443011921867e-08, + "loss": 0.0008, + "step": 39726 + }, + { + "epoch": 0.77, + "learning_rate": 4.592054677488253e-08, + "loss": 0.0005, + "step": 39727 + }, + { + "epoch": 0.77, + "learning_rate": 4.591666343054638e-08, + "loss": 0.0005, + "step": 39728 + }, + { + "epoch": 0.77, + "learning_rate": 4.591278008621024e-08, + "loss": 0.0003, + "step": 39729 + }, + { + "epoch": 0.77, + "learning_rate": 4.5908896741874096e-08, + "loss": 0.0005, + "step": 39730 + }, + { + "epoch": 0.77, + "learning_rate": 4.5905013397537954e-08, + "loss": 0.0003, + "step": 39731 + }, + { + "epoch": 0.77, + "learning_rate": 4.590113005320181e-08, + "loss": 0.0004, + "step": 39732 + }, + { + "epoch": 0.77, + "learning_rate": 4.589724670886567e-08, + "loss": 0.0004, + "step": 39733 + }, + { + "epoch": 0.77, + "learning_rate": 4.589336336452953e-08, + "loss": 0.0012, + "step": 39734 + }, + { + "epoch": 0.77, + "learning_rate": 4.588948002019339e-08, + "loss": 0.0005, + "step": 39735 + }, + { + "epoch": 0.77, + "learning_rate": 4.5885596675857245e-08, + "loss": 0.0004, + "step": 39736 + }, + { + "epoch": 0.77, + "learning_rate": 4.5881713331521103e-08, + "loss": 0.0005, + "step": 39737 + }, + { + "epoch": 0.77, + "learning_rate": 4.587782998718496e-08, + "loss": 0.0005, + "step": 39738 + }, + { + "epoch": 0.77, + "learning_rate": 4.587394664284882e-08, + "loss": 0.0005, + "step": 39739 + }, + { + "epoch": 0.77, + "learning_rate": 4.587006329851268e-08, + "loss": 0.0033, + "step": 39740 + }, + { + "epoch": 0.77, + "learning_rate": 4.5866179954176536e-08, + "loss": 0.001, + "step": 39741 + }, + { + "epoch": 0.77, + "learning_rate": 4.5862296609840395e-08, + "loss": 0.0003, + "step": 39742 + }, + { + "epoch": 0.77, + "learning_rate": 4.5858413265504246e-08, + "loss": 0.0004, + "step": 39743 + }, + { + "epoch": 0.77, + "learning_rate": 4.5854529921168104e-08, + "loss": 0.0004, + "step": 39744 + }, + { + "epoch": 0.77, + "learning_rate": 4.585064657683196e-08, + "loss": 0.0003, + "step": 39745 + }, + { + "epoch": 0.77, + "learning_rate": 4.584676323249582e-08, + "loss": 0.0003, + "step": 39746 + }, + { + "epoch": 0.77, + "learning_rate": 4.584287988815968e-08, + "loss": 0.0002, + "step": 39747 + }, + { + "epoch": 0.77, + "learning_rate": 4.583899654382354e-08, + "loss": 0.0005, + "step": 39748 + }, + { + "epoch": 0.77, + "learning_rate": 4.5835113199487396e-08, + "loss": 0.0005, + "step": 39749 + }, + { + "epoch": 0.77, + "learning_rate": 4.5831229855151254e-08, + "loss": 0.0003, + "step": 39750 + }, + { + "epoch": 0.77, + "learning_rate": 4.582734651081511e-08, + "loss": 0.0005, + "step": 39751 + }, + { + "epoch": 0.77, + "learning_rate": 4.582346316647897e-08, + "loss": 0.0003, + "step": 39752 + }, + { + "epoch": 0.77, + "learning_rate": 4.581957982214283e-08, + "loss": 0.0004, + "step": 39753 + }, + { + "epoch": 0.77, + "learning_rate": 4.581569647780669e-08, + "loss": 0.0004, + "step": 39754 + }, + { + "epoch": 0.77, + "learning_rate": 4.5811813133470545e-08, + "loss": 0.0003, + "step": 39755 + }, + { + "epoch": 0.77, + "learning_rate": 4.5807929789134403e-08, + "loss": 0.0005, + "step": 39756 + }, + { + "epoch": 0.77, + "learning_rate": 4.5804046444798255e-08, + "loss": 0.0003, + "step": 39757 + }, + { + "epoch": 0.77, + "learning_rate": 4.580016310046211e-08, + "loss": 0.0034, + "step": 39758 + }, + { + "epoch": 0.77, + "learning_rate": 4.579627975612597e-08, + "loss": 0.0002, + "step": 39759 + }, + { + "epoch": 0.77, + "learning_rate": 4.579239641178983e-08, + "loss": 0.0004, + "step": 39760 + }, + { + "epoch": 0.77, + "learning_rate": 4.578851306745369e-08, + "loss": 0.0004, + "step": 39761 + }, + { + "epoch": 0.77, + "learning_rate": 4.5784629723117546e-08, + "loss": 0.0005, + "step": 39762 + }, + { + "epoch": 0.77, + "learning_rate": 4.5780746378781404e-08, + "loss": 0.0086, + "step": 39763 + }, + { + "epoch": 0.77, + "learning_rate": 4.577686303444526e-08, + "loss": 0.2216, + "step": 39764 + }, + { + "epoch": 0.77, + "learning_rate": 4.577297969010912e-08, + "loss": 0.0004, + "step": 39765 + }, + { + "epoch": 0.77, + "learning_rate": 4.576909634577298e-08, + "loss": 0.0004, + "step": 39766 + }, + { + "epoch": 0.77, + "learning_rate": 4.576521300143684e-08, + "loss": 0.0003, + "step": 39767 + }, + { + "epoch": 0.77, + "learning_rate": 4.5761329657100696e-08, + "loss": 0.09, + "step": 39768 + }, + { + "epoch": 0.77, + "learning_rate": 4.5757446312764554e-08, + "loss": 0.0003, + "step": 39769 + }, + { + "epoch": 0.77, + "learning_rate": 4.575356296842841e-08, + "loss": 0.0111, + "step": 39770 + }, + { + "epoch": 0.77, + "learning_rate": 4.574967962409227e-08, + "loss": 0.0018, + "step": 39771 + }, + { + "epoch": 0.77, + "learning_rate": 4.574579627975612e-08, + "loss": 0.3275, + "step": 39772 + }, + { + "epoch": 0.77, + "learning_rate": 4.574191293541998e-08, + "loss": 0.0005, + "step": 39773 + }, + { + "epoch": 0.77, + "learning_rate": 4.573802959108384e-08, + "loss": 0.0004, + "step": 39774 + }, + { + "epoch": 0.77, + "learning_rate": 4.57341462467477e-08, + "loss": 0.0005, + "step": 39775 + }, + { + "epoch": 0.77, + "learning_rate": 4.5730262902411555e-08, + "loss": 0.0003, + "step": 39776 + }, + { + "epoch": 0.77, + "learning_rate": 4.572637955807541e-08, + "loss": 0.0003, + "step": 39777 + }, + { + "epoch": 0.77, + "learning_rate": 4.572249621373927e-08, + "loss": 0.0003, + "step": 39778 + }, + { + "epoch": 0.77, + "learning_rate": 4.571861286940313e-08, + "loss": 0.0004, + "step": 39779 + }, + { + "epoch": 0.77, + "learning_rate": 4.571472952506699e-08, + "loss": 0.0077, + "step": 39780 + }, + { + "epoch": 0.77, + "learning_rate": 4.5710846180730846e-08, + "loss": 0.0005, + "step": 39781 + }, + { + "epoch": 0.77, + "learning_rate": 4.5706962836394705e-08, + "loss": 0.0015, + "step": 39782 + }, + { + "epoch": 0.77, + "learning_rate": 4.570307949205856e-08, + "loss": 0.0005, + "step": 39783 + }, + { + "epoch": 0.77, + "learning_rate": 4.569919614772242e-08, + "loss": 0.0003, + "step": 39784 + }, + { + "epoch": 0.77, + "learning_rate": 4.569531280338628e-08, + "loss": 0.0004, + "step": 39785 + }, + { + "epoch": 0.77, + "learning_rate": 4.569142945905013e-08, + "loss": 0.0004, + "step": 39786 + }, + { + "epoch": 0.77, + "learning_rate": 4.568754611471399e-08, + "loss": 0.0082, + "step": 39787 + }, + { + "epoch": 0.77, + "learning_rate": 4.568366277037785e-08, + "loss": 0.0004, + "step": 39788 + }, + { + "epoch": 0.77, + "learning_rate": 4.5679779426041706e-08, + "loss": 0.0003, + "step": 39789 + }, + { + "epoch": 0.77, + "learning_rate": 4.5675896081705564e-08, + "loss": 0.0006, + "step": 39790 + }, + { + "epoch": 0.77, + "learning_rate": 4.567201273736942e-08, + "loss": 0.0005, + "step": 39791 + }, + { + "epoch": 0.77, + "learning_rate": 4.566812939303328e-08, + "loss": 0.0009, + "step": 39792 + }, + { + "epoch": 0.77, + "learning_rate": 4.566424604869714e-08, + "loss": 0.0006, + "step": 39793 + }, + { + "epoch": 0.77, + "learning_rate": 4.5660362704361e-08, + "loss": 0.0005, + "step": 39794 + }, + { + "epoch": 0.77, + "learning_rate": 4.5656479360024855e-08, + "loss": 0.0003, + "step": 39795 + }, + { + "epoch": 0.77, + "learning_rate": 4.5652596015688713e-08, + "loss": 0.0005, + "step": 39796 + }, + { + "epoch": 0.77, + "learning_rate": 4.564871267135257e-08, + "loss": 0.0015, + "step": 39797 + }, + { + "epoch": 0.77, + "learning_rate": 4.564482932701642e-08, + "loss": 0.0003, + "step": 39798 + }, + { + "epoch": 0.77, + "learning_rate": 4.564094598268028e-08, + "loss": 0.0021, + "step": 39799 + }, + { + "epoch": 0.77, + "learning_rate": 4.563706263834414e-08, + "loss": 0.0053, + "step": 39800 + }, + { + "epoch": 0.77, + "learning_rate": 4.5633179294008e-08, + "loss": 0.0005, + "step": 39801 + }, + { + "epoch": 0.77, + "learning_rate": 4.5629295949671856e-08, + "loss": 0.0067, + "step": 39802 + }, + { + "epoch": 0.77, + "learning_rate": 4.5625412605335714e-08, + "loss": 0.0004, + "step": 39803 + }, + { + "epoch": 0.77, + "learning_rate": 4.562152926099957e-08, + "loss": 0.0004, + "step": 39804 + }, + { + "epoch": 0.77, + "learning_rate": 4.5617645916663424e-08, + "loss": 0.0006, + "step": 39805 + }, + { + "epoch": 0.77, + "learning_rate": 4.561376257232728e-08, + "loss": 0.0004, + "step": 39806 + }, + { + "epoch": 0.77, + "learning_rate": 4.560987922799114e-08, + "loss": 0.0005, + "step": 39807 + }, + { + "epoch": 0.77, + "learning_rate": 4.5605995883655e-08, + "loss": 0.0004, + "step": 39808 + }, + { + "epoch": 0.77, + "learning_rate": 4.560211253931886e-08, + "loss": 0.0115, + "step": 39809 + }, + { + "epoch": 0.77, + "learning_rate": 4.5598229194982715e-08, + "loss": 0.0004, + "step": 39810 + }, + { + "epoch": 0.77, + "learning_rate": 4.5594345850646574e-08, + "loss": 0.0003, + "step": 39811 + }, + { + "epoch": 0.77, + "learning_rate": 4.559046250631043e-08, + "loss": 0.0004, + "step": 39812 + }, + { + "epoch": 0.77, + "learning_rate": 4.558657916197429e-08, + "loss": 0.0003, + "step": 39813 + }, + { + "epoch": 0.77, + "learning_rate": 4.558269581763815e-08, + "loss": 0.0004, + "step": 39814 + }, + { + "epoch": 0.77, + "learning_rate": 4.5578812473302e-08, + "loss": 0.0005, + "step": 39815 + }, + { + "epoch": 0.77, + "learning_rate": 4.557492912896586e-08, + "loss": 0.0005, + "step": 39816 + }, + { + "epoch": 0.77, + "learning_rate": 4.5571045784629717e-08, + "loss": 0.0007, + "step": 39817 + }, + { + "epoch": 0.77, + "learning_rate": 4.5567162440293575e-08, + "loss": 0.0003, + "step": 39818 + }, + { + "epoch": 0.77, + "learning_rate": 4.556327909595743e-08, + "loss": 0.0003, + "step": 39819 + }, + { + "epoch": 0.77, + "learning_rate": 4.555939575162129e-08, + "loss": 0.0004, + "step": 39820 + }, + { + "epoch": 0.77, + "learning_rate": 4.555551240728515e-08, + "loss": 0.0004, + "step": 39821 + }, + { + "epoch": 0.77, + "learning_rate": 4.555162906294901e-08, + "loss": 0.0004, + "step": 39822 + }, + { + "epoch": 0.77, + "learning_rate": 4.5547745718612866e-08, + "loss": 0.0107, + "step": 39823 + }, + { + "epoch": 0.77, + "learning_rate": 4.5543862374276724e-08, + "loss": 0.001, + "step": 39824 + }, + { + "epoch": 0.77, + "learning_rate": 4.553997902994058e-08, + "loss": 0.0007, + "step": 39825 + }, + { + "epoch": 0.77, + "learning_rate": 4.553609568560444e-08, + "loss": 0.0003, + "step": 39826 + }, + { + "epoch": 0.77, + "learning_rate": 4.55322123412683e-08, + "loss": 1.4234, + "step": 39827 + }, + { + "epoch": 0.77, + "learning_rate": 4.552832899693216e-08, + "loss": 0.0022, + "step": 39828 + }, + { + "epoch": 0.77, + "learning_rate": 4.5524445652596016e-08, + "loss": 0.0017, + "step": 39829 + }, + { + "epoch": 0.77, + "learning_rate": 4.552056230825987e-08, + "loss": 0.0004, + "step": 39830 + }, + { + "epoch": 0.77, + "learning_rate": 4.5516678963923725e-08, + "loss": 0.0003, + "step": 39831 + }, + { + "epoch": 0.77, + "learning_rate": 4.5512795619587584e-08, + "loss": 0.0006, + "step": 39832 + }, + { + "epoch": 0.77, + "learning_rate": 4.550891227525144e-08, + "loss": 0.0003, + "step": 39833 + }, + { + "epoch": 0.77, + "learning_rate": 4.55050289309153e-08, + "loss": 0.0005, + "step": 39834 + }, + { + "epoch": 0.77, + "learning_rate": 4.550114558657916e-08, + "loss": 0.0003, + "step": 39835 + }, + { + "epoch": 0.77, + "learning_rate": 4.5497262242243017e-08, + "loss": 0.0003, + "step": 39836 + }, + { + "epoch": 0.77, + "learning_rate": 4.5493378897906875e-08, + "loss": 0.9019, + "step": 39837 + }, + { + "epoch": 0.77, + "learning_rate": 4.548949555357073e-08, + "loss": 0.0004, + "step": 39838 + }, + { + "epoch": 0.77, + "learning_rate": 4.548561220923459e-08, + "loss": 0.0004, + "step": 39839 + }, + { + "epoch": 0.77, + "learning_rate": 4.548172886489845e-08, + "loss": 0.0002, + "step": 39840 + }, + { + "epoch": 0.77, + "learning_rate": 4.547784552056231e-08, + "loss": 0.0003, + "step": 39841 + }, + { + "epoch": 0.77, + "learning_rate": 4.5473962176226166e-08, + "loss": 0.005, + "step": 39842 + }, + { + "epoch": 0.77, + "learning_rate": 4.5470078831890024e-08, + "loss": 0.0003, + "step": 39843 + }, + { + "epoch": 0.77, + "learning_rate": 4.5466195487553876e-08, + "loss": 0.0396, + "step": 39844 + }, + { + "epoch": 0.77, + "learning_rate": 4.5462312143217734e-08, + "loss": 0.0004, + "step": 39845 + }, + { + "epoch": 0.77, + "learning_rate": 4.545842879888159e-08, + "loss": 0.0004, + "step": 39846 + }, + { + "epoch": 0.77, + "learning_rate": 4.545454545454545e-08, + "loss": 0.0005, + "step": 39847 + }, + { + "epoch": 0.77, + "learning_rate": 4.545066211020931e-08, + "loss": 0.0003, + "step": 39848 + }, + { + "epoch": 0.77, + "learning_rate": 4.544677876587317e-08, + "loss": 0.0004, + "step": 39849 + }, + { + "epoch": 0.77, + "learning_rate": 4.5442895421537025e-08, + "loss": 0.0004, + "step": 39850 + }, + { + "epoch": 0.77, + "learning_rate": 4.5439012077200884e-08, + "loss": 0.0003, + "step": 39851 + }, + { + "epoch": 0.77, + "learning_rate": 4.543512873286474e-08, + "loss": 0.0004, + "step": 39852 + }, + { + "epoch": 0.77, + "learning_rate": 4.54312453885286e-08, + "loss": 0.0003, + "step": 39853 + }, + { + "epoch": 0.77, + "learning_rate": 4.542736204419246e-08, + "loss": 0.0006, + "step": 39854 + }, + { + "epoch": 0.77, + "learning_rate": 4.5423478699856317e-08, + "loss": 0.0006, + "step": 39855 + }, + { + "epoch": 0.77, + "learning_rate": 4.5419595355520175e-08, + "loss": 1.1542, + "step": 39856 + }, + { + "epoch": 0.77, + "learning_rate": 4.541571201118403e-08, + "loss": 0.0004, + "step": 39857 + }, + { + "epoch": 0.77, + "learning_rate": 4.541182866684789e-08, + "loss": 0.0003, + "step": 39858 + }, + { + "epoch": 0.77, + "learning_rate": 4.540794532251174e-08, + "loss": 0.0002, + "step": 39859 + }, + { + "epoch": 0.77, + "learning_rate": 4.54040619781756e-08, + "loss": 0.0004, + "step": 39860 + }, + { + "epoch": 0.77, + "learning_rate": 4.540017863383946e-08, + "loss": 0.0004, + "step": 39861 + }, + { + "epoch": 0.77, + "learning_rate": 4.539629528950332e-08, + "loss": 0.0005, + "step": 39862 + }, + { + "epoch": 0.77, + "learning_rate": 4.5392411945167176e-08, + "loss": 0.0003, + "step": 39863 + }, + { + "epoch": 0.77, + "learning_rate": 4.5388528600831034e-08, + "loss": 0.0005, + "step": 39864 + }, + { + "epoch": 0.77, + "learning_rate": 4.538464525649489e-08, + "loss": 0.0003, + "step": 39865 + }, + { + "epoch": 0.77, + "learning_rate": 4.538076191215875e-08, + "loss": 0.0006, + "step": 39866 + }, + { + "epoch": 0.77, + "learning_rate": 4.537687856782261e-08, + "loss": 0.0003, + "step": 39867 + }, + { + "epoch": 0.77, + "learning_rate": 4.537299522348647e-08, + "loss": 0.0004, + "step": 39868 + }, + { + "epoch": 0.77, + "learning_rate": 4.5369111879150325e-08, + "loss": 0.0007, + "step": 39869 + }, + { + "epoch": 0.77, + "learning_rate": 4.5365228534814184e-08, + "loss": 0.0006, + "step": 39870 + }, + { + "epoch": 0.77, + "learning_rate": 4.536134519047804e-08, + "loss": 0.0005, + "step": 39871 + }, + { + "epoch": 0.77, + "learning_rate": 4.53574618461419e-08, + "loss": 0.0005, + "step": 39872 + }, + { + "epoch": 0.77, + "learning_rate": 4.535357850180575e-08, + "loss": 0.0004, + "step": 39873 + }, + { + "epoch": 0.77, + "learning_rate": 4.534969515746961e-08, + "loss": 0.0004, + "step": 39874 + }, + { + "epoch": 0.77, + "learning_rate": 4.534581181313347e-08, + "loss": 0.0004, + "step": 39875 + }, + { + "epoch": 0.77, + "learning_rate": 4.5341928468797327e-08, + "loss": 0.0142, + "step": 39876 + }, + { + "epoch": 0.77, + "learning_rate": 4.5338045124461185e-08, + "loss": 0.0006, + "step": 39877 + }, + { + "epoch": 0.77, + "learning_rate": 4.533416178012504e-08, + "loss": 0.0014, + "step": 39878 + }, + { + "epoch": 0.77, + "learning_rate": 4.53302784357889e-08, + "loss": 0.0003, + "step": 39879 + }, + { + "epoch": 0.77, + "learning_rate": 4.532639509145276e-08, + "loss": 0.0003, + "step": 39880 + }, + { + "epoch": 0.77, + "learning_rate": 4.532251174711662e-08, + "loss": 0.0004, + "step": 39881 + }, + { + "epoch": 0.77, + "learning_rate": 4.5318628402780476e-08, + "loss": 1.1102, + "step": 39882 + }, + { + "epoch": 0.77, + "learning_rate": 4.5314745058444334e-08, + "loss": 0.0003, + "step": 39883 + }, + { + "epoch": 0.77, + "learning_rate": 4.531086171410819e-08, + "loss": 0.0003, + "step": 39884 + }, + { + "epoch": 0.77, + "learning_rate": 4.530697836977205e-08, + "loss": 0.0979, + "step": 39885 + }, + { + "epoch": 0.77, + "learning_rate": 4.53030950254359e-08, + "loss": 0.0003, + "step": 39886 + }, + { + "epoch": 0.77, + "learning_rate": 4.529921168109976e-08, + "loss": 0.0017, + "step": 39887 + }, + { + "epoch": 0.77, + "learning_rate": 4.529532833676362e-08, + "loss": 0.0004, + "step": 39888 + }, + { + "epoch": 0.77, + "learning_rate": 4.529144499242748e-08, + "loss": 0.095, + "step": 39889 + }, + { + "epoch": 0.77, + "learning_rate": 4.5287561648091335e-08, + "loss": 0.0004, + "step": 39890 + }, + { + "epoch": 0.77, + "learning_rate": 4.5283678303755194e-08, + "loss": 0.0003, + "step": 39891 + }, + { + "epoch": 0.77, + "learning_rate": 4.527979495941905e-08, + "loss": 0.0005, + "step": 39892 + }, + { + "epoch": 0.77, + "learning_rate": 4.527591161508291e-08, + "loss": 0.0021, + "step": 39893 + }, + { + "epoch": 0.77, + "learning_rate": 4.527202827074676e-08, + "loss": 0.0005, + "step": 39894 + }, + { + "epoch": 0.77, + "learning_rate": 4.526814492641062e-08, + "loss": 0.0062, + "step": 39895 + }, + { + "epoch": 0.77, + "learning_rate": 4.526426158207448e-08, + "loss": 0.0004, + "step": 39896 + }, + { + "epoch": 0.77, + "learning_rate": 4.5260378237738336e-08, + "loss": 0.0005, + "step": 39897 + }, + { + "epoch": 0.77, + "learning_rate": 4.5256494893402195e-08, + "loss": 0.0004, + "step": 39898 + }, + { + "epoch": 0.77, + "learning_rate": 4.525261154906605e-08, + "loss": 0.0005, + "step": 39899 + }, + { + "epoch": 0.77, + "learning_rate": 4.524872820472991e-08, + "loss": 0.0005, + "step": 39900 + }, + { + "epoch": 0.77, + "learning_rate": 4.524484486039377e-08, + "loss": 0.0004, + "step": 39901 + }, + { + "epoch": 0.77, + "learning_rate": 4.524096151605762e-08, + "loss": 0.0004, + "step": 39902 + }, + { + "epoch": 0.77, + "learning_rate": 4.523707817172148e-08, + "loss": 0.0004, + "step": 39903 + }, + { + "epoch": 0.77, + "learning_rate": 4.523319482738534e-08, + "loss": 0.0003, + "step": 39904 + }, + { + "epoch": 0.77, + "learning_rate": 4.5229311483049196e-08, + "loss": 0.0004, + "step": 39905 + }, + { + "epoch": 0.77, + "learning_rate": 4.5225428138713054e-08, + "loss": 0.0003, + "step": 39906 + }, + { + "epoch": 0.77, + "learning_rate": 4.522154479437691e-08, + "loss": 0.0004, + "step": 39907 + }, + { + "epoch": 0.77, + "learning_rate": 4.521766145004077e-08, + "loss": 0.0004, + "step": 39908 + }, + { + "epoch": 0.77, + "learning_rate": 4.521377810570463e-08, + "loss": 0.0006, + "step": 39909 + }, + { + "epoch": 0.77, + "learning_rate": 4.520989476136849e-08, + "loss": 0.0006, + "step": 39910 + }, + { + "epoch": 0.77, + "learning_rate": 4.5206011417032345e-08, + "loss": 0.0003, + "step": 39911 + }, + { + "epoch": 0.77, + "learning_rate": 4.5202128072696203e-08, + "loss": 0.0004, + "step": 39912 + }, + { + "epoch": 0.77, + "learning_rate": 4.519824472836006e-08, + "loss": 0.0003, + "step": 39913 + }, + { + "epoch": 0.77, + "learning_rate": 4.519436138402392e-08, + "loss": 0.0006, + "step": 39914 + }, + { + "epoch": 0.77, + "learning_rate": 4.519047803968778e-08, + "loss": 0.0004, + "step": 39915 + }, + { + "epoch": 0.77, + "learning_rate": 4.5186594695351636e-08, + "loss": 0.0005, + "step": 39916 + }, + { + "epoch": 0.77, + "learning_rate": 4.518271135101549e-08, + "loss": 0.0003, + "step": 39917 + }, + { + "epoch": 0.77, + "learning_rate": 4.5178828006679346e-08, + "loss": 0.0006, + "step": 39918 + }, + { + "epoch": 0.77, + "learning_rate": 4.5174944662343205e-08, + "loss": 0.0004, + "step": 39919 + }, + { + "epoch": 0.77, + "learning_rate": 4.517106131800706e-08, + "loss": 0.0006, + "step": 39920 + }, + { + "epoch": 0.77, + "learning_rate": 4.516717797367092e-08, + "loss": 1.587, + "step": 39921 + }, + { + "epoch": 0.77, + "learning_rate": 4.516329462933478e-08, + "loss": 1.0078, + "step": 39922 + }, + { + "epoch": 0.77, + "learning_rate": 4.515941128499864e-08, + "loss": 0.0004, + "step": 39923 + }, + { + "epoch": 0.77, + "learning_rate": 4.5155527940662496e-08, + "loss": 0.0005, + "step": 39924 + }, + { + "epoch": 0.77, + "learning_rate": 4.5151644596326354e-08, + "loss": 0.0004, + "step": 39925 + }, + { + "epoch": 0.77, + "learning_rate": 4.514776125199021e-08, + "loss": 0.0005, + "step": 39926 + }, + { + "epoch": 0.77, + "learning_rate": 4.514387790765407e-08, + "loss": 0.0004, + "step": 39927 + }, + { + "epoch": 0.77, + "learning_rate": 4.513999456331793e-08, + "loss": 0.0005, + "step": 39928 + }, + { + "epoch": 0.77, + "learning_rate": 4.513611121898179e-08, + "loss": 0.1833, + "step": 39929 + }, + { + "epoch": 0.77, + "learning_rate": 4.5132227874645645e-08, + "loss": 0.0007, + "step": 39930 + }, + { + "epoch": 0.77, + "learning_rate": 4.51283445303095e-08, + "loss": 0.0004, + "step": 39931 + }, + { + "epoch": 0.77, + "learning_rate": 4.5124461185973355e-08, + "loss": 0.0003, + "step": 39932 + }, + { + "epoch": 0.77, + "learning_rate": 4.5120577841637213e-08, + "loss": 0.0002, + "step": 39933 + }, + { + "epoch": 0.77, + "learning_rate": 4.511669449730107e-08, + "loss": 0.0004, + "step": 39934 + }, + { + "epoch": 0.77, + "learning_rate": 4.511281115296493e-08, + "loss": 0.0004, + "step": 39935 + }, + { + "epoch": 0.77, + "learning_rate": 4.510892780862879e-08, + "loss": 0.0004, + "step": 39936 + }, + { + "epoch": 0.77, + "learning_rate": 4.5105044464292646e-08, + "loss": 0.0004, + "step": 39937 + }, + { + "epoch": 0.77, + "learning_rate": 4.5101161119956505e-08, + "loss": 0.0004, + "step": 39938 + }, + { + "epoch": 0.77, + "learning_rate": 4.509727777562036e-08, + "loss": 0.0003, + "step": 39939 + }, + { + "epoch": 0.77, + "learning_rate": 4.509339443128422e-08, + "loss": 0.0004, + "step": 39940 + }, + { + "epoch": 0.77, + "learning_rate": 4.508951108694808e-08, + "loss": 0.0062, + "step": 39941 + }, + { + "epoch": 0.77, + "learning_rate": 4.508562774261194e-08, + "loss": 0.0002, + "step": 39942 + }, + { + "epoch": 0.77, + "learning_rate": 4.5081744398275796e-08, + "loss": 1.3888, + "step": 39943 + }, + { + "epoch": 0.77, + "learning_rate": 4.5077861053939654e-08, + "loss": 0.0004, + "step": 39944 + }, + { + "epoch": 0.77, + "learning_rate": 4.507397770960351e-08, + "loss": 0.001, + "step": 39945 + }, + { + "epoch": 0.77, + "learning_rate": 4.5070094365267364e-08, + "loss": 1.2491, + "step": 39946 + }, + { + "epoch": 0.77, + "learning_rate": 4.506621102093122e-08, + "loss": 0.0006, + "step": 39947 + }, + { + "epoch": 0.77, + "learning_rate": 4.506232767659508e-08, + "loss": 0.0013, + "step": 39948 + }, + { + "epoch": 0.77, + "learning_rate": 4.505844433225894e-08, + "loss": 0.0098, + "step": 39949 + }, + { + "epoch": 0.77, + "learning_rate": 4.50545609879228e-08, + "loss": 0.0005, + "step": 39950 + }, + { + "epoch": 0.77, + "learning_rate": 4.5050677643586655e-08, + "loss": 0.0003, + "step": 39951 + }, + { + "epoch": 0.77, + "learning_rate": 4.5046794299250513e-08, + "loss": 0.0004, + "step": 39952 + }, + { + "epoch": 0.78, + "learning_rate": 4.504291095491437e-08, + "loss": 0.0003, + "step": 39953 + }, + { + "epoch": 0.78, + "learning_rate": 4.503902761057823e-08, + "loss": 0.0004, + "step": 39954 + }, + { + "epoch": 0.78, + "learning_rate": 4.503514426624209e-08, + "loss": 0.9279, + "step": 39955 + }, + { + "epoch": 0.78, + "learning_rate": 4.5031260921905946e-08, + "loss": 0.0004, + "step": 39956 + }, + { + "epoch": 0.78, + "learning_rate": 4.5027377577569805e-08, + "loss": 0.0005, + "step": 39957 + }, + { + "epoch": 0.78, + "learning_rate": 4.502349423323366e-08, + "loss": 0.0005, + "step": 39958 + }, + { + "epoch": 0.78, + "learning_rate": 4.501961088889752e-08, + "loss": 0.0003, + "step": 39959 + }, + { + "epoch": 0.78, + "learning_rate": 4.501572754456137e-08, + "loss": 0.0005, + "step": 39960 + }, + { + "epoch": 0.78, + "learning_rate": 4.501184420022523e-08, + "loss": 0.0052, + "step": 39961 + }, + { + "epoch": 0.78, + "learning_rate": 4.500796085588909e-08, + "loss": 0.001, + "step": 39962 + }, + { + "epoch": 0.78, + "learning_rate": 4.500407751155295e-08, + "loss": 0.0005, + "step": 39963 + }, + { + "epoch": 0.78, + "learning_rate": 4.5000194167216806e-08, + "loss": 0.0005, + "step": 39964 + }, + { + "epoch": 0.78, + "learning_rate": 4.4996310822880664e-08, + "loss": 0.7405, + "step": 39965 + }, + { + "epoch": 0.78, + "learning_rate": 4.499242747854452e-08, + "loss": 0.2258, + "step": 39966 + }, + { + "epoch": 0.78, + "learning_rate": 4.498854413420838e-08, + "loss": 0.0005, + "step": 39967 + }, + { + "epoch": 0.78, + "learning_rate": 4.498466078987224e-08, + "loss": 0.0008, + "step": 39968 + }, + { + "epoch": 0.78, + "learning_rate": 4.49807774455361e-08, + "loss": 0.0005, + "step": 39969 + }, + { + "epoch": 0.78, + "learning_rate": 4.4976894101199955e-08, + "loss": 0.0011, + "step": 39970 + }, + { + "epoch": 0.78, + "learning_rate": 4.4973010756863813e-08, + "loss": 0.1289, + "step": 39971 + }, + { + "epoch": 0.78, + "learning_rate": 4.496912741252767e-08, + "loss": 0.0005, + "step": 39972 + }, + { + "epoch": 0.78, + "learning_rate": 4.496524406819153e-08, + "loss": 0.0006, + "step": 39973 + }, + { + "epoch": 0.78, + "learning_rate": 4.496136072385539e-08, + "loss": 0.0007, + "step": 39974 + }, + { + "epoch": 0.78, + "learning_rate": 4.495747737951924e-08, + "loss": 0.0005, + "step": 39975 + }, + { + "epoch": 0.78, + "learning_rate": 4.49535940351831e-08, + "loss": 0.0004, + "step": 39976 + }, + { + "epoch": 0.78, + "learning_rate": 4.4949710690846956e-08, + "loss": 0.0004, + "step": 39977 + }, + { + "epoch": 0.78, + "learning_rate": 4.4945827346510815e-08, + "loss": 0.0004, + "step": 39978 + }, + { + "epoch": 0.78, + "learning_rate": 4.494194400217467e-08, + "loss": 0.0004, + "step": 39979 + }, + { + "epoch": 0.78, + "learning_rate": 4.493806065783853e-08, + "loss": 0.0006, + "step": 39980 + }, + { + "epoch": 0.78, + "learning_rate": 4.493417731350239e-08, + "loss": 0.0003, + "step": 39981 + }, + { + "epoch": 0.78, + "learning_rate": 4.493029396916624e-08, + "loss": 0.0003, + "step": 39982 + }, + { + "epoch": 0.78, + "learning_rate": 4.49264106248301e-08, + "loss": 0.0004, + "step": 39983 + }, + { + "epoch": 0.78, + "learning_rate": 4.492252728049396e-08, + "loss": 0.0005, + "step": 39984 + }, + { + "epoch": 0.78, + "learning_rate": 4.4918643936157816e-08, + "loss": 0.0004, + "step": 39985 + }, + { + "epoch": 0.78, + "learning_rate": 4.4914760591821674e-08, + "loss": 1.14, + "step": 39986 + }, + { + "epoch": 0.78, + "learning_rate": 4.491087724748553e-08, + "loss": 0.0005, + "step": 39987 + }, + { + "epoch": 0.78, + "learning_rate": 4.490699390314939e-08, + "loss": 0.0025, + "step": 39988 + }, + { + "epoch": 0.78, + "learning_rate": 4.490311055881325e-08, + "loss": 0.0004, + "step": 39989 + }, + { + "epoch": 0.78, + "learning_rate": 4.48992272144771e-08, + "loss": 0.0003, + "step": 39990 + }, + { + "epoch": 0.78, + "learning_rate": 4.489534387014096e-08, + "loss": 0.0005, + "step": 39991 + }, + { + "epoch": 0.78, + "learning_rate": 4.489146052580482e-08, + "loss": 0.0015, + "step": 39992 + }, + { + "epoch": 0.78, + "learning_rate": 4.4887577181468675e-08, + "loss": 0.0004, + "step": 39993 + }, + { + "epoch": 0.78, + "learning_rate": 4.488369383713253e-08, + "loss": 0.0035, + "step": 39994 + }, + { + "epoch": 0.78, + "learning_rate": 4.487981049279639e-08, + "loss": 0.0004, + "step": 39995 + }, + { + "epoch": 0.78, + "learning_rate": 4.487592714846025e-08, + "loss": 0.0004, + "step": 39996 + }, + { + "epoch": 0.78, + "learning_rate": 4.487204380412411e-08, + "loss": 0.0004, + "step": 39997 + }, + { + "epoch": 0.78, + "learning_rate": 4.4868160459787966e-08, + "loss": 0.3625, + "step": 39998 + }, + { + "epoch": 0.78, + "learning_rate": 4.4864277115451824e-08, + "loss": 0.0004, + "step": 39999 + }, + { + "epoch": 0.78, + "learning_rate": 4.486039377111568e-08, + "loss": 0.0004, + "step": 40000 + }, + { + "epoch": 0.78, + "learning_rate": 4.485651042677954e-08, + "loss": 0.0003, + "step": 40001 + }, + { + "epoch": 0.78, + "learning_rate": 4.48526270824434e-08, + "loss": 0.0004, + "step": 40002 + }, + { + "epoch": 0.78, + "learning_rate": 4.484874373810726e-08, + "loss": 0.0005, + "step": 40003 + }, + { + "epoch": 0.78, + "learning_rate": 4.484486039377111e-08, + "loss": 0.0006, + "step": 40004 + }, + { + "epoch": 0.78, + "learning_rate": 4.484097704943497e-08, + "loss": 0.0005, + "step": 40005 + }, + { + "epoch": 0.78, + "learning_rate": 4.4837093705098826e-08, + "loss": 0.7568, + "step": 40006 + }, + { + "epoch": 0.78, + "learning_rate": 4.4833210360762684e-08, + "loss": 0.3418, + "step": 40007 + }, + { + "epoch": 0.78, + "learning_rate": 4.482932701642654e-08, + "loss": 0.0008, + "step": 40008 + }, + { + "epoch": 0.78, + "learning_rate": 4.48254436720904e-08, + "loss": 0.0006, + "step": 40009 + }, + { + "epoch": 0.78, + "learning_rate": 4.482156032775426e-08, + "loss": 0.0005, + "step": 40010 + }, + { + "epoch": 0.78, + "learning_rate": 4.481767698341812e-08, + "loss": 0.0003, + "step": 40011 + }, + { + "epoch": 0.78, + "learning_rate": 4.4813793639081975e-08, + "loss": 1.1857, + "step": 40012 + }, + { + "epoch": 0.78, + "learning_rate": 4.480991029474583e-08, + "loss": 0.0006, + "step": 40013 + }, + { + "epoch": 0.78, + "learning_rate": 4.480602695040969e-08, + "loss": 0.0007, + "step": 40014 + }, + { + "epoch": 0.78, + "learning_rate": 4.480214360607355e-08, + "loss": 0.0005, + "step": 40015 + }, + { + "epoch": 0.78, + "learning_rate": 4.479826026173741e-08, + "loss": 0.0057, + "step": 40016 + }, + { + "epoch": 0.78, + "learning_rate": 4.4794376917401266e-08, + "loss": 1.2381, + "step": 40017 + }, + { + "epoch": 0.78, + "learning_rate": 4.479049357306512e-08, + "loss": 0.0005, + "step": 40018 + }, + { + "epoch": 0.78, + "learning_rate": 4.4786610228728976e-08, + "loss": 1.0476, + "step": 40019 + }, + { + "epoch": 0.78, + "learning_rate": 4.4782726884392834e-08, + "loss": 0.0005, + "step": 40020 + }, + { + "epoch": 0.78, + "learning_rate": 4.477884354005669e-08, + "loss": 0.0003, + "step": 40021 + }, + { + "epoch": 0.78, + "learning_rate": 4.477496019572055e-08, + "loss": 0.9177, + "step": 40022 + }, + { + "epoch": 0.78, + "learning_rate": 4.477107685138441e-08, + "loss": 0.0005, + "step": 40023 + }, + { + "epoch": 0.78, + "learning_rate": 4.476719350704827e-08, + "loss": 0.0284, + "step": 40024 + }, + { + "epoch": 0.78, + "learning_rate": 4.4763310162712126e-08, + "loss": 0.0005, + "step": 40025 + }, + { + "epoch": 0.78, + "learning_rate": 4.4759426818375984e-08, + "loss": 0.0007, + "step": 40026 + }, + { + "epoch": 0.78, + "learning_rate": 4.475554347403984e-08, + "loss": 0.0005, + "step": 40027 + }, + { + "epoch": 0.78, + "learning_rate": 4.47516601297037e-08, + "loss": 0.0008, + "step": 40028 + }, + { + "epoch": 0.78, + "learning_rate": 4.474777678536756e-08, + "loss": 0.0012, + "step": 40029 + }, + { + "epoch": 0.78, + "learning_rate": 4.474389344103142e-08, + "loss": 0.0004, + "step": 40030 + }, + { + "epoch": 0.78, + "learning_rate": 4.4740010096695275e-08, + "loss": 0.0005, + "step": 40031 + }, + { + "epoch": 0.78, + "learning_rate": 4.473612675235913e-08, + "loss": 0.7044, + "step": 40032 + }, + { + "epoch": 0.78, + "learning_rate": 4.4732243408022985e-08, + "loss": 0.0005, + "step": 40033 + }, + { + "epoch": 0.78, + "learning_rate": 4.472836006368684e-08, + "loss": 0.0004, + "step": 40034 + }, + { + "epoch": 0.78, + "learning_rate": 4.47244767193507e-08, + "loss": 0.0004, + "step": 40035 + }, + { + "epoch": 0.78, + "learning_rate": 4.472059337501456e-08, + "loss": 0.0005, + "step": 40036 + }, + { + "epoch": 0.78, + "learning_rate": 4.471671003067842e-08, + "loss": 0.0005, + "step": 40037 + }, + { + "epoch": 0.78, + "learning_rate": 4.4712826686342276e-08, + "loss": 0.004, + "step": 40038 + }, + { + "epoch": 0.78, + "learning_rate": 4.4708943342006134e-08, + "loss": 0.0004, + "step": 40039 + }, + { + "epoch": 0.78, + "learning_rate": 4.470505999766999e-08, + "loss": 0.0005, + "step": 40040 + }, + { + "epoch": 0.78, + "learning_rate": 4.470117665333385e-08, + "loss": 0.0047, + "step": 40041 + }, + { + "epoch": 0.78, + "learning_rate": 4.469729330899771e-08, + "loss": 0.0004, + "step": 40042 + }, + { + "epoch": 0.78, + "learning_rate": 4.469340996466157e-08, + "loss": 0.0675, + "step": 40043 + }, + { + "epoch": 0.78, + "learning_rate": 4.4689526620325426e-08, + "loss": 0.0006, + "step": 40044 + }, + { + "epoch": 0.78, + "learning_rate": 4.4685643275989284e-08, + "loss": 0.0004, + "step": 40045 + }, + { + "epoch": 0.78, + "learning_rate": 4.468175993165314e-08, + "loss": 0.0005, + "step": 40046 + }, + { + "epoch": 0.78, + "learning_rate": 4.4677876587316994e-08, + "loss": 0.0003, + "step": 40047 + }, + { + "epoch": 0.78, + "learning_rate": 4.467399324298085e-08, + "loss": 0.0004, + "step": 40048 + }, + { + "epoch": 0.78, + "learning_rate": 4.467010989864471e-08, + "loss": 0.0004, + "step": 40049 + }, + { + "epoch": 0.78, + "learning_rate": 4.466622655430857e-08, + "loss": 0.0154, + "step": 40050 + }, + { + "epoch": 0.78, + "learning_rate": 4.4662343209972427e-08, + "loss": 0.0005, + "step": 40051 + }, + { + "epoch": 0.78, + "learning_rate": 4.4658459865636285e-08, + "loss": 0.0004, + "step": 40052 + }, + { + "epoch": 0.78, + "learning_rate": 4.465457652130014e-08, + "loss": 0.0073, + "step": 40053 + }, + { + "epoch": 0.78, + "learning_rate": 4.4650693176964e-08, + "loss": 0.0005, + "step": 40054 + }, + { + "epoch": 0.78, + "learning_rate": 4.464680983262786e-08, + "loss": 0.004, + "step": 40055 + }, + { + "epoch": 0.78, + "learning_rate": 4.464292648829172e-08, + "loss": 0.0004, + "step": 40056 + }, + { + "epoch": 0.78, + "learning_rate": 4.4639043143955576e-08, + "loss": 0.0004, + "step": 40057 + }, + { + "epoch": 0.78, + "learning_rate": 4.4635159799619434e-08, + "loss": 0.0005, + "step": 40058 + }, + { + "epoch": 0.78, + "learning_rate": 4.463127645528329e-08, + "loss": 0.0005, + "step": 40059 + }, + { + "epoch": 0.78, + "learning_rate": 4.462739311094715e-08, + "loss": 0.0004, + "step": 40060 + }, + { + "epoch": 0.78, + "learning_rate": 4.462350976661101e-08, + "loss": 0.0004, + "step": 40061 + }, + { + "epoch": 0.78, + "learning_rate": 4.461962642227486e-08, + "loss": 0.0007, + "step": 40062 + }, + { + "epoch": 0.78, + "learning_rate": 4.461574307793872e-08, + "loss": 0.0004, + "step": 40063 + }, + { + "epoch": 0.78, + "learning_rate": 4.461185973360258e-08, + "loss": 0.0299, + "step": 40064 + }, + { + "epoch": 0.78, + "learning_rate": 4.4607976389266435e-08, + "loss": 0.0003, + "step": 40065 + }, + { + "epoch": 0.78, + "learning_rate": 4.4604093044930294e-08, + "loss": 0.0005, + "step": 40066 + }, + { + "epoch": 0.78, + "learning_rate": 4.460020970059415e-08, + "loss": 0.0003, + "step": 40067 + }, + { + "epoch": 0.78, + "learning_rate": 4.459632635625801e-08, + "loss": 0.0008, + "step": 40068 + }, + { + "epoch": 0.78, + "learning_rate": 4.459244301192187e-08, + "loss": 0.0005, + "step": 40069 + }, + { + "epoch": 0.78, + "learning_rate": 4.4588559667585727e-08, + "loss": 0.0005, + "step": 40070 + }, + { + "epoch": 0.78, + "learning_rate": 4.458467632324958e-08, + "loss": 0.0004, + "step": 40071 + }, + { + "epoch": 0.78, + "learning_rate": 4.4580792978913437e-08, + "loss": 0.3035, + "step": 40072 + }, + { + "epoch": 0.78, + "learning_rate": 4.4576909634577295e-08, + "loss": 0.0004, + "step": 40073 + }, + { + "epoch": 0.78, + "learning_rate": 4.457302629024115e-08, + "loss": 0.003, + "step": 40074 + }, + { + "epoch": 0.78, + "learning_rate": 4.456914294590501e-08, + "loss": 0.0004, + "step": 40075 + }, + { + "epoch": 0.78, + "learning_rate": 4.456525960156887e-08, + "loss": 0.0004, + "step": 40076 + }, + { + "epoch": 0.78, + "learning_rate": 4.456137625723273e-08, + "loss": 2.0468, + "step": 40077 + }, + { + "epoch": 0.78, + "learning_rate": 4.455749291289658e-08, + "loss": 0.0004, + "step": 40078 + }, + { + "epoch": 0.78, + "learning_rate": 4.455360956856044e-08, + "loss": 0.0003, + "step": 40079 + }, + { + "epoch": 0.78, + "learning_rate": 4.4549726224224296e-08, + "loss": 0.0004, + "step": 40080 + }, + { + "epoch": 0.78, + "learning_rate": 4.4545842879888154e-08, + "loss": 0.0491, + "step": 40081 + }, + { + "epoch": 0.78, + "learning_rate": 4.454195953555201e-08, + "loss": 0.0002, + "step": 40082 + }, + { + "epoch": 0.78, + "learning_rate": 4.453807619121587e-08, + "loss": 0.0238, + "step": 40083 + }, + { + "epoch": 0.78, + "learning_rate": 4.453419284687973e-08, + "loss": 0.0005, + "step": 40084 + }, + { + "epoch": 0.78, + "learning_rate": 4.453030950254359e-08, + "loss": 0.0005, + "step": 40085 + }, + { + "epoch": 0.78, + "learning_rate": 4.4526426158207445e-08, + "loss": 0.0005, + "step": 40086 + }, + { + "epoch": 0.78, + "learning_rate": 4.4522542813871304e-08, + "loss": 0.0005, + "step": 40087 + }, + { + "epoch": 0.78, + "learning_rate": 4.451865946953516e-08, + "loss": 0.0006, + "step": 40088 + }, + { + "epoch": 0.78, + "learning_rate": 4.451477612519902e-08, + "loss": 0.0004, + "step": 40089 + }, + { + "epoch": 0.78, + "learning_rate": 4.451089278086288e-08, + "loss": 0.0003, + "step": 40090 + }, + { + "epoch": 0.78, + "learning_rate": 4.450700943652673e-08, + "loss": 0.0004, + "step": 40091 + }, + { + "epoch": 0.78, + "learning_rate": 4.450312609219059e-08, + "loss": 0.0005, + "step": 40092 + }, + { + "epoch": 0.78, + "learning_rate": 4.4499242747854446e-08, + "loss": 0.0005, + "step": 40093 + }, + { + "epoch": 0.78, + "learning_rate": 4.4495359403518305e-08, + "loss": 0.4942, + "step": 40094 + }, + { + "epoch": 0.78, + "learning_rate": 4.449147605918216e-08, + "loss": 0.382, + "step": 40095 + }, + { + "epoch": 0.78, + "learning_rate": 4.448759271484602e-08, + "loss": 0.0004, + "step": 40096 + }, + { + "epoch": 0.78, + "learning_rate": 4.448370937050988e-08, + "loss": 0.0003, + "step": 40097 + }, + { + "epoch": 0.78, + "learning_rate": 4.447982602617374e-08, + "loss": 0.0005, + "step": 40098 + }, + { + "epoch": 0.78, + "learning_rate": 4.4475942681837596e-08, + "loss": 0.0002, + "step": 40099 + }, + { + "epoch": 0.78, + "learning_rate": 4.4472059337501454e-08, + "loss": 0.0004, + "step": 40100 + }, + { + "epoch": 0.78, + "learning_rate": 4.446817599316531e-08, + "loss": 0.0003, + "step": 40101 + }, + { + "epoch": 0.78, + "learning_rate": 4.446429264882917e-08, + "loss": 0.0008, + "step": 40102 + }, + { + "epoch": 0.78, + "learning_rate": 4.446040930449303e-08, + "loss": 0.0005, + "step": 40103 + }, + { + "epoch": 0.78, + "learning_rate": 4.445652596015689e-08, + "loss": 0.0004, + "step": 40104 + }, + { + "epoch": 0.78, + "learning_rate": 4.445264261582074e-08, + "loss": 0.0004, + "step": 40105 + }, + { + "epoch": 0.78, + "learning_rate": 4.44487592714846e-08, + "loss": 0.7383, + "step": 40106 + }, + { + "epoch": 0.78, + "learning_rate": 4.4444875927148455e-08, + "loss": 0.0003, + "step": 40107 + }, + { + "epoch": 0.78, + "learning_rate": 4.4440992582812313e-08, + "loss": 0.0003, + "step": 40108 + }, + { + "epoch": 0.78, + "learning_rate": 4.443710923847617e-08, + "loss": 0.0002, + "step": 40109 + }, + { + "epoch": 0.78, + "learning_rate": 4.443322589414003e-08, + "loss": 0.0004, + "step": 40110 + }, + { + "epoch": 0.78, + "learning_rate": 4.442934254980389e-08, + "loss": 0.0011, + "step": 40111 + }, + { + "epoch": 0.78, + "learning_rate": 4.4425459205467746e-08, + "loss": 0.0004, + "step": 40112 + }, + { + "epoch": 0.78, + "learning_rate": 4.4421575861131605e-08, + "loss": 0.0012, + "step": 40113 + }, + { + "epoch": 0.78, + "learning_rate": 4.441769251679546e-08, + "loss": 0.0004, + "step": 40114 + }, + { + "epoch": 0.78, + "learning_rate": 4.441380917245932e-08, + "loss": 0.0003, + "step": 40115 + }, + { + "epoch": 0.78, + "learning_rate": 4.440992582812318e-08, + "loss": 0.0004, + "step": 40116 + }, + { + "epoch": 0.78, + "learning_rate": 4.440604248378704e-08, + "loss": 0.0003, + "step": 40117 + }, + { + "epoch": 0.78, + "learning_rate": 4.4402159139450896e-08, + "loss": 0.0004, + "step": 40118 + }, + { + "epoch": 0.78, + "learning_rate": 4.4398275795114754e-08, + "loss": 0.0004, + "step": 40119 + }, + { + "epoch": 0.78, + "learning_rate": 4.4394392450778606e-08, + "loss": 0.0003, + "step": 40120 + }, + { + "epoch": 0.78, + "learning_rate": 4.4390509106442464e-08, + "loss": 0.0004, + "step": 40121 + }, + { + "epoch": 0.78, + "learning_rate": 4.438662576210632e-08, + "loss": 0.0004, + "step": 40122 + }, + { + "epoch": 0.78, + "learning_rate": 4.438274241777018e-08, + "loss": 0.0003, + "step": 40123 + }, + { + "epoch": 0.78, + "learning_rate": 4.437885907343404e-08, + "loss": 0.0004, + "step": 40124 + }, + { + "epoch": 0.78, + "learning_rate": 4.43749757290979e-08, + "loss": 0.0044, + "step": 40125 + }, + { + "epoch": 0.78, + "learning_rate": 4.4371092384761755e-08, + "loss": 0.0004, + "step": 40126 + }, + { + "epoch": 0.78, + "learning_rate": 4.4367209040425614e-08, + "loss": 0.0005, + "step": 40127 + }, + { + "epoch": 0.78, + "learning_rate": 4.436332569608947e-08, + "loss": 0.0004, + "step": 40128 + }, + { + "epoch": 0.78, + "learning_rate": 4.435944235175333e-08, + "loss": 0.0005, + "step": 40129 + }, + { + "epoch": 0.78, + "learning_rate": 4.435555900741719e-08, + "loss": 0.0004, + "step": 40130 + }, + { + "epoch": 0.78, + "learning_rate": 4.4351675663081046e-08, + "loss": 0.0005, + "step": 40131 + }, + { + "epoch": 0.78, + "learning_rate": 4.4347792318744905e-08, + "loss": 0.0424, + "step": 40132 + }, + { + "epoch": 0.78, + "learning_rate": 4.434390897440876e-08, + "loss": 0.0004, + "step": 40133 + }, + { + "epoch": 0.78, + "learning_rate": 4.4340025630072615e-08, + "loss": 0.0002, + "step": 40134 + }, + { + "epoch": 0.78, + "learning_rate": 4.433614228573647e-08, + "loss": 0.0004, + "step": 40135 + }, + { + "epoch": 0.78, + "learning_rate": 4.433225894140033e-08, + "loss": 0.7565, + "step": 40136 + }, + { + "epoch": 0.78, + "learning_rate": 4.432837559706419e-08, + "loss": 0.0004, + "step": 40137 + }, + { + "epoch": 0.78, + "learning_rate": 4.432449225272805e-08, + "loss": 0.0005, + "step": 40138 + }, + { + "epoch": 0.78, + "learning_rate": 4.4320608908391906e-08, + "loss": 0.0003, + "step": 40139 + }, + { + "epoch": 0.78, + "learning_rate": 4.4316725564055764e-08, + "loss": 0.0007, + "step": 40140 + }, + { + "epoch": 0.78, + "learning_rate": 4.431284221971962e-08, + "loss": 0.0004, + "step": 40141 + }, + { + "epoch": 0.78, + "learning_rate": 4.430895887538348e-08, + "loss": 0.0026, + "step": 40142 + }, + { + "epoch": 0.78, + "learning_rate": 4.430507553104734e-08, + "loss": 0.0004, + "step": 40143 + }, + { + "epoch": 0.78, + "learning_rate": 4.43011921867112e-08, + "loss": 0.0639, + "step": 40144 + }, + { + "epoch": 0.78, + "learning_rate": 4.4297308842375055e-08, + "loss": 0.0006, + "step": 40145 + }, + { + "epoch": 0.78, + "learning_rate": 4.4293425498038914e-08, + "loss": 0.0004, + "step": 40146 + }, + { + "epoch": 0.78, + "learning_rate": 4.428954215370277e-08, + "loss": 0.0007, + "step": 40147 + }, + { + "epoch": 0.78, + "learning_rate": 4.428565880936663e-08, + "loss": 0.0007, + "step": 40148 + }, + { + "epoch": 0.78, + "learning_rate": 4.428177546503048e-08, + "loss": 0.0007, + "step": 40149 + }, + { + "epoch": 0.78, + "learning_rate": 4.427789212069434e-08, + "loss": 0.0004, + "step": 40150 + }, + { + "epoch": 0.78, + "learning_rate": 4.42740087763582e-08, + "loss": 0.0008, + "step": 40151 + }, + { + "epoch": 0.78, + "learning_rate": 4.4270125432022056e-08, + "loss": 0.0003, + "step": 40152 + }, + { + "epoch": 0.78, + "learning_rate": 4.4266242087685915e-08, + "loss": 0.0004, + "step": 40153 + }, + { + "epoch": 0.78, + "learning_rate": 4.426235874334977e-08, + "loss": 0.0005, + "step": 40154 + }, + { + "epoch": 0.78, + "learning_rate": 4.425847539901363e-08, + "loss": 0.0005, + "step": 40155 + }, + { + "epoch": 0.78, + "learning_rate": 4.425459205467749e-08, + "loss": 0.0003, + "step": 40156 + }, + { + "epoch": 0.78, + "learning_rate": 4.425070871034135e-08, + "loss": 0.0003, + "step": 40157 + }, + { + "epoch": 0.78, + "learning_rate": 4.4246825366005206e-08, + "loss": 0.0004, + "step": 40158 + }, + { + "epoch": 0.78, + "learning_rate": 4.424294202166906e-08, + "loss": 0.0004, + "step": 40159 + }, + { + "epoch": 0.78, + "learning_rate": 4.4239058677332916e-08, + "loss": 0.0005, + "step": 40160 + }, + { + "epoch": 0.78, + "learning_rate": 4.4235175332996774e-08, + "loss": 0.0004, + "step": 40161 + }, + { + "epoch": 0.78, + "learning_rate": 4.423129198866063e-08, + "loss": 0.0004, + "step": 40162 + }, + { + "epoch": 0.78, + "learning_rate": 4.422740864432449e-08, + "loss": 0.0003, + "step": 40163 + }, + { + "epoch": 0.78, + "learning_rate": 4.422352529998835e-08, + "loss": 0.0006, + "step": 40164 + }, + { + "epoch": 0.78, + "learning_rate": 4.421964195565221e-08, + "loss": 0.0003, + "step": 40165 + }, + { + "epoch": 0.78, + "learning_rate": 4.4215758611316065e-08, + "loss": 0.0004, + "step": 40166 + }, + { + "epoch": 0.78, + "learning_rate": 4.421187526697992e-08, + "loss": 0.0003, + "step": 40167 + }, + { + "epoch": 0.78, + "learning_rate": 4.4207991922643775e-08, + "loss": 0.1737, + "step": 40168 + }, + { + "epoch": 0.78, + "learning_rate": 4.420410857830763e-08, + "loss": 0.0006, + "step": 40169 + }, + { + "epoch": 0.78, + "learning_rate": 4.420022523397149e-08, + "loss": 0.0006, + "step": 40170 + }, + { + "epoch": 0.78, + "learning_rate": 4.419634188963535e-08, + "loss": 0.0004, + "step": 40171 + }, + { + "epoch": 0.78, + "learning_rate": 4.419245854529921e-08, + "loss": 0.0003, + "step": 40172 + }, + { + "epoch": 0.78, + "learning_rate": 4.4188575200963066e-08, + "loss": 0.0003, + "step": 40173 + }, + { + "epoch": 0.78, + "learning_rate": 4.4184691856626925e-08, + "loss": 0.0004, + "step": 40174 + }, + { + "epoch": 0.78, + "learning_rate": 4.418080851229078e-08, + "loss": 0.0003, + "step": 40175 + }, + { + "epoch": 0.78, + "learning_rate": 4.417692516795464e-08, + "loss": 0.0004, + "step": 40176 + }, + { + "epoch": 0.78, + "learning_rate": 4.41730418236185e-08, + "loss": 0.0003, + "step": 40177 + }, + { + "epoch": 0.78, + "learning_rate": 4.416915847928235e-08, + "loss": 0.2117, + "step": 40178 + }, + { + "epoch": 0.78, + "learning_rate": 4.416527513494621e-08, + "loss": 0.0255, + "step": 40179 + }, + { + "epoch": 0.78, + "learning_rate": 4.416139179061007e-08, + "loss": 0.0004, + "step": 40180 + }, + { + "epoch": 0.78, + "learning_rate": 4.4157508446273926e-08, + "loss": 0.0003, + "step": 40181 + }, + { + "epoch": 0.78, + "learning_rate": 4.4153625101937784e-08, + "loss": 0.0004, + "step": 40182 + }, + { + "epoch": 0.78, + "learning_rate": 4.414974175760164e-08, + "loss": 0.0003, + "step": 40183 + }, + { + "epoch": 0.78, + "learning_rate": 4.41458584132655e-08, + "loss": 0.0003, + "step": 40184 + }, + { + "epoch": 0.78, + "learning_rate": 4.414197506892936e-08, + "loss": 0.0005, + "step": 40185 + }, + { + "epoch": 0.78, + "learning_rate": 4.413809172459322e-08, + "loss": 0.0004, + "step": 40186 + }, + { + "epoch": 0.78, + "learning_rate": 4.4134208380257075e-08, + "loss": 0.1602, + "step": 40187 + }, + { + "epoch": 0.78, + "learning_rate": 4.4130325035920933e-08, + "loss": 0.0005, + "step": 40188 + }, + { + "epoch": 0.78, + "learning_rate": 4.412644169158479e-08, + "loss": 0.0006, + "step": 40189 + }, + { + "epoch": 0.78, + "learning_rate": 4.412255834724865e-08, + "loss": 0.0005, + "step": 40190 + }, + { + "epoch": 0.78, + "learning_rate": 4.411867500291251e-08, + "loss": 0.0005, + "step": 40191 + }, + { + "epoch": 0.78, + "learning_rate": 4.411479165857636e-08, + "loss": 0.0004, + "step": 40192 + }, + { + "epoch": 0.78, + "learning_rate": 4.411090831424022e-08, + "loss": 0.0004, + "step": 40193 + }, + { + "epoch": 0.78, + "learning_rate": 4.4107024969904076e-08, + "loss": 0.061, + "step": 40194 + }, + { + "epoch": 0.78, + "learning_rate": 4.4103141625567934e-08, + "loss": 0.0003, + "step": 40195 + }, + { + "epoch": 0.78, + "learning_rate": 4.409925828123179e-08, + "loss": 0.0005, + "step": 40196 + }, + { + "epoch": 0.78, + "learning_rate": 4.409537493689565e-08, + "loss": 0.0007, + "step": 40197 + }, + { + "epoch": 0.78, + "learning_rate": 4.409149159255951e-08, + "loss": 0.0005, + "step": 40198 + }, + { + "epoch": 0.78, + "learning_rate": 4.408760824822337e-08, + "loss": 0.0003, + "step": 40199 + }, + { + "epoch": 0.78, + "learning_rate": 4.4083724903887226e-08, + "loss": 0.0004, + "step": 40200 + }, + { + "epoch": 0.78, + "learning_rate": 4.4079841559551084e-08, + "loss": 0.0003, + "step": 40201 + }, + { + "epoch": 0.78, + "learning_rate": 4.407595821521494e-08, + "loss": 0.0003, + "step": 40202 + }, + { + "epoch": 0.78, + "learning_rate": 4.40720748708788e-08, + "loss": 0.0003, + "step": 40203 + }, + { + "epoch": 0.78, + "learning_rate": 4.406819152654266e-08, + "loss": 0.0005, + "step": 40204 + }, + { + "epoch": 0.78, + "learning_rate": 4.406430818220652e-08, + "loss": 0.0003, + "step": 40205 + }, + { + "epoch": 0.78, + "learning_rate": 4.4060424837870375e-08, + "loss": 0.0005, + "step": 40206 + }, + { + "epoch": 0.78, + "learning_rate": 4.405654149353423e-08, + "loss": 0.0003, + "step": 40207 + }, + { + "epoch": 0.78, + "learning_rate": 4.4052658149198085e-08, + "loss": 0.0003, + "step": 40208 + }, + { + "epoch": 0.78, + "learning_rate": 4.404877480486194e-08, + "loss": 0.0003, + "step": 40209 + }, + { + "epoch": 0.78, + "learning_rate": 4.40448914605258e-08, + "loss": 0.2167, + "step": 40210 + }, + { + "epoch": 0.78, + "learning_rate": 4.404100811618966e-08, + "loss": 0.0005, + "step": 40211 + }, + { + "epoch": 0.78, + "learning_rate": 4.403712477185352e-08, + "loss": 0.0004, + "step": 40212 + }, + { + "epoch": 0.78, + "learning_rate": 4.4033241427517376e-08, + "loss": 0.0004, + "step": 40213 + }, + { + "epoch": 0.78, + "learning_rate": 4.4029358083181234e-08, + "loss": 0.0004, + "step": 40214 + }, + { + "epoch": 0.78, + "learning_rate": 4.402547473884509e-08, + "loss": 0.0004, + "step": 40215 + }, + { + "epoch": 0.78, + "learning_rate": 4.402159139450895e-08, + "loss": 0.0003, + "step": 40216 + }, + { + "epoch": 0.78, + "learning_rate": 4.401770805017281e-08, + "loss": 0.0064, + "step": 40217 + }, + { + "epoch": 0.78, + "learning_rate": 4.401382470583667e-08, + "loss": 0.0004, + "step": 40218 + }, + { + "epoch": 0.78, + "learning_rate": 4.4009941361500526e-08, + "loss": 0.0003, + "step": 40219 + }, + { + "epoch": 0.78, + "learning_rate": 4.4006058017164384e-08, + "loss": 0.0007, + "step": 40220 + }, + { + "epoch": 0.78, + "learning_rate": 4.4002174672828236e-08, + "loss": 0.0005, + "step": 40221 + }, + { + "epoch": 0.78, + "learning_rate": 4.3998291328492094e-08, + "loss": 0.0005, + "step": 40222 + }, + { + "epoch": 0.78, + "learning_rate": 4.399440798415595e-08, + "loss": 0.0003, + "step": 40223 + }, + { + "epoch": 0.78, + "learning_rate": 4.399052463981981e-08, + "loss": 0.0004, + "step": 40224 + }, + { + "epoch": 0.78, + "learning_rate": 4.398664129548367e-08, + "loss": 0.0006, + "step": 40225 + }, + { + "epoch": 0.78, + "learning_rate": 4.398275795114753e-08, + "loss": 0.1267, + "step": 40226 + }, + { + "epoch": 0.78, + "learning_rate": 4.3978874606811385e-08, + "loss": 0.0004, + "step": 40227 + }, + { + "epoch": 0.78, + "learning_rate": 4.397499126247524e-08, + "loss": 0.0006, + "step": 40228 + }, + { + "epoch": 0.78, + "learning_rate": 4.39711079181391e-08, + "loss": 0.0007, + "step": 40229 + }, + { + "epoch": 0.78, + "learning_rate": 4.396722457380296e-08, + "loss": 0.0004, + "step": 40230 + }, + { + "epoch": 0.78, + "learning_rate": 4.396334122946682e-08, + "loss": 0.0004, + "step": 40231 + }, + { + "epoch": 0.78, + "learning_rate": 4.3959457885130676e-08, + "loss": 0.0184, + "step": 40232 + }, + { + "epoch": 0.78, + "learning_rate": 4.3955574540794534e-08, + "loss": 0.0004, + "step": 40233 + }, + { + "epoch": 0.78, + "learning_rate": 4.395169119645839e-08, + "loss": 0.0365, + "step": 40234 + }, + { + "epoch": 0.78, + "learning_rate": 4.394780785212225e-08, + "loss": 0.0008, + "step": 40235 + }, + { + "epoch": 0.78, + "learning_rate": 4.39439245077861e-08, + "loss": 0.0004, + "step": 40236 + }, + { + "epoch": 0.78, + "learning_rate": 4.394004116344996e-08, + "loss": 0.0004, + "step": 40237 + }, + { + "epoch": 0.78, + "learning_rate": 4.393615781911382e-08, + "loss": 0.002, + "step": 40238 + }, + { + "epoch": 0.78, + "learning_rate": 4.393227447477768e-08, + "loss": 0.0007, + "step": 40239 + }, + { + "epoch": 0.78, + "learning_rate": 4.3928391130441536e-08, + "loss": 0.0005, + "step": 40240 + }, + { + "epoch": 0.78, + "learning_rate": 4.3924507786105394e-08, + "loss": 0.8181, + "step": 40241 + }, + { + "epoch": 0.78, + "learning_rate": 4.392062444176925e-08, + "loss": 0.0036, + "step": 40242 + }, + { + "epoch": 0.78, + "learning_rate": 4.391674109743311e-08, + "loss": 0.0003, + "step": 40243 + }, + { + "epoch": 0.78, + "learning_rate": 4.391285775309697e-08, + "loss": 0.0006, + "step": 40244 + }, + { + "epoch": 0.78, + "learning_rate": 4.390897440876083e-08, + "loss": 0.0005, + "step": 40245 + }, + { + "epoch": 0.78, + "learning_rate": 4.3905091064424685e-08, + "loss": 0.0004, + "step": 40246 + }, + { + "epoch": 0.78, + "learning_rate": 4.390120772008854e-08, + "loss": 0.0003, + "step": 40247 + }, + { + "epoch": 0.78, + "learning_rate": 4.3897324375752395e-08, + "loss": 0.0004, + "step": 40248 + }, + { + "epoch": 0.78, + "learning_rate": 4.389344103141625e-08, + "loss": 0.0005, + "step": 40249 + }, + { + "epoch": 0.78, + "learning_rate": 4.388955768708011e-08, + "loss": 0.0007, + "step": 40250 + }, + { + "epoch": 0.78, + "learning_rate": 4.388567434274397e-08, + "loss": 0.0006, + "step": 40251 + }, + { + "epoch": 0.78, + "learning_rate": 4.388179099840783e-08, + "loss": 0.0005, + "step": 40252 + }, + { + "epoch": 0.78, + "learning_rate": 4.3877907654071686e-08, + "loss": 0.0005, + "step": 40253 + }, + { + "epoch": 0.78, + "learning_rate": 4.3874024309735544e-08, + "loss": 0.0054, + "step": 40254 + }, + { + "epoch": 0.78, + "learning_rate": 4.3870140965399396e-08, + "loss": 0.7294, + "step": 40255 + }, + { + "epoch": 0.78, + "learning_rate": 4.3866257621063254e-08, + "loss": 0.0035, + "step": 40256 + }, + { + "epoch": 0.78, + "learning_rate": 4.386237427672711e-08, + "loss": 0.0006, + "step": 40257 + }, + { + "epoch": 0.78, + "learning_rate": 4.385849093239097e-08, + "loss": 0.0004, + "step": 40258 + }, + { + "epoch": 0.78, + "learning_rate": 4.385460758805483e-08, + "loss": 0.0004, + "step": 40259 + }, + { + "epoch": 0.78, + "learning_rate": 4.385072424371869e-08, + "loss": 0.0003, + "step": 40260 + }, + { + "epoch": 0.78, + "learning_rate": 4.3846840899382545e-08, + "loss": 0.0005, + "step": 40261 + }, + { + "epoch": 0.78, + "learning_rate": 4.3842957555046404e-08, + "loss": 0.0003, + "step": 40262 + }, + { + "epoch": 0.78, + "learning_rate": 4.383907421071026e-08, + "loss": 0.0004, + "step": 40263 + }, + { + "epoch": 0.78, + "learning_rate": 4.383519086637412e-08, + "loss": 0.0004, + "step": 40264 + }, + { + "epoch": 0.78, + "learning_rate": 4.383130752203797e-08, + "loss": 0.0004, + "step": 40265 + }, + { + "epoch": 0.78, + "learning_rate": 4.382742417770183e-08, + "loss": 0.0003, + "step": 40266 + }, + { + "epoch": 0.78, + "learning_rate": 4.382354083336569e-08, + "loss": 0.0003, + "step": 40267 + }, + { + "epoch": 0.78, + "learning_rate": 4.3819657489029547e-08, + "loss": 0.0003, + "step": 40268 + }, + { + "epoch": 0.78, + "learning_rate": 4.3815774144693405e-08, + "loss": 0.0005, + "step": 40269 + }, + { + "epoch": 0.78, + "learning_rate": 4.381189080035726e-08, + "loss": 0.0004, + "step": 40270 + }, + { + "epoch": 0.78, + "learning_rate": 4.380800745602112e-08, + "loss": 0.0004, + "step": 40271 + }, + { + "epoch": 0.78, + "learning_rate": 4.380412411168498e-08, + "loss": 0.5521, + "step": 40272 + }, + { + "epoch": 0.78, + "learning_rate": 4.380024076734884e-08, + "loss": 0.0004, + "step": 40273 + }, + { + "epoch": 0.78, + "learning_rate": 4.3796357423012696e-08, + "loss": 0.0004, + "step": 40274 + }, + { + "epoch": 0.78, + "learning_rate": 4.3792474078676554e-08, + "loss": 0.4136, + "step": 40275 + }, + { + "epoch": 0.78, + "learning_rate": 4.378859073434041e-08, + "loss": 0.0138, + "step": 40276 + }, + { + "epoch": 0.78, + "learning_rate": 4.378470739000427e-08, + "loss": 0.0023, + "step": 40277 + }, + { + "epoch": 0.78, + "learning_rate": 4.378082404566813e-08, + "loss": 0.001, + "step": 40278 + }, + { + "epoch": 0.78, + "learning_rate": 4.377694070133198e-08, + "loss": 0.0005, + "step": 40279 + }, + { + "epoch": 0.78, + "learning_rate": 4.377305735699584e-08, + "loss": 0.0005, + "step": 40280 + }, + { + "epoch": 0.78, + "learning_rate": 4.37691740126597e-08, + "loss": 0.0005, + "step": 40281 + }, + { + "epoch": 0.78, + "learning_rate": 4.3765290668323555e-08, + "loss": 0.0005, + "step": 40282 + }, + { + "epoch": 0.78, + "learning_rate": 4.3761407323987414e-08, + "loss": 0.0009, + "step": 40283 + }, + { + "epoch": 0.78, + "learning_rate": 4.375752397965127e-08, + "loss": 0.764, + "step": 40284 + }, + { + "epoch": 0.78, + "learning_rate": 4.375364063531513e-08, + "loss": 0.0004, + "step": 40285 + }, + { + "epoch": 0.78, + "learning_rate": 4.374975729097899e-08, + "loss": 0.0007, + "step": 40286 + }, + { + "epoch": 0.78, + "learning_rate": 4.3745873946642847e-08, + "loss": 0.0006, + "step": 40287 + }, + { + "epoch": 0.78, + "learning_rate": 4.3741990602306705e-08, + "loss": 0.0005, + "step": 40288 + }, + { + "epoch": 0.78, + "learning_rate": 4.373810725797056e-08, + "loss": 0.0004, + "step": 40289 + }, + { + "epoch": 0.78, + "learning_rate": 4.373422391363442e-08, + "loss": 0.0064, + "step": 40290 + }, + { + "epoch": 0.78, + "learning_rate": 4.373034056929828e-08, + "loss": 0.0004, + "step": 40291 + }, + { + "epoch": 0.78, + "learning_rate": 4.372645722496214e-08, + "loss": 0.0004, + "step": 40292 + }, + { + "epoch": 0.78, + "learning_rate": 4.3722573880625996e-08, + "loss": 0.0004, + "step": 40293 + }, + { + "epoch": 0.78, + "learning_rate": 4.371869053628985e-08, + "loss": 0.0005, + "step": 40294 + }, + { + "epoch": 0.78, + "learning_rate": 4.3714807191953706e-08, + "loss": 0.0004, + "step": 40295 + }, + { + "epoch": 0.78, + "learning_rate": 4.3710923847617564e-08, + "loss": 0.0003, + "step": 40296 + }, + { + "epoch": 0.78, + "learning_rate": 4.370704050328142e-08, + "loss": 0.0003, + "step": 40297 + }, + { + "epoch": 0.78, + "learning_rate": 4.370315715894528e-08, + "loss": 0.0006, + "step": 40298 + }, + { + "epoch": 0.78, + "learning_rate": 4.369927381460914e-08, + "loss": 0.0013, + "step": 40299 + }, + { + "epoch": 0.78, + "learning_rate": 4.3695390470273e-08, + "loss": 0.4359, + "step": 40300 + }, + { + "epoch": 0.78, + "learning_rate": 4.3691507125936855e-08, + "loss": 0.0003, + "step": 40301 + }, + { + "epoch": 0.78, + "learning_rate": 4.3687623781600714e-08, + "loss": 0.0006, + "step": 40302 + }, + { + "epoch": 0.78, + "learning_rate": 4.368374043726457e-08, + "loss": 0.0004, + "step": 40303 + }, + { + "epoch": 0.78, + "learning_rate": 4.367985709292843e-08, + "loss": 0.0005, + "step": 40304 + }, + { + "epoch": 0.78, + "learning_rate": 4.367597374859229e-08, + "loss": 0.0004, + "step": 40305 + }, + { + "epoch": 0.78, + "learning_rate": 4.3672090404256147e-08, + "loss": 0.0006, + "step": 40306 + }, + { + "epoch": 0.78, + "learning_rate": 4.3668207059920005e-08, + "loss": 0.0004, + "step": 40307 + }, + { + "epoch": 0.78, + "learning_rate": 4.3664323715583856e-08, + "loss": 0.0007, + "step": 40308 + }, + { + "epoch": 0.78, + "learning_rate": 4.3660440371247715e-08, + "loss": 0.0006, + "step": 40309 + }, + { + "epoch": 0.78, + "learning_rate": 4.365655702691157e-08, + "loss": 0.0004, + "step": 40310 + }, + { + "epoch": 0.78, + "learning_rate": 4.365267368257543e-08, + "loss": 0.0005, + "step": 40311 + }, + { + "epoch": 0.78, + "learning_rate": 4.364879033823929e-08, + "loss": 0.0005, + "step": 40312 + }, + { + "epoch": 0.78, + "learning_rate": 4.364490699390315e-08, + "loss": 0.0004, + "step": 40313 + }, + { + "epoch": 0.78, + "learning_rate": 4.3641023649567006e-08, + "loss": 0.0004, + "step": 40314 + }, + { + "epoch": 0.78, + "learning_rate": 4.3637140305230864e-08, + "loss": 0.0003, + "step": 40315 + }, + { + "epoch": 0.78, + "learning_rate": 4.363325696089472e-08, + "loss": 0.0004, + "step": 40316 + }, + { + "epoch": 0.78, + "learning_rate": 4.362937361655858e-08, + "loss": 0.0007, + "step": 40317 + }, + { + "epoch": 0.78, + "learning_rate": 4.362549027222244e-08, + "loss": 0.0021, + "step": 40318 + }, + { + "epoch": 0.78, + "learning_rate": 4.36216069278863e-08, + "loss": 0.0006, + "step": 40319 + }, + { + "epoch": 0.78, + "learning_rate": 4.3617723583550155e-08, + "loss": 0.0003, + "step": 40320 + }, + { + "epoch": 0.78, + "learning_rate": 4.3613840239214014e-08, + "loss": 0.0004, + "step": 40321 + }, + { + "epoch": 0.78, + "learning_rate": 4.360995689487787e-08, + "loss": 0.001, + "step": 40322 + }, + { + "epoch": 0.78, + "learning_rate": 4.3606073550541724e-08, + "loss": 0.0004, + "step": 40323 + }, + { + "epoch": 0.78, + "learning_rate": 4.360219020620558e-08, + "loss": 0.0022, + "step": 40324 + }, + { + "epoch": 0.78, + "learning_rate": 4.359830686186944e-08, + "loss": 0.0004, + "step": 40325 + }, + { + "epoch": 0.78, + "learning_rate": 4.35944235175333e-08, + "loss": 0.0004, + "step": 40326 + }, + { + "epoch": 0.78, + "learning_rate": 4.3590540173197156e-08, + "loss": 0.9312, + "step": 40327 + }, + { + "epoch": 0.78, + "learning_rate": 4.3586656828861015e-08, + "loss": 0.0005, + "step": 40328 + }, + { + "epoch": 0.78, + "learning_rate": 4.358277348452487e-08, + "loss": 0.0006, + "step": 40329 + }, + { + "epoch": 0.78, + "learning_rate": 4.357889014018873e-08, + "loss": 0.0003, + "step": 40330 + }, + { + "epoch": 0.78, + "learning_rate": 4.357500679585259e-08, + "loss": 0.0784, + "step": 40331 + }, + { + "epoch": 0.78, + "learning_rate": 4.357112345151645e-08, + "loss": 0.0003, + "step": 40332 + }, + { + "epoch": 0.78, + "learning_rate": 4.3567240107180306e-08, + "loss": 0.0006, + "step": 40333 + }, + { + "epoch": 0.78, + "learning_rate": 4.3563356762844164e-08, + "loss": 0.0005, + "step": 40334 + }, + { + "epoch": 0.78, + "learning_rate": 4.355947341850802e-08, + "loss": 0.0007, + "step": 40335 + }, + { + "epoch": 0.78, + "learning_rate": 4.3555590074171874e-08, + "loss": 0.0004, + "step": 40336 + }, + { + "epoch": 0.78, + "learning_rate": 4.355170672983573e-08, + "loss": 0.0004, + "step": 40337 + }, + { + "epoch": 0.78, + "learning_rate": 4.354782338549959e-08, + "loss": 0.0005, + "step": 40338 + }, + { + "epoch": 0.78, + "learning_rate": 4.354394004116345e-08, + "loss": 0.0004, + "step": 40339 + }, + { + "epoch": 0.78, + "learning_rate": 4.354005669682731e-08, + "loss": 0.0003, + "step": 40340 + }, + { + "epoch": 0.78, + "learning_rate": 4.3536173352491165e-08, + "loss": 0.0004, + "step": 40341 + }, + { + "epoch": 0.78, + "learning_rate": 4.3532290008155024e-08, + "loss": 0.0004, + "step": 40342 + }, + { + "epoch": 0.78, + "learning_rate": 4.352840666381888e-08, + "loss": 1.1537, + "step": 40343 + }, + { + "epoch": 0.78, + "learning_rate": 4.3524523319482733e-08, + "loss": 0.0091, + "step": 40344 + }, + { + "epoch": 0.78, + "learning_rate": 4.352063997514659e-08, + "loss": 0.0003, + "step": 40345 + }, + { + "epoch": 0.78, + "learning_rate": 4.351675663081045e-08, + "loss": 0.0004, + "step": 40346 + }, + { + "epoch": 0.78, + "learning_rate": 4.351287328647431e-08, + "loss": 0.0004, + "step": 40347 + }, + { + "epoch": 0.78, + "learning_rate": 4.3508989942138166e-08, + "loss": 0.0009, + "step": 40348 + }, + { + "epoch": 0.78, + "learning_rate": 4.3505106597802025e-08, + "loss": 0.0003, + "step": 40349 + }, + { + "epoch": 0.78, + "learning_rate": 4.350122325346588e-08, + "loss": 0.0003, + "step": 40350 + }, + { + "epoch": 0.78, + "learning_rate": 4.349733990912974e-08, + "loss": 0.0002, + "step": 40351 + }, + { + "epoch": 0.78, + "learning_rate": 4.349345656479359e-08, + "loss": 0.0004, + "step": 40352 + }, + { + "epoch": 0.78, + "learning_rate": 4.348957322045745e-08, + "loss": 0.0004, + "step": 40353 + }, + { + "epoch": 0.78, + "learning_rate": 4.348568987612131e-08, + "loss": 0.0004, + "step": 40354 + }, + { + "epoch": 0.78, + "learning_rate": 4.348180653178517e-08, + "loss": 0.0003, + "step": 40355 + }, + { + "epoch": 0.78, + "learning_rate": 4.3477923187449026e-08, + "loss": 0.0025, + "step": 40356 + }, + { + "epoch": 0.78, + "learning_rate": 4.3474039843112884e-08, + "loss": 0.0004, + "step": 40357 + }, + { + "epoch": 0.78, + "learning_rate": 4.347015649877674e-08, + "loss": 0.0005, + "step": 40358 + }, + { + "epoch": 0.78, + "learning_rate": 4.34662731544406e-08, + "loss": 0.0003, + "step": 40359 + }, + { + "epoch": 0.78, + "learning_rate": 4.346238981010446e-08, + "loss": 0.0005, + "step": 40360 + }, + { + "epoch": 0.78, + "learning_rate": 4.345850646576832e-08, + "loss": 0.0113, + "step": 40361 + }, + { + "epoch": 0.78, + "learning_rate": 4.3454623121432175e-08, + "loss": 0.3658, + "step": 40362 + }, + { + "epoch": 0.78, + "learning_rate": 4.3450739777096033e-08, + "loss": 0.0003, + "step": 40363 + }, + { + "epoch": 0.78, + "learning_rate": 4.344685643275989e-08, + "loss": 0.0008, + "step": 40364 + }, + { + "epoch": 0.78, + "learning_rate": 4.344297308842375e-08, + "loss": 0.0004, + "step": 40365 + }, + { + "epoch": 0.78, + "learning_rate": 4.34390897440876e-08, + "loss": 0.0003, + "step": 40366 + }, + { + "epoch": 0.78, + "learning_rate": 4.343520639975146e-08, + "loss": 0.0006, + "step": 40367 + }, + { + "epoch": 0.78, + "learning_rate": 4.343132305541532e-08, + "loss": 0.0009, + "step": 40368 + }, + { + "epoch": 0.78, + "learning_rate": 4.3427439711079176e-08, + "loss": 0.0004, + "step": 40369 + }, + { + "epoch": 0.78, + "learning_rate": 4.3423556366743035e-08, + "loss": 0.0004, + "step": 40370 + }, + { + "epoch": 0.78, + "learning_rate": 4.341967302240689e-08, + "loss": 0.0004, + "step": 40371 + }, + { + "epoch": 0.78, + "learning_rate": 4.341578967807075e-08, + "loss": 0.0004, + "step": 40372 + }, + { + "epoch": 0.78, + "learning_rate": 4.341190633373461e-08, + "loss": 0.0004, + "step": 40373 + }, + { + "epoch": 0.78, + "learning_rate": 4.340802298939847e-08, + "loss": 0.0004, + "step": 40374 + }, + { + "epoch": 0.78, + "learning_rate": 4.3404139645062326e-08, + "loss": 0.0003, + "step": 40375 + }, + { + "epoch": 0.78, + "learning_rate": 4.3400256300726184e-08, + "loss": 0.0004, + "step": 40376 + }, + { + "epoch": 0.78, + "learning_rate": 4.339637295639004e-08, + "loss": 0.1451, + "step": 40377 + }, + { + "epoch": 0.78, + "learning_rate": 4.33924896120539e-08, + "loss": 0.0005, + "step": 40378 + }, + { + "epoch": 0.78, + "learning_rate": 4.338860626771776e-08, + "loss": 0.0003, + "step": 40379 + }, + { + "epoch": 0.78, + "learning_rate": 4.338472292338162e-08, + "loss": 0.0005, + "step": 40380 + }, + { + "epoch": 0.78, + "learning_rate": 4.338083957904547e-08, + "loss": 0.0006, + "step": 40381 + }, + { + "epoch": 0.78, + "learning_rate": 4.337695623470933e-08, + "loss": 0.0003, + "step": 40382 + }, + { + "epoch": 0.78, + "learning_rate": 4.3373072890373185e-08, + "loss": 0.0004, + "step": 40383 + }, + { + "epoch": 0.78, + "learning_rate": 4.3369189546037043e-08, + "loss": 0.0012, + "step": 40384 + }, + { + "epoch": 0.78, + "learning_rate": 4.33653062017009e-08, + "loss": 0.0009, + "step": 40385 + }, + { + "epoch": 0.78, + "learning_rate": 4.336142285736476e-08, + "loss": 0.0006, + "step": 40386 + }, + { + "epoch": 0.78, + "learning_rate": 4.335753951302862e-08, + "loss": 0.0003, + "step": 40387 + }, + { + "epoch": 0.78, + "learning_rate": 4.3353656168692476e-08, + "loss": 0.0003, + "step": 40388 + }, + { + "epoch": 0.78, + "learning_rate": 4.3349772824356335e-08, + "loss": 0.0003, + "step": 40389 + }, + { + "epoch": 0.78, + "learning_rate": 4.334588948002019e-08, + "loss": 0.0003, + "step": 40390 + }, + { + "epoch": 0.78, + "learning_rate": 4.334200613568405e-08, + "loss": 0.0003, + "step": 40391 + }, + { + "epoch": 0.78, + "learning_rate": 4.333812279134791e-08, + "loss": 0.0005, + "step": 40392 + }, + { + "epoch": 0.78, + "learning_rate": 4.333423944701177e-08, + "loss": 0.0005, + "step": 40393 + }, + { + "epoch": 0.78, + "learning_rate": 4.3330356102675626e-08, + "loss": 0.0003, + "step": 40394 + }, + { + "epoch": 0.78, + "learning_rate": 4.332647275833948e-08, + "loss": 0.0003, + "step": 40395 + }, + { + "epoch": 0.78, + "learning_rate": 4.3322589414003336e-08, + "loss": 0.0005, + "step": 40396 + }, + { + "epoch": 0.78, + "learning_rate": 4.3318706069667194e-08, + "loss": 0.0005, + "step": 40397 + }, + { + "epoch": 0.78, + "learning_rate": 4.331482272533105e-08, + "loss": 0.0029, + "step": 40398 + }, + { + "epoch": 0.78, + "learning_rate": 4.331093938099491e-08, + "loss": 0.0003, + "step": 40399 + }, + { + "epoch": 0.78, + "learning_rate": 4.330705603665877e-08, + "loss": 0.0003, + "step": 40400 + }, + { + "epoch": 0.78, + "learning_rate": 4.330317269232263e-08, + "loss": 0.01, + "step": 40401 + }, + { + "epoch": 0.78, + "learning_rate": 4.3299289347986485e-08, + "loss": 0.0004, + "step": 40402 + }, + { + "epoch": 0.78, + "learning_rate": 4.3295406003650343e-08, + "loss": 0.0004, + "step": 40403 + }, + { + "epoch": 0.78, + "learning_rate": 4.32915226593142e-08, + "loss": 0.1001, + "step": 40404 + }, + { + "epoch": 0.78, + "learning_rate": 4.328763931497806e-08, + "loss": 0.0003, + "step": 40405 + }, + { + "epoch": 0.78, + "learning_rate": 4.328375597064192e-08, + "loss": 0.0053, + "step": 40406 + }, + { + "epoch": 0.78, + "learning_rate": 4.3279872626305776e-08, + "loss": 0.0003, + "step": 40407 + }, + { + "epoch": 0.78, + "learning_rate": 4.3275989281969635e-08, + "loss": 0.1698, + "step": 40408 + }, + { + "epoch": 0.78, + "learning_rate": 4.327210593763349e-08, + "loss": 0.0005, + "step": 40409 + }, + { + "epoch": 0.78, + "learning_rate": 4.3268222593297344e-08, + "loss": 0.0019, + "step": 40410 + }, + { + "epoch": 0.78, + "learning_rate": 4.32643392489612e-08, + "loss": 0.0007, + "step": 40411 + }, + { + "epoch": 0.78, + "learning_rate": 4.326045590462506e-08, + "loss": 0.0003, + "step": 40412 + }, + { + "epoch": 0.78, + "learning_rate": 4.325657256028892e-08, + "loss": 0.0003, + "step": 40413 + }, + { + "epoch": 0.78, + "learning_rate": 4.325268921595278e-08, + "loss": 0.0004, + "step": 40414 + }, + { + "epoch": 0.78, + "learning_rate": 4.3248805871616636e-08, + "loss": 0.0405, + "step": 40415 + }, + { + "epoch": 0.78, + "learning_rate": 4.3244922527280494e-08, + "loss": 0.0005, + "step": 40416 + }, + { + "epoch": 0.78, + "learning_rate": 4.324103918294435e-08, + "loss": 0.0004, + "step": 40417 + }, + { + "epoch": 0.78, + "learning_rate": 4.323715583860821e-08, + "loss": 0.0004, + "step": 40418 + }, + { + "epoch": 0.78, + "learning_rate": 4.323327249427207e-08, + "loss": 0.0011, + "step": 40419 + }, + { + "epoch": 0.78, + "learning_rate": 4.322938914993593e-08, + "loss": 0.0035, + "step": 40420 + }, + { + "epoch": 0.78, + "learning_rate": 4.3225505805599785e-08, + "loss": 0.0005, + "step": 40421 + }, + { + "epoch": 0.78, + "learning_rate": 4.3221622461263643e-08, + "loss": 0.0003, + "step": 40422 + }, + { + "epoch": 0.78, + "learning_rate": 4.32177391169275e-08, + "loss": 0.7919, + "step": 40423 + }, + { + "epoch": 0.78, + "learning_rate": 4.321385577259135e-08, + "loss": 0.182, + "step": 40424 + }, + { + "epoch": 0.78, + "learning_rate": 4.320997242825521e-08, + "loss": 0.0005, + "step": 40425 + }, + { + "epoch": 0.78, + "learning_rate": 4.320608908391907e-08, + "loss": 0.0003, + "step": 40426 + }, + { + "epoch": 0.78, + "learning_rate": 4.320220573958293e-08, + "loss": 0.0014, + "step": 40427 + }, + { + "epoch": 0.78, + "learning_rate": 4.3198322395246786e-08, + "loss": 0.0005, + "step": 40428 + }, + { + "epoch": 0.78, + "learning_rate": 4.3194439050910644e-08, + "loss": 0.0006, + "step": 40429 + }, + { + "epoch": 0.78, + "learning_rate": 4.31905557065745e-08, + "loss": 0.0006, + "step": 40430 + }, + { + "epoch": 0.78, + "learning_rate": 4.318667236223836e-08, + "loss": 0.2942, + "step": 40431 + }, + { + "epoch": 0.78, + "learning_rate": 4.318278901790221e-08, + "loss": 0.0004, + "step": 40432 + }, + { + "epoch": 0.78, + "learning_rate": 4.317890567356607e-08, + "loss": 0.0006, + "step": 40433 + }, + { + "epoch": 0.78, + "learning_rate": 4.317502232922993e-08, + "loss": 0.0036, + "step": 40434 + }, + { + "epoch": 0.78, + "learning_rate": 4.317113898489379e-08, + "loss": 0.0005, + "step": 40435 + }, + { + "epoch": 0.78, + "learning_rate": 4.3167255640557646e-08, + "loss": 0.0004, + "step": 40436 + }, + { + "epoch": 0.78, + "learning_rate": 4.3163372296221504e-08, + "loss": 0.0004, + "step": 40437 + }, + { + "epoch": 0.78, + "learning_rate": 4.315948895188536e-08, + "loss": 0.0003, + "step": 40438 + }, + { + "epoch": 0.78, + "learning_rate": 4.3155605607549214e-08, + "loss": 0.0005, + "step": 40439 + }, + { + "epoch": 0.78, + "learning_rate": 4.315172226321307e-08, + "loss": 0.0004, + "step": 40440 + }, + { + "epoch": 0.78, + "learning_rate": 4.314783891887693e-08, + "loss": 0.0004, + "step": 40441 + }, + { + "epoch": 0.78, + "learning_rate": 4.314395557454079e-08, + "loss": 0.0007, + "step": 40442 + }, + { + "epoch": 0.78, + "learning_rate": 4.3140072230204647e-08, + "loss": 0.0003, + "step": 40443 + }, + { + "epoch": 0.78, + "learning_rate": 4.3136188885868505e-08, + "loss": 0.0004, + "step": 40444 + }, + { + "epoch": 0.78, + "learning_rate": 4.313230554153236e-08, + "loss": 0.0003, + "step": 40445 + }, + { + "epoch": 0.78, + "learning_rate": 4.312842219719622e-08, + "loss": 0.0004, + "step": 40446 + }, + { + "epoch": 0.78, + "learning_rate": 4.312453885286008e-08, + "loss": 0.011, + "step": 40447 + }, + { + "epoch": 0.78, + "learning_rate": 4.312065550852394e-08, + "loss": 0.0602, + "step": 40448 + }, + { + "epoch": 0.78, + "learning_rate": 4.3116772164187796e-08, + "loss": 0.0004, + "step": 40449 + }, + { + "epoch": 0.78, + "learning_rate": 4.3112888819851654e-08, + "loss": 0.0004, + "step": 40450 + }, + { + "epoch": 0.78, + "learning_rate": 4.310900547551551e-08, + "loss": 0.0007, + "step": 40451 + }, + { + "epoch": 0.78, + "learning_rate": 4.310512213117937e-08, + "loss": 0.0005, + "step": 40452 + }, + { + "epoch": 0.78, + "learning_rate": 4.310123878684322e-08, + "loss": 0.2239, + "step": 40453 + }, + { + "epoch": 0.78, + "learning_rate": 4.309735544250708e-08, + "loss": 0.0004, + "step": 40454 + }, + { + "epoch": 0.78, + "learning_rate": 4.309347209817094e-08, + "loss": 0.0004, + "step": 40455 + }, + { + "epoch": 0.78, + "learning_rate": 4.30895887538348e-08, + "loss": 0.0003, + "step": 40456 + }, + { + "epoch": 0.78, + "learning_rate": 4.3085705409498655e-08, + "loss": 0.0007, + "step": 40457 + }, + { + "epoch": 0.78, + "learning_rate": 4.3081822065162514e-08, + "loss": 0.0004, + "step": 40458 + }, + { + "epoch": 0.78, + "learning_rate": 4.307793872082637e-08, + "loss": 0.368, + "step": 40459 + }, + { + "epoch": 0.78, + "learning_rate": 4.307405537649023e-08, + "loss": 0.0012, + "step": 40460 + }, + { + "epoch": 0.78, + "learning_rate": 4.307017203215409e-08, + "loss": 0.0012, + "step": 40461 + }, + { + "epoch": 0.78, + "learning_rate": 4.3066288687817947e-08, + "loss": 0.0004, + "step": 40462 + }, + { + "epoch": 0.78, + "learning_rate": 4.3062405343481805e-08, + "loss": 0.0004, + "step": 40463 + }, + { + "epoch": 0.78, + "learning_rate": 4.305852199914566e-08, + "loss": 0.6552, + "step": 40464 + }, + { + "epoch": 0.78, + "learning_rate": 4.305463865480952e-08, + "loss": 0.0004, + "step": 40465 + }, + { + "epoch": 0.78, + "learning_rate": 4.305075531047338e-08, + "loss": 0.0004, + "step": 40466 + }, + { + "epoch": 0.78, + "learning_rate": 4.304687196613724e-08, + "loss": 0.1782, + "step": 40467 + }, + { + "epoch": 0.78, + "learning_rate": 4.304298862180109e-08, + "loss": 0.0004, + "step": 40468 + }, + { + "epoch": 0.79, + "learning_rate": 4.303910527746495e-08, + "loss": 0.0005, + "step": 40469 + }, + { + "epoch": 0.79, + "learning_rate": 4.3035221933128806e-08, + "loss": 0.0004, + "step": 40470 + }, + { + "epoch": 0.79, + "learning_rate": 4.3031338588792664e-08, + "loss": 0.5648, + "step": 40471 + }, + { + "epoch": 0.79, + "learning_rate": 4.302745524445652e-08, + "loss": 0.0004, + "step": 40472 + }, + { + "epoch": 0.79, + "learning_rate": 4.302357190012038e-08, + "loss": 0.0007, + "step": 40473 + }, + { + "epoch": 0.79, + "learning_rate": 4.301968855578424e-08, + "loss": 0.0003, + "step": 40474 + }, + { + "epoch": 0.79, + "learning_rate": 4.30158052114481e-08, + "loss": 0.0005, + "step": 40475 + }, + { + "epoch": 0.79, + "learning_rate": 4.3011921867111955e-08, + "loss": 0.0005, + "step": 40476 + }, + { + "epoch": 0.79, + "learning_rate": 4.3008038522775814e-08, + "loss": 0.0043, + "step": 40477 + }, + { + "epoch": 0.79, + "learning_rate": 4.300415517843967e-08, + "loss": 0.001, + "step": 40478 + }, + { + "epoch": 0.79, + "learning_rate": 4.300027183410353e-08, + "loss": 0.0005, + "step": 40479 + }, + { + "epoch": 0.79, + "learning_rate": 4.299638848976739e-08, + "loss": 0.0356, + "step": 40480 + }, + { + "epoch": 0.79, + "learning_rate": 4.299250514543125e-08, + "loss": 0.0004, + "step": 40481 + }, + { + "epoch": 0.79, + "learning_rate": 4.29886218010951e-08, + "loss": 0.0006, + "step": 40482 + }, + { + "epoch": 0.79, + "learning_rate": 4.2984738456758957e-08, + "loss": 0.349, + "step": 40483 + }, + { + "epoch": 0.79, + "learning_rate": 4.2980855112422815e-08, + "loss": 0.0003, + "step": 40484 + }, + { + "epoch": 0.79, + "learning_rate": 4.297697176808667e-08, + "loss": 0.0004, + "step": 40485 + }, + { + "epoch": 0.79, + "learning_rate": 4.297308842375053e-08, + "loss": 0.0004, + "step": 40486 + }, + { + "epoch": 0.79, + "learning_rate": 4.296920507941439e-08, + "loss": 0.0006, + "step": 40487 + }, + { + "epoch": 0.79, + "learning_rate": 4.296532173507825e-08, + "loss": 0.0004, + "step": 40488 + }, + { + "epoch": 0.79, + "learning_rate": 4.2961438390742106e-08, + "loss": 0.0004, + "step": 40489 + }, + { + "epoch": 0.79, + "learning_rate": 4.2957555046405964e-08, + "loss": 0.0009, + "step": 40490 + }, + { + "epoch": 0.79, + "learning_rate": 4.295367170206982e-08, + "loss": 0.0005, + "step": 40491 + }, + { + "epoch": 0.79, + "learning_rate": 4.294978835773368e-08, + "loss": 0.0004, + "step": 40492 + }, + { + "epoch": 0.79, + "learning_rate": 4.294590501339754e-08, + "loss": 0.0005, + "step": 40493 + }, + { + "epoch": 0.79, + "learning_rate": 4.29420216690614e-08, + "loss": 0.0005, + "step": 40494 + }, + { + "epoch": 0.79, + "learning_rate": 4.2938138324725256e-08, + "loss": 0.0003, + "step": 40495 + }, + { + "epoch": 0.79, + "learning_rate": 4.2934254980389114e-08, + "loss": 0.0003, + "step": 40496 + }, + { + "epoch": 0.79, + "learning_rate": 4.2930371636052965e-08, + "loss": 0.0003, + "step": 40497 + }, + { + "epoch": 0.79, + "learning_rate": 4.2926488291716824e-08, + "loss": 0.0006, + "step": 40498 + }, + { + "epoch": 0.79, + "learning_rate": 4.292260494738068e-08, + "loss": 0.0053, + "step": 40499 + }, + { + "epoch": 0.79, + "learning_rate": 4.291872160304454e-08, + "loss": 0.0009, + "step": 40500 + }, + { + "epoch": 0.79, + "learning_rate": 4.29148382587084e-08, + "loss": 0.0282, + "step": 40501 + }, + { + "epoch": 0.79, + "learning_rate": 4.2910954914372257e-08, + "loss": 0.0006, + "step": 40502 + }, + { + "epoch": 0.79, + "learning_rate": 4.2907071570036115e-08, + "loss": 0.0076, + "step": 40503 + }, + { + "epoch": 0.79, + "learning_rate": 4.290318822569997e-08, + "loss": 0.0004, + "step": 40504 + }, + { + "epoch": 0.79, + "learning_rate": 4.289930488136383e-08, + "loss": 0.0003, + "step": 40505 + }, + { + "epoch": 0.79, + "learning_rate": 4.289542153702769e-08, + "loss": 0.0003, + "step": 40506 + }, + { + "epoch": 0.79, + "learning_rate": 4.289153819269155e-08, + "loss": 0.0557, + "step": 40507 + }, + { + "epoch": 0.79, + "learning_rate": 4.2887654848355406e-08, + "loss": 0.0005, + "step": 40508 + }, + { + "epoch": 0.79, + "learning_rate": 4.2883771504019264e-08, + "loss": 0.0004, + "step": 40509 + }, + { + "epoch": 0.79, + "learning_rate": 4.287988815968312e-08, + "loss": 0.0004, + "step": 40510 + }, + { + "epoch": 0.79, + "learning_rate": 4.2876004815346974e-08, + "loss": 0.0003, + "step": 40511 + }, + { + "epoch": 0.79, + "learning_rate": 4.287212147101083e-08, + "loss": 0.0004, + "step": 40512 + }, + { + "epoch": 0.79, + "learning_rate": 4.286823812667469e-08, + "loss": 0.0007, + "step": 40513 + }, + { + "epoch": 0.79, + "learning_rate": 4.286435478233855e-08, + "loss": 0.0004, + "step": 40514 + }, + { + "epoch": 0.79, + "learning_rate": 4.286047143800241e-08, + "loss": 0.0007, + "step": 40515 + }, + { + "epoch": 0.79, + "learning_rate": 4.2856588093666265e-08, + "loss": 0.0004, + "step": 40516 + }, + { + "epoch": 0.79, + "learning_rate": 4.2852704749330124e-08, + "loss": 0.0007, + "step": 40517 + }, + { + "epoch": 0.79, + "learning_rate": 4.284882140499398e-08, + "loss": 0.0003, + "step": 40518 + }, + { + "epoch": 0.79, + "learning_rate": 4.284493806065784e-08, + "loss": 0.0003, + "step": 40519 + }, + { + "epoch": 0.79, + "learning_rate": 4.28410547163217e-08, + "loss": 0.0007, + "step": 40520 + }, + { + "epoch": 0.79, + "learning_rate": 4.283717137198555e-08, + "loss": 0.0007, + "step": 40521 + }, + { + "epoch": 0.79, + "learning_rate": 4.283328802764941e-08, + "loss": 0.0004, + "step": 40522 + }, + { + "epoch": 0.79, + "learning_rate": 4.2829404683313267e-08, + "loss": 0.0004, + "step": 40523 + }, + { + "epoch": 0.79, + "learning_rate": 4.2825521338977125e-08, + "loss": 0.0004, + "step": 40524 + }, + { + "epoch": 0.79, + "learning_rate": 4.282163799464098e-08, + "loss": 0.0006, + "step": 40525 + }, + { + "epoch": 0.79, + "learning_rate": 4.281775465030484e-08, + "loss": 0.0004, + "step": 40526 + }, + { + "epoch": 0.79, + "learning_rate": 4.28138713059687e-08, + "loss": 0.0003, + "step": 40527 + }, + { + "epoch": 0.79, + "learning_rate": 4.280998796163255e-08, + "loss": 0.0014, + "step": 40528 + }, + { + "epoch": 0.79, + "learning_rate": 4.280610461729641e-08, + "loss": 0.0003, + "step": 40529 + }, + { + "epoch": 0.79, + "learning_rate": 4.280222127296027e-08, + "loss": 0.0005, + "step": 40530 + }, + { + "epoch": 0.79, + "learning_rate": 4.2798337928624126e-08, + "loss": 0.0004, + "step": 40531 + }, + { + "epoch": 0.79, + "learning_rate": 4.2794454584287984e-08, + "loss": 0.001, + "step": 40532 + }, + { + "epoch": 0.79, + "learning_rate": 4.279057123995184e-08, + "loss": 0.0004, + "step": 40533 + }, + { + "epoch": 0.79, + "learning_rate": 4.27866878956157e-08, + "loss": 0.0004, + "step": 40534 + }, + { + "epoch": 0.79, + "learning_rate": 4.278280455127956e-08, + "loss": 0.0321, + "step": 40535 + }, + { + "epoch": 0.79, + "learning_rate": 4.277892120694342e-08, + "loss": 0.0003, + "step": 40536 + }, + { + "epoch": 0.79, + "learning_rate": 4.2775037862607275e-08, + "loss": 0.0004, + "step": 40537 + }, + { + "epoch": 0.79, + "learning_rate": 4.2771154518271134e-08, + "loss": 0.0004, + "step": 40538 + }, + { + "epoch": 0.79, + "learning_rate": 4.276727117393499e-08, + "loss": 0.0004, + "step": 40539 + }, + { + "epoch": 0.79, + "learning_rate": 4.2763387829598843e-08, + "loss": 0.0004, + "step": 40540 + }, + { + "epoch": 0.79, + "learning_rate": 4.27595044852627e-08, + "loss": 0.0006, + "step": 40541 + }, + { + "epoch": 0.79, + "learning_rate": 4.275562114092656e-08, + "loss": 0.0003, + "step": 40542 + }, + { + "epoch": 0.79, + "learning_rate": 4.275173779659042e-08, + "loss": 0.0004, + "step": 40543 + }, + { + "epoch": 0.79, + "learning_rate": 4.2747854452254276e-08, + "loss": 0.0003, + "step": 40544 + }, + { + "epoch": 0.79, + "learning_rate": 4.2743971107918135e-08, + "loss": 0.0004, + "step": 40545 + }, + { + "epoch": 0.79, + "learning_rate": 4.274008776358199e-08, + "loss": 0.9763, + "step": 40546 + }, + { + "epoch": 0.79, + "learning_rate": 4.273620441924585e-08, + "loss": 0.0004, + "step": 40547 + }, + { + "epoch": 0.79, + "learning_rate": 4.273232107490971e-08, + "loss": 0.0003, + "step": 40548 + }, + { + "epoch": 0.79, + "learning_rate": 4.272843773057357e-08, + "loss": 0.0004, + "step": 40549 + }, + { + "epoch": 0.79, + "learning_rate": 4.2724554386237426e-08, + "loss": 0.0003, + "step": 40550 + }, + { + "epoch": 0.79, + "learning_rate": 4.2720671041901284e-08, + "loss": 0.0292, + "step": 40551 + }, + { + "epoch": 0.79, + "learning_rate": 4.271678769756514e-08, + "loss": 0.0005, + "step": 40552 + }, + { + "epoch": 0.79, + "learning_rate": 4.2712904353229e-08, + "loss": 0.0006, + "step": 40553 + }, + { + "epoch": 0.79, + "learning_rate": 4.270902100889286e-08, + "loss": 0.0004, + "step": 40554 + }, + { + "epoch": 0.79, + "learning_rate": 4.270513766455671e-08, + "loss": 1.1877, + "step": 40555 + }, + { + "epoch": 0.79, + "learning_rate": 4.270125432022057e-08, + "loss": 0.8861, + "step": 40556 + }, + { + "epoch": 0.79, + "learning_rate": 4.269737097588443e-08, + "loss": 0.0003, + "step": 40557 + }, + { + "epoch": 0.79, + "learning_rate": 4.2693487631548285e-08, + "loss": 0.0004, + "step": 40558 + }, + { + "epoch": 0.79, + "learning_rate": 4.2689604287212143e-08, + "loss": 0.0003, + "step": 40559 + }, + { + "epoch": 0.79, + "learning_rate": 4.2685720942876e-08, + "loss": 0.0005, + "step": 40560 + }, + { + "epoch": 0.79, + "learning_rate": 4.268183759853986e-08, + "loss": 0.0003, + "step": 40561 + }, + { + "epoch": 0.79, + "learning_rate": 4.267795425420372e-08, + "loss": 0.0003, + "step": 40562 + }, + { + "epoch": 0.79, + "learning_rate": 4.2674070909867576e-08, + "loss": 0.0004, + "step": 40563 + }, + { + "epoch": 0.79, + "learning_rate": 4.2670187565531435e-08, + "loss": 0.0009, + "step": 40564 + }, + { + "epoch": 0.79, + "learning_rate": 4.266630422119529e-08, + "loss": 0.0005, + "step": 40565 + }, + { + "epoch": 0.79, + "learning_rate": 4.266242087685915e-08, + "loss": 0.0004, + "step": 40566 + }, + { + "epoch": 0.79, + "learning_rate": 4.265853753252301e-08, + "loss": 0.0003, + "step": 40567 + }, + { + "epoch": 0.79, + "learning_rate": 4.265465418818687e-08, + "loss": 0.0004, + "step": 40568 + }, + { + "epoch": 0.79, + "learning_rate": 4.265077084385072e-08, + "loss": 0.0002, + "step": 40569 + }, + { + "epoch": 0.79, + "learning_rate": 4.264688749951458e-08, + "loss": 0.0007, + "step": 40570 + }, + { + "epoch": 0.79, + "learning_rate": 4.2643004155178436e-08, + "loss": 0.0008, + "step": 40571 + }, + { + "epoch": 0.79, + "learning_rate": 4.2639120810842294e-08, + "loss": 0.0004, + "step": 40572 + }, + { + "epoch": 0.79, + "learning_rate": 4.263523746650615e-08, + "loss": 0.0005, + "step": 40573 + }, + { + "epoch": 0.79, + "learning_rate": 4.263135412217001e-08, + "loss": 0.0004, + "step": 40574 + }, + { + "epoch": 0.79, + "learning_rate": 4.262747077783387e-08, + "loss": 0.0005, + "step": 40575 + }, + { + "epoch": 0.79, + "learning_rate": 4.262358743349773e-08, + "loss": 0.0004, + "step": 40576 + }, + { + "epoch": 0.79, + "learning_rate": 4.2619704089161585e-08, + "loss": 0.0003, + "step": 40577 + }, + { + "epoch": 0.79, + "learning_rate": 4.2615820744825443e-08, + "loss": 0.0014, + "step": 40578 + }, + { + "epoch": 0.79, + "learning_rate": 4.26119374004893e-08, + "loss": 0.0005, + "step": 40579 + }, + { + "epoch": 0.79, + "learning_rate": 4.260805405615316e-08, + "loss": 0.0003, + "step": 40580 + }, + { + "epoch": 0.79, + "learning_rate": 4.260417071181702e-08, + "loss": 0.0004, + "step": 40581 + }, + { + "epoch": 0.79, + "learning_rate": 4.2600287367480876e-08, + "loss": 0.0005, + "step": 40582 + }, + { + "epoch": 0.79, + "learning_rate": 4.2596404023144735e-08, + "loss": 0.0004, + "step": 40583 + }, + { + "epoch": 0.79, + "learning_rate": 4.2592520678808586e-08, + "loss": 0.0004, + "step": 40584 + }, + { + "epoch": 0.79, + "learning_rate": 4.2588637334472445e-08, + "loss": 0.0003, + "step": 40585 + }, + { + "epoch": 0.79, + "learning_rate": 4.25847539901363e-08, + "loss": 0.0013, + "step": 40586 + }, + { + "epoch": 0.79, + "learning_rate": 4.258087064580016e-08, + "loss": 0.0003, + "step": 40587 + }, + { + "epoch": 0.79, + "learning_rate": 4.257698730146402e-08, + "loss": 0.0005, + "step": 40588 + }, + { + "epoch": 0.79, + "learning_rate": 4.257310395712788e-08, + "loss": 0.0005, + "step": 40589 + }, + { + "epoch": 0.79, + "learning_rate": 4.2569220612791736e-08, + "loss": 0.0006, + "step": 40590 + }, + { + "epoch": 0.79, + "learning_rate": 4.2565337268455594e-08, + "loss": 0.0003, + "step": 40591 + }, + { + "epoch": 0.79, + "learning_rate": 4.256145392411945e-08, + "loss": 0.0002, + "step": 40592 + }, + { + "epoch": 0.79, + "learning_rate": 4.255757057978331e-08, + "loss": 0.0778, + "step": 40593 + }, + { + "epoch": 0.79, + "learning_rate": 4.255368723544717e-08, + "loss": 0.0005, + "step": 40594 + }, + { + "epoch": 0.79, + "learning_rate": 4.254980389111103e-08, + "loss": 0.0014, + "step": 40595 + }, + { + "epoch": 0.79, + "learning_rate": 4.2545920546774885e-08, + "loss": 0.0009, + "step": 40596 + }, + { + "epoch": 0.79, + "learning_rate": 4.2542037202438744e-08, + "loss": 0.0014, + "step": 40597 + }, + { + "epoch": 0.79, + "learning_rate": 4.2538153858102595e-08, + "loss": 0.0005, + "step": 40598 + }, + { + "epoch": 0.79, + "learning_rate": 4.2534270513766453e-08, + "loss": 0.0004, + "step": 40599 + }, + { + "epoch": 0.79, + "learning_rate": 4.253038716943031e-08, + "loss": 0.0005, + "step": 40600 + }, + { + "epoch": 0.79, + "learning_rate": 4.252650382509417e-08, + "loss": 0.001, + "step": 40601 + }, + { + "epoch": 0.79, + "learning_rate": 4.252262048075803e-08, + "loss": 0.0006, + "step": 40602 + }, + { + "epoch": 0.79, + "learning_rate": 4.2518737136421886e-08, + "loss": 0.5815, + "step": 40603 + }, + { + "epoch": 0.79, + "learning_rate": 4.2514853792085745e-08, + "loss": 0.0007, + "step": 40604 + }, + { + "epoch": 0.79, + "learning_rate": 4.25109704477496e-08, + "loss": 0.0004, + "step": 40605 + }, + { + "epoch": 0.79, + "learning_rate": 4.250708710341346e-08, + "loss": 0.0005, + "step": 40606 + }, + { + "epoch": 0.79, + "learning_rate": 4.250320375907732e-08, + "loss": 0.0004, + "step": 40607 + }, + { + "epoch": 0.79, + "learning_rate": 4.249932041474118e-08, + "loss": 0.0004, + "step": 40608 + }, + { + "epoch": 0.79, + "learning_rate": 4.249543707040503e-08, + "loss": 0.0005, + "step": 40609 + }, + { + "epoch": 0.79, + "learning_rate": 4.249155372606889e-08, + "loss": 0.0004, + "step": 40610 + }, + { + "epoch": 0.79, + "learning_rate": 4.2487670381732746e-08, + "loss": 0.0004, + "step": 40611 + }, + { + "epoch": 0.79, + "learning_rate": 4.2483787037396604e-08, + "loss": 0.0004, + "step": 40612 + }, + { + "epoch": 0.79, + "learning_rate": 4.247990369306046e-08, + "loss": 0.0004, + "step": 40613 + }, + { + "epoch": 0.79, + "learning_rate": 4.247602034872432e-08, + "loss": 0.0167, + "step": 40614 + }, + { + "epoch": 0.79, + "learning_rate": 4.247213700438818e-08, + "loss": 0.0004, + "step": 40615 + }, + { + "epoch": 0.79, + "learning_rate": 4.246825366005203e-08, + "loss": 0.0003, + "step": 40616 + }, + { + "epoch": 0.79, + "learning_rate": 4.246437031571589e-08, + "loss": 0.0008, + "step": 40617 + }, + { + "epoch": 0.79, + "learning_rate": 4.246048697137975e-08, + "loss": 0.0003, + "step": 40618 + }, + { + "epoch": 0.79, + "learning_rate": 4.2456603627043605e-08, + "loss": 0.0005, + "step": 40619 + }, + { + "epoch": 0.79, + "learning_rate": 4.245272028270746e-08, + "loss": 0.0004, + "step": 40620 + }, + { + "epoch": 0.79, + "learning_rate": 4.244883693837132e-08, + "loss": 0.0006, + "step": 40621 + }, + { + "epoch": 0.79, + "learning_rate": 4.244495359403518e-08, + "loss": 0.0048, + "step": 40622 + }, + { + "epoch": 0.79, + "learning_rate": 4.244107024969904e-08, + "loss": 0.0006, + "step": 40623 + }, + { + "epoch": 0.79, + "learning_rate": 4.2437186905362896e-08, + "loss": 0.0003, + "step": 40624 + }, + { + "epoch": 0.79, + "learning_rate": 4.2433303561026754e-08, + "loss": 0.0004, + "step": 40625 + }, + { + "epoch": 0.79, + "learning_rate": 4.242942021669061e-08, + "loss": 0.0004, + "step": 40626 + }, + { + "epoch": 0.79, + "learning_rate": 4.2425536872354464e-08, + "loss": 0.0005, + "step": 40627 + }, + { + "epoch": 0.79, + "learning_rate": 4.242165352801832e-08, + "loss": 0.9378, + "step": 40628 + }, + { + "epoch": 0.79, + "learning_rate": 4.241777018368218e-08, + "loss": 1.0597, + "step": 40629 + }, + { + "epoch": 0.79, + "learning_rate": 4.241388683934604e-08, + "loss": 0.0005, + "step": 40630 + }, + { + "epoch": 0.79, + "learning_rate": 4.24100034950099e-08, + "loss": 0.0006, + "step": 40631 + }, + { + "epoch": 0.79, + "learning_rate": 4.2406120150673756e-08, + "loss": 0.0004, + "step": 40632 + }, + { + "epoch": 0.79, + "learning_rate": 4.2402236806337614e-08, + "loss": 0.0004, + "step": 40633 + }, + { + "epoch": 0.79, + "learning_rate": 4.239835346200147e-08, + "loss": 0.0011, + "step": 40634 + }, + { + "epoch": 0.79, + "learning_rate": 4.239447011766533e-08, + "loss": 0.0004, + "step": 40635 + }, + { + "epoch": 0.79, + "learning_rate": 4.239058677332919e-08, + "loss": 0.4847, + "step": 40636 + }, + { + "epoch": 0.79, + "learning_rate": 4.238670342899305e-08, + "loss": 0.6546, + "step": 40637 + }, + { + "epoch": 0.79, + "learning_rate": 4.2382820084656905e-08, + "loss": 0.8635, + "step": 40638 + }, + { + "epoch": 0.79, + "learning_rate": 4.237893674032076e-08, + "loss": 0.0004, + "step": 40639 + }, + { + "epoch": 0.79, + "learning_rate": 4.237505339598462e-08, + "loss": 0.0004, + "step": 40640 + }, + { + "epoch": 0.79, + "learning_rate": 4.237117005164848e-08, + "loss": 0.0005, + "step": 40641 + }, + { + "epoch": 0.79, + "learning_rate": 4.236728670731233e-08, + "loss": 0.0006, + "step": 40642 + }, + { + "epoch": 0.79, + "learning_rate": 4.236340336297619e-08, + "loss": 0.0004, + "step": 40643 + }, + { + "epoch": 0.79, + "learning_rate": 4.235952001864005e-08, + "loss": 0.0005, + "step": 40644 + }, + { + "epoch": 0.79, + "learning_rate": 4.2355636674303906e-08, + "loss": 0.0006, + "step": 40645 + }, + { + "epoch": 0.79, + "learning_rate": 4.2351753329967764e-08, + "loss": 0.0005, + "step": 40646 + }, + { + "epoch": 0.79, + "learning_rate": 4.234786998563162e-08, + "loss": 0.0004, + "step": 40647 + }, + { + "epoch": 0.79, + "learning_rate": 4.234398664129548e-08, + "loss": 0.0003, + "step": 40648 + }, + { + "epoch": 0.79, + "learning_rate": 4.234010329695934e-08, + "loss": 0.0004, + "step": 40649 + }, + { + "epoch": 0.79, + "learning_rate": 4.23362199526232e-08, + "loss": 0.0003, + "step": 40650 + }, + { + "epoch": 0.79, + "learning_rate": 4.2332336608287056e-08, + "loss": 0.0003, + "step": 40651 + }, + { + "epoch": 0.79, + "learning_rate": 4.2328453263950914e-08, + "loss": 0.0017, + "step": 40652 + }, + { + "epoch": 0.79, + "learning_rate": 4.232456991961477e-08, + "loss": 0.0003, + "step": 40653 + }, + { + "epoch": 0.79, + "learning_rate": 4.232068657527863e-08, + "loss": 0.0004, + "step": 40654 + }, + { + "epoch": 0.79, + "learning_rate": 4.231680323094249e-08, + "loss": 0.0044, + "step": 40655 + }, + { + "epoch": 0.79, + "learning_rate": 4.231291988660634e-08, + "loss": 0.0003, + "step": 40656 + }, + { + "epoch": 0.79, + "learning_rate": 4.23090365422702e-08, + "loss": 0.0004, + "step": 40657 + }, + { + "epoch": 0.79, + "learning_rate": 4.230515319793406e-08, + "loss": 0.001, + "step": 40658 + }, + { + "epoch": 0.79, + "learning_rate": 4.2301269853597915e-08, + "loss": 0.0005, + "step": 40659 + }, + { + "epoch": 0.79, + "learning_rate": 4.229738650926177e-08, + "loss": 0.0003, + "step": 40660 + }, + { + "epoch": 0.79, + "learning_rate": 4.229350316492563e-08, + "loss": 0.0006, + "step": 40661 + }, + { + "epoch": 0.79, + "learning_rate": 4.228961982058949e-08, + "loss": 0.0003, + "step": 40662 + }, + { + "epoch": 0.79, + "learning_rate": 4.228573647625335e-08, + "loss": 0.0003, + "step": 40663 + }, + { + "epoch": 0.79, + "learning_rate": 4.2281853131917206e-08, + "loss": 0.0004, + "step": 40664 + }, + { + "epoch": 0.79, + "learning_rate": 4.2277969787581064e-08, + "loss": 0.0004, + "step": 40665 + }, + { + "epoch": 0.79, + "learning_rate": 4.227408644324492e-08, + "loss": 0.0009, + "step": 40666 + }, + { + "epoch": 0.79, + "learning_rate": 4.227020309890878e-08, + "loss": 0.0003, + "step": 40667 + }, + { + "epoch": 0.79, + "learning_rate": 4.226631975457264e-08, + "loss": 0.0004, + "step": 40668 + }, + { + "epoch": 0.79, + "learning_rate": 4.22624364102365e-08, + "loss": 0.0003, + "step": 40669 + }, + { + "epoch": 0.79, + "learning_rate": 4.2258553065900356e-08, + "loss": 0.0004, + "step": 40670 + }, + { + "epoch": 0.79, + "learning_rate": 4.225466972156421e-08, + "loss": 0.0003, + "step": 40671 + }, + { + "epoch": 0.79, + "learning_rate": 4.2250786377228066e-08, + "loss": 0.0004, + "step": 40672 + }, + { + "epoch": 0.79, + "learning_rate": 4.2246903032891924e-08, + "loss": 0.2447, + "step": 40673 + }, + { + "epoch": 0.79, + "learning_rate": 4.224301968855578e-08, + "loss": 0.0005, + "step": 40674 + }, + { + "epoch": 0.79, + "learning_rate": 4.223913634421964e-08, + "loss": 0.0005, + "step": 40675 + }, + { + "epoch": 0.79, + "learning_rate": 4.22352529998835e-08, + "loss": 0.0006, + "step": 40676 + }, + { + "epoch": 0.79, + "learning_rate": 4.223136965554736e-08, + "loss": 0.0003, + "step": 40677 + }, + { + "epoch": 0.79, + "learning_rate": 4.2227486311211215e-08, + "loss": 0.0006, + "step": 40678 + }, + { + "epoch": 0.79, + "learning_rate": 4.222360296687507e-08, + "loss": 0.0006, + "step": 40679 + }, + { + "epoch": 0.79, + "learning_rate": 4.221971962253893e-08, + "loss": 0.0006, + "step": 40680 + }, + { + "epoch": 0.79, + "learning_rate": 4.221583627820279e-08, + "loss": 0.0003, + "step": 40681 + }, + { + "epoch": 0.79, + "learning_rate": 4.221195293386665e-08, + "loss": 0.0418, + "step": 40682 + }, + { + "epoch": 0.79, + "learning_rate": 4.2208069589530506e-08, + "loss": 1.9182, + "step": 40683 + }, + { + "epoch": 0.79, + "learning_rate": 4.2204186245194364e-08, + "loss": 0.0004, + "step": 40684 + }, + { + "epoch": 0.79, + "learning_rate": 4.2200302900858216e-08, + "loss": 0.0005, + "step": 40685 + }, + { + "epoch": 0.79, + "learning_rate": 4.2196419556522074e-08, + "loss": 0.0055, + "step": 40686 + }, + { + "epoch": 0.79, + "learning_rate": 4.219253621218593e-08, + "loss": 0.0004, + "step": 40687 + }, + { + "epoch": 0.79, + "learning_rate": 4.218865286784979e-08, + "loss": 0.0007, + "step": 40688 + }, + { + "epoch": 0.79, + "learning_rate": 4.218476952351365e-08, + "loss": 0.0004, + "step": 40689 + }, + { + "epoch": 0.79, + "learning_rate": 4.218088617917751e-08, + "loss": 0.0003, + "step": 40690 + }, + { + "epoch": 0.79, + "learning_rate": 4.2177002834841366e-08, + "loss": 0.0006, + "step": 40691 + }, + { + "epoch": 0.79, + "learning_rate": 4.2173119490505224e-08, + "loss": 0.0016, + "step": 40692 + }, + { + "epoch": 0.79, + "learning_rate": 4.216923614616908e-08, + "loss": 0.0005, + "step": 40693 + }, + { + "epoch": 0.79, + "learning_rate": 4.216535280183294e-08, + "loss": 0.0008, + "step": 40694 + }, + { + "epoch": 0.79, + "learning_rate": 4.21614694574968e-08, + "loss": 0.0033, + "step": 40695 + }, + { + "epoch": 0.79, + "learning_rate": 4.215758611316066e-08, + "loss": 0.0012, + "step": 40696 + }, + { + "epoch": 0.79, + "learning_rate": 4.2153702768824515e-08, + "loss": 0.0005, + "step": 40697 + }, + { + "epoch": 0.79, + "learning_rate": 4.2149819424488367e-08, + "loss": 0.0005, + "step": 40698 + }, + { + "epoch": 0.79, + "learning_rate": 4.2145936080152225e-08, + "loss": 0.0005, + "step": 40699 + }, + { + "epoch": 0.79, + "learning_rate": 4.214205273581608e-08, + "loss": 0.0003, + "step": 40700 + }, + { + "epoch": 0.79, + "learning_rate": 4.213816939147994e-08, + "loss": 0.0005, + "step": 40701 + }, + { + "epoch": 0.79, + "learning_rate": 4.21342860471438e-08, + "loss": 0.919, + "step": 40702 + }, + { + "epoch": 0.79, + "learning_rate": 4.213040270280766e-08, + "loss": 0.0004, + "step": 40703 + }, + { + "epoch": 0.79, + "learning_rate": 4.2126519358471516e-08, + "loss": 0.0003, + "step": 40704 + }, + { + "epoch": 0.79, + "learning_rate": 4.212263601413537e-08, + "loss": 0.0003, + "step": 40705 + }, + { + "epoch": 0.79, + "learning_rate": 4.2118752669799226e-08, + "loss": 0.8161, + "step": 40706 + }, + { + "epoch": 0.79, + "learning_rate": 4.2114869325463084e-08, + "loss": 0.0125, + "step": 40707 + }, + { + "epoch": 0.79, + "learning_rate": 4.211098598112694e-08, + "loss": 0.9832, + "step": 40708 + }, + { + "epoch": 0.79, + "learning_rate": 4.21071026367908e-08, + "loss": 0.0003, + "step": 40709 + }, + { + "epoch": 0.79, + "learning_rate": 4.210321929245466e-08, + "loss": 0.0045, + "step": 40710 + }, + { + "epoch": 0.79, + "learning_rate": 4.209933594811852e-08, + "loss": 0.0021, + "step": 40711 + }, + { + "epoch": 0.79, + "learning_rate": 4.2095452603782375e-08, + "loss": 0.0007, + "step": 40712 + }, + { + "epoch": 0.79, + "learning_rate": 4.2091569259446234e-08, + "loss": 0.0011, + "step": 40713 + }, + { + "epoch": 0.79, + "learning_rate": 4.2087685915110085e-08, + "loss": 0.0007, + "step": 40714 + }, + { + "epoch": 0.79, + "learning_rate": 4.2083802570773944e-08, + "loss": 0.0066, + "step": 40715 + }, + { + "epoch": 0.79, + "learning_rate": 4.20799192264378e-08, + "loss": 0.0004, + "step": 40716 + }, + { + "epoch": 0.79, + "learning_rate": 4.207603588210166e-08, + "loss": 0.0004, + "step": 40717 + }, + { + "epoch": 0.79, + "learning_rate": 4.207215253776552e-08, + "loss": 0.0003, + "step": 40718 + }, + { + "epoch": 0.79, + "learning_rate": 4.2068269193429377e-08, + "loss": 0.0005, + "step": 40719 + }, + { + "epoch": 0.79, + "learning_rate": 4.2064385849093235e-08, + "loss": 0.0004, + "step": 40720 + }, + { + "epoch": 0.79, + "learning_rate": 4.206050250475709e-08, + "loss": 0.0005, + "step": 40721 + }, + { + "epoch": 0.79, + "learning_rate": 4.205661916042095e-08, + "loss": 0.0004, + "step": 40722 + }, + { + "epoch": 0.79, + "learning_rate": 4.205273581608481e-08, + "loss": 0.1411, + "step": 40723 + }, + { + "epoch": 0.79, + "learning_rate": 4.204885247174867e-08, + "loss": 0.0004, + "step": 40724 + }, + { + "epoch": 0.79, + "learning_rate": 4.2044969127412526e-08, + "loss": 0.0005, + "step": 40725 + }, + { + "epoch": 0.79, + "learning_rate": 4.2041085783076384e-08, + "loss": 0.0003, + "step": 40726 + }, + { + "epoch": 0.79, + "learning_rate": 4.203720243874024e-08, + "loss": 0.0004, + "step": 40727 + }, + { + "epoch": 0.79, + "learning_rate": 4.20333190944041e-08, + "loss": 0.0003, + "step": 40728 + }, + { + "epoch": 0.79, + "learning_rate": 4.202943575006795e-08, + "loss": 0.0005, + "step": 40729 + }, + { + "epoch": 0.79, + "learning_rate": 4.202555240573181e-08, + "loss": 0.0005, + "step": 40730 + }, + { + "epoch": 0.79, + "learning_rate": 4.202166906139567e-08, + "loss": 0.0006, + "step": 40731 + }, + { + "epoch": 0.79, + "learning_rate": 4.201778571705953e-08, + "loss": 0.1443, + "step": 40732 + }, + { + "epoch": 0.79, + "learning_rate": 4.2013902372723385e-08, + "loss": 0.6772, + "step": 40733 + }, + { + "epoch": 0.79, + "learning_rate": 4.2010019028387244e-08, + "loss": 0.0003, + "step": 40734 + }, + { + "epoch": 0.79, + "learning_rate": 4.20061356840511e-08, + "loss": 0.0004, + "step": 40735 + }, + { + "epoch": 0.79, + "learning_rate": 4.200225233971496e-08, + "loss": 0.0004, + "step": 40736 + }, + { + "epoch": 0.79, + "learning_rate": 4.199836899537882e-08, + "loss": 0.0004, + "step": 40737 + }, + { + "epoch": 0.79, + "learning_rate": 4.1994485651042677e-08, + "loss": 1.3653, + "step": 40738 + }, + { + "epoch": 0.79, + "learning_rate": 4.1990602306706535e-08, + "loss": 1.136, + "step": 40739 + }, + { + "epoch": 0.79, + "learning_rate": 4.198671896237039e-08, + "loss": 0.0006, + "step": 40740 + }, + { + "epoch": 0.79, + "learning_rate": 4.198283561803425e-08, + "loss": 0.0062, + "step": 40741 + }, + { + "epoch": 0.79, + "learning_rate": 4.197895227369811e-08, + "loss": 0.0003, + "step": 40742 + }, + { + "epoch": 0.79, + "learning_rate": 4.197506892936196e-08, + "loss": 0.0005, + "step": 40743 + }, + { + "epoch": 0.79, + "learning_rate": 4.197118558502582e-08, + "loss": 0.0002, + "step": 40744 + }, + { + "epoch": 0.79, + "learning_rate": 4.196730224068968e-08, + "loss": 0.0004, + "step": 40745 + }, + { + "epoch": 0.79, + "learning_rate": 4.1963418896353536e-08, + "loss": 0.0004, + "step": 40746 + }, + { + "epoch": 0.79, + "learning_rate": 4.1959535552017394e-08, + "loss": 0.0004, + "step": 40747 + }, + { + "epoch": 0.79, + "learning_rate": 4.195565220768125e-08, + "loss": 0.0004, + "step": 40748 + }, + { + "epoch": 0.79, + "learning_rate": 4.195176886334511e-08, + "loss": 0.0003, + "step": 40749 + }, + { + "epoch": 0.79, + "learning_rate": 4.194788551900897e-08, + "loss": 0.1005, + "step": 40750 + }, + { + "epoch": 0.79, + "learning_rate": 4.194400217467283e-08, + "loss": 0.0005, + "step": 40751 + }, + { + "epoch": 0.79, + "learning_rate": 4.1940118830336685e-08, + "loss": 0.0003, + "step": 40752 + }, + { + "epoch": 0.79, + "learning_rate": 4.1936235486000544e-08, + "loss": 0.0004, + "step": 40753 + }, + { + "epoch": 0.79, + "learning_rate": 4.19323521416644e-08, + "loss": 0.4286, + "step": 40754 + }, + { + "epoch": 0.79, + "learning_rate": 4.192846879732826e-08, + "loss": 0.0005, + "step": 40755 + }, + { + "epoch": 0.79, + "learning_rate": 4.192458545299212e-08, + "loss": 0.0005, + "step": 40756 + }, + { + "epoch": 0.79, + "learning_rate": 4.1920702108655977e-08, + "loss": 0.1536, + "step": 40757 + }, + { + "epoch": 0.79, + "learning_rate": 4.191681876431983e-08, + "loss": 0.0004, + "step": 40758 + }, + { + "epoch": 0.79, + "learning_rate": 4.1912935419983686e-08, + "loss": 0.0004, + "step": 40759 + }, + { + "epoch": 0.79, + "learning_rate": 4.1909052075647545e-08, + "loss": 0.0004, + "step": 40760 + }, + { + "epoch": 0.79, + "learning_rate": 4.19051687313114e-08, + "loss": 0.0071, + "step": 40761 + }, + { + "epoch": 0.79, + "learning_rate": 4.190128538697526e-08, + "loss": 0.0003, + "step": 40762 + }, + { + "epoch": 0.79, + "learning_rate": 4.189740204263912e-08, + "loss": 0.2798, + "step": 40763 + }, + { + "epoch": 0.79, + "learning_rate": 4.189351869830298e-08, + "loss": 0.0006, + "step": 40764 + }, + { + "epoch": 0.79, + "learning_rate": 4.1889635353966836e-08, + "loss": 0.0004, + "step": 40765 + }, + { + "epoch": 0.79, + "learning_rate": 4.1885752009630694e-08, + "loss": 0.0005, + "step": 40766 + }, + { + "epoch": 0.79, + "learning_rate": 4.188186866529455e-08, + "loss": 0.0005, + "step": 40767 + }, + { + "epoch": 0.79, + "learning_rate": 4.187798532095841e-08, + "loss": 0.0003, + "step": 40768 + }, + { + "epoch": 0.79, + "learning_rate": 4.187410197662227e-08, + "loss": 0.0006, + "step": 40769 + }, + { + "epoch": 0.79, + "learning_rate": 4.187021863228613e-08, + "loss": 0.8821, + "step": 40770 + }, + { + "epoch": 0.79, + "learning_rate": 4.1866335287949985e-08, + "loss": 0.0004, + "step": 40771 + }, + { + "epoch": 0.79, + "learning_rate": 4.186245194361384e-08, + "loss": 0.0006, + "step": 40772 + }, + { + "epoch": 0.79, + "learning_rate": 4.1858568599277695e-08, + "loss": 0.2264, + "step": 40773 + }, + { + "epoch": 0.79, + "learning_rate": 4.1854685254941553e-08, + "loss": 0.0003, + "step": 40774 + }, + { + "epoch": 0.79, + "learning_rate": 4.185080191060541e-08, + "loss": 0.0003, + "step": 40775 + }, + { + "epoch": 0.79, + "learning_rate": 4.184691856626927e-08, + "loss": 0.0004, + "step": 40776 + }, + { + "epoch": 0.79, + "learning_rate": 4.184303522193313e-08, + "loss": 0.0004, + "step": 40777 + }, + { + "epoch": 0.79, + "learning_rate": 4.1839151877596986e-08, + "loss": 0.6486, + "step": 40778 + }, + { + "epoch": 0.79, + "learning_rate": 4.1835268533260845e-08, + "loss": 0.0005, + "step": 40779 + }, + { + "epoch": 0.79, + "learning_rate": 4.18313851889247e-08, + "loss": 0.7295, + "step": 40780 + }, + { + "epoch": 0.79, + "learning_rate": 4.182750184458856e-08, + "loss": 1.0218, + "step": 40781 + }, + { + "epoch": 0.79, + "learning_rate": 4.182361850025242e-08, + "loss": 0.0005, + "step": 40782 + }, + { + "epoch": 0.79, + "learning_rate": 4.181973515591628e-08, + "loss": 0.0003, + "step": 40783 + }, + { + "epoch": 0.79, + "learning_rate": 4.1815851811580136e-08, + "loss": 0.0182, + "step": 40784 + }, + { + "epoch": 0.79, + "learning_rate": 4.1811968467243994e-08, + "loss": 0.0005, + "step": 40785 + }, + { + "epoch": 0.79, + "learning_rate": 4.1808085122907846e-08, + "loss": 0.0005, + "step": 40786 + }, + { + "epoch": 0.79, + "learning_rate": 4.1804201778571704e-08, + "loss": 0.0005, + "step": 40787 + }, + { + "epoch": 0.79, + "learning_rate": 4.180031843423556e-08, + "loss": 0.0005, + "step": 40788 + }, + { + "epoch": 0.79, + "learning_rate": 4.179643508989942e-08, + "loss": 0.0004, + "step": 40789 + }, + { + "epoch": 0.79, + "learning_rate": 4.179255174556328e-08, + "loss": 0.0009, + "step": 40790 + }, + { + "epoch": 0.79, + "learning_rate": 4.178866840122714e-08, + "loss": 0.0004, + "step": 40791 + }, + { + "epoch": 0.79, + "learning_rate": 4.1784785056890995e-08, + "loss": 0.0004, + "step": 40792 + }, + { + "epoch": 0.79, + "learning_rate": 4.178090171255485e-08, + "loss": 0.0039, + "step": 40793 + }, + { + "epoch": 0.79, + "learning_rate": 4.1777018368218705e-08, + "loss": 0.0004, + "step": 40794 + }, + { + "epoch": 0.79, + "learning_rate": 4.1773135023882563e-08, + "loss": 0.0009, + "step": 40795 + }, + { + "epoch": 0.79, + "learning_rate": 4.176925167954642e-08, + "loss": 0.0004, + "step": 40796 + }, + { + "epoch": 0.79, + "learning_rate": 4.176536833521028e-08, + "loss": 0.0006, + "step": 40797 + }, + { + "epoch": 0.79, + "learning_rate": 4.176148499087414e-08, + "loss": 0.0007, + "step": 40798 + }, + { + "epoch": 0.79, + "learning_rate": 4.1757601646537996e-08, + "loss": 0.0005, + "step": 40799 + }, + { + "epoch": 0.79, + "learning_rate": 4.1753718302201855e-08, + "loss": 0.0004, + "step": 40800 + }, + { + "epoch": 0.79, + "learning_rate": 4.1749834957865706e-08, + "loss": 0.0004, + "step": 40801 + }, + { + "epoch": 0.79, + "learning_rate": 4.1745951613529564e-08, + "loss": 0.0926, + "step": 40802 + }, + { + "epoch": 0.79, + "learning_rate": 4.174206826919342e-08, + "loss": 0.0003, + "step": 40803 + }, + { + "epoch": 0.79, + "learning_rate": 4.173818492485728e-08, + "loss": 0.0004, + "step": 40804 + }, + { + "epoch": 0.79, + "learning_rate": 4.173430158052114e-08, + "loss": 0.0004, + "step": 40805 + }, + { + "epoch": 0.79, + "learning_rate": 4.1730418236185e-08, + "loss": 0.6492, + "step": 40806 + }, + { + "epoch": 0.79, + "learning_rate": 4.1726534891848856e-08, + "loss": 0.0007, + "step": 40807 + }, + { + "epoch": 0.79, + "learning_rate": 4.1722651547512714e-08, + "loss": 0.0005, + "step": 40808 + }, + { + "epoch": 0.79, + "learning_rate": 4.171876820317657e-08, + "loss": 0.0005, + "step": 40809 + }, + { + "epoch": 0.79, + "learning_rate": 4.171488485884043e-08, + "loss": 0.5089, + "step": 40810 + }, + { + "epoch": 0.79, + "learning_rate": 4.171100151450429e-08, + "loss": 0.0005, + "step": 40811 + }, + { + "epoch": 0.79, + "learning_rate": 4.170711817016815e-08, + "loss": 0.0003, + "step": 40812 + }, + { + "epoch": 0.79, + "learning_rate": 4.1703234825832005e-08, + "loss": 0.0004, + "step": 40813 + }, + { + "epoch": 0.79, + "learning_rate": 4.1699351481495863e-08, + "loss": 0.0002, + "step": 40814 + }, + { + "epoch": 0.79, + "learning_rate": 4.169546813715972e-08, + "loss": 0.0014, + "step": 40815 + }, + { + "epoch": 0.79, + "learning_rate": 4.169158479282357e-08, + "loss": 0.0003, + "step": 40816 + }, + { + "epoch": 0.79, + "learning_rate": 4.168770144848743e-08, + "loss": 0.0013, + "step": 40817 + }, + { + "epoch": 0.79, + "learning_rate": 4.168381810415129e-08, + "loss": 0.001, + "step": 40818 + }, + { + "epoch": 0.79, + "learning_rate": 4.167993475981515e-08, + "loss": 0.0005, + "step": 40819 + }, + { + "epoch": 0.79, + "learning_rate": 4.1676051415479006e-08, + "loss": 0.0003, + "step": 40820 + }, + { + "epoch": 0.79, + "learning_rate": 4.1672168071142864e-08, + "loss": 0.0004, + "step": 40821 + }, + { + "epoch": 0.79, + "learning_rate": 4.166828472680672e-08, + "loss": 0.0009, + "step": 40822 + }, + { + "epoch": 0.79, + "learning_rate": 4.166440138247058e-08, + "loss": 0.0004, + "step": 40823 + }, + { + "epoch": 0.79, + "learning_rate": 4.166051803813444e-08, + "loss": 0.001, + "step": 40824 + }, + { + "epoch": 0.79, + "learning_rate": 4.16566346937983e-08, + "loss": 0.0005, + "step": 40825 + }, + { + "epoch": 0.79, + "learning_rate": 4.1652751349462156e-08, + "loss": 1.0079, + "step": 40826 + }, + { + "epoch": 0.79, + "learning_rate": 4.1648868005126014e-08, + "loss": 0.001, + "step": 40827 + }, + { + "epoch": 0.79, + "learning_rate": 4.164498466078987e-08, + "loss": 0.0004, + "step": 40828 + }, + { + "epoch": 0.79, + "learning_rate": 4.164110131645373e-08, + "loss": 0.0003, + "step": 40829 + }, + { + "epoch": 0.79, + "learning_rate": 4.163721797211758e-08, + "loss": 0.0004, + "step": 40830 + }, + { + "epoch": 0.79, + "learning_rate": 4.163333462778144e-08, + "loss": 0.0002, + "step": 40831 + }, + { + "epoch": 0.79, + "learning_rate": 4.16294512834453e-08, + "loss": 0.0009, + "step": 40832 + }, + { + "epoch": 0.79, + "learning_rate": 4.162556793910916e-08, + "loss": 0.0003, + "step": 40833 + }, + { + "epoch": 0.79, + "learning_rate": 4.1621684594773015e-08, + "loss": 0.0005, + "step": 40834 + }, + { + "epoch": 0.79, + "learning_rate": 4.161780125043687e-08, + "loss": 0.0003, + "step": 40835 + }, + { + "epoch": 0.79, + "learning_rate": 4.161391790610073e-08, + "loss": 0.0004, + "step": 40836 + }, + { + "epoch": 0.79, + "learning_rate": 4.161003456176459e-08, + "loss": 1.7965, + "step": 40837 + }, + { + "epoch": 0.79, + "learning_rate": 4.160615121742845e-08, + "loss": 0.0003, + "step": 40838 + }, + { + "epoch": 0.79, + "learning_rate": 4.1602267873092306e-08, + "loss": 0.0005, + "step": 40839 + }, + { + "epoch": 0.79, + "learning_rate": 4.1598384528756165e-08, + "loss": 1.2768, + "step": 40840 + }, + { + "epoch": 0.79, + "learning_rate": 4.159450118442002e-08, + "loss": 0.0005, + "step": 40841 + }, + { + "epoch": 0.79, + "learning_rate": 4.159061784008388e-08, + "loss": 0.0005, + "step": 40842 + }, + { + "epoch": 0.79, + "learning_rate": 4.158673449574774e-08, + "loss": 0.0005, + "step": 40843 + }, + { + "epoch": 0.79, + "learning_rate": 4.15828511514116e-08, + "loss": 0.0005, + "step": 40844 + }, + { + "epoch": 0.79, + "learning_rate": 4.157896780707545e-08, + "loss": 0.0003, + "step": 40845 + }, + { + "epoch": 0.79, + "learning_rate": 4.157508446273931e-08, + "loss": 0.0004, + "step": 40846 + }, + { + "epoch": 0.79, + "learning_rate": 4.1571201118403166e-08, + "loss": 0.0005, + "step": 40847 + }, + { + "epoch": 0.79, + "learning_rate": 4.1567317774067024e-08, + "loss": 0.0007, + "step": 40848 + }, + { + "epoch": 0.79, + "learning_rate": 4.156343442973088e-08, + "loss": 0.0003, + "step": 40849 + }, + { + "epoch": 0.79, + "learning_rate": 4.155955108539474e-08, + "loss": 0.0005, + "step": 40850 + }, + { + "epoch": 0.79, + "learning_rate": 4.15556677410586e-08, + "loss": 0.0017, + "step": 40851 + }, + { + "epoch": 0.79, + "learning_rate": 4.155178439672246e-08, + "loss": 0.0004, + "step": 40852 + }, + { + "epoch": 0.79, + "learning_rate": 4.1547901052386315e-08, + "loss": 0.0509, + "step": 40853 + }, + { + "epoch": 0.79, + "learning_rate": 4.1544017708050173e-08, + "loss": 0.0005, + "step": 40854 + }, + { + "epoch": 0.79, + "learning_rate": 4.154013436371403e-08, + "loss": 0.0004, + "step": 40855 + }, + { + "epoch": 0.79, + "learning_rate": 4.153625101937789e-08, + "loss": 0.0003, + "step": 40856 + }, + { + "epoch": 0.79, + "learning_rate": 4.153236767504175e-08, + "loss": 0.0009, + "step": 40857 + }, + { + "epoch": 0.79, + "learning_rate": 4.1528484330705606e-08, + "loss": 0.0006, + "step": 40858 + }, + { + "epoch": 0.79, + "learning_rate": 4.152460098636946e-08, + "loss": 0.0003, + "step": 40859 + }, + { + "epoch": 0.79, + "learning_rate": 4.1520717642033316e-08, + "loss": 0.0228, + "step": 40860 + }, + { + "epoch": 0.79, + "learning_rate": 4.1516834297697174e-08, + "loss": 0.0004, + "step": 40861 + }, + { + "epoch": 0.79, + "learning_rate": 4.151295095336103e-08, + "loss": 0.0003, + "step": 40862 + }, + { + "epoch": 0.79, + "learning_rate": 4.150906760902489e-08, + "loss": 0.0005, + "step": 40863 + }, + { + "epoch": 0.79, + "learning_rate": 4.150518426468875e-08, + "loss": 0.0003, + "step": 40864 + }, + { + "epoch": 0.79, + "learning_rate": 4.150130092035261e-08, + "loss": 0.0003, + "step": 40865 + }, + { + "epoch": 0.79, + "learning_rate": 4.1497417576016466e-08, + "loss": 0.0003, + "step": 40866 + }, + { + "epoch": 0.79, + "learning_rate": 4.1493534231680324e-08, + "loss": 0.0003, + "step": 40867 + }, + { + "epoch": 0.79, + "learning_rate": 4.148965088734418e-08, + "loss": 0.0008, + "step": 40868 + }, + { + "epoch": 0.79, + "learning_rate": 4.148576754300804e-08, + "loss": 0.0005, + "step": 40869 + }, + { + "epoch": 0.79, + "learning_rate": 4.14818841986719e-08, + "loss": 0.0003, + "step": 40870 + }, + { + "epoch": 0.79, + "learning_rate": 4.147800085433576e-08, + "loss": 0.1407, + "step": 40871 + }, + { + "epoch": 0.79, + "learning_rate": 4.1474117509999615e-08, + "loss": 0.0003, + "step": 40872 + }, + { + "epoch": 0.79, + "learning_rate": 4.1470234165663473e-08, + "loss": 0.0004, + "step": 40873 + }, + { + "epoch": 0.79, + "learning_rate": 4.1466350821327325e-08, + "loss": 0.0004, + "step": 40874 + }, + { + "epoch": 0.79, + "learning_rate": 4.146246747699118e-08, + "loss": 0.0024, + "step": 40875 + }, + { + "epoch": 0.79, + "learning_rate": 4.145858413265504e-08, + "loss": 0.0004, + "step": 40876 + }, + { + "epoch": 0.79, + "learning_rate": 4.14547007883189e-08, + "loss": 0.0005, + "step": 40877 + }, + { + "epoch": 0.79, + "learning_rate": 4.145081744398276e-08, + "loss": 0.0003, + "step": 40878 + }, + { + "epoch": 0.79, + "learning_rate": 4.1446934099646616e-08, + "loss": 0.0338, + "step": 40879 + }, + { + "epoch": 0.79, + "learning_rate": 4.1443050755310474e-08, + "loss": 0.0003, + "step": 40880 + }, + { + "epoch": 0.79, + "learning_rate": 4.143916741097433e-08, + "loss": 0.0004, + "step": 40881 + }, + { + "epoch": 0.79, + "learning_rate": 4.1435284066638184e-08, + "loss": 0.0004, + "step": 40882 + }, + { + "epoch": 0.79, + "learning_rate": 4.143140072230204e-08, + "loss": 0.0004, + "step": 40883 + }, + { + "epoch": 0.79, + "learning_rate": 4.14275173779659e-08, + "loss": 0.0004, + "step": 40884 + }, + { + "epoch": 0.79, + "learning_rate": 4.142363403362976e-08, + "loss": 0.0153, + "step": 40885 + }, + { + "epoch": 0.79, + "learning_rate": 4.141975068929362e-08, + "loss": 0.0008, + "step": 40886 + }, + { + "epoch": 0.79, + "learning_rate": 4.1415867344957476e-08, + "loss": 0.0004, + "step": 40887 + }, + { + "epoch": 0.79, + "learning_rate": 4.1411984000621334e-08, + "loss": 0.0013, + "step": 40888 + }, + { + "epoch": 0.79, + "learning_rate": 4.1408100656285185e-08, + "loss": 0.0839, + "step": 40889 + }, + { + "epoch": 0.79, + "learning_rate": 4.1404217311949044e-08, + "loss": 0.0004, + "step": 40890 + }, + { + "epoch": 0.79, + "learning_rate": 4.14003339676129e-08, + "loss": 0.0003, + "step": 40891 + }, + { + "epoch": 0.79, + "learning_rate": 4.139645062327676e-08, + "loss": 0.0005, + "step": 40892 + }, + { + "epoch": 0.79, + "learning_rate": 4.139256727894062e-08, + "loss": 0.0004, + "step": 40893 + }, + { + "epoch": 0.79, + "learning_rate": 4.1388683934604477e-08, + "loss": 0.0006, + "step": 40894 + }, + { + "epoch": 0.79, + "learning_rate": 4.1384800590268335e-08, + "loss": 0.0546, + "step": 40895 + }, + { + "epoch": 0.79, + "learning_rate": 4.138091724593219e-08, + "loss": 0.0004, + "step": 40896 + }, + { + "epoch": 0.79, + "learning_rate": 4.137703390159605e-08, + "loss": 0.0009, + "step": 40897 + }, + { + "epoch": 0.79, + "learning_rate": 4.137315055725991e-08, + "loss": 0.0005, + "step": 40898 + }, + { + "epoch": 0.79, + "learning_rate": 4.136926721292377e-08, + "loss": 0.0509, + "step": 40899 + }, + { + "epoch": 0.79, + "learning_rate": 4.1365383868587626e-08, + "loss": 0.0005, + "step": 40900 + }, + { + "epoch": 0.79, + "learning_rate": 4.1361500524251484e-08, + "loss": 0.4785, + "step": 40901 + }, + { + "epoch": 0.79, + "learning_rate": 4.135761717991534e-08, + "loss": 0.0004, + "step": 40902 + }, + { + "epoch": 0.79, + "learning_rate": 4.1353733835579194e-08, + "loss": 0.0004, + "step": 40903 + }, + { + "epoch": 0.79, + "learning_rate": 4.134985049124305e-08, + "loss": 0.0005, + "step": 40904 + }, + { + "epoch": 0.79, + "learning_rate": 4.134596714690691e-08, + "loss": 0.0005, + "step": 40905 + }, + { + "epoch": 0.79, + "learning_rate": 4.134208380257077e-08, + "loss": 0.0003, + "step": 40906 + }, + { + "epoch": 0.79, + "learning_rate": 4.133820045823463e-08, + "loss": 0.0005, + "step": 40907 + }, + { + "epoch": 0.79, + "learning_rate": 4.1334317113898485e-08, + "loss": 0.1963, + "step": 40908 + }, + { + "epoch": 0.79, + "learning_rate": 4.1330433769562344e-08, + "loss": 0.0003, + "step": 40909 + }, + { + "epoch": 0.79, + "learning_rate": 4.13265504252262e-08, + "loss": 0.6477, + "step": 40910 + }, + { + "epoch": 0.79, + "learning_rate": 4.132266708089006e-08, + "loss": 0.053, + "step": 40911 + }, + { + "epoch": 0.79, + "learning_rate": 4.131878373655392e-08, + "loss": 0.001, + "step": 40912 + }, + { + "epoch": 0.79, + "learning_rate": 4.1314900392217777e-08, + "loss": 0.0004, + "step": 40913 + }, + { + "epoch": 0.79, + "learning_rate": 4.1311017047881635e-08, + "loss": 0.0005, + "step": 40914 + }, + { + "epoch": 0.79, + "learning_rate": 4.130713370354549e-08, + "loss": 0.0073, + "step": 40915 + }, + { + "epoch": 0.79, + "learning_rate": 4.130325035920935e-08, + "loss": 0.5908, + "step": 40916 + }, + { + "epoch": 0.79, + "learning_rate": 4.12993670148732e-08, + "loss": 0.0005, + "step": 40917 + }, + { + "epoch": 0.79, + "learning_rate": 4.129548367053706e-08, + "loss": 0.0004, + "step": 40918 + }, + { + "epoch": 0.79, + "learning_rate": 4.129160032620092e-08, + "loss": 0.0005, + "step": 40919 + }, + { + "epoch": 0.79, + "learning_rate": 4.128771698186478e-08, + "loss": 0.0005, + "step": 40920 + }, + { + "epoch": 0.79, + "learning_rate": 4.1283833637528636e-08, + "loss": 0.0004, + "step": 40921 + }, + { + "epoch": 0.79, + "learning_rate": 4.1279950293192494e-08, + "loss": 0.0033, + "step": 40922 + }, + { + "epoch": 0.79, + "learning_rate": 4.127606694885635e-08, + "loss": 0.0004, + "step": 40923 + }, + { + "epoch": 0.79, + "learning_rate": 4.127218360452021e-08, + "loss": 0.1865, + "step": 40924 + }, + { + "epoch": 0.79, + "learning_rate": 4.126830026018407e-08, + "loss": 0.0003, + "step": 40925 + }, + { + "epoch": 0.79, + "learning_rate": 4.126441691584793e-08, + "loss": 0.0004, + "step": 40926 + }, + { + "epoch": 0.79, + "learning_rate": 4.1260533571511785e-08, + "loss": 0.0004, + "step": 40927 + }, + { + "epoch": 0.79, + "learning_rate": 4.1256650227175644e-08, + "loss": 0.0004, + "step": 40928 + }, + { + "epoch": 0.79, + "learning_rate": 4.12527668828395e-08, + "loss": 0.0003, + "step": 40929 + }, + { + "epoch": 0.79, + "learning_rate": 4.124888353850336e-08, + "loss": 0.0004, + "step": 40930 + }, + { + "epoch": 0.79, + "learning_rate": 4.124500019416722e-08, + "loss": 0.0008, + "step": 40931 + }, + { + "epoch": 0.79, + "learning_rate": 4.124111684983107e-08, + "loss": 0.001, + "step": 40932 + }, + { + "epoch": 0.79, + "learning_rate": 4.123723350549493e-08, + "loss": 0.0004, + "step": 40933 + }, + { + "epoch": 0.79, + "learning_rate": 4.1233350161158787e-08, + "loss": 0.0003, + "step": 40934 + }, + { + "epoch": 0.79, + "learning_rate": 4.1229466816822645e-08, + "loss": 0.0005, + "step": 40935 + }, + { + "epoch": 0.79, + "learning_rate": 4.12255834724865e-08, + "loss": 0.0004, + "step": 40936 + }, + { + "epoch": 0.79, + "learning_rate": 4.122170012815036e-08, + "loss": 0.0003, + "step": 40937 + }, + { + "epoch": 0.79, + "learning_rate": 4.121781678381422e-08, + "loss": 0.0005, + "step": 40938 + }, + { + "epoch": 0.79, + "learning_rate": 4.121393343947808e-08, + "loss": 0.0008, + "step": 40939 + }, + { + "epoch": 0.79, + "learning_rate": 4.1210050095141936e-08, + "loss": 0.0004, + "step": 40940 + }, + { + "epoch": 0.79, + "learning_rate": 4.1206166750805794e-08, + "loss": 0.0003, + "step": 40941 + }, + { + "epoch": 0.79, + "learning_rate": 4.120228340646965e-08, + "loss": 0.0005, + "step": 40942 + }, + { + "epoch": 0.79, + "learning_rate": 4.119840006213351e-08, + "loss": 0.0005, + "step": 40943 + }, + { + "epoch": 0.79, + "learning_rate": 4.119451671779737e-08, + "loss": 0.0004, + "step": 40944 + }, + { + "epoch": 0.79, + "learning_rate": 4.119063337346123e-08, + "loss": 0.0005, + "step": 40945 + }, + { + "epoch": 0.79, + "learning_rate": 4.118675002912508e-08, + "loss": 0.0028, + "step": 40946 + }, + { + "epoch": 0.79, + "learning_rate": 4.118286668478894e-08, + "loss": 0.0006, + "step": 40947 + }, + { + "epoch": 0.79, + "learning_rate": 4.1178983340452795e-08, + "loss": 0.0004, + "step": 40948 + }, + { + "epoch": 0.79, + "learning_rate": 4.1175099996116654e-08, + "loss": 0.0008, + "step": 40949 + }, + { + "epoch": 0.79, + "learning_rate": 4.117121665178051e-08, + "loss": 0.0007, + "step": 40950 + }, + { + "epoch": 0.79, + "learning_rate": 4.116733330744437e-08, + "loss": 0.0004, + "step": 40951 + }, + { + "epoch": 0.79, + "learning_rate": 4.116344996310823e-08, + "loss": 0.001, + "step": 40952 + }, + { + "epoch": 0.79, + "learning_rate": 4.1159566618772087e-08, + "loss": 0.0006, + "step": 40953 + }, + { + "epoch": 0.79, + "learning_rate": 4.1155683274435945e-08, + "loss": 0.0004, + "step": 40954 + }, + { + "epoch": 0.79, + "learning_rate": 4.11517999300998e-08, + "loss": 0.0011, + "step": 40955 + }, + { + "epoch": 0.79, + "learning_rate": 4.114791658576366e-08, + "loss": 0.0005, + "step": 40956 + }, + { + "epoch": 0.79, + "learning_rate": 4.114403324142752e-08, + "loss": 0.0009, + "step": 40957 + }, + { + "epoch": 0.79, + "learning_rate": 4.114014989709138e-08, + "loss": 0.0007, + "step": 40958 + }, + { + "epoch": 0.79, + "learning_rate": 4.1136266552755236e-08, + "loss": 0.0004, + "step": 40959 + }, + { + "epoch": 0.79, + "learning_rate": 4.1132383208419094e-08, + "loss": 0.0008, + "step": 40960 + }, + { + "epoch": 0.79, + "learning_rate": 4.1128499864082946e-08, + "loss": 0.0004, + "step": 40961 + }, + { + "epoch": 0.79, + "learning_rate": 4.1124616519746804e-08, + "loss": 0.0003, + "step": 40962 + }, + { + "epoch": 0.79, + "learning_rate": 4.112073317541066e-08, + "loss": 0.0004, + "step": 40963 + }, + { + "epoch": 0.79, + "learning_rate": 4.111684983107452e-08, + "loss": 0.0005, + "step": 40964 + }, + { + "epoch": 0.79, + "learning_rate": 4.111296648673838e-08, + "loss": 0.0008, + "step": 40965 + }, + { + "epoch": 0.79, + "learning_rate": 4.110908314240224e-08, + "loss": 0.0004, + "step": 40966 + }, + { + "epoch": 0.79, + "learning_rate": 4.1105199798066095e-08, + "loss": 0.0002, + "step": 40967 + }, + { + "epoch": 0.79, + "learning_rate": 4.1101316453729954e-08, + "loss": 0.0004, + "step": 40968 + }, + { + "epoch": 0.79, + "learning_rate": 4.109743310939381e-08, + "loss": 0.0003, + "step": 40969 + }, + { + "epoch": 0.79, + "learning_rate": 4.1093549765057663e-08, + "loss": 0.0004, + "step": 40970 + }, + { + "epoch": 0.79, + "learning_rate": 4.108966642072152e-08, + "loss": 0.0004, + "step": 40971 + }, + { + "epoch": 0.79, + "learning_rate": 4.108578307638538e-08, + "loss": 0.0004, + "step": 40972 + }, + { + "epoch": 0.79, + "learning_rate": 4.108189973204924e-08, + "loss": 0.0005, + "step": 40973 + }, + { + "epoch": 0.79, + "learning_rate": 4.1078016387713096e-08, + "loss": 0.0004, + "step": 40974 + }, + { + "epoch": 0.79, + "learning_rate": 4.1074133043376955e-08, + "loss": 0.1304, + "step": 40975 + }, + { + "epoch": 0.79, + "learning_rate": 4.107024969904081e-08, + "loss": 0.0004, + "step": 40976 + }, + { + "epoch": 0.79, + "learning_rate": 4.106636635470467e-08, + "loss": 0.0003, + "step": 40977 + }, + { + "epoch": 0.79, + "learning_rate": 4.106248301036852e-08, + "loss": 0.0008, + "step": 40978 + }, + { + "epoch": 0.79, + "learning_rate": 4.105859966603238e-08, + "loss": 0.0005, + "step": 40979 + }, + { + "epoch": 0.79, + "learning_rate": 4.105471632169624e-08, + "loss": 0.0005, + "step": 40980 + }, + { + "epoch": 0.79, + "learning_rate": 4.10508329773601e-08, + "loss": 0.0004, + "step": 40981 + }, + { + "epoch": 0.79, + "learning_rate": 4.1046949633023956e-08, + "loss": 0.0004, + "step": 40982 + }, + { + "epoch": 0.79, + "learning_rate": 4.1043066288687814e-08, + "loss": 0.0005, + "step": 40983 + }, + { + "epoch": 0.8, + "learning_rate": 4.103918294435167e-08, + "loss": 0.0003, + "step": 40984 + }, + { + "epoch": 0.8, + "learning_rate": 4.103529960001553e-08, + "loss": 0.3293, + "step": 40985 + }, + { + "epoch": 0.8, + "learning_rate": 4.103141625567939e-08, + "loss": 0.0004, + "step": 40986 + }, + { + "epoch": 0.8, + "learning_rate": 4.102753291134325e-08, + "loss": 0.0004, + "step": 40987 + }, + { + "epoch": 0.8, + "learning_rate": 4.1023649567007105e-08, + "loss": 0.0003, + "step": 40988 + }, + { + "epoch": 0.8, + "learning_rate": 4.1019766222670964e-08, + "loss": 0.0004, + "step": 40989 + }, + { + "epoch": 0.8, + "learning_rate": 4.1015882878334815e-08, + "loss": 0.0003, + "step": 40990 + }, + { + "epoch": 0.8, + "learning_rate": 4.1011999533998673e-08, + "loss": 0.0004, + "step": 40991 + }, + { + "epoch": 0.8, + "learning_rate": 4.100811618966253e-08, + "loss": 0.0003, + "step": 40992 + }, + { + "epoch": 0.8, + "learning_rate": 4.100423284532639e-08, + "loss": 0.0003, + "step": 40993 + }, + { + "epoch": 0.8, + "learning_rate": 4.100034950099025e-08, + "loss": 0.0004, + "step": 40994 + }, + { + "epoch": 0.8, + "learning_rate": 4.0996466156654106e-08, + "loss": 0.0022, + "step": 40995 + }, + { + "epoch": 0.8, + "learning_rate": 4.0992582812317965e-08, + "loss": 0.0004, + "step": 40996 + }, + { + "epoch": 0.8, + "learning_rate": 4.098869946798182e-08, + "loss": 0.0005, + "step": 40997 + }, + { + "epoch": 0.8, + "learning_rate": 4.098481612364568e-08, + "loss": 0.0003, + "step": 40998 + }, + { + "epoch": 0.8, + "learning_rate": 4.098093277930954e-08, + "loss": 0.0004, + "step": 40999 + }, + { + "epoch": 0.8, + "learning_rate": 4.09770494349734e-08, + "loss": 0.0003, + "step": 41000 + }, + { + "epoch": 0.8, + "learning_rate": 4.0973166090637256e-08, + "loss": 0.0292, + "step": 41001 + }, + { + "epoch": 0.8, + "learning_rate": 4.0969282746301114e-08, + "loss": 0.2059, + "step": 41002 + }, + { + "epoch": 0.8, + "learning_rate": 4.096539940196497e-08, + "loss": 1.0095, + "step": 41003 + }, + { + "epoch": 0.8, + "learning_rate": 4.0961516057628824e-08, + "loss": 0.0002, + "step": 41004 + }, + { + "epoch": 0.8, + "learning_rate": 4.095763271329268e-08, + "loss": 0.3479, + "step": 41005 + }, + { + "epoch": 0.8, + "learning_rate": 4.095374936895654e-08, + "loss": 0.0005, + "step": 41006 + }, + { + "epoch": 0.8, + "learning_rate": 4.09498660246204e-08, + "loss": 0.0005, + "step": 41007 + }, + { + "epoch": 0.8, + "learning_rate": 4.094598268028426e-08, + "loss": 0.0003, + "step": 41008 + }, + { + "epoch": 0.8, + "learning_rate": 4.0942099335948115e-08, + "loss": 0.0004, + "step": 41009 + }, + { + "epoch": 0.8, + "learning_rate": 4.0938215991611973e-08, + "loss": 0.0003, + "step": 41010 + }, + { + "epoch": 0.8, + "learning_rate": 4.093433264727583e-08, + "loss": 0.0005, + "step": 41011 + }, + { + "epoch": 0.8, + "learning_rate": 4.093044930293969e-08, + "loss": 0.0002, + "step": 41012 + }, + { + "epoch": 0.8, + "learning_rate": 4.092656595860355e-08, + "loss": 0.0003, + "step": 41013 + }, + { + "epoch": 0.8, + "learning_rate": 4.0922682614267406e-08, + "loss": 0.0003, + "step": 41014 + }, + { + "epoch": 0.8, + "learning_rate": 4.0918799269931265e-08, + "loss": 0.0004, + "step": 41015 + }, + { + "epoch": 0.8, + "learning_rate": 4.091491592559512e-08, + "loss": 0.0006, + "step": 41016 + }, + { + "epoch": 0.8, + "learning_rate": 4.091103258125898e-08, + "loss": 0.0003, + "step": 41017 + }, + { + "epoch": 0.8, + "learning_rate": 4.090714923692284e-08, + "loss": 0.2291, + "step": 41018 + }, + { + "epoch": 0.8, + "learning_rate": 4.090326589258669e-08, + "loss": 0.0003, + "step": 41019 + }, + { + "epoch": 0.8, + "learning_rate": 4.089938254825055e-08, + "loss": 0.0006, + "step": 41020 + }, + { + "epoch": 0.8, + "learning_rate": 4.089549920391441e-08, + "loss": 0.0004, + "step": 41021 + }, + { + "epoch": 0.8, + "learning_rate": 4.0891615859578266e-08, + "loss": 0.0003, + "step": 41022 + }, + { + "epoch": 0.8, + "learning_rate": 4.0887732515242124e-08, + "loss": 0.0003, + "step": 41023 + }, + { + "epoch": 0.8, + "learning_rate": 4.088384917090598e-08, + "loss": 0.0018, + "step": 41024 + }, + { + "epoch": 0.8, + "learning_rate": 4.087996582656984e-08, + "loss": 0.0003, + "step": 41025 + }, + { + "epoch": 0.8, + "learning_rate": 4.08760824822337e-08, + "loss": 0.0004, + "step": 41026 + }, + { + "epoch": 0.8, + "learning_rate": 4.087219913789756e-08, + "loss": 0.4831, + "step": 41027 + }, + { + "epoch": 0.8, + "learning_rate": 4.0868315793561415e-08, + "loss": 0.0004, + "step": 41028 + }, + { + "epoch": 0.8, + "learning_rate": 4.0864432449225273e-08, + "loss": 0.4354, + "step": 41029 + }, + { + "epoch": 0.8, + "learning_rate": 4.086054910488913e-08, + "loss": 0.0004, + "step": 41030 + }, + { + "epoch": 0.8, + "learning_rate": 4.085666576055299e-08, + "loss": 0.0007, + "step": 41031 + }, + { + "epoch": 0.8, + "learning_rate": 4.085278241621685e-08, + "loss": 0.0004, + "step": 41032 + }, + { + "epoch": 0.8, + "learning_rate": 4.08488990718807e-08, + "loss": 0.0006, + "step": 41033 + }, + { + "epoch": 0.8, + "learning_rate": 4.084501572754456e-08, + "loss": 0.0004, + "step": 41034 + }, + { + "epoch": 0.8, + "learning_rate": 4.0841132383208416e-08, + "loss": 0.0003, + "step": 41035 + }, + { + "epoch": 0.8, + "learning_rate": 4.0837249038872275e-08, + "loss": 0.0004, + "step": 41036 + }, + { + "epoch": 0.8, + "learning_rate": 4.083336569453613e-08, + "loss": 0.0267, + "step": 41037 + }, + { + "epoch": 0.8, + "learning_rate": 4.082948235019999e-08, + "loss": 0.0004, + "step": 41038 + }, + { + "epoch": 0.8, + "learning_rate": 4.082559900586385e-08, + "loss": 0.0004, + "step": 41039 + }, + { + "epoch": 0.8, + "learning_rate": 4.082171566152771e-08, + "loss": 0.0004, + "step": 41040 + }, + { + "epoch": 0.8, + "learning_rate": 4.0817832317191566e-08, + "loss": 0.0004, + "step": 41041 + }, + { + "epoch": 0.8, + "learning_rate": 4.0813948972855424e-08, + "loss": 0.0004, + "step": 41042 + }, + { + "epoch": 0.8, + "learning_rate": 4.081006562851928e-08, + "loss": 0.0005, + "step": 41043 + }, + { + "epoch": 0.8, + "learning_rate": 4.080618228418314e-08, + "loss": 0.0005, + "step": 41044 + }, + { + "epoch": 0.8, + "learning_rate": 4.0802298939847e-08, + "loss": 0.0009, + "step": 41045 + }, + { + "epoch": 0.8, + "learning_rate": 4.079841559551086e-08, + "loss": 0.6739, + "step": 41046 + }, + { + "epoch": 0.8, + "learning_rate": 4.0794532251174715e-08, + "loss": 0.0003, + "step": 41047 + }, + { + "epoch": 0.8, + "learning_rate": 4.079064890683857e-08, + "loss": 0.0004, + "step": 41048 + }, + { + "epoch": 0.8, + "learning_rate": 4.0786765562502425e-08, + "loss": 0.0004, + "step": 41049 + }, + { + "epoch": 0.8, + "learning_rate": 4.0782882218166283e-08, + "loss": 0.0005, + "step": 41050 + }, + { + "epoch": 0.8, + "learning_rate": 4.077899887383014e-08, + "loss": 0.0005, + "step": 41051 + }, + { + "epoch": 0.8, + "learning_rate": 4.0775115529494e-08, + "loss": 0.0004, + "step": 41052 + }, + { + "epoch": 0.8, + "learning_rate": 4.077123218515786e-08, + "loss": 0.0005, + "step": 41053 + }, + { + "epoch": 0.8, + "learning_rate": 4.0767348840821716e-08, + "loss": 0.0003, + "step": 41054 + }, + { + "epoch": 0.8, + "learning_rate": 4.0763465496485575e-08, + "loss": 0.0004, + "step": 41055 + }, + { + "epoch": 0.8, + "learning_rate": 4.075958215214943e-08, + "loss": 0.0004, + "step": 41056 + }, + { + "epoch": 0.8, + "learning_rate": 4.075569880781329e-08, + "loss": 0.0186, + "step": 41057 + }, + { + "epoch": 0.8, + "learning_rate": 4.075181546347715e-08, + "loss": 0.0004, + "step": 41058 + }, + { + "epoch": 0.8, + "learning_rate": 4.0747932119141e-08, + "loss": 0.0004, + "step": 41059 + }, + { + "epoch": 0.8, + "learning_rate": 4.074404877480486e-08, + "loss": 0.0006, + "step": 41060 + }, + { + "epoch": 0.8, + "learning_rate": 4.074016543046872e-08, + "loss": 0.0003, + "step": 41061 + }, + { + "epoch": 0.8, + "learning_rate": 4.0736282086132576e-08, + "loss": 0.0004, + "step": 41062 + }, + { + "epoch": 0.8, + "learning_rate": 4.0732398741796434e-08, + "loss": 0.0006, + "step": 41063 + }, + { + "epoch": 0.8, + "learning_rate": 4.072851539746029e-08, + "loss": 0.0003, + "step": 41064 + }, + { + "epoch": 0.8, + "learning_rate": 4.072463205312415e-08, + "loss": 0.0013, + "step": 41065 + }, + { + "epoch": 0.8, + "learning_rate": 4.0720748708788e-08, + "loss": 0.4795, + "step": 41066 + }, + { + "epoch": 0.8, + "learning_rate": 4.071686536445186e-08, + "loss": 0.0004, + "step": 41067 + }, + { + "epoch": 0.8, + "learning_rate": 4.071298202011572e-08, + "loss": 0.0004, + "step": 41068 + }, + { + "epoch": 0.8, + "learning_rate": 4.070909867577958e-08, + "loss": 0.0014, + "step": 41069 + }, + { + "epoch": 0.8, + "learning_rate": 4.0705215331443435e-08, + "loss": 0.0004, + "step": 41070 + }, + { + "epoch": 0.8, + "learning_rate": 4.070133198710729e-08, + "loss": 0.0013, + "step": 41071 + }, + { + "epoch": 0.8, + "learning_rate": 4.069744864277115e-08, + "loss": 0.0004, + "step": 41072 + }, + { + "epoch": 0.8, + "learning_rate": 4.069356529843501e-08, + "loss": 0.0006, + "step": 41073 + }, + { + "epoch": 0.8, + "learning_rate": 4.068968195409887e-08, + "loss": 0.0003, + "step": 41074 + }, + { + "epoch": 0.8, + "learning_rate": 4.0685798609762726e-08, + "loss": 0.0005, + "step": 41075 + }, + { + "epoch": 0.8, + "learning_rate": 4.0681915265426584e-08, + "loss": 0.0033, + "step": 41076 + }, + { + "epoch": 0.8, + "learning_rate": 4.0678031921090436e-08, + "loss": 0.0004, + "step": 41077 + }, + { + "epoch": 0.8, + "learning_rate": 4.0674148576754294e-08, + "loss": 0.0008, + "step": 41078 + }, + { + "epoch": 0.8, + "learning_rate": 4.067026523241815e-08, + "loss": 0.0005, + "step": 41079 + }, + { + "epoch": 0.8, + "learning_rate": 4.066638188808201e-08, + "loss": 0.0004, + "step": 41080 + }, + { + "epoch": 0.8, + "learning_rate": 4.066249854374587e-08, + "loss": 0.0003, + "step": 41081 + }, + { + "epoch": 0.8, + "learning_rate": 4.065861519940973e-08, + "loss": 0.0004, + "step": 41082 + }, + { + "epoch": 0.8, + "learning_rate": 4.0654731855073586e-08, + "loss": 0.0004, + "step": 41083 + }, + { + "epoch": 0.8, + "learning_rate": 4.0650848510737444e-08, + "loss": 0.041, + "step": 41084 + }, + { + "epoch": 0.8, + "learning_rate": 4.06469651664013e-08, + "loss": 0.0003, + "step": 41085 + }, + { + "epoch": 0.8, + "learning_rate": 4.064308182206516e-08, + "loss": 0.0006, + "step": 41086 + }, + { + "epoch": 0.8, + "learning_rate": 4.063919847772902e-08, + "loss": 0.0006, + "step": 41087 + }, + { + "epoch": 0.8, + "learning_rate": 4.063531513339288e-08, + "loss": 0.0024, + "step": 41088 + }, + { + "epoch": 0.8, + "learning_rate": 4.0631431789056735e-08, + "loss": 0.0003, + "step": 41089 + }, + { + "epoch": 0.8, + "learning_rate": 4.062754844472059e-08, + "loss": 0.0005, + "step": 41090 + }, + { + "epoch": 0.8, + "learning_rate": 4.0623665100384445e-08, + "loss": 0.0004, + "step": 41091 + }, + { + "epoch": 0.8, + "learning_rate": 4.06197817560483e-08, + "loss": 0.0003, + "step": 41092 + }, + { + "epoch": 0.8, + "learning_rate": 4.061589841171216e-08, + "loss": 0.0004, + "step": 41093 + }, + { + "epoch": 0.8, + "learning_rate": 4.061201506737602e-08, + "loss": 0.0005, + "step": 41094 + }, + { + "epoch": 0.8, + "learning_rate": 4.060813172303988e-08, + "loss": 0.0005, + "step": 41095 + }, + { + "epoch": 0.8, + "learning_rate": 4.0604248378703736e-08, + "loss": 0.0003, + "step": 41096 + }, + { + "epoch": 0.8, + "learning_rate": 4.0600365034367594e-08, + "loss": 0.0391, + "step": 41097 + }, + { + "epoch": 0.8, + "learning_rate": 4.059648169003145e-08, + "loss": 0.0005, + "step": 41098 + }, + { + "epoch": 0.8, + "learning_rate": 4.059259834569531e-08, + "loss": 0.001, + "step": 41099 + }, + { + "epoch": 0.8, + "learning_rate": 4.058871500135917e-08, + "loss": 0.0007, + "step": 41100 + }, + { + "epoch": 0.8, + "learning_rate": 4.058483165702303e-08, + "loss": 0.0003, + "step": 41101 + }, + { + "epoch": 0.8, + "learning_rate": 4.0580948312686886e-08, + "loss": 1.1954, + "step": 41102 + }, + { + "epoch": 0.8, + "learning_rate": 4.0577064968350744e-08, + "loss": 0.0003, + "step": 41103 + }, + { + "epoch": 0.8, + "learning_rate": 4.05731816240146e-08, + "loss": 0.0004, + "step": 41104 + }, + { + "epoch": 0.8, + "learning_rate": 4.056929827967846e-08, + "loss": 0.0004, + "step": 41105 + }, + { + "epoch": 0.8, + "learning_rate": 4.056541493534231e-08, + "loss": 0.0003, + "step": 41106 + }, + { + "epoch": 0.8, + "learning_rate": 4.056153159100617e-08, + "loss": 0.0004, + "step": 41107 + }, + { + "epoch": 0.8, + "learning_rate": 4.055764824667003e-08, + "loss": 0.0007, + "step": 41108 + }, + { + "epoch": 0.8, + "learning_rate": 4.0553764902333887e-08, + "loss": 0.0003, + "step": 41109 + }, + { + "epoch": 0.8, + "learning_rate": 4.0549881557997745e-08, + "loss": 0.0004, + "step": 41110 + }, + { + "epoch": 0.8, + "learning_rate": 4.05459982136616e-08, + "loss": 0.0004, + "step": 41111 + }, + { + "epoch": 0.8, + "learning_rate": 4.054211486932546e-08, + "loss": 0.0004, + "step": 41112 + }, + { + "epoch": 0.8, + "learning_rate": 4.053823152498932e-08, + "loss": 0.0006, + "step": 41113 + }, + { + "epoch": 0.8, + "learning_rate": 4.053434818065318e-08, + "loss": 0.0003, + "step": 41114 + }, + { + "epoch": 0.8, + "learning_rate": 4.0530464836317036e-08, + "loss": 0.2423, + "step": 41115 + }, + { + "epoch": 0.8, + "learning_rate": 4.0526581491980894e-08, + "loss": 0.0004, + "step": 41116 + }, + { + "epoch": 0.8, + "learning_rate": 4.052269814764475e-08, + "loss": 0.0004, + "step": 41117 + }, + { + "epoch": 0.8, + "learning_rate": 4.051881480330861e-08, + "loss": 0.0004, + "step": 41118 + }, + { + "epoch": 0.8, + "learning_rate": 4.051493145897247e-08, + "loss": 0.0004, + "step": 41119 + }, + { + "epoch": 0.8, + "learning_rate": 4.051104811463632e-08, + "loss": 0.0003, + "step": 41120 + }, + { + "epoch": 0.8, + "learning_rate": 4.050716477030018e-08, + "loss": 0.1989, + "step": 41121 + }, + { + "epoch": 0.8, + "learning_rate": 4.050328142596404e-08, + "loss": 0.0003, + "step": 41122 + }, + { + "epoch": 0.8, + "learning_rate": 4.0499398081627895e-08, + "loss": 0.0005, + "step": 41123 + }, + { + "epoch": 0.8, + "learning_rate": 4.0495514737291754e-08, + "loss": 0.0008, + "step": 41124 + }, + { + "epoch": 0.8, + "learning_rate": 4.049163139295561e-08, + "loss": 0.2197, + "step": 41125 + }, + { + "epoch": 0.8, + "learning_rate": 4.048774804861947e-08, + "loss": 0.0004, + "step": 41126 + }, + { + "epoch": 0.8, + "learning_rate": 4.048386470428333e-08, + "loss": 0.0005, + "step": 41127 + }, + { + "epoch": 0.8, + "learning_rate": 4.0479981359947187e-08, + "loss": 0.0021, + "step": 41128 + }, + { + "epoch": 0.8, + "learning_rate": 4.0476098015611045e-08, + "loss": 0.0006, + "step": 41129 + }, + { + "epoch": 0.8, + "learning_rate": 4.04722146712749e-08, + "loss": 0.0005, + "step": 41130 + }, + { + "epoch": 0.8, + "learning_rate": 4.046833132693876e-08, + "loss": 0.0003, + "step": 41131 + }, + { + "epoch": 0.8, + "learning_rate": 4.046444798260262e-08, + "loss": 0.0004, + "step": 41132 + }, + { + "epoch": 0.8, + "learning_rate": 4.046056463826648e-08, + "loss": 0.0301, + "step": 41133 + }, + { + "epoch": 0.8, + "learning_rate": 4.0456681293930336e-08, + "loss": 0.0005, + "step": 41134 + }, + { + "epoch": 0.8, + "learning_rate": 4.045279794959419e-08, + "loss": 0.0004, + "step": 41135 + }, + { + "epoch": 0.8, + "learning_rate": 4.0448914605258046e-08, + "loss": 0.0003, + "step": 41136 + }, + { + "epoch": 0.8, + "learning_rate": 4.0445031260921904e-08, + "loss": 0.7943, + "step": 41137 + }, + { + "epoch": 0.8, + "learning_rate": 4.044114791658576e-08, + "loss": 0.0005, + "step": 41138 + }, + { + "epoch": 0.8, + "learning_rate": 4.043726457224962e-08, + "loss": 1.0275, + "step": 41139 + }, + { + "epoch": 0.8, + "learning_rate": 4.043338122791348e-08, + "loss": 0.0004, + "step": 41140 + }, + { + "epoch": 0.8, + "learning_rate": 4.042949788357734e-08, + "loss": 0.0005, + "step": 41141 + }, + { + "epoch": 0.8, + "learning_rate": 4.0425614539241195e-08, + "loss": 0.573, + "step": 41142 + }, + { + "epoch": 0.8, + "learning_rate": 4.0421731194905054e-08, + "loss": 0.0004, + "step": 41143 + }, + { + "epoch": 0.8, + "learning_rate": 4.041784785056891e-08, + "loss": 0.0008, + "step": 41144 + }, + { + "epoch": 0.8, + "learning_rate": 4.041396450623277e-08, + "loss": 0.0003, + "step": 41145 + }, + { + "epoch": 0.8, + "learning_rate": 4.041008116189663e-08, + "loss": 0.0004, + "step": 41146 + }, + { + "epoch": 0.8, + "learning_rate": 4.040619781756048e-08, + "loss": 0.0003, + "step": 41147 + }, + { + "epoch": 0.8, + "learning_rate": 4.040231447322434e-08, + "loss": 0.0003, + "step": 41148 + }, + { + "epoch": 0.8, + "learning_rate": 4.0398431128888197e-08, + "loss": 0.0003, + "step": 41149 + }, + { + "epoch": 0.8, + "learning_rate": 4.0394547784552055e-08, + "loss": 0.0004, + "step": 41150 + }, + { + "epoch": 0.8, + "learning_rate": 4.039066444021591e-08, + "loss": 0.0004, + "step": 41151 + }, + { + "epoch": 0.8, + "learning_rate": 4.038678109587977e-08, + "loss": 0.0003, + "step": 41152 + }, + { + "epoch": 0.8, + "learning_rate": 4.038289775154363e-08, + "loss": 0.0003, + "step": 41153 + }, + { + "epoch": 0.8, + "learning_rate": 4.037901440720749e-08, + "loss": 0.0003, + "step": 41154 + }, + { + "epoch": 0.8, + "learning_rate": 4.037513106287134e-08, + "loss": 0.0003, + "step": 41155 + }, + { + "epoch": 0.8, + "learning_rate": 4.03712477185352e-08, + "loss": 0.0007, + "step": 41156 + }, + { + "epoch": 0.8, + "learning_rate": 4.0367364374199056e-08, + "loss": 0.0005, + "step": 41157 + }, + { + "epoch": 0.8, + "learning_rate": 4.0363481029862914e-08, + "loss": 0.0004, + "step": 41158 + }, + { + "epoch": 0.8, + "learning_rate": 4.035959768552677e-08, + "loss": 0.0004, + "step": 41159 + }, + { + "epoch": 0.8, + "learning_rate": 4.035571434119063e-08, + "loss": 0.0004, + "step": 41160 + }, + { + "epoch": 0.8, + "learning_rate": 4.035183099685449e-08, + "loss": 0.0004, + "step": 41161 + }, + { + "epoch": 0.8, + "learning_rate": 4.034794765251835e-08, + "loss": 1.0955, + "step": 41162 + }, + { + "epoch": 0.8, + "learning_rate": 4.0344064308182205e-08, + "loss": 0.0004, + "step": 41163 + }, + { + "epoch": 0.8, + "learning_rate": 4.034018096384606e-08, + "loss": 0.0006, + "step": 41164 + }, + { + "epoch": 0.8, + "learning_rate": 4.0336297619509915e-08, + "loss": 0.0003, + "step": 41165 + }, + { + "epoch": 0.8, + "learning_rate": 4.0332414275173774e-08, + "loss": 0.0005, + "step": 41166 + }, + { + "epoch": 0.8, + "learning_rate": 4.032853093083763e-08, + "loss": 0.0006, + "step": 41167 + }, + { + "epoch": 0.8, + "learning_rate": 4.032464758650149e-08, + "loss": 0.0007, + "step": 41168 + }, + { + "epoch": 0.8, + "learning_rate": 4.032076424216535e-08, + "loss": 0.0004, + "step": 41169 + }, + { + "epoch": 0.8, + "learning_rate": 4.0316880897829206e-08, + "loss": 0.0004, + "step": 41170 + }, + { + "epoch": 0.8, + "learning_rate": 4.0312997553493065e-08, + "loss": 0.0036, + "step": 41171 + }, + { + "epoch": 0.8, + "learning_rate": 4.030911420915692e-08, + "loss": 0.0005, + "step": 41172 + }, + { + "epoch": 0.8, + "learning_rate": 4.030523086482078e-08, + "loss": 0.0004, + "step": 41173 + }, + { + "epoch": 0.8, + "learning_rate": 4.030134752048464e-08, + "loss": 0.0008, + "step": 41174 + }, + { + "epoch": 0.8, + "learning_rate": 4.02974641761485e-08, + "loss": 0.0004, + "step": 41175 + }, + { + "epoch": 0.8, + "learning_rate": 4.0293580831812356e-08, + "loss": 0.0005, + "step": 41176 + }, + { + "epoch": 0.8, + "learning_rate": 4.0289697487476214e-08, + "loss": 0.666, + "step": 41177 + }, + { + "epoch": 0.8, + "learning_rate": 4.0285814143140066e-08, + "loss": 0.0005, + "step": 41178 + }, + { + "epoch": 0.8, + "learning_rate": 4.0281930798803924e-08, + "loss": 0.0012, + "step": 41179 + }, + { + "epoch": 0.8, + "learning_rate": 4.027804745446778e-08, + "loss": 0.0005, + "step": 41180 + }, + { + "epoch": 0.8, + "learning_rate": 4.027416411013164e-08, + "loss": 0.0004, + "step": 41181 + }, + { + "epoch": 0.8, + "learning_rate": 4.02702807657955e-08, + "loss": 0.0006, + "step": 41182 + }, + { + "epoch": 0.8, + "learning_rate": 4.026639742145936e-08, + "loss": 0.001, + "step": 41183 + }, + { + "epoch": 0.8, + "learning_rate": 4.0262514077123215e-08, + "loss": 0.0007, + "step": 41184 + }, + { + "epoch": 0.8, + "learning_rate": 4.0258630732787074e-08, + "loss": 0.0011, + "step": 41185 + }, + { + "epoch": 0.8, + "learning_rate": 4.025474738845093e-08, + "loss": 0.0004, + "step": 41186 + }, + { + "epoch": 0.8, + "learning_rate": 4.025086404411479e-08, + "loss": 0.1037, + "step": 41187 + }, + { + "epoch": 0.8, + "learning_rate": 4.024698069977865e-08, + "loss": 0.0004, + "step": 41188 + }, + { + "epoch": 0.8, + "learning_rate": 4.0243097355442507e-08, + "loss": 0.0005, + "step": 41189 + }, + { + "epoch": 0.8, + "learning_rate": 4.0239214011106365e-08, + "loss": 0.0003, + "step": 41190 + }, + { + "epoch": 0.8, + "learning_rate": 4.023533066677022e-08, + "loss": 0.0005, + "step": 41191 + }, + { + "epoch": 0.8, + "learning_rate": 4.023144732243408e-08, + "loss": 0.7088, + "step": 41192 + }, + { + "epoch": 0.8, + "learning_rate": 4.022756397809793e-08, + "loss": 0.0015, + "step": 41193 + }, + { + "epoch": 0.8, + "learning_rate": 4.022368063376179e-08, + "loss": 0.0003, + "step": 41194 + }, + { + "epoch": 0.8, + "learning_rate": 4.021979728942565e-08, + "loss": 0.0003, + "step": 41195 + }, + { + "epoch": 0.8, + "learning_rate": 4.021591394508951e-08, + "loss": 0.0072, + "step": 41196 + }, + { + "epoch": 0.8, + "learning_rate": 4.0212030600753366e-08, + "loss": 0.0003, + "step": 41197 + }, + { + "epoch": 0.8, + "learning_rate": 4.0208147256417224e-08, + "loss": 0.0005, + "step": 41198 + }, + { + "epoch": 0.8, + "learning_rate": 4.020426391208108e-08, + "loss": 0.0097, + "step": 41199 + }, + { + "epoch": 0.8, + "learning_rate": 4.020038056774494e-08, + "loss": 0.0185, + "step": 41200 + }, + { + "epoch": 0.8, + "learning_rate": 4.01964972234088e-08, + "loss": 0.0004, + "step": 41201 + }, + { + "epoch": 0.8, + "learning_rate": 4.019261387907266e-08, + "loss": 0.0004, + "step": 41202 + }, + { + "epoch": 0.8, + "learning_rate": 4.0188730534736515e-08, + "loss": 0.0006, + "step": 41203 + }, + { + "epoch": 0.8, + "learning_rate": 4.0184847190400374e-08, + "loss": 0.0002, + "step": 41204 + }, + { + "epoch": 0.8, + "learning_rate": 4.018096384606423e-08, + "loss": 0.0005, + "step": 41205 + }, + { + "epoch": 0.8, + "learning_rate": 4.017708050172809e-08, + "loss": 0.0008, + "step": 41206 + }, + { + "epoch": 0.8, + "learning_rate": 4.017319715739194e-08, + "loss": 0.0004, + "step": 41207 + }, + { + "epoch": 0.8, + "learning_rate": 4.01693138130558e-08, + "loss": 0.0026, + "step": 41208 + }, + { + "epoch": 0.8, + "learning_rate": 4.016543046871966e-08, + "loss": 0.0004, + "step": 41209 + }, + { + "epoch": 0.8, + "learning_rate": 4.0161547124383516e-08, + "loss": 0.0004, + "step": 41210 + }, + { + "epoch": 0.8, + "learning_rate": 4.0157663780047375e-08, + "loss": 0.0006, + "step": 41211 + }, + { + "epoch": 0.8, + "learning_rate": 4.015378043571123e-08, + "loss": 0.0013, + "step": 41212 + }, + { + "epoch": 0.8, + "learning_rate": 4.014989709137509e-08, + "loss": 0.0004, + "step": 41213 + }, + { + "epoch": 0.8, + "learning_rate": 4.014601374703895e-08, + "loss": 0.0004, + "step": 41214 + }, + { + "epoch": 0.8, + "learning_rate": 4.014213040270281e-08, + "loss": 0.0004, + "step": 41215 + }, + { + "epoch": 0.8, + "learning_rate": 4.0138247058366666e-08, + "loss": 0.0004, + "step": 41216 + }, + { + "epoch": 0.8, + "learning_rate": 4.0134363714030524e-08, + "loss": 0.0055, + "step": 41217 + }, + { + "epoch": 0.8, + "learning_rate": 4.013048036969438e-08, + "loss": 0.0003, + "step": 41218 + }, + { + "epoch": 0.8, + "learning_rate": 4.012659702535824e-08, + "loss": 0.0004, + "step": 41219 + }, + { + "epoch": 0.8, + "learning_rate": 4.01227136810221e-08, + "loss": 0.0209, + "step": 41220 + }, + { + "epoch": 0.8, + "learning_rate": 4.011883033668596e-08, + "loss": 0.0004, + "step": 41221 + }, + { + "epoch": 0.8, + "learning_rate": 4.011494699234981e-08, + "loss": 0.0004, + "step": 41222 + }, + { + "epoch": 0.8, + "learning_rate": 4.011106364801367e-08, + "loss": 0.0006, + "step": 41223 + }, + { + "epoch": 0.8, + "learning_rate": 4.0107180303677525e-08, + "loss": 0.0011, + "step": 41224 + }, + { + "epoch": 0.8, + "learning_rate": 4.0103296959341383e-08, + "loss": 0.0006, + "step": 41225 + }, + { + "epoch": 0.8, + "learning_rate": 4.009941361500524e-08, + "loss": 0.0004, + "step": 41226 + }, + { + "epoch": 0.8, + "learning_rate": 4.00955302706691e-08, + "loss": 0.0003, + "step": 41227 + }, + { + "epoch": 0.8, + "learning_rate": 4.009164692633296e-08, + "loss": 0.0004, + "step": 41228 + }, + { + "epoch": 0.8, + "learning_rate": 4.0087763581996816e-08, + "loss": 0.0003, + "step": 41229 + }, + { + "epoch": 0.8, + "learning_rate": 4.0083880237660675e-08, + "loss": 0.0005, + "step": 41230 + }, + { + "epoch": 0.8, + "learning_rate": 4.007999689332453e-08, + "loss": 0.0005, + "step": 41231 + }, + { + "epoch": 0.8, + "learning_rate": 4.007611354898839e-08, + "loss": 0.0003, + "step": 41232 + }, + { + "epoch": 0.8, + "learning_rate": 4.007223020465225e-08, + "loss": 0.0865, + "step": 41233 + }, + { + "epoch": 0.8, + "learning_rate": 4.006834686031611e-08, + "loss": 0.0005, + "step": 41234 + }, + { + "epoch": 0.8, + "learning_rate": 4.0064463515979966e-08, + "loss": 0.0004, + "step": 41235 + }, + { + "epoch": 0.8, + "learning_rate": 4.006058017164382e-08, + "loss": 0.0003, + "step": 41236 + }, + { + "epoch": 0.8, + "learning_rate": 4.0056696827307676e-08, + "loss": 0.0004, + "step": 41237 + }, + { + "epoch": 0.8, + "learning_rate": 4.0052813482971534e-08, + "loss": 0.0004, + "step": 41238 + }, + { + "epoch": 0.8, + "learning_rate": 4.004893013863539e-08, + "loss": 0.0006, + "step": 41239 + }, + { + "epoch": 0.8, + "learning_rate": 4.004504679429925e-08, + "loss": 0.0004, + "step": 41240 + }, + { + "epoch": 0.8, + "learning_rate": 4.004116344996311e-08, + "loss": 0.0005, + "step": 41241 + }, + { + "epoch": 0.8, + "learning_rate": 4.003728010562697e-08, + "loss": 0.0005, + "step": 41242 + }, + { + "epoch": 0.8, + "learning_rate": 4.003339676129082e-08, + "loss": 0.9065, + "step": 41243 + }, + { + "epoch": 0.8, + "learning_rate": 4.002951341695468e-08, + "loss": 0.0005, + "step": 41244 + }, + { + "epoch": 0.8, + "learning_rate": 4.0025630072618535e-08, + "loss": 0.0009, + "step": 41245 + }, + { + "epoch": 0.8, + "learning_rate": 4.0021746728282393e-08, + "loss": 0.0009, + "step": 41246 + }, + { + "epoch": 0.8, + "learning_rate": 4.001786338394625e-08, + "loss": 0.3704, + "step": 41247 + }, + { + "epoch": 0.8, + "learning_rate": 4.001398003961011e-08, + "loss": 0.0007, + "step": 41248 + }, + { + "epoch": 0.8, + "learning_rate": 4.001009669527397e-08, + "loss": 0.0004, + "step": 41249 + }, + { + "epoch": 0.8, + "learning_rate": 4.0006213350937826e-08, + "loss": 0.0004, + "step": 41250 + }, + { + "epoch": 0.8, + "learning_rate": 4.000233000660168e-08, + "loss": 0.0006, + "step": 41251 + }, + { + "epoch": 0.8, + "learning_rate": 3.9998446662265536e-08, + "loss": 0.0003, + "step": 41252 + }, + { + "epoch": 0.8, + "learning_rate": 3.9994563317929394e-08, + "loss": 0.0004, + "step": 41253 + }, + { + "epoch": 0.8, + "learning_rate": 3.999067997359325e-08, + "loss": 0.0005, + "step": 41254 + }, + { + "epoch": 0.8, + "learning_rate": 3.998679662925711e-08, + "loss": 0.0006, + "step": 41255 + }, + { + "epoch": 0.8, + "learning_rate": 3.998291328492097e-08, + "loss": 0.0004, + "step": 41256 + }, + { + "epoch": 0.8, + "learning_rate": 3.997902994058483e-08, + "loss": 0.0003, + "step": 41257 + }, + { + "epoch": 0.8, + "learning_rate": 3.9975146596248686e-08, + "loss": 0.653, + "step": 41258 + }, + { + "epoch": 0.8, + "learning_rate": 3.9971263251912544e-08, + "loss": 0.001, + "step": 41259 + }, + { + "epoch": 0.8, + "learning_rate": 3.99673799075764e-08, + "loss": 0.0005, + "step": 41260 + }, + { + "epoch": 0.8, + "learning_rate": 3.996349656324026e-08, + "loss": 0.0003, + "step": 41261 + }, + { + "epoch": 0.8, + "learning_rate": 3.995961321890412e-08, + "loss": 0.0073, + "step": 41262 + }, + { + "epoch": 0.8, + "learning_rate": 3.995572987456798e-08, + "loss": 0.0009, + "step": 41263 + }, + { + "epoch": 0.8, + "learning_rate": 3.9951846530231835e-08, + "loss": 0.0011, + "step": 41264 + }, + { + "epoch": 0.8, + "learning_rate": 3.994796318589569e-08, + "loss": 0.1939, + "step": 41265 + }, + { + "epoch": 0.8, + "learning_rate": 3.9944079841559545e-08, + "loss": 0.0005, + "step": 41266 + }, + { + "epoch": 0.8, + "learning_rate": 3.99401964972234e-08, + "loss": 0.0005, + "step": 41267 + }, + { + "epoch": 0.8, + "learning_rate": 3.993631315288726e-08, + "loss": 0.0004, + "step": 41268 + }, + { + "epoch": 0.8, + "learning_rate": 3.993242980855112e-08, + "loss": 0.0004, + "step": 41269 + }, + { + "epoch": 0.8, + "learning_rate": 3.992854646421498e-08, + "loss": 0.5917, + "step": 41270 + }, + { + "epoch": 0.8, + "learning_rate": 3.9924663119878836e-08, + "loss": 0.0005, + "step": 41271 + }, + { + "epoch": 0.8, + "learning_rate": 3.9920779775542694e-08, + "loss": 0.0004, + "step": 41272 + }, + { + "epoch": 0.8, + "learning_rate": 3.991689643120655e-08, + "loss": 0.0005, + "step": 41273 + }, + { + "epoch": 0.8, + "learning_rate": 3.991301308687041e-08, + "loss": 0.0003, + "step": 41274 + }, + { + "epoch": 0.8, + "learning_rate": 3.990912974253427e-08, + "loss": 0.0004, + "step": 41275 + }, + { + "epoch": 0.8, + "learning_rate": 3.990524639819813e-08, + "loss": 0.0008, + "step": 41276 + }, + { + "epoch": 0.8, + "learning_rate": 3.9901363053861986e-08, + "loss": 0.0013, + "step": 41277 + }, + { + "epoch": 0.8, + "learning_rate": 3.9897479709525844e-08, + "loss": 0.0003, + "step": 41278 + }, + { + "epoch": 0.8, + "learning_rate": 3.98935963651897e-08, + "loss": 0.0004, + "step": 41279 + }, + { + "epoch": 0.8, + "learning_rate": 3.9889713020853554e-08, + "loss": 0.0005, + "step": 41280 + }, + { + "epoch": 0.8, + "learning_rate": 3.988582967651741e-08, + "loss": 0.0007, + "step": 41281 + }, + { + "epoch": 0.8, + "learning_rate": 3.988194633218127e-08, + "loss": 0.004, + "step": 41282 + }, + { + "epoch": 0.8, + "learning_rate": 3.987806298784513e-08, + "loss": 0.0004, + "step": 41283 + }, + { + "epoch": 0.8, + "learning_rate": 3.987417964350899e-08, + "loss": 0.0009, + "step": 41284 + }, + { + "epoch": 0.8, + "learning_rate": 3.9870296299172845e-08, + "loss": 0.0006, + "step": 41285 + }, + { + "epoch": 0.8, + "learning_rate": 3.98664129548367e-08, + "loss": 0.0005, + "step": 41286 + }, + { + "epoch": 0.8, + "learning_rate": 3.986252961050056e-08, + "loss": 0.0006, + "step": 41287 + }, + { + "epoch": 0.8, + "learning_rate": 3.985864626616442e-08, + "loss": 0.0003, + "step": 41288 + }, + { + "epoch": 0.8, + "learning_rate": 3.985476292182828e-08, + "loss": 0.0003, + "step": 41289 + }, + { + "epoch": 0.8, + "learning_rate": 3.9850879577492136e-08, + "loss": 0.0005, + "step": 41290 + }, + { + "epoch": 0.8, + "learning_rate": 3.9846996233155994e-08, + "loss": 0.0004, + "step": 41291 + }, + { + "epoch": 0.8, + "learning_rate": 3.984311288881985e-08, + "loss": 0.0006, + "step": 41292 + }, + { + "epoch": 0.8, + "learning_rate": 3.983922954448371e-08, + "loss": 0.0003, + "step": 41293 + }, + { + "epoch": 0.8, + "learning_rate": 3.983534620014756e-08, + "loss": 0.0004, + "step": 41294 + }, + { + "epoch": 0.8, + "learning_rate": 3.983146285581142e-08, + "loss": 0.0006, + "step": 41295 + }, + { + "epoch": 0.8, + "learning_rate": 3.982757951147528e-08, + "loss": 0.0003, + "step": 41296 + }, + { + "epoch": 0.8, + "learning_rate": 3.982369616713914e-08, + "loss": 0.0024, + "step": 41297 + }, + { + "epoch": 0.8, + "learning_rate": 3.9819812822802996e-08, + "loss": 0.0004, + "step": 41298 + }, + { + "epoch": 0.8, + "learning_rate": 3.9815929478466854e-08, + "loss": 0.0041, + "step": 41299 + }, + { + "epoch": 0.8, + "learning_rate": 3.981204613413071e-08, + "loss": 0.0005, + "step": 41300 + }, + { + "epoch": 0.8, + "learning_rate": 3.980816278979457e-08, + "loss": 0.0007, + "step": 41301 + }, + { + "epoch": 0.8, + "learning_rate": 3.980427944545843e-08, + "loss": 0.0004, + "step": 41302 + }, + { + "epoch": 0.8, + "learning_rate": 3.980039610112229e-08, + "loss": 0.0183, + "step": 41303 + }, + { + "epoch": 0.8, + "learning_rate": 3.9796512756786145e-08, + "loss": 0.0003, + "step": 41304 + }, + { + "epoch": 0.8, + "learning_rate": 3.979262941245e-08, + "loss": 0.0003, + "step": 41305 + }, + { + "epoch": 0.8, + "learning_rate": 3.978874606811386e-08, + "loss": 0.0481, + "step": 41306 + }, + { + "epoch": 0.8, + "learning_rate": 3.978486272377772e-08, + "loss": 0.0003, + "step": 41307 + }, + { + "epoch": 0.8, + "learning_rate": 3.978097937944158e-08, + "loss": 0.0005, + "step": 41308 + }, + { + "epoch": 0.8, + "learning_rate": 3.977709603510543e-08, + "loss": 0.0009, + "step": 41309 + }, + { + "epoch": 0.8, + "learning_rate": 3.977321269076929e-08, + "loss": 0.0005, + "step": 41310 + }, + { + "epoch": 0.8, + "learning_rate": 3.9769329346433146e-08, + "loss": 0.0004, + "step": 41311 + }, + { + "epoch": 0.8, + "learning_rate": 3.9765446002097004e-08, + "loss": 0.0004, + "step": 41312 + }, + { + "epoch": 0.8, + "learning_rate": 3.976156265776086e-08, + "loss": 0.0003, + "step": 41313 + }, + { + "epoch": 0.8, + "learning_rate": 3.975767931342472e-08, + "loss": 0.0008, + "step": 41314 + }, + { + "epoch": 0.8, + "learning_rate": 3.975379596908858e-08, + "loss": 0.0003, + "step": 41315 + }, + { + "epoch": 0.8, + "learning_rate": 3.974991262475244e-08, + "loss": 0.0004, + "step": 41316 + }, + { + "epoch": 0.8, + "learning_rate": 3.9746029280416296e-08, + "loss": 0.9034, + "step": 41317 + }, + { + "epoch": 0.8, + "learning_rate": 3.9742145936080154e-08, + "loss": 0.0003, + "step": 41318 + }, + { + "epoch": 0.8, + "learning_rate": 3.973826259174401e-08, + "loss": 0.7376, + "step": 41319 + }, + { + "epoch": 0.8, + "learning_rate": 3.973437924740787e-08, + "loss": 0.0005, + "step": 41320 + }, + { + "epoch": 0.8, + "learning_rate": 3.973049590307173e-08, + "loss": 0.0003, + "step": 41321 + }, + { + "epoch": 0.8, + "learning_rate": 3.972661255873559e-08, + "loss": 0.0004, + "step": 41322 + }, + { + "epoch": 0.8, + "learning_rate": 3.972272921439944e-08, + "loss": 0.0012, + "step": 41323 + }, + { + "epoch": 0.8, + "learning_rate": 3.97188458700633e-08, + "loss": 0.0005, + "step": 41324 + }, + { + "epoch": 0.8, + "learning_rate": 3.9714962525727155e-08, + "loss": 0.0004, + "step": 41325 + }, + { + "epoch": 0.8, + "learning_rate": 3.971107918139101e-08, + "loss": 0.0004, + "step": 41326 + }, + { + "epoch": 0.8, + "learning_rate": 3.970719583705487e-08, + "loss": 0.0004, + "step": 41327 + }, + { + "epoch": 0.8, + "learning_rate": 3.970331249271873e-08, + "loss": 0.0189, + "step": 41328 + }, + { + "epoch": 0.8, + "learning_rate": 3.969942914838259e-08, + "loss": 0.0004, + "step": 41329 + }, + { + "epoch": 0.8, + "learning_rate": 3.9695545804046446e-08, + "loss": 0.0003, + "step": 41330 + }, + { + "epoch": 0.8, + "learning_rate": 3.9691662459710304e-08, + "loss": 0.0005, + "step": 41331 + }, + { + "epoch": 0.8, + "learning_rate": 3.9687779115374156e-08, + "loss": 0.0006, + "step": 41332 + }, + { + "epoch": 0.8, + "learning_rate": 3.9683895771038014e-08, + "loss": 0.0003, + "step": 41333 + }, + { + "epoch": 0.8, + "learning_rate": 3.968001242670187e-08, + "loss": 0.0005, + "step": 41334 + }, + { + "epoch": 0.8, + "learning_rate": 3.967612908236573e-08, + "loss": 0.0013, + "step": 41335 + }, + { + "epoch": 0.8, + "learning_rate": 3.967224573802959e-08, + "loss": 1.0946, + "step": 41336 + }, + { + "epoch": 0.8, + "learning_rate": 3.966836239369345e-08, + "loss": 0.0005, + "step": 41337 + }, + { + "epoch": 0.8, + "learning_rate": 3.9664479049357306e-08, + "loss": 0.0005, + "step": 41338 + }, + { + "epoch": 0.8, + "learning_rate": 3.966059570502116e-08, + "loss": 0.0005, + "step": 41339 + }, + { + "epoch": 0.8, + "learning_rate": 3.9656712360685015e-08, + "loss": 0.0003, + "step": 41340 + }, + { + "epoch": 0.8, + "learning_rate": 3.9652829016348874e-08, + "loss": 0.0004, + "step": 41341 + }, + { + "epoch": 0.8, + "learning_rate": 3.964894567201273e-08, + "loss": 0.0005, + "step": 41342 + }, + { + "epoch": 0.8, + "learning_rate": 3.964506232767659e-08, + "loss": 0.0003, + "step": 41343 + }, + { + "epoch": 0.8, + "learning_rate": 3.964117898334045e-08, + "loss": 0.0311, + "step": 41344 + }, + { + "epoch": 0.8, + "learning_rate": 3.9637295639004307e-08, + "loss": 0.0008, + "step": 41345 + }, + { + "epoch": 0.8, + "learning_rate": 3.9633412294668165e-08, + "loss": 0.0005, + "step": 41346 + }, + { + "epoch": 0.8, + "learning_rate": 3.962952895033202e-08, + "loss": 0.0003, + "step": 41347 + }, + { + "epoch": 0.8, + "learning_rate": 3.962564560599588e-08, + "loss": 0.9199, + "step": 41348 + }, + { + "epoch": 0.8, + "learning_rate": 3.962176226165974e-08, + "loss": 0.0003, + "step": 41349 + }, + { + "epoch": 0.8, + "learning_rate": 3.96178789173236e-08, + "loss": 0.0004, + "step": 41350 + }, + { + "epoch": 0.8, + "learning_rate": 3.9613995572987456e-08, + "loss": 0.0005, + "step": 41351 + }, + { + "epoch": 0.8, + "learning_rate": 3.961011222865131e-08, + "loss": 0.0003, + "step": 41352 + }, + { + "epoch": 0.8, + "learning_rate": 3.9606228884315166e-08, + "loss": 0.0005, + "step": 41353 + }, + { + "epoch": 0.8, + "learning_rate": 3.9602345539979024e-08, + "loss": 0.0004, + "step": 41354 + }, + { + "epoch": 0.8, + "learning_rate": 3.959846219564288e-08, + "loss": 0.0004, + "step": 41355 + }, + { + "epoch": 0.8, + "learning_rate": 3.959457885130674e-08, + "loss": 0.0039, + "step": 41356 + }, + { + "epoch": 0.8, + "learning_rate": 3.95906955069706e-08, + "loss": 0.0003, + "step": 41357 + }, + { + "epoch": 0.8, + "learning_rate": 3.958681216263446e-08, + "loss": 0.0006, + "step": 41358 + }, + { + "epoch": 0.8, + "learning_rate": 3.9582928818298315e-08, + "loss": 0.0008, + "step": 41359 + }, + { + "epoch": 0.8, + "learning_rate": 3.9579045473962174e-08, + "loss": 0.0005, + "step": 41360 + }, + { + "epoch": 0.8, + "learning_rate": 3.957516212962603e-08, + "loss": 0.0005, + "step": 41361 + }, + { + "epoch": 0.8, + "learning_rate": 3.957127878528989e-08, + "loss": 0.0005, + "step": 41362 + }, + { + "epoch": 0.8, + "learning_rate": 3.956739544095375e-08, + "loss": 0.005, + "step": 41363 + }, + { + "epoch": 0.8, + "learning_rate": 3.9563512096617607e-08, + "loss": 0.0004, + "step": 41364 + }, + { + "epoch": 0.8, + "learning_rate": 3.9559628752281465e-08, + "loss": 0.0005, + "step": 41365 + }, + { + "epoch": 0.8, + "learning_rate": 3.955574540794532e-08, + "loss": 0.0003, + "step": 41366 + }, + { + "epoch": 0.8, + "learning_rate": 3.9551862063609175e-08, + "loss": 0.0003, + "step": 41367 + }, + { + "epoch": 0.8, + "learning_rate": 3.954797871927303e-08, + "loss": 0.0007, + "step": 41368 + }, + { + "epoch": 0.8, + "learning_rate": 3.954409537493689e-08, + "loss": 0.0017, + "step": 41369 + }, + { + "epoch": 0.8, + "learning_rate": 3.954021203060075e-08, + "loss": 0.0004, + "step": 41370 + }, + { + "epoch": 0.8, + "learning_rate": 3.953632868626461e-08, + "loss": 0.0182, + "step": 41371 + }, + { + "epoch": 0.8, + "learning_rate": 3.9532445341928466e-08, + "loss": 0.0005, + "step": 41372 + }, + { + "epoch": 0.8, + "learning_rate": 3.9528561997592324e-08, + "loss": 0.0005, + "step": 41373 + }, + { + "epoch": 0.8, + "learning_rate": 3.952467865325618e-08, + "loss": 0.0009, + "step": 41374 + }, + { + "epoch": 0.8, + "learning_rate": 3.952079530892004e-08, + "loss": 0.6075, + "step": 41375 + }, + { + "epoch": 0.8, + "learning_rate": 3.95169119645839e-08, + "loss": 1.1803, + "step": 41376 + }, + { + "epoch": 0.8, + "learning_rate": 3.951302862024776e-08, + "loss": 0.0004, + "step": 41377 + }, + { + "epoch": 0.8, + "learning_rate": 3.9509145275911615e-08, + "loss": 0.0005, + "step": 41378 + }, + { + "epoch": 0.8, + "learning_rate": 3.9505261931575474e-08, + "loss": 1.3902, + "step": 41379 + }, + { + "epoch": 0.8, + "learning_rate": 3.950137858723933e-08, + "loss": 0.0121, + "step": 41380 + }, + { + "epoch": 0.8, + "learning_rate": 3.9497495242903184e-08, + "loss": 0.0004, + "step": 41381 + }, + { + "epoch": 0.8, + "learning_rate": 3.949361189856704e-08, + "loss": 0.0005, + "step": 41382 + }, + { + "epoch": 0.8, + "learning_rate": 3.94897285542309e-08, + "loss": 0.0003, + "step": 41383 + }, + { + "epoch": 0.8, + "learning_rate": 3.948584520989476e-08, + "loss": 0.0074, + "step": 41384 + }, + { + "epoch": 0.8, + "learning_rate": 3.9481961865558617e-08, + "loss": 0.0007, + "step": 41385 + }, + { + "epoch": 0.8, + "learning_rate": 3.9478078521222475e-08, + "loss": 0.0004, + "step": 41386 + }, + { + "epoch": 0.8, + "learning_rate": 3.947419517688633e-08, + "loss": 0.0217, + "step": 41387 + }, + { + "epoch": 0.8, + "learning_rate": 3.947031183255019e-08, + "loss": 0.0004, + "step": 41388 + }, + { + "epoch": 0.8, + "learning_rate": 3.946642848821405e-08, + "loss": 0.0004, + "step": 41389 + }, + { + "epoch": 0.8, + "learning_rate": 3.946254514387791e-08, + "loss": 0.0691, + "step": 41390 + }, + { + "epoch": 0.8, + "learning_rate": 3.9458661799541766e-08, + "loss": 0.0005, + "step": 41391 + }, + { + "epoch": 0.8, + "learning_rate": 3.9454778455205624e-08, + "loss": 0.0003, + "step": 41392 + }, + { + "epoch": 0.8, + "learning_rate": 3.945089511086948e-08, + "loss": 0.0004, + "step": 41393 + }, + { + "epoch": 0.8, + "learning_rate": 3.944701176653334e-08, + "loss": 0.0002, + "step": 41394 + }, + { + "epoch": 0.8, + "learning_rate": 3.94431284221972e-08, + "loss": 0.0003, + "step": 41395 + }, + { + "epoch": 0.8, + "learning_rate": 3.943924507786105e-08, + "loss": 0.0004, + "step": 41396 + }, + { + "epoch": 0.8, + "learning_rate": 3.943536173352491e-08, + "loss": 0.0019, + "step": 41397 + }, + { + "epoch": 0.8, + "learning_rate": 3.943147838918877e-08, + "loss": 0.0004, + "step": 41398 + }, + { + "epoch": 0.8, + "learning_rate": 3.9427595044852625e-08, + "loss": 0.0004, + "step": 41399 + }, + { + "epoch": 0.8, + "learning_rate": 3.9423711700516484e-08, + "loss": 0.0004, + "step": 41400 + }, + { + "epoch": 0.8, + "learning_rate": 3.941982835618034e-08, + "loss": 0.0004, + "step": 41401 + }, + { + "epoch": 0.8, + "learning_rate": 3.94159450118442e-08, + "loss": 0.0143, + "step": 41402 + }, + { + "epoch": 0.8, + "learning_rate": 3.941206166750806e-08, + "loss": 0.0004, + "step": 41403 + }, + { + "epoch": 0.8, + "learning_rate": 3.9408178323171917e-08, + "loss": 0.009, + "step": 41404 + }, + { + "epoch": 0.8, + "learning_rate": 3.9404294978835775e-08, + "loss": 0.0005, + "step": 41405 + }, + { + "epoch": 0.8, + "learning_rate": 3.940041163449963e-08, + "loss": 0.0006, + "step": 41406 + }, + { + "epoch": 0.8, + "learning_rate": 3.939652829016349e-08, + "loss": 0.0004, + "step": 41407 + }, + { + "epoch": 0.8, + "learning_rate": 3.939264494582735e-08, + "loss": 0.0004, + "step": 41408 + }, + { + "epoch": 0.8, + "learning_rate": 3.938876160149121e-08, + "loss": 0.0005, + "step": 41409 + }, + { + "epoch": 0.8, + "learning_rate": 3.938487825715506e-08, + "loss": 0.0045, + "step": 41410 + }, + { + "epoch": 0.8, + "learning_rate": 3.938099491281892e-08, + "loss": 0.0004, + "step": 41411 + }, + { + "epoch": 0.8, + "learning_rate": 3.9377111568482776e-08, + "loss": 0.0003, + "step": 41412 + }, + { + "epoch": 0.8, + "learning_rate": 3.9373228224146634e-08, + "loss": 0.0004, + "step": 41413 + }, + { + "epoch": 0.8, + "learning_rate": 3.936934487981049e-08, + "loss": 0.071, + "step": 41414 + }, + { + "epoch": 0.8, + "learning_rate": 3.936546153547435e-08, + "loss": 0.0011, + "step": 41415 + }, + { + "epoch": 0.8, + "learning_rate": 3.936157819113821e-08, + "loss": 0.0006, + "step": 41416 + }, + { + "epoch": 0.8, + "learning_rate": 3.935769484680207e-08, + "loss": 0.0004, + "step": 41417 + }, + { + "epoch": 0.8, + "learning_rate": 3.9353811502465925e-08, + "loss": 0.0005, + "step": 41418 + }, + { + "epoch": 0.8, + "learning_rate": 3.9349928158129784e-08, + "loss": 0.0003, + "step": 41419 + }, + { + "epoch": 0.8, + "learning_rate": 3.9346044813793635e-08, + "loss": 0.0003, + "step": 41420 + }, + { + "epoch": 0.8, + "learning_rate": 3.9342161469457493e-08, + "loss": 0.0003, + "step": 41421 + }, + { + "epoch": 0.8, + "learning_rate": 3.933827812512135e-08, + "loss": 0.0027, + "step": 41422 + }, + { + "epoch": 0.8, + "learning_rate": 3.933439478078521e-08, + "loss": 0.0008, + "step": 41423 + }, + { + "epoch": 0.8, + "learning_rate": 3.933051143644907e-08, + "loss": 0.0003, + "step": 41424 + }, + { + "epoch": 0.8, + "learning_rate": 3.9326628092112926e-08, + "loss": 0.0003, + "step": 41425 + }, + { + "epoch": 0.8, + "learning_rate": 3.9322744747776785e-08, + "loss": 0.0006, + "step": 41426 + }, + { + "epoch": 0.8, + "learning_rate": 3.931886140344064e-08, + "loss": 0.0004, + "step": 41427 + }, + { + "epoch": 0.8, + "learning_rate": 3.9314978059104495e-08, + "loss": 0.0003, + "step": 41428 + }, + { + "epoch": 0.8, + "learning_rate": 3.931109471476835e-08, + "loss": 0.0004, + "step": 41429 + }, + { + "epoch": 0.8, + "learning_rate": 3.930721137043221e-08, + "loss": 0.0005, + "step": 41430 + }, + { + "epoch": 0.8, + "learning_rate": 3.930332802609607e-08, + "loss": 0.0004, + "step": 41431 + }, + { + "epoch": 0.8, + "learning_rate": 3.929944468175993e-08, + "loss": 0.3107, + "step": 41432 + }, + { + "epoch": 0.8, + "learning_rate": 3.9295561337423786e-08, + "loss": 0.0004, + "step": 41433 + }, + { + "epoch": 0.8, + "learning_rate": 3.9291677993087644e-08, + "loss": 0.0004, + "step": 41434 + }, + { + "epoch": 0.8, + "learning_rate": 3.92877946487515e-08, + "loss": 0.0005, + "step": 41435 + }, + { + "epoch": 0.8, + "learning_rate": 3.928391130441536e-08, + "loss": 0.0004, + "step": 41436 + }, + { + "epoch": 0.8, + "learning_rate": 3.928002796007922e-08, + "loss": 0.0305, + "step": 41437 + }, + { + "epoch": 0.8, + "learning_rate": 3.927614461574308e-08, + "loss": 0.0004, + "step": 41438 + }, + { + "epoch": 0.8, + "learning_rate": 3.927226127140693e-08, + "loss": 0.0004, + "step": 41439 + }, + { + "epoch": 0.8, + "learning_rate": 3.926837792707079e-08, + "loss": 0.0003, + "step": 41440 + }, + { + "epoch": 0.8, + "learning_rate": 3.9264494582734645e-08, + "loss": 0.0004, + "step": 41441 + }, + { + "epoch": 0.8, + "learning_rate": 3.9260611238398503e-08, + "loss": 0.0035, + "step": 41442 + }, + { + "epoch": 0.8, + "learning_rate": 3.925672789406236e-08, + "loss": 0.0003, + "step": 41443 + }, + { + "epoch": 0.8, + "learning_rate": 3.925284454972622e-08, + "loss": 0.0004, + "step": 41444 + }, + { + "epoch": 0.8, + "learning_rate": 3.924896120539008e-08, + "loss": 0.0004, + "step": 41445 + }, + { + "epoch": 0.8, + "learning_rate": 3.9245077861053936e-08, + "loss": 0.0004, + "step": 41446 + }, + { + "epoch": 0.8, + "learning_rate": 3.9241194516717795e-08, + "loss": 0.0005, + "step": 41447 + }, + { + "epoch": 0.8, + "learning_rate": 3.923731117238165e-08, + "loss": 0.0004, + "step": 41448 + }, + { + "epoch": 0.8, + "learning_rate": 3.923342782804551e-08, + "loss": 0.0168, + "step": 41449 + }, + { + "epoch": 0.8, + "learning_rate": 3.922954448370937e-08, + "loss": 0.0005, + "step": 41450 + }, + { + "epoch": 0.8, + "learning_rate": 3.922566113937323e-08, + "loss": 0.0005, + "step": 41451 + }, + { + "epoch": 0.8, + "learning_rate": 3.9221777795037086e-08, + "loss": 0.0003, + "step": 41452 + }, + { + "epoch": 0.8, + "learning_rate": 3.9217894450700944e-08, + "loss": 0.0005, + "step": 41453 + }, + { + "epoch": 0.8, + "learning_rate": 3.9214011106364796e-08, + "loss": 0.9685, + "step": 41454 + }, + { + "epoch": 0.8, + "learning_rate": 3.9210127762028654e-08, + "loss": 0.0006, + "step": 41455 + }, + { + "epoch": 0.8, + "learning_rate": 3.920624441769251e-08, + "loss": 0.0007, + "step": 41456 + }, + { + "epoch": 0.8, + "learning_rate": 3.920236107335637e-08, + "loss": 0.0003, + "step": 41457 + }, + { + "epoch": 0.8, + "learning_rate": 3.919847772902023e-08, + "loss": 0.0003, + "step": 41458 + }, + { + "epoch": 0.8, + "learning_rate": 3.919459438468409e-08, + "loss": 0.0005, + "step": 41459 + }, + { + "epoch": 0.8, + "learning_rate": 3.9190711040347945e-08, + "loss": 0.0126, + "step": 41460 + }, + { + "epoch": 0.8, + "learning_rate": 3.9186827696011803e-08, + "loss": 0.017, + "step": 41461 + }, + { + "epoch": 0.8, + "learning_rate": 3.918294435167566e-08, + "loss": 0.0072, + "step": 41462 + }, + { + "epoch": 0.8, + "learning_rate": 3.917906100733952e-08, + "loss": 0.001, + "step": 41463 + }, + { + "epoch": 0.8, + "learning_rate": 3.917517766300338e-08, + "loss": 0.0007, + "step": 41464 + }, + { + "epoch": 0.8, + "learning_rate": 3.9171294318667236e-08, + "loss": 0.0005, + "step": 41465 + }, + { + "epoch": 0.8, + "learning_rate": 3.9167410974331095e-08, + "loss": 0.9578, + "step": 41466 + }, + { + "epoch": 0.8, + "learning_rate": 3.916352762999495e-08, + "loss": 0.0025, + "step": 41467 + }, + { + "epoch": 0.8, + "learning_rate": 3.9159644285658804e-08, + "loss": 0.0005, + "step": 41468 + }, + { + "epoch": 0.8, + "learning_rate": 3.915576094132266e-08, + "loss": 0.2841, + "step": 41469 + }, + { + "epoch": 0.8, + "learning_rate": 3.915187759698652e-08, + "loss": 0.0003, + "step": 41470 + }, + { + "epoch": 0.8, + "learning_rate": 3.914799425265038e-08, + "loss": 0.0071, + "step": 41471 + }, + { + "epoch": 0.8, + "learning_rate": 3.914411090831424e-08, + "loss": 0.0004, + "step": 41472 + }, + { + "epoch": 0.8, + "learning_rate": 3.9140227563978096e-08, + "loss": 0.4986, + "step": 41473 + }, + { + "epoch": 0.8, + "learning_rate": 3.9136344219641954e-08, + "loss": 0.0003, + "step": 41474 + }, + { + "epoch": 0.8, + "learning_rate": 3.913246087530581e-08, + "loss": 0.0006, + "step": 41475 + }, + { + "epoch": 0.8, + "learning_rate": 3.912857753096967e-08, + "loss": 0.001, + "step": 41476 + }, + { + "epoch": 0.8, + "learning_rate": 3.912469418663353e-08, + "loss": 0.0003, + "step": 41477 + }, + { + "epoch": 0.8, + "learning_rate": 3.912081084229739e-08, + "loss": 0.0004, + "step": 41478 + }, + { + "epoch": 0.8, + "learning_rate": 3.9116927497961245e-08, + "loss": 0.0005, + "step": 41479 + }, + { + "epoch": 0.8, + "learning_rate": 3.9113044153625103e-08, + "loss": 0.0005, + "step": 41480 + }, + { + "epoch": 0.8, + "learning_rate": 3.910916080928896e-08, + "loss": 0.8469, + "step": 41481 + }, + { + "epoch": 0.8, + "learning_rate": 3.910527746495282e-08, + "loss": 0.0005, + "step": 41482 + }, + { + "epoch": 0.8, + "learning_rate": 3.910139412061667e-08, + "loss": 0.0004, + "step": 41483 + }, + { + "epoch": 0.8, + "learning_rate": 3.909751077628053e-08, + "loss": 0.0007, + "step": 41484 + }, + { + "epoch": 0.8, + "learning_rate": 3.909362743194439e-08, + "loss": 0.0019, + "step": 41485 + }, + { + "epoch": 0.8, + "learning_rate": 3.9089744087608246e-08, + "loss": 0.0004, + "step": 41486 + }, + { + "epoch": 0.8, + "learning_rate": 3.9085860743272104e-08, + "loss": 0.3618, + "step": 41487 + }, + { + "epoch": 0.8, + "learning_rate": 3.908197739893596e-08, + "loss": 0.0004, + "step": 41488 + }, + { + "epoch": 0.8, + "learning_rate": 3.907809405459982e-08, + "loss": 0.0005, + "step": 41489 + }, + { + "epoch": 0.8, + "learning_rate": 3.907421071026368e-08, + "loss": 0.0003, + "step": 41490 + }, + { + "epoch": 0.8, + "learning_rate": 3.907032736592754e-08, + "loss": 0.0002, + "step": 41491 + }, + { + "epoch": 0.8, + "learning_rate": 3.9066444021591396e-08, + "loss": 0.0005, + "step": 41492 + }, + { + "epoch": 0.8, + "learning_rate": 3.9062560677255254e-08, + "loss": 0.0005, + "step": 41493 + }, + { + "epoch": 0.8, + "learning_rate": 3.905867733291911e-08, + "loss": 0.003, + "step": 41494 + }, + { + "epoch": 0.8, + "learning_rate": 3.905479398858297e-08, + "loss": 0.0004, + "step": 41495 + }, + { + "epoch": 0.8, + "learning_rate": 3.905091064424683e-08, + "loss": 0.0006, + "step": 41496 + }, + { + "epoch": 0.8, + "learning_rate": 3.904702729991068e-08, + "loss": 0.0003, + "step": 41497 + }, + { + "epoch": 0.8, + "learning_rate": 3.904314395557454e-08, + "loss": 0.0004, + "step": 41498 + }, + { + "epoch": 0.8, + "learning_rate": 3.90392606112384e-08, + "loss": 0.0003, + "step": 41499 + }, + { + "epoch": 0.81, + "learning_rate": 3.9035377266902255e-08, + "loss": 0.0003, + "step": 41500 + }, + { + "epoch": 0.81, + "learning_rate": 3.903149392256611e-08, + "loss": 0.0006, + "step": 41501 + }, + { + "epoch": 0.81, + "learning_rate": 3.902761057822997e-08, + "loss": 0.0278, + "step": 41502 + }, + { + "epoch": 0.81, + "learning_rate": 3.902372723389383e-08, + "loss": 0.0025, + "step": 41503 + }, + { + "epoch": 0.81, + "learning_rate": 3.901984388955769e-08, + "loss": 0.0004, + "step": 41504 + }, + { + "epoch": 0.81, + "learning_rate": 3.9015960545221546e-08, + "loss": 0.0006, + "step": 41505 + }, + { + "epoch": 0.81, + "learning_rate": 3.9012077200885405e-08, + "loss": 0.0005, + "step": 41506 + }, + { + "epoch": 0.81, + "learning_rate": 3.900819385654926e-08, + "loss": 0.0004, + "step": 41507 + }, + { + "epoch": 0.81, + "learning_rate": 3.900431051221312e-08, + "loss": 0.1696, + "step": 41508 + }, + { + "epoch": 0.81, + "learning_rate": 3.900042716787697e-08, + "loss": 0.0006, + "step": 41509 + }, + { + "epoch": 0.81, + "learning_rate": 3.899654382354083e-08, + "loss": 0.0008, + "step": 41510 + }, + { + "epoch": 0.81, + "learning_rate": 3.899266047920469e-08, + "loss": 0.0014, + "step": 41511 + }, + { + "epoch": 0.81, + "learning_rate": 3.898877713486855e-08, + "loss": 0.0006, + "step": 41512 + }, + { + "epoch": 0.81, + "learning_rate": 3.8984893790532406e-08, + "loss": 0.0005, + "step": 41513 + }, + { + "epoch": 0.81, + "learning_rate": 3.8981010446196264e-08, + "loss": 0.0005, + "step": 41514 + }, + { + "epoch": 0.81, + "learning_rate": 3.897712710186012e-08, + "loss": 0.0004, + "step": 41515 + }, + { + "epoch": 0.81, + "learning_rate": 3.8973243757523974e-08, + "loss": 0.0003, + "step": 41516 + }, + { + "epoch": 0.81, + "learning_rate": 3.896936041318783e-08, + "loss": 0.0007, + "step": 41517 + }, + { + "epoch": 0.81, + "learning_rate": 3.896547706885169e-08, + "loss": 0.0002, + "step": 41518 + }, + { + "epoch": 0.81, + "learning_rate": 3.896159372451555e-08, + "loss": 0.0005, + "step": 41519 + }, + { + "epoch": 0.81, + "learning_rate": 3.895771038017941e-08, + "loss": 0.0003, + "step": 41520 + }, + { + "epoch": 0.81, + "learning_rate": 3.8953827035843265e-08, + "loss": 0.0003, + "step": 41521 + }, + { + "epoch": 0.81, + "learning_rate": 3.894994369150712e-08, + "loss": 0.327, + "step": 41522 + }, + { + "epoch": 0.81, + "learning_rate": 3.894606034717098e-08, + "loss": 0.0004, + "step": 41523 + }, + { + "epoch": 0.81, + "learning_rate": 3.894217700283484e-08, + "loss": 0.0004, + "step": 41524 + }, + { + "epoch": 0.81, + "learning_rate": 3.89382936584987e-08, + "loss": 0.0005, + "step": 41525 + }, + { + "epoch": 0.81, + "learning_rate": 3.893441031416255e-08, + "loss": 0.0005, + "step": 41526 + }, + { + "epoch": 0.81, + "learning_rate": 3.893052696982641e-08, + "loss": 0.0006, + "step": 41527 + }, + { + "epoch": 0.81, + "learning_rate": 3.8926643625490266e-08, + "loss": 0.0005, + "step": 41528 + }, + { + "epoch": 0.81, + "learning_rate": 3.8922760281154124e-08, + "loss": 0.0004, + "step": 41529 + }, + { + "epoch": 0.81, + "learning_rate": 3.891887693681798e-08, + "loss": 0.0004, + "step": 41530 + }, + { + "epoch": 0.81, + "learning_rate": 3.891499359248184e-08, + "loss": 0.0002, + "step": 41531 + }, + { + "epoch": 0.81, + "learning_rate": 3.89111102481457e-08, + "loss": 0.0004, + "step": 41532 + }, + { + "epoch": 0.81, + "learning_rate": 3.890722690380956e-08, + "loss": 0.0003, + "step": 41533 + }, + { + "epoch": 0.81, + "learning_rate": 3.8903343559473416e-08, + "loss": 0.0003, + "step": 41534 + }, + { + "epoch": 0.81, + "learning_rate": 3.8899460215137274e-08, + "loss": 0.0074, + "step": 41535 + }, + { + "epoch": 0.81, + "learning_rate": 3.889557687080113e-08, + "loss": 0.9206, + "step": 41536 + }, + { + "epoch": 0.81, + "learning_rate": 3.889169352646499e-08, + "loss": 0.0003, + "step": 41537 + }, + { + "epoch": 0.81, + "learning_rate": 3.888781018212885e-08, + "loss": 0.0031, + "step": 41538 + }, + { + "epoch": 0.81, + "learning_rate": 3.888392683779271e-08, + "loss": 0.0004, + "step": 41539 + }, + { + "epoch": 0.81, + "learning_rate": 3.8880043493456565e-08, + "loss": 0.0005, + "step": 41540 + }, + { + "epoch": 0.81, + "learning_rate": 3.8876160149120417e-08, + "loss": 0.0005, + "step": 41541 + }, + { + "epoch": 0.81, + "learning_rate": 3.8872276804784275e-08, + "loss": 0.0006, + "step": 41542 + }, + { + "epoch": 0.81, + "learning_rate": 3.886839346044813e-08, + "loss": 0.0004, + "step": 41543 + }, + { + "epoch": 0.81, + "learning_rate": 3.886451011611199e-08, + "loss": 0.0002, + "step": 41544 + }, + { + "epoch": 0.81, + "learning_rate": 3.886062677177585e-08, + "loss": 0.1624, + "step": 41545 + }, + { + "epoch": 0.81, + "learning_rate": 3.885674342743971e-08, + "loss": 1.0976, + "step": 41546 + }, + { + "epoch": 0.81, + "learning_rate": 3.8852860083103566e-08, + "loss": 0.0011, + "step": 41547 + }, + { + "epoch": 0.81, + "learning_rate": 3.8848976738767424e-08, + "loss": 0.0008, + "step": 41548 + }, + { + "epoch": 0.81, + "learning_rate": 3.884509339443128e-08, + "loss": 0.0004, + "step": 41549 + }, + { + "epoch": 0.81, + "learning_rate": 3.884121005009514e-08, + "loss": 0.0002, + "step": 41550 + }, + { + "epoch": 0.81, + "learning_rate": 3.8837326705759e-08, + "loss": 0.0007, + "step": 41551 + }, + { + "epoch": 0.81, + "learning_rate": 3.883344336142286e-08, + "loss": 0.0005, + "step": 41552 + }, + { + "epoch": 0.81, + "learning_rate": 3.8829560017086716e-08, + "loss": 0.0017, + "step": 41553 + }, + { + "epoch": 0.81, + "learning_rate": 3.8825676672750574e-08, + "loss": 0.0003, + "step": 41554 + }, + { + "epoch": 0.81, + "learning_rate": 3.8821793328414425e-08, + "loss": 0.0006, + "step": 41555 + }, + { + "epoch": 0.81, + "learning_rate": 3.8817909984078284e-08, + "loss": 0.0005, + "step": 41556 + }, + { + "epoch": 0.81, + "learning_rate": 3.881402663974214e-08, + "loss": 0.0004, + "step": 41557 + }, + { + "epoch": 0.81, + "learning_rate": 3.8810143295406e-08, + "loss": 0.0004, + "step": 41558 + }, + { + "epoch": 0.81, + "learning_rate": 3.880625995106986e-08, + "loss": 0.0004, + "step": 41559 + }, + { + "epoch": 0.81, + "learning_rate": 3.8802376606733717e-08, + "loss": 0.0004, + "step": 41560 + }, + { + "epoch": 0.81, + "learning_rate": 3.8798493262397575e-08, + "loss": 0.0003, + "step": 41561 + }, + { + "epoch": 0.81, + "learning_rate": 3.879460991806143e-08, + "loss": 0.0006, + "step": 41562 + }, + { + "epoch": 0.81, + "learning_rate": 3.879072657372529e-08, + "loss": 0.0004, + "step": 41563 + }, + { + "epoch": 0.81, + "learning_rate": 3.878684322938915e-08, + "loss": 0.0004, + "step": 41564 + }, + { + "epoch": 0.81, + "learning_rate": 3.878295988505301e-08, + "loss": 0.0004, + "step": 41565 + }, + { + "epoch": 0.81, + "learning_rate": 3.8779076540716866e-08, + "loss": 0.0003, + "step": 41566 + }, + { + "epoch": 0.81, + "learning_rate": 3.8775193196380724e-08, + "loss": 0.0005, + "step": 41567 + }, + { + "epoch": 0.81, + "learning_rate": 3.877130985204458e-08, + "loss": 0.0006, + "step": 41568 + }, + { + "epoch": 0.81, + "learning_rate": 3.876742650770844e-08, + "loss": 0.0142, + "step": 41569 + }, + { + "epoch": 0.81, + "learning_rate": 3.876354316337229e-08, + "loss": 0.0004, + "step": 41570 + }, + { + "epoch": 0.81, + "learning_rate": 3.875965981903615e-08, + "loss": 0.0005, + "step": 41571 + }, + { + "epoch": 0.81, + "learning_rate": 3.875577647470001e-08, + "loss": 0.0003, + "step": 41572 + }, + { + "epoch": 0.81, + "learning_rate": 3.875189313036387e-08, + "loss": 0.0004, + "step": 41573 + }, + { + "epoch": 0.81, + "learning_rate": 3.8748009786027725e-08, + "loss": 0.0698, + "step": 41574 + }, + { + "epoch": 0.81, + "learning_rate": 3.8744126441691584e-08, + "loss": 0.0047, + "step": 41575 + }, + { + "epoch": 0.81, + "learning_rate": 3.874024309735544e-08, + "loss": 0.0008, + "step": 41576 + }, + { + "epoch": 0.81, + "learning_rate": 3.87363597530193e-08, + "loss": 0.0004, + "step": 41577 + }, + { + "epoch": 0.81, + "learning_rate": 3.873247640868316e-08, + "loss": 0.0185, + "step": 41578 + }, + { + "epoch": 0.81, + "learning_rate": 3.8728593064347017e-08, + "loss": 0.0005, + "step": 41579 + }, + { + "epoch": 0.81, + "learning_rate": 3.8724709720010875e-08, + "loss": 0.0005, + "step": 41580 + }, + { + "epoch": 0.81, + "learning_rate": 3.872082637567473e-08, + "loss": 0.0003, + "step": 41581 + }, + { + "epoch": 0.81, + "learning_rate": 3.871694303133859e-08, + "loss": 0.0005, + "step": 41582 + }, + { + "epoch": 0.81, + "learning_rate": 3.871305968700245e-08, + "loss": 0.0003, + "step": 41583 + }, + { + "epoch": 0.81, + "learning_rate": 3.87091763426663e-08, + "loss": 0.0004, + "step": 41584 + }, + { + "epoch": 0.81, + "learning_rate": 3.870529299833016e-08, + "loss": 0.0014, + "step": 41585 + }, + { + "epoch": 0.81, + "learning_rate": 3.870140965399402e-08, + "loss": 1.3697, + "step": 41586 + }, + { + "epoch": 0.81, + "learning_rate": 3.8697526309657876e-08, + "loss": 0.0003, + "step": 41587 + }, + { + "epoch": 0.81, + "learning_rate": 3.8693642965321734e-08, + "loss": 0.0004, + "step": 41588 + }, + { + "epoch": 0.81, + "learning_rate": 3.868975962098559e-08, + "loss": 0.0005, + "step": 41589 + }, + { + "epoch": 0.81, + "learning_rate": 3.868587627664945e-08, + "loss": 0.0007, + "step": 41590 + }, + { + "epoch": 0.81, + "learning_rate": 3.868199293231331e-08, + "loss": 0.0008, + "step": 41591 + }, + { + "epoch": 0.81, + "learning_rate": 3.867810958797717e-08, + "loss": 0.0005, + "step": 41592 + }, + { + "epoch": 0.81, + "learning_rate": 3.8674226243641025e-08, + "loss": 0.0003, + "step": 41593 + }, + { + "epoch": 0.81, + "learning_rate": 3.8670342899304884e-08, + "loss": 0.0003, + "step": 41594 + }, + { + "epoch": 0.81, + "learning_rate": 3.866645955496874e-08, + "loss": 0.0006, + "step": 41595 + }, + { + "epoch": 0.81, + "learning_rate": 3.86625762106326e-08, + "loss": 1.3075, + "step": 41596 + }, + { + "epoch": 0.81, + "learning_rate": 3.865869286629645e-08, + "loss": 0.0003, + "step": 41597 + }, + { + "epoch": 0.81, + "learning_rate": 3.865480952196031e-08, + "loss": 0.0003, + "step": 41598 + }, + { + "epoch": 0.81, + "learning_rate": 3.865092617762417e-08, + "loss": 0.0005, + "step": 41599 + }, + { + "epoch": 0.81, + "learning_rate": 3.8647042833288027e-08, + "loss": 0.0004, + "step": 41600 + }, + { + "epoch": 0.81, + "learning_rate": 3.8643159488951885e-08, + "loss": 0.0004, + "step": 41601 + }, + { + "epoch": 0.81, + "learning_rate": 3.863927614461574e-08, + "loss": 0.0013, + "step": 41602 + }, + { + "epoch": 0.81, + "learning_rate": 3.86353928002796e-08, + "loss": 0.0006, + "step": 41603 + }, + { + "epoch": 0.81, + "learning_rate": 3.863150945594346e-08, + "loss": 0.0004, + "step": 41604 + }, + { + "epoch": 0.81, + "learning_rate": 3.862762611160731e-08, + "loss": 0.0004, + "step": 41605 + }, + { + "epoch": 0.81, + "learning_rate": 3.862374276727117e-08, + "loss": 0.0006, + "step": 41606 + }, + { + "epoch": 0.81, + "learning_rate": 3.861985942293503e-08, + "loss": 0.0003, + "step": 41607 + }, + { + "epoch": 0.81, + "learning_rate": 3.8615976078598886e-08, + "loss": 0.0006, + "step": 41608 + }, + { + "epoch": 0.81, + "learning_rate": 3.8612092734262744e-08, + "loss": 0.0003, + "step": 41609 + }, + { + "epoch": 0.81, + "learning_rate": 3.86082093899266e-08, + "loss": 0.2048, + "step": 41610 + }, + { + "epoch": 0.81, + "learning_rate": 3.860432604559046e-08, + "loss": 0.0369, + "step": 41611 + }, + { + "epoch": 0.81, + "learning_rate": 3.860044270125432e-08, + "loss": 0.0004, + "step": 41612 + }, + { + "epoch": 0.81, + "learning_rate": 3.859655935691817e-08, + "loss": 0.0003, + "step": 41613 + }, + { + "epoch": 0.81, + "learning_rate": 3.859267601258203e-08, + "loss": 0.0005, + "step": 41614 + }, + { + "epoch": 0.81, + "learning_rate": 3.858879266824589e-08, + "loss": 0.0003, + "step": 41615 + }, + { + "epoch": 0.81, + "learning_rate": 3.8584909323909745e-08, + "loss": 0.0005, + "step": 41616 + }, + { + "epoch": 0.81, + "learning_rate": 3.8581025979573603e-08, + "loss": 0.0009, + "step": 41617 + }, + { + "epoch": 0.81, + "learning_rate": 3.857714263523746e-08, + "loss": 0.0004, + "step": 41618 + }, + { + "epoch": 0.81, + "learning_rate": 3.857325929090132e-08, + "loss": 0.0004, + "step": 41619 + }, + { + "epoch": 0.81, + "learning_rate": 3.856937594656518e-08, + "loss": 0.0004, + "step": 41620 + }, + { + "epoch": 0.81, + "learning_rate": 3.8565492602229036e-08, + "loss": 0.0005, + "step": 41621 + }, + { + "epoch": 0.81, + "learning_rate": 3.8561609257892895e-08, + "loss": 0.0003, + "step": 41622 + }, + { + "epoch": 0.81, + "learning_rate": 3.855772591355675e-08, + "loss": 0.0003, + "step": 41623 + }, + { + "epoch": 0.81, + "learning_rate": 3.855384256922061e-08, + "loss": 0.4994, + "step": 41624 + }, + { + "epoch": 0.81, + "learning_rate": 3.854995922488447e-08, + "loss": 0.0003, + "step": 41625 + }, + { + "epoch": 0.81, + "learning_rate": 3.854607588054833e-08, + "loss": 0.0003, + "step": 41626 + }, + { + "epoch": 0.81, + "learning_rate": 3.8542192536212186e-08, + "loss": 0.0005, + "step": 41627 + }, + { + "epoch": 0.81, + "learning_rate": 3.853830919187604e-08, + "loss": 0.0003, + "step": 41628 + }, + { + "epoch": 0.81, + "learning_rate": 3.8534425847539896e-08, + "loss": 0.0004, + "step": 41629 + }, + { + "epoch": 0.81, + "learning_rate": 3.8530542503203754e-08, + "loss": 0.0005, + "step": 41630 + }, + { + "epoch": 0.81, + "learning_rate": 3.852665915886761e-08, + "loss": 0.8571, + "step": 41631 + }, + { + "epoch": 0.81, + "learning_rate": 3.852277581453147e-08, + "loss": 0.0004, + "step": 41632 + }, + { + "epoch": 0.81, + "learning_rate": 3.851889247019533e-08, + "loss": 0.0003, + "step": 41633 + }, + { + "epoch": 0.81, + "learning_rate": 3.851500912585919e-08, + "loss": 0.0003, + "step": 41634 + }, + { + "epoch": 0.81, + "learning_rate": 3.8511125781523045e-08, + "loss": 0.0005, + "step": 41635 + }, + { + "epoch": 0.81, + "learning_rate": 3.8507242437186903e-08, + "loss": 0.0005, + "step": 41636 + }, + { + "epoch": 0.81, + "learning_rate": 3.850335909285076e-08, + "loss": 0.0005, + "step": 41637 + }, + { + "epoch": 0.81, + "learning_rate": 3.849947574851462e-08, + "loss": 0.0004, + "step": 41638 + }, + { + "epoch": 0.81, + "learning_rate": 3.849559240417848e-08, + "loss": 0.0004, + "step": 41639 + }, + { + "epoch": 0.81, + "learning_rate": 3.8491709059842336e-08, + "loss": 0.0008, + "step": 41640 + }, + { + "epoch": 0.81, + "learning_rate": 3.8487825715506195e-08, + "loss": 0.0006, + "step": 41641 + }, + { + "epoch": 0.81, + "learning_rate": 3.8483942371170046e-08, + "loss": 0.0158, + "step": 41642 + }, + { + "epoch": 0.81, + "learning_rate": 3.8480059026833905e-08, + "loss": 0.0002, + "step": 41643 + }, + { + "epoch": 0.81, + "learning_rate": 3.847617568249776e-08, + "loss": 0.0003, + "step": 41644 + }, + { + "epoch": 0.81, + "learning_rate": 3.847229233816162e-08, + "loss": 0.0004, + "step": 41645 + }, + { + "epoch": 0.81, + "learning_rate": 3.846840899382548e-08, + "loss": 0.2855, + "step": 41646 + }, + { + "epoch": 0.81, + "learning_rate": 3.846452564948934e-08, + "loss": 0.0005, + "step": 41647 + }, + { + "epoch": 0.81, + "learning_rate": 3.8460642305153196e-08, + "loss": 0.002, + "step": 41648 + }, + { + "epoch": 0.81, + "learning_rate": 3.8456758960817054e-08, + "loss": 0.0005, + "step": 41649 + }, + { + "epoch": 0.81, + "learning_rate": 3.845287561648091e-08, + "loss": 0.0004, + "step": 41650 + }, + { + "epoch": 0.81, + "learning_rate": 3.844899227214477e-08, + "loss": 0.0003, + "step": 41651 + }, + { + "epoch": 0.81, + "learning_rate": 3.844510892780863e-08, + "loss": 0.0005, + "step": 41652 + }, + { + "epoch": 0.81, + "learning_rate": 3.844122558347249e-08, + "loss": 0.0004, + "step": 41653 + }, + { + "epoch": 0.81, + "learning_rate": 3.8437342239136345e-08, + "loss": 0.0004, + "step": 41654 + }, + { + "epoch": 0.81, + "learning_rate": 3.8433458894800204e-08, + "loss": 0.0003, + "step": 41655 + }, + { + "epoch": 0.81, + "learning_rate": 3.842957555046406e-08, + "loss": 0.0007, + "step": 41656 + }, + { + "epoch": 0.81, + "learning_rate": 3.8425692206127913e-08, + "loss": 0.0004, + "step": 41657 + }, + { + "epoch": 0.81, + "learning_rate": 3.842180886179177e-08, + "loss": 0.0009, + "step": 41658 + }, + { + "epoch": 0.81, + "learning_rate": 3.841792551745563e-08, + "loss": 0.0004, + "step": 41659 + }, + { + "epoch": 0.81, + "learning_rate": 3.841404217311949e-08, + "loss": 0.0005, + "step": 41660 + }, + { + "epoch": 0.81, + "learning_rate": 3.8410158828783346e-08, + "loss": 0.0004, + "step": 41661 + }, + { + "epoch": 0.81, + "learning_rate": 3.8406275484447205e-08, + "loss": 0.0007, + "step": 41662 + }, + { + "epoch": 0.81, + "learning_rate": 3.840239214011106e-08, + "loss": 0.0004, + "step": 41663 + }, + { + "epoch": 0.81, + "learning_rate": 3.839850879577492e-08, + "loss": 0.0004, + "step": 41664 + }, + { + "epoch": 0.81, + "learning_rate": 3.839462545143878e-08, + "loss": 0.0002, + "step": 41665 + }, + { + "epoch": 0.81, + "learning_rate": 3.839074210710264e-08, + "loss": 0.0004, + "step": 41666 + }, + { + "epoch": 0.81, + "learning_rate": 3.8386858762766496e-08, + "loss": 0.0004, + "step": 41667 + }, + { + "epoch": 0.81, + "learning_rate": 3.8382975418430354e-08, + "loss": 0.0011, + "step": 41668 + }, + { + "epoch": 0.81, + "learning_rate": 3.837909207409421e-08, + "loss": 1.1234, + "step": 41669 + }, + { + "epoch": 0.81, + "learning_rate": 3.837520872975807e-08, + "loss": 0.0006, + "step": 41670 + }, + { + "epoch": 0.81, + "learning_rate": 3.837132538542192e-08, + "loss": 0.0004, + "step": 41671 + }, + { + "epoch": 0.81, + "learning_rate": 3.836744204108578e-08, + "loss": 0.0003, + "step": 41672 + }, + { + "epoch": 0.81, + "learning_rate": 3.836355869674964e-08, + "loss": 0.0003, + "step": 41673 + }, + { + "epoch": 0.81, + "learning_rate": 3.83596753524135e-08, + "loss": 0.0004, + "step": 41674 + }, + { + "epoch": 0.81, + "learning_rate": 3.8355792008077355e-08, + "loss": 0.0004, + "step": 41675 + }, + { + "epoch": 0.81, + "learning_rate": 3.8351908663741213e-08, + "loss": 0.0065, + "step": 41676 + }, + { + "epoch": 0.81, + "learning_rate": 3.834802531940507e-08, + "loss": 0.0005, + "step": 41677 + }, + { + "epoch": 0.81, + "learning_rate": 3.834414197506893e-08, + "loss": 0.0003, + "step": 41678 + }, + { + "epoch": 0.81, + "learning_rate": 3.834025863073279e-08, + "loss": 0.0004, + "step": 41679 + }, + { + "epoch": 0.81, + "learning_rate": 3.8336375286396646e-08, + "loss": 0.0004, + "step": 41680 + }, + { + "epoch": 0.81, + "learning_rate": 3.8332491942060505e-08, + "loss": 0.0002, + "step": 41681 + }, + { + "epoch": 0.81, + "learning_rate": 3.832860859772436e-08, + "loss": 0.0011, + "step": 41682 + }, + { + "epoch": 0.81, + "learning_rate": 3.832472525338822e-08, + "loss": 0.0003, + "step": 41683 + }, + { + "epoch": 0.81, + "learning_rate": 3.832084190905208e-08, + "loss": 0.0004, + "step": 41684 + }, + { + "epoch": 0.81, + "learning_rate": 3.831695856471594e-08, + "loss": 0.0005, + "step": 41685 + }, + { + "epoch": 0.81, + "learning_rate": 3.831307522037979e-08, + "loss": 0.0004, + "step": 41686 + }, + { + "epoch": 0.81, + "learning_rate": 3.830919187604365e-08, + "loss": 0.0005, + "step": 41687 + }, + { + "epoch": 0.81, + "learning_rate": 3.8305308531707506e-08, + "loss": 0.3756, + "step": 41688 + }, + { + "epoch": 0.81, + "learning_rate": 3.8301425187371364e-08, + "loss": 0.0005, + "step": 41689 + }, + { + "epoch": 0.81, + "learning_rate": 3.829754184303522e-08, + "loss": 0.0003, + "step": 41690 + }, + { + "epoch": 0.81, + "learning_rate": 3.829365849869908e-08, + "loss": 0.0005, + "step": 41691 + }, + { + "epoch": 0.81, + "learning_rate": 3.828977515436294e-08, + "loss": 0.0004, + "step": 41692 + }, + { + "epoch": 0.81, + "learning_rate": 3.828589181002679e-08, + "loss": 0.0004, + "step": 41693 + }, + { + "epoch": 0.81, + "learning_rate": 3.828200846569065e-08, + "loss": 0.0006, + "step": 41694 + }, + { + "epoch": 0.81, + "learning_rate": 3.827812512135451e-08, + "loss": 0.0009, + "step": 41695 + }, + { + "epoch": 0.81, + "learning_rate": 3.8274241777018365e-08, + "loss": 0.0002, + "step": 41696 + }, + { + "epoch": 0.81, + "learning_rate": 3.8270358432682223e-08, + "loss": 0.0015, + "step": 41697 + }, + { + "epoch": 0.81, + "learning_rate": 3.826647508834608e-08, + "loss": 0.0003, + "step": 41698 + }, + { + "epoch": 0.81, + "learning_rate": 3.826259174400994e-08, + "loss": 0.0004, + "step": 41699 + }, + { + "epoch": 0.81, + "learning_rate": 3.825870839967379e-08, + "loss": 0.0003, + "step": 41700 + }, + { + "epoch": 0.81, + "learning_rate": 3.825482505533765e-08, + "loss": 0.0004, + "step": 41701 + }, + { + "epoch": 0.81, + "learning_rate": 3.825094171100151e-08, + "loss": 0.0004, + "step": 41702 + }, + { + "epoch": 0.81, + "learning_rate": 3.8247058366665366e-08, + "loss": 0.0003, + "step": 41703 + }, + { + "epoch": 0.81, + "learning_rate": 3.8243175022329224e-08, + "loss": 0.354, + "step": 41704 + }, + { + "epoch": 0.81, + "learning_rate": 3.823929167799308e-08, + "loss": 0.1305, + "step": 41705 + }, + { + "epoch": 0.81, + "learning_rate": 3.823540833365694e-08, + "loss": 0.0005, + "step": 41706 + }, + { + "epoch": 0.81, + "learning_rate": 3.82315249893208e-08, + "loss": 0.0005, + "step": 41707 + }, + { + "epoch": 0.81, + "learning_rate": 3.822764164498466e-08, + "loss": 0.0005, + "step": 41708 + }, + { + "epoch": 0.81, + "learning_rate": 3.8223758300648516e-08, + "loss": 0.0007, + "step": 41709 + }, + { + "epoch": 0.81, + "learning_rate": 3.8219874956312374e-08, + "loss": 0.0003, + "step": 41710 + }, + { + "epoch": 0.81, + "learning_rate": 3.821599161197623e-08, + "loss": 0.0003, + "step": 41711 + }, + { + "epoch": 0.81, + "learning_rate": 3.821210826764009e-08, + "loss": 0.0004, + "step": 41712 + }, + { + "epoch": 0.81, + "learning_rate": 3.820822492330395e-08, + "loss": 0.8918, + "step": 41713 + }, + { + "epoch": 0.81, + "learning_rate": 3.820434157896781e-08, + "loss": 0.0004, + "step": 41714 + }, + { + "epoch": 0.81, + "learning_rate": 3.820045823463166e-08, + "loss": 0.0003, + "step": 41715 + }, + { + "epoch": 0.81, + "learning_rate": 3.819657489029552e-08, + "loss": 0.0006, + "step": 41716 + }, + { + "epoch": 0.81, + "learning_rate": 3.8192691545959375e-08, + "loss": 0.0005, + "step": 41717 + }, + { + "epoch": 0.81, + "learning_rate": 3.818880820162323e-08, + "loss": 0.0005, + "step": 41718 + }, + { + "epoch": 0.81, + "learning_rate": 3.818492485728709e-08, + "loss": 0.0006, + "step": 41719 + }, + { + "epoch": 0.81, + "learning_rate": 3.818104151295095e-08, + "loss": 0.0003, + "step": 41720 + }, + { + "epoch": 0.81, + "learning_rate": 3.817715816861481e-08, + "loss": 0.0004, + "step": 41721 + }, + { + "epoch": 0.81, + "learning_rate": 3.8173274824278666e-08, + "loss": 0.0005, + "step": 41722 + }, + { + "epoch": 0.81, + "learning_rate": 3.8169391479942524e-08, + "loss": 0.0004, + "step": 41723 + }, + { + "epoch": 0.81, + "learning_rate": 3.816550813560638e-08, + "loss": 0.0004, + "step": 41724 + }, + { + "epoch": 0.81, + "learning_rate": 3.816162479127024e-08, + "loss": 0.0004, + "step": 41725 + }, + { + "epoch": 0.81, + "learning_rate": 3.81577414469341e-08, + "loss": 0.8186, + "step": 41726 + }, + { + "epoch": 0.81, + "learning_rate": 3.815385810259796e-08, + "loss": 0.0005, + "step": 41727 + }, + { + "epoch": 0.81, + "learning_rate": 3.8149974758261816e-08, + "loss": 0.0003, + "step": 41728 + }, + { + "epoch": 0.81, + "learning_rate": 3.814609141392567e-08, + "loss": 0.5656, + "step": 41729 + }, + { + "epoch": 0.81, + "learning_rate": 3.8142208069589526e-08, + "loss": 0.0005, + "step": 41730 + }, + { + "epoch": 0.81, + "learning_rate": 3.8138324725253384e-08, + "loss": 0.001, + "step": 41731 + }, + { + "epoch": 0.81, + "learning_rate": 3.813444138091724e-08, + "loss": 0.0006, + "step": 41732 + }, + { + "epoch": 0.81, + "learning_rate": 3.81305580365811e-08, + "loss": 0.7834, + "step": 41733 + }, + { + "epoch": 0.81, + "learning_rate": 3.812667469224496e-08, + "loss": 0.0004, + "step": 41734 + }, + { + "epoch": 0.81, + "learning_rate": 3.812279134790882e-08, + "loss": 0.0011, + "step": 41735 + }, + { + "epoch": 0.81, + "learning_rate": 3.8118908003572675e-08, + "loss": 0.0004, + "step": 41736 + }, + { + "epoch": 0.81, + "learning_rate": 3.811502465923653e-08, + "loss": 0.0006, + "step": 41737 + }, + { + "epoch": 0.81, + "learning_rate": 3.811114131490039e-08, + "loss": 0.0004, + "step": 41738 + }, + { + "epoch": 0.81, + "learning_rate": 3.810725797056425e-08, + "loss": 0.0003, + "step": 41739 + }, + { + "epoch": 0.81, + "learning_rate": 3.810337462622811e-08, + "loss": 0.0006, + "step": 41740 + }, + { + "epoch": 0.81, + "learning_rate": 3.8099491281891966e-08, + "loss": 0.0003, + "step": 41741 + }, + { + "epoch": 0.81, + "learning_rate": 3.8095607937555824e-08, + "loss": 0.0005, + "step": 41742 + }, + { + "epoch": 0.81, + "learning_rate": 3.809172459321968e-08, + "loss": 0.0003, + "step": 41743 + }, + { + "epoch": 0.81, + "learning_rate": 3.8087841248883534e-08, + "loss": 0.0004, + "step": 41744 + }, + { + "epoch": 0.81, + "learning_rate": 3.808395790454739e-08, + "loss": 0.0005, + "step": 41745 + }, + { + "epoch": 0.81, + "learning_rate": 3.808007456021125e-08, + "loss": 0.0004, + "step": 41746 + }, + { + "epoch": 0.81, + "learning_rate": 3.807619121587511e-08, + "loss": 0.0003, + "step": 41747 + }, + { + "epoch": 0.81, + "learning_rate": 3.807230787153897e-08, + "loss": 0.0005, + "step": 41748 + }, + { + "epoch": 0.81, + "learning_rate": 3.8068424527202826e-08, + "loss": 0.0004, + "step": 41749 + }, + { + "epoch": 0.81, + "learning_rate": 3.8064541182866684e-08, + "loss": 0.0005, + "step": 41750 + }, + { + "epoch": 0.81, + "learning_rate": 3.806065783853054e-08, + "loss": 0.8825, + "step": 41751 + }, + { + "epoch": 0.81, + "learning_rate": 3.80567744941944e-08, + "loss": 0.0004, + "step": 41752 + }, + { + "epoch": 0.81, + "learning_rate": 3.805289114985826e-08, + "loss": 0.0003, + "step": 41753 + }, + { + "epoch": 0.81, + "learning_rate": 3.804900780552212e-08, + "loss": 0.0004, + "step": 41754 + }, + { + "epoch": 0.81, + "learning_rate": 3.8045124461185975e-08, + "loss": 0.0004, + "step": 41755 + }, + { + "epoch": 0.81, + "learning_rate": 3.804124111684983e-08, + "loss": 0.0005, + "step": 41756 + }, + { + "epoch": 0.81, + "learning_rate": 3.803735777251369e-08, + "loss": 0.0005, + "step": 41757 + }, + { + "epoch": 0.81, + "learning_rate": 3.803347442817754e-08, + "loss": 0.0003, + "step": 41758 + }, + { + "epoch": 0.81, + "learning_rate": 3.80295910838414e-08, + "loss": 0.0231, + "step": 41759 + }, + { + "epoch": 0.81, + "learning_rate": 3.802570773950526e-08, + "loss": 0.0006, + "step": 41760 + }, + { + "epoch": 0.81, + "learning_rate": 3.802182439516912e-08, + "loss": 0.2862, + "step": 41761 + }, + { + "epoch": 0.81, + "learning_rate": 3.8017941050832976e-08, + "loss": 0.0004, + "step": 41762 + }, + { + "epoch": 0.81, + "learning_rate": 3.8014057706496834e-08, + "loss": 0.0003, + "step": 41763 + }, + { + "epoch": 0.81, + "learning_rate": 3.801017436216069e-08, + "loss": 0.0005, + "step": 41764 + }, + { + "epoch": 0.81, + "learning_rate": 3.800629101782455e-08, + "loss": 0.0003, + "step": 41765 + }, + { + "epoch": 0.81, + "learning_rate": 3.800240767348841e-08, + "loss": 0.4363, + "step": 41766 + }, + { + "epoch": 0.81, + "learning_rate": 3.799852432915227e-08, + "loss": 0.0004, + "step": 41767 + }, + { + "epoch": 0.81, + "learning_rate": 3.7994640984816126e-08, + "loss": 0.0006, + "step": 41768 + }, + { + "epoch": 0.81, + "learning_rate": 3.7990757640479984e-08, + "loss": 0.0004, + "step": 41769 + }, + { + "epoch": 0.81, + "learning_rate": 3.798687429614384e-08, + "loss": 0.0004, + "step": 41770 + }, + { + "epoch": 0.81, + "learning_rate": 3.79829909518077e-08, + "loss": 0.0005, + "step": 41771 + }, + { + "epoch": 0.81, + "learning_rate": 3.797910760747156e-08, + "loss": 0.0005, + "step": 41772 + }, + { + "epoch": 0.81, + "learning_rate": 3.797522426313541e-08, + "loss": 0.0005, + "step": 41773 + }, + { + "epoch": 0.81, + "learning_rate": 3.797134091879927e-08, + "loss": 0.0003, + "step": 41774 + }, + { + "epoch": 0.81, + "learning_rate": 3.7967457574463127e-08, + "loss": 0.0004, + "step": 41775 + }, + { + "epoch": 0.81, + "learning_rate": 3.7963574230126985e-08, + "loss": 0.0006, + "step": 41776 + }, + { + "epoch": 0.81, + "learning_rate": 3.795969088579084e-08, + "loss": 0.0006, + "step": 41777 + }, + { + "epoch": 0.81, + "learning_rate": 3.79558075414547e-08, + "loss": 0.0004, + "step": 41778 + }, + { + "epoch": 0.81, + "learning_rate": 3.795192419711856e-08, + "loss": 0.0004, + "step": 41779 + }, + { + "epoch": 0.81, + "learning_rate": 3.794804085278242e-08, + "loss": 0.0004, + "step": 41780 + }, + { + "epoch": 0.81, + "learning_rate": 3.7944157508446276e-08, + "loss": 0.0003, + "step": 41781 + }, + { + "epoch": 0.81, + "learning_rate": 3.794027416411013e-08, + "loss": 0.0003, + "step": 41782 + }, + { + "epoch": 0.81, + "learning_rate": 3.7936390819773986e-08, + "loss": 0.0004, + "step": 41783 + }, + { + "epoch": 0.81, + "learning_rate": 3.7932507475437844e-08, + "loss": 0.0005, + "step": 41784 + }, + { + "epoch": 0.81, + "learning_rate": 3.79286241311017e-08, + "loss": 0.0004, + "step": 41785 + }, + { + "epoch": 0.81, + "learning_rate": 3.792474078676556e-08, + "loss": 0.0003, + "step": 41786 + }, + { + "epoch": 0.81, + "learning_rate": 3.792085744242942e-08, + "loss": 0.0004, + "step": 41787 + }, + { + "epoch": 0.81, + "learning_rate": 3.791697409809328e-08, + "loss": 0.0004, + "step": 41788 + }, + { + "epoch": 0.81, + "learning_rate": 3.791309075375713e-08, + "loss": 0.0002, + "step": 41789 + }, + { + "epoch": 0.81, + "learning_rate": 3.790920740942099e-08, + "loss": 0.0003, + "step": 41790 + }, + { + "epoch": 0.81, + "learning_rate": 3.7905324065084845e-08, + "loss": 0.3116, + "step": 41791 + }, + { + "epoch": 0.81, + "learning_rate": 3.7901440720748704e-08, + "loss": 0.0006, + "step": 41792 + }, + { + "epoch": 0.81, + "learning_rate": 3.789755737641256e-08, + "loss": 0.0004, + "step": 41793 + }, + { + "epoch": 0.81, + "learning_rate": 3.789367403207642e-08, + "loss": 0.0003, + "step": 41794 + }, + { + "epoch": 0.81, + "learning_rate": 3.788979068774028e-08, + "loss": 0.0004, + "step": 41795 + }, + { + "epoch": 0.81, + "learning_rate": 3.7885907343404137e-08, + "loss": 0.0004, + "step": 41796 + }, + { + "epoch": 0.81, + "learning_rate": 3.7882023999067995e-08, + "loss": 0.0003, + "step": 41797 + }, + { + "epoch": 0.81, + "learning_rate": 3.787814065473185e-08, + "loss": 0.57, + "step": 41798 + }, + { + "epoch": 0.81, + "learning_rate": 3.787425731039571e-08, + "loss": 0.1687, + "step": 41799 + }, + { + "epoch": 0.81, + "learning_rate": 3.787037396605957e-08, + "loss": 0.0003, + "step": 41800 + }, + { + "epoch": 0.81, + "learning_rate": 3.786649062172343e-08, + "loss": 0.0005, + "step": 41801 + }, + { + "epoch": 0.81, + "learning_rate": 3.786260727738728e-08, + "loss": 0.0004, + "step": 41802 + }, + { + "epoch": 0.81, + "learning_rate": 3.785872393305114e-08, + "loss": 0.0005, + "step": 41803 + }, + { + "epoch": 0.81, + "learning_rate": 3.7854840588714996e-08, + "loss": 0.0006, + "step": 41804 + }, + { + "epoch": 0.81, + "learning_rate": 3.7850957244378854e-08, + "loss": 0.0004, + "step": 41805 + }, + { + "epoch": 0.81, + "learning_rate": 3.784707390004271e-08, + "loss": 0.0004, + "step": 41806 + }, + { + "epoch": 0.81, + "learning_rate": 3.784319055570657e-08, + "loss": 0.001, + "step": 41807 + }, + { + "epoch": 0.81, + "learning_rate": 3.783930721137043e-08, + "loss": 0.0006, + "step": 41808 + }, + { + "epoch": 0.81, + "learning_rate": 3.783542386703429e-08, + "loss": 1.2718, + "step": 41809 + }, + { + "epoch": 0.81, + "learning_rate": 3.7831540522698145e-08, + "loss": 0.0005, + "step": 41810 + }, + { + "epoch": 0.81, + "learning_rate": 3.7827657178362004e-08, + "loss": 0.0005, + "step": 41811 + }, + { + "epoch": 0.81, + "learning_rate": 3.782377383402586e-08, + "loss": 0.0007, + "step": 41812 + }, + { + "epoch": 0.81, + "learning_rate": 3.781989048968972e-08, + "loss": 0.0225, + "step": 41813 + }, + { + "epoch": 0.81, + "learning_rate": 3.781600714535358e-08, + "loss": 0.0004, + "step": 41814 + }, + { + "epoch": 0.81, + "learning_rate": 3.7812123801017437e-08, + "loss": 0.0012, + "step": 41815 + }, + { + "epoch": 0.81, + "learning_rate": 3.780824045668129e-08, + "loss": 0.0008, + "step": 41816 + }, + { + "epoch": 0.81, + "learning_rate": 3.7804357112345146e-08, + "loss": 0.0004, + "step": 41817 + }, + { + "epoch": 0.81, + "learning_rate": 3.7800473768009005e-08, + "loss": 0.0005, + "step": 41818 + }, + { + "epoch": 0.81, + "learning_rate": 3.779659042367286e-08, + "loss": 0.0004, + "step": 41819 + }, + { + "epoch": 0.81, + "learning_rate": 3.779270707933672e-08, + "loss": 0.0005, + "step": 41820 + }, + { + "epoch": 0.81, + "learning_rate": 3.778882373500058e-08, + "loss": 0.0004, + "step": 41821 + }, + { + "epoch": 0.81, + "learning_rate": 3.778494039066444e-08, + "loss": 0.0006, + "step": 41822 + }, + { + "epoch": 0.81, + "learning_rate": 3.7781057046328296e-08, + "loss": 0.0003, + "step": 41823 + }, + { + "epoch": 0.81, + "learning_rate": 3.7777173701992154e-08, + "loss": 0.0005, + "step": 41824 + }, + { + "epoch": 0.81, + "learning_rate": 3.777329035765601e-08, + "loss": 0.0004, + "step": 41825 + }, + { + "epoch": 0.81, + "learning_rate": 3.776940701331987e-08, + "loss": 0.0004, + "step": 41826 + }, + { + "epoch": 0.81, + "learning_rate": 3.776552366898373e-08, + "loss": 0.0706, + "step": 41827 + }, + { + "epoch": 0.81, + "learning_rate": 3.776164032464759e-08, + "loss": 0.1924, + "step": 41828 + }, + { + "epoch": 0.81, + "learning_rate": 3.7757756980311445e-08, + "loss": 0.0008, + "step": 41829 + }, + { + "epoch": 0.81, + "learning_rate": 3.7753873635975304e-08, + "loss": 0.7751, + "step": 41830 + }, + { + "epoch": 0.81, + "learning_rate": 3.7749990291639155e-08, + "loss": 0.0008, + "step": 41831 + }, + { + "epoch": 0.81, + "learning_rate": 3.7746106947303014e-08, + "loss": 0.0006, + "step": 41832 + }, + { + "epoch": 0.81, + "learning_rate": 3.774222360296687e-08, + "loss": 0.0003, + "step": 41833 + }, + { + "epoch": 0.81, + "learning_rate": 3.773834025863073e-08, + "loss": 0.0004, + "step": 41834 + }, + { + "epoch": 0.81, + "learning_rate": 3.773445691429459e-08, + "loss": 0.0005, + "step": 41835 + }, + { + "epoch": 0.81, + "learning_rate": 3.7730573569958446e-08, + "loss": 0.0003, + "step": 41836 + }, + { + "epoch": 0.81, + "learning_rate": 3.7726690225622305e-08, + "loss": 0.0003, + "step": 41837 + }, + { + "epoch": 0.81, + "learning_rate": 3.772280688128616e-08, + "loss": 0.0004, + "step": 41838 + }, + { + "epoch": 0.81, + "learning_rate": 3.771892353695002e-08, + "loss": 0.0003, + "step": 41839 + }, + { + "epoch": 0.81, + "learning_rate": 3.771504019261388e-08, + "loss": 0.0004, + "step": 41840 + }, + { + "epoch": 0.81, + "learning_rate": 3.771115684827774e-08, + "loss": 0.6711, + "step": 41841 + }, + { + "epoch": 0.81, + "learning_rate": 3.7707273503941596e-08, + "loss": 0.0005, + "step": 41842 + }, + { + "epoch": 0.81, + "learning_rate": 3.7703390159605454e-08, + "loss": 0.176, + "step": 41843 + }, + { + "epoch": 0.81, + "learning_rate": 3.769950681526931e-08, + "loss": 0.0003, + "step": 41844 + }, + { + "epoch": 0.81, + "learning_rate": 3.7695623470933164e-08, + "loss": 0.0004, + "step": 41845 + }, + { + "epoch": 0.81, + "learning_rate": 3.769174012659702e-08, + "loss": 0.0004, + "step": 41846 + }, + { + "epoch": 0.81, + "learning_rate": 3.768785678226088e-08, + "loss": 0.0006, + "step": 41847 + }, + { + "epoch": 0.81, + "learning_rate": 3.768397343792474e-08, + "loss": 0.0305, + "step": 41848 + }, + { + "epoch": 0.81, + "learning_rate": 3.76800900935886e-08, + "loss": 0.0006, + "step": 41849 + }, + { + "epoch": 0.81, + "learning_rate": 3.7676206749252455e-08, + "loss": 0.0003, + "step": 41850 + }, + { + "epoch": 0.81, + "learning_rate": 3.7672323404916314e-08, + "loss": 0.0003, + "step": 41851 + }, + { + "epoch": 0.81, + "learning_rate": 3.766844006058017e-08, + "loss": 0.0004, + "step": 41852 + }, + { + "epoch": 0.81, + "learning_rate": 3.766455671624403e-08, + "loss": 0.0003, + "step": 41853 + }, + { + "epoch": 0.81, + "learning_rate": 3.766067337190789e-08, + "loss": 0.1858, + "step": 41854 + }, + { + "epoch": 0.81, + "learning_rate": 3.7656790027571747e-08, + "loss": 0.4111, + "step": 41855 + }, + { + "epoch": 0.81, + "learning_rate": 3.7652906683235605e-08, + "loss": 0.0021, + "step": 41856 + }, + { + "epoch": 0.81, + "learning_rate": 3.764902333889946e-08, + "loss": 0.0005, + "step": 41857 + }, + { + "epoch": 0.81, + "learning_rate": 3.764513999456332e-08, + "loss": 0.0214, + "step": 41858 + }, + { + "epoch": 0.81, + "learning_rate": 3.764125665022718e-08, + "loss": 0.0003, + "step": 41859 + }, + { + "epoch": 0.81, + "learning_rate": 3.763737330589103e-08, + "loss": 0.0552, + "step": 41860 + }, + { + "epoch": 0.81, + "learning_rate": 3.763348996155489e-08, + "loss": 0.0003, + "step": 41861 + }, + { + "epoch": 0.81, + "learning_rate": 3.762960661721875e-08, + "loss": 0.0003, + "step": 41862 + }, + { + "epoch": 0.81, + "learning_rate": 3.7625723272882606e-08, + "loss": 0.0004, + "step": 41863 + }, + { + "epoch": 0.81, + "learning_rate": 3.7621839928546464e-08, + "loss": 0.0005, + "step": 41864 + }, + { + "epoch": 0.81, + "learning_rate": 3.761795658421032e-08, + "loss": 0.0003, + "step": 41865 + }, + { + "epoch": 0.81, + "learning_rate": 3.761407323987418e-08, + "loss": 0.0008, + "step": 41866 + }, + { + "epoch": 0.81, + "learning_rate": 3.761018989553804e-08, + "loss": 0.0004, + "step": 41867 + }, + { + "epoch": 0.81, + "learning_rate": 3.76063065512019e-08, + "loss": 0.0004, + "step": 41868 + }, + { + "epoch": 0.81, + "learning_rate": 3.7602423206865755e-08, + "loss": 0.1604, + "step": 41869 + }, + { + "epoch": 0.81, + "learning_rate": 3.759853986252961e-08, + "loss": 0.0004, + "step": 41870 + }, + { + "epoch": 0.81, + "learning_rate": 3.7594656518193465e-08, + "loss": 0.0004, + "step": 41871 + }, + { + "epoch": 0.81, + "learning_rate": 3.7590773173857323e-08, + "loss": 0.0004, + "step": 41872 + }, + { + "epoch": 0.81, + "learning_rate": 3.758688982952118e-08, + "loss": 0.0004, + "step": 41873 + }, + { + "epoch": 0.81, + "learning_rate": 3.758300648518504e-08, + "loss": 0.0003, + "step": 41874 + }, + { + "epoch": 0.81, + "learning_rate": 3.75791231408489e-08, + "loss": 0.001, + "step": 41875 + }, + { + "epoch": 0.81, + "learning_rate": 3.7575239796512756e-08, + "loss": 0.0004, + "step": 41876 + }, + { + "epoch": 0.81, + "learning_rate": 3.757135645217661e-08, + "loss": 0.0154, + "step": 41877 + }, + { + "epoch": 0.81, + "learning_rate": 3.7567473107840466e-08, + "loss": 0.0003, + "step": 41878 + }, + { + "epoch": 0.81, + "learning_rate": 3.7563589763504325e-08, + "loss": 0.0005, + "step": 41879 + }, + { + "epoch": 0.81, + "learning_rate": 3.755970641916818e-08, + "loss": 0.0003, + "step": 41880 + }, + { + "epoch": 0.81, + "learning_rate": 3.755582307483204e-08, + "loss": 0.0013, + "step": 41881 + }, + { + "epoch": 0.81, + "learning_rate": 3.75519397304959e-08, + "loss": 0.0005, + "step": 41882 + }, + { + "epoch": 0.81, + "learning_rate": 3.754805638615976e-08, + "loss": 0.0004, + "step": 41883 + }, + { + "epoch": 0.81, + "learning_rate": 3.7544173041823616e-08, + "loss": 0.0086, + "step": 41884 + }, + { + "epoch": 0.81, + "learning_rate": 3.7540289697487474e-08, + "loss": 0.0004, + "step": 41885 + }, + { + "epoch": 0.81, + "learning_rate": 3.753640635315133e-08, + "loss": 0.0009, + "step": 41886 + }, + { + "epoch": 0.81, + "learning_rate": 3.753252300881519e-08, + "loss": 0.0005, + "step": 41887 + }, + { + "epoch": 0.81, + "learning_rate": 3.752863966447905e-08, + "loss": 0.0003, + "step": 41888 + }, + { + "epoch": 0.81, + "learning_rate": 3.75247563201429e-08, + "loss": 0.0005, + "step": 41889 + }, + { + "epoch": 0.81, + "learning_rate": 3.752087297580676e-08, + "loss": 0.0005, + "step": 41890 + }, + { + "epoch": 0.81, + "learning_rate": 3.751698963147062e-08, + "loss": 0.0004, + "step": 41891 + }, + { + "epoch": 0.81, + "learning_rate": 3.7513106287134475e-08, + "loss": 0.7918, + "step": 41892 + }, + { + "epoch": 0.81, + "learning_rate": 3.7509222942798333e-08, + "loss": 0.0004, + "step": 41893 + }, + { + "epoch": 0.81, + "learning_rate": 3.750533959846219e-08, + "loss": 0.0003, + "step": 41894 + }, + { + "epoch": 0.81, + "learning_rate": 3.750145625412605e-08, + "loss": 0.0004, + "step": 41895 + }, + { + "epoch": 0.81, + "learning_rate": 3.749757290978991e-08, + "loss": 0.0016, + "step": 41896 + }, + { + "epoch": 0.81, + "learning_rate": 3.7493689565453766e-08, + "loss": 0.0004, + "step": 41897 + }, + { + "epoch": 0.81, + "learning_rate": 3.7489806221117625e-08, + "loss": 0.0003, + "step": 41898 + }, + { + "epoch": 0.81, + "learning_rate": 3.748592287678148e-08, + "loss": 0.0004, + "step": 41899 + }, + { + "epoch": 0.81, + "learning_rate": 3.748203953244534e-08, + "loss": 0.0003, + "step": 41900 + }, + { + "epoch": 0.81, + "learning_rate": 3.74781561881092e-08, + "loss": 0.0004, + "step": 41901 + }, + { + "epoch": 0.81, + "learning_rate": 3.747427284377306e-08, + "loss": 0.0004, + "step": 41902 + }, + { + "epoch": 0.81, + "learning_rate": 3.747038949943691e-08, + "loss": 0.0041, + "step": 41903 + }, + { + "epoch": 0.81, + "learning_rate": 3.746650615510077e-08, + "loss": 0.0003, + "step": 41904 + }, + { + "epoch": 0.81, + "learning_rate": 3.7462622810764626e-08, + "loss": 0.0004, + "step": 41905 + }, + { + "epoch": 0.81, + "learning_rate": 3.7458739466428484e-08, + "loss": 0.0007, + "step": 41906 + }, + { + "epoch": 0.81, + "learning_rate": 3.745485612209234e-08, + "loss": 0.0036, + "step": 41907 + }, + { + "epoch": 0.81, + "learning_rate": 3.74509727777562e-08, + "loss": 0.0004, + "step": 41908 + }, + { + "epoch": 0.81, + "learning_rate": 3.744708943342006e-08, + "loss": 0.0005, + "step": 41909 + }, + { + "epoch": 0.81, + "learning_rate": 3.744320608908392e-08, + "loss": 0.0004, + "step": 41910 + }, + { + "epoch": 0.81, + "learning_rate": 3.7439322744747775e-08, + "loss": 0.0003, + "step": 41911 + }, + { + "epoch": 0.81, + "learning_rate": 3.7435439400411633e-08, + "loss": 0.0003, + "step": 41912 + }, + { + "epoch": 0.81, + "learning_rate": 3.743155605607549e-08, + "loss": 0.0004, + "step": 41913 + }, + { + "epoch": 0.81, + "learning_rate": 3.742767271173935e-08, + "loss": 0.0004, + "step": 41914 + }, + { + "epoch": 0.81, + "learning_rate": 3.742378936740321e-08, + "loss": 0.0006, + "step": 41915 + }, + { + "epoch": 0.81, + "learning_rate": 3.7419906023067066e-08, + "loss": 0.0052, + "step": 41916 + }, + { + "epoch": 0.81, + "learning_rate": 3.7416022678730925e-08, + "loss": 0.0007, + "step": 41917 + }, + { + "epoch": 0.81, + "learning_rate": 3.7412139334394776e-08, + "loss": 0.525, + "step": 41918 + }, + { + "epoch": 0.81, + "learning_rate": 3.7408255990058634e-08, + "loss": 0.0006, + "step": 41919 + }, + { + "epoch": 0.81, + "learning_rate": 3.740437264572249e-08, + "loss": 0.0004, + "step": 41920 + }, + { + "epoch": 0.81, + "learning_rate": 3.740048930138635e-08, + "loss": 0.0003, + "step": 41921 + }, + { + "epoch": 0.81, + "learning_rate": 3.739660595705021e-08, + "loss": 0.0003, + "step": 41922 + }, + { + "epoch": 0.81, + "learning_rate": 3.739272261271407e-08, + "loss": 0.0005, + "step": 41923 + }, + { + "epoch": 0.81, + "learning_rate": 3.7388839268377926e-08, + "loss": 0.0008, + "step": 41924 + }, + { + "epoch": 0.81, + "learning_rate": 3.7384955924041784e-08, + "loss": 0.0007, + "step": 41925 + }, + { + "epoch": 0.81, + "learning_rate": 3.738107257970564e-08, + "loss": 0.0004, + "step": 41926 + }, + { + "epoch": 0.81, + "learning_rate": 3.73771892353695e-08, + "loss": 1.2764, + "step": 41927 + }, + { + "epoch": 0.81, + "learning_rate": 3.737330589103336e-08, + "loss": 0.0003, + "step": 41928 + }, + { + "epoch": 0.81, + "learning_rate": 3.736942254669722e-08, + "loss": 0.6716, + "step": 41929 + }, + { + "epoch": 0.81, + "learning_rate": 3.7365539202361075e-08, + "loss": 0.0003, + "step": 41930 + }, + { + "epoch": 0.81, + "learning_rate": 3.7361655858024933e-08, + "loss": 0.0011, + "step": 41931 + }, + { + "epoch": 0.81, + "learning_rate": 3.7357772513688785e-08, + "loss": 0.0004, + "step": 41932 + }, + { + "epoch": 0.81, + "learning_rate": 3.735388916935264e-08, + "loss": 0.0008, + "step": 41933 + }, + { + "epoch": 0.81, + "learning_rate": 3.73500058250165e-08, + "loss": 0.0006, + "step": 41934 + }, + { + "epoch": 0.81, + "learning_rate": 3.734612248068036e-08, + "loss": 0.0003, + "step": 41935 + }, + { + "epoch": 0.81, + "learning_rate": 3.734223913634422e-08, + "loss": 0.0003, + "step": 41936 + }, + { + "epoch": 0.81, + "learning_rate": 3.7338355792008076e-08, + "loss": 0.0076, + "step": 41937 + }, + { + "epoch": 0.81, + "learning_rate": 3.7334472447671934e-08, + "loss": 0.0004, + "step": 41938 + }, + { + "epoch": 0.81, + "learning_rate": 3.733058910333579e-08, + "loss": 0.0003, + "step": 41939 + }, + { + "epoch": 0.81, + "learning_rate": 3.732670575899965e-08, + "loss": 0.0738, + "step": 41940 + }, + { + "epoch": 0.81, + "learning_rate": 3.732282241466351e-08, + "loss": 0.3514, + "step": 41941 + }, + { + "epoch": 0.81, + "learning_rate": 3.731893907032737e-08, + "loss": 0.0005, + "step": 41942 + }, + { + "epoch": 0.81, + "learning_rate": 3.7315055725991226e-08, + "loss": 0.0003, + "step": 41943 + }, + { + "epoch": 0.81, + "learning_rate": 3.7311172381655084e-08, + "loss": 0.0004, + "step": 41944 + }, + { + "epoch": 0.81, + "learning_rate": 3.730728903731894e-08, + "loss": 0.0004, + "step": 41945 + }, + { + "epoch": 0.81, + "learning_rate": 3.73034056929828e-08, + "loss": 0.0004, + "step": 41946 + }, + { + "epoch": 0.81, + "learning_rate": 3.729952234864665e-08, + "loss": 0.0003, + "step": 41947 + }, + { + "epoch": 0.81, + "learning_rate": 3.729563900431051e-08, + "loss": 0.001, + "step": 41948 + }, + { + "epoch": 0.81, + "learning_rate": 3.729175565997437e-08, + "loss": 0.0004, + "step": 41949 + }, + { + "epoch": 0.81, + "learning_rate": 3.728787231563823e-08, + "loss": 0.0008, + "step": 41950 + }, + { + "epoch": 0.81, + "learning_rate": 3.7283988971302085e-08, + "loss": 0.0004, + "step": 41951 + }, + { + "epoch": 0.81, + "learning_rate": 3.728010562696594e-08, + "loss": 0.0004, + "step": 41952 + }, + { + "epoch": 0.81, + "learning_rate": 3.72762222826298e-08, + "loss": 0.0003, + "step": 41953 + }, + { + "epoch": 0.81, + "learning_rate": 3.727233893829366e-08, + "loss": 0.0003, + "step": 41954 + }, + { + "epoch": 0.81, + "learning_rate": 3.726845559395752e-08, + "loss": 0.0005, + "step": 41955 + }, + { + "epoch": 0.81, + "learning_rate": 3.7264572249621376e-08, + "loss": 0.0004, + "step": 41956 + }, + { + "epoch": 0.81, + "learning_rate": 3.7260688905285234e-08, + "loss": 0.0004, + "step": 41957 + }, + { + "epoch": 0.81, + "learning_rate": 3.725680556094909e-08, + "loss": 0.0003, + "step": 41958 + }, + { + "epoch": 0.81, + "learning_rate": 3.7252922216612944e-08, + "loss": 0.1004, + "step": 41959 + }, + { + "epoch": 0.81, + "learning_rate": 3.72490388722768e-08, + "loss": 0.0006, + "step": 41960 + }, + { + "epoch": 0.81, + "learning_rate": 3.724515552794066e-08, + "loss": 0.0005, + "step": 41961 + }, + { + "epoch": 0.81, + "learning_rate": 3.724127218360452e-08, + "loss": 0.0003, + "step": 41962 + }, + { + "epoch": 0.81, + "learning_rate": 3.723738883926838e-08, + "loss": 0.0004, + "step": 41963 + }, + { + "epoch": 0.81, + "learning_rate": 3.7233505494932236e-08, + "loss": 0.0004, + "step": 41964 + }, + { + "epoch": 0.81, + "learning_rate": 3.7229622150596094e-08, + "loss": 0.0003, + "step": 41965 + }, + { + "epoch": 0.81, + "learning_rate": 3.7225738806259945e-08, + "loss": 0.0004, + "step": 41966 + }, + { + "epoch": 0.81, + "learning_rate": 3.7221855461923804e-08, + "loss": 0.0011, + "step": 41967 + }, + { + "epoch": 0.81, + "learning_rate": 3.721797211758766e-08, + "loss": 0.0014, + "step": 41968 + }, + { + "epoch": 0.81, + "learning_rate": 3.721408877325152e-08, + "loss": 0.0005, + "step": 41969 + }, + { + "epoch": 0.81, + "learning_rate": 3.721020542891538e-08, + "loss": 0.0004, + "step": 41970 + }, + { + "epoch": 0.81, + "learning_rate": 3.7206322084579237e-08, + "loss": 0.0004, + "step": 41971 + }, + { + "epoch": 0.81, + "learning_rate": 3.7202438740243095e-08, + "loss": 0.0006, + "step": 41972 + }, + { + "epoch": 0.81, + "learning_rate": 3.719855539590695e-08, + "loss": 0.6257, + "step": 41973 + }, + { + "epoch": 0.81, + "learning_rate": 3.719467205157081e-08, + "loss": 0.0004, + "step": 41974 + }, + { + "epoch": 0.81, + "learning_rate": 3.719078870723467e-08, + "loss": 0.0004, + "step": 41975 + }, + { + "epoch": 0.81, + "learning_rate": 3.718690536289852e-08, + "loss": 0.0005, + "step": 41976 + }, + { + "epoch": 0.81, + "learning_rate": 3.718302201856238e-08, + "loss": 0.0006, + "step": 41977 + }, + { + "epoch": 0.81, + "learning_rate": 3.717913867422624e-08, + "loss": 0.0015, + "step": 41978 + }, + { + "epoch": 0.81, + "learning_rate": 3.7175255329890096e-08, + "loss": 0.0004, + "step": 41979 + }, + { + "epoch": 0.81, + "learning_rate": 3.7171371985553954e-08, + "loss": 0.0004, + "step": 41980 + }, + { + "epoch": 0.81, + "learning_rate": 3.716748864121781e-08, + "loss": 0.0004, + "step": 41981 + }, + { + "epoch": 0.81, + "learning_rate": 3.716360529688167e-08, + "loss": 0.0004, + "step": 41982 + }, + { + "epoch": 0.81, + "learning_rate": 3.715972195254553e-08, + "loss": 0.0003, + "step": 41983 + }, + { + "epoch": 0.81, + "learning_rate": 3.715583860820939e-08, + "loss": 0.0005, + "step": 41984 + }, + { + "epoch": 0.81, + "learning_rate": 3.7151955263873245e-08, + "loss": 0.0004, + "step": 41985 + }, + { + "epoch": 0.81, + "learning_rate": 3.7148071919537104e-08, + "loss": 0.1174, + "step": 41986 + }, + { + "epoch": 0.81, + "learning_rate": 3.714418857520096e-08, + "loss": 0.0003, + "step": 41987 + }, + { + "epoch": 0.81, + "learning_rate": 3.714030523086482e-08, + "loss": 0.0003, + "step": 41988 + }, + { + "epoch": 0.81, + "learning_rate": 3.713642188652868e-08, + "loss": 0.6824, + "step": 41989 + }, + { + "epoch": 0.81, + "learning_rate": 3.713253854219253e-08, + "loss": 0.4151, + "step": 41990 + }, + { + "epoch": 0.81, + "learning_rate": 3.712865519785639e-08, + "loss": 0.0004, + "step": 41991 + }, + { + "epoch": 0.81, + "learning_rate": 3.7124771853520247e-08, + "loss": 0.0004, + "step": 41992 + }, + { + "epoch": 0.81, + "learning_rate": 3.7120888509184105e-08, + "loss": 1.2648, + "step": 41993 + }, + { + "epoch": 0.81, + "learning_rate": 3.711700516484796e-08, + "loss": 0.0003, + "step": 41994 + }, + { + "epoch": 0.81, + "learning_rate": 3.711312182051182e-08, + "loss": 0.002, + "step": 41995 + }, + { + "epoch": 0.81, + "learning_rate": 3.710923847617568e-08, + "loss": 0.0005, + "step": 41996 + }, + { + "epoch": 0.81, + "learning_rate": 3.710535513183954e-08, + "loss": 0.0003, + "step": 41997 + }, + { + "epoch": 0.81, + "learning_rate": 3.7101471787503396e-08, + "loss": 0.0004, + "step": 41998 + }, + { + "epoch": 0.81, + "learning_rate": 3.7097588443167254e-08, + "loss": 0.0004, + "step": 41999 + }, + { + "epoch": 0.81, + "learning_rate": 3.709370509883111e-08, + "loss": 0.0004, + "step": 42000 + }, + { + "epoch": 0.81, + "learning_rate": 3.708982175449497e-08, + "loss": 0.0003, + "step": 42001 + }, + { + "epoch": 0.81, + "learning_rate": 3.708593841015883e-08, + "loss": 0.0005, + "step": 42002 + }, + { + "epoch": 0.81, + "learning_rate": 3.708205506582269e-08, + "loss": 0.0004, + "step": 42003 + }, + { + "epoch": 0.81, + "learning_rate": 3.7078171721486545e-08, + "loss": 0.0004, + "step": 42004 + }, + { + "epoch": 0.81, + "learning_rate": 3.70742883771504e-08, + "loss": 0.5057, + "step": 42005 + }, + { + "epoch": 0.81, + "learning_rate": 3.7070405032814255e-08, + "loss": 0.0004, + "step": 42006 + }, + { + "epoch": 0.81, + "learning_rate": 3.7066521688478114e-08, + "loss": 0.0003, + "step": 42007 + }, + { + "epoch": 0.81, + "learning_rate": 3.706263834414197e-08, + "loss": 0.0004, + "step": 42008 + }, + { + "epoch": 0.81, + "learning_rate": 3.705875499980583e-08, + "loss": 0.0004, + "step": 42009 + }, + { + "epoch": 0.81, + "learning_rate": 3.705487165546969e-08, + "loss": 0.0004, + "step": 42010 + }, + { + "epoch": 0.81, + "learning_rate": 3.7050988311133547e-08, + "loss": 1.1999, + "step": 42011 + }, + { + "epoch": 0.81, + "learning_rate": 3.7047104966797405e-08, + "loss": 0.0005, + "step": 42012 + }, + { + "epoch": 0.81, + "learning_rate": 3.704322162246126e-08, + "loss": 0.0004, + "step": 42013 + }, + { + "epoch": 0.81, + "learning_rate": 3.703933827812512e-08, + "loss": 0.6238, + "step": 42014 + }, + { + "epoch": 0.82, + "learning_rate": 3.703545493378898e-08, + "loss": 0.0003, + "step": 42015 + }, + { + "epoch": 0.82, + "learning_rate": 3.703157158945284e-08, + "loss": 0.0009, + "step": 42016 + }, + { + "epoch": 0.82, + "learning_rate": 3.7027688245116696e-08, + "loss": 0.0004, + "step": 42017 + }, + { + "epoch": 0.82, + "learning_rate": 3.7023804900780554e-08, + "loss": 0.0004, + "step": 42018 + }, + { + "epoch": 0.82, + "learning_rate": 3.7019921556444406e-08, + "loss": 0.0004, + "step": 42019 + }, + { + "epoch": 0.82, + "learning_rate": 3.7016038212108264e-08, + "loss": 0.0007, + "step": 42020 + }, + { + "epoch": 0.82, + "learning_rate": 3.701215486777212e-08, + "loss": 0.0029, + "step": 42021 + }, + { + "epoch": 0.82, + "learning_rate": 3.700827152343598e-08, + "loss": 0.0004, + "step": 42022 + }, + { + "epoch": 0.82, + "learning_rate": 3.700438817909984e-08, + "loss": 0.0003, + "step": 42023 + }, + { + "epoch": 0.82, + "learning_rate": 3.70005048347637e-08, + "loss": 0.0047, + "step": 42024 + }, + { + "epoch": 0.82, + "learning_rate": 3.6996621490427555e-08, + "loss": 0.0023, + "step": 42025 + }, + { + "epoch": 0.82, + "learning_rate": 3.6992738146091414e-08, + "loss": 0.0003, + "step": 42026 + }, + { + "epoch": 0.82, + "learning_rate": 3.698885480175527e-08, + "loss": 0.0004, + "step": 42027 + }, + { + "epoch": 0.82, + "learning_rate": 3.698497145741913e-08, + "loss": 0.2337, + "step": 42028 + }, + { + "epoch": 0.82, + "learning_rate": 3.698108811308299e-08, + "loss": 0.0005, + "step": 42029 + }, + { + "epoch": 0.82, + "learning_rate": 3.6977204768746847e-08, + "loss": 0.0004, + "step": 42030 + }, + { + "epoch": 0.82, + "learning_rate": 3.6973321424410705e-08, + "loss": 0.0005, + "step": 42031 + }, + { + "epoch": 0.82, + "learning_rate": 3.696943808007456e-08, + "loss": 0.0004, + "step": 42032 + }, + { + "epoch": 0.82, + "learning_rate": 3.696555473573842e-08, + "loss": 0.0004, + "step": 42033 + }, + { + "epoch": 0.82, + "learning_rate": 3.696167139140227e-08, + "loss": 0.9311, + "step": 42034 + }, + { + "epoch": 0.82, + "learning_rate": 3.695778804706613e-08, + "loss": 0.0005, + "step": 42035 + }, + { + "epoch": 0.82, + "learning_rate": 3.695390470272999e-08, + "loss": 0.0004, + "step": 42036 + }, + { + "epoch": 0.82, + "learning_rate": 3.695002135839385e-08, + "loss": 0.0004, + "step": 42037 + }, + { + "epoch": 0.82, + "learning_rate": 3.6946138014057706e-08, + "loss": 1.075, + "step": 42038 + }, + { + "epoch": 0.82, + "learning_rate": 3.6942254669721564e-08, + "loss": 0.0005, + "step": 42039 + }, + { + "epoch": 0.82, + "learning_rate": 3.693837132538542e-08, + "loss": 0.0003, + "step": 42040 + }, + { + "epoch": 0.82, + "learning_rate": 3.693448798104928e-08, + "loss": 0.0009, + "step": 42041 + }, + { + "epoch": 0.82, + "learning_rate": 3.693060463671314e-08, + "loss": 0.0004, + "step": 42042 + }, + { + "epoch": 0.82, + "learning_rate": 3.6926721292377e-08, + "loss": 0.0004, + "step": 42043 + }, + { + "epoch": 0.82, + "learning_rate": 3.6922837948040855e-08, + "loss": 0.0018, + "step": 42044 + }, + { + "epoch": 0.82, + "learning_rate": 3.6918954603704714e-08, + "loss": 0.0003, + "step": 42045 + }, + { + "epoch": 0.82, + "learning_rate": 3.691507125936857e-08, + "loss": 0.0008, + "step": 42046 + }, + { + "epoch": 0.82, + "learning_rate": 3.6911187915032424e-08, + "loss": 0.5566, + "step": 42047 + }, + { + "epoch": 0.82, + "learning_rate": 3.690730457069628e-08, + "loss": 0.0003, + "step": 42048 + }, + { + "epoch": 0.82, + "learning_rate": 3.690342122636014e-08, + "loss": 0.0007, + "step": 42049 + }, + { + "epoch": 0.82, + "learning_rate": 3.6899537882024e-08, + "loss": 0.8755, + "step": 42050 + }, + { + "epoch": 0.82, + "learning_rate": 3.6895654537687857e-08, + "loss": 0.0007, + "step": 42051 + }, + { + "epoch": 0.82, + "learning_rate": 3.6891771193351715e-08, + "loss": 0.0006, + "step": 42052 + }, + { + "epoch": 0.82, + "learning_rate": 3.688788784901557e-08, + "loss": 0.0004, + "step": 42053 + }, + { + "epoch": 0.82, + "learning_rate": 3.6884004504679425e-08, + "loss": 0.0004, + "step": 42054 + }, + { + "epoch": 0.82, + "learning_rate": 3.688012116034328e-08, + "loss": 0.0004, + "step": 42055 + }, + { + "epoch": 0.82, + "learning_rate": 3.687623781600714e-08, + "loss": 0.0005, + "step": 42056 + }, + { + "epoch": 0.82, + "learning_rate": 3.6872354471671e-08, + "loss": 0.0007, + "step": 42057 + }, + { + "epoch": 0.82, + "learning_rate": 3.686847112733486e-08, + "loss": 0.0006, + "step": 42058 + }, + { + "epoch": 0.82, + "learning_rate": 3.6864587782998716e-08, + "loss": 0.0005, + "step": 42059 + }, + { + "epoch": 0.82, + "learning_rate": 3.6860704438662574e-08, + "loss": 0.0004, + "step": 42060 + }, + { + "epoch": 0.82, + "learning_rate": 3.685682109432643e-08, + "loss": 1.051, + "step": 42061 + }, + { + "epoch": 0.82, + "learning_rate": 3.685293774999029e-08, + "loss": 0.0004, + "step": 42062 + }, + { + "epoch": 0.82, + "learning_rate": 3.684905440565414e-08, + "loss": 0.0006, + "step": 42063 + }, + { + "epoch": 0.82, + "learning_rate": 3.6845171061318e-08, + "loss": 1.388, + "step": 42064 + }, + { + "epoch": 0.82, + "learning_rate": 3.684128771698186e-08, + "loss": 0.0005, + "step": 42065 + }, + { + "epoch": 0.82, + "learning_rate": 3.683740437264572e-08, + "loss": 0.0004, + "step": 42066 + }, + { + "epoch": 0.82, + "learning_rate": 3.6833521028309575e-08, + "loss": 0.0009, + "step": 42067 + }, + { + "epoch": 0.82, + "learning_rate": 3.6829637683973433e-08, + "loss": 0.0003, + "step": 42068 + }, + { + "epoch": 0.82, + "learning_rate": 3.682575433963729e-08, + "loss": 0.0003, + "step": 42069 + }, + { + "epoch": 0.82, + "learning_rate": 3.682187099530115e-08, + "loss": 1.0367, + "step": 42070 + }, + { + "epoch": 0.82, + "learning_rate": 3.681798765096501e-08, + "loss": 0.0055, + "step": 42071 + }, + { + "epoch": 0.82, + "learning_rate": 3.6814104306628866e-08, + "loss": 0.0003, + "step": 42072 + }, + { + "epoch": 0.82, + "learning_rate": 3.6810220962292725e-08, + "loss": 0.0003, + "step": 42073 + }, + { + "epoch": 0.82, + "learning_rate": 3.680633761795658e-08, + "loss": 0.0034, + "step": 42074 + }, + { + "epoch": 0.82, + "learning_rate": 3.680245427362044e-08, + "loss": 0.0003, + "step": 42075 + }, + { + "epoch": 0.82, + "learning_rate": 3.67985709292843e-08, + "loss": 0.0004, + "step": 42076 + }, + { + "epoch": 0.82, + "learning_rate": 3.679468758494815e-08, + "loss": 0.001, + "step": 42077 + }, + { + "epoch": 0.82, + "learning_rate": 3.679080424061201e-08, + "loss": 0.0004, + "step": 42078 + }, + { + "epoch": 0.82, + "learning_rate": 3.678692089627587e-08, + "loss": 0.0005, + "step": 42079 + }, + { + "epoch": 0.82, + "learning_rate": 3.6783037551939726e-08, + "loss": 0.0282, + "step": 42080 + }, + { + "epoch": 0.82, + "learning_rate": 3.6779154207603584e-08, + "loss": 0.4441, + "step": 42081 + }, + { + "epoch": 0.82, + "learning_rate": 3.677527086326744e-08, + "loss": 0.0004, + "step": 42082 + }, + { + "epoch": 0.82, + "learning_rate": 3.67713875189313e-08, + "loss": 0.0406, + "step": 42083 + }, + { + "epoch": 0.82, + "learning_rate": 3.676750417459516e-08, + "loss": 0.0004, + "step": 42084 + }, + { + "epoch": 0.82, + "learning_rate": 3.676362083025902e-08, + "loss": 0.0004, + "step": 42085 + }, + { + "epoch": 0.82, + "learning_rate": 3.6759737485922875e-08, + "loss": 0.0006, + "step": 42086 + }, + { + "epoch": 0.82, + "learning_rate": 3.6755854141586733e-08, + "loss": 0.0004, + "step": 42087 + }, + { + "epoch": 0.82, + "learning_rate": 3.675197079725059e-08, + "loss": 0.0005, + "step": 42088 + }, + { + "epoch": 0.82, + "learning_rate": 3.674808745291445e-08, + "loss": 0.0005, + "step": 42089 + }, + { + "epoch": 0.82, + "learning_rate": 3.674420410857831e-08, + "loss": 0.0003, + "step": 42090 + }, + { + "epoch": 0.82, + "learning_rate": 3.6740320764242166e-08, + "loss": 0.0006, + "step": 42091 + }, + { + "epoch": 0.82, + "learning_rate": 3.673643741990602e-08, + "loss": 0.0006, + "step": 42092 + }, + { + "epoch": 0.82, + "learning_rate": 3.6732554075569876e-08, + "loss": 0.0005, + "step": 42093 + }, + { + "epoch": 0.82, + "learning_rate": 3.6728670731233735e-08, + "loss": 0.0004, + "step": 42094 + }, + { + "epoch": 0.82, + "learning_rate": 3.672478738689759e-08, + "loss": 0.0004, + "step": 42095 + }, + { + "epoch": 0.82, + "learning_rate": 3.672090404256145e-08, + "loss": 0.0003, + "step": 42096 + }, + { + "epoch": 0.82, + "learning_rate": 3.671702069822531e-08, + "loss": 0.0005, + "step": 42097 + }, + { + "epoch": 0.82, + "learning_rate": 3.671313735388917e-08, + "loss": 0.0003, + "step": 42098 + }, + { + "epoch": 0.82, + "learning_rate": 3.6709254009553026e-08, + "loss": 0.0004, + "step": 42099 + }, + { + "epoch": 0.82, + "learning_rate": 3.6705370665216884e-08, + "loss": 0.0003, + "step": 42100 + }, + { + "epoch": 0.82, + "learning_rate": 3.670148732088074e-08, + "loss": 0.01, + "step": 42101 + }, + { + "epoch": 0.82, + "learning_rate": 3.66976039765446e-08, + "loss": 0.0008, + "step": 42102 + }, + { + "epoch": 0.82, + "learning_rate": 3.669372063220846e-08, + "loss": 0.0004, + "step": 42103 + }, + { + "epoch": 0.82, + "learning_rate": 3.668983728787232e-08, + "loss": 0.0003, + "step": 42104 + }, + { + "epoch": 0.82, + "learning_rate": 3.6685953943536175e-08, + "loss": 0.0038, + "step": 42105 + }, + { + "epoch": 0.82, + "learning_rate": 3.668207059920003e-08, + "loss": 0.0009, + "step": 42106 + }, + { + "epoch": 0.82, + "learning_rate": 3.6678187254863885e-08, + "loss": 0.0007, + "step": 42107 + }, + { + "epoch": 0.82, + "learning_rate": 3.6674303910527743e-08, + "loss": 0.0003, + "step": 42108 + }, + { + "epoch": 0.82, + "learning_rate": 3.66704205661916e-08, + "loss": 0.0005, + "step": 42109 + }, + { + "epoch": 0.82, + "learning_rate": 3.666653722185546e-08, + "loss": 0.0006, + "step": 42110 + }, + { + "epoch": 0.82, + "learning_rate": 3.666265387751932e-08, + "loss": 0.0007, + "step": 42111 + }, + { + "epoch": 0.82, + "learning_rate": 3.6658770533183176e-08, + "loss": 0.0003, + "step": 42112 + }, + { + "epoch": 0.82, + "learning_rate": 3.6654887188847035e-08, + "loss": 0.0003, + "step": 42113 + }, + { + "epoch": 0.82, + "learning_rate": 3.665100384451089e-08, + "loss": 0.0003, + "step": 42114 + }, + { + "epoch": 0.82, + "learning_rate": 3.664712050017475e-08, + "loss": 1.2493, + "step": 42115 + }, + { + "epoch": 0.82, + "learning_rate": 3.664323715583861e-08, + "loss": 0.0007, + "step": 42116 + }, + { + "epoch": 0.82, + "learning_rate": 3.663935381150247e-08, + "loss": 1.222, + "step": 42117 + }, + { + "epoch": 0.82, + "learning_rate": 3.6635470467166326e-08, + "loss": 0.0003, + "step": 42118 + }, + { + "epoch": 0.82, + "learning_rate": 3.6631587122830184e-08, + "loss": 0.0003, + "step": 42119 + }, + { + "epoch": 0.82, + "learning_rate": 3.662770377849404e-08, + "loss": 0.0004, + "step": 42120 + }, + { + "epoch": 0.82, + "learning_rate": 3.6623820434157894e-08, + "loss": 0.4235, + "step": 42121 + }, + { + "epoch": 0.82, + "learning_rate": 3.661993708982175e-08, + "loss": 0.0008, + "step": 42122 + }, + { + "epoch": 0.82, + "learning_rate": 3.661605374548561e-08, + "loss": 0.0004, + "step": 42123 + }, + { + "epoch": 0.82, + "learning_rate": 3.661217040114947e-08, + "loss": 0.0005, + "step": 42124 + }, + { + "epoch": 0.82, + "learning_rate": 3.660828705681333e-08, + "loss": 0.0004, + "step": 42125 + }, + { + "epoch": 0.82, + "learning_rate": 3.6604403712477185e-08, + "loss": 0.0006, + "step": 42126 + }, + { + "epoch": 0.82, + "learning_rate": 3.6600520368141043e-08, + "loss": 0.0383, + "step": 42127 + }, + { + "epoch": 0.82, + "learning_rate": 3.65966370238049e-08, + "loss": 0.0005, + "step": 42128 + }, + { + "epoch": 0.82, + "learning_rate": 3.659275367946876e-08, + "loss": 0.0004, + "step": 42129 + }, + { + "epoch": 0.82, + "learning_rate": 3.658887033513262e-08, + "loss": 0.0003, + "step": 42130 + }, + { + "epoch": 0.82, + "learning_rate": 3.6584986990796476e-08, + "loss": 0.0006, + "step": 42131 + }, + { + "epoch": 0.82, + "learning_rate": 3.6581103646460335e-08, + "loss": 0.0006, + "step": 42132 + }, + { + "epoch": 0.82, + "learning_rate": 3.657722030212419e-08, + "loss": 0.0003, + "step": 42133 + }, + { + "epoch": 0.82, + "learning_rate": 3.657333695778805e-08, + "loss": 0.0017, + "step": 42134 + }, + { + "epoch": 0.82, + "learning_rate": 3.65694536134519e-08, + "loss": 0.0003, + "step": 42135 + }, + { + "epoch": 0.82, + "learning_rate": 3.656557026911576e-08, + "loss": 0.0005, + "step": 42136 + }, + { + "epoch": 0.82, + "learning_rate": 3.656168692477962e-08, + "loss": 0.0004, + "step": 42137 + }, + { + "epoch": 0.82, + "learning_rate": 3.655780358044348e-08, + "loss": 0.0065, + "step": 42138 + }, + { + "epoch": 0.82, + "learning_rate": 3.6553920236107336e-08, + "loss": 0.0004, + "step": 42139 + }, + { + "epoch": 0.82, + "learning_rate": 3.6550036891771194e-08, + "loss": 0.0003, + "step": 42140 + }, + { + "epoch": 0.82, + "learning_rate": 3.654615354743505e-08, + "loss": 0.0005, + "step": 42141 + }, + { + "epoch": 0.82, + "learning_rate": 3.654227020309891e-08, + "loss": 0.0004, + "step": 42142 + }, + { + "epoch": 0.82, + "learning_rate": 3.653838685876276e-08, + "loss": 0.0004, + "step": 42143 + }, + { + "epoch": 0.82, + "learning_rate": 3.653450351442662e-08, + "loss": 0.7449, + "step": 42144 + }, + { + "epoch": 0.82, + "learning_rate": 3.653062017009048e-08, + "loss": 0.0006, + "step": 42145 + }, + { + "epoch": 0.82, + "learning_rate": 3.652673682575434e-08, + "loss": 0.0004, + "step": 42146 + }, + { + "epoch": 0.82, + "learning_rate": 3.6522853481418195e-08, + "loss": 0.0004, + "step": 42147 + }, + { + "epoch": 0.82, + "learning_rate": 3.651897013708205e-08, + "loss": 0.0011, + "step": 42148 + }, + { + "epoch": 0.82, + "learning_rate": 3.651508679274591e-08, + "loss": 0.0004, + "step": 42149 + }, + { + "epoch": 0.82, + "learning_rate": 3.651120344840976e-08, + "loss": 0.0019, + "step": 42150 + }, + { + "epoch": 0.82, + "learning_rate": 3.650732010407362e-08, + "loss": 0.0006, + "step": 42151 + }, + { + "epoch": 0.82, + "learning_rate": 3.650343675973748e-08, + "loss": 0.0003, + "step": 42152 + }, + { + "epoch": 0.82, + "learning_rate": 3.649955341540134e-08, + "loss": 0.0005, + "step": 42153 + }, + { + "epoch": 0.82, + "learning_rate": 3.6495670071065196e-08, + "loss": 0.0004, + "step": 42154 + }, + { + "epoch": 0.82, + "learning_rate": 3.6491786726729054e-08, + "loss": 0.0003, + "step": 42155 + }, + { + "epoch": 0.82, + "learning_rate": 3.648790338239291e-08, + "loss": 0.0007, + "step": 42156 + }, + { + "epoch": 0.82, + "learning_rate": 3.648402003805677e-08, + "loss": 0.0005, + "step": 42157 + }, + { + "epoch": 0.82, + "learning_rate": 3.648013669372063e-08, + "loss": 0.0005, + "step": 42158 + }, + { + "epoch": 0.82, + "learning_rate": 3.647625334938449e-08, + "loss": 0.0006, + "step": 42159 + }, + { + "epoch": 0.82, + "learning_rate": 3.6472370005048346e-08, + "loss": 0.0005, + "step": 42160 + }, + { + "epoch": 0.82, + "learning_rate": 3.6468486660712204e-08, + "loss": 0.0004, + "step": 42161 + }, + { + "epoch": 0.82, + "learning_rate": 3.646460331637606e-08, + "loss": 0.7031, + "step": 42162 + }, + { + "epoch": 0.82, + "learning_rate": 3.646071997203992e-08, + "loss": 0.0004, + "step": 42163 + }, + { + "epoch": 0.82, + "learning_rate": 3.645683662770377e-08, + "loss": 0.0004, + "step": 42164 + }, + { + "epoch": 0.82, + "learning_rate": 3.645295328336763e-08, + "loss": 0.0004, + "step": 42165 + }, + { + "epoch": 0.82, + "learning_rate": 3.644906993903149e-08, + "loss": 0.0003, + "step": 42166 + }, + { + "epoch": 0.82, + "learning_rate": 3.6445186594695347e-08, + "loss": 0.5447, + "step": 42167 + }, + { + "epoch": 0.82, + "learning_rate": 3.6441303250359205e-08, + "loss": 0.0007, + "step": 42168 + }, + { + "epoch": 0.82, + "learning_rate": 3.643741990602306e-08, + "loss": 0.0003, + "step": 42169 + }, + { + "epoch": 0.82, + "learning_rate": 3.643353656168692e-08, + "loss": 0.0004, + "step": 42170 + }, + { + "epoch": 0.82, + "learning_rate": 3.642965321735078e-08, + "loss": 0.0003, + "step": 42171 + }, + { + "epoch": 0.82, + "learning_rate": 3.642576987301464e-08, + "loss": 0.0005, + "step": 42172 + }, + { + "epoch": 0.82, + "learning_rate": 3.6421886528678496e-08, + "loss": 0.0005, + "step": 42173 + }, + { + "epoch": 0.82, + "learning_rate": 3.6418003184342354e-08, + "loss": 0.0005, + "step": 42174 + }, + { + "epoch": 0.82, + "learning_rate": 3.641411984000621e-08, + "loss": 0.0004, + "step": 42175 + }, + { + "epoch": 0.82, + "learning_rate": 3.641023649567007e-08, + "loss": 0.0419, + "step": 42176 + }, + { + "epoch": 0.82, + "learning_rate": 3.640635315133393e-08, + "loss": 0.0004, + "step": 42177 + }, + { + "epoch": 0.82, + "learning_rate": 3.640246980699779e-08, + "loss": 0.0006, + "step": 42178 + }, + { + "epoch": 0.82, + "learning_rate": 3.639858646266164e-08, + "loss": 0.0005, + "step": 42179 + }, + { + "epoch": 0.82, + "learning_rate": 3.63947031183255e-08, + "loss": 0.0004, + "step": 42180 + }, + { + "epoch": 0.82, + "learning_rate": 3.6390819773989355e-08, + "loss": 0.0006, + "step": 42181 + }, + { + "epoch": 0.82, + "learning_rate": 3.6386936429653214e-08, + "loss": 0.0004, + "step": 42182 + }, + { + "epoch": 0.82, + "learning_rate": 3.638305308531707e-08, + "loss": 0.0004, + "step": 42183 + }, + { + "epoch": 0.82, + "learning_rate": 3.637916974098093e-08, + "loss": 0.0003, + "step": 42184 + }, + { + "epoch": 0.82, + "learning_rate": 3.637528639664479e-08, + "loss": 0.0003, + "step": 42185 + }, + { + "epoch": 0.82, + "learning_rate": 3.637140305230865e-08, + "loss": 0.0005, + "step": 42186 + }, + { + "epoch": 0.82, + "learning_rate": 3.6367519707972505e-08, + "loss": 0.0004, + "step": 42187 + }, + { + "epoch": 0.82, + "learning_rate": 3.636363636363636e-08, + "loss": 0.0005, + "step": 42188 + }, + { + "epoch": 0.82, + "learning_rate": 3.635975301930022e-08, + "loss": 0.0003, + "step": 42189 + }, + { + "epoch": 0.82, + "learning_rate": 3.635586967496408e-08, + "loss": 0.0103, + "step": 42190 + }, + { + "epoch": 0.82, + "learning_rate": 3.635198633062794e-08, + "loss": 0.0003, + "step": 42191 + }, + { + "epoch": 0.82, + "learning_rate": 3.6348102986291796e-08, + "loss": 0.0005, + "step": 42192 + }, + { + "epoch": 0.82, + "learning_rate": 3.634421964195565e-08, + "loss": 0.0004, + "step": 42193 + }, + { + "epoch": 0.82, + "learning_rate": 3.6340336297619506e-08, + "loss": 0.0003, + "step": 42194 + }, + { + "epoch": 0.82, + "learning_rate": 3.6336452953283364e-08, + "loss": 0.0004, + "step": 42195 + }, + { + "epoch": 0.82, + "learning_rate": 3.633256960894722e-08, + "loss": 0.0007, + "step": 42196 + }, + { + "epoch": 0.82, + "learning_rate": 3.632868626461108e-08, + "loss": 0.0033, + "step": 42197 + }, + { + "epoch": 0.82, + "learning_rate": 3.632480292027494e-08, + "loss": 0.0003, + "step": 42198 + }, + { + "epoch": 0.82, + "learning_rate": 3.63209195759388e-08, + "loss": 0.0005, + "step": 42199 + }, + { + "epoch": 0.82, + "learning_rate": 3.6317036231602656e-08, + "loss": 0.0003, + "step": 42200 + }, + { + "epoch": 0.82, + "learning_rate": 3.6313152887266514e-08, + "loss": 0.0005, + "step": 42201 + }, + { + "epoch": 0.82, + "learning_rate": 3.630926954293037e-08, + "loss": 1.0918, + "step": 42202 + }, + { + "epoch": 0.82, + "learning_rate": 3.630538619859423e-08, + "loss": 0.0002, + "step": 42203 + }, + { + "epoch": 0.82, + "learning_rate": 3.630150285425809e-08, + "loss": 0.0006, + "step": 42204 + }, + { + "epoch": 0.82, + "learning_rate": 3.629761950992195e-08, + "loss": 0.0007, + "step": 42205 + }, + { + "epoch": 0.82, + "learning_rate": 3.6293736165585805e-08, + "loss": 0.0005, + "step": 42206 + }, + { + "epoch": 0.82, + "learning_rate": 3.628985282124966e-08, + "loss": 0.0006, + "step": 42207 + }, + { + "epoch": 0.82, + "learning_rate": 3.6285969476913515e-08, + "loss": 0.0004, + "step": 42208 + }, + { + "epoch": 0.82, + "learning_rate": 3.628208613257737e-08, + "loss": 0.0005, + "step": 42209 + }, + { + "epoch": 0.82, + "learning_rate": 3.627820278824123e-08, + "loss": 0.0007, + "step": 42210 + }, + { + "epoch": 0.82, + "learning_rate": 3.627431944390509e-08, + "loss": 0.0004, + "step": 42211 + }, + { + "epoch": 0.82, + "learning_rate": 3.627043609956895e-08, + "loss": 0.0004, + "step": 42212 + }, + { + "epoch": 0.82, + "learning_rate": 3.6266552755232806e-08, + "loss": 0.0004, + "step": 42213 + }, + { + "epoch": 0.82, + "learning_rate": 3.6262669410896664e-08, + "loss": 0.0004, + "step": 42214 + }, + { + "epoch": 0.82, + "learning_rate": 3.625878606656052e-08, + "loss": 0.0005, + "step": 42215 + }, + { + "epoch": 0.82, + "learning_rate": 3.625490272222438e-08, + "loss": 1.0498, + "step": 42216 + }, + { + "epoch": 0.82, + "learning_rate": 3.625101937788824e-08, + "loss": 0.0004, + "step": 42217 + }, + { + "epoch": 0.82, + "learning_rate": 3.62471360335521e-08, + "loss": 0.0008, + "step": 42218 + }, + { + "epoch": 0.82, + "learning_rate": 3.6243252689215956e-08, + "loss": 0.0006, + "step": 42219 + }, + { + "epoch": 0.82, + "learning_rate": 3.6239369344879814e-08, + "loss": 0.0004, + "step": 42220 + }, + { + "epoch": 0.82, + "learning_rate": 3.623548600054367e-08, + "loss": 0.0004, + "step": 42221 + }, + { + "epoch": 0.82, + "learning_rate": 3.6231602656207524e-08, + "loss": 0.0003, + "step": 42222 + }, + { + "epoch": 0.82, + "learning_rate": 3.622771931187138e-08, + "loss": 0.0005, + "step": 42223 + }, + { + "epoch": 0.82, + "learning_rate": 3.622383596753524e-08, + "loss": 0.0004, + "step": 42224 + }, + { + "epoch": 0.82, + "learning_rate": 3.62199526231991e-08, + "loss": 0.0003, + "step": 42225 + }, + { + "epoch": 0.82, + "learning_rate": 3.6216069278862957e-08, + "loss": 0.0004, + "step": 42226 + }, + { + "epoch": 0.82, + "learning_rate": 3.6212185934526815e-08, + "loss": 0.0378, + "step": 42227 + }, + { + "epoch": 0.82, + "learning_rate": 3.620830259019067e-08, + "loss": 0.0004, + "step": 42228 + }, + { + "epoch": 0.82, + "learning_rate": 3.620441924585453e-08, + "loss": 0.0003, + "step": 42229 + }, + { + "epoch": 0.82, + "learning_rate": 3.620053590151839e-08, + "loss": 0.0005, + "step": 42230 + }, + { + "epoch": 0.82, + "learning_rate": 3.619665255718224e-08, + "loss": 0.0006, + "step": 42231 + }, + { + "epoch": 0.82, + "learning_rate": 3.61927692128461e-08, + "loss": 0.0003, + "step": 42232 + }, + { + "epoch": 0.82, + "learning_rate": 3.618888586850996e-08, + "loss": 0.0004, + "step": 42233 + }, + { + "epoch": 0.82, + "learning_rate": 3.6185002524173816e-08, + "loss": 0.0005, + "step": 42234 + }, + { + "epoch": 0.82, + "learning_rate": 3.6181119179837674e-08, + "loss": 0.0003, + "step": 42235 + }, + { + "epoch": 0.82, + "learning_rate": 3.617723583550153e-08, + "loss": 0.0005, + "step": 42236 + }, + { + "epoch": 0.82, + "learning_rate": 3.617335249116539e-08, + "loss": 0.0004, + "step": 42237 + }, + { + "epoch": 0.82, + "learning_rate": 3.616946914682925e-08, + "loss": 0.4249, + "step": 42238 + }, + { + "epoch": 0.82, + "learning_rate": 3.61655858024931e-08, + "loss": 0.0004, + "step": 42239 + }, + { + "epoch": 0.82, + "learning_rate": 3.616170245815696e-08, + "loss": 0.0043, + "step": 42240 + }, + { + "epoch": 0.82, + "learning_rate": 3.615781911382082e-08, + "loss": 0.0002, + "step": 42241 + }, + { + "epoch": 0.82, + "learning_rate": 3.6153935769484675e-08, + "loss": 0.0004, + "step": 42242 + }, + { + "epoch": 0.82, + "learning_rate": 3.6150052425148534e-08, + "loss": 0.0004, + "step": 42243 + }, + { + "epoch": 0.82, + "learning_rate": 3.614616908081239e-08, + "loss": 0.0009, + "step": 42244 + }, + { + "epoch": 0.82, + "learning_rate": 3.614228573647625e-08, + "loss": 0.0004, + "step": 42245 + }, + { + "epoch": 0.82, + "learning_rate": 3.613840239214011e-08, + "loss": 0.0004, + "step": 42246 + }, + { + "epoch": 0.82, + "learning_rate": 3.6134519047803967e-08, + "loss": 0.0006, + "step": 42247 + }, + { + "epoch": 0.82, + "learning_rate": 3.6130635703467825e-08, + "loss": 0.0167, + "step": 42248 + }, + { + "epoch": 0.82, + "learning_rate": 3.612675235913168e-08, + "loss": 0.0006, + "step": 42249 + }, + { + "epoch": 0.82, + "learning_rate": 3.612286901479554e-08, + "loss": 0.0004, + "step": 42250 + }, + { + "epoch": 0.82, + "learning_rate": 3.611898567045939e-08, + "loss": 0.0004, + "step": 42251 + }, + { + "epoch": 0.82, + "learning_rate": 3.611510232612325e-08, + "loss": 0.0007, + "step": 42252 + }, + { + "epoch": 0.82, + "learning_rate": 3.611121898178711e-08, + "loss": 0.0004, + "step": 42253 + }, + { + "epoch": 0.82, + "learning_rate": 3.610733563745097e-08, + "loss": 0.0003, + "step": 42254 + }, + { + "epoch": 0.82, + "learning_rate": 3.6103452293114826e-08, + "loss": 0.0004, + "step": 42255 + }, + { + "epoch": 0.82, + "learning_rate": 3.6099568948778684e-08, + "loss": 0.0003, + "step": 42256 + }, + { + "epoch": 0.82, + "learning_rate": 3.609568560444254e-08, + "loss": 0.0004, + "step": 42257 + }, + { + "epoch": 0.82, + "learning_rate": 3.60918022601064e-08, + "loss": 0.0006, + "step": 42258 + }, + { + "epoch": 0.82, + "learning_rate": 3.608791891577026e-08, + "loss": 0.0004, + "step": 42259 + }, + { + "epoch": 0.82, + "learning_rate": 3.608403557143412e-08, + "loss": 0.0003, + "step": 42260 + }, + { + "epoch": 0.82, + "learning_rate": 3.6080152227097975e-08, + "loss": 0.001, + "step": 42261 + }, + { + "epoch": 0.82, + "learning_rate": 3.6076268882761834e-08, + "loss": 0.0004, + "step": 42262 + }, + { + "epoch": 0.82, + "learning_rate": 3.607238553842569e-08, + "loss": 0.005, + "step": 42263 + }, + { + "epoch": 0.82, + "learning_rate": 3.606850219408955e-08, + "loss": 0.0004, + "step": 42264 + }, + { + "epoch": 0.82, + "learning_rate": 3.606461884975341e-08, + "loss": 0.0003, + "step": 42265 + }, + { + "epoch": 0.82, + "learning_rate": 3.606073550541726e-08, + "loss": 0.0012, + "step": 42266 + }, + { + "epoch": 0.82, + "learning_rate": 3.605685216108112e-08, + "loss": 0.001, + "step": 42267 + }, + { + "epoch": 0.82, + "learning_rate": 3.6052968816744976e-08, + "loss": 0.0005, + "step": 42268 + }, + { + "epoch": 0.82, + "learning_rate": 3.6049085472408835e-08, + "loss": 0.0004, + "step": 42269 + }, + { + "epoch": 0.82, + "learning_rate": 3.604520212807269e-08, + "loss": 0.0005, + "step": 42270 + }, + { + "epoch": 0.82, + "learning_rate": 3.604131878373655e-08, + "loss": 0.0005, + "step": 42271 + }, + { + "epoch": 0.82, + "learning_rate": 3.603743543940041e-08, + "loss": 0.4951, + "step": 42272 + }, + { + "epoch": 0.82, + "learning_rate": 3.603355209506427e-08, + "loss": 0.0008, + "step": 42273 + }, + { + "epoch": 0.82, + "learning_rate": 3.6029668750728126e-08, + "loss": 0.0003, + "step": 42274 + }, + { + "epoch": 0.82, + "learning_rate": 3.6025785406391984e-08, + "loss": 0.0003, + "step": 42275 + }, + { + "epoch": 0.82, + "learning_rate": 3.602190206205584e-08, + "loss": 0.0004, + "step": 42276 + }, + { + "epoch": 0.82, + "learning_rate": 3.60180187177197e-08, + "loss": 0.0003, + "step": 42277 + }, + { + "epoch": 0.82, + "learning_rate": 3.601413537338356e-08, + "loss": 0.0004, + "step": 42278 + }, + { + "epoch": 0.82, + "learning_rate": 3.601025202904742e-08, + "loss": 0.0004, + "step": 42279 + }, + { + "epoch": 0.82, + "learning_rate": 3.600636868471127e-08, + "loss": 0.0007, + "step": 42280 + }, + { + "epoch": 0.82, + "learning_rate": 3.600248534037513e-08, + "loss": 0.0004, + "step": 42281 + }, + { + "epoch": 0.82, + "learning_rate": 3.5998601996038985e-08, + "loss": 0.0006, + "step": 42282 + }, + { + "epoch": 0.82, + "learning_rate": 3.5994718651702843e-08, + "loss": 0.2954, + "step": 42283 + }, + { + "epoch": 0.82, + "learning_rate": 3.59908353073667e-08, + "loss": 0.0007, + "step": 42284 + }, + { + "epoch": 0.82, + "learning_rate": 3.598695196303056e-08, + "loss": 0.0006, + "step": 42285 + }, + { + "epoch": 0.82, + "learning_rate": 3.598306861869442e-08, + "loss": 0.0004, + "step": 42286 + }, + { + "epoch": 0.82, + "learning_rate": 3.5979185274358276e-08, + "loss": 0.0173, + "step": 42287 + }, + { + "epoch": 0.82, + "learning_rate": 3.5975301930022135e-08, + "loss": 0.0005, + "step": 42288 + }, + { + "epoch": 0.82, + "learning_rate": 3.597141858568599e-08, + "loss": 0.0008, + "step": 42289 + }, + { + "epoch": 0.82, + "learning_rate": 3.596753524134985e-08, + "loss": 0.0004, + "step": 42290 + }, + { + "epoch": 0.82, + "learning_rate": 3.596365189701371e-08, + "loss": 0.0004, + "step": 42291 + }, + { + "epoch": 0.82, + "learning_rate": 3.595976855267757e-08, + "loss": 0.0005, + "step": 42292 + }, + { + "epoch": 0.82, + "learning_rate": 3.5955885208341426e-08, + "loss": 0.0018, + "step": 42293 + }, + { + "epoch": 0.82, + "learning_rate": 3.5952001864005284e-08, + "loss": 0.0004, + "step": 42294 + }, + { + "epoch": 0.82, + "learning_rate": 3.5948118519669136e-08, + "loss": 0.0005, + "step": 42295 + }, + { + "epoch": 0.82, + "learning_rate": 3.5944235175332994e-08, + "loss": 0.0003, + "step": 42296 + }, + { + "epoch": 0.82, + "learning_rate": 3.594035183099685e-08, + "loss": 0.6072, + "step": 42297 + }, + { + "epoch": 0.82, + "learning_rate": 3.593646848666071e-08, + "loss": 0.0003, + "step": 42298 + }, + { + "epoch": 0.82, + "learning_rate": 3.593258514232457e-08, + "loss": 0.0003, + "step": 42299 + }, + { + "epoch": 0.82, + "learning_rate": 3.592870179798843e-08, + "loss": 0.0005, + "step": 42300 + }, + { + "epoch": 0.82, + "learning_rate": 3.5924818453652285e-08, + "loss": 0.0006, + "step": 42301 + }, + { + "epoch": 0.82, + "learning_rate": 3.5920935109316143e-08, + "loss": 0.0004, + "step": 42302 + }, + { + "epoch": 0.82, + "learning_rate": 3.591705176498e-08, + "loss": 0.0004, + "step": 42303 + }, + { + "epoch": 0.82, + "learning_rate": 3.591316842064386e-08, + "loss": 0.0003, + "step": 42304 + }, + { + "epoch": 0.82, + "learning_rate": 3.590928507630772e-08, + "loss": 0.0004, + "step": 42305 + }, + { + "epoch": 0.82, + "learning_rate": 3.5905401731971576e-08, + "loss": 0.0004, + "step": 42306 + }, + { + "epoch": 0.82, + "learning_rate": 3.5901518387635435e-08, + "loss": 0.0007, + "step": 42307 + }, + { + "epoch": 0.82, + "learning_rate": 3.589763504329929e-08, + "loss": 0.0004, + "step": 42308 + }, + { + "epoch": 0.82, + "learning_rate": 3.5893751698963145e-08, + "loss": 0.0011, + "step": 42309 + }, + { + "epoch": 0.82, + "learning_rate": 3.5889868354627e-08, + "loss": 0.5313, + "step": 42310 + }, + { + "epoch": 0.82, + "learning_rate": 3.588598501029086e-08, + "loss": 0.0004, + "step": 42311 + }, + { + "epoch": 0.82, + "learning_rate": 3.588210166595472e-08, + "loss": 0.0008, + "step": 42312 + }, + { + "epoch": 0.82, + "learning_rate": 3.587821832161858e-08, + "loss": 0.0005, + "step": 42313 + }, + { + "epoch": 0.82, + "learning_rate": 3.5874334977282436e-08, + "loss": 0.0006, + "step": 42314 + }, + { + "epoch": 0.82, + "learning_rate": 3.5870451632946294e-08, + "loss": 0.0008, + "step": 42315 + }, + { + "epoch": 0.82, + "learning_rate": 3.586656828861015e-08, + "loss": 0.1194, + "step": 42316 + }, + { + "epoch": 0.82, + "learning_rate": 3.586268494427401e-08, + "loss": 0.0005, + "step": 42317 + }, + { + "epoch": 0.82, + "learning_rate": 3.585880159993787e-08, + "loss": 0.001, + "step": 42318 + }, + { + "epoch": 0.82, + "learning_rate": 3.585491825560173e-08, + "loss": 0.0005, + "step": 42319 + }, + { + "epoch": 0.82, + "learning_rate": 3.585103491126558e-08, + "loss": 0.0004, + "step": 42320 + }, + { + "epoch": 0.82, + "learning_rate": 3.584715156692944e-08, + "loss": 0.0009, + "step": 42321 + }, + { + "epoch": 0.82, + "learning_rate": 3.5843268222593295e-08, + "loss": 0.0005, + "step": 42322 + }, + { + "epoch": 0.82, + "learning_rate": 3.5839384878257153e-08, + "loss": 0.0003, + "step": 42323 + }, + { + "epoch": 0.82, + "learning_rate": 3.583550153392101e-08, + "loss": 0.1998, + "step": 42324 + }, + { + "epoch": 0.82, + "learning_rate": 3.583161818958487e-08, + "loss": 0.0004, + "step": 42325 + }, + { + "epoch": 0.82, + "learning_rate": 3.582773484524873e-08, + "loss": 0.0005, + "step": 42326 + }, + { + "epoch": 0.82, + "learning_rate": 3.582385150091258e-08, + "loss": 0.0005, + "step": 42327 + }, + { + "epoch": 0.82, + "learning_rate": 3.581996815657644e-08, + "loss": 0.0204, + "step": 42328 + }, + { + "epoch": 0.82, + "learning_rate": 3.5816084812240296e-08, + "loss": 0.527, + "step": 42329 + }, + { + "epoch": 0.82, + "learning_rate": 3.5812201467904154e-08, + "loss": 0.0004, + "step": 42330 + }, + { + "epoch": 0.82, + "learning_rate": 3.580831812356801e-08, + "loss": 0.0003, + "step": 42331 + }, + { + "epoch": 0.82, + "learning_rate": 3.580443477923187e-08, + "loss": 0.0004, + "step": 42332 + }, + { + "epoch": 0.82, + "learning_rate": 3.580055143489573e-08, + "loss": 0.0006, + "step": 42333 + }, + { + "epoch": 0.82, + "learning_rate": 3.579666809055959e-08, + "loss": 0.0004, + "step": 42334 + }, + { + "epoch": 0.82, + "learning_rate": 3.5792784746223446e-08, + "loss": 0.0005, + "step": 42335 + }, + { + "epoch": 0.82, + "learning_rate": 3.5788901401887304e-08, + "loss": 0.0005, + "step": 42336 + }, + { + "epoch": 0.82, + "learning_rate": 3.578501805755116e-08, + "loss": 0.0004, + "step": 42337 + }, + { + "epoch": 0.82, + "learning_rate": 3.5781134713215014e-08, + "loss": 0.0004, + "step": 42338 + }, + { + "epoch": 0.82, + "learning_rate": 3.577725136887887e-08, + "loss": 0.0004, + "step": 42339 + }, + { + "epoch": 0.82, + "learning_rate": 3.577336802454273e-08, + "loss": 0.0005, + "step": 42340 + }, + { + "epoch": 0.82, + "learning_rate": 3.576948468020659e-08, + "loss": 0.0006, + "step": 42341 + }, + { + "epoch": 0.82, + "learning_rate": 3.576560133587045e-08, + "loss": 0.6412, + "step": 42342 + }, + { + "epoch": 0.82, + "learning_rate": 3.5761717991534305e-08, + "loss": 0.0004, + "step": 42343 + }, + { + "epoch": 0.82, + "learning_rate": 3.575783464719816e-08, + "loss": 0.0004, + "step": 42344 + }, + { + "epoch": 0.82, + "learning_rate": 3.575395130286202e-08, + "loss": 0.0006, + "step": 42345 + }, + { + "epoch": 0.82, + "learning_rate": 3.575006795852588e-08, + "loss": 0.0004, + "step": 42346 + }, + { + "epoch": 0.82, + "learning_rate": 3.574618461418974e-08, + "loss": 0.0004, + "step": 42347 + }, + { + "epoch": 0.82, + "learning_rate": 3.5742301269853596e-08, + "loss": 0.0004, + "step": 42348 + }, + { + "epoch": 0.82, + "learning_rate": 3.5738417925517455e-08, + "loss": 0.0002, + "step": 42349 + }, + { + "epoch": 0.82, + "learning_rate": 3.573453458118131e-08, + "loss": 0.0004, + "step": 42350 + }, + { + "epoch": 0.82, + "learning_rate": 3.573065123684517e-08, + "loss": 0.0003, + "step": 42351 + }, + { + "epoch": 0.82, + "learning_rate": 3.572676789250903e-08, + "loss": 0.0004, + "step": 42352 + }, + { + "epoch": 0.82, + "learning_rate": 3.572288454817288e-08, + "loss": 0.0004, + "step": 42353 + }, + { + "epoch": 0.82, + "learning_rate": 3.571900120383674e-08, + "loss": 0.0003, + "step": 42354 + }, + { + "epoch": 0.82, + "learning_rate": 3.57151178595006e-08, + "loss": 0.0005, + "step": 42355 + }, + { + "epoch": 0.82, + "learning_rate": 3.5711234515164456e-08, + "loss": 0.0004, + "step": 42356 + }, + { + "epoch": 0.82, + "learning_rate": 3.5707351170828314e-08, + "loss": 0.5064, + "step": 42357 + }, + { + "epoch": 0.82, + "learning_rate": 3.570346782649217e-08, + "loss": 0.0197, + "step": 42358 + }, + { + "epoch": 0.82, + "learning_rate": 3.569958448215603e-08, + "loss": 0.0048, + "step": 42359 + }, + { + "epoch": 0.82, + "learning_rate": 3.569570113781989e-08, + "loss": 0.0004, + "step": 42360 + }, + { + "epoch": 0.82, + "learning_rate": 3.569181779348375e-08, + "loss": 0.0029, + "step": 42361 + }, + { + "epoch": 0.82, + "learning_rate": 3.5687934449147605e-08, + "loss": 0.4476, + "step": 42362 + }, + { + "epoch": 0.82, + "learning_rate": 3.568405110481146e-08, + "loss": 0.0004, + "step": 42363 + }, + { + "epoch": 0.82, + "learning_rate": 3.568016776047532e-08, + "loss": 0.0003, + "step": 42364 + }, + { + "epoch": 0.82, + "learning_rate": 3.567628441613918e-08, + "loss": 0.0007, + "step": 42365 + }, + { + "epoch": 0.82, + "learning_rate": 3.567240107180304e-08, + "loss": 0.0004, + "step": 42366 + }, + { + "epoch": 0.82, + "learning_rate": 3.566851772746689e-08, + "loss": 0.0005, + "step": 42367 + }, + { + "epoch": 0.82, + "learning_rate": 3.566463438313075e-08, + "loss": 0.0006, + "step": 42368 + }, + { + "epoch": 0.82, + "learning_rate": 3.5660751038794606e-08, + "loss": 0.0004, + "step": 42369 + }, + { + "epoch": 0.82, + "learning_rate": 3.5656867694458464e-08, + "loss": 0.0005, + "step": 42370 + }, + { + "epoch": 0.82, + "learning_rate": 3.565298435012232e-08, + "loss": 0.0005, + "step": 42371 + }, + { + "epoch": 0.82, + "learning_rate": 3.564910100578618e-08, + "loss": 0.0005, + "step": 42372 + }, + { + "epoch": 0.82, + "learning_rate": 3.564521766145004e-08, + "loss": 0.0004, + "step": 42373 + }, + { + "epoch": 0.82, + "learning_rate": 3.56413343171139e-08, + "loss": 0.0005, + "step": 42374 + }, + { + "epoch": 0.82, + "learning_rate": 3.5637450972777756e-08, + "loss": 0.0006, + "step": 42375 + }, + { + "epoch": 0.82, + "learning_rate": 3.5633567628441614e-08, + "loss": 0.0005, + "step": 42376 + }, + { + "epoch": 0.82, + "learning_rate": 3.562968428410547e-08, + "loss": 0.0003, + "step": 42377 + }, + { + "epoch": 0.82, + "learning_rate": 3.562580093976933e-08, + "loss": 0.0005, + "step": 42378 + }, + { + "epoch": 0.82, + "learning_rate": 3.562191759543319e-08, + "loss": 0.0004, + "step": 42379 + }, + { + "epoch": 0.82, + "learning_rate": 3.561803425109705e-08, + "loss": 0.0004, + "step": 42380 + }, + { + "epoch": 0.82, + "learning_rate": 3.5614150906760905e-08, + "loss": 0.0004, + "step": 42381 + }, + { + "epoch": 0.82, + "learning_rate": 3.561026756242476e-08, + "loss": 0.0004, + "step": 42382 + }, + { + "epoch": 0.82, + "learning_rate": 3.5606384218088615e-08, + "loss": 0.0015, + "step": 42383 + }, + { + "epoch": 0.82, + "learning_rate": 3.560250087375247e-08, + "loss": 0.0116, + "step": 42384 + }, + { + "epoch": 0.82, + "learning_rate": 3.559861752941633e-08, + "loss": 0.0003, + "step": 42385 + }, + { + "epoch": 0.82, + "learning_rate": 3.559473418508019e-08, + "loss": 0.672, + "step": 42386 + }, + { + "epoch": 0.82, + "learning_rate": 3.559085084074405e-08, + "loss": 0.0003, + "step": 42387 + }, + { + "epoch": 0.82, + "learning_rate": 3.5586967496407906e-08, + "loss": 0.0003, + "step": 42388 + }, + { + "epoch": 0.82, + "learning_rate": 3.5583084152071764e-08, + "loss": 0.0004, + "step": 42389 + }, + { + "epoch": 0.82, + "learning_rate": 3.557920080773562e-08, + "loss": 0.0004, + "step": 42390 + }, + { + "epoch": 0.82, + "learning_rate": 3.557531746339948e-08, + "loss": 0.0004, + "step": 42391 + }, + { + "epoch": 0.82, + "learning_rate": 3.557143411906334e-08, + "loss": 0.0002, + "step": 42392 + }, + { + "epoch": 0.82, + "learning_rate": 3.55675507747272e-08, + "loss": 0.0003, + "step": 42393 + }, + { + "epoch": 0.82, + "learning_rate": 3.5563667430391056e-08, + "loss": 0.0004, + "step": 42394 + }, + { + "epoch": 0.82, + "learning_rate": 3.5559784086054914e-08, + "loss": 0.0004, + "step": 42395 + }, + { + "epoch": 0.82, + "learning_rate": 3.5555900741718766e-08, + "loss": 0.0003, + "step": 42396 + }, + { + "epoch": 0.82, + "learning_rate": 3.5552017397382624e-08, + "loss": 0.0004, + "step": 42397 + }, + { + "epoch": 0.82, + "learning_rate": 3.554813405304648e-08, + "loss": 0.0759, + "step": 42398 + }, + { + "epoch": 0.82, + "learning_rate": 3.554425070871034e-08, + "loss": 0.0007, + "step": 42399 + }, + { + "epoch": 0.82, + "learning_rate": 3.55403673643742e-08, + "loss": 0.0053, + "step": 42400 + }, + { + "epoch": 0.82, + "learning_rate": 3.553648402003806e-08, + "loss": 0.0003, + "step": 42401 + }, + { + "epoch": 0.82, + "learning_rate": 3.5532600675701915e-08, + "loss": 0.0004, + "step": 42402 + }, + { + "epoch": 0.82, + "learning_rate": 3.552871733136577e-08, + "loss": 0.0004, + "step": 42403 + }, + { + "epoch": 0.82, + "learning_rate": 3.552483398702963e-08, + "loss": 0.0004, + "step": 42404 + }, + { + "epoch": 0.82, + "learning_rate": 3.552095064269349e-08, + "loss": 0.0004, + "step": 42405 + }, + { + "epoch": 0.82, + "learning_rate": 3.551706729835735e-08, + "loss": 0.0005, + "step": 42406 + }, + { + "epoch": 0.82, + "learning_rate": 3.5513183954021206e-08, + "loss": 0.0004, + "step": 42407 + }, + { + "epoch": 0.82, + "learning_rate": 3.550930060968506e-08, + "loss": 0.0004, + "step": 42408 + }, + { + "epoch": 0.82, + "learning_rate": 3.5505417265348916e-08, + "loss": 0.0004, + "step": 42409 + }, + { + "epoch": 0.82, + "learning_rate": 3.5501533921012774e-08, + "loss": 0.0004, + "step": 42410 + }, + { + "epoch": 0.82, + "learning_rate": 3.549765057667663e-08, + "loss": 0.0018, + "step": 42411 + }, + { + "epoch": 0.82, + "learning_rate": 3.549376723234049e-08, + "loss": 0.0003, + "step": 42412 + }, + { + "epoch": 0.82, + "learning_rate": 3.548988388800435e-08, + "loss": 0.0003, + "step": 42413 + }, + { + "epoch": 0.82, + "learning_rate": 3.548600054366821e-08, + "loss": 0.0005, + "step": 42414 + }, + { + "epoch": 0.82, + "learning_rate": 3.5482117199332066e-08, + "loss": 0.9294, + "step": 42415 + }, + { + "epoch": 0.82, + "learning_rate": 3.547823385499592e-08, + "loss": 0.0004, + "step": 42416 + }, + { + "epoch": 0.82, + "learning_rate": 3.5474350510659775e-08, + "loss": 0.0004, + "step": 42417 + }, + { + "epoch": 0.82, + "learning_rate": 3.5470467166323634e-08, + "loss": 0.0006, + "step": 42418 + }, + { + "epoch": 0.82, + "learning_rate": 3.546658382198749e-08, + "loss": 0.003, + "step": 42419 + }, + { + "epoch": 0.82, + "learning_rate": 3.546270047765135e-08, + "loss": 0.0003, + "step": 42420 + }, + { + "epoch": 0.82, + "learning_rate": 3.545881713331521e-08, + "loss": 0.0004, + "step": 42421 + }, + { + "epoch": 0.82, + "learning_rate": 3.5454933788979067e-08, + "loss": 0.0003, + "step": 42422 + }, + { + "epoch": 0.82, + "learning_rate": 3.5451050444642925e-08, + "loss": 0.0004, + "step": 42423 + }, + { + "epoch": 0.82, + "learning_rate": 3.544716710030678e-08, + "loss": 0.0139, + "step": 42424 + }, + { + "epoch": 0.82, + "learning_rate": 3.5443283755970635e-08, + "loss": 0.0009, + "step": 42425 + }, + { + "epoch": 0.82, + "learning_rate": 3.543940041163449e-08, + "loss": 0.0004, + "step": 42426 + }, + { + "epoch": 0.82, + "learning_rate": 3.543551706729835e-08, + "loss": 0.0003, + "step": 42427 + }, + { + "epoch": 0.82, + "learning_rate": 3.543163372296221e-08, + "loss": 0.0008, + "step": 42428 + }, + { + "epoch": 0.82, + "learning_rate": 3.542775037862607e-08, + "loss": 0.0004, + "step": 42429 + }, + { + "epoch": 0.82, + "learning_rate": 3.5423867034289926e-08, + "loss": 0.4394, + "step": 42430 + }, + { + "epoch": 0.82, + "learning_rate": 3.5419983689953784e-08, + "loss": 0.0015, + "step": 42431 + }, + { + "epoch": 0.82, + "learning_rate": 3.541610034561764e-08, + "loss": 0.0006, + "step": 42432 + }, + { + "epoch": 0.82, + "learning_rate": 3.54122170012815e-08, + "loss": 0.0005, + "step": 42433 + }, + { + "epoch": 0.82, + "learning_rate": 3.540833365694536e-08, + "loss": 0.0006, + "step": 42434 + }, + { + "epoch": 0.82, + "learning_rate": 3.540445031260922e-08, + "loss": 0.0004, + "step": 42435 + }, + { + "epoch": 0.82, + "learning_rate": 3.5400566968273075e-08, + "loss": 0.0004, + "step": 42436 + }, + { + "epoch": 0.82, + "learning_rate": 3.5396683623936934e-08, + "loss": 0.006, + "step": 42437 + }, + { + "epoch": 0.82, + "learning_rate": 3.539280027960079e-08, + "loss": 0.0004, + "step": 42438 + }, + { + "epoch": 0.82, + "learning_rate": 3.538891693526465e-08, + "loss": 0.0004, + "step": 42439 + }, + { + "epoch": 0.82, + "learning_rate": 3.53850335909285e-08, + "loss": 0.0004, + "step": 42440 + }, + { + "epoch": 0.82, + "learning_rate": 3.538115024659236e-08, + "loss": 0.7721, + "step": 42441 + }, + { + "epoch": 0.82, + "learning_rate": 3.537726690225622e-08, + "loss": 0.0003, + "step": 42442 + }, + { + "epoch": 0.82, + "learning_rate": 3.5373383557920077e-08, + "loss": 0.0004, + "step": 42443 + }, + { + "epoch": 0.82, + "learning_rate": 3.5369500213583935e-08, + "loss": 1.1455, + "step": 42444 + }, + { + "epoch": 0.82, + "learning_rate": 3.536561686924779e-08, + "loss": 0.0003, + "step": 42445 + }, + { + "epoch": 0.82, + "learning_rate": 3.536173352491165e-08, + "loss": 0.0004, + "step": 42446 + }, + { + "epoch": 0.82, + "learning_rate": 3.535785018057551e-08, + "loss": 0.0004, + "step": 42447 + }, + { + "epoch": 0.82, + "learning_rate": 3.535396683623937e-08, + "loss": 0.0003, + "step": 42448 + }, + { + "epoch": 0.82, + "learning_rate": 3.5350083491903226e-08, + "loss": 0.0004, + "step": 42449 + }, + { + "epoch": 0.82, + "learning_rate": 3.5346200147567084e-08, + "loss": 0.0003, + "step": 42450 + }, + { + "epoch": 0.82, + "learning_rate": 3.534231680323094e-08, + "loss": 0.0003, + "step": 42451 + }, + { + "epoch": 0.82, + "learning_rate": 3.53384334588948e-08, + "loss": 0.0005, + "step": 42452 + }, + { + "epoch": 0.82, + "learning_rate": 3.533455011455866e-08, + "loss": 0.0004, + "step": 42453 + }, + { + "epoch": 0.82, + "learning_rate": 3.533066677022251e-08, + "loss": 0.0022, + "step": 42454 + }, + { + "epoch": 0.82, + "learning_rate": 3.532678342588637e-08, + "loss": 0.0004, + "step": 42455 + }, + { + "epoch": 0.82, + "learning_rate": 3.532290008155023e-08, + "loss": 0.0004, + "step": 42456 + }, + { + "epoch": 0.82, + "learning_rate": 3.5319016737214085e-08, + "loss": 0.1592, + "step": 42457 + }, + { + "epoch": 0.82, + "learning_rate": 3.5315133392877944e-08, + "loss": 0.0011, + "step": 42458 + }, + { + "epoch": 0.82, + "learning_rate": 3.53112500485418e-08, + "loss": 0.0389, + "step": 42459 + }, + { + "epoch": 0.82, + "learning_rate": 3.530736670420566e-08, + "loss": 0.2621, + "step": 42460 + }, + { + "epoch": 0.82, + "learning_rate": 3.530348335986952e-08, + "loss": 0.0004, + "step": 42461 + }, + { + "epoch": 0.82, + "learning_rate": 3.5299600015533377e-08, + "loss": 0.0004, + "step": 42462 + }, + { + "epoch": 0.82, + "learning_rate": 3.5295716671197235e-08, + "loss": 1.0239, + "step": 42463 + }, + { + "epoch": 0.82, + "learning_rate": 3.529183332686109e-08, + "loss": 0.0003, + "step": 42464 + }, + { + "epoch": 0.82, + "learning_rate": 3.528794998252495e-08, + "loss": 0.0021, + "step": 42465 + }, + { + "epoch": 0.82, + "learning_rate": 3.528406663818881e-08, + "loss": 0.0004, + "step": 42466 + }, + { + "epoch": 0.82, + "learning_rate": 3.528018329385267e-08, + "loss": 0.0005, + "step": 42467 + }, + { + "epoch": 0.82, + "learning_rate": 3.5276299949516526e-08, + "loss": 0.7409, + "step": 42468 + }, + { + "epoch": 0.82, + "learning_rate": 3.527241660518038e-08, + "loss": 0.0003, + "step": 42469 + }, + { + "epoch": 0.82, + "learning_rate": 3.5268533260844236e-08, + "loss": 0.5205, + "step": 42470 + }, + { + "epoch": 0.82, + "learning_rate": 3.5264649916508094e-08, + "loss": 0.0005, + "step": 42471 + }, + { + "epoch": 0.82, + "learning_rate": 3.526076657217195e-08, + "loss": 0.0003, + "step": 42472 + }, + { + "epoch": 0.82, + "learning_rate": 3.525688322783581e-08, + "loss": 0.0004, + "step": 42473 + }, + { + "epoch": 0.82, + "learning_rate": 3.525299988349967e-08, + "loss": 0.0004, + "step": 42474 + }, + { + "epoch": 0.82, + "learning_rate": 3.524911653916353e-08, + "loss": 0.0005, + "step": 42475 + }, + { + "epoch": 0.82, + "learning_rate": 3.5245233194827385e-08, + "loss": 0.0004, + "step": 42476 + }, + { + "epoch": 0.82, + "learning_rate": 3.5241349850491244e-08, + "loss": 0.0004, + "step": 42477 + }, + { + "epoch": 0.82, + "learning_rate": 3.52374665061551e-08, + "loss": 0.0005, + "step": 42478 + }, + { + "epoch": 0.82, + "learning_rate": 3.523358316181896e-08, + "loss": 0.0004, + "step": 42479 + }, + { + "epoch": 0.82, + "learning_rate": 3.522969981748282e-08, + "loss": 0.002, + "step": 42480 + }, + { + "epoch": 0.82, + "learning_rate": 3.5225816473146677e-08, + "loss": 0.0003, + "step": 42481 + }, + { + "epoch": 0.82, + "learning_rate": 3.5221933128810535e-08, + "loss": 0.0004, + "step": 42482 + }, + { + "epoch": 0.82, + "learning_rate": 3.5218049784474386e-08, + "loss": 0.2031, + "step": 42483 + }, + { + "epoch": 0.82, + "learning_rate": 3.5214166440138245e-08, + "loss": 0.0003, + "step": 42484 + }, + { + "epoch": 0.82, + "learning_rate": 3.52102830958021e-08, + "loss": 0.0004, + "step": 42485 + }, + { + "epoch": 0.82, + "learning_rate": 3.520639975146596e-08, + "loss": 0.0117, + "step": 42486 + }, + { + "epoch": 0.82, + "learning_rate": 3.520251640712982e-08, + "loss": 0.0004, + "step": 42487 + }, + { + "epoch": 0.82, + "learning_rate": 3.519863306279368e-08, + "loss": 0.0004, + "step": 42488 + }, + { + "epoch": 0.82, + "learning_rate": 3.5194749718457536e-08, + "loss": 0.0005, + "step": 42489 + }, + { + "epoch": 0.82, + "learning_rate": 3.5190866374121394e-08, + "loss": 0.0005, + "step": 42490 + }, + { + "epoch": 0.82, + "learning_rate": 3.518698302978525e-08, + "loss": 0.0004, + "step": 42491 + }, + { + "epoch": 0.82, + "learning_rate": 3.518309968544911e-08, + "loss": 0.0005, + "step": 42492 + }, + { + "epoch": 0.82, + "learning_rate": 3.517921634111297e-08, + "loss": 0.0017, + "step": 42493 + }, + { + "epoch": 0.82, + "learning_rate": 3.517533299677683e-08, + "loss": 0.0005, + "step": 42494 + }, + { + "epoch": 0.82, + "learning_rate": 3.5171449652440685e-08, + "loss": 1.2928, + "step": 42495 + }, + { + "epoch": 0.82, + "learning_rate": 3.5167566308104544e-08, + "loss": 0.0006, + "step": 42496 + }, + { + "epoch": 0.82, + "learning_rate": 3.5163682963768395e-08, + "loss": 0.0003, + "step": 42497 + }, + { + "epoch": 0.82, + "learning_rate": 3.5159799619432253e-08, + "loss": 0.0003, + "step": 42498 + }, + { + "epoch": 0.82, + "learning_rate": 3.515591627509611e-08, + "loss": 0.0003, + "step": 42499 + }, + { + "epoch": 0.82, + "learning_rate": 3.515203293075997e-08, + "loss": 0.0005, + "step": 42500 + }, + { + "epoch": 0.82, + "learning_rate": 3.514814958642383e-08, + "loss": 0.0006, + "step": 42501 + }, + { + "epoch": 0.82, + "learning_rate": 3.5144266242087686e-08, + "loss": 0.0003, + "step": 42502 + }, + { + "epoch": 0.82, + "learning_rate": 3.5140382897751545e-08, + "loss": 0.0003, + "step": 42503 + }, + { + "epoch": 0.82, + "learning_rate": 3.5136499553415396e-08, + "loss": 0.0003, + "step": 42504 + }, + { + "epoch": 0.82, + "learning_rate": 3.5132616209079255e-08, + "loss": 0.0003, + "step": 42505 + }, + { + "epoch": 0.82, + "learning_rate": 3.512873286474311e-08, + "loss": 0.0007, + "step": 42506 + }, + { + "epoch": 0.82, + "learning_rate": 3.512484952040697e-08, + "loss": 0.0004, + "step": 42507 + }, + { + "epoch": 0.82, + "learning_rate": 3.512096617607083e-08, + "loss": 0.0004, + "step": 42508 + }, + { + "epoch": 0.82, + "learning_rate": 3.511708283173469e-08, + "loss": 0.0009, + "step": 42509 + }, + { + "epoch": 0.82, + "learning_rate": 3.5113199487398546e-08, + "loss": 0.0004, + "step": 42510 + }, + { + "epoch": 0.82, + "learning_rate": 3.5109316143062404e-08, + "loss": 0.0004, + "step": 42511 + }, + { + "epoch": 0.82, + "learning_rate": 3.5105432798726256e-08, + "loss": 0.0004, + "step": 42512 + }, + { + "epoch": 0.82, + "learning_rate": 3.5101549454390114e-08, + "loss": 0.0004, + "step": 42513 + }, + { + "epoch": 0.82, + "learning_rate": 3.509766611005397e-08, + "loss": 0.0004, + "step": 42514 + }, + { + "epoch": 0.82, + "learning_rate": 3.509378276571783e-08, + "loss": 0.0003, + "step": 42515 + }, + { + "epoch": 0.82, + "learning_rate": 3.508989942138169e-08, + "loss": 0.0003, + "step": 42516 + }, + { + "epoch": 0.82, + "learning_rate": 3.508601607704555e-08, + "loss": 0.0003, + "step": 42517 + }, + { + "epoch": 0.82, + "learning_rate": 3.5082132732709405e-08, + "loss": 0.0008, + "step": 42518 + }, + { + "epoch": 0.82, + "learning_rate": 3.5078249388373263e-08, + "loss": 0.0003, + "step": 42519 + }, + { + "epoch": 0.82, + "learning_rate": 3.507436604403712e-08, + "loss": 0.0005, + "step": 42520 + }, + { + "epoch": 0.82, + "learning_rate": 3.507048269970098e-08, + "loss": 0.0004, + "step": 42521 + }, + { + "epoch": 0.82, + "learning_rate": 3.506659935536484e-08, + "loss": 0.0005, + "step": 42522 + }, + { + "epoch": 0.82, + "learning_rate": 3.5062716011028696e-08, + "loss": 0.0947, + "step": 42523 + }, + { + "epoch": 0.82, + "learning_rate": 3.5058832666692555e-08, + "loss": 0.0003, + "step": 42524 + }, + { + "epoch": 0.82, + "learning_rate": 3.505494932235641e-08, + "loss": 0.0004, + "step": 42525 + }, + { + "epoch": 0.82, + "learning_rate": 3.505106597802027e-08, + "loss": 0.0004, + "step": 42526 + }, + { + "epoch": 0.82, + "learning_rate": 3.504718263368412e-08, + "loss": 0.0003, + "step": 42527 + }, + { + "epoch": 0.82, + "learning_rate": 3.504329928934798e-08, + "loss": 0.0005, + "step": 42528 + }, + { + "epoch": 0.82, + "learning_rate": 3.503941594501184e-08, + "loss": 1.1119, + "step": 42529 + }, + { + "epoch": 0.82, + "learning_rate": 3.50355326006757e-08, + "loss": 0.0005, + "step": 42530 + }, + { + "epoch": 0.83, + "learning_rate": 3.5031649256339556e-08, + "loss": 0.0003, + "step": 42531 + }, + { + "epoch": 0.83, + "learning_rate": 3.5027765912003414e-08, + "loss": 0.4649, + "step": 42532 + }, + { + "epoch": 0.83, + "learning_rate": 3.502388256766727e-08, + "loss": 0.0005, + "step": 42533 + }, + { + "epoch": 0.83, + "learning_rate": 3.501999922333113e-08, + "loss": 0.0005, + "step": 42534 + }, + { + "epoch": 0.83, + "learning_rate": 3.501611587899499e-08, + "loss": 0.0004, + "step": 42535 + }, + { + "epoch": 0.83, + "learning_rate": 3.501223253465885e-08, + "loss": 0.0003, + "step": 42536 + }, + { + "epoch": 0.83, + "learning_rate": 3.5008349190322705e-08, + "loss": 0.0003, + "step": 42537 + }, + { + "epoch": 0.83, + "learning_rate": 3.5004465845986563e-08, + "loss": 0.0004, + "step": 42538 + }, + { + "epoch": 0.83, + "learning_rate": 3.500058250165042e-08, + "loss": 0.0338, + "step": 42539 + }, + { + "epoch": 0.83, + "learning_rate": 3.499669915731428e-08, + "loss": 0.0004, + "step": 42540 + }, + { + "epoch": 0.83, + "learning_rate": 3.499281581297813e-08, + "loss": 0.0004, + "step": 42541 + }, + { + "epoch": 0.83, + "learning_rate": 3.498893246864199e-08, + "loss": 0.0006, + "step": 42542 + }, + { + "epoch": 0.83, + "learning_rate": 3.498504912430585e-08, + "loss": 0.0003, + "step": 42543 + }, + { + "epoch": 0.83, + "learning_rate": 3.4981165779969706e-08, + "loss": 0.0003, + "step": 42544 + }, + { + "epoch": 0.83, + "learning_rate": 3.4977282435633565e-08, + "loss": 0.8545, + "step": 42545 + }, + { + "epoch": 0.83, + "learning_rate": 3.497339909129742e-08, + "loss": 0.0003, + "step": 42546 + }, + { + "epoch": 0.83, + "learning_rate": 3.496951574696128e-08, + "loss": 0.0004, + "step": 42547 + }, + { + "epoch": 0.83, + "learning_rate": 3.496563240262514e-08, + "loss": 0.0003, + "step": 42548 + }, + { + "epoch": 0.83, + "learning_rate": 3.4961749058289e-08, + "loss": 0.0004, + "step": 42549 + }, + { + "epoch": 0.83, + "learning_rate": 3.4957865713952856e-08, + "loss": 0.0004, + "step": 42550 + }, + { + "epoch": 0.83, + "learning_rate": 3.4953982369616714e-08, + "loss": 0.0004, + "step": 42551 + }, + { + "epoch": 0.83, + "learning_rate": 3.495009902528057e-08, + "loss": 0.0004, + "step": 42552 + }, + { + "epoch": 0.83, + "learning_rate": 3.494621568094443e-08, + "loss": 0.0006, + "step": 42553 + }, + { + "epoch": 0.83, + "learning_rate": 3.494233233660829e-08, + "loss": 0.0003, + "step": 42554 + }, + { + "epoch": 0.83, + "learning_rate": 3.493844899227215e-08, + "loss": 0.0004, + "step": 42555 + }, + { + "epoch": 0.83, + "learning_rate": 3.4934565647936e-08, + "loss": 0.0024, + "step": 42556 + }, + { + "epoch": 0.83, + "learning_rate": 3.493068230359986e-08, + "loss": 0.0005, + "step": 42557 + }, + { + "epoch": 0.83, + "learning_rate": 3.4926798959263715e-08, + "loss": 0.0004, + "step": 42558 + }, + { + "epoch": 0.83, + "learning_rate": 3.4922915614927573e-08, + "loss": 0.0004, + "step": 42559 + }, + { + "epoch": 0.83, + "learning_rate": 3.491903227059143e-08, + "loss": 0.0005, + "step": 42560 + }, + { + "epoch": 0.83, + "learning_rate": 3.491514892625529e-08, + "loss": 0.0008, + "step": 42561 + }, + { + "epoch": 0.83, + "learning_rate": 3.491126558191915e-08, + "loss": 0.0004, + "step": 42562 + }, + { + "epoch": 0.83, + "learning_rate": 3.4907382237583006e-08, + "loss": 0.0006, + "step": 42563 + }, + { + "epoch": 0.83, + "learning_rate": 3.4903498893246865e-08, + "loss": 0.0775, + "step": 42564 + }, + { + "epoch": 0.83, + "learning_rate": 3.489961554891072e-08, + "loss": 0.0004, + "step": 42565 + }, + { + "epoch": 0.83, + "learning_rate": 3.489573220457458e-08, + "loss": 0.0003, + "step": 42566 + }, + { + "epoch": 0.83, + "learning_rate": 3.489184886023844e-08, + "loss": 0.0003, + "step": 42567 + }, + { + "epoch": 0.83, + "learning_rate": 3.48879655159023e-08, + "loss": 0.0004, + "step": 42568 + }, + { + "epoch": 0.83, + "learning_rate": 3.4884082171566156e-08, + "loss": 0.1657, + "step": 42569 + }, + { + "epoch": 0.83, + "learning_rate": 3.488019882723001e-08, + "loss": 0.0003, + "step": 42570 + }, + { + "epoch": 0.83, + "learning_rate": 3.4876315482893866e-08, + "loss": 0.0003, + "step": 42571 + }, + { + "epoch": 0.83, + "learning_rate": 3.4872432138557724e-08, + "loss": 0.0007, + "step": 42572 + }, + { + "epoch": 0.83, + "learning_rate": 3.486854879422158e-08, + "loss": 0.8536, + "step": 42573 + }, + { + "epoch": 0.83, + "learning_rate": 3.486466544988544e-08, + "loss": 0.0004, + "step": 42574 + }, + { + "epoch": 0.83, + "learning_rate": 3.48607821055493e-08, + "loss": 0.0005, + "step": 42575 + }, + { + "epoch": 0.83, + "learning_rate": 3.485689876121316e-08, + "loss": 0.0004, + "step": 42576 + }, + { + "epoch": 0.83, + "learning_rate": 3.4853015416877015e-08, + "loss": 0.204, + "step": 42577 + }, + { + "epoch": 0.83, + "learning_rate": 3.4849132072540873e-08, + "loss": 0.0002, + "step": 42578 + }, + { + "epoch": 0.83, + "learning_rate": 3.484524872820473e-08, + "loss": 0.0003, + "step": 42579 + }, + { + "epoch": 0.83, + "learning_rate": 3.484136538386859e-08, + "loss": 0.0003, + "step": 42580 + }, + { + "epoch": 0.83, + "learning_rate": 3.483748203953245e-08, + "loss": 0.0004, + "step": 42581 + }, + { + "epoch": 0.83, + "learning_rate": 3.4833598695196306e-08, + "loss": 0.0004, + "step": 42582 + }, + { + "epoch": 0.83, + "learning_rate": 3.4829715350860165e-08, + "loss": 0.0006, + "step": 42583 + }, + { + "epoch": 0.83, + "learning_rate": 3.482583200652402e-08, + "loss": 0.0003, + "step": 42584 + }, + { + "epoch": 0.83, + "learning_rate": 3.4821948662187874e-08, + "loss": 0.0003, + "step": 42585 + }, + { + "epoch": 0.83, + "learning_rate": 3.481806531785173e-08, + "loss": 0.0176, + "step": 42586 + }, + { + "epoch": 0.83, + "learning_rate": 3.481418197351559e-08, + "loss": 0.8656, + "step": 42587 + }, + { + "epoch": 0.83, + "learning_rate": 3.481029862917945e-08, + "loss": 0.0004, + "step": 42588 + }, + { + "epoch": 0.83, + "learning_rate": 3.480641528484331e-08, + "loss": 0.0004, + "step": 42589 + }, + { + "epoch": 0.83, + "learning_rate": 3.4802531940507166e-08, + "loss": 0.0003, + "step": 42590 + }, + { + "epoch": 0.83, + "learning_rate": 3.4798648596171024e-08, + "loss": 0.0068, + "step": 42591 + }, + { + "epoch": 0.83, + "learning_rate": 3.479476525183488e-08, + "loss": 0.0003, + "step": 42592 + }, + { + "epoch": 0.83, + "learning_rate": 3.4790881907498734e-08, + "loss": 0.0004, + "step": 42593 + }, + { + "epoch": 0.83, + "learning_rate": 3.478699856316259e-08, + "loss": 0.0004, + "step": 42594 + }, + { + "epoch": 0.83, + "learning_rate": 3.478311521882645e-08, + "loss": 0.0004, + "step": 42595 + }, + { + "epoch": 0.83, + "learning_rate": 3.477923187449031e-08, + "loss": 0.0004, + "step": 42596 + }, + { + "epoch": 0.83, + "learning_rate": 3.477534853015417e-08, + "loss": 0.0003, + "step": 42597 + }, + { + "epoch": 0.83, + "learning_rate": 3.4771465185818025e-08, + "loss": 0.0003, + "step": 42598 + }, + { + "epoch": 0.83, + "learning_rate": 3.476758184148188e-08, + "loss": 0.0007, + "step": 42599 + }, + { + "epoch": 0.83, + "learning_rate": 3.4763698497145735e-08, + "loss": 0.0004, + "step": 42600 + }, + { + "epoch": 0.83, + "learning_rate": 3.475981515280959e-08, + "loss": 0.0003, + "step": 42601 + }, + { + "epoch": 0.83, + "learning_rate": 3.475593180847345e-08, + "loss": 0.0003, + "step": 42602 + }, + { + "epoch": 0.83, + "learning_rate": 3.475204846413731e-08, + "loss": 0.0011, + "step": 42603 + }, + { + "epoch": 0.83, + "learning_rate": 3.474816511980117e-08, + "loss": 0.0004, + "step": 42604 + }, + { + "epoch": 0.83, + "learning_rate": 3.4744281775465026e-08, + "loss": 0.0006, + "step": 42605 + }, + { + "epoch": 0.83, + "learning_rate": 3.4740398431128884e-08, + "loss": 0.0003, + "step": 42606 + }, + { + "epoch": 0.83, + "learning_rate": 3.473651508679274e-08, + "loss": 0.0004, + "step": 42607 + }, + { + "epoch": 0.83, + "learning_rate": 3.47326317424566e-08, + "loss": 0.0003, + "step": 42608 + }, + { + "epoch": 0.83, + "learning_rate": 3.472874839812046e-08, + "loss": 0.016, + "step": 42609 + }, + { + "epoch": 0.83, + "learning_rate": 3.472486505378432e-08, + "loss": 0.3854, + "step": 42610 + }, + { + "epoch": 0.83, + "learning_rate": 3.4720981709448176e-08, + "loss": 0.0002, + "step": 42611 + }, + { + "epoch": 0.83, + "learning_rate": 3.4717098365112034e-08, + "loss": 0.8741, + "step": 42612 + }, + { + "epoch": 0.83, + "learning_rate": 3.471321502077589e-08, + "loss": 0.0004, + "step": 42613 + }, + { + "epoch": 0.83, + "learning_rate": 3.4709331676439744e-08, + "loss": 0.9723, + "step": 42614 + }, + { + "epoch": 0.83, + "learning_rate": 3.47054483321036e-08, + "loss": 0.0004, + "step": 42615 + }, + { + "epoch": 0.83, + "learning_rate": 3.470156498776746e-08, + "loss": 0.0003, + "step": 42616 + }, + { + "epoch": 0.83, + "learning_rate": 3.469768164343132e-08, + "loss": 1.5167, + "step": 42617 + }, + { + "epoch": 0.83, + "learning_rate": 3.4693798299095177e-08, + "loss": 0.8454, + "step": 42618 + }, + { + "epoch": 0.83, + "learning_rate": 3.4689914954759035e-08, + "loss": 0.0017, + "step": 42619 + }, + { + "epoch": 0.83, + "learning_rate": 3.468603161042289e-08, + "loss": 0.0003, + "step": 42620 + }, + { + "epoch": 0.83, + "learning_rate": 3.468214826608675e-08, + "loss": 0.0011, + "step": 42621 + }, + { + "epoch": 0.83, + "learning_rate": 3.467826492175061e-08, + "loss": 0.2888, + "step": 42622 + }, + { + "epoch": 0.83, + "learning_rate": 3.467438157741447e-08, + "loss": 0.0007, + "step": 42623 + }, + { + "epoch": 0.83, + "learning_rate": 3.4670498233078326e-08, + "loss": 0.0004, + "step": 42624 + }, + { + "epoch": 0.83, + "learning_rate": 3.4666614888742184e-08, + "loss": 0.0003, + "step": 42625 + }, + { + "epoch": 0.83, + "learning_rate": 3.466273154440604e-08, + "loss": 0.0003, + "step": 42626 + }, + { + "epoch": 0.83, + "learning_rate": 3.46588482000699e-08, + "loss": 0.0006, + "step": 42627 + }, + { + "epoch": 0.83, + "learning_rate": 3.465496485573375e-08, + "loss": 0.0004, + "step": 42628 + }, + { + "epoch": 0.83, + "learning_rate": 3.465108151139761e-08, + "loss": 0.0005, + "step": 42629 + }, + { + "epoch": 0.83, + "learning_rate": 3.464719816706147e-08, + "loss": 0.0006, + "step": 42630 + }, + { + "epoch": 0.83, + "learning_rate": 3.464331482272533e-08, + "loss": 0.0003, + "step": 42631 + }, + { + "epoch": 0.83, + "learning_rate": 3.4639431478389185e-08, + "loss": 0.0041, + "step": 42632 + }, + { + "epoch": 0.83, + "learning_rate": 3.4635548134053044e-08, + "loss": 0.0003, + "step": 42633 + }, + { + "epoch": 0.83, + "learning_rate": 3.46316647897169e-08, + "loss": 0.0005, + "step": 42634 + }, + { + "epoch": 0.83, + "learning_rate": 3.462778144538076e-08, + "loss": 0.0005, + "step": 42635 + }, + { + "epoch": 0.83, + "learning_rate": 3.462389810104462e-08, + "loss": 0.0004, + "step": 42636 + }, + { + "epoch": 0.83, + "learning_rate": 3.4620014756708477e-08, + "loss": 0.0005, + "step": 42637 + }, + { + "epoch": 0.83, + "learning_rate": 3.4616131412372335e-08, + "loss": 0.0003, + "step": 42638 + }, + { + "epoch": 0.83, + "learning_rate": 3.461224806803619e-08, + "loss": 0.0004, + "step": 42639 + }, + { + "epoch": 0.83, + "learning_rate": 3.460836472370005e-08, + "loss": 0.0004, + "step": 42640 + }, + { + "epoch": 0.83, + "learning_rate": 3.460448137936391e-08, + "loss": 0.0005, + "step": 42641 + }, + { + "epoch": 0.83, + "learning_rate": 3.460059803502777e-08, + "loss": 0.0005, + "step": 42642 + }, + { + "epoch": 0.83, + "learning_rate": 3.459671469069162e-08, + "loss": 0.001, + "step": 42643 + }, + { + "epoch": 0.83, + "learning_rate": 3.459283134635548e-08, + "loss": 0.0004, + "step": 42644 + }, + { + "epoch": 0.83, + "learning_rate": 3.4588948002019336e-08, + "loss": 0.0006, + "step": 42645 + }, + { + "epoch": 0.83, + "learning_rate": 3.4585064657683194e-08, + "loss": 0.0004, + "step": 42646 + }, + { + "epoch": 0.83, + "learning_rate": 3.458118131334705e-08, + "loss": 0.0004, + "step": 42647 + }, + { + "epoch": 0.83, + "learning_rate": 3.457729796901091e-08, + "loss": 0.0006, + "step": 42648 + }, + { + "epoch": 0.83, + "learning_rate": 3.457341462467477e-08, + "loss": 0.0004, + "step": 42649 + }, + { + "epoch": 0.83, + "learning_rate": 3.456953128033863e-08, + "loss": 0.0004, + "step": 42650 + }, + { + "epoch": 0.83, + "learning_rate": 3.4565647936002485e-08, + "loss": 0.084, + "step": 42651 + }, + { + "epoch": 0.83, + "learning_rate": 3.4561764591666344e-08, + "loss": 0.0068, + "step": 42652 + }, + { + "epoch": 0.83, + "learning_rate": 3.45578812473302e-08, + "loss": 0.0004, + "step": 42653 + }, + { + "epoch": 0.83, + "learning_rate": 3.455399790299406e-08, + "loss": 0.0006, + "step": 42654 + }, + { + "epoch": 0.83, + "learning_rate": 3.455011455865792e-08, + "loss": 0.0003, + "step": 42655 + }, + { + "epoch": 0.83, + "learning_rate": 3.454623121432178e-08, + "loss": 0.0003, + "step": 42656 + }, + { + "epoch": 0.83, + "learning_rate": 3.454234786998563e-08, + "loss": 0.0004, + "step": 42657 + }, + { + "epoch": 0.83, + "learning_rate": 3.4538464525649487e-08, + "loss": 0.0004, + "step": 42658 + }, + { + "epoch": 0.83, + "learning_rate": 3.4534581181313345e-08, + "loss": 0.0005, + "step": 42659 + }, + { + "epoch": 0.83, + "learning_rate": 3.45306978369772e-08, + "loss": 0.0003, + "step": 42660 + }, + { + "epoch": 0.83, + "learning_rate": 3.452681449264106e-08, + "loss": 0.0043, + "step": 42661 + }, + { + "epoch": 0.83, + "learning_rate": 3.452293114830492e-08, + "loss": 0.0004, + "step": 42662 + }, + { + "epoch": 0.83, + "learning_rate": 3.451904780396878e-08, + "loss": 0.0005, + "step": 42663 + }, + { + "epoch": 0.83, + "learning_rate": 3.4515164459632636e-08, + "loss": 0.0005, + "step": 42664 + }, + { + "epoch": 0.83, + "learning_rate": 3.4511281115296494e-08, + "loss": 0.0004, + "step": 42665 + }, + { + "epoch": 0.83, + "learning_rate": 3.450739777096035e-08, + "loss": 0.0006, + "step": 42666 + }, + { + "epoch": 0.83, + "learning_rate": 3.450351442662421e-08, + "loss": 0.0004, + "step": 42667 + }, + { + "epoch": 0.83, + "learning_rate": 3.449963108228807e-08, + "loss": 0.0003, + "step": 42668 + }, + { + "epoch": 0.83, + "learning_rate": 3.449574773795193e-08, + "loss": 0.0003, + "step": 42669 + }, + { + "epoch": 0.83, + "learning_rate": 3.4491864393615785e-08, + "loss": 0.0008, + "step": 42670 + }, + { + "epoch": 0.83, + "learning_rate": 3.4487981049279644e-08, + "loss": 0.002, + "step": 42671 + }, + { + "epoch": 0.83, + "learning_rate": 3.4484097704943495e-08, + "loss": 0.0053, + "step": 42672 + }, + { + "epoch": 0.83, + "learning_rate": 3.4480214360607354e-08, + "loss": 0.0005, + "step": 42673 + }, + { + "epoch": 0.83, + "learning_rate": 3.447633101627121e-08, + "loss": 0.0008, + "step": 42674 + }, + { + "epoch": 0.83, + "learning_rate": 3.447244767193507e-08, + "loss": 0.0003, + "step": 42675 + }, + { + "epoch": 0.83, + "learning_rate": 3.446856432759893e-08, + "loss": 0.0005, + "step": 42676 + }, + { + "epoch": 0.83, + "learning_rate": 3.4464680983262787e-08, + "loss": 0.0003, + "step": 42677 + }, + { + "epoch": 0.83, + "learning_rate": 3.4460797638926645e-08, + "loss": 0.0004, + "step": 42678 + }, + { + "epoch": 0.83, + "learning_rate": 3.44569142945905e-08, + "loss": 0.218, + "step": 42679 + }, + { + "epoch": 0.83, + "learning_rate": 3.445303095025436e-08, + "loss": 0.0006, + "step": 42680 + }, + { + "epoch": 0.83, + "learning_rate": 3.444914760591821e-08, + "loss": 0.0004, + "step": 42681 + }, + { + "epoch": 0.83, + "learning_rate": 3.444526426158207e-08, + "loss": 0.0003, + "step": 42682 + }, + { + "epoch": 0.83, + "learning_rate": 3.444138091724593e-08, + "loss": 0.0004, + "step": 42683 + }, + { + "epoch": 0.83, + "learning_rate": 3.443749757290979e-08, + "loss": 0.0005, + "step": 42684 + }, + { + "epoch": 0.83, + "learning_rate": 3.4433614228573646e-08, + "loss": 0.0003, + "step": 42685 + }, + { + "epoch": 0.83, + "learning_rate": 3.4429730884237504e-08, + "loss": 0.0005, + "step": 42686 + }, + { + "epoch": 0.83, + "learning_rate": 3.442584753990136e-08, + "loss": 0.0003, + "step": 42687 + }, + { + "epoch": 0.83, + "learning_rate": 3.442196419556522e-08, + "loss": 0.0009, + "step": 42688 + }, + { + "epoch": 0.83, + "learning_rate": 3.441808085122907e-08, + "loss": 0.0005, + "step": 42689 + }, + { + "epoch": 0.83, + "learning_rate": 3.441419750689293e-08, + "loss": 0.0003, + "step": 42690 + }, + { + "epoch": 0.83, + "learning_rate": 3.441031416255679e-08, + "loss": 0.0008, + "step": 42691 + }, + { + "epoch": 0.83, + "learning_rate": 3.440643081822065e-08, + "loss": 0.0004, + "step": 42692 + }, + { + "epoch": 0.83, + "learning_rate": 3.4402547473884505e-08, + "loss": 0.0004, + "step": 42693 + }, + { + "epoch": 0.83, + "learning_rate": 3.4398664129548364e-08, + "loss": 0.0004, + "step": 42694 + }, + { + "epoch": 0.83, + "learning_rate": 3.439478078521222e-08, + "loss": 0.0004, + "step": 42695 + }, + { + "epoch": 0.83, + "learning_rate": 3.439089744087608e-08, + "loss": 0.0003, + "step": 42696 + }, + { + "epoch": 0.83, + "learning_rate": 3.438701409653994e-08, + "loss": 0.0205, + "step": 42697 + }, + { + "epoch": 0.83, + "learning_rate": 3.4383130752203796e-08, + "loss": 0.0009, + "step": 42698 + }, + { + "epoch": 0.83, + "learning_rate": 3.4379247407867655e-08, + "loss": 0.0011, + "step": 42699 + }, + { + "epoch": 0.83, + "learning_rate": 3.437536406353151e-08, + "loss": 0.0005, + "step": 42700 + }, + { + "epoch": 0.83, + "learning_rate": 3.4371480719195365e-08, + "loss": 0.0003, + "step": 42701 + }, + { + "epoch": 0.83, + "learning_rate": 3.436759737485922e-08, + "loss": 1.1102, + "step": 42702 + }, + { + "epoch": 0.83, + "learning_rate": 3.436371403052308e-08, + "loss": 0.0004, + "step": 42703 + }, + { + "epoch": 0.83, + "learning_rate": 3.435983068618694e-08, + "loss": 1.1299, + "step": 42704 + }, + { + "epoch": 0.83, + "learning_rate": 3.43559473418508e-08, + "loss": 0.0003, + "step": 42705 + }, + { + "epoch": 0.83, + "learning_rate": 3.4352063997514656e-08, + "loss": 1.2255, + "step": 42706 + }, + { + "epoch": 0.83, + "learning_rate": 3.4348180653178514e-08, + "loss": 0.0006, + "step": 42707 + }, + { + "epoch": 0.83, + "learning_rate": 3.434429730884237e-08, + "loss": 0.0004, + "step": 42708 + }, + { + "epoch": 0.83, + "learning_rate": 3.434041396450623e-08, + "loss": 0.0004, + "step": 42709 + }, + { + "epoch": 0.83, + "learning_rate": 3.433653062017009e-08, + "loss": 0.0004, + "step": 42710 + }, + { + "epoch": 0.83, + "learning_rate": 3.433264727583395e-08, + "loss": 1.0163, + "step": 42711 + }, + { + "epoch": 0.83, + "learning_rate": 3.4328763931497805e-08, + "loss": 0.0005, + "step": 42712 + }, + { + "epoch": 0.83, + "learning_rate": 3.4324880587161664e-08, + "loss": 0.0005, + "step": 42713 + }, + { + "epoch": 0.83, + "learning_rate": 3.432099724282552e-08, + "loss": 0.0005, + "step": 42714 + }, + { + "epoch": 0.83, + "learning_rate": 3.4317113898489373e-08, + "loss": 0.0003, + "step": 42715 + }, + { + "epoch": 0.83, + "learning_rate": 3.431323055415323e-08, + "loss": 0.0005, + "step": 42716 + }, + { + "epoch": 0.83, + "learning_rate": 3.430934720981709e-08, + "loss": 0.0003, + "step": 42717 + }, + { + "epoch": 0.83, + "learning_rate": 3.430546386548095e-08, + "loss": 0.0247, + "step": 42718 + }, + { + "epoch": 0.83, + "learning_rate": 3.4301580521144806e-08, + "loss": 0.0026, + "step": 42719 + }, + { + "epoch": 0.83, + "learning_rate": 3.4297697176808665e-08, + "loss": 0.0003, + "step": 42720 + }, + { + "epoch": 0.83, + "learning_rate": 3.429381383247252e-08, + "loss": 0.0004, + "step": 42721 + }, + { + "epoch": 0.83, + "learning_rate": 3.428993048813638e-08, + "loss": 0.0004, + "step": 42722 + }, + { + "epoch": 0.83, + "learning_rate": 3.428604714380024e-08, + "loss": 0.0005, + "step": 42723 + }, + { + "epoch": 0.83, + "learning_rate": 3.42821637994641e-08, + "loss": 0.0003, + "step": 42724 + }, + { + "epoch": 0.83, + "learning_rate": 3.4278280455127956e-08, + "loss": 0.0003, + "step": 42725 + }, + { + "epoch": 0.83, + "learning_rate": 3.4274397110791814e-08, + "loss": 0.0004, + "step": 42726 + }, + { + "epoch": 0.83, + "learning_rate": 3.427051376645567e-08, + "loss": 0.0004, + "step": 42727 + }, + { + "epoch": 0.83, + "learning_rate": 3.426663042211953e-08, + "loss": 0.0003, + "step": 42728 + }, + { + "epoch": 0.83, + "learning_rate": 3.426274707778339e-08, + "loss": 0.0003, + "step": 42729 + }, + { + "epoch": 0.83, + "learning_rate": 3.425886373344724e-08, + "loss": 0.7128, + "step": 42730 + }, + { + "epoch": 0.83, + "learning_rate": 3.42549803891111e-08, + "loss": 0.0011, + "step": 42731 + }, + { + "epoch": 0.83, + "learning_rate": 3.425109704477496e-08, + "loss": 0.0842, + "step": 42732 + }, + { + "epoch": 0.83, + "learning_rate": 3.4247213700438815e-08, + "loss": 0.0004, + "step": 42733 + }, + { + "epoch": 0.83, + "learning_rate": 3.4243330356102673e-08, + "loss": 0.0016, + "step": 42734 + }, + { + "epoch": 0.83, + "learning_rate": 3.423944701176653e-08, + "loss": 0.0025, + "step": 42735 + }, + { + "epoch": 0.83, + "learning_rate": 3.423556366743039e-08, + "loss": 0.0004, + "step": 42736 + }, + { + "epoch": 0.83, + "learning_rate": 3.423168032309425e-08, + "loss": 0.0061, + "step": 42737 + }, + { + "epoch": 0.83, + "learning_rate": 3.4227796978758106e-08, + "loss": 0.0008, + "step": 42738 + }, + { + "epoch": 0.83, + "learning_rate": 3.4223913634421965e-08, + "loss": 0.0003, + "step": 42739 + }, + { + "epoch": 0.83, + "learning_rate": 3.422003029008582e-08, + "loss": 0.0007, + "step": 42740 + }, + { + "epoch": 0.83, + "learning_rate": 3.421614694574968e-08, + "loss": 0.0003, + "step": 42741 + }, + { + "epoch": 0.83, + "learning_rate": 3.421226360141354e-08, + "loss": 0.0037, + "step": 42742 + }, + { + "epoch": 0.83, + "learning_rate": 3.42083802570774e-08, + "loss": 0.0003, + "step": 42743 + }, + { + "epoch": 0.83, + "learning_rate": 3.420449691274125e-08, + "loss": 0.0004, + "step": 42744 + }, + { + "epoch": 0.83, + "learning_rate": 3.420061356840511e-08, + "loss": 0.0004, + "step": 42745 + }, + { + "epoch": 0.83, + "learning_rate": 3.4196730224068966e-08, + "loss": 0.0084, + "step": 42746 + }, + { + "epoch": 0.83, + "learning_rate": 3.4192846879732824e-08, + "loss": 0.0015, + "step": 42747 + }, + { + "epoch": 0.83, + "learning_rate": 3.418896353539668e-08, + "loss": 0.0005, + "step": 42748 + }, + { + "epoch": 0.83, + "learning_rate": 3.418508019106054e-08, + "loss": 0.0003, + "step": 42749 + }, + { + "epoch": 0.83, + "learning_rate": 3.41811968467244e-08, + "loss": 0.2699, + "step": 42750 + }, + { + "epoch": 0.83, + "learning_rate": 3.417731350238826e-08, + "loss": 0.0004, + "step": 42751 + }, + { + "epoch": 0.83, + "learning_rate": 3.4173430158052115e-08, + "loss": 0.0007, + "step": 42752 + }, + { + "epoch": 0.83, + "learning_rate": 3.4169546813715973e-08, + "loss": 0.0004, + "step": 42753 + }, + { + "epoch": 0.83, + "learning_rate": 3.416566346937983e-08, + "loss": 0.0033, + "step": 42754 + }, + { + "epoch": 0.83, + "learning_rate": 3.416178012504369e-08, + "loss": 0.0004, + "step": 42755 + }, + { + "epoch": 0.83, + "learning_rate": 3.415789678070755e-08, + "loss": 0.0003, + "step": 42756 + }, + { + "epoch": 0.83, + "learning_rate": 3.4154013436371406e-08, + "loss": 0.0004, + "step": 42757 + }, + { + "epoch": 0.83, + "learning_rate": 3.4150130092035265e-08, + "loss": 0.0005, + "step": 42758 + }, + { + "epoch": 0.83, + "learning_rate": 3.4146246747699116e-08, + "loss": 0.0015, + "step": 42759 + }, + { + "epoch": 0.83, + "learning_rate": 3.4142363403362975e-08, + "loss": 0.0004, + "step": 42760 + }, + { + "epoch": 0.83, + "learning_rate": 3.413848005902683e-08, + "loss": 0.0017, + "step": 42761 + }, + { + "epoch": 0.83, + "learning_rate": 3.413459671469069e-08, + "loss": 0.0003, + "step": 42762 + }, + { + "epoch": 0.83, + "learning_rate": 3.413071337035455e-08, + "loss": 0.0025, + "step": 42763 + }, + { + "epoch": 0.83, + "learning_rate": 3.412683002601841e-08, + "loss": 0.0004, + "step": 42764 + }, + { + "epoch": 0.83, + "learning_rate": 3.4122946681682266e-08, + "loss": 0.0005, + "step": 42765 + }, + { + "epoch": 0.83, + "learning_rate": 3.4119063337346124e-08, + "loss": 0.0006, + "step": 42766 + }, + { + "epoch": 0.83, + "learning_rate": 3.411517999300998e-08, + "loss": 0.0005, + "step": 42767 + }, + { + "epoch": 0.83, + "learning_rate": 3.411129664867384e-08, + "loss": 0.0022, + "step": 42768 + }, + { + "epoch": 0.83, + "learning_rate": 3.41074133043377e-08, + "loss": 0.0004, + "step": 42769 + }, + { + "epoch": 0.83, + "learning_rate": 3.410352996000155e-08, + "loss": 0.0004, + "step": 42770 + }, + { + "epoch": 0.83, + "learning_rate": 3.409964661566541e-08, + "loss": 0.0004, + "step": 42771 + }, + { + "epoch": 0.83, + "learning_rate": 3.409576327132927e-08, + "loss": 0.0005, + "step": 42772 + }, + { + "epoch": 0.83, + "learning_rate": 3.4091879926993125e-08, + "loss": 0.0002, + "step": 42773 + }, + { + "epoch": 0.83, + "learning_rate": 3.4087996582656983e-08, + "loss": 0.0007, + "step": 42774 + }, + { + "epoch": 0.83, + "learning_rate": 3.408411323832084e-08, + "loss": 0.0004, + "step": 42775 + }, + { + "epoch": 0.83, + "learning_rate": 3.40802298939847e-08, + "loss": 0.0003, + "step": 42776 + }, + { + "epoch": 0.83, + "learning_rate": 3.407634654964855e-08, + "loss": 0.0012, + "step": 42777 + }, + { + "epoch": 0.83, + "learning_rate": 3.407246320531241e-08, + "loss": 0.0584, + "step": 42778 + }, + { + "epoch": 0.83, + "learning_rate": 3.406857986097627e-08, + "loss": 0.0005, + "step": 42779 + }, + { + "epoch": 0.83, + "learning_rate": 3.4064696516640126e-08, + "loss": 0.0005, + "step": 42780 + }, + { + "epoch": 0.83, + "learning_rate": 3.4060813172303984e-08, + "loss": 0.0004, + "step": 42781 + }, + { + "epoch": 0.83, + "learning_rate": 3.405692982796784e-08, + "loss": 0.0003, + "step": 42782 + }, + { + "epoch": 0.83, + "learning_rate": 3.40530464836317e-08, + "loss": 0.0074, + "step": 42783 + }, + { + "epoch": 0.83, + "learning_rate": 3.404916313929556e-08, + "loss": 0.0005, + "step": 42784 + }, + { + "epoch": 0.83, + "learning_rate": 3.404527979495942e-08, + "loss": 0.0007, + "step": 42785 + }, + { + "epoch": 0.83, + "learning_rate": 3.4041396450623276e-08, + "loss": 0.0005, + "step": 42786 + }, + { + "epoch": 0.83, + "learning_rate": 3.4037513106287134e-08, + "loss": 0.0004, + "step": 42787 + }, + { + "epoch": 0.83, + "learning_rate": 3.4033629761950986e-08, + "loss": 0.0005, + "step": 42788 + }, + { + "epoch": 0.83, + "learning_rate": 3.4029746417614844e-08, + "loss": 0.0004, + "step": 42789 + }, + { + "epoch": 0.83, + "learning_rate": 3.40258630732787e-08, + "loss": 0.0035, + "step": 42790 + }, + { + "epoch": 0.83, + "learning_rate": 3.402197972894256e-08, + "loss": 0.0005, + "step": 42791 + }, + { + "epoch": 0.83, + "learning_rate": 3.401809638460642e-08, + "loss": 0.0009, + "step": 42792 + }, + { + "epoch": 0.83, + "learning_rate": 3.401421304027028e-08, + "loss": 0.0003, + "step": 42793 + }, + { + "epoch": 0.83, + "learning_rate": 3.4010329695934135e-08, + "loss": 0.0004, + "step": 42794 + }, + { + "epoch": 0.83, + "learning_rate": 3.400644635159799e-08, + "loss": 0.0004, + "step": 42795 + }, + { + "epoch": 0.83, + "learning_rate": 3.400256300726185e-08, + "loss": 0.0003, + "step": 42796 + }, + { + "epoch": 0.83, + "learning_rate": 3.399867966292571e-08, + "loss": 0.0004, + "step": 42797 + }, + { + "epoch": 0.83, + "learning_rate": 3.399479631858957e-08, + "loss": 0.0007, + "step": 42798 + }, + { + "epoch": 0.83, + "learning_rate": 3.3990912974253426e-08, + "loss": 0.0004, + "step": 42799 + }, + { + "epoch": 0.83, + "learning_rate": 3.3987029629917284e-08, + "loss": 0.0004, + "step": 42800 + }, + { + "epoch": 0.83, + "learning_rate": 3.398314628558114e-08, + "loss": 0.0006, + "step": 42801 + }, + { + "epoch": 0.83, + "learning_rate": 3.3979262941244994e-08, + "loss": 0.0005, + "step": 42802 + }, + { + "epoch": 0.83, + "learning_rate": 3.397537959690885e-08, + "loss": 0.0455, + "step": 42803 + }, + { + "epoch": 0.83, + "learning_rate": 3.397149625257271e-08, + "loss": 0.0006, + "step": 42804 + }, + { + "epoch": 0.83, + "learning_rate": 3.396761290823657e-08, + "loss": 0.0005, + "step": 42805 + }, + { + "epoch": 0.83, + "learning_rate": 3.396372956390043e-08, + "loss": 0.0003, + "step": 42806 + }, + { + "epoch": 0.83, + "learning_rate": 3.3959846219564286e-08, + "loss": 0.0003, + "step": 42807 + }, + { + "epoch": 0.83, + "learning_rate": 3.3955962875228144e-08, + "loss": 0.0005, + "step": 42808 + }, + { + "epoch": 0.83, + "learning_rate": 3.3952079530892e-08, + "loss": 0.0003, + "step": 42809 + }, + { + "epoch": 0.83, + "learning_rate": 3.394819618655586e-08, + "loss": 0.0022, + "step": 42810 + }, + { + "epoch": 0.83, + "learning_rate": 3.394431284221972e-08, + "loss": 0.0003, + "step": 42811 + }, + { + "epoch": 0.83, + "learning_rate": 3.394042949788358e-08, + "loss": 0.0046, + "step": 42812 + }, + { + "epoch": 0.83, + "learning_rate": 3.3936546153547435e-08, + "loss": 0.0004, + "step": 42813 + }, + { + "epoch": 0.83, + "learning_rate": 3.393266280921129e-08, + "loss": 0.0003, + "step": 42814 + }, + { + "epoch": 0.83, + "learning_rate": 3.392877946487515e-08, + "loss": 0.0003, + "step": 42815 + }, + { + "epoch": 0.83, + "learning_rate": 3.392489612053901e-08, + "loss": 0.0003, + "step": 42816 + }, + { + "epoch": 0.83, + "learning_rate": 3.392101277620286e-08, + "loss": 0.0003, + "step": 42817 + }, + { + "epoch": 0.83, + "learning_rate": 3.391712943186672e-08, + "loss": 0.0004, + "step": 42818 + }, + { + "epoch": 0.83, + "learning_rate": 3.391324608753058e-08, + "loss": 0.0004, + "step": 42819 + }, + { + "epoch": 0.83, + "learning_rate": 3.3909362743194436e-08, + "loss": 0.0003, + "step": 42820 + }, + { + "epoch": 0.83, + "learning_rate": 3.3905479398858294e-08, + "loss": 0.0005, + "step": 42821 + }, + { + "epoch": 0.83, + "learning_rate": 3.390159605452215e-08, + "loss": 0.0004, + "step": 42822 + }, + { + "epoch": 0.83, + "learning_rate": 3.389771271018601e-08, + "loss": 0.0204, + "step": 42823 + }, + { + "epoch": 0.83, + "learning_rate": 3.389382936584987e-08, + "loss": 0.0003, + "step": 42824 + }, + { + "epoch": 0.83, + "learning_rate": 3.388994602151373e-08, + "loss": 0.0032, + "step": 42825 + }, + { + "epoch": 0.83, + "learning_rate": 3.3886062677177586e-08, + "loss": 0.0003, + "step": 42826 + }, + { + "epoch": 0.83, + "learning_rate": 3.3882179332841444e-08, + "loss": 0.0003, + "step": 42827 + }, + { + "epoch": 0.83, + "learning_rate": 3.38782959885053e-08, + "loss": 0.0006, + "step": 42828 + }, + { + "epoch": 0.83, + "learning_rate": 3.387441264416916e-08, + "loss": 0.0014, + "step": 42829 + }, + { + "epoch": 0.83, + "learning_rate": 3.387052929983302e-08, + "loss": 0.0008, + "step": 42830 + }, + { + "epoch": 0.83, + "learning_rate": 3.386664595549687e-08, + "loss": 0.0003, + "step": 42831 + }, + { + "epoch": 0.83, + "learning_rate": 3.386276261116073e-08, + "loss": 0.0013, + "step": 42832 + }, + { + "epoch": 0.83, + "learning_rate": 3.3858879266824587e-08, + "loss": 0.0004, + "step": 42833 + }, + { + "epoch": 0.83, + "learning_rate": 3.3854995922488445e-08, + "loss": 0.0004, + "step": 42834 + }, + { + "epoch": 0.83, + "learning_rate": 3.38511125781523e-08, + "loss": 0.0004, + "step": 42835 + }, + { + "epoch": 0.83, + "learning_rate": 3.384722923381616e-08, + "loss": 0.0004, + "step": 42836 + }, + { + "epoch": 0.83, + "learning_rate": 3.384334588948002e-08, + "loss": 0.0004, + "step": 42837 + }, + { + "epoch": 0.83, + "learning_rate": 3.383946254514388e-08, + "loss": 0.0004, + "step": 42838 + }, + { + "epoch": 0.83, + "learning_rate": 3.3835579200807736e-08, + "loss": 0.0002, + "step": 42839 + }, + { + "epoch": 0.83, + "learning_rate": 3.3831695856471594e-08, + "loss": 0.0005, + "step": 42840 + }, + { + "epoch": 0.83, + "learning_rate": 3.382781251213545e-08, + "loss": 0.0007, + "step": 42841 + }, + { + "epoch": 0.83, + "learning_rate": 3.382392916779931e-08, + "loss": 0.0003, + "step": 42842 + }, + { + "epoch": 0.83, + "learning_rate": 3.382004582346317e-08, + "loss": 0.0004, + "step": 42843 + }, + { + "epoch": 0.83, + "learning_rate": 3.381616247912703e-08, + "loss": 0.0008, + "step": 42844 + }, + { + "epoch": 0.83, + "learning_rate": 3.3812279134790886e-08, + "loss": 0.0004, + "step": 42845 + }, + { + "epoch": 0.83, + "learning_rate": 3.380839579045474e-08, + "loss": 0.0005, + "step": 42846 + }, + { + "epoch": 0.83, + "learning_rate": 3.3804512446118595e-08, + "loss": 0.6688, + "step": 42847 + }, + { + "epoch": 0.83, + "learning_rate": 3.3800629101782454e-08, + "loss": 0.0007, + "step": 42848 + }, + { + "epoch": 0.83, + "learning_rate": 3.379674575744631e-08, + "loss": 0.0003, + "step": 42849 + }, + { + "epoch": 0.83, + "learning_rate": 3.379286241311017e-08, + "loss": 0.0008, + "step": 42850 + }, + { + "epoch": 0.83, + "learning_rate": 3.378897906877403e-08, + "loss": 0.0003, + "step": 42851 + }, + { + "epoch": 0.83, + "learning_rate": 3.378509572443789e-08, + "loss": 0.0402, + "step": 42852 + }, + { + "epoch": 0.83, + "learning_rate": 3.3781212380101745e-08, + "loss": 0.0004, + "step": 42853 + }, + { + "epoch": 0.83, + "learning_rate": 3.37773290357656e-08, + "loss": 0.0004, + "step": 42854 + }, + { + "epoch": 0.83, + "learning_rate": 3.377344569142946e-08, + "loss": 0.0004, + "step": 42855 + }, + { + "epoch": 0.83, + "learning_rate": 3.376956234709332e-08, + "loss": 0.0004, + "step": 42856 + }, + { + "epoch": 0.83, + "learning_rate": 3.376567900275718e-08, + "loss": 0.0004, + "step": 42857 + }, + { + "epoch": 0.83, + "learning_rate": 3.376179565842103e-08, + "loss": 0.0007, + "step": 42858 + }, + { + "epoch": 0.83, + "learning_rate": 3.375791231408489e-08, + "loss": 0.0005, + "step": 42859 + }, + { + "epoch": 0.83, + "learning_rate": 3.3754028969748746e-08, + "loss": 0.1891, + "step": 42860 + }, + { + "epoch": 0.83, + "learning_rate": 3.3750145625412604e-08, + "loss": 0.0003, + "step": 42861 + }, + { + "epoch": 0.83, + "learning_rate": 3.374626228107646e-08, + "loss": 0.0004, + "step": 42862 + }, + { + "epoch": 0.83, + "learning_rate": 3.374237893674032e-08, + "loss": 0.0003, + "step": 42863 + }, + { + "epoch": 0.83, + "learning_rate": 3.373849559240418e-08, + "loss": 0.0003, + "step": 42864 + }, + { + "epoch": 0.83, + "learning_rate": 3.373461224806804e-08, + "loss": 0.0003, + "step": 42865 + }, + { + "epoch": 0.83, + "learning_rate": 3.373072890373189e-08, + "loss": 0.0005, + "step": 42866 + }, + { + "epoch": 0.83, + "learning_rate": 3.372684555939575e-08, + "loss": 0.0004, + "step": 42867 + }, + { + "epoch": 0.83, + "learning_rate": 3.3722962215059605e-08, + "loss": 0.0003, + "step": 42868 + }, + { + "epoch": 0.83, + "learning_rate": 3.3719078870723464e-08, + "loss": 0.0257, + "step": 42869 + }, + { + "epoch": 0.83, + "learning_rate": 3.371519552638732e-08, + "loss": 0.0004, + "step": 42870 + }, + { + "epoch": 0.83, + "learning_rate": 3.371131218205118e-08, + "loss": 0.0005, + "step": 42871 + }, + { + "epoch": 0.83, + "learning_rate": 3.370742883771504e-08, + "loss": 0.0004, + "step": 42872 + }, + { + "epoch": 0.83, + "learning_rate": 3.3703545493378897e-08, + "loss": 0.0005, + "step": 42873 + }, + { + "epoch": 0.83, + "learning_rate": 3.3699662149042755e-08, + "loss": 0.0006, + "step": 42874 + }, + { + "epoch": 0.83, + "learning_rate": 3.3695778804706606e-08, + "loss": 0.0002, + "step": 42875 + }, + { + "epoch": 0.83, + "learning_rate": 3.3691895460370465e-08, + "loss": 0.0027, + "step": 42876 + }, + { + "epoch": 0.83, + "learning_rate": 3.368801211603432e-08, + "loss": 0.0003, + "step": 42877 + }, + { + "epoch": 0.83, + "learning_rate": 3.368412877169818e-08, + "loss": 0.0004, + "step": 42878 + }, + { + "epoch": 0.83, + "learning_rate": 3.368024542736204e-08, + "loss": 0.0004, + "step": 42879 + }, + { + "epoch": 0.83, + "learning_rate": 3.36763620830259e-08, + "loss": 0.0006, + "step": 42880 + }, + { + "epoch": 0.83, + "learning_rate": 3.3672478738689756e-08, + "loss": 0.0003, + "step": 42881 + }, + { + "epoch": 0.83, + "learning_rate": 3.3668595394353614e-08, + "loss": 0.0005, + "step": 42882 + }, + { + "epoch": 0.83, + "learning_rate": 3.366471205001747e-08, + "loss": 0.0006, + "step": 42883 + }, + { + "epoch": 0.83, + "learning_rate": 3.366082870568133e-08, + "loss": 0.0003, + "step": 42884 + }, + { + "epoch": 0.83, + "learning_rate": 3.365694536134519e-08, + "loss": 0.0014, + "step": 42885 + }, + { + "epoch": 0.83, + "learning_rate": 3.365306201700905e-08, + "loss": 0.0008, + "step": 42886 + }, + { + "epoch": 0.83, + "learning_rate": 3.3649178672672905e-08, + "loss": 0.0003, + "step": 42887 + }, + { + "epoch": 0.83, + "learning_rate": 3.3645295328336764e-08, + "loss": 0.0003, + "step": 42888 + }, + { + "epoch": 0.83, + "learning_rate": 3.3641411984000615e-08, + "loss": 0.0005, + "step": 42889 + }, + { + "epoch": 0.83, + "learning_rate": 3.3637528639664474e-08, + "loss": 0.0007, + "step": 42890 + }, + { + "epoch": 0.83, + "learning_rate": 3.363364529532833e-08, + "loss": 0.0042, + "step": 42891 + }, + { + "epoch": 0.83, + "learning_rate": 3.362976195099219e-08, + "loss": 0.5696, + "step": 42892 + }, + { + "epoch": 0.83, + "learning_rate": 3.362587860665605e-08, + "loss": 0.0004, + "step": 42893 + }, + { + "epoch": 0.83, + "learning_rate": 3.3621995262319906e-08, + "loss": 0.1387, + "step": 42894 + }, + { + "epoch": 0.83, + "learning_rate": 3.3618111917983765e-08, + "loss": 0.0007, + "step": 42895 + }, + { + "epoch": 0.83, + "learning_rate": 3.361422857364762e-08, + "loss": 0.0004, + "step": 42896 + }, + { + "epoch": 0.83, + "learning_rate": 3.361034522931148e-08, + "loss": 0.0003, + "step": 42897 + }, + { + "epoch": 0.83, + "learning_rate": 3.360646188497534e-08, + "loss": 1.242, + "step": 42898 + }, + { + "epoch": 0.83, + "learning_rate": 3.36025785406392e-08, + "loss": 0.0003, + "step": 42899 + }, + { + "epoch": 0.83, + "learning_rate": 3.3598695196303056e-08, + "loss": 0.0004, + "step": 42900 + }, + { + "epoch": 0.83, + "learning_rate": 3.3594811851966914e-08, + "loss": 0.0004, + "step": 42901 + }, + { + "epoch": 0.83, + "learning_rate": 3.359092850763077e-08, + "loss": 0.0005, + "step": 42902 + }, + { + "epoch": 0.83, + "learning_rate": 3.358704516329463e-08, + "loss": 0.0005, + "step": 42903 + }, + { + "epoch": 0.83, + "learning_rate": 3.358316181895848e-08, + "loss": 0.0003, + "step": 42904 + }, + { + "epoch": 0.83, + "learning_rate": 3.357927847462234e-08, + "loss": 0.0005, + "step": 42905 + }, + { + "epoch": 0.83, + "learning_rate": 3.35753951302862e-08, + "loss": 0.0004, + "step": 42906 + }, + { + "epoch": 0.83, + "learning_rate": 3.357151178595006e-08, + "loss": 0.0003, + "step": 42907 + }, + { + "epoch": 0.83, + "learning_rate": 3.3567628441613915e-08, + "loss": 0.0005, + "step": 42908 + }, + { + "epoch": 0.83, + "learning_rate": 3.3563745097277774e-08, + "loss": 0.0003, + "step": 42909 + }, + { + "epoch": 0.83, + "learning_rate": 3.355986175294163e-08, + "loss": 0.0005, + "step": 42910 + }, + { + "epoch": 0.83, + "learning_rate": 3.355597840860549e-08, + "loss": 0.0004, + "step": 42911 + }, + { + "epoch": 0.83, + "learning_rate": 3.355209506426935e-08, + "loss": 0.718, + "step": 42912 + }, + { + "epoch": 0.83, + "learning_rate": 3.3548211719933207e-08, + "loss": 0.0003, + "step": 42913 + }, + { + "epoch": 0.83, + "learning_rate": 3.3544328375597065e-08, + "loss": 0.0013, + "step": 42914 + }, + { + "epoch": 0.83, + "learning_rate": 3.354044503126092e-08, + "loss": 0.0006, + "step": 42915 + }, + { + "epoch": 0.83, + "learning_rate": 3.353656168692478e-08, + "loss": 0.0004, + "step": 42916 + }, + { + "epoch": 0.83, + "learning_rate": 3.353267834258864e-08, + "loss": 0.0047, + "step": 42917 + }, + { + "epoch": 0.83, + "learning_rate": 3.352879499825249e-08, + "loss": 0.0005, + "step": 42918 + }, + { + "epoch": 0.83, + "learning_rate": 3.352491165391635e-08, + "loss": 0.0006, + "step": 42919 + }, + { + "epoch": 0.83, + "learning_rate": 3.352102830958021e-08, + "loss": 0.0003, + "step": 42920 + }, + { + "epoch": 0.83, + "learning_rate": 3.3517144965244066e-08, + "loss": 0.0005, + "step": 42921 + }, + { + "epoch": 0.83, + "learning_rate": 3.3513261620907924e-08, + "loss": 0.0004, + "step": 42922 + }, + { + "epoch": 0.83, + "learning_rate": 3.350937827657178e-08, + "loss": 0.0004, + "step": 42923 + }, + { + "epoch": 0.83, + "learning_rate": 3.350549493223564e-08, + "loss": 0.0005, + "step": 42924 + }, + { + "epoch": 0.83, + "learning_rate": 3.35016115878995e-08, + "loss": 0.0005, + "step": 42925 + }, + { + "epoch": 0.83, + "learning_rate": 3.349772824356336e-08, + "loss": 0.0003, + "step": 42926 + }, + { + "epoch": 0.83, + "learning_rate": 3.3493844899227215e-08, + "loss": 0.0005, + "step": 42927 + }, + { + "epoch": 0.83, + "learning_rate": 3.3489961554891074e-08, + "loss": 0.0003, + "step": 42928 + }, + { + "epoch": 0.83, + "learning_rate": 3.348607821055493e-08, + "loss": 0.0004, + "step": 42929 + }, + { + "epoch": 0.83, + "learning_rate": 3.348219486621879e-08, + "loss": 0.0022, + "step": 42930 + }, + { + "epoch": 0.83, + "learning_rate": 3.347831152188265e-08, + "loss": 0.0004, + "step": 42931 + }, + { + "epoch": 0.83, + "learning_rate": 3.3474428177546507e-08, + "loss": 0.001, + "step": 42932 + }, + { + "epoch": 0.83, + "learning_rate": 3.347054483321036e-08, + "loss": 0.0003, + "step": 42933 + }, + { + "epoch": 0.83, + "learning_rate": 3.3466661488874216e-08, + "loss": 0.0003, + "step": 42934 + }, + { + "epoch": 0.83, + "learning_rate": 3.3462778144538075e-08, + "loss": 0.0005, + "step": 42935 + }, + { + "epoch": 0.83, + "learning_rate": 3.345889480020193e-08, + "loss": 0.0003, + "step": 42936 + }, + { + "epoch": 0.83, + "learning_rate": 3.345501145586579e-08, + "loss": 0.0004, + "step": 42937 + }, + { + "epoch": 0.83, + "learning_rate": 3.345112811152965e-08, + "loss": 0.0006, + "step": 42938 + }, + { + "epoch": 0.83, + "learning_rate": 3.344724476719351e-08, + "loss": 0.0004, + "step": 42939 + }, + { + "epoch": 0.83, + "learning_rate": 3.3443361422857366e-08, + "loss": 0.0003, + "step": 42940 + }, + { + "epoch": 0.83, + "learning_rate": 3.3439478078521224e-08, + "loss": 0.0004, + "step": 42941 + }, + { + "epoch": 0.83, + "learning_rate": 3.343559473418508e-08, + "loss": 0.0319, + "step": 42942 + }, + { + "epoch": 0.83, + "learning_rate": 3.343171138984894e-08, + "loss": 0.0004, + "step": 42943 + }, + { + "epoch": 0.83, + "learning_rate": 3.34278280455128e-08, + "loss": 0.0004, + "step": 42944 + }, + { + "epoch": 0.83, + "learning_rate": 3.342394470117666e-08, + "loss": 0.0006, + "step": 42945 + }, + { + "epoch": 0.83, + "learning_rate": 3.3420061356840515e-08, + "loss": 0.0004, + "step": 42946 + }, + { + "epoch": 0.83, + "learning_rate": 3.341617801250437e-08, + "loss": 0.0003, + "step": 42947 + }, + { + "epoch": 0.83, + "learning_rate": 3.3412294668168225e-08, + "loss": 0.0003, + "step": 42948 + }, + { + "epoch": 0.83, + "learning_rate": 3.3408411323832083e-08, + "loss": 0.0005, + "step": 42949 + }, + { + "epoch": 0.83, + "learning_rate": 3.340452797949594e-08, + "loss": 0.0005, + "step": 42950 + }, + { + "epoch": 0.83, + "learning_rate": 3.34006446351598e-08, + "loss": 0.0005, + "step": 42951 + }, + { + "epoch": 0.83, + "learning_rate": 3.339676129082366e-08, + "loss": 0.0003, + "step": 42952 + }, + { + "epoch": 0.83, + "learning_rate": 3.3392877946487516e-08, + "loss": 0.0004, + "step": 42953 + }, + { + "epoch": 0.83, + "learning_rate": 3.338899460215137e-08, + "loss": 0.0003, + "step": 42954 + }, + { + "epoch": 0.83, + "learning_rate": 3.3385111257815226e-08, + "loss": 0.7564, + "step": 42955 + }, + { + "epoch": 0.83, + "learning_rate": 3.3381227913479085e-08, + "loss": 0.5171, + "step": 42956 + }, + { + "epoch": 0.83, + "learning_rate": 3.337734456914294e-08, + "loss": 0.0003, + "step": 42957 + }, + { + "epoch": 0.83, + "learning_rate": 3.33734612248068e-08, + "loss": 0.1717, + "step": 42958 + }, + { + "epoch": 0.83, + "learning_rate": 3.336957788047066e-08, + "loss": 0.0004, + "step": 42959 + }, + { + "epoch": 0.83, + "learning_rate": 3.336569453613452e-08, + "loss": 0.0002, + "step": 42960 + }, + { + "epoch": 0.83, + "learning_rate": 3.3361811191798376e-08, + "loss": 0.308, + "step": 42961 + }, + { + "epoch": 0.83, + "learning_rate": 3.335792784746223e-08, + "loss": 0.0006, + "step": 42962 + }, + { + "epoch": 0.83, + "learning_rate": 3.3354044503126086e-08, + "loss": 0.0003, + "step": 42963 + }, + { + "epoch": 0.83, + "learning_rate": 3.3350161158789944e-08, + "loss": 0.001, + "step": 42964 + }, + { + "epoch": 0.83, + "learning_rate": 3.33462778144538e-08, + "loss": 0.0004, + "step": 42965 + }, + { + "epoch": 0.83, + "learning_rate": 3.334239447011766e-08, + "loss": 0.0005, + "step": 42966 + }, + { + "epoch": 0.83, + "learning_rate": 3.333851112578152e-08, + "loss": 0.0002, + "step": 42967 + }, + { + "epoch": 0.83, + "learning_rate": 3.333462778144538e-08, + "loss": 0.5721, + "step": 42968 + }, + { + "epoch": 0.83, + "learning_rate": 3.3330744437109235e-08, + "loss": 0.0004, + "step": 42969 + }, + { + "epoch": 0.83, + "learning_rate": 3.3326861092773093e-08, + "loss": 0.0004, + "step": 42970 + }, + { + "epoch": 0.83, + "learning_rate": 3.332297774843695e-08, + "loss": 0.0007, + "step": 42971 + }, + { + "epoch": 0.83, + "learning_rate": 3.331909440410081e-08, + "loss": 0.0004, + "step": 42972 + }, + { + "epoch": 0.83, + "learning_rate": 3.331521105976467e-08, + "loss": 0.0005, + "step": 42973 + }, + { + "epoch": 0.83, + "learning_rate": 3.3311327715428526e-08, + "loss": 0.0006, + "step": 42974 + }, + { + "epoch": 0.83, + "learning_rate": 3.3307444371092385e-08, + "loss": 0.0003, + "step": 42975 + }, + { + "epoch": 0.83, + "learning_rate": 3.3303561026756236e-08, + "loss": 0.0003, + "step": 42976 + }, + { + "epoch": 0.83, + "learning_rate": 3.3299677682420094e-08, + "loss": 0.0004, + "step": 42977 + }, + { + "epoch": 0.83, + "learning_rate": 3.329579433808395e-08, + "loss": 0.0006, + "step": 42978 + }, + { + "epoch": 0.83, + "learning_rate": 3.329191099374781e-08, + "loss": 0.0024, + "step": 42979 + }, + { + "epoch": 0.83, + "learning_rate": 3.328802764941167e-08, + "loss": 0.0003, + "step": 42980 + }, + { + "epoch": 0.83, + "learning_rate": 3.328414430507553e-08, + "loss": 0.0008, + "step": 42981 + }, + { + "epoch": 0.83, + "learning_rate": 3.3280260960739386e-08, + "loss": 0.0015, + "step": 42982 + }, + { + "epoch": 0.83, + "learning_rate": 3.3276377616403244e-08, + "loss": 0.0005, + "step": 42983 + }, + { + "epoch": 0.83, + "learning_rate": 3.32724942720671e-08, + "loss": 0.0004, + "step": 42984 + }, + { + "epoch": 0.83, + "learning_rate": 3.326861092773096e-08, + "loss": 0.0006, + "step": 42985 + }, + { + "epoch": 0.83, + "learning_rate": 3.326472758339482e-08, + "loss": 0.0005, + "step": 42986 + }, + { + "epoch": 0.83, + "learning_rate": 3.326084423905868e-08, + "loss": 0.0004, + "step": 42987 + }, + { + "epoch": 0.83, + "learning_rate": 3.3256960894722535e-08, + "loss": 0.0005, + "step": 42988 + }, + { + "epoch": 0.83, + "learning_rate": 3.3253077550386393e-08, + "loss": 0.0004, + "step": 42989 + }, + { + "epoch": 0.83, + "learning_rate": 3.324919420605025e-08, + "loss": 0.0424, + "step": 42990 + }, + { + "epoch": 0.83, + "learning_rate": 3.32453108617141e-08, + "loss": 0.0006, + "step": 42991 + }, + { + "epoch": 0.83, + "learning_rate": 3.324142751737796e-08, + "loss": 0.4361, + "step": 42992 + }, + { + "epoch": 0.83, + "learning_rate": 3.323754417304182e-08, + "loss": 0.0003, + "step": 42993 + }, + { + "epoch": 0.83, + "learning_rate": 3.323366082870568e-08, + "loss": 0.0004, + "step": 42994 + }, + { + "epoch": 0.83, + "learning_rate": 3.3229777484369536e-08, + "loss": 0.0004, + "step": 42995 + }, + { + "epoch": 0.83, + "learning_rate": 3.3225894140033394e-08, + "loss": 0.0005, + "step": 42996 + }, + { + "epoch": 0.83, + "learning_rate": 3.322201079569725e-08, + "loss": 0.0004, + "step": 42997 + }, + { + "epoch": 0.83, + "learning_rate": 3.321812745136111e-08, + "loss": 0.8528, + "step": 42998 + }, + { + "epoch": 0.83, + "learning_rate": 3.321424410702497e-08, + "loss": 0.0004, + "step": 42999 + }, + { + "epoch": 0.83, + "learning_rate": 3.321036076268883e-08, + "loss": 0.0004, + "step": 43000 + }, + { + "epoch": 0.83, + "learning_rate": 3.3206477418352686e-08, + "loss": 0.0003, + "step": 43001 + }, + { + "epoch": 0.83, + "learning_rate": 3.3202594074016544e-08, + "loss": 0.0011, + "step": 43002 + }, + { + "epoch": 0.83, + "learning_rate": 3.31987107296804e-08, + "loss": 0.0005, + "step": 43003 + }, + { + "epoch": 0.83, + "learning_rate": 3.319482738534426e-08, + "loss": 0.0004, + "step": 43004 + }, + { + "epoch": 0.83, + "learning_rate": 3.319094404100811e-08, + "loss": 0.0004, + "step": 43005 + }, + { + "epoch": 0.83, + "learning_rate": 3.318706069667197e-08, + "loss": 1.2063, + "step": 43006 + }, + { + "epoch": 0.83, + "learning_rate": 3.318317735233583e-08, + "loss": 0.0006, + "step": 43007 + }, + { + "epoch": 0.83, + "learning_rate": 3.317929400799969e-08, + "loss": 0.0004, + "step": 43008 + }, + { + "epoch": 0.83, + "learning_rate": 3.3175410663663545e-08, + "loss": 0.0003, + "step": 43009 + }, + { + "epoch": 0.83, + "learning_rate": 3.31715273193274e-08, + "loss": 0.8063, + "step": 43010 + }, + { + "epoch": 0.83, + "learning_rate": 3.316764397499126e-08, + "loss": 0.0005, + "step": 43011 + }, + { + "epoch": 0.83, + "learning_rate": 3.316376063065512e-08, + "loss": 0.0004, + "step": 43012 + }, + { + "epoch": 0.83, + "learning_rate": 3.315987728631898e-08, + "loss": 0.0006, + "step": 43013 + }, + { + "epoch": 0.83, + "learning_rate": 3.3155993941982836e-08, + "loss": 0.0017, + "step": 43014 + }, + { + "epoch": 0.83, + "learning_rate": 3.3152110597646695e-08, + "loss": 0.0004, + "step": 43015 + }, + { + "epoch": 0.83, + "learning_rate": 3.314822725331055e-08, + "loss": 0.0003, + "step": 43016 + }, + { + "epoch": 0.83, + "learning_rate": 3.314434390897441e-08, + "loss": 0.0003, + "step": 43017 + }, + { + "epoch": 0.83, + "learning_rate": 3.314046056463827e-08, + "loss": 0.0004, + "step": 43018 + }, + { + "epoch": 0.83, + "learning_rate": 3.313657722030213e-08, + "loss": 0.0004, + "step": 43019 + }, + { + "epoch": 0.83, + "learning_rate": 3.313269387596598e-08, + "loss": 0.0003, + "step": 43020 + }, + { + "epoch": 0.83, + "learning_rate": 3.312881053162984e-08, + "loss": 0.0006, + "step": 43021 + }, + { + "epoch": 0.83, + "learning_rate": 3.3124927187293696e-08, + "loss": 0.0003, + "step": 43022 + }, + { + "epoch": 0.83, + "learning_rate": 3.3121043842957554e-08, + "loss": 0.0004, + "step": 43023 + }, + { + "epoch": 0.83, + "learning_rate": 3.311716049862141e-08, + "loss": 0.0003, + "step": 43024 + }, + { + "epoch": 0.83, + "learning_rate": 3.311327715428527e-08, + "loss": 0.0003, + "step": 43025 + }, + { + "epoch": 0.83, + "learning_rate": 3.310939380994913e-08, + "loss": 0.0003, + "step": 43026 + }, + { + "epoch": 0.83, + "learning_rate": 3.310551046561299e-08, + "loss": 0.0004, + "step": 43027 + }, + { + "epoch": 0.83, + "learning_rate": 3.3101627121276845e-08, + "loss": 0.0007, + "step": 43028 + }, + { + "epoch": 0.83, + "learning_rate": 3.30977437769407e-08, + "loss": 0.0005, + "step": 43029 + }, + { + "epoch": 0.83, + "learning_rate": 3.309386043260456e-08, + "loss": 0.0004, + "step": 43030 + }, + { + "epoch": 0.83, + "learning_rate": 3.308997708826842e-08, + "loss": 0.0008, + "step": 43031 + }, + { + "epoch": 0.83, + "learning_rate": 3.308609374393228e-08, + "loss": 0.0004, + "step": 43032 + }, + { + "epoch": 0.83, + "learning_rate": 3.3082210399596136e-08, + "loss": 0.0003, + "step": 43033 + }, + { + "epoch": 0.83, + "learning_rate": 3.307832705525999e-08, + "loss": 0.0004, + "step": 43034 + }, + { + "epoch": 0.83, + "learning_rate": 3.3074443710923846e-08, + "loss": 0.0003, + "step": 43035 + }, + { + "epoch": 0.83, + "learning_rate": 3.3070560366587704e-08, + "loss": 0.0003, + "step": 43036 + }, + { + "epoch": 0.83, + "learning_rate": 3.306667702225156e-08, + "loss": 0.0011, + "step": 43037 + }, + { + "epoch": 0.83, + "learning_rate": 3.306279367791542e-08, + "loss": 0.0004, + "step": 43038 + }, + { + "epoch": 0.83, + "learning_rate": 3.305891033357928e-08, + "loss": 0.0004, + "step": 43039 + }, + { + "epoch": 0.83, + "learning_rate": 3.305502698924314e-08, + "loss": 0.0004, + "step": 43040 + }, + { + "epoch": 0.83, + "learning_rate": 3.3051143644906996e-08, + "loss": 0.0006, + "step": 43041 + }, + { + "epoch": 0.83, + "learning_rate": 3.3047260300570854e-08, + "loss": 0.0004, + "step": 43042 + }, + { + "epoch": 0.83, + "learning_rate": 3.3043376956234705e-08, + "loss": 0.0003, + "step": 43043 + }, + { + "epoch": 0.83, + "learning_rate": 3.3039493611898564e-08, + "loss": 0.0006, + "step": 43044 + }, + { + "epoch": 0.83, + "learning_rate": 3.303561026756242e-08, + "loss": 0.0005, + "step": 43045 + }, + { + "epoch": 0.84, + "learning_rate": 3.303172692322628e-08, + "loss": 0.0004, + "step": 43046 + }, + { + "epoch": 0.84, + "learning_rate": 3.302784357889014e-08, + "loss": 0.0003, + "step": 43047 + }, + { + "epoch": 0.84, + "learning_rate": 3.3023960234554e-08, + "loss": 0.0006, + "step": 43048 + }, + { + "epoch": 0.84, + "learning_rate": 3.3020076890217855e-08, + "loss": 0.0004, + "step": 43049 + }, + { + "epoch": 0.84, + "learning_rate": 3.3016193545881707e-08, + "loss": 0.0007, + "step": 43050 + }, + { + "epoch": 0.84, + "learning_rate": 3.3012310201545565e-08, + "loss": 0.0004, + "step": 43051 + }, + { + "epoch": 0.84, + "learning_rate": 3.300842685720942e-08, + "loss": 0.0004, + "step": 43052 + }, + { + "epoch": 0.84, + "learning_rate": 3.300454351287328e-08, + "loss": 0.0004, + "step": 43053 + }, + { + "epoch": 0.84, + "learning_rate": 3.300066016853714e-08, + "loss": 0.0005, + "step": 43054 + }, + { + "epoch": 0.84, + "learning_rate": 3.2996776824201e-08, + "loss": 0.0004, + "step": 43055 + }, + { + "epoch": 0.84, + "learning_rate": 3.2992893479864856e-08, + "loss": 0.0004, + "step": 43056 + }, + { + "epoch": 0.84, + "learning_rate": 3.2989010135528714e-08, + "loss": 0.0004, + "step": 43057 + }, + { + "epoch": 0.84, + "learning_rate": 3.298512679119257e-08, + "loss": 0.0004, + "step": 43058 + }, + { + "epoch": 0.84, + "learning_rate": 3.298124344685643e-08, + "loss": 0.0016, + "step": 43059 + }, + { + "epoch": 0.84, + "learning_rate": 3.297736010252029e-08, + "loss": 0.0004, + "step": 43060 + }, + { + "epoch": 0.84, + "learning_rate": 3.297347675818415e-08, + "loss": 0.0006, + "step": 43061 + }, + { + "epoch": 0.84, + "learning_rate": 3.2969593413848006e-08, + "loss": 0.0004, + "step": 43062 + }, + { + "epoch": 0.84, + "learning_rate": 3.296571006951186e-08, + "loss": 0.0006, + "step": 43063 + }, + { + "epoch": 0.84, + "learning_rate": 3.2961826725175715e-08, + "loss": 0.0098, + "step": 43064 + }, + { + "epoch": 0.84, + "learning_rate": 3.2957943380839574e-08, + "loss": 0.0004, + "step": 43065 + }, + { + "epoch": 0.84, + "learning_rate": 3.295406003650343e-08, + "loss": 0.0004, + "step": 43066 + }, + { + "epoch": 0.84, + "learning_rate": 3.295017669216729e-08, + "loss": 0.0006, + "step": 43067 + }, + { + "epoch": 0.84, + "learning_rate": 3.294629334783115e-08, + "loss": 1.0942, + "step": 43068 + }, + { + "epoch": 0.84, + "learning_rate": 3.2942410003495007e-08, + "loss": 0.0004, + "step": 43069 + }, + { + "epoch": 0.84, + "learning_rate": 3.2938526659158865e-08, + "loss": 0.0084, + "step": 43070 + }, + { + "epoch": 0.84, + "learning_rate": 3.293464331482272e-08, + "loss": 0.0008, + "step": 43071 + }, + { + "epoch": 0.84, + "learning_rate": 3.293075997048658e-08, + "loss": 0.0005, + "step": 43072 + }, + { + "epoch": 0.84, + "learning_rate": 3.292687662615044e-08, + "loss": 0.0005, + "step": 43073 + }, + { + "epoch": 0.84, + "learning_rate": 3.29229932818143e-08, + "loss": 0.0191, + "step": 43074 + }, + { + "epoch": 0.84, + "learning_rate": 3.2919109937478156e-08, + "loss": 0.0004, + "step": 43075 + }, + { + "epoch": 0.84, + "learning_rate": 3.2915226593142014e-08, + "loss": 0.0004, + "step": 43076 + }, + { + "epoch": 0.84, + "learning_rate": 3.291134324880587e-08, + "loss": 0.0226, + "step": 43077 + }, + { + "epoch": 0.84, + "learning_rate": 3.2907459904469724e-08, + "loss": 0.0003, + "step": 43078 + }, + { + "epoch": 0.84, + "learning_rate": 3.290357656013358e-08, + "loss": 0.0006, + "step": 43079 + }, + { + "epoch": 0.84, + "learning_rate": 3.289969321579744e-08, + "loss": 0.0002, + "step": 43080 + }, + { + "epoch": 0.84, + "learning_rate": 3.28958098714613e-08, + "loss": 0.0007, + "step": 43081 + }, + { + "epoch": 0.84, + "learning_rate": 3.289192652712516e-08, + "loss": 0.0004, + "step": 43082 + }, + { + "epoch": 0.84, + "learning_rate": 3.2888043182789015e-08, + "loss": 0.0006, + "step": 43083 + }, + { + "epoch": 0.84, + "learning_rate": 3.2884159838452874e-08, + "loss": 0.0004, + "step": 43084 + }, + { + "epoch": 0.84, + "learning_rate": 3.288027649411673e-08, + "loss": 0.0003, + "step": 43085 + }, + { + "epoch": 0.84, + "learning_rate": 3.287639314978059e-08, + "loss": 0.0004, + "step": 43086 + }, + { + "epoch": 0.84, + "learning_rate": 3.287250980544445e-08, + "loss": 0.0005, + "step": 43087 + }, + { + "epoch": 0.84, + "learning_rate": 3.2868626461108307e-08, + "loss": 0.0004, + "step": 43088 + }, + { + "epoch": 0.84, + "learning_rate": 3.2864743116772165e-08, + "loss": 0.0003, + "step": 43089 + }, + { + "epoch": 0.84, + "learning_rate": 3.286085977243602e-08, + "loss": 0.0004, + "step": 43090 + }, + { + "epoch": 0.84, + "learning_rate": 3.285697642809988e-08, + "loss": 0.0003, + "step": 43091 + }, + { + "epoch": 0.84, + "learning_rate": 3.285309308376373e-08, + "loss": 0.0005, + "step": 43092 + }, + { + "epoch": 0.84, + "learning_rate": 3.284920973942759e-08, + "loss": 0.0177, + "step": 43093 + }, + { + "epoch": 0.84, + "learning_rate": 3.284532639509145e-08, + "loss": 0.0004, + "step": 43094 + }, + { + "epoch": 0.84, + "learning_rate": 3.284144305075531e-08, + "loss": 0.0004, + "step": 43095 + }, + { + "epoch": 0.84, + "learning_rate": 3.2837559706419166e-08, + "loss": 0.0007, + "step": 43096 + }, + { + "epoch": 0.84, + "learning_rate": 3.2833676362083024e-08, + "loss": 0.0004, + "step": 43097 + }, + { + "epoch": 0.84, + "learning_rate": 3.282979301774688e-08, + "loss": 0.0004, + "step": 43098 + }, + { + "epoch": 0.84, + "learning_rate": 3.282590967341074e-08, + "loss": 0.0028, + "step": 43099 + }, + { + "epoch": 0.84, + "learning_rate": 3.28220263290746e-08, + "loss": 0.0004, + "step": 43100 + }, + { + "epoch": 0.84, + "learning_rate": 3.281814298473846e-08, + "loss": 0.8398, + "step": 43101 + }, + { + "epoch": 0.84, + "learning_rate": 3.2814259640402315e-08, + "loss": 0.0005, + "step": 43102 + }, + { + "epoch": 0.84, + "learning_rate": 3.2810376296066174e-08, + "loss": 0.0005, + "step": 43103 + }, + { + "epoch": 0.84, + "learning_rate": 3.280649295173003e-08, + "loss": 0.0003, + "step": 43104 + }, + { + "epoch": 0.84, + "learning_rate": 3.280260960739389e-08, + "loss": 0.0005, + "step": 43105 + }, + { + "epoch": 0.84, + "learning_rate": 3.279872626305775e-08, + "loss": 0.0003, + "step": 43106 + }, + { + "epoch": 0.84, + "learning_rate": 3.27948429187216e-08, + "loss": 0.0005, + "step": 43107 + }, + { + "epoch": 0.84, + "learning_rate": 3.279095957438546e-08, + "loss": 0.0002, + "step": 43108 + }, + { + "epoch": 0.84, + "learning_rate": 3.2787076230049317e-08, + "loss": 0.0004, + "step": 43109 + }, + { + "epoch": 0.84, + "learning_rate": 3.2783192885713175e-08, + "loss": 0.0004, + "step": 43110 + }, + { + "epoch": 0.84, + "learning_rate": 3.277930954137703e-08, + "loss": 0.0088, + "step": 43111 + }, + { + "epoch": 0.84, + "learning_rate": 3.277542619704089e-08, + "loss": 0.0006, + "step": 43112 + }, + { + "epoch": 0.84, + "learning_rate": 3.277154285270475e-08, + "loss": 0.0003, + "step": 43113 + }, + { + "epoch": 0.84, + "learning_rate": 3.276765950836861e-08, + "loss": 0.0004, + "step": 43114 + }, + { + "epoch": 0.84, + "learning_rate": 3.2763776164032466e-08, + "loss": 0.0006, + "step": 43115 + }, + { + "epoch": 0.84, + "learning_rate": 3.2759892819696324e-08, + "loss": 0.0913, + "step": 43116 + }, + { + "epoch": 0.84, + "learning_rate": 3.275600947536018e-08, + "loss": 0.0004, + "step": 43117 + }, + { + "epoch": 0.84, + "learning_rate": 3.275212613102404e-08, + "loss": 0.0005, + "step": 43118 + }, + { + "epoch": 0.84, + "learning_rate": 3.27482427866879e-08, + "loss": 0.0004, + "step": 43119 + }, + { + "epoch": 0.84, + "learning_rate": 3.274435944235176e-08, + "loss": 0.0009, + "step": 43120 + }, + { + "epoch": 0.84, + "learning_rate": 3.274047609801561e-08, + "loss": 0.0006, + "step": 43121 + }, + { + "epoch": 0.84, + "learning_rate": 3.273659275367947e-08, + "loss": 0.0003, + "step": 43122 + }, + { + "epoch": 0.84, + "learning_rate": 3.2732709409343325e-08, + "loss": 0.0003, + "step": 43123 + }, + { + "epoch": 0.84, + "learning_rate": 3.2728826065007184e-08, + "loss": 0.2291, + "step": 43124 + }, + { + "epoch": 0.84, + "learning_rate": 3.272494272067104e-08, + "loss": 0.11, + "step": 43125 + }, + { + "epoch": 0.84, + "learning_rate": 3.27210593763349e-08, + "loss": 0.0004, + "step": 43126 + }, + { + "epoch": 0.84, + "learning_rate": 3.271717603199876e-08, + "loss": 0.0025, + "step": 43127 + }, + { + "epoch": 0.84, + "learning_rate": 3.2713292687662617e-08, + "loss": 0.0003, + "step": 43128 + }, + { + "epoch": 0.84, + "learning_rate": 3.2709409343326475e-08, + "loss": 0.0004, + "step": 43129 + }, + { + "epoch": 0.84, + "learning_rate": 3.270552599899033e-08, + "loss": 0.0003, + "step": 43130 + }, + { + "epoch": 0.84, + "learning_rate": 3.2701642654654185e-08, + "loss": 0.0004, + "step": 43131 + }, + { + "epoch": 0.84, + "learning_rate": 3.269775931031804e-08, + "loss": 0.0005, + "step": 43132 + }, + { + "epoch": 0.84, + "learning_rate": 3.26938759659819e-08, + "loss": 0.0007, + "step": 43133 + }, + { + "epoch": 0.84, + "learning_rate": 3.268999262164576e-08, + "loss": 0.0004, + "step": 43134 + }, + { + "epoch": 0.84, + "learning_rate": 3.268610927730962e-08, + "loss": 0.0004, + "step": 43135 + }, + { + "epoch": 0.84, + "learning_rate": 3.2682225932973476e-08, + "loss": 0.0005, + "step": 43136 + }, + { + "epoch": 0.84, + "learning_rate": 3.2678342588637334e-08, + "loss": 0.0004, + "step": 43137 + }, + { + "epoch": 0.84, + "learning_rate": 3.2674459244301186e-08, + "loss": 0.0009, + "step": 43138 + }, + { + "epoch": 0.84, + "learning_rate": 3.2670575899965044e-08, + "loss": 0.0003, + "step": 43139 + }, + { + "epoch": 0.84, + "learning_rate": 3.26666925556289e-08, + "loss": 0.0004, + "step": 43140 + }, + { + "epoch": 0.84, + "learning_rate": 3.266280921129276e-08, + "loss": 0.0003, + "step": 43141 + }, + { + "epoch": 0.84, + "learning_rate": 3.265892586695662e-08, + "loss": 0.0004, + "step": 43142 + }, + { + "epoch": 0.84, + "learning_rate": 3.265504252262048e-08, + "loss": 0.0006, + "step": 43143 + }, + { + "epoch": 0.84, + "learning_rate": 3.2651159178284335e-08, + "loss": 0.0005, + "step": 43144 + }, + { + "epoch": 0.84, + "learning_rate": 3.2647275833948193e-08, + "loss": 0.0004, + "step": 43145 + }, + { + "epoch": 0.84, + "learning_rate": 3.264339248961205e-08, + "loss": 0.0003, + "step": 43146 + }, + { + "epoch": 0.84, + "learning_rate": 3.263950914527591e-08, + "loss": 0.0008, + "step": 43147 + }, + { + "epoch": 0.84, + "learning_rate": 3.263562580093977e-08, + "loss": 0.0002, + "step": 43148 + }, + { + "epoch": 0.84, + "learning_rate": 3.2631742456603626e-08, + "loss": 0.0004, + "step": 43149 + }, + { + "epoch": 0.84, + "learning_rate": 3.262785911226748e-08, + "loss": 0.0004, + "step": 43150 + }, + { + "epoch": 0.84, + "learning_rate": 3.2623975767931336e-08, + "loss": 0.0003, + "step": 43151 + }, + { + "epoch": 0.84, + "learning_rate": 3.2620092423595195e-08, + "loss": 0.0005, + "step": 43152 + }, + { + "epoch": 0.84, + "learning_rate": 3.261620907925905e-08, + "loss": 0.0009, + "step": 43153 + }, + { + "epoch": 0.84, + "learning_rate": 3.261232573492291e-08, + "loss": 0.0004, + "step": 43154 + }, + { + "epoch": 0.84, + "learning_rate": 3.260844239058677e-08, + "loss": 0.0005, + "step": 43155 + }, + { + "epoch": 0.84, + "learning_rate": 3.260455904625063e-08, + "loss": 0.0006, + "step": 43156 + }, + { + "epoch": 0.84, + "learning_rate": 3.2600675701914486e-08, + "loss": 0.0004, + "step": 43157 + }, + { + "epoch": 0.84, + "learning_rate": 3.2596792357578344e-08, + "loss": 0.0006, + "step": 43158 + }, + { + "epoch": 0.84, + "learning_rate": 3.25929090132422e-08, + "loss": 0.6168, + "step": 43159 + }, + { + "epoch": 0.84, + "learning_rate": 3.258902566890606e-08, + "loss": 0.0006, + "step": 43160 + }, + { + "epoch": 0.84, + "learning_rate": 3.258514232456992e-08, + "loss": 0.0004, + "step": 43161 + }, + { + "epoch": 0.84, + "learning_rate": 3.258125898023378e-08, + "loss": 1.0448, + "step": 43162 + }, + { + "epoch": 0.84, + "learning_rate": 3.2577375635897635e-08, + "loss": 0.0005, + "step": 43163 + }, + { + "epoch": 0.84, + "learning_rate": 3.2573492291561493e-08, + "loss": 0.0004, + "step": 43164 + }, + { + "epoch": 0.84, + "learning_rate": 3.2569608947225345e-08, + "loss": 0.0005, + "step": 43165 + }, + { + "epoch": 0.84, + "learning_rate": 3.2565725602889203e-08, + "loss": 0.0003, + "step": 43166 + }, + { + "epoch": 0.84, + "learning_rate": 3.256184225855306e-08, + "loss": 0.0005, + "step": 43167 + }, + { + "epoch": 0.84, + "learning_rate": 3.255795891421692e-08, + "loss": 0.0003, + "step": 43168 + }, + { + "epoch": 0.84, + "learning_rate": 3.255407556988078e-08, + "loss": 0.0004, + "step": 43169 + }, + { + "epoch": 0.84, + "learning_rate": 3.2550192225544636e-08, + "loss": 0.0015, + "step": 43170 + }, + { + "epoch": 0.84, + "learning_rate": 3.2546308881208495e-08, + "loss": 0.0003, + "step": 43171 + }, + { + "epoch": 0.84, + "learning_rate": 3.254242553687235e-08, + "loss": 0.0003, + "step": 43172 + }, + { + "epoch": 0.84, + "learning_rate": 3.253854219253621e-08, + "loss": 0.0003, + "step": 43173 + }, + { + "epoch": 0.84, + "learning_rate": 3.253465884820007e-08, + "loss": 0.0004, + "step": 43174 + }, + { + "epoch": 0.84, + "learning_rate": 3.253077550386393e-08, + "loss": 0.0004, + "step": 43175 + }, + { + "epoch": 0.84, + "learning_rate": 3.2526892159527786e-08, + "loss": 0.0004, + "step": 43176 + }, + { + "epoch": 0.84, + "learning_rate": 3.2523008815191644e-08, + "loss": 0.0004, + "step": 43177 + }, + { + "epoch": 0.84, + "learning_rate": 3.25191254708555e-08, + "loss": 0.0003, + "step": 43178 + }, + { + "epoch": 0.84, + "learning_rate": 3.2515242126519354e-08, + "loss": 0.0005, + "step": 43179 + }, + { + "epoch": 0.84, + "learning_rate": 3.251135878218321e-08, + "loss": 0.0341, + "step": 43180 + }, + { + "epoch": 0.84, + "learning_rate": 3.250747543784707e-08, + "loss": 0.0006, + "step": 43181 + }, + { + "epoch": 0.84, + "learning_rate": 3.250359209351093e-08, + "loss": 0.0003, + "step": 43182 + }, + { + "epoch": 0.84, + "learning_rate": 3.249970874917479e-08, + "loss": 0.0004, + "step": 43183 + }, + { + "epoch": 0.84, + "learning_rate": 3.2495825404838645e-08, + "loss": 0.0005, + "step": 43184 + }, + { + "epoch": 0.84, + "learning_rate": 3.2491942060502503e-08, + "loss": 0.0581, + "step": 43185 + }, + { + "epoch": 0.84, + "learning_rate": 3.248805871616636e-08, + "loss": 0.0005, + "step": 43186 + }, + { + "epoch": 0.84, + "learning_rate": 3.248417537183022e-08, + "loss": 0.0003, + "step": 43187 + }, + { + "epoch": 0.84, + "learning_rate": 3.248029202749408e-08, + "loss": 0.0004, + "step": 43188 + }, + { + "epoch": 0.84, + "learning_rate": 3.2476408683157936e-08, + "loss": 0.0004, + "step": 43189 + }, + { + "epoch": 0.84, + "learning_rate": 3.2472525338821795e-08, + "loss": 0.1712, + "step": 43190 + }, + { + "epoch": 0.84, + "learning_rate": 3.246864199448565e-08, + "loss": 0.0004, + "step": 43191 + }, + { + "epoch": 0.84, + "learning_rate": 3.246475865014951e-08, + "loss": 0.002, + "step": 43192 + }, + { + "epoch": 0.84, + "learning_rate": 3.246087530581337e-08, + "loss": 0.0004, + "step": 43193 + }, + { + "epoch": 0.84, + "learning_rate": 3.245699196147722e-08, + "loss": 0.0003, + "step": 43194 + }, + { + "epoch": 0.84, + "learning_rate": 3.245310861714108e-08, + "loss": 0.0005, + "step": 43195 + }, + { + "epoch": 0.84, + "learning_rate": 3.244922527280494e-08, + "loss": 0.0321, + "step": 43196 + }, + { + "epoch": 0.84, + "learning_rate": 3.2445341928468796e-08, + "loss": 0.9552, + "step": 43197 + }, + { + "epoch": 0.84, + "learning_rate": 3.2441458584132654e-08, + "loss": 0.0005, + "step": 43198 + }, + { + "epoch": 0.84, + "learning_rate": 3.243757523979651e-08, + "loss": 0.0006, + "step": 43199 + }, + { + "epoch": 0.84, + "learning_rate": 3.243369189546037e-08, + "loss": 0.0007, + "step": 43200 + }, + { + "epoch": 0.84, + "learning_rate": 3.242980855112423e-08, + "loss": 0.0991, + "step": 43201 + }, + { + "epoch": 0.84, + "learning_rate": 3.242592520678809e-08, + "loss": 0.0005, + "step": 43202 + }, + { + "epoch": 0.84, + "learning_rate": 3.2422041862451945e-08, + "loss": 0.0114, + "step": 43203 + }, + { + "epoch": 0.84, + "learning_rate": 3.2418158518115803e-08, + "loss": 0.0015, + "step": 43204 + }, + { + "epoch": 0.84, + "learning_rate": 3.241427517377966e-08, + "loss": 0.0004, + "step": 43205 + }, + { + "epoch": 0.84, + "learning_rate": 3.241039182944352e-08, + "loss": 0.0004, + "step": 43206 + }, + { + "epoch": 0.84, + "learning_rate": 3.240650848510738e-08, + "loss": 0.0004, + "step": 43207 + }, + { + "epoch": 0.84, + "learning_rate": 3.240262514077123e-08, + "loss": 0.0004, + "step": 43208 + }, + { + "epoch": 0.84, + "learning_rate": 3.239874179643509e-08, + "loss": 0.0067, + "step": 43209 + }, + { + "epoch": 0.84, + "learning_rate": 3.2394858452098946e-08, + "loss": 0.0538, + "step": 43210 + }, + { + "epoch": 0.84, + "learning_rate": 3.2390975107762805e-08, + "loss": 0.0003, + "step": 43211 + }, + { + "epoch": 0.84, + "learning_rate": 3.238709176342666e-08, + "loss": 1.2021, + "step": 43212 + }, + { + "epoch": 0.84, + "learning_rate": 3.238320841909052e-08, + "loss": 0.0005, + "step": 43213 + }, + { + "epoch": 0.84, + "learning_rate": 3.237932507475438e-08, + "loss": 0.0004, + "step": 43214 + }, + { + "epoch": 0.84, + "learning_rate": 3.237544173041824e-08, + "loss": 1.3156, + "step": 43215 + }, + { + "epoch": 0.84, + "learning_rate": 3.2371558386082096e-08, + "loss": 0.0004, + "step": 43216 + }, + { + "epoch": 0.84, + "learning_rate": 3.2367675041745954e-08, + "loss": 0.6464, + "step": 43217 + }, + { + "epoch": 0.84, + "learning_rate": 3.236379169740981e-08, + "loss": 0.0003, + "step": 43218 + }, + { + "epoch": 0.84, + "learning_rate": 3.235990835307367e-08, + "loss": 0.0004, + "step": 43219 + }, + { + "epoch": 0.84, + "learning_rate": 3.235602500873752e-08, + "loss": 0.0004, + "step": 43220 + }, + { + "epoch": 0.84, + "learning_rate": 3.235214166440138e-08, + "loss": 0.2078, + "step": 43221 + }, + { + "epoch": 0.84, + "learning_rate": 3.234825832006524e-08, + "loss": 0.0004, + "step": 43222 + }, + { + "epoch": 0.84, + "learning_rate": 3.23443749757291e-08, + "loss": 0.0003, + "step": 43223 + }, + { + "epoch": 0.84, + "learning_rate": 3.2340491631392955e-08, + "loss": 0.0002, + "step": 43224 + }, + { + "epoch": 0.84, + "learning_rate": 3.2336608287056813e-08, + "loss": 0.0007, + "step": 43225 + }, + { + "epoch": 0.84, + "learning_rate": 3.233272494272067e-08, + "loss": 0.0005, + "step": 43226 + }, + { + "epoch": 0.84, + "learning_rate": 3.232884159838452e-08, + "loss": 0.0003, + "step": 43227 + }, + { + "epoch": 0.84, + "learning_rate": 3.232495825404838e-08, + "loss": 0.0004, + "step": 43228 + }, + { + "epoch": 0.84, + "learning_rate": 3.232107490971224e-08, + "loss": 0.0059, + "step": 43229 + }, + { + "epoch": 0.84, + "learning_rate": 3.23171915653761e-08, + "loss": 0.0004, + "step": 43230 + }, + { + "epoch": 0.84, + "learning_rate": 3.2313308221039956e-08, + "loss": 0.0054, + "step": 43231 + }, + { + "epoch": 0.84, + "learning_rate": 3.2309424876703814e-08, + "loss": 0.0003, + "step": 43232 + }, + { + "epoch": 0.84, + "learning_rate": 3.230554153236767e-08, + "loss": 0.0036, + "step": 43233 + }, + { + "epoch": 0.84, + "learning_rate": 3.230165818803153e-08, + "loss": 1.2456, + "step": 43234 + }, + { + "epoch": 0.84, + "learning_rate": 3.229777484369539e-08, + "loss": 0.0004, + "step": 43235 + }, + { + "epoch": 0.84, + "learning_rate": 3.229389149935925e-08, + "loss": 0.0002, + "step": 43236 + }, + { + "epoch": 0.84, + "learning_rate": 3.22900081550231e-08, + "loss": 0.0185, + "step": 43237 + }, + { + "epoch": 0.84, + "learning_rate": 3.228612481068696e-08, + "loss": 0.0003, + "step": 43238 + }, + { + "epoch": 0.84, + "learning_rate": 3.2282241466350816e-08, + "loss": 0.0008, + "step": 43239 + }, + { + "epoch": 0.84, + "learning_rate": 3.2278358122014674e-08, + "loss": 0.0005, + "step": 43240 + }, + { + "epoch": 0.84, + "learning_rate": 3.227447477767853e-08, + "loss": 0.0005, + "step": 43241 + }, + { + "epoch": 0.84, + "learning_rate": 3.227059143334239e-08, + "loss": 0.0003, + "step": 43242 + }, + { + "epoch": 0.84, + "learning_rate": 3.226670808900625e-08, + "loss": 0.0003, + "step": 43243 + }, + { + "epoch": 0.84, + "learning_rate": 3.226282474467011e-08, + "loss": 0.0003, + "step": 43244 + }, + { + "epoch": 0.84, + "learning_rate": 3.2258941400333965e-08, + "loss": 0.0004, + "step": 43245 + }, + { + "epoch": 0.84, + "learning_rate": 3.225505805599782e-08, + "loss": 0.0003, + "step": 43246 + }, + { + "epoch": 0.84, + "learning_rate": 3.225117471166168e-08, + "loss": 0.0004, + "step": 43247 + }, + { + "epoch": 0.84, + "learning_rate": 3.224729136732554e-08, + "loss": 0.0004, + "step": 43248 + }, + { + "epoch": 0.84, + "learning_rate": 3.22434080229894e-08, + "loss": 0.0011, + "step": 43249 + }, + { + "epoch": 0.84, + "learning_rate": 3.2239524678653256e-08, + "loss": 0.0003, + "step": 43250 + }, + { + "epoch": 0.84, + "learning_rate": 3.2235641334317114e-08, + "loss": 0.0004, + "step": 43251 + }, + { + "epoch": 0.84, + "learning_rate": 3.2231757989980966e-08, + "loss": 0.0011, + "step": 43252 + }, + { + "epoch": 0.84, + "learning_rate": 3.2227874645644824e-08, + "loss": 1.2289, + "step": 43253 + }, + { + "epoch": 0.84, + "learning_rate": 3.222399130130868e-08, + "loss": 0.0763, + "step": 43254 + }, + { + "epoch": 0.84, + "learning_rate": 3.222010795697254e-08, + "loss": 0.0006, + "step": 43255 + }, + { + "epoch": 0.84, + "learning_rate": 3.22162246126364e-08, + "loss": 0.0222, + "step": 43256 + }, + { + "epoch": 0.84, + "learning_rate": 3.221234126830026e-08, + "loss": 0.0005, + "step": 43257 + }, + { + "epoch": 0.84, + "learning_rate": 3.2208457923964116e-08, + "loss": 0.0004, + "step": 43258 + }, + { + "epoch": 0.84, + "learning_rate": 3.2204574579627974e-08, + "loss": 0.0004, + "step": 43259 + }, + { + "epoch": 0.84, + "learning_rate": 3.220069123529183e-08, + "loss": 0.685, + "step": 43260 + }, + { + "epoch": 0.84, + "learning_rate": 3.219680789095569e-08, + "loss": 0.0003, + "step": 43261 + }, + { + "epoch": 0.84, + "learning_rate": 3.219292454661955e-08, + "loss": 0.0005, + "step": 43262 + }, + { + "epoch": 0.84, + "learning_rate": 3.218904120228341e-08, + "loss": 0.0004, + "step": 43263 + }, + { + "epoch": 0.84, + "learning_rate": 3.2185157857947265e-08, + "loss": 0.0006, + "step": 43264 + }, + { + "epoch": 0.84, + "learning_rate": 3.218127451361112e-08, + "loss": 0.0005, + "step": 43265 + }, + { + "epoch": 0.84, + "learning_rate": 3.2177391169274975e-08, + "loss": 0.6587, + "step": 43266 + }, + { + "epoch": 0.84, + "learning_rate": 3.217350782493883e-08, + "loss": 0.0003, + "step": 43267 + }, + { + "epoch": 0.84, + "learning_rate": 3.216962448060269e-08, + "loss": 0.0002, + "step": 43268 + }, + { + "epoch": 0.84, + "learning_rate": 3.216574113626655e-08, + "loss": 0.0025, + "step": 43269 + }, + { + "epoch": 0.84, + "learning_rate": 3.216185779193041e-08, + "loss": 0.0003, + "step": 43270 + }, + { + "epoch": 0.84, + "learning_rate": 3.2157974447594266e-08, + "loss": 0.0022, + "step": 43271 + }, + { + "epoch": 0.84, + "learning_rate": 3.2154091103258124e-08, + "loss": 0.0005, + "step": 43272 + }, + { + "epoch": 0.84, + "learning_rate": 3.215020775892198e-08, + "loss": 0.0007, + "step": 43273 + }, + { + "epoch": 0.84, + "learning_rate": 3.214632441458584e-08, + "loss": 0.0003, + "step": 43274 + }, + { + "epoch": 0.84, + "learning_rate": 3.21424410702497e-08, + "loss": 0.0005, + "step": 43275 + }, + { + "epoch": 0.84, + "learning_rate": 3.213855772591356e-08, + "loss": 0.0003, + "step": 43276 + }, + { + "epoch": 0.84, + "learning_rate": 3.2134674381577416e-08, + "loss": 0.0003, + "step": 43277 + }, + { + "epoch": 0.84, + "learning_rate": 3.2130791037241274e-08, + "loss": 0.0005, + "step": 43278 + }, + { + "epoch": 0.84, + "learning_rate": 3.212690769290513e-08, + "loss": 0.0005, + "step": 43279 + }, + { + "epoch": 0.84, + "learning_rate": 3.212302434856899e-08, + "loss": 0.0003, + "step": 43280 + }, + { + "epoch": 0.84, + "learning_rate": 3.211914100423284e-08, + "loss": 0.0004, + "step": 43281 + }, + { + "epoch": 0.84, + "learning_rate": 3.21152576598967e-08, + "loss": 0.0004, + "step": 43282 + }, + { + "epoch": 0.84, + "learning_rate": 3.211137431556056e-08, + "loss": 0.0004, + "step": 43283 + }, + { + "epoch": 0.84, + "learning_rate": 3.2107490971224417e-08, + "loss": 0.0004, + "step": 43284 + }, + { + "epoch": 0.84, + "learning_rate": 3.2103607626888275e-08, + "loss": 0.0014, + "step": 43285 + }, + { + "epoch": 0.84, + "learning_rate": 3.209972428255213e-08, + "loss": 0.0003, + "step": 43286 + }, + { + "epoch": 0.84, + "learning_rate": 3.209584093821599e-08, + "loss": 0.0005, + "step": 43287 + }, + { + "epoch": 0.84, + "learning_rate": 3.209195759387985e-08, + "loss": 1.2133, + "step": 43288 + }, + { + "epoch": 0.84, + "learning_rate": 3.208807424954371e-08, + "loss": 0.0003, + "step": 43289 + }, + { + "epoch": 0.84, + "learning_rate": 3.2084190905207566e-08, + "loss": 0.0003, + "step": 43290 + }, + { + "epoch": 0.84, + "learning_rate": 3.2080307560871424e-08, + "loss": 0.0003, + "step": 43291 + }, + { + "epoch": 0.84, + "learning_rate": 3.207642421653528e-08, + "loss": 0.001, + "step": 43292 + }, + { + "epoch": 0.84, + "learning_rate": 3.207254087219914e-08, + "loss": 0.0003, + "step": 43293 + }, + { + "epoch": 0.84, + "learning_rate": 3.2068657527863e-08, + "loss": 0.0003, + "step": 43294 + }, + { + "epoch": 0.84, + "learning_rate": 3.206477418352685e-08, + "loss": 0.0043, + "step": 43295 + }, + { + "epoch": 0.84, + "learning_rate": 3.206089083919071e-08, + "loss": 0.0004, + "step": 43296 + }, + { + "epoch": 0.84, + "learning_rate": 3.205700749485457e-08, + "loss": 0.0003, + "step": 43297 + }, + { + "epoch": 0.84, + "learning_rate": 3.2053124150518425e-08, + "loss": 0.0004, + "step": 43298 + }, + { + "epoch": 0.84, + "learning_rate": 3.2049240806182284e-08, + "loss": 0.0005, + "step": 43299 + }, + { + "epoch": 0.84, + "learning_rate": 3.204535746184614e-08, + "loss": 0.0473, + "step": 43300 + }, + { + "epoch": 0.84, + "learning_rate": 3.204147411751e-08, + "loss": 0.0004, + "step": 43301 + }, + { + "epoch": 0.84, + "learning_rate": 3.203759077317386e-08, + "loss": 0.0004, + "step": 43302 + }, + { + "epoch": 0.84, + "learning_rate": 3.2033707428837717e-08, + "loss": 0.0005, + "step": 43303 + }, + { + "epoch": 0.84, + "learning_rate": 3.2029824084501575e-08, + "loss": 0.0004, + "step": 43304 + }, + { + "epoch": 0.84, + "learning_rate": 3.202594074016543e-08, + "loss": 0.0003, + "step": 43305 + }, + { + "epoch": 0.84, + "learning_rate": 3.202205739582929e-08, + "loss": 0.0004, + "step": 43306 + }, + { + "epoch": 0.84, + "learning_rate": 3.201817405149315e-08, + "loss": 0.0006, + "step": 43307 + }, + { + "epoch": 0.84, + "learning_rate": 3.2014290707157e-08, + "loss": 0.0015, + "step": 43308 + }, + { + "epoch": 0.84, + "learning_rate": 3.201040736282086e-08, + "loss": 0.0004, + "step": 43309 + }, + { + "epoch": 0.84, + "learning_rate": 3.200652401848472e-08, + "loss": 0.0016, + "step": 43310 + }, + { + "epoch": 0.84, + "learning_rate": 3.2002640674148576e-08, + "loss": 0.0003, + "step": 43311 + }, + { + "epoch": 0.84, + "learning_rate": 3.1998757329812434e-08, + "loss": 0.0003, + "step": 43312 + }, + { + "epoch": 0.84, + "learning_rate": 3.199487398547629e-08, + "loss": 0.0005, + "step": 43313 + }, + { + "epoch": 0.84, + "learning_rate": 3.199099064114015e-08, + "loss": 0.0004, + "step": 43314 + }, + { + "epoch": 0.84, + "learning_rate": 3.1987107296804e-08, + "loss": 0.0005, + "step": 43315 + }, + { + "epoch": 0.84, + "learning_rate": 3.198322395246786e-08, + "loss": 0.0239, + "step": 43316 + }, + { + "epoch": 0.84, + "learning_rate": 3.197934060813172e-08, + "loss": 0.0005, + "step": 43317 + }, + { + "epoch": 0.84, + "learning_rate": 3.197545726379558e-08, + "loss": 0.0004, + "step": 43318 + }, + { + "epoch": 0.84, + "learning_rate": 3.1971573919459435e-08, + "loss": 0.0005, + "step": 43319 + }, + { + "epoch": 0.84, + "learning_rate": 3.1967690575123294e-08, + "loss": 0.0004, + "step": 43320 + }, + { + "epoch": 0.84, + "learning_rate": 3.196380723078715e-08, + "loss": 0.0004, + "step": 43321 + }, + { + "epoch": 0.84, + "learning_rate": 3.195992388645101e-08, + "loss": 0.0006, + "step": 43322 + }, + { + "epoch": 0.84, + "learning_rate": 3.195604054211487e-08, + "loss": 0.0007, + "step": 43323 + }, + { + "epoch": 0.84, + "learning_rate": 3.195215719777872e-08, + "loss": 0.0007, + "step": 43324 + }, + { + "epoch": 0.84, + "learning_rate": 3.194827385344258e-08, + "loss": 0.0007, + "step": 43325 + }, + { + "epoch": 0.84, + "learning_rate": 3.1944390509106436e-08, + "loss": 0.0005, + "step": 43326 + }, + { + "epoch": 0.84, + "learning_rate": 3.1940507164770295e-08, + "loss": 0.653, + "step": 43327 + }, + { + "epoch": 0.84, + "learning_rate": 3.193662382043415e-08, + "loss": 0.0004, + "step": 43328 + }, + { + "epoch": 0.84, + "learning_rate": 3.193274047609801e-08, + "loss": 0.0003, + "step": 43329 + }, + { + "epoch": 0.84, + "learning_rate": 3.192885713176187e-08, + "loss": 0.0027, + "step": 43330 + }, + { + "epoch": 0.84, + "learning_rate": 3.192497378742573e-08, + "loss": 0.0004, + "step": 43331 + }, + { + "epoch": 0.84, + "learning_rate": 3.1921090443089586e-08, + "loss": 0.0037, + "step": 43332 + }, + { + "epoch": 0.84, + "learning_rate": 3.1917207098753444e-08, + "loss": 0.0005, + "step": 43333 + }, + { + "epoch": 0.84, + "learning_rate": 3.19133237544173e-08, + "loss": 0.0003, + "step": 43334 + }, + { + "epoch": 0.84, + "learning_rate": 3.190944041008116e-08, + "loss": 0.0004, + "step": 43335 + }, + { + "epoch": 0.84, + "learning_rate": 3.190555706574502e-08, + "loss": 0.0004, + "step": 43336 + }, + { + "epoch": 0.84, + "learning_rate": 3.190167372140888e-08, + "loss": 0.0004, + "step": 43337 + }, + { + "epoch": 0.84, + "learning_rate": 3.1897790377072735e-08, + "loss": 0.0003, + "step": 43338 + }, + { + "epoch": 0.84, + "learning_rate": 3.189390703273659e-08, + "loss": 0.0003, + "step": 43339 + }, + { + "epoch": 0.84, + "learning_rate": 3.1890023688400445e-08, + "loss": 0.0005, + "step": 43340 + }, + { + "epoch": 0.84, + "learning_rate": 3.1886140344064303e-08, + "loss": 0.0005, + "step": 43341 + }, + { + "epoch": 0.84, + "learning_rate": 3.188225699972816e-08, + "loss": 0.0004, + "step": 43342 + }, + { + "epoch": 0.84, + "learning_rate": 3.187837365539202e-08, + "loss": 0.0005, + "step": 43343 + }, + { + "epoch": 0.84, + "learning_rate": 3.187449031105588e-08, + "loss": 0.0003, + "step": 43344 + }, + { + "epoch": 0.84, + "learning_rate": 3.1870606966719736e-08, + "loss": 0.0019, + "step": 43345 + }, + { + "epoch": 0.84, + "learning_rate": 3.1866723622383595e-08, + "loss": 0.0004, + "step": 43346 + }, + { + "epoch": 0.84, + "learning_rate": 3.186284027804745e-08, + "loss": 0.0004, + "step": 43347 + }, + { + "epoch": 0.84, + "learning_rate": 3.185895693371131e-08, + "loss": 0.0006, + "step": 43348 + }, + { + "epoch": 0.84, + "learning_rate": 3.185507358937517e-08, + "loss": 0.0005, + "step": 43349 + }, + { + "epoch": 0.84, + "learning_rate": 3.185119024503903e-08, + "loss": 0.0004, + "step": 43350 + }, + { + "epoch": 0.84, + "learning_rate": 3.1847306900702886e-08, + "loss": 0.0005, + "step": 43351 + }, + { + "epoch": 0.84, + "learning_rate": 3.1843423556366744e-08, + "loss": 0.0005, + "step": 43352 + }, + { + "epoch": 0.84, + "learning_rate": 3.1839540212030596e-08, + "loss": 0.0005, + "step": 43353 + }, + { + "epoch": 0.84, + "learning_rate": 3.1835656867694454e-08, + "loss": 0.0003, + "step": 43354 + }, + { + "epoch": 0.84, + "learning_rate": 3.183177352335831e-08, + "loss": 0.0004, + "step": 43355 + }, + { + "epoch": 0.84, + "learning_rate": 3.182789017902217e-08, + "loss": 0.0004, + "step": 43356 + }, + { + "epoch": 0.84, + "learning_rate": 3.182400683468603e-08, + "loss": 1.2858, + "step": 43357 + }, + { + "epoch": 0.84, + "learning_rate": 3.182012349034989e-08, + "loss": 0.0004, + "step": 43358 + }, + { + "epoch": 0.84, + "learning_rate": 3.1816240146013745e-08, + "loss": 0.0005, + "step": 43359 + }, + { + "epoch": 0.84, + "learning_rate": 3.1812356801677604e-08, + "loss": 0.571, + "step": 43360 + }, + { + "epoch": 0.84, + "learning_rate": 3.180847345734146e-08, + "loss": 0.0088, + "step": 43361 + }, + { + "epoch": 0.84, + "learning_rate": 3.180459011300532e-08, + "loss": 0.005, + "step": 43362 + }, + { + "epoch": 0.84, + "learning_rate": 3.180070676866918e-08, + "loss": 0.0005, + "step": 43363 + }, + { + "epoch": 0.84, + "learning_rate": 3.1796823424333036e-08, + "loss": 0.0006, + "step": 43364 + }, + { + "epoch": 0.84, + "learning_rate": 3.1792940079996895e-08, + "loss": 0.0005, + "step": 43365 + }, + { + "epoch": 0.84, + "learning_rate": 3.178905673566075e-08, + "loss": 0.0004, + "step": 43366 + }, + { + "epoch": 0.84, + "learning_rate": 3.178517339132461e-08, + "loss": 0.0003, + "step": 43367 + }, + { + "epoch": 0.84, + "learning_rate": 3.178129004698846e-08, + "loss": 0.0004, + "step": 43368 + }, + { + "epoch": 0.84, + "learning_rate": 3.177740670265232e-08, + "loss": 0.0005, + "step": 43369 + }, + { + "epoch": 0.84, + "learning_rate": 3.177352335831618e-08, + "loss": 0.0003, + "step": 43370 + }, + { + "epoch": 0.84, + "learning_rate": 3.176964001398004e-08, + "loss": 0.0003, + "step": 43371 + }, + { + "epoch": 0.84, + "learning_rate": 3.1765756669643896e-08, + "loss": 0.0004, + "step": 43372 + }, + { + "epoch": 0.84, + "learning_rate": 3.1761873325307754e-08, + "loss": 0.0587, + "step": 43373 + }, + { + "epoch": 0.84, + "learning_rate": 3.175798998097161e-08, + "loss": 0.0005, + "step": 43374 + }, + { + "epoch": 0.84, + "learning_rate": 3.175410663663547e-08, + "loss": 0.0011, + "step": 43375 + }, + { + "epoch": 0.84, + "learning_rate": 3.175022329229933e-08, + "loss": 0.0004, + "step": 43376 + }, + { + "epoch": 0.84, + "learning_rate": 3.174633994796319e-08, + "loss": 0.0506, + "step": 43377 + }, + { + "epoch": 0.84, + "learning_rate": 3.1742456603627045e-08, + "loss": 0.0003, + "step": 43378 + }, + { + "epoch": 0.84, + "learning_rate": 3.1738573259290904e-08, + "loss": 0.0228, + "step": 43379 + }, + { + "epoch": 0.84, + "learning_rate": 3.173468991495476e-08, + "loss": 0.0003, + "step": 43380 + }, + { + "epoch": 0.84, + "learning_rate": 3.173080657061862e-08, + "loss": 0.0005, + "step": 43381 + }, + { + "epoch": 0.84, + "learning_rate": 3.172692322628247e-08, + "loss": 0.0008, + "step": 43382 + }, + { + "epoch": 0.84, + "learning_rate": 3.172303988194633e-08, + "loss": 0.0003, + "step": 43383 + }, + { + "epoch": 0.84, + "learning_rate": 3.171915653761019e-08, + "loss": 0.0005, + "step": 43384 + }, + { + "epoch": 0.84, + "learning_rate": 3.1715273193274046e-08, + "loss": 0.0005, + "step": 43385 + }, + { + "epoch": 0.84, + "learning_rate": 3.1711389848937905e-08, + "loss": 0.0003, + "step": 43386 + }, + { + "epoch": 0.84, + "learning_rate": 3.170750650460176e-08, + "loss": 0.0004, + "step": 43387 + }, + { + "epoch": 0.84, + "learning_rate": 3.170362316026562e-08, + "loss": 0.0005, + "step": 43388 + }, + { + "epoch": 0.84, + "learning_rate": 3.169973981592948e-08, + "loss": 0.0003, + "step": 43389 + }, + { + "epoch": 0.84, + "learning_rate": 3.169585647159334e-08, + "loss": 0.0005, + "step": 43390 + }, + { + "epoch": 0.84, + "learning_rate": 3.1691973127257196e-08, + "loss": 0.0003, + "step": 43391 + }, + { + "epoch": 0.84, + "learning_rate": 3.1688089782921054e-08, + "loss": 0.0003, + "step": 43392 + }, + { + "epoch": 0.84, + "learning_rate": 3.168420643858491e-08, + "loss": 0.0004, + "step": 43393 + }, + { + "epoch": 0.84, + "learning_rate": 3.168032309424877e-08, + "loss": 0.0003, + "step": 43394 + }, + { + "epoch": 0.84, + "learning_rate": 3.167643974991263e-08, + "loss": 0.001, + "step": 43395 + }, + { + "epoch": 0.84, + "learning_rate": 3.167255640557649e-08, + "loss": 0.0004, + "step": 43396 + }, + { + "epoch": 0.84, + "learning_rate": 3.166867306124034e-08, + "loss": 0.0006, + "step": 43397 + }, + { + "epoch": 0.84, + "learning_rate": 3.16647897169042e-08, + "loss": 0.001, + "step": 43398 + }, + { + "epoch": 0.84, + "learning_rate": 3.1660906372568055e-08, + "loss": 0.0299, + "step": 43399 + }, + { + "epoch": 0.84, + "learning_rate": 3.1657023028231913e-08, + "loss": 0.3727, + "step": 43400 + }, + { + "epoch": 0.84, + "learning_rate": 3.165313968389577e-08, + "loss": 0.0004, + "step": 43401 + }, + { + "epoch": 0.84, + "learning_rate": 3.164925633955963e-08, + "loss": 0.0004, + "step": 43402 + }, + { + "epoch": 0.84, + "learning_rate": 3.164537299522349e-08, + "loss": 0.0003, + "step": 43403 + }, + { + "epoch": 0.84, + "learning_rate": 3.164148965088734e-08, + "loss": 0.0004, + "step": 43404 + }, + { + "epoch": 0.84, + "learning_rate": 3.16376063065512e-08, + "loss": 0.0003, + "step": 43405 + }, + { + "epoch": 0.84, + "learning_rate": 3.1633722962215056e-08, + "loss": 0.2778, + "step": 43406 + }, + { + "epoch": 0.84, + "learning_rate": 3.1629839617878915e-08, + "loss": 0.0004, + "step": 43407 + }, + { + "epoch": 0.84, + "learning_rate": 3.162595627354277e-08, + "loss": 0.0013, + "step": 43408 + }, + { + "epoch": 0.84, + "learning_rate": 3.162207292920663e-08, + "loss": 0.0003, + "step": 43409 + }, + { + "epoch": 0.84, + "learning_rate": 3.161818958487049e-08, + "loss": 0.0004, + "step": 43410 + }, + { + "epoch": 0.84, + "learning_rate": 3.161430624053434e-08, + "loss": 0.0004, + "step": 43411 + }, + { + "epoch": 0.84, + "learning_rate": 3.16104228961982e-08, + "loss": 0.0007, + "step": 43412 + }, + { + "epoch": 0.84, + "learning_rate": 3.160653955186206e-08, + "loss": 0.0007, + "step": 43413 + }, + { + "epoch": 0.84, + "learning_rate": 3.1602656207525916e-08, + "loss": 0.0004, + "step": 43414 + }, + { + "epoch": 0.84, + "learning_rate": 3.1598772863189774e-08, + "loss": 0.0004, + "step": 43415 + }, + { + "epoch": 0.84, + "learning_rate": 3.159488951885363e-08, + "loss": 0.0005, + "step": 43416 + }, + { + "epoch": 0.84, + "learning_rate": 3.159100617451749e-08, + "loss": 0.8401, + "step": 43417 + }, + { + "epoch": 0.84, + "learning_rate": 3.158712283018135e-08, + "loss": 0.0005, + "step": 43418 + }, + { + "epoch": 0.84, + "learning_rate": 3.158323948584521e-08, + "loss": 0.0004, + "step": 43419 + }, + { + "epoch": 0.84, + "learning_rate": 3.1579356141509065e-08, + "loss": 0.0005, + "step": 43420 + }, + { + "epoch": 0.84, + "learning_rate": 3.1575472797172923e-08, + "loss": 0.0002, + "step": 43421 + }, + { + "epoch": 0.84, + "learning_rate": 3.157158945283678e-08, + "loss": 0.0005, + "step": 43422 + }, + { + "epoch": 0.84, + "learning_rate": 3.156770610850064e-08, + "loss": 0.0003, + "step": 43423 + }, + { + "epoch": 0.84, + "learning_rate": 3.15638227641645e-08, + "loss": 0.0249, + "step": 43424 + }, + { + "epoch": 0.84, + "learning_rate": 3.1559939419828356e-08, + "loss": 0.0143, + "step": 43425 + }, + { + "epoch": 0.84, + "learning_rate": 3.155605607549221e-08, + "loss": 0.0314, + "step": 43426 + }, + { + "epoch": 0.84, + "learning_rate": 3.1552172731156066e-08, + "loss": 0.0003, + "step": 43427 + }, + { + "epoch": 0.84, + "learning_rate": 3.1548289386819924e-08, + "loss": 0.0004, + "step": 43428 + }, + { + "epoch": 0.84, + "learning_rate": 3.154440604248378e-08, + "loss": 0.0004, + "step": 43429 + }, + { + "epoch": 0.84, + "learning_rate": 3.154052269814764e-08, + "loss": 0.0003, + "step": 43430 + }, + { + "epoch": 0.84, + "learning_rate": 3.15366393538115e-08, + "loss": 0.0004, + "step": 43431 + }, + { + "epoch": 0.84, + "learning_rate": 3.153275600947536e-08, + "loss": 0.0005, + "step": 43432 + }, + { + "epoch": 0.84, + "learning_rate": 3.1528872665139216e-08, + "loss": 0.0006, + "step": 43433 + }, + { + "epoch": 0.84, + "learning_rate": 3.1524989320803074e-08, + "loss": 0.0004, + "step": 43434 + }, + { + "epoch": 0.84, + "learning_rate": 3.152110597646693e-08, + "loss": 0.0004, + "step": 43435 + }, + { + "epoch": 0.84, + "learning_rate": 3.151722263213079e-08, + "loss": 0.0004, + "step": 43436 + }, + { + "epoch": 0.84, + "learning_rate": 3.151333928779465e-08, + "loss": 0.0004, + "step": 43437 + }, + { + "epoch": 0.84, + "learning_rate": 3.150945594345851e-08, + "loss": 0.1462, + "step": 43438 + }, + { + "epoch": 0.84, + "learning_rate": 3.1505572599122365e-08, + "loss": 0.0004, + "step": 43439 + }, + { + "epoch": 0.84, + "learning_rate": 3.150168925478622e-08, + "loss": 0.0003, + "step": 43440 + }, + { + "epoch": 0.84, + "learning_rate": 3.1497805910450075e-08, + "loss": 0.0004, + "step": 43441 + }, + { + "epoch": 0.84, + "learning_rate": 3.149392256611393e-08, + "loss": 0.804, + "step": 43442 + }, + { + "epoch": 0.84, + "learning_rate": 3.149003922177779e-08, + "loss": 0.0007, + "step": 43443 + }, + { + "epoch": 0.84, + "learning_rate": 3.148615587744165e-08, + "loss": 0.0003, + "step": 43444 + }, + { + "epoch": 0.84, + "learning_rate": 3.148227253310551e-08, + "loss": 0.0004, + "step": 43445 + }, + { + "epoch": 0.84, + "learning_rate": 3.1478389188769366e-08, + "loss": 0.0005, + "step": 43446 + }, + { + "epoch": 0.84, + "learning_rate": 3.1474505844433224e-08, + "loss": 0.0006, + "step": 43447 + }, + { + "epoch": 0.84, + "learning_rate": 3.147062250009708e-08, + "loss": 0.0003, + "step": 43448 + }, + { + "epoch": 0.84, + "learning_rate": 3.146673915576094e-08, + "loss": 0.0003, + "step": 43449 + }, + { + "epoch": 0.84, + "learning_rate": 3.14628558114248e-08, + "loss": 0.0003, + "step": 43450 + }, + { + "epoch": 0.84, + "learning_rate": 3.145897246708866e-08, + "loss": 0.0003, + "step": 43451 + }, + { + "epoch": 0.84, + "learning_rate": 3.1455089122752516e-08, + "loss": 0.0101, + "step": 43452 + }, + { + "epoch": 0.84, + "learning_rate": 3.1451205778416374e-08, + "loss": 0.0004, + "step": 43453 + }, + { + "epoch": 0.84, + "learning_rate": 3.144732243408023e-08, + "loss": 1.1509, + "step": 43454 + }, + { + "epoch": 0.84, + "learning_rate": 3.1443439089744084e-08, + "loss": 0.0003, + "step": 43455 + }, + { + "epoch": 0.84, + "learning_rate": 3.143955574540794e-08, + "loss": 0.0004, + "step": 43456 + }, + { + "epoch": 0.84, + "learning_rate": 3.14356724010718e-08, + "loss": 0.0005, + "step": 43457 + }, + { + "epoch": 0.84, + "learning_rate": 3.143178905673566e-08, + "loss": 0.0006, + "step": 43458 + }, + { + "epoch": 0.84, + "learning_rate": 3.142790571239952e-08, + "loss": 0.5114, + "step": 43459 + }, + { + "epoch": 0.84, + "learning_rate": 3.1424022368063375e-08, + "loss": 0.114, + "step": 43460 + }, + { + "epoch": 0.84, + "learning_rate": 3.142013902372723e-08, + "loss": 0.0084, + "step": 43461 + }, + { + "epoch": 0.84, + "learning_rate": 3.141625567939109e-08, + "loss": 0.0003, + "step": 43462 + }, + { + "epoch": 0.84, + "learning_rate": 3.141237233505495e-08, + "loss": 0.0003, + "step": 43463 + }, + { + "epoch": 0.84, + "learning_rate": 3.140848899071881e-08, + "loss": 0.0003, + "step": 43464 + }, + { + "epoch": 0.84, + "learning_rate": 3.1404605646382666e-08, + "loss": 0.3899, + "step": 43465 + }, + { + "epoch": 0.84, + "learning_rate": 3.1400722302046524e-08, + "loss": 0.0005, + "step": 43466 + }, + { + "epoch": 0.84, + "learning_rate": 3.139683895771038e-08, + "loss": 0.0004, + "step": 43467 + }, + { + "epoch": 0.84, + "learning_rate": 3.139295561337424e-08, + "loss": 0.0007, + "step": 43468 + }, + { + "epoch": 0.84, + "learning_rate": 3.138907226903809e-08, + "loss": 0.0007, + "step": 43469 + }, + { + "epoch": 0.84, + "learning_rate": 3.138518892470195e-08, + "loss": 0.1479, + "step": 43470 + }, + { + "epoch": 0.84, + "learning_rate": 3.138130558036581e-08, + "loss": 0.0005, + "step": 43471 + }, + { + "epoch": 0.84, + "learning_rate": 3.137742223602967e-08, + "loss": 0.0049, + "step": 43472 + }, + { + "epoch": 0.84, + "learning_rate": 3.1373538891693526e-08, + "loss": 0.0053, + "step": 43473 + }, + { + "epoch": 0.84, + "learning_rate": 3.1369655547357384e-08, + "loss": 0.0003, + "step": 43474 + }, + { + "epoch": 0.84, + "learning_rate": 3.136577220302124e-08, + "loss": 0.0007, + "step": 43475 + }, + { + "epoch": 0.84, + "learning_rate": 3.13618888586851e-08, + "loss": 0.0004, + "step": 43476 + }, + { + "epoch": 0.84, + "learning_rate": 3.135800551434896e-08, + "loss": 0.0005, + "step": 43477 + }, + { + "epoch": 0.84, + "learning_rate": 3.135412217001282e-08, + "loss": 0.0003, + "step": 43478 + }, + { + "epoch": 0.84, + "learning_rate": 3.1350238825676675e-08, + "loss": 0.0006, + "step": 43479 + }, + { + "epoch": 0.84, + "learning_rate": 3.134635548134053e-08, + "loss": 0.0004, + "step": 43480 + }, + { + "epoch": 0.84, + "learning_rate": 3.134247213700439e-08, + "loss": 0.0025, + "step": 43481 + }, + { + "epoch": 0.84, + "learning_rate": 3.133858879266825e-08, + "loss": 0.0004, + "step": 43482 + }, + { + "epoch": 0.84, + "learning_rate": 3.133470544833211e-08, + "loss": 0.0003, + "step": 43483 + }, + { + "epoch": 0.84, + "learning_rate": 3.133082210399596e-08, + "loss": 0.0007, + "step": 43484 + }, + { + "epoch": 0.84, + "learning_rate": 3.132693875965982e-08, + "loss": 0.0003, + "step": 43485 + }, + { + "epoch": 0.84, + "learning_rate": 3.1323055415323676e-08, + "loss": 0.0003, + "step": 43486 + }, + { + "epoch": 0.84, + "learning_rate": 3.1319172070987534e-08, + "loss": 0.0004, + "step": 43487 + }, + { + "epoch": 0.84, + "learning_rate": 3.131528872665139e-08, + "loss": 0.0004, + "step": 43488 + }, + { + "epoch": 0.84, + "learning_rate": 3.131140538231525e-08, + "loss": 0.2161, + "step": 43489 + }, + { + "epoch": 0.84, + "learning_rate": 3.130752203797911e-08, + "loss": 0.0003, + "step": 43490 + }, + { + "epoch": 0.84, + "learning_rate": 3.130363869364297e-08, + "loss": 0.0004, + "step": 43491 + }, + { + "epoch": 0.84, + "learning_rate": 3.129975534930682e-08, + "loss": 0.0404, + "step": 43492 + }, + { + "epoch": 0.84, + "learning_rate": 3.129587200497068e-08, + "loss": 0.0006, + "step": 43493 + }, + { + "epoch": 0.84, + "learning_rate": 3.1291988660634535e-08, + "loss": 0.0011, + "step": 43494 + }, + { + "epoch": 0.84, + "learning_rate": 3.1288105316298394e-08, + "loss": 0.002, + "step": 43495 + }, + { + "epoch": 0.84, + "learning_rate": 3.128422197196225e-08, + "loss": 0.0004, + "step": 43496 + }, + { + "epoch": 0.84, + "learning_rate": 3.128033862762611e-08, + "loss": 0.0002, + "step": 43497 + }, + { + "epoch": 0.84, + "learning_rate": 3.127645528328997e-08, + "loss": 0.0003, + "step": 43498 + }, + { + "epoch": 0.84, + "learning_rate": 3.1272571938953827e-08, + "loss": 0.0007, + "step": 43499 + }, + { + "epoch": 0.84, + "learning_rate": 3.126868859461768e-08, + "loss": 0.0004, + "step": 43500 + }, + { + "epoch": 0.84, + "learning_rate": 3.1264805250281537e-08, + "loss": 0.0006, + "step": 43501 + }, + { + "epoch": 0.84, + "learning_rate": 3.1260921905945395e-08, + "loss": 0.0004, + "step": 43502 + }, + { + "epoch": 0.84, + "learning_rate": 3.125703856160925e-08, + "loss": 0.0004, + "step": 43503 + }, + { + "epoch": 0.84, + "learning_rate": 3.125315521727311e-08, + "loss": 0.0004, + "step": 43504 + }, + { + "epoch": 0.84, + "learning_rate": 3.124927187293697e-08, + "loss": 0.0006, + "step": 43505 + }, + { + "epoch": 0.84, + "learning_rate": 3.124538852860083e-08, + "loss": 0.0005, + "step": 43506 + }, + { + "epoch": 0.84, + "learning_rate": 3.1241505184264686e-08, + "loss": 0.0006, + "step": 43507 + }, + { + "epoch": 0.84, + "learning_rate": 3.1237621839928544e-08, + "loss": 0.0003, + "step": 43508 + }, + { + "epoch": 0.84, + "learning_rate": 3.12337384955924e-08, + "loss": 1.1588, + "step": 43509 + }, + { + "epoch": 0.84, + "learning_rate": 3.122985515125626e-08, + "loss": 0.0005, + "step": 43510 + }, + { + "epoch": 0.84, + "learning_rate": 3.122597180692012e-08, + "loss": 0.0003, + "step": 43511 + }, + { + "epoch": 0.84, + "learning_rate": 3.122208846258398e-08, + "loss": 0.0004, + "step": 43512 + }, + { + "epoch": 0.84, + "learning_rate": 3.121820511824783e-08, + "loss": 0.0003, + "step": 43513 + }, + { + "epoch": 0.84, + "learning_rate": 3.121432177391169e-08, + "loss": 0.0004, + "step": 43514 + }, + { + "epoch": 0.84, + "learning_rate": 3.1210438429575545e-08, + "loss": 0.0004, + "step": 43515 + }, + { + "epoch": 0.84, + "learning_rate": 3.1206555085239404e-08, + "loss": 0.0008, + "step": 43516 + }, + { + "epoch": 0.84, + "learning_rate": 3.120267174090326e-08, + "loss": 0.0003, + "step": 43517 + }, + { + "epoch": 0.84, + "learning_rate": 3.119878839656712e-08, + "loss": 0.0004, + "step": 43518 + }, + { + "epoch": 0.84, + "learning_rate": 3.119490505223098e-08, + "loss": 0.0004, + "step": 43519 + }, + { + "epoch": 0.84, + "learning_rate": 3.1191021707894837e-08, + "loss": 0.0004, + "step": 43520 + }, + { + "epoch": 0.84, + "learning_rate": 3.1187138363558695e-08, + "loss": 0.0005, + "step": 43521 + }, + { + "epoch": 0.84, + "learning_rate": 3.118325501922255e-08, + "loss": 0.8635, + "step": 43522 + }, + { + "epoch": 0.84, + "learning_rate": 3.117937167488641e-08, + "loss": 0.0004, + "step": 43523 + }, + { + "epoch": 0.84, + "learning_rate": 3.117548833055027e-08, + "loss": 0.0004, + "step": 43524 + }, + { + "epoch": 0.84, + "learning_rate": 3.117160498621413e-08, + "loss": 0.0003, + "step": 43525 + }, + { + "epoch": 0.84, + "learning_rate": 3.1167721641877986e-08, + "loss": 0.0005, + "step": 43526 + }, + { + "epoch": 0.84, + "learning_rate": 3.116383829754184e-08, + "loss": 0.0003, + "step": 43527 + }, + { + "epoch": 0.84, + "learning_rate": 3.1159954953205696e-08, + "loss": 0.0003, + "step": 43528 + }, + { + "epoch": 0.84, + "learning_rate": 3.1156071608869554e-08, + "loss": 0.0003, + "step": 43529 + }, + { + "epoch": 0.84, + "learning_rate": 3.115218826453341e-08, + "loss": 0.0002, + "step": 43530 + }, + { + "epoch": 0.84, + "learning_rate": 3.114830492019727e-08, + "loss": 0.0004, + "step": 43531 + }, + { + "epoch": 0.84, + "learning_rate": 3.114442157586113e-08, + "loss": 0.0006, + "step": 43532 + }, + { + "epoch": 0.84, + "learning_rate": 3.114053823152499e-08, + "loss": 0.0042, + "step": 43533 + }, + { + "epoch": 0.84, + "learning_rate": 3.1136654887188845e-08, + "loss": 0.0029, + "step": 43534 + }, + { + "epoch": 0.84, + "learning_rate": 3.1132771542852704e-08, + "loss": 0.0003, + "step": 43535 + }, + { + "epoch": 0.84, + "learning_rate": 3.112888819851656e-08, + "loss": 0.0003, + "step": 43536 + }, + { + "epoch": 0.84, + "learning_rate": 3.112500485418042e-08, + "loss": 0.0003, + "step": 43537 + }, + { + "epoch": 0.84, + "learning_rate": 3.112112150984428e-08, + "loss": 0.0003, + "step": 43538 + }, + { + "epoch": 0.84, + "learning_rate": 3.1117238165508137e-08, + "loss": 0.0005, + "step": 43539 + }, + { + "epoch": 0.84, + "learning_rate": 3.1113354821171995e-08, + "loss": 0.0005, + "step": 43540 + }, + { + "epoch": 0.84, + "learning_rate": 3.110947147683585e-08, + "loss": 0.0004, + "step": 43541 + }, + { + "epoch": 0.84, + "learning_rate": 3.1105588132499705e-08, + "loss": 0.1593, + "step": 43542 + }, + { + "epoch": 0.84, + "learning_rate": 3.110170478816356e-08, + "loss": 0.0004, + "step": 43543 + }, + { + "epoch": 0.84, + "learning_rate": 3.109782144382742e-08, + "loss": 0.0004, + "step": 43544 + }, + { + "epoch": 0.84, + "learning_rate": 3.109393809949128e-08, + "loss": 0.0003, + "step": 43545 + }, + { + "epoch": 0.84, + "learning_rate": 3.109005475515514e-08, + "loss": 0.0017, + "step": 43546 + }, + { + "epoch": 0.84, + "learning_rate": 3.1086171410818996e-08, + "loss": 0.0161, + "step": 43547 + }, + { + "epoch": 0.84, + "learning_rate": 3.1082288066482854e-08, + "loss": 0.0002, + "step": 43548 + }, + { + "epoch": 0.84, + "learning_rate": 3.107840472214671e-08, + "loss": 0.0004, + "step": 43549 + }, + { + "epoch": 0.84, + "learning_rate": 3.107452137781057e-08, + "loss": 0.0003, + "step": 43550 + }, + { + "epoch": 0.84, + "learning_rate": 3.107063803347443e-08, + "loss": 0.0004, + "step": 43551 + }, + { + "epoch": 0.84, + "learning_rate": 3.106675468913829e-08, + "loss": 0.6034, + "step": 43552 + }, + { + "epoch": 0.84, + "learning_rate": 3.1062871344802145e-08, + "loss": 0.0004, + "step": 43553 + }, + { + "epoch": 0.84, + "learning_rate": 3.1058988000466004e-08, + "loss": 0.6089, + "step": 43554 + }, + { + "epoch": 0.84, + "learning_rate": 3.105510465612986e-08, + "loss": 0.0004, + "step": 43555 + }, + { + "epoch": 0.84, + "learning_rate": 3.1051221311793714e-08, + "loss": 0.0003, + "step": 43556 + }, + { + "epoch": 0.84, + "learning_rate": 3.104733796745757e-08, + "loss": 0.0004, + "step": 43557 + }, + { + "epoch": 0.84, + "learning_rate": 3.104345462312143e-08, + "loss": 0.7589, + "step": 43558 + }, + { + "epoch": 0.84, + "learning_rate": 3.103957127878529e-08, + "loss": 0.0004, + "step": 43559 + }, + { + "epoch": 0.84, + "learning_rate": 3.1035687934449146e-08, + "loss": 0.0003, + "step": 43560 + }, + { + "epoch": 0.84, + "learning_rate": 3.1031804590113005e-08, + "loss": 0.0005, + "step": 43561 + }, + { + "epoch": 0.85, + "learning_rate": 3.102792124577686e-08, + "loss": 0.0004, + "step": 43562 + }, + { + "epoch": 0.85, + "learning_rate": 3.102403790144072e-08, + "loss": 0.0026, + "step": 43563 + }, + { + "epoch": 0.85, + "learning_rate": 3.102015455710458e-08, + "loss": 0.0009, + "step": 43564 + }, + { + "epoch": 0.85, + "learning_rate": 3.101627121276844e-08, + "loss": 0.0006, + "step": 43565 + }, + { + "epoch": 0.85, + "learning_rate": 3.1012387868432296e-08, + "loss": 0.0005, + "step": 43566 + }, + { + "epoch": 0.85, + "learning_rate": 3.1008504524096154e-08, + "loss": 0.0055, + "step": 43567 + }, + { + "epoch": 0.85, + "learning_rate": 3.100462117976001e-08, + "loss": 0.0005, + "step": 43568 + }, + { + "epoch": 0.85, + "learning_rate": 3.100073783542387e-08, + "loss": 0.0003, + "step": 43569 + }, + { + "epoch": 0.85, + "learning_rate": 3.099685449108773e-08, + "loss": 0.0004, + "step": 43570 + }, + { + "epoch": 0.85, + "learning_rate": 3.099297114675158e-08, + "loss": 0.0304, + "step": 43571 + }, + { + "epoch": 0.85, + "learning_rate": 3.098908780241544e-08, + "loss": 0.0004, + "step": 43572 + }, + { + "epoch": 0.85, + "learning_rate": 3.09852044580793e-08, + "loss": 0.2897, + "step": 43573 + }, + { + "epoch": 0.85, + "learning_rate": 3.0981321113743155e-08, + "loss": 0.0004, + "step": 43574 + }, + { + "epoch": 0.85, + "learning_rate": 3.0977437769407014e-08, + "loss": 0.0004, + "step": 43575 + }, + { + "epoch": 0.85, + "learning_rate": 3.097355442507087e-08, + "loss": 0.0004, + "step": 43576 + }, + { + "epoch": 0.85, + "learning_rate": 3.096967108073473e-08, + "loss": 0.0028, + "step": 43577 + }, + { + "epoch": 0.85, + "learning_rate": 3.096578773639859e-08, + "loss": 0.0005, + "step": 43578 + }, + { + "epoch": 0.85, + "learning_rate": 3.0961904392062447e-08, + "loss": 0.0004, + "step": 43579 + }, + { + "epoch": 0.85, + "learning_rate": 3.0958021047726305e-08, + "loss": 0.0003, + "step": 43580 + }, + { + "epoch": 0.85, + "learning_rate": 3.0954137703390156e-08, + "loss": 0.0024, + "step": 43581 + }, + { + "epoch": 0.85, + "learning_rate": 3.0950254359054015e-08, + "loss": 0.0006, + "step": 43582 + }, + { + "epoch": 0.85, + "learning_rate": 3.094637101471787e-08, + "loss": 0.0018, + "step": 43583 + }, + { + "epoch": 0.85, + "learning_rate": 3.094248767038173e-08, + "loss": 0.0004, + "step": 43584 + }, + { + "epoch": 0.85, + "learning_rate": 3.093860432604559e-08, + "loss": 0.2355, + "step": 43585 + }, + { + "epoch": 0.85, + "learning_rate": 3.093472098170945e-08, + "loss": 0.0333, + "step": 43586 + }, + { + "epoch": 0.85, + "learning_rate": 3.0930837637373306e-08, + "loss": 0.0006, + "step": 43587 + }, + { + "epoch": 0.85, + "learning_rate": 3.092695429303716e-08, + "loss": 0.0004, + "step": 43588 + }, + { + "epoch": 0.85, + "learning_rate": 3.0923070948701016e-08, + "loss": 0.0004, + "step": 43589 + }, + { + "epoch": 0.85, + "learning_rate": 3.0919187604364874e-08, + "loss": 0.0004, + "step": 43590 + }, + { + "epoch": 0.85, + "learning_rate": 3.091530426002873e-08, + "loss": 0.0007, + "step": 43591 + }, + { + "epoch": 0.85, + "learning_rate": 3.091142091569259e-08, + "loss": 0.0004, + "step": 43592 + }, + { + "epoch": 0.85, + "learning_rate": 3.090753757135645e-08, + "loss": 0.0004, + "step": 43593 + }, + { + "epoch": 0.85, + "learning_rate": 3.090365422702031e-08, + "loss": 0.0004, + "step": 43594 + }, + { + "epoch": 0.85, + "learning_rate": 3.0899770882684165e-08, + "loss": 0.4432, + "step": 43595 + }, + { + "epoch": 0.85, + "learning_rate": 3.0895887538348023e-08, + "loss": 0.0003, + "step": 43596 + }, + { + "epoch": 0.85, + "learning_rate": 3.089200419401188e-08, + "loss": 0.0003, + "step": 43597 + }, + { + "epoch": 0.85, + "learning_rate": 3.088812084967574e-08, + "loss": 0.2808, + "step": 43598 + }, + { + "epoch": 0.85, + "learning_rate": 3.08842375053396e-08, + "loss": 0.0004, + "step": 43599 + }, + { + "epoch": 0.85, + "learning_rate": 3.088035416100345e-08, + "loss": 0.0002, + "step": 43600 + }, + { + "epoch": 0.85, + "learning_rate": 3.087647081666731e-08, + "loss": 0.0005, + "step": 43601 + }, + { + "epoch": 0.85, + "learning_rate": 3.0872587472331166e-08, + "loss": 0.0007, + "step": 43602 + }, + { + "epoch": 0.85, + "learning_rate": 3.0868704127995025e-08, + "loss": 0.0004, + "step": 43603 + }, + { + "epoch": 0.85, + "learning_rate": 3.086482078365888e-08, + "loss": 0.0003, + "step": 43604 + }, + { + "epoch": 0.85, + "learning_rate": 3.086093743932274e-08, + "loss": 0.0019, + "step": 43605 + }, + { + "epoch": 0.85, + "learning_rate": 3.08570540949866e-08, + "loss": 0.0004, + "step": 43606 + }, + { + "epoch": 0.85, + "learning_rate": 3.085317075065046e-08, + "loss": 0.0005, + "step": 43607 + }, + { + "epoch": 0.85, + "learning_rate": 3.0849287406314316e-08, + "loss": 0.0004, + "step": 43608 + }, + { + "epoch": 0.85, + "learning_rate": 3.0845404061978174e-08, + "loss": 0.0006, + "step": 43609 + }, + { + "epoch": 0.85, + "learning_rate": 3.084152071764203e-08, + "loss": 0.0005, + "step": 43610 + }, + { + "epoch": 0.85, + "learning_rate": 3.083763737330589e-08, + "loss": 0.0005, + "step": 43611 + }, + { + "epoch": 0.85, + "learning_rate": 3.083375402896975e-08, + "loss": 0.0003, + "step": 43612 + }, + { + "epoch": 0.85, + "learning_rate": 3.082987068463361e-08, + "loss": 0.0005, + "step": 43613 + }, + { + "epoch": 0.85, + "learning_rate": 3.082598734029746e-08, + "loss": 0.0003, + "step": 43614 + }, + { + "epoch": 0.85, + "learning_rate": 3.082210399596132e-08, + "loss": 0.0004, + "step": 43615 + }, + { + "epoch": 0.85, + "learning_rate": 3.0818220651625175e-08, + "loss": 0.0139, + "step": 43616 + }, + { + "epoch": 0.85, + "learning_rate": 3.0814337307289033e-08, + "loss": 0.0002, + "step": 43617 + }, + { + "epoch": 0.85, + "learning_rate": 3.081045396295289e-08, + "loss": 0.0006, + "step": 43618 + }, + { + "epoch": 0.85, + "learning_rate": 3.080657061861675e-08, + "loss": 0.3483, + "step": 43619 + }, + { + "epoch": 0.85, + "learning_rate": 3.080268727428061e-08, + "loss": 0.0003, + "step": 43620 + }, + { + "epoch": 0.85, + "learning_rate": 3.0798803929944466e-08, + "loss": 0.0005, + "step": 43621 + }, + { + "epoch": 0.85, + "learning_rate": 3.0794920585608325e-08, + "loss": 0.0005, + "step": 43622 + }, + { + "epoch": 0.85, + "learning_rate": 3.079103724127218e-08, + "loss": 0.0008, + "step": 43623 + }, + { + "epoch": 0.85, + "learning_rate": 3.078715389693604e-08, + "loss": 0.0004, + "step": 43624 + }, + { + "epoch": 0.85, + "learning_rate": 3.07832705525999e-08, + "loss": 0.0004, + "step": 43625 + }, + { + "epoch": 0.85, + "learning_rate": 3.077938720826376e-08, + "loss": 0.0005, + "step": 43626 + }, + { + "epoch": 0.85, + "learning_rate": 3.0775503863927616e-08, + "loss": 0.0004, + "step": 43627 + }, + { + "epoch": 0.85, + "learning_rate": 3.0771620519591474e-08, + "loss": 0.0006, + "step": 43628 + }, + { + "epoch": 0.85, + "learning_rate": 3.0767737175255326e-08, + "loss": 0.0005, + "step": 43629 + }, + { + "epoch": 0.85, + "learning_rate": 3.0763853830919184e-08, + "loss": 0.0005, + "step": 43630 + }, + { + "epoch": 0.85, + "learning_rate": 3.075997048658304e-08, + "loss": 0.0004, + "step": 43631 + }, + { + "epoch": 0.85, + "learning_rate": 3.07560871422469e-08, + "loss": 0.0003, + "step": 43632 + }, + { + "epoch": 0.85, + "learning_rate": 3.075220379791076e-08, + "loss": 0.0004, + "step": 43633 + }, + { + "epoch": 0.85, + "learning_rate": 3.074832045357462e-08, + "loss": 0.0422, + "step": 43634 + }, + { + "epoch": 0.85, + "learning_rate": 3.0744437109238475e-08, + "loss": 0.0004, + "step": 43635 + }, + { + "epoch": 0.85, + "learning_rate": 3.0740553764902333e-08, + "loss": 0.0045, + "step": 43636 + }, + { + "epoch": 0.85, + "learning_rate": 3.073667042056619e-08, + "loss": 0.0004, + "step": 43637 + }, + { + "epoch": 0.85, + "learning_rate": 3.073278707623005e-08, + "loss": 0.0004, + "step": 43638 + }, + { + "epoch": 0.85, + "learning_rate": 3.072890373189391e-08, + "loss": 0.8687, + "step": 43639 + }, + { + "epoch": 0.85, + "learning_rate": 3.0725020387557766e-08, + "loss": 0.0005, + "step": 43640 + }, + { + "epoch": 0.85, + "learning_rate": 3.0721137043221625e-08, + "loss": 0.0003, + "step": 43641 + }, + { + "epoch": 0.85, + "learning_rate": 3.071725369888548e-08, + "loss": 0.0003, + "step": 43642 + }, + { + "epoch": 0.85, + "learning_rate": 3.0713370354549334e-08, + "loss": 0.7444, + "step": 43643 + }, + { + "epoch": 0.85, + "learning_rate": 3.070948701021319e-08, + "loss": 0.4568, + "step": 43644 + }, + { + "epoch": 0.85, + "learning_rate": 3.070560366587705e-08, + "loss": 0.0004, + "step": 43645 + }, + { + "epoch": 0.85, + "learning_rate": 3.070172032154091e-08, + "loss": 0.0005, + "step": 43646 + }, + { + "epoch": 0.85, + "learning_rate": 3.069783697720477e-08, + "loss": 0.0004, + "step": 43647 + }, + { + "epoch": 0.85, + "learning_rate": 3.0693953632868626e-08, + "loss": 0.0005, + "step": 43648 + }, + { + "epoch": 0.85, + "learning_rate": 3.0690070288532484e-08, + "loss": 0.0004, + "step": 43649 + }, + { + "epoch": 0.85, + "learning_rate": 3.068618694419634e-08, + "loss": 0.0007, + "step": 43650 + }, + { + "epoch": 0.85, + "learning_rate": 3.06823035998602e-08, + "loss": 0.0004, + "step": 43651 + }, + { + "epoch": 0.85, + "learning_rate": 3.067842025552406e-08, + "loss": 0.0003, + "step": 43652 + }, + { + "epoch": 0.85, + "learning_rate": 3.067453691118792e-08, + "loss": 0.2036, + "step": 43653 + }, + { + "epoch": 0.85, + "learning_rate": 3.0670653566851775e-08, + "loss": 0.0005, + "step": 43654 + }, + { + "epoch": 0.85, + "learning_rate": 3.0666770222515633e-08, + "loss": 0.0006, + "step": 43655 + }, + { + "epoch": 0.85, + "learning_rate": 3.066288687817949e-08, + "loss": 0.0005, + "step": 43656 + }, + { + "epoch": 0.85, + "learning_rate": 3.065900353384335e-08, + "loss": 0.0016, + "step": 43657 + }, + { + "epoch": 0.85, + "learning_rate": 3.06551201895072e-08, + "loss": 0.0004, + "step": 43658 + }, + { + "epoch": 0.85, + "learning_rate": 3.065123684517106e-08, + "loss": 0.0005, + "step": 43659 + }, + { + "epoch": 0.85, + "learning_rate": 3.064735350083492e-08, + "loss": 0.0003, + "step": 43660 + }, + { + "epoch": 0.85, + "learning_rate": 3.0643470156498776e-08, + "loss": 0.0004, + "step": 43661 + }, + { + "epoch": 0.85, + "learning_rate": 3.0639586812162634e-08, + "loss": 0.0004, + "step": 43662 + }, + { + "epoch": 0.85, + "learning_rate": 3.063570346782649e-08, + "loss": 0.0004, + "step": 43663 + }, + { + "epoch": 0.85, + "learning_rate": 3.063182012349035e-08, + "loss": 0.0004, + "step": 43664 + }, + { + "epoch": 0.85, + "learning_rate": 3.062793677915421e-08, + "loss": 0.0004, + "step": 43665 + }, + { + "epoch": 0.85, + "learning_rate": 3.062405343481807e-08, + "loss": 0.0008, + "step": 43666 + }, + { + "epoch": 0.85, + "learning_rate": 3.0620170090481926e-08, + "loss": 0.0003, + "step": 43667 + }, + { + "epoch": 0.85, + "learning_rate": 3.0616286746145784e-08, + "loss": 0.0007, + "step": 43668 + }, + { + "epoch": 0.85, + "learning_rate": 3.0612403401809636e-08, + "loss": 0.0011, + "step": 43669 + }, + { + "epoch": 0.85, + "learning_rate": 3.0608520057473494e-08, + "loss": 0.0005, + "step": 43670 + }, + { + "epoch": 0.85, + "learning_rate": 3.060463671313735e-08, + "loss": 0.0009, + "step": 43671 + }, + { + "epoch": 0.85, + "learning_rate": 3.060075336880121e-08, + "loss": 0.555, + "step": 43672 + }, + { + "epoch": 0.85, + "learning_rate": 3.059687002446507e-08, + "loss": 0.0002, + "step": 43673 + }, + { + "epoch": 0.85, + "learning_rate": 3.059298668012893e-08, + "loss": 0.0003, + "step": 43674 + }, + { + "epoch": 0.85, + "learning_rate": 3.0589103335792785e-08, + "loss": 0.0003, + "step": 43675 + }, + { + "epoch": 0.85, + "learning_rate": 3.058521999145664e-08, + "loss": 0.0006, + "step": 43676 + }, + { + "epoch": 0.85, + "learning_rate": 3.0581336647120495e-08, + "loss": 0.0004, + "step": 43677 + }, + { + "epoch": 0.85, + "learning_rate": 3.057745330278435e-08, + "loss": 0.0003, + "step": 43678 + }, + { + "epoch": 0.85, + "learning_rate": 3.057356995844821e-08, + "loss": 0.0004, + "step": 43679 + }, + { + "epoch": 0.85, + "learning_rate": 3.056968661411207e-08, + "loss": 0.0004, + "step": 43680 + }, + { + "epoch": 0.85, + "learning_rate": 3.056580326977593e-08, + "loss": 0.0006, + "step": 43681 + }, + { + "epoch": 0.85, + "learning_rate": 3.0561919925439786e-08, + "loss": 0.0004, + "step": 43682 + }, + { + "epoch": 0.85, + "learning_rate": 3.0558036581103644e-08, + "loss": 0.0003, + "step": 43683 + }, + { + "epoch": 0.85, + "learning_rate": 3.05541532367675e-08, + "loss": 0.0003, + "step": 43684 + }, + { + "epoch": 0.85, + "learning_rate": 3.055026989243136e-08, + "loss": 0.0555, + "step": 43685 + }, + { + "epoch": 0.85, + "learning_rate": 3.054638654809522e-08, + "loss": 0.0006, + "step": 43686 + }, + { + "epoch": 0.85, + "learning_rate": 3.054250320375907e-08, + "loss": 0.0003, + "step": 43687 + }, + { + "epoch": 0.85, + "learning_rate": 3.053861985942293e-08, + "loss": 0.0004, + "step": 43688 + }, + { + "epoch": 0.85, + "learning_rate": 3.053473651508679e-08, + "loss": 0.0004, + "step": 43689 + }, + { + "epoch": 0.85, + "learning_rate": 3.0530853170750645e-08, + "loss": 0.0005, + "step": 43690 + }, + { + "epoch": 0.85, + "learning_rate": 3.0526969826414504e-08, + "loss": 0.0004, + "step": 43691 + }, + { + "epoch": 0.85, + "learning_rate": 3.052308648207836e-08, + "loss": 0.0005, + "step": 43692 + }, + { + "epoch": 0.85, + "learning_rate": 3.051920313774222e-08, + "loss": 0.0009, + "step": 43693 + }, + { + "epoch": 0.85, + "learning_rate": 3.051531979340608e-08, + "loss": 0.0008, + "step": 43694 + }, + { + "epoch": 0.85, + "learning_rate": 3.0511436449069937e-08, + "loss": 0.0004, + "step": 43695 + }, + { + "epoch": 0.85, + "learning_rate": 3.0507553104733795e-08, + "loss": 0.0004, + "step": 43696 + }, + { + "epoch": 0.85, + "learning_rate": 3.050366976039765e-08, + "loss": 0.0004, + "step": 43697 + }, + { + "epoch": 0.85, + "learning_rate": 3.049978641606151e-08, + "loss": 0.001, + "step": 43698 + }, + { + "epoch": 0.85, + "learning_rate": 3.049590307172537e-08, + "loss": 0.0016, + "step": 43699 + }, + { + "epoch": 0.85, + "learning_rate": 3.049201972738923e-08, + "loss": 0.0004, + "step": 43700 + }, + { + "epoch": 0.85, + "learning_rate": 3.048813638305308e-08, + "loss": 0.0005, + "step": 43701 + }, + { + "epoch": 0.85, + "learning_rate": 3.048425303871694e-08, + "loss": 0.0004, + "step": 43702 + }, + { + "epoch": 0.85, + "learning_rate": 3.0480369694380796e-08, + "loss": 0.0003, + "step": 43703 + }, + { + "epoch": 0.85, + "learning_rate": 3.0476486350044654e-08, + "loss": 0.0004, + "step": 43704 + }, + { + "epoch": 0.85, + "learning_rate": 3.047260300570851e-08, + "loss": 0.0004, + "step": 43705 + }, + { + "epoch": 0.85, + "learning_rate": 3.046871966137237e-08, + "loss": 0.0003, + "step": 43706 + }, + { + "epoch": 0.85, + "learning_rate": 3.046483631703623e-08, + "loss": 0.0006, + "step": 43707 + }, + { + "epoch": 0.85, + "learning_rate": 3.046095297270009e-08, + "loss": 0.0004, + "step": 43708 + }, + { + "epoch": 0.85, + "learning_rate": 3.0457069628363945e-08, + "loss": 0.0003, + "step": 43709 + }, + { + "epoch": 0.85, + "learning_rate": 3.0453186284027804e-08, + "loss": 0.0004, + "step": 43710 + }, + { + "epoch": 0.85, + "learning_rate": 3.044930293969166e-08, + "loss": 0.0002, + "step": 43711 + }, + { + "epoch": 0.85, + "learning_rate": 3.044541959535552e-08, + "loss": 0.0004, + "step": 43712 + }, + { + "epoch": 0.85, + "learning_rate": 3.044153625101938e-08, + "loss": 0.3649, + "step": 43713 + }, + { + "epoch": 0.85, + "learning_rate": 3.043765290668324e-08, + "loss": 0.0003, + "step": 43714 + }, + { + "epoch": 0.85, + "learning_rate": 3.0433769562347095e-08, + "loss": 0.0005, + "step": 43715 + }, + { + "epoch": 0.85, + "learning_rate": 3.0429886218010947e-08, + "loss": 0.2222, + "step": 43716 + }, + { + "epoch": 0.85, + "learning_rate": 3.0426002873674805e-08, + "loss": 0.0003, + "step": 43717 + }, + { + "epoch": 0.85, + "learning_rate": 3.042211952933866e-08, + "loss": 0.0002, + "step": 43718 + }, + { + "epoch": 0.85, + "learning_rate": 3.041823618500252e-08, + "loss": 0.0003, + "step": 43719 + }, + { + "epoch": 0.85, + "learning_rate": 3.041435284066638e-08, + "loss": 0.0005, + "step": 43720 + }, + { + "epoch": 0.85, + "learning_rate": 3.041046949633024e-08, + "loss": 0.295, + "step": 43721 + }, + { + "epoch": 0.85, + "learning_rate": 3.0406586151994096e-08, + "loss": 0.0003, + "step": 43722 + }, + { + "epoch": 0.85, + "learning_rate": 3.0402702807657954e-08, + "loss": 0.0002, + "step": 43723 + }, + { + "epoch": 0.85, + "learning_rate": 3.039881946332181e-08, + "loss": 0.001, + "step": 43724 + }, + { + "epoch": 0.85, + "learning_rate": 3.039493611898567e-08, + "loss": 0.0006, + "step": 43725 + }, + { + "epoch": 0.85, + "learning_rate": 3.039105277464953e-08, + "loss": 0.0007, + "step": 43726 + }, + { + "epoch": 0.85, + "learning_rate": 3.038716943031339e-08, + "loss": 0.0633, + "step": 43727 + }, + { + "epoch": 0.85, + "learning_rate": 3.0383286085977246e-08, + "loss": 0.0004, + "step": 43728 + }, + { + "epoch": 0.85, + "learning_rate": 3.0379402741641104e-08, + "loss": 0.0005, + "step": 43729 + }, + { + "epoch": 0.85, + "learning_rate": 3.0375519397304955e-08, + "loss": 0.0004, + "step": 43730 + }, + { + "epoch": 0.85, + "learning_rate": 3.0371636052968814e-08, + "loss": 0.0006, + "step": 43731 + }, + { + "epoch": 0.85, + "learning_rate": 3.036775270863267e-08, + "loss": 0.7208, + "step": 43732 + }, + { + "epoch": 0.85, + "learning_rate": 3.036386936429653e-08, + "loss": 0.0003, + "step": 43733 + }, + { + "epoch": 0.85, + "learning_rate": 3.035998601996039e-08, + "loss": 0.0003, + "step": 43734 + }, + { + "epoch": 0.85, + "learning_rate": 3.0356102675624247e-08, + "loss": 0.7676, + "step": 43735 + }, + { + "epoch": 0.85, + "learning_rate": 3.0352219331288105e-08, + "loss": 0.0006, + "step": 43736 + }, + { + "epoch": 0.85, + "learning_rate": 3.034833598695196e-08, + "loss": 0.0004, + "step": 43737 + }, + { + "epoch": 0.85, + "learning_rate": 3.034445264261582e-08, + "loss": 0.0003, + "step": 43738 + }, + { + "epoch": 0.85, + "learning_rate": 3.034056929827968e-08, + "loss": 0.0004, + "step": 43739 + }, + { + "epoch": 0.85, + "learning_rate": 3.033668595394354e-08, + "loss": 0.7754, + "step": 43740 + }, + { + "epoch": 0.85, + "learning_rate": 3.0332802609607396e-08, + "loss": 0.0004, + "step": 43741 + }, + { + "epoch": 0.85, + "learning_rate": 3.0328919265271254e-08, + "loss": 0.0003, + "step": 43742 + }, + { + "epoch": 0.85, + "learning_rate": 3.032503592093511e-08, + "loss": 0.0003, + "step": 43743 + }, + { + "epoch": 0.85, + "learning_rate": 3.032115257659897e-08, + "loss": 0.0004, + "step": 43744 + }, + { + "epoch": 0.85, + "learning_rate": 3.031726923226282e-08, + "loss": 0.0004, + "step": 43745 + }, + { + "epoch": 0.85, + "learning_rate": 3.031338588792668e-08, + "loss": 0.0005, + "step": 43746 + }, + { + "epoch": 0.85, + "learning_rate": 3.030950254359054e-08, + "loss": 0.0005, + "step": 43747 + }, + { + "epoch": 0.85, + "learning_rate": 3.03056191992544e-08, + "loss": 0.0002, + "step": 43748 + }, + { + "epoch": 0.85, + "learning_rate": 3.0301735854918255e-08, + "loss": 0.0003, + "step": 43749 + }, + { + "epoch": 0.85, + "learning_rate": 3.0297852510582114e-08, + "loss": 0.0005, + "step": 43750 + }, + { + "epoch": 0.85, + "learning_rate": 3.029396916624597e-08, + "loss": 0.0012, + "step": 43751 + }, + { + "epoch": 0.85, + "learning_rate": 3.029008582190983e-08, + "loss": 0.0022, + "step": 43752 + }, + { + "epoch": 0.85, + "learning_rate": 3.028620247757369e-08, + "loss": 0.0012, + "step": 43753 + }, + { + "epoch": 0.85, + "learning_rate": 3.0282319133237547e-08, + "loss": 0.0003, + "step": 43754 + }, + { + "epoch": 0.85, + "learning_rate": 3.0278435788901405e-08, + "loss": 0.0005, + "step": 43755 + }, + { + "epoch": 0.85, + "learning_rate": 3.027455244456526e-08, + "loss": 0.0003, + "step": 43756 + }, + { + "epoch": 0.85, + "learning_rate": 3.027066910022912e-08, + "loss": 0.0005, + "step": 43757 + }, + { + "epoch": 0.85, + "learning_rate": 3.026678575589297e-08, + "loss": 0.0004, + "step": 43758 + }, + { + "epoch": 0.85, + "learning_rate": 3.026290241155683e-08, + "loss": 0.0005, + "step": 43759 + }, + { + "epoch": 0.85, + "learning_rate": 3.025901906722069e-08, + "loss": 0.0004, + "step": 43760 + }, + { + "epoch": 0.85, + "learning_rate": 3.025513572288455e-08, + "loss": 0.0004, + "step": 43761 + }, + { + "epoch": 0.85, + "learning_rate": 3.0251252378548406e-08, + "loss": 0.0004, + "step": 43762 + }, + { + "epoch": 0.85, + "learning_rate": 3.0247369034212264e-08, + "loss": 0.0003, + "step": 43763 + }, + { + "epoch": 0.85, + "learning_rate": 3.024348568987612e-08, + "loss": 0.0004, + "step": 43764 + }, + { + "epoch": 0.85, + "learning_rate": 3.0239602345539974e-08, + "loss": 0.0004, + "step": 43765 + }, + { + "epoch": 0.85, + "learning_rate": 3.023571900120383e-08, + "loss": 0.0003, + "step": 43766 + }, + { + "epoch": 0.85, + "learning_rate": 3.023183565686769e-08, + "loss": 0.0003, + "step": 43767 + }, + { + "epoch": 0.85, + "learning_rate": 3.022795231253155e-08, + "loss": 0.0003, + "step": 43768 + }, + { + "epoch": 0.85, + "learning_rate": 3.022406896819541e-08, + "loss": 0.0005, + "step": 43769 + }, + { + "epoch": 0.85, + "learning_rate": 3.0220185623859265e-08, + "loss": 0.0035, + "step": 43770 + }, + { + "epoch": 0.85, + "learning_rate": 3.0216302279523124e-08, + "loss": 0.6838, + "step": 43771 + }, + { + "epoch": 0.85, + "learning_rate": 3.021241893518698e-08, + "loss": 0.0003, + "step": 43772 + }, + { + "epoch": 0.85, + "learning_rate": 3.020853559085084e-08, + "loss": 0.0004, + "step": 43773 + }, + { + "epoch": 0.85, + "learning_rate": 3.020465224651469e-08, + "loss": 0.2016, + "step": 43774 + }, + { + "epoch": 0.85, + "learning_rate": 3.020076890217855e-08, + "loss": 0.0023, + "step": 43775 + }, + { + "epoch": 0.85, + "learning_rate": 3.019688555784241e-08, + "loss": 0.0004, + "step": 43776 + }, + { + "epoch": 0.85, + "learning_rate": 3.0193002213506266e-08, + "loss": 0.0003, + "step": 43777 + }, + { + "epoch": 0.85, + "learning_rate": 3.0189118869170125e-08, + "loss": 0.0004, + "step": 43778 + }, + { + "epoch": 0.85, + "learning_rate": 3.018523552483398e-08, + "loss": 0.0009, + "step": 43779 + }, + { + "epoch": 0.85, + "learning_rate": 3.018135218049784e-08, + "loss": 0.0006, + "step": 43780 + }, + { + "epoch": 0.85, + "learning_rate": 3.01774688361617e-08, + "loss": 0.0011, + "step": 43781 + }, + { + "epoch": 0.85, + "learning_rate": 3.017358549182556e-08, + "loss": 0.0003, + "step": 43782 + }, + { + "epoch": 0.85, + "learning_rate": 3.0169702147489416e-08, + "loss": 0.0004, + "step": 43783 + }, + { + "epoch": 0.85, + "learning_rate": 3.0165818803153274e-08, + "loss": 0.0002, + "step": 43784 + }, + { + "epoch": 0.85, + "learning_rate": 3.016193545881713e-08, + "loss": 0.0004, + "step": 43785 + }, + { + "epoch": 0.85, + "learning_rate": 3.015805211448099e-08, + "loss": 0.0005, + "step": 43786 + }, + { + "epoch": 0.85, + "learning_rate": 3.015416877014485e-08, + "loss": 0.0004, + "step": 43787 + }, + { + "epoch": 0.85, + "learning_rate": 3.01502854258087e-08, + "loss": 0.0003, + "step": 43788 + }, + { + "epoch": 0.85, + "learning_rate": 3.014640208147256e-08, + "loss": 0.0006, + "step": 43789 + }, + { + "epoch": 0.85, + "learning_rate": 3.014251873713642e-08, + "loss": 0.0004, + "step": 43790 + }, + { + "epoch": 0.85, + "learning_rate": 3.0138635392800275e-08, + "loss": 0.0006, + "step": 43791 + }, + { + "epoch": 0.85, + "learning_rate": 3.0134752048464133e-08, + "loss": 0.0006, + "step": 43792 + }, + { + "epoch": 0.85, + "learning_rate": 3.013086870412799e-08, + "loss": 0.0004, + "step": 43793 + }, + { + "epoch": 0.85, + "learning_rate": 3.012698535979185e-08, + "loss": 0.0077, + "step": 43794 + }, + { + "epoch": 0.85, + "learning_rate": 3.012310201545571e-08, + "loss": 0.0004, + "step": 43795 + }, + { + "epoch": 0.85, + "learning_rate": 3.0119218671119566e-08, + "loss": 0.0005, + "step": 43796 + }, + { + "epoch": 0.85, + "learning_rate": 3.0115335326783425e-08, + "loss": 0.0005, + "step": 43797 + }, + { + "epoch": 0.85, + "learning_rate": 3.011145198244728e-08, + "loss": 0.0007, + "step": 43798 + }, + { + "epoch": 0.85, + "learning_rate": 3.010756863811114e-08, + "loss": 0.0092, + "step": 43799 + }, + { + "epoch": 0.85, + "learning_rate": 3.0103685293775e-08, + "loss": 0.9439, + "step": 43800 + }, + { + "epoch": 0.85, + "learning_rate": 3.009980194943886e-08, + "loss": 0.0003, + "step": 43801 + }, + { + "epoch": 0.85, + "learning_rate": 3.0095918605102716e-08, + "loss": 0.0004, + "step": 43802 + }, + { + "epoch": 0.85, + "learning_rate": 3.009203526076657e-08, + "loss": 0.0003, + "step": 43803 + }, + { + "epoch": 0.85, + "learning_rate": 3.0088151916430426e-08, + "loss": 0.0005, + "step": 43804 + }, + { + "epoch": 0.85, + "learning_rate": 3.0084268572094284e-08, + "loss": 0.0004, + "step": 43805 + }, + { + "epoch": 0.85, + "learning_rate": 3.008038522775814e-08, + "loss": 0.0005, + "step": 43806 + }, + { + "epoch": 0.85, + "learning_rate": 3.0076501883422e-08, + "loss": 0.0763, + "step": 43807 + }, + { + "epoch": 0.85, + "learning_rate": 3.007261853908586e-08, + "loss": 0.0004, + "step": 43808 + }, + { + "epoch": 0.85, + "learning_rate": 3.006873519474972e-08, + "loss": 0.0005, + "step": 43809 + }, + { + "epoch": 0.85, + "learning_rate": 3.0064851850413575e-08, + "loss": 0.0004, + "step": 43810 + }, + { + "epoch": 0.85, + "learning_rate": 3.0060968506077433e-08, + "loss": 0.0005, + "step": 43811 + }, + { + "epoch": 0.85, + "learning_rate": 3.005708516174129e-08, + "loss": 0.0002, + "step": 43812 + }, + { + "epoch": 0.85, + "learning_rate": 3.005320181740515e-08, + "loss": 0.0532, + "step": 43813 + }, + { + "epoch": 0.85, + "learning_rate": 3.004931847306901e-08, + "loss": 0.0005, + "step": 43814 + }, + { + "epoch": 0.85, + "learning_rate": 3.0045435128732866e-08, + "loss": 0.0003, + "step": 43815 + }, + { + "epoch": 0.85, + "learning_rate": 3.0041551784396725e-08, + "loss": 0.0003, + "step": 43816 + }, + { + "epoch": 0.85, + "learning_rate": 3.0037668440060576e-08, + "loss": 0.0003, + "step": 43817 + }, + { + "epoch": 0.85, + "learning_rate": 3.0033785095724435e-08, + "loss": 0.0003, + "step": 43818 + }, + { + "epoch": 0.85, + "learning_rate": 3.002990175138829e-08, + "loss": 0.0003, + "step": 43819 + }, + { + "epoch": 0.85, + "learning_rate": 3.002601840705215e-08, + "loss": 0.6538, + "step": 43820 + }, + { + "epoch": 0.85, + "learning_rate": 3.002213506271601e-08, + "loss": 0.0003, + "step": 43821 + }, + { + "epoch": 0.85, + "learning_rate": 3.001825171837987e-08, + "loss": 0.0005, + "step": 43822 + }, + { + "epoch": 0.85, + "learning_rate": 3.0014368374043726e-08, + "loss": 0.0005, + "step": 43823 + }, + { + "epoch": 0.85, + "learning_rate": 3.0010485029707584e-08, + "loss": 0.0005, + "step": 43824 + }, + { + "epoch": 0.85, + "learning_rate": 3.000660168537144e-08, + "loss": 0.0003, + "step": 43825 + }, + { + "epoch": 0.85, + "learning_rate": 3.00027183410353e-08, + "loss": 0.0004, + "step": 43826 + }, + { + "epoch": 0.85, + "learning_rate": 2.999883499669916e-08, + "loss": 0.0006, + "step": 43827 + }, + { + "epoch": 0.85, + "learning_rate": 2.999495165236302e-08, + "loss": 0.1126, + "step": 43828 + }, + { + "epoch": 0.85, + "learning_rate": 2.9991068308026875e-08, + "loss": 0.0004, + "step": 43829 + }, + { + "epoch": 0.85, + "learning_rate": 2.9987184963690733e-08, + "loss": 0.0007, + "step": 43830 + }, + { + "epoch": 0.85, + "learning_rate": 2.998330161935459e-08, + "loss": 0.0003, + "step": 43831 + }, + { + "epoch": 0.85, + "learning_rate": 2.9979418275018443e-08, + "loss": 0.0004, + "step": 43832 + }, + { + "epoch": 0.85, + "learning_rate": 2.99755349306823e-08, + "loss": 0.0005, + "step": 43833 + }, + { + "epoch": 0.85, + "learning_rate": 2.997165158634616e-08, + "loss": 0.0004, + "step": 43834 + }, + { + "epoch": 0.85, + "learning_rate": 2.996776824201002e-08, + "loss": 0.0005, + "step": 43835 + }, + { + "epoch": 0.85, + "learning_rate": 2.9963884897673876e-08, + "loss": 0.0004, + "step": 43836 + }, + { + "epoch": 0.85, + "learning_rate": 2.9960001553337735e-08, + "loss": 0.0005, + "step": 43837 + }, + { + "epoch": 0.85, + "learning_rate": 2.995611820900159e-08, + "loss": 0.0004, + "step": 43838 + }, + { + "epoch": 0.85, + "learning_rate": 2.995223486466545e-08, + "loss": 0.0017, + "step": 43839 + }, + { + "epoch": 0.85, + "learning_rate": 2.994835152032931e-08, + "loss": 0.0004, + "step": 43840 + }, + { + "epoch": 0.85, + "learning_rate": 2.994446817599317e-08, + "loss": 0.0004, + "step": 43841 + }, + { + "epoch": 0.85, + "learning_rate": 2.9940584831657026e-08, + "loss": 0.0005, + "step": 43842 + }, + { + "epoch": 0.85, + "learning_rate": 2.9936701487320884e-08, + "loss": 0.0003, + "step": 43843 + }, + { + "epoch": 0.85, + "learning_rate": 2.993281814298474e-08, + "loss": 0.5669, + "step": 43844 + }, + { + "epoch": 0.85, + "learning_rate": 2.99289347986486e-08, + "loss": 0.0004, + "step": 43845 + }, + { + "epoch": 0.85, + "learning_rate": 2.992505145431245e-08, + "loss": 0.0002, + "step": 43846 + }, + { + "epoch": 0.85, + "learning_rate": 2.992116810997631e-08, + "loss": 0.0003, + "step": 43847 + }, + { + "epoch": 0.85, + "learning_rate": 2.991728476564017e-08, + "loss": 0.0003, + "step": 43848 + }, + { + "epoch": 0.85, + "learning_rate": 2.991340142130403e-08, + "loss": 0.0003, + "step": 43849 + }, + { + "epoch": 0.85, + "learning_rate": 2.9909518076967885e-08, + "loss": 0.0004, + "step": 43850 + }, + { + "epoch": 0.85, + "learning_rate": 2.9905634732631743e-08, + "loss": 0.0003, + "step": 43851 + }, + { + "epoch": 0.85, + "learning_rate": 2.99017513882956e-08, + "loss": 0.0686, + "step": 43852 + }, + { + "epoch": 0.85, + "learning_rate": 2.989786804395946e-08, + "loss": 0.0006, + "step": 43853 + }, + { + "epoch": 0.85, + "learning_rate": 2.989398469962331e-08, + "loss": 0.0005, + "step": 43854 + }, + { + "epoch": 0.85, + "learning_rate": 2.989010135528717e-08, + "loss": 0.1079, + "step": 43855 + }, + { + "epoch": 0.85, + "learning_rate": 2.988621801095103e-08, + "loss": 0.0009, + "step": 43856 + }, + { + "epoch": 0.85, + "learning_rate": 2.9882334666614886e-08, + "loss": 0.0004, + "step": 43857 + }, + { + "epoch": 0.85, + "learning_rate": 2.9878451322278744e-08, + "loss": 0.0003, + "step": 43858 + }, + { + "epoch": 0.85, + "learning_rate": 2.98745679779426e-08, + "loss": 0.0004, + "step": 43859 + }, + { + "epoch": 0.85, + "learning_rate": 2.987068463360646e-08, + "loss": 0.0005, + "step": 43860 + }, + { + "epoch": 0.85, + "learning_rate": 2.986680128927031e-08, + "loss": 0.0003, + "step": 43861 + }, + { + "epoch": 0.85, + "learning_rate": 2.986291794493417e-08, + "loss": 0.0003, + "step": 43862 + }, + { + "epoch": 0.85, + "learning_rate": 2.985903460059803e-08, + "loss": 0.3078, + "step": 43863 + }, + { + "epoch": 0.85, + "learning_rate": 2.985515125626189e-08, + "loss": 0.0003, + "step": 43864 + }, + { + "epoch": 0.85, + "learning_rate": 2.9851267911925746e-08, + "loss": 0.0004, + "step": 43865 + }, + { + "epoch": 0.85, + "learning_rate": 2.9847384567589604e-08, + "loss": 0.0006, + "step": 43866 + }, + { + "epoch": 0.85, + "learning_rate": 2.984350122325346e-08, + "loss": 0.0004, + "step": 43867 + }, + { + "epoch": 0.85, + "learning_rate": 2.983961787891732e-08, + "loss": 0.0004, + "step": 43868 + }, + { + "epoch": 0.85, + "learning_rate": 2.983573453458118e-08, + "loss": 0.0008, + "step": 43869 + }, + { + "epoch": 0.85, + "learning_rate": 2.983185119024504e-08, + "loss": 0.0003, + "step": 43870 + }, + { + "epoch": 0.85, + "learning_rate": 2.9827967845908895e-08, + "loss": 0.0004, + "step": 43871 + }, + { + "epoch": 0.85, + "learning_rate": 2.982408450157275e-08, + "loss": 0.0004, + "step": 43872 + }, + { + "epoch": 0.85, + "learning_rate": 2.982020115723661e-08, + "loss": 0.0011, + "step": 43873 + }, + { + "epoch": 0.85, + "learning_rate": 2.981631781290047e-08, + "loss": 0.0132, + "step": 43874 + }, + { + "epoch": 0.85, + "learning_rate": 2.981243446856432e-08, + "loss": 0.0003, + "step": 43875 + }, + { + "epoch": 0.85, + "learning_rate": 2.980855112422818e-08, + "loss": 0.0004, + "step": 43876 + }, + { + "epoch": 0.85, + "learning_rate": 2.980466777989204e-08, + "loss": 0.0005, + "step": 43877 + }, + { + "epoch": 0.85, + "learning_rate": 2.98007844355559e-08, + "loss": 0.229, + "step": 43878 + }, + { + "epoch": 0.85, + "learning_rate": 2.9796901091219758e-08, + "loss": 0.0003, + "step": 43879 + }, + { + "epoch": 0.85, + "learning_rate": 2.9793017746883613e-08, + "loss": 0.0005, + "step": 43880 + }, + { + "epoch": 0.85, + "learning_rate": 2.978913440254747e-08, + "loss": 0.0004, + "step": 43881 + }, + { + "epoch": 0.85, + "learning_rate": 2.978525105821133e-08, + "loss": 0.0004, + "step": 43882 + }, + { + "epoch": 0.85, + "learning_rate": 2.9781367713875187e-08, + "loss": 0.0003, + "step": 43883 + }, + { + "epoch": 0.85, + "learning_rate": 2.9777484369539046e-08, + "loss": 0.0003, + "step": 43884 + }, + { + "epoch": 0.85, + "learning_rate": 2.9773601025202904e-08, + "loss": 0.0005, + "step": 43885 + }, + { + "epoch": 0.85, + "learning_rate": 2.9769717680866762e-08, + "loss": 1.2298, + "step": 43886 + }, + { + "epoch": 0.85, + "learning_rate": 2.976583433653062e-08, + "loss": 0.0003, + "step": 43887 + }, + { + "epoch": 0.85, + "learning_rate": 2.976195099219448e-08, + "loss": 0.0003, + "step": 43888 + }, + { + "epoch": 0.85, + "learning_rate": 2.9758067647858337e-08, + "loss": 0.18, + "step": 43889 + }, + { + "epoch": 0.85, + "learning_rate": 2.975418430352219e-08, + "loss": 0.5603, + "step": 43890 + }, + { + "epoch": 0.85, + "learning_rate": 2.9750300959186047e-08, + "loss": 0.0004, + "step": 43891 + }, + { + "epoch": 0.85, + "learning_rate": 2.9746417614849905e-08, + "loss": 0.0005, + "step": 43892 + }, + { + "epoch": 0.85, + "learning_rate": 2.9742534270513763e-08, + "loss": 0.0016, + "step": 43893 + }, + { + "epoch": 0.85, + "learning_rate": 2.973865092617762e-08, + "loss": 0.0004, + "step": 43894 + }, + { + "epoch": 0.85, + "learning_rate": 2.973476758184148e-08, + "loss": 0.0004, + "step": 43895 + }, + { + "epoch": 0.85, + "learning_rate": 2.9730884237505338e-08, + "loss": 0.0005, + "step": 43896 + }, + { + "epoch": 0.85, + "learning_rate": 2.9727000893169196e-08, + "loss": 0.0146, + "step": 43897 + }, + { + "epoch": 0.85, + "learning_rate": 2.9723117548833054e-08, + "loss": 0.0003, + "step": 43898 + }, + { + "epoch": 0.85, + "learning_rate": 2.9719234204496913e-08, + "loss": 0.0002, + "step": 43899 + }, + { + "epoch": 0.85, + "learning_rate": 2.971535086016077e-08, + "loss": 0.0028, + "step": 43900 + }, + { + "epoch": 0.85, + "learning_rate": 2.971146751582463e-08, + "loss": 0.0004, + "step": 43901 + }, + { + "epoch": 0.85, + "learning_rate": 2.9707584171488487e-08, + "loss": 0.0003, + "step": 43902 + }, + { + "epoch": 0.85, + "learning_rate": 2.9703700827152346e-08, + "loss": 0.0003, + "step": 43903 + }, + { + "epoch": 0.85, + "learning_rate": 2.9699817482816197e-08, + "loss": 0.0004, + "step": 43904 + }, + { + "epoch": 0.85, + "learning_rate": 2.9695934138480055e-08, + "loss": 1.2207, + "step": 43905 + }, + { + "epoch": 0.85, + "learning_rate": 2.9692050794143914e-08, + "loss": 0.0006, + "step": 43906 + }, + { + "epoch": 0.85, + "learning_rate": 2.9688167449807772e-08, + "loss": 0.0005, + "step": 43907 + }, + { + "epoch": 0.85, + "learning_rate": 2.968428410547163e-08, + "loss": 0.0004, + "step": 43908 + }, + { + "epoch": 0.85, + "learning_rate": 2.968040076113549e-08, + "loss": 0.0003, + "step": 43909 + }, + { + "epoch": 0.85, + "learning_rate": 2.9676517416799347e-08, + "loss": 0.0564, + "step": 43910 + }, + { + "epoch": 0.85, + "learning_rate": 2.9672634072463205e-08, + "loss": 0.0005, + "step": 43911 + }, + { + "epoch": 0.85, + "learning_rate": 2.9668750728127063e-08, + "loss": 0.0004, + "step": 43912 + }, + { + "epoch": 0.85, + "learning_rate": 2.966486738379092e-08, + "loss": 0.0021, + "step": 43913 + }, + { + "epoch": 0.85, + "learning_rate": 2.966098403945478e-08, + "loss": 0.0003, + "step": 43914 + }, + { + "epoch": 0.85, + "learning_rate": 2.9657100695118638e-08, + "loss": 0.0004, + "step": 43915 + }, + { + "epoch": 0.85, + "learning_rate": 2.9653217350782496e-08, + "loss": 0.7532, + "step": 43916 + }, + { + "epoch": 0.85, + "learning_rate": 2.964933400644635e-08, + "loss": 0.004, + "step": 43917 + }, + { + "epoch": 0.85, + "learning_rate": 2.964545066211021e-08, + "loss": 0.0007, + "step": 43918 + }, + { + "epoch": 0.85, + "learning_rate": 2.9641567317774064e-08, + "loss": 0.0005, + "step": 43919 + }, + { + "epoch": 0.85, + "learning_rate": 2.9637683973437923e-08, + "loss": 0.0035, + "step": 43920 + }, + { + "epoch": 0.85, + "learning_rate": 2.963380062910178e-08, + "loss": 0.9138, + "step": 43921 + }, + { + "epoch": 0.85, + "learning_rate": 2.962991728476564e-08, + "loss": 0.0004, + "step": 43922 + }, + { + "epoch": 0.85, + "learning_rate": 2.9626033940429497e-08, + "loss": 0.0004, + "step": 43923 + }, + { + "epoch": 0.85, + "learning_rate": 2.9622150596093352e-08, + "loss": 0.0003, + "step": 43924 + }, + { + "epoch": 0.85, + "learning_rate": 2.961826725175721e-08, + "loss": 0.0004, + "step": 43925 + }, + { + "epoch": 0.85, + "learning_rate": 2.961438390742107e-08, + "loss": 0.0004, + "step": 43926 + }, + { + "epoch": 0.85, + "learning_rate": 2.9610500563084927e-08, + "loss": 0.2731, + "step": 43927 + }, + { + "epoch": 0.85, + "learning_rate": 2.9606617218748785e-08, + "loss": 1.1223, + "step": 43928 + }, + { + "epoch": 0.85, + "learning_rate": 2.9602733874412643e-08, + "loss": 0.0004, + "step": 43929 + }, + { + "epoch": 0.85, + "learning_rate": 2.9598850530076502e-08, + "loss": 0.8499, + "step": 43930 + }, + { + "epoch": 0.85, + "learning_rate": 2.959496718574036e-08, + "loss": 0.0004, + "step": 43931 + }, + { + "epoch": 0.85, + "learning_rate": 2.9591083841404218e-08, + "loss": 0.0004, + "step": 43932 + }, + { + "epoch": 0.85, + "learning_rate": 2.958720049706807e-08, + "loss": 0.0003, + "step": 43933 + }, + { + "epoch": 0.85, + "learning_rate": 2.9583317152731928e-08, + "loss": 0.0003, + "step": 43934 + }, + { + "epoch": 0.85, + "learning_rate": 2.9579433808395786e-08, + "loss": 0.0004, + "step": 43935 + }, + { + "epoch": 0.85, + "learning_rate": 2.9575550464059645e-08, + "loss": 0.0002, + "step": 43936 + }, + { + "epoch": 0.85, + "learning_rate": 2.9571667119723503e-08, + "loss": 0.0007, + "step": 43937 + }, + { + "epoch": 0.85, + "learning_rate": 2.956778377538736e-08, + "loss": 0.0004, + "step": 43938 + }, + { + "epoch": 0.85, + "learning_rate": 2.956390043105122e-08, + "loss": 0.0003, + "step": 43939 + }, + { + "epoch": 0.85, + "learning_rate": 2.9560017086715078e-08, + "loss": 0.0003, + "step": 43940 + }, + { + "epoch": 0.85, + "learning_rate": 2.9556133742378936e-08, + "loss": 0.0004, + "step": 43941 + }, + { + "epoch": 0.85, + "learning_rate": 2.9552250398042794e-08, + "loss": 0.0004, + "step": 43942 + }, + { + "epoch": 0.85, + "learning_rate": 2.9548367053706652e-08, + "loss": 0.3919, + "step": 43943 + }, + { + "epoch": 0.85, + "learning_rate": 2.954448370937051e-08, + "loss": 0.0003, + "step": 43944 + }, + { + "epoch": 0.85, + "learning_rate": 2.954060036503437e-08, + "loss": 0.0003, + "step": 43945 + }, + { + "epoch": 0.85, + "learning_rate": 2.9536717020698227e-08, + "loss": 0.0003, + "step": 43946 + }, + { + "epoch": 0.85, + "learning_rate": 2.9532833676362085e-08, + "loss": 0.0005, + "step": 43947 + }, + { + "epoch": 0.85, + "learning_rate": 2.9528950332025937e-08, + "loss": 0.0027, + "step": 43948 + }, + { + "epoch": 0.85, + "learning_rate": 2.9525066987689795e-08, + "loss": 0.0004, + "step": 43949 + }, + { + "epoch": 0.85, + "learning_rate": 2.9521183643353653e-08, + "loss": 0.0004, + "step": 43950 + }, + { + "epoch": 0.85, + "learning_rate": 2.951730029901751e-08, + "loss": 1.1579, + "step": 43951 + }, + { + "epoch": 0.85, + "learning_rate": 2.951341695468137e-08, + "loss": 0.0003, + "step": 43952 + }, + { + "epoch": 0.85, + "learning_rate": 2.9509533610345228e-08, + "loss": 0.0004, + "step": 43953 + }, + { + "epoch": 0.85, + "learning_rate": 2.9505650266009086e-08, + "loss": 0.0277, + "step": 43954 + }, + { + "epoch": 0.85, + "learning_rate": 2.9501766921672945e-08, + "loss": 0.0004, + "step": 43955 + }, + { + "epoch": 0.85, + "learning_rate": 2.9497883577336803e-08, + "loss": 0.0004, + "step": 43956 + }, + { + "epoch": 0.85, + "learning_rate": 2.949400023300066e-08, + "loss": 0.0004, + "step": 43957 + }, + { + "epoch": 0.85, + "learning_rate": 2.949011688866452e-08, + "loss": 0.0004, + "step": 43958 + }, + { + "epoch": 0.85, + "learning_rate": 2.9486233544328378e-08, + "loss": 0.0004, + "step": 43959 + }, + { + "epoch": 0.85, + "learning_rate": 2.9482350199992236e-08, + "loss": 0.0004, + "step": 43960 + }, + { + "epoch": 0.85, + "learning_rate": 2.947846685565609e-08, + "loss": 0.0005, + "step": 43961 + }, + { + "epoch": 0.85, + "learning_rate": 2.9474583511319946e-08, + "loss": 0.0004, + "step": 43962 + }, + { + "epoch": 0.85, + "learning_rate": 2.9470700166983804e-08, + "loss": 0.0003, + "step": 43963 + }, + { + "epoch": 0.85, + "learning_rate": 2.9466816822647662e-08, + "loss": 0.0003, + "step": 43964 + }, + { + "epoch": 0.85, + "learning_rate": 2.946293347831152e-08, + "loss": 0.7795, + "step": 43965 + }, + { + "epoch": 0.85, + "learning_rate": 2.945905013397538e-08, + "loss": 1.1929, + "step": 43966 + }, + { + "epoch": 0.85, + "learning_rate": 2.9455166789639237e-08, + "loss": 0.0003, + "step": 43967 + }, + { + "epoch": 0.85, + "learning_rate": 2.9451283445303092e-08, + "loss": 0.0004, + "step": 43968 + }, + { + "epoch": 0.85, + "learning_rate": 2.944740010096695e-08, + "loss": 0.0002, + "step": 43969 + }, + { + "epoch": 0.85, + "learning_rate": 2.9443516756630808e-08, + "loss": 0.7978, + "step": 43970 + }, + { + "epoch": 0.85, + "learning_rate": 2.9439633412294667e-08, + "loss": 0.0003, + "step": 43971 + }, + { + "epoch": 0.85, + "learning_rate": 2.9435750067958525e-08, + "loss": 0.0005, + "step": 43972 + }, + { + "epoch": 0.85, + "learning_rate": 2.9431866723622383e-08, + "loss": 0.0004, + "step": 43973 + }, + { + "epoch": 0.85, + "learning_rate": 2.942798337928624e-08, + "loss": 0.0004, + "step": 43974 + }, + { + "epoch": 0.85, + "learning_rate": 2.94241000349501e-08, + "loss": 0.0004, + "step": 43975 + }, + { + "epoch": 0.85, + "learning_rate": 2.9420216690613958e-08, + "loss": 0.0004, + "step": 43976 + }, + { + "epoch": 0.85, + "learning_rate": 2.941633334627781e-08, + "loss": 0.0004, + "step": 43977 + }, + { + "epoch": 0.85, + "learning_rate": 2.9412450001941668e-08, + "loss": 0.0004, + "step": 43978 + }, + { + "epoch": 0.85, + "learning_rate": 2.9408566657605526e-08, + "loss": 0.0005, + "step": 43979 + }, + { + "epoch": 0.85, + "learning_rate": 2.9404683313269384e-08, + "loss": 0.0005, + "step": 43980 + }, + { + "epoch": 0.85, + "learning_rate": 2.9400799968933242e-08, + "loss": 0.0004, + "step": 43981 + }, + { + "epoch": 0.85, + "learning_rate": 2.93969166245971e-08, + "loss": 0.961, + "step": 43982 + }, + { + "epoch": 0.85, + "learning_rate": 2.939303328026096e-08, + "loss": 0.0003, + "step": 43983 + }, + { + "epoch": 0.85, + "learning_rate": 2.9389149935924817e-08, + "loss": 0.0004, + "step": 43984 + }, + { + "epoch": 0.85, + "learning_rate": 2.9385266591588675e-08, + "loss": 0.0003, + "step": 43985 + }, + { + "epoch": 0.85, + "learning_rate": 2.9381383247252534e-08, + "loss": 0.0004, + "step": 43986 + }, + { + "epoch": 0.85, + "learning_rate": 2.9377499902916392e-08, + "loss": 0.0003, + "step": 43987 + }, + { + "epoch": 0.85, + "learning_rate": 2.937361655858025e-08, + "loss": 0.0005, + "step": 43988 + }, + { + "epoch": 0.85, + "learning_rate": 2.9369733214244108e-08, + "loss": 0.0004, + "step": 43989 + }, + { + "epoch": 0.85, + "learning_rate": 2.9365849869907967e-08, + "loss": 0.9722, + "step": 43990 + }, + { + "epoch": 0.85, + "learning_rate": 2.9361966525571818e-08, + "loss": 0.0004, + "step": 43991 + }, + { + "epoch": 0.85, + "learning_rate": 2.9358083181235676e-08, + "loss": 0.0004, + "step": 43992 + }, + { + "epoch": 0.85, + "learning_rate": 2.9354199836899535e-08, + "loss": 0.0004, + "step": 43993 + }, + { + "epoch": 0.85, + "learning_rate": 2.9350316492563393e-08, + "loss": 0.0006, + "step": 43994 + }, + { + "epoch": 0.85, + "learning_rate": 2.934643314822725e-08, + "loss": 0.0067, + "step": 43995 + }, + { + "epoch": 0.85, + "learning_rate": 2.934254980389111e-08, + "loss": 0.0005, + "step": 43996 + }, + { + "epoch": 0.85, + "learning_rate": 2.9338666459554968e-08, + "loss": 0.0004, + "step": 43997 + }, + { + "epoch": 0.85, + "learning_rate": 2.9334783115218826e-08, + "loss": 0.0003, + "step": 43998 + }, + { + "epoch": 0.85, + "learning_rate": 2.9330899770882684e-08, + "loss": 0.0004, + "step": 43999 + }, + { + "epoch": 0.85, + "learning_rate": 2.9327016426546542e-08, + "loss": 0.003, + "step": 44000 + }, + { + "epoch": 0.85, + "learning_rate": 2.93231330822104e-08, + "loss": 0.0003, + "step": 44001 + }, + { + "epoch": 0.85, + "learning_rate": 2.931924973787426e-08, + "loss": 0.0004, + "step": 44002 + }, + { + "epoch": 0.85, + "learning_rate": 2.9315366393538117e-08, + "loss": 0.0003, + "step": 44003 + }, + { + "epoch": 0.85, + "learning_rate": 2.9311483049201975e-08, + "loss": 0.7922, + "step": 44004 + }, + { + "epoch": 0.85, + "learning_rate": 2.930759970486583e-08, + "loss": 0.0008, + "step": 44005 + }, + { + "epoch": 0.85, + "learning_rate": 2.9303716360529685e-08, + "loss": 0.0005, + "step": 44006 + }, + { + "epoch": 0.85, + "learning_rate": 2.9299833016193543e-08, + "loss": 0.0006, + "step": 44007 + }, + { + "epoch": 0.85, + "learning_rate": 2.9295949671857402e-08, + "loss": 0.0007, + "step": 44008 + }, + { + "epoch": 0.85, + "learning_rate": 2.929206632752126e-08, + "loss": 0.0003, + "step": 44009 + }, + { + "epoch": 0.85, + "learning_rate": 2.9288182983185118e-08, + "loss": 0.0003, + "step": 44010 + }, + { + "epoch": 0.85, + "learning_rate": 2.9284299638848976e-08, + "loss": 0.8947, + "step": 44011 + }, + { + "epoch": 0.85, + "learning_rate": 2.928041629451283e-08, + "loss": 0.0004, + "step": 44012 + }, + { + "epoch": 0.85, + "learning_rate": 2.927653295017669e-08, + "loss": 0.0004, + "step": 44013 + }, + { + "epoch": 0.85, + "learning_rate": 2.9272649605840548e-08, + "loss": 0.0133, + "step": 44014 + }, + { + "epoch": 0.85, + "learning_rate": 2.9268766261504406e-08, + "loss": 0.0007, + "step": 44015 + }, + { + "epoch": 0.85, + "learning_rate": 2.9264882917168264e-08, + "loss": 0.0004, + "step": 44016 + }, + { + "epoch": 0.85, + "learning_rate": 2.9260999572832123e-08, + "loss": 0.0007, + "step": 44017 + }, + { + "epoch": 0.85, + "learning_rate": 2.925711622849598e-08, + "loss": 0.0003, + "step": 44018 + }, + { + "epoch": 0.85, + "learning_rate": 2.925323288415984e-08, + "loss": 0.0005, + "step": 44019 + }, + { + "epoch": 0.85, + "learning_rate": 2.924934953982369e-08, + "loss": 0.0004, + "step": 44020 + }, + { + "epoch": 0.85, + "learning_rate": 2.924546619548755e-08, + "loss": 0.0004, + "step": 44021 + }, + { + "epoch": 0.85, + "learning_rate": 2.9241582851151407e-08, + "loss": 0.0074, + "step": 44022 + }, + { + "epoch": 0.85, + "learning_rate": 2.9237699506815265e-08, + "loss": 0.0004, + "step": 44023 + }, + { + "epoch": 0.85, + "learning_rate": 2.9233816162479124e-08, + "loss": 0.0004, + "step": 44024 + }, + { + "epoch": 0.85, + "learning_rate": 2.9229932818142982e-08, + "loss": 0.0005, + "step": 44025 + }, + { + "epoch": 0.85, + "learning_rate": 2.922604947380684e-08, + "loss": 0.0004, + "step": 44026 + }, + { + "epoch": 0.85, + "learning_rate": 2.92221661294707e-08, + "loss": 0.0006, + "step": 44027 + }, + { + "epoch": 0.85, + "learning_rate": 2.9218282785134557e-08, + "loss": 0.0004, + "step": 44028 + }, + { + "epoch": 0.85, + "learning_rate": 2.9214399440798415e-08, + "loss": 0.8954, + "step": 44029 + }, + { + "epoch": 0.85, + "learning_rate": 2.9210516096462273e-08, + "loss": 0.0003, + "step": 44030 + }, + { + "epoch": 0.85, + "learning_rate": 2.920663275212613e-08, + "loss": 0.0003, + "step": 44031 + }, + { + "epoch": 0.85, + "learning_rate": 2.920274940778999e-08, + "loss": 0.0005, + "step": 44032 + }, + { + "epoch": 0.85, + "learning_rate": 2.9198866063453848e-08, + "loss": 0.0004, + "step": 44033 + }, + { + "epoch": 0.85, + "learning_rate": 2.9194982719117706e-08, + "loss": 0.0004, + "step": 44034 + }, + { + "epoch": 0.85, + "learning_rate": 2.9191099374781558e-08, + "loss": 0.0005, + "step": 44035 + }, + { + "epoch": 0.85, + "learning_rate": 2.9187216030445416e-08, + "loss": 0.0004, + "step": 44036 + }, + { + "epoch": 0.85, + "learning_rate": 2.9183332686109274e-08, + "loss": 0.0009, + "step": 44037 + }, + { + "epoch": 0.85, + "learning_rate": 2.9179449341773133e-08, + "loss": 0.0081, + "step": 44038 + }, + { + "epoch": 0.85, + "learning_rate": 2.917556599743699e-08, + "loss": 0.0004, + "step": 44039 + }, + { + "epoch": 0.85, + "learning_rate": 2.917168265310085e-08, + "loss": 0.0003, + "step": 44040 + }, + { + "epoch": 0.85, + "learning_rate": 2.9167799308764707e-08, + "loss": 0.0004, + "step": 44041 + }, + { + "epoch": 0.85, + "learning_rate": 2.9163915964428565e-08, + "loss": 0.0002, + "step": 44042 + }, + { + "epoch": 0.85, + "learning_rate": 2.9160032620092424e-08, + "loss": 0.0005, + "step": 44043 + }, + { + "epoch": 0.85, + "learning_rate": 2.9156149275756282e-08, + "loss": 0.0003, + "step": 44044 + }, + { + "epoch": 0.85, + "learning_rate": 2.915226593142014e-08, + "loss": 0.0005, + "step": 44045 + }, + { + "epoch": 0.85, + "learning_rate": 2.9148382587084e-08, + "loss": 0.0003, + "step": 44046 + }, + { + "epoch": 0.85, + "learning_rate": 2.9144499242747857e-08, + "loss": 0.0002, + "step": 44047 + }, + { + "epoch": 0.85, + "learning_rate": 2.9140615898411715e-08, + "loss": 0.0006, + "step": 44048 + }, + { + "epoch": 0.85, + "learning_rate": 2.9136732554075567e-08, + "loss": 0.0005, + "step": 44049 + }, + { + "epoch": 0.85, + "learning_rate": 2.9132849209739425e-08, + "loss": 0.0114, + "step": 44050 + }, + { + "epoch": 0.85, + "learning_rate": 2.9128965865403283e-08, + "loss": 0.0003, + "step": 44051 + }, + { + "epoch": 0.85, + "learning_rate": 2.912508252106714e-08, + "loss": 0.0003, + "step": 44052 + }, + { + "epoch": 0.85, + "learning_rate": 2.9121199176731e-08, + "loss": 0.0004, + "step": 44053 + }, + { + "epoch": 0.85, + "learning_rate": 2.9117315832394858e-08, + "loss": 0.001, + "step": 44054 + }, + { + "epoch": 0.85, + "learning_rate": 2.9113432488058716e-08, + "loss": 0.086, + "step": 44055 + }, + { + "epoch": 0.85, + "learning_rate": 2.9109549143722574e-08, + "loss": 0.0004, + "step": 44056 + }, + { + "epoch": 0.85, + "learning_rate": 2.910566579938643e-08, + "loss": 0.0003, + "step": 44057 + }, + { + "epoch": 0.85, + "learning_rate": 2.9101782455050287e-08, + "loss": 0.0004, + "step": 44058 + }, + { + "epoch": 0.85, + "learning_rate": 2.9097899110714146e-08, + "loss": 0.0004, + "step": 44059 + }, + { + "epoch": 0.85, + "learning_rate": 2.9094015766378004e-08, + "loss": 0.0004, + "step": 44060 + }, + { + "epoch": 0.85, + "learning_rate": 2.9090132422041862e-08, + "loss": 0.0003, + "step": 44061 + }, + { + "epoch": 0.85, + "learning_rate": 2.908624907770572e-08, + "loss": 0.0005, + "step": 44062 + }, + { + "epoch": 0.85, + "learning_rate": 2.908236573336958e-08, + "loss": 0.0004, + "step": 44063 + }, + { + "epoch": 0.85, + "learning_rate": 2.907848238903343e-08, + "loss": 0.0004, + "step": 44064 + }, + { + "epoch": 0.85, + "learning_rate": 2.907459904469729e-08, + "loss": 0.0004, + "step": 44065 + }, + { + "epoch": 0.85, + "learning_rate": 2.9070715700361147e-08, + "loss": 0.0004, + "step": 44066 + }, + { + "epoch": 0.85, + "learning_rate": 2.9066832356025005e-08, + "loss": 0.0003, + "step": 44067 + }, + { + "epoch": 0.85, + "learning_rate": 2.9062949011688863e-08, + "loss": 0.0005, + "step": 44068 + }, + { + "epoch": 0.85, + "learning_rate": 2.905906566735272e-08, + "loss": 0.0003, + "step": 44069 + }, + { + "epoch": 0.85, + "learning_rate": 2.905518232301658e-08, + "loss": 0.4983, + "step": 44070 + }, + { + "epoch": 0.85, + "learning_rate": 2.9051298978680438e-08, + "loss": 0.0004, + "step": 44071 + }, + { + "epoch": 0.85, + "learning_rate": 2.9047415634344296e-08, + "loss": 0.0005, + "step": 44072 + }, + { + "epoch": 0.85, + "learning_rate": 2.9043532290008155e-08, + "loss": 0.0005, + "step": 44073 + }, + { + "epoch": 0.85, + "learning_rate": 2.9039648945672013e-08, + "loss": 0.0003, + "step": 44074 + }, + { + "epoch": 0.85, + "learning_rate": 2.903576560133587e-08, + "loss": 0.6087, + "step": 44075 + }, + { + "epoch": 0.85, + "learning_rate": 2.903188225699973e-08, + "loss": 0.0003, + "step": 44076 + }, + { + "epoch": 0.86, + "learning_rate": 2.9027998912663587e-08, + "loss": 0.0003, + "step": 44077 + }, + { + "epoch": 0.86, + "learning_rate": 2.902411556832744e-08, + "loss": 0.0004, + "step": 44078 + }, + { + "epoch": 0.86, + "learning_rate": 2.9020232223991297e-08, + "loss": 0.0003, + "step": 44079 + }, + { + "epoch": 0.86, + "learning_rate": 2.9016348879655156e-08, + "loss": 0.0005, + "step": 44080 + }, + { + "epoch": 0.86, + "learning_rate": 2.9012465535319014e-08, + "loss": 0.0004, + "step": 44081 + }, + { + "epoch": 0.86, + "learning_rate": 2.9008582190982872e-08, + "loss": 0.0006, + "step": 44082 + }, + { + "epoch": 0.86, + "learning_rate": 2.900469884664673e-08, + "loss": 0.0003, + "step": 44083 + }, + { + "epoch": 0.86, + "learning_rate": 2.900081550231059e-08, + "loss": 0.447, + "step": 44084 + }, + { + "epoch": 0.86, + "learning_rate": 2.8996932157974447e-08, + "loss": 0.0004, + "step": 44085 + }, + { + "epoch": 0.86, + "learning_rate": 2.8993048813638305e-08, + "loss": 0.1903, + "step": 44086 + }, + { + "epoch": 0.86, + "learning_rate": 2.8989165469302163e-08, + "loss": 0.8557, + "step": 44087 + }, + { + "epoch": 0.86, + "learning_rate": 2.898528212496602e-08, + "loss": 0.2032, + "step": 44088 + }, + { + "epoch": 0.86, + "learning_rate": 2.898139878062988e-08, + "loss": 0.0004, + "step": 44089 + }, + { + "epoch": 0.86, + "learning_rate": 2.8977515436293738e-08, + "loss": 0.0006, + "step": 44090 + }, + { + "epoch": 0.86, + "learning_rate": 2.8973632091957596e-08, + "loss": 0.0005, + "step": 44091 + }, + { + "epoch": 0.86, + "learning_rate": 2.8969748747621455e-08, + "loss": 0.0026, + "step": 44092 + }, + { + "epoch": 0.86, + "learning_rate": 2.8965865403285306e-08, + "loss": 0.0004, + "step": 44093 + }, + { + "epoch": 0.86, + "learning_rate": 2.8961982058949164e-08, + "loss": 0.0004, + "step": 44094 + }, + { + "epoch": 0.86, + "learning_rate": 2.8958098714613023e-08, + "loss": 0.0005, + "step": 44095 + }, + { + "epoch": 0.86, + "learning_rate": 2.895421537027688e-08, + "loss": 0.0005, + "step": 44096 + }, + { + "epoch": 0.86, + "learning_rate": 2.895033202594074e-08, + "loss": 0.0004, + "step": 44097 + }, + { + "epoch": 0.86, + "learning_rate": 2.8946448681604597e-08, + "loss": 0.0013, + "step": 44098 + }, + { + "epoch": 0.86, + "learning_rate": 2.8942565337268456e-08, + "loss": 0.0005, + "step": 44099 + }, + { + "epoch": 0.86, + "learning_rate": 2.8938681992932314e-08, + "loss": 0.0004, + "step": 44100 + }, + { + "epoch": 0.86, + "learning_rate": 2.893479864859617e-08, + "loss": 0.0003, + "step": 44101 + }, + { + "epoch": 0.86, + "learning_rate": 2.8930915304260027e-08, + "loss": 0.0003, + "step": 44102 + }, + { + "epoch": 0.86, + "learning_rate": 2.8927031959923885e-08, + "loss": 0.0007, + "step": 44103 + }, + { + "epoch": 0.86, + "learning_rate": 2.8923148615587744e-08, + "loss": 0.0003, + "step": 44104 + }, + { + "epoch": 0.86, + "learning_rate": 2.8919265271251602e-08, + "loss": 0.0003, + "step": 44105 + }, + { + "epoch": 0.86, + "learning_rate": 2.891538192691546e-08, + "loss": 0.0006, + "step": 44106 + }, + { + "epoch": 0.86, + "learning_rate": 2.8911498582579315e-08, + "loss": 0.0004, + "step": 44107 + }, + { + "epoch": 0.86, + "learning_rate": 2.890761523824317e-08, + "loss": 0.0004, + "step": 44108 + }, + { + "epoch": 0.86, + "learning_rate": 2.8903731893907028e-08, + "loss": 0.0005, + "step": 44109 + }, + { + "epoch": 0.86, + "learning_rate": 2.8899848549570886e-08, + "loss": 0.0005, + "step": 44110 + }, + { + "epoch": 0.86, + "learning_rate": 2.8895965205234745e-08, + "loss": 0.001, + "step": 44111 + }, + { + "epoch": 0.86, + "learning_rate": 2.8892081860898603e-08, + "loss": 0.0444, + "step": 44112 + }, + { + "epoch": 0.86, + "learning_rate": 2.888819851656246e-08, + "loss": 0.0005, + "step": 44113 + }, + { + "epoch": 0.86, + "learning_rate": 2.888431517222632e-08, + "loss": 0.0003, + "step": 44114 + }, + { + "epoch": 0.86, + "learning_rate": 2.8880431827890178e-08, + "loss": 0.0004, + "step": 44115 + }, + { + "epoch": 0.86, + "learning_rate": 2.8876548483554036e-08, + "loss": 0.0005, + "step": 44116 + }, + { + "epoch": 0.86, + "learning_rate": 2.8872665139217894e-08, + "loss": 0.0005, + "step": 44117 + }, + { + "epoch": 0.86, + "learning_rate": 2.8868781794881752e-08, + "loss": 0.0003, + "step": 44118 + }, + { + "epoch": 0.86, + "learning_rate": 2.886489845054561e-08, + "loss": 0.0003, + "step": 44119 + }, + { + "epoch": 0.86, + "learning_rate": 2.886101510620947e-08, + "loss": 1.0363, + "step": 44120 + }, + { + "epoch": 0.86, + "learning_rate": 2.8857131761873327e-08, + "loss": 0.0005, + "step": 44121 + }, + { + "epoch": 0.86, + "learning_rate": 2.885324841753718e-08, + "loss": 0.0005, + "step": 44122 + }, + { + "epoch": 0.86, + "learning_rate": 2.8849365073201037e-08, + "loss": 0.0003, + "step": 44123 + }, + { + "epoch": 0.86, + "learning_rate": 2.8845481728864895e-08, + "loss": 0.0003, + "step": 44124 + }, + { + "epoch": 0.86, + "learning_rate": 2.8841598384528753e-08, + "loss": 0.0005, + "step": 44125 + }, + { + "epoch": 0.86, + "learning_rate": 2.8837715040192612e-08, + "loss": 0.0003, + "step": 44126 + }, + { + "epoch": 0.86, + "learning_rate": 2.883383169585647e-08, + "loss": 0.0004, + "step": 44127 + }, + { + "epoch": 0.86, + "learning_rate": 2.8829948351520328e-08, + "loss": 0.0004, + "step": 44128 + }, + { + "epoch": 0.86, + "learning_rate": 2.8826065007184186e-08, + "loss": 0.0003, + "step": 44129 + }, + { + "epoch": 0.86, + "learning_rate": 2.8822181662848045e-08, + "loss": 0.0003, + "step": 44130 + }, + { + "epoch": 0.86, + "learning_rate": 2.8818298318511903e-08, + "loss": 0.0009, + "step": 44131 + }, + { + "epoch": 0.86, + "learning_rate": 2.881441497417576e-08, + "loss": 0.1705, + "step": 44132 + }, + { + "epoch": 0.86, + "learning_rate": 2.881053162983962e-08, + "loss": 0.0009, + "step": 44133 + }, + { + "epoch": 0.86, + "learning_rate": 2.8806648285503478e-08, + "loss": 0.0005, + "step": 44134 + }, + { + "epoch": 0.86, + "learning_rate": 2.8802764941167336e-08, + "loss": 1.0514, + "step": 44135 + }, + { + "epoch": 0.86, + "learning_rate": 2.8798881596831188e-08, + "loss": 0.0004, + "step": 44136 + }, + { + "epoch": 0.86, + "learning_rate": 2.8794998252495046e-08, + "loss": 0.3804, + "step": 44137 + }, + { + "epoch": 0.86, + "learning_rate": 2.8791114908158904e-08, + "loss": 0.0005, + "step": 44138 + }, + { + "epoch": 0.86, + "learning_rate": 2.8787231563822762e-08, + "loss": 0.0003, + "step": 44139 + }, + { + "epoch": 0.86, + "learning_rate": 2.878334821948662e-08, + "loss": 0.0005, + "step": 44140 + }, + { + "epoch": 0.86, + "learning_rate": 2.877946487515048e-08, + "loss": 0.0002, + "step": 44141 + }, + { + "epoch": 0.86, + "learning_rate": 2.8775581530814337e-08, + "loss": 0.0005, + "step": 44142 + }, + { + "epoch": 0.86, + "learning_rate": 2.8771698186478195e-08, + "loss": 0.0005, + "step": 44143 + }, + { + "epoch": 0.86, + "learning_rate": 2.8767814842142053e-08, + "loss": 0.0005, + "step": 44144 + }, + { + "epoch": 0.86, + "learning_rate": 2.876393149780591e-08, + "loss": 0.0004, + "step": 44145 + }, + { + "epoch": 0.86, + "learning_rate": 2.8760048153469767e-08, + "loss": 0.0003, + "step": 44146 + }, + { + "epoch": 0.86, + "learning_rate": 2.8756164809133625e-08, + "loss": 0.0004, + "step": 44147 + }, + { + "epoch": 0.86, + "learning_rate": 2.8752281464797483e-08, + "loss": 0.0004, + "step": 44148 + }, + { + "epoch": 0.86, + "learning_rate": 2.874839812046134e-08, + "loss": 0.0004, + "step": 44149 + }, + { + "epoch": 0.86, + "learning_rate": 2.87445147761252e-08, + "loss": 0.0004, + "step": 44150 + }, + { + "epoch": 0.86, + "learning_rate": 2.8740631431789055e-08, + "loss": 0.0004, + "step": 44151 + }, + { + "epoch": 0.86, + "learning_rate": 2.873674808745291e-08, + "loss": 0.0003, + "step": 44152 + }, + { + "epoch": 0.86, + "learning_rate": 2.8732864743116768e-08, + "loss": 0.0003, + "step": 44153 + }, + { + "epoch": 0.86, + "learning_rate": 2.8728981398780626e-08, + "loss": 0.0005, + "step": 44154 + }, + { + "epoch": 0.86, + "learning_rate": 2.8725098054444484e-08, + "loss": 0.0006, + "step": 44155 + }, + { + "epoch": 0.86, + "learning_rate": 2.8721214710108342e-08, + "loss": 0.0005, + "step": 44156 + }, + { + "epoch": 0.86, + "learning_rate": 2.87173313657722e-08, + "loss": 0.0006, + "step": 44157 + }, + { + "epoch": 0.86, + "learning_rate": 2.871344802143606e-08, + "loss": 0.0004, + "step": 44158 + }, + { + "epoch": 0.86, + "learning_rate": 2.8709564677099917e-08, + "loss": 0.1137, + "step": 44159 + }, + { + "epoch": 0.86, + "learning_rate": 2.8705681332763775e-08, + "loss": 0.0003, + "step": 44160 + }, + { + "epoch": 0.86, + "learning_rate": 2.8701797988427634e-08, + "loss": 0.0004, + "step": 44161 + }, + { + "epoch": 0.86, + "learning_rate": 2.8697914644091492e-08, + "loss": 0.0005, + "step": 44162 + }, + { + "epoch": 0.86, + "learning_rate": 2.869403129975535e-08, + "loss": 0.0003, + "step": 44163 + }, + { + "epoch": 0.86, + "learning_rate": 2.869014795541921e-08, + "loss": 0.0009, + "step": 44164 + }, + { + "epoch": 0.86, + "learning_rate": 2.868626461108306e-08, + "loss": 0.0003, + "step": 44165 + }, + { + "epoch": 0.86, + "learning_rate": 2.8682381266746918e-08, + "loss": 0.0122, + "step": 44166 + }, + { + "epoch": 0.86, + "learning_rate": 2.8678497922410777e-08, + "loss": 0.0005, + "step": 44167 + }, + { + "epoch": 0.86, + "learning_rate": 2.8674614578074635e-08, + "loss": 0.0006, + "step": 44168 + }, + { + "epoch": 0.86, + "learning_rate": 2.8670731233738493e-08, + "loss": 0.0007, + "step": 44169 + }, + { + "epoch": 0.86, + "learning_rate": 2.866684788940235e-08, + "loss": 0.0004, + "step": 44170 + }, + { + "epoch": 0.86, + "learning_rate": 2.866296454506621e-08, + "loss": 0.0011, + "step": 44171 + }, + { + "epoch": 0.86, + "learning_rate": 2.8659081200730068e-08, + "loss": 0.0007, + "step": 44172 + }, + { + "epoch": 0.86, + "learning_rate": 2.8655197856393926e-08, + "loss": 0.0148, + "step": 44173 + }, + { + "epoch": 0.86, + "learning_rate": 2.8651314512057784e-08, + "loss": 0.3886, + "step": 44174 + }, + { + "epoch": 0.86, + "learning_rate": 2.8647431167721643e-08, + "loss": 0.0016, + "step": 44175 + }, + { + "epoch": 0.86, + "learning_rate": 2.86435478233855e-08, + "loss": 0.0005, + "step": 44176 + }, + { + "epoch": 0.86, + "learning_rate": 2.863966447904936e-08, + "loss": 0.0004, + "step": 44177 + }, + { + "epoch": 0.86, + "learning_rate": 2.8635781134713217e-08, + "loss": 0.0003, + "step": 44178 + }, + { + "epoch": 0.86, + "learning_rate": 2.8631897790377075e-08, + "loss": 0.0003, + "step": 44179 + }, + { + "epoch": 0.86, + "learning_rate": 2.8628014446040927e-08, + "loss": 0.1999, + "step": 44180 + }, + { + "epoch": 0.86, + "learning_rate": 2.8624131101704785e-08, + "loss": 0.0005, + "step": 44181 + }, + { + "epoch": 0.86, + "learning_rate": 2.8620247757368644e-08, + "loss": 0.0006, + "step": 44182 + }, + { + "epoch": 0.86, + "learning_rate": 2.8616364413032502e-08, + "loss": 0.0005, + "step": 44183 + }, + { + "epoch": 0.86, + "learning_rate": 2.861248106869636e-08, + "loss": 0.0003, + "step": 44184 + }, + { + "epoch": 0.86, + "learning_rate": 2.8608597724360218e-08, + "loss": 0.8528, + "step": 44185 + }, + { + "epoch": 0.86, + "learning_rate": 2.8604714380024077e-08, + "loss": 0.0003, + "step": 44186 + }, + { + "epoch": 0.86, + "learning_rate": 2.8600831035687935e-08, + "loss": 0.1999, + "step": 44187 + }, + { + "epoch": 0.86, + "learning_rate": 2.8596947691351793e-08, + "loss": 0.0004, + "step": 44188 + }, + { + "epoch": 0.86, + "learning_rate": 2.8593064347015648e-08, + "loss": 0.0003, + "step": 44189 + }, + { + "epoch": 0.86, + "learning_rate": 2.8589181002679506e-08, + "loss": 0.0006, + "step": 44190 + }, + { + "epoch": 0.86, + "learning_rate": 2.8585297658343364e-08, + "loss": 0.0004, + "step": 44191 + }, + { + "epoch": 0.86, + "learning_rate": 2.8581414314007223e-08, + "loss": 0.0624, + "step": 44192 + }, + { + "epoch": 0.86, + "learning_rate": 2.857753096967108e-08, + "loss": 0.0259, + "step": 44193 + }, + { + "epoch": 0.86, + "learning_rate": 2.8573647625334936e-08, + "loss": 0.0004, + "step": 44194 + }, + { + "epoch": 0.86, + "learning_rate": 2.8569764280998794e-08, + "loss": 0.0003, + "step": 44195 + }, + { + "epoch": 0.86, + "learning_rate": 2.8565880936662652e-08, + "loss": 0.0003, + "step": 44196 + }, + { + "epoch": 0.86, + "learning_rate": 2.8561997592326507e-08, + "loss": 0.0003, + "step": 44197 + }, + { + "epoch": 0.86, + "learning_rate": 2.8558114247990366e-08, + "loss": 0.0004, + "step": 44198 + }, + { + "epoch": 0.86, + "learning_rate": 2.8554230903654224e-08, + "loss": 0.0005, + "step": 44199 + }, + { + "epoch": 0.86, + "learning_rate": 2.8550347559318082e-08, + "loss": 0.3872, + "step": 44200 + }, + { + "epoch": 0.86, + "learning_rate": 2.854646421498194e-08, + "loss": 0.0005, + "step": 44201 + }, + { + "epoch": 0.86, + "learning_rate": 2.85425808706458e-08, + "loss": 0.0004, + "step": 44202 + }, + { + "epoch": 0.86, + "learning_rate": 2.8538697526309657e-08, + "loss": 0.0005, + "step": 44203 + }, + { + "epoch": 0.86, + "learning_rate": 2.8534814181973515e-08, + "loss": 0.0004, + "step": 44204 + }, + { + "epoch": 0.86, + "learning_rate": 2.8530930837637373e-08, + "loss": 0.0004, + "step": 44205 + }, + { + "epoch": 0.86, + "learning_rate": 2.852704749330123e-08, + "loss": 0.0005, + "step": 44206 + }, + { + "epoch": 0.86, + "learning_rate": 2.852316414896509e-08, + "loss": 0.0007, + "step": 44207 + }, + { + "epoch": 0.86, + "learning_rate": 2.8519280804628948e-08, + "loss": 0.0004, + "step": 44208 + }, + { + "epoch": 0.86, + "learning_rate": 2.85153974602928e-08, + "loss": 0.0005, + "step": 44209 + }, + { + "epoch": 0.86, + "learning_rate": 2.8511514115956658e-08, + "loss": 0.0004, + "step": 44210 + }, + { + "epoch": 0.86, + "learning_rate": 2.8507630771620516e-08, + "loss": 0.0005, + "step": 44211 + }, + { + "epoch": 0.86, + "learning_rate": 2.8503747427284374e-08, + "loss": 0.0005, + "step": 44212 + }, + { + "epoch": 0.86, + "learning_rate": 2.8499864082948233e-08, + "loss": 0.0005, + "step": 44213 + }, + { + "epoch": 0.86, + "learning_rate": 2.849598073861209e-08, + "loss": 0.0004, + "step": 44214 + }, + { + "epoch": 0.86, + "learning_rate": 2.849209739427595e-08, + "loss": 0.0004, + "step": 44215 + }, + { + "epoch": 0.86, + "learning_rate": 2.8488214049939807e-08, + "loss": 0.0003, + "step": 44216 + }, + { + "epoch": 0.86, + "learning_rate": 2.8484330705603666e-08, + "loss": 0.0003, + "step": 44217 + }, + { + "epoch": 0.86, + "learning_rate": 2.8480447361267524e-08, + "loss": 0.0006, + "step": 44218 + }, + { + "epoch": 0.86, + "learning_rate": 2.8476564016931382e-08, + "loss": 0.0003, + "step": 44219 + }, + { + "epoch": 0.86, + "learning_rate": 2.847268067259524e-08, + "loss": 0.0003, + "step": 44220 + }, + { + "epoch": 0.86, + "learning_rate": 2.84687973282591e-08, + "loss": 0.0002, + "step": 44221 + }, + { + "epoch": 0.86, + "learning_rate": 2.8464913983922957e-08, + "loss": 0.0003, + "step": 44222 + }, + { + "epoch": 0.86, + "learning_rate": 2.846103063958681e-08, + "loss": 0.0004, + "step": 44223 + }, + { + "epoch": 0.86, + "learning_rate": 2.8457147295250667e-08, + "loss": 0.0004, + "step": 44224 + }, + { + "epoch": 0.86, + "learning_rate": 2.8453263950914525e-08, + "loss": 0.0003, + "step": 44225 + }, + { + "epoch": 0.86, + "learning_rate": 2.8449380606578383e-08, + "loss": 0.0004, + "step": 44226 + }, + { + "epoch": 0.86, + "learning_rate": 2.844549726224224e-08, + "loss": 0.0008, + "step": 44227 + }, + { + "epoch": 0.86, + "learning_rate": 2.84416139179061e-08, + "loss": 0.0004, + "step": 44228 + }, + { + "epoch": 0.86, + "learning_rate": 2.8437730573569958e-08, + "loss": 0.0003, + "step": 44229 + }, + { + "epoch": 0.86, + "learning_rate": 2.8433847229233816e-08, + "loss": 0.0004, + "step": 44230 + }, + { + "epoch": 0.86, + "learning_rate": 2.8429963884897674e-08, + "loss": 0.0005, + "step": 44231 + }, + { + "epoch": 0.86, + "learning_rate": 2.8426080540561533e-08, + "loss": 0.0003, + "step": 44232 + }, + { + "epoch": 0.86, + "learning_rate": 2.842219719622539e-08, + "loss": 0.0003, + "step": 44233 + }, + { + "epoch": 0.86, + "learning_rate": 2.8418313851889246e-08, + "loss": 0.0007, + "step": 44234 + }, + { + "epoch": 0.86, + "learning_rate": 2.8414430507553104e-08, + "loss": 0.0004, + "step": 44235 + }, + { + "epoch": 0.86, + "learning_rate": 2.8410547163216962e-08, + "loss": 0.0003, + "step": 44236 + }, + { + "epoch": 0.86, + "learning_rate": 2.840666381888082e-08, + "loss": 0.6383, + "step": 44237 + }, + { + "epoch": 0.86, + "learning_rate": 2.8402780474544675e-08, + "loss": 0.0004, + "step": 44238 + }, + { + "epoch": 0.86, + "learning_rate": 2.8398897130208534e-08, + "loss": 0.0005, + "step": 44239 + }, + { + "epoch": 0.86, + "learning_rate": 2.8395013785872392e-08, + "loss": 0.0076, + "step": 44240 + }, + { + "epoch": 0.86, + "learning_rate": 2.8391130441536247e-08, + "loss": 0.0008, + "step": 44241 + }, + { + "epoch": 0.86, + "learning_rate": 2.8387247097200105e-08, + "loss": 0.0007, + "step": 44242 + }, + { + "epoch": 0.86, + "learning_rate": 2.8383363752863963e-08, + "loss": 0.0491, + "step": 44243 + }, + { + "epoch": 0.86, + "learning_rate": 2.8379480408527822e-08, + "loss": 0.0003, + "step": 44244 + }, + { + "epoch": 0.86, + "learning_rate": 2.837559706419168e-08, + "loss": 0.0005, + "step": 44245 + }, + { + "epoch": 0.86, + "learning_rate": 2.8371713719855538e-08, + "loss": 0.3472, + "step": 44246 + }, + { + "epoch": 0.86, + "learning_rate": 2.8367830375519396e-08, + "loss": 0.0004, + "step": 44247 + }, + { + "epoch": 0.86, + "learning_rate": 2.8363947031183255e-08, + "loss": 0.0003, + "step": 44248 + }, + { + "epoch": 0.86, + "learning_rate": 2.8360063686847113e-08, + "loss": 0.0004, + "step": 44249 + }, + { + "epoch": 0.86, + "learning_rate": 2.835618034251097e-08, + "loss": 0.0004, + "step": 44250 + }, + { + "epoch": 0.86, + "learning_rate": 2.835229699817483e-08, + "loss": 0.0004, + "step": 44251 + }, + { + "epoch": 0.86, + "learning_rate": 2.834841365383868e-08, + "loss": 0.0006, + "step": 44252 + }, + { + "epoch": 0.86, + "learning_rate": 2.834453030950254e-08, + "loss": 0.7303, + "step": 44253 + }, + { + "epoch": 0.86, + "learning_rate": 2.8340646965166397e-08, + "loss": 0.0003, + "step": 44254 + }, + { + "epoch": 0.86, + "learning_rate": 2.8336763620830256e-08, + "loss": 0.0005, + "step": 44255 + }, + { + "epoch": 0.86, + "learning_rate": 2.8332880276494114e-08, + "loss": 0.0004, + "step": 44256 + }, + { + "epoch": 0.86, + "learning_rate": 2.8328996932157972e-08, + "loss": 1.1063, + "step": 44257 + }, + { + "epoch": 0.86, + "learning_rate": 2.832511358782183e-08, + "loss": 0.0003, + "step": 44258 + }, + { + "epoch": 0.86, + "learning_rate": 2.832123024348569e-08, + "loss": 0.0004, + "step": 44259 + }, + { + "epoch": 0.86, + "learning_rate": 2.8317346899149547e-08, + "loss": 0.0003, + "step": 44260 + }, + { + "epoch": 0.86, + "learning_rate": 2.8313463554813405e-08, + "loss": 0.0003, + "step": 44261 + }, + { + "epoch": 0.86, + "learning_rate": 2.8309580210477263e-08, + "loss": 0.0003, + "step": 44262 + }, + { + "epoch": 0.86, + "learning_rate": 2.8305696866141122e-08, + "loss": 0.0005, + "step": 44263 + }, + { + "epoch": 0.86, + "learning_rate": 2.830181352180498e-08, + "loss": 0.0009, + "step": 44264 + }, + { + "epoch": 0.86, + "learning_rate": 2.8297930177468838e-08, + "loss": 0.0004, + "step": 44265 + }, + { + "epoch": 0.86, + "learning_rate": 2.8294046833132696e-08, + "loss": 0.7454, + "step": 44266 + }, + { + "epoch": 0.86, + "learning_rate": 2.8290163488796548e-08, + "loss": 0.0014, + "step": 44267 + }, + { + "epoch": 0.86, + "learning_rate": 2.8286280144460406e-08, + "loss": 0.0003, + "step": 44268 + }, + { + "epoch": 0.86, + "learning_rate": 2.8282396800124265e-08, + "loss": 0.0006, + "step": 44269 + }, + { + "epoch": 0.86, + "learning_rate": 2.8278513455788123e-08, + "loss": 0.0005, + "step": 44270 + }, + { + "epoch": 0.86, + "learning_rate": 2.827463011145198e-08, + "loss": 0.0004, + "step": 44271 + }, + { + "epoch": 0.86, + "learning_rate": 2.827074676711584e-08, + "loss": 0.0003, + "step": 44272 + }, + { + "epoch": 0.86, + "learning_rate": 2.8266863422779698e-08, + "loss": 0.0003, + "step": 44273 + }, + { + "epoch": 0.86, + "learning_rate": 2.8262980078443556e-08, + "loss": 0.0004, + "step": 44274 + }, + { + "epoch": 0.86, + "learning_rate": 2.8259096734107414e-08, + "loss": 0.0004, + "step": 44275 + }, + { + "epoch": 0.86, + "learning_rate": 2.8255213389771272e-08, + "loss": 0.0015, + "step": 44276 + }, + { + "epoch": 0.86, + "learning_rate": 2.825133004543513e-08, + "loss": 0.0003, + "step": 44277 + }, + { + "epoch": 0.86, + "learning_rate": 2.8247446701098985e-08, + "loss": 0.0143, + "step": 44278 + }, + { + "epoch": 0.86, + "learning_rate": 2.8243563356762844e-08, + "loss": 0.0004, + "step": 44279 + }, + { + "epoch": 0.86, + "learning_rate": 2.8239680012426702e-08, + "loss": 0.0003, + "step": 44280 + }, + { + "epoch": 0.86, + "learning_rate": 2.8235796668090557e-08, + "loss": 0.0004, + "step": 44281 + }, + { + "epoch": 0.86, + "learning_rate": 2.8231913323754415e-08, + "loss": 0.0004, + "step": 44282 + }, + { + "epoch": 0.86, + "learning_rate": 2.8228029979418273e-08, + "loss": 0.0005, + "step": 44283 + }, + { + "epoch": 0.86, + "learning_rate": 2.822414663508213e-08, + "loss": 0.0004, + "step": 44284 + }, + { + "epoch": 0.86, + "learning_rate": 2.8220263290745987e-08, + "loss": 0.0004, + "step": 44285 + }, + { + "epoch": 0.86, + "learning_rate": 2.8216379946409845e-08, + "loss": 0.0003, + "step": 44286 + }, + { + "epoch": 0.86, + "learning_rate": 2.8212496602073703e-08, + "loss": 0.0007, + "step": 44287 + }, + { + "epoch": 0.86, + "learning_rate": 2.820861325773756e-08, + "loss": 0.0003, + "step": 44288 + }, + { + "epoch": 0.86, + "learning_rate": 2.820472991340142e-08, + "loss": 0.2224, + "step": 44289 + }, + { + "epoch": 0.86, + "learning_rate": 2.8200846569065278e-08, + "loss": 0.0006, + "step": 44290 + }, + { + "epoch": 0.86, + "learning_rate": 2.8196963224729136e-08, + "loss": 0.0007, + "step": 44291 + }, + { + "epoch": 0.86, + "learning_rate": 2.8193079880392994e-08, + "loss": 0.0003, + "step": 44292 + }, + { + "epoch": 0.86, + "learning_rate": 2.8189196536056852e-08, + "loss": 0.0003, + "step": 44293 + }, + { + "epoch": 0.86, + "learning_rate": 2.818531319172071e-08, + "loss": 0.0076, + "step": 44294 + }, + { + "epoch": 0.86, + "learning_rate": 2.818142984738457e-08, + "loss": 0.0005, + "step": 44295 + }, + { + "epoch": 0.86, + "learning_rate": 2.817754650304842e-08, + "loss": 0.0004, + "step": 44296 + }, + { + "epoch": 0.86, + "learning_rate": 2.817366315871228e-08, + "loss": 0.0003, + "step": 44297 + }, + { + "epoch": 0.86, + "learning_rate": 2.8169779814376137e-08, + "loss": 0.0004, + "step": 44298 + }, + { + "epoch": 0.86, + "learning_rate": 2.8165896470039995e-08, + "loss": 0.0003, + "step": 44299 + }, + { + "epoch": 0.86, + "learning_rate": 2.8162013125703854e-08, + "loss": 0.0012, + "step": 44300 + }, + { + "epoch": 0.86, + "learning_rate": 2.8158129781367712e-08, + "loss": 0.0004, + "step": 44301 + }, + { + "epoch": 0.86, + "learning_rate": 2.815424643703157e-08, + "loss": 0.0004, + "step": 44302 + }, + { + "epoch": 0.86, + "learning_rate": 2.8150363092695428e-08, + "loss": 0.0003, + "step": 44303 + }, + { + "epoch": 0.86, + "learning_rate": 2.8146479748359287e-08, + "loss": 0.001, + "step": 44304 + }, + { + "epoch": 0.86, + "learning_rate": 2.8142596404023145e-08, + "loss": 0.0003, + "step": 44305 + }, + { + "epoch": 0.86, + "learning_rate": 2.8138713059687003e-08, + "loss": 0.0004, + "step": 44306 + }, + { + "epoch": 0.86, + "learning_rate": 2.813482971535086e-08, + "loss": 0.0004, + "step": 44307 + }, + { + "epoch": 0.86, + "learning_rate": 2.813094637101472e-08, + "loss": 0.0003, + "step": 44308 + }, + { + "epoch": 0.86, + "learning_rate": 2.8127063026678578e-08, + "loss": 0.0003, + "step": 44309 + }, + { + "epoch": 0.86, + "learning_rate": 2.812317968234243e-08, + "loss": 0.0003, + "step": 44310 + }, + { + "epoch": 0.86, + "learning_rate": 2.8119296338006288e-08, + "loss": 0.0004, + "step": 44311 + }, + { + "epoch": 0.86, + "learning_rate": 2.8115412993670146e-08, + "loss": 0.0004, + "step": 44312 + }, + { + "epoch": 0.86, + "learning_rate": 2.8111529649334004e-08, + "loss": 0.0005, + "step": 44313 + }, + { + "epoch": 0.86, + "learning_rate": 2.8107646304997862e-08, + "loss": 0.0005, + "step": 44314 + }, + { + "epoch": 0.86, + "learning_rate": 2.810376296066172e-08, + "loss": 0.0004, + "step": 44315 + }, + { + "epoch": 0.86, + "learning_rate": 2.809987961632558e-08, + "loss": 0.0003, + "step": 44316 + }, + { + "epoch": 0.86, + "learning_rate": 2.8095996271989437e-08, + "loss": 0.0003, + "step": 44317 + }, + { + "epoch": 0.86, + "learning_rate": 2.8092112927653295e-08, + "loss": 0.0004, + "step": 44318 + }, + { + "epoch": 0.86, + "learning_rate": 2.8088229583317154e-08, + "loss": 0.0004, + "step": 44319 + }, + { + "epoch": 0.86, + "learning_rate": 2.8084346238981012e-08, + "loss": 0.0003, + "step": 44320 + }, + { + "epoch": 0.86, + "learning_rate": 2.808046289464487e-08, + "loss": 0.0004, + "step": 44321 + }, + { + "epoch": 0.86, + "learning_rate": 2.8076579550308725e-08, + "loss": 0.0004, + "step": 44322 + }, + { + "epoch": 0.86, + "learning_rate": 2.8072696205972583e-08, + "loss": 0.0004, + "step": 44323 + }, + { + "epoch": 0.86, + "learning_rate": 2.806881286163644e-08, + "loss": 0.0003, + "step": 44324 + }, + { + "epoch": 0.86, + "learning_rate": 2.8064929517300296e-08, + "loss": 0.0003, + "step": 44325 + }, + { + "epoch": 0.86, + "learning_rate": 2.8061046172964155e-08, + "loss": 0.0005, + "step": 44326 + }, + { + "epoch": 0.86, + "learning_rate": 2.8057162828628013e-08, + "loss": 0.0006, + "step": 44327 + }, + { + "epoch": 0.86, + "learning_rate": 2.805327948429187e-08, + "loss": 0.0003, + "step": 44328 + }, + { + "epoch": 0.86, + "learning_rate": 2.8049396139955726e-08, + "loss": 0.0004, + "step": 44329 + }, + { + "epoch": 0.86, + "learning_rate": 2.8045512795619584e-08, + "loss": 0.0003, + "step": 44330 + }, + { + "epoch": 0.86, + "learning_rate": 2.8041629451283443e-08, + "loss": 0.0005, + "step": 44331 + }, + { + "epoch": 0.86, + "learning_rate": 2.80377461069473e-08, + "loss": 0.0004, + "step": 44332 + }, + { + "epoch": 0.86, + "learning_rate": 2.803386276261116e-08, + "loss": 0.0004, + "step": 44333 + }, + { + "epoch": 0.86, + "learning_rate": 2.8029979418275017e-08, + "loss": 0.0005, + "step": 44334 + }, + { + "epoch": 0.86, + "learning_rate": 2.8026096073938876e-08, + "loss": 0.0003, + "step": 44335 + }, + { + "epoch": 0.86, + "learning_rate": 2.8022212729602734e-08, + "loss": 0.0009, + "step": 44336 + }, + { + "epoch": 0.86, + "learning_rate": 2.8018329385266592e-08, + "loss": 0.0079, + "step": 44337 + }, + { + "epoch": 0.86, + "learning_rate": 2.801444604093045e-08, + "loss": 0.028, + "step": 44338 + }, + { + "epoch": 0.86, + "learning_rate": 2.8010562696594302e-08, + "loss": 0.0014, + "step": 44339 + }, + { + "epoch": 0.86, + "learning_rate": 2.800667935225816e-08, + "loss": 0.0004, + "step": 44340 + }, + { + "epoch": 0.86, + "learning_rate": 2.800279600792202e-08, + "loss": 0.0005, + "step": 44341 + }, + { + "epoch": 0.86, + "learning_rate": 2.7998912663585877e-08, + "loss": 1.0642, + "step": 44342 + }, + { + "epoch": 0.86, + "learning_rate": 2.7995029319249735e-08, + "loss": 0.0011, + "step": 44343 + }, + { + "epoch": 0.86, + "learning_rate": 2.7991145974913593e-08, + "loss": 0.0005, + "step": 44344 + }, + { + "epoch": 0.86, + "learning_rate": 2.798726263057745e-08, + "loss": 0.0002, + "step": 44345 + }, + { + "epoch": 0.86, + "learning_rate": 2.798337928624131e-08, + "loss": 0.0003, + "step": 44346 + }, + { + "epoch": 0.86, + "learning_rate": 2.7979495941905168e-08, + "loss": 0.0006, + "step": 44347 + }, + { + "epoch": 0.86, + "learning_rate": 2.7975612597569026e-08, + "loss": 0.0004, + "step": 44348 + }, + { + "epoch": 0.86, + "learning_rate": 2.7971729253232884e-08, + "loss": 0.0002, + "step": 44349 + }, + { + "epoch": 0.86, + "learning_rate": 2.7967845908896743e-08, + "loss": 0.0004, + "step": 44350 + }, + { + "epoch": 0.86, + "learning_rate": 2.79639625645606e-08, + "loss": 0.0006, + "step": 44351 + }, + { + "epoch": 0.86, + "learning_rate": 2.796007922022446e-08, + "loss": 0.4183, + "step": 44352 + }, + { + "epoch": 0.86, + "learning_rate": 2.7956195875888317e-08, + "loss": 0.0394, + "step": 44353 + }, + { + "epoch": 0.86, + "learning_rate": 2.795231253155217e-08, + "loss": 0.0006, + "step": 44354 + }, + { + "epoch": 0.86, + "learning_rate": 2.7948429187216027e-08, + "loss": 0.0003, + "step": 44355 + }, + { + "epoch": 0.86, + "learning_rate": 2.7944545842879885e-08, + "loss": 0.0004, + "step": 44356 + }, + { + "epoch": 0.86, + "learning_rate": 2.7940662498543744e-08, + "loss": 0.0005, + "step": 44357 + }, + { + "epoch": 0.86, + "learning_rate": 2.7936779154207602e-08, + "loss": 0.0006, + "step": 44358 + }, + { + "epoch": 0.86, + "learning_rate": 2.793289580987146e-08, + "loss": 0.0003, + "step": 44359 + }, + { + "epoch": 0.86, + "learning_rate": 2.792901246553532e-08, + "loss": 0.0005, + "step": 44360 + }, + { + "epoch": 0.86, + "learning_rate": 2.7925129121199177e-08, + "loss": 0.0004, + "step": 44361 + }, + { + "epoch": 0.86, + "learning_rate": 2.7921245776863035e-08, + "loss": 0.2376, + "step": 44362 + }, + { + "epoch": 0.86, + "learning_rate": 2.7917362432526893e-08, + "loss": 0.0004, + "step": 44363 + }, + { + "epoch": 0.86, + "learning_rate": 2.791347908819075e-08, + "loss": 0.0005, + "step": 44364 + }, + { + "epoch": 0.86, + "learning_rate": 2.790959574385461e-08, + "loss": 0.0006, + "step": 44365 + }, + { + "epoch": 0.86, + "learning_rate": 2.7905712399518465e-08, + "loss": 0.0004, + "step": 44366 + }, + { + "epoch": 0.86, + "learning_rate": 2.7901829055182323e-08, + "loss": 0.0003, + "step": 44367 + }, + { + "epoch": 0.86, + "learning_rate": 2.7897945710846178e-08, + "loss": 0.0005, + "step": 44368 + }, + { + "epoch": 0.86, + "learning_rate": 2.7894062366510036e-08, + "loss": 0.0011, + "step": 44369 + }, + { + "epoch": 0.86, + "learning_rate": 2.7890179022173894e-08, + "loss": 0.0002, + "step": 44370 + }, + { + "epoch": 0.86, + "learning_rate": 2.7886295677837753e-08, + "loss": 0.0005, + "step": 44371 + }, + { + "epoch": 0.86, + "learning_rate": 2.788241233350161e-08, + "loss": 0.0004, + "step": 44372 + }, + { + "epoch": 0.86, + "learning_rate": 2.787852898916547e-08, + "loss": 0.0002, + "step": 44373 + }, + { + "epoch": 0.86, + "learning_rate": 2.7874645644829324e-08, + "loss": 0.0004, + "step": 44374 + }, + { + "epoch": 0.86, + "learning_rate": 2.7870762300493182e-08, + "loss": 0.0004, + "step": 44375 + }, + { + "epoch": 0.86, + "learning_rate": 2.786687895615704e-08, + "loss": 0.0003, + "step": 44376 + }, + { + "epoch": 0.86, + "learning_rate": 2.78629956118209e-08, + "loss": 0.0004, + "step": 44377 + }, + { + "epoch": 0.86, + "learning_rate": 2.7859112267484757e-08, + "loss": 0.0004, + "step": 44378 + }, + { + "epoch": 0.86, + "learning_rate": 2.7855228923148615e-08, + "loss": 1.2066, + "step": 44379 + }, + { + "epoch": 0.86, + "learning_rate": 2.7851345578812473e-08, + "loss": 0.0138, + "step": 44380 + }, + { + "epoch": 0.86, + "learning_rate": 2.784746223447633e-08, + "loss": 0.0005, + "step": 44381 + }, + { + "epoch": 0.86, + "learning_rate": 2.784357889014019e-08, + "loss": 0.0004, + "step": 44382 + }, + { + "epoch": 0.86, + "learning_rate": 2.783969554580404e-08, + "loss": 0.0008, + "step": 44383 + }, + { + "epoch": 0.86, + "learning_rate": 2.78358122014679e-08, + "loss": 0.0005, + "step": 44384 + }, + { + "epoch": 0.86, + "learning_rate": 2.7831928857131758e-08, + "loss": 0.0007, + "step": 44385 + }, + { + "epoch": 0.86, + "learning_rate": 2.7828045512795616e-08, + "loss": 0.0003, + "step": 44386 + }, + { + "epoch": 0.86, + "learning_rate": 2.7824162168459474e-08, + "loss": 0.0004, + "step": 44387 + }, + { + "epoch": 0.86, + "learning_rate": 2.7820278824123333e-08, + "loss": 0.0003, + "step": 44388 + }, + { + "epoch": 0.86, + "learning_rate": 2.781639547978719e-08, + "loss": 0.0004, + "step": 44389 + }, + { + "epoch": 0.86, + "learning_rate": 2.781251213545105e-08, + "loss": 0.0005, + "step": 44390 + }, + { + "epoch": 0.86, + "learning_rate": 2.7808628791114907e-08, + "loss": 0.0004, + "step": 44391 + }, + { + "epoch": 0.86, + "learning_rate": 2.7804745446778766e-08, + "loss": 1.3032, + "step": 44392 + }, + { + "epoch": 0.86, + "learning_rate": 2.7800862102442624e-08, + "loss": 0.0003, + "step": 44393 + }, + { + "epoch": 0.86, + "learning_rate": 2.7796978758106482e-08, + "loss": 0.0004, + "step": 44394 + }, + { + "epoch": 0.86, + "learning_rate": 2.779309541377034e-08, + "loss": 0.0004, + "step": 44395 + }, + { + "epoch": 0.86, + "learning_rate": 2.77892120694342e-08, + "loss": 0.001, + "step": 44396 + }, + { + "epoch": 0.86, + "learning_rate": 2.778532872509805e-08, + "loss": 0.0004, + "step": 44397 + }, + { + "epoch": 0.86, + "learning_rate": 2.778144538076191e-08, + "loss": 0.0004, + "step": 44398 + }, + { + "epoch": 0.86, + "learning_rate": 2.7777562036425767e-08, + "loss": 0.0004, + "step": 44399 + }, + { + "epoch": 0.86, + "learning_rate": 2.7773678692089625e-08, + "loss": 0.0003, + "step": 44400 + }, + { + "epoch": 0.86, + "learning_rate": 2.7769795347753483e-08, + "loss": 0.0003, + "step": 44401 + }, + { + "epoch": 0.86, + "learning_rate": 2.776591200341734e-08, + "loss": 0.0005, + "step": 44402 + }, + { + "epoch": 0.86, + "learning_rate": 2.77620286590812e-08, + "loss": 0.0004, + "step": 44403 + }, + { + "epoch": 0.86, + "learning_rate": 2.7758145314745058e-08, + "loss": 0.0004, + "step": 44404 + }, + { + "epoch": 0.86, + "learning_rate": 2.7754261970408916e-08, + "loss": 0.0004, + "step": 44405 + }, + { + "epoch": 0.86, + "learning_rate": 2.7750378626072775e-08, + "loss": 0.0004, + "step": 44406 + }, + { + "epoch": 0.86, + "learning_rate": 2.7746495281736633e-08, + "loss": 0.0005, + "step": 44407 + }, + { + "epoch": 0.86, + "learning_rate": 2.774261193740049e-08, + "loss": 0.0004, + "step": 44408 + }, + { + "epoch": 0.86, + "learning_rate": 2.773872859306435e-08, + "loss": 0.0006, + "step": 44409 + }, + { + "epoch": 0.86, + "learning_rate": 2.7734845248728207e-08, + "loss": 0.0004, + "step": 44410 + }, + { + "epoch": 0.86, + "learning_rate": 2.7730961904392062e-08, + "loss": 0.0004, + "step": 44411 + }, + { + "epoch": 0.86, + "learning_rate": 2.7727078560055917e-08, + "loss": 0.0004, + "step": 44412 + }, + { + "epoch": 0.86, + "learning_rate": 2.7723195215719776e-08, + "loss": 0.0004, + "step": 44413 + }, + { + "epoch": 0.86, + "learning_rate": 2.7719311871383634e-08, + "loss": 0.0004, + "step": 44414 + }, + { + "epoch": 0.86, + "learning_rate": 2.7715428527047492e-08, + "loss": 0.0021, + "step": 44415 + }, + { + "epoch": 0.86, + "learning_rate": 2.771154518271135e-08, + "loss": 0.0005, + "step": 44416 + }, + { + "epoch": 0.86, + "learning_rate": 2.770766183837521e-08, + "loss": 0.0005, + "step": 44417 + }, + { + "epoch": 0.86, + "learning_rate": 2.7703778494039064e-08, + "loss": 0.0005, + "step": 44418 + }, + { + "epoch": 0.86, + "learning_rate": 2.7699895149702922e-08, + "loss": 0.1896, + "step": 44419 + }, + { + "epoch": 0.86, + "learning_rate": 2.769601180536678e-08, + "loss": 0.0003, + "step": 44420 + }, + { + "epoch": 0.86, + "learning_rate": 2.7692128461030638e-08, + "loss": 0.0005, + "step": 44421 + }, + { + "epoch": 0.86, + "learning_rate": 2.7688245116694497e-08, + "loss": 0.0003, + "step": 44422 + }, + { + "epoch": 0.86, + "learning_rate": 2.7684361772358355e-08, + "loss": 0.0003, + "step": 44423 + }, + { + "epoch": 0.86, + "learning_rate": 2.7680478428022213e-08, + "loss": 1.12, + "step": 44424 + }, + { + "epoch": 0.86, + "learning_rate": 2.767659508368607e-08, + "loss": 0.0003, + "step": 44425 + }, + { + "epoch": 0.86, + "learning_rate": 2.7672711739349923e-08, + "loss": 0.0005, + "step": 44426 + }, + { + "epoch": 0.86, + "learning_rate": 2.766882839501378e-08, + "loss": 0.0084, + "step": 44427 + }, + { + "epoch": 0.86, + "learning_rate": 2.766494505067764e-08, + "loss": 0.0018, + "step": 44428 + }, + { + "epoch": 0.86, + "learning_rate": 2.7661061706341498e-08, + "loss": 0.0003, + "step": 44429 + }, + { + "epoch": 0.86, + "learning_rate": 2.7657178362005356e-08, + "loss": 0.0006, + "step": 44430 + }, + { + "epoch": 0.86, + "learning_rate": 2.7653295017669214e-08, + "loss": 0.001, + "step": 44431 + }, + { + "epoch": 0.86, + "learning_rate": 2.7649411673333072e-08, + "loss": 0.0004, + "step": 44432 + }, + { + "epoch": 0.86, + "learning_rate": 2.764552832899693e-08, + "loss": 0.001, + "step": 44433 + }, + { + "epoch": 0.86, + "learning_rate": 2.764164498466079e-08, + "loss": 0.0004, + "step": 44434 + }, + { + "epoch": 0.86, + "learning_rate": 2.7637761640324647e-08, + "loss": 0.0004, + "step": 44435 + }, + { + "epoch": 0.86, + "learning_rate": 2.7633878295988505e-08, + "loss": 0.1251, + "step": 44436 + }, + { + "epoch": 0.86, + "learning_rate": 2.7629994951652364e-08, + "loss": 0.0003, + "step": 44437 + }, + { + "epoch": 0.86, + "learning_rate": 2.7626111607316222e-08, + "loss": 0.043, + "step": 44438 + }, + { + "epoch": 0.86, + "learning_rate": 2.762222826298008e-08, + "loss": 0.201, + "step": 44439 + }, + { + "epoch": 0.86, + "learning_rate": 2.7618344918643938e-08, + "loss": 0.0004, + "step": 44440 + }, + { + "epoch": 0.86, + "learning_rate": 2.761446157430779e-08, + "loss": 0.0005, + "step": 44441 + }, + { + "epoch": 0.86, + "learning_rate": 2.7610578229971648e-08, + "loss": 0.9983, + "step": 44442 + }, + { + "epoch": 0.86, + "learning_rate": 2.7606694885635506e-08, + "loss": 0.0009, + "step": 44443 + }, + { + "epoch": 0.86, + "learning_rate": 2.7602811541299365e-08, + "loss": 0.8704, + "step": 44444 + }, + { + "epoch": 0.86, + "learning_rate": 2.7598928196963223e-08, + "loss": 0.0005, + "step": 44445 + }, + { + "epoch": 0.86, + "learning_rate": 2.759504485262708e-08, + "loss": 0.0003, + "step": 44446 + }, + { + "epoch": 0.86, + "learning_rate": 2.759116150829094e-08, + "loss": 0.8526, + "step": 44447 + }, + { + "epoch": 0.86, + "learning_rate": 2.7587278163954798e-08, + "loss": 0.0003, + "step": 44448 + }, + { + "epoch": 0.86, + "learning_rate": 2.7583394819618656e-08, + "loss": 0.0004, + "step": 44449 + }, + { + "epoch": 0.86, + "learning_rate": 2.7579511475282514e-08, + "loss": 0.0004, + "step": 44450 + }, + { + "epoch": 0.86, + "learning_rate": 2.7575628130946372e-08, + "loss": 0.0005, + "step": 44451 + }, + { + "epoch": 0.86, + "learning_rate": 2.757174478661023e-08, + "loss": 0.0004, + "step": 44452 + }, + { + "epoch": 0.86, + "learning_rate": 2.756786144227409e-08, + "loss": 0.0004, + "step": 44453 + }, + { + "epoch": 0.86, + "learning_rate": 2.7563978097937947e-08, + "loss": 0.662, + "step": 44454 + }, + { + "epoch": 0.86, + "learning_rate": 2.75600947536018e-08, + "loss": 0.0018, + "step": 44455 + }, + { + "epoch": 0.86, + "learning_rate": 2.7556211409265657e-08, + "loss": 0.0004, + "step": 44456 + }, + { + "epoch": 0.86, + "learning_rate": 2.7552328064929515e-08, + "loss": 0.0005, + "step": 44457 + }, + { + "epoch": 0.86, + "learning_rate": 2.7548444720593373e-08, + "loss": 0.008, + "step": 44458 + }, + { + "epoch": 0.86, + "learning_rate": 2.7544561376257232e-08, + "loss": 0.0005, + "step": 44459 + }, + { + "epoch": 0.86, + "learning_rate": 2.754067803192109e-08, + "loss": 0.0013, + "step": 44460 + }, + { + "epoch": 0.86, + "learning_rate": 2.7536794687584948e-08, + "loss": 0.0004, + "step": 44461 + }, + { + "epoch": 0.86, + "learning_rate": 2.7532911343248803e-08, + "loss": 0.0029, + "step": 44462 + }, + { + "epoch": 0.86, + "learning_rate": 2.752902799891266e-08, + "loss": 0.0003, + "step": 44463 + }, + { + "epoch": 0.86, + "learning_rate": 2.752514465457652e-08, + "loss": 0.0002, + "step": 44464 + }, + { + "epoch": 0.86, + "learning_rate": 2.7521261310240378e-08, + "loss": 0.0003, + "step": 44465 + }, + { + "epoch": 0.86, + "learning_rate": 2.7517377965904236e-08, + "loss": 0.0006, + "step": 44466 + }, + { + "epoch": 0.86, + "learning_rate": 2.7513494621568094e-08, + "loss": 0.0006, + "step": 44467 + }, + { + "epoch": 0.86, + "learning_rate": 2.7509611277231953e-08, + "loss": 0.0003, + "step": 44468 + }, + { + "epoch": 0.86, + "learning_rate": 2.750572793289581e-08, + "loss": 0.0004, + "step": 44469 + }, + { + "epoch": 0.86, + "learning_rate": 2.7501844588559662e-08, + "loss": 0.0003, + "step": 44470 + }, + { + "epoch": 0.86, + "learning_rate": 2.749796124422352e-08, + "loss": 0.0004, + "step": 44471 + }, + { + "epoch": 0.86, + "learning_rate": 2.749407789988738e-08, + "loss": 0.0971, + "step": 44472 + }, + { + "epoch": 0.86, + "learning_rate": 2.7490194555551237e-08, + "loss": 0.0002, + "step": 44473 + }, + { + "epoch": 0.86, + "learning_rate": 2.7486311211215095e-08, + "loss": 0.0003, + "step": 44474 + }, + { + "epoch": 0.86, + "learning_rate": 2.7482427866878954e-08, + "loss": 0.0005, + "step": 44475 + }, + { + "epoch": 0.86, + "learning_rate": 2.7478544522542812e-08, + "loss": 0.0003, + "step": 44476 + }, + { + "epoch": 0.86, + "learning_rate": 2.747466117820667e-08, + "loss": 0.0006, + "step": 44477 + }, + { + "epoch": 0.86, + "learning_rate": 2.747077783387053e-08, + "loss": 0.0003, + "step": 44478 + }, + { + "epoch": 0.86, + "learning_rate": 2.7466894489534387e-08, + "loss": 0.0005, + "step": 44479 + }, + { + "epoch": 0.86, + "learning_rate": 2.7463011145198245e-08, + "loss": 0.0005, + "step": 44480 + }, + { + "epoch": 0.86, + "learning_rate": 2.7459127800862103e-08, + "loss": 0.0003, + "step": 44481 + }, + { + "epoch": 0.86, + "learning_rate": 2.745524445652596e-08, + "loss": 0.0899, + "step": 44482 + }, + { + "epoch": 0.86, + "learning_rate": 2.745136111218982e-08, + "loss": 0.0006, + "step": 44483 + }, + { + "epoch": 0.86, + "learning_rate": 2.744747776785367e-08, + "loss": 0.0068, + "step": 44484 + }, + { + "epoch": 0.86, + "learning_rate": 2.744359442351753e-08, + "loss": 0.0003, + "step": 44485 + }, + { + "epoch": 0.86, + "learning_rate": 2.7439711079181388e-08, + "loss": 0.0002, + "step": 44486 + }, + { + "epoch": 0.86, + "learning_rate": 2.7435827734845246e-08, + "loss": 0.0008, + "step": 44487 + }, + { + "epoch": 0.86, + "learning_rate": 2.7431944390509104e-08, + "loss": 0.0004, + "step": 44488 + }, + { + "epoch": 0.86, + "learning_rate": 2.7428061046172962e-08, + "loss": 0.0004, + "step": 44489 + }, + { + "epoch": 0.86, + "learning_rate": 2.742417770183682e-08, + "loss": 0.0006, + "step": 44490 + }, + { + "epoch": 0.86, + "learning_rate": 2.742029435750068e-08, + "loss": 0.0003, + "step": 44491 + }, + { + "epoch": 0.86, + "learning_rate": 2.7416411013164537e-08, + "loss": 0.0004, + "step": 44492 + }, + { + "epoch": 0.86, + "learning_rate": 2.7412527668828395e-08, + "loss": 0.0005, + "step": 44493 + }, + { + "epoch": 0.86, + "learning_rate": 2.7408644324492254e-08, + "loss": 0.0005, + "step": 44494 + }, + { + "epoch": 0.86, + "learning_rate": 2.7404760980156112e-08, + "loss": 0.0006, + "step": 44495 + }, + { + "epoch": 0.86, + "learning_rate": 2.740087763581997e-08, + "loss": 0.0004, + "step": 44496 + }, + { + "epoch": 0.86, + "learning_rate": 2.739699429148383e-08, + "loss": 0.0003, + "step": 44497 + }, + { + "epoch": 0.86, + "learning_rate": 2.7393110947147687e-08, + "loss": 1.253, + "step": 44498 + }, + { + "epoch": 0.86, + "learning_rate": 2.7389227602811538e-08, + "loss": 0.0005, + "step": 44499 + }, + { + "epoch": 0.86, + "learning_rate": 2.7385344258475397e-08, + "loss": 0.009, + "step": 44500 + }, + { + "epoch": 0.86, + "learning_rate": 2.7381460914139255e-08, + "loss": 0.0003, + "step": 44501 + }, + { + "epoch": 0.86, + "learning_rate": 2.7377577569803113e-08, + "loss": 0.0002, + "step": 44502 + }, + { + "epoch": 0.86, + "learning_rate": 2.737369422546697e-08, + "loss": 0.0002, + "step": 44503 + }, + { + "epoch": 0.86, + "learning_rate": 2.736981088113083e-08, + "loss": 0.0006, + "step": 44504 + }, + { + "epoch": 0.86, + "learning_rate": 2.7365927536794688e-08, + "loss": 0.0005, + "step": 44505 + }, + { + "epoch": 0.86, + "learning_rate": 2.7362044192458543e-08, + "loss": 0.0003, + "step": 44506 + }, + { + "epoch": 0.86, + "learning_rate": 2.73581608481224e-08, + "loss": 0.0004, + "step": 44507 + }, + { + "epoch": 0.86, + "learning_rate": 2.735427750378626e-08, + "loss": 0.0058, + "step": 44508 + }, + { + "epoch": 0.86, + "learning_rate": 2.7350394159450117e-08, + "loss": 0.0004, + "step": 44509 + }, + { + "epoch": 0.86, + "learning_rate": 2.7346510815113976e-08, + "loss": 0.0003, + "step": 44510 + }, + { + "epoch": 0.86, + "learning_rate": 2.7342627470777834e-08, + "loss": 0.001, + "step": 44511 + }, + { + "epoch": 0.86, + "learning_rate": 2.7338744126441692e-08, + "loss": 0.0004, + "step": 44512 + }, + { + "epoch": 0.86, + "learning_rate": 2.7334860782105547e-08, + "loss": 0.0011, + "step": 44513 + }, + { + "epoch": 0.86, + "learning_rate": 2.7330977437769402e-08, + "loss": 0.0004, + "step": 44514 + }, + { + "epoch": 0.86, + "learning_rate": 2.732709409343326e-08, + "loss": 0.0003, + "step": 44515 + }, + { + "epoch": 0.86, + "learning_rate": 2.732321074909712e-08, + "loss": 0.0009, + "step": 44516 + }, + { + "epoch": 0.86, + "learning_rate": 2.7319327404760977e-08, + "loss": 0.0007, + "step": 44517 + }, + { + "epoch": 0.86, + "learning_rate": 2.7315444060424835e-08, + "loss": 0.6154, + "step": 44518 + }, + { + "epoch": 0.86, + "learning_rate": 2.7311560716088693e-08, + "loss": 0.0005, + "step": 44519 + }, + { + "epoch": 0.86, + "learning_rate": 2.730767737175255e-08, + "loss": 0.0005, + "step": 44520 + }, + { + "epoch": 0.86, + "learning_rate": 2.730379402741641e-08, + "loss": 0.0061, + "step": 44521 + }, + { + "epoch": 0.86, + "learning_rate": 2.7299910683080268e-08, + "loss": 0.0009, + "step": 44522 + }, + { + "epoch": 0.86, + "learning_rate": 2.7296027338744126e-08, + "loss": 0.0033, + "step": 44523 + }, + { + "epoch": 0.86, + "learning_rate": 2.7292143994407984e-08, + "loss": 0.0005, + "step": 44524 + }, + { + "epoch": 0.86, + "learning_rate": 2.7288260650071843e-08, + "loss": 0.0008, + "step": 44525 + }, + { + "epoch": 0.86, + "learning_rate": 2.72843773057357e-08, + "loss": 0.0004, + "step": 44526 + }, + { + "epoch": 0.86, + "learning_rate": 2.728049396139956e-08, + "loss": 0.0005, + "step": 44527 + }, + { + "epoch": 0.86, + "learning_rate": 2.727661061706341e-08, + "loss": 0.0004, + "step": 44528 + }, + { + "epoch": 0.86, + "learning_rate": 2.727272727272727e-08, + "loss": 0.0006, + "step": 44529 + }, + { + "epoch": 0.86, + "learning_rate": 2.7268843928391127e-08, + "loss": 0.0025, + "step": 44530 + }, + { + "epoch": 0.86, + "learning_rate": 2.7264960584054986e-08, + "loss": 0.0004, + "step": 44531 + }, + { + "epoch": 0.86, + "learning_rate": 2.7261077239718844e-08, + "loss": 0.0005, + "step": 44532 + }, + { + "epoch": 0.86, + "learning_rate": 2.7257193895382702e-08, + "loss": 0.3136, + "step": 44533 + }, + { + "epoch": 0.86, + "learning_rate": 2.725331055104656e-08, + "loss": 0.0004, + "step": 44534 + }, + { + "epoch": 0.86, + "learning_rate": 2.724942720671042e-08, + "loss": 0.0004, + "step": 44535 + }, + { + "epoch": 0.86, + "learning_rate": 2.7245543862374277e-08, + "loss": 0.0006, + "step": 44536 + }, + { + "epoch": 0.86, + "learning_rate": 2.7241660518038135e-08, + "loss": 0.0005, + "step": 44537 + }, + { + "epoch": 0.86, + "learning_rate": 2.7237777173701993e-08, + "loss": 0.0004, + "step": 44538 + }, + { + "epoch": 0.86, + "learning_rate": 2.723389382936585e-08, + "loss": 0.0002, + "step": 44539 + }, + { + "epoch": 0.86, + "learning_rate": 2.723001048502971e-08, + "loss": 0.7352, + "step": 44540 + }, + { + "epoch": 0.86, + "learning_rate": 2.7226127140693568e-08, + "loss": 0.0004, + "step": 44541 + }, + { + "epoch": 0.86, + "learning_rate": 2.722224379635742e-08, + "loss": 0.0003, + "step": 44542 + }, + { + "epoch": 0.86, + "learning_rate": 2.7218360452021278e-08, + "loss": 1.0637, + "step": 44543 + }, + { + "epoch": 0.86, + "learning_rate": 2.7214477107685136e-08, + "loss": 0.0003, + "step": 44544 + }, + { + "epoch": 0.86, + "learning_rate": 2.7210593763348994e-08, + "loss": 0.0003, + "step": 44545 + }, + { + "epoch": 0.86, + "learning_rate": 2.7206710419012853e-08, + "loss": 0.0004, + "step": 44546 + }, + { + "epoch": 0.86, + "learning_rate": 2.720282707467671e-08, + "loss": 0.0007, + "step": 44547 + }, + { + "epoch": 0.86, + "learning_rate": 2.719894373034057e-08, + "loss": 0.0003, + "step": 44548 + }, + { + "epoch": 0.86, + "learning_rate": 2.7195060386004427e-08, + "loss": 0.0004, + "step": 44549 + }, + { + "epoch": 0.86, + "learning_rate": 2.7191177041668286e-08, + "loss": 0.0004, + "step": 44550 + }, + { + "epoch": 0.86, + "learning_rate": 2.718729369733214e-08, + "loss": 0.0013, + "step": 44551 + }, + { + "epoch": 0.86, + "learning_rate": 2.7183410352996e-08, + "loss": 0.0005, + "step": 44552 + }, + { + "epoch": 0.86, + "learning_rate": 2.7179527008659857e-08, + "loss": 0.0003, + "step": 44553 + }, + { + "epoch": 0.86, + "learning_rate": 2.7175643664323715e-08, + "loss": 0.0004, + "step": 44554 + }, + { + "epoch": 0.86, + "learning_rate": 2.7171760319987574e-08, + "loss": 0.0005, + "step": 44555 + }, + { + "epoch": 0.86, + "learning_rate": 2.7167876975651432e-08, + "loss": 0.0002, + "step": 44556 + }, + { + "epoch": 0.86, + "learning_rate": 2.7163993631315287e-08, + "loss": 0.0002, + "step": 44557 + }, + { + "epoch": 0.86, + "learning_rate": 2.716011028697914e-08, + "loss": 0.0005, + "step": 44558 + }, + { + "epoch": 0.86, + "learning_rate": 2.7156226942643e-08, + "loss": 0.0007, + "step": 44559 + }, + { + "epoch": 0.86, + "learning_rate": 2.7152343598306858e-08, + "loss": 0.0003, + "step": 44560 + }, + { + "epoch": 0.86, + "learning_rate": 2.7148460253970716e-08, + "loss": 0.0004, + "step": 44561 + }, + { + "epoch": 0.86, + "learning_rate": 2.7144576909634575e-08, + "loss": 0.0004, + "step": 44562 + }, + { + "epoch": 0.86, + "learning_rate": 2.7140693565298433e-08, + "loss": 0.0004, + "step": 44563 + }, + { + "epoch": 0.86, + "learning_rate": 2.713681022096229e-08, + "loss": 0.0003, + "step": 44564 + }, + { + "epoch": 0.86, + "learning_rate": 2.713292687662615e-08, + "loss": 0.0003, + "step": 44565 + }, + { + "epoch": 0.86, + "learning_rate": 2.7129043532290008e-08, + "loss": 0.0003, + "step": 44566 + }, + { + "epoch": 0.86, + "learning_rate": 2.7125160187953866e-08, + "loss": 0.0005, + "step": 44567 + }, + { + "epoch": 0.86, + "learning_rate": 2.7121276843617724e-08, + "loss": 0.0004, + "step": 44568 + }, + { + "epoch": 0.86, + "learning_rate": 2.7117393499281582e-08, + "loss": 0.0006, + "step": 44569 + }, + { + "epoch": 0.86, + "learning_rate": 2.711351015494544e-08, + "loss": 0.0009, + "step": 44570 + }, + { + "epoch": 0.86, + "learning_rate": 2.7109626810609292e-08, + "loss": 0.0051, + "step": 44571 + }, + { + "epoch": 0.86, + "learning_rate": 2.710574346627315e-08, + "loss": 0.0004, + "step": 44572 + }, + { + "epoch": 0.86, + "learning_rate": 2.710186012193701e-08, + "loss": 0.0028, + "step": 44573 + }, + { + "epoch": 0.86, + "learning_rate": 2.7097976777600867e-08, + "loss": 0.0003, + "step": 44574 + }, + { + "epoch": 0.86, + "learning_rate": 2.7094093433264725e-08, + "loss": 0.0004, + "step": 44575 + }, + { + "epoch": 0.86, + "learning_rate": 2.7090210088928583e-08, + "loss": 0.0004, + "step": 44576 + }, + { + "epoch": 0.86, + "learning_rate": 2.708632674459244e-08, + "loss": 0.0004, + "step": 44577 + }, + { + "epoch": 0.86, + "learning_rate": 2.70824434002563e-08, + "loss": 0.0007, + "step": 44578 + }, + { + "epoch": 0.86, + "learning_rate": 2.7078560055920158e-08, + "loss": 0.0002, + "step": 44579 + }, + { + "epoch": 0.86, + "learning_rate": 2.7074676711584016e-08, + "loss": 0.0004, + "step": 44580 + }, + { + "epoch": 0.86, + "learning_rate": 2.7070793367247875e-08, + "loss": 0.0004, + "step": 44581 + }, + { + "epoch": 0.86, + "learning_rate": 2.7066910022911733e-08, + "loss": 0.4125, + "step": 44582 + }, + { + "epoch": 0.86, + "learning_rate": 2.706302667857559e-08, + "loss": 0.0048, + "step": 44583 + }, + { + "epoch": 0.86, + "learning_rate": 2.705914333423945e-08, + "loss": 0.0003, + "step": 44584 + }, + { + "epoch": 0.86, + "learning_rate": 2.7055259989903308e-08, + "loss": 0.0005, + "step": 44585 + }, + { + "epoch": 0.86, + "learning_rate": 2.705137664556716e-08, + "loss": 0.0004, + "step": 44586 + }, + { + "epoch": 0.86, + "learning_rate": 2.7047493301231017e-08, + "loss": 0.0004, + "step": 44587 + }, + { + "epoch": 0.86, + "learning_rate": 2.7043609956894876e-08, + "loss": 0.0003, + "step": 44588 + }, + { + "epoch": 0.86, + "learning_rate": 2.7039726612558734e-08, + "loss": 0.0004, + "step": 44589 + }, + { + "epoch": 0.86, + "learning_rate": 2.7035843268222592e-08, + "loss": 0.0002, + "step": 44590 + }, + { + "epoch": 0.86, + "learning_rate": 2.703195992388645e-08, + "loss": 0.0004, + "step": 44591 + }, + { + "epoch": 0.86, + "learning_rate": 2.702807657955031e-08, + "loss": 0.0004, + "step": 44592 + }, + { + "epoch": 0.87, + "learning_rate": 2.7024193235214167e-08, + "loss": 0.0006, + "step": 44593 + }, + { + "epoch": 0.87, + "learning_rate": 2.7020309890878025e-08, + "loss": 0.001, + "step": 44594 + }, + { + "epoch": 0.87, + "learning_rate": 2.701642654654188e-08, + "loss": 0.0018, + "step": 44595 + }, + { + "epoch": 0.87, + "learning_rate": 2.701254320220574e-08, + "loss": 0.0003, + "step": 44596 + }, + { + "epoch": 0.87, + "learning_rate": 2.7008659857869597e-08, + "loss": 0.0006, + "step": 44597 + }, + { + "epoch": 0.87, + "learning_rate": 2.7004776513533455e-08, + "loss": 0.0004, + "step": 44598 + }, + { + "epoch": 0.87, + "learning_rate": 2.7000893169197313e-08, + "loss": 0.1114, + "step": 44599 + }, + { + "epoch": 0.87, + "learning_rate": 2.6997009824861168e-08, + "loss": 0.0003, + "step": 44600 + }, + { + "epoch": 0.87, + "learning_rate": 2.6993126480525026e-08, + "loss": 0.0005, + "step": 44601 + }, + { + "epoch": 0.87, + "learning_rate": 2.698924313618888e-08, + "loss": 0.0005, + "step": 44602 + }, + { + "epoch": 0.87, + "learning_rate": 2.698535979185274e-08, + "loss": 0.0005, + "step": 44603 + }, + { + "epoch": 0.87, + "learning_rate": 2.6981476447516598e-08, + "loss": 0.0004, + "step": 44604 + }, + { + "epoch": 0.87, + "learning_rate": 2.6977593103180456e-08, + "loss": 0.0005, + "step": 44605 + }, + { + "epoch": 0.87, + "learning_rate": 2.6973709758844314e-08, + "loss": 0.0005, + "step": 44606 + }, + { + "epoch": 0.87, + "learning_rate": 2.6969826414508172e-08, + "loss": 0.5259, + "step": 44607 + }, + { + "epoch": 0.87, + "learning_rate": 2.696594307017203e-08, + "loss": 0.0004, + "step": 44608 + }, + { + "epoch": 0.87, + "learning_rate": 2.696205972583589e-08, + "loss": 0.0004, + "step": 44609 + }, + { + "epoch": 0.87, + "learning_rate": 2.6958176381499747e-08, + "loss": 0.0004, + "step": 44610 + }, + { + "epoch": 0.87, + "learning_rate": 2.6954293037163605e-08, + "loss": 0.0004, + "step": 44611 + }, + { + "epoch": 0.87, + "learning_rate": 2.6950409692827464e-08, + "loss": 0.0002, + "step": 44612 + }, + { + "epoch": 0.87, + "learning_rate": 2.6946526348491322e-08, + "loss": 0.0004, + "step": 44613 + }, + { + "epoch": 0.87, + "learning_rate": 2.694264300415518e-08, + "loss": 0.0003, + "step": 44614 + }, + { + "epoch": 0.87, + "learning_rate": 2.6938759659819032e-08, + "loss": 0.0004, + "step": 44615 + }, + { + "epoch": 0.87, + "learning_rate": 2.693487631548289e-08, + "loss": 0.0003, + "step": 44616 + }, + { + "epoch": 0.87, + "learning_rate": 2.6930992971146748e-08, + "loss": 0.0002, + "step": 44617 + }, + { + "epoch": 0.87, + "learning_rate": 2.6927109626810607e-08, + "loss": 0.0005, + "step": 44618 + }, + { + "epoch": 0.87, + "learning_rate": 2.6923226282474465e-08, + "loss": 0.0003, + "step": 44619 + }, + { + "epoch": 0.87, + "learning_rate": 2.6919342938138323e-08, + "loss": 0.0005, + "step": 44620 + }, + { + "epoch": 0.87, + "learning_rate": 2.691545959380218e-08, + "loss": 0.0004, + "step": 44621 + }, + { + "epoch": 0.87, + "learning_rate": 2.691157624946604e-08, + "loss": 0.0004, + "step": 44622 + }, + { + "epoch": 0.87, + "learning_rate": 2.6907692905129898e-08, + "loss": 0.0004, + "step": 44623 + }, + { + "epoch": 0.87, + "learning_rate": 2.6903809560793756e-08, + "loss": 0.0004, + "step": 44624 + }, + { + "epoch": 0.87, + "learning_rate": 2.6899926216457614e-08, + "loss": 0.0003, + "step": 44625 + }, + { + "epoch": 0.87, + "learning_rate": 2.6896042872121472e-08, + "loss": 0.0004, + "step": 44626 + }, + { + "epoch": 0.87, + "learning_rate": 2.689215952778533e-08, + "loss": 0.0005, + "step": 44627 + }, + { + "epoch": 0.87, + "learning_rate": 2.688827618344919e-08, + "loss": 0.0003, + "step": 44628 + }, + { + "epoch": 0.87, + "learning_rate": 2.688439283911304e-08, + "loss": 0.9639, + "step": 44629 + }, + { + "epoch": 0.87, + "learning_rate": 2.68805094947769e-08, + "loss": 0.0004, + "step": 44630 + }, + { + "epoch": 0.87, + "learning_rate": 2.6876626150440757e-08, + "loss": 0.5386, + "step": 44631 + }, + { + "epoch": 0.87, + "learning_rate": 2.6872742806104615e-08, + "loss": 0.0005, + "step": 44632 + }, + { + "epoch": 0.87, + "learning_rate": 2.6868859461768474e-08, + "loss": 0.0056, + "step": 44633 + }, + { + "epoch": 0.87, + "learning_rate": 2.6864976117432332e-08, + "loss": 0.0004, + "step": 44634 + }, + { + "epoch": 0.87, + "learning_rate": 2.686109277309619e-08, + "loss": 0.0528, + "step": 44635 + }, + { + "epoch": 0.87, + "learning_rate": 2.6857209428760048e-08, + "loss": 0.0005, + "step": 44636 + }, + { + "epoch": 0.87, + "learning_rate": 2.6853326084423907e-08, + "loss": 0.0003, + "step": 44637 + }, + { + "epoch": 0.87, + "learning_rate": 2.6849442740087765e-08, + "loss": 0.6946, + "step": 44638 + }, + { + "epoch": 0.87, + "learning_rate": 2.684555939575162e-08, + "loss": 0.0004, + "step": 44639 + }, + { + "epoch": 0.87, + "learning_rate": 2.6841676051415478e-08, + "loss": 0.0003, + "step": 44640 + }, + { + "epoch": 0.87, + "learning_rate": 2.6837792707079336e-08, + "loss": 0.0007, + "step": 44641 + }, + { + "epoch": 0.87, + "learning_rate": 2.6833909362743194e-08, + "loss": 0.0013, + "step": 44642 + }, + { + "epoch": 0.87, + "learning_rate": 2.6830026018407053e-08, + "loss": 0.0029, + "step": 44643 + }, + { + "epoch": 0.87, + "learning_rate": 2.6826142674070908e-08, + "loss": 0.0004, + "step": 44644 + }, + { + "epoch": 0.87, + "learning_rate": 2.6822259329734766e-08, + "loss": 0.0004, + "step": 44645 + }, + { + "epoch": 0.87, + "learning_rate": 2.681837598539862e-08, + "loss": 0.0011, + "step": 44646 + }, + { + "epoch": 0.87, + "learning_rate": 2.681449264106248e-08, + "loss": 0.0005, + "step": 44647 + }, + { + "epoch": 0.87, + "learning_rate": 2.6810609296726337e-08, + "loss": 0.0002, + "step": 44648 + }, + { + "epoch": 0.87, + "learning_rate": 2.6806725952390196e-08, + "loss": 0.0005, + "step": 44649 + }, + { + "epoch": 0.87, + "learning_rate": 2.6802842608054054e-08, + "loss": 0.001, + "step": 44650 + }, + { + "epoch": 0.87, + "learning_rate": 2.6798959263717912e-08, + "loss": 0.0002, + "step": 44651 + }, + { + "epoch": 0.87, + "learning_rate": 2.679507591938177e-08, + "loss": 0.7608, + "step": 44652 + }, + { + "epoch": 0.87, + "learning_rate": 2.679119257504563e-08, + "loss": 0.0007, + "step": 44653 + }, + { + "epoch": 0.87, + "learning_rate": 2.6787309230709487e-08, + "loss": 0.0004, + "step": 44654 + }, + { + "epoch": 0.87, + "learning_rate": 2.6783425886373345e-08, + "loss": 0.0007, + "step": 44655 + }, + { + "epoch": 0.87, + "learning_rate": 2.6779542542037203e-08, + "loss": 0.0003, + "step": 44656 + }, + { + "epoch": 0.87, + "learning_rate": 2.677565919770106e-08, + "loss": 0.0002, + "step": 44657 + }, + { + "epoch": 0.87, + "learning_rate": 2.6771775853364913e-08, + "loss": 0.0003, + "step": 44658 + }, + { + "epoch": 0.87, + "learning_rate": 2.676789250902877e-08, + "loss": 0.1781, + "step": 44659 + }, + { + "epoch": 0.87, + "learning_rate": 2.676400916469263e-08, + "loss": 0.0013, + "step": 44660 + }, + { + "epoch": 0.87, + "learning_rate": 2.6760125820356488e-08, + "loss": 0.0003, + "step": 44661 + }, + { + "epoch": 0.87, + "learning_rate": 2.6756242476020346e-08, + "loss": 0.0003, + "step": 44662 + }, + { + "epoch": 0.87, + "learning_rate": 2.6752359131684204e-08, + "loss": 0.0004, + "step": 44663 + }, + { + "epoch": 0.87, + "learning_rate": 2.6748475787348063e-08, + "loss": 0.0003, + "step": 44664 + }, + { + "epoch": 0.87, + "learning_rate": 2.674459244301192e-08, + "loss": 0.0005, + "step": 44665 + }, + { + "epoch": 0.87, + "learning_rate": 2.674070909867578e-08, + "loss": 0.0005, + "step": 44666 + }, + { + "epoch": 0.87, + "learning_rate": 2.6736825754339637e-08, + "loss": 0.0003, + "step": 44667 + }, + { + "epoch": 0.87, + "learning_rate": 2.6732942410003496e-08, + "loss": 0.0003, + "step": 44668 + }, + { + "epoch": 0.87, + "learning_rate": 2.6729059065667354e-08, + "loss": 0.001, + "step": 44669 + }, + { + "epoch": 0.87, + "learning_rate": 2.6725175721331212e-08, + "loss": 0.0006, + "step": 44670 + }, + { + "epoch": 0.87, + "learning_rate": 2.672129237699507e-08, + "loss": 0.004, + "step": 44671 + }, + { + "epoch": 0.87, + "learning_rate": 2.671740903265893e-08, + "loss": 0.0004, + "step": 44672 + }, + { + "epoch": 0.87, + "learning_rate": 2.671352568832278e-08, + "loss": 0.0003, + "step": 44673 + }, + { + "epoch": 0.87, + "learning_rate": 2.670964234398664e-08, + "loss": 0.0005, + "step": 44674 + }, + { + "epoch": 0.87, + "learning_rate": 2.6705758999650497e-08, + "loss": 0.0005, + "step": 44675 + }, + { + "epoch": 0.87, + "learning_rate": 2.6701875655314355e-08, + "loss": 0.0002, + "step": 44676 + }, + { + "epoch": 0.87, + "learning_rate": 2.6697992310978213e-08, + "loss": 0.0009, + "step": 44677 + }, + { + "epoch": 0.87, + "learning_rate": 2.669410896664207e-08, + "loss": 0.0003, + "step": 44678 + }, + { + "epoch": 0.87, + "learning_rate": 2.669022562230593e-08, + "loss": 0.0002, + "step": 44679 + }, + { + "epoch": 0.87, + "learning_rate": 2.6686342277969788e-08, + "loss": 0.0004, + "step": 44680 + }, + { + "epoch": 0.87, + "learning_rate": 2.6682458933633646e-08, + "loss": 0.0004, + "step": 44681 + }, + { + "epoch": 0.87, + "learning_rate": 2.6678575589297504e-08, + "loss": 0.0004, + "step": 44682 + }, + { + "epoch": 0.87, + "learning_rate": 2.667469224496136e-08, + "loss": 0.0003, + "step": 44683 + }, + { + "epoch": 0.87, + "learning_rate": 2.6670808900625218e-08, + "loss": 0.0012, + "step": 44684 + }, + { + "epoch": 0.87, + "learning_rate": 2.6666925556289076e-08, + "loss": 0.0005, + "step": 44685 + }, + { + "epoch": 0.87, + "learning_rate": 2.6663042211952934e-08, + "loss": 0.0003, + "step": 44686 + }, + { + "epoch": 0.87, + "learning_rate": 2.665915886761679e-08, + "loss": 0.0006, + "step": 44687 + }, + { + "epoch": 0.87, + "learning_rate": 2.6655275523280647e-08, + "loss": 0.0003, + "step": 44688 + }, + { + "epoch": 0.87, + "learning_rate": 2.6651392178944505e-08, + "loss": 0.0003, + "step": 44689 + }, + { + "epoch": 0.87, + "learning_rate": 2.6647508834608364e-08, + "loss": 0.1099, + "step": 44690 + }, + { + "epoch": 0.87, + "learning_rate": 2.664362549027222e-08, + "loss": 0.0003, + "step": 44691 + }, + { + "epoch": 0.87, + "learning_rate": 2.6639742145936077e-08, + "loss": 0.0004, + "step": 44692 + }, + { + "epoch": 0.87, + "learning_rate": 2.6635858801599935e-08, + "loss": 0.0013, + "step": 44693 + }, + { + "epoch": 0.87, + "learning_rate": 2.6631975457263793e-08, + "loss": 0.0024, + "step": 44694 + }, + { + "epoch": 0.87, + "learning_rate": 2.662809211292765e-08, + "loss": 0.0004, + "step": 44695 + }, + { + "epoch": 0.87, + "learning_rate": 2.662420876859151e-08, + "loss": 0.0004, + "step": 44696 + }, + { + "epoch": 0.87, + "learning_rate": 2.6620325424255368e-08, + "loss": 0.0003, + "step": 44697 + }, + { + "epoch": 0.87, + "learning_rate": 2.6616442079919226e-08, + "loss": 0.0296, + "step": 44698 + }, + { + "epoch": 0.87, + "learning_rate": 2.6612558735583085e-08, + "loss": 0.8545, + "step": 44699 + }, + { + "epoch": 0.87, + "learning_rate": 2.6608675391246943e-08, + "loss": 0.0004, + "step": 44700 + }, + { + "epoch": 0.87, + "learning_rate": 2.66047920469108e-08, + "loss": 0.0007, + "step": 44701 + }, + { + "epoch": 0.87, + "learning_rate": 2.6600908702574653e-08, + "loss": 0.0003, + "step": 44702 + }, + { + "epoch": 0.87, + "learning_rate": 2.659702535823851e-08, + "loss": 0.0004, + "step": 44703 + }, + { + "epoch": 0.87, + "learning_rate": 2.659314201390237e-08, + "loss": 0.0003, + "step": 44704 + }, + { + "epoch": 0.87, + "learning_rate": 2.6589258669566227e-08, + "loss": 0.0004, + "step": 44705 + }, + { + "epoch": 0.87, + "learning_rate": 2.6585375325230086e-08, + "loss": 0.0006, + "step": 44706 + }, + { + "epoch": 0.87, + "learning_rate": 2.6581491980893944e-08, + "loss": 0.0005, + "step": 44707 + }, + { + "epoch": 0.87, + "learning_rate": 2.6577608636557802e-08, + "loss": 0.0004, + "step": 44708 + }, + { + "epoch": 0.87, + "learning_rate": 2.657372529222166e-08, + "loss": 0.0016, + "step": 44709 + }, + { + "epoch": 0.87, + "learning_rate": 2.656984194788552e-08, + "loss": 0.0003, + "step": 44710 + }, + { + "epoch": 0.87, + "learning_rate": 2.6565958603549377e-08, + "loss": 0.0033, + "step": 44711 + }, + { + "epoch": 0.87, + "learning_rate": 2.6562075259213235e-08, + "loss": 0.0004, + "step": 44712 + }, + { + "epoch": 0.87, + "learning_rate": 2.6558191914877093e-08, + "loss": 0.0014, + "step": 44713 + }, + { + "epoch": 0.87, + "learning_rate": 2.655430857054095e-08, + "loss": 0.2563, + "step": 44714 + }, + { + "epoch": 0.87, + "learning_rate": 2.655042522620481e-08, + "loss": 0.0003, + "step": 44715 + }, + { + "epoch": 0.87, + "learning_rate": 2.654654188186866e-08, + "loss": 0.0003, + "step": 44716 + }, + { + "epoch": 0.87, + "learning_rate": 2.654265853753252e-08, + "loss": 0.0005, + "step": 44717 + }, + { + "epoch": 0.87, + "learning_rate": 2.6538775193196378e-08, + "loss": 0.0004, + "step": 44718 + }, + { + "epoch": 0.87, + "learning_rate": 2.6534891848860236e-08, + "loss": 0.0003, + "step": 44719 + }, + { + "epoch": 0.87, + "learning_rate": 2.6531008504524094e-08, + "loss": 0.0031, + "step": 44720 + }, + { + "epoch": 0.87, + "learning_rate": 2.6527125160187953e-08, + "loss": 0.0005, + "step": 44721 + }, + { + "epoch": 0.87, + "learning_rate": 2.652324181585181e-08, + "loss": 0.0004, + "step": 44722 + }, + { + "epoch": 0.87, + "learning_rate": 2.651935847151567e-08, + "loss": 0.0012, + "step": 44723 + }, + { + "epoch": 0.87, + "learning_rate": 2.6515475127179527e-08, + "loss": 0.8143, + "step": 44724 + }, + { + "epoch": 0.87, + "learning_rate": 2.6511591782843386e-08, + "loss": 0.0009, + "step": 44725 + }, + { + "epoch": 0.87, + "learning_rate": 2.6507708438507244e-08, + "loss": 0.0012, + "step": 44726 + }, + { + "epoch": 0.87, + "learning_rate": 2.6503825094171102e-08, + "loss": 0.0004, + "step": 44727 + }, + { + "epoch": 0.87, + "learning_rate": 2.6499941749834957e-08, + "loss": 0.0004, + "step": 44728 + }, + { + "epoch": 0.87, + "learning_rate": 2.6496058405498815e-08, + "loss": 0.0003, + "step": 44729 + }, + { + "epoch": 0.87, + "learning_rate": 2.6492175061162674e-08, + "loss": 0.0128, + "step": 44730 + }, + { + "epoch": 0.87, + "learning_rate": 2.648829171682653e-08, + "loss": 0.0005, + "step": 44731 + }, + { + "epoch": 0.87, + "learning_rate": 2.6484408372490387e-08, + "loss": 0.0004, + "step": 44732 + }, + { + "epoch": 0.87, + "learning_rate": 2.6480525028154245e-08, + "loss": 0.0564, + "step": 44733 + }, + { + "epoch": 0.87, + "learning_rate": 2.6476641683818103e-08, + "loss": 0.01, + "step": 44734 + }, + { + "epoch": 0.87, + "learning_rate": 2.6472758339481958e-08, + "loss": 0.0003, + "step": 44735 + }, + { + "epoch": 0.87, + "learning_rate": 2.6468874995145816e-08, + "loss": 0.0002, + "step": 44736 + }, + { + "epoch": 0.87, + "learning_rate": 2.6464991650809675e-08, + "loss": 0.0005, + "step": 44737 + }, + { + "epoch": 0.87, + "learning_rate": 2.6461108306473533e-08, + "loss": 0.0639, + "step": 44738 + }, + { + "epoch": 0.87, + "learning_rate": 2.645722496213739e-08, + "loss": 0.0005, + "step": 44739 + }, + { + "epoch": 0.87, + "learning_rate": 2.645334161780125e-08, + "loss": 0.0003, + "step": 44740 + }, + { + "epoch": 0.87, + "learning_rate": 2.6449458273465108e-08, + "loss": 0.7364, + "step": 44741 + }, + { + "epoch": 0.87, + "learning_rate": 2.6445574929128966e-08, + "loss": 0.0005, + "step": 44742 + }, + { + "epoch": 0.87, + "learning_rate": 2.6441691584792824e-08, + "loss": 0.0003, + "step": 44743 + }, + { + "epoch": 0.87, + "learning_rate": 2.6437808240456682e-08, + "loss": 0.0003, + "step": 44744 + }, + { + "epoch": 0.87, + "learning_rate": 2.6433924896120534e-08, + "loss": 0.0005, + "step": 44745 + }, + { + "epoch": 0.87, + "learning_rate": 2.6430041551784392e-08, + "loss": 0.0005, + "step": 44746 + }, + { + "epoch": 0.87, + "learning_rate": 2.642615820744825e-08, + "loss": 0.0003, + "step": 44747 + }, + { + "epoch": 0.87, + "learning_rate": 2.642227486311211e-08, + "loss": 0.0011, + "step": 44748 + }, + { + "epoch": 0.87, + "learning_rate": 2.6418391518775967e-08, + "loss": 0.0004, + "step": 44749 + }, + { + "epoch": 0.87, + "learning_rate": 2.6414508174439825e-08, + "loss": 0.0003, + "step": 44750 + }, + { + "epoch": 0.87, + "learning_rate": 2.6410624830103684e-08, + "loss": 0.0004, + "step": 44751 + }, + { + "epoch": 0.87, + "learning_rate": 2.6406741485767542e-08, + "loss": 0.0004, + "step": 44752 + }, + { + "epoch": 0.87, + "learning_rate": 2.64028581414314e-08, + "loss": 0.0005, + "step": 44753 + }, + { + "epoch": 0.87, + "learning_rate": 2.6398974797095258e-08, + "loss": 0.0003, + "step": 44754 + }, + { + "epoch": 0.87, + "learning_rate": 2.6395091452759116e-08, + "loss": 0.0004, + "step": 44755 + }, + { + "epoch": 0.87, + "learning_rate": 2.6391208108422975e-08, + "loss": 0.0005, + "step": 44756 + }, + { + "epoch": 0.87, + "learning_rate": 2.6387324764086833e-08, + "loss": 0.0003, + "step": 44757 + }, + { + "epoch": 0.87, + "learning_rate": 2.638344141975069e-08, + "loss": 0.0003, + "step": 44758 + }, + { + "epoch": 0.87, + "learning_rate": 2.637955807541455e-08, + "loss": 0.0004, + "step": 44759 + }, + { + "epoch": 0.87, + "learning_rate": 2.63756747310784e-08, + "loss": 0.0004, + "step": 44760 + }, + { + "epoch": 0.87, + "learning_rate": 2.637179138674226e-08, + "loss": 0.0005, + "step": 44761 + }, + { + "epoch": 0.87, + "learning_rate": 2.6367908042406118e-08, + "loss": 0.0006, + "step": 44762 + }, + { + "epoch": 0.87, + "learning_rate": 2.6364024698069976e-08, + "loss": 0.0004, + "step": 44763 + }, + { + "epoch": 0.87, + "learning_rate": 2.6360141353733834e-08, + "loss": 0.0004, + "step": 44764 + }, + { + "epoch": 0.87, + "learning_rate": 2.6356258009397692e-08, + "loss": 0.0003, + "step": 44765 + }, + { + "epoch": 0.87, + "learning_rate": 2.635237466506155e-08, + "loss": 0.0004, + "step": 44766 + }, + { + "epoch": 0.87, + "learning_rate": 2.634849132072541e-08, + "loss": 0.5611, + "step": 44767 + }, + { + "epoch": 0.87, + "learning_rate": 2.6344607976389267e-08, + "loss": 0.1834, + "step": 44768 + }, + { + "epoch": 0.87, + "learning_rate": 2.6340724632053125e-08, + "loss": 0.0004, + "step": 44769 + }, + { + "epoch": 0.87, + "learning_rate": 2.6336841287716984e-08, + "loss": 0.0004, + "step": 44770 + }, + { + "epoch": 0.87, + "learning_rate": 2.6332957943380842e-08, + "loss": 0.0003, + "step": 44771 + }, + { + "epoch": 0.87, + "learning_rate": 2.6329074599044697e-08, + "loss": 0.0005, + "step": 44772 + }, + { + "epoch": 0.87, + "learning_rate": 2.6325191254708555e-08, + "loss": 0.0005, + "step": 44773 + }, + { + "epoch": 0.87, + "learning_rate": 2.632130791037241e-08, + "loss": 0.0003, + "step": 44774 + }, + { + "epoch": 0.87, + "learning_rate": 2.6317424566036268e-08, + "loss": 0.0004, + "step": 44775 + }, + { + "epoch": 0.87, + "learning_rate": 2.6313541221700126e-08, + "loss": 0.0005, + "step": 44776 + }, + { + "epoch": 0.87, + "learning_rate": 2.6309657877363985e-08, + "loss": 0.0005, + "step": 44777 + }, + { + "epoch": 0.87, + "learning_rate": 2.6305774533027843e-08, + "loss": 0.0003, + "step": 44778 + }, + { + "epoch": 0.87, + "learning_rate": 2.6301891188691698e-08, + "loss": 0.0003, + "step": 44779 + }, + { + "epoch": 0.87, + "learning_rate": 2.6298007844355556e-08, + "loss": 0.0003, + "step": 44780 + }, + { + "epoch": 0.87, + "learning_rate": 2.6294124500019414e-08, + "loss": 0.0003, + "step": 44781 + }, + { + "epoch": 0.87, + "learning_rate": 2.6290241155683273e-08, + "loss": 0.0003, + "step": 44782 + }, + { + "epoch": 0.87, + "learning_rate": 2.628635781134713e-08, + "loss": 0.0004, + "step": 44783 + }, + { + "epoch": 0.87, + "learning_rate": 2.628247446701099e-08, + "loss": 0.8259, + "step": 44784 + }, + { + "epoch": 0.87, + "learning_rate": 2.6278591122674847e-08, + "loss": 0.0005, + "step": 44785 + }, + { + "epoch": 0.87, + "learning_rate": 2.6274707778338706e-08, + "loss": 0.0003, + "step": 44786 + }, + { + "epoch": 0.87, + "learning_rate": 2.6270824434002564e-08, + "loss": 0.0004, + "step": 44787 + }, + { + "epoch": 0.87, + "learning_rate": 2.6266941089666422e-08, + "loss": 0.001, + "step": 44788 + }, + { + "epoch": 0.87, + "learning_rate": 2.6263057745330274e-08, + "loss": 1.0165, + "step": 44789 + }, + { + "epoch": 0.87, + "learning_rate": 2.6259174400994132e-08, + "loss": 0.0004, + "step": 44790 + }, + { + "epoch": 0.87, + "learning_rate": 2.625529105665799e-08, + "loss": 0.0003, + "step": 44791 + }, + { + "epoch": 0.87, + "learning_rate": 2.625140771232185e-08, + "loss": 0.0004, + "step": 44792 + }, + { + "epoch": 0.87, + "learning_rate": 2.6247524367985707e-08, + "loss": 0.0004, + "step": 44793 + }, + { + "epoch": 0.87, + "learning_rate": 2.6243641023649565e-08, + "loss": 0.5656, + "step": 44794 + }, + { + "epoch": 0.87, + "learning_rate": 2.6239757679313423e-08, + "loss": 0.0004, + "step": 44795 + }, + { + "epoch": 0.87, + "learning_rate": 2.623587433497728e-08, + "loss": 0.0003, + "step": 44796 + }, + { + "epoch": 0.87, + "learning_rate": 2.623199099064114e-08, + "loss": 0.0004, + "step": 44797 + }, + { + "epoch": 0.87, + "learning_rate": 2.6228107646304998e-08, + "loss": 0.0138, + "step": 44798 + }, + { + "epoch": 0.87, + "learning_rate": 2.6224224301968856e-08, + "loss": 0.0006, + "step": 44799 + }, + { + "epoch": 0.87, + "learning_rate": 2.6220340957632714e-08, + "loss": 0.0003, + "step": 44800 + }, + { + "epoch": 0.87, + "learning_rate": 2.6216457613296573e-08, + "loss": 0.0003, + "step": 44801 + }, + { + "epoch": 0.87, + "learning_rate": 2.621257426896043e-08, + "loss": 0.0007, + "step": 44802 + }, + { + "epoch": 0.87, + "learning_rate": 2.6208690924624282e-08, + "loss": 0.0004, + "step": 44803 + }, + { + "epoch": 0.87, + "learning_rate": 2.620480758028814e-08, + "loss": 0.0005, + "step": 44804 + }, + { + "epoch": 0.87, + "learning_rate": 2.6200924235952e-08, + "loss": 0.0004, + "step": 44805 + }, + { + "epoch": 0.87, + "learning_rate": 2.6197040891615857e-08, + "loss": 0.0005, + "step": 44806 + }, + { + "epoch": 0.87, + "learning_rate": 2.6193157547279715e-08, + "loss": 0.0003, + "step": 44807 + }, + { + "epoch": 0.87, + "learning_rate": 2.6189274202943574e-08, + "loss": 0.0004, + "step": 44808 + }, + { + "epoch": 0.87, + "learning_rate": 2.6185390858607432e-08, + "loss": 0.0004, + "step": 44809 + }, + { + "epoch": 0.87, + "learning_rate": 2.618150751427129e-08, + "loss": 0.0004, + "step": 44810 + }, + { + "epoch": 0.87, + "learning_rate": 2.617762416993515e-08, + "loss": 0.0004, + "step": 44811 + }, + { + "epoch": 0.87, + "learning_rate": 2.6173740825599007e-08, + "loss": 0.0003, + "step": 44812 + }, + { + "epoch": 0.87, + "learning_rate": 2.6169857481262865e-08, + "loss": 1.1529, + "step": 44813 + }, + { + "epoch": 0.87, + "learning_rate": 2.6165974136926723e-08, + "loss": 0.0003, + "step": 44814 + }, + { + "epoch": 0.87, + "learning_rate": 2.616209079259058e-08, + "loss": 0.0004, + "step": 44815 + }, + { + "epoch": 0.87, + "learning_rate": 2.6158207448254436e-08, + "loss": 0.0004, + "step": 44816 + }, + { + "epoch": 0.87, + "learning_rate": 2.6154324103918295e-08, + "loss": 0.0006, + "step": 44817 + }, + { + "epoch": 0.87, + "learning_rate": 2.615044075958215e-08, + "loss": 1.1167, + "step": 44818 + }, + { + "epoch": 0.87, + "learning_rate": 2.6146557415246008e-08, + "loss": 0.7289, + "step": 44819 + }, + { + "epoch": 0.87, + "learning_rate": 2.6142674070909866e-08, + "loss": 0.0027, + "step": 44820 + }, + { + "epoch": 0.87, + "learning_rate": 2.6138790726573724e-08, + "loss": 0.0012, + "step": 44821 + }, + { + "epoch": 0.87, + "learning_rate": 2.6134907382237582e-08, + "loss": 0.0007, + "step": 44822 + }, + { + "epoch": 0.87, + "learning_rate": 2.6131024037901437e-08, + "loss": 0.0004, + "step": 44823 + }, + { + "epoch": 0.87, + "learning_rate": 2.6127140693565296e-08, + "loss": 0.0005, + "step": 44824 + }, + { + "epoch": 0.87, + "learning_rate": 2.6123257349229154e-08, + "loss": 0.0007, + "step": 44825 + }, + { + "epoch": 0.87, + "learning_rate": 2.6119374004893012e-08, + "loss": 0.0005, + "step": 44826 + }, + { + "epoch": 0.87, + "learning_rate": 2.611549066055687e-08, + "loss": 0.1213, + "step": 44827 + }, + { + "epoch": 0.87, + "learning_rate": 2.611160731622073e-08, + "loss": 0.1782, + "step": 44828 + }, + { + "epoch": 0.87, + "learning_rate": 2.6107723971884587e-08, + "loss": 0.0004, + "step": 44829 + }, + { + "epoch": 0.87, + "learning_rate": 2.6103840627548445e-08, + "loss": 0.0004, + "step": 44830 + }, + { + "epoch": 0.87, + "learning_rate": 2.6099957283212303e-08, + "loss": 0.0003, + "step": 44831 + }, + { + "epoch": 0.87, + "learning_rate": 2.6096073938876155e-08, + "loss": 0.0004, + "step": 44832 + }, + { + "epoch": 0.87, + "learning_rate": 2.6092190594540013e-08, + "loss": 0.0341, + "step": 44833 + }, + { + "epoch": 0.87, + "learning_rate": 2.608830725020387e-08, + "loss": 0.0004, + "step": 44834 + }, + { + "epoch": 0.87, + "learning_rate": 2.608442390586773e-08, + "loss": 0.0005, + "step": 44835 + }, + { + "epoch": 0.87, + "learning_rate": 2.6080540561531588e-08, + "loss": 0.0005, + "step": 44836 + }, + { + "epoch": 0.87, + "learning_rate": 2.6076657217195446e-08, + "loss": 0.0005, + "step": 44837 + }, + { + "epoch": 0.87, + "learning_rate": 2.6072773872859304e-08, + "loss": 0.0003, + "step": 44838 + }, + { + "epoch": 0.87, + "learning_rate": 2.6068890528523163e-08, + "loss": 0.0004, + "step": 44839 + }, + { + "epoch": 0.87, + "learning_rate": 2.606500718418702e-08, + "loss": 0.0003, + "step": 44840 + }, + { + "epoch": 0.87, + "learning_rate": 2.606112383985088e-08, + "loss": 0.0421, + "step": 44841 + }, + { + "epoch": 0.87, + "learning_rate": 2.6057240495514737e-08, + "loss": 0.0004, + "step": 44842 + }, + { + "epoch": 0.87, + "learning_rate": 2.6053357151178596e-08, + "loss": 0.0003, + "step": 44843 + }, + { + "epoch": 0.87, + "learning_rate": 2.6049473806842454e-08, + "loss": 0.0003, + "step": 44844 + }, + { + "epoch": 0.87, + "learning_rate": 2.6045590462506312e-08, + "loss": 0.0006, + "step": 44845 + }, + { + "epoch": 0.87, + "learning_rate": 2.604170711817017e-08, + "loss": 0.0004, + "step": 44846 + }, + { + "epoch": 0.87, + "learning_rate": 2.6037823773834022e-08, + "loss": 0.0003, + "step": 44847 + }, + { + "epoch": 0.87, + "learning_rate": 2.603394042949788e-08, + "loss": 0.0004, + "step": 44848 + }, + { + "epoch": 0.87, + "learning_rate": 2.603005708516174e-08, + "loss": 1.0363, + "step": 44849 + }, + { + "epoch": 0.87, + "learning_rate": 2.6026173740825597e-08, + "loss": 0.0004, + "step": 44850 + }, + { + "epoch": 0.87, + "learning_rate": 2.6022290396489455e-08, + "loss": 0.0005, + "step": 44851 + }, + { + "epoch": 0.87, + "learning_rate": 2.6018407052153313e-08, + "loss": 0.0003, + "step": 44852 + }, + { + "epoch": 0.87, + "learning_rate": 2.601452370781717e-08, + "loss": 1.2438, + "step": 44853 + }, + { + "epoch": 0.87, + "learning_rate": 2.601064036348103e-08, + "loss": 0.0008, + "step": 44854 + }, + { + "epoch": 0.87, + "learning_rate": 2.6006757019144888e-08, + "loss": 0.0012, + "step": 44855 + }, + { + "epoch": 0.87, + "learning_rate": 2.6002873674808746e-08, + "loss": 0.0006, + "step": 44856 + }, + { + "epoch": 0.87, + "learning_rate": 2.5998990330472604e-08, + "loss": 0.0004, + "step": 44857 + }, + { + "epoch": 0.87, + "learning_rate": 2.5995106986136463e-08, + "loss": 0.0012, + "step": 44858 + }, + { + "epoch": 0.87, + "learning_rate": 2.599122364180032e-08, + "loss": 0.0004, + "step": 44859 + }, + { + "epoch": 0.87, + "learning_rate": 2.5987340297464176e-08, + "loss": 0.0003, + "step": 44860 + }, + { + "epoch": 0.87, + "learning_rate": 2.598345695312803e-08, + "loss": 0.0003, + "step": 44861 + }, + { + "epoch": 0.87, + "learning_rate": 2.597957360879189e-08, + "loss": 0.0004, + "step": 44862 + }, + { + "epoch": 0.87, + "learning_rate": 2.5975690264455747e-08, + "loss": 0.0006, + "step": 44863 + }, + { + "epoch": 0.87, + "learning_rate": 2.5971806920119606e-08, + "loss": 0.0003, + "step": 44864 + }, + { + "epoch": 0.87, + "learning_rate": 2.5967923575783464e-08, + "loss": 0.0004, + "step": 44865 + }, + { + "epoch": 0.87, + "learning_rate": 2.5964040231447322e-08, + "loss": 0.0003, + "step": 44866 + }, + { + "epoch": 0.87, + "learning_rate": 2.596015688711118e-08, + "loss": 0.0004, + "step": 44867 + }, + { + "epoch": 0.87, + "learning_rate": 2.5956273542775035e-08, + "loss": 0.0006, + "step": 44868 + }, + { + "epoch": 0.87, + "learning_rate": 2.5952390198438893e-08, + "loss": 0.2993, + "step": 44869 + }, + { + "epoch": 0.87, + "learning_rate": 2.5948506854102752e-08, + "loss": 0.0013, + "step": 44870 + }, + { + "epoch": 0.87, + "learning_rate": 2.594462350976661e-08, + "loss": 0.0006, + "step": 44871 + }, + { + "epoch": 0.87, + "learning_rate": 2.5940740165430468e-08, + "loss": 0.0003, + "step": 44872 + }, + { + "epoch": 0.87, + "learning_rate": 2.5936856821094326e-08, + "loss": 0.0006, + "step": 44873 + }, + { + "epoch": 0.87, + "learning_rate": 2.5932973476758185e-08, + "loss": 0.0003, + "step": 44874 + }, + { + "epoch": 0.87, + "learning_rate": 2.5929090132422043e-08, + "loss": 0.0005, + "step": 44875 + }, + { + "epoch": 0.87, + "learning_rate": 2.5925206788085895e-08, + "loss": 0.0004, + "step": 44876 + }, + { + "epoch": 0.87, + "learning_rate": 2.5921323443749753e-08, + "loss": 0.0007, + "step": 44877 + }, + { + "epoch": 0.87, + "learning_rate": 2.591744009941361e-08, + "loss": 0.0012, + "step": 44878 + }, + { + "epoch": 0.87, + "learning_rate": 2.591355675507747e-08, + "loss": 0.9563, + "step": 44879 + }, + { + "epoch": 0.87, + "learning_rate": 2.5909673410741328e-08, + "loss": 0.0004, + "step": 44880 + }, + { + "epoch": 0.87, + "learning_rate": 2.5905790066405186e-08, + "loss": 0.0004, + "step": 44881 + }, + { + "epoch": 0.87, + "learning_rate": 2.5901906722069044e-08, + "loss": 0.0003, + "step": 44882 + }, + { + "epoch": 0.87, + "learning_rate": 2.5898023377732902e-08, + "loss": 0.0003, + "step": 44883 + }, + { + "epoch": 0.87, + "learning_rate": 2.589414003339676e-08, + "loss": 0.0004, + "step": 44884 + }, + { + "epoch": 0.87, + "learning_rate": 2.589025668906062e-08, + "loss": 0.0004, + "step": 44885 + }, + { + "epoch": 0.87, + "learning_rate": 2.5886373344724477e-08, + "loss": 0.0004, + "step": 44886 + }, + { + "epoch": 0.87, + "learning_rate": 2.5882490000388335e-08, + "loss": 0.0004, + "step": 44887 + }, + { + "epoch": 0.87, + "learning_rate": 2.5878606656052194e-08, + "loss": 0.0007, + "step": 44888 + }, + { + "epoch": 0.87, + "learning_rate": 2.5874723311716052e-08, + "loss": 0.0019, + "step": 44889 + }, + { + "epoch": 0.87, + "learning_rate": 2.5870839967379903e-08, + "loss": 0.0004, + "step": 44890 + }, + { + "epoch": 0.87, + "learning_rate": 2.586695662304376e-08, + "loss": 0.0003, + "step": 44891 + }, + { + "epoch": 0.87, + "learning_rate": 2.586307327870762e-08, + "loss": 0.0005, + "step": 44892 + }, + { + "epoch": 0.87, + "learning_rate": 2.5859189934371478e-08, + "loss": 0.0003, + "step": 44893 + }, + { + "epoch": 0.87, + "learning_rate": 2.5855306590035336e-08, + "loss": 0.0025, + "step": 44894 + }, + { + "epoch": 0.87, + "learning_rate": 2.5851423245699195e-08, + "loss": 0.0003, + "step": 44895 + }, + { + "epoch": 0.87, + "learning_rate": 2.5847539901363053e-08, + "loss": 0.2338, + "step": 44896 + }, + { + "epoch": 0.87, + "learning_rate": 2.584365655702691e-08, + "loss": 0.0004, + "step": 44897 + }, + { + "epoch": 0.87, + "learning_rate": 2.583977321269077e-08, + "loss": 0.0003, + "step": 44898 + }, + { + "epoch": 0.87, + "learning_rate": 2.5835889868354628e-08, + "loss": 0.0003, + "step": 44899 + }, + { + "epoch": 0.87, + "learning_rate": 2.5832006524018486e-08, + "loss": 0.0004, + "step": 44900 + }, + { + "epoch": 0.87, + "learning_rate": 2.5828123179682344e-08, + "loss": 0.0004, + "step": 44901 + }, + { + "epoch": 0.87, + "learning_rate": 2.5824239835346202e-08, + "loss": 0.0003, + "step": 44902 + }, + { + "epoch": 0.87, + "learning_rate": 2.582035649101006e-08, + "loss": 0.0005, + "step": 44903 + }, + { + "epoch": 0.87, + "learning_rate": 2.581647314667392e-08, + "loss": 0.0006, + "step": 44904 + }, + { + "epoch": 0.87, + "learning_rate": 2.581258980233777e-08, + "loss": 0.0004, + "step": 44905 + }, + { + "epoch": 0.87, + "learning_rate": 2.580870645800163e-08, + "loss": 0.0006, + "step": 44906 + }, + { + "epoch": 0.87, + "learning_rate": 2.5804823113665487e-08, + "loss": 0.0003, + "step": 44907 + }, + { + "epoch": 0.87, + "learning_rate": 2.5800939769329345e-08, + "loss": 0.0004, + "step": 44908 + }, + { + "epoch": 0.87, + "learning_rate": 2.5797056424993203e-08, + "loss": 0.0003, + "step": 44909 + }, + { + "epoch": 0.87, + "learning_rate": 2.579317308065706e-08, + "loss": 0.0004, + "step": 44910 + }, + { + "epoch": 0.87, + "learning_rate": 2.578928973632092e-08, + "loss": 0.0003, + "step": 44911 + }, + { + "epoch": 0.87, + "learning_rate": 2.5785406391984775e-08, + "loss": 0.0003, + "step": 44912 + }, + { + "epoch": 0.87, + "learning_rate": 2.5781523047648633e-08, + "loss": 0.0027, + "step": 44913 + }, + { + "epoch": 0.87, + "learning_rate": 2.577763970331249e-08, + "loss": 0.0004, + "step": 44914 + }, + { + "epoch": 0.87, + "learning_rate": 2.577375635897635e-08, + "loss": 0.0004, + "step": 44915 + }, + { + "epoch": 0.87, + "learning_rate": 2.5769873014640208e-08, + "loss": 0.0011, + "step": 44916 + }, + { + "epoch": 0.87, + "learning_rate": 2.5765989670304066e-08, + "loss": 0.0004, + "step": 44917 + }, + { + "epoch": 0.87, + "learning_rate": 2.5762106325967924e-08, + "loss": 0.0005, + "step": 44918 + }, + { + "epoch": 0.87, + "learning_rate": 2.5758222981631776e-08, + "loss": 0.0004, + "step": 44919 + }, + { + "epoch": 0.87, + "learning_rate": 2.5754339637295634e-08, + "loss": 0.0004, + "step": 44920 + }, + { + "epoch": 0.87, + "learning_rate": 2.5750456292959492e-08, + "loss": 0.0003, + "step": 44921 + }, + { + "epoch": 0.87, + "learning_rate": 2.574657294862335e-08, + "loss": 0.0006, + "step": 44922 + }, + { + "epoch": 0.87, + "learning_rate": 2.574268960428721e-08, + "loss": 0.0004, + "step": 44923 + }, + { + "epoch": 0.87, + "learning_rate": 2.5738806259951067e-08, + "loss": 0.0003, + "step": 44924 + }, + { + "epoch": 0.87, + "learning_rate": 2.5734922915614925e-08, + "loss": 0.0004, + "step": 44925 + }, + { + "epoch": 0.87, + "learning_rate": 2.5731039571278784e-08, + "loss": 0.0004, + "step": 44926 + }, + { + "epoch": 0.87, + "learning_rate": 2.5727156226942642e-08, + "loss": 0.0004, + "step": 44927 + }, + { + "epoch": 0.87, + "learning_rate": 2.57232728826065e-08, + "loss": 0.0006, + "step": 44928 + }, + { + "epoch": 0.87, + "learning_rate": 2.571938953827036e-08, + "loss": 0.0004, + "step": 44929 + }, + { + "epoch": 0.87, + "learning_rate": 2.5715506193934217e-08, + "loss": 0.0005, + "step": 44930 + }, + { + "epoch": 0.87, + "learning_rate": 2.5711622849598075e-08, + "loss": 1.1452, + "step": 44931 + }, + { + "epoch": 0.87, + "learning_rate": 2.5707739505261933e-08, + "loss": 0.7232, + "step": 44932 + }, + { + "epoch": 0.87, + "learning_rate": 2.570385616092579e-08, + "loss": 0.0003, + "step": 44933 + }, + { + "epoch": 0.87, + "learning_rate": 2.5699972816589643e-08, + "loss": 0.0003, + "step": 44934 + }, + { + "epoch": 0.87, + "learning_rate": 2.56960894722535e-08, + "loss": 0.0004, + "step": 44935 + }, + { + "epoch": 0.87, + "learning_rate": 2.569220612791736e-08, + "loss": 0.0003, + "step": 44936 + }, + { + "epoch": 0.87, + "learning_rate": 2.5688322783581218e-08, + "loss": 0.0004, + "step": 44937 + }, + { + "epoch": 0.87, + "learning_rate": 2.5684439439245076e-08, + "loss": 0.0003, + "step": 44938 + }, + { + "epoch": 0.87, + "learning_rate": 2.5680556094908934e-08, + "loss": 0.0005, + "step": 44939 + }, + { + "epoch": 0.87, + "learning_rate": 2.5676672750572792e-08, + "loss": 0.0004, + "step": 44940 + }, + { + "epoch": 0.87, + "learning_rate": 2.567278940623665e-08, + "loss": 0.0004, + "step": 44941 + }, + { + "epoch": 0.87, + "learning_rate": 2.566890606190051e-08, + "loss": 0.0003, + "step": 44942 + }, + { + "epoch": 0.87, + "learning_rate": 2.5665022717564367e-08, + "loss": 0.0015, + "step": 44943 + }, + { + "epoch": 0.87, + "learning_rate": 2.5661139373228225e-08, + "loss": 0.0003, + "step": 44944 + }, + { + "epoch": 0.87, + "learning_rate": 2.5657256028892084e-08, + "loss": 1.2523, + "step": 44945 + }, + { + "epoch": 0.87, + "learning_rate": 2.5653372684555942e-08, + "loss": 0.0003, + "step": 44946 + }, + { + "epoch": 0.87, + "learning_rate": 2.56494893402198e-08, + "loss": 0.0628, + "step": 44947 + }, + { + "epoch": 0.87, + "learning_rate": 2.5645605995883652e-08, + "loss": 0.0005, + "step": 44948 + }, + { + "epoch": 0.87, + "learning_rate": 2.564172265154751e-08, + "loss": 0.0003, + "step": 44949 + }, + { + "epoch": 0.87, + "learning_rate": 2.5637839307211368e-08, + "loss": 0.0004, + "step": 44950 + }, + { + "epoch": 0.87, + "learning_rate": 2.5633955962875227e-08, + "loss": 0.0004, + "step": 44951 + }, + { + "epoch": 0.87, + "learning_rate": 2.5630072618539085e-08, + "loss": 0.0005, + "step": 44952 + }, + { + "epoch": 0.87, + "learning_rate": 2.5626189274202943e-08, + "loss": 0.0004, + "step": 44953 + }, + { + "epoch": 0.87, + "learning_rate": 2.56223059298668e-08, + "loss": 0.0004, + "step": 44954 + }, + { + "epoch": 0.87, + "learning_rate": 2.561842258553066e-08, + "loss": 0.0005, + "step": 44955 + }, + { + "epoch": 0.87, + "learning_rate": 2.5614539241194514e-08, + "loss": 0.0005, + "step": 44956 + }, + { + "epoch": 0.87, + "learning_rate": 2.5610655896858373e-08, + "loss": 0.0004, + "step": 44957 + }, + { + "epoch": 0.87, + "learning_rate": 2.560677255252223e-08, + "loss": 0.0004, + "step": 44958 + }, + { + "epoch": 0.87, + "learning_rate": 2.560288920818609e-08, + "loss": 0.0005, + "step": 44959 + }, + { + "epoch": 0.87, + "learning_rate": 2.5599005863849947e-08, + "loss": 0.0105, + "step": 44960 + }, + { + "epoch": 0.87, + "learning_rate": 2.5595122519513806e-08, + "loss": 0.0005, + "step": 44961 + }, + { + "epoch": 0.87, + "learning_rate": 2.5591239175177664e-08, + "loss": 0.0003, + "step": 44962 + }, + { + "epoch": 0.87, + "learning_rate": 2.5587355830841516e-08, + "loss": 0.0003, + "step": 44963 + }, + { + "epoch": 0.87, + "learning_rate": 2.5583472486505374e-08, + "loss": 0.0003, + "step": 44964 + }, + { + "epoch": 0.87, + "learning_rate": 2.5579589142169232e-08, + "loss": 0.0003, + "step": 44965 + }, + { + "epoch": 0.87, + "learning_rate": 2.557570579783309e-08, + "loss": 0.0976, + "step": 44966 + }, + { + "epoch": 0.87, + "learning_rate": 2.557182245349695e-08, + "loss": 0.0694, + "step": 44967 + }, + { + "epoch": 0.87, + "learning_rate": 2.5567939109160807e-08, + "loss": 0.0004, + "step": 44968 + }, + { + "epoch": 0.87, + "learning_rate": 2.5564055764824665e-08, + "loss": 0.0004, + "step": 44969 + }, + { + "epoch": 0.87, + "learning_rate": 2.5560172420488523e-08, + "loss": 0.0003, + "step": 44970 + }, + { + "epoch": 0.87, + "learning_rate": 2.555628907615238e-08, + "loss": 0.0004, + "step": 44971 + }, + { + "epoch": 0.87, + "learning_rate": 2.555240573181624e-08, + "loss": 0.0003, + "step": 44972 + }, + { + "epoch": 0.87, + "learning_rate": 2.5548522387480098e-08, + "loss": 0.0004, + "step": 44973 + }, + { + "epoch": 0.87, + "learning_rate": 2.5544639043143956e-08, + "loss": 0.0003, + "step": 44974 + }, + { + "epoch": 0.87, + "learning_rate": 2.5540755698807814e-08, + "loss": 0.0005, + "step": 44975 + }, + { + "epoch": 0.87, + "learning_rate": 2.5536872354471673e-08, + "loss": 0.0004, + "step": 44976 + }, + { + "epoch": 0.87, + "learning_rate": 2.5532989010135524e-08, + "loss": 0.0008, + "step": 44977 + }, + { + "epoch": 0.87, + "learning_rate": 2.5529105665799383e-08, + "loss": 0.0005, + "step": 44978 + }, + { + "epoch": 0.87, + "learning_rate": 2.552522232146324e-08, + "loss": 0.0003, + "step": 44979 + }, + { + "epoch": 0.87, + "learning_rate": 2.55213389771271e-08, + "loss": 0.0003, + "step": 44980 + }, + { + "epoch": 0.87, + "learning_rate": 2.5517455632790957e-08, + "loss": 0.0004, + "step": 44981 + }, + { + "epoch": 0.87, + "learning_rate": 2.5513572288454816e-08, + "loss": 0.0003, + "step": 44982 + }, + { + "epoch": 0.87, + "learning_rate": 2.5509688944118674e-08, + "loss": 0.0004, + "step": 44983 + }, + { + "epoch": 0.87, + "learning_rate": 2.5505805599782532e-08, + "loss": 0.0006, + "step": 44984 + }, + { + "epoch": 0.87, + "learning_rate": 2.550192225544639e-08, + "loss": 0.0003, + "step": 44985 + }, + { + "epoch": 0.87, + "learning_rate": 2.549803891111025e-08, + "loss": 0.0003, + "step": 44986 + }, + { + "epoch": 0.87, + "learning_rate": 2.5494155566774107e-08, + "loss": 0.0005, + "step": 44987 + }, + { + "epoch": 0.87, + "learning_rate": 2.5490272222437965e-08, + "loss": 0.0004, + "step": 44988 + }, + { + "epoch": 0.87, + "learning_rate": 2.5486388878101823e-08, + "loss": 0.0003, + "step": 44989 + }, + { + "epoch": 0.87, + "learning_rate": 2.548250553376568e-08, + "loss": 0.0003, + "step": 44990 + }, + { + "epoch": 0.87, + "learning_rate": 2.547862218942954e-08, + "loss": 0.0021, + "step": 44991 + }, + { + "epoch": 0.87, + "learning_rate": 2.547473884509339e-08, + "loss": 0.0004, + "step": 44992 + }, + { + "epoch": 0.87, + "learning_rate": 2.547085550075725e-08, + "loss": 0.0005, + "step": 44993 + }, + { + "epoch": 0.87, + "learning_rate": 2.5466972156421108e-08, + "loss": 0.0004, + "step": 44994 + }, + { + "epoch": 0.87, + "learning_rate": 2.5463088812084966e-08, + "loss": 0.0003, + "step": 44995 + }, + { + "epoch": 0.87, + "learning_rate": 2.5459205467748824e-08, + "loss": 0.0033, + "step": 44996 + }, + { + "epoch": 0.87, + "learning_rate": 2.5455322123412683e-08, + "loss": 0.8279, + "step": 44997 + }, + { + "epoch": 0.87, + "learning_rate": 2.545143877907654e-08, + "loss": 0.0004, + "step": 44998 + }, + { + "epoch": 0.87, + "learning_rate": 2.54475554347404e-08, + "loss": 0.0004, + "step": 44999 + }, + { + "epoch": 0.87, + "learning_rate": 2.5443672090404254e-08, + "loss": 0.0408, + "step": 45000 + }, + { + "epoch": 0.87, + "learning_rate": 2.5439788746068112e-08, + "loss": 0.0003, + "step": 45001 + }, + { + "epoch": 0.87, + "learning_rate": 2.543590540173197e-08, + "loss": 0.0003, + "step": 45002 + }, + { + "epoch": 0.87, + "learning_rate": 2.543202205739583e-08, + "loss": 0.0006, + "step": 45003 + }, + { + "epoch": 0.87, + "learning_rate": 2.5428138713059687e-08, + "loss": 1.3835, + "step": 45004 + }, + { + "epoch": 0.87, + "learning_rate": 2.5424255368723545e-08, + "loss": 0.0003, + "step": 45005 + }, + { + "epoch": 0.87, + "learning_rate": 2.54203720243874e-08, + "loss": 0.6469, + "step": 45006 + }, + { + "epoch": 0.87, + "learning_rate": 2.541648868005126e-08, + "loss": 0.0005, + "step": 45007 + }, + { + "epoch": 0.87, + "learning_rate": 2.5412605335715113e-08, + "loss": 0.0003, + "step": 45008 + }, + { + "epoch": 0.87, + "learning_rate": 2.540872199137897e-08, + "loss": 0.0003, + "step": 45009 + }, + { + "epoch": 0.87, + "learning_rate": 2.540483864704283e-08, + "loss": 0.0004, + "step": 45010 + }, + { + "epoch": 0.87, + "learning_rate": 2.5400955302706688e-08, + "loss": 0.0003, + "step": 45011 + }, + { + "epoch": 0.87, + "learning_rate": 2.5397071958370546e-08, + "loss": 0.0003, + "step": 45012 + }, + { + "epoch": 0.87, + "learning_rate": 2.5393188614034405e-08, + "loss": 0.0004, + "step": 45013 + }, + { + "epoch": 0.87, + "learning_rate": 2.5389305269698263e-08, + "loss": 0.0004, + "step": 45014 + }, + { + "epoch": 0.87, + "learning_rate": 2.538542192536212e-08, + "loss": 0.0004, + "step": 45015 + }, + { + "epoch": 0.87, + "learning_rate": 2.538153858102598e-08, + "loss": 0.0006, + "step": 45016 + }, + { + "epoch": 0.87, + "learning_rate": 2.5377655236689838e-08, + "loss": 0.0004, + "step": 45017 + }, + { + "epoch": 0.87, + "learning_rate": 2.5373771892353696e-08, + "loss": 0.0003, + "step": 45018 + }, + { + "epoch": 0.87, + "learning_rate": 2.5369888548017554e-08, + "loss": 0.0005, + "step": 45019 + }, + { + "epoch": 0.87, + "learning_rate": 2.5366005203681412e-08, + "loss": 0.0004, + "step": 45020 + }, + { + "epoch": 0.87, + "learning_rate": 2.5362121859345264e-08, + "loss": 0.621, + "step": 45021 + }, + { + "epoch": 0.87, + "learning_rate": 2.5358238515009122e-08, + "loss": 0.5877, + "step": 45022 + }, + { + "epoch": 0.87, + "learning_rate": 2.535435517067298e-08, + "loss": 0.0004, + "step": 45023 + }, + { + "epoch": 0.87, + "learning_rate": 2.535047182633684e-08, + "loss": 0.0093, + "step": 45024 + }, + { + "epoch": 0.87, + "learning_rate": 2.5346588482000697e-08, + "loss": 0.0022, + "step": 45025 + }, + { + "epoch": 0.87, + "learning_rate": 2.5342705137664555e-08, + "loss": 0.0005, + "step": 45026 + }, + { + "epoch": 0.87, + "learning_rate": 2.5338821793328413e-08, + "loss": 0.0003, + "step": 45027 + }, + { + "epoch": 0.87, + "learning_rate": 2.533493844899227e-08, + "loss": 0.3818, + "step": 45028 + }, + { + "epoch": 0.87, + "learning_rate": 2.533105510465613e-08, + "loss": 0.0224, + "step": 45029 + }, + { + "epoch": 0.87, + "learning_rate": 2.5327171760319988e-08, + "loss": 0.0003, + "step": 45030 + }, + { + "epoch": 0.87, + "learning_rate": 2.5323288415983846e-08, + "loss": 0.004, + "step": 45031 + }, + { + "epoch": 0.87, + "learning_rate": 2.5319405071647705e-08, + "loss": 0.0005, + "step": 45032 + }, + { + "epoch": 0.87, + "learning_rate": 2.5315521727311563e-08, + "loss": 0.0003, + "step": 45033 + }, + { + "epoch": 0.87, + "learning_rate": 2.531163838297542e-08, + "loss": 0.8087, + "step": 45034 + }, + { + "epoch": 0.87, + "learning_rate": 2.5307755038639273e-08, + "loss": 0.2219, + "step": 45035 + }, + { + "epoch": 0.87, + "learning_rate": 2.530387169430313e-08, + "loss": 0.0004, + "step": 45036 + }, + { + "epoch": 0.87, + "learning_rate": 2.529998834996699e-08, + "loss": 0.0004, + "step": 45037 + }, + { + "epoch": 0.87, + "learning_rate": 2.5296105005630847e-08, + "loss": 0.0005, + "step": 45038 + }, + { + "epoch": 0.87, + "learning_rate": 2.5292221661294706e-08, + "loss": 0.0003, + "step": 45039 + }, + { + "epoch": 0.87, + "learning_rate": 2.5288338316958564e-08, + "loss": 1.2183, + "step": 45040 + }, + { + "epoch": 0.87, + "learning_rate": 2.5284454972622422e-08, + "loss": 0.0007, + "step": 45041 + }, + { + "epoch": 0.87, + "learning_rate": 2.528057162828628e-08, + "loss": 0.0004, + "step": 45042 + }, + { + "epoch": 0.87, + "learning_rate": 2.527668828395014e-08, + "loss": 0.0003, + "step": 45043 + }, + { + "epoch": 0.87, + "learning_rate": 2.5272804939613997e-08, + "loss": 0.0006, + "step": 45044 + }, + { + "epoch": 0.87, + "learning_rate": 2.5268921595277852e-08, + "loss": 0.0004, + "step": 45045 + }, + { + "epoch": 0.87, + "learning_rate": 2.526503825094171e-08, + "loss": 0.0003, + "step": 45046 + }, + { + "epoch": 0.87, + "learning_rate": 2.5261154906605568e-08, + "loss": 1.1758, + "step": 45047 + }, + { + "epoch": 0.87, + "learning_rate": 2.5257271562269427e-08, + "loss": 0.0003, + "step": 45048 + }, + { + "epoch": 0.87, + "learning_rate": 2.5253388217933285e-08, + "loss": 0.0005, + "step": 45049 + }, + { + "epoch": 0.87, + "learning_rate": 2.524950487359714e-08, + "loss": 0.0003, + "step": 45050 + }, + { + "epoch": 0.87, + "learning_rate": 2.5245621529260998e-08, + "loss": 0.0267, + "step": 45051 + }, + { + "epoch": 0.87, + "learning_rate": 2.5241738184924853e-08, + "loss": 0.0003, + "step": 45052 + }, + { + "epoch": 0.87, + "learning_rate": 2.523785484058871e-08, + "loss": 0.0007, + "step": 45053 + }, + { + "epoch": 0.87, + "learning_rate": 2.523397149625257e-08, + "loss": 0.0005, + "step": 45054 + }, + { + "epoch": 0.87, + "learning_rate": 2.5230088151916428e-08, + "loss": 0.0004, + "step": 45055 + }, + { + "epoch": 0.87, + "learning_rate": 2.5226204807580286e-08, + "loss": 0.0004, + "step": 45056 + }, + { + "epoch": 0.87, + "learning_rate": 2.5222321463244144e-08, + "loss": 0.0003, + "step": 45057 + }, + { + "epoch": 0.87, + "learning_rate": 2.5218438118908002e-08, + "loss": 0.0004, + "step": 45058 + }, + { + "epoch": 0.87, + "learning_rate": 2.521455477457186e-08, + "loss": 0.0007, + "step": 45059 + }, + { + "epoch": 0.87, + "learning_rate": 2.521067143023572e-08, + "loss": 0.0002, + "step": 45060 + }, + { + "epoch": 0.87, + "learning_rate": 2.5206788085899577e-08, + "loss": 0.0466, + "step": 45061 + }, + { + "epoch": 0.87, + "learning_rate": 2.5202904741563435e-08, + "loss": 0.0004, + "step": 45062 + }, + { + "epoch": 0.87, + "learning_rate": 2.5199021397227294e-08, + "loss": 0.0003, + "step": 45063 + }, + { + "epoch": 0.87, + "learning_rate": 2.5195138052891145e-08, + "loss": 0.0005, + "step": 45064 + }, + { + "epoch": 0.87, + "learning_rate": 2.5191254708555003e-08, + "loss": 0.0002, + "step": 45065 + }, + { + "epoch": 0.87, + "learning_rate": 2.5187371364218862e-08, + "loss": 0.0003, + "step": 45066 + }, + { + "epoch": 0.87, + "learning_rate": 2.518348801988272e-08, + "loss": 0.0003, + "step": 45067 + }, + { + "epoch": 0.87, + "learning_rate": 2.5179604675546578e-08, + "loss": 0.0005, + "step": 45068 + }, + { + "epoch": 0.87, + "learning_rate": 2.5175721331210436e-08, + "loss": 0.0004, + "step": 45069 + }, + { + "epoch": 0.87, + "learning_rate": 2.5171837986874295e-08, + "loss": 0.0003, + "step": 45070 + }, + { + "epoch": 0.87, + "learning_rate": 2.5167954642538153e-08, + "loss": 0.0004, + "step": 45071 + }, + { + "epoch": 0.87, + "learning_rate": 2.516407129820201e-08, + "loss": 0.0004, + "step": 45072 + }, + { + "epoch": 0.87, + "learning_rate": 2.516018795386587e-08, + "loss": 0.1699, + "step": 45073 + }, + { + "epoch": 0.87, + "learning_rate": 2.5156304609529728e-08, + "loss": 0.0025, + "step": 45074 + }, + { + "epoch": 0.87, + "learning_rate": 2.5152421265193586e-08, + "loss": 0.0004, + "step": 45075 + }, + { + "epoch": 0.87, + "learning_rate": 2.5148537920857444e-08, + "loss": 0.0005, + "step": 45076 + }, + { + "epoch": 0.87, + "learning_rate": 2.5144654576521302e-08, + "loss": 0.0003, + "step": 45077 + }, + { + "epoch": 0.87, + "learning_rate": 2.514077123218516e-08, + "loss": 0.0004, + "step": 45078 + }, + { + "epoch": 0.87, + "learning_rate": 2.5136887887849012e-08, + "loss": 0.0003, + "step": 45079 + }, + { + "epoch": 0.87, + "learning_rate": 2.513300454351287e-08, + "loss": 0.0352, + "step": 45080 + }, + { + "epoch": 0.87, + "learning_rate": 2.512912119917673e-08, + "loss": 0.0003, + "step": 45081 + }, + { + "epoch": 0.87, + "learning_rate": 2.5125237854840587e-08, + "loss": 0.0215, + "step": 45082 + }, + { + "epoch": 0.87, + "learning_rate": 2.5121354510504445e-08, + "loss": 0.0005, + "step": 45083 + }, + { + "epoch": 0.87, + "learning_rate": 2.5117471166168304e-08, + "loss": 0.0004, + "step": 45084 + }, + { + "epoch": 0.87, + "learning_rate": 2.5113587821832162e-08, + "loss": 0.0003, + "step": 45085 + }, + { + "epoch": 0.87, + "learning_rate": 2.510970447749602e-08, + "loss": 0.0018, + "step": 45086 + }, + { + "epoch": 0.87, + "learning_rate": 2.5105821133159878e-08, + "loss": 0.0022, + "step": 45087 + }, + { + "epoch": 0.87, + "learning_rate": 2.5101937788823736e-08, + "loss": 0.0005, + "step": 45088 + }, + { + "epoch": 0.87, + "learning_rate": 2.509805444448759e-08, + "loss": 0.0004, + "step": 45089 + }, + { + "epoch": 0.87, + "learning_rate": 2.509417110015145e-08, + "loss": 0.0003, + "step": 45090 + }, + { + "epoch": 0.87, + "learning_rate": 2.5090287755815308e-08, + "loss": 0.0005, + "step": 45091 + }, + { + "epoch": 0.87, + "learning_rate": 2.5086404411479166e-08, + "loss": 0.7766, + "step": 45092 + }, + { + "epoch": 0.87, + "learning_rate": 2.508252106714302e-08, + "loss": 0.0003, + "step": 45093 + }, + { + "epoch": 0.87, + "learning_rate": 2.507863772280688e-08, + "loss": 0.0004, + "step": 45094 + }, + { + "epoch": 0.87, + "learning_rate": 2.5074754378470738e-08, + "loss": 0.0005, + "step": 45095 + }, + { + "epoch": 0.87, + "learning_rate": 2.5070871034134593e-08, + "loss": 0.0003, + "step": 45096 + }, + { + "epoch": 0.87, + "learning_rate": 2.506698768979845e-08, + "loss": 0.0003, + "step": 45097 + }, + { + "epoch": 0.87, + "learning_rate": 2.506310434546231e-08, + "loss": 0.0005, + "step": 45098 + }, + { + "epoch": 0.87, + "learning_rate": 2.5059221001126167e-08, + "loss": 0.0003, + "step": 45099 + }, + { + "epoch": 0.87, + "learning_rate": 2.5055337656790026e-08, + "loss": 0.0003, + "step": 45100 + }, + { + "epoch": 0.87, + "learning_rate": 2.5051454312453884e-08, + "loss": 0.0003, + "step": 45101 + }, + { + "epoch": 0.87, + "learning_rate": 2.5047570968117742e-08, + "loss": 0.001, + "step": 45102 + }, + { + "epoch": 0.87, + "learning_rate": 2.50436876237816e-08, + "loss": 0.0005, + "step": 45103 + }, + { + "epoch": 0.87, + "learning_rate": 2.503980427944546e-08, + "loss": 0.0002, + "step": 45104 + }, + { + "epoch": 0.87, + "learning_rate": 2.5035920935109317e-08, + "loss": 0.0004, + "step": 45105 + }, + { + "epoch": 0.87, + "learning_rate": 2.5032037590773175e-08, + "loss": 0.0003, + "step": 45106 + }, + { + "epoch": 0.87, + "learning_rate": 2.5028154246437033e-08, + "loss": 0.0005, + "step": 45107 + }, + { + "epoch": 0.88, + "learning_rate": 2.5024270902100885e-08, + "loss": 0.0002, + "step": 45108 + }, + { + "epoch": 0.88, + "learning_rate": 2.5020387557764743e-08, + "loss": 0.0003, + "step": 45109 + }, + { + "epoch": 0.88, + "learning_rate": 2.50165042134286e-08, + "loss": 0.0006, + "step": 45110 + }, + { + "epoch": 0.88, + "learning_rate": 2.501262086909246e-08, + "loss": 0.0004, + "step": 45111 + }, + { + "epoch": 0.88, + "learning_rate": 2.5008737524756318e-08, + "loss": 0.0004, + "step": 45112 + }, + { + "epoch": 0.88, + "learning_rate": 2.5004854180420176e-08, + "loss": 0.0004, + "step": 45113 + }, + { + "epoch": 0.88, + "learning_rate": 2.5000970836084034e-08, + "loss": 0.0005, + "step": 45114 + }, + { + "epoch": 0.88, + "learning_rate": 2.4997087491747893e-08, + "loss": 0.0003, + "step": 45115 + }, + { + "epoch": 0.88, + "learning_rate": 2.499320414741175e-08, + "loss": 0.0005, + "step": 45116 + }, + { + "epoch": 0.88, + "learning_rate": 2.498932080307561e-08, + "loss": 1.0526, + "step": 45117 + }, + { + "epoch": 0.88, + "learning_rate": 2.4985437458739464e-08, + "loss": 0.0004, + "step": 45118 + }, + { + "epoch": 0.88, + "learning_rate": 2.4981554114403322e-08, + "loss": 0.0072, + "step": 45119 + }, + { + "epoch": 0.88, + "learning_rate": 2.497767077006718e-08, + "loss": 0.0003, + "step": 45120 + }, + { + "epoch": 0.88, + "learning_rate": 2.497378742573104e-08, + "loss": 0.0004, + "step": 45121 + }, + { + "epoch": 0.88, + "learning_rate": 2.4969904081394897e-08, + "loss": 0.0003, + "step": 45122 + }, + { + "epoch": 0.88, + "learning_rate": 2.4966020737058755e-08, + "loss": 0.0005, + "step": 45123 + }, + { + "epoch": 0.88, + "learning_rate": 2.4962137392722613e-08, + "loss": 0.0003, + "step": 45124 + }, + { + "epoch": 0.88, + "learning_rate": 2.4958254048386472e-08, + "loss": 0.0004, + "step": 45125 + }, + { + "epoch": 0.88, + "learning_rate": 2.4954370704050327e-08, + "loss": 0.0003, + "step": 45126 + }, + { + "epoch": 0.88, + "learning_rate": 2.4950487359714185e-08, + "loss": 0.0004, + "step": 45127 + }, + { + "epoch": 0.88, + "learning_rate": 2.4946604015378043e-08, + "loss": 0.0005, + "step": 45128 + }, + { + "epoch": 0.88, + "learning_rate": 2.49427206710419e-08, + "loss": 0.0003, + "step": 45129 + }, + { + "epoch": 0.88, + "learning_rate": 2.493883732670576e-08, + "loss": 0.001, + "step": 45130 + }, + { + "epoch": 0.88, + "learning_rate": 2.4934953982369618e-08, + "loss": 0.0004, + "step": 45131 + }, + { + "epoch": 0.88, + "learning_rate": 2.4931070638033476e-08, + "loss": 0.0003, + "step": 45132 + }, + { + "epoch": 0.88, + "learning_rate": 2.492718729369733e-08, + "loss": 0.0004, + "step": 45133 + }, + { + "epoch": 0.88, + "learning_rate": 2.492330394936119e-08, + "loss": 0.0004, + "step": 45134 + }, + { + "epoch": 0.88, + "learning_rate": 2.4919420605025048e-08, + "loss": 0.004, + "step": 45135 + }, + { + "epoch": 0.88, + "learning_rate": 2.4915537260688906e-08, + "loss": 0.0005, + "step": 45136 + }, + { + "epoch": 0.88, + "learning_rate": 2.491165391635276e-08, + "loss": 0.0004, + "step": 45137 + }, + { + "epoch": 0.88, + "learning_rate": 2.490777057201662e-08, + "loss": 0.4523, + "step": 45138 + }, + { + "epoch": 0.88, + "learning_rate": 2.4903887227680477e-08, + "loss": 0.0006, + "step": 45139 + }, + { + "epoch": 0.88, + "learning_rate": 2.4900003883344335e-08, + "loss": 0.0005, + "step": 45140 + }, + { + "epoch": 0.88, + "learning_rate": 2.489612053900819e-08, + "loss": 0.0004, + "step": 45141 + }, + { + "epoch": 0.88, + "learning_rate": 2.489223719467205e-08, + "loss": 0.0004, + "step": 45142 + }, + { + "epoch": 0.88, + "learning_rate": 2.4888353850335907e-08, + "loss": 0.0003, + "step": 45143 + }, + { + "epoch": 0.88, + "learning_rate": 2.4884470505999765e-08, + "loss": 0.6037, + "step": 45144 + }, + { + "epoch": 0.88, + "learning_rate": 2.4880587161663623e-08, + "loss": 0.0004, + "step": 45145 + }, + { + "epoch": 0.88, + "learning_rate": 2.487670381732748e-08, + "loss": 0.0004, + "step": 45146 + }, + { + "epoch": 0.88, + "learning_rate": 2.4872820472991337e-08, + "loss": 0.0003, + "step": 45147 + }, + { + "epoch": 0.88, + "learning_rate": 2.4868937128655195e-08, + "loss": 0.7337, + "step": 45148 + }, + { + "epoch": 0.88, + "learning_rate": 2.4865053784319053e-08, + "loss": 0.0004, + "step": 45149 + }, + { + "epoch": 0.88, + "learning_rate": 2.486117043998291e-08, + "loss": 0.0068, + "step": 45150 + }, + { + "epoch": 0.88, + "learning_rate": 2.485728709564677e-08, + "loss": 0.0108, + "step": 45151 + }, + { + "epoch": 0.88, + "learning_rate": 2.4853403751310628e-08, + "loss": 0.0004, + "step": 45152 + }, + { + "epoch": 0.88, + "learning_rate": 2.4849520406974486e-08, + "loss": 0.0003, + "step": 45153 + }, + { + "epoch": 0.88, + "learning_rate": 2.4845637062638344e-08, + "loss": 0.0253, + "step": 45154 + }, + { + "epoch": 0.88, + "learning_rate": 2.48417537183022e-08, + "loss": 0.0003, + "step": 45155 + }, + { + "epoch": 0.88, + "learning_rate": 2.4837870373966057e-08, + "loss": 0.0005, + "step": 45156 + }, + { + "epoch": 0.88, + "learning_rate": 2.4833987029629916e-08, + "loss": 0.0003, + "step": 45157 + }, + { + "epoch": 0.88, + "learning_rate": 2.4830103685293774e-08, + "loss": 0.0004, + "step": 45158 + }, + { + "epoch": 0.88, + "learning_rate": 2.4826220340957632e-08, + "loss": 0.0121, + "step": 45159 + }, + { + "epoch": 0.88, + "learning_rate": 2.482233699662149e-08, + "loss": 0.0005, + "step": 45160 + }, + { + "epoch": 0.88, + "learning_rate": 2.481845365228535e-08, + "loss": 0.9037, + "step": 45161 + }, + { + "epoch": 0.88, + "learning_rate": 2.4814570307949204e-08, + "loss": 0.0003, + "step": 45162 + }, + { + "epoch": 0.88, + "learning_rate": 2.4810686963613062e-08, + "loss": 0.0012, + "step": 45163 + }, + { + "epoch": 0.88, + "learning_rate": 2.480680361927692e-08, + "loss": 0.0005, + "step": 45164 + }, + { + "epoch": 0.88, + "learning_rate": 2.4802920274940778e-08, + "loss": 0.0005, + "step": 45165 + }, + { + "epoch": 0.88, + "learning_rate": 2.4799036930604637e-08, + "loss": 0.0008, + "step": 45166 + }, + { + "epoch": 0.88, + "learning_rate": 2.4795153586268495e-08, + "loss": 0.0004, + "step": 45167 + }, + { + "epoch": 0.88, + "learning_rate": 2.4791270241932353e-08, + "loss": 0.0009, + "step": 45168 + }, + { + "epoch": 0.88, + "learning_rate": 2.4787386897596208e-08, + "loss": 0.0004, + "step": 45169 + }, + { + "epoch": 0.88, + "learning_rate": 2.4783503553260066e-08, + "loss": 0.0005, + "step": 45170 + }, + { + "epoch": 0.88, + "learning_rate": 2.4779620208923924e-08, + "loss": 0.0007, + "step": 45171 + }, + { + "epoch": 0.88, + "learning_rate": 2.4775736864587783e-08, + "loss": 0.0003, + "step": 45172 + }, + { + "epoch": 0.88, + "learning_rate": 2.477185352025164e-08, + "loss": 0.0004, + "step": 45173 + }, + { + "epoch": 0.88, + "learning_rate": 2.47679701759155e-08, + "loss": 0.0003, + "step": 45174 + }, + { + "epoch": 0.88, + "learning_rate": 2.4764086831579357e-08, + "loss": 0.0004, + "step": 45175 + }, + { + "epoch": 0.88, + "learning_rate": 2.4760203487243212e-08, + "loss": 0.0004, + "step": 45176 + }, + { + "epoch": 0.88, + "learning_rate": 2.475632014290707e-08, + "loss": 0.0006, + "step": 45177 + }, + { + "epoch": 0.88, + "learning_rate": 2.475243679857093e-08, + "loss": 0.0006, + "step": 45178 + }, + { + "epoch": 0.88, + "learning_rate": 2.4748553454234787e-08, + "loss": 0.0004, + "step": 45179 + }, + { + "epoch": 0.88, + "learning_rate": 2.4744670109898645e-08, + "loss": 0.0004, + "step": 45180 + }, + { + "epoch": 0.88, + "learning_rate": 2.47407867655625e-08, + "loss": 0.0003, + "step": 45181 + }, + { + "epoch": 0.88, + "learning_rate": 2.473690342122636e-08, + "loss": 0.0055, + "step": 45182 + }, + { + "epoch": 0.88, + "learning_rate": 2.4733020076890217e-08, + "loss": 0.0011, + "step": 45183 + }, + { + "epoch": 0.88, + "learning_rate": 2.4729136732554075e-08, + "loss": 0.0003, + "step": 45184 + }, + { + "epoch": 0.88, + "learning_rate": 2.472525338821793e-08, + "loss": 0.0004, + "step": 45185 + }, + { + "epoch": 0.88, + "learning_rate": 2.4721370043881788e-08, + "loss": 0.0003, + "step": 45186 + }, + { + "epoch": 0.88, + "learning_rate": 2.4717486699545646e-08, + "loss": 0.0004, + "step": 45187 + }, + { + "epoch": 0.88, + "learning_rate": 2.4713603355209505e-08, + "loss": 0.0004, + "step": 45188 + }, + { + "epoch": 0.88, + "learning_rate": 2.4709720010873363e-08, + "loss": 0.3276, + "step": 45189 + }, + { + "epoch": 0.88, + "learning_rate": 2.470583666653722e-08, + "loss": 0.0003, + "step": 45190 + }, + { + "epoch": 0.88, + "learning_rate": 2.4701953322201076e-08, + "loss": 0.0003, + "step": 45191 + }, + { + "epoch": 0.88, + "learning_rate": 2.4698069977864934e-08, + "loss": 0.0003, + "step": 45192 + }, + { + "epoch": 0.88, + "learning_rate": 2.4694186633528793e-08, + "loss": 1.0998, + "step": 45193 + }, + { + "epoch": 0.88, + "learning_rate": 2.469030328919265e-08, + "loss": 0.0004, + "step": 45194 + }, + { + "epoch": 0.88, + "learning_rate": 2.468641994485651e-08, + "loss": 0.0004, + "step": 45195 + }, + { + "epoch": 0.88, + "learning_rate": 2.4682536600520367e-08, + "loss": 0.0003, + "step": 45196 + }, + { + "epoch": 0.88, + "learning_rate": 2.4678653256184226e-08, + "loss": 0.0003, + "step": 45197 + }, + { + "epoch": 0.88, + "learning_rate": 2.467476991184808e-08, + "loss": 0.0208, + "step": 45198 + }, + { + "epoch": 0.88, + "learning_rate": 2.467088656751194e-08, + "loss": 0.0004, + "step": 45199 + }, + { + "epoch": 0.88, + "learning_rate": 2.4667003223175797e-08, + "loss": 0.0007, + "step": 45200 + }, + { + "epoch": 0.88, + "learning_rate": 2.4663119878839655e-08, + "loss": 0.0038, + "step": 45201 + }, + { + "epoch": 0.88, + "learning_rate": 2.4659236534503513e-08, + "loss": 0.3048, + "step": 45202 + }, + { + "epoch": 0.88, + "learning_rate": 2.4655353190167372e-08, + "loss": 0.0003, + "step": 45203 + }, + { + "epoch": 0.88, + "learning_rate": 2.465146984583123e-08, + "loss": 0.0005, + "step": 45204 + }, + { + "epoch": 0.88, + "learning_rate": 2.4647586501495085e-08, + "loss": 0.7707, + "step": 45205 + }, + { + "epoch": 0.88, + "learning_rate": 2.4643703157158943e-08, + "loss": 0.0095, + "step": 45206 + }, + { + "epoch": 0.88, + "learning_rate": 2.46398198128228e-08, + "loss": 0.0004, + "step": 45207 + }, + { + "epoch": 0.88, + "learning_rate": 2.463593646848666e-08, + "loss": 0.0013, + "step": 45208 + }, + { + "epoch": 0.88, + "learning_rate": 2.4632053124150518e-08, + "loss": 0.0004, + "step": 45209 + }, + { + "epoch": 0.88, + "learning_rate": 2.4628169779814376e-08, + "loss": 0.4947, + "step": 45210 + }, + { + "epoch": 0.88, + "learning_rate": 2.4624286435478234e-08, + "loss": 0.0003, + "step": 45211 + }, + { + "epoch": 0.88, + "learning_rate": 2.4620403091142093e-08, + "loss": 0.0006, + "step": 45212 + }, + { + "epoch": 0.88, + "learning_rate": 2.4616519746805948e-08, + "loss": 0.0003, + "step": 45213 + }, + { + "epoch": 0.88, + "learning_rate": 2.4612636402469806e-08, + "loss": 0.0041, + "step": 45214 + }, + { + "epoch": 0.88, + "learning_rate": 2.4608753058133664e-08, + "loss": 0.0068, + "step": 45215 + }, + { + "epoch": 0.88, + "learning_rate": 2.4604869713797522e-08, + "loss": 0.0004, + "step": 45216 + }, + { + "epoch": 0.88, + "learning_rate": 2.460098636946138e-08, + "loss": 0.0004, + "step": 45217 + }, + { + "epoch": 0.88, + "learning_rate": 2.459710302512524e-08, + "loss": 0.0005, + "step": 45218 + }, + { + "epoch": 0.88, + "learning_rate": 2.4593219680789097e-08, + "loss": 0.0004, + "step": 45219 + }, + { + "epoch": 0.88, + "learning_rate": 2.4589336336452952e-08, + "loss": 0.0003, + "step": 45220 + }, + { + "epoch": 0.88, + "learning_rate": 2.458545299211681e-08, + "loss": 0.0004, + "step": 45221 + }, + { + "epoch": 0.88, + "learning_rate": 2.458156964778067e-08, + "loss": 0.0002, + "step": 45222 + }, + { + "epoch": 0.88, + "learning_rate": 2.4577686303444527e-08, + "loss": 0.0003, + "step": 45223 + }, + { + "epoch": 0.88, + "learning_rate": 2.4573802959108385e-08, + "loss": 0.0004, + "step": 45224 + }, + { + "epoch": 0.88, + "learning_rate": 2.456991961477224e-08, + "loss": 0.0003, + "step": 45225 + }, + { + "epoch": 0.88, + "learning_rate": 2.4566036270436098e-08, + "loss": 0.0004, + "step": 45226 + }, + { + "epoch": 0.88, + "learning_rate": 2.4562152926099956e-08, + "loss": 0.0004, + "step": 45227 + }, + { + "epoch": 0.88, + "learning_rate": 2.4558269581763815e-08, + "loss": 0.0008, + "step": 45228 + }, + { + "epoch": 0.88, + "learning_rate": 2.455438623742767e-08, + "loss": 0.0005, + "step": 45229 + }, + { + "epoch": 0.88, + "learning_rate": 2.4550502893091528e-08, + "loss": 0.0003, + "step": 45230 + }, + { + "epoch": 0.88, + "learning_rate": 2.4546619548755386e-08, + "loss": 0.0003, + "step": 45231 + }, + { + "epoch": 0.88, + "learning_rate": 2.4542736204419244e-08, + "loss": 0.0004, + "step": 45232 + }, + { + "epoch": 0.88, + "learning_rate": 2.4538852860083103e-08, + "loss": 0.7551, + "step": 45233 + }, + { + "epoch": 0.88, + "learning_rate": 2.4534969515746957e-08, + "loss": 0.0003, + "step": 45234 + }, + { + "epoch": 0.88, + "learning_rate": 2.4531086171410816e-08, + "loss": 0.0004, + "step": 45235 + }, + { + "epoch": 0.88, + "learning_rate": 2.4527202827074674e-08, + "loss": 0.0003, + "step": 45236 + }, + { + "epoch": 0.88, + "learning_rate": 2.4523319482738532e-08, + "loss": 1.3842, + "step": 45237 + }, + { + "epoch": 0.88, + "learning_rate": 2.451943613840239e-08, + "loss": 0.0096, + "step": 45238 + }, + { + "epoch": 0.88, + "learning_rate": 2.451555279406625e-08, + "loss": 0.0003, + "step": 45239 + }, + { + "epoch": 0.88, + "learning_rate": 2.4511669449730107e-08, + "loss": 0.0003, + "step": 45240 + }, + { + "epoch": 0.88, + "learning_rate": 2.4507786105393965e-08, + "loss": 0.0004, + "step": 45241 + }, + { + "epoch": 0.88, + "learning_rate": 2.450390276105782e-08, + "loss": 0.0006, + "step": 45242 + }, + { + "epoch": 0.88, + "learning_rate": 2.4500019416721678e-08, + "loss": 0.0004, + "step": 45243 + }, + { + "epoch": 0.88, + "learning_rate": 2.4496136072385537e-08, + "loss": 0.0002, + "step": 45244 + }, + { + "epoch": 0.88, + "learning_rate": 2.4492252728049395e-08, + "loss": 0.0005, + "step": 45245 + }, + { + "epoch": 0.88, + "learning_rate": 2.4488369383713253e-08, + "loss": 0.0145, + "step": 45246 + }, + { + "epoch": 0.88, + "learning_rate": 2.448448603937711e-08, + "loss": 0.0004, + "step": 45247 + }, + { + "epoch": 0.88, + "learning_rate": 2.448060269504097e-08, + "loss": 0.0006, + "step": 45248 + }, + { + "epoch": 0.88, + "learning_rate": 2.4476719350704825e-08, + "loss": 0.0006, + "step": 45249 + }, + { + "epoch": 0.88, + "learning_rate": 2.4472836006368683e-08, + "loss": 0.0006, + "step": 45250 + }, + { + "epoch": 0.88, + "learning_rate": 2.446895266203254e-08, + "loss": 0.0012, + "step": 45251 + }, + { + "epoch": 0.88, + "learning_rate": 2.44650693176964e-08, + "loss": 0.0005, + "step": 45252 + }, + { + "epoch": 0.88, + "learning_rate": 2.4461185973360257e-08, + "loss": 0.0018, + "step": 45253 + }, + { + "epoch": 0.88, + "learning_rate": 2.4457302629024116e-08, + "loss": 0.0003, + "step": 45254 + }, + { + "epoch": 0.88, + "learning_rate": 2.4453419284687974e-08, + "loss": 0.0005, + "step": 45255 + }, + { + "epoch": 0.88, + "learning_rate": 2.444953594035183e-08, + "loss": 0.0004, + "step": 45256 + }, + { + "epoch": 0.88, + "learning_rate": 2.4445652596015687e-08, + "loss": 0.0004, + "step": 45257 + }, + { + "epoch": 0.88, + "learning_rate": 2.4441769251679545e-08, + "loss": 0.0026, + "step": 45258 + }, + { + "epoch": 0.88, + "learning_rate": 2.4437885907343404e-08, + "loss": 0.1716, + "step": 45259 + }, + { + "epoch": 0.88, + "learning_rate": 2.4434002563007262e-08, + "loss": 0.0004, + "step": 45260 + }, + { + "epoch": 0.88, + "learning_rate": 2.443011921867112e-08, + "loss": 0.0004, + "step": 45261 + }, + { + "epoch": 0.88, + "learning_rate": 2.442623587433498e-08, + "loss": 0.0003, + "step": 45262 + }, + { + "epoch": 0.88, + "learning_rate": 2.4422352529998833e-08, + "loss": 0.0003, + "step": 45263 + }, + { + "epoch": 0.88, + "learning_rate": 2.441846918566269e-08, + "loss": 0.0005, + "step": 45264 + }, + { + "epoch": 0.88, + "learning_rate": 2.441458584132655e-08, + "loss": 0.0004, + "step": 45265 + }, + { + "epoch": 0.88, + "learning_rate": 2.4410702496990408e-08, + "loss": 0.0003, + "step": 45266 + }, + { + "epoch": 0.88, + "learning_rate": 2.4406819152654266e-08, + "loss": 0.0005, + "step": 45267 + }, + { + "epoch": 0.88, + "learning_rate": 2.4402935808318125e-08, + "loss": 0.0003, + "step": 45268 + }, + { + "epoch": 0.88, + "learning_rate": 2.4399052463981983e-08, + "loss": 0.0004, + "step": 45269 + }, + { + "epoch": 0.88, + "learning_rate": 2.4395169119645838e-08, + "loss": 0.0005, + "step": 45270 + }, + { + "epoch": 0.88, + "learning_rate": 2.4391285775309696e-08, + "loss": 0.0005, + "step": 45271 + }, + { + "epoch": 0.88, + "learning_rate": 2.4387402430973554e-08, + "loss": 0.0008, + "step": 45272 + }, + { + "epoch": 0.88, + "learning_rate": 2.438351908663741e-08, + "loss": 0.0005, + "step": 45273 + }, + { + "epoch": 0.88, + "learning_rate": 2.4379635742301267e-08, + "loss": 0.0005, + "step": 45274 + }, + { + "epoch": 0.88, + "learning_rate": 2.4375752397965126e-08, + "loss": 0.0002, + "step": 45275 + }, + { + "epoch": 0.88, + "learning_rate": 2.4371869053628984e-08, + "loss": 0.0004, + "step": 45276 + }, + { + "epoch": 0.88, + "learning_rate": 2.4367985709292842e-08, + "loss": 0.0004, + "step": 45277 + }, + { + "epoch": 0.88, + "learning_rate": 2.4364102364956697e-08, + "loss": 0.0005, + "step": 45278 + }, + { + "epoch": 0.88, + "learning_rate": 2.4360219020620555e-08, + "loss": 0.0005, + "step": 45279 + }, + { + "epoch": 0.88, + "learning_rate": 2.4356335676284414e-08, + "loss": 0.0004, + "step": 45280 + }, + { + "epoch": 0.88, + "learning_rate": 2.4352452331948272e-08, + "loss": 0.0008, + "step": 45281 + }, + { + "epoch": 0.88, + "learning_rate": 2.434856898761213e-08, + "loss": 0.0003, + "step": 45282 + }, + { + "epoch": 0.88, + "learning_rate": 2.4344685643275988e-08, + "loss": 0.0004, + "step": 45283 + }, + { + "epoch": 0.88, + "learning_rate": 2.4340802298939847e-08, + "loss": 0.0005, + "step": 45284 + }, + { + "epoch": 0.88, + "learning_rate": 2.43369189546037e-08, + "loss": 0.0005, + "step": 45285 + }, + { + "epoch": 0.88, + "learning_rate": 2.433303561026756e-08, + "loss": 1.3621, + "step": 45286 + }, + { + "epoch": 0.88, + "learning_rate": 2.4329152265931418e-08, + "loss": 0.0003, + "step": 45287 + }, + { + "epoch": 0.88, + "learning_rate": 2.4325268921595276e-08, + "loss": 0.0005, + "step": 45288 + }, + { + "epoch": 0.88, + "learning_rate": 2.4321385577259134e-08, + "loss": 0.108, + "step": 45289 + }, + { + "epoch": 0.88, + "learning_rate": 2.4317502232922993e-08, + "loss": 0.0003, + "step": 45290 + }, + { + "epoch": 0.88, + "learning_rate": 2.431361888858685e-08, + "loss": 0.0003, + "step": 45291 + }, + { + "epoch": 0.88, + "learning_rate": 2.4309735544250706e-08, + "loss": 0.0008, + "step": 45292 + }, + { + "epoch": 0.88, + "learning_rate": 2.4305852199914564e-08, + "loss": 0.0005, + "step": 45293 + }, + { + "epoch": 0.88, + "learning_rate": 2.4301968855578422e-08, + "loss": 0.0003, + "step": 45294 + }, + { + "epoch": 0.88, + "learning_rate": 2.429808551124228e-08, + "loss": 0.0004, + "step": 45295 + }, + { + "epoch": 0.88, + "learning_rate": 2.429420216690614e-08, + "loss": 0.0003, + "step": 45296 + }, + { + "epoch": 0.88, + "learning_rate": 2.4290318822569997e-08, + "loss": 0.0004, + "step": 45297 + }, + { + "epoch": 0.88, + "learning_rate": 2.4286435478233855e-08, + "loss": 0.0004, + "step": 45298 + }, + { + "epoch": 0.88, + "learning_rate": 2.4282552133897714e-08, + "loss": 0.0003, + "step": 45299 + }, + { + "epoch": 0.88, + "learning_rate": 2.427866878956157e-08, + "loss": 0.0309, + "step": 45300 + }, + { + "epoch": 0.88, + "learning_rate": 2.4274785445225427e-08, + "loss": 0.0004, + "step": 45301 + }, + { + "epoch": 0.88, + "learning_rate": 2.4270902100889285e-08, + "loss": 0.0004, + "step": 45302 + }, + { + "epoch": 0.88, + "learning_rate": 2.4267018756553143e-08, + "loss": 0.0005, + "step": 45303 + }, + { + "epoch": 0.88, + "learning_rate": 2.4263135412217e-08, + "loss": 0.0005, + "step": 45304 + }, + { + "epoch": 0.88, + "learning_rate": 2.425925206788086e-08, + "loss": 0.0004, + "step": 45305 + }, + { + "epoch": 0.88, + "learning_rate": 2.4255368723544718e-08, + "loss": 0.9576, + "step": 45306 + }, + { + "epoch": 0.88, + "learning_rate": 2.4251485379208573e-08, + "loss": 0.0005, + "step": 45307 + }, + { + "epoch": 0.88, + "learning_rate": 2.424760203487243e-08, + "loss": 0.0007, + "step": 45308 + }, + { + "epoch": 0.88, + "learning_rate": 2.424371869053629e-08, + "loss": 0.0004, + "step": 45309 + }, + { + "epoch": 0.88, + "learning_rate": 2.4239835346200148e-08, + "loss": 0.0003, + "step": 45310 + }, + { + "epoch": 0.88, + "learning_rate": 2.4235952001864006e-08, + "loss": 0.0003, + "step": 45311 + }, + { + "epoch": 0.88, + "learning_rate": 2.4232068657527864e-08, + "loss": 0.0007, + "step": 45312 + }, + { + "epoch": 0.88, + "learning_rate": 2.4228185313191722e-08, + "loss": 0.0004, + "step": 45313 + }, + { + "epoch": 0.88, + "learning_rate": 2.4224301968855577e-08, + "loss": 0.046, + "step": 45314 + }, + { + "epoch": 0.88, + "learning_rate": 2.4220418624519436e-08, + "loss": 0.0008, + "step": 45315 + }, + { + "epoch": 0.88, + "learning_rate": 2.4216535280183294e-08, + "loss": 0.0003, + "step": 45316 + }, + { + "epoch": 0.88, + "learning_rate": 2.4212651935847152e-08, + "loss": 0.0004, + "step": 45317 + }, + { + "epoch": 0.88, + "learning_rate": 2.4208768591511007e-08, + "loss": 0.0005, + "step": 45318 + }, + { + "epoch": 0.88, + "learning_rate": 2.4204885247174865e-08, + "loss": 0.0004, + "step": 45319 + }, + { + "epoch": 0.88, + "learning_rate": 2.4201001902838723e-08, + "loss": 0.0004, + "step": 45320 + }, + { + "epoch": 0.88, + "learning_rate": 2.419711855850258e-08, + "loss": 0.0014, + "step": 45321 + }, + { + "epoch": 0.88, + "learning_rate": 2.4193235214166437e-08, + "loss": 1.0777, + "step": 45322 + }, + { + "epoch": 0.88, + "learning_rate": 2.4189351869830295e-08, + "loss": 0.0185, + "step": 45323 + }, + { + "epoch": 0.88, + "learning_rate": 2.4185468525494153e-08, + "loss": 0.0004, + "step": 45324 + }, + { + "epoch": 0.88, + "learning_rate": 2.418158518115801e-08, + "loss": 0.0004, + "step": 45325 + }, + { + "epoch": 0.88, + "learning_rate": 2.417770183682187e-08, + "loss": 0.0006, + "step": 45326 + }, + { + "epoch": 0.88, + "learning_rate": 2.4173818492485728e-08, + "loss": 0.6991, + "step": 45327 + }, + { + "epoch": 0.88, + "learning_rate": 2.4169935148149586e-08, + "loss": 0.0005, + "step": 45328 + }, + { + "epoch": 0.88, + "learning_rate": 2.416605180381344e-08, + "loss": 0.0006, + "step": 45329 + }, + { + "epoch": 0.88, + "learning_rate": 2.41621684594773e-08, + "loss": 0.0006, + "step": 45330 + }, + { + "epoch": 0.88, + "learning_rate": 2.4158285115141158e-08, + "loss": 0.0003, + "step": 45331 + }, + { + "epoch": 0.88, + "learning_rate": 2.4154401770805016e-08, + "loss": 0.0003, + "step": 45332 + }, + { + "epoch": 0.88, + "learning_rate": 2.4150518426468874e-08, + "loss": 0.0006, + "step": 45333 + }, + { + "epoch": 0.88, + "learning_rate": 2.4146635082132732e-08, + "loss": 0.0004, + "step": 45334 + }, + { + "epoch": 0.88, + "learning_rate": 2.414275173779659e-08, + "loss": 0.0004, + "step": 45335 + }, + { + "epoch": 0.88, + "learning_rate": 2.4138868393460445e-08, + "loss": 0.0003, + "step": 45336 + }, + { + "epoch": 0.88, + "learning_rate": 2.4134985049124304e-08, + "loss": 0.0003, + "step": 45337 + }, + { + "epoch": 0.88, + "learning_rate": 2.4131101704788162e-08, + "loss": 0.1256, + "step": 45338 + }, + { + "epoch": 0.88, + "learning_rate": 2.412721836045202e-08, + "loss": 0.389, + "step": 45339 + }, + { + "epoch": 0.88, + "learning_rate": 2.412333501611588e-08, + "loss": 0.0004, + "step": 45340 + }, + { + "epoch": 0.88, + "learning_rate": 2.4119451671779737e-08, + "loss": 0.0018, + "step": 45341 + }, + { + "epoch": 0.88, + "learning_rate": 2.4115568327443595e-08, + "loss": 0.0004, + "step": 45342 + }, + { + "epoch": 0.88, + "learning_rate": 2.411168498310745e-08, + "loss": 0.0003, + "step": 45343 + }, + { + "epoch": 0.88, + "learning_rate": 2.4107801638771308e-08, + "loss": 0.0078, + "step": 45344 + }, + { + "epoch": 0.88, + "learning_rate": 2.4103918294435166e-08, + "loss": 0.0006, + "step": 45345 + }, + { + "epoch": 0.88, + "learning_rate": 2.4100034950099025e-08, + "loss": 0.0005, + "step": 45346 + }, + { + "epoch": 0.88, + "learning_rate": 2.4096151605762883e-08, + "loss": 0.0002, + "step": 45347 + }, + { + "epoch": 0.88, + "learning_rate": 2.409226826142674e-08, + "loss": 0.0004, + "step": 45348 + }, + { + "epoch": 0.88, + "learning_rate": 2.40883849170906e-08, + "loss": 0.0003, + "step": 45349 + }, + { + "epoch": 0.88, + "learning_rate": 2.4084501572754454e-08, + "loss": 0.0007, + "step": 45350 + }, + { + "epoch": 0.88, + "learning_rate": 2.4080618228418312e-08, + "loss": 0.0003, + "step": 45351 + }, + { + "epoch": 0.88, + "learning_rate": 2.407673488408217e-08, + "loss": 0.1882, + "step": 45352 + }, + { + "epoch": 0.88, + "learning_rate": 2.407285153974603e-08, + "loss": 0.0054, + "step": 45353 + }, + { + "epoch": 0.88, + "learning_rate": 2.4068968195409887e-08, + "loss": 0.0004, + "step": 45354 + }, + { + "epoch": 0.88, + "learning_rate": 2.4065084851073745e-08, + "loss": 0.0004, + "step": 45355 + }, + { + "epoch": 0.88, + "learning_rate": 2.4061201506737604e-08, + "loss": 0.0005, + "step": 45356 + }, + { + "epoch": 0.88, + "learning_rate": 2.4057318162401462e-08, + "loss": 0.0003, + "step": 45357 + }, + { + "epoch": 0.88, + "learning_rate": 2.4053434818065317e-08, + "loss": 0.0003, + "step": 45358 + }, + { + "epoch": 0.88, + "learning_rate": 2.4049551473729175e-08, + "loss": 0.0638, + "step": 45359 + }, + { + "epoch": 0.88, + "learning_rate": 2.4045668129393033e-08, + "loss": 0.0004, + "step": 45360 + }, + { + "epoch": 0.88, + "learning_rate": 2.404178478505689e-08, + "loss": 0.0096, + "step": 45361 + }, + { + "epoch": 0.88, + "learning_rate": 2.4037901440720747e-08, + "loss": 0.0002, + "step": 45362 + }, + { + "epoch": 0.88, + "learning_rate": 2.4034018096384605e-08, + "loss": 0.0004, + "step": 45363 + }, + { + "epoch": 0.88, + "learning_rate": 2.4030134752048463e-08, + "loss": 0.0003, + "step": 45364 + }, + { + "epoch": 0.88, + "learning_rate": 2.4026251407712318e-08, + "loss": 0.0189, + "step": 45365 + }, + { + "epoch": 0.88, + "learning_rate": 2.4022368063376176e-08, + "loss": 0.0004, + "step": 45366 + }, + { + "epoch": 0.88, + "learning_rate": 2.4018484719040034e-08, + "loss": 0.0006, + "step": 45367 + }, + { + "epoch": 0.88, + "learning_rate": 2.4014601374703893e-08, + "loss": 0.0004, + "step": 45368 + }, + { + "epoch": 0.88, + "learning_rate": 2.401071803036775e-08, + "loss": 1.1339, + "step": 45369 + }, + { + "epoch": 0.88, + "learning_rate": 2.400683468603161e-08, + "loss": 0.0005, + "step": 45370 + }, + { + "epoch": 0.88, + "learning_rate": 2.4002951341695467e-08, + "loss": 0.0003, + "step": 45371 + }, + { + "epoch": 0.88, + "learning_rate": 2.3999067997359322e-08, + "loss": 0.0009, + "step": 45372 + }, + { + "epoch": 0.88, + "learning_rate": 2.399518465302318e-08, + "loss": 0.0004, + "step": 45373 + }, + { + "epoch": 0.88, + "learning_rate": 2.399130130868704e-08, + "loss": 0.0004, + "step": 45374 + }, + { + "epoch": 0.88, + "learning_rate": 2.3987417964350897e-08, + "loss": 0.0003, + "step": 45375 + }, + { + "epoch": 0.88, + "learning_rate": 2.3983534620014755e-08, + "loss": 0.0003, + "step": 45376 + }, + { + "epoch": 0.88, + "learning_rate": 2.3979651275678614e-08, + "loss": 0.0004, + "step": 45377 + }, + { + "epoch": 0.88, + "learning_rate": 2.3975767931342472e-08, + "loss": 0.0004, + "step": 45378 + }, + { + "epoch": 0.88, + "learning_rate": 2.3971884587006327e-08, + "loss": 0.2675, + "step": 45379 + }, + { + "epoch": 0.88, + "learning_rate": 2.3968001242670185e-08, + "loss": 0.3313, + "step": 45380 + }, + { + "epoch": 0.88, + "learning_rate": 2.3964117898334043e-08, + "loss": 0.4464, + "step": 45381 + }, + { + "epoch": 0.88, + "learning_rate": 2.39602345539979e-08, + "loss": 0.0003, + "step": 45382 + }, + { + "epoch": 0.88, + "learning_rate": 2.395635120966176e-08, + "loss": 0.0006, + "step": 45383 + }, + { + "epoch": 0.88, + "learning_rate": 2.3952467865325618e-08, + "loss": 0.0006, + "step": 45384 + }, + { + "epoch": 0.88, + "learning_rate": 2.3948584520989476e-08, + "loss": 0.0002, + "step": 45385 + }, + { + "epoch": 0.88, + "learning_rate": 2.3944701176653334e-08, + "loss": 0.0003, + "step": 45386 + }, + { + "epoch": 0.88, + "learning_rate": 2.394081783231719e-08, + "loss": 0.0005, + "step": 45387 + }, + { + "epoch": 0.88, + "learning_rate": 2.3936934487981048e-08, + "loss": 0.0006, + "step": 45388 + }, + { + "epoch": 0.88, + "learning_rate": 2.3933051143644906e-08, + "loss": 0.0004, + "step": 45389 + }, + { + "epoch": 0.88, + "learning_rate": 2.3929167799308764e-08, + "loss": 0.0004, + "step": 45390 + }, + { + "epoch": 0.88, + "learning_rate": 2.3925284454972622e-08, + "loss": 0.0004, + "step": 45391 + }, + { + "epoch": 0.88, + "learning_rate": 2.392140111063648e-08, + "loss": 0.0004, + "step": 45392 + }, + { + "epoch": 0.88, + "learning_rate": 2.391751776630034e-08, + "loss": 0.1435, + "step": 45393 + }, + { + "epoch": 0.88, + "learning_rate": 2.3913634421964194e-08, + "loss": 0.0004, + "step": 45394 + }, + { + "epoch": 0.88, + "learning_rate": 2.3909751077628052e-08, + "loss": 0.0003, + "step": 45395 + }, + { + "epoch": 0.88, + "learning_rate": 2.390586773329191e-08, + "loss": 0.0007, + "step": 45396 + }, + { + "epoch": 0.88, + "learning_rate": 2.390198438895577e-08, + "loss": 0.0005, + "step": 45397 + }, + { + "epoch": 0.88, + "learning_rate": 2.3898101044619627e-08, + "loss": 0.0005, + "step": 45398 + }, + { + "epoch": 0.88, + "learning_rate": 2.3894217700283485e-08, + "loss": 0.001, + "step": 45399 + }, + { + "epoch": 0.88, + "learning_rate": 2.3890334355947343e-08, + "loss": 0.0005, + "step": 45400 + }, + { + "epoch": 0.88, + "learning_rate": 2.3886451011611198e-08, + "loss": 0.0005, + "step": 45401 + }, + { + "epoch": 0.88, + "learning_rate": 2.3882567667275056e-08, + "loss": 0.0005, + "step": 45402 + }, + { + "epoch": 0.88, + "learning_rate": 2.3878684322938915e-08, + "loss": 0.0005, + "step": 45403 + }, + { + "epoch": 0.88, + "learning_rate": 2.3874800978602773e-08, + "loss": 0.0004, + "step": 45404 + }, + { + "epoch": 0.88, + "learning_rate": 2.387091763426663e-08, + "loss": 0.4269, + "step": 45405 + }, + { + "epoch": 0.88, + "learning_rate": 2.3867034289930486e-08, + "loss": 0.0005, + "step": 45406 + }, + { + "epoch": 0.88, + "learning_rate": 2.3863150945594344e-08, + "loss": 0.0006, + "step": 45407 + }, + { + "epoch": 0.88, + "learning_rate": 2.3859267601258203e-08, + "loss": 0.0003, + "step": 45408 + }, + { + "epoch": 0.88, + "learning_rate": 2.385538425692206e-08, + "loss": 0.0004, + "step": 45409 + }, + { + "epoch": 0.88, + "learning_rate": 2.3851500912585916e-08, + "loss": 0.8115, + "step": 45410 + }, + { + "epoch": 0.88, + "learning_rate": 2.3847617568249774e-08, + "loss": 0.0028, + "step": 45411 + }, + { + "epoch": 0.88, + "learning_rate": 2.3843734223913632e-08, + "loss": 0.0043, + "step": 45412 + }, + { + "epoch": 0.88, + "learning_rate": 2.383985087957749e-08, + "loss": 0.0003, + "step": 45413 + }, + { + "epoch": 0.88, + "learning_rate": 2.383596753524135e-08, + "loss": 0.0135, + "step": 45414 + }, + { + "epoch": 0.88, + "learning_rate": 2.3832084190905207e-08, + "loss": 0.0008, + "step": 45415 + }, + { + "epoch": 0.88, + "learning_rate": 2.3828200846569062e-08, + "loss": 1.0746, + "step": 45416 + }, + { + "epoch": 0.88, + "learning_rate": 2.382431750223292e-08, + "loss": 0.0004, + "step": 45417 + }, + { + "epoch": 0.88, + "learning_rate": 2.382043415789678e-08, + "loss": 0.0004, + "step": 45418 + }, + { + "epoch": 0.88, + "learning_rate": 2.3816550813560637e-08, + "loss": 0.0004, + "step": 45419 + }, + { + "epoch": 0.88, + "learning_rate": 2.3812667469224495e-08, + "loss": 0.0004, + "step": 45420 + }, + { + "epoch": 0.88, + "learning_rate": 2.3808784124888353e-08, + "loss": 0.0007, + "step": 45421 + }, + { + "epoch": 0.88, + "learning_rate": 2.380490078055221e-08, + "loss": 0.0004, + "step": 45422 + }, + { + "epoch": 0.88, + "learning_rate": 2.3801017436216066e-08, + "loss": 0.0004, + "step": 45423 + }, + { + "epoch": 0.88, + "learning_rate": 2.3797134091879925e-08, + "loss": 0.0004, + "step": 45424 + }, + { + "epoch": 0.88, + "learning_rate": 2.3793250747543783e-08, + "loss": 0.0006, + "step": 45425 + }, + { + "epoch": 0.88, + "learning_rate": 2.378936740320764e-08, + "loss": 0.0003, + "step": 45426 + }, + { + "epoch": 0.88, + "learning_rate": 2.37854840588715e-08, + "loss": 0.272, + "step": 45427 + }, + { + "epoch": 0.88, + "learning_rate": 2.3781600714535358e-08, + "loss": 0.0004, + "step": 45428 + }, + { + "epoch": 0.88, + "learning_rate": 2.3777717370199216e-08, + "loss": 0.0003, + "step": 45429 + }, + { + "epoch": 0.88, + "learning_rate": 2.377383402586307e-08, + "loss": 0.0004, + "step": 45430 + }, + { + "epoch": 0.88, + "learning_rate": 2.376995068152693e-08, + "loss": 0.0005, + "step": 45431 + }, + { + "epoch": 0.88, + "learning_rate": 2.3766067337190787e-08, + "loss": 0.0005, + "step": 45432 + }, + { + "epoch": 0.88, + "learning_rate": 2.3762183992854646e-08, + "loss": 0.0013, + "step": 45433 + }, + { + "epoch": 0.88, + "learning_rate": 2.3758300648518504e-08, + "loss": 0.0006, + "step": 45434 + }, + { + "epoch": 0.88, + "learning_rate": 2.3754417304182362e-08, + "loss": 0.0007, + "step": 45435 + }, + { + "epoch": 0.88, + "learning_rate": 2.375053395984622e-08, + "loss": 0.0015, + "step": 45436 + }, + { + "epoch": 0.88, + "learning_rate": 2.3746650615510075e-08, + "loss": 0.0005, + "step": 45437 + }, + { + "epoch": 0.88, + "learning_rate": 2.3742767271173933e-08, + "loss": 0.9496, + "step": 45438 + }, + { + "epoch": 0.88, + "learning_rate": 2.3738883926837792e-08, + "loss": 0.0005, + "step": 45439 + }, + { + "epoch": 0.88, + "learning_rate": 2.373500058250165e-08, + "loss": 0.0004, + "step": 45440 + }, + { + "epoch": 0.88, + "learning_rate": 2.3731117238165508e-08, + "loss": 0.0007, + "step": 45441 + }, + { + "epoch": 0.88, + "learning_rate": 2.3727233893829366e-08, + "loss": 0.0003, + "step": 45442 + }, + { + "epoch": 0.88, + "learning_rate": 2.3723350549493225e-08, + "loss": 0.0003, + "step": 45443 + }, + { + "epoch": 0.88, + "learning_rate": 2.3719467205157083e-08, + "loss": 0.0004, + "step": 45444 + }, + { + "epoch": 0.88, + "learning_rate": 2.3715583860820938e-08, + "loss": 0.0004, + "step": 45445 + }, + { + "epoch": 0.88, + "learning_rate": 2.3711700516484796e-08, + "loss": 0.0003, + "step": 45446 + }, + { + "epoch": 0.88, + "learning_rate": 2.3707817172148654e-08, + "loss": 0.0005, + "step": 45447 + }, + { + "epoch": 0.88, + "learning_rate": 2.3703933827812513e-08, + "loss": 0.0004, + "step": 45448 + }, + { + "epoch": 0.88, + "learning_rate": 2.370005048347637e-08, + "loss": 0.0003, + "step": 45449 + }, + { + "epoch": 0.88, + "learning_rate": 2.3696167139140226e-08, + "loss": 0.8812, + "step": 45450 + }, + { + "epoch": 0.88, + "learning_rate": 2.3692283794804084e-08, + "loss": 0.0004, + "step": 45451 + }, + { + "epoch": 0.88, + "learning_rate": 2.3688400450467942e-08, + "loss": 0.0004, + "step": 45452 + }, + { + "epoch": 0.88, + "learning_rate": 2.36845171061318e-08, + "loss": 0.0007, + "step": 45453 + }, + { + "epoch": 0.88, + "learning_rate": 2.3680633761795655e-08, + "loss": 0.0003, + "step": 45454 + }, + { + "epoch": 0.88, + "learning_rate": 2.3676750417459514e-08, + "loss": 0.0006, + "step": 45455 + }, + { + "epoch": 0.88, + "learning_rate": 2.3672867073123372e-08, + "loss": 0.0003, + "step": 45456 + }, + { + "epoch": 0.88, + "learning_rate": 2.366898372878723e-08, + "loss": 0.0028, + "step": 45457 + }, + { + "epoch": 0.88, + "learning_rate": 2.366510038445109e-08, + "loss": 0.0006, + "step": 45458 + }, + { + "epoch": 0.88, + "learning_rate": 2.3661217040114943e-08, + "loss": 0.0003, + "step": 45459 + }, + { + "epoch": 0.88, + "learning_rate": 2.36573336957788e-08, + "loss": 0.0004, + "step": 45460 + }, + { + "epoch": 0.88, + "learning_rate": 2.365345035144266e-08, + "loss": 0.0006, + "step": 45461 + }, + { + "epoch": 0.88, + "learning_rate": 2.3649567007106518e-08, + "loss": 0.0004, + "step": 45462 + }, + { + "epoch": 0.88, + "learning_rate": 2.3645683662770376e-08, + "loss": 0.0005, + "step": 45463 + }, + { + "epoch": 0.88, + "learning_rate": 2.3641800318434235e-08, + "loss": 0.0006, + "step": 45464 + }, + { + "epoch": 0.88, + "learning_rate": 2.3637916974098093e-08, + "loss": 0.2042, + "step": 45465 + }, + { + "epoch": 0.88, + "learning_rate": 2.3634033629761948e-08, + "loss": 0.0005, + "step": 45466 + }, + { + "epoch": 0.88, + "learning_rate": 2.3630150285425806e-08, + "loss": 0.0004, + "step": 45467 + }, + { + "epoch": 0.88, + "learning_rate": 2.3626266941089664e-08, + "loss": 0.0004, + "step": 45468 + }, + { + "epoch": 0.88, + "learning_rate": 2.3622383596753522e-08, + "loss": 0.366, + "step": 45469 + }, + { + "epoch": 0.88, + "learning_rate": 2.361850025241738e-08, + "loss": 0.0339, + "step": 45470 + }, + { + "epoch": 0.88, + "learning_rate": 2.361461690808124e-08, + "loss": 0.0004, + "step": 45471 + }, + { + "epoch": 0.88, + "learning_rate": 2.3610733563745097e-08, + "loss": 0.0004, + "step": 45472 + }, + { + "epoch": 0.88, + "learning_rate": 2.3606850219408955e-08, + "loss": 0.0004, + "step": 45473 + }, + { + "epoch": 0.88, + "learning_rate": 2.360296687507281e-08, + "loss": 0.0003, + "step": 45474 + }, + { + "epoch": 0.88, + "learning_rate": 2.359908353073667e-08, + "loss": 0.0002, + "step": 45475 + }, + { + "epoch": 0.88, + "learning_rate": 2.3595200186400527e-08, + "loss": 0.1408, + "step": 45476 + }, + { + "epoch": 0.88, + "learning_rate": 2.3591316842064385e-08, + "loss": 0.0004, + "step": 45477 + }, + { + "epoch": 0.88, + "learning_rate": 2.3587433497728243e-08, + "loss": 0.0036, + "step": 45478 + }, + { + "epoch": 0.88, + "learning_rate": 2.35835501533921e-08, + "loss": 0.0033, + "step": 45479 + }, + { + "epoch": 0.88, + "learning_rate": 2.357966680905596e-08, + "loss": 0.0023, + "step": 45480 + }, + { + "epoch": 0.88, + "learning_rate": 2.3575783464719815e-08, + "loss": 0.6536, + "step": 45481 + }, + { + "epoch": 0.88, + "learning_rate": 2.3571900120383673e-08, + "loss": 0.0004, + "step": 45482 + }, + { + "epoch": 0.88, + "learning_rate": 2.356801677604753e-08, + "loss": 0.0005, + "step": 45483 + }, + { + "epoch": 0.88, + "learning_rate": 2.356413343171139e-08, + "loss": 0.0003, + "step": 45484 + }, + { + "epoch": 0.88, + "learning_rate": 2.3560250087375248e-08, + "loss": 0.0004, + "step": 45485 + }, + { + "epoch": 0.88, + "learning_rate": 2.3556366743039106e-08, + "loss": 0.0005, + "step": 45486 + }, + { + "epoch": 0.88, + "learning_rate": 2.3552483398702964e-08, + "loss": 0.0005, + "step": 45487 + }, + { + "epoch": 0.88, + "learning_rate": 2.354860005436682e-08, + "loss": 0.0004, + "step": 45488 + }, + { + "epoch": 0.88, + "learning_rate": 2.3544716710030677e-08, + "loss": 0.002, + "step": 45489 + }, + { + "epoch": 0.88, + "learning_rate": 2.3540833365694536e-08, + "loss": 1.2765, + "step": 45490 + }, + { + "epoch": 0.88, + "learning_rate": 2.3536950021358394e-08, + "loss": 0.0005, + "step": 45491 + }, + { + "epoch": 0.88, + "learning_rate": 2.3533066677022252e-08, + "loss": 0.0003, + "step": 45492 + }, + { + "epoch": 0.88, + "learning_rate": 2.352918333268611e-08, + "loss": 0.0003, + "step": 45493 + }, + { + "epoch": 0.88, + "learning_rate": 2.352529998834997e-08, + "loss": 0.1617, + "step": 45494 + }, + { + "epoch": 0.88, + "learning_rate": 2.3521416644013824e-08, + "loss": 0.4954, + "step": 45495 + }, + { + "epoch": 0.88, + "learning_rate": 2.3517533299677682e-08, + "loss": 0.5357, + "step": 45496 + }, + { + "epoch": 0.88, + "learning_rate": 2.351364995534154e-08, + "loss": 0.0005, + "step": 45497 + }, + { + "epoch": 0.88, + "learning_rate": 2.3509766611005395e-08, + "loss": 0.0004, + "step": 45498 + }, + { + "epoch": 0.88, + "learning_rate": 2.3505883266669253e-08, + "loss": 0.0002, + "step": 45499 + }, + { + "epoch": 0.88, + "learning_rate": 2.350199992233311e-08, + "loss": 0.0003, + "step": 45500 + }, + { + "epoch": 0.88, + "learning_rate": 2.349811657799697e-08, + "loss": 0.0007, + "step": 45501 + }, + { + "epoch": 0.88, + "learning_rate": 2.3494233233660828e-08, + "loss": 0.0003, + "step": 45502 + }, + { + "epoch": 0.88, + "learning_rate": 2.3490349889324683e-08, + "loss": 0.0005, + "step": 45503 + }, + { + "epoch": 0.88, + "learning_rate": 2.348646654498854e-08, + "loss": 0.0003, + "step": 45504 + }, + { + "epoch": 0.88, + "learning_rate": 2.34825832006524e-08, + "loss": 0.0003, + "step": 45505 + }, + { + "epoch": 0.88, + "learning_rate": 2.3478699856316258e-08, + "loss": 0.0004, + "step": 45506 + }, + { + "epoch": 0.88, + "learning_rate": 2.3474816511980116e-08, + "loss": 0.0006, + "step": 45507 + }, + { + "epoch": 0.88, + "learning_rate": 2.3470933167643974e-08, + "loss": 0.0003, + "step": 45508 + }, + { + "epoch": 0.88, + "learning_rate": 2.3467049823307832e-08, + "loss": 0.0004, + "step": 45509 + }, + { + "epoch": 0.88, + "learning_rate": 2.3463166478971687e-08, + "loss": 0.0003, + "step": 45510 + }, + { + "epoch": 0.88, + "learning_rate": 2.3459283134635546e-08, + "loss": 0.0003, + "step": 45511 + }, + { + "epoch": 0.88, + "learning_rate": 2.3455399790299404e-08, + "loss": 0.0004, + "step": 45512 + }, + { + "epoch": 0.88, + "learning_rate": 2.3451516445963262e-08, + "loss": 0.0004, + "step": 45513 + }, + { + "epoch": 0.88, + "learning_rate": 2.344763310162712e-08, + "loss": 0.0003, + "step": 45514 + }, + { + "epoch": 0.88, + "learning_rate": 2.344374975729098e-08, + "loss": 0.0004, + "step": 45515 + }, + { + "epoch": 0.88, + "learning_rate": 2.3439866412954837e-08, + "loss": 0.0004, + "step": 45516 + }, + { + "epoch": 0.88, + "learning_rate": 2.3435983068618692e-08, + "loss": 0.0002, + "step": 45517 + }, + { + "epoch": 0.88, + "learning_rate": 2.343209972428255e-08, + "loss": 1.3266, + "step": 45518 + }, + { + "epoch": 0.88, + "learning_rate": 2.3428216379946408e-08, + "loss": 0.0004, + "step": 45519 + }, + { + "epoch": 0.88, + "learning_rate": 2.3424333035610266e-08, + "loss": 0.0004, + "step": 45520 + }, + { + "epoch": 0.88, + "learning_rate": 2.3420449691274125e-08, + "loss": 0.0003, + "step": 45521 + }, + { + "epoch": 0.88, + "learning_rate": 2.3416566346937983e-08, + "loss": 0.0009, + "step": 45522 + }, + { + "epoch": 0.88, + "learning_rate": 2.341268300260184e-08, + "loss": 0.0005, + "step": 45523 + }, + { + "epoch": 0.88, + "learning_rate": 2.3408799658265696e-08, + "loss": 0.041, + "step": 45524 + }, + { + "epoch": 0.88, + "learning_rate": 2.3404916313929554e-08, + "loss": 0.0003, + "step": 45525 + }, + { + "epoch": 0.88, + "learning_rate": 2.3401032969593413e-08, + "loss": 0.0004, + "step": 45526 + }, + { + "epoch": 0.88, + "learning_rate": 2.339714962525727e-08, + "loss": 0.0003, + "step": 45527 + }, + { + "epoch": 0.88, + "learning_rate": 2.339326628092113e-08, + "loss": 0.7172, + "step": 45528 + }, + { + "epoch": 0.88, + "learning_rate": 2.3389382936584987e-08, + "loss": 0.0003, + "step": 45529 + }, + { + "epoch": 0.88, + "learning_rate": 2.3385499592248846e-08, + "loss": 0.0012, + "step": 45530 + }, + { + "epoch": 0.88, + "learning_rate": 2.3381616247912704e-08, + "loss": 0.0004, + "step": 45531 + }, + { + "epoch": 0.88, + "learning_rate": 2.337773290357656e-08, + "loss": 0.0003, + "step": 45532 + }, + { + "epoch": 0.88, + "learning_rate": 2.3373849559240417e-08, + "loss": 0.0003, + "step": 45533 + }, + { + "epoch": 0.88, + "learning_rate": 2.3369966214904275e-08, + "loss": 0.0005, + "step": 45534 + }, + { + "epoch": 0.88, + "learning_rate": 2.3366082870568133e-08, + "loss": 0.0087, + "step": 45535 + }, + { + "epoch": 0.88, + "learning_rate": 2.3362199526231992e-08, + "loss": 0.0003, + "step": 45536 + }, + { + "epoch": 0.88, + "learning_rate": 2.335831618189585e-08, + "loss": 0.0003, + "step": 45537 + }, + { + "epoch": 0.88, + "learning_rate": 2.3354432837559708e-08, + "loss": 0.0008, + "step": 45538 + }, + { + "epoch": 0.88, + "learning_rate": 2.3350549493223563e-08, + "loss": 0.0005, + "step": 45539 + }, + { + "epoch": 0.88, + "learning_rate": 2.334666614888742e-08, + "loss": 0.0002, + "step": 45540 + }, + { + "epoch": 0.88, + "learning_rate": 2.334278280455128e-08, + "loss": 0.0003, + "step": 45541 + }, + { + "epoch": 0.88, + "learning_rate": 2.3338899460215135e-08, + "loss": 0.3572, + "step": 45542 + }, + { + "epoch": 0.88, + "learning_rate": 2.3335016115878993e-08, + "loss": 0.0003, + "step": 45543 + }, + { + "epoch": 0.88, + "learning_rate": 2.333113277154285e-08, + "loss": 0.0004, + "step": 45544 + }, + { + "epoch": 0.88, + "learning_rate": 2.332724942720671e-08, + "loss": 0.0007, + "step": 45545 + }, + { + "epoch": 0.88, + "learning_rate": 2.3323366082870564e-08, + "loss": 0.0003, + "step": 45546 + }, + { + "epoch": 0.88, + "learning_rate": 2.3319482738534422e-08, + "loss": 0.0004, + "step": 45547 + }, + { + "epoch": 0.88, + "learning_rate": 2.331559939419828e-08, + "loss": 0.1781, + "step": 45548 + }, + { + "epoch": 0.88, + "learning_rate": 2.331171604986214e-08, + "loss": 0.0004, + "step": 45549 + }, + { + "epoch": 0.88, + "learning_rate": 2.3307832705525997e-08, + "loss": 0.0005, + "step": 45550 + }, + { + "epoch": 0.88, + "learning_rate": 2.3303949361189855e-08, + "loss": 1.0632, + "step": 45551 + }, + { + "epoch": 0.88, + "learning_rate": 2.3300066016853714e-08, + "loss": 0.0003, + "step": 45552 + }, + { + "epoch": 0.88, + "learning_rate": 2.329618267251757e-08, + "loss": 0.0003, + "step": 45553 + }, + { + "epoch": 0.88, + "learning_rate": 2.3292299328181427e-08, + "loss": 0.0003, + "step": 45554 + }, + { + "epoch": 0.88, + "learning_rate": 2.3288415983845285e-08, + "loss": 0.0005, + "step": 45555 + }, + { + "epoch": 0.88, + "learning_rate": 2.3284532639509143e-08, + "loss": 1.2664, + "step": 45556 + }, + { + "epoch": 0.88, + "learning_rate": 2.3280649295173e-08, + "loss": 0.0004, + "step": 45557 + }, + { + "epoch": 0.88, + "learning_rate": 2.327676595083686e-08, + "loss": 1.4567, + "step": 45558 + }, + { + "epoch": 0.88, + "learning_rate": 2.3272882606500718e-08, + "loss": 0.0005, + "step": 45559 + }, + { + "epoch": 0.88, + "learning_rate": 2.3268999262164576e-08, + "loss": 0.0004, + "step": 45560 + }, + { + "epoch": 0.88, + "learning_rate": 2.326511591782843e-08, + "loss": 0.0003, + "step": 45561 + }, + { + "epoch": 0.88, + "learning_rate": 2.326123257349229e-08, + "loss": 0.0006, + "step": 45562 + }, + { + "epoch": 0.88, + "learning_rate": 2.3257349229156148e-08, + "loss": 0.0004, + "step": 45563 + }, + { + "epoch": 0.88, + "learning_rate": 2.3253465884820006e-08, + "loss": 0.0073, + "step": 45564 + }, + { + "epoch": 0.88, + "learning_rate": 2.3249582540483864e-08, + "loss": 0.0004, + "step": 45565 + }, + { + "epoch": 0.88, + "learning_rate": 2.3245699196147723e-08, + "loss": 0.0006, + "step": 45566 + }, + { + "epoch": 0.88, + "learning_rate": 2.324181585181158e-08, + "loss": 0.8092, + "step": 45567 + }, + { + "epoch": 0.88, + "learning_rate": 2.3237932507475436e-08, + "loss": 0.0004, + "step": 45568 + }, + { + "epoch": 0.88, + "learning_rate": 2.3234049163139294e-08, + "loss": 0.0004, + "step": 45569 + }, + { + "epoch": 0.88, + "learning_rate": 2.3230165818803152e-08, + "loss": 0.0004, + "step": 45570 + }, + { + "epoch": 0.88, + "learning_rate": 2.322628247446701e-08, + "loss": 0.0015, + "step": 45571 + }, + { + "epoch": 0.88, + "learning_rate": 2.322239913013087e-08, + "loss": 0.0004, + "step": 45572 + }, + { + "epoch": 0.88, + "learning_rate": 2.3218515785794727e-08, + "loss": 0.0003, + "step": 45573 + }, + { + "epoch": 0.88, + "learning_rate": 2.3214632441458585e-08, + "loss": 0.0002, + "step": 45574 + }, + { + "epoch": 0.88, + "learning_rate": 2.321074909712244e-08, + "loss": 0.0305, + "step": 45575 + }, + { + "epoch": 0.88, + "learning_rate": 2.3206865752786298e-08, + "loss": 0.0009, + "step": 45576 + }, + { + "epoch": 0.88, + "learning_rate": 2.3202982408450157e-08, + "loss": 0.0105, + "step": 45577 + }, + { + "epoch": 0.88, + "learning_rate": 2.3199099064114015e-08, + "loss": 0.0003, + "step": 45578 + }, + { + "epoch": 0.88, + "learning_rate": 2.3195215719777873e-08, + "loss": 0.0004, + "step": 45579 + }, + { + "epoch": 0.88, + "learning_rate": 2.319133237544173e-08, + "loss": 0.0003, + "step": 45580 + }, + { + "epoch": 0.88, + "learning_rate": 2.318744903110559e-08, + "loss": 0.0003, + "step": 45581 + }, + { + "epoch": 0.88, + "learning_rate": 2.3183565686769444e-08, + "loss": 0.1893, + "step": 45582 + }, + { + "epoch": 0.88, + "learning_rate": 2.3179682342433303e-08, + "loss": 0.0003, + "step": 45583 + }, + { + "epoch": 0.88, + "learning_rate": 2.317579899809716e-08, + "loss": 0.0122, + "step": 45584 + }, + { + "epoch": 0.88, + "learning_rate": 2.317191565376102e-08, + "loss": 0.0004, + "step": 45585 + }, + { + "epoch": 0.88, + "learning_rate": 2.3168032309424877e-08, + "loss": 0.0004, + "step": 45586 + }, + { + "epoch": 0.88, + "learning_rate": 2.3164148965088732e-08, + "loss": 0.0004, + "step": 45587 + }, + { + "epoch": 0.88, + "learning_rate": 2.316026562075259e-08, + "loss": 0.0013, + "step": 45588 + }, + { + "epoch": 0.88, + "learning_rate": 2.315638227641645e-08, + "loss": 0.0005, + "step": 45589 + }, + { + "epoch": 0.88, + "learning_rate": 2.3152498932080304e-08, + "loss": 0.0004, + "step": 45590 + }, + { + "epoch": 0.88, + "learning_rate": 2.3148615587744162e-08, + "loss": 0.0006, + "step": 45591 + }, + { + "epoch": 0.88, + "learning_rate": 2.314473224340802e-08, + "loss": 0.0006, + "step": 45592 + }, + { + "epoch": 0.88, + "learning_rate": 2.314084889907188e-08, + "loss": 0.0005, + "step": 45593 + }, + { + "epoch": 0.88, + "learning_rate": 2.3136965554735737e-08, + "loss": 0.001, + "step": 45594 + }, + { + "epoch": 0.88, + "learning_rate": 2.3133082210399595e-08, + "loss": 0.0003, + "step": 45595 + }, + { + "epoch": 0.88, + "learning_rate": 2.3129198866063453e-08, + "loss": 0.1358, + "step": 45596 + }, + { + "epoch": 0.88, + "learning_rate": 2.3125315521727308e-08, + "loss": 0.63, + "step": 45597 + }, + { + "epoch": 0.88, + "learning_rate": 2.3121432177391166e-08, + "loss": 0.0004, + "step": 45598 + }, + { + "epoch": 0.88, + "learning_rate": 2.3117548833055025e-08, + "loss": 0.0003, + "step": 45599 + }, + { + "epoch": 0.88, + "learning_rate": 2.3113665488718883e-08, + "loss": 0.0005, + "step": 45600 + }, + { + "epoch": 0.88, + "learning_rate": 2.310978214438274e-08, + "loss": 0.0003, + "step": 45601 + }, + { + "epoch": 0.88, + "learning_rate": 2.31058988000466e-08, + "loss": 0.0004, + "step": 45602 + }, + { + "epoch": 0.88, + "learning_rate": 2.3102015455710458e-08, + "loss": 0.0004, + "step": 45603 + }, + { + "epoch": 0.88, + "learning_rate": 2.3098132111374313e-08, + "loss": 0.0003, + "step": 45604 + }, + { + "epoch": 0.88, + "learning_rate": 2.309424876703817e-08, + "loss": 0.0004, + "step": 45605 + }, + { + "epoch": 0.88, + "learning_rate": 2.309036542270203e-08, + "loss": 0.0005, + "step": 45606 + }, + { + "epoch": 0.88, + "learning_rate": 2.3086482078365887e-08, + "loss": 0.5609, + "step": 45607 + }, + { + "epoch": 0.88, + "learning_rate": 2.3082598734029746e-08, + "loss": 0.8348, + "step": 45608 + }, + { + "epoch": 0.88, + "learning_rate": 2.3078715389693604e-08, + "loss": 0.0007, + "step": 45609 + }, + { + "epoch": 0.88, + "learning_rate": 2.3074832045357462e-08, + "loss": 0.0532, + "step": 45610 + }, + { + "epoch": 0.88, + "learning_rate": 2.3070948701021317e-08, + "loss": 0.0005, + "step": 45611 + }, + { + "epoch": 0.88, + "learning_rate": 2.3067065356685175e-08, + "loss": 0.0004, + "step": 45612 + }, + { + "epoch": 0.88, + "learning_rate": 2.3063182012349034e-08, + "loss": 0.0003, + "step": 45613 + }, + { + "epoch": 0.88, + "learning_rate": 2.3059298668012892e-08, + "loss": 0.0004, + "step": 45614 + }, + { + "epoch": 0.88, + "learning_rate": 2.305541532367675e-08, + "loss": 0.0004, + "step": 45615 + }, + { + "epoch": 0.88, + "learning_rate": 2.3051531979340608e-08, + "loss": 0.0004, + "step": 45616 + }, + { + "epoch": 0.88, + "learning_rate": 2.3047648635004467e-08, + "loss": 0.0003, + "step": 45617 + }, + { + "epoch": 0.88, + "learning_rate": 2.3043765290668325e-08, + "loss": 0.0004, + "step": 45618 + }, + { + "epoch": 0.88, + "learning_rate": 2.303988194633218e-08, + "loss": 0.0005, + "step": 45619 + }, + { + "epoch": 0.88, + "learning_rate": 2.3035998601996038e-08, + "loss": 0.0004, + "step": 45620 + }, + { + "epoch": 0.88, + "learning_rate": 2.3032115257659896e-08, + "loss": 0.001, + "step": 45621 + }, + { + "epoch": 0.88, + "learning_rate": 2.3028231913323754e-08, + "loss": 0.004, + "step": 45622 + }, + { + "epoch": 0.88, + "learning_rate": 2.3024348568987613e-08, + "loss": 0.0006, + "step": 45623 + }, + { + "epoch": 0.89, + "learning_rate": 2.302046522465147e-08, + "loss": 0.0005, + "step": 45624 + }, + { + "epoch": 0.89, + "learning_rate": 2.301658188031533e-08, + "loss": 0.0004, + "step": 45625 + }, + { + "epoch": 0.89, + "learning_rate": 2.3012698535979184e-08, + "loss": 0.0003, + "step": 45626 + }, + { + "epoch": 0.89, + "learning_rate": 2.3008815191643042e-08, + "loss": 0.0003, + "step": 45627 + }, + { + "epoch": 0.89, + "learning_rate": 2.30049318473069e-08, + "loss": 0.0004, + "step": 45628 + }, + { + "epoch": 0.89, + "learning_rate": 2.300104850297076e-08, + "loss": 0.0003, + "step": 45629 + }, + { + "epoch": 0.89, + "learning_rate": 2.2997165158634617e-08, + "loss": 0.0003, + "step": 45630 + }, + { + "epoch": 0.89, + "learning_rate": 2.2993281814298472e-08, + "loss": 0.0006, + "step": 45631 + }, + { + "epoch": 0.89, + "learning_rate": 2.298939846996233e-08, + "loss": 0.0005, + "step": 45632 + }, + { + "epoch": 0.89, + "learning_rate": 2.298551512562619e-08, + "loss": 1.2749, + "step": 45633 + }, + { + "epoch": 0.89, + "learning_rate": 2.2981631781290047e-08, + "loss": 0.0005, + "step": 45634 + }, + { + "epoch": 0.89, + "learning_rate": 2.2977748436953902e-08, + "loss": 0.0286, + "step": 45635 + }, + { + "epoch": 0.89, + "learning_rate": 2.297386509261776e-08, + "loss": 0.0139, + "step": 45636 + }, + { + "epoch": 0.89, + "learning_rate": 2.2969981748281618e-08, + "loss": 0.0003, + "step": 45637 + }, + { + "epoch": 0.89, + "learning_rate": 2.2966098403945476e-08, + "loss": 0.0003, + "step": 45638 + }, + { + "epoch": 0.89, + "learning_rate": 2.2962215059609335e-08, + "loss": 0.0004, + "step": 45639 + }, + { + "epoch": 0.89, + "learning_rate": 2.295833171527319e-08, + "loss": 0.0004, + "step": 45640 + }, + { + "epoch": 0.89, + "learning_rate": 2.2954448370937048e-08, + "loss": 0.0004, + "step": 45641 + }, + { + "epoch": 0.89, + "learning_rate": 2.2950565026600906e-08, + "loss": 0.0003, + "step": 45642 + }, + { + "epoch": 0.89, + "learning_rate": 2.2946681682264764e-08, + "loss": 0.0004, + "step": 45643 + }, + { + "epoch": 0.89, + "learning_rate": 2.2942798337928623e-08, + "loss": 0.0004, + "step": 45644 + }, + { + "epoch": 0.89, + "learning_rate": 2.293891499359248e-08, + "loss": 0.0018, + "step": 45645 + }, + { + "epoch": 0.89, + "learning_rate": 2.293503164925634e-08, + "loss": 0.0004, + "step": 45646 + }, + { + "epoch": 0.89, + "learning_rate": 2.2931148304920197e-08, + "loss": 0.0003, + "step": 45647 + }, + { + "epoch": 0.89, + "learning_rate": 2.2927264960584052e-08, + "loss": 0.0007, + "step": 45648 + }, + { + "epoch": 0.89, + "learning_rate": 2.292338161624791e-08, + "loss": 0.0003, + "step": 45649 + }, + { + "epoch": 0.89, + "learning_rate": 2.291949827191177e-08, + "loss": 0.0003, + "step": 45650 + }, + { + "epoch": 0.89, + "learning_rate": 2.2915614927575627e-08, + "loss": 0.0006, + "step": 45651 + }, + { + "epoch": 0.89, + "learning_rate": 2.2911731583239485e-08, + "loss": 0.0004, + "step": 45652 + }, + { + "epoch": 0.89, + "learning_rate": 2.2907848238903343e-08, + "loss": 0.0003, + "step": 45653 + }, + { + "epoch": 0.89, + "learning_rate": 2.2903964894567202e-08, + "loss": 0.0005, + "step": 45654 + }, + { + "epoch": 0.89, + "learning_rate": 2.2900081550231057e-08, + "loss": 0.0004, + "step": 45655 + }, + { + "epoch": 0.89, + "learning_rate": 2.2896198205894915e-08, + "loss": 0.0004, + "step": 45656 + }, + { + "epoch": 0.89, + "learning_rate": 2.2892314861558773e-08, + "loss": 0.0004, + "step": 45657 + }, + { + "epoch": 0.89, + "learning_rate": 2.288843151722263e-08, + "loss": 0.0003, + "step": 45658 + }, + { + "epoch": 0.89, + "learning_rate": 2.288454817288649e-08, + "loss": 0.0003, + "step": 45659 + }, + { + "epoch": 0.89, + "learning_rate": 2.2880664828550348e-08, + "loss": 0.9923, + "step": 45660 + }, + { + "epoch": 0.89, + "learning_rate": 2.2876781484214206e-08, + "loss": 0.0014, + "step": 45661 + }, + { + "epoch": 0.89, + "learning_rate": 2.287289813987806e-08, + "loss": 1.2073, + "step": 45662 + }, + { + "epoch": 0.89, + "learning_rate": 2.286901479554192e-08, + "loss": 0.0003, + "step": 45663 + }, + { + "epoch": 0.89, + "learning_rate": 2.2865131451205778e-08, + "loss": 0.0353, + "step": 45664 + }, + { + "epoch": 0.89, + "learning_rate": 2.2861248106869636e-08, + "loss": 0.0003, + "step": 45665 + }, + { + "epoch": 0.89, + "learning_rate": 2.2857364762533494e-08, + "loss": 0.0005, + "step": 45666 + }, + { + "epoch": 0.89, + "learning_rate": 2.2853481418197352e-08, + "loss": 0.0011, + "step": 45667 + }, + { + "epoch": 0.89, + "learning_rate": 2.284959807386121e-08, + "loss": 0.0003, + "step": 45668 + }, + { + "epoch": 0.89, + "learning_rate": 2.2845714729525065e-08, + "loss": 0.0004, + "step": 45669 + }, + { + "epoch": 0.89, + "learning_rate": 2.2841831385188924e-08, + "loss": 0.0103, + "step": 45670 + }, + { + "epoch": 0.89, + "learning_rate": 2.2837948040852782e-08, + "loss": 0.0003, + "step": 45671 + }, + { + "epoch": 0.89, + "learning_rate": 2.283406469651664e-08, + "loss": 0.0004, + "step": 45672 + }, + { + "epoch": 0.89, + "learning_rate": 2.28301813521805e-08, + "loss": 0.0003, + "step": 45673 + }, + { + "epoch": 0.89, + "learning_rate": 2.2826298007844357e-08, + "loss": 0.0004, + "step": 45674 + }, + { + "epoch": 0.89, + "learning_rate": 2.282241466350821e-08, + "loss": 0.0006, + "step": 45675 + }, + { + "epoch": 0.89, + "learning_rate": 2.281853131917207e-08, + "loss": 0.0006, + "step": 45676 + }, + { + "epoch": 0.89, + "learning_rate": 2.2814647974835928e-08, + "loss": 0.0002, + "step": 45677 + }, + { + "epoch": 0.89, + "learning_rate": 2.2810764630499786e-08, + "loss": 1.1797, + "step": 45678 + }, + { + "epoch": 0.89, + "learning_rate": 2.280688128616364e-08, + "loss": 0.1421, + "step": 45679 + }, + { + "epoch": 0.89, + "learning_rate": 2.28029979418275e-08, + "loss": 0.0008, + "step": 45680 + }, + { + "epoch": 0.89, + "learning_rate": 2.2799114597491358e-08, + "loss": 0.0003, + "step": 45681 + }, + { + "epoch": 0.89, + "learning_rate": 2.2795231253155216e-08, + "loss": 0.0004, + "step": 45682 + }, + { + "epoch": 0.89, + "learning_rate": 2.2791347908819074e-08, + "loss": 0.0003, + "step": 45683 + }, + { + "epoch": 0.89, + "learning_rate": 2.278746456448293e-08, + "loss": 0.0004, + "step": 45684 + }, + { + "epoch": 0.89, + "learning_rate": 2.2783581220146787e-08, + "loss": 0.0003, + "step": 45685 + }, + { + "epoch": 0.89, + "learning_rate": 2.2779697875810646e-08, + "loss": 0.0589, + "step": 45686 + }, + { + "epoch": 0.89, + "learning_rate": 2.2775814531474504e-08, + "loss": 0.0005, + "step": 45687 + }, + { + "epoch": 0.89, + "learning_rate": 2.2771931187138362e-08, + "loss": 0.0003, + "step": 45688 + }, + { + "epoch": 0.89, + "learning_rate": 2.276804784280222e-08, + "loss": 0.0003, + "step": 45689 + }, + { + "epoch": 0.89, + "learning_rate": 2.276416449846608e-08, + "loss": 0.0078, + "step": 45690 + }, + { + "epoch": 0.89, + "learning_rate": 2.2760281154129934e-08, + "loss": 0.0005, + "step": 45691 + }, + { + "epoch": 0.89, + "learning_rate": 2.2756397809793792e-08, + "loss": 0.0003, + "step": 45692 + }, + { + "epoch": 0.89, + "learning_rate": 2.275251446545765e-08, + "loss": 0.0653, + "step": 45693 + }, + { + "epoch": 0.89, + "learning_rate": 2.2748631121121508e-08, + "loss": 0.0003, + "step": 45694 + }, + { + "epoch": 0.89, + "learning_rate": 2.2744747776785367e-08, + "loss": 0.0004, + "step": 45695 + }, + { + "epoch": 0.89, + "learning_rate": 2.2740864432449225e-08, + "loss": 0.1811, + "step": 45696 + }, + { + "epoch": 0.89, + "learning_rate": 2.2736981088113083e-08, + "loss": 1.0248, + "step": 45697 + }, + { + "epoch": 0.89, + "learning_rate": 2.2733097743776938e-08, + "loss": 0.0007, + "step": 45698 + }, + { + "epoch": 0.89, + "learning_rate": 2.2729214399440796e-08, + "loss": 0.0012, + "step": 45699 + }, + { + "epoch": 0.89, + "learning_rate": 2.2725331055104654e-08, + "loss": 0.0004, + "step": 45700 + }, + { + "epoch": 0.89, + "learning_rate": 2.2721447710768513e-08, + "loss": 0.0004, + "step": 45701 + }, + { + "epoch": 0.89, + "learning_rate": 2.271756436643237e-08, + "loss": 0.0005, + "step": 45702 + }, + { + "epoch": 0.89, + "learning_rate": 2.271368102209623e-08, + "loss": 0.0003, + "step": 45703 + }, + { + "epoch": 0.89, + "learning_rate": 2.2709797677760087e-08, + "loss": 0.0004, + "step": 45704 + }, + { + "epoch": 0.89, + "learning_rate": 2.2705914333423946e-08, + "loss": 0.0005, + "step": 45705 + }, + { + "epoch": 0.89, + "learning_rate": 2.27020309890878e-08, + "loss": 0.0004, + "step": 45706 + }, + { + "epoch": 0.89, + "learning_rate": 2.269814764475166e-08, + "loss": 0.0005, + "step": 45707 + }, + { + "epoch": 0.89, + "learning_rate": 2.2694264300415517e-08, + "loss": 0.3774, + "step": 45708 + }, + { + "epoch": 0.89, + "learning_rate": 2.2690380956079375e-08, + "loss": 0.0005, + "step": 45709 + }, + { + "epoch": 0.89, + "learning_rate": 2.2686497611743234e-08, + "loss": 0.0003, + "step": 45710 + }, + { + "epoch": 0.89, + "learning_rate": 2.2682614267407092e-08, + "loss": 0.0003, + "step": 45711 + }, + { + "epoch": 0.89, + "learning_rate": 2.267873092307095e-08, + "loss": 0.0003, + "step": 45712 + }, + { + "epoch": 0.89, + "learning_rate": 2.2674847578734805e-08, + "loss": 0.0003, + "step": 45713 + }, + { + "epoch": 0.89, + "learning_rate": 2.2670964234398663e-08, + "loss": 0.0004, + "step": 45714 + }, + { + "epoch": 0.89, + "learning_rate": 2.266708089006252e-08, + "loss": 0.0005, + "step": 45715 + }, + { + "epoch": 0.89, + "learning_rate": 2.266319754572638e-08, + "loss": 0.0004, + "step": 45716 + }, + { + "epoch": 0.89, + "learning_rate": 2.2659314201390238e-08, + "loss": 0.0017, + "step": 45717 + }, + { + "epoch": 0.89, + "learning_rate": 2.2655430857054096e-08, + "loss": 0.0042, + "step": 45718 + }, + { + "epoch": 0.89, + "learning_rate": 2.265154751271795e-08, + "loss": 0.0011, + "step": 45719 + }, + { + "epoch": 0.89, + "learning_rate": 2.264766416838181e-08, + "loss": 0.0006, + "step": 45720 + }, + { + "epoch": 0.89, + "learning_rate": 2.2643780824045668e-08, + "loss": 0.0177, + "step": 45721 + }, + { + "epoch": 0.89, + "learning_rate": 2.2639897479709526e-08, + "loss": 0.0003, + "step": 45722 + }, + { + "epoch": 0.89, + "learning_rate": 2.263601413537338e-08, + "loss": 0.3272, + "step": 45723 + }, + { + "epoch": 0.89, + "learning_rate": 2.263213079103724e-08, + "loss": 0.0011, + "step": 45724 + }, + { + "epoch": 0.89, + "learning_rate": 2.2628247446701097e-08, + "loss": 0.0005, + "step": 45725 + }, + { + "epoch": 0.89, + "learning_rate": 2.2624364102364956e-08, + "loss": 0.0231, + "step": 45726 + }, + { + "epoch": 0.89, + "learning_rate": 2.262048075802881e-08, + "loss": 0.0005, + "step": 45727 + }, + { + "epoch": 0.89, + "learning_rate": 2.261659741369267e-08, + "loss": 0.0004, + "step": 45728 + }, + { + "epoch": 0.89, + "learning_rate": 2.2612714069356527e-08, + "loss": 0.0005, + "step": 45729 + }, + { + "epoch": 0.89, + "learning_rate": 2.2608830725020385e-08, + "loss": 0.0003, + "step": 45730 + }, + { + "epoch": 0.89, + "learning_rate": 2.2604947380684243e-08, + "loss": 0.0005, + "step": 45731 + }, + { + "epoch": 0.89, + "learning_rate": 2.2601064036348102e-08, + "loss": 0.0005, + "step": 45732 + }, + { + "epoch": 0.89, + "learning_rate": 2.259718069201196e-08, + "loss": 0.0144, + "step": 45733 + }, + { + "epoch": 0.89, + "learning_rate": 2.2593297347675818e-08, + "loss": 0.0005, + "step": 45734 + }, + { + "epoch": 0.89, + "learning_rate": 2.2589414003339673e-08, + "loss": 0.0005, + "step": 45735 + }, + { + "epoch": 0.89, + "learning_rate": 2.258553065900353e-08, + "loss": 0.0004, + "step": 45736 + }, + { + "epoch": 0.89, + "learning_rate": 2.258164731466739e-08, + "loss": 0.0005, + "step": 45737 + }, + { + "epoch": 0.89, + "learning_rate": 2.2577763970331248e-08, + "loss": 0.0068, + "step": 45738 + }, + { + "epoch": 0.89, + "learning_rate": 2.2573880625995106e-08, + "loss": 0.0039, + "step": 45739 + }, + { + "epoch": 0.89, + "learning_rate": 2.2569997281658964e-08, + "loss": 0.0003, + "step": 45740 + }, + { + "epoch": 0.89, + "learning_rate": 2.2566113937322823e-08, + "loss": 0.0006, + "step": 45741 + }, + { + "epoch": 0.89, + "learning_rate": 2.2562230592986678e-08, + "loss": 0.0003, + "step": 45742 + }, + { + "epoch": 0.89, + "learning_rate": 2.2558347248650536e-08, + "loss": 0.0004, + "step": 45743 + }, + { + "epoch": 0.89, + "learning_rate": 2.2554463904314394e-08, + "loss": 0.0004, + "step": 45744 + }, + { + "epoch": 0.89, + "learning_rate": 2.2550580559978252e-08, + "loss": 0.0006, + "step": 45745 + }, + { + "epoch": 0.89, + "learning_rate": 2.254669721564211e-08, + "loss": 0.0004, + "step": 45746 + }, + { + "epoch": 0.89, + "learning_rate": 2.254281387130597e-08, + "loss": 0.558, + "step": 45747 + }, + { + "epoch": 0.89, + "learning_rate": 2.2538930526969827e-08, + "loss": 0.0004, + "step": 45748 + }, + { + "epoch": 0.89, + "learning_rate": 2.2535047182633682e-08, + "loss": 0.0008, + "step": 45749 + }, + { + "epoch": 0.89, + "learning_rate": 2.253116383829754e-08, + "loss": 0.0006, + "step": 45750 + }, + { + "epoch": 0.89, + "learning_rate": 2.25272804939614e-08, + "loss": 0.0003, + "step": 45751 + }, + { + "epoch": 0.89, + "learning_rate": 2.2523397149625257e-08, + "loss": 0.0004, + "step": 45752 + }, + { + "epoch": 0.89, + "learning_rate": 2.2519513805289115e-08, + "loss": 0.0004, + "step": 45753 + }, + { + "epoch": 0.89, + "learning_rate": 2.2515630460952973e-08, + "loss": 0.0006, + "step": 45754 + }, + { + "epoch": 0.89, + "learning_rate": 2.251174711661683e-08, + "loss": 0.0003, + "step": 45755 + }, + { + "epoch": 0.89, + "learning_rate": 2.2507863772280686e-08, + "loss": 0.0004, + "step": 45756 + }, + { + "epoch": 0.89, + "learning_rate": 2.2503980427944545e-08, + "loss": 0.0003, + "step": 45757 + }, + { + "epoch": 0.89, + "learning_rate": 2.2500097083608403e-08, + "loss": 0.0005, + "step": 45758 + }, + { + "epoch": 0.89, + "learning_rate": 2.249621373927226e-08, + "loss": 0.0013, + "step": 45759 + }, + { + "epoch": 0.89, + "learning_rate": 2.249233039493612e-08, + "loss": 0.0003, + "step": 45760 + }, + { + "epoch": 0.89, + "learning_rate": 2.2488447050599978e-08, + "loss": 0.0005, + "step": 45761 + }, + { + "epoch": 0.89, + "learning_rate": 2.2484563706263836e-08, + "loss": 0.0007, + "step": 45762 + }, + { + "epoch": 0.89, + "learning_rate": 2.2480680361927694e-08, + "loss": 0.0002, + "step": 45763 + }, + { + "epoch": 0.89, + "learning_rate": 2.247679701759155e-08, + "loss": 0.0004, + "step": 45764 + }, + { + "epoch": 0.89, + "learning_rate": 2.2472913673255407e-08, + "loss": 0.0004, + "step": 45765 + }, + { + "epoch": 0.89, + "learning_rate": 2.2469030328919266e-08, + "loss": 0.0004, + "step": 45766 + }, + { + "epoch": 0.89, + "learning_rate": 2.246514698458312e-08, + "loss": 0.0006, + "step": 45767 + }, + { + "epoch": 0.89, + "learning_rate": 2.246126364024698e-08, + "loss": 0.0003, + "step": 45768 + }, + { + "epoch": 0.89, + "learning_rate": 2.2457380295910837e-08, + "loss": 0.0003, + "step": 45769 + }, + { + "epoch": 0.89, + "learning_rate": 2.2453496951574695e-08, + "loss": 0.0003, + "step": 45770 + }, + { + "epoch": 0.89, + "learning_rate": 2.244961360723855e-08, + "loss": 0.0004, + "step": 45771 + }, + { + "epoch": 0.89, + "learning_rate": 2.244573026290241e-08, + "loss": 0.0004, + "step": 45772 + }, + { + "epoch": 0.89, + "learning_rate": 2.2441846918566267e-08, + "loss": 0.0004, + "step": 45773 + }, + { + "epoch": 0.89, + "learning_rate": 2.2437963574230125e-08, + "loss": 0.0008, + "step": 45774 + }, + { + "epoch": 0.89, + "learning_rate": 2.2434080229893983e-08, + "loss": 0.0005, + "step": 45775 + }, + { + "epoch": 0.89, + "learning_rate": 2.243019688555784e-08, + "loss": 0.0002, + "step": 45776 + }, + { + "epoch": 0.89, + "learning_rate": 2.24263135412217e-08, + "loss": 0.0004, + "step": 45777 + }, + { + "epoch": 0.89, + "learning_rate": 2.2422430196885555e-08, + "loss": 0.0004, + "step": 45778 + }, + { + "epoch": 0.89, + "learning_rate": 2.2418546852549413e-08, + "loss": 0.0005, + "step": 45779 + }, + { + "epoch": 0.89, + "learning_rate": 2.241466350821327e-08, + "loss": 0.0005, + "step": 45780 + }, + { + "epoch": 0.89, + "learning_rate": 2.241078016387713e-08, + "loss": 0.0004, + "step": 45781 + }, + { + "epoch": 0.89, + "learning_rate": 2.2406896819540987e-08, + "loss": 0.0002, + "step": 45782 + }, + { + "epoch": 0.89, + "learning_rate": 2.2403013475204846e-08, + "loss": 0.0006, + "step": 45783 + }, + { + "epoch": 0.89, + "learning_rate": 2.2399130130868704e-08, + "loss": 0.0005, + "step": 45784 + }, + { + "epoch": 0.89, + "learning_rate": 2.239524678653256e-08, + "loss": 0.0012, + "step": 45785 + }, + { + "epoch": 0.89, + "learning_rate": 2.2391363442196417e-08, + "loss": 0.0003, + "step": 45786 + }, + { + "epoch": 0.89, + "learning_rate": 2.2387480097860275e-08, + "loss": 0.0004, + "step": 45787 + }, + { + "epoch": 0.89, + "learning_rate": 2.2383596753524134e-08, + "loss": 0.0004, + "step": 45788 + }, + { + "epoch": 0.89, + "learning_rate": 2.2379713409187992e-08, + "loss": 0.0008, + "step": 45789 + }, + { + "epoch": 0.89, + "learning_rate": 2.237583006485185e-08, + "loss": 0.0004, + "step": 45790 + }, + { + "epoch": 0.89, + "learning_rate": 2.237194672051571e-08, + "loss": 0.0004, + "step": 45791 + }, + { + "epoch": 0.89, + "learning_rate": 2.2368063376179567e-08, + "loss": 0.0004, + "step": 45792 + }, + { + "epoch": 0.89, + "learning_rate": 2.236418003184342e-08, + "loss": 0.0004, + "step": 45793 + }, + { + "epoch": 0.89, + "learning_rate": 2.236029668750728e-08, + "loss": 0.0251, + "step": 45794 + }, + { + "epoch": 0.89, + "learning_rate": 2.2356413343171138e-08, + "loss": 0.0004, + "step": 45795 + }, + { + "epoch": 0.89, + "learning_rate": 2.2352529998834996e-08, + "loss": 0.0004, + "step": 45796 + }, + { + "epoch": 0.89, + "learning_rate": 2.2348646654498855e-08, + "loss": 0.0003, + "step": 45797 + }, + { + "epoch": 0.89, + "learning_rate": 2.2344763310162713e-08, + "loss": 0.0003, + "step": 45798 + }, + { + "epoch": 0.89, + "learning_rate": 2.234087996582657e-08, + "loss": 0.0005, + "step": 45799 + }, + { + "epoch": 0.89, + "learning_rate": 2.2336996621490426e-08, + "loss": 0.0003, + "step": 45800 + }, + { + "epoch": 0.89, + "learning_rate": 2.2333113277154284e-08, + "loss": 0.0004, + "step": 45801 + }, + { + "epoch": 0.89, + "learning_rate": 2.2329229932818142e-08, + "loss": 0.0007, + "step": 45802 + }, + { + "epoch": 0.89, + "learning_rate": 2.2325346588482e-08, + "loss": 0.0005, + "step": 45803 + }, + { + "epoch": 0.89, + "learning_rate": 2.232146324414586e-08, + "loss": 0.0003, + "step": 45804 + }, + { + "epoch": 0.89, + "learning_rate": 2.2317579899809717e-08, + "loss": 0.0004, + "step": 45805 + }, + { + "epoch": 0.89, + "learning_rate": 2.2313696555473575e-08, + "loss": 0.0003, + "step": 45806 + }, + { + "epoch": 0.89, + "learning_rate": 2.230981321113743e-08, + "loss": 0.0004, + "step": 45807 + }, + { + "epoch": 0.89, + "learning_rate": 2.230592986680129e-08, + "loss": 0.0002, + "step": 45808 + }, + { + "epoch": 0.89, + "learning_rate": 2.2302046522465147e-08, + "loss": 0.0005, + "step": 45809 + }, + { + "epoch": 0.89, + "learning_rate": 2.2298163178129005e-08, + "loss": 0.0002, + "step": 45810 + }, + { + "epoch": 0.89, + "learning_rate": 2.2294279833792863e-08, + "loss": 0.0003, + "step": 45811 + }, + { + "epoch": 0.89, + "learning_rate": 2.2290396489456718e-08, + "loss": 0.0005, + "step": 45812 + }, + { + "epoch": 0.89, + "learning_rate": 2.2286513145120577e-08, + "loss": 0.2196, + "step": 45813 + }, + { + "epoch": 0.89, + "learning_rate": 2.2282629800784435e-08, + "loss": 0.0003, + "step": 45814 + }, + { + "epoch": 0.89, + "learning_rate": 2.227874645644829e-08, + "loss": 0.0004, + "step": 45815 + }, + { + "epoch": 0.89, + "learning_rate": 2.2274863112112148e-08, + "loss": 0.467, + "step": 45816 + }, + { + "epoch": 0.89, + "learning_rate": 2.2270979767776006e-08, + "loss": 0.0003, + "step": 45817 + }, + { + "epoch": 0.89, + "learning_rate": 2.2267096423439864e-08, + "loss": 0.0005, + "step": 45818 + }, + { + "epoch": 0.89, + "learning_rate": 2.2263213079103723e-08, + "loss": 0.0003, + "step": 45819 + }, + { + "epoch": 0.89, + "learning_rate": 2.225932973476758e-08, + "loss": 0.0003, + "step": 45820 + }, + { + "epoch": 0.89, + "learning_rate": 2.225544639043144e-08, + "loss": 0.0003, + "step": 45821 + }, + { + "epoch": 0.89, + "learning_rate": 2.2251563046095294e-08, + "loss": 0.0003, + "step": 45822 + }, + { + "epoch": 0.89, + "learning_rate": 2.2247679701759152e-08, + "loss": 0.0005, + "step": 45823 + }, + { + "epoch": 0.89, + "learning_rate": 2.224379635742301e-08, + "loss": 0.0005, + "step": 45824 + }, + { + "epoch": 0.89, + "learning_rate": 2.223991301308687e-08, + "loss": 0.0003, + "step": 45825 + }, + { + "epoch": 0.89, + "learning_rate": 2.2236029668750727e-08, + "loss": 0.0006, + "step": 45826 + }, + { + "epoch": 0.89, + "learning_rate": 2.2232146324414585e-08, + "loss": 1.3062, + "step": 45827 + }, + { + "epoch": 0.89, + "learning_rate": 2.2228262980078444e-08, + "loss": 0.0006, + "step": 45828 + }, + { + "epoch": 0.89, + "learning_rate": 2.22243796357423e-08, + "loss": 0.4293, + "step": 45829 + }, + { + "epoch": 0.89, + "learning_rate": 2.2220496291406157e-08, + "loss": 0.0004, + "step": 45830 + }, + { + "epoch": 0.89, + "learning_rate": 2.2216612947070015e-08, + "loss": 0.0034, + "step": 45831 + }, + { + "epoch": 0.89, + "learning_rate": 2.2212729602733873e-08, + "loss": 0.0003, + "step": 45832 + }, + { + "epoch": 0.89, + "learning_rate": 2.220884625839773e-08, + "loss": 0.0004, + "step": 45833 + }, + { + "epoch": 0.89, + "learning_rate": 2.220496291406159e-08, + "loss": 0.0002, + "step": 45834 + }, + { + "epoch": 0.89, + "learning_rate": 2.2201079569725448e-08, + "loss": 0.0004, + "step": 45835 + }, + { + "epoch": 0.89, + "learning_rate": 2.2197196225389303e-08, + "loss": 0.0013, + "step": 45836 + }, + { + "epoch": 0.89, + "learning_rate": 2.219331288105316e-08, + "loss": 0.0005, + "step": 45837 + }, + { + "epoch": 0.89, + "learning_rate": 2.218942953671702e-08, + "loss": 0.0003, + "step": 45838 + }, + { + "epoch": 0.89, + "learning_rate": 2.2185546192380878e-08, + "loss": 0.0009, + "step": 45839 + }, + { + "epoch": 0.89, + "learning_rate": 2.2181662848044736e-08, + "loss": 0.0005, + "step": 45840 + }, + { + "epoch": 0.89, + "learning_rate": 2.2177779503708594e-08, + "loss": 0.0003, + "step": 45841 + }, + { + "epoch": 0.89, + "learning_rate": 2.2173896159372452e-08, + "loss": 0.0003, + "step": 45842 + }, + { + "epoch": 0.89, + "learning_rate": 2.2170012815036307e-08, + "loss": 0.0005, + "step": 45843 + }, + { + "epoch": 0.89, + "learning_rate": 2.2166129470700166e-08, + "loss": 0.0005, + "step": 45844 + }, + { + "epoch": 0.89, + "learning_rate": 2.2162246126364024e-08, + "loss": 0.0004, + "step": 45845 + }, + { + "epoch": 0.89, + "learning_rate": 2.2158362782027882e-08, + "loss": 0.001, + "step": 45846 + }, + { + "epoch": 0.89, + "learning_rate": 2.215447943769174e-08, + "loss": 0.0061, + "step": 45847 + }, + { + "epoch": 0.89, + "learning_rate": 2.21505960933556e-08, + "loss": 0.0003, + "step": 45848 + }, + { + "epoch": 0.89, + "learning_rate": 2.2146712749019457e-08, + "loss": 0.0004, + "step": 45849 + }, + { + "epoch": 0.89, + "learning_rate": 2.2142829404683315e-08, + "loss": 0.0003, + "step": 45850 + }, + { + "epoch": 0.89, + "learning_rate": 2.213894606034717e-08, + "loss": 0.0611, + "step": 45851 + }, + { + "epoch": 0.89, + "learning_rate": 2.2135062716011028e-08, + "loss": 0.0006, + "step": 45852 + }, + { + "epoch": 0.89, + "learning_rate": 2.2131179371674886e-08, + "loss": 0.1142, + "step": 45853 + }, + { + "epoch": 0.89, + "learning_rate": 2.2127296027338745e-08, + "loss": 0.0005, + "step": 45854 + }, + { + "epoch": 0.89, + "learning_rate": 2.2123412683002603e-08, + "loss": 0.0004, + "step": 45855 + }, + { + "epoch": 0.89, + "learning_rate": 2.2119529338666458e-08, + "loss": 0.0002, + "step": 45856 + }, + { + "epoch": 0.89, + "learning_rate": 2.2115645994330316e-08, + "loss": 0.0004, + "step": 45857 + }, + { + "epoch": 0.89, + "learning_rate": 2.2111762649994174e-08, + "loss": 0.025, + "step": 45858 + }, + { + "epoch": 0.89, + "learning_rate": 2.2107879305658033e-08, + "loss": 0.0004, + "step": 45859 + }, + { + "epoch": 0.89, + "learning_rate": 2.2103995961321888e-08, + "loss": 0.0004, + "step": 45860 + }, + { + "epoch": 0.89, + "learning_rate": 2.2100112616985746e-08, + "loss": 0.0005, + "step": 45861 + }, + { + "epoch": 0.89, + "learning_rate": 2.2096229272649604e-08, + "loss": 0.0003, + "step": 45862 + }, + { + "epoch": 0.89, + "learning_rate": 2.2092345928313462e-08, + "loss": 0.0005, + "step": 45863 + }, + { + "epoch": 0.89, + "learning_rate": 2.208846258397732e-08, + "loss": 0.0017, + "step": 45864 + }, + { + "epoch": 0.89, + "learning_rate": 2.2084579239641175e-08, + "loss": 0.7151, + "step": 45865 + }, + { + "epoch": 0.89, + "learning_rate": 2.2080695895305034e-08, + "loss": 1.1871, + "step": 45866 + }, + { + "epoch": 0.89, + "learning_rate": 2.2076812550968892e-08, + "loss": 0.0004, + "step": 45867 + }, + { + "epoch": 0.89, + "learning_rate": 2.207292920663275e-08, + "loss": 0.367, + "step": 45868 + }, + { + "epoch": 0.89, + "learning_rate": 2.206904586229661e-08, + "loss": 0.0018, + "step": 45869 + }, + { + "epoch": 0.89, + "learning_rate": 2.2065162517960467e-08, + "loss": 0.0004, + "step": 45870 + }, + { + "epoch": 0.89, + "learning_rate": 2.2061279173624325e-08, + "loss": 0.851, + "step": 45871 + }, + { + "epoch": 0.89, + "learning_rate": 2.205739582928818e-08, + "loss": 0.0005, + "step": 45872 + }, + { + "epoch": 0.89, + "learning_rate": 2.2053512484952038e-08, + "loss": 0.0004, + "step": 45873 + }, + { + "epoch": 0.89, + "learning_rate": 2.2049629140615896e-08, + "loss": 0.0003, + "step": 45874 + }, + { + "epoch": 0.89, + "learning_rate": 2.2045745796279755e-08, + "loss": 0.0003, + "step": 45875 + }, + { + "epoch": 0.89, + "learning_rate": 2.2041862451943613e-08, + "loss": 0.9003, + "step": 45876 + }, + { + "epoch": 0.89, + "learning_rate": 2.203797910760747e-08, + "loss": 0.0003, + "step": 45877 + }, + { + "epoch": 0.89, + "learning_rate": 2.203409576327133e-08, + "loss": 1.0656, + "step": 45878 + }, + { + "epoch": 0.89, + "learning_rate": 2.2030212418935188e-08, + "loss": 0.0005, + "step": 45879 + }, + { + "epoch": 0.89, + "learning_rate": 2.2026329074599042e-08, + "loss": 0.0004, + "step": 45880 + }, + { + "epoch": 0.89, + "learning_rate": 2.20224457302629e-08, + "loss": 0.0008, + "step": 45881 + }, + { + "epoch": 0.89, + "learning_rate": 2.201856238592676e-08, + "loss": 0.0007, + "step": 45882 + }, + { + "epoch": 0.89, + "learning_rate": 2.2014679041590617e-08, + "loss": 0.0004, + "step": 45883 + }, + { + "epoch": 0.89, + "learning_rate": 2.2010795697254475e-08, + "loss": 0.0087, + "step": 45884 + }, + { + "epoch": 0.89, + "learning_rate": 2.2006912352918334e-08, + "loss": 0.0003, + "step": 45885 + }, + { + "epoch": 0.89, + "learning_rate": 2.2003029008582192e-08, + "loss": 0.7489, + "step": 45886 + }, + { + "epoch": 0.89, + "learning_rate": 2.1999145664246047e-08, + "loss": 0.0004, + "step": 45887 + }, + { + "epoch": 0.89, + "learning_rate": 2.1995262319909905e-08, + "loss": 0.0005, + "step": 45888 + }, + { + "epoch": 0.89, + "learning_rate": 2.1991378975573763e-08, + "loss": 0.3124, + "step": 45889 + }, + { + "epoch": 0.89, + "learning_rate": 2.198749563123762e-08, + "loss": 0.0044, + "step": 45890 + }, + { + "epoch": 0.89, + "learning_rate": 2.198361228690148e-08, + "loss": 0.0006, + "step": 45891 + }, + { + "epoch": 0.89, + "learning_rate": 2.1979728942565338e-08, + "loss": 0.0003, + "step": 45892 + }, + { + "epoch": 0.89, + "learning_rate": 2.1975845598229196e-08, + "loss": 0.0008, + "step": 45893 + }, + { + "epoch": 0.89, + "learning_rate": 2.197196225389305e-08, + "loss": 0.0003, + "step": 45894 + }, + { + "epoch": 0.89, + "learning_rate": 2.196807890955691e-08, + "loss": 0.0003, + "step": 45895 + }, + { + "epoch": 0.89, + "learning_rate": 2.1964195565220768e-08, + "loss": 0.0004, + "step": 45896 + }, + { + "epoch": 0.89, + "learning_rate": 2.1960312220884626e-08, + "loss": 1.0769, + "step": 45897 + }, + { + "epoch": 0.89, + "learning_rate": 2.1956428876548484e-08, + "loss": 0.0003, + "step": 45898 + }, + { + "epoch": 0.89, + "learning_rate": 2.1952545532212343e-08, + "loss": 0.0004, + "step": 45899 + }, + { + "epoch": 0.89, + "learning_rate": 2.1948662187876197e-08, + "loss": 0.0014, + "step": 45900 + }, + { + "epoch": 0.89, + "learning_rate": 2.1944778843540056e-08, + "loss": 0.0006, + "step": 45901 + }, + { + "epoch": 0.89, + "learning_rate": 2.1940895499203914e-08, + "loss": 0.0007, + "step": 45902 + }, + { + "epoch": 0.89, + "learning_rate": 2.1937012154867772e-08, + "loss": 0.0003, + "step": 45903 + }, + { + "epoch": 0.89, + "learning_rate": 2.1933128810531627e-08, + "loss": 0.0005, + "step": 45904 + }, + { + "epoch": 0.89, + "learning_rate": 2.1929245466195485e-08, + "loss": 0.0007, + "step": 45905 + }, + { + "epoch": 0.89, + "learning_rate": 2.1925362121859344e-08, + "loss": 0.0012, + "step": 45906 + }, + { + "epoch": 0.89, + "learning_rate": 2.1921478777523202e-08, + "loss": 0.0007, + "step": 45907 + }, + { + "epoch": 0.89, + "learning_rate": 2.191759543318706e-08, + "loss": 0.0003, + "step": 45908 + }, + { + "epoch": 0.89, + "learning_rate": 2.1913712088850915e-08, + "loss": 0.0004, + "step": 45909 + }, + { + "epoch": 0.89, + "learning_rate": 2.1909828744514773e-08, + "loss": 0.0005, + "step": 45910 + }, + { + "epoch": 0.89, + "learning_rate": 2.190594540017863e-08, + "loss": 0.0003, + "step": 45911 + }, + { + "epoch": 0.89, + "learning_rate": 2.190206205584249e-08, + "loss": 0.0005, + "step": 45912 + }, + { + "epoch": 0.89, + "learning_rate": 2.1898178711506348e-08, + "loss": 0.0004, + "step": 45913 + }, + { + "epoch": 0.89, + "learning_rate": 2.1894295367170206e-08, + "loss": 0.0004, + "step": 45914 + }, + { + "epoch": 0.89, + "learning_rate": 2.1890412022834064e-08, + "loss": 0.0003, + "step": 45915 + }, + { + "epoch": 0.89, + "learning_rate": 2.188652867849792e-08, + "loss": 0.0005, + "step": 45916 + }, + { + "epoch": 0.89, + "learning_rate": 2.1882645334161778e-08, + "loss": 0.0004, + "step": 45917 + }, + { + "epoch": 0.89, + "learning_rate": 2.1878761989825636e-08, + "loss": 0.0004, + "step": 45918 + }, + { + "epoch": 0.89, + "learning_rate": 2.1874878645489494e-08, + "loss": 0.0005, + "step": 45919 + }, + { + "epoch": 0.89, + "learning_rate": 2.1870995301153352e-08, + "loss": 0.0003, + "step": 45920 + }, + { + "epoch": 0.89, + "learning_rate": 2.186711195681721e-08, + "loss": 0.0003, + "step": 45921 + }, + { + "epoch": 0.89, + "learning_rate": 2.186322861248107e-08, + "loss": 1.0533, + "step": 45922 + }, + { + "epoch": 0.89, + "learning_rate": 2.1859345268144924e-08, + "loss": 0.0004, + "step": 45923 + }, + { + "epoch": 0.89, + "learning_rate": 2.1855461923808782e-08, + "loss": 0.0003, + "step": 45924 + }, + { + "epoch": 0.89, + "learning_rate": 2.185157857947264e-08, + "loss": 0.0005, + "step": 45925 + }, + { + "epoch": 0.89, + "learning_rate": 2.18476952351365e-08, + "loss": 0.0033, + "step": 45926 + }, + { + "epoch": 0.89, + "learning_rate": 2.1843811890800357e-08, + "loss": 0.0005, + "step": 45927 + }, + { + "epoch": 0.89, + "learning_rate": 2.1839928546464215e-08, + "loss": 1.422, + "step": 45928 + }, + { + "epoch": 0.89, + "learning_rate": 2.1836045202128073e-08, + "loss": 0.0003, + "step": 45929 + }, + { + "epoch": 0.89, + "learning_rate": 2.1832161857791928e-08, + "loss": 0.0005, + "step": 45930 + }, + { + "epoch": 0.89, + "learning_rate": 2.1828278513455786e-08, + "loss": 0.0007, + "step": 45931 + }, + { + "epoch": 0.89, + "learning_rate": 2.1824395169119645e-08, + "loss": 0.0005, + "step": 45932 + }, + { + "epoch": 0.89, + "learning_rate": 2.1820511824783503e-08, + "loss": 0.0003, + "step": 45933 + }, + { + "epoch": 0.89, + "learning_rate": 2.181662848044736e-08, + "loss": 0.0003, + "step": 45934 + }, + { + "epoch": 0.89, + "learning_rate": 2.181274513611122e-08, + "loss": 0.0006, + "step": 45935 + }, + { + "epoch": 0.89, + "learning_rate": 2.1808861791775078e-08, + "loss": 0.0003, + "step": 45936 + }, + { + "epoch": 0.89, + "learning_rate": 2.1804978447438936e-08, + "loss": 0.0004, + "step": 45937 + }, + { + "epoch": 0.89, + "learning_rate": 2.180109510310279e-08, + "loss": 0.0003, + "step": 45938 + }, + { + "epoch": 0.89, + "learning_rate": 2.179721175876665e-08, + "loss": 0.2733, + "step": 45939 + }, + { + "epoch": 0.89, + "learning_rate": 2.1793328414430507e-08, + "loss": 0.0005, + "step": 45940 + }, + { + "epoch": 0.89, + "learning_rate": 2.1789445070094366e-08, + "loss": 0.0002, + "step": 45941 + }, + { + "epoch": 0.89, + "learning_rate": 2.1785561725758224e-08, + "loss": 0.0004, + "step": 45942 + }, + { + "epoch": 0.89, + "learning_rate": 2.1781678381422082e-08, + "loss": 0.0003, + "step": 45943 + }, + { + "epoch": 0.89, + "learning_rate": 2.1777795037085937e-08, + "loss": 0.0004, + "step": 45944 + }, + { + "epoch": 0.89, + "learning_rate": 2.1773911692749795e-08, + "loss": 0.0003, + "step": 45945 + }, + { + "epoch": 0.89, + "learning_rate": 2.1770028348413654e-08, + "loss": 0.6335, + "step": 45946 + }, + { + "epoch": 0.89, + "learning_rate": 2.1766145004077512e-08, + "loss": 0.5948, + "step": 45947 + }, + { + "epoch": 0.89, + "learning_rate": 2.1762261659741367e-08, + "loss": 0.0004, + "step": 45948 + }, + { + "epoch": 0.89, + "learning_rate": 2.1758378315405225e-08, + "loss": 0.0004, + "step": 45949 + }, + { + "epoch": 0.89, + "learning_rate": 2.1754494971069083e-08, + "loss": 0.0005, + "step": 45950 + }, + { + "epoch": 0.89, + "learning_rate": 2.175061162673294e-08, + "loss": 0.0004, + "step": 45951 + }, + { + "epoch": 0.89, + "learning_rate": 2.1746728282396796e-08, + "loss": 0.0004, + "step": 45952 + }, + { + "epoch": 0.89, + "learning_rate": 2.1742844938060655e-08, + "loss": 0.0024, + "step": 45953 + }, + { + "epoch": 0.89, + "learning_rate": 2.1738961593724513e-08, + "loss": 0.0003, + "step": 45954 + }, + { + "epoch": 0.89, + "learning_rate": 2.173507824938837e-08, + "loss": 0.0003, + "step": 45955 + }, + { + "epoch": 0.89, + "learning_rate": 2.173119490505223e-08, + "loss": 0.0003, + "step": 45956 + }, + { + "epoch": 0.89, + "learning_rate": 2.1727311560716088e-08, + "loss": 0.0005, + "step": 45957 + }, + { + "epoch": 0.89, + "learning_rate": 2.1723428216379946e-08, + "loss": 0.0005, + "step": 45958 + }, + { + "epoch": 0.89, + "learning_rate": 2.17195448720438e-08, + "loss": 0.0006, + "step": 45959 + }, + { + "epoch": 0.89, + "learning_rate": 2.171566152770766e-08, + "loss": 0.0004, + "step": 45960 + }, + { + "epoch": 0.89, + "learning_rate": 2.1711778183371517e-08, + "loss": 0.1102, + "step": 45961 + }, + { + "epoch": 0.89, + "learning_rate": 2.1707894839035376e-08, + "loss": 0.0288, + "step": 45962 + }, + { + "epoch": 0.89, + "learning_rate": 2.1704011494699234e-08, + "loss": 0.0003, + "step": 45963 + }, + { + "epoch": 0.89, + "learning_rate": 2.1700128150363092e-08, + "loss": 0.0004, + "step": 45964 + }, + { + "epoch": 0.89, + "learning_rate": 2.169624480602695e-08, + "loss": 0.0006, + "step": 45965 + }, + { + "epoch": 0.89, + "learning_rate": 2.169236146169081e-08, + "loss": 0.0004, + "step": 45966 + }, + { + "epoch": 0.89, + "learning_rate": 2.1688478117354663e-08, + "loss": 0.0003, + "step": 45967 + }, + { + "epoch": 0.89, + "learning_rate": 2.1684594773018522e-08, + "loss": 0.0023, + "step": 45968 + }, + { + "epoch": 0.89, + "learning_rate": 2.168071142868238e-08, + "loss": 0.0003, + "step": 45969 + }, + { + "epoch": 0.89, + "learning_rate": 2.1676828084346238e-08, + "loss": 0.0005, + "step": 45970 + }, + { + "epoch": 0.89, + "learning_rate": 2.1672944740010096e-08, + "loss": 0.0003, + "step": 45971 + }, + { + "epoch": 0.89, + "learning_rate": 2.1669061395673955e-08, + "loss": 0.0005, + "step": 45972 + }, + { + "epoch": 0.89, + "learning_rate": 2.1665178051337813e-08, + "loss": 0.6989, + "step": 45973 + }, + { + "epoch": 0.89, + "learning_rate": 2.1661294707001668e-08, + "loss": 0.0004, + "step": 45974 + }, + { + "epoch": 0.89, + "learning_rate": 2.1657411362665526e-08, + "loss": 0.0003, + "step": 45975 + }, + { + "epoch": 0.89, + "learning_rate": 2.1653528018329384e-08, + "loss": 0.0003, + "step": 45976 + }, + { + "epoch": 0.89, + "learning_rate": 2.1649644673993243e-08, + "loss": 0.0002, + "step": 45977 + }, + { + "epoch": 0.89, + "learning_rate": 2.16457613296571e-08, + "loss": 0.0004, + "step": 45978 + }, + { + "epoch": 0.89, + "learning_rate": 2.164187798532096e-08, + "loss": 0.0003, + "step": 45979 + }, + { + "epoch": 0.89, + "learning_rate": 2.1637994640984817e-08, + "loss": 0.0004, + "step": 45980 + }, + { + "epoch": 0.89, + "learning_rate": 2.1634111296648672e-08, + "loss": 0.0009, + "step": 45981 + }, + { + "epoch": 0.89, + "learning_rate": 2.163022795231253e-08, + "loss": 0.0005, + "step": 45982 + }, + { + "epoch": 0.89, + "learning_rate": 2.162634460797639e-08, + "loss": 0.0003, + "step": 45983 + }, + { + "epoch": 0.89, + "learning_rate": 2.1622461263640247e-08, + "loss": 0.6595, + "step": 45984 + }, + { + "epoch": 0.89, + "learning_rate": 2.1618577919304105e-08, + "loss": 0.0003, + "step": 45985 + }, + { + "epoch": 0.89, + "learning_rate": 2.1614694574967963e-08, + "loss": 0.0004, + "step": 45986 + }, + { + "epoch": 0.89, + "learning_rate": 2.1610811230631822e-08, + "loss": 0.0004, + "step": 45987 + }, + { + "epoch": 0.89, + "learning_rate": 2.1606927886295677e-08, + "loss": 0.0048, + "step": 45988 + }, + { + "epoch": 0.89, + "learning_rate": 2.1603044541959535e-08, + "loss": 0.0004, + "step": 45989 + }, + { + "epoch": 0.89, + "learning_rate": 2.1599161197623393e-08, + "loss": 0.0004, + "step": 45990 + }, + { + "epoch": 0.89, + "learning_rate": 2.159527785328725e-08, + "loss": 0.0003, + "step": 45991 + }, + { + "epoch": 0.89, + "learning_rate": 2.1591394508951106e-08, + "loss": 0.483, + "step": 45992 + }, + { + "epoch": 0.89, + "learning_rate": 2.1587511164614965e-08, + "loss": 0.6395, + "step": 45993 + }, + { + "epoch": 0.89, + "learning_rate": 2.1583627820278823e-08, + "loss": 1.0211, + "step": 45994 + }, + { + "epoch": 0.89, + "learning_rate": 2.157974447594268e-08, + "loss": 0.0003, + "step": 45995 + }, + { + "epoch": 0.89, + "learning_rate": 2.1575861131606536e-08, + "loss": 0.0005, + "step": 45996 + }, + { + "epoch": 0.89, + "learning_rate": 2.1571977787270394e-08, + "loss": 0.7298, + "step": 45997 + }, + { + "epoch": 0.89, + "learning_rate": 2.1568094442934252e-08, + "loss": 0.0004, + "step": 45998 + }, + { + "epoch": 0.89, + "learning_rate": 2.156421109859811e-08, + "loss": 0.0004, + "step": 45999 + }, + { + "epoch": 0.89, + "learning_rate": 2.156032775426197e-08, + "loss": 0.0003, + "step": 46000 + }, + { + "epoch": 0.89, + "learning_rate": 2.1556444409925827e-08, + "loss": 0.0338, + "step": 46001 + }, + { + "epoch": 0.89, + "learning_rate": 2.1552561065589685e-08, + "loss": 0.0004, + "step": 46002 + }, + { + "epoch": 0.89, + "learning_rate": 2.154867772125354e-08, + "loss": 0.0003, + "step": 46003 + }, + { + "epoch": 0.89, + "learning_rate": 2.15447943769174e-08, + "loss": 0.0005, + "step": 46004 + }, + { + "epoch": 0.89, + "learning_rate": 2.1540911032581257e-08, + "loss": 0.0005, + "step": 46005 + }, + { + "epoch": 0.89, + "learning_rate": 2.1537027688245115e-08, + "loss": 0.0003, + "step": 46006 + }, + { + "epoch": 0.89, + "learning_rate": 2.1533144343908973e-08, + "loss": 0.0005, + "step": 46007 + }, + { + "epoch": 0.89, + "learning_rate": 2.152926099957283e-08, + "loss": 0.0003, + "step": 46008 + }, + { + "epoch": 0.89, + "learning_rate": 2.152537765523669e-08, + "loss": 0.0003, + "step": 46009 + }, + { + "epoch": 0.89, + "learning_rate": 2.1521494310900545e-08, + "loss": 0.763, + "step": 46010 + }, + { + "epoch": 0.89, + "learning_rate": 2.1517610966564403e-08, + "loss": 0.0004, + "step": 46011 + }, + { + "epoch": 0.89, + "learning_rate": 2.151372762222826e-08, + "loss": 0.0004, + "step": 46012 + }, + { + "epoch": 0.89, + "learning_rate": 2.150984427789212e-08, + "loss": 0.0004, + "step": 46013 + }, + { + "epoch": 0.89, + "learning_rate": 2.1505960933555978e-08, + "loss": 0.0007, + "step": 46014 + }, + { + "epoch": 0.89, + "learning_rate": 2.1502077589219836e-08, + "loss": 0.0008, + "step": 46015 + }, + { + "epoch": 0.89, + "learning_rate": 2.1498194244883694e-08, + "loss": 1.4629, + "step": 46016 + }, + { + "epoch": 0.89, + "learning_rate": 2.149431090054755e-08, + "loss": 0.0004, + "step": 46017 + }, + { + "epoch": 0.89, + "learning_rate": 2.1490427556211407e-08, + "loss": 0.8598, + "step": 46018 + }, + { + "epoch": 0.89, + "learning_rate": 2.1486544211875266e-08, + "loss": 0.0003, + "step": 46019 + }, + { + "epoch": 0.89, + "learning_rate": 2.1482660867539124e-08, + "loss": 0.0004, + "step": 46020 + }, + { + "epoch": 0.89, + "learning_rate": 2.1478777523202982e-08, + "loss": 0.0005, + "step": 46021 + }, + { + "epoch": 0.89, + "learning_rate": 2.147489417886684e-08, + "loss": 0.0004, + "step": 46022 + }, + { + "epoch": 0.89, + "learning_rate": 2.14710108345307e-08, + "loss": 0.0003, + "step": 46023 + }, + { + "epoch": 0.89, + "learning_rate": 2.1467127490194557e-08, + "loss": 0.0004, + "step": 46024 + }, + { + "epoch": 0.89, + "learning_rate": 2.1463244145858412e-08, + "loss": 0.0007, + "step": 46025 + }, + { + "epoch": 0.89, + "learning_rate": 2.145936080152227e-08, + "loss": 0.0004, + "step": 46026 + }, + { + "epoch": 0.89, + "learning_rate": 2.1455477457186128e-08, + "loss": 0.0004, + "step": 46027 + }, + { + "epoch": 0.89, + "learning_rate": 2.1451594112849987e-08, + "loss": 0.0004, + "step": 46028 + }, + { + "epoch": 0.89, + "learning_rate": 2.1447710768513845e-08, + "loss": 0.0015, + "step": 46029 + }, + { + "epoch": 0.89, + "learning_rate": 2.1443827424177703e-08, + "loss": 0.002, + "step": 46030 + }, + { + "epoch": 0.89, + "learning_rate": 2.143994407984156e-08, + "loss": 0.0005, + "step": 46031 + }, + { + "epoch": 0.89, + "learning_rate": 2.1436060735505416e-08, + "loss": 0.0792, + "step": 46032 + }, + { + "epoch": 0.89, + "learning_rate": 2.1432177391169274e-08, + "loss": 0.0004, + "step": 46033 + }, + { + "epoch": 0.89, + "learning_rate": 2.1428294046833133e-08, + "loss": 0.0004, + "step": 46034 + }, + { + "epoch": 0.89, + "learning_rate": 2.142441070249699e-08, + "loss": 0.0004, + "step": 46035 + }, + { + "epoch": 0.89, + "learning_rate": 2.142052735816085e-08, + "loss": 0.0004, + "step": 46036 + }, + { + "epoch": 0.89, + "learning_rate": 2.1416644013824704e-08, + "loss": 0.0004, + "step": 46037 + }, + { + "epoch": 0.89, + "learning_rate": 2.1412760669488562e-08, + "loss": 0.0003, + "step": 46038 + }, + { + "epoch": 0.89, + "learning_rate": 2.140887732515242e-08, + "loss": 0.0003, + "step": 46039 + }, + { + "epoch": 0.89, + "learning_rate": 2.1404993980816276e-08, + "loss": 0.0003, + "step": 46040 + }, + { + "epoch": 0.89, + "learning_rate": 2.1401110636480134e-08, + "loss": 0.0005, + "step": 46041 + }, + { + "epoch": 0.89, + "learning_rate": 2.1397227292143992e-08, + "loss": 0.0005, + "step": 46042 + }, + { + "epoch": 0.89, + "learning_rate": 2.139334394780785e-08, + "loss": 0.0004, + "step": 46043 + }, + { + "epoch": 0.89, + "learning_rate": 2.138946060347171e-08, + "loss": 0.0027, + "step": 46044 + }, + { + "epoch": 0.89, + "learning_rate": 2.1385577259135567e-08, + "loss": 0.0004, + "step": 46045 + }, + { + "epoch": 0.89, + "learning_rate": 2.1381693914799422e-08, + "loss": 0.001, + "step": 46046 + }, + { + "epoch": 0.89, + "learning_rate": 2.137781057046328e-08, + "loss": 0.0003, + "step": 46047 + }, + { + "epoch": 0.89, + "learning_rate": 2.1373927226127138e-08, + "loss": 0.0003, + "step": 46048 + }, + { + "epoch": 0.89, + "learning_rate": 2.1370043881790996e-08, + "loss": 0.0003, + "step": 46049 + }, + { + "epoch": 0.89, + "learning_rate": 2.1366160537454855e-08, + "loss": 1.1033, + "step": 46050 + }, + { + "epoch": 0.89, + "learning_rate": 2.1362277193118713e-08, + "loss": 0.0004, + "step": 46051 + }, + { + "epoch": 0.89, + "learning_rate": 2.135839384878257e-08, + "loss": 0.6433, + "step": 46052 + }, + { + "epoch": 0.89, + "learning_rate": 2.135451050444643e-08, + "loss": 0.0003, + "step": 46053 + }, + { + "epoch": 0.89, + "learning_rate": 2.1350627160110284e-08, + "loss": 0.6654, + "step": 46054 + }, + { + "epoch": 0.89, + "learning_rate": 2.1346743815774143e-08, + "loss": 0.0007, + "step": 46055 + }, + { + "epoch": 0.89, + "learning_rate": 2.1342860471438e-08, + "loss": 0.0002, + "step": 46056 + }, + { + "epoch": 0.89, + "learning_rate": 2.133897712710186e-08, + "loss": 0.0004, + "step": 46057 + }, + { + "epoch": 0.89, + "learning_rate": 2.1335093782765717e-08, + "loss": 0.0005, + "step": 46058 + }, + { + "epoch": 0.89, + "learning_rate": 2.1331210438429576e-08, + "loss": 0.7451, + "step": 46059 + }, + { + "epoch": 0.89, + "learning_rate": 2.1327327094093434e-08, + "loss": 0.0005, + "step": 46060 + }, + { + "epoch": 0.89, + "learning_rate": 2.132344374975729e-08, + "loss": 0.0009, + "step": 46061 + }, + { + "epoch": 0.89, + "learning_rate": 2.1319560405421147e-08, + "loss": 0.0427, + "step": 46062 + }, + { + "epoch": 0.89, + "learning_rate": 2.1315677061085005e-08, + "loss": 0.4557, + "step": 46063 + }, + { + "epoch": 0.89, + "learning_rate": 2.1311793716748863e-08, + "loss": 0.0004, + "step": 46064 + }, + { + "epoch": 0.89, + "learning_rate": 2.1307910372412722e-08, + "loss": 0.0003, + "step": 46065 + }, + { + "epoch": 0.89, + "learning_rate": 2.130402702807658e-08, + "loss": 0.0005, + "step": 46066 + }, + { + "epoch": 0.89, + "learning_rate": 2.1300143683740438e-08, + "loss": 0.0004, + "step": 46067 + }, + { + "epoch": 0.89, + "learning_rate": 2.1296260339404293e-08, + "loss": 0.1352, + "step": 46068 + }, + { + "epoch": 0.89, + "learning_rate": 2.129237699506815e-08, + "loss": 0.0003, + "step": 46069 + }, + { + "epoch": 0.89, + "learning_rate": 2.128849365073201e-08, + "loss": 0.0003, + "step": 46070 + }, + { + "epoch": 0.89, + "learning_rate": 2.1284610306395868e-08, + "loss": 0.0004, + "step": 46071 + }, + { + "epoch": 0.89, + "learning_rate": 2.1280726962059726e-08, + "loss": 0.0004, + "step": 46072 + }, + { + "epoch": 0.89, + "learning_rate": 2.1276843617723584e-08, + "loss": 0.0006, + "step": 46073 + }, + { + "epoch": 0.89, + "learning_rate": 2.1272960273387443e-08, + "loss": 0.4687, + "step": 46074 + }, + { + "epoch": 0.89, + "learning_rate": 2.1269076929051298e-08, + "loss": 0.0003, + "step": 46075 + }, + { + "epoch": 0.89, + "learning_rate": 2.1265193584715156e-08, + "loss": 0.0005, + "step": 46076 + }, + { + "epoch": 0.89, + "learning_rate": 2.1261310240379014e-08, + "loss": 0.0008, + "step": 46077 + }, + { + "epoch": 0.89, + "learning_rate": 2.1257426896042872e-08, + "loss": 0.0005, + "step": 46078 + }, + { + "epoch": 0.89, + "learning_rate": 2.125354355170673e-08, + "loss": 0.0006, + "step": 46079 + }, + { + "epoch": 0.89, + "learning_rate": 2.124966020737059e-08, + "loss": 0.0003, + "step": 46080 + }, + { + "epoch": 0.89, + "learning_rate": 2.1245776863034444e-08, + "loss": 0.0004, + "step": 46081 + }, + { + "epoch": 0.89, + "learning_rate": 2.1241893518698302e-08, + "loss": 0.0018, + "step": 46082 + }, + { + "epoch": 0.89, + "learning_rate": 2.123801017436216e-08, + "loss": 0.9662, + "step": 46083 + }, + { + "epoch": 0.89, + "learning_rate": 2.1234126830026015e-08, + "loss": 0.0004, + "step": 46084 + }, + { + "epoch": 0.89, + "learning_rate": 2.1230243485689873e-08, + "loss": 0.3149, + "step": 46085 + }, + { + "epoch": 0.89, + "learning_rate": 2.122636014135373e-08, + "loss": 0.8202, + "step": 46086 + }, + { + "epoch": 0.89, + "learning_rate": 2.122247679701759e-08, + "loss": 0.0003, + "step": 46087 + }, + { + "epoch": 0.89, + "learning_rate": 2.1218593452681448e-08, + "loss": 0.0005, + "step": 46088 + }, + { + "epoch": 0.89, + "learning_rate": 2.1214710108345306e-08, + "loss": 0.0006, + "step": 46089 + }, + { + "epoch": 0.89, + "learning_rate": 2.121082676400916e-08, + "loss": 0.0005, + "step": 46090 + }, + { + "epoch": 0.89, + "learning_rate": 2.120694341967302e-08, + "loss": 0.0301, + "step": 46091 + }, + { + "epoch": 0.89, + "learning_rate": 2.1203060075336878e-08, + "loss": 0.8509, + "step": 46092 + }, + { + "epoch": 0.89, + "learning_rate": 2.1199176731000736e-08, + "loss": 0.0005, + "step": 46093 + }, + { + "epoch": 0.89, + "learning_rate": 2.1195293386664594e-08, + "loss": 0.0004, + "step": 46094 + }, + { + "epoch": 0.89, + "learning_rate": 2.1191410042328453e-08, + "loss": 0.0045, + "step": 46095 + }, + { + "epoch": 0.89, + "learning_rate": 2.118752669799231e-08, + "loss": 0.0004, + "step": 46096 + }, + { + "epoch": 0.89, + "learning_rate": 2.1183643353656166e-08, + "loss": 0.0004, + "step": 46097 + }, + { + "epoch": 0.89, + "learning_rate": 2.1179760009320024e-08, + "loss": 0.0004, + "step": 46098 + }, + { + "epoch": 0.89, + "learning_rate": 2.1175876664983882e-08, + "loss": 0.0005, + "step": 46099 + }, + { + "epoch": 0.89, + "learning_rate": 2.117199332064774e-08, + "loss": 0.0006, + "step": 46100 + }, + { + "epoch": 0.89, + "learning_rate": 2.11681099763116e-08, + "loss": 0.0003, + "step": 46101 + }, + { + "epoch": 0.89, + "learning_rate": 2.1164226631975457e-08, + "loss": 0.0003, + "step": 46102 + }, + { + "epoch": 0.89, + "learning_rate": 2.1160343287639315e-08, + "loss": 0.0003, + "step": 46103 + }, + { + "epoch": 0.89, + "learning_rate": 2.115645994330317e-08, + "loss": 0.0005, + "step": 46104 + }, + { + "epoch": 0.89, + "learning_rate": 2.115257659896703e-08, + "loss": 0.0054, + "step": 46105 + }, + { + "epoch": 0.89, + "learning_rate": 2.1148693254630887e-08, + "loss": 0.0003, + "step": 46106 + }, + { + "epoch": 0.89, + "learning_rate": 2.1144809910294745e-08, + "loss": 0.0004, + "step": 46107 + }, + { + "epoch": 0.89, + "learning_rate": 2.1140926565958603e-08, + "loss": 0.0004, + "step": 46108 + }, + { + "epoch": 0.89, + "learning_rate": 2.113704322162246e-08, + "loss": 0.0003, + "step": 46109 + }, + { + "epoch": 0.89, + "learning_rate": 2.113315987728632e-08, + "loss": 0.0004, + "step": 46110 + }, + { + "epoch": 0.89, + "learning_rate": 2.1129276532950178e-08, + "loss": 0.0002, + "step": 46111 + }, + { + "epoch": 0.89, + "learning_rate": 2.1125393188614033e-08, + "loss": 0.0004, + "step": 46112 + }, + { + "epoch": 0.89, + "learning_rate": 2.112150984427789e-08, + "loss": 0.0004, + "step": 46113 + }, + { + "epoch": 0.89, + "learning_rate": 2.111762649994175e-08, + "loss": 0.0004, + "step": 46114 + }, + { + "epoch": 0.89, + "learning_rate": 2.1113743155605607e-08, + "loss": 0.0003, + "step": 46115 + }, + { + "epoch": 0.89, + "learning_rate": 2.1109859811269466e-08, + "loss": 0.0003, + "step": 46116 + }, + { + "epoch": 0.89, + "learning_rate": 2.1105976466933324e-08, + "loss": 0.0005, + "step": 46117 + }, + { + "epoch": 0.89, + "learning_rate": 2.1102093122597182e-08, + "loss": 0.0004, + "step": 46118 + }, + { + "epoch": 0.89, + "learning_rate": 2.1098209778261037e-08, + "loss": 0.0004, + "step": 46119 + }, + { + "epoch": 0.89, + "learning_rate": 2.1094326433924895e-08, + "loss": 0.0004, + "step": 46120 + }, + { + "epoch": 0.89, + "learning_rate": 2.1090443089588754e-08, + "loss": 0.0018, + "step": 46121 + }, + { + "epoch": 0.89, + "learning_rate": 2.1086559745252612e-08, + "loss": 0.0004, + "step": 46122 + }, + { + "epoch": 0.89, + "learning_rate": 2.108267640091647e-08, + "loss": 0.0005, + "step": 46123 + }, + { + "epoch": 0.89, + "learning_rate": 2.107879305658033e-08, + "loss": 0.0003, + "step": 46124 + }, + { + "epoch": 0.89, + "learning_rate": 2.1074909712244183e-08, + "loss": 0.0004, + "step": 46125 + }, + { + "epoch": 0.89, + "learning_rate": 2.107102636790804e-08, + "loss": 0.0003, + "step": 46126 + }, + { + "epoch": 0.89, + "learning_rate": 2.10671430235719e-08, + "loss": 0.0004, + "step": 46127 + }, + { + "epoch": 0.89, + "learning_rate": 2.1063259679235758e-08, + "loss": 0.0006, + "step": 46128 + }, + { + "epoch": 0.89, + "learning_rate": 2.1059376334899613e-08, + "loss": 0.0005, + "step": 46129 + }, + { + "epoch": 0.89, + "learning_rate": 2.105549299056347e-08, + "loss": 0.0004, + "step": 46130 + }, + { + "epoch": 0.89, + "learning_rate": 2.105160964622733e-08, + "loss": 0.0004, + "step": 46131 + }, + { + "epoch": 0.89, + "learning_rate": 2.1047726301891188e-08, + "loss": 0.0005, + "step": 46132 + }, + { + "epoch": 0.89, + "learning_rate": 2.1043842957555043e-08, + "loss": 0.689, + "step": 46133 + }, + { + "epoch": 0.89, + "learning_rate": 2.10399596132189e-08, + "loss": 0.0004, + "step": 46134 + }, + { + "epoch": 0.89, + "learning_rate": 2.103607626888276e-08, + "loss": 0.0005, + "step": 46135 + }, + { + "epoch": 0.89, + "learning_rate": 2.1032192924546617e-08, + "loss": 0.0006, + "step": 46136 + }, + { + "epoch": 0.89, + "learning_rate": 2.1028309580210476e-08, + "loss": 0.0004, + "step": 46137 + }, + { + "epoch": 0.89, + "learning_rate": 2.1024426235874334e-08, + "loss": 0.0023, + "step": 46138 + }, + { + "epoch": 0.89, + "learning_rate": 2.1020542891538192e-08, + "loss": 0.0003, + "step": 46139 + }, + { + "epoch": 0.9, + "learning_rate": 2.101665954720205e-08, + "loss": 0.0003, + "step": 46140 + }, + { + "epoch": 0.9, + "learning_rate": 2.1012776202865905e-08, + "loss": 0.0003, + "step": 46141 + }, + { + "epoch": 0.9, + "learning_rate": 2.1008892858529764e-08, + "loss": 0.0003, + "step": 46142 + }, + { + "epoch": 0.9, + "learning_rate": 2.1005009514193622e-08, + "loss": 0.0004, + "step": 46143 + }, + { + "epoch": 0.9, + "learning_rate": 2.100112616985748e-08, + "loss": 0.0005, + "step": 46144 + }, + { + "epoch": 0.9, + "learning_rate": 2.0997242825521338e-08, + "loss": 0.0003, + "step": 46145 + }, + { + "epoch": 0.9, + "learning_rate": 2.0993359481185197e-08, + "loss": 0.0005, + "step": 46146 + }, + { + "epoch": 0.9, + "learning_rate": 2.0989476136849055e-08, + "loss": 0.0003, + "step": 46147 + }, + { + "epoch": 0.9, + "learning_rate": 2.098559279251291e-08, + "loss": 0.0003, + "step": 46148 + }, + { + "epoch": 0.9, + "learning_rate": 2.0981709448176768e-08, + "loss": 0.0003, + "step": 46149 + }, + { + "epoch": 0.9, + "learning_rate": 2.0977826103840626e-08, + "loss": 0.0004, + "step": 46150 + }, + { + "epoch": 0.9, + "learning_rate": 2.0973942759504484e-08, + "loss": 0.0004, + "step": 46151 + }, + { + "epoch": 0.9, + "learning_rate": 2.0970059415168343e-08, + "loss": 0.0003, + "step": 46152 + }, + { + "epoch": 0.9, + "learning_rate": 2.09661760708322e-08, + "loss": 0.0004, + "step": 46153 + }, + { + "epoch": 0.9, + "learning_rate": 2.096229272649606e-08, + "loss": 0.0002, + "step": 46154 + }, + { + "epoch": 0.9, + "learning_rate": 2.0958409382159914e-08, + "loss": 0.0003, + "step": 46155 + }, + { + "epoch": 0.9, + "learning_rate": 2.0954526037823772e-08, + "loss": 0.001, + "step": 46156 + }, + { + "epoch": 0.9, + "learning_rate": 2.095064269348763e-08, + "loss": 0.0004, + "step": 46157 + }, + { + "epoch": 0.9, + "learning_rate": 2.094675934915149e-08, + "loss": 0.7786, + "step": 46158 + }, + { + "epoch": 0.9, + "learning_rate": 2.0942876004815347e-08, + "loss": 0.0003, + "step": 46159 + }, + { + "epoch": 0.9, + "learning_rate": 2.0938992660479205e-08, + "loss": 0.0491, + "step": 46160 + }, + { + "epoch": 0.9, + "learning_rate": 2.0935109316143064e-08, + "loss": 0.0004, + "step": 46161 + }, + { + "epoch": 0.9, + "learning_rate": 2.093122597180692e-08, + "loss": 0.0003, + "step": 46162 + }, + { + "epoch": 0.9, + "learning_rate": 2.0927342627470777e-08, + "loss": 0.0004, + "step": 46163 + }, + { + "epoch": 0.9, + "learning_rate": 2.0923459283134635e-08, + "loss": 0.6598, + "step": 46164 + }, + { + "epoch": 0.9, + "learning_rate": 2.0919575938798493e-08, + "loss": 0.0005, + "step": 46165 + }, + { + "epoch": 0.9, + "learning_rate": 2.091569259446235e-08, + "loss": 0.0003, + "step": 46166 + }, + { + "epoch": 0.9, + "learning_rate": 2.091180925012621e-08, + "loss": 0.0005, + "step": 46167 + }, + { + "epoch": 0.9, + "learning_rate": 2.0907925905790068e-08, + "loss": 0.0005, + "step": 46168 + }, + { + "epoch": 0.9, + "learning_rate": 2.0904042561453923e-08, + "loss": 0.0003, + "step": 46169 + }, + { + "epoch": 0.9, + "learning_rate": 2.090015921711778e-08, + "loss": 0.4691, + "step": 46170 + }, + { + "epoch": 0.9, + "learning_rate": 2.089627587278164e-08, + "loss": 0.0004, + "step": 46171 + }, + { + "epoch": 0.9, + "learning_rate": 2.0892392528445498e-08, + "loss": 0.1517, + "step": 46172 + }, + { + "epoch": 0.9, + "learning_rate": 2.0888509184109353e-08, + "loss": 0.0005, + "step": 46173 + }, + { + "epoch": 0.9, + "learning_rate": 2.088462583977321e-08, + "loss": 0.0005, + "step": 46174 + }, + { + "epoch": 0.9, + "learning_rate": 2.088074249543707e-08, + "loss": 0.0004, + "step": 46175 + }, + { + "epoch": 0.9, + "learning_rate": 2.0876859151100927e-08, + "loss": 0.1024, + "step": 46176 + }, + { + "epoch": 0.9, + "learning_rate": 2.0872975806764782e-08, + "loss": 0.0003, + "step": 46177 + }, + { + "epoch": 0.9, + "learning_rate": 2.086909246242864e-08, + "loss": 0.4956, + "step": 46178 + }, + { + "epoch": 0.9, + "learning_rate": 2.08652091180925e-08, + "loss": 0.405, + "step": 46179 + }, + { + "epoch": 0.9, + "learning_rate": 2.0861325773756357e-08, + "loss": 0.0005, + "step": 46180 + }, + { + "epoch": 0.9, + "learning_rate": 2.0857442429420215e-08, + "loss": 0.0004, + "step": 46181 + }, + { + "epoch": 0.9, + "learning_rate": 2.0853559085084073e-08, + "loss": 0.0004, + "step": 46182 + }, + { + "epoch": 0.9, + "learning_rate": 2.0849675740747932e-08, + "loss": 0.0004, + "step": 46183 + }, + { + "epoch": 0.9, + "learning_rate": 2.0845792396411787e-08, + "loss": 0.0004, + "step": 46184 + }, + { + "epoch": 0.9, + "learning_rate": 2.0841909052075645e-08, + "loss": 0.0005, + "step": 46185 + }, + { + "epoch": 0.9, + "learning_rate": 2.0838025707739503e-08, + "loss": 0.0007, + "step": 46186 + }, + { + "epoch": 0.9, + "learning_rate": 2.083414236340336e-08, + "loss": 0.0005, + "step": 46187 + }, + { + "epoch": 0.9, + "learning_rate": 2.083025901906722e-08, + "loss": 0.0003, + "step": 46188 + }, + { + "epoch": 0.9, + "learning_rate": 2.0826375674731078e-08, + "loss": 0.0004, + "step": 46189 + }, + { + "epoch": 0.9, + "learning_rate": 2.0822492330394936e-08, + "loss": 0.0003, + "step": 46190 + }, + { + "epoch": 0.9, + "learning_rate": 2.081860898605879e-08, + "loss": 0.0003, + "step": 46191 + }, + { + "epoch": 0.9, + "learning_rate": 2.081472564172265e-08, + "loss": 0.0004, + "step": 46192 + }, + { + "epoch": 0.9, + "learning_rate": 2.0810842297386508e-08, + "loss": 0.0004, + "step": 46193 + }, + { + "epoch": 0.9, + "learning_rate": 2.0806958953050366e-08, + "loss": 0.0004, + "step": 46194 + }, + { + "epoch": 0.9, + "learning_rate": 2.0803075608714224e-08, + "loss": 0.0003, + "step": 46195 + }, + { + "epoch": 0.9, + "learning_rate": 2.0799192264378082e-08, + "loss": 0.0003, + "step": 46196 + }, + { + "epoch": 0.9, + "learning_rate": 2.079530892004194e-08, + "loss": 0.0003, + "step": 46197 + }, + { + "epoch": 0.9, + "learning_rate": 2.07914255757058e-08, + "loss": 0.0004, + "step": 46198 + }, + { + "epoch": 0.9, + "learning_rate": 2.0787542231369654e-08, + "loss": 0.0004, + "step": 46199 + }, + { + "epoch": 0.9, + "learning_rate": 2.0783658887033512e-08, + "loss": 0.0005, + "step": 46200 + }, + { + "epoch": 0.9, + "learning_rate": 2.077977554269737e-08, + "loss": 0.4045, + "step": 46201 + }, + { + "epoch": 0.9, + "learning_rate": 2.077589219836123e-08, + "loss": 0.0003, + "step": 46202 + }, + { + "epoch": 0.9, + "learning_rate": 2.0772008854025087e-08, + "loss": 0.0004, + "step": 46203 + }, + { + "epoch": 0.9, + "learning_rate": 2.0768125509688945e-08, + "loss": 0.0004, + "step": 46204 + }, + { + "epoch": 0.9, + "learning_rate": 2.0764242165352803e-08, + "loss": 0.0003, + "step": 46205 + }, + { + "epoch": 0.9, + "learning_rate": 2.0760358821016658e-08, + "loss": 0.0004, + "step": 46206 + }, + { + "epoch": 0.9, + "learning_rate": 2.0756475476680516e-08, + "loss": 0.0047, + "step": 46207 + }, + { + "epoch": 0.9, + "learning_rate": 2.0752592132344375e-08, + "loss": 0.0003, + "step": 46208 + }, + { + "epoch": 0.9, + "learning_rate": 2.0748708788008233e-08, + "loss": 0.0004, + "step": 46209 + }, + { + "epoch": 0.9, + "learning_rate": 2.074482544367209e-08, + "loss": 0.7949, + "step": 46210 + }, + { + "epoch": 0.9, + "learning_rate": 2.074094209933595e-08, + "loss": 0.0003, + "step": 46211 + }, + { + "epoch": 0.9, + "learning_rate": 2.0737058754999808e-08, + "loss": 0.0007, + "step": 46212 + }, + { + "epoch": 0.9, + "learning_rate": 2.0733175410663662e-08, + "loss": 0.0005, + "step": 46213 + }, + { + "epoch": 0.9, + "learning_rate": 2.072929206632752e-08, + "loss": 0.7941, + "step": 46214 + }, + { + "epoch": 0.9, + "learning_rate": 2.072540872199138e-08, + "loss": 0.0006, + "step": 46215 + }, + { + "epoch": 0.9, + "learning_rate": 2.0721525377655237e-08, + "loss": 0.0003, + "step": 46216 + }, + { + "epoch": 0.9, + "learning_rate": 2.0717642033319092e-08, + "loss": 0.0003, + "step": 46217 + }, + { + "epoch": 0.9, + "learning_rate": 2.071375868898295e-08, + "loss": 0.0005, + "step": 46218 + }, + { + "epoch": 0.9, + "learning_rate": 2.070987534464681e-08, + "loss": 0.0004, + "step": 46219 + }, + { + "epoch": 0.9, + "learning_rate": 2.0705992000310667e-08, + "loss": 0.0004, + "step": 46220 + }, + { + "epoch": 0.9, + "learning_rate": 2.0702108655974522e-08, + "loss": 1.1762, + "step": 46221 + }, + { + "epoch": 0.9, + "learning_rate": 2.069822531163838e-08, + "loss": 0.0005, + "step": 46222 + }, + { + "epoch": 0.9, + "learning_rate": 2.0694341967302238e-08, + "loss": 0.0017, + "step": 46223 + }, + { + "epoch": 0.9, + "learning_rate": 2.0690458622966097e-08, + "loss": 0.0003, + "step": 46224 + }, + { + "epoch": 0.9, + "learning_rate": 2.0686575278629955e-08, + "loss": 0.0004, + "step": 46225 + }, + { + "epoch": 0.9, + "learning_rate": 2.0682691934293813e-08, + "loss": 0.0022, + "step": 46226 + }, + { + "epoch": 0.9, + "learning_rate": 2.067880858995767e-08, + "loss": 0.0004, + "step": 46227 + }, + { + "epoch": 0.9, + "learning_rate": 2.0674925245621526e-08, + "loss": 0.0004, + "step": 46228 + }, + { + "epoch": 0.9, + "learning_rate": 2.0671041901285384e-08, + "loss": 1.0337, + "step": 46229 + }, + { + "epoch": 0.9, + "learning_rate": 2.0667158556949243e-08, + "loss": 0.0003, + "step": 46230 + }, + { + "epoch": 0.9, + "learning_rate": 2.06632752126131e-08, + "loss": 0.0004, + "step": 46231 + }, + { + "epoch": 0.9, + "learning_rate": 2.065939186827696e-08, + "loss": 0.0005, + "step": 46232 + }, + { + "epoch": 0.9, + "learning_rate": 2.0655508523940817e-08, + "loss": 0.0004, + "step": 46233 + }, + { + "epoch": 0.9, + "learning_rate": 2.0651625179604676e-08, + "loss": 0.0005, + "step": 46234 + }, + { + "epoch": 0.9, + "learning_rate": 2.064774183526853e-08, + "loss": 0.0003, + "step": 46235 + }, + { + "epoch": 0.9, + "learning_rate": 2.064385849093239e-08, + "loss": 0.0004, + "step": 46236 + }, + { + "epoch": 0.9, + "learning_rate": 2.0639975146596247e-08, + "loss": 0.0003, + "step": 46237 + }, + { + "epoch": 0.9, + "learning_rate": 2.0636091802260105e-08, + "loss": 0.0003, + "step": 46238 + }, + { + "epoch": 0.9, + "learning_rate": 2.0632208457923964e-08, + "loss": 0.0005, + "step": 46239 + }, + { + "epoch": 0.9, + "learning_rate": 2.0628325113587822e-08, + "loss": 0.0003, + "step": 46240 + }, + { + "epoch": 0.9, + "learning_rate": 2.062444176925168e-08, + "loss": 0.0005, + "step": 46241 + }, + { + "epoch": 0.9, + "learning_rate": 2.0620558424915535e-08, + "loss": 0.0005, + "step": 46242 + }, + { + "epoch": 0.9, + "learning_rate": 2.0616675080579393e-08, + "loss": 0.0003, + "step": 46243 + }, + { + "epoch": 0.9, + "learning_rate": 2.061279173624325e-08, + "loss": 0.0003, + "step": 46244 + }, + { + "epoch": 0.9, + "learning_rate": 2.060890839190711e-08, + "loss": 0.0004, + "step": 46245 + }, + { + "epoch": 0.9, + "learning_rate": 2.0605025047570968e-08, + "loss": 0.0021, + "step": 46246 + }, + { + "epoch": 0.9, + "learning_rate": 2.0601141703234826e-08, + "loss": 0.0004, + "step": 46247 + }, + { + "epoch": 0.9, + "learning_rate": 2.0597258358898684e-08, + "loss": 0.0003, + "step": 46248 + }, + { + "epoch": 0.9, + "learning_rate": 2.059337501456254e-08, + "loss": 0.0003, + "step": 46249 + }, + { + "epoch": 0.9, + "learning_rate": 2.0589491670226398e-08, + "loss": 0.0003, + "step": 46250 + }, + { + "epoch": 0.9, + "learning_rate": 2.0585608325890256e-08, + "loss": 0.0003, + "step": 46251 + }, + { + "epoch": 0.9, + "learning_rate": 2.0581724981554114e-08, + "loss": 0.0004, + "step": 46252 + }, + { + "epoch": 0.9, + "learning_rate": 2.0577841637217972e-08, + "loss": 0.0004, + "step": 46253 + }, + { + "epoch": 0.9, + "learning_rate": 2.057395829288183e-08, + "loss": 0.0004, + "step": 46254 + }, + { + "epoch": 0.9, + "learning_rate": 2.057007494854569e-08, + "loss": 0.0005, + "step": 46255 + }, + { + "epoch": 0.9, + "learning_rate": 2.0566191604209547e-08, + "loss": 0.0005, + "step": 46256 + }, + { + "epoch": 0.9, + "learning_rate": 2.0562308259873402e-08, + "loss": 0.0763, + "step": 46257 + }, + { + "epoch": 0.9, + "learning_rate": 2.055842491553726e-08, + "loss": 0.0306, + "step": 46258 + }, + { + "epoch": 0.9, + "learning_rate": 2.055454157120112e-08, + "loss": 0.0002, + "step": 46259 + }, + { + "epoch": 0.9, + "learning_rate": 2.0550658226864977e-08, + "loss": 0.0003, + "step": 46260 + }, + { + "epoch": 0.9, + "learning_rate": 2.0546774882528832e-08, + "loss": 0.0003, + "step": 46261 + }, + { + "epoch": 0.9, + "learning_rate": 2.054289153819269e-08, + "loss": 0.0007, + "step": 46262 + }, + { + "epoch": 0.9, + "learning_rate": 2.0539008193856548e-08, + "loss": 0.0003, + "step": 46263 + }, + { + "epoch": 0.9, + "learning_rate": 2.0535124849520406e-08, + "loss": 0.0002, + "step": 46264 + }, + { + "epoch": 0.9, + "learning_rate": 2.053124150518426e-08, + "loss": 0.0003, + "step": 46265 + }, + { + "epoch": 0.9, + "learning_rate": 2.052735816084812e-08, + "loss": 0.0005, + "step": 46266 + }, + { + "epoch": 0.9, + "learning_rate": 2.0523474816511978e-08, + "loss": 0.0009, + "step": 46267 + }, + { + "epoch": 0.9, + "learning_rate": 2.0519591472175836e-08, + "loss": 0.0769, + "step": 46268 + }, + { + "epoch": 0.9, + "learning_rate": 2.0515708127839694e-08, + "loss": 0.0246, + "step": 46269 + }, + { + "epoch": 0.9, + "learning_rate": 2.0511824783503553e-08, + "loss": 0.8077, + "step": 46270 + }, + { + "epoch": 0.9, + "learning_rate": 2.0507941439167408e-08, + "loss": 0.0006, + "step": 46271 + }, + { + "epoch": 0.9, + "learning_rate": 2.0504058094831266e-08, + "loss": 0.0006, + "step": 46272 + }, + { + "epoch": 0.9, + "learning_rate": 2.0500174750495124e-08, + "loss": 0.0004, + "step": 46273 + }, + { + "epoch": 0.9, + "learning_rate": 2.0496291406158982e-08, + "loss": 1.3262, + "step": 46274 + }, + { + "epoch": 0.9, + "learning_rate": 2.049240806182284e-08, + "loss": 0.0004, + "step": 46275 + }, + { + "epoch": 0.9, + "learning_rate": 2.04885247174867e-08, + "loss": 0.0004, + "step": 46276 + }, + { + "epoch": 0.9, + "learning_rate": 2.0484641373150557e-08, + "loss": 0.0057, + "step": 46277 + }, + { + "epoch": 0.9, + "learning_rate": 2.0480758028814412e-08, + "loss": 0.0006, + "step": 46278 + }, + { + "epoch": 0.9, + "learning_rate": 2.047687468447827e-08, + "loss": 0.0003, + "step": 46279 + }, + { + "epoch": 0.9, + "learning_rate": 2.047299134014213e-08, + "loss": 0.0004, + "step": 46280 + }, + { + "epoch": 0.9, + "learning_rate": 2.0469107995805987e-08, + "loss": 0.0004, + "step": 46281 + }, + { + "epoch": 0.9, + "learning_rate": 2.0465224651469845e-08, + "loss": 0.0023, + "step": 46282 + }, + { + "epoch": 0.9, + "learning_rate": 2.0461341307133703e-08, + "loss": 0.0004, + "step": 46283 + }, + { + "epoch": 0.9, + "learning_rate": 2.045745796279756e-08, + "loss": 0.0033, + "step": 46284 + }, + { + "epoch": 0.9, + "learning_rate": 2.045357461846142e-08, + "loss": 0.0005, + "step": 46285 + }, + { + "epoch": 0.9, + "learning_rate": 2.0449691274125275e-08, + "loss": 0.0003, + "step": 46286 + }, + { + "epoch": 0.9, + "learning_rate": 2.0445807929789133e-08, + "loss": 0.0005, + "step": 46287 + }, + { + "epoch": 0.9, + "learning_rate": 2.044192458545299e-08, + "loss": 0.0004, + "step": 46288 + }, + { + "epoch": 0.9, + "learning_rate": 2.043804124111685e-08, + "loss": 0.0003, + "step": 46289 + }, + { + "epoch": 0.9, + "learning_rate": 2.0434157896780708e-08, + "loss": 0.0005, + "step": 46290 + }, + { + "epoch": 0.9, + "learning_rate": 2.0430274552444566e-08, + "loss": 0.0005, + "step": 46291 + }, + { + "epoch": 0.9, + "learning_rate": 2.0426391208108424e-08, + "loss": 0.0004, + "step": 46292 + }, + { + "epoch": 0.9, + "learning_rate": 2.042250786377228e-08, + "loss": 0.0003, + "step": 46293 + }, + { + "epoch": 0.9, + "learning_rate": 2.0418624519436137e-08, + "loss": 0.0004, + "step": 46294 + }, + { + "epoch": 0.9, + "learning_rate": 2.0414741175099996e-08, + "loss": 0.0006, + "step": 46295 + }, + { + "epoch": 0.9, + "learning_rate": 2.0410857830763854e-08, + "loss": 0.4244, + "step": 46296 + }, + { + "epoch": 0.9, + "learning_rate": 2.0406974486427712e-08, + "loss": 0.0133, + "step": 46297 + }, + { + "epoch": 0.9, + "learning_rate": 2.040309114209157e-08, + "loss": 0.0003, + "step": 46298 + }, + { + "epoch": 0.9, + "learning_rate": 2.039920779775543e-08, + "loss": 0.0019, + "step": 46299 + }, + { + "epoch": 0.9, + "learning_rate": 2.0395324453419283e-08, + "loss": 0.0003, + "step": 46300 + }, + { + "epoch": 0.9, + "learning_rate": 2.0391441109083142e-08, + "loss": 0.0035, + "step": 46301 + }, + { + "epoch": 0.9, + "learning_rate": 2.0387557764747e-08, + "loss": 0.0004, + "step": 46302 + }, + { + "epoch": 0.9, + "learning_rate": 2.0383674420410858e-08, + "loss": 0.0004, + "step": 46303 + }, + { + "epoch": 0.9, + "learning_rate": 2.0379791076074716e-08, + "loss": 0.0004, + "step": 46304 + }, + { + "epoch": 0.9, + "learning_rate": 2.0375907731738575e-08, + "loss": 0.0009, + "step": 46305 + }, + { + "epoch": 0.9, + "learning_rate": 2.037202438740243e-08, + "loss": 0.0003, + "step": 46306 + }, + { + "epoch": 0.9, + "learning_rate": 2.0368141043066288e-08, + "loss": 0.0005, + "step": 46307 + }, + { + "epoch": 0.9, + "learning_rate": 2.0364257698730146e-08, + "loss": 0.0007, + "step": 46308 + }, + { + "epoch": 0.9, + "learning_rate": 2.0360374354394e-08, + "loss": 0.0004, + "step": 46309 + }, + { + "epoch": 0.9, + "learning_rate": 2.035649101005786e-08, + "loss": 0.0003, + "step": 46310 + }, + { + "epoch": 0.9, + "learning_rate": 2.0352607665721717e-08, + "loss": 0.006, + "step": 46311 + }, + { + "epoch": 0.9, + "learning_rate": 2.0348724321385576e-08, + "loss": 0.0012, + "step": 46312 + }, + { + "epoch": 0.9, + "learning_rate": 2.0344840977049434e-08, + "loss": 0.0006, + "step": 46313 + }, + { + "epoch": 0.9, + "learning_rate": 2.0340957632713292e-08, + "loss": 0.0005, + "step": 46314 + }, + { + "epoch": 0.9, + "learning_rate": 2.0337074288377147e-08, + "loss": 0.0003, + "step": 46315 + }, + { + "epoch": 0.9, + "learning_rate": 2.0333190944041005e-08, + "loss": 0.0003, + "step": 46316 + }, + { + "epoch": 0.9, + "learning_rate": 2.0329307599704864e-08, + "loss": 0.0006, + "step": 46317 + }, + { + "epoch": 0.9, + "learning_rate": 2.0325424255368722e-08, + "loss": 0.0003, + "step": 46318 + }, + { + "epoch": 0.9, + "learning_rate": 2.032154091103258e-08, + "loss": 0.0004, + "step": 46319 + }, + { + "epoch": 0.9, + "learning_rate": 2.031765756669644e-08, + "loss": 0.0004, + "step": 46320 + }, + { + "epoch": 0.9, + "learning_rate": 2.0313774222360297e-08, + "loss": 0.0005, + "step": 46321 + }, + { + "epoch": 0.9, + "learning_rate": 2.030989087802415e-08, + "loss": 0.0004, + "step": 46322 + }, + { + "epoch": 0.9, + "learning_rate": 2.030600753368801e-08, + "loss": 0.0003, + "step": 46323 + }, + { + "epoch": 0.9, + "learning_rate": 2.0302124189351868e-08, + "loss": 0.0013, + "step": 46324 + }, + { + "epoch": 0.9, + "learning_rate": 2.0298240845015726e-08, + "loss": 0.0007, + "step": 46325 + }, + { + "epoch": 0.9, + "learning_rate": 2.0294357500679585e-08, + "loss": 0.0003, + "step": 46326 + }, + { + "epoch": 0.9, + "learning_rate": 2.0290474156343443e-08, + "loss": 0.0003, + "step": 46327 + }, + { + "epoch": 0.9, + "learning_rate": 2.02865908120073e-08, + "loss": 0.0005, + "step": 46328 + }, + { + "epoch": 0.9, + "learning_rate": 2.0282707467671156e-08, + "loss": 0.0003, + "step": 46329 + }, + { + "epoch": 0.9, + "learning_rate": 2.0278824123335014e-08, + "loss": 0.0021, + "step": 46330 + }, + { + "epoch": 0.9, + "learning_rate": 2.0274940778998872e-08, + "loss": 0.0003, + "step": 46331 + }, + { + "epoch": 0.9, + "learning_rate": 2.027105743466273e-08, + "loss": 0.0004, + "step": 46332 + }, + { + "epoch": 0.9, + "learning_rate": 2.026717409032659e-08, + "loss": 0.0109, + "step": 46333 + }, + { + "epoch": 0.9, + "learning_rate": 2.0263290745990447e-08, + "loss": 0.696, + "step": 46334 + }, + { + "epoch": 0.9, + "learning_rate": 2.0259407401654305e-08, + "loss": 0.0003, + "step": 46335 + }, + { + "epoch": 0.9, + "learning_rate": 2.025552405731816e-08, + "loss": 0.0004, + "step": 46336 + }, + { + "epoch": 0.9, + "learning_rate": 2.025164071298202e-08, + "loss": 0.0004, + "step": 46337 + }, + { + "epoch": 0.9, + "learning_rate": 2.0247757368645877e-08, + "loss": 0.0005, + "step": 46338 + }, + { + "epoch": 0.9, + "learning_rate": 2.0243874024309735e-08, + "loss": 0.0004, + "step": 46339 + }, + { + "epoch": 0.9, + "learning_rate": 2.0239990679973593e-08, + "loss": 0.0004, + "step": 46340 + }, + { + "epoch": 0.9, + "learning_rate": 2.023610733563745e-08, + "loss": 0.0004, + "step": 46341 + }, + { + "epoch": 0.9, + "learning_rate": 2.023222399130131e-08, + "loss": 0.0283, + "step": 46342 + }, + { + "epoch": 0.9, + "learning_rate": 2.0228340646965168e-08, + "loss": 0.0008, + "step": 46343 + }, + { + "epoch": 0.9, + "learning_rate": 2.0224457302629023e-08, + "loss": 0.0006, + "step": 46344 + }, + { + "epoch": 0.9, + "learning_rate": 2.022057395829288e-08, + "loss": 0.0005, + "step": 46345 + }, + { + "epoch": 0.9, + "learning_rate": 2.021669061395674e-08, + "loss": 0.0003, + "step": 46346 + }, + { + "epoch": 0.9, + "learning_rate": 2.0212807269620598e-08, + "loss": 0.0004, + "step": 46347 + }, + { + "epoch": 0.9, + "learning_rate": 2.0208923925284456e-08, + "loss": 0.0005, + "step": 46348 + }, + { + "epoch": 0.9, + "learning_rate": 2.0205040580948314e-08, + "loss": 0.6483, + "step": 46349 + }, + { + "epoch": 0.9, + "learning_rate": 2.020115723661217e-08, + "loss": 0.0003, + "step": 46350 + }, + { + "epoch": 0.9, + "learning_rate": 2.0197273892276027e-08, + "loss": 0.0003, + "step": 46351 + }, + { + "epoch": 0.9, + "learning_rate": 2.0193390547939886e-08, + "loss": 0.0004, + "step": 46352 + }, + { + "epoch": 0.9, + "learning_rate": 2.0189507203603744e-08, + "loss": 0.0004, + "step": 46353 + }, + { + "epoch": 0.9, + "learning_rate": 2.01856238592676e-08, + "loss": 0.0004, + "step": 46354 + }, + { + "epoch": 0.9, + "learning_rate": 2.0181740514931457e-08, + "loss": 0.0003, + "step": 46355 + }, + { + "epoch": 0.9, + "learning_rate": 2.0177857170595315e-08, + "loss": 0.001, + "step": 46356 + }, + { + "epoch": 0.9, + "learning_rate": 2.0173973826259174e-08, + "loss": 1.1739, + "step": 46357 + }, + { + "epoch": 0.9, + "learning_rate": 2.017009048192303e-08, + "loss": 0.2226, + "step": 46358 + }, + { + "epoch": 0.9, + "learning_rate": 2.0166207137586887e-08, + "loss": 0.0003, + "step": 46359 + }, + { + "epoch": 0.9, + "learning_rate": 2.0162323793250745e-08, + "loss": 0.0005, + "step": 46360 + }, + { + "epoch": 0.9, + "learning_rate": 2.0158440448914603e-08, + "loss": 0.0004, + "step": 46361 + }, + { + "epoch": 0.9, + "learning_rate": 2.015455710457846e-08, + "loss": 0.0002, + "step": 46362 + }, + { + "epoch": 0.9, + "learning_rate": 2.015067376024232e-08, + "loss": 0.0004, + "step": 46363 + }, + { + "epoch": 0.9, + "learning_rate": 2.0146790415906178e-08, + "loss": 0.0003, + "step": 46364 + }, + { + "epoch": 0.9, + "learning_rate": 2.0142907071570033e-08, + "loss": 0.0003, + "step": 46365 + }, + { + "epoch": 0.9, + "learning_rate": 2.013902372723389e-08, + "loss": 0.0003, + "step": 46366 + }, + { + "epoch": 0.9, + "learning_rate": 2.013514038289775e-08, + "loss": 0.0003, + "step": 46367 + }, + { + "epoch": 0.9, + "learning_rate": 2.0131257038561608e-08, + "loss": 0.0004, + "step": 46368 + }, + { + "epoch": 0.9, + "learning_rate": 2.0127373694225466e-08, + "loss": 0.0003, + "step": 46369 + }, + { + "epoch": 0.9, + "learning_rate": 2.0123490349889324e-08, + "loss": 0.0005, + "step": 46370 + }, + { + "epoch": 0.9, + "learning_rate": 2.0119607005553182e-08, + "loss": 0.0005, + "step": 46371 + }, + { + "epoch": 0.9, + "learning_rate": 2.011572366121704e-08, + "loss": 0.0003, + "step": 46372 + }, + { + "epoch": 0.9, + "learning_rate": 2.0111840316880896e-08, + "loss": 0.0005, + "step": 46373 + }, + { + "epoch": 0.9, + "learning_rate": 2.0107956972544754e-08, + "loss": 0.0003, + "step": 46374 + }, + { + "epoch": 0.9, + "learning_rate": 2.0104073628208612e-08, + "loss": 0.0004, + "step": 46375 + }, + { + "epoch": 0.9, + "learning_rate": 2.010019028387247e-08, + "loss": 0.0003, + "step": 46376 + }, + { + "epoch": 0.9, + "learning_rate": 2.009630693953633e-08, + "loss": 0.0004, + "step": 46377 + }, + { + "epoch": 0.9, + "learning_rate": 2.0092423595200187e-08, + "loss": 0.0003, + "step": 46378 + }, + { + "epoch": 0.9, + "learning_rate": 2.0088540250864045e-08, + "loss": 0.9031, + "step": 46379 + }, + { + "epoch": 0.9, + "learning_rate": 2.00846569065279e-08, + "loss": 0.0003, + "step": 46380 + }, + { + "epoch": 0.9, + "learning_rate": 2.0080773562191758e-08, + "loss": 0.0005, + "step": 46381 + }, + { + "epoch": 0.9, + "learning_rate": 2.0076890217855616e-08, + "loss": 0.0004, + "step": 46382 + }, + { + "epoch": 0.9, + "learning_rate": 2.0073006873519475e-08, + "loss": 0.0005, + "step": 46383 + }, + { + "epoch": 0.9, + "learning_rate": 2.0069123529183333e-08, + "loss": 0.0034, + "step": 46384 + }, + { + "epoch": 0.9, + "learning_rate": 2.006524018484719e-08, + "loss": 0.0004, + "step": 46385 + }, + { + "epoch": 0.9, + "learning_rate": 2.006135684051105e-08, + "loss": 0.0003, + "step": 46386 + }, + { + "epoch": 0.9, + "learning_rate": 2.0057473496174904e-08, + "loss": 0.2317, + "step": 46387 + }, + { + "epoch": 0.9, + "learning_rate": 2.0053590151838763e-08, + "loss": 0.4453, + "step": 46388 + }, + { + "epoch": 0.9, + "learning_rate": 2.004970680750262e-08, + "loss": 0.0004, + "step": 46389 + }, + { + "epoch": 0.9, + "learning_rate": 2.004582346316648e-08, + "loss": 0.0004, + "step": 46390 + }, + { + "epoch": 0.9, + "learning_rate": 2.0041940118830337e-08, + "loss": 0.0004, + "step": 46391 + }, + { + "epoch": 0.9, + "learning_rate": 2.0038056774494196e-08, + "loss": 0.0004, + "step": 46392 + }, + { + "epoch": 0.9, + "learning_rate": 2.0034173430158054e-08, + "loss": 0.0003, + "step": 46393 + }, + { + "epoch": 0.9, + "learning_rate": 2.003029008582191e-08, + "loss": 0.9732, + "step": 46394 + }, + { + "epoch": 0.9, + "learning_rate": 2.0026406741485767e-08, + "loss": 0.0005, + "step": 46395 + }, + { + "epoch": 0.9, + "learning_rate": 2.0022523397149625e-08, + "loss": 0.0003, + "step": 46396 + }, + { + "epoch": 0.9, + "learning_rate": 2.0018640052813483e-08, + "loss": 0.0004, + "step": 46397 + }, + { + "epoch": 0.9, + "learning_rate": 2.001475670847734e-08, + "loss": 0.0004, + "step": 46398 + }, + { + "epoch": 0.9, + "learning_rate": 2.0010873364141197e-08, + "loss": 0.0006, + "step": 46399 + }, + { + "epoch": 0.9, + "learning_rate": 2.0006990019805055e-08, + "loss": 0.0027, + "step": 46400 + }, + { + "epoch": 0.9, + "learning_rate": 2.0003106675468913e-08, + "loss": 0.0003, + "step": 46401 + }, + { + "epoch": 0.9, + "learning_rate": 1.9999223331132768e-08, + "loss": 0.0004, + "step": 46402 + }, + { + "epoch": 0.9, + "learning_rate": 1.9995339986796626e-08, + "loss": 0.0045, + "step": 46403 + }, + { + "epoch": 0.9, + "learning_rate": 1.9991456642460485e-08, + "loss": 0.0004, + "step": 46404 + }, + { + "epoch": 0.9, + "learning_rate": 1.9987573298124343e-08, + "loss": 0.0004, + "step": 46405 + }, + { + "epoch": 0.9, + "learning_rate": 1.99836899537882e-08, + "loss": 0.0004, + "step": 46406 + }, + { + "epoch": 0.9, + "learning_rate": 1.997980660945206e-08, + "loss": 0.9731, + "step": 46407 + }, + { + "epoch": 0.9, + "learning_rate": 1.9975923265115918e-08, + "loss": 0.484, + "step": 46408 + }, + { + "epoch": 0.9, + "learning_rate": 1.9972039920779772e-08, + "loss": 0.0003, + "step": 46409 + }, + { + "epoch": 0.9, + "learning_rate": 1.996815657644363e-08, + "loss": 0.0008, + "step": 46410 + }, + { + "epoch": 0.9, + "learning_rate": 1.996427323210749e-08, + "loss": 0.0004, + "step": 46411 + }, + { + "epoch": 0.9, + "learning_rate": 1.9960389887771347e-08, + "loss": 0.0003, + "step": 46412 + }, + { + "epoch": 0.9, + "learning_rate": 1.9956506543435205e-08, + "loss": 0.0003, + "step": 46413 + }, + { + "epoch": 0.9, + "learning_rate": 1.9952623199099064e-08, + "loss": 0.0003, + "step": 46414 + }, + { + "epoch": 0.9, + "learning_rate": 1.9948739854762922e-08, + "loss": 0.0003, + "step": 46415 + }, + { + "epoch": 0.9, + "learning_rate": 1.9944856510426777e-08, + "loss": 0.0003, + "step": 46416 + }, + { + "epoch": 0.9, + "learning_rate": 1.9940973166090635e-08, + "loss": 0.0003, + "step": 46417 + }, + { + "epoch": 0.9, + "learning_rate": 1.9937089821754493e-08, + "loss": 0.0005, + "step": 46418 + }, + { + "epoch": 0.9, + "learning_rate": 1.993320647741835e-08, + "loss": 0.0005, + "step": 46419 + }, + { + "epoch": 0.9, + "learning_rate": 1.992932313308221e-08, + "loss": 0.0004, + "step": 46420 + }, + { + "epoch": 0.9, + "learning_rate": 1.9925439788746068e-08, + "loss": 0.435, + "step": 46421 + }, + { + "epoch": 0.9, + "learning_rate": 1.9921556444409926e-08, + "loss": 0.0005, + "step": 46422 + }, + { + "epoch": 0.9, + "learning_rate": 1.991767310007378e-08, + "loss": 0.0006, + "step": 46423 + }, + { + "epoch": 0.9, + "learning_rate": 1.991378975573764e-08, + "loss": 0.0006, + "step": 46424 + }, + { + "epoch": 0.9, + "learning_rate": 1.9909906411401498e-08, + "loss": 1.0728, + "step": 46425 + }, + { + "epoch": 0.9, + "learning_rate": 1.9906023067065356e-08, + "loss": 0.0004, + "step": 46426 + }, + { + "epoch": 0.9, + "learning_rate": 1.9902139722729214e-08, + "loss": 0.0004, + "step": 46427 + }, + { + "epoch": 0.9, + "learning_rate": 1.9898256378393073e-08, + "loss": 0.0003, + "step": 46428 + }, + { + "epoch": 0.9, + "learning_rate": 1.989437303405693e-08, + "loss": 0.0004, + "step": 46429 + }, + { + "epoch": 0.9, + "learning_rate": 1.989048968972079e-08, + "loss": 0.0006, + "step": 46430 + }, + { + "epoch": 0.9, + "learning_rate": 1.9886606345384644e-08, + "loss": 0.0005, + "step": 46431 + }, + { + "epoch": 0.9, + "learning_rate": 1.9882723001048502e-08, + "loss": 0.7022, + "step": 46432 + }, + { + "epoch": 0.9, + "learning_rate": 1.987883965671236e-08, + "loss": 0.0066, + "step": 46433 + }, + { + "epoch": 0.9, + "learning_rate": 1.987495631237622e-08, + "loss": 0.0005, + "step": 46434 + }, + { + "epoch": 0.9, + "learning_rate": 1.9871072968040077e-08, + "loss": 0.0008, + "step": 46435 + }, + { + "epoch": 0.9, + "learning_rate": 1.9867189623703935e-08, + "loss": 0.002, + "step": 46436 + }, + { + "epoch": 0.9, + "learning_rate": 1.9863306279367793e-08, + "loss": 0.5644, + "step": 46437 + }, + { + "epoch": 0.9, + "learning_rate": 1.985942293503165e-08, + "loss": 0.2977, + "step": 46438 + }, + { + "epoch": 0.9, + "learning_rate": 1.9855539590695507e-08, + "loss": 0.0151, + "step": 46439 + }, + { + "epoch": 0.9, + "learning_rate": 1.9851656246359365e-08, + "loss": 0.2364, + "step": 46440 + }, + { + "epoch": 0.9, + "learning_rate": 1.9847772902023223e-08, + "loss": 0.0003, + "step": 46441 + }, + { + "epoch": 0.9, + "learning_rate": 1.9843889557687078e-08, + "loss": 0.0005, + "step": 46442 + }, + { + "epoch": 0.9, + "learning_rate": 1.9840006213350936e-08, + "loss": 0.0004, + "step": 46443 + }, + { + "epoch": 0.9, + "learning_rate": 1.9836122869014795e-08, + "loss": 0.1982, + "step": 46444 + }, + { + "epoch": 0.9, + "learning_rate": 1.9832239524678653e-08, + "loss": 0.0004, + "step": 46445 + }, + { + "epoch": 0.9, + "learning_rate": 1.9828356180342508e-08, + "loss": 0.0007, + "step": 46446 + }, + { + "epoch": 0.9, + "learning_rate": 1.9824472836006366e-08, + "loss": 0.0005, + "step": 46447 + }, + { + "epoch": 0.9, + "learning_rate": 1.9820589491670224e-08, + "loss": 0.0004, + "step": 46448 + }, + { + "epoch": 0.9, + "learning_rate": 1.9816706147334082e-08, + "loss": 0.0004, + "step": 46449 + }, + { + "epoch": 0.9, + "learning_rate": 1.981282280299794e-08, + "loss": 0.7327, + "step": 46450 + }, + { + "epoch": 0.9, + "learning_rate": 1.98089394586618e-08, + "loss": 0.1807, + "step": 46451 + }, + { + "epoch": 0.9, + "learning_rate": 1.9805056114325654e-08, + "loss": 0.0004, + "step": 46452 + }, + { + "epoch": 0.9, + "learning_rate": 1.9801172769989512e-08, + "loss": 0.0004, + "step": 46453 + }, + { + "epoch": 0.9, + "learning_rate": 1.979728942565337e-08, + "loss": 0.0004, + "step": 46454 + }, + { + "epoch": 0.9, + "learning_rate": 1.979340608131723e-08, + "loss": 0.0004, + "step": 46455 + }, + { + "epoch": 0.9, + "learning_rate": 1.9789522736981087e-08, + "loss": 0.0005, + "step": 46456 + }, + { + "epoch": 0.9, + "learning_rate": 1.9785639392644945e-08, + "loss": 0.0003, + "step": 46457 + }, + { + "epoch": 0.9, + "learning_rate": 1.9781756048308803e-08, + "loss": 0.0005, + "step": 46458 + }, + { + "epoch": 0.9, + "learning_rate": 1.977787270397266e-08, + "loss": 0.0003, + "step": 46459 + }, + { + "epoch": 0.9, + "learning_rate": 1.9773989359636516e-08, + "loss": 0.0004, + "step": 46460 + }, + { + "epoch": 0.9, + "learning_rate": 1.9770106015300375e-08, + "loss": 0.0011, + "step": 46461 + }, + { + "epoch": 0.9, + "learning_rate": 1.9766222670964233e-08, + "loss": 1.2094, + "step": 46462 + }, + { + "epoch": 0.9, + "learning_rate": 1.976233932662809e-08, + "loss": 0.0004, + "step": 46463 + }, + { + "epoch": 0.9, + "learning_rate": 1.975845598229195e-08, + "loss": 0.0003, + "step": 46464 + }, + { + "epoch": 0.9, + "learning_rate": 1.9754572637955808e-08, + "loss": 0.0004, + "step": 46465 + }, + { + "epoch": 0.9, + "learning_rate": 1.9750689293619666e-08, + "loss": 0.0005, + "step": 46466 + }, + { + "epoch": 0.9, + "learning_rate": 1.974680594928352e-08, + "loss": 0.0025, + "step": 46467 + }, + { + "epoch": 0.9, + "learning_rate": 1.974292260494738e-08, + "loss": 0.3113, + "step": 46468 + }, + { + "epoch": 0.9, + "learning_rate": 1.9739039260611237e-08, + "loss": 0.0075, + "step": 46469 + }, + { + "epoch": 0.9, + "learning_rate": 1.9735155916275096e-08, + "loss": 0.0004, + "step": 46470 + }, + { + "epoch": 0.9, + "learning_rate": 1.9731272571938954e-08, + "loss": 0.0005, + "step": 46471 + }, + { + "epoch": 0.9, + "learning_rate": 1.9727389227602812e-08, + "loss": 0.0004, + "step": 46472 + }, + { + "epoch": 0.9, + "learning_rate": 1.972350588326667e-08, + "loss": 0.001, + "step": 46473 + }, + { + "epoch": 0.9, + "learning_rate": 1.9719622538930525e-08, + "loss": 0.0004, + "step": 46474 + }, + { + "epoch": 0.9, + "learning_rate": 1.9715739194594384e-08, + "loss": 0.0003, + "step": 46475 + }, + { + "epoch": 0.9, + "learning_rate": 1.9711855850258242e-08, + "loss": 0.0144, + "step": 46476 + }, + { + "epoch": 0.9, + "learning_rate": 1.97079725059221e-08, + "loss": 0.0006, + "step": 46477 + }, + { + "epoch": 0.9, + "learning_rate": 1.9704089161585958e-08, + "loss": 0.0003, + "step": 46478 + }, + { + "epoch": 0.9, + "learning_rate": 1.9700205817249817e-08, + "loss": 0.0005, + "step": 46479 + }, + { + "epoch": 0.9, + "learning_rate": 1.9696322472913675e-08, + "loss": 0.0006, + "step": 46480 + }, + { + "epoch": 0.9, + "learning_rate": 1.969243912857753e-08, + "loss": 0.0005, + "step": 46481 + }, + { + "epoch": 0.9, + "learning_rate": 1.9688555784241388e-08, + "loss": 0.0003, + "step": 46482 + }, + { + "epoch": 0.9, + "learning_rate": 1.9684672439905246e-08, + "loss": 0.0022, + "step": 46483 + }, + { + "epoch": 0.9, + "learning_rate": 1.9680789095569104e-08, + "loss": 0.0003, + "step": 46484 + }, + { + "epoch": 0.9, + "learning_rate": 1.9676905751232963e-08, + "loss": 0.8425, + "step": 46485 + }, + { + "epoch": 0.9, + "learning_rate": 1.9673022406896818e-08, + "loss": 0.0004, + "step": 46486 + }, + { + "epoch": 0.9, + "learning_rate": 1.9669139062560676e-08, + "loss": 0.0054, + "step": 46487 + }, + { + "epoch": 0.9, + "learning_rate": 1.9665255718224534e-08, + "loss": 0.0003, + "step": 46488 + }, + { + "epoch": 0.9, + "learning_rate": 1.9661372373888392e-08, + "loss": 0.0003, + "step": 46489 + }, + { + "epoch": 0.9, + "learning_rate": 1.9657489029552247e-08, + "loss": 0.0096, + "step": 46490 + }, + { + "epoch": 0.9, + "learning_rate": 1.9653605685216106e-08, + "loss": 0.0004, + "step": 46491 + }, + { + "epoch": 0.9, + "learning_rate": 1.9649722340879964e-08, + "loss": 0.0007, + "step": 46492 + }, + { + "epoch": 0.9, + "learning_rate": 1.9645838996543822e-08, + "loss": 0.0003, + "step": 46493 + }, + { + "epoch": 0.9, + "learning_rate": 1.964195565220768e-08, + "loss": 0.0005, + "step": 46494 + }, + { + "epoch": 0.9, + "learning_rate": 1.963807230787154e-08, + "loss": 0.0006, + "step": 46495 + }, + { + "epoch": 0.9, + "learning_rate": 1.9634188963535393e-08, + "loss": 0.0004, + "step": 46496 + }, + { + "epoch": 0.9, + "learning_rate": 1.9630305619199252e-08, + "loss": 0.0005, + "step": 46497 + }, + { + "epoch": 0.9, + "learning_rate": 1.962642227486311e-08, + "loss": 0.0004, + "step": 46498 + }, + { + "epoch": 0.9, + "learning_rate": 1.9622538930526968e-08, + "loss": 0.0004, + "step": 46499 + }, + { + "epoch": 0.9, + "learning_rate": 1.9618655586190826e-08, + "loss": 0.0004, + "step": 46500 + }, + { + "epoch": 0.9, + "learning_rate": 1.9614772241854685e-08, + "loss": 0.0004, + "step": 46501 + }, + { + "epoch": 0.9, + "learning_rate": 1.9610888897518543e-08, + "loss": 0.0004, + "step": 46502 + }, + { + "epoch": 0.9, + "learning_rate": 1.9607005553182398e-08, + "loss": 0.0007, + "step": 46503 + }, + { + "epoch": 0.9, + "learning_rate": 1.9603122208846256e-08, + "loss": 0.0004, + "step": 46504 + }, + { + "epoch": 0.9, + "learning_rate": 1.9599238864510114e-08, + "loss": 0.0427, + "step": 46505 + }, + { + "epoch": 0.9, + "learning_rate": 1.9595355520173973e-08, + "loss": 0.0003, + "step": 46506 + }, + { + "epoch": 0.9, + "learning_rate": 1.959147217583783e-08, + "loss": 0.0004, + "step": 46507 + }, + { + "epoch": 0.9, + "learning_rate": 1.958758883150169e-08, + "loss": 0.0003, + "step": 46508 + }, + { + "epoch": 0.9, + "learning_rate": 1.9583705487165547e-08, + "loss": 0.0004, + "step": 46509 + }, + { + "epoch": 0.9, + "learning_rate": 1.9579822142829402e-08, + "loss": 0.0004, + "step": 46510 + }, + { + "epoch": 0.9, + "learning_rate": 1.957593879849326e-08, + "loss": 0.0004, + "step": 46511 + }, + { + "epoch": 0.9, + "learning_rate": 1.957205545415712e-08, + "loss": 0.0004, + "step": 46512 + }, + { + "epoch": 0.9, + "learning_rate": 1.9568172109820977e-08, + "loss": 0.0005, + "step": 46513 + }, + { + "epoch": 0.9, + "learning_rate": 1.9564288765484835e-08, + "loss": 1.0923, + "step": 46514 + }, + { + "epoch": 0.9, + "learning_rate": 1.9560405421148693e-08, + "loss": 0.0007, + "step": 46515 + }, + { + "epoch": 0.9, + "learning_rate": 1.9556522076812552e-08, + "loss": 0.0005, + "step": 46516 + }, + { + "epoch": 0.9, + "learning_rate": 1.955263873247641e-08, + "loss": 0.0004, + "step": 46517 + }, + { + "epoch": 0.9, + "learning_rate": 1.9548755388140265e-08, + "loss": 0.0003, + "step": 46518 + }, + { + "epoch": 0.9, + "learning_rate": 1.9544872043804123e-08, + "loss": 0.0005, + "step": 46519 + }, + { + "epoch": 0.9, + "learning_rate": 1.954098869946798e-08, + "loss": 0.0006, + "step": 46520 + }, + { + "epoch": 0.9, + "learning_rate": 1.953710535513184e-08, + "loss": 0.0004, + "step": 46521 + }, + { + "epoch": 0.9, + "learning_rate": 1.9533222010795698e-08, + "loss": 0.0002, + "step": 46522 + }, + { + "epoch": 0.9, + "learning_rate": 1.9529338666459556e-08, + "loss": 0.0005, + "step": 46523 + }, + { + "epoch": 0.9, + "learning_rate": 1.9525455322123414e-08, + "loss": 0.0004, + "step": 46524 + }, + { + "epoch": 0.9, + "learning_rate": 1.952157197778727e-08, + "loss": 0.0002, + "step": 46525 + }, + { + "epoch": 0.9, + "learning_rate": 1.9517688633451128e-08, + "loss": 0.0008, + "step": 46526 + }, + { + "epoch": 0.9, + "learning_rate": 1.9513805289114986e-08, + "loss": 0.0004, + "step": 46527 + }, + { + "epoch": 0.9, + "learning_rate": 1.9509921944778844e-08, + "loss": 0.0003, + "step": 46528 + }, + { + "epoch": 0.9, + "learning_rate": 1.9506038600442702e-08, + "loss": 0.0004, + "step": 46529 + }, + { + "epoch": 0.9, + "learning_rate": 1.950215525610656e-08, + "loss": 0.0006, + "step": 46530 + }, + { + "epoch": 0.9, + "learning_rate": 1.9498271911770415e-08, + "loss": 0.0005, + "step": 46531 + }, + { + "epoch": 0.9, + "learning_rate": 1.9494388567434274e-08, + "loss": 0.0006, + "step": 46532 + }, + { + "epoch": 0.9, + "learning_rate": 1.9490505223098132e-08, + "loss": 0.0003, + "step": 46533 + }, + { + "epoch": 0.9, + "learning_rate": 1.9486621878761987e-08, + "loss": 0.0003, + "step": 46534 + }, + { + "epoch": 0.9, + "learning_rate": 1.9482738534425845e-08, + "loss": 0.0005, + "step": 46535 + }, + { + "epoch": 0.9, + "learning_rate": 1.9478855190089703e-08, + "loss": 0.0003, + "step": 46536 + }, + { + "epoch": 0.9, + "learning_rate": 1.947497184575356e-08, + "loss": 0.0004, + "step": 46537 + }, + { + "epoch": 0.9, + "learning_rate": 1.947108850141742e-08, + "loss": 0.0006, + "step": 46538 + }, + { + "epoch": 0.9, + "learning_rate": 1.9467205157081275e-08, + "loss": 0.0004, + "step": 46539 + }, + { + "epoch": 0.9, + "learning_rate": 1.9463321812745133e-08, + "loss": 1.324, + "step": 46540 + }, + { + "epoch": 0.9, + "learning_rate": 1.945943846840899e-08, + "loss": 0.0003, + "step": 46541 + }, + { + "epoch": 0.9, + "learning_rate": 1.945555512407285e-08, + "loss": 0.0004, + "step": 46542 + }, + { + "epoch": 0.9, + "learning_rate": 1.9451671779736708e-08, + "loss": 0.0003, + "step": 46543 + }, + { + "epoch": 0.9, + "learning_rate": 1.9447788435400566e-08, + "loss": 0.0003, + "step": 46544 + }, + { + "epoch": 0.9, + "learning_rate": 1.9443905091064424e-08, + "loss": 0.0005, + "step": 46545 + }, + { + "epoch": 0.9, + "learning_rate": 1.9440021746728282e-08, + "loss": 1.6038, + "step": 46546 + }, + { + "epoch": 0.9, + "learning_rate": 1.9436138402392137e-08, + "loss": 0.0005, + "step": 46547 + }, + { + "epoch": 0.9, + "learning_rate": 1.9432255058055996e-08, + "loss": 0.1187, + "step": 46548 + }, + { + "epoch": 0.9, + "learning_rate": 1.9428371713719854e-08, + "loss": 0.0004, + "step": 46549 + }, + { + "epoch": 0.9, + "learning_rate": 1.9424488369383712e-08, + "loss": 0.0005, + "step": 46550 + }, + { + "epoch": 0.9, + "learning_rate": 1.942060502504757e-08, + "loss": 0.0003, + "step": 46551 + }, + { + "epoch": 0.9, + "learning_rate": 1.941672168071143e-08, + "loss": 0.8034, + "step": 46552 + }, + { + "epoch": 0.9, + "learning_rate": 1.9412838336375287e-08, + "loss": 0.0003, + "step": 46553 + }, + { + "epoch": 0.9, + "learning_rate": 1.9408954992039142e-08, + "loss": 0.0005, + "step": 46554 + }, + { + "epoch": 0.9, + "learning_rate": 1.9405071647703e-08, + "loss": 0.0004, + "step": 46555 + }, + { + "epoch": 0.9, + "learning_rate": 1.9401188303366858e-08, + "loss": 0.0004, + "step": 46556 + }, + { + "epoch": 0.9, + "learning_rate": 1.9397304959030717e-08, + "loss": 0.0005, + "step": 46557 + }, + { + "epoch": 0.9, + "learning_rate": 1.9393421614694575e-08, + "loss": 0.0004, + "step": 46558 + }, + { + "epoch": 0.9, + "learning_rate": 1.9389538270358433e-08, + "loss": 0.0006, + "step": 46559 + }, + { + "epoch": 0.9, + "learning_rate": 1.938565492602229e-08, + "loss": 0.0003, + "step": 46560 + }, + { + "epoch": 0.9, + "learning_rate": 1.9381771581686146e-08, + "loss": 0.0002, + "step": 46561 + }, + { + "epoch": 0.9, + "learning_rate": 1.9377888237350004e-08, + "loss": 0.0004, + "step": 46562 + }, + { + "epoch": 0.9, + "learning_rate": 1.9374004893013863e-08, + "loss": 0.0009, + "step": 46563 + }, + { + "epoch": 0.9, + "learning_rate": 1.937012154867772e-08, + "loss": 0.0004, + "step": 46564 + }, + { + "epoch": 0.9, + "learning_rate": 1.936623820434158e-08, + "loss": 0.0004, + "step": 46565 + }, + { + "epoch": 0.9, + "learning_rate": 1.9362354860005437e-08, + "loss": 0.0004, + "step": 46566 + }, + { + "epoch": 0.9, + "learning_rate": 1.9358471515669296e-08, + "loss": 0.0008, + "step": 46567 + }, + { + "epoch": 0.9, + "learning_rate": 1.935458817133315e-08, + "loss": 0.4507, + "step": 46568 + }, + { + "epoch": 0.9, + "learning_rate": 1.935070482699701e-08, + "loss": 0.0005, + "step": 46569 + }, + { + "epoch": 0.9, + "learning_rate": 1.9346821482660867e-08, + "loss": 0.0005, + "step": 46570 + }, + { + "epoch": 0.9, + "learning_rate": 1.9342938138324725e-08, + "loss": 0.0004, + "step": 46571 + }, + { + "epoch": 0.9, + "learning_rate": 1.9339054793988584e-08, + "loss": 0.0006, + "step": 46572 + }, + { + "epoch": 0.9, + "learning_rate": 1.9335171449652442e-08, + "loss": 0.0139, + "step": 46573 + }, + { + "epoch": 0.9, + "learning_rate": 1.93312881053163e-08, + "loss": 0.0003, + "step": 46574 + }, + { + "epoch": 0.9, + "learning_rate": 1.9327404760980155e-08, + "loss": 0.0006, + "step": 46575 + }, + { + "epoch": 0.9, + "learning_rate": 1.9323521416644013e-08, + "loss": 0.0004, + "step": 46576 + }, + { + "epoch": 0.9, + "learning_rate": 1.931963807230787e-08, + "loss": 0.0003, + "step": 46577 + }, + { + "epoch": 0.9, + "learning_rate": 1.931575472797173e-08, + "loss": 0.0004, + "step": 46578 + }, + { + "epoch": 0.9, + "learning_rate": 1.9311871383635585e-08, + "loss": 0.0005, + "step": 46579 + }, + { + "epoch": 0.9, + "learning_rate": 1.9307988039299443e-08, + "loss": 0.0004, + "step": 46580 + }, + { + "epoch": 0.9, + "learning_rate": 1.93041046949633e-08, + "loss": 0.0005, + "step": 46581 + }, + { + "epoch": 0.9, + "learning_rate": 1.930022135062716e-08, + "loss": 0.0004, + "step": 46582 + }, + { + "epoch": 0.9, + "learning_rate": 1.9296338006291014e-08, + "loss": 0.0003, + "step": 46583 + }, + { + "epoch": 0.9, + "learning_rate": 1.9292454661954873e-08, + "loss": 0.0003, + "step": 46584 + }, + { + "epoch": 0.9, + "learning_rate": 1.928857131761873e-08, + "loss": 0.0006, + "step": 46585 + }, + { + "epoch": 0.9, + "learning_rate": 1.928468797328259e-08, + "loss": 0.0004, + "step": 46586 + }, + { + "epoch": 0.9, + "learning_rate": 1.9280804628946447e-08, + "loss": 0.0003, + "step": 46587 + }, + { + "epoch": 0.9, + "learning_rate": 1.9276921284610306e-08, + "loss": 0.0002, + "step": 46588 + }, + { + "epoch": 0.9, + "learning_rate": 1.9273037940274164e-08, + "loss": 0.0004, + "step": 46589 + }, + { + "epoch": 0.9, + "learning_rate": 1.926915459593802e-08, + "loss": 0.0004, + "step": 46590 + }, + { + "epoch": 0.9, + "learning_rate": 1.9265271251601877e-08, + "loss": 0.0004, + "step": 46591 + }, + { + "epoch": 0.9, + "learning_rate": 1.9261387907265735e-08, + "loss": 0.0441, + "step": 46592 + }, + { + "epoch": 0.9, + "learning_rate": 1.9257504562929594e-08, + "loss": 0.0006, + "step": 46593 + }, + { + "epoch": 0.9, + "learning_rate": 1.9253621218593452e-08, + "loss": 0.0003, + "step": 46594 + }, + { + "epoch": 0.9, + "learning_rate": 1.924973787425731e-08, + "loss": 0.0004, + "step": 46595 + }, + { + "epoch": 0.9, + "learning_rate": 1.9245854529921168e-08, + "loss": 0.0134, + "step": 46596 + }, + { + "epoch": 0.9, + "learning_rate": 1.9241971185585023e-08, + "loss": 0.0053, + "step": 46597 + }, + { + "epoch": 0.9, + "learning_rate": 1.923808784124888e-08, + "loss": 0.0003, + "step": 46598 + }, + { + "epoch": 0.9, + "learning_rate": 1.923420449691274e-08, + "loss": 0.0004, + "step": 46599 + }, + { + "epoch": 0.9, + "learning_rate": 1.9230321152576598e-08, + "loss": 0.0004, + "step": 46600 + }, + { + "epoch": 0.9, + "learning_rate": 1.9226437808240456e-08, + "loss": 0.3212, + "step": 46601 + }, + { + "epoch": 0.9, + "learning_rate": 1.9222554463904314e-08, + "loss": 0.0003, + "step": 46602 + }, + { + "epoch": 0.9, + "learning_rate": 1.9218671119568173e-08, + "loss": 0.0004, + "step": 46603 + }, + { + "epoch": 0.9, + "learning_rate": 1.921478777523203e-08, + "loss": 0.0003, + "step": 46604 + }, + { + "epoch": 0.9, + "learning_rate": 1.9210904430895886e-08, + "loss": 0.0006, + "step": 46605 + }, + { + "epoch": 0.9, + "learning_rate": 1.9207021086559744e-08, + "loss": 0.0004, + "step": 46606 + }, + { + "epoch": 0.9, + "learning_rate": 1.9203137742223602e-08, + "loss": 0.0313, + "step": 46607 + }, + { + "epoch": 0.9, + "learning_rate": 1.919925439788746e-08, + "loss": 0.91, + "step": 46608 + }, + { + "epoch": 0.9, + "learning_rate": 1.919537105355132e-08, + "loss": 0.0007, + "step": 46609 + }, + { + "epoch": 0.9, + "learning_rate": 1.9191487709215177e-08, + "loss": 0.0005, + "step": 46610 + }, + { + "epoch": 0.9, + "learning_rate": 1.9187604364879035e-08, + "loss": 0.0003, + "step": 46611 + }, + { + "epoch": 0.9, + "learning_rate": 1.918372102054289e-08, + "loss": 0.2727, + "step": 46612 + }, + { + "epoch": 0.9, + "learning_rate": 1.917983767620675e-08, + "loss": 0.0004, + "step": 46613 + }, + { + "epoch": 0.9, + "learning_rate": 1.9175954331870607e-08, + "loss": 0.0002, + "step": 46614 + }, + { + "epoch": 0.9, + "learning_rate": 1.9172070987534465e-08, + "loss": 0.0004, + "step": 46615 + }, + { + "epoch": 0.9, + "learning_rate": 1.9168187643198323e-08, + "loss": 0.0012, + "step": 46616 + }, + { + "epoch": 0.9, + "learning_rate": 1.916430429886218e-08, + "loss": 0.0059, + "step": 46617 + }, + { + "epoch": 0.9, + "learning_rate": 1.916042095452604e-08, + "loss": 0.0011, + "step": 46618 + }, + { + "epoch": 0.9, + "learning_rate": 1.9156537610189895e-08, + "loss": 0.0003, + "step": 46619 + }, + { + "epoch": 0.9, + "learning_rate": 1.9152654265853753e-08, + "loss": 0.0011, + "step": 46620 + }, + { + "epoch": 0.9, + "learning_rate": 1.914877092151761e-08, + "loss": 0.0004, + "step": 46621 + }, + { + "epoch": 0.9, + "learning_rate": 1.914488757718147e-08, + "loss": 0.0023, + "step": 46622 + }, + { + "epoch": 0.9, + "learning_rate": 1.9141004232845324e-08, + "loss": 0.0008, + "step": 46623 + }, + { + "epoch": 0.9, + "learning_rate": 1.9137120888509183e-08, + "loss": 0.0004, + "step": 46624 + }, + { + "epoch": 0.9, + "learning_rate": 1.913323754417304e-08, + "loss": 0.0004, + "step": 46625 + }, + { + "epoch": 0.9, + "learning_rate": 1.9129354199836896e-08, + "loss": 0.0003, + "step": 46626 + }, + { + "epoch": 0.9, + "learning_rate": 1.9125470855500754e-08, + "loss": 0.0005, + "step": 46627 + }, + { + "epoch": 0.9, + "learning_rate": 1.9121587511164612e-08, + "loss": 0.0004, + "step": 46628 + }, + { + "epoch": 0.9, + "learning_rate": 1.911770416682847e-08, + "loss": 0.0003, + "step": 46629 + }, + { + "epoch": 0.9, + "learning_rate": 1.911382082249233e-08, + "loss": 0.0004, + "step": 46630 + }, + { + "epoch": 0.9, + "learning_rate": 1.9109937478156187e-08, + "loss": 0.0003, + "step": 46631 + }, + { + "epoch": 0.9, + "learning_rate": 1.9106054133820045e-08, + "loss": 0.0054, + "step": 46632 + }, + { + "epoch": 0.9, + "learning_rate": 1.9102170789483903e-08, + "loss": 0.0005, + "step": 46633 + }, + { + "epoch": 0.9, + "learning_rate": 1.909828744514776e-08, + "loss": 0.0004, + "step": 46634 + }, + { + "epoch": 0.9, + "learning_rate": 1.9094404100811617e-08, + "loss": 0.0006, + "step": 46635 + }, + { + "epoch": 0.9, + "learning_rate": 1.9090520756475475e-08, + "loss": 0.0005, + "step": 46636 + }, + { + "epoch": 0.9, + "learning_rate": 1.9086637412139333e-08, + "loss": 0.0004, + "step": 46637 + }, + { + "epoch": 0.9, + "learning_rate": 1.908275406780319e-08, + "loss": 0.0004, + "step": 46638 + }, + { + "epoch": 0.9, + "learning_rate": 1.907887072346705e-08, + "loss": 0.0003, + "step": 46639 + }, + { + "epoch": 0.9, + "learning_rate": 1.9074987379130908e-08, + "loss": 0.0004, + "step": 46640 + }, + { + "epoch": 0.9, + "learning_rate": 1.9071104034794763e-08, + "loss": 0.2547, + "step": 46641 + }, + { + "epoch": 0.9, + "learning_rate": 1.906722069045862e-08, + "loss": 0.0003, + "step": 46642 + }, + { + "epoch": 0.9, + "learning_rate": 1.906333734612248e-08, + "loss": 0.0003, + "step": 46643 + }, + { + "epoch": 0.9, + "learning_rate": 1.9059454001786337e-08, + "loss": 0.0005, + "step": 46644 + }, + { + "epoch": 0.9, + "learning_rate": 1.9055570657450196e-08, + "loss": 0.0163, + "step": 46645 + }, + { + "epoch": 0.9, + "learning_rate": 1.9051687313114054e-08, + "loss": 0.0004, + "step": 46646 + }, + { + "epoch": 0.9, + "learning_rate": 1.9047803968777912e-08, + "loss": 0.0003, + "step": 46647 + }, + { + "epoch": 0.9, + "learning_rate": 1.9043920624441767e-08, + "loss": 0.0004, + "step": 46648 + }, + { + "epoch": 0.9, + "learning_rate": 1.9040037280105625e-08, + "loss": 0.0005, + "step": 46649 + }, + { + "epoch": 0.9, + "learning_rate": 1.9036153935769484e-08, + "loss": 0.0004, + "step": 46650 + }, + { + "epoch": 0.9, + "learning_rate": 1.9032270591433342e-08, + "loss": 0.0003, + "step": 46651 + }, + { + "epoch": 0.9, + "learning_rate": 1.90283872470972e-08, + "loss": 0.0005, + "step": 46652 + }, + { + "epoch": 0.9, + "learning_rate": 1.902450390276106e-08, + "loss": 0.0004, + "step": 46653 + }, + { + "epoch": 0.9, + "learning_rate": 1.9020620558424917e-08, + "loss": 0.0003, + "step": 46654 + }, + { + "epoch": 0.91, + "learning_rate": 1.901673721408877e-08, + "loss": 0.0005, + "step": 46655 + }, + { + "epoch": 0.91, + "learning_rate": 1.901285386975263e-08, + "loss": 0.0003, + "step": 46656 + }, + { + "epoch": 0.91, + "learning_rate": 1.9008970525416488e-08, + "loss": 0.0008, + "step": 46657 + }, + { + "epoch": 0.91, + "learning_rate": 1.9005087181080346e-08, + "loss": 0.0005, + "step": 46658 + }, + { + "epoch": 0.91, + "learning_rate": 1.9001203836744205e-08, + "loss": 0.0005, + "step": 46659 + }, + { + "epoch": 0.91, + "learning_rate": 1.8997320492408063e-08, + "loss": 0.0005, + "step": 46660 + }, + { + "epoch": 0.91, + "learning_rate": 1.899343714807192e-08, + "loss": 0.0005, + "step": 46661 + }, + { + "epoch": 0.91, + "learning_rate": 1.898955380373578e-08, + "loss": 0.0006, + "step": 46662 + }, + { + "epoch": 0.91, + "learning_rate": 1.8985670459399634e-08, + "loss": 0.0824, + "step": 46663 + }, + { + "epoch": 0.91, + "learning_rate": 1.8981787115063492e-08, + "loss": 0.0003, + "step": 46664 + }, + { + "epoch": 0.91, + "learning_rate": 1.897790377072735e-08, + "loss": 0.0005, + "step": 46665 + }, + { + "epoch": 0.91, + "learning_rate": 1.897402042639121e-08, + "loss": 0.0004, + "step": 46666 + }, + { + "epoch": 0.91, + "learning_rate": 1.8970137082055064e-08, + "loss": 0.0004, + "step": 46667 + }, + { + "epoch": 0.91, + "learning_rate": 1.8966253737718922e-08, + "loss": 0.004, + "step": 46668 + }, + { + "epoch": 0.91, + "learning_rate": 1.896237039338278e-08, + "loss": 0.0006, + "step": 46669 + }, + { + "epoch": 0.91, + "learning_rate": 1.895848704904664e-08, + "loss": 0.0003, + "step": 46670 + }, + { + "epoch": 0.91, + "learning_rate": 1.8954603704710494e-08, + "loss": 0.0003, + "step": 46671 + }, + { + "epoch": 0.91, + "learning_rate": 1.8950720360374352e-08, + "loss": 0.0005, + "step": 46672 + }, + { + "epoch": 0.91, + "learning_rate": 1.894683701603821e-08, + "loss": 0.0004, + "step": 46673 + }, + { + "epoch": 0.91, + "learning_rate": 1.8942953671702068e-08, + "loss": 0.0005, + "step": 46674 + }, + { + "epoch": 0.91, + "learning_rate": 1.8939070327365927e-08, + "loss": 0.0004, + "step": 46675 + }, + { + "epoch": 0.91, + "learning_rate": 1.8935186983029785e-08, + "loss": 0.001, + "step": 46676 + }, + { + "epoch": 0.91, + "learning_rate": 1.893130363869364e-08, + "loss": 0.0002, + "step": 46677 + }, + { + "epoch": 0.91, + "learning_rate": 1.8927420294357498e-08, + "loss": 0.0003, + "step": 46678 + }, + { + "epoch": 0.91, + "learning_rate": 1.8923536950021356e-08, + "loss": 0.0082, + "step": 46679 + }, + { + "epoch": 0.91, + "learning_rate": 1.8919653605685214e-08, + "loss": 0.0004, + "step": 46680 + }, + { + "epoch": 0.91, + "learning_rate": 1.8915770261349073e-08, + "loss": 0.0004, + "step": 46681 + }, + { + "epoch": 0.91, + "learning_rate": 1.891188691701293e-08, + "loss": 0.0003, + "step": 46682 + }, + { + "epoch": 0.91, + "learning_rate": 1.890800357267679e-08, + "loss": 0.0004, + "step": 46683 + }, + { + "epoch": 0.91, + "learning_rate": 1.8904120228340644e-08, + "loss": 0.0004, + "step": 46684 + }, + { + "epoch": 0.91, + "learning_rate": 1.8900236884004502e-08, + "loss": 0.01, + "step": 46685 + }, + { + "epoch": 0.91, + "learning_rate": 1.889635353966836e-08, + "loss": 0.0003, + "step": 46686 + }, + { + "epoch": 0.91, + "learning_rate": 1.889247019533222e-08, + "loss": 0.5332, + "step": 46687 + }, + { + "epoch": 0.91, + "learning_rate": 1.8888586850996077e-08, + "loss": 0.0445, + "step": 46688 + }, + { + "epoch": 0.91, + "learning_rate": 1.8884703506659935e-08, + "loss": 0.0004, + "step": 46689 + }, + { + "epoch": 0.91, + "learning_rate": 1.8880820162323794e-08, + "loss": 0.0004, + "step": 46690 + }, + { + "epoch": 0.91, + "learning_rate": 1.8876936817987652e-08, + "loss": 0.0003, + "step": 46691 + }, + { + "epoch": 0.91, + "learning_rate": 1.8873053473651507e-08, + "loss": 0.0006, + "step": 46692 + }, + { + "epoch": 0.91, + "learning_rate": 1.8869170129315365e-08, + "loss": 0.0003, + "step": 46693 + }, + { + "epoch": 0.91, + "learning_rate": 1.8865286784979223e-08, + "loss": 0.0003, + "step": 46694 + }, + { + "epoch": 0.91, + "learning_rate": 1.886140344064308e-08, + "loss": 1.0423, + "step": 46695 + }, + { + "epoch": 0.91, + "learning_rate": 1.885752009630694e-08, + "loss": 0.0003, + "step": 46696 + }, + { + "epoch": 0.91, + "learning_rate": 1.8853636751970798e-08, + "loss": 0.0004, + "step": 46697 + }, + { + "epoch": 0.91, + "learning_rate": 1.8849753407634656e-08, + "loss": 0.0008, + "step": 46698 + }, + { + "epoch": 0.91, + "learning_rate": 1.884587006329851e-08, + "loss": 0.0004, + "step": 46699 + }, + { + "epoch": 0.91, + "learning_rate": 1.884198671896237e-08, + "loss": 0.0005, + "step": 46700 + }, + { + "epoch": 0.91, + "learning_rate": 1.8838103374626228e-08, + "loss": 0.0004, + "step": 46701 + }, + { + "epoch": 0.91, + "learning_rate": 1.8834220030290086e-08, + "loss": 0.0005, + "step": 46702 + }, + { + "epoch": 0.91, + "learning_rate": 1.8830336685953944e-08, + "loss": 0.0004, + "step": 46703 + }, + { + "epoch": 0.91, + "learning_rate": 1.8826453341617802e-08, + "loss": 0.0533, + "step": 46704 + }, + { + "epoch": 0.91, + "learning_rate": 1.882256999728166e-08, + "loss": 0.0005, + "step": 46705 + }, + { + "epoch": 0.91, + "learning_rate": 1.8818686652945516e-08, + "loss": 0.7571, + "step": 46706 + }, + { + "epoch": 0.91, + "learning_rate": 1.8814803308609374e-08, + "loss": 0.5275, + "step": 46707 + }, + { + "epoch": 0.91, + "learning_rate": 1.8810919964273232e-08, + "loss": 0.001, + "step": 46708 + }, + { + "epoch": 0.91, + "learning_rate": 1.880703661993709e-08, + "loss": 0.0003, + "step": 46709 + }, + { + "epoch": 0.91, + "learning_rate": 1.880315327560095e-08, + "loss": 0.0005, + "step": 46710 + }, + { + "epoch": 0.91, + "learning_rate": 1.8799269931264803e-08, + "loss": 0.9564, + "step": 46711 + }, + { + "epoch": 0.91, + "learning_rate": 1.8795386586928662e-08, + "loss": 0.0008, + "step": 46712 + }, + { + "epoch": 0.91, + "learning_rate": 1.879150324259252e-08, + "loss": 0.0003, + "step": 46713 + }, + { + "epoch": 0.91, + "learning_rate": 1.8787619898256378e-08, + "loss": 0.0004, + "step": 46714 + }, + { + "epoch": 0.91, + "learning_rate": 1.8783736553920233e-08, + "loss": 1.9886, + "step": 46715 + }, + { + "epoch": 0.91, + "learning_rate": 1.877985320958409e-08, + "loss": 0.0004, + "step": 46716 + }, + { + "epoch": 0.91, + "learning_rate": 1.877596986524795e-08, + "loss": 0.0004, + "step": 46717 + }, + { + "epoch": 0.91, + "learning_rate": 1.8772086520911808e-08, + "loss": 0.0003, + "step": 46718 + }, + { + "epoch": 0.91, + "learning_rate": 1.8768203176575666e-08, + "loss": 0.0004, + "step": 46719 + }, + { + "epoch": 0.91, + "learning_rate": 1.8764319832239524e-08, + "loss": 0.0004, + "step": 46720 + }, + { + "epoch": 0.91, + "learning_rate": 1.876043648790338e-08, + "loss": 0.0527, + "step": 46721 + }, + { + "epoch": 0.91, + "learning_rate": 1.8756553143567238e-08, + "loss": 0.0005, + "step": 46722 + }, + { + "epoch": 0.91, + "learning_rate": 1.8752669799231096e-08, + "loss": 0.0005, + "step": 46723 + }, + { + "epoch": 0.91, + "learning_rate": 1.8748786454894954e-08, + "loss": 0.0197, + "step": 46724 + }, + { + "epoch": 0.91, + "learning_rate": 1.8744903110558812e-08, + "loss": 0.0012, + "step": 46725 + }, + { + "epoch": 0.91, + "learning_rate": 1.874101976622267e-08, + "loss": 0.0003, + "step": 46726 + }, + { + "epoch": 0.91, + "learning_rate": 1.873713642188653e-08, + "loss": 0.0004, + "step": 46727 + }, + { + "epoch": 0.91, + "learning_rate": 1.8733253077550384e-08, + "loss": 0.0006, + "step": 46728 + }, + { + "epoch": 0.91, + "learning_rate": 1.8729369733214242e-08, + "loss": 0.0299, + "step": 46729 + }, + { + "epoch": 0.91, + "learning_rate": 1.87254863888781e-08, + "loss": 0.0006, + "step": 46730 + }, + { + "epoch": 0.91, + "learning_rate": 1.872160304454196e-08, + "loss": 0.0004, + "step": 46731 + }, + { + "epoch": 0.91, + "learning_rate": 1.8717719700205817e-08, + "loss": 0.0019, + "step": 46732 + }, + { + "epoch": 0.91, + "learning_rate": 1.8713836355869675e-08, + "loss": 0.0005, + "step": 46733 + }, + { + "epoch": 0.91, + "learning_rate": 1.8709953011533533e-08, + "loss": 0.0005, + "step": 46734 + }, + { + "epoch": 0.91, + "learning_rate": 1.8706069667197388e-08, + "loss": 0.0004, + "step": 46735 + }, + { + "epoch": 0.91, + "learning_rate": 1.8702186322861246e-08, + "loss": 0.0003, + "step": 46736 + }, + { + "epoch": 0.91, + "learning_rate": 1.8698302978525105e-08, + "loss": 0.0003, + "step": 46737 + }, + { + "epoch": 0.91, + "learning_rate": 1.8694419634188963e-08, + "loss": 0.0004, + "step": 46738 + }, + { + "epoch": 0.91, + "learning_rate": 1.869053628985282e-08, + "loss": 0.0009, + "step": 46739 + }, + { + "epoch": 0.91, + "learning_rate": 1.868665294551668e-08, + "loss": 0.0007, + "step": 46740 + }, + { + "epoch": 0.91, + "learning_rate": 1.8682769601180538e-08, + "loss": 0.0066, + "step": 46741 + }, + { + "epoch": 0.91, + "learning_rate": 1.8678886256844392e-08, + "loss": 0.0004, + "step": 46742 + }, + { + "epoch": 0.91, + "learning_rate": 1.867500291250825e-08, + "loss": 0.0004, + "step": 46743 + }, + { + "epoch": 0.91, + "learning_rate": 1.867111956817211e-08, + "loss": 0.0664, + "step": 46744 + }, + { + "epoch": 0.91, + "learning_rate": 1.8667236223835967e-08, + "loss": 0.0005, + "step": 46745 + }, + { + "epoch": 0.91, + "learning_rate": 1.8663352879499825e-08, + "loss": 0.0006, + "step": 46746 + }, + { + "epoch": 0.91, + "learning_rate": 1.8659469535163684e-08, + "loss": 0.0006, + "step": 46747 + }, + { + "epoch": 0.91, + "learning_rate": 1.8655586190827542e-08, + "loss": 0.0006, + "step": 46748 + }, + { + "epoch": 0.91, + "learning_rate": 1.86517028464914e-08, + "loss": 0.0004, + "step": 46749 + }, + { + "epoch": 0.91, + "learning_rate": 1.8647819502155255e-08, + "loss": 0.2057, + "step": 46750 + }, + { + "epoch": 0.91, + "learning_rate": 1.8643936157819113e-08, + "loss": 0.002, + "step": 46751 + }, + { + "epoch": 0.91, + "learning_rate": 1.864005281348297e-08, + "loss": 0.0004, + "step": 46752 + }, + { + "epoch": 0.91, + "learning_rate": 1.863616946914683e-08, + "loss": 0.0003, + "step": 46753 + }, + { + "epoch": 0.91, + "learning_rate": 1.8632286124810688e-08, + "loss": 0.0247, + "step": 46754 + }, + { + "epoch": 0.91, + "learning_rate": 1.8628402780474546e-08, + "loss": 0.0004, + "step": 46755 + }, + { + "epoch": 0.91, + "learning_rate": 1.86245194361384e-08, + "loss": 0.0006, + "step": 46756 + }, + { + "epoch": 0.91, + "learning_rate": 1.862063609180226e-08, + "loss": 0.0004, + "step": 46757 + }, + { + "epoch": 0.91, + "learning_rate": 1.8616752747466118e-08, + "loss": 0.0003, + "step": 46758 + }, + { + "epoch": 0.91, + "learning_rate": 1.8612869403129973e-08, + "loss": 1.2988, + "step": 46759 + }, + { + "epoch": 0.91, + "learning_rate": 1.860898605879383e-08, + "loss": 0.0007, + "step": 46760 + }, + { + "epoch": 0.91, + "learning_rate": 1.860510271445769e-08, + "loss": 1.0483, + "step": 46761 + }, + { + "epoch": 0.91, + "learning_rate": 1.8601219370121547e-08, + "loss": 0.0005, + "step": 46762 + }, + { + "epoch": 0.91, + "learning_rate": 1.8597336025785406e-08, + "loss": 0.0003, + "step": 46763 + }, + { + "epoch": 0.91, + "learning_rate": 1.859345268144926e-08, + "loss": 0.0003, + "step": 46764 + }, + { + "epoch": 0.91, + "learning_rate": 1.858956933711312e-08, + "loss": 0.0004, + "step": 46765 + }, + { + "epoch": 0.91, + "learning_rate": 1.8585685992776977e-08, + "loss": 0.0004, + "step": 46766 + }, + { + "epoch": 0.91, + "learning_rate": 1.8581802648440835e-08, + "loss": 0.0004, + "step": 46767 + }, + { + "epoch": 0.91, + "learning_rate": 1.8577919304104694e-08, + "loss": 0.0004, + "step": 46768 + }, + { + "epoch": 0.91, + "learning_rate": 1.8574035959768552e-08, + "loss": 0.0003, + "step": 46769 + }, + { + "epoch": 0.91, + "learning_rate": 1.857015261543241e-08, + "loss": 0.0004, + "step": 46770 + }, + { + "epoch": 0.91, + "learning_rate": 1.8566269271096265e-08, + "loss": 0.0005, + "step": 46771 + }, + { + "epoch": 0.91, + "learning_rate": 1.8562385926760123e-08, + "loss": 0.0003, + "step": 46772 + }, + { + "epoch": 0.91, + "learning_rate": 1.855850258242398e-08, + "loss": 0.0007, + "step": 46773 + }, + { + "epoch": 0.91, + "learning_rate": 1.855461923808784e-08, + "loss": 0.0012, + "step": 46774 + }, + { + "epoch": 0.91, + "learning_rate": 1.8550735893751698e-08, + "loss": 0.002, + "step": 46775 + }, + { + "epoch": 0.91, + "learning_rate": 1.8546852549415556e-08, + "loss": 0.9642, + "step": 46776 + }, + { + "epoch": 0.91, + "learning_rate": 1.8542969205079415e-08, + "loss": 0.0004, + "step": 46777 + }, + { + "epoch": 0.91, + "learning_rate": 1.8539085860743273e-08, + "loss": 0.0004, + "step": 46778 + }, + { + "epoch": 0.91, + "learning_rate": 1.8535202516407128e-08, + "loss": 0.0006, + "step": 46779 + }, + { + "epoch": 0.91, + "learning_rate": 1.8531319172070986e-08, + "loss": 0.0004, + "step": 46780 + }, + { + "epoch": 0.91, + "learning_rate": 1.8527435827734844e-08, + "loss": 0.0003, + "step": 46781 + }, + { + "epoch": 0.91, + "learning_rate": 1.8523552483398702e-08, + "loss": 0.0003, + "step": 46782 + }, + { + "epoch": 0.91, + "learning_rate": 1.851966913906256e-08, + "loss": 0.0003, + "step": 46783 + }, + { + "epoch": 0.91, + "learning_rate": 1.851578579472642e-08, + "loss": 0.0004, + "step": 46784 + }, + { + "epoch": 0.91, + "learning_rate": 1.8511902450390277e-08, + "loss": 0.0003, + "step": 46785 + }, + { + "epoch": 0.91, + "learning_rate": 1.8508019106054132e-08, + "loss": 0.0004, + "step": 46786 + }, + { + "epoch": 0.91, + "learning_rate": 1.850413576171799e-08, + "loss": 0.4951, + "step": 46787 + }, + { + "epoch": 0.91, + "learning_rate": 1.850025241738185e-08, + "loss": 0.0004, + "step": 46788 + }, + { + "epoch": 0.91, + "learning_rate": 1.8496369073045707e-08, + "loss": 0.0004, + "step": 46789 + }, + { + "epoch": 0.91, + "learning_rate": 1.8492485728709565e-08, + "loss": 0.0004, + "step": 46790 + }, + { + "epoch": 0.91, + "learning_rate": 1.8488602384373423e-08, + "loss": 0.0003, + "step": 46791 + }, + { + "epoch": 0.91, + "learning_rate": 1.848471904003728e-08, + "loss": 0.0006, + "step": 46792 + }, + { + "epoch": 0.91, + "learning_rate": 1.8480835695701136e-08, + "loss": 0.0019, + "step": 46793 + }, + { + "epoch": 0.91, + "learning_rate": 1.8476952351364995e-08, + "loss": 0.0003, + "step": 46794 + }, + { + "epoch": 0.91, + "learning_rate": 1.8473069007028853e-08, + "loss": 0.0329, + "step": 46795 + }, + { + "epoch": 0.91, + "learning_rate": 1.846918566269271e-08, + "loss": 0.0004, + "step": 46796 + }, + { + "epoch": 0.91, + "learning_rate": 1.846530231835657e-08, + "loss": 0.0004, + "step": 46797 + }, + { + "epoch": 0.91, + "learning_rate": 1.8461418974020428e-08, + "loss": 0.0003, + "step": 46798 + }, + { + "epoch": 0.91, + "learning_rate": 1.8457535629684286e-08, + "loss": 0.0005, + "step": 46799 + }, + { + "epoch": 0.91, + "learning_rate": 1.845365228534814e-08, + "loss": 0.0004, + "step": 46800 + }, + { + "epoch": 0.91, + "learning_rate": 1.8449768941012e-08, + "loss": 0.0005, + "step": 46801 + }, + { + "epoch": 0.91, + "learning_rate": 1.8445885596675857e-08, + "loss": 0.7148, + "step": 46802 + }, + { + "epoch": 0.91, + "learning_rate": 1.8442002252339712e-08, + "loss": 0.0005, + "step": 46803 + }, + { + "epoch": 0.91, + "learning_rate": 1.843811890800357e-08, + "loss": 0.0003, + "step": 46804 + }, + { + "epoch": 0.91, + "learning_rate": 1.843423556366743e-08, + "loss": 0.0003, + "step": 46805 + }, + { + "epoch": 0.91, + "learning_rate": 1.8430352219331287e-08, + "loss": 0.0003, + "step": 46806 + }, + { + "epoch": 0.91, + "learning_rate": 1.8426468874995145e-08, + "loss": 0.0004, + "step": 46807 + }, + { + "epoch": 0.91, + "learning_rate": 1.8422585530659e-08, + "loss": 0.0275, + "step": 46808 + }, + { + "epoch": 0.91, + "learning_rate": 1.841870218632286e-08, + "loss": 0.0003, + "step": 46809 + }, + { + "epoch": 0.91, + "learning_rate": 1.8414818841986717e-08, + "loss": 0.0003, + "step": 46810 + }, + { + "epoch": 0.91, + "learning_rate": 1.8410935497650575e-08, + "loss": 0.0003, + "step": 46811 + }, + { + "epoch": 0.91, + "learning_rate": 1.8407052153314433e-08, + "loss": 0.0004, + "step": 46812 + }, + { + "epoch": 0.91, + "learning_rate": 1.840316880897829e-08, + "loss": 0.0004, + "step": 46813 + }, + { + "epoch": 0.91, + "learning_rate": 1.839928546464215e-08, + "loss": 0.0004, + "step": 46814 + }, + { + "epoch": 0.91, + "learning_rate": 1.8395402120306005e-08, + "loss": 0.0004, + "step": 46815 + }, + { + "epoch": 0.91, + "learning_rate": 1.8391518775969863e-08, + "loss": 0.0004, + "step": 46816 + }, + { + "epoch": 0.91, + "learning_rate": 1.838763543163372e-08, + "loss": 0.0007, + "step": 46817 + }, + { + "epoch": 0.91, + "learning_rate": 1.838375208729758e-08, + "loss": 0.0201, + "step": 46818 + }, + { + "epoch": 0.91, + "learning_rate": 1.8379868742961438e-08, + "loss": 0.0003, + "step": 46819 + }, + { + "epoch": 0.91, + "learning_rate": 1.8375985398625296e-08, + "loss": 0.0004, + "step": 46820 + }, + { + "epoch": 0.91, + "learning_rate": 1.8372102054289154e-08, + "loss": 0.0005, + "step": 46821 + }, + { + "epoch": 0.91, + "learning_rate": 1.836821870995301e-08, + "loss": 0.0004, + "step": 46822 + }, + { + "epoch": 0.91, + "learning_rate": 1.8364335365616867e-08, + "loss": 0.0004, + "step": 46823 + }, + { + "epoch": 0.91, + "learning_rate": 1.8360452021280726e-08, + "loss": 0.0003, + "step": 46824 + }, + { + "epoch": 0.91, + "learning_rate": 1.8356568676944584e-08, + "loss": 0.0004, + "step": 46825 + }, + { + "epoch": 0.91, + "learning_rate": 1.8352685332608442e-08, + "loss": 0.0004, + "step": 46826 + }, + { + "epoch": 0.91, + "learning_rate": 1.83488019882723e-08, + "loss": 0.0006, + "step": 46827 + }, + { + "epoch": 0.91, + "learning_rate": 1.834491864393616e-08, + "loss": 0.0004, + "step": 46828 + }, + { + "epoch": 0.91, + "learning_rate": 1.8341035299600013e-08, + "loss": 0.0003, + "step": 46829 + }, + { + "epoch": 0.91, + "learning_rate": 1.8337151955263872e-08, + "loss": 0.0005, + "step": 46830 + }, + { + "epoch": 0.91, + "learning_rate": 1.833326861092773e-08, + "loss": 0.0005, + "step": 46831 + }, + { + "epoch": 0.91, + "learning_rate": 1.8329385266591588e-08, + "loss": 0.0004, + "step": 46832 + }, + { + "epoch": 0.91, + "learning_rate": 1.8325501922255446e-08, + "loss": 0.0004, + "step": 46833 + }, + { + "epoch": 0.91, + "learning_rate": 1.8321618577919305e-08, + "loss": 0.0006, + "step": 46834 + }, + { + "epoch": 0.91, + "learning_rate": 1.8317735233583163e-08, + "loss": 0.0003, + "step": 46835 + }, + { + "epoch": 0.91, + "learning_rate": 1.831385188924702e-08, + "loss": 0.0003, + "step": 46836 + }, + { + "epoch": 0.91, + "learning_rate": 1.8309968544910876e-08, + "loss": 0.0004, + "step": 46837 + }, + { + "epoch": 0.91, + "learning_rate": 1.8306085200574734e-08, + "loss": 0.0003, + "step": 46838 + }, + { + "epoch": 0.91, + "learning_rate": 1.8302201856238593e-08, + "loss": 0.0013, + "step": 46839 + }, + { + "epoch": 0.91, + "learning_rate": 1.829831851190245e-08, + "loss": 0.0007, + "step": 46840 + }, + { + "epoch": 0.91, + "learning_rate": 1.829443516756631e-08, + "loss": 0.0005, + "step": 46841 + }, + { + "epoch": 0.91, + "learning_rate": 1.8290551823230167e-08, + "loss": 0.0003, + "step": 46842 + }, + { + "epoch": 0.91, + "learning_rate": 1.8286668478894026e-08, + "loss": 0.0003, + "step": 46843 + }, + { + "epoch": 0.91, + "learning_rate": 1.828278513455788e-08, + "loss": 0.0004, + "step": 46844 + }, + { + "epoch": 0.91, + "learning_rate": 1.827890179022174e-08, + "loss": 0.0168, + "step": 46845 + }, + { + "epoch": 0.91, + "learning_rate": 1.8275018445885597e-08, + "loss": 0.0412, + "step": 46846 + }, + { + "epoch": 0.91, + "learning_rate": 1.8271135101549455e-08, + "loss": 0.0041, + "step": 46847 + }, + { + "epoch": 0.91, + "learning_rate": 1.826725175721331e-08, + "loss": 0.0004, + "step": 46848 + }, + { + "epoch": 0.91, + "learning_rate": 1.826336841287717e-08, + "loss": 0.0004, + "step": 46849 + }, + { + "epoch": 0.91, + "learning_rate": 1.8259485068541027e-08, + "loss": 0.0108, + "step": 46850 + }, + { + "epoch": 0.91, + "learning_rate": 1.825560172420488e-08, + "loss": 0.0029, + "step": 46851 + }, + { + "epoch": 0.91, + "learning_rate": 1.825171837986874e-08, + "loss": 0.0003, + "step": 46852 + }, + { + "epoch": 0.91, + "learning_rate": 1.8247835035532598e-08, + "loss": 0.0005, + "step": 46853 + }, + { + "epoch": 0.91, + "learning_rate": 1.8243951691196456e-08, + "loss": 0.0007, + "step": 46854 + }, + { + "epoch": 0.91, + "learning_rate": 1.8240068346860315e-08, + "loss": 0.0005, + "step": 46855 + }, + { + "epoch": 0.91, + "learning_rate": 1.8236185002524173e-08, + "loss": 0.0006, + "step": 46856 + }, + { + "epoch": 0.91, + "learning_rate": 1.823230165818803e-08, + "loss": 0.0003, + "step": 46857 + }, + { + "epoch": 0.91, + "learning_rate": 1.8228418313851886e-08, + "loss": 0.0016, + "step": 46858 + }, + { + "epoch": 0.91, + "learning_rate": 1.8224534969515744e-08, + "loss": 0.0002, + "step": 46859 + }, + { + "epoch": 0.91, + "learning_rate": 1.8220651625179602e-08, + "loss": 0.0004, + "step": 46860 + }, + { + "epoch": 0.91, + "learning_rate": 1.821676828084346e-08, + "loss": 0.1196, + "step": 46861 + }, + { + "epoch": 0.91, + "learning_rate": 1.821288493650732e-08, + "loss": 0.0005, + "step": 46862 + }, + { + "epoch": 0.91, + "learning_rate": 1.8209001592171177e-08, + "loss": 0.0004, + "step": 46863 + }, + { + "epoch": 0.91, + "learning_rate": 1.8205118247835035e-08, + "loss": 0.0004, + "step": 46864 + }, + { + "epoch": 0.91, + "learning_rate": 1.8201234903498894e-08, + "loss": 0.0025, + "step": 46865 + }, + { + "epoch": 0.91, + "learning_rate": 1.819735155916275e-08, + "loss": 0.0006, + "step": 46866 + }, + { + "epoch": 0.91, + "learning_rate": 1.8193468214826607e-08, + "loss": 0.6643, + "step": 46867 + }, + { + "epoch": 0.91, + "learning_rate": 1.8189584870490465e-08, + "loss": 0.0004, + "step": 46868 + }, + { + "epoch": 0.91, + "learning_rate": 1.8185701526154323e-08, + "loss": 0.0002, + "step": 46869 + }, + { + "epoch": 0.91, + "learning_rate": 1.818181818181818e-08, + "loss": 0.0022, + "step": 46870 + }, + { + "epoch": 0.91, + "learning_rate": 1.817793483748204e-08, + "loss": 0.0005, + "step": 46871 + }, + { + "epoch": 0.91, + "learning_rate": 1.8174051493145898e-08, + "loss": 0.0004, + "step": 46872 + }, + { + "epoch": 0.91, + "learning_rate": 1.8170168148809753e-08, + "loss": 0.0005, + "step": 46873 + }, + { + "epoch": 0.91, + "learning_rate": 1.816628480447361e-08, + "loss": 0.0005, + "step": 46874 + }, + { + "epoch": 0.91, + "learning_rate": 1.816240146013747e-08, + "loss": 0.0003, + "step": 46875 + }, + { + "epoch": 0.91, + "learning_rate": 1.8158518115801328e-08, + "loss": 0.0004, + "step": 46876 + }, + { + "epoch": 0.91, + "learning_rate": 1.8154634771465186e-08, + "loss": 0.7184, + "step": 46877 + }, + { + "epoch": 0.91, + "learning_rate": 1.8150751427129044e-08, + "loss": 0.0003, + "step": 46878 + }, + { + "epoch": 0.91, + "learning_rate": 1.8146868082792902e-08, + "loss": 0.0003, + "step": 46879 + }, + { + "epoch": 0.91, + "learning_rate": 1.8142984738456757e-08, + "loss": 0.0003, + "step": 46880 + }, + { + "epoch": 0.91, + "learning_rate": 1.8139101394120616e-08, + "loss": 0.0003, + "step": 46881 + }, + { + "epoch": 0.91, + "learning_rate": 1.8135218049784474e-08, + "loss": 0.001, + "step": 46882 + }, + { + "epoch": 0.91, + "learning_rate": 1.8131334705448332e-08, + "loss": 0.0004, + "step": 46883 + }, + { + "epoch": 0.91, + "learning_rate": 1.812745136111219e-08, + "loss": 0.0005, + "step": 46884 + }, + { + "epoch": 0.91, + "learning_rate": 1.812356801677605e-08, + "loss": 0.0004, + "step": 46885 + }, + { + "epoch": 0.91, + "learning_rate": 1.8119684672439907e-08, + "loss": 0.0004, + "step": 46886 + }, + { + "epoch": 0.91, + "learning_rate": 1.8115801328103762e-08, + "loss": 0.0005, + "step": 46887 + }, + { + "epoch": 0.91, + "learning_rate": 1.811191798376762e-08, + "loss": 0.0003, + "step": 46888 + }, + { + "epoch": 0.91, + "learning_rate": 1.8108034639431478e-08, + "loss": 0.0004, + "step": 46889 + }, + { + "epoch": 0.91, + "learning_rate": 1.8104151295095337e-08, + "loss": 0.0005, + "step": 46890 + }, + { + "epoch": 0.91, + "learning_rate": 1.8100267950759195e-08, + "loss": 0.0013, + "step": 46891 + }, + { + "epoch": 0.91, + "learning_rate": 1.809638460642305e-08, + "loss": 0.0003, + "step": 46892 + }, + { + "epoch": 0.91, + "learning_rate": 1.8092501262086908e-08, + "loss": 0.02, + "step": 46893 + }, + { + "epoch": 0.91, + "learning_rate": 1.8088617917750766e-08, + "loss": 0.0003, + "step": 46894 + }, + { + "epoch": 0.91, + "learning_rate": 1.8084734573414624e-08, + "loss": 0.0004, + "step": 46895 + }, + { + "epoch": 0.91, + "learning_rate": 1.808085122907848e-08, + "loss": 0.0003, + "step": 46896 + }, + { + "epoch": 0.91, + "learning_rate": 1.8076967884742338e-08, + "loss": 0.0005, + "step": 46897 + }, + { + "epoch": 0.91, + "learning_rate": 1.8073084540406196e-08, + "loss": 0.0004, + "step": 46898 + }, + { + "epoch": 0.91, + "learning_rate": 1.8069201196070054e-08, + "loss": 0.0002, + "step": 46899 + }, + { + "epoch": 0.91, + "learning_rate": 1.8065317851733912e-08, + "loss": 0.0003, + "step": 46900 + }, + { + "epoch": 0.91, + "learning_rate": 1.806143450739777e-08, + "loss": 0.0003, + "step": 46901 + }, + { + "epoch": 0.91, + "learning_rate": 1.8057551163061626e-08, + "loss": 1.1184, + "step": 46902 + }, + { + "epoch": 0.91, + "learning_rate": 1.8053667818725484e-08, + "loss": 0.0003, + "step": 46903 + }, + { + "epoch": 0.91, + "learning_rate": 1.8049784474389342e-08, + "loss": 1.0283, + "step": 46904 + }, + { + "epoch": 0.91, + "learning_rate": 1.80459011300532e-08, + "loss": 0.0028, + "step": 46905 + }, + { + "epoch": 0.91, + "learning_rate": 1.804201778571706e-08, + "loss": 0.0002, + "step": 46906 + }, + { + "epoch": 0.91, + "learning_rate": 1.8038134441380917e-08, + "loss": 0.0005, + "step": 46907 + }, + { + "epoch": 0.91, + "learning_rate": 1.8034251097044775e-08, + "loss": 0.0005, + "step": 46908 + }, + { + "epoch": 0.91, + "learning_rate": 1.803036775270863e-08, + "loss": 0.0003, + "step": 46909 + }, + { + "epoch": 0.91, + "learning_rate": 1.8026484408372488e-08, + "loss": 0.0003, + "step": 46910 + }, + { + "epoch": 0.91, + "learning_rate": 1.8022601064036346e-08, + "loss": 0.0004, + "step": 46911 + }, + { + "epoch": 0.91, + "learning_rate": 1.8018717719700205e-08, + "loss": 0.0009, + "step": 46912 + }, + { + "epoch": 0.91, + "learning_rate": 1.8014834375364063e-08, + "loss": 0.0004, + "step": 46913 + }, + { + "epoch": 0.91, + "learning_rate": 1.801095103102792e-08, + "loss": 0.0005, + "step": 46914 + }, + { + "epoch": 0.91, + "learning_rate": 1.800706768669178e-08, + "loss": 0.0003, + "step": 46915 + }, + { + "epoch": 0.91, + "learning_rate": 1.8003184342355634e-08, + "loss": 0.0005, + "step": 46916 + }, + { + "epoch": 0.91, + "learning_rate": 1.7999300998019493e-08, + "loss": 0.0004, + "step": 46917 + }, + { + "epoch": 0.91, + "learning_rate": 1.799541765368335e-08, + "loss": 0.0004, + "step": 46918 + }, + { + "epoch": 0.91, + "learning_rate": 1.799153430934721e-08, + "loss": 0.0003, + "step": 46919 + }, + { + "epoch": 0.91, + "learning_rate": 1.7987650965011067e-08, + "loss": 0.0006, + "step": 46920 + }, + { + "epoch": 0.91, + "learning_rate": 1.7983767620674926e-08, + "loss": 0.0005, + "step": 46921 + }, + { + "epoch": 0.91, + "learning_rate": 1.7979884276338784e-08, + "loss": 0.0003, + "step": 46922 + }, + { + "epoch": 0.91, + "learning_rate": 1.7976000932002642e-08, + "loss": 0.0004, + "step": 46923 + }, + { + "epoch": 0.91, + "learning_rate": 1.7972117587666497e-08, + "loss": 0.0003, + "step": 46924 + }, + { + "epoch": 0.91, + "learning_rate": 1.7968234243330355e-08, + "loss": 0.0009, + "step": 46925 + }, + { + "epoch": 0.91, + "learning_rate": 1.7964350898994214e-08, + "loss": 0.0003, + "step": 46926 + }, + { + "epoch": 0.91, + "learning_rate": 1.7960467554658072e-08, + "loss": 0.0006, + "step": 46927 + }, + { + "epoch": 0.91, + "learning_rate": 1.795658421032193e-08, + "loss": 0.6634, + "step": 46928 + }, + { + "epoch": 0.91, + "learning_rate": 1.7952700865985788e-08, + "loss": 0.0037, + "step": 46929 + }, + { + "epoch": 0.91, + "learning_rate": 1.7948817521649646e-08, + "loss": 0.0003, + "step": 46930 + }, + { + "epoch": 0.91, + "learning_rate": 1.79449341773135e-08, + "loss": 0.0005, + "step": 46931 + }, + { + "epoch": 0.91, + "learning_rate": 1.794105083297736e-08, + "loss": 0.0003, + "step": 46932 + }, + { + "epoch": 0.91, + "learning_rate": 1.7937167488641218e-08, + "loss": 0.0004, + "step": 46933 + }, + { + "epoch": 0.91, + "learning_rate": 1.7933284144305076e-08, + "loss": 0.0005, + "step": 46934 + }, + { + "epoch": 0.91, + "learning_rate": 1.7929400799968934e-08, + "loss": 0.0004, + "step": 46935 + }, + { + "epoch": 0.91, + "learning_rate": 1.792551745563279e-08, + "loss": 0.0005, + "step": 46936 + }, + { + "epoch": 0.91, + "learning_rate": 1.7921634111296648e-08, + "loss": 0.0003, + "step": 46937 + }, + { + "epoch": 0.91, + "learning_rate": 1.7917750766960506e-08, + "loss": 0.0006, + "step": 46938 + }, + { + "epoch": 0.91, + "learning_rate": 1.7913867422624364e-08, + "loss": 0.0005, + "step": 46939 + }, + { + "epoch": 0.91, + "learning_rate": 1.790998407828822e-08, + "loss": 0.1861, + "step": 46940 + }, + { + "epoch": 0.91, + "learning_rate": 1.7906100733952077e-08, + "loss": 0.0005, + "step": 46941 + }, + { + "epoch": 0.91, + "learning_rate": 1.7902217389615935e-08, + "loss": 0.0005, + "step": 46942 + }, + { + "epoch": 0.91, + "learning_rate": 1.7898334045279794e-08, + "loss": 0.0006, + "step": 46943 + }, + { + "epoch": 0.91, + "learning_rate": 1.7894450700943652e-08, + "loss": 0.0007, + "step": 46944 + }, + { + "epoch": 0.91, + "learning_rate": 1.7890567356607507e-08, + "loss": 0.0007, + "step": 46945 + }, + { + "epoch": 0.91, + "learning_rate": 1.7886684012271365e-08, + "loss": 0.3124, + "step": 46946 + }, + { + "epoch": 0.91, + "learning_rate": 1.7882800667935223e-08, + "loss": 0.0006, + "step": 46947 + }, + { + "epoch": 0.91, + "learning_rate": 1.787891732359908e-08, + "loss": 0.0004, + "step": 46948 + }, + { + "epoch": 0.91, + "learning_rate": 1.787503397926294e-08, + "loss": 0.0003, + "step": 46949 + }, + { + "epoch": 0.91, + "learning_rate": 1.7871150634926798e-08, + "loss": 0.0003, + "step": 46950 + }, + { + "epoch": 0.91, + "learning_rate": 1.7867267290590656e-08, + "loss": 0.0003, + "step": 46951 + }, + { + "epoch": 0.91, + "learning_rate": 1.7863383946254515e-08, + "loss": 0.0006, + "step": 46952 + }, + { + "epoch": 0.91, + "learning_rate": 1.785950060191837e-08, + "loss": 0.0003, + "step": 46953 + }, + { + "epoch": 0.91, + "learning_rate": 1.7855617257582228e-08, + "loss": 0.0003, + "step": 46954 + }, + { + "epoch": 0.91, + "learning_rate": 1.7851733913246086e-08, + "loss": 0.0003, + "step": 46955 + }, + { + "epoch": 0.91, + "learning_rate": 1.7847850568909944e-08, + "loss": 0.0005, + "step": 46956 + }, + { + "epoch": 0.91, + "learning_rate": 1.7843967224573803e-08, + "loss": 0.0006, + "step": 46957 + }, + { + "epoch": 0.91, + "learning_rate": 1.784008388023766e-08, + "loss": 0.0003, + "step": 46958 + }, + { + "epoch": 0.91, + "learning_rate": 1.783620053590152e-08, + "loss": 0.0004, + "step": 46959 + }, + { + "epoch": 0.91, + "learning_rate": 1.7832317191565374e-08, + "loss": 0.0005, + "step": 46960 + }, + { + "epoch": 0.91, + "learning_rate": 1.7828433847229232e-08, + "loss": 0.0005, + "step": 46961 + }, + { + "epoch": 0.91, + "learning_rate": 1.782455050289309e-08, + "loss": 0.0003, + "step": 46962 + }, + { + "epoch": 0.91, + "learning_rate": 1.782066715855695e-08, + "loss": 0.0598, + "step": 46963 + }, + { + "epoch": 0.91, + "learning_rate": 1.7816783814220807e-08, + "loss": 0.3556, + "step": 46964 + }, + { + "epoch": 0.91, + "learning_rate": 1.7812900469884665e-08, + "loss": 0.1765, + "step": 46965 + }, + { + "epoch": 0.91, + "learning_rate": 1.7809017125548523e-08, + "loss": 1.212, + "step": 46966 + }, + { + "epoch": 0.91, + "learning_rate": 1.780513378121238e-08, + "loss": 1.3153, + "step": 46967 + }, + { + "epoch": 0.91, + "learning_rate": 1.7801250436876237e-08, + "loss": 0.0003, + "step": 46968 + }, + { + "epoch": 0.91, + "learning_rate": 1.7797367092540095e-08, + "loss": 0.0328, + "step": 46969 + }, + { + "epoch": 0.91, + "learning_rate": 1.7793483748203953e-08, + "loss": 1.0016, + "step": 46970 + }, + { + "epoch": 0.91, + "learning_rate": 1.778960040386781e-08, + "loss": 0.0003, + "step": 46971 + }, + { + "epoch": 0.91, + "learning_rate": 1.778571705953167e-08, + "loss": 0.0043, + "step": 46972 + }, + { + "epoch": 0.91, + "learning_rate": 1.7781833715195528e-08, + "loss": 0.0004, + "step": 46973 + }, + { + "epoch": 0.91, + "learning_rate": 1.7777950370859383e-08, + "loss": 0.0003, + "step": 46974 + }, + { + "epoch": 0.91, + "learning_rate": 1.777406702652324e-08, + "loss": 0.0004, + "step": 46975 + }, + { + "epoch": 0.91, + "learning_rate": 1.77701836821871e-08, + "loss": 0.0009, + "step": 46976 + }, + { + "epoch": 0.91, + "learning_rate": 1.7766300337850957e-08, + "loss": 0.0004, + "step": 46977 + }, + { + "epoch": 0.91, + "learning_rate": 1.7762416993514816e-08, + "loss": 0.0009, + "step": 46978 + }, + { + "epoch": 0.91, + "learning_rate": 1.7758533649178674e-08, + "loss": 0.0004, + "step": 46979 + }, + { + "epoch": 0.91, + "learning_rate": 1.775465030484253e-08, + "loss": 0.0004, + "step": 46980 + }, + { + "epoch": 0.91, + "learning_rate": 1.7750766960506387e-08, + "loss": 0.0004, + "step": 46981 + }, + { + "epoch": 0.91, + "learning_rate": 1.7746883616170245e-08, + "loss": 0.0004, + "step": 46982 + }, + { + "epoch": 0.91, + "learning_rate": 1.7743000271834104e-08, + "loss": 0.2297, + "step": 46983 + }, + { + "epoch": 0.91, + "learning_rate": 1.773911692749796e-08, + "loss": 0.0005, + "step": 46984 + }, + { + "epoch": 0.91, + "learning_rate": 1.7735233583161817e-08, + "loss": 0.0006, + "step": 46985 + }, + { + "epoch": 0.91, + "learning_rate": 1.7731350238825675e-08, + "loss": 0.0005, + "step": 46986 + }, + { + "epoch": 0.91, + "learning_rate": 1.7727466894489533e-08, + "loss": 0.0004, + "step": 46987 + }, + { + "epoch": 0.91, + "learning_rate": 1.772358355015339e-08, + "loss": 0.0004, + "step": 46988 + }, + { + "epoch": 0.91, + "learning_rate": 1.7719700205817246e-08, + "loss": 0.0002, + "step": 46989 + }, + { + "epoch": 0.91, + "learning_rate": 1.7715816861481105e-08, + "loss": 0.9776, + "step": 46990 + }, + { + "epoch": 0.91, + "learning_rate": 1.7711933517144963e-08, + "loss": 0.0004, + "step": 46991 + }, + { + "epoch": 0.91, + "learning_rate": 1.770805017280882e-08, + "loss": 0.0003, + "step": 46992 + }, + { + "epoch": 0.91, + "learning_rate": 1.770416682847268e-08, + "loss": 0.0003, + "step": 46993 + }, + { + "epoch": 0.91, + "learning_rate": 1.7700283484136538e-08, + "loss": 0.0015, + "step": 46994 + }, + { + "epoch": 0.91, + "learning_rate": 1.7696400139800396e-08, + "loss": 0.0027, + "step": 46995 + }, + { + "epoch": 0.91, + "learning_rate": 1.769251679546425e-08, + "loss": 0.0004, + "step": 46996 + }, + { + "epoch": 0.91, + "learning_rate": 1.768863345112811e-08, + "loss": 0.0004, + "step": 46997 + }, + { + "epoch": 0.91, + "learning_rate": 1.7684750106791967e-08, + "loss": 0.0003, + "step": 46998 + }, + { + "epoch": 0.91, + "learning_rate": 1.7680866762455826e-08, + "loss": 0.0004, + "step": 46999 + }, + { + "epoch": 0.91, + "learning_rate": 1.7676983418119684e-08, + "loss": 0.0003, + "step": 47000 + }, + { + "epoch": 0.91, + "learning_rate": 1.7673100073783542e-08, + "loss": 0.0021, + "step": 47001 + }, + { + "epoch": 0.91, + "learning_rate": 1.76692167294474e-08, + "loss": 0.0004, + "step": 47002 + }, + { + "epoch": 0.91, + "learning_rate": 1.7665333385111255e-08, + "loss": 0.0007, + "step": 47003 + }, + { + "epoch": 0.91, + "learning_rate": 1.7661450040775114e-08, + "loss": 0.0003, + "step": 47004 + }, + { + "epoch": 0.91, + "learning_rate": 1.7657566696438972e-08, + "loss": 0.0004, + "step": 47005 + }, + { + "epoch": 0.91, + "learning_rate": 1.765368335210283e-08, + "loss": 0.0004, + "step": 47006 + }, + { + "epoch": 0.91, + "learning_rate": 1.7649800007766688e-08, + "loss": 0.0003, + "step": 47007 + }, + { + "epoch": 0.91, + "learning_rate": 1.7645916663430547e-08, + "loss": 0.0003, + "step": 47008 + }, + { + "epoch": 0.91, + "learning_rate": 1.7642033319094405e-08, + "loss": 0.0002, + "step": 47009 + }, + { + "epoch": 0.91, + "learning_rate": 1.7638149974758263e-08, + "loss": 0.0003, + "step": 47010 + }, + { + "epoch": 0.91, + "learning_rate": 1.7634266630422118e-08, + "loss": 0.0003, + "step": 47011 + }, + { + "epoch": 0.91, + "learning_rate": 1.7630383286085976e-08, + "loss": 0.0003, + "step": 47012 + }, + { + "epoch": 0.91, + "learning_rate": 1.7626499941749834e-08, + "loss": 0.0004, + "step": 47013 + }, + { + "epoch": 0.91, + "learning_rate": 1.7622616597413693e-08, + "loss": 0.0003, + "step": 47014 + }, + { + "epoch": 0.91, + "learning_rate": 1.761873325307755e-08, + "loss": 0.0004, + "step": 47015 + }, + { + "epoch": 0.91, + "learning_rate": 1.761484990874141e-08, + "loss": 0.0005, + "step": 47016 + }, + { + "epoch": 0.91, + "learning_rate": 1.7610966564405267e-08, + "loss": 0.0004, + "step": 47017 + }, + { + "epoch": 0.91, + "learning_rate": 1.7607083220069122e-08, + "loss": 0.0003, + "step": 47018 + }, + { + "epoch": 0.91, + "learning_rate": 1.760319987573298e-08, + "loss": 0.0007, + "step": 47019 + }, + { + "epoch": 0.91, + "learning_rate": 1.759931653139684e-08, + "loss": 0.0024, + "step": 47020 + }, + { + "epoch": 0.91, + "learning_rate": 1.7595433187060697e-08, + "loss": 0.0003, + "step": 47021 + }, + { + "epoch": 0.91, + "learning_rate": 1.7591549842724555e-08, + "loss": 0.0005, + "step": 47022 + }, + { + "epoch": 0.91, + "learning_rate": 1.7587666498388414e-08, + "loss": 0.0002, + "step": 47023 + }, + { + "epoch": 0.91, + "learning_rate": 1.7583783154052272e-08, + "loss": 0.0005, + "step": 47024 + }, + { + "epoch": 0.91, + "learning_rate": 1.7579899809716127e-08, + "loss": 0.0004, + "step": 47025 + }, + { + "epoch": 0.91, + "learning_rate": 1.7576016465379985e-08, + "loss": 0.0004, + "step": 47026 + }, + { + "epoch": 0.91, + "learning_rate": 1.7572133121043843e-08, + "loss": 0.0009, + "step": 47027 + }, + { + "epoch": 0.91, + "learning_rate": 1.7568249776707698e-08, + "loss": 0.0004, + "step": 47028 + }, + { + "epoch": 0.91, + "learning_rate": 1.7564366432371556e-08, + "loss": 0.0003, + "step": 47029 + }, + { + "epoch": 0.91, + "learning_rate": 1.7560483088035415e-08, + "loss": 0.0003, + "step": 47030 + }, + { + "epoch": 0.91, + "learning_rate": 1.7556599743699273e-08, + "loss": 0.0024, + "step": 47031 + }, + { + "epoch": 0.91, + "learning_rate": 1.7552716399363128e-08, + "loss": 0.0005, + "step": 47032 + }, + { + "epoch": 0.91, + "learning_rate": 1.7548833055026986e-08, + "loss": 0.0005, + "step": 47033 + }, + { + "epoch": 0.91, + "learning_rate": 1.7544949710690844e-08, + "loss": 0.0006, + "step": 47034 + }, + { + "epoch": 0.91, + "learning_rate": 1.7541066366354703e-08, + "loss": 0.0004, + "step": 47035 + }, + { + "epoch": 0.91, + "learning_rate": 1.753718302201856e-08, + "loss": 0.0003, + "step": 47036 + }, + { + "epoch": 0.91, + "learning_rate": 1.753329967768242e-08, + "loss": 1.228, + "step": 47037 + }, + { + "epoch": 0.91, + "learning_rate": 1.7529416333346277e-08, + "loss": 0.0004, + "step": 47038 + }, + { + "epoch": 0.91, + "learning_rate": 1.7525532989010136e-08, + "loss": 0.0004, + "step": 47039 + }, + { + "epoch": 0.91, + "learning_rate": 1.752164964467399e-08, + "loss": 0.0005, + "step": 47040 + }, + { + "epoch": 0.91, + "learning_rate": 1.751776630033785e-08, + "loss": 0.0011, + "step": 47041 + }, + { + "epoch": 0.91, + "learning_rate": 1.7513882956001707e-08, + "loss": 0.0003, + "step": 47042 + }, + { + "epoch": 0.91, + "learning_rate": 1.7509999611665565e-08, + "loss": 0.0173, + "step": 47043 + }, + { + "epoch": 0.91, + "learning_rate": 1.7506116267329423e-08, + "loss": 0.0004, + "step": 47044 + }, + { + "epoch": 0.91, + "learning_rate": 1.7502232922993282e-08, + "loss": 0.0005, + "step": 47045 + }, + { + "epoch": 0.91, + "learning_rate": 1.749834957865714e-08, + "loss": 0.0004, + "step": 47046 + }, + { + "epoch": 0.91, + "learning_rate": 1.7494466234320995e-08, + "loss": 0.0006, + "step": 47047 + }, + { + "epoch": 0.91, + "learning_rate": 1.7490582889984853e-08, + "loss": 0.0004, + "step": 47048 + }, + { + "epoch": 0.91, + "learning_rate": 1.748669954564871e-08, + "loss": 1.3084, + "step": 47049 + }, + { + "epoch": 0.91, + "learning_rate": 1.748281620131257e-08, + "loss": 0.0005, + "step": 47050 + }, + { + "epoch": 0.91, + "learning_rate": 1.7478932856976428e-08, + "loss": 0.0005, + "step": 47051 + }, + { + "epoch": 0.91, + "learning_rate": 1.7475049512640286e-08, + "loss": 1.8492, + "step": 47052 + }, + { + "epoch": 0.91, + "learning_rate": 1.7471166168304144e-08, + "loss": 0.0276, + "step": 47053 + }, + { + "epoch": 0.91, + "learning_rate": 1.7467282823968e-08, + "loss": 0.0008, + "step": 47054 + }, + { + "epoch": 0.91, + "learning_rate": 1.7463399479631858e-08, + "loss": 0.0004, + "step": 47055 + }, + { + "epoch": 0.91, + "learning_rate": 1.7459516135295716e-08, + "loss": 0.0004, + "step": 47056 + }, + { + "epoch": 0.91, + "learning_rate": 1.7455632790959574e-08, + "loss": 0.0004, + "step": 47057 + }, + { + "epoch": 0.91, + "learning_rate": 1.7451749446623432e-08, + "loss": 0.0003, + "step": 47058 + }, + { + "epoch": 0.91, + "learning_rate": 1.744786610228729e-08, + "loss": 0.8138, + "step": 47059 + }, + { + "epoch": 0.91, + "learning_rate": 1.744398275795115e-08, + "loss": 0.0008, + "step": 47060 + }, + { + "epoch": 0.91, + "learning_rate": 1.7440099413615004e-08, + "loss": 0.0004, + "step": 47061 + }, + { + "epoch": 0.91, + "learning_rate": 1.7436216069278862e-08, + "loss": 0.0004, + "step": 47062 + }, + { + "epoch": 0.91, + "learning_rate": 1.743233272494272e-08, + "loss": 0.0004, + "step": 47063 + }, + { + "epoch": 0.91, + "learning_rate": 1.742844938060658e-08, + "loss": 0.2274, + "step": 47064 + }, + { + "epoch": 0.91, + "learning_rate": 1.7424566036270437e-08, + "loss": 0.0005, + "step": 47065 + }, + { + "epoch": 0.91, + "learning_rate": 1.7420682691934295e-08, + "loss": 0.5798, + "step": 47066 + }, + { + "epoch": 0.91, + "learning_rate": 1.7416799347598153e-08, + "loss": 0.0004, + "step": 47067 + }, + { + "epoch": 0.91, + "learning_rate": 1.741291600326201e-08, + "loss": 0.0002, + "step": 47068 + }, + { + "epoch": 0.91, + "learning_rate": 1.7409032658925866e-08, + "loss": 0.0017, + "step": 47069 + }, + { + "epoch": 0.91, + "learning_rate": 1.7405149314589725e-08, + "loss": 0.0003, + "step": 47070 + }, + { + "epoch": 0.91, + "learning_rate": 1.7401265970253583e-08, + "loss": 0.0004, + "step": 47071 + }, + { + "epoch": 0.91, + "learning_rate": 1.739738262591744e-08, + "loss": 0.0021, + "step": 47072 + }, + { + "epoch": 0.91, + "learning_rate": 1.7393499281581296e-08, + "loss": 0.127, + "step": 47073 + }, + { + "epoch": 0.91, + "learning_rate": 1.7389615937245154e-08, + "loss": 0.0004, + "step": 47074 + }, + { + "epoch": 0.91, + "learning_rate": 1.7385732592909012e-08, + "loss": 0.0006, + "step": 47075 + }, + { + "epoch": 0.91, + "learning_rate": 1.7381849248572867e-08, + "loss": 0.0003, + "step": 47076 + }, + { + "epoch": 0.91, + "learning_rate": 1.7377965904236726e-08, + "loss": 0.6612, + "step": 47077 + }, + { + "epoch": 0.91, + "learning_rate": 1.7374082559900584e-08, + "loss": 0.0005, + "step": 47078 + }, + { + "epoch": 0.91, + "learning_rate": 1.7370199215564442e-08, + "loss": 0.0007, + "step": 47079 + }, + { + "epoch": 0.91, + "learning_rate": 1.73663158712283e-08, + "loss": 0.0006, + "step": 47080 + }, + { + "epoch": 0.91, + "learning_rate": 1.736243252689216e-08, + "loss": 0.0003, + "step": 47081 + }, + { + "epoch": 0.91, + "learning_rate": 1.7358549182556017e-08, + "loss": 0.0004, + "step": 47082 + }, + { + "epoch": 0.91, + "learning_rate": 1.7354665838219872e-08, + "loss": 0.0003, + "step": 47083 + }, + { + "epoch": 0.91, + "learning_rate": 1.735078249388373e-08, + "loss": 0.0004, + "step": 47084 + }, + { + "epoch": 0.91, + "learning_rate": 1.7346899149547588e-08, + "loss": 0.7636, + "step": 47085 + }, + { + "epoch": 0.91, + "learning_rate": 1.7343015805211447e-08, + "loss": 0.0004, + "step": 47086 + }, + { + "epoch": 0.91, + "learning_rate": 1.7339132460875305e-08, + "loss": 0.1096, + "step": 47087 + }, + { + "epoch": 0.91, + "learning_rate": 1.7335249116539163e-08, + "loss": 0.0007, + "step": 47088 + }, + { + "epoch": 0.91, + "learning_rate": 1.733136577220302e-08, + "loss": 0.0004, + "step": 47089 + }, + { + "epoch": 0.91, + "learning_rate": 1.7327482427866876e-08, + "loss": 0.0003, + "step": 47090 + }, + { + "epoch": 0.91, + "learning_rate": 1.7323599083530734e-08, + "loss": 0.0003, + "step": 47091 + }, + { + "epoch": 0.91, + "learning_rate": 1.7319715739194593e-08, + "loss": 0.0003, + "step": 47092 + }, + { + "epoch": 0.91, + "learning_rate": 1.731583239485845e-08, + "loss": 0.0004, + "step": 47093 + }, + { + "epoch": 0.91, + "learning_rate": 1.731194905052231e-08, + "loss": 0.9045, + "step": 47094 + }, + { + "epoch": 0.91, + "learning_rate": 1.7308065706186167e-08, + "loss": 0.0004, + "step": 47095 + }, + { + "epoch": 0.91, + "learning_rate": 1.7304182361850026e-08, + "loss": 0.0004, + "step": 47096 + }, + { + "epoch": 0.91, + "learning_rate": 1.7300299017513884e-08, + "loss": 0.0007, + "step": 47097 + }, + { + "epoch": 0.91, + "learning_rate": 1.729641567317774e-08, + "loss": 0.0393, + "step": 47098 + }, + { + "epoch": 0.91, + "learning_rate": 1.7292532328841597e-08, + "loss": 0.0005, + "step": 47099 + }, + { + "epoch": 0.91, + "learning_rate": 1.7288648984505455e-08, + "loss": 0.0004, + "step": 47100 + }, + { + "epoch": 0.91, + "learning_rate": 1.7284765640169314e-08, + "loss": 0.0003, + "step": 47101 + }, + { + "epoch": 0.91, + "learning_rate": 1.7280882295833172e-08, + "loss": 0.0003, + "step": 47102 + }, + { + "epoch": 0.91, + "learning_rate": 1.727699895149703e-08, + "loss": 0.0007, + "step": 47103 + }, + { + "epoch": 0.91, + "learning_rate": 1.727311560716089e-08, + "loss": 0.0003, + "step": 47104 + }, + { + "epoch": 0.91, + "learning_rate": 1.7269232262824743e-08, + "loss": 0.0005, + "step": 47105 + }, + { + "epoch": 0.91, + "learning_rate": 1.72653489184886e-08, + "loss": 0.0076, + "step": 47106 + }, + { + "epoch": 0.91, + "learning_rate": 1.726146557415246e-08, + "loss": 0.0005, + "step": 47107 + }, + { + "epoch": 0.91, + "learning_rate": 1.7257582229816318e-08, + "loss": 0.0003, + "step": 47108 + }, + { + "epoch": 0.91, + "learning_rate": 1.7253698885480176e-08, + "loss": 0.0314, + "step": 47109 + }, + { + "epoch": 0.91, + "learning_rate": 1.7249815541144035e-08, + "loss": 0.0004, + "step": 47110 + }, + { + "epoch": 0.91, + "learning_rate": 1.7245932196807893e-08, + "loss": 0.0003, + "step": 47111 + }, + { + "epoch": 0.91, + "learning_rate": 1.7242048852471748e-08, + "loss": 0.0003, + "step": 47112 + }, + { + "epoch": 0.91, + "learning_rate": 1.7238165508135606e-08, + "loss": 0.0004, + "step": 47113 + }, + { + "epoch": 0.91, + "learning_rate": 1.7234282163799464e-08, + "loss": 0.003, + "step": 47114 + }, + { + "epoch": 0.91, + "learning_rate": 1.7230398819463322e-08, + "loss": 1.2238, + "step": 47115 + }, + { + "epoch": 0.91, + "learning_rate": 1.722651547512718e-08, + "loss": 0.0004, + "step": 47116 + }, + { + "epoch": 0.91, + "learning_rate": 1.7222632130791036e-08, + "loss": 0.0004, + "step": 47117 + }, + { + "epoch": 0.91, + "learning_rate": 1.7218748786454894e-08, + "loss": 0.0005, + "step": 47118 + }, + { + "epoch": 0.91, + "learning_rate": 1.7214865442118752e-08, + "loss": 0.5175, + "step": 47119 + }, + { + "epoch": 0.91, + "learning_rate": 1.721098209778261e-08, + "loss": 0.0005, + "step": 47120 + }, + { + "epoch": 0.91, + "learning_rate": 1.7207098753446465e-08, + "loss": 0.0009, + "step": 47121 + }, + { + "epoch": 0.91, + "learning_rate": 1.7203215409110324e-08, + "loss": 0.0004, + "step": 47122 + }, + { + "epoch": 0.91, + "learning_rate": 1.7199332064774182e-08, + "loss": 0.0005, + "step": 47123 + }, + { + "epoch": 0.91, + "learning_rate": 1.719544872043804e-08, + "loss": 0.0005, + "step": 47124 + }, + { + "epoch": 0.91, + "learning_rate": 1.7191565376101898e-08, + "loss": 0.0009, + "step": 47125 + }, + { + "epoch": 0.91, + "learning_rate": 1.7187682031765756e-08, + "loss": 0.5801, + "step": 47126 + }, + { + "epoch": 0.91, + "learning_rate": 1.718379868742961e-08, + "loss": 0.0004, + "step": 47127 + }, + { + "epoch": 0.91, + "learning_rate": 1.717991534309347e-08, + "loss": 0.0005, + "step": 47128 + }, + { + "epoch": 0.91, + "learning_rate": 1.7176031998757328e-08, + "loss": 0.0009, + "step": 47129 + }, + { + "epoch": 0.91, + "learning_rate": 1.7172148654421186e-08, + "loss": 0.0003, + "step": 47130 + }, + { + "epoch": 0.91, + "learning_rate": 1.7168265310085044e-08, + "loss": 0.0004, + "step": 47131 + }, + { + "epoch": 0.91, + "learning_rate": 1.7164381965748903e-08, + "loss": 0.0004, + "step": 47132 + }, + { + "epoch": 0.91, + "learning_rate": 1.716049862141276e-08, + "loss": 0.0005, + "step": 47133 + }, + { + "epoch": 0.91, + "learning_rate": 1.7156615277076616e-08, + "loss": 0.0004, + "step": 47134 + }, + { + "epoch": 0.91, + "learning_rate": 1.7152731932740474e-08, + "loss": 0.0004, + "step": 47135 + }, + { + "epoch": 0.91, + "learning_rate": 1.7148848588404332e-08, + "loss": 0.0004, + "step": 47136 + }, + { + "epoch": 0.91, + "learning_rate": 1.714496524406819e-08, + "loss": 0.0006, + "step": 47137 + }, + { + "epoch": 0.91, + "learning_rate": 1.714108189973205e-08, + "loss": 0.0005, + "step": 47138 + }, + { + "epoch": 0.91, + "learning_rate": 1.7137198555395907e-08, + "loss": 0.0004, + "step": 47139 + }, + { + "epoch": 0.91, + "learning_rate": 1.7133315211059765e-08, + "loss": 0.0004, + "step": 47140 + }, + { + "epoch": 0.91, + "learning_rate": 1.712943186672362e-08, + "loss": 0.0005, + "step": 47141 + }, + { + "epoch": 0.91, + "learning_rate": 1.712554852238748e-08, + "loss": 1.1494, + "step": 47142 + }, + { + "epoch": 0.91, + "learning_rate": 1.7121665178051337e-08, + "loss": 0.2443, + "step": 47143 + }, + { + "epoch": 0.91, + "learning_rate": 1.7117781833715195e-08, + "loss": 1.1547, + "step": 47144 + }, + { + "epoch": 0.91, + "learning_rate": 1.7113898489379053e-08, + "loss": 0.0008, + "step": 47145 + }, + { + "epoch": 0.91, + "learning_rate": 1.711001514504291e-08, + "loss": 0.0003, + "step": 47146 + }, + { + "epoch": 0.91, + "learning_rate": 1.710613180070677e-08, + "loss": 0.0003, + "step": 47147 + }, + { + "epoch": 0.91, + "learning_rate": 1.7102248456370625e-08, + "loss": 0.0003, + "step": 47148 + }, + { + "epoch": 0.91, + "learning_rate": 1.7098365112034483e-08, + "loss": 0.0006, + "step": 47149 + }, + { + "epoch": 0.91, + "learning_rate": 1.709448176769834e-08, + "loss": 0.0003, + "step": 47150 + }, + { + "epoch": 0.91, + "learning_rate": 1.70905984233622e-08, + "loss": 0.0004, + "step": 47151 + }, + { + "epoch": 0.91, + "learning_rate": 1.7086715079026058e-08, + "loss": 0.0003, + "step": 47152 + }, + { + "epoch": 0.91, + "learning_rate": 1.7082831734689916e-08, + "loss": 0.0004, + "step": 47153 + }, + { + "epoch": 0.91, + "learning_rate": 1.7078948390353774e-08, + "loss": 0.4236, + "step": 47154 + }, + { + "epoch": 0.91, + "learning_rate": 1.7075065046017632e-08, + "loss": 0.0002, + "step": 47155 + }, + { + "epoch": 0.91, + "learning_rate": 1.7071181701681487e-08, + "loss": 0.1044, + "step": 47156 + }, + { + "epoch": 0.91, + "learning_rate": 1.7067298357345346e-08, + "loss": 0.0004, + "step": 47157 + }, + { + "epoch": 0.91, + "learning_rate": 1.7063415013009204e-08, + "loss": 0.0005, + "step": 47158 + }, + { + "epoch": 0.91, + "learning_rate": 1.7059531668673062e-08, + "loss": 0.0003, + "step": 47159 + }, + { + "epoch": 0.91, + "learning_rate": 1.705564832433692e-08, + "loss": 0.0003, + "step": 47160 + }, + { + "epoch": 0.91, + "learning_rate": 1.7051764980000775e-08, + "loss": 0.0006, + "step": 47161 + }, + { + "epoch": 0.91, + "learning_rate": 1.7047881635664633e-08, + "loss": 0.0004, + "step": 47162 + }, + { + "epoch": 0.91, + "learning_rate": 1.7043998291328492e-08, + "loss": 0.172, + "step": 47163 + }, + { + "epoch": 0.91, + "learning_rate": 1.704011494699235e-08, + "loss": 0.0005, + "step": 47164 + }, + { + "epoch": 0.91, + "learning_rate": 1.7036231602656205e-08, + "loss": 0.7883, + "step": 47165 + }, + { + "epoch": 0.91, + "learning_rate": 1.7032348258320063e-08, + "loss": 0.7641, + "step": 47166 + }, + { + "epoch": 0.91, + "learning_rate": 1.702846491398392e-08, + "loss": 0.0003, + "step": 47167 + }, + { + "epoch": 0.91, + "learning_rate": 1.702458156964778e-08, + "loss": 0.0003, + "step": 47168 + }, + { + "epoch": 0.91, + "learning_rate": 1.7020698225311638e-08, + "loss": 0.0083, + "step": 47169 + }, + { + "epoch": 0.91, + "learning_rate": 1.7016814880975493e-08, + "loss": 0.0005, + "step": 47170 + }, + { + "epoch": 0.92, + "learning_rate": 1.701293153663935e-08, + "loss": 0.0004, + "step": 47171 + }, + { + "epoch": 0.92, + "learning_rate": 1.700904819230321e-08, + "loss": 1.1918, + "step": 47172 + }, + { + "epoch": 0.92, + "learning_rate": 1.7005164847967068e-08, + "loss": 0.0004, + "step": 47173 + }, + { + "epoch": 0.92, + "learning_rate": 1.7001281503630926e-08, + "loss": 0.0086, + "step": 47174 + }, + { + "epoch": 0.92, + "learning_rate": 1.6997398159294784e-08, + "loss": 0.0004, + "step": 47175 + }, + { + "epoch": 0.92, + "learning_rate": 1.6993514814958642e-08, + "loss": 0.0007, + "step": 47176 + }, + { + "epoch": 0.92, + "learning_rate": 1.6989631470622497e-08, + "loss": 0.0003, + "step": 47177 + }, + { + "epoch": 0.92, + "learning_rate": 1.6985748126286355e-08, + "loss": 0.0003, + "step": 47178 + }, + { + "epoch": 0.92, + "learning_rate": 1.6981864781950214e-08, + "loss": 1.066, + "step": 47179 + }, + { + "epoch": 0.92, + "learning_rate": 1.6977981437614072e-08, + "loss": 0.0003, + "step": 47180 + }, + { + "epoch": 0.92, + "learning_rate": 1.697409809327793e-08, + "loss": 0.5824, + "step": 47181 + }, + { + "epoch": 0.92, + "learning_rate": 1.697021474894179e-08, + "loss": 0.0004, + "step": 47182 + }, + { + "epoch": 0.92, + "learning_rate": 1.6966331404605647e-08, + "loss": 0.0004, + "step": 47183 + }, + { + "epoch": 0.92, + "learning_rate": 1.6962448060269505e-08, + "loss": 0.0005, + "step": 47184 + }, + { + "epoch": 0.92, + "learning_rate": 1.695856471593336e-08, + "loss": 0.0007, + "step": 47185 + }, + { + "epoch": 0.92, + "learning_rate": 1.6954681371597218e-08, + "loss": 0.0003, + "step": 47186 + }, + { + "epoch": 0.92, + "learning_rate": 1.6950798027261076e-08, + "loss": 0.0005, + "step": 47187 + }, + { + "epoch": 0.92, + "learning_rate": 1.6946914682924935e-08, + "loss": 0.0004, + "step": 47188 + }, + { + "epoch": 0.92, + "learning_rate": 1.6943031338588793e-08, + "loss": 0.0003, + "step": 47189 + }, + { + "epoch": 0.92, + "learning_rate": 1.693914799425265e-08, + "loss": 0.0005, + "step": 47190 + }, + { + "epoch": 0.92, + "learning_rate": 1.693526464991651e-08, + "loss": 0.0062, + "step": 47191 + }, + { + "epoch": 0.92, + "learning_rate": 1.6931381305580364e-08, + "loss": 0.0003, + "step": 47192 + }, + { + "epoch": 0.92, + "learning_rate": 1.6927497961244222e-08, + "loss": 0.0003, + "step": 47193 + }, + { + "epoch": 0.92, + "learning_rate": 1.692361461690808e-08, + "loss": 0.0005, + "step": 47194 + }, + { + "epoch": 0.92, + "learning_rate": 1.691973127257194e-08, + "loss": 0.0003, + "step": 47195 + }, + { + "epoch": 0.92, + "learning_rate": 1.6915847928235797e-08, + "loss": 0.0008, + "step": 47196 + }, + { + "epoch": 0.92, + "learning_rate": 1.6911964583899655e-08, + "loss": 0.0007, + "step": 47197 + }, + { + "epoch": 0.92, + "learning_rate": 1.6908081239563514e-08, + "loss": 0.5113, + "step": 47198 + }, + { + "epoch": 0.92, + "learning_rate": 1.690419789522737e-08, + "loss": 0.0021, + "step": 47199 + }, + { + "epoch": 0.92, + "learning_rate": 1.6900314550891227e-08, + "loss": 0.506, + "step": 47200 + }, + { + "epoch": 0.92, + "learning_rate": 1.6896431206555085e-08, + "loss": 0.0004, + "step": 47201 + }, + { + "epoch": 0.92, + "learning_rate": 1.6892547862218943e-08, + "loss": 0.0004, + "step": 47202 + }, + { + "epoch": 0.92, + "learning_rate": 1.68886645178828e-08, + "loss": 0.0033, + "step": 47203 + }, + { + "epoch": 0.92, + "learning_rate": 1.688478117354666e-08, + "loss": 0.0004, + "step": 47204 + }, + { + "epoch": 0.92, + "learning_rate": 1.6880897829210515e-08, + "loss": 0.0003, + "step": 47205 + }, + { + "epoch": 0.92, + "learning_rate": 1.6877014484874373e-08, + "loss": 0.0024, + "step": 47206 + }, + { + "epoch": 0.92, + "learning_rate": 1.687313114053823e-08, + "loss": 0.0004, + "step": 47207 + }, + { + "epoch": 0.92, + "learning_rate": 1.686924779620209e-08, + "loss": 0.0003, + "step": 47208 + }, + { + "epoch": 0.92, + "learning_rate": 1.6865364451865944e-08, + "loss": 0.0004, + "step": 47209 + }, + { + "epoch": 0.92, + "learning_rate": 1.6861481107529803e-08, + "loss": 0.0005, + "step": 47210 + }, + { + "epoch": 0.92, + "learning_rate": 1.685759776319366e-08, + "loss": 0.0003, + "step": 47211 + }, + { + "epoch": 0.92, + "learning_rate": 1.685371441885752e-08, + "loss": 0.0004, + "step": 47212 + }, + { + "epoch": 0.92, + "learning_rate": 1.6849831074521377e-08, + "loss": 0.0003, + "step": 47213 + }, + { + "epoch": 0.92, + "learning_rate": 1.6845947730185232e-08, + "loss": 0.0021, + "step": 47214 + }, + { + "epoch": 0.92, + "learning_rate": 1.684206438584909e-08, + "loss": 0.0003, + "step": 47215 + }, + { + "epoch": 0.92, + "learning_rate": 1.683818104151295e-08, + "loss": 0.0004, + "step": 47216 + }, + { + "epoch": 0.92, + "learning_rate": 1.6834297697176807e-08, + "loss": 0.3606, + "step": 47217 + }, + { + "epoch": 0.92, + "learning_rate": 1.6830414352840665e-08, + "loss": 0.0005, + "step": 47218 + }, + { + "epoch": 0.92, + "learning_rate": 1.6826531008504524e-08, + "loss": 0.2851, + "step": 47219 + }, + { + "epoch": 0.92, + "learning_rate": 1.6822647664168382e-08, + "loss": 0.0004, + "step": 47220 + }, + { + "epoch": 0.92, + "learning_rate": 1.6818764319832237e-08, + "loss": 0.0013, + "step": 47221 + }, + { + "epoch": 0.92, + "learning_rate": 1.6814880975496095e-08, + "loss": 0.0003, + "step": 47222 + }, + { + "epoch": 0.92, + "learning_rate": 1.6810997631159953e-08, + "loss": 0.0004, + "step": 47223 + }, + { + "epoch": 0.92, + "learning_rate": 1.680711428682381e-08, + "loss": 0.0003, + "step": 47224 + }, + { + "epoch": 0.92, + "learning_rate": 1.680323094248767e-08, + "loss": 0.0004, + "step": 47225 + }, + { + "epoch": 0.92, + "learning_rate": 1.6799347598151528e-08, + "loss": 0.0015, + "step": 47226 + }, + { + "epoch": 0.92, + "learning_rate": 1.6795464253815386e-08, + "loss": 0.3178, + "step": 47227 + }, + { + "epoch": 0.92, + "learning_rate": 1.679158090947924e-08, + "loss": 0.0003, + "step": 47228 + }, + { + "epoch": 0.92, + "learning_rate": 1.67876975651431e-08, + "loss": 0.0002, + "step": 47229 + }, + { + "epoch": 0.92, + "learning_rate": 1.6783814220806958e-08, + "loss": 0.0003, + "step": 47230 + }, + { + "epoch": 0.92, + "learning_rate": 1.6779930876470816e-08, + "loss": 1.2658, + "step": 47231 + }, + { + "epoch": 0.92, + "learning_rate": 1.6776047532134674e-08, + "loss": 0.0004, + "step": 47232 + }, + { + "epoch": 0.92, + "learning_rate": 1.6772164187798532e-08, + "loss": 0.0005, + "step": 47233 + }, + { + "epoch": 0.92, + "learning_rate": 1.676828084346239e-08, + "loss": 0.0005, + "step": 47234 + }, + { + "epoch": 0.92, + "learning_rate": 1.6764397499126246e-08, + "loss": 0.0007, + "step": 47235 + }, + { + "epoch": 0.92, + "learning_rate": 1.6760514154790104e-08, + "loss": 0.0003, + "step": 47236 + }, + { + "epoch": 0.92, + "learning_rate": 1.6756630810453962e-08, + "loss": 0.0005, + "step": 47237 + }, + { + "epoch": 0.92, + "learning_rate": 1.675274746611782e-08, + "loss": 0.0005, + "step": 47238 + }, + { + "epoch": 0.92, + "learning_rate": 1.674886412178168e-08, + "loss": 0.0005, + "step": 47239 + }, + { + "epoch": 0.92, + "learning_rate": 1.6744980777445537e-08, + "loss": 0.0004, + "step": 47240 + }, + { + "epoch": 0.92, + "learning_rate": 1.6741097433109395e-08, + "loss": 0.7884, + "step": 47241 + }, + { + "epoch": 0.92, + "learning_rate": 1.6737214088773253e-08, + "loss": 0.0003, + "step": 47242 + }, + { + "epoch": 0.92, + "learning_rate": 1.6733330744437108e-08, + "loss": 0.0005, + "step": 47243 + }, + { + "epoch": 0.92, + "learning_rate": 1.6729447400100966e-08, + "loss": 0.8033, + "step": 47244 + }, + { + "epoch": 0.92, + "learning_rate": 1.6725564055764825e-08, + "loss": 0.0006, + "step": 47245 + }, + { + "epoch": 0.92, + "learning_rate": 1.6721680711428683e-08, + "loss": 0.0004, + "step": 47246 + }, + { + "epoch": 0.92, + "learning_rate": 1.671779736709254e-08, + "loss": 0.0003, + "step": 47247 + }, + { + "epoch": 0.92, + "learning_rate": 1.67139140227564e-08, + "loss": 0.0005, + "step": 47248 + }, + { + "epoch": 0.92, + "learning_rate": 1.6710030678420258e-08, + "loss": 0.0006, + "step": 47249 + }, + { + "epoch": 0.92, + "learning_rate": 1.6706147334084113e-08, + "loss": 0.0003, + "step": 47250 + }, + { + "epoch": 0.92, + "learning_rate": 1.670226398974797e-08, + "loss": 1.5114, + "step": 47251 + }, + { + "epoch": 0.92, + "learning_rate": 1.669838064541183e-08, + "loss": 1.0365, + "step": 47252 + }, + { + "epoch": 0.92, + "learning_rate": 1.6694497301075684e-08, + "loss": 0.0015, + "step": 47253 + }, + { + "epoch": 0.92, + "learning_rate": 1.6690613956739542e-08, + "loss": 0.0004, + "step": 47254 + }, + { + "epoch": 0.92, + "learning_rate": 1.66867306124034e-08, + "loss": 0.0007, + "step": 47255 + }, + { + "epoch": 0.92, + "learning_rate": 1.668284726806726e-08, + "loss": 0.0003, + "step": 47256 + }, + { + "epoch": 0.92, + "learning_rate": 1.6678963923731114e-08, + "loss": 0.0006, + "step": 47257 + }, + { + "epoch": 0.92, + "learning_rate": 1.6675080579394972e-08, + "loss": 0.0003, + "step": 47258 + }, + { + "epoch": 0.92, + "learning_rate": 1.667119723505883e-08, + "loss": 0.0005, + "step": 47259 + }, + { + "epoch": 0.92, + "learning_rate": 1.666731389072269e-08, + "loss": 0.0005, + "step": 47260 + }, + { + "epoch": 0.92, + "learning_rate": 1.6663430546386547e-08, + "loss": 0.0003, + "step": 47261 + }, + { + "epoch": 0.92, + "learning_rate": 1.6659547202050405e-08, + "loss": 0.0077, + "step": 47262 + }, + { + "epoch": 0.92, + "learning_rate": 1.6655663857714263e-08, + "loss": 0.0005, + "step": 47263 + }, + { + "epoch": 0.92, + "learning_rate": 1.6651780513378118e-08, + "loss": 0.0004, + "step": 47264 + }, + { + "epoch": 0.92, + "learning_rate": 1.6647897169041976e-08, + "loss": 0.0004, + "step": 47265 + }, + { + "epoch": 0.92, + "learning_rate": 1.6644013824705835e-08, + "loss": 0.0022, + "step": 47266 + }, + { + "epoch": 0.92, + "learning_rate": 1.6640130480369693e-08, + "loss": 0.0013, + "step": 47267 + }, + { + "epoch": 0.92, + "learning_rate": 1.663624713603355e-08, + "loss": 0.4441, + "step": 47268 + }, + { + "epoch": 0.92, + "learning_rate": 1.663236379169741e-08, + "loss": 0.0002, + "step": 47269 + }, + { + "epoch": 0.92, + "learning_rate": 1.6628480447361268e-08, + "loss": 0.0004, + "step": 47270 + }, + { + "epoch": 0.92, + "learning_rate": 1.6624597103025126e-08, + "loss": 0.0004, + "step": 47271 + }, + { + "epoch": 0.92, + "learning_rate": 1.662071375868898e-08, + "loss": 0.0004, + "step": 47272 + }, + { + "epoch": 0.92, + "learning_rate": 1.661683041435284e-08, + "loss": 0.0005, + "step": 47273 + }, + { + "epoch": 0.92, + "learning_rate": 1.6612947070016697e-08, + "loss": 0.0004, + "step": 47274 + }, + { + "epoch": 0.92, + "learning_rate": 1.6609063725680555e-08, + "loss": 0.0009, + "step": 47275 + }, + { + "epoch": 0.92, + "learning_rate": 1.6605180381344414e-08, + "loss": 0.0004, + "step": 47276 + }, + { + "epoch": 0.92, + "learning_rate": 1.6601297037008272e-08, + "loss": 0.0003, + "step": 47277 + }, + { + "epoch": 0.92, + "learning_rate": 1.659741369267213e-08, + "loss": 0.0004, + "step": 47278 + }, + { + "epoch": 0.92, + "learning_rate": 1.6593530348335985e-08, + "loss": 0.0003, + "step": 47279 + }, + { + "epoch": 0.92, + "learning_rate": 1.6589647003999843e-08, + "loss": 0.0004, + "step": 47280 + }, + { + "epoch": 0.92, + "learning_rate": 1.65857636596637e-08, + "loss": 0.0009, + "step": 47281 + }, + { + "epoch": 0.92, + "learning_rate": 1.658188031532756e-08, + "loss": 0.001, + "step": 47282 + }, + { + "epoch": 0.92, + "learning_rate": 1.6577996970991418e-08, + "loss": 0.0004, + "step": 47283 + }, + { + "epoch": 0.92, + "learning_rate": 1.6574113626655276e-08, + "loss": 0.0003, + "step": 47284 + }, + { + "epoch": 0.92, + "learning_rate": 1.6570230282319135e-08, + "loss": 0.0007, + "step": 47285 + }, + { + "epoch": 0.92, + "learning_rate": 1.656634693798299e-08, + "loss": 0.2677, + "step": 47286 + }, + { + "epoch": 0.92, + "learning_rate": 1.6562463593646848e-08, + "loss": 0.0007, + "step": 47287 + }, + { + "epoch": 0.92, + "learning_rate": 1.6558580249310706e-08, + "loss": 0.0004, + "step": 47288 + }, + { + "epoch": 0.92, + "learning_rate": 1.6554696904974564e-08, + "loss": 0.0004, + "step": 47289 + }, + { + "epoch": 0.92, + "learning_rate": 1.6550813560638423e-08, + "loss": 0.0004, + "step": 47290 + }, + { + "epoch": 0.92, + "learning_rate": 1.654693021630228e-08, + "loss": 0.0005, + "step": 47291 + }, + { + "epoch": 0.92, + "learning_rate": 1.654304687196614e-08, + "loss": 0.0005, + "step": 47292 + }, + { + "epoch": 0.92, + "learning_rate": 1.6539163527629994e-08, + "loss": 0.0005, + "step": 47293 + }, + { + "epoch": 0.92, + "learning_rate": 1.6535280183293852e-08, + "loss": 0.0002, + "step": 47294 + }, + { + "epoch": 0.92, + "learning_rate": 1.653139683895771e-08, + "loss": 0.0006, + "step": 47295 + }, + { + "epoch": 0.92, + "learning_rate": 1.652751349462157e-08, + "loss": 0.001, + "step": 47296 + }, + { + "epoch": 0.92, + "learning_rate": 1.6523630150285427e-08, + "loss": 0.0007, + "step": 47297 + }, + { + "epoch": 0.92, + "learning_rate": 1.6519746805949282e-08, + "loss": 0.0004, + "step": 47298 + }, + { + "epoch": 0.92, + "learning_rate": 1.651586346161314e-08, + "loss": 0.0004, + "step": 47299 + }, + { + "epoch": 0.92, + "learning_rate": 1.6511980117277e-08, + "loss": 0.0003, + "step": 47300 + }, + { + "epoch": 0.92, + "learning_rate": 1.6508096772940853e-08, + "loss": 0.0003, + "step": 47301 + }, + { + "epoch": 0.92, + "learning_rate": 1.650421342860471e-08, + "loss": 0.0003, + "step": 47302 + }, + { + "epoch": 0.92, + "learning_rate": 1.650033008426857e-08, + "loss": 0.0003, + "step": 47303 + }, + { + "epoch": 0.92, + "learning_rate": 1.6496446739932428e-08, + "loss": 0.0004, + "step": 47304 + }, + { + "epoch": 0.92, + "learning_rate": 1.6492563395596286e-08, + "loss": 1.1073, + "step": 47305 + }, + { + "epoch": 0.92, + "learning_rate": 1.6488680051260145e-08, + "loss": 0.0005, + "step": 47306 + }, + { + "epoch": 0.92, + "learning_rate": 1.6484796706924003e-08, + "loss": 0.0006, + "step": 47307 + }, + { + "epoch": 0.92, + "learning_rate": 1.6480913362587858e-08, + "loss": 0.0003, + "step": 47308 + }, + { + "epoch": 0.92, + "learning_rate": 1.6477030018251716e-08, + "loss": 0.0007, + "step": 47309 + }, + { + "epoch": 0.92, + "learning_rate": 1.6473146673915574e-08, + "loss": 0.0004, + "step": 47310 + }, + { + "epoch": 0.92, + "learning_rate": 1.6469263329579432e-08, + "loss": 0.0003, + "step": 47311 + }, + { + "epoch": 0.92, + "learning_rate": 1.646537998524329e-08, + "loss": 0.0003, + "step": 47312 + }, + { + "epoch": 0.92, + "learning_rate": 1.646149664090715e-08, + "loss": 0.004, + "step": 47313 + }, + { + "epoch": 0.92, + "learning_rate": 1.6457613296571007e-08, + "loss": 0.0005, + "step": 47314 + }, + { + "epoch": 0.92, + "learning_rate": 1.6453729952234862e-08, + "loss": 0.0042, + "step": 47315 + }, + { + "epoch": 0.92, + "learning_rate": 1.644984660789872e-08, + "loss": 0.0035, + "step": 47316 + }, + { + "epoch": 0.92, + "learning_rate": 1.644596326356258e-08, + "loss": 0.0004, + "step": 47317 + }, + { + "epoch": 0.92, + "learning_rate": 1.6442079919226437e-08, + "loss": 0.4924, + "step": 47318 + }, + { + "epoch": 0.92, + "learning_rate": 1.6438196574890295e-08, + "loss": 0.0003, + "step": 47319 + }, + { + "epoch": 0.92, + "learning_rate": 1.6434313230554153e-08, + "loss": 0.0003, + "step": 47320 + }, + { + "epoch": 0.92, + "learning_rate": 1.643042988621801e-08, + "loss": 0.0003, + "step": 47321 + }, + { + "epoch": 0.92, + "learning_rate": 1.6426546541881866e-08, + "loss": 0.0002, + "step": 47322 + }, + { + "epoch": 0.92, + "learning_rate": 1.6422663197545725e-08, + "loss": 0.0005, + "step": 47323 + }, + { + "epoch": 0.92, + "learning_rate": 1.6418779853209583e-08, + "loss": 0.0005, + "step": 47324 + }, + { + "epoch": 0.92, + "learning_rate": 1.641489650887344e-08, + "loss": 0.0058, + "step": 47325 + }, + { + "epoch": 0.92, + "learning_rate": 1.64110131645373e-08, + "loss": 0.9473, + "step": 47326 + }, + { + "epoch": 0.92, + "learning_rate": 1.6407129820201158e-08, + "loss": 0.4421, + "step": 47327 + }, + { + "epoch": 0.92, + "learning_rate": 1.6403246475865016e-08, + "loss": 0.0006, + "step": 47328 + }, + { + "epoch": 0.92, + "learning_rate": 1.6399363131528874e-08, + "loss": 0.0006, + "step": 47329 + }, + { + "epoch": 0.92, + "learning_rate": 1.639547978719273e-08, + "loss": 0.0004, + "step": 47330 + }, + { + "epoch": 0.92, + "learning_rate": 1.6391596442856587e-08, + "loss": 0.0003, + "step": 47331 + }, + { + "epoch": 0.92, + "learning_rate": 1.6387713098520446e-08, + "loss": 0.0004, + "step": 47332 + }, + { + "epoch": 0.92, + "learning_rate": 1.6383829754184304e-08, + "loss": 0.0006, + "step": 47333 + }, + { + "epoch": 0.92, + "learning_rate": 1.6379946409848162e-08, + "loss": 0.1968, + "step": 47334 + }, + { + "epoch": 0.92, + "learning_rate": 1.637606306551202e-08, + "loss": 0.001, + "step": 47335 + }, + { + "epoch": 0.92, + "learning_rate": 1.637217972117588e-08, + "loss": 0.0003, + "step": 47336 + }, + { + "epoch": 0.92, + "learning_rate": 1.6368296376839734e-08, + "loss": 0.0004, + "step": 47337 + }, + { + "epoch": 0.92, + "learning_rate": 1.6364413032503592e-08, + "loss": 0.0004, + "step": 47338 + }, + { + "epoch": 0.92, + "learning_rate": 1.636052968816745e-08, + "loss": 0.0004, + "step": 47339 + }, + { + "epoch": 0.92, + "learning_rate": 1.6356646343831308e-08, + "loss": 0.0006, + "step": 47340 + }, + { + "epoch": 0.92, + "learning_rate": 1.6352762999495167e-08, + "loss": 0.0018, + "step": 47341 + }, + { + "epoch": 0.92, + "learning_rate": 1.634887965515902e-08, + "loss": 0.0005, + "step": 47342 + }, + { + "epoch": 0.92, + "learning_rate": 1.634499631082288e-08, + "loss": 0.0005, + "step": 47343 + }, + { + "epoch": 0.92, + "learning_rate": 1.6341112966486738e-08, + "loss": 0.0004, + "step": 47344 + }, + { + "epoch": 0.92, + "learning_rate": 1.6337229622150593e-08, + "loss": 0.0225, + "step": 47345 + }, + { + "epoch": 0.92, + "learning_rate": 1.633334627781445e-08, + "loss": 0.0002, + "step": 47346 + }, + { + "epoch": 0.92, + "learning_rate": 1.632946293347831e-08, + "loss": 0.0004, + "step": 47347 + }, + { + "epoch": 0.92, + "learning_rate": 1.6325579589142168e-08, + "loss": 0.0003, + "step": 47348 + }, + { + "epoch": 0.92, + "learning_rate": 1.6321696244806026e-08, + "loss": 0.0003, + "step": 47349 + }, + { + "epoch": 0.92, + "learning_rate": 1.6317812900469884e-08, + "loss": 0.0003, + "step": 47350 + }, + { + "epoch": 0.92, + "learning_rate": 1.631392955613374e-08, + "loss": 0.0004, + "step": 47351 + }, + { + "epoch": 0.92, + "learning_rate": 1.6310046211797597e-08, + "loss": 0.0003, + "step": 47352 + }, + { + "epoch": 0.92, + "learning_rate": 1.6306162867461456e-08, + "loss": 1.069, + "step": 47353 + }, + { + "epoch": 0.92, + "learning_rate": 1.6302279523125314e-08, + "loss": 0.0006, + "step": 47354 + }, + { + "epoch": 0.92, + "learning_rate": 1.6298396178789172e-08, + "loss": 0.0003, + "step": 47355 + }, + { + "epoch": 0.92, + "learning_rate": 1.629451283445303e-08, + "loss": 0.0004, + "step": 47356 + }, + { + "epoch": 0.92, + "learning_rate": 1.629062949011689e-08, + "loss": 0.0004, + "step": 47357 + }, + { + "epoch": 0.92, + "learning_rate": 1.6286746145780747e-08, + "loss": 0.0004, + "step": 47358 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282862801444602e-08, + "loss": 0.0006, + "step": 47359 + }, + { + "epoch": 0.92, + "learning_rate": 1.627897945710846e-08, + "loss": 0.0003, + "step": 47360 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275096112772318e-08, + "loss": 0.1439, + "step": 47361 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271212768436176e-08, + "loss": 0.0004, + "step": 47362 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267329424100035e-08, + "loss": 0.0003, + "step": 47363 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263446079763893e-08, + "loss": 0.0003, + "step": 47364 + }, + { + "epoch": 0.92, + "learning_rate": 1.625956273542775e-08, + "loss": 0.0003, + "step": 47365 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255679391091606e-08, + "loss": 0.0006, + "step": 47366 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251796046755464e-08, + "loss": 0.0003, + "step": 47367 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247912702419323e-08, + "loss": 0.0005, + "step": 47368 + }, + { + "epoch": 0.92, + "learning_rate": 1.624402935808318e-08, + "loss": 0.0003, + "step": 47369 + }, + { + "epoch": 0.92, + "learning_rate": 1.624014601374704e-08, + "loss": 0.0005, + "step": 47370 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236262669410897e-08, + "loss": 0.0003, + "step": 47371 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232379325074756e-08, + "loss": 0.0007, + "step": 47372 + }, + { + "epoch": 0.92, + "learning_rate": 1.622849598073861e-08, + "loss": 0.0003, + "step": 47373 + }, + { + "epoch": 0.92, + "learning_rate": 1.622461263640247e-08, + "loss": 0.861, + "step": 47374 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220729292066327e-08, + "loss": 0.001, + "step": 47375 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216845947730185e-08, + "loss": 0.0012, + "step": 47376 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212962603394043e-08, + "loss": 0.0007, + "step": 47377 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209079259057902e-08, + "loss": 0.0003, + "step": 47378 + }, + { + "epoch": 0.92, + "learning_rate": 1.620519591472176e-08, + "loss": 0.0003, + "step": 47379 + }, + { + "epoch": 0.92, + "learning_rate": 1.6201312570385615e-08, + "loss": 0.0614, + "step": 47380 + }, + { + "epoch": 0.92, + "learning_rate": 1.6197429226049473e-08, + "loss": 0.0007, + "step": 47381 + }, + { + "epoch": 0.92, + "learning_rate": 1.619354588171333e-08, + "loss": 0.0007, + "step": 47382 + }, + { + "epoch": 0.92, + "learning_rate": 1.618966253737719e-08, + "loss": 0.0003, + "step": 47383 + }, + { + "epoch": 0.92, + "learning_rate": 1.6185779193041048e-08, + "loss": 0.0011, + "step": 47384 + }, + { + "epoch": 0.92, + "learning_rate": 1.6181895848704906e-08, + "loss": 0.0007, + "step": 47385 + }, + { + "epoch": 0.92, + "learning_rate": 1.617801250436876e-08, + "loss": 0.0004, + "step": 47386 + }, + { + "epoch": 0.92, + "learning_rate": 1.617412916003262e-08, + "loss": 0.0004, + "step": 47387 + }, + { + "epoch": 0.92, + "learning_rate": 1.6170245815696478e-08, + "loss": 1.1499, + "step": 47388 + }, + { + "epoch": 0.92, + "learning_rate": 1.6166362471360336e-08, + "loss": 0.0004, + "step": 47389 + }, + { + "epoch": 0.92, + "learning_rate": 1.616247912702419e-08, + "loss": 0.0005, + "step": 47390 + }, + { + "epoch": 0.92, + "learning_rate": 1.615859578268805e-08, + "loss": 0.0024, + "step": 47391 + }, + { + "epoch": 0.92, + "learning_rate": 1.6154712438351907e-08, + "loss": 0.0021, + "step": 47392 + }, + { + "epoch": 0.92, + "learning_rate": 1.6150829094015765e-08, + "loss": 0.0097, + "step": 47393 + }, + { + "epoch": 0.92, + "learning_rate": 1.6146945749679624e-08, + "loss": 0.0004, + "step": 47394 + }, + { + "epoch": 0.92, + "learning_rate": 1.614306240534348e-08, + "loss": 0.0003, + "step": 47395 + }, + { + "epoch": 0.92, + "learning_rate": 1.6139179061007337e-08, + "loss": 0.0004, + "step": 47396 + }, + { + "epoch": 0.92, + "learning_rate": 1.6135295716671195e-08, + "loss": 0.0005, + "step": 47397 + }, + { + "epoch": 0.92, + "learning_rate": 1.6131412372335053e-08, + "loss": 0.0004, + "step": 47398 + }, + { + "epoch": 0.92, + "learning_rate": 1.612752902799891e-08, + "loss": 0.0004, + "step": 47399 + }, + { + "epoch": 0.92, + "learning_rate": 1.612364568366277e-08, + "loss": 0.0004, + "step": 47400 + }, + { + "epoch": 0.92, + "learning_rate": 1.6119762339326628e-08, + "loss": 0.0034, + "step": 47401 + }, + { + "epoch": 0.92, + "learning_rate": 1.6115878994990483e-08, + "loss": 0.0008, + "step": 47402 + }, + { + "epoch": 0.92, + "learning_rate": 1.611199565065434e-08, + "loss": 0.0003, + "step": 47403 + }, + { + "epoch": 0.92, + "learning_rate": 1.61081123063182e-08, + "loss": 0.0116, + "step": 47404 + }, + { + "epoch": 0.92, + "learning_rate": 1.6104228961982058e-08, + "loss": 1.7217, + "step": 47405 + }, + { + "epoch": 0.92, + "learning_rate": 1.6100345617645916e-08, + "loss": 0.0005, + "step": 47406 + }, + { + "epoch": 0.92, + "learning_rate": 1.6096462273309774e-08, + "loss": 0.0004, + "step": 47407 + }, + { + "epoch": 0.92, + "learning_rate": 1.6092578928973632e-08, + "loss": 0.0164, + "step": 47408 + }, + { + "epoch": 0.92, + "learning_rate": 1.6088695584637487e-08, + "loss": 0.0003, + "step": 47409 + }, + { + "epoch": 0.92, + "learning_rate": 1.6084812240301346e-08, + "loss": 0.0004, + "step": 47410 + }, + { + "epoch": 0.92, + "learning_rate": 1.6080928895965204e-08, + "loss": 0.0006, + "step": 47411 + }, + { + "epoch": 0.92, + "learning_rate": 1.6077045551629062e-08, + "loss": 0.0003, + "step": 47412 + }, + { + "epoch": 0.92, + "learning_rate": 1.607316220729292e-08, + "loss": 0.0899, + "step": 47413 + }, + { + "epoch": 0.92, + "learning_rate": 1.606927886295678e-08, + "loss": 0.0224, + "step": 47414 + }, + { + "epoch": 0.92, + "learning_rate": 1.6065395518620637e-08, + "loss": 0.0005, + "step": 47415 + }, + { + "epoch": 0.92, + "learning_rate": 1.6061512174284495e-08, + "loss": 0.8956, + "step": 47416 + }, + { + "epoch": 0.92, + "learning_rate": 1.605762882994835e-08, + "loss": 0.0211, + "step": 47417 + }, + { + "epoch": 0.92, + "learning_rate": 1.6053745485612208e-08, + "loss": 0.0004, + "step": 47418 + }, + { + "epoch": 0.92, + "learning_rate": 1.6049862141276067e-08, + "loss": 0.0003, + "step": 47419 + }, + { + "epoch": 0.92, + "learning_rate": 1.6045978796939925e-08, + "loss": 0.0003, + "step": 47420 + }, + { + "epoch": 0.92, + "learning_rate": 1.6042095452603783e-08, + "loss": 0.0004, + "step": 47421 + }, + { + "epoch": 0.92, + "learning_rate": 1.603821210826764e-08, + "loss": 0.0004, + "step": 47422 + }, + { + "epoch": 0.92, + "learning_rate": 1.60343287639315e-08, + "loss": 0.0003, + "step": 47423 + }, + { + "epoch": 0.92, + "learning_rate": 1.6030445419595354e-08, + "loss": 0.3258, + "step": 47424 + }, + { + "epoch": 0.92, + "learning_rate": 1.6026562075259213e-08, + "loss": 0.0029, + "step": 47425 + }, + { + "epoch": 0.92, + "learning_rate": 1.602267873092307e-08, + "loss": 0.001, + "step": 47426 + }, + { + "epoch": 0.92, + "learning_rate": 1.601879538658693e-08, + "loss": 0.1188, + "step": 47427 + }, + { + "epoch": 0.92, + "learning_rate": 1.6014912042250787e-08, + "loss": 0.0238, + "step": 47428 + }, + { + "epoch": 0.92, + "learning_rate": 1.6011028697914646e-08, + "loss": 0.0004, + "step": 47429 + }, + { + "epoch": 0.92, + "learning_rate": 1.60071453535785e-08, + "loss": 0.3158, + "step": 47430 + }, + { + "epoch": 0.92, + "learning_rate": 1.600326200924236e-08, + "loss": 0.0015, + "step": 47431 + }, + { + "epoch": 0.92, + "learning_rate": 1.5999378664906217e-08, + "loss": 0.0003, + "step": 47432 + }, + { + "epoch": 0.92, + "learning_rate": 1.5995495320570075e-08, + "loss": 0.0018, + "step": 47433 + }, + { + "epoch": 0.92, + "learning_rate": 1.599161197623393e-08, + "loss": 0.0004, + "step": 47434 + }, + { + "epoch": 0.92, + "learning_rate": 1.598772863189779e-08, + "loss": 0.0003, + "step": 47435 + }, + { + "epoch": 0.92, + "learning_rate": 1.5983845287561647e-08, + "loss": 0.0004, + "step": 47436 + }, + { + "epoch": 0.92, + "learning_rate": 1.5979961943225505e-08, + "loss": 0.0006, + "step": 47437 + }, + { + "epoch": 0.92, + "learning_rate": 1.597607859888936e-08, + "loss": 0.0004, + "step": 47438 + }, + { + "epoch": 0.92, + "learning_rate": 1.5972195254553218e-08, + "loss": 0.0003, + "step": 47439 + }, + { + "epoch": 0.92, + "learning_rate": 1.5968311910217076e-08, + "loss": 1.4981, + "step": 47440 + }, + { + "epoch": 0.92, + "learning_rate": 1.5964428565880935e-08, + "loss": 0.0003, + "step": 47441 + }, + { + "epoch": 0.92, + "learning_rate": 1.5960545221544793e-08, + "loss": 0.0004, + "step": 47442 + }, + { + "epoch": 0.92, + "learning_rate": 1.595666187720865e-08, + "loss": 0.0003, + "step": 47443 + }, + { + "epoch": 0.92, + "learning_rate": 1.595277853287251e-08, + "loss": 0.0003, + "step": 47444 + }, + { + "epoch": 0.92, + "learning_rate": 1.5948895188536368e-08, + "loss": 0.0003, + "step": 47445 + }, + { + "epoch": 0.92, + "learning_rate": 1.5945011844200223e-08, + "loss": 0.0008, + "step": 47446 + }, + { + "epoch": 0.92, + "learning_rate": 1.594112849986408e-08, + "loss": 0.0003, + "step": 47447 + }, + { + "epoch": 0.92, + "learning_rate": 1.593724515552794e-08, + "loss": 0.0004, + "step": 47448 + }, + { + "epoch": 0.92, + "learning_rate": 1.5933361811191797e-08, + "loss": 0.0004, + "step": 47449 + }, + { + "epoch": 0.92, + "learning_rate": 1.5929478466855656e-08, + "loss": 0.0004, + "step": 47450 + }, + { + "epoch": 0.92, + "learning_rate": 1.5925595122519514e-08, + "loss": 0.0004, + "step": 47451 + }, + { + "epoch": 0.92, + "learning_rate": 1.5921711778183372e-08, + "loss": 0.0003, + "step": 47452 + }, + { + "epoch": 0.92, + "learning_rate": 1.5917828433847227e-08, + "loss": 0.0003, + "step": 47453 + }, + { + "epoch": 0.92, + "learning_rate": 1.5913945089511085e-08, + "loss": 0.0004, + "step": 47454 + }, + { + "epoch": 0.92, + "learning_rate": 1.5910061745174944e-08, + "loss": 0.0007, + "step": 47455 + }, + { + "epoch": 0.92, + "learning_rate": 1.5906178400838802e-08, + "loss": 0.0006, + "step": 47456 + }, + { + "epoch": 0.92, + "learning_rate": 1.590229505650266e-08, + "loss": 1.5234, + "step": 47457 + }, + { + "epoch": 0.92, + "learning_rate": 1.5898411712166518e-08, + "loss": 0.0023, + "step": 47458 + }, + { + "epoch": 0.92, + "learning_rate": 1.5894528367830376e-08, + "loss": 0.0003, + "step": 47459 + }, + { + "epoch": 0.92, + "learning_rate": 1.589064502349423e-08, + "loss": 0.0015, + "step": 47460 + }, + { + "epoch": 0.92, + "learning_rate": 1.588676167915809e-08, + "loss": 0.0003, + "step": 47461 + }, + { + "epoch": 0.92, + "learning_rate": 1.5882878334821948e-08, + "loss": 0.0003, + "step": 47462 + }, + { + "epoch": 0.92, + "learning_rate": 1.5878994990485806e-08, + "loss": 0.0004, + "step": 47463 + }, + { + "epoch": 0.92, + "learning_rate": 1.5875111646149664e-08, + "loss": 0.0004, + "step": 47464 + }, + { + "epoch": 0.92, + "learning_rate": 1.5871228301813523e-08, + "loss": 0.0004, + "step": 47465 + }, + { + "epoch": 0.92, + "learning_rate": 1.586734495747738e-08, + "loss": 1.6863, + "step": 47466 + }, + { + "epoch": 0.92, + "learning_rate": 1.5863461613141236e-08, + "loss": 0.0003, + "step": 47467 + }, + { + "epoch": 0.92, + "learning_rate": 1.5859578268805094e-08, + "loss": 0.0076, + "step": 47468 + }, + { + "epoch": 0.92, + "learning_rate": 1.5855694924468952e-08, + "loss": 0.0003, + "step": 47469 + }, + { + "epoch": 0.92, + "learning_rate": 1.585181158013281e-08, + "loss": 0.0003, + "step": 47470 + }, + { + "epoch": 0.92, + "learning_rate": 1.584792823579667e-08, + "loss": 0.0019, + "step": 47471 + }, + { + "epoch": 0.92, + "learning_rate": 1.5844044891460527e-08, + "loss": 0.0004, + "step": 47472 + }, + { + "epoch": 0.92, + "learning_rate": 1.5840161547124385e-08, + "loss": 0.0004, + "step": 47473 + }, + { + "epoch": 0.92, + "learning_rate": 1.5836278202788244e-08, + "loss": 0.0007, + "step": 47474 + }, + { + "epoch": 0.92, + "learning_rate": 1.58323948584521e-08, + "loss": 0.0005, + "step": 47475 + }, + { + "epoch": 0.92, + "learning_rate": 1.5828511514115957e-08, + "loss": 0.0003, + "step": 47476 + }, + { + "epoch": 0.92, + "learning_rate": 1.5824628169779815e-08, + "loss": 0.0003, + "step": 47477 + }, + { + "epoch": 0.92, + "learning_rate": 1.582074482544367e-08, + "loss": 0.1817, + "step": 47478 + }, + { + "epoch": 0.92, + "learning_rate": 1.5816861481107528e-08, + "loss": 0.0008, + "step": 47479 + }, + { + "epoch": 0.92, + "learning_rate": 1.5812978136771386e-08, + "loss": 0.0005, + "step": 47480 + }, + { + "epoch": 0.92, + "learning_rate": 1.5809094792435245e-08, + "loss": 0.0004, + "step": 47481 + }, + { + "epoch": 0.92, + "learning_rate": 1.58052114480991e-08, + "loss": 0.0105, + "step": 47482 + }, + { + "epoch": 0.92, + "learning_rate": 1.5801328103762958e-08, + "loss": 0.0004, + "step": 47483 + }, + { + "epoch": 0.92, + "learning_rate": 1.5797444759426816e-08, + "loss": 0.0015, + "step": 47484 + }, + { + "epoch": 0.92, + "learning_rate": 1.5793561415090674e-08, + "loss": 0.0003, + "step": 47485 + }, + { + "epoch": 0.92, + "learning_rate": 1.5789678070754533e-08, + "loss": 0.0004, + "step": 47486 + }, + { + "epoch": 0.92, + "learning_rate": 1.578579472641839e-08, + "loss": 0.004, + "step": 47487 + }, + { + "epoch": 0.92, + "learning_rate": 1.578191138208225e-08, + "loss": 0.0068, + "step": 47488 + }, + { + "epoch": 0.92, + "learning_rate": 1.5778028037746104e-08, + "loss": 0.8417, + "step": 47489 + }, + { + "epoch": 0.92, + "learning_rate": 1.5774144693409962e-08, + "loss": 0.0034, + "step": 47490 + }, + { + "epoch": 0.92, + "learning_rate": 1.577026134907382e-08, + "loss": 0.0004, + "step": 47491 + }, + { + "epoch": 0.92, + "learning_rate": 1.576637800473768e-08, + "loss": 0.0005, + "step": 47492 + }, + { + "epoch": 0.92, + "learning_rate": 1.5762494660401537e-08, + "loss": 0.0004, + "step": 47493 + }, + { + "epoch": 0.92, + "learning_rate": 1.5758611316065395e-08, + "loss": 1.0652, + "step": 47494 + }, + { + "epoch": 0.92, + "learning_rate": 1.5754727971729253e-08, + "loss": 0.0003, + "step": 47495 + }, + { + "epoch": 0.92, + "learning_rate": 1.575084462739311e-08, + "loss": 0.0003, + "step": 47496 + }, + { + "epoch": 0.92, + "learning_rate": 1.5746961283056967e-08, + "loss": 0.0003, + "step": 47497 + }, + { + "epoch": 0.92, + "learning_rate": 1.5743077938720825e-08, + "loss": 0.005, + "step": 47498 + }, + { + "epoch": 0.92, + "learning_rate": 1.5739194594384683e-08, + "loss": 0.0031, + "step": 47499 + }, + { + "epoch": 0.92, + "learning_rate": 1.573531125004854e-08, + "loss": 0.0004, + "step": 47500 + }, + { + "epoch": 0.92, + "learning_rate": 1.57314279057124e-08, + "loss": 0.0004, + "step": 47501 + }, + { + "epoch": 0.92, + "learning_rate": 1.5727544561376258e-08, + "loss": 0.0004, + "step": 47502 + }, + { + "epoch": 0.92, + "learning_rate": 1.5723661217040116e-08, + "loss": 0.0005, + "step": 47503 + }, + { + "epoch": 0.92, + "learning_rate": 1.571977787270397e-08, + "loss": 1.0168, + "step": 47504 + }, + { + "epoch": 0.92, + "learning_rate": 1.571589452836783e-08, + "loss": 0.001, + "step": 47505 + }, + { + "epoch": 0.92, + "learning_rate": 1.5712011184031688e-08, + "loss": 0.0006, + "step": 47506 + }, + { + "epoch": 0.92, + "learning_rate": 1.5708127839695546e-08, + "loss": 0.0003, + "step": 47507 + }, + { + "epoch": 0.92, + "learning_rate": 1.5704244495359404e-08, + "loss": 0.0003, + "step": 47508 + }, + { + "epoch": 0.92, + "learning_rate": 1.5700361151023262e-08, + "loss": 0.032, + "step": 47509 + }, + { + "epoch": 0.92, + "learning_rate": 1.569647780668712e-08, + "loss": 0.0005, + "step": 47510 + }, + { + "epoch": 0.92, + "learning_rate": 1.5692594462350975e-08, + "loss": 0.0003, + "step": 47511 + }, + { + "epoch": 0.92, + "learning_rate": 1.5688711118014834e-08, + "loss": 0.0005, + "step": 47512 + }, + { + "epoch": 0.92, + "learning_rate": 1.5684827773678692e-08, + "loss": 0.0004, + "step": 47513 + }, + { + "epoch": 0.92, + "learning_rate": 1.568094442934255e-08, + "loss": 0.8818, + "step": 47514 + }, + { + "epoch": 0.92, + "learning_rate": 1.567706108500641e-08, + "loss": 0.0004, + "step": 47515 + }, + { + "epoch": 0.92, + "learning_rate": 1.5673177740670267e-08, + "loss": 0.0003, + "step": 47516 + }, + { + "epoch": 0.92, + "learning_rate": 1.5669294396334125e-08, + "loss": 0.0003, + "step": 47517 + }, + { + "epoch": 0.92, + "learning_rate": 1.566541105199798e-08, + "loss": 0.0002, + "step": 47518 + }, + { + "epoch": 0.92, + "learning_rate": 1.5661527707661838e-08, + "loss": 0.0006, + "step": 47519 + }, + { + "epoch": 0.92, + "learning_rate": 1.5657644363325696e-08, + "loss": 0.0003, + "step": 47520 + }, + { + "epoch": 0.92, + "learning_rate": 1.5653761018989555e-08, + "loss": 0.0005, + "step": 47521 + }, + { + "epoch": 0.92, + "learning_rate": 1.564987767465341e-08, + "loss": 0.0004, + "step": 47522 + }, + { + "epoch": 0.92, + "learning_rate": 1.5645994330317268e-08, + "loss": 0.0003, + "step": 47523 + }, + { + "epoch": 0.92, + "learning_rate": 1.5642110985981126e-08, + "loss": 0.0004, + "step": 47524 + }, + { + "epoch": 0.92, + "learning_rate": 1.5638227641644984e-08, + "loss": 0.0002, + "step": 47525 + }, + { + "epoch": 0.92, + "learning_rate": 1.563434429730884e-08, + "loss": 0.0003, + "step": 47526 + }, + { + "epoch": 0.92, + "learning_rate": 1.5630460952972697e-08, + "loss": 0.0003, + "step": 47527 + }, + { + "epoch": 0.92, + "learning_rate": 1.5626577608636556e-08, + "loss": 0.0003, + "step": 47528 + }, + { + "epoch": 0.92, + "learning_rate": 1.5622694264300414e-08, + "loss": 0.0003, + "step": 47529 + }, + { + "epoch": 0.92, + "learning_rate": 1.5618810919964272e-08, + "loss": 0.0006, + "step": 47530 + }, + { + "epoch": 0.92, + "learning_rate": 1.561492757562813e-08, + "loss": 0.0004, + "step": 47531 + }, + { + "epoch": 0.92, + "learning_rate": 1.561104423129199e-08, + "loss": 0.0004, + "step": 47532 + }, + { + "epoch": 0.92, + "learning_rate": 1.5607160886955844e-08, + "loss": 0.0003, + "step": 47533 + }, + { + "epoch": 0.92, + "learning_rate": 1.5603277542619702e-08, + "loss": 0.0003, + "step": 47534 + }, + { + "epoch": 0.92, + "learning_rate": 1.559939419828356e-08, + "loss": 0.0004, + "step": 47535 + }, + { + "epoch": 0.92, + "learning_rate": 1.5595510853947418e-08, + "loss": 0.0003, + "step": 47536 + }, + { + "epoch": 0.92, + "learning_rate": 1.5591627509611277e-08, + "loss": 0.0004, + "step": 47537 + }, + { + "epoch": 0.92, + "learning_rate": 1.5587744165275135e-08, + "loss": 0.0007, + "step": 47538 + }, + { + "epoch": 0.92, + "learning_rate": 1.5583860820938993e-08, + "loss": 0.3229, + "step": 47539 + }, + { + "epoch": 0.92, + "learning_rate": 1.5579977476602848e-08, + "loss": 0.0004, + "step": 47540 + }, + { + "epoch": 0.92, + "learning_rate": 1.5576094132266706e-08, + "loss": 0.0003, + "step": 47541 + }, + { + "epoch": 0.92, + "learning_rate": 1.5572210787930564e-08, + "loss": 0.0004, + "step": 47542 + }, + { + "epoch": 0.92, + "learning_rate": 1.5568327443594423e-08, + "loss": 0.0003, + "step": 47543 + }, + { + "epoch": 0.92, + "learning_rate": 1.556444409925828e-08, + "loss": 0.0005, + "step": 47544 + }, + { + "epoch": 0.92, + "learning_rate": 1.556056075492214e-08, + "loss": 0.0004, + "step": 47545 + }, + { + "epoch": 0.92, + "learning_rate": 1.5556677410585997e-08, + "loss": 0.0004, + "step": 47546 + }, + { + "epoch": 0.92, + "learning_rate": 1.5552794066249852e-08, + "loss": 0.0038, + "step": 47547 + }, + { + "epoch": 0.92, + "learning_rate": 1.554891072191371e-08, + "loss": 0.0005, + "step": 47548 + }, + { + "epoch": 0.92, + "learning_rate": 1.554502737757757e-08, + "loss": 0.0005, + "step": 47549 + }, + { + "epoch": 0.92, + "learning_rate": 1.5541144033241427e-08, + "loss": 0.0003, + "step": 47550 + }, + { + "epoch": 0.92, + "learning_rate": 1.5537260688905285e-08, + "loss": 0.0004, + "step": 47551 + }, + { + "epoch": 0.92, + "learning_rate": 1.5533377344569144e-08, + "loss": 0.0008, + "step": 47552 + }, + { + "epoch": 0.92, + "learning_rate": 1.5529494000233002e-08, + "loss": 0.0004, + "step": 47553 + }, + { + "epoch": 0.92, + "learning_rate": 1.5525610655896857e-08, + "loss": 0.0005, + "step": 47554 + }, + { + "epoch": 0.92, + "learning_rate": 1.5521727311560715e-08, + "loss": 0.0007, + "step": 47555 + }, + { + "epoch": 0.92, + "learning_rate": 1.5517843967224573e-08, + "loss": 0.0003, + "step": 47556 + }, + { + "epoch": 0.92, + "learning_rate": 1.551396062288843e-08, + "loss": 0.0003, + "step": 47557 + }, + { + "epoch": 0.92, + "learning_rate": 1.551007727855229e-08, + "loss": 0.0004, + "step": 47558 + }, + { + "epoch": 0.92, + "learning_rate": 1.5506193934216148e-08, + "loss": 0.0004, + "step": 47559 + }, + { + "epoch": 0.92, + "learning_rate": 1.5502310589880006e-08, + "loss": 0.0004, + "step": 47560 + }, + { + "epoch": 0.92, + "learning_rate": 1.5498427245543864e-08, + "loss": 0.0016, + "step": 47561 + }, + { + "epoch": 0.92, + "learning_rate": 1.549454390120772e-08, + "loss": 0.0004, + "step": 47562 + }, + { + "epoch": 0.92, + "learning_rate": 1.5490660556871578e-08, + "loss": 0.0003, + "step": 47563 + }, + { + "epoch": 0.92, + "learning_rate": 1.5486777212535436e-08, + "loss": 0.0005, + "step": 47564 + }, + { + "epoch": 0.92, + "learning_rate": 1.5482893868199294e-08, + "loss": 0.0068, + "step": 47565 + }, + { + "epoch": 0.92, + "learning_rate": 1.5479010523863152e-08, + "loss": 0.0003, + "step": 47566 + }, + { + "epoch": 0.92, + "learning_rate": 1.5475127179527007e-08, + "loss": 0.0141, + "step": 47567 + }, + { + "epoch": 0.92, + "learning_rate": 1.5471243835190866e-08, + "loss": 0.0004, + "step": 47568 + }, + { + "epoch": 0.92, + "learning_rate": 1.5467360490854724e-08, + "loss": 0.0027, + "step": 47569 + }, + { + "epoch": 0.92, + "learning_rate": 1.546347714651858e-08, + "loss": 0.0004, + "step": 47570 + }, + { + "epoch": 0.92, + "learning_rate": 1.5459593802182437e-08, + "loss": 0.0003, + "step": 47571 + }, + { + "epoch": 0.92, + "learning_rate": 1.5455710457846295e-08, + "loss": 0.0039, + "step": 47572 + }, + { + "epoch": 0.92, + "learning_rate": 1.5451827113510153e-08, + "loss": 0.0004, + "step": 47573 + }, + { + "epoch": 0.92, + "learning_rate": 1.5447943769174012e-08, + "loss": 0.0003, + "step": 47574 + }, + { + "epoch": 0.92, + "learning_rate": 1.544406042483787e-08, + "loss": 0.0003, + "step": 47575 + }, + { + "epoch": 0.92, + "learning_rate": 1.5440177080501725e-08, + "loss": 0.0003, + "step": 47576 + }, + { + "epoch": 0.92, + "learning_rate": 1.5436293736165583e-08, + "loss": 0.0004, + "step": 47577 + }, + { + "epoch": 0.92, + "learning_rate": 1.543241039182944e-08, + "loss": 0.0002, + "step": 47578 + }, + { + "epoch": 0.92, + "learning_rate": 1.54285270474933e-08, + "loss": 0.3579, + "step": 47579 + }, + { + "epoch": 0.92, + "learning_rate": 1.5424643703157158e-08, + "loss": 0.0003, + "step": 47580 + }, + { + "epoch": 0.92, + "learning_rate": 1.5420760358821016e-08, + "loss": 0.0002, + "step": 47581 + }, + { + "epoch": 0.92, + "learning_rate": 1.5416877014484874e-08, + "loss": 0.0004, + "step": 47582 + }, + { + "epoch": 0.92, + "learning_rate": 1.541299367014873e-08, + "loss": 0.0004, + "step": 47583 + }, + { + "epoch": 0.92, + "learning_rate": 1.5409110325812588e-08, + "loss": 0.0003, + "step": 47584 + }, + { + "epoch": 0.92, + "learning_rate": 1.5405226981476446e-08, + "loss": 0.0003, + "step": 47585 + }, + { + "epoch": 0.92, + "learning_rate": 1.5401343637140304e-08, + "loss": 0.0003, + "step": 47586 + }, + { + "epoch": 0.92, + "learning_rate": 1.5397460292804162e-08, + "loss": 0.0008, + "step": 47587 + }, + { + "epoch": 0.92, + "learning_rate": 1.539357694846802e-08, + "loss": 0.0003, + "step": 47588 + }, + { + "epoch": 0.92, + "learning_rate": 1.538969360413188e-08, + "loss": 0.0004, + "step": 47589 + }, + { + "epoch": 0.92, + "learning_rate": 1.5385810259795737e-08, + "loss": 0.0003, + "step": 47590 + }, + { + "epoch": 0.92, + "learning_rate": 1.5381926915459592e-08, + "loss": 0.0004, + "step": 47591 + }, + { + "epoch": 0.92, + "learning_rate": 1.537804357112345e-08, + "loss": 0.7591, + "step": 47592 + }, + { + "epoch": 0.92, + "learning_rate": 1.537416022678731e-08, + "loss": 0.0003, + "step": 47593 + }, + { + "epoch": 0.92, + "learning_rate": 1.5370276882451167e-08, + "loss": 0.0003, + "step": 47594 + }, + { + "epoch": 0.92, + "learning_rate": 1.5366393538115025e-08, + "loss": 0.0027, + "step": 47595 + }, + { + "epoch": 0.92, + "learning_rate": 1.5362510193778883e-08, + "loss": 0.0003, + "step": 47596 + }, + { + "epoch": 0.92, + "learning_rate": 1.535862684944274e-08, + "loss": 0.0003, + "step": 47597 + }, + { + "epoch": 0.92, + "learning_rate": 1.5354743505106596e-08, + "loss": 0.0009, + "step": 47598 + }, + { + "epoch": 0.92, + "learning_rate": 1.5350860160770455e-08, + "loss": 0.0039, + "step": 47599 + }, + { + "epoch": 0.92, + "learning_rate": 1.5346976816434313e-08, + "loss": 0.0003, + "step": 47600 + }, + { + "epoch": 0.92, + "learning_rate": 1.534309347209817e-08, + "loss": 0.0112, + "step": 47601 + }, + { + "epoch": 0.92, + "learning_rate": 1.533921012776203e-08, + "loss": 0.0004, + "step": 47602 + }, + { + "epoch": 0.92, + "learning_rate": 1.5335326783425888e-08, + "loss": 0.001, + "step": 47603 + }, + { + "epoch": 0.92, + "learning_rate": 1.5331443439089746e-08, + "loss": 0.0003, + "step": 47604 + }, + { + "epoch": 0.92, + "learning_rate": 1.53275600947536e-08, + "loss": 0.0005, + "step": 47605 + }, + { + "epoch": 0.92, + "learning_rate": 1.532367675041746e-08, + "loss": 0.0004, + "step": 47606 + }, + { + "epoch": 0.92, + "learning_rate": 1.5319793406081317e-08, + "loss": 0.0003, + "step": 47607 + }, + { + "epoch": 0.92, + "learning_rate": 1.5315910061745175e-08, + "loss": 0.0006, + "step": 47608 + }, + { + "epoch": 0.92, + "learning_rate": 1.5312026717409034e-08, + "loss": 0.0006, + "step": 47609 + }, + { + "epoch": 0.92, + "learning_rate": 1.5308143373072892e-08, + "loss": 0.0006, + "step": 47610 + }, + { + "epoch": 0.92, + "learning_rate": 1.5304260028736747e-08, + "loss": 0.0004, + "step": 47611 + }, + { + "epoch": 0.92, + "learning_rate": 1.5300376684400605e-08, + "loss": 0.0005, + "step": 47612 + }, + { + "epoch": 0.92, + "learning_rate": 1.5296493340064463e-08, + "loss": 0.0003, + "step": 47613 + }, + { + "epoch": 0.92, + "learning_rate": 1.529260999572832e-08, + "loss": 0.0003, + "step": 47614 + }, + { + "epoch": 0.92, + "learning_rate": 1.5288726651392177e-08, + "loss": 0.1888, + "step": 47615 + }, + { + "epoch": 0.92, + "learning_rate": 1.5284843307056035e-08, + "loss": 0.0003, + "step": 47616 + }, + { + "epoch": 0.92, + "learning_rate": 1.5280959962719893e-08, + "loss": 0.0056, + "step": 47617 + }, + { + "epoch": 0.92, + "learning_rate": 1.527707661838375e-08, + "loss": 0.0005, + "step": 47618 + }, + { + "epoch": 0.92, + "learning_rate": 1.527319327404761e-08, + "loss": 0.0004, + "step": 47619 + }, + { + "epoch": 0.92, + "learning_rate": 1.5269309929711464e-08, + "loss": 0.0358, + "step": 47620 + }, + { + "epoch": 0.92, + "learning_rate": 1.5265426585375323e-08, + "loss": 0.0003, + "step": 47621 + }, + { + "epoch": 0.92, + "learning_rate": 1.526154324103918e-08, + "loss": 0.0008, + "step": 47622 + }, + { + "epoch": 0.92, + "learning_rate": 1.525765989670304e-08, + "loss": 0.0003, + "step": 47623 + }, + { + "epoch": 0.92, + "learning_rate": 1.5253776552366897e-08, + "loss": 0.0684, + "step": 47624 + }, + { + "epoch": 0.92, + "learning_rate": 1.5249893208030756e-08, + "loss": 0.0005, + "step": 47625 + }, + { + "epoch": 0.92, + "learning_rate": 1.5246009863694614e-08, + "loss": 0.0776, + "step": 47626 + }, + { + "epoch": 0.92, + "learning_rate": 1.524212651935847e-08, + "loss": 0.0024, + "step": 47627 + }, + { + "epoch": 0.92, + "learning_rate": 1.5238243175022327e-08, + "loss": 0.0003, + "step": 47628 + }, + { + "epoch": 0.92, + "learning_rate": 1.5234359830686185e-08, + "loss": 0.0004, + "step": 47629 + }, + { + "epoch": 0.92, + "learning_rate": 1.5230476486350044e-08, + "loss": 0.0003, + "step": 47630 + }, + { + "epoch": 0.92, + "learning_rate": 1.5226593142013902e-08, + "loss": 0.0005, + "step": 47631 + }, + { + "epoch": 0.92, + "learning_rate": 1.522270979767776e-08, + "loss": 0.0004, + "step": 47632 + }, + { + "epoch": 0.92, + "learning_rate": 1.521882645334162e-08, + "loss": 0.0004, + "step": 47633 + }, + { + "epoch": 0.92, + "learning_rate": 1.5214943109005473e-08, + "loss": 0.0004, + "step": 47634 + }, + { + "epoch": 0.92, + "learning_rate": 1.521105976466933e-08, + "loss": 0.0006, + "step": 47635 + }, + { + "epoch": 0.92, + "learning_rate": 1.520717642033319e-08, + "loss": 1.0358, + "step": 47636 + }, + { + "epoch": 0.92, + "learning_rate": 1.5203293075997048e-08, + "loss": 0.7017, + "step": 47637 + }, + { + "epoch": 0.92, + "learning_rate": 1.5199409731660906e-08, + "loss": 0.0003, + "step": 47638 + }, + { + "epoch": 0.92, + "learning_rate": 1.5195526387324765e-08, + "loss": 0.0005, + "step": 47639 + }, + { + "epoch": 0.92, + "learning_rate": 1.5191643042988623e-08, + "loss": 0.0004, + "step": 47640 + }, + { + "epoch": 0.92, + "learning_rate": 1.5187759698652478e-08, + "loss": 0.0372, + "step": 47641 + }, + { + "epoch": 0.92, + "learning_rate": 1.5183876354316336e-08, + "loss": 0.7054, + "step": 47642 + }, + { + "epoch": 0.92, + "learning_rate": 1.5179993009980194e-08, + "loss": 0.0003, + "step": 47643 + }, + { + "epoch": 0.92, + "learning_rate": 1.5176109665644052e-08, + "loss": 0.0004, + "step": 47644 + }, + { + "epoch": 0.92, + "learning_rate": 1.517222632130791e-08, + "loss": 0.0004, + "step": 47645 + }, + { + "epoch": 0.92, + "learning_rate": 1.516834297697177e-08, + "loss": 0.0003, + "step": 47646 + }, + { + "epoch": 0.92, + "learning_rate": 1.5164459632635627e-08, + "loss": 0.0005, + "step": 47647 + }, + { + "epoch": 0.92, + "learning_rate": 1.5160576288299485e-08, + "loss": 0.0003, + "step": 47648 + }, + { + "epoch": 0.92, + "learning_rate": 1.515669294396334e-08, + "loss": 0.0004, + "step": 47649 + }, + { + "epoch": 0.92, + "learning_rate": 1.51528095996272e-08, + "loss": 0.0219, + "step": 47650 + }, + { + "epoch": 0.92, + "learning_rate": 1.5148926255291057e-08, + "loss": 0.0003, + "step": 47651 + }, + { + "epoch": 0.92, + "learning_rate": 1.5145042910954915e-08, + "loss": 0.0005, + "step": 47652 + }, + { + "epoch": 0.92, + "learning_rate": 1.5141159566618773e-08, + "loss": 0.0003, + "step": 47653 + }, + { + "epoch": 0.92, + "learning_rate": 1.513727622228263e-08, + "loss": 0.0004, + "step": 47654 + }, + { + "epoch": 0.92, + "learning_rate": 1.5133392877946486e-08, + "loss": 0.0003, + "step": 47655 + }, + { + "epoch": 0.92, + "learning_rate": 1.5129509533610345e-08, + "loss": 0.0006, + "step": 47656 + }, + { + "epoch": 0.92, + "learning_rate": 1.5125626189274203e-08, + "loss": 0.0004, + "step": 47657 + }, + { + "epoch": 0.92, + "learning_rate": 1.512174284493806e-08, + "loss": 0.0004, + "step": 47658 + }, + { + "epoch": 0.92, + "learning_rate": 1.5117859500601916e-08, + "loss": 0.0004, + "step": 47659 + }, + { + "epoch": 0.92, + "learning_rate": 1.5113976156265774e-08, + "loss": 0.0019, + "step": 47660 + }, + { + "epoch": 0.92, + "learning_rate": 1.5110092811929633e-08, + "loss": 0.0004, + "step": 47661 + }, + { + "epoch": 0.92, + "learning_rate": 1.510620946759349e-08, + "loss": 0.0025, + "step": 47662 + }, + { + "epoch": 0.92, + "learning_rate": 1.5102326123257346e-08, + "loss": 0.0124, + "step": 47663 + }, + { + "epoch": 0.92, + "learning_rate": 1.5098442778921204e-08, + "loss": 0.0004, + "step": 47664 + }, + { + "epoch": 0.92, + "learning_rate": 1.5094559434585062e-08, + "loss": 0.0004, + "step": 47665 + }, + { + "epoch": 0.92, + "learning_rate": 1.509067609024892e-08, + "loss": 0.0006, + "step": 47666 + }, + { + "epoch": 0.92, + "learning_rate": 1.508679274591278e-08, + "loss": 0.0003, + "step": 47667 + }, + { + "epoch": 0.92, + "learning_rate": 1.5082909401576637e-08, + "loss": 0.0003, + "step": 47668 + }, + { + "epoch": 0.92, + "learning_rate": 1.5079026057240495e-08, + "loss": 0.7738, + "step": 47669 + }, + { + "epoch": 0.92, + "learning_rate": 1.507514271290435e-08, + "loss": 0.0294, + "step": 47670 + }, + { + "epoch": 0.92, + "learning_rate": 1.507125936856821e-08, + "loss": 0.0005, + "step": 47671 + }, + { + "epoch": 0.92, + "learning_rate": 1.5067376024232067e-08, + "loss": 0.0003, + "step": 47672 + }, + { + "epoch": 0.92, + "learning_rate": 1.5063492679895925e-08, + "loss": 0.2055, + "step": 47673 + }, + { + "epoch": 0.92, + "learning_rate": 1.5059609335559783e-08, + "loss": 0.0006, + "step": 47674 + }, + { + "epoch": 0.92, + "learning_rate": 1.505572599122364e-08, + "loss": 0.0006, + "step": 47675 + }, + { + "epoch": 0.92, + "learning_rate": 1.50518426468875e-08, + "loss": 0.0416, + "step": 47676 + }, + { + "epoch": 0.92, + "learning_rate": 1.5047959302551358e-08, + "loss": 0.0003, + "step": 47677 + }, + { + "epoch": 0.92, + "learning_rate": 1.5044075958215213e-08, + "loss": 0.0003, + "step": 47678 + }, + { + "epoch": 0.92, + "learning_rate": 1.504019261387907e-08, + "loss": 0.0003, + "step": 47679 + }, + { + "epoch": 0.92, + "learning_rate": 1.503630926954293e-08, + "loss": 0.0008, + "step": 47680 + }, + { + "epoch": 0.92, + "learning_rate": 1.5032425925206788e-08, + "loss": 0.0004, + "step": 47681 + }, + { + "epoch": 0.92, + "learning_rate": 1.5028542580870646e-08, + "loss": 0.0003, + "step": 47682 + }, + { + "epoch": 0.92, + "learning_rate": 1.5024659236534504e-08, + "loss": 0.001, + "step": 47683 + }, + { + "epoch": 0.92, + "learning_rate": 1.5020775892198362e-08, + "loss": 0.0004, + "step": 47684 + }, + { + "epoch": 0.92, + "learning_rate": 1.5016892547862217e-08, + "loss": 0.6913, + "step": 47685 + }, + { + "epoch": 0.93, + "learning_rate": 1.5013009203526076e-08, + "loss": 0.0058, + "step": 47686 + }, + { + "epoch": 0.93, + "learning_rate": 1.5009125859189934e-08, + "loss": 0.0003, + "step": 47687 + }, + { + "epoch": 0.93, + "learning_rate": 1.5005242514853792e-08, + "loss": 0.0004, + "step": 47688 + }, + { + "epoch": 0.93, + "learning_rate": 1.500135917051765e-08, + "loss": 0.0004, + "step": 47689 + }, + { + "epoch": 0.93, + "learning_rate": 1.499747582618151e-08, + "loss": 0.0004, + "step": 47690 + }, + { + "epoch": 0.93, + "learning_rate": 1.4993592481845367e-08, + "loss": 0.0004, + "step": 47691 + }, + { + "epoch": 0.93, + "learning_rate": 1.4989709137509222e-08, + "loss": 0.0004, + "step": 47692 + }, + { + "epoch": 0.93, + "learning_rate": 1.498582579317308e-08, + "loss": 0.0005, + "step": 47693 + }, + { + "epoch": 0.93, + "learning_rate": 1.4981942448836938e-08, + "loss": 0.0003, + "step": 47694 + }, + { + "epoch": 0.93, + "learning_rate": 1.4978059104500796e-08, + "loss": 0.0148, + "step": 47695 + }, + { + "epoch": 0.93, + "learning_rate": 1.4974175760164655e-08, + "loss": 0.0003, + "step": 47696 + }, + { + "epoch": 0.93, + "learning_rate": 1.4970292415828513e-08, + "loss": 0.0004, + "step": 47697 + }, + { + "epoch": 0.93, + "learning_rate": 1.496640907149237e-08, + "loss": 0.0064, + "step": 47698 + }, + { + "epoch": 0.93, + "learning_rate": 1.4962525727156226e-08, + "loss": 0.1397, + "step": 47699 + }, + { + "epoch": 0.93, + "learning_rate": 1.4958642382820084e-08, + "loss": 0.0003, + "step": 47700 + }, + { + "epoch": 0.93, + "learning_rate": 1.4954759038483943e-08, + "loss": 0.0005, + "step": 47701 + }, + { + "epoch": 0.93, + "learning_rate": 1.49508756941478e-08, + "loss": 0.0004, + "step": 47702 + }, + { + "epoch": 0.93, + "learning_rate": 1.4946992349811656e-08, + "loss": 0.0005, + "step": 47703 + }, + { + "epoch": 0.93, + "learning_rate": 1.4943109005475514e-08, + "loss": 0.0028, + "step": 47704 + }, + { + "epoch": 0.93, + "learning_rate": 1.4939225661139372e-08, + "loss": 0.2073, + "step": 47705 + }, + { + "epoch": 0.93, + "learning_rate": 1.493534231680323e-08, + "loss": 0.0003, + "step": 47706 + }, + { + "epoch": 0.93, + "learning_rate": 1.4931458972467085e-08, + "loss": 0.0007, + "step": 47707 + }, + { + "epoch": 0.93, + "learning_rate": 1.4927575628130944e-08, + "loss": 0.0003, + "step": 47708 + }, + { + "epoch": 0.93, + "learning_rate": 1.4923692283794802e-08, + "loss": 0.7003, + "step": 47709 + }, + { + "epoch": 0.93, + "learning_rate": 1.491980893945866e-08, + "loss": 0.0005, + "step": 47710 + }, + { + "epoch": 0.93, + "learning_rate": 1.491592559512252e-08, + "loss": 0.0003, + "step": 47711 + }, + { + "epoch": 0.93, + "learning_rate": 1.4912042250786377e-08, + "loss": 0.0002, + "step": 47712 + }, + { + "epoch": 0.93, + "learning_rate": 1.4908158906450235e-08, + "loss": 0.0003, + "step": 47713 + }, + { + "epoch": 0.93, + "learning_rate": 1.490427556211409e-08, + "loss": 0.0004, + "step": 47714 + }, + { + "epoch": 0.93, + "learning_rate": 1.490039221777795e-08, + "loss": 0.0003, + "step": 47715 + }, + { + "epoch": 0.93, + "learning_rate": 1.4896508873441806e-08, + "loss": 0.0003, + "step": 47716 + }, + { + "epoch": 0.93, + "learning_rate": 1.4892625529105665e-08, + "loss": 0.0004, + "step": 47717 + }, + { + "epoch": 0.93, + "learning_rate": 1.4888742184769523e-08, + "loss": 0.0005, + "step": 47718 + }, + { + "epoch": 0.93, + "learning_rate": 1.4884858840433381e-08, + "loss": 1.279, + "step": 47719 + }, + { + "epoch": 0.93, + "learning_rate": 1.488097549609724e-08, + "loss": 0.0005, + "step": 47720 + }, + { + "epoch": 0.93, + "learning_rate": 1.4877092151761094e-08, + "loss": 0.0005, + "step": 47721 + }, + { + "epoch": 0.93, + "learning_rate": 1.4873208807424952e-08, + "loss": 0.0009, + "step": 47722 + }, + { + "epoch": 0.93, + "learning_rate": 1.486932546308881e-08, + "loss": 0.0003, + "step": 47723 + }, + { + "epoch": 0.93, + "learning_rate": 1.4865442118752669e-08, + "loss": 0.0012, + "step": 47724 + }, + { + "epoch": 0.93, + "learning_rate": 1.4861558774416527e-08, + "loss": 0.0004, + "step": 47725 + }, + { + "epoch": 0.93, + "learning_rate": 1.4857675430080385e-08, + "loss": 0.0006, + "step": 47726 + }, + { + "epoch": 0.93, + "learning_rate": 1.4853792085744244e-08, + "loss": 0.0023, + "step": 47727 + }, + { + "epoch": 0.93, + "learning_rate": 1.4849908741408099e-08, + "loss": 0.0003, + "step": 47728 + }, + { + "epoch": 0.93, + "learning_rate": 1.4846025397071957e-08, + "loss": 0.0004, + "step": 47729 + }, + { + "epoch": 0.93, + "learning_rate": 1.4842142052735815e-08, + "loss": 0.0003, + "step": 47730 + }, + { + "epoch": 0.93, + "learning_rate": 1.4838258708399673e-08, + "loss": 0.001, + "step": 47731 + }, + { + "epoch": 0.93, + "learning_rate": 1.4834375364063532e-08, + "loss": 0.5211, + "step": 47732 + }, + { + "epoch": 0.93, + "learning_rate": 1.483049201972739e-08, + "loss": 0.0004, + "step": 47733 + }, + { + "epoch": 0.93, + "learning_rate": 1.4826608675391248e-08, + "loss": 0.0012, + "step": 47734 + }, + { + "epoch": 0.93, + "learning_rate": 1.4822725331055105e-08, + "loss": 0.0004, + "step": 47735 + }, + { + "epoch": 0.93, + "learning_rate": 1.4818841986718961e-08, + "loss": 0.0003, + "step": 47736 + }, + { + "epoch": 0.93, + "learning_rate": 1.481495864238282e-08, + "loss": 0.071, + "step": 47737 + }, + { + "epoch": 0.93, + "learning_rate": 1.4811075298046676e-08, + "loss": 0.455, + "step": 47738 + }, + { + "epoch": 0.93, + "learning_rate": 1.4807191953710534e-08, + "loss": 0.0006, + "step": 47739 + }, + { + "epoch": 0.93, + "learning_rate": 1.4803308609374393e-08, + "loss": 0.0005, + "step": 47740 + }, + { + "epoch": 0.93, + "learning_rate": 1.4799425265038251e-08, + "loss": 0.0002, + "step": 47741 + }, + { + "epoch": 0.93, + "learning_rate": 1.4795541920702109e-08, + "loss": 0.0004, + "step": 47742 + }, + { + "epoch": 0.93, + "learning_rate": 1.4791658576365964e-08, + "loss": 0.001, + "step": 47743 + }, + { + "epoch": 0.93, + "learning_rate": 1.4787775232029822e-08, + "loss": 0.0005, + "step": 47744 + }, + { + "epoch": 0.93, + "learning_rate": 1.478389188769368e-08, + "loss": 0.6908, + "step": 47745 + }, + { + "epoch": 0.93, + "learning_rate": 1.4780008543357539e-08, + "loss": 0.0004, + "step": 47746 + }, + { + "epoch": 0.93, + "learning_rate": 1.4776125199021397e-08, + "loss": 0.0003, + "step": 47747 + }, + { + "epoch": 0.93, + "learning_rate": 1.4772241854685255e-08, + "loss": 0.0004, + "step": 47748 + }, + { + "epoch": 0.93, + "learning_rate": 1.4768358510349113e-08, + "loss": 0.0005, + "step": 47749 + }, + { + "epoch": 0.93, + "learning_rate": 1.4764475166012968e-08, + "loss": 0.0006, + "step": 47750 + }, + { + "epoch": 0.93, + "learning_rate": 1.4760591821676827e-08, + "loss": 0.0004, + "step": 47751 + }, + { + "epoch": 0.93, + "learning_rate": 1.4756708477340685e-08, + "loss": 0.0004, + "step": 47752 + }, + { + "epoch": 0.93, + "learning_rate": 1.4752825133004543e-08, + "loss": 0.0004, + "step": 47753 + }, + { + "epoch": 0.93, + "learning_rate": 1.4748941788668401e-08, + "loss": 0.0005, + "step": 47754 + }, + { + "epoch": 0.93, + "learning_rate": 1.474505844433226e-08, + "loss": 0.0005, + "step": 47755 + }, + { + "epoch": 0.93, + "learning_rate": 1.4741175099996118e-08, + "loss": 0.0004, + "step": 47756 + }, + { + "epoch": 0.93, + "learning_rate": 1.4737291755659973e-08, + "loss": 0.0003, + "step": 47757 + }, + { + "epoch": 0.93, + "learning_rate": 1.4733408411323831e-08, + "loss": 0.0002, + "step": 47758 + }, + { + "epoch": 0.93, + "learning_rate": 1.472952506698769e-08, + "loss": 0.0013, + "step": 47759 + }, + { + "epoch": 0.93, + "learning_rate": 1.4725641722651546e-08, + "loss": 0.0004, + "step": 47760 + }, + { + "epoch": 0.93, + "learning_rate": 1.4721758378315404e-08, + "loss": 0.0003, + "step": 47761 + }, + { + "epoch": 0.93, + "learning_rate": 1.4717875033979262e-08, + "loss": 0.0004, + "step": 47762 + }, + { + "epoch": 0.93, + "learning_rate": 1.471399168964312e-08, + "loss": 0.0004, + "step": 47763 + }, + { + "epoch": 0.93, + "learning_rate": 1.4710108345306979e-08, + "loss": 0.0003, + "step": 47764 + }, + { + "epoch": 0.93, + "learning_rate": 1.4706225000970834e-08, + "loss": 0.0004, + "step": 47765 + }, + { + "epoch": 0.93, + "learning_rate": 1.4702341656634692e-08, + "loss": 0.0002, + "step": 47766 + }, + { + "epoch": 0.93, + "learning_rate": 1.469845831229855e-08, + "loss": 0.0008, + "step": 47767 + }, + { + "epoch": 0.93, + "learning_rate": 1.4694574967962409e-08, + "loss": 0.0003, + "step": 47768 + }, + { + "epoch": 0.93, + "learning_rate": 1.4690691623626267e-08, + "loss": 0.0005, + "step": 47769 + }, + { + "epoch": 0.93, + "learning_rate": 1.4686808279290125e-08, + "loss": 0.0003, + "step": 47770 + }, + { + "epoch": 0.93, + "learning_rate": 1.4682924934953983e-08, + "loss": 0.0003, + "step": 47771 + }, + { + "epoch": 0.93, + "learning_rate": 1.4679041590617838e-08, + "loss": 0.0004, + "step": 47772 + }, + { + "epoch": 0.93, + "learning_rate": 1.4675158246281696e-08, + "loss": 0.0005, + "step": 47773 + }, + { + "epoch": 0.93, + "learning_rate": 1.4671274901945555e-08, + "loss": 0.0003, + "step": 47774 + }, + { + "epoch": 0.93, + "learning_rate": 1.4667391557609413e-08, + "loss": 0.0007, + "step": 47775 + }, + { + "epoch": 0.93, + "learning_rate": 1.4663508213273271e-08, + "loss": 0.0005, + "step": 47776 + }, + { + "epoch": 0.93, + "learning_rate": 1.465962486893713e-08, + "loss": 0.0003, + "step": 47777 + }, + { + "epoch": 0.93, + "learning_rate": 1.4655741524600988e-08, + "loss": 0.0327, + "step": 47778 + }, + { + "epoch": 0.93, + "learning_rate": 1.4651858180264843e-08, + "loss": 0.0003, + "step": 47779 + }, + { + "epoch": 0.93, + "learning_rate": 1.4647974835928701e-08, + "loss": 0.0004, + "step": 47780 + }, + { + "epoch": 0.93, + "learning_rate": 1.4644091491592559e-08, + "loss": 0.0004, + "step": 47781 + }, + { + "epoch": 0.93, + "learning_rate": 1.4640208147256416e-08, + "loss": 0.0004, + "step": 47782 + }, + { + "epoch": 0.93, + "learning_rate": 1.4636324802920274e-08, + "loss": 0.0003, + "step": 47783 + }, + { + "epoch": 0.93, + "learning_rate": 1.4632441458584132e-08, + "loss": 0.0004, + "step": 47784 + }, + { + "epoch": 0.93, + "learning_rate": 1.462855811424799e-08, + "loss": 0.001, + "step": 47785 + }, + { + "epoch": 0.93, + "learning_rate": 1.4624674769911845e-08, + "loss": 0.0002, + "step": 47786 + }, + { + "epoch": 0.93, + "learning_rate": 1.4620791425575704e-08, + "loss": 0.0004, + "step": 47787 + }, + { + "epoch": 0.93, + "learning_rate": 1.4616908081239562e-08, + "loss": 0.0005, + "step": 47788 + }, + { + "epoch": 0.93, + "learning_rate": 1.461302473690342e-08, + "loss": 0.0004, + "step": 47789 + }, + { + "epoch": 0.93, + "learning_rate": 1.4609141392567278e-08, + "loss": 0.0005, + "step": 47790 + }, + { + "epoch": 0.93, + "learning_rate": 1.4605258048231137e-08, + "loss": 0.0003, + "step": 47791 + }, + { + "epoch": 0.93, + "learning_rate": 1.4601374703894995e-08, + "loss": 0.5222, + "step": 47792 + }, + { + "epoch": 0.93, + "learning_rate": 1.4597491359558853e-08, + "loss": 0.0004, + "step": 47793 + }, + { + "epoch": 0.93, + "learning_rate": 1.4593608015222708e-08, + "loss": 0.0003, + "step": 47794 + }, + { + "epoch": 0.93, + "learning_rate": 1.4589724670886566e-08, + "loss": 0.0004, + "step": 47795 + }, + { + "epoch": 0.93, + "learning_rate": 1.4585841326550424e-08, + "loss": 0.0496, + "step": 47796 + }, + { + "epoch": 0.93, + "learning_rate": 1.4581957982214283e-08, + "loss": 0.0004, + "step": 47797 + }, + { + "epoch": 0.93, + "learning_rate": 1.4578074637878141e-08, + "loss": 0.0004, + "step": 47798 + }, + { + "epoch": 0.93, + "learning_rate": 1.4574191293542e-08, + "loss": 0.0004, + "step": 47799 + }, + { + "epoch": 0.93, + "learning_rate": 1.4570307949205857e-08, + "loss": 0.0005, + "step": 47800 + }, + { + "epoch": 0.93, + "learning_rate": 1.4566424604869712e-08, + "loss": 0.0002, + "step": 47801 + }, + { + "epoch": 0.93, + "learning_rate": 1.456254126053357e-08, + "loss": 0.0004, + "step": 47802 + }, + { + "epoch": 0.93, + "learning_rate": 1.4558657916197429e-08, + "loss": 0.1886, + "step": 47803 + }, + { + "epoch": 0.93, + "learning_rate": 1.4554774571861287e-08, + "loss": 0.0003, + "step": 47804 + }, + { + "epoch": 0.93, + "learning_rate": 1.4550891227525144e-08, + "loss": 0.0004, + "step": 47805 + }, + { + "epoch": 0.93, + "learning_rate": 1.4547007883189002e-08, + "loss": 0.0003, + "step": 47806 + }, + { + "epoch": 0.93, + "learning_rate": 1.454312453885286e-08, + "loss": 0.0018, + "step": 47807 + }, + { + "epoch": 0.93, + "learning_rate": 1.4539241194516715e-08, + "loss": 0.0004, + "step": 47808 + }, + { + "epoch": 0.93, + "learning_rate": 1.4535357850180573e-08, + "loss": 0.0003, + "step": 47809 + }, + { + "epoch": 0.93, + "learning_rate": 1.4531474505844432e-08, + "loss": 0.0003, + "step": 47810 + }, + { + "epoch": 0.93, + "learning_rate": 1.452759116150829e-08, + "loss": 0.0003, + "step": 47811 + }, + { + "epoch": 0.93, + "learning_rate": 1.4523707817172148e-08, + "loss": 0.0003, + "step": 47812 + }, + { + "epoch": 0.93, + "learning_rate": 1.4519824472836006e-08, + "loss": 0.0004, + "step": 47813 + }, + { + "epoch": 0.93, + "learning_rate": 1.4515941128499865e-08, + "loss": 0.0004, + "step": 47814 + }, + { + "epoch": 0.93, + "learning_rate": 1.451205778416372e-08, + "loss": 0.0005, + "step": 47815 + }, + { + "epoch": 0.93, + "learning_rate": 1.4508174439827578e-08, + "loss": 0.0003, + "step": 47816 + }, + { + "epoch": 0.93, + "learning_rate": 1.4504291095491436e-08, + "loss": 0.0005, + "step": 47817 + }, + { + "epoch": 0.93, + "learning_rate": 1.4500407751155294e-08, + "loss": 0.0006, + "step": 47818 + }, + { + "epoch": 0.93, + "learning_rate": 1.4496524406819153e-08, + "loss": 0.0003, + "step": 47819 + }, + { + "epoch": 0.93, + "learning_rate": 1.449264106248301e-08, + "loss": 0.0004, + "step": 47820 + }, + { + "epoch": 0.93, + "learning_rate": 1.4488757718146869e-08, + "loss": 0.0004, + "step": 47821 + }, + { + "epoch": 0.93, + "learning_rate": 1.4484874373810727e-08, + "loss": 0.0004, + "step": 47822 + }, + { + "epoch": 0.93, + "learning_rate": 1.4480991029474582e-08, + "loss": 0.0374, + "step": 47823 + }, + { + "epoch": 0.93, + "learning_rate": 1.447710768513844e-08, + "loss": 0.0026, + "step": 47824 + }, + { + "epoch": 0.93, + "learning_rate": 1.4473224340802299e-08, + "loss": 0.0005, + "step": 47825 + }, + { + "epoch": 0.93, + "learning_rate": 1.4469340996466157e-08, + "loss": 0.0005, + "step": 47826 + }, + { + "epoch": 0.93, + "learning_rate": 1.4465457652130014e-08, + "loss": 0.0004, + "step": 47827 + }, + { + "epoch": 0.93, + "learning_rate": 1.4461574307793872e-08, + "loss": 0.0003, + "step": 47828 + }, + { + "epoch": 0.93, + "learning_rate": 1.445769096345773e-08, + "loss": 0.0008, + "step": 47829 + }, + { + "epoch": 0.93, + "learning_rate": 1.4453807619121585e-08, + "loss": 0.0003, + "step": 47830 + }, + { + "epoch": 0.93, + "learning_rate": 1.4449924274785443e-08, + "loss": 0.0003, + "step": 47831 + }, + { + "epoch": 0.93, + "learning_rate": 1.4446040930449301e-08, + "loss": 0.0004, + "step": 47832 + }, + { + "epoch": 0.93, + "learning_rate": 1.444215758611316e-08, + "loss": 0.0004, + "step": 47833 + }, + { + "epoch": 0.93, + "learning_rate": 1.4438274241777018e-08, + "loss": 0.0003, + "step": 47834 + }, + { + "epoch": 0.93, + "learning_rate": 1.4434390897440876e-08, + "loss": 0.0003, + "step": 47835 + }, + { + "epoch": 0.93, + "learning_rate": 1.4430507553104734e-08, + "loss": 0.0006, + "step": 47836 + }, + { + "epoch": 0.93, + "learning_rate": 1.442662420876859e-08, + "loss": 0.0004, + "step": 47837 + }, + { + "epoch": 0.93, + "learning_rate": 1.4422740864432448e-08, + "loss": 0.0004, + "step": 47838 + }, + { + "epoch": 0.93, + "learning_rate": 1.4418857520096306e-08, + "loss": 0.0004, + "step": 47839 + }, + { + "epoch": 0.93, + "learning_rate": 1.4414974175760164e-08, + "loss": 0.0014, + "step": 47840 + }, + { + "epoch": 0.93, + "learning_rate": 1.4411090831424022e-08, + "loss": 0.0004, + "step": 47841 + }, + { + "epoch": 0.93, + "learning_rate": 1.440720748708788e-08, + "loss": 0.0374, + "step": 47842 + }, + { + "epoch": 0.93, + "learning_rate": 1.4403324142751739e-08, + "loss": 0.0004, + "step": 47843 + }, + { + "epoch": 0.93, + "learning_rate": 1.4399440798415594e-08, + "loss": 0.0006, + "step": 47844 + }, + { + "epoch": 0.93, + "learning_rate": 1.4395557454079452e-08, + "loss": 0.0008, + "step": 47845 + }, + { + "epoch": 0.93, + "learning_rate": 1.439167410974331e-08, + "loss": 0.0006, + "step": 47846 + }, + { + "epoch": 0.93, + "learning_rate": 1.4387790765407168e-08, + "loss": 0.0005, + "step": 47847 + }, + { + "epoch": 0.93, + "learning_rate": 1.4383907421071027e-08, + "loss": 0.0053, + "step": 47848 + }, + { + "epoch": 0.93, + "learning_rate": 1.4380024076734883e-08, + "loss": 0.0004, + "step": 47849 + }, + { + "epoch": 0.93, + "learning_rate": 1.4376140732398742e-08, + "loss": 0.0004, + "step": 47850 + }, + { + "epoch": 0.93, + "learning_rate": 1.43722573880626e-08, + "loss": 0.0004, + "step": 47851 + }, + { + "epoch": 0.93, + "learning_rate": 1.4368374043726455e-08, + "loss": 0.0004, + "step": 47852 + }, + { + "epoch": 0.93, + "learning_rate": 1.4364490699390313e-08, + "loss": 0.0004, + "step": 47853 + }, + { + "epoch": 0.93, + "learning_rate": 1.4360607355054171e-08, + "loss": 0.0016, + "step": 47854 + }, + { + "epoch": 0.93, + "learning_rate": 1.435672401071803e-08, + "loss": 0.0007, + "step": 47855 + }, + { + "epoch": 0.93, + "learning_rate": 1.4352840666381888e-08, + "loss": 0.0003, + "step": 47856 + }, + { + "epoch": 0.93, + "learning_rate": 1.4348957322045746e-08, + "loss": 0.6219, + "step": 47857 + }, + { + "epoch": 0.93, + "learning_rate": 1.4345073977709604e-08, + "loss": 0.0004, + "step": 47858 + }, + { + "epoch": 0.93, + "learning_rate": 1.4341190633373459e-08, + "loss": 0.9487, + "step": 47859 + }, + { + "epoch": 0.93, + "learning_rate": 1.4337307289037317e-08, + "loss": 0.0005, + "step": 47860 + }, + { + "epoch": 0.93, + "learning_rate": 1.4333423944701176e-08, + "loss": 0.0005, + "step": 47861 + }, + { + "epoch": 0.93, + "learning_rate": 1.4329540600365034e-08, + "loss": 0.0019, + "step": 47862 + }, + { + "epoch": 0.93, + "learning_rate": 1.4325657256028892e-08, + "loss": 0.0004, + "step": 47863 + }, + { + "epoch": 0.93, + "learning_rate": 1.432177391169275e-08, + "loss": 0.0026, + "step": 47864 + }, + { + "epoch": 0.93, + "learning_rate": 1.4317890567356609e-08, + "loss": 0.0004, + "step": 47865 + }, + { + "epoch": 0.93, + "learning_rate": 1.4314007223020464e-08, + "loss": 0.0008, + "step": 47866 + }, + { + "epoch": 0.93, + "learning_rate": 1.4310123878684322e-08, + "loss": 0.0011, + "step": 47867 + }, + { + "epoch": 0.93, + "learning_rate": 1.430624053434818e-08, + "loss": 0.0664, + "step": 47868 + }, + { + "epoch": 0.93, + "learning_rate": 1.4302357190012038e-08, + "loss": 0.0003, + "step": 47869 + }, + { + "epoch": 0.93, + "learning_rate": 1.4298473845675897e-08, + "loss": 0.0003, + "step": 47870 + }, + { + "epoch": 0.93, + "learning_rate": 1.4294590501339753e-08, + "loss": 0.0003, + "step": 47871 + }, + { + "epoch": 0.93, + "learning_rate": 1.4290707157003611e-08, + "loss": 0.0004, + "step": 47872 + }, + { + "epoch": 0.93, + "learning_rate": 1.4286823812667468e-08, + "loss": 0.0006, + "step": 47873 + }, + { + "epoch": 0.93, + "learning_rate": 1.4282940468331326e-08, + "loss": 0.0006, + "step": 47874 + }, + { + "epoch": 0.93, + "learning_rate": 1.4279057123995183e-08, + "loss": 0.0004, + "step": 47875 + }, + { + "epoch": 0.93, + "learning_rate": 1.4275173779659041e-08, + "loss": 0.0003, + "step": 47876 + }, + { + "epoch": 0.93, + "learning_rate": 1.42712904353229e-08, + "loss": 0.0004, + "step": 47877 + }, + { + "epoch": 0.93, + "learning_rate": 1.4267407090986758e-08, + "loss": 0.0007, + "step": 47878 + }, + { + "epoch": 0.93, + "learning_rate": 1.4263523746650616e-08, + "loss": 0.0003, + "step": 47879 + }, + { + "epoch": 0.93, + "learning_rate": 1.4259640402314474e-08, + "loss": 0.0004, + "step": 47880 + }, + { + "epoch": 0.93, + "learning_rate": 1.4255757057978329e-08, + "loss": 0.0006, + "step": 47881 + }, + { + "epoch": 0.93, + "learning_rate": 1.4251873713642187e-08, + "loss": 0.0004, + "step": 47882 + }, + { + "epoch": 0.93, + "learning_rate": 1.4247990369306045e-08, + "loss": 1.3108, + "step": 47883 + }, + { + "epoch": 0.93, + "learning_rate": 1.4244107024969904e-08, + "loss": 0.0004, + "step": 47884 + }, + { + "epoch": 0.93, + "learning_rate": 1.4240223680633762e-08, + "loss": 0.6267, + "step": 47885 + }, + { + "epoch": 0.93, + "learning_rate": 1.423634033629762e-08, + "loss": 0.0003, + "step": 47886 + }, + { + "epoch": 0.93, + "learning_rate": 1.4232456991961478e-08, + "loss": 0.0004, + "step": 47887 + }, + { + "epoch": 0.93, + "learning_rate": 1.4228573647625333e-08, + "loss": 0.0004, + "step": 47888 + }, + { + "epoch": 0.93, + "learning_rate": 1.4224690303289192e-08, + "loss": 0.0006, + "step": 47889 + }, + { + "epoch": 0.93, + "learning_rate": 1.422080695895305e-08, + "loss": 0.0005, + "step": 47890 + }, + { + "epoch": 0.93, + "learning_rate": 1.4216923614616908e-08, + "loss": 0.0073, + "step": 47891 + }, + { + "epoch": 0.93, + "learning_rate": 1.4213040270280766e-08, + "loss": 0.0003, + "step": 47892 + }, + { + "epoch": 0.93, + "learning_rate": 1.4209156925944623e-08, + "loss": 0.0004, + "step": 47893 + }, + { + "epoch": 0.93, + "learning_rate": 1.4205273581608481e-08, + "loss": 0.0004, + "step": 47894 + }, + { + "epoch": 0.93, + "learning_rate": 1.4201390237272338e-08, + "loss": 0.0003, + "step": 47895 + }, + { + "epoch": 0.93, + "learning_rate": 1.4197506892936196e-08, + "loss": 0.0003, + "step": 47896 + }, + { + "epoch": 0.93, + "learning_rate": 1.4193623548600053e-08, + "loss": 0.0003, + "step": 47897 + }, + { + "epoch": 0.93, + "learning_rate": 1.4189740204263911e-08, + "loss": 0.0003, + "step": 47898 + }, + { + "epoch": 0.93, + "learning_rate": 1.4185856859927769e-08, + "loss": 0.0004, + "step": 47899 + }, + { + "epoch": 0.93, + "learning_rate": 1.4181973515591627e-08, + "loss": 0.0006, + "step": 47900 + }, + { + "epoch": 0.93, + "learning_rate": 1.4178090171255486e-08, + "loss": 0.0003, + "step": 47901 + }, + { + "epoch": 0.93, + "learning_rate": 1.417420682691934e-08, + "loss": 0.0003, + "step": 47902 + }, + { + "epoch": 0.93, + "learning_rate": 1.4170323482583199e-08, + "loss": 0.0005, + "step": 47903 + }, + { + "epoch": 0.93, + "learning_rate": 1.4166440138247057e-08, + "loss": 0.0005, + "step": 47904 + }, + { + "epoch": 0.93, + "learning_rate": 1.4162556793910915e-08, + "loss": 0.0006, + "step": 47905 + }, + { + "epoch": 0.93, + "learning_rate": 1.4158673449574773e-08, + "loss": 0.0005, + "step": 47906 + }, + { + "epoch": 0.93, + "learning_rate": 1.4154790105238632e-08, + "loss": 0.0003, + "step": 47907 + }, + { + "epoch": 0.93, + "learning_rate": 1.415090676090249e-08, + "loss": 0.0073, + "step": 47908 + }, + { + "epoch": 0.93, + "learning_rate": 1.4147023416566348e-08, + "loss": 0.0004, + "step": 47909 + }, + { + "epoch": 0.93, + "learning_rate": 1.4143140072230203e-08, + "loss": 0.0003, + "step": 47910 + }, + { + "epoch": 0.93, + "learning_rate": 1.4139256727894061e-08, + "loss": 0.0003, + "step": 47911 + }, + { + "epoch": 0.93, + "learning_rate": 1.413537338355792e-08, + "loss": 1.1212, + "step": 47912 + }, + { + "epoch": 0.93, + "learning_rate": 1.4131490039221778e-08, + "loss": 0.0011, + "step": 47913 + }, + { + "epoch": 0.93, + "learning_rate": 1.4127606694885636e-08, + "loss": 0.0003, + "step": 47914 + }, + { + "epoch": 0.93, + "learning_rate": 1.4123723350549493e-08, + "loss": 0.0004, + "step": 47915 + }, + { + "epoch": 0.93, + "learning_rate": 1.4119840006213351e-08, + "loss": 0.4511, + "step": 47916 + }, + { + "epoch": 0.93, + "learning_rate": 1.4115956661877208e-08, + "loss": 0.0004, + "step": 47917 + }, + { + "epoch": 0.93, + "learning_rate": 1.4112073317541066e-08, + "loss": 0.0032, + "step": 47918 + }, + { + "epoch": 0.93, + "learning_rate": 1.4108189973204922e-08, + "loss": 0.0003, + "step": 47919 + }, + { + "epoch": 0.93, + "learning_rate": 1.410430662886878e-08, + "loss": 0.0035, + "step": 47920 + }, + { + "epoch": 0.93, + "learning_rate": 1.4100423284532639e-08, + "loss": 0.0004, + "step": 47921 + }, + { + "epoch": 0.93, + "learning_rate": 1.4096539940196497e-08, + "loss": 0.0005, + "step": 47922 + }, + { + "epoch": 0.93, + "learning_rate": 1.4092656595860355e-08, + "loss": 0.0003, + "step": 47923 + }, + { + "epoch": 0.93, + "learning_rate": 1.408877325152421e-08, + "loss": 0.0003, + "step": 47924 + }, + { + "epoch": 0.93, + "learning_rate": 1.4084889907188069e-08, + "loss": 0.0005, + "step": 47925 + }, + { + "epoch": 0.93, + "learning_rate": 1.4081006562851927e-08, + "loss": 0.0003, + "step": 47926 + }, + { + "epoch": 0.93, + "learning_rate": 1.4077123218515785e-08, + "loss": 0.8837, + "step": 47927 + }, + { + "epoch": 0.93, + "learning_rate": 1.4073239874179643e-08, + "loss": 0.0004, + "step": 47928 + }, + { + "epoch": 0.93, + "learning_rate": 1.4069356529843502e-08, + "loss": 0.9061, + "step": 47929 + }, + { + "epoch": 0.93, + "learning_rate": 1.406547318550736e-08, + "loss": 0.0004, + "step": 47930 + }, + { + "epoch": 0.93, + "learning_rate": 1.4061589841171215e-08, + "loss": 0.0005, + "step": 47931 + }, + { + "epoch": 0.93, + "learning_rate": 1.4057706496835073e-08, + "loss": 0.0146, + "step": 47932 + }, + { + "epoch": 0.93, + "learning_rate": 1.4053823152498931e-08, + "loss": 0.0004, + "step": 47933 + }, + { + "epoch": 0.93, + "learning_rate": 1.404993980816279e-08, + "loss": 0.0003, + "step": 47934 + }, + { + "epoch": 0.93, + "learning_rate": 1.4046056463826648e-08, + "loss": 0.0003, + "step": 47935 + }, + { + "epoch": 0.93, + "learning_rate": 1.4042173119490506e-08, + "loss": 0.0002, + "step": 47936 + }, + { + "epoch": 0.93, + "learning_rate": 1.4038289775154363e-08, + "loss": 0.0003, + "step": 47937 + }, + { + "epoch": 0.93, + "learning_rate": 1.403440643081822e-08, + "loss": 0.6752, + "step": 47938 + }, + { + "epoch": 0.93, + "learning_rate": 1.4030523086482077e-08, + "loss": 0.0004, + "step": 47939 + }, + { + "epoch": 0.93, + "learning_rate": 1.4026639742145936e-08, + "loss": 0.0003, + "step": 47940 + }, + { + "epoch": 0.93, + "learning_rate": 1.4022756397809792e-08, + "loss": 0.0025, + "step": 47941 + }, + { + "epoch": 0.93, + "learning_rate": 1.401887305347365e-08, + "loss": 0.0007, + "step": 47942 + }, + { + "epoch": 0.93, + "learning_rate": 1.4014989709137509e-08, + "loss": 0.0002, + "step": 47943 + }, + { + "epoch": 0.93, + "learning_rate": 1.4011106364801367e-08, + "loss": 0.0003, + "step": 47944 + }, + { + "epoch": 0.93, + "learning_rate": 1.4007223020465225e-08, + "loss": 0.0005, + "step": 47945 + }, + { + "epoch": 0.93, + "learning_rate": 1.400333967612908e-08, + "loss": 0.0002, + "step": 47946 + }, + { + "epoch": 0.93, + "learning_rate": 1.3999456331792938e-08, + "loss": 0.0004, + "step": 47947 + }, + { + "epoch": 0.93, + "learning_rate": 1.3995572987456797e-08, + "loss": 0.1317, + "step": 47948 + }, + { + "epoch": 0.93, + "learning_rate": 1.3991689643120655e-08, + "loss": 0.0002, + "step": 47949 + }, + { + "epoch": 0.93, + "learning_rate": 1.3987806298784513e-08, + "loss": 0.0004, + "step": 47950 + }, + { + "epoch": 0.93, + "learning_rate": 1.3983922954448371e-08, + "loss": 0.0005, + "step": 47951 + }, + { + "epoch": 0.93, + "learning_rate": 1.398003961011223e-08, + "loss": 0.0003, + "step": 47952 + }, + { + "epoch": 0.93, + "learning_rate": 1.3976156265776084e-08, + "loss": 0.0005, + "step": 47953 + }, + { + "epoch": 0.93, + "learning_rate": 1.3972272921439943e-08, + "loss": 0.0004, + "step": 47954 + }, + { + "epoch": 0.93, + "learning_rate": 1.3968389577103801e-08, + "loss": 0.0011, + "step": 47955 + }, + { + "epoch": 0.93, + "learning_rate": 1.396450623276766e-08, + "loss": 0.0006, + "step": 47956 + }, + { + "epoch": 0.93, + "learning_rate": 1.3960622888431517e-08, + "loss": 0.0008, + "step": 47957 + }, + { + "epoch": 0.93, + "learning_rate": 1.3956739544095376e-08, + "loss": 0.0007, + "step": 47958 + }, + { + "epoch": 0.93, + "learning_rate": 1.3952856199759232e-08, + "loss": 0.9407, + "step": 47959 + }, + { + "epoch": 0.93, + "learning_rate": 1.3948972855423089e-08, + "loss": 0.0003, + "step": 47960 + }, + { + "epoch": 0.93, + "learning_rate": 1.3945089511086947e-08, + "loss": 0.1286, + "step": 47961 + }, + { + "epoch": 0.93, + "learning_rate": 1.3941206166750805e-08, + "loss": 0.0004, + "step": 47962 + }, + { + "epoch": 0.93, + "learning_rate": 1.3937322822414662e-08, + "loss": 0.0004, + "step": 47963 + }, + { + "epoch": 0.93, + "learning_rate": 1.393343947807852e-08, + "loss": 0.0012, + "step": 47964 + }, + { + "epoch": 0.93, + "learning_rate": 1.3929556133742378e-08, + "loss": 0.0007, + "step": 47965 + }, + { + "epoch": 0.93, + "learning_rate": 1.3925672789406237e-08, + "loss": 0.0004, + "step": 47966 + }, + { + "epoch": 0.93, + "learning_rate": 1.3921789445070095e-08, + "loss": 1.2575, + "step": 47967 + }, + { + "epoch": 0.93, + "learning_rate": 1.391790610073395e-08, + "loss": 0.0007, + "step": 47968 + }, + { + "epoch": 0.93, + "learning_rate": 1.3914022756397808e-08, + "loss": 0.0003, + "step": 47969 + }, + { + "epoch": 0.93, + "learning_rate": 1.3910139412061666e-08, + "loss": 0.0004, + "step": 47970 + }, + { + "epoch": 0.93, + "learning_rate": 1.3906256067725525e-08, + "loss": 0.0005, + "step": 47971 + }, + { + "epoch": 0.93, + "learning_rate": 1.3902372723389383e-08, + "loss": 0.0004, + "step": 47972 + }, + { + "epoch": 0.93, + "learning_rate": 1.3898489379053241e-08, + "loss": 0.0005, + "step": 47973 + }, + { + "epoch": 0.93, + "learning_rate": 1.38946060347171e-08, + "loss": 0.0004, + "step": 47974 + }, + { + "epoch": 0.93, + "learning_rate": 1.3890722690380954e-08, + "loss": 0.0004, + "step": 47975 + }, + { + "epoch": 0.93, + "learning_rate": 1.3886839346044813e-08, + "loss": 0.001, + "step": 47976 + }, + { + "epoch": 0.93, + "learning_rate": 1.388295600170867e-08, + "loss": 0.0094, + "step": 47977 + }, + { + "epoch": 0.93, + "learning_rate": 1.3879072657372529e-08, + "loss": 0.0003, + "step": 47978 + }, + { + "epoch": 0.93, + "learning_rate": 1.3875189313036387e-08, + "loss": 0.0004, + "step": 47979 + }, + { + "epoch": 0.93, + "learning_rate": 1.3871305968700246e-08, + "loss": 0.0003, + "step": 47980 + }, + { + "epoch": 0.93, + "learning_rate": 1.3867422624364104e-08, + "loss": 0.0004, + "step": 47981 + }, + { + "epoch": 0.93, + "learning_rate": 1.3863539280027959e-08, + "loss": 0.0005, + "step": 47982 + }, + { + "epoch": 0.93, + "learning_rate": 1.3859655935691817e-08, + "loss": 0.0003, + "step": 47983 + }, + { + "epoch": 0.93, + "learning_rate": 1.3855772591355675e-08, + "loss": 0.0005, + "step": 47984 + }, + { + "epoch": 0.93, + "learning_rate": 1.3851889247019532e-08, + "loss": 0.001, + "step": 47985 + }, + { + "epoch": 0.93, + "learning_rate": 1.384800590268339e-08, + "loss": 0.0005, + "step": 47986 + }, + { + "epoch": 0.93, + "learning_rate": 1.3844122558347248e-08, + "loss": 0.0003, + "step": 47987 + }, + { + "epoch": 0.93, + "learning_rate": 1.3840239214011106e-08, + "loss": 0.0003, + "step": 47988 + }, + { + "epoch": 0.93, + "learning_rate": 1.3836355869674961e-08, + "loss": 0.0003, + "step": 47989 + }, + { + "epoch": 0.93, + "learning_rate": 1.383247252533882e-08, + "loss": 0.0137, + "step": 47990 + }, + { + "epoch": 0.93, + "learning_rate": 1.3828589181002678e-08, + "loss": 0.0037, + "step": 47991 + }, + { + "epoch": 0.93, + "learning_rate": 1.3824705836666536e-08, + "loss": 0.0005, + "step": 47992 + }, + { + "epoch": 0.93, + "learning_rate": 1.3820822492330394e-08, + "loss": 0.0003, + "step": 47993 + }, + { + "epoch": 0.93, + "learning_rate": 1.3816939147994253e-08, + "loss": 0.0003, + "step": 47994 + }, + { + "epoch": 0.93, + "learning_rate": 1.3813055803658111e-08, + "loss": 0.1094, + "step": 47995 + }, + { + "epoch": 0.93, + "learning_rate": 1.3809172459321969e-08, + "loss": 0.0004, + "step": 47996 + }, + { + "epoch": 0.93, + "learning_rate": 1.3805289114985824e-08, + "loss": 0.0006, + "step": 47997 + }, + { + "epoch": 0.93, + "learning_rate": 1.3801405770649682e-08, + "loss": 0.0006, + "step": 47998 + }, + { + "epoch": 0.93, + "learning_rate": 1.379752242631354e-08, + "loss": 0.0004, + "step": 47999 + }, + { + "epoch": 0.93, + "learning_rate": 1.3793639081977399e-08, + "loss": 0.0004, + "step": 48000 + }, + { + "epoch": 0.93, + "learning_rate": 1.3789755737641257e-08, + "loss": 0.001, + "step": 48001 + }, + { + "epoch": 0.93, + "learning_rate": 1.3785872393305115e-08, + "loss": 0.0003, + "step": 48002 + }, + { + "epoch": 0.93, + "learning_rate": 1.3781989048968974e-08, + "loss": 0.0003, + "step": 48003 + }, + { + "epoch": 0.93, + "learning_rate": 1.3778105704632828e-08, + "loss": 0.001, + "step": 48004 + }, + { + "epoch": 0.93, + "learning_rate": 1.3774222360296687e-08, + "loss": 0.0003, + "step": 48005 + }, + { + "epoch": 0.93, + "learning_rate": 1.3770339015960545e-08, + "loss": 0.0005, + "step": 48006 + }, + { + "epoch": 0.93, + "learning_rate": 1.3766455671624402e-08, + "loss": 0.0004, + "step": 48007 + }, + { + "epoch": 0.93, + "learning_rate": 1.376257232728826e-08, + "loss": 0.0004, + "step": 48008 + }, + { + "epoch": 0.93, + "learning_rate": 1.3758688982952118e-08, + "loss": 0.0003, + "step": 48009 + }, + { + "epoch": 0.93, + "learning_rate": 1.3754805638615976e-08, + "loss": 0.0005, + "step": 48010 + }, + { + "epoch": 0.93, + "learning_rate": 1.3750922294279831e-08, + "loss": 0.0003, + "step": 48011 + }, + { + "epoch": 0.93, + "learning_rate": 1.374703894994369e-08, + "loss": 0.0003, + "step": 48012 + }, + { + "epoch": 0.93, + "learning_rate": 1.3743155605607548e-08, + "loss": 0.0251, + "step": 48013 + }, + { + "epoch": 0.93, + "learning_rate": 1.3739272261271406e-08, + "loss": 0.2281, + "step": 48014 + }, + { + "epoch": 0.93, + "learning_rate": 1.3735388916935264e-08, + "loss": 1.2342, + "step": 48015 + }, + { + "epoch": 0.93, + "learning_rate": 1.3731505572599122e-08, + "loss": 0.0004, + "step": 48016 + }, + { + "epoch": 0.93, + "learning_rate": 1.372762222826298e-08, + "loss": 0.0004, + "step": 48017 + }, + { + "epoch": 0.93, + "learning_rate": 1.3723738883926836e-08, + "loss": 0.0005, + "step": 48018 + }, + { + "epoch": 0.93, + "learning_rate": 1.3719855539590694e-08, + "loss": 0.0003, + "step": 48019 + }, + { + "epoch": 0.93, + "learning_rate": 1.3715972195254552e-08, + "loss": 0.0004, + "step": 48020 + }, + { + "epoch": 0.93, + "learning_rate": 1.371208885091841e-08, + "loss": 0.0004, + "step": 48021 + }, + { + "epoch": 0.93, + "learning_rate": 1.3708205506582269e-08, + "loss": 0.0004, + "step": 48022 + }, + { + "epoch": 0.93, + "learning_rate": 1.3704322162246127e-08, + "loss": 0.0004, + "step": 48023 + }, + { + "epoch": 0.93, + "learning_rate": 1.3700438817909985e-08, + "loss": 0.0005, + "step": 48024 + }, + { + "epoch": 0.93, + "learning_rate": 1.3696555473573843e-08, + "loss": 0.0003, + "step": 48025 + }, + { + "epoch": 0.93, + "learning_rate": 1.3692672129237698e-08, + "loss": 0.0003, + "step": 48026 + }, + { + "epoch": 0.93, + "learning_rate": 1.3688788784901557e-08, + "loss": 0.0004, + "step": 48027 + }, + { + "epoch": 0.93, + "learning_rate": 1.3684905440565415e-08, + "loss": 0.0004, + "step": 48028 + }, + { + "epoch": 0.93, + "learning_rate": 1.3681022096229271e-08, + "loss": 0.0003, + "step": 48029 + }, + { + "epoch": 0.93, + "learning_rate": 1.367713875189313e-08, + "loss": 0.0005, + "step": 48030 + }, + { + "epoch": 0.93, + "learning_rate": 1.3673255407556988e-08, + "loss": 0.0004, + "step": 48031 + }, + { + "epoch": 0.93, + "learning_rate": 1.3669372063220846e-08, + "loss": 0.0411, + "step": 48032 + }, + { + "epoch": 0.93, + "learning_rate": 1.3665488718884701e-08, + "loss": 0.0012, + "step": 48033 + }, + { + "epoch": 0.93, + "learning_rate": 1.366160537454856e-08, + "loss": 0.0004, + "step": 48034 + }, + { + "epoch": 0.93, + "learning_rate": 1.3657722030212418e-08, + "loss": 0.0004, + "step": 48035 + }, + { + "epoch": 0.93, + "learning_rate": 1.3653838685876276e-08, + "loss": 0.5215, + "step": 48036 + }, + { + "epoch": 0.93, + "learning_rate": 1.3649955341540134e-08, + "loss": 0.0003, + "step": 48037 + }, + { + "epoch": 0.93, + "learning_rate": 1.3646071997203992e-08, + "loss": 0.0004, + "step": 48038 + }, + { + "epoch": 0.93, + "learning_rate": 1.364218865286785e-08, + "loss": 0.0003, + "step": 48039 + }, + { + "epoch": 0.93, + "learning_rate": 1.3638305308531705e-08, + "loss": 0.0002, + "step": 48040 + }, + { + "epoch": 0.93, + "learning_rate": 1.3634421964195564e-08, + "loss": 0.0007, + "step": 48041 + }, + { + "epoch": 0.93, + "learning_rate": 1.3630538619859422e-08, + "loss": 0.0008, + "step": 48042 + }, + { + "epoch": 0.93, + "learning_rate": 1.362665527552328e-08, + "loss": 0.0004, + "step": 48043 + }, + { + "epoch": 0.93, + "learning_rate": 1.3622771931187138e-08, + "loss": 0.0011, + "step": 48044 + }, + { + "epoch": 0.93, + "learning_rate": 1.3618888586850997e-08, + "loss": 0.0005, + "step": 48045 + }, + { + "epoch": 0.93, + "learning_rate": 1.3615005242514855e-08, + "loss": 0.0003, + "step": 48046 + }, + { + "epoch": 0.93, + "learning_rate": 1.361112189817871e-08, + "loss": 0.0342, + "step": 48047 + }, + { + "epoch": 0.93, + "learning_rate": 1.3607238553842568e-08, + "loss": 0.0003, + "step": 48048 + }, + { + "epoch": 0.93, + "learning_rate": 1.3603355209506426e-08, + "loss": 0.0004, + "step": 48049 + }, + { + "epoch": 0.93, + "learning_rate": 1.3599471865170285e-08, + "loss": 0.3266, + "step": 48050 + }, + { + "epoch": 0.93, + "learning_rate": 1.3595588520834143e-08, + "loss": 0.0004, + "step": 48051 + }, + { + "epoch": 0.93, + "learning_rate": 1.3591705176498e-08, + "loss": 0.0004, + "step": 48052 + }, + { + "epoch": 0.93, + "learning_rate": 1.3587821832161858e-08, + "loss": 0.0003, + "step": 48053 + }, + { + "epoch": 0.93, + "learning_rate": 1.3583938487825716e-08, + "loss": 0.0002, + "step": 48054 + }, + { + "epoch": 0.93, + "learning_rate": 1.358005514348957e-08, + "loss": 0.0003, + "step": 48055 + }, + { + "epoch": 0.93, + "learning_rate": 1.3576171799153429e-08, + "loss": 0.0003, + "step": 48056 + }, + { + "epoch": 0.93, + "learning_rate": 1.3572288454817287e-08, + "loss": 0.0003, + "step": 48057 + }, + { + "epoch": 0.93, + "learning_rate": 1.3568405110481146e-08, + "loss": 1.2975, + "step": 48058 + }, + { + "epoch": 0.93, + "learning_rate": 1.3564521766145004e-08, + "loss": 0.0003, + "step": 48059 + }, + { + "epoch": 0.93, + "learning_rate": 1.3560638421808862e-08, + "loss": 0.0004, + "step": 48060 + }, + { + "epoch": 0.93, + "learning_rate": 1.355675507747272e-08, + "loss": 0.0004, + "step": 48061 + }, + { + "epoch": 0.93, + "learning_rate": 1.3552871733136575e-08, + "loss": 0.0004, + "step": 48062 + }, + { + "epoch": 0.93, + "learning_rate": 1.3548988388800433e-08, + "loss": 0.0004, + "step": 48063 + }, + { + "epoch": 0.93, + "learning_rate": 1.3545105044464292e-08, + "loss": 0.0004, + "step": 48064 + }, + { + "epoch": 0.93, + "learning_rate": 1.354122170012815e-08, + "loss": 0.0004, + "step": 48065 + }, + { + "epoch": 0.93, + "learning_rate": 1.3537338355792008e-08, + "loss": 0.0004, + "step": 48066 + }, + { + "epoch": 0.93, + "learning_rate": 1.3533455011455866e-08, + "loss": 0.0004, + "step": 48067 + }, + { + "epoch": 0.93, + "learning_rate": 1.3529571667119725e-08, + "loss": 0.0004, + "step": 48068 + }, + { + "epoch": 0.93, + "learning_rate": 1.352568832278358e-08, + "loss": 1.1234, + "step": 48069 + }, + { + "epoch": 0.93, + "learning_rate": 1.3521804978447438e-08, + "loss": 0.3484, + "step": 48070 + }, + { + "epoch": 0.93, + "learning_rate": 1.3517921634111296e-08, + "loss": 0.0004, + "step": 48071 + }, + { + "epoch": 0.93, + "learning_rate": 1.3514038289775154e-08, + "loss": 0.0003, + "step": 48072 + }, + { + "epoch": 0.93, + "learning_rate": 1.3510154945439013e-08, + "loss": 0.0005, + "step": 48073 + }, + { + "epoch": 0.93, + "learning_rate": 1.350627160110287e-08, + "loss": 0.0004, + "step": 48074 + }, + { + "epoch": 0.93, + "learning_rate": 1.3502388256766727e-08, + "loss": 0.0004, + "step": 48075 + }, + { + "epoch": 0.93, + "learning_rate": 1.3498504912430584e-08, + "loss": 0.4236, + "step": 48076 + }, + { + "epoch": 0.93, + "learning_rate": 1.349462156809444e-08, + "loss": 0.0003, + "step": 48077 + }, + { + "epoch": 0.93, + "learning_rate": 1.3490738223758299e-08, + "loss": 0.0004, + "step": 48078 + }, + { + "epoch": 0.93, + "learning_rate": 1.3486854879422157e-08, + "loss": 0.0003, + "step": 48079 + }, + { + "epoch": 0.93, + "learning_rate": 1.3482971535086015e-08, + "loss": 0.0002, + "step": 48080 + }, + { + "epoch": 0.93, + "learning_rate": 1.3479088190749874e-08, + "loss": 0.0005, + "step": 48081 + }, + { + "epoch": 0.93, + "learning_rate": 1.3475204846413732e-08, + "loss": 0.0003, + "step": 48082 + }, + { + "epoch": 0.93, + "learning_rate": 1.347132150207759e-08, + "loss": 0.0003, + "step": 48083 + }, + { + "epoch": 0.93, + "learning_rate": 1.3467438157741445e-08, + "loss": 0.0005, + "step": 48084 + }, + { + "epoch": 0.93, + "learning_rate": 1.3463554813405303e-08, + "loss": 0.0005, + "step": 48085 + }, + { + "epoch": 0.93, + "learning_rate": 1.3459671469069161e-08, + "loss": 0.0003, + "step": 48086 + }, + { + "epoch": 0.93, + "learning_rate": 1.345578812473302e-08, + "loss": 0.1704, + "step": 48087 + }, + { + "epoch": 0.93, + "learning_rate": 1.3451904780396878e-08, + "loss": 0.0004, + "step": 48088 + }, + { + "epoch": 0.93, + "learning_rate": 1.3448021436060736e-08, + "loss": 0.0005, + "step": 48089 + }, + { + "epoch": 0.93, + "learning_rate": 1.3444138091724594e-08, + "loss": 0.0005, + "step": 48090 + }, + { + "epoch": 0.93, + "learning_rate": 1.344025474738845e-08, + "loss": 0.0003, + "step": 48091 + }, + { + "epoch": 0.93, + "learning_rate": 1.3436371403052308e-08, + "loss": 0.0003, + "step": 48092 + }, + { + "epoch": 0.93, + "learning_rate": 1.3432488058716166e-08, + "loss": 0.0005, + "step": 48093 + }, + { + "epoch": 0.93, + "learning_rate": 1.3428604714380024e-08, + "loss": 0.0005, + "step": 48094 + }, + { + "epoch": 0.93, + "learning_rate": 1.3424721370043882e-08, + "loss": 0.0004, + "step": 48095 + }, + { + "epoch": 0.93, + "learning_rate": 1.3420838025707739e-08, + "loss": 0.0004, + "step": 48096 + }, + { + "epoch": 0.93, + "learning_rate": 1.3416954681371597e-08, + "loss": 0.0003, + "step": 48097 + }, + { + "epoch": 0.93, + "learning_rate": 1.3413071337035454e-08, + "loss": 0.0005, + "step": 48098 + }, + { + "epoch": 0.93, + "learning_rate": 1.340918799269931e-08, + "loss": 0.0005, + "step": 48099 + }, + { + "epoch": 0.93, + "learning_rate": 1.3405304648363169e-08, + "loss": 0.0003, + "step": 48100 + }, + { + "epoch": 0.93, + "learning_rate": 1.3401421304027027e-08, + "loss": 0.0003, + "step": 48101 + }, + { + "epoch": 0.93, + "learning_rate": 1.3397537959690885e-08, + "loss": 0.0004, + "step": 48102 + }, + { + "epoch": 0.93, + "learning_rate": 1.3393654615354743e-08, + "loss": 0.0004, + "step": 48103 + }, + { + "epoch": 0.93, + "learning_rate": 1.3389771271018602e-08, + "loss": 0.0002, + "step": 48104 + }, + { + "epoch": 0.93, + "learning_rate": 1.3385887926682457e-08, + "loss": 0.0003, + "step": 48105 + }, + { + "epoch": 0.93, + "learning_rate": 1.3382004582346315e-08, + "loss": 0.0005, + "step": 48106 + }, + { + "epoch": 0.93, + "learning_rate": 1.3378121238010173e-08, + "loss": 0.0003, + "step": 48107 + }, + { + "epoch": 0.93, + "learning_rate": 1.3374237893674031e-08, + "loss": 0.0005, + "step": 48108 + }, + { + "epoch": 0.93, + "learning_rate": 1.337035454933789e-08, + "loss": 0.006, + "step": 48109 + }, + { + "epoch": 0.93, + "learning_rate": 1.3366471205001748e-08, + "loss": 0.0006, + "step": 48110 + }, + { + "epoch": 0.93, + "learning_rate": 1.3362587860665606e-08, + "loss": 0.5509, + "step": 48111 + }, + { + "epoch": 0.93, + "learning_rate": 1.3358704516329464e-08, + "loss": 0.0007, + "step": 48112 + }, + { + "epoch": 0.93, + "learning_rate": 1.335482117199332e-08, + "loss": 1.3271, + "step": 48113 + }, + { + "epoch": 0.93, + "learning_rate": 1.3350937827657177e-08, + "loss": 0.0003, + "step": 48114 + }, + { + "epoch": 0.93, + "learning_rate": 1.3347054483321036e-08, + "loss": 0.0004, + "step": 48115 + }, + { + "epoch": 0.93, + "learning_rate": 1.3343171138984894e-08, + "loss": 0.0003, + "step": 48116 + }, + { + "epoch": 0.93, + "learning_rate": 1.3339287794648752e-08, + "loss": 0.0123, + "step": 48117 + }, + { + "epoch": 0.93, + "learning_rate": 1.3335404450312609e-08, + "loss": 0.0309, + "step": 48118 + }, + { + "epoch": 0.93, + "learning_rate": 1.3331521105976467e-08, + "loss": 0.0003, + "step": 48119 + }, + { + "epoch": 0.93, + "learning_rate": 1.3327637761640324e-08, + "loss": 0.6117, + "step": 48120 + }, + { + "epoch": 0.93, + "learning_rate": 1.3323754417304182e-08, + "loss": 0.0005, + "step": 48121 + }, + { + "epoch": 0.93, + "learning_rate": 1.3319871072968038e-08, + "loss": 0.0005, + "step": 48122 + }, + { + "epoch": 0.93, + "learning_rate": 1.3315987728631897e-08, + "loss": 0.0003, + "step": 48123 + }, + { + "epoch": 0.93, + "learning_rate": 1.3312104384295755e-08, + "loss": 0.0003, + "step": 48124 + }, + { + "epoch": 0.93, + "learning_rate": 1.3308221039959613e-08, + "loss": 0.0951, + "step": 48125 + }, + { + "epoch": 0.93, + "learning_rate": 1.3304337695623471e-08, + "loss": 0.0005, + "step": 48126 + }, + { + "epoch": 0.93, + "learning_rate": 1.3300454351287326e-08, + "loss": 0.0119, + "step": 48127 + }, + { + "epoch": 0.93, + "learning_rate": 1.3296571006951185e-08, + "loss": 0.0006, + "step": 48128 + }, + { + "epoch": 0.93, + "learning_rate": 1.3292687662615043e-08, + "loss": 0.0003, + "step": 48129 + }, + { + "epoch": 0.93, + "learning_rate": 1.3288804318278901e-08, + "loss": 0.0003, + "step": 48130 + }, + { + "epoch": 0.93, + "learning_rate": 1.328492097394276e-08, + "loss": 0.0004, + "step": 48131 + }, + { + "epoch": 0.93, + "learning_rate": 1.3281037629606618e-08, + "loss": 0.0003, + "step": 48132 + }, + { + "epoch": 0.93, + "learning_rate": 1.3277154285270476e-08, + "loss": 0.0006, + "step": 48133 + }, + { + "epoch": 0.93, + "learning_rate": 1.327327094093433e-08, + "loss": 0.0005, + "step": 48134 + }, + { + "epoch": 0.93, + "learning_rate": 1.3269387596598189e-08, + "loss": 0.0004, + "step": 48135 + }, + { + "epoch": 0.93, + "learning_rate": 1.3265504252262047e-08, + "loss": 0.0005, + "step": 48136 + }, + { + "epoch": 0.93, + "learning_rate": 1.3261620907925905e-08, + "loss": 0.0914, + "step": 48137 + }, + { + "epoch": 0.93, + "learning_rate": 1.3257737563589764e-08, + "loss": 0.0004, + "step": 48138 + }, + { + "epoch": 0.93, + "learning_rate": 1.3253854219253622e-08, + "loss": 0.0005, + "step": 48139 + }, + { + "epoch": 0.93, + "learning_rate": 1.3249970874917479e-08, + "loss": 0.0004, + "step": 48140 + }, + { + "epoch": 0.93, + "learning_rate": 1.3246087530581337e-08, + "loss": 0.0138, + "step": 48141 + }, + { + "epoch": 0.93, + "learning_rate": 1.3242204186245193e-08, + "loss": 0.0003, + "step": 48142 + }, + { + "epoch": 0.93, + "learning_rate": 1.3238320841909052e-08, + "loss": 0.2398, + "step": 48143 + }, + { + "epoch": 0.93, + "learning_rate": 1.3234437497572908e-08, + "loss": 0.0099, + "step": 48144 + }, + { + "epoch": 0.93, + "learning_rate": 1.3230554153236766e-08, + "loss": 0.0012, + "step": 48145 + }, + { + "epoch": 0.93, + "learning_rate": 1.3226670808900625e-08, + "loss": 0.0005, + "step": 48146 + }, + { + "epoch": 0.93, + "learning_rate": 1.3222787464564483e-08, + "loss": 0.0005, + "step": 48147 + }, + { + "epoch": 0.93, + "learning_rate": 1.3218904120228341e-08, + "loss": 0.0004, + "step": 48148 + }, + { + "epoch": 0.93, + "learning_rate": 1.3215020775892196e-08, + "loss": 0.0004, + "step": 48149 + }, + { + "epoch": 0.93, + "learning_rate": 1.3211137431556054e-08, + "loss": 0.004, + "step": 48150 + }, + { + "epoch": 0.93, + "learning_rate": 1.3207254087219913e-08, + "loss": 0.0015, + "step": 48151 + }, + { + "epoch": 0.93, + "learning_rate": 1.3203370742883771e-08, + "loss": 0.0003, + "step": 48152 + }, + { + "epoch": 0.93, + "learning_rate": 1.3199487398547629e-08, + "loss": 0.0003, + "step": 48153 + }, + { + "epoch": 0.93, + "learning_rate": 1.3195604054211487e-08, + "loss": 0.0787, + "step": 48154 + }, + { + "epoch": 0.93, + "learning_rate": 1.3191720709875346e-08, + "loss": 0.0003, + "step": 48155 + }, + { + "epoch": 0.93, + "learning_rate": 1.31878373655392e-08, + "loss": 0.389, + "step": 48156 + }, + { + "epoch": 0.93, + "learning_rate": 1.3183954021203059e-08, + "loss": 0.0004, + "step": 48157 + }, + { + "epoch": 0.93, + "learning_rate": 1.3180070676866917e-08, + "loss": 0.0003, + "step": 48158 + }, + { + "epoch": 0.93, + "learning_rate": 1.3176187332530775e-08, + "loss": 0.0005, + "step": 48159 + }, + { + "epoch": 0.93, + "learning_rate": 1.3172303988194634e-08, + "loss": 0.0004, + "step": 48160 + }, + { + "epoch": 0.93, + "learning_rate": 1.3168420643858492e-08, + "loss": 0.0004, + "step": 48161 + }, + { + "epoch": 0.93, + "learning_rate": 1.3164537299522348e-08, + "loss": 0.0003, + "step": 48162 + }, + { + "epoch": 0.93, + "learning_rate": 1.3160653955186205e-08, + "loss": 0.0005, + "step": 48163 + }, + { + "epoch": 0.93, + "learning_rate": 1.3156770610850063e-08, + "loss": 0.0006, + "step": 48164 + }, + { + "epoch": 0.93, + "learning_rate": 1.3152887266513921e-08, + "loss": 0.0003, + "step": 48165 + }, + { + "epoch": 0.93, + "learning_rate": 1.3149003922177778e-08, + "loss": 0.0006, + "step": 48166 + }, + { + "epoch": 0.93, + "learning_rate": 1.3145120577841636e-08, + "loss": 0.0083, + "step": 48167 + }, + { + "epoch": 0.93, + "learning_rate": 1.3141237233505495e-08, + "loss": 0.0003, + "step": 48168 + }, + { + "epoch": 0.93, + "learning_rate": 1.3137353889169353e-08, + "loss": 0.0006, + "step": 48169 + }, + { + "epoch": 0.93, + "learning_rate": 1.3133470544833211e-08, + "loss": 0.0545, + "step": 48170 + }, + { + "epoch": 0.93, + "learning_rate": 1.3129587200497066e-08, + "loss": 0.0003, + "step": 48171 + }, + { + "epoch": 0.93, + "learning_rate": 1.3125703856160924e-08, + "loss": 0.0003, + "step": 48172 + }, + { + "epoch": 0.93, + "learning_rate": 1.3121820511824782e-08, + "loss": 0.0004, + "step": 48173 + }, + { + "epoch": 0.93, + "learning_rate": 1.311793716748864e-08, + "loss": 0.0006, + "step": 48174 + }, + { + "epoch": 0.93, + "learning_rate": 1.3114053823152499e-08, + "loss": 0.0244, + "step": 48175 + }, + { + "epoch": 0.93, + "learning_rate": 1.3110170478816357e-08, + "loss": 0.0002, + "step": 48176 + }, + { + "epoch": 0.93, + "learning_rate": 1.3106287134480215e-08, + "loss": 0.0038, + "step": 48177 + }, + { + "epoch": 0.93, + "learning_rate": 1.310240379014407e-08, + "loss": 0.3602, + "step": 48178 + }, + { + "epoch": 0.93, + "learning_rate": 1.3098520445807929e-08, + "loss": 0.0004, + "step": 48179 + }, + { + "epoch": 0.93, + "learning_rate": 1.3094637101471787e-08, + "loss": 0.0002, + "step": 48180 + }, + { + "epoch": 0.93, + "learning_rate": 1.3090753757135645e-08, + "loss": 0.0003, + "step": 48181 + }, + { + "epoch": 0.93, + "learning_rate": 1.3086870412799503e-08, + "loss": 0.0006, + "step": 48182 + }, + { + "epoch": 0.93, + "learning_rate": 1.3082987068463362e-08, + "loss": 0.0003, + "step": 48183 + }, + { + "epoch": 0.93, + "learning_rate": 1.3079103724127218e-08, + "loss": 0.1432, + "step": 48184 + }, + { + "epoch": 0.93, + "learning_rate": 1.3075220379791075e-08, + "loss": 0.0004, + "step": 48185 + }, + { + "epoch": 0.93, + "learning_rate": 1.3071337035454933e-08, + "loss": 0.0015, + "step": 48186 + }, + { + "epoch": 0.93, + "learning_rate": 1.3067453691118791e-08, + "loss": 0.0003, + "step": 48187 + }, + { + "epoch": 0.93, + "learning_rate": 1.3063570346782648e-08, + "loss": 0.0005, + "step": 48188 + }, + { + "epoch": 0.93, + "learning_rate": 1.3059687002446506e-08, + "loss": 0.0004, + "step": 48189 + }, + { + "epoch": 0.93, + "learning_rate": 1.3055803658110364e-08, + "loss": 0.0007, + "step": 48190 + }, + { + "epoch": 0.93, + "learning_rate": 1.3051920313774223e-08, + "loss": 0.0004, + "step": 48191 + }, + { + "epoch": 0.93, + "learning_rate": 1.3048036969438077e-08, + "loss": 0.8867, + "step": 48192 + }, + { + "epoch": 0.93, + "learning_rate": 1.3044153625101936e-08, + "loss": 0.0003, + "step": 48193 + }, + { + "epoch": 0.93, + "learning_rate": 1.3040270280765794e-08, + "loss": 0.0003, + "step": 48194 + }, + { + "epoch": 0.93, + "learning_rate": 1.3036386936429652e-08, + "loss": 0.0332, + "step": 48195 + }, + { + "epoch": 0.93, + "learning_rate": 1.303250359209351e-08, + "loss": 0.0004, + "step": 48196 + }, + { + "epoch": 0.93, + "learning_rate": 1.3028620247757369e-08, + "loss": 0.0004, + "step": 48197 + }, + { + "epoch": 0.93, + "learning_rate": 1.3024736903421227e-08, + "loss": 0.0003, + "step": 48198 + }, + { + "epoch": 0.93, + "learning_rate": 1.3020853559085085e-08, + "loss": 0.0004, + "step": 48199 + }, + { + "epoch": 0.93, + "learning_rate": 1.301697021474894e-08, + "loss": 0.0004, + "step": 48200 + }, + { + "epoch": 0.93, + "learning_rate": 1.3013086870412798e-08, + "loss": 0.0007, + "step": 48201 + }, + { + "epoch": 0.94, + "learning_rate": 1.3009203526076657e-08, + "loss": 0.0004, + "step": 48202 + }, + { + "epoch": 0.94, + "learning_rate": 1.3005320181740515e-08, + "loss": 0.0006, + "step": 48203 + }, + { + "epoch": 0.94, + "learning_rate": 1.3001436837404373e-08, + "loss": 0.0005, + "step": 48204 + }, + { + "epoch": 0.94, + "learning_rate": 1.2997553493068231e-08, + "loss": 0.0005, + "step": 48205 + }, + { + "epoch": 0.94, + "learning_rate": 1.2993670148732088e-08, + "loss": 0.0006, + "step": 48206 + }, + { + "epoch": 0.94, + "learning_rate": 1.2989786804395945e-08, + "loss": 0.0016, + "step": 48207 + }, + { + "epoch": 0.94, + "learning_rate": 1.2985903460059803e-08, + "loss": 0.0004, + "step": 48208 + }, + { + "epoch": 0.94, + "learning_rate": 1.2982020115723661e-08, + "loss": 0.0003, + "step": 48209 + }, + { + "epoch": 0.94, + "learning_rate": 1.2978136771387518e-08, + "loss": 0.0003, + "step": 48210 + }, + { + "epoch": 0.94, + "learning_rate": 1.2974253427051376e-08, + "loss": 0.0004, + "step": 48211 + }, + { + "epoch": 0.94, + "learning_rate": 1.2970370082715234e-08, + "loss": 0.0395, + "step": 48212 + }, + { + "epoch": 0.94, + "learning_rate": 1.2966486738379092e-08, + "loss": 0.0004, + "step": 48213 + }, + { + "epoch": 0.94, + "learning_rate": 1.2962603394042947e-08, + "loss": 0.0002, + "step": 48214 + }, + { + "epoch": 0.94, + "learning_rate": 1.2958720049706806e-08, + "loss": 0.0004, + "step": 48215 + }, + { + "epoch": 0.94, + "learning_rate": 1.2954836705370664e-08, + "loss": 0.0003, + "step": 48216 + }, + { + "epoch": 0.94, + "learning_rate": 1.2950953361034522e-08, + "loss": 0.0003, + "step": 48217 + }, + { + "epoch": 0.94, + "learning_rate": 1.294707001669838e-08, + "loss": 0.0004, + "step": 48218 + }, + { + "epoch": 0.94, + "learning_rate": 1.2943186672362239e-08, + "loss": 0.0003, + "step": 48219 + }, + { + "epoch": 0.94, + "learning_rate": 1.2939303328026097e-08, + "loss": 0.0004, + "step": 48220 + }, + { + "epoch": 0.94, + "learning_rate": 1.2935419983689952e-08, + "loss": 0.0004, + "step": 48221 + }, + { + "epoch": 0.94, + "learning_rate": 1.293153663935381e-08, + "loss": 0.0003, + "step": 48222 + }, + { + "epoch": 0.94, + "learning_rate": 1.2927653295017668e-08, + "loss": 0.0004, + "step": 48223 + }, + { + "epoch": 0.94, + "learning_rate": 1.2923769950681526e-08, + "loss": 0.0005, + "step": 48224 + }, + { + "epoch": 0.94, + "learning_rate": 1.2919886606345385e-08, + "loss": 0.0003, + "step": 48225 + }, + { + "epoch": 0.94, + "learning_rate": 1.2916003262009243e-08, + "loss": 0.9344, + "step": 48226 + }, + { + "epoch": 0.94, + "learning_rate": 1.2912119917673101e-08, + "loss": 0.0004, + "step": 48227 + }, + { + "epoch": 0.94, + "learning_rate": 1.290823657333696e-08, + "loss": 0.0007, + "step": 48228 + }, + { + "epoch": 0.94, + "learning_rate": 1.2904353229000814e-08, + "loss": 0.0005, + "step": 48229 + }, + { + "epoch": 0.94, + "learning_rate": 1.2900469884664673e-08, + "loss": 0.001, + "step": 48230 + }, + { + "epoch": 0.94, + "learning_rate": 1.289658654032853e-08, + "loss": 0.0006, + "step": 48231 + }, + { + "epoch": 0.94, + "learning_rate": 1.2892703195992387e-08, + "loss": 0.8032, + "step": 48232 + }, + { + "epoch": 0.94, + "learning_rate": 1.2888819851656246e-08, + "loss": 0.0003, + "step": 48233 + }, + { + "epoch": 0.94, + "learning_rate": 1.2884936507320104e-08, + "loss": 0.0003, + "step": 48234 + }, + { + "epoch": 0.94, + "learning_rate": 1.2881053162983962e-08, + "loss": 0.0004, + "step": 48235 + }, + { + "epoch": 0.94, + "learning_rate": 1.2877169818647817e-08, + "loss": 0.0004, + "step": 48236 + }, + { + "epoch": 0.94, + "learning_rate": 1.2873286474311675e-08, + "loss": 0.0003, + "step": 48237 + }, + { + "epoch": 0.94, + "learning_rate": 1.2869403129975534e-08, + "loss": 0.509, + "step": 48238 + }, + { + "epoch": 0.94, + "learning_rate": 1.2865519785639392e-08, + "loss": 0.0004, + "step": 48239 + }, + { + "epoch": 0.94, + "learning_rate": 1.286163644130325e-08, + "loss": 0.0004, + "step": 48240 + }, + { + "epoch": 0.94, + "learning_rate": 1.2857753096967108e-08, + "loss": 0.0007, + "step": 48241 + }, + { + "epoch": 0.94, + "learning_rate": 1.2853869752630967e-08, + "loss": 0.0003, + "step": 48242 + }, + { + "epoch": 0.94, + "learning_rate": 1.2849986408294821e-08, + "loss": 0.0005, + "step": 48243 + }, + { + "epoch": 0.94, + "learning_rate": 1.284610306395868e-08, + "loss": 0.0004, + "step": 48244 + }, + { + "epoch": 0.94, + "learning_rate": 1.2842219719622538e-08, + "loss": 0.0004, + "step": 48245 + }, + { + "epoch": 0.94, + "learning_rate": 1.2838336375286396e-08, + "loss": 0.0005, + "step": 48246 + }, + { + "epoch": 0.94, + "learning_rate": 1.2834453030950254e-08, + "loss": 0.0004, + "step": 48247 + }, + { + "epoch": 0.94, + "learning_rate": 1.2830569686614113e-08, + "loss": 0.0003, + "step": 48248 + }, + { + "epoch": 0.94, + "learning_rate": 1.2826686342277971e-08, + "loss": 0.0004, + "step": 48249 + }, + { + "epoch": 0.94, + "learning_rate": 1.2822802997941826e-08, + "loss": 0.0004, + "step": 48250 + }, + { + "epoch": 0.94, + "learning_rate": 1.2818919653605684e-08, + "loss": 0.002, + "step": 48251 + }, + { + "epoch": 0.94, + "learning_rate": 1.2815036309269542e-08, + "loss": 0.0004, + "step": 48252 + }, + { + "epoch": 0.94, + "learning_rate": 1.28111529649334e-08, + "loss": 0.0007, + "step": 48253 + }, + { + "epoch": 0.94, + "learning_rate": 1.2807269620597257e-08, + "loss": 0.0009, + "step": 48254 + }, + { + "epoch": 0.94, + "learning_rate": 1.2803386276261115e-08, + "loss": 0.008, + "step": 48255 + }, + { + "epoch": 0.94, + "learning_rate": 1.2799502931924974e-08, + "loss": 0.0007, + "step": 48256 + }, + { + "epoch": 0.94, + "learning_rate": 1.2795619587588832e-08, + "loss": 0.0004, + "step": 48257 + }, + { + "epoch": 0.94, + "learning_rate": 1.2791736243252687e-08, + "loss": 0.0003, + "step": 48258 + }, + { + "epoch": 0.94, + "learning_rate": 1.2787852898916545e-08, + "loss": 0.0004, + "step": 48259 + }, + { + "epoch": 0.94, + "learning_rate": 1.2783969554580403e-08, + "loss": 0.0008, + "step": 48260 + }, + { + "epoch": 0.94, + "learning_rate": 1.2780086210244262e-08, + "loss": 0.0005, + "step": 48261 + }, + { + "epoch": 0.94, + "learning_rate": 1.277620286590812e-08, + "loss": 0.0561, + "step": 48262 + }, + { + "epoch": 0.94, + "learning_rate": 1.2772319521571978e-08, + "loss": 0.0005, + "step": 48263 + }, + { + "epoch": 0.94, + "learning_rate": 1.2768436177235836e-08, + "loss": 0.0004, + "step": 48264 + }, + { + "epoch": 0.94, + "learning_rate": 1.2764552832899691e-08, + "loss": 0.0003, + "step": 48265 + }, + { + "epoch": 0.94, + "learning_rate": 1.276066948856355e-08, + "loss": 0.0004, + "step": 48266 + }, + { + "epoch": 0.94, + "learning_rate": 1.2756786144227408e-08, + "loss": 0.006, + "step": 48267 + }, + { + "epoch": 0.94, + "learning_rate": 1.2752902799891266e-08, + "loss": 0.0004, + "step": 48268 + }, + { + "epoch": 0.94, + "learning_rate": 1.2749019455555124e-08, + "loss": 0.0003, + "step": 48269 + }, + { + "epoch": 0.94, + "learning_rate": 1.2745136111218983e-08, + "loss": 0.0005, + "step": 48270 + }, + { + "epoch": 0.94, + "learning_rate": 1.274125276688284e-08, + "loss": 0.0003, + "step": 48271 + }, + { + "epoch": 0.94, + "learning_rate": 1.2737369422546696e-08, + "loss": 0.0005, + "step": 48272 + }, + { + "epoch": 0.94, + "learning_rate": 1.2733486078210554e-08, + "loss": 0.0003, + "step": 48273 + }, + { + "epoch": 0.94, + "learning_rate": 1.2729602733874412e-08, + "loss": 0.0004, + "step": 48274 + }, + { + "epoch": 0.94, + "learning_rate": 1.272571938953827e-08, + "loss": 0.0004, + "step": 48275 + }, + { + "epoch": 0.94, + "learning_rate": 1.2721836045202127e-08, + "loss": 2.0929, + "step": 48276 + }, + { + "epoch": 0.94, + "learning_rate": 1.2717952700865985e-08, + "loss": 0.2598, + "step": 48277 + }, + { + "epoch": 0.94, + "learning_rate": 1.2714069356529843e-08, + "loss": 1.1384, + "step": 48278 + }, + { + "epoch": 0.94, + "learning_rate": 1.27101860121937e-08, + "loss": 0.0003, + "step": 48279 + }, + { + "epoch": 0.94, + "learning_rate": 1.2706302667857557e-08, + "loss": 0.7397, + "step": 48280 + }, + { + "epoch": 0.94, + "learning_rate": 1.2702419323521415e-08, + "loss": 0.0017, + "step": 48281 + }, + { + "epoch": 0.94, + "learning_rate": 1.2698535979185273e-08, + "loss": 0.0298, + "step": 48282 + }, + { + "epoch": 0.94, + "learning_rate": 1.2694652634849131e-08, + "loss": 0.0003, + "step": 48283 + }, + { + "epoch": 0.94, + "learning_rate": 1.269076929051299e-08, + "loss": 0.0003, + "step": 48284 + }, + { + "epoch": 0.94, + "learning_rate": 1.2686885946176848e-08, + "loss": 0.0003, + "step": 48285 + }, + { + "epoch": 0.94, + "learning_rate": 1.2683002601840706e-08, + "loss": 0.0004, + "step": 48286 + }, + { + "epoch": 0.94, + "learning_rate": 1.2679119257504561e-08, + "loss": 0.0005, + "step": 48287 + }, + { + "epoch": 0.94, + "learning_rate": 1.267523591316842e-08, + "loss": 0.0016, + "step": 48288 + }, + { + "epoch": 0.94, + "learning_rate": 1.2671352568832278e-08, + "loss": 0.0014, + "step": 48289 + }, + { + "epoch": 0.94, + "learning_rate": 1.2667469224496136e-08, + "loss": 0.6529, + "step": 48290 + }, + { + "epoch": 0.94, + "learning_rate": 1.2663585880159994e-08, + "loss": 0.0003, + "step": 48291 + }, + { + "epoch": 0.94, + "learning_rate": 1.2659702535823852e-08, + "loss": 0.0004, + "step": 48292 + }, + { + "epoch": 0.94, + "learning_rate": 1.265581919148771e-08, + "loss": 0.0042, + "step": 48293 + }, + { + "epoch": 0.94, + "learning_rate": 1.2651935847151565e-08, + "loss": 0.0005, + "step": 48294 + }, + { + "epoch": 0.94, + "learning_rate": 1.2648052502815424e-08, + "loss": 0.0003, + "step": 48295 + }, + { + "epoch": 0.94, + "learning_rate": 1.2644169158479282e-08, + "loss": 0.0005, + "step": 48296 + }, + { + "epoch": 0.94, + "learning_rate": 1.264028581414314e-08, + "loss": 0.0003, + "step": 48297 + }, + { + "epoch": 0.94, + "learning_rate": 1.2636402469806998e-08, + "loss": 0.0003, + "step": 48298 + }, + { + "epoch": 0.94, + "learning_rate": 1.2632519125470855e-08, + "loss": 0.0002, + "step": 48299 + }, + { + "epoch": 0.94, + "learning_rate": 1.2628635781134713e-08, + "loss": 0.0003, + "step": 48300 + }, + { + "epoch": 0.94, + "learning_rate": 1.262475243679857e-08, + "loss": 0.0003, + "step": 48301 + }, + { + "epoch": 0.94, + "learning_rate": 1.2620869092462426e-08, + "loss": 1.0387, + "step": 48302 + }, + { + "epoch": 0.94, + "learning_rate": 1.2616985748126285e-08, + "loss": 0.0003, + "step": 48303 + }, + { + "epoch": 0.94, + "learning_rate": 1.2613102403790143e-08, + "loss": 0.0003, + "step": 48304 + }, + { + "epoch": 0.94, + "learning_rate": 1.2609219059454001e-08, + "loss": 0.0003, + "step": 48305 + }, + { + "epoch": 0.94, + "learning_rate": 1.260533571511786e-08, + "loss": 0.0004, + "step": 48306 + }, + { + "epoch": 0.94, + "learning_rate": 1.2601452370781718e-08, + "loss": 0.0003, + "step": 48307 + }, + { + "epoch": 0.94, + "learning_rate": 1.2597569026445573e-08, + "loss": 0.0003, + "step": 48308 + }, + { + "epoch": 0.94, + "learning_rate": 1.2593685682109431e-08, + "loss": 0.0003, + "step": 48309 + }, + { + "epoch": 0.94, + "learning_rate": 1.2589802337773289e-08, + "loss": 0.0003, + "step": 48310 + }, + { + "epoch": 0.94, + "learning_rate": 1.2585918993437147e-08, + "loss": 0.0004, + "step": 48311 + }, + { + "epoch": 0.94, + "learning_rate": 1.2582035649101006e-08, + "loss": 0.8693, + "step": 48312 + }, + { + "epoch": 0.94, + "learning_rate": 1.2578152304764864e-08, + "loss": 0.0003, + "step": 48313 + }, + { + "epoch": 0.94, + "learning_rate": 1.2574268960428722e-08, + "loss": 0.0004, + "step": 48314 + }, + { + "epoch": 0.94, + "learning_rate": 1.257038561609258e-08, + "loss": 0.0004, + "step": 48315 + }, + { + "epoch": 0.94, + "learning_rate": 1.2566502271756435e-08, + "loss": 0.0004, + "step": 48316 + }, + { + "epoch": 0.94, + "learning_rate": 1.2562618927420294e-08, + "loss": 0.0106, + "step": 48317 + }, + { + "epoch": 0.94, + "learning_rate": 1.2558735583084152e-08, + "loss": 0.0004, + "step": 48318 + }, + { + "epoch": 0.94, + "learning_rate": 1.255485223874801e-08, + "loss": 0.001, + "step": 48319 + }, + { + "epoch": 0.94, + "learning_rate": 1.2550968894411868e-08, + "loss": 0.025, + "step": 48320 + }, + { + "epoch": 0.94, + "learning_rate": 1.2547085550075725e-08, + "loss": 0.0012, + "step": 48321 + }, + { + "epoch": 0.94, + "learning_rate": 1.2543202205739583e-08, + "loss": 0.0004, + "step": 48322 + }, + { + "epoch": 0.94, + "learning_rate": 1.253931886140344e-08, + "loss": 1.4064, + "step": 48323 + }, + { + "epoch": 0.94, + "learning_rate": 1.2535435517067296e-08, + "loss": 0.0004, + "step": 48324 + }, + { + "epoch": 0.94, + "learning_rate": 1.2531552172731155e-08, + "loss": 0.0003, + "step": 48325 + }, + { + "epoch": 0.94, + "learning_rate": 1.2527668828395013e-08, + "loss": 0.0004, + "step": 48326 + }, + { + "epoch": 0.94, + "learning_rate": 1.2523785484058871e-08, + "loss": 0.0007, + "step": 48327 + }, + { + "epoch": 0.94, + "learning_rate": 1.251990213972273e-08, + "loss": 1.0441, + "step": 48328 + }, + { + "epoch": 0.94, + "learning_rate": 1.2516018795386587e-08, + "loss": 0.0005, + "step": 48329 + }, + { + "epoch": 0.94, + "learning_rate": 1.2512135451050442e-08, + "loss": 0.0005, + "step": 48330 + }, + { + "epoch": 0.94, + "learning_rate": 1.25082521067143e-08, + "loss": 0.0004, + "step": 48331 + }, + { + "epoch": 0.94, + "learning_rate": 1.2504368762378159e-08, + "loss": 0.0106, + "step": 48332 + }, + { + "epoch": 0.94, + "learning_rate": 1.2500485418042017e-08, + "loss": 0.0005, + "step": 48333 + }, + { + "epoch": 0.94, + "learning_rate": 1.2496602073705875e-08, + "loss": 0.0003, + "step": 48334 + }, + { + "epoch": 0.94, + "learning_rate": 1.2492718729369732e-08, + "loss": 0.0004, + "step": 48335 + }, + { + "epoch": 0.94, + "learning_rate": 1.248883538503359e-08, + "loss": 0.0005, + "step": 48336 + }, + { + "epoch": 0.94, + "learning_rate": 1.2484952040697448e-08, + "loss": 0.0003, + "step": 48337 + }, + { + "epoch": 0.94, + "learning_rate": 1.2481068696361307e-08, + "loss": 1.4954, + "step": 48338 + }, + { + "epoch": 0.94, + "learning_rate": 1.2477185352025163e-08, + "loss": 0.0004, + "step": 48339 + }, + { + "epoch": 0.94, + "learning_rate": 1.2473302007689022e-08, + "loss": 0.0006, + "step": 48340 + }, + { + "epoch": 0.94, + "learning_rate": 1.246941866335288e-08, + "loss": 0.0006, + "step": 48341 + }, + { + "epoch": 0.94, + "learning_rate": 1.2465535319016738e-08, + "loss": 0.0004, + "step": 48342 + }, + { + "epoch": 0.94, + "learning_rate": 1.2461651974680595e-08, + "loss": 0.0008, + "step": 48343 + }, + { + "epoch": 0.94, + "learning_rate": 1.2457768630344453e-08, + "loss": 0.0008, + "step": 48344 + }, + { + "epoch": 0.94, + "learning_rate": 1.245388528600831e-08, + "loss": 0.0004, + "step": 48345 + }, + { + "epoch": 0.94, + "learning_rate": 1.2450001941672168e-08, + "loss": 0.0005, + "step": 48346 + }, + { + "epoch": 0.94, + "learning_rate": 1.2446118597336024e-08, + "loss": 0.0004, + "step": 48347 + }, + { + "epoch": 0.94, + "learning_rate": 1.2442235252999883e-08, + "loss": 0.0005, + "step": 48348 + }, + { + "epoch": 0.94, + "learning_rate": 1.243835190866374e-08, + "loss": 0.0004, + "step": 48349 + }, + { + "epoch": 0.94, + "learning_rate": 1.2434468564327597e-08, + "loss": 0.0003, + "step": 48350 + }, + { + "epoch": 0.94, + "learning_rate": 1.2430585219991456e-08, + "loss": 0.0057, + "step": 48351 + }, + { + "epoch": 0.94, + "learning_rate": 1.2426701875655314e-08, + "loss": 0.0005, + "step": 48352 + }, + { + "epoch": 0.94, + "learning_rate": 1.2422818531319172e-08, + "loss": 0.0004, + "step": 48353 + }, + { + "epoch": 0.94, + "learning_rate": 1.2418935186983029e-08, + "loss": 0.0005, + "step": 48354 + }, + { + "epoch": 0.94, + "learning_rate": 1.2415051842646887e-08, + "loss": 0.0005, + "step": 48355 + }, + { + "epoch": 0.94, + "learning_rate": 1.2411168498310745e-08, + "loss": 0.0034, + "step": 48356 + }, + { + "epoch": 0.94, + "learning_rate": 1.2407285153974602e-08, + "loss": 0.0009, + "step": 48357 + }, + { + "epoch": 0.94, + "learning_rate": 1.240340180963846e-08, + "loss": 0.0009, + "step": 48358 + }, + { + "epoch": 0.94, + "learning_rate": 1.2399518465302318e-08, + "loss": 0.0029, + "step": 48359 + }, + { + "epoch": 0.94, + "learning_rate": 1.2395635120966177e-08, + "loss": 0.0002, + "step": 48360 + }, + { + "epoch": 0.94, + "learning_rate": 1.2391751776630033e-08, + "loss": 0.0063, + "step": 48361 + }, + { + "epoch": 0.94, + "learning_rate": 1.2387868432293891e-08, + "loss": 0.0026, + "step": 48362 + }, + { + "epoch": 0.94, + "learning_rate": 1.238398508795775e-08, + "loss": 0.0004, + "step": 48363 + }, + { + "epoch": 0.94, + "learning_rate": 1.2380101743621606e-08, + "loss": 0.0005, + "step": 48364 + }, + { + "epoch": 0.94, + "learning_rate": 1.2376218399285464e-08, + "loss": 0.0003, + "step": 48365 + }, + { + "epoch": 0.94, + "learning_rate": 1.2372335054949323e-08, + "loss": 0.0003, + "step": 48366 + }, + { + "epoch": 0.94, + "learning_rate": 1.236845171061318e-08, + "loss": 0.0004, + "step": 48367 + }, + { + "epoch": 0.94, + "learning_rate": 1.2364568366277038e-08, + "loss": 0.0004, + "step": 48368 + }, + { + "epoch": 0.94, + "learning_rate": 1.2360685021940894e-08, + "loss": 0.0003, + "step": 48369 + }, + { + "epoch": 0.94, + "learning_rate": 1.2356801677604752e-08, + "loss": 0.0003, + "step": 48370 + }, + { + "epoch": 0.94, + "learning_rate": 1.235291833326861e-08, + "loss": 0.0004, + "step": 48371 + }, + { + "epoch": 0.94, + "learning_rate": 1.2349034988932467e-08, + "loss": 0.001, + "step": 48372 + }, + { + "epoch": 0.94, + "learning_rate": 1.2345151644596325e-08, + "loss": 0.0003, + "step": 48373 + }, + { + "epoch": 0.94, + "learning_rate": 1.2341268300260184e-08, + "loss": 0.0266, + "step": 48374 + }, + { + "epoch": 0.94, + "learning_rate": 1.233738495592404e-08, + "loss": 0.0004, + "step": 48375 + }, + { + "epoch": 0.94, + "learning_rate": 1.2333501611587898e-08, + "loss": 0.0003, + "step": 48376 + }, + { + "epoch": 0.94, + "learning_rate": 1.2329618267251757e-08, + "loss": 0.0003, + "step": 48377 + }, + { + "epoch": 0.94, + "learning_rate": 1.2325734922915615e-08, + "loss": 0.0003, + "step": 48378 + }, + { + "epoch": 0.94, + "learning_rate": 1.2321851578579472e-08, + "loss": 0.0005, + "step": 48379 + }, + { + "epoch": 0.94, + "learning_rate": 1.231796823424333e-08, + "loss": 0.0003, + "step": 48380 + }, + { + "epoch": 0.94, + "learning_rate": 1.2314084889907188e-08, + "loss": 0.0004, + "step": 48381 + }, + { + "epoch": 0.94, + "learning_rate": 1.2310201545571046e-08, + "loss": 0.0003, + "step": 48382 + }, + { + "epoch": 0.94, + "learning_rate": 1.2306318201234903e-08, + "loss": 0.0003, + "step": 48383 + }, + { + "epoch": 0.94, + "learning_rate": 1.2302434856898761e-08, + "loss": 0.8494, + "step": 48384 + }, + { + "epoch": 0.94, + "learning_rate": 1.229855151256262e-08, + "loss": 0.0004, + "step": 48385 + }, + { + "epoch": 0.94, + "learning_rate": 1.2294668168226476e-08, + "loss": 0.0003, + "step": 48386 + }, + { + "epoch": 0.94, + "learning_rate": 1.2290784823890334e-08, + "loss": 0.0003, + "step": 48387 + }, + { + "epoch": 0.94, + "learning_rate": 1.2286901479554192e-08, + "loss": 0.0003, + "step": 48388 + }, + { + "epoch": 0.94, + "learning_rate": 1.2283018135218049e-08, + "loss": 0.6798, + "step": 48389 + }, + { + "epoch": 0.94, + "learning_rate": 1.2279134790881907e-08, + "loss": 0.0003, + "step": 48390 + }, + { + "epoch": 0.94, + "learning_rate": 1.2275251446545764e-08, + "loss": 0.0005, + "step": 48391 + }, + { + "epoch": 0.94, + "learning_rate": 1.2271368102209622e-08, + "loss": 0.0006, + "step": 48392 + }, + { + "epoch": 0.94, + "learning_rate": 1.2267484757873479e-08, + "loss": 0.0004, + "step": 48393 + }, + { + "epoch": 0.94, + "learning_rate": 1.2263601413537337e-08, + "loss": 0.0004, + "step": 48394 + }, + { + "epoch": 0.94, + "learning_rate": 1.2259718069201195e-08, + "loss": 0.0003, + "step": 48395 + }, + { + "epoch": 0.94, + "learning_rate": 1.2255834724865053e-08, + "loss": 0.3657, + "step": 48396 + }, + { + "epoch": 0.94, + "learning_rate": 1.225195138052891e-08, + "loss": 0.0098, + "step": 48397 + }, + { + "epoch": 0.94, + "learning_rate": 1.2248068036192768e-08, + "loss": 0.0003, + "step": 48398 + }, + { + "epoch": 0.94, + "learning_rate": 1.2244184691856627e-08, + "loss": 0.0005, + "step": 48399 + }, + { + "epoch": 0.94, + "learning_rate": 1.2240301347520485e-08, + "loss": 0.0003, + "step": 48400 + }, + { + "epoch": 0.94, + "learning_rate": 1.2236418003184341e-08, + "loss": 0.6418, + "step": 48401 + }, + { + "epoch": 0.94, + "learning_rate": 1.22325346588482e-08, + "loss": 0.0004, + "step": 48402 + }, + { + "epoch": 0.94, + "learning_rate": 1.2228651314512058e-08, + "loss": 0.0006, + "step": 48403 + }, + { + "epoch": 0.94, + "learning_rate": 1.2224767970175914e-08, + "loss": 0.0003, + "step": 48404 + }, + { + "epoch": 0.94, + "learning_rate": 1.2220884625839773e-08, + "loss": 0.0005, + "step": 48405 + }, + { + "epoch": 0.94, + "learning_rate": 1.2217001281503631e-08, + "loss": 0.0004, + "step": 48406 + }, + { + "epoch": 0.94, + "learning_rate": 1.221311793716749e-08, + "loss": 0.0004, + "step": 48407 + }, + { + "epoch": 0.94, + "learning_rate": 1.2209234592831346e-08, + "loss": 0.2787, + "step": 48408 + }, + { + "epoch": 0.94, + "learning_rate": 1.2205351248495204e-08, + "loss": 0.0006, + "step": 48409 + }, + { + "epoch": 0.94, + "learning_rate": 1.2201467904159062e-08, + "loss": 0.0003, + "step": 48410 + }, + { + "epoch": 0.94, + "learning_rate": 1.2197584559822919e-08, + "loss": 0.0003, + "step": 48411 + }, + { + "epoch": 0.94, + "learning_rate": 1.2193701215486777e-08, + "loss": 0.0003, + "step": 48412 + }, + { + "epoch": 0.94, + "learning_rate": 1.2189817871150634e-08, + "loss": 0.0004, + "step": 48413 + }, + { + "epoch": 0.94, + "learning_rate": 1.2185934526814492e-08, + "loss": 0.0005, + "step": 48414 + }, + { + "epoch": 0.94, + "learning_rate": 1.2182051182478349e-08, + "loss": 0.0011, + "step": 48415 + }, + { + "epoch": 0.94, + "learning_rate": 1.2178167838142207e-08, + "loss": 0.0009, + "step": 48416 + }, + { + "epoch": 0.94, + "learning_rate": 1.2174284493806065e-08, + "loss": 0.0005, + "step": 48417 + }, + { + "epoch": 0.94, + "learning_rate": 1.2170401149469923e-08, + "loss": 0.0004, + "step": 48418 + }, + { + "epoch": 0.94, + "learning_rate": 1.216651780513378e-08, + "loss": 0.0003, + "step": 48419 + }, + { + "epoch": 0.94, + "learning_rate": 1.2162634460797638e-08, + "loss": 0.0004, + "step": 48420 + }, + { + "epoch": 0.94, + "learning_rate": 1.2158751116461496e-08, + "loss": 0.0011, + "step": 48421 + }, + { + "epoch": 0.94, + "learning_rate": 1.2154867772125353e-08, + "loss": 0.0004, + "step": 48422 + }, + { + "epoch": 0.94, + "learning_rate": 1.2150984427789211e-08, + "loss": 0.0002, + "step": 48423 + }, + { + "epoch": 0.94, + "learning_rate": 1.214710108345307e-08, + "loss": 0.0005, + "step": 48424 + }, + { + "epoch": 0.94, + "learning_rate": 1.2143217739116928e-08, + "loss": 0.0002, + "step": 48425 + }, + { + "epoch": 0.94, + "learning_rate": 1.2139334394780784e-08, + "loss": 0.0002, + "step": 48426 + }, + { + "epoch": 0.94, + "learning_rate": 1.2135451050444642e-08, + "loss": 0.0005, + "step": 48427 + }, + { + "epoch": 0.94, + "learning_rate": 1.21315677061085e-08, + "loss": 0.0005, + "step": 48428 + }, + { + "epoch": 0.94, + "learning_rate": 1.2127684361772359e-08, + "loss": 0.0005, + "step": 48429 + }, + { + "epoch": 0.94, + "learning_rate": 1.2123801017436216e-08, + "loss": 0.0004, + "step": 48430 + }, + { + "epoch": 0.94, + "learning_rate": 1.2119917673100074e-08, + "loss": 0.0004, + "step": 48431 + }, + { + "epoch": 0.94, + "learning_rate": 1.2116034328763932e-08, + "loss": 0.0003, + "step": 48432 + }, + { + "epoch": 0.94, + "learning_rate": 1.2112150984427789e-08, + "loss": 0.0004, + "step": 48433 + }, + { + "epoch": 0.94, + "learning_rate": 1.2108267640091647e-08, + "loss": 0.1088, + "step": 48434 + }, + { + "epoch": 0.94, + "learning_rate": 1.2104384295755503e-08, + "loss": 0.0004, + "step": 48435 + }, + { + "epoch": 0.94, + "learning_rate": 1.2100500951419362e-08, + "loss": 0.0003, + "step": 48436 + }, + { + "epoch": 0.94, + "learning_rate": 1.2096617607083218e-08, + "loss": 0.0004, + "step": 48437 + }, + { + "epoch": 0.94, + "learning_rate": 1.2092734262747077e-08, + "loss": 0.0005, + "step": 48438 + }, + { + "epoch": 0.94, + "learning_rate": 1.2088850918410935e-08, + "loss": 0.0002, + "step": 48439 + }, + { + "epoch": 0.94, + "learning_rate": 1.2084967574074793e-08, + "loss": 0.0004, + "step": 48440 + }, + { + "epoch": 0.94, + "learning_rate": 1.208108422973865e-08, + "loss": 0.0005, + "step": 48441 + }, + { + "epoch": 0.94, + "learning_rate": 1.2077200885402508e-08, + "loss": 0.0004, + "step": 48442 + }, + { + "epoch": 0.94, + "learning_rate": 1.2073317541066366e-08, + "loss": 0.0003, + "step": 48443 + }, + { + "epoch": 0.94, + "learning_rate": 1.2069434196730223e-08, + "loss": 0.0004, + "step": 48444 + }, + { + "epoch": 0.94, + "learning_rate": 1.2065550852394081e-08, + "loss": 0.0003, + "step": 48445 + }, + { + "epoch": 0.94, + "learning_rate": 1.206166750805794e-08, + "loss": 0.0005, + "step": 48446 + }, + { + "epoch": 0.94, + "learning_rate": 1.2057784163721797e-08, + "loss": 0.0003, + "step": 48447 + }, + { + "epoch": 0.94, + "learning_rate": 1.2053900819385654e-08, + "loss": 0.0006, + "step": 48448 + }, + { + "epoch": 0.94, + "learning_rate": 1.2050017475049512e-08, + "loss": 0.0004, + "step": 48449 + }, + { + "epoch": 0.94, + "learning_rate": 1.204613413071337e-08, + "loss": 0.0004, + "step": 48450 + }, + { + "epoch": 0.94, + "learning_rate": 1.2042250786377227e-08, + "loss": 0.0004, + "step": 48451 + }, + { + "epoch": 0.94, + "learning_rate": 1.2038367442041085e-08, + "loss": 0.0003, + "step": 48452 + }, + { + "epoch": 0.94, + "learning_rate": 1.2034484097704944e-08, + "loss": 0.0007, + "step": 48453 + }, + { + "epoch": 0.94, + "learning_rate": 1.2030600753368802e-08, + "loss": 0.0005, + "step": 48454 + }, + { + "epoch": 0.94, + "learning_rate": 1.2026717409032658e-08, + "loss": 0.0005, + "step": 48455 + }, + { + "epoch": 0.94, + "learning_rate": 1.2022834064696517e-08, + "loss": 0.0003, + "step": 48456 + }, + { + "epoch": 0.94, + "learning_rate": 1.2018950720360373e-08, + "loss": 0.5179, + "step": 48457 + }, + { + "epoch": 0.94, + "learning_rate": 1.2015067376024232e-08, + "loss": 0.0003, + "step": 48458 + }, + { + "epoch": 0.94, + "learning_rate": 1.2011184031688088e-08, + "loss": 0.0005, + "step": 48459 + }, + { + "epoch": 0.94, + "learning_rate": 1.2007300687351946e-08, + "loss": 0.001, + "step": 48460 + }, + { + "epoch": 0.94, + "learning_rate": 1.2003417343015805e-08, + "loss": 1.1546, + "step": 48461 + }, + { + "epoch": 0.94, + "learning_rate": 1.1999533998679661e-08, + "loss": 0.0004, + "step": 48462 + }, + { + "epoch": 0.94, + "learning_rate": 1.199565065434352e-08, + "loss": 0.0053, + "step": 48463 + }, + { + "epoch": 0.94, + "learning_rate": 1.1991767310007378e-08, + "loss": 0.0004, + "step": 48464 + }, + { + "epoch": 0.94, + "learning_rate": 1.1987883965671236e-08, + "loss": 0.0023, + "step": 48465 + }, + { + "epoch": 0.94, + "learning_rate": 1.1984000621335093e-08, + "loss": 0.009, + "step": 48466 + }, + { + "epoch": 0.94, + "learning_rate": 1.198011727699895e-08, + "loss": 0.0003, + "step": 48467 + }, + { + "epoch": 0.94, + "learning_rate": 1.1976233932662809e-08, + "loss": 0.0009, + "step": 48468 + }, + { + "epoch": 0.94, + "learning_rate": 1.1972350588326667e-08, + "loss": 0.1967, + "step": 48469 + }, + { + "epoch": 0.94, + "learning_rate": 1.1968467243990524e-08, + "loss": 0.0004, + "step": 48470 + }, + { + "epoch": 0.94, + "learning_rate": 1.1964583899654382e-08, + "loss": 0.0004, + "step": 48471 + }, + { + "epoch": 0.94, + "learning_rate": 1.196070055531824e-08, + "loss": 0.0005, + "step": 48472 + }, + { + "epoch": 0.94, + "learning_rate": 1.1956817210982097e-08, + "loss": 0.0003, + "step": 48473 + }, + { + "epoch": 0.94, + "learning_rate": 1.1952933866645955e-08, + "loss": 0.0006, + "step": 48474 + }, + { + "epoch": 0.94, + "learning_rate": 1.1949050522309813e-08, + "loss": 0.0003, + "step": 48475 + }, + { + "epoch": 0.94, + "learning_rate": 1.1945167177973672e-08, + "loss": 0.0005, + "step": 48476 + }, + { + "epoch": 0.94, + "learning_rate": 1.1941283833637528e-08, + "loss": 0.0008, + "step": 48477 + }, + { + "epoch": 0.94, + "learning_rate": 1.1937400489301386e-08, + "loss": 0.0004, + "step": 48478 + }, + { + "epoch": 0.94, + "learning_rate": 1.1933517144965243e-08, + "loss": 0.0003, + "step": 48479 + }, + { + "epoch": 0.94, + "learning_rate": 1.1929633800629101e-08, + "loss": 0.0003, + "step": 48480 + }, + { + "epoch": 0.94, + "learning_rate": 1.1925750456292958e-08, + "loss": 0.0003, + "step": 48481 + }, + { + "epoch": 0.94, + "learning_rate": 1.1921867111956816e-08, + "loss": 0.0003, + "step": 48482 + }, + { + "epoch": 0.94, + "learning_rate": 1.1917983767620674e-08, + "loss": 0.0002, + "step": 48483 + }, + { + "epoch": 0.94, + "learning_rate": 1.1914100423284531e-08, + "loss": 0.0002, + "step": 48484 + }, + { + "epoch": 0.94, + "learning_rate": 1.191021707894839e-08, + "loss": 0.0004, + "step": 48485 + }, + { + "epoch": 0.94, + "learning_rate": 1.1906333734612247e-08, + "loss": 0.3695, + "step": 48486 + }, + { + "epoch": 0.94, + "learning_rate": 1.1902450390276106e-08, + "loss": 0.0004, + "step": 48487 + }, + { + "epoch": 0.94, + "learning_rate": 1.1898567045939962e-08, + "loss": 0.0004, + "step": 48488 + }, + { + "epoch": 0.94, + "learning_rate": 1.189468370160382e-08, + "loss": 0.0012, + "step": 48489 + }, + { + "epoch": 0.94, + "learning_rate": 1.1890800357267679e-08, + "loss": 0.0007, + "step": 48490 + }, + { + "epoch": 0.94, + "learning_rate": 1.1886917012931535e-08, + "loss": 0.0004, + "step": 48491 + }, + { + "epoch": 0.94, + "learning_rate": 1.1883033668595394e-08, + "loss": 0.0004, + "step": 48492 + }, + { + "epoch": 0.94, + "learning_rate": 1.1879150324259252e-08, + "loss": 0.0037, + "step": 48493 + }, + { + "epoch": 0.94, + "learning_rate": 1.187526697992311e-08, + "loss": 0.0004, + "step": 48494 + }, + { + "epoch": 0.94, + "learning_rate": 1.1871383635586967e-08, + "loss": 0.0006, + "step": 48495 + }, + { + "epoch": 0.94, + "learning_rate": 1.1867500291250825e-08, + "loss": 0.0004, + "step": 48496 + }, + { + "epoch": 0.94, + "learning_rate": 1.1863616946914683e-08, + "loss": 0.0007, + "step": 48497 + }, + { + "epoch": 0.94, + "learning_rate": 1.1859733602578541e-08, + "loss": 0.0004, + "step": 48498 + }, + { + "epoch": 0.94, + "learning_rate": 1.1855850258242398e-08, + "loss": 0.0006, + "step": 48499 + }, + { + "epoch": 0.94, + "learning_rate": 1.1851966913906256e-08, + "loss": 0.0004, + "step": 48500 + }, + { + "epoch": 0.94, + "learning_rate": 1.1848083569570113e-08, + "loss": 0.0002, + "step": 48501 + }, + { + "epoch": 0.94, + "learning_rate": 1.1844200225233971e-08, + "loss": 0.0004, + "step": 48502 + }, + { + "epoch": 0.94, + "learning_rate": 1.1840316880897828e-08, + "loss": 0.0003, + "step": 48503 + }, + { + "epoch": 0.94, + "learning_rate": 1.1836433536561686e-08, + "loss": 0.0004, + "step": 48504 + }, + { + "epoch": 0.94, + "learning_rate": 1.1832550192225544e-08, + "loss": 0.0003, + "step": 48505 + }, + { + "epoch": 0.94, + "learning_rate": 1.18286668478894e-08, + "loss": 0.0003, + "step": 48506 + }, + { + "epoch": 0.94, + "learning_rate": 1.1824783503553259e-08, + "loss": 1.1609, + "step": 48507 + }, + { + "epoch": 0.94, + "learning_rate": 1.1820900159217117e-08, + "loss": 0.1165, + "step": 48508 + }, + { + "epoch": 0.94, + "learning_rate": 1.1817016814880974e-08, + "loss": 0.0003, + "step": 48509 + }, + { + "epoch": 0.94, + "learning_rate": 1.1813133470544832e-08, + "loss": 1.0683, + "step": 48510 + }, + { + "epoch": 0.94, + "learning_rate": 1.180925012620869e-08, + "loss": 1.2423, + "step": 48511 + }, + { + "epoch": 0.94, + "learning_rate": 1.1805366781872549e-08, + "loss": 0.0004, + "step": 48512 + }, + { + "epoch": 0.94, + "learning_rate": 1.1801483437536405e-08, + "loss": 0.0003, + "step": 48513 + }, + { + "epoch": 0.94, + "learning_rate": 1.1797600093200263e-08, + "loss": 0.0003, + "step": 48514 + }, + { + "epoch": 0.94, + "learning_rate": 1.1793716748864122e-08, + "loss": 0.0011, + "step": 48515 + }, + { + "epoch": 0.94, + "learning_rate": 1.178983340452798e-08, + "loss": 0.0004, + "step": 48516 + }, + { + "epoch": 0.94, + "learning_rate": 1.1785950060191837e-08, + "loss": 0.0003, + "step": 48517 + }, + { + "epoch": 0.94, + "learning_rate": 1.1782066715855695e-08, + "loss": 0.0004, + "step": 48518 + }, + { + "epoch": 0.94, + "learning_rate": 1.1778183371519553e-08, + "loss": 0.0009, + "step": 48519 + }, + { + "epoch": 0.94, + "learning_rate": 1.177430002718341e-08, + "loss": 0.0003, + "step": 48520 + }, + { + "epoch": 0.94, + "learning_rate": 1.1770416682847268e-08, + "loss": 0.0005, + "step": 48521 + }, + { + "epoch": 0.94, + "learning_rate": 1.1766533338511126e-08, + "loss": 0.0005, + "step": 48522 + }, + { + "epoch": 0.94, + "learning_rate": 1.1762649994174984e-08, + "loss": 0.0005, + "step": 48523 + }, + { + "epoch": 0.94, + "learning_rate": 1.1758766649838841e-08, + "loss": 0.0003, + "step": 48524 + }, + { + "epoch": 0.94, + "learning_rate": 1.1754883305502697e-08, + "loss": 0.0005, + "step": 48525 + }, + { + "epoch": 0.94, + "learning_rate": 1.1750999961166556e-08, + "loss": 0.0004, + "step": 48526 + }, + { + "epoch": 0.94, + "learning_rate": 1.1747116616830414e-08, + "loss": 0.7355, + "step": 48527 + }, + { + "epoch": 0.94, + "learning_rate": 1.174323327249427e-08, + "loss": 0.0005, + "step": 48528 + }, + { + "epoch": 0.94, + "learning_rate": 1.1739349928158129e-08, + "loss": 0.5975, + "step": 48529 + }, + { + "epoch": 0.94, + "learning_rate": 1.1735466583821987e-08, + "loss": 0.0005, + "step": 48530 + }, + { + "epoch": 0.94, + "learning_rate": 1.1731583239485844e-08, + "loss": 0.0004, + "step": 48531 + }, + { + "epoch": 0.94, + "learning_rate": 1.1727699895149702e-08, + "loss": 0.0004, + "step": 48532 + }, + { + "epoch": 0.94, + "learning_rate": 1.172381655081356e-08, + "loss": 0.0004, + "step": 48533 + }, + { + "epoch": 0.94, + "learning_rate": 1.1719933206477418e-08, + "loss": 0.0071, + "step": 48534 + }, + { + "epoch": 0.94, + "learning_rate": 1.1716049862141275e-08, + "loss": 0.0004, + "step": 48535 + }, + { + "epoch": 0.94, + "learning_rate": 1.1712166517805133e-08, + "loss": 0.5071, + "step": 48536 + }, + { + "epoch": 0.94, + "learning_rate": 1.1708283173468991e-08, + "loss": 0.0045, + "step": 48537 + }, + { + "epoch": 0.94, + "learning_rate": 1.1704399829132848e-08, + "loss": 0.0004, + "step": 48538 + }, + { + "epoch": 0.94, + "learning_rate": 1.1700516484796706e-08, + "loss": 0.0004, + "step": 48539 + }, + { + "epoch": 0.94, + "learning_rate": 1.1696633140460565e-08, + "loss": 0.1172, + "step": 48540 + }, + { + "epoch": 0.94, + "learning_rate": 1.1692749796124423e-08, + "loss": 0.0004, + "step": 48541 + }, + { + "epoch": 0.94, + "learning_rate": 1.168886645178828e-08, + "loss": 0.0006, + "step": 48542 + }, + { + "epoch": 0.94, + "learning_rate": 1.1684983107452138e-08, + "loss": 0.0003, + "step": 48543 + }, + { + "epoch": 0.94, + "learning_rate": 1.1681099763115996e-08, + "loss": 0.0509, + "step": 48544 + }, + { + "epoch": 0.94, + "learning_rate": 1.1677216418779854e-08, + "loss": 0.0005, + "step": 48545 + }, + { + "epoch": 0.94, + "learning_rate": 1.167333307444371e-08, + "loss": 0.0006, + "step": 48546 + }, + { + "epoch": 0.94, + "learning_rate": 1.1669449730107567e-08, + "loss": 0.0006, + "step": 48547 + }, + { + "epoch": 0.94, + "learning_rate": 1.1665566385771426e-08, + "loss": 0.0004, + "step": 48548 + }, + { + "epoch": 0.94, + "learning_rate": 1.1661683041435282e-08, + "loss": 0.0004, + "step": 48549 + }, + { + "epoch": 0.94, + "learning_rate": 1.165779969709914e-08, + "loss": 0.0004, + "step": 48550 + }, + { + "epoch": 0.94, + "learning_rate": 1.1653916352762999e-08, + "loss": 0.0005, + "step": 48551 + }, + { + "epoch": 0.94, + "learning_rate": 1.1650033008426857e-08, + "loss": 0.0003, + "step": 48552 + }, + { + "epoch": 0.94, + "learning_rate": 1.1646149664090713e-08, + "loss": 0.0021, + "step": 48553 + }, + { + "epoch": 0.94, + "learning_rate": 1.1642266319754572e-08, + "loss": 0.2462, + "step": 48554 + }, + { + "epoch": 0.94, + "learning_rate": 1.163838297541843e-08, + "loss": 1.4068, + "step": 48555 + }, + { + "epoch": 0.94, + "learning_rate": 1.1634499631082288e-08, + "loss": 0.0004, + "step": 48556 + }, + { + "epoch": 0.94, + "learning_rate": 1.1630616286746145e-08, + "loss": 0.0005, + "step": 48557 + }, + { + "epoch": 0.94, + "learning_rate": 1.1626732942410003e-08, + "loss": 0.0003, + "step": 48558 + }, + { + "epoch": 0.94, + "learning_rate": 1.1622849598073861e-08, + "loss": 0.9356, + "step": 48559 + }, + { + "epoch": 0.94, + "learning_rate": 1.1618966253737718e-08, + "loss": 0.0003, + "step": 48560 + }, + { + "epoch": 0.94, + "learning_rate": 1.1615082909401576e-08, + "loss": 0.0004, + "step": 48561 + }, + { + "epoch": 0.94, + "learning_rate": 1.1611199565065434e-08, + "loss": 0.0003, + "step": 48562 + }, + { + "epoch": 0.94, + "learning_rate": 1.1607316220729293e-08, + "loss": 0.0003, + "step": 48563 + }, + { + "epoch": 0.94, + "learning_rate": 1.1603432876393149e-08, + "loss": 0.0027, + "step": 48564 + }, + { + "epoch": 0.94, + "learning_rate": 1.1599549532057007e-08, + "loss": 0.0003, + "step": 48565 + }, + { + "epoch": 0.94, + "learning_rate": 1.1595666187720866e-08, + "loss": 0.0006, + "step": 48566 + }, + { + "epoch": 0.94, + "learning_rate": 1.1591782843384722e-08, + "loss": 0.0005, + "step": 48567 + }, + { + "epoch": 0.94, + "learning_rate": 1.158789949904858e-08, + "loss": 0.0004, + "step": 48568 + }, + { + "epoch": 0.94, + "learning_rate": 1.1584016154712439e-08, + "loss": 0.0004, + "step": 48569 + }, + { + "epoch": 0.94, + "learning_rate": 1.1580132810376295e-08, + "loss": 0.0004, + "step": 48570 + }, + { + "epoch": 0.94, + "learning_rate": 1.1576249466040152e-08, + "loss": 0.0005, + "step": 48571 + }, + { + "epoch": 0.94, + "learning_rate": 1.157236612170401e-08, + "loss": 0.0004, + "step": 48572 + }, + { + "epoch": 0.94, + "learning_rate": 1.1568482777367868e-08, + "loss": 0.1338, + "step": 48573 + }, + { + "epoch": 0.94, + "learning_rate": 1.1564599433031727e-08, + "loss": 0.0004, + "step": 48574 + }, + { + "epoch": 0.94, + "learning_rate": 1.1560716088695583e-08, + "loss": 0.0005, + "step": 48575 + }, + { + "epoch": 0.94, + "learning_rate": 1.1556832744359441e-08, + "loss": 0.0005, + "step": 48576 + }, + { + "epoch": 0.94, + "learning_rate": 1.15529494000233e-08, + "loss": 0.0002, + "step": 48577 + }, + { + "epoch": 0.94, + "learning_rate": 1.1549066055687156e-08, + "loss": 0.0003, + "step": 48578 + }, + { + "epoch": 0.94, + "learning_rate": 1.1545182711351015e-08, + "loss": 0.0003, + "step": 48579 + }, + { + "epoch": 0.94, + "learning_rate": 1.1541299367014873e-08, + "loss": 0.0004, + "step": 48580 + }, + { + "epoch": 0.94, + "learning_rate": 1.1537416022678731e-08, + "loss": 0.0004, + "step": 48581 + }, + { + "epoch": 0.94, + "learning_rate": 1.1533532678342588e-08, + "loss": 0.0004, + "step": 48582 + }, + { + "epoch": 0.94, + "learning_rate": 1.1529649334006446e-08, + "loss": 0.0004, + "step": 48583 + }, + { + "epoch": 0.94, + "learning_rate": 1.1525765989670304e-08, + "loss": 0.0004, + "step": 48584 + }, + { + "epoch": 0.94, + "learning_rate": 1.1521882645334162e-08, + "loss": 0.0004, + "step": 48585 + }, + { + "epoch": 0.94, + "learning_rate": 1.1517999300998019e-08, + "loss": 0.6654, + "step": 48586 + }, + { + "epoch": 0.94, + "learning_rate": 1.1514115956661877e-08, + "loss": 0.0013, + "step": 48587 + }, + { + "epoch": 0.94, + "learning_rate": 1.1510232612325735e-08, + "loss": 0.0004, + "step": 48588 + }, + { + "epoch": 0.94, + "learning_rate": 1.1506349267989592e-08, + "loss": 0.0004, + "step": 48589 + }, + { + "epoch": 0.94, + "learning_rate": 1.150246592365345e-08, + "loss": 0.0014, + "step": 48590 + }, + { + "epoch": 0.94, + "learning_rate": 1.1498582579317309e-08, + "loss": 0.0004, + "step": 48591 + }, + { + "epoch": 0.94, + "learning_rate": 1.1494699234981165e-08, + "loss": 0.0009, + "step": 48592 + }, + { + "epoch": 0.94, + "learning_rate": 1.1490815890645023e-08, + "loss": 0.0004, + "step": 48593 + }, + { + "epoch": 0.94, + "learning_rate": 1.148693254630888e-08, + "loss": 0.0006, + "step": 48594 + }, + { + "epoch": 0.94, + "learning_rate": 1.1483049201972738e-08, + "loss": 0.0005, + "step": 48595 + }, + { + "epoch": 0.94, + "learning_rate": 1.1479165857636595e-08, + "loss": 0.0006, + "step": 48596 + }, + { + "epoch": 0.94, + "learning_rate": 1.1475282513300453e-08, + "loss": 0.0004, + "step": 48597 + }, + { + "epoch": 0.94, + "learning_rate": 1.1471399168964311e-08, + "loss": 0.0004, + "step": 48598 + }, + { + "epoch": 0.94, + "learning_rate": 1.146751582462817e-08, + "loss": 0.0004, + "step": 48599 + }, + { + "epoch": 0.94, + "learning_rate": 1.1463632480292026e-08, + "loss": 0.0004, + "step": 48600 + }, + { + "epoch": 0.94, + "learning_rate": 1.1459749135955884e-08, + "loss": 0.0003, + "step": 48601 + }, + { + "epoch": 0.94, + "learning_rate": 1.1455865791619743e-08, + "loss": 0.0003, + "step": 48602 + }, + { + "epoch": 0.94, + "learning_rate": 1.1451982447283601e-08, + "loss": 0.0004, + "step": 48603 + }, + { + "epoch": 0.94, + "learning_rate": 1.1448099102947457e-08, + "loss": 0.0005, + "step": 48604 + }, + { + "epoch": 0.94, + "learning_rate": 1.1444215758611316e-08, + "loss": 0.0003, + "step": 48605 + }, + { + "epoch": 0.94, + "learning_rate": 1.1440332414275174e-08, + "loss": 0.0003, + "step": 48606 + }, + { + "epoch": 0.94, + "learning_rate": 1.143644906993903e-08, + "loss": 0.6574, + "step": 48607 + }, + { + "epoch": 0.94, + "learning_rate": 1.1432565725602889e-08, + "loss": 0.0003, + "step": 48608 + }, + { + "epoch": 0.94, + "learning_rate": 1.1428682381266747e-08, + "loss": 0.0003, + "step": 48609 + }, + { + "epoch": 0.94, + "learning_rate": 1.1424799036930605e-08, + "loss": 0.0003, + "step": 48610 + }, + { + "epoch": 0.94, + "learning_rate": 1.1420915692594462e-08, + "loss": 0.0003, + "step": 48611 + }, + { + "epoch": 0.94, + "learning_rate": 1.141703234825832e-08, + "loss": 0.0004, + "step": 48612 + }, + { + "epoch": 0.94, + "learning_rate": 1.1413149003922178e-08, + "loss": 0.0003, + "step": 48613 + }, + { + "epoch": 0.94, + "learning_rate": 1.1409265659586035e-08, + "loss": 0.0003, + "step": 48614 + }, + { + "epoch": 0.94, + "learning_rate": 1.1405382315249893e-08, + "loss": 0.0003, + "step": 48615 + }, + { + "epoch": 0.94, + "learning_rate": 1.140149897091375e-08, + "loss": 0.0003, + "step": 48616 + }, + { + "epoch": 0.94, + "learning_rate": 1.1397615626577608e-08, + "loss": 0.0003, + "step": 48617 + }, + { + "epoch": 0.94, + "learning_rate": 1.1393732282241465e-08, + "loss": 0.0004, + "step": 48618 + }, + { + "epoch": 0.94, + "learning_rate": 1.1389848937905323e-08, + "loss": 0.0003, + "step": 48619 + }, + { + "epoch": 0.94, + "learning_rate": 1.1385965593569181e-08, + "loss": 0.0009, + "step": 48620 + }, + { + "epoch": 0.94, + "learning_rate": 1.138208224923304e-08, + "loss": 0.0004, + "step": 48621 + }, + { + "epoch": 0.94, + "learning_rate": 1.1378198904896896e-08, + "loss": 0.0003, + "step": 48622 + }, + { + "epoch": 0.94, + "learning_rate": 1.1374315560560754e-08, + "loss": 0.0004, + "step": 48623 + }, + { + "epoch": 0.94, + "learning_rate": 1.1370432216224612e-08, + "loss": 0.0006, + "step": 48624 + }, + { + "epoch": 0.94, + "learning_rate": 1.1366548871888469e-08, + "loss": 0.0005, + "step": 48625 + }, + { + "epoch": 0.94, + "learning_rate": 1.1362665527552327e-08, + "loss": 0.0003, + "step": 48626 + }, + { + "epoch": 0.94, + "learning_rate": 1.1358782183216185e-08, + "loss": 0.0005, + "step": 48627 + }, + { + "epoch": 0.94, + "learning_rate": 1.1354898838880044e-08, + "loss": 0.7581, + "step": 48628 + }, + { + "epoch": 0.94, + "learning_rate": 1.13510154945439e-08, + "loss": 0.0004, + "step": 48629 + }, + { + "epoch": 0.94, + "learning_rate": 1.1347132150207759e-08, + "loss": 0.0005, + "step": 48630 + }, + { + "epoch": 0.94, + "learning_rate": 1.1343248805871617e-08, + "loss": 0.0003, + "step": 48631 + }, + { + "epoch": 0.94, + "learning_rate": 1.1339365461535475e-08, + "loss": 0.0018, + "step": 48632 + }, + { + "epoch": 0.94, + "learning_rate": 1.1335482117199332e-08, + "loss": 0.0005, + "step": 48633 + }, + { + "epoch": 0.94, + "learning_rate": 1.133159877286319e-08, + "loss": 0.0003, + "step": 48634 + }, + { + "epoch": 0.94, + "learning_rate": 1.1327715428527048e-08, + "loss": 0.0004, + "step": 48635 + }, + { + "epoch": 0.94, + "learning_rate": 1.1323832084190905e-08, + "loss": 0.0004, + "step": 48636 + }, + { + "epoch": 0.94, + "learning_rate": 1.1319948739854763e-08, + "loss": 0.0006, + "step": 48637 + }, + { + "epoch": 0.94, + "learning_rate": 1.131606539551862e-08, + "loss": 0.0004, + "step": 48638 + }, + { + "epoch": 0.94, + "learning_rate": 1.1312182051182478e-08, + "loss": 0.0608, + "step": 48639 + }, + { + "epoch": 0.94, + "learning_rate": 1.1308298706846334e-08, + "loss": 0.0004, + "step": 48640 + }, + { + "epoch": 0.94, + "learning_rate": 1.1304415362510193e-08, + "loss": 0.0004, + "step": 48641 + }, + { + "epoch": 0.94, + "learning_rate": 1.1300532018174051e-08, + "loss": 0.0007, + "step": 48642 + }, + { + "epoch": 0.94, + "learning_rate": 1.1296648673837909e-08, + "loss": 0.0004, + "step": 48643 + }, + { + "epoch": 0.94, + "learning_rate": 1.1292765329501766e-08, + "loss": 0.0003, + "step": 48644 + }, + { + "epoch": 0.94, + "learning_rate": 1.1288881985165624e-08, + "loss": 0.0042, + "step": 48645 + }, + { + "epoch": 0.94, + "learning_rate": 1.1284998640829482e-08, + "loss": 0.0003, + "step": 48646 + }, + { + "epoch": 0.94, + "learning_rate": 1.1281115296493339e-08, + "loss": 0.0004, + "step": 48647 + }, + { + "epoch": 0.94, + "learning_rate": 1.1277231952157197e-08, + "loss": 0.0004, + "step": 48648 + }, + { + "epoch": 0.94, + "learning_rate": 1.1273348607821055e-08, + "loss": 0.0003, + "step": 48649 + }, + { + "epoch": 0.94, + "learning_rate": 1.1269465263484914e-08, + "loss": 0.0003, + "step": 48650 + }, + { + "epoch": 0.94, + "learning_rate": 1.126558191914877e-08, + "loss": 0.0004, + "step": 48651 + }, + { + "epoch": 0.94, + "learning_rate": 1.1261698574812628e-08, + "loss": 0.0003, + "step": 48652 + }, + { + "epoch": 0.94, + "learning_rate": 1.1257815230476487e-08, + "loss": 0.0006, + "step": 48653 + }, + { + "epoch": 0.94, + "learning_rate": 1.1253931886140343e-08, + "loss": 0.0003, + "step": 48654 + }, + { + "epoch": 0.94, + "learning_rate": 1.1250048541804201e-08, + "loss": 0.0003, + "step": 48655 + }, + { + "epoch": 0.94, + "learning_rate": 1.124616519746806e-08, + "loss": 0.0003, + "step": 48656 + }, + { + "epoch": 0.94, + "learning_rate": 1.1242281853131918e-08, + "loss": 0.0003, + "step": 48657 + }, + { + "epoch": 0.94, + "learning_rate": 1.1238398508795775e-08, + "loss": 0.3383, + "step": 48658 + }, + { + "epoch": 0.94, + "learning_rate": 1.1234515164459633e-08, + "loss": 0.0003, + "step": 48659 + }, + { + "epoch": 0.94, + "learning_rate": 1.123063182012349e-08, + "loss": 0.0005, + "step": 48660 + }, + { + "epoch": 0.94, + "learning_rate": 1.1226748475787348e-08, + "loss": 0.0004, + "step": 48661 + }, + { + "epoch": 0.94, + "learning_rate": 1.1222865131451204e-08, + "loss": 0.0005, + "step": 48662 + }, + { + "epoch": 0.94, + "learning_rate": 1.1218981787115062e-08, + "loss": 0.0003, + "step": 48663 + }, + { + "epoch": 0.94, + "learning_rate": 1.121509844277892e-08, + "loss": 0.0006, + "step": 48664 + }, + { + "epoch": 0.94, + "learning_rate": 1.1211215098442777e-08, + "loss": 0.0003, + "step": 48665 + }, + { + "epoch": 0.94, + "learning_rate": 1.1207331754106635e-08, + "loss": 0.0004, + "step": 48666 + }, + { + "epoch": 0.94, + "learning_rate": 1.1203448409770494e-08, + "loss": 0.0007, + "step": 48667 + }, + { + "epoch": 0.94, + "learning_rate": 1.1199565065434352e-08, + "loss": 0.0005, + "step": 48668 + }, + { + "epoch": 0.94, + "learning_rate": 1.1195681721098209e-08, + "loss": 0.0003, + "step": 48669 + }, + { + "epoch": 0.94, + "learning_rate": 1.1191798376762067e-08, + "loss": 0.0004, + "step": 48670 + }, + { + "epoch": 0.94, + "learning_rate": 1.1187915032425925e-08, + "loss": 0.0003, + "step": 48671 + }, + { + "epoch": 0.94, + "learning_rate": 1.1184031688089783e-08, + "loss": 0.001, + "step": 48672 + }, + { + "epoch": 0.94, + "learning_rate": 1.118014834375364e-08, + "loss": 0.0004, + "step": 48673 + }, + { + "epoch": 0.94, + "learning_rate": 1.1176264999417498e-08, + "loss": 0.0004, + "step": 48674 + }, + { + "epoch": 0.94, + "learning_rate": 1.1172381655081356e-08, + "loss": 0.0003, + "step": 48675 + }, + { + "epoch": 0.94, + "learning_rate": 1.1168498310745213e-08, + "loss": 0.0007, + "step": 48676 + }, + { + "epoch": 0.94, + "learning_rate": 1.1164614966409071e-08, + "loss": 0.0003, + "step": 48677 + }, + { + "epoch": 0.94, + "learning_rate": 1.116073162207293e-08, + "loss": 0.0004, + "step": 48678 + }, + { + "epoch": 0.94, + "learning_rate": 1.1156848277736788e-08, + "loss": 0.023, + "step": 48679 + }, + { + "epoch": 0.94, + "learning_rate": 1.1152964933400644e-08, + "loss": 0.0004, + "step": 48680 + }, + { + "epoch": 0.94, + "learning_rate": 1.1149081589064503e-08, + "loss": 0.1001, + "step": 48681 + }, + { + "epoch": 0.94, + "learning_rate": 1.1145198244728359e-08, + "loss": 0.0004, + "step": 48682 + }, + { + "epoch": 0.94, + "learning_rate": 1.1141314900392217e-08, + "loss": 0.0005, + "step": 48683 + }, + { + "epoch": 0.94, + "learning_rate": 1.1137431556056074e-08, + "loss": 0.4804, + "step": 48684 + }, + { + "epoch": 0.94, + "learning_rate": 1.1133548211719932e-08, + "loss": 0.0413, + "step": 48685 + }, + { + "epoch": 0.94, + "learning_rate": 1.112966486738379e-08, + "loss": 0.0006, + "step": 48686 + }, + { + "epoch": 0.94, + "learning_rate": 1.1125781523047647e-08, + "loss": 0.0002, + "step": 48687 + }, + { + "epoch": 0.94, + "learning_rate": 1.1121898178711505e-08, + "loss": 0.0004, + "step": 48688 + }, + { + "epoch": 0.94, + "learning_rate": 1.1118014834375364e-08, + "loss": 0.0051, + "step": 48689 + }, + { + "epoch": 0.94, + "learning_rate": 1.1114131490039222e-08, + "loss": 0.6226, + "step": 48690 + }, + { + "epoch": 0.94, + "learning_rate": 1.1110248145703078e-08, + "loss": 0.0004, + "step": 48691 + }, + { + "epoch": 0.94, + "learning_rate": 1.1106364801366937e-08, + "loss": 0.0011, + "step": 48692 + }, + { + "epoch": 0.94, + "learning_rate": 1.1102481457030795e-08, + "loss": 0.0004, + "step": 48693 + }, + { + "epoch": 0.94, + "learning_rate": 1.1098598112694651e-08, + "loss": 0.0005, + "step": 48694 + }, + { + "epoch": 0.94, + "learning_rate": 1.109471476835851e-08, + "loss": 0.0003, + "step": 48695 + }, + { + "epoch": 0.94, + "learning_rate": 1.1090831424022368e-08, + "loss": 0.0075, + "step": 48696 + }, + { + "epoch": 0.94, + "learning_rate": 1.1086948079686226e-08, + "loss": 0.0003, + "step": 48697 + }, + { + "epoch": 0.94, + "learning_rate": 1.1083064735350083e-08, + "loss": 0.0009, + "step": 48698 + }, + { + "epoch": 0.94, + "learning_rate": 1.1079181391013941e-08, + "loss": 0.0004, + "step": 48699 + }, + { + "epoch": 0.94, + "learning_rate": 1.10752980466778e-08, + "loss": 0.0003, + "step": 48700 + }, + { + "epoch": 0.94, + "learning_rate": 1.1071414702341658e-08, + "loss": 0.0044, + "step": 48701 + }, + { + "epoch": 0.94, + "learning_rate": 1.1067531358005514e-08, + "loss": 0.0003, + "step": 48702 + }, + { + "epoch": 0.94, + "learning_rate": 1.1063648013669372e-08, + "loss": 0.0003, + "step": 48703 + }, + { + "epoch": 0.94, + "learning_rate": 1.1059764669333229e-08, + "loss": 0.0004, + "step": 48704 + }, + { + "epoch": 0.94, + "learning_rate": 1.1055881324997087e-08, + "loss": 0.0029, + "step": 48705 + }, + { + "epoch": 0.94, + "learning_rate": 1.1051997980660944e-08, + "loss": 0.0004, + "step": 48706 + }, + { + "epoch": 0.94, + "learning_rate": 1.1048114636324802e-08, + "loss": 0.0006, + "step": 48707 + }, + { + "epoch": 0.94, + "learning_rate": 1.104423129198866e-08, + "loss": 0.0008, + "step": 48708 + }, + { + "epoch": 0.94, + "learning_rate": 1.1040347947652517e-08, + "loss": 0.0003, + "step": 48709 + }, + { + "epoch": 0.94, + "learning_rate": 1.1036464603316375e-08, + "loss": 0.2866, + "step": 48710 + }, + { + "epoch": 0.94, + "learning_rate": 1.1032581258980233e-08, + "loss": 0.0004, + "step": 48711 + }, + { + "epoch": 0.94, + "learning_rate": 1.102869791464409e-08, + "loss": 0.0003, + "step": 48712 + }, + { + "epoch": 0.94, + "learning_rate": 1.1024814570307948e-08, + "loss": 0.0004, + "step": 48713 + }, + { + "epoch": 0.94, + "learning_rate": 1.1020931225971806e-08, + "loss": 0.0003, + "step": 48714 + }, + { + "epoch": 0.94, + "learning_rate": 1.1017047881635665e-08, + "loss": 0.0008, + "step": 48715 + }, + { + "epoch": 0.94, + "learning_rate": 1.1013164537299521e-08, + "loss": 0.0009, + "step": 48716 + }, + { + "epoch": 0.95, + "learning_rate": 1.100928119296338e-08, + "loss": 0.0002, + "step": 48717 + }, + { + "epoch": 0.95, + "learning_rate": 1.1005397848627238e-08, + "loss": 0.0004, + "step": 48718 + }, + { + "epoch": 0.95, + "learning_rate": 1.1001514504291096e-08, + "loss": 0.0006, + "step": 48719 + }, + { + "epoch": 0.95, + "learning_rate": 1.0997631159954953e-08, + "loss": 0.0009, + "step": 48720 + }, + { + "epoch": 0.95, + "learning_rate": 1.099374781561881e-08, + "loss": 0.0003, + "step": 48721 + }, + { + "epoch": 0.95, + "learning_rate": 1.0989864471282669e-08, + "loss": 0.0005, + "step": 48722 + }, + { + "epoch": 0.95, + "learning_rate": 1.0985981126946526e-08, + "loss": 0.0076, + "step": 48723 + }, + { + "epoch": 0.95, + "learning_rate": 1.0982097782610384e-08, + "loss": 0.4093, + "step": 48724 + }, + { + "epoch": 0.95, + "learning_rate": 1.0978214438274242e-08, + "loss": 0.0012, + "step": 48725 + }, + { + "epoch": 0.95, + "learning_rate": 1.0974331093938099e-08, + "loss": 0.0004, + "step": 48726 + }, + { + "epoch": 0.95, + "learning_rate": 1.0970447749601957e-08, + "loss": 0.0004, + "step": 48727 + }, + { + "epoch": 0.95, + "learning_rate": 1.0966564405265814e-08, + "loss": 0.0003, + "step": 48728 + }, + { + "epoch": 0.95, + "learning_rate": 1.0962681060929672e-08, + "loss": 0.0004, + "step": 48729 + }, + { + "epoch": 0.95, + "learning_rate": 1.095879771659353e-08, + "loss": 0.0003, + "step": 48730 + }, + { + "epoch": 0.95, + "learning_rate": 1.0954914372257387e-08, + "loss": 0.0002, + "step": 48731 + }, + { + "epoch": 0.95, + "learning_rate": 1.0951031027921245e-08, + "loss": 0.0006, + "step": 48732 + }, + { + "epoch": 0.95, + "learning_rate": 1.0947147683585103e-08, + "loss": 0.0008, + "step": 48733 + }, + { + "epoch": 0.95, + "learning_rate": 1.094326433924896e-08, + "loss": 0.0005, + "step": 48734 + }, + { + "epoch": 0.95, + "learning_rate": 1.0939380994912818e-08, + "loss": 0.0004, + "step": 48735 + }, + { + "epoch": 0.95, + "learning_rate": 1.0935497650576676e-08, + "loss": 0.0045, + "step": 48736 + }, + { + "epoch": 0.95, + "learning_rate": 1.0931614306240534e-08, + "loss": 0.0372, + "step": 48737 + }, + { + "epoch": 0.95, + "learning_rate": 1.0927730961904391e-08, + "loss": 0.0004, + "step": 48738 + }, + { + "epoch": 0.95, + "learning_rate": 1.092384761756825e-08, + "loss": 0.0006, + "step": 48739 + }, + { + "epoch": 0.95, + "learning_rate": 1.0919964273232108e-08, + "loss": 0.0003, + "step": 48740 + }, + { + "epoch": 0.95, + "learning_rate": 1.0916080928895964e-08, + "loss": 0.0004, + "step": 48741 + }, + { + "epoch": 0.95, + "learning_rate": 1.0912197584559822e-08, + "loss": 1.1418, + "step": 48742 + }, + { + "epoch": 0.95, + "learning_rate": 1.090831424022368e-08, + "loss": 0.0004, + "step": 48743 + }, + { + "epoch": 0.95, + "learning_rate": 1.0904430895887539e-08, + "loss": 0.0004, + "step": 48744 + }, + { + "epoch": 0.95, + "learning_rate": 1.0900547551551395e-08, + "loss": 1.1059, + "step": 48745 + }, + { + "epoch": 0.95, + "learning_rate": 1.0896664207215254e-08, + "loss": 0.0005, + "step": 48746 + }, + { + "epoch": 0.95, + "learning_rate": 1.0892780862879112e-08, + "loss": 0.0005, + "step": 48747 + }, + { + "epoch": 0.95, + "learning_rate": 1.0888897518542969e-08, + "loss": 0.0004, + "step": 48748 + }, + { + "epoch": 0.95, + "learning_rate": 1.0885014174206827e-08, + "loss": 0.0024, + "step": 48749 + }, + { + "epoch": 0.95, + "learning_rate": 1.0881130829870683e-08, + "loss": 0.0004, + "step": 48750 + }, + { + "epoch": 0.95, + "learning_rate": 1.0877247485534542e-08, + "loss": 0.0005, + "step": 48751 + }, + { + "epoch": 0.95, + "learning_rate": 1.0873364141198398e-08, + "loss": 0.0002, + "step": 48752 + }, + { + "epoch": 0.95, + "learning_rate": 1.0869480796862256e-08, + "loss": 0.0003, + "step": 48753 + }, + { + "epoch": 0.95, + "learning_rate": 1.0865597452526115e-08, + "loss": 0.0004, + "step": 48754 + }, + { + "epoch": 0.95, + "learning_rate": 1.0861714108189973e-08, + "loss": 0.0004, + "step": 48755 + }, + { + "epoch": 0.95, + "learning_rate": 1.085783076385383e-08, + "loss": 0.0005, + "step": 48756 + }, + { + "epoch": 0.95, + "learning_rate": 1.0853947419517688e-08, + "loss": 0.0002, + "step": 48757 + }, + { + "epoch": 0.95, + "learning_rate": 1.0850064075181546e-08, + "loss": 0.0003, + "step": 48758 + }, + { + "epoch": 0.95, + "learning_rate": 1.0846180730845404e-08, + "loss": 0.7421, + "step": 48759 + }, + { + "epoch": 0.95, + "learning_rate": 1.0842297386509261e-08, + "loss": 0.6437, + "step": 48760 + }, + { + "epoch": 0.95, + "learning_rate": 1.0838414042173119e-08, + "loss": 0.0021, + "step": 48761 + }, + { + "epoch": 0.95, + "learning_rate": 1.0834530697836977e-08, + "loss": 0.0004, + "step": 48762 + }, + { + "epoch": 0.95, + "learning_rate": 1.0830647353500834e-08, + "loss": 0.0006, + "step": 48763 + }, + { + "epoch": 0.95, + "learning_rate": 1.0826764009164692e-08, + "loss": 0.0002, + "step": 48764 + }, + { + "epoch": 0.95, + "learning_rate": 1.082288066482855e-08, + "loss": 0.0004, + "step": 48765 + }, + { + "epoch": 0.95, + "learning_rate": 1.0818997320492409e-08, + "loss": 0.0017, + "step": 48766 + }, + { + "epoch": 0.95, + "learning_rate": 1.0815113976156265e-08, + "loss": 0.6742, + "step": 48767 + }, + { + "epoch": 0.95, + "learning_rate": 1.0811230631820123e-08, + "loss": 0.002, + "step": 48768 + }, + { + "epoch": 0.95, + "learning_rate": 1.0807347287483982e-08, + "loss": 0.1203, + "step": 48769 + }, + { + "epoch": 0.95, + "learning_rate": 1.0803463943147838e-08, + "loss": 0.0003, + "step": 48770 + }, + { + "epoch": 0.95, + "learning_rate": 1.0799580598811697e-08, + "loss": 0.5947, + "step": 48771 + }, + { + "epoch": 0.95, + "learning_rate": 1.0795697254475553e-08, + "loss": 0.0005, + "step": 48772 + }, + { + "epoch": 0.95, + "learning_rate": 1.0791813910139411e-08, + "loss": 0.0004, + "step": 48773 + }, + { + "epoch": 0.95, + "learning_rate": 1.0787930565803268e-08, + "loss": 0.0003, + "step": 48774 + }, + { + "epoch": 0.95, + "learning_rate": 1.0784047221467126e-08, + "loss": 0.0003, + "step": 48775 + }, + { + "epoch": 0.95, + "learning_rate": 1.0780163877130984e-08, + "loss": 1.1029, + "step": 48776 + }, + { + "epoch": 0.95, + "learning_rate": 1.0776280532794843e-08, + "loss": 0.0004, + "step": 48777 + }, + { + "epoch": 0.95, + "learning_rate": 1.07723971884587e-08, + "loss": 0.0012, + "step": 48778 + }, + { + "epoch": 0.95, + "learning_rate": 1.0768513844122558e-08, + "loss": 0.0003, + "step": 48779 + }, + { + "epoch": 0.95, + "learning_rate": 1.0764630499786416e-08, + "loss": 0.0003, + "step": 48780 + }, + { + "epoch": 0.95, + "learning_rate": 1.0760747155450272e-08, + "loss": 0.0003, + "step": 48781 + }, + { + "epoch": 0.95, + "learning_rate": 1.075686381111413e-08, + "loss": 0.0003, + "step": 48782 + }, + { + "epoch": 0.95, + "learning_rate": 1.0752980466777989e-08, + "loss": 0.0004, + "step": 48783 + }, + { + "epoch": 0.95, + "learning_rate": 1.0749097122441847e-08, + "loss": 0.0004, + "step": 48784 + }, + { + "epoch": 0.95, + "learning_rate": 1.0745213778105704e-08, + "loss": 0.0004, + "step": 48785 + }, + { + "epoch": 0.95, + "learning_rate": 1.0741330433769562e-08, + "loss": 0.0014, + "step": 48786 + }, + { + "epoch": 0.95, + "learning_rate": 1.073744708943342e-08, + "loss": 0.0002, + "step": 48787 + }, + { + "epoch": 0.95, + "learning_rate": 1.0733563745097278e-08, + "loss": 0.0005, + "step": 48788 + }, + { + "epoch": 0.95, + "learning_rate": 1.0729680400761135e-08, + "loss": 0.0003, + "step": 48789 + }, + { + "epoch": 0.95, + "learning_rate": 1.0725797056424993e-08, + "loss": 0.0003, + "step": 48790 + }, + { + "epoch": 0.95, + "learning_rate": 1.0721913712088852e-08, + "loss": 0.0031, + "step": 48791 + }, + { + "epoch": 0.95, + "learning_rate": 1.0718030367752708e-08, + "loss": 0.0004, + "step": 48792 + }, + { + "epoch": 0.95, + "learning_rate": 1.0714147023416566e-08, + "loss": 0.0003, + "step": 48793 + }, + { + "epoch": 0.95, + "learning_rate": 1.0710263679080425e-08, + "loss": 0.0004, + "step": 48794 + }, + { + "epoch": 0.95, + "learning_rate": 1.0706380334744281e-08, + "loss": 0.0003, + "step": 48795 + }, + { + "epoch": 0.95, + "learning_rate": 1.0702496990408138e-08, + "loss": 0.0004, + "step": 48796 + }, + { + "epoch": 0.95, + "learning_rate": 1.0698613646071996e-08, + "loss": 0.0003, + "step": 48797 + }, + { + "epoch": 0.95, + "learning_rate": 1.0694730301735854e-08, + "loss": 0.0004, + "step": 48798 + }, + { + "epoch": 0.95, + "learning_rate": 1.0690846957399711e-08, + "loss": 0.0004, + "step": 48799 + }, + { + "epoch": 0.95, + "learning_rate": 1.0686963613063569e-08, + "loss": 0.0004, + "step": 48800 + }, + { + "epoch": 0.95, + "learning_rate": 1.0683080268727427e-08, + "loss": 0.0003, + "step": 48801 + }, + { + "epoch": 0.95, + "learning_rate": 1.0679196924391286e-08, + "loss": 0.0032, + "step": 48802 + }, + { + "epoch": 0.95, + "learning_rate": 1.0675313580055142e-08, + "loss": 0.0004, + "step": 48803 + }, + { + "epoch": 0.95, + "learning_rate": 1.0671430235719e-08, + "loss": 0.0003, + "step": 48804 + }, + { + "epoch": 0.95, + "learning_rate": 1.0667546891382859e-08, + "loss": 0.6698, + "step": 48805 + }, + { + "epoch": 0.95, + "learning_rate": 1.0663663547046717e-08, + "loss": 0.0005, + "step": 48806 + }, + { + "epoch": 0.95, + "learning_rate": 1.0659780202710574e-08, + "loss": 0.0004, + "step": 48807 + }, + { + "epoch": 0.95, + "learning_rate": 1.0655896858374432e-08, + "loss": 0.0007, + "step": 48808 + }, + { + "epoch": 0.95, + "learning_rate": 1.065201351403829e-08, + "loss": 0.0003, + "step": 48809 + }, + { + "epoch": 0.95, + "learning_rate": 1.0648130169702147e-08, + "loss": 0.0002, + "step": 48810 + }, + { + "epoch": 0.95, + "learning_rate": 1.0644246825366005e-08, + "loss": 0.0003, + "step": 48811 + }, + { + "epoch": 0.95, + "learning_rate": 1.0640363481029863e-08, + "loss": 0.0003, + "step": 48812 + }, + { + "epoch": 0.95, + "learning_rate": 1.0636480136693721e-08, + "loss": 0.0003, + "step": 48813 + }, + { + "epoch": 0.95, + "learning_rate": 1.0632596792357578e-08, + "loss": 0.0004, + "step": 48814 + }, + { + "epoch": 0.95, + "learning_rate": 1.0628713448021436e-08, + "loss": 0.0004, + "step": 48815 + }, + { + "epoch": 0.95, + "learning_rate": 1.0624830103685294e-08, + "loss": 0.0012, + "step": 48816 + }, + { + "epoch": 0.95, + "learning_rate": 1.0620946759349151e-08, + "loss": 0.0057, + "step": 48817 + }, + { + "epoch": 0.95, + "learning_rate": 1.0617063415013008e-08, + "loss": 0.0022, + "step": 48818 + }, + { + "epoch": 0.95, + "learning_rate": 1.0613180070676866e-08, + "loss": 0.0004, + "step": 48819 + }, + { + "epoch": 0.95, + "learning_rate": 1.0609296726340724e-08, + "loss": 0.0011, + "step": 48820 + }, + { + "epoch": 0.95, + "learning_rate": 1.060541338200458e-08, + "loss": 0.001, + "step": 48821 + }, + { + "epoch": 0.95, + "learning_rate": 1.0601530037668439e-08, + "loss": 0.0012, + "step": 48822 + }, + { + "epoch": 0.95, + "learning_rate": 1.0597646693332297e-08, + "loss": 0.7202, + "step": 48823 + }, + { + "epoch": 0.95, + "learning_rate": 1.0593763348996155e-08, + "loss": 0.0005, + "step": 48824 + }, + { + "epoch": 0.95, + "learning_rate": 1.0589880004660012e-08, + "loss": 0.0003, + "step": 48825 + }, + { + "epoch": 0.95, + "learning_rate": 1.058599666032387e-08, + "loss": 0.0004, + "step": 48826 + }, + { + "epoch": 0.95, + "learning_rate": 1.0582113315987728e-08, + "loss": 0.0004, + "step": 48827 + }, + { + "epoch": 0.95, + "learning_rate": 1.0578229971651585e-08, + "loss": 0.0007, + "step": 48828 + }, + { + "epoch": 0.95, + "learning_rate": 1.0574346627315443e-08, + "loss": 0.0003, + "step": 48829 + }, + { + "epoch": 0.95, + "learning_rate": 1.0570463282979302e-08, + "loss": 0.0003, + "step": 48830 + }, + { + "epoch": 0.95, + "learning_rate": 1.056657993864316e-08, + "loss": 0.0003, + "step": 48831 + }, + { + "epoch": 0.95, + "learning_rate": 1.0562696594307016e-08, + "loss": 0.0004, + "step": 48832 + }, + { + "epoch": 0.95, + "learning_rate": 1.0558813249970875e-08, + "loss": 0.0027, + "step": 48833 + }, + { + "epoch": 0.95, + "learning_rate": 1.0554929905634733e-08, + "loss": 0.0004, + "step": 48834 + }, + { + "epoch": 0.95, + "learning_rate": 1.0551046561298591e-08, + "loss": 0.0003, + "step": 48835 + }, + { + "epoch": 0.95, + "learning_rate": 1.0547163216962448e-08, + "loss": 0.0004, + "step": 48836 + }, + { + "epoch": 0.95, + "learning_rate": 1.0543279872626306e-08, + "loss": 0.0004, + "step": 48837 + }, + { + "epoch": 0.95, + "learning_rate": 1.0539396528290164e-08, + "loss": 0.0003, + "step": 48838 + }, + { + "epoch": 0.95, + "learning_rate": 1.053551318395402e-08, + "loss": 0.0004, + "step": 48839 + }, + { + "epoch": 0.95, + "learning_rate": 1.0531629839617879e-08, + "loss": 0.4699, + "step": 48840 + }, + { + "epoch": 0.95, + "learning_rate": 1.0527746495281736e-08, + "loss": 0.0004, + "step": 48841 + }, + { + "epoch": 0.95, + "learning_rate": 1.0523863150945594e-08, + "loss": 0.0003, + "step": 48842 + }, + { + "epoch": 0.95, + "learning_rate": 1.051997980660945e-08, + "loss": 0.0007, + "step": 48843 + }, + { + "epoch": 0.95, + "learning_rate": 1.0516096462273309e-08, + "loss": 0.0002, + "step": 48844 + }, + { + "epoch": 0.95, + "learning_rate": 1.0512213117937167e-08, + "loss": 0.0003, + "step": 48845 + }, + { + "epoch": 0.95, + "learning_rate": 1.0508329773601025e-08, + "loss": 0.0003, + "step": 48846 + }, + { + "epoch": 0.95, + "learning_rate": 1.0504446429264882e-08, + "loss": 0.0006, + "step": 48847 + }, + { + "epoch": 0.95, + "learning_rate": 1.050056308492874e-08, + "loss": 0.0003, + "step": 48848 + }, + { + "epoch": 0.95, + "learning_rate": 1.0496679740592598e-08, + "loss": 0.0013, + "step": 48849 + }, + { + "epoch": 0.95, + "learning_rate": 1.0492796396256455e-08, + "loss": 0.0007, + "step": 48850 + }, + { + "epoch": 0.95, + "learning_rate": 1.0488913051920313e-08, + "loss": 1.1719, + "step": 48851 + }, + { + "epoch": 0.95, + "learning_rate": 1.0485029707584171e-08, + "loss": 0.0003, + "step": 48852 + }, + { + "epoch": 0.95, + "learning_rate": 1.048114636324803e-08, + "loss": 0.0003, + "step": 48853 + }, + { + "epoch": 0.95, + "learning_rate": 1.0477263018911886e-08, + "loss": 0.0004, + "step": 48854 + }, + { + "epoch": 0.95, + "learning_rate": 1.0473379674575744e-08, + "loss": 0.0003, + "step": 48855 + }, + { + "epoch": 0.95, + "learning_rate": 1.0469496330239603e-08, + "loss": 0.0004, + "step": 48856 + }, + { + "epoch": 0.95, + "learning_rate": 1.046561298590346e-08, + "loss": 0.0004, + "step": 48857 + }, + { + "epoch": 0.95, + "learning_rate": 1.0461729641567317e-08, + "loss": 0.0003, + "step": 48858 + }, + { + "epoch": 0.95, + "learning_rate": 1.0457846297231176e-08, + "loss": 0.0003, + "step": 48859 + }, + { + "epoch": 0.95, + "learning_rate": 1.0453962952895034e-08, + "loss": 0.0006, + "step": 48860 + }, + { + "epoch": 0.95, + "learning_rate": 1.045007960855889e-08, + "loss": 0.0003, + "step": 48861 + }, + { + "epoch": 0.95, + "learning_rate": 1.0446196264222749e-08, + "loss": 0.0004, + "step": 48862 + }, + { + "epoch": 0.95, + "learning_rate": 1.0442312919886605e-08, + "loss": 0.0106, + "step": 48863 + }, + { + "epoch": 0.95, + "learning_rate": 1.0438429575550464e-08, + "loss": 0.0008, + "step": 48864 + }, + { + "epoch": 0.95, + "learning_rate": 1.043454623121432e-08, + "loss": 1.0296, + "step": 48865 + }, + { + "epoch": 0.95, + "learning_rate": 1.0430662886878178e-08, + "loss": 0.0004, + "step": 48866 + }, + { + "epoch": 0.95, + "learning_rate": 1.0426779542542037e-08, + "loss": 0.0004, + "step": 48867 + }, + { + "epoch": 0.95, + "learning_rate": 1.0422896198205893e-08, + "loss": 0.0007, + "step": 48868 + }, + { + "epoch": 0.95, + "learning_rate": 1.0419012853869752e-08, + "loss": 0.0005, + "step": 48869 + }, + { + "epoch": 0.95, + "learning_rate": 1.041512950953361e-08, + "loss": 0.6961, + "step": 48870 + }, + { + "epoch": 0.95, + "learning_rate": 1.0411246165197468e-08, + "loss": 0.0004, + "step": 48871 + }, + { + "epoch": 0.95, + "learning_rate": 1.0407362820861325e-08, + "loss": 0.0004, + "step": 48872 + }, + { + "epoch": 0.95, + "learning_rate": 1.0403479476525183e-08, + "loss": 1.1124, + "step": 48873 + }, + { + "epoch": 0.95, + "learning_rate": 1.0399596132189041e-08, + "loss": 0.0004, + "step": 48874 + }, + { + "epoch": 0.95, + "learning_rate": 1.03957127878529e-08, + "loss": 0.0004, + "step": 48875 + }, + { + "epoch": 0.95, + "learning_rate": 1.0391829443516756e-08, + "loss": 0.0004, + "step": 48876 + }, + { + "epoch": 0.95, + "learning_rate": 1.0387946099180614e-08, + "loss": 0.0032, + "step": 48877 + }, + { + "epoch": 0.95, + "learning_rate": 1.0384062754844472e-08, + "loss": 0.0003, + "step": 48878 + }, + { + "epoch": 0.95, + "learning_rate": 1.0380179410508329e-08, + "loss": 0.0004, + "step": 48879 + }, + { + "epoch": 0.95, + "learning_rate": 1.0376296066172187e-08, + "loss": 0.0002, + "step": 48880 + }, + { + "epoch": 0.95, + "learning_rate": 1.0372412721836046e-08, + "loss": 0.0007, + "step": 48881 + }, + { + "epoch": 0.95, + "learning_rate": 1.0368529377499904e-08, + "loss": 0.0004, + "step": 48882 + }, + { + "epoch": 0.95, + "learning_rate": 1.036464603316376e-08, + "loss": 0.0004, + "step": 48883 + }, + { + "epoch": 0.95, + "learning_rate": 1.0360762688827619e-08, + "loss": 0.0004, + "step": 48884 + }, + { + "epoch": 0.95, + "learning_rate": 1.0356879344491475e-08, + "loss": 0.0008, + "step": 48885 + }, + { + "epoch": 0.95, + "learning_rate": 1.0352996000155333e-08, + "loss": 0.0005, + "step": 48886 + }, + { + "epoch": 0.95, + "learning_rate": 1.034911265581919e-08, + "loss": 0.785, + "step": 48887 + }, + { + "epoch": 0.95, + "learning_rate": 1.0345229311483048e-08, + "loss": 0.0003, + "step": 48888 + }, + { + "epoch": 0.95, + "learning_rate": 1.0341345967146907e-08, + "loss": 0.0002, + "step": 48889 + }, + { + "epoch": 0.95, + "learning_rate": 1.0337462622810763e-08, + "loss": 0.0054, + "step": 48890 + }, + { + "epoch": 0.95, + "learning_rate": 1.0333579278474621e-08, + "loss": 0.0004, + "step": 48891 + }, + { + "epoch": 0.95, + "learning_rate": 1.032969593413848e-08, + "loss": 0.0003, + "step": 48892 + }, + { + "epoch": 0.95, + "learning_rate": 1.0325812589802338e-08, + "loss": 0.0005, + "step": 48893 + }, + { + "epoch": 0.95, + "learning_rate": 1.0321929245466194e-08, + "loss": 0.0004, + "step": 48894 + }, + { + "epoch": 0.95, + "learning_rate": 1.0318045901130053e-08, + "loss": 0.0004, + "step": 48895 + }, + { + "epoch": 0.95, + "learning_rate": 1.0314162556793911e-08, + "loss": 0.0005, + "step": 48896 + }, + { + "epoch": 0.95, + "learning_rate": 1.0310279212457768e-08, + "loss": 0.0004, + "step": 48897 + }, + { + "epoch": 0.95, + "learning_rate": 1.0306395868121626e-08, + "loss": 0.0003, + "step": 48898 + }, + { + "epoch": 0.95, + "learning_rate": 1.0302512523785484e-08, + "loss": 0.0003, + "step": 48899 + }, + { + "epoch": 0.95, + "learning_rate": 1.0298629179449342e-08, + "loss": 0.0003, + "step": 48900 + }, + { + "epoch": 0.95, + "learning_rate": 1.0294745835113199e-08, + "loss": 0.3008, + "step": 48901 + }, + { + "epoch": 0.95, + "learning_rate": 1.0290862490777057e-08, + "loss": 0.0003, + "step": 48902 + }, + { + "epoch": 0.95, + "learning_rate": 1.0286979146440915e-08, + "loss": 0.0003, + "step": 48903 + }, + { + "epoch": 0.95, + "learning_rate": 1.0283095802104774e-08, + "loss": 0.0004, + "step": 48904 + }, + { + "epoch": 0.95, + "learning_rate": 1.027921245776863e-08, + "loss": 0.0005, + "step": 48905 + }, + { + "epoch": 0.95, + "learning_rate": 1.0275329113432488e-08, + "loss": 0.8283, + "step": 48906 + }, + { + "epoch": 0.95, + "learning_rate": 1.0271445769096345e-08, + "loss": 0.0003, + "step": 48907 + }, + { + "epoch": 0.95, + "learning_rate": 1.0267562424760203e-08, + "loss": 0.0004, + "step": 48908 + }, + { + "epoch": 0.95, + "learning_rate": 1.026367908042406e-08, + "loss": 0.1458, + "step": 48909 + }, + { + "epoch": 0.95, + "learning_rate": 1.0259795736087918e-08, + "loss": 0.0003, + "step": 48910 + }, + { + "epoch": 0.95, + "learning_rate": 1.0255912391751776e-08, + "loss": 0.0004, + "step": 48911 + }, + { + "epoch": 0.95, + "learning_rate": 1.0252029047415633e-08, + "loss": 0.0011, + "step": 48912 + }, + { + "epoch": 0.95, + "learning_rate": 1.0248145703079491e-08, + "loss": 0.0003, + "step": 48913 + }, + { + "epoch": 0.95, + "learning_rate": 1.024426235874335e-08, + "loss": 0.0004, + "step": 48914 + }, + { + "epoch": 0.95, + "learning_rate": 1.0240379014407206e-08, + "loss": 0.0013, + "step": 48915 + }, + { + "epoch": 0.95, + "learning_rate": 1.0236495670071064e-08, + "loss": 0.0003, + "step": 48916 + }, + { + "epoch": 0.95, + "learning_rate": 1.0232612325734922e-08, + "loss": 0.0004, + "step": 48917 + }, + { + "epoch": 0.95, + "learning_rate": 1.022872898139878e-08, + "loss": 0.0008, + "step": 48918 + }, + { + "epoch": 0.95, + "learning_rate": 1.0224845637062637e-08, + "loss": 0.0005, + "step": 48919 + }, + { + "epoch": 0.95, + "learning_rate": 1.0220962292726496e-08, + "loss": 0.0005, + "step": 48920 + }, + { + "epoch": 0.95, + "learning_rate": 1.0217078948390354e-08, + "loss": 0.0005, + "step": 48921 + }, + { + "epoch": 0.95, + "learning_rate": 1.0213195604054212e-08, + "loss": 0.0004, + "step": 48922 + }, + { + "epoch": 0.95, + "learning_rate": 1.0209312259718069e-08, + "loss": 0.0004, + "step": 48923 + }, + { + "epoch": 0.95, + "learning_rate": 1.0205428915381927e-08, + "loss": 0.0004, + "step": 48924 + }, + { + "epoch": 0.95, + "learning_rate": 1.0201545571045785e-08, + "loss": 0.0003, + "step": 48925 + }, + { + "epoch": 0.95, + "learning_rate": 1.0197662226709642e-08, + "loss": 0.0003, + "step": 48926 + }, + { + "epoch": 0.95, + "learning_rate": 1.01937788823735e-08, + "loss": 0.0003, + "step": 48927 + }, + { + "epoch": 0.95, + "learning_rate": 1.0189895538037358e-08, + "loss": 0.6658, + "step": 48928 + }, + { + "epoch": 0.95, + "learning_rate": 1.0186012193701215e-08, + "loss": 0.0007, + "step": 48929 + }, + { + "epoch": 0.95, + "learning_rate": 1.0182128849365073e-08, + "loss": 0.0003, + "step": 48930 + }, + { + "epoch": 0.95, + "learning_rate": 1.017824550502893e-08, + "loss": 0.0004, + "step": 48931 + }, + { + "epoch": 0.95, + "learning_rate": 1.0174362160692788e-08, + "loss": 0.0005, + "step": 48932 + }, + { + "epoch": 0.95, + "learning_rate": 1.0170478816356646e-08, + "loss": 0.0005, + "step": 48933 + }, + { + "epoch": 0.95, + "learning_rate": 1.0166595472020503e-08, + "loss": 0.0003, + "step": 48934 + }, + { + "epoch": 0.95, + "learning_rate": 1.0162712127684361e-08, + "loss": 0.0004, + "step": 48935 + }, + { + "epoch": 0.95, + "learning_rate": 1.015882878334822e-08, + "loss": 0.0023, + "step": 48936 + }, + { + "epoch": 0.95, + "learning_rate": 1.0154945439012076e-08, + "loss": 0.8858, + "step": 48937 + }, + { + "epoch": 0.95, + "learning_rate": 1.0151062094675934e-08, + "loss": 0.0041, + "step": 48938 + }, + { + "epoch": 0.95, + "learning_rate": 1.0147178750339792e-08, + "loss": 0.001, + "step": 48939 + }, + { + "epoch": 0.95, + "learning_rate": 1.014329540600365e-08, + "loss": 0.5225, + "step": 48940 + }, + { + "epoch": 0.95, + "learning_rate": 1.0139412061667507e-08, + "loss": 0.0016, + "step": 48941 + }, + { + "epoch": 0.95, + "learning_rate": 1.0135528717331365e-08, + "loss": 0.2875, + "step": 48942 + }, + { + "epoch": 0.95, + "learning_rate": 1.0131645372995224e-08, + "loss": 0.7029, + "step": 48943 + }, + { + "epoch": 0.95, + "learning_rate": 1.012776202865908e-08, + "loss": 0.0003, + "step": 48944 + }, + { + "epoch": 0.95, + "learning_rate": 1.0123878684322938e-08, + "loss": 0.0018, + "step": 48945 + }, + { + "epoch": 0.95, + "learning_rate": 1.0119995339986797e-08, + "loss": 0.0005, + "step": 48946 + }, + { + "epoch": 0.95, + "learning_rate": 1.0116111995650655e-08, + "loss": 0.0003, + "step": 48947 + }, + { + "epoch": 0.95, + "learning_rate": 1.0112228651314512e-08, + "loss": 0.0033, + "step": 48948 + }, + { + "epoch": 0.95, + "learning_rate": 1.010834530697837e-08, + "loss": 0.0004, + "step": 48949 + }, + { + "epoch": 0.95, + "learning_rate": 1.0104461962642228e-08, + "loss": 0.0083, + "step": 48950 + }, + { + "epoch": 0.95, + "learning_rate": 1.0100578618306085e-08, + "loss": 0.0003, + "step": 48951 + }, + { + "epoch": 0.95, + "learning_rate": 1.0096695273969943e-08, + "loss": 0.0006, + "step": 48952 + }, + { + "epoch": 0.95, + "learning_rate": 1.00928119296338e-08, + "loss": 0.8714, + "step": 48953 + }, + { + "epoch": 0.95, + "learning_rate": 1.0088928585297658e-08, + "loss": 0.0004, + "step": 48954 + }, + { + "epoch": 0.95, + "learning_rate": 1.0085045240961514e-08, + "loss": 0.0003, + "step": 48955 + }, + { + "epoch": 0.95, + "learning_rate": 1.0081161896625372e-08, + "loss": 0.0003, + "step": 48956 + }, + { + "epoch": 0.95, + "learning_rate": 1.007727855228923e-08, + "loss": 0.0003, + "step": 48957 + }, + { + "epoch": 0.95, + "learning_rate": 1.0073395207953089e-08, + "loss": 0.0007, + "step": 48958 + }, + { + "epoch": 0.95, + "learning_rate": 1.0069511863616946e-08, + "loss": 0.0004, + "step": 48959 + }, + { + "epoch": 0.95, + "learning_rate": 1.0065628519280804e-08, + "loss": 0.0003, + "step": 48960 + }, + { + "epoch": 0.95, + "learning_rate": 1.0061745174944662e-08, + "loss": 0.0004, + "step": 48961 + }, + { + "epoch": 0.95, + "learning_rate": 1.005786183060852e-08, + "loss": 0.0005, + "step": 48962 + }, + { + "epoch": 0.95, + "learning_rate": 1.0053978486272377e-08, + "loss": 0.0003, + "step": 48963 + }, + { + "epoch": 0.95, + "learning_rate": 1.0050095141936235e-08, + "loss": 0.0004, + "step": 48964 + }, + { + "epoch": 0.95, + "learning_rate": 1.0046211797600093e-08, + "loss": 0.0005, + "step": 48965 + }, + { + "epoch": 0.95, + "learning_rate": 1.004232845326395e-08, + "loss": 0.0007, + "step": 48966 + }, + { + "epoch": 0.95, + "learning_rate": 1.0038445108927808e-08, + "loss": 0.0003, + "step": 48967 + }, + { + "epoch": 0.95, + "learning_rate": 1.0034561764591666e-08, + "loss": 0.0016, + "step": 48968 + }, + { + "epoch": 0.95, + "learning_rate": 1.0030678420255525e-08, + "loss": 0.0003, + "step": 48969 + }, + { + "epoch": 0.95, + "learning_rate": 1.0026795075919381e-08, + "loss": 0.07, + "step": 48970 + }, + { + "epoch": 0.95, + "learning_rate": 1.002291173158324e-08, + "loss": 0.0003, + "step": 48971 + }, + { + "epoch": 0.95, + "learning_rate": 1.0019028387247098e-08, + "loss": 0.0005, + "step": 48972 + }, + { + "epoch": 0.95, + "learning_rate": 1.0015145042910954e-08, + "loss": 0.0004, + "step": 48973 + }, + { + "epoch": 0.95, + "learning_rate": 1.0011261698574813e-08, + "loss": 0.0004, + "step": 48974 + }, + { + "epoch": 0.95, + "learning_rate": 1.000737835423867e-08, + "loss": 0.0004, + "step": 48975 + }, + { + "epoch": 0.95, + "learning_rate": 1.0003495009902527e-08, + "loss": 0.0004, + "step": 48976 + }, + { + "epoch": 0.95, + "learning_rate": 9.999611665566384e-09, + "loss": 0.0003, + "step": 48977 + }, + { + "epoch": 0.95, + "learning_rate": 9.995728321230242e-09, + "loss": 0.0004, + "step": 48978 + }, + { + "epoch": 0.95, + "learning_rate": 9.9918449768941e-09, + "loss": 0.6796, + "step": 48979 + }, + { + "epoch": 0.95, + "learning_rate": 9.987961632557959e-09, + "loss": 0.0002, + "step": 48980 + }, + { + "epoch": 0.95, + "learning_rate": 9.984078288221815e-09, + "loss": 0.0005, + "step": 48981 + }, + { + "epoch": 0.95, + "learning_rate": 9.980194943885674e-09, + "loss": 0.0006, + "step": 48982 + }, + { + "epoch": 0.95, + "learning_rate": 9.976311599549532e-09, + "loss": 0.0004, + "step": 48983 + }, + { + "epoch": 0.95, + "learning_rate": 9.972428255213388e-09, + "loss": 0.0004, + "step": 48984 + }, + { + "epoch": 0.95, + "learning_rate": 9.968544910877247e-09, + "loss": 0.0004, + "step": 48985 + }, + { + "epoch": 0.95, + "learning_rate": 9.964661566541105e-09, + "loss": 0.0006, + "step": 48986 + }, + { + "epoch": 0.95, + "learning_rate": 9.960778222204963e-09, + "loss": 0.0005, + "step": 48987 + }, + { + "epoch": 0.95, + "learning_rate": 9.95689487786882e-09, + "loss": 0.4482, + "step": 48988 + }, + { + "epoch": 0.95, + "learning_rate": 9.953011533532678e-09, + "loss": 0.0009, + "step": 48989 + }, + { + "epoch": 0.95, + "learning_rate": 9.949128189196536e-09, + "loss": 0.0006, + "step": 48990 + }, + { + "epoch": 0.95, + "learning_rate": 9.945244844860395e-09, + "loss": 0.0005, + "step": 48991 + }, + { + "epoch": 0.95, + "learning_rate": 9.941361500524251e-09, + "loss": 0.0004, + "step": 48992 + }, + { + "epoch": 0.95, + "learning_rate": 9.93747815618811e-09, + "loss": 0.0004, + "step": 48993 + }, + { + "epoch": 0.95, + "learning_rate": 9.933594811851968e-09, + "loss": 0.0003, + "step": 48994 + }, + { + "epoch": 0.95, + "learning_rate": 9.929711467515824e-09, + "loss": 0.0003, + "step": 48995 + }, + { + "epoch": 0.95, + "learning_rate": 9.925828123179682e-09, + "loss": 0.0003, + "step": 48996 + }, + { + "epoch": 0.95, + "learning_rate": 9.921944778843539e-09, + "loss": 0.0006, + "step": 48997 + }, + { + "epoch": 0.95, + "learning_rate": 9.918061434507397e-09, + "loss": 0.0057, + "step": 48998 + }, + { + "epoch": 0.95, + "learning_rate": 9.914178090171254e-09, + "loss": 0.0004, + "step": 48999 + }, + { + "epoch": 0.95, + "learning_rate": 9.910294745835112e-09, + "loss": 0.0003, + "step": 49000 + }, + { + "epoch": 0.95, + "learning_rate": 9.90641140149897e-09, + "loss": 0.7784, + "step": 49001 + }, + { + "epoch": 0.95, + "learning_rate": 9.902528057162827e-09, + "loss": 0.0003, + "step": 49002 + }, + { + "epoch": 0.95, + "learning_rate": 9.898644712826685e-09, + "loss": 0.0003, + "step": 49003 + }, + { + "epoch": 0.95, + "learning_rate": 9.894761368490543e-09, + "loss": 0.0006, + "step": 49004 + }, + { + "epoch": 0.95, + "learning_rate": 9.890878024154402e-09, + "loss": 0.0004, + "step": 49005 + }, + { + "epoch": 0.95, + "learning_rate": 9.886994679818258e-09, + "loss": 0.0003, + "step": 49006 + }, + { + "epoch": 0.95, + "learning_rate": 9.883111335482116e-09, + "loss": 0.0003, + "step": 49007 + }, + { + "epoch": 0.95, + "learning_rate": 9.879227991145975e-09, + "loss": 0.0005, + "step": 49008 + }, + { + "epoch": 0.95, + "learning_rate": 9.875344646809833e-09, + "loss": 0.0004, + "step": 49009 + }, + { + "epoch": 0.95, + "learning_rate": 9.87146130247369e-09, + "loss": 0.0004, + "step": 49010 + }, + { + "epoch": 0.95, + "learning_rate": 9.867577958137548e-09, + "loss": 0.0004, + "step": 49011 + }, + { + "epoch": 0.95, + "learning_rate": 9.863694613801406e-09, + "loss": 0.0002, + "step": 49012 + }, + { + "epoch": 0.95, + "learning_rate": 9.859811269465263e-09, + "loss": 0.0004, + "step": 49013 + }, + { + "epoch": 0.95, + "learning_rate": 9.855927925129121e-09, + "loss": 0.0228, + "step": 49014 + }, + { + "epoch": 0.95, + "learning_rate": 9.852044580792979e-09, + "loss": 0.0005, + "step": 49015 + }, + { + "epoch": 0.95, + "learning_rate": 9.848161236456837e-09, + "loss": 0.02, + "step": 49016 + }, + { + "epoch": 0.95, + "learning_rate": 9.844277892120694e-09, + "loss": 0.0005, + "step": 49017 + }, + { + "epoch": 0.95, + "learning_rate": 9.840394547784552e-09, + "loss": 0.0003, + "step": 49018 + }, + { + "epoch": 0.95, + "learning_rate": 9.836511203448409e-09, + "loss": 0.0004, + "step": 49019 + }, + { + "epoch": 0.95, + "learning_rate": 9.832627859112267e-09, + "loss": 0.0003, + "step": 49020 + }, + { + "epoch": 0.95, + "learning_rate": 9.828744514776124e-09, + "loss": 0.0003, + "step": 49021 + }, + { + "epoch": 0.95, + "learning_rate": 9.824861170439982e-09, + "loss": 0.0003, + "step": 49022 + }, + { + "epoch": 0.95, + "learning_rate": 9.82097782610384e-09, + "loss": 0.0013, + "step": 49023 + }, + { + "epoch": 0.95, + "learning_rate": 9.817094481767697e-09, + "loss": 0.0003, + "step": 49024 + }, + { + "epoch": 0.95, + "learning_rate": 9.813211137431555e-09, + "loss": 0.0007, + "step": 49025 + }, + { + "epoch": 0.95, + "learning_rate": 9.809327793095413e-09, + "loss": 0.0004, + "step": 49026 + }, + { + "epoch": 0.95, + "learning_rate": 9.805444448759271e-09, + "loss": 0.7782, + "step": 49027 + }, + { + "epoch": 0.95, + "learning_rate": 9.801561104423128e-09, + "loss": 0.0009, + "step": 49028 + }, + { + "epoch": 0.95, + "learning_rate": 9.797677760086986e-09, + "loss": 0.0004, + "step": 49029 + }, + { + "epoch": 0.95, + "learning_rate": 9.793794415750845e-09, + "loss": 0.0009, + "step": 49030 + }, + { + "epoch": 0.95, + "learning_rate": 9.789911071414701e-09, + "loss": 0.0005, + "step": 49031 + }, + { + "epoch": 0.95, + "learning_rate": 9.78602772707856e-09, + "loss": 0.0004, + "step": 49032 + }, + { + "epoch": 0.95, + "learning_rate": 9.782144382742418e-09, + "loss": 0.0004, + "step": 49033 + }, + { + "epoch": 0.95, + "learning_rate": 9.778261038406276e-09, + "loss": 0.966, + "step": 49034 + }, + { + "epoch": 0.95, + "learning_rate": 9.774377694070132e-09, + "loss": 0.0003, + "step": 49035 + }, + { + "epoch": 0.95, + "learning_rate": 9.77049434973399e-09, + "loss": 0.0003, + "step": 49036 + }, + { + "epoch": 0.95, + "learning_rate": 9.766611005397849e-09, + "loss": 0.0004, + "step": 49037 + }, + { + "epoch": 0.95, + "learning_rate": 9.762727661061707e-09, + "loss": 0.0003, + "step": 49038 + }, + { + "epoch": 0.95, + "learning_rate": 9.758844316725564e-09, + "loss": 0.581, + "step": 49039 + }, + { + "epoch": 0.95, + "learning_rate": 9.754960972389422e-09, + "loss": 0.0005, + "step": 49040 + }, + { + "epoch": 0.95, + "learning_rate": 9.75107762805328e-09, + "loss": 0.0005, + "step": 49041 + }, + { + "epoch": 0.95, + "learning_rate": 9.747194283717137e-09, + "loss": 0.0008, + "step": 49042 + }, + { + "epoch": 0.95, + "learning_rate": 9.743310939380993e-09, + "loss": 0.0005, + "step": 49043 + }, + { + "epoch": 0.95, + "learning_rate": 9.739427595044852e-09, + "loss": 0.0004, + "step": 49044 + }, + { + "epoch": 0.95, + "learning_rate": 9.73554425070871e-09, + "loss": 0.0004, + "step": 49045 + }, + { + "epoch": 0.95, + "learning_rate": 9.731660906372567e-09, + "loss": 0.0005, + "step": 49046 + }, + { + "epoch": 0.95, + "learning_rate": 9.727777562036425e-09, + "loss": 0.0004, + "step": 49047 + }, + { + "epoch": 0.95, + "learning_rate": 9.723894217700283e-09, + "loss": 0.0004, + "step": 49048 + }, + { + "epoch": 0.95, + "learning_rate": 9.720010873364141e-09, + "loss": 0.0004, + "step": 49049 + }, + { + "epoch": 0.95, + "learning_rate": 9.716127529027998e-09, + "loss": 0.0004, + "step": 49050 + }, + { + "epoch": 0.95, + "learning_rate": 9.712244184691856e-09, + "loss": 0.0003, + "step": 49051 + }, + { + "epoch": 0.95, + "learning_rate": 9.708360840355714e-09, + "loss": 0.0006, + "step": 49052 + }, + { + "epoch": 0.95, + "learning_rate": 9.704477496019571e-09, + "loss": 0.0006, + "step": 49053 + }, + { + "epoch": 0.95, + "learning_rate": 9.700594151683429e-09, + "loss": 0.0003, + "step": 49054 + }, + { + "epoch": 0.95, + "learning_rate": 9.696710807347287e-09, + "loss": 0.0004, + "step": 49055 + }, + { + "epoch": 0.95, + "learning_rate": 9.692827463011146e-09, + "loss": 0.0005, + "step": 49056 + }, + { + "epoch": 0.95, + "learning_rate": 9.688944118675002e-09, + "loss": 0.0004, + "step": 49057 + }, + { + "epoch": 0.95, + "learning_rate": 9.68506077433886e-09, + "loss": 0.0004, + "step": 49058 + }, + { + "epoch": 0.95, + "learning_rate": 9.681177430002719e-09, + "loss": 0.0009, + "step": 49059 + }, + { + "epoch": 0.95, + "learning_rate": 9.677294085666575e-09, + "loss": 0.0003, + "step": 49060 + }, + { + "epoch": 0.95, + "learning_rate": 9.673410741330434e-09, + "loss": 0.0003, + "step": 49061 + }, + { + "epoch": 0.95, + "learning_rate": 9.669527396994292e-09, + "loss": 0.0011, + "step": 49062 + }, + { + "epoch": 0.95, + "learning_rate": 9.66564405265815e-09, + "loss": 0.0003, + "step": 49063 + }, + { + "epoch": 0.95, + "learning_rate": 9.661760708322007e-09, + "loss": 0.0004, + "step": 49064 + }, + { + "epoch": 0.95, + "learning_rate": 9.657877363985865e-09, + "loss": 0.0005, + "step": 49065 + }, + { + "epoch": 0.95, + "learning_rate": 9.653994019649721e-09, + "loss": 0.0003, + "step": 49066 + }, + { + "epoch": 0.95, + "learning_rate": 9.65011067531358e-09, + "loss": 0.0003, + "step": 49067 + }, + { + "epoch": 0.95, + "learning_rate": 9.646227330977436e-09, + "loss": 0.0004, + "step": 49068 + }, + { + "epoch": 0.95, + "learning_rate": 9.642343986641295e-09, + "loss": 0.0004, + "step": 49069 + }, + { + "epoch": 0.95, + "learning_rate": 9.638460642305153e-09, + "loss": 0.0005, + "step": 49070 + }, + { + "epoch": 0.95, + "learning_rate": 9.63457729796901e-09, + "loss": 0.0178, + "step": 49071 + }, + { + "epoch": 0.95, + "learning_rate": 9.630693953632868e-09, + "loss": 0.0004, + "step": 49072 + }, + { + "epoch": 0.95, + "learning_rate": 9.626810609296726e-09, + "loss": 0.0003, + "step": 49073 + }, + { + "epoch": 0.95, + "learning_rate": 9.622927264960584e-09, + "loss": 0.158, + "step": 49074 + }, + { + "epoch": 0.95, + "learning_rate": 9.61904392062444e-09, + "loss": 0.0003, + "step": 49075 + }, + { + "epoch": 0.95, + "learning_rate": 9.615160576288299e-09, + "loss": 0.0004, + "step": 49076 + }, + { + "epoch": 0.95, + "learning_rate": 9.611277231952157e-09, + "loss": 0.0004, + "step": 49077 + }, + { + "epoch": 0.95, + "learning_rate": 9.607393887616015e-09, + "loss": 0.0003, + "step": 49078 + }, + { + "epoch": 0.95, + "learning_rate": 9.603510543279872e-09, + "loss": 0.0003, + "step": 49079 + }, + { + "epoch": 0.95, + "learning_rate": 9.59962719894373e-09, + "loss": 0.0004, + "step": 49080 + }, + { + "epoch": 0.95, + "learning_rate": 9.595743854607589e-09, + "loss": 0.0004, + "step": 49081 + }, + { + "epoch": 0.95, + "learning_rate": 9.591860510271445e-09, + "loss": 0.0003, + "step": 49082 + }, + { + "epoch": 0.95, + "learning_rate": 9.587977165935303e-09, + "loss": 0.0012, + "step": 49083 + }, + { + "epoch": 0.95, + "learning_rate": 9.584093821599162e-09, + "loss": 0.0003, + "step": 49084 + }, + { + "epoch": 0.95, + "learning_rate": 9.58021047726302e-09, + "loss": 1.121, + "step": 49085 + }, + { + "epoch": 0.95, + "learning_rate": 9.576327132926876e-09, + "loss": 0.0003, + "step": 49086 + }, + { + "epoch": 0.95, + "learning_rate": 9.572443788590735e-09, + "loss": 0.0003, + "step": 49087 + }, + { + "epoch": 0.95, + "learning_rate": 9.568560444254591e-09, + "loss": 0.0003, + "step": 49088 + }, + { + "epoch": 0.95, + "learning_rate": 9.564677099918448e-09, + "loss": 0.0003, + "step": 49089 + }, + { + "epoch": 0.95, + "learning_rate": 9.560793755582306e-09, + "loss": 0.0004, + "step": 49090 + }, + { + "epoch": 0.95, + "learning_rate": 9.556910411246164e-09, + "loss": 0.0004, + "step": 49091 + }, + { + "epoch": 0.95, + "learning_rate": 9.553027066910023e-09, + "loss": 0.0004, + "step": 49092 + }, + { + "epoch": 0.95, + "learning_rate": 9.54914372257388e-09, + "loss": 0.0002, + "step": 49093 + }, + { + "epoch": 0.95, + "learning_rate": 9.545260378237737e-09, + "loss": 0.0009, + "step": 49094 + }, + { + "epoch": 0.95, + "learning_rate": 9.541377033901596e-09, + "loss": 0.0162, + "step": 49095 + }, + { + "epoch": 0.95, + "learning_rate": 9.537493689565454e-09, + "loss": 0.0004, + "step": 49096 + }, + { + "epoch": 0.95, + "learning_rate": 9.53361034522931e-09, + "loss": 0.0007, + "step": 49097 + }, + { + "epoch": 0.95, + "learning_rate": 9.529727000893169e-09, + "loss": 0.0004, + "step": 49098 + }, + { + "epoch": 0.95, + "learning_rate": 9.525843656557027e-09, + "loss": 0.0005, + "step": 49099 + }, + { + "epoch": 0.95, + "learning_rate": 9.521960312220884e-09, + "loss": 0.3682, + "step": 49100 + }, + { + "epoch": 0.95, + "learning_rate": 9.518076967884742e-09, + "loss": 0.0004, + "step": 49101 + }, + { + "epoch": 0.95, + "learning_rate": 9.5141936235486e-09, + "loss": 0.0004, + "step": 49102 + }, + { + "epoch": 0.95, + "learning_rate": 9.510310279212458e-09, + "loss": 0.0006, + "step": 49103 + }, + { + "epoch": 0.95, + "learning_rate": 9.506426934876315e-09, + "loss": 0.0023, + "step": 49104 + }, + { + "epoch": 0.95, + "learning_rate": 9.502543590540173e-09, + "loss": 0.0009, + "step": 49105 + }, + { + "epoch": 0.95, + "learning_rate": 9.498660246204031e-09, + "loss": 0.0772, + "step": 49106 + }, + { + "epoch": 0.95, + "learning_rate": 9.49477690186789e-09, + "loss": 0.5244, + "step": 49107 + }, + { + "epoch": 0.95, + "learning_rate": 9.490893557531746e-09, + "loss": 0.0005, + "step": 49108 + }, + { + "epoch": 0.95, + "learning_rate": 9.487010213195604e-09, + "loss": 0.0006, + "step": 49109 + }, + { + "epoch": 0.95, + "learning_rate": 9.483126868859461e-09, + "loss": 0.0008, + "step": 49110 + }, + { + "epoch": 0.95, + "learning_rate": 9.47924352452332e-09, + "loss": 0.0005, + "step": 49111 + }, + { + "epoch": 0.95, + "learning_rate": 9.475360180187176e-09, + "loss": 0.0007, + "step": 49112 + }, + { + "epoch": 0.95, + "learning_rate": 9.471476835851034e-09, + "loss": 0.0008, + "step": 49113 + }, + { + "epoch": 0.95, + "learning_rate": 9.467593491514892e-09, + "loss": 0.0079, + "step": 49114 + }, + { + "epoch": 0.95, + "learning_rate": 9.463710147178749e-09, + "loss": 0.0003, + "step": 49115 + }, + { + "epoch": 0.95, + "learning_rate": 9.459826802842607e-09, + "loss": 0.0003, + "step": 49116 + }, + { + "epoch": 0.95, + "learning_rate": 9.455943458506465e-09, + "loss": 0.0004, + "step": 49117 + }, + { + "epoch": 0.95, + "learning_rate": 9.452060114170322e-09, + "loss": 0.0006, + "step": 49118 + }, + { + "epoch": 0.95, + "learning_rate": 9.44817676983418e-09, + "loss": 0.0004, + "step": 49119 + }, + { + "epoch": 0.95, + "learning_rate": 9.444293425498039e-09, + "loss": 0.0665, + "step": 49120 + }, + { + "epoch": 0.95, + "learning_rate": 9.440410081161897e-09, + "loss": 0.0003, + "step": 49121 + }, + { + "epoch": 0.95, + "learning_rate": 9.436526736825753e-09, + "loss": 0.0004, + "step": 49122 + }, + { + "epoch": 0.95, + "learning_rate": 9.432643392489612e-09, + "loss": 0.0009, + "step": 49123 + }, + { + "epoch": 0.95, + "learning_rate": 9.42876004815347e-09, + "loss": 0.0003, + "step": 49124 + }, + { + "epoch": 0.95, + "learning_rate": 9.424876703817328e-09, + "loss": 0.0003, + "step": 49125 + }, + { + "epoch": 0.95, + "learning_rate": 9.420993359481185e-09, + "loss": 0.0003, + "step": 49126 + }, + { + "epoch": 0.95, + "learning_rate": 9.417110015145043e-09, + "loss": 0.0003, + "step": 49127 + }, + { + "epoch": 0.95, + "learning_rate": 9.413226670808901e-09, + "loss": 0.0003, + "step": 49128 + }, + { + "epoch": 0.95, + "learning_rate": 9.409343326472758e-09, + "loss": 1.5213, + "step": 49129 + }, + { + "epoch": 0.95, + "learning_rate": 9.405459982136616e-09, + "loss": 0.0009, + "step": 49130 + }, + { + "epoch": 0.95, + "learning_rate": 9.401576637800474e-09, + "loss": 0.0002, + "step": 49131 + }, + { + "epoch": 0.95, + "learning_rate": 9.397693293464331e-09, + "loss": 0.0004, + "step": 49132 + }, + { + "epoch": 0.95, + "learning_rate": 9.393809949128189e-09, + "loss": 0.0005, + "step": 49133 + }, + { + "epoch": 0.95, + "learning_rate": 9.389926604792046e-09, + "loss": 0.0003, + "step": 49134 + }, + { + "epoch": 0.95, + "learning_rate": 9.386043260455904e-09, + "loss": 0.0003, + "step": 49135 + }, + { + "epoch": 0.95, + "learning_rate": 9.382159916119762e-09, + "loss": 0.0004, + "step": 49136 + }, + { + "epoch": 0.95, + "learning_rate": 9.378276571783619e-09, + "loss": 0.0005, + "step": 49137 + }, + { + "epoch": 0.95, + "learning_rate": 9.374393227447477e-09, + "loss": 0.0005, + "step": 49138 + }, + { + "epoch": 0.95, + "learning_rate": 9.370509883111335e-09, + "loss": 0.0003, + "step": 49139 + }, + { + "epoch": 0.95, + "learning_rate": 9.366626538775192e-09, + "loss": 0.0005, + "step": 49140 + }, + { + "epoch": 0.95, + "learning_rate": 9.36274319443905e-09, + "loss": 0.0004, + "step": 49141 + }, + { + "epoch": 0.95, + "learning_rate": 9.358859850102908e-09, + "loss": 0.0003, + "step": 49142 + }, + { + "epoch": 0.95, + "learning_rate": 9.354976505766767e-09, + "loss": 0.0004, + "step": 49143 + }, + { + "epoch": 0.95, + "learning_rate": 9.351093161430623e-09, + "loss": 0.001, + "step": 49144 + }, + { + "epoch": 0.95, + "learning_rate": 9.347209817094481e-09, + "loss": 0.0032, + "step": 49145 + }, + { + "epoch": 0.95, + "learning_rate": 9.34332647275834e-09, + "loss": 0.0004, + "step": 49146 + }, + { + "epoch": 0.95, + "learning_rate": 9.339443128422196e-09, + "loss": 0.0003, + "step": 49147 + }, + { + "epoch": 0.95, + "learning_rate": 9.335559784086054e-09, + "loss": 0.0007, + "step": 49148 + }, + { + "epoch": 0.95, + "learning_rate": 9.331676439749913e-09, + "loss": 0.0006, + "step": 49149 + }, + { + "epoch": 0.95, + "learning_rate": 9.327793095413771e-09, + "loss": 0.0004, + "step": 49150 + }, + { + "epoch": 0.95, + "learning_rate": 9.323909751077628e-09, + "loss": 1.1716, + "step": 49151 + }, + { + "epoch": 0.95, + "learning_rate": 9.320026406741486e-09, + "loss": 0.0004, + "step": 49152 + }, + { + "epoch": 0.95, + "learning_rate": 9.316143062405344e-09, + "loss": 0.0003, + "step": 49153 + }, + { + "epoch": 0.95, + "learning_rate": 9.3122597180692e-09, + "loss": 0.0368, + "step": 49154 + }, + { + "epoch": 0.95, + "learning_rate": 9.308376373733059e-09, + "loss": 0.0008, + "step": 49155 + }, + { + "epoch": 0.95, + "learning_rate": 9.304493029396915e-09, + "loss": 0.0003, + "step": 49156 + }, + { + "epoch": 0.95, + "learning_rate": 9.300609685060774e-09, + "loss": 0.0003, + "step": 49157 + }, + { + "epoch": 0.95, + "learning_rate": 9.29672634072463e-09, + "loss": 0.0003, + "step": 49158 + }, + { + "epoch": 0.95, + "learning_rate": 9.292842996388489e-09, + "loss": 0.0004, + "step": 49159 + }, + { + "epoch": 0.95, + "learning_rate": 9.288959652052347e-09, + "loss": 0.0003, + "step": 49160 + }, + { + "epoch": 0.95, + "learning_rate": 9.285076307716205e-09, + "loss": 0.0003, + "step": 49161 + }, + { + "epoch": 0.95, + "learning_rate": 9.281192963380062e-09, + "loss": 0.0985, + "step": 49162 + }, + { + "epoch": 0.95, + "learning_rate": 9.27730961904392e-09, + "loss": 0.0004, + "step": 49163 + }, + { + "epoch": 0.95, + "learning_rate": 9.273426274707778e-09, + "loss": 0.0003, + "step": 49164 + }, + { + "epoch": 0.95, + "learning_rate": 9.269542930371636e-09, + "loss": 0.0014, + "step": 49165 + }, + { + "epoch": 0.95, + "learning_rate": 9.265659586035493e-09, + "loss": 0.0017, + "step": 49166 + }, + { + "epoch": 0.95, + "learning_rate": 9.261776241699351e-09, + "loss": 0.0011, + "step": 49167 + }, + { + "epoch": 0.95, + "learning_rate": 9.25789289736321e-09, + "loss": 0.0039, + "step": 49168 + }, + { + "epoch": 0.95, + "learning_rate": 9.254009553027066e-09, + "loss": 0.0007, + "step": 49169 + }, + { + "epoch": 0.95, + "learning_rate": 9.250126208690924e-09, + "loss": 0.0004, + "step": 49170 + }, + { + "epoch": 0.95, + "learning_rate": 9.246242864354783e-09, + "loss": 0.0004, + "step": 49171 + }, + { + "epoch": 0.95, + "learning_rate": 9.24235952001864e-09, + "loss": 0.0003, + "step": 49172 + }, + { + "epoch": 0.95, + "learning_rate": 9.238476175682497e-09, + "loss": 0.0004, + "step": 49173 + }, + { + "epoch": 0.95, + "learning_rate": 9.234592831346356e-09, + "loss": 0.0004, + "step": 49174 + }, + { + "epoch": 0.95, + "learning_rate": 9.230709487010214e-09, + "loss": 0.0003, + "step": 49175 + }, + { + "epoch": 0.95, + "learning_rate": 9.22682614267407e-09, + "loss": 0.0004, + "step": 49176 + }, + { + "epoch": 0.95, + "learning_rate": 9.222942798337929e-09, + "loss": 0.0044, + "step": 49177 + }, + { + "epoch": 0.95, + "learning_rate": 9.219059454001785e-09, + "loss": 1.3555, + "step": 49178 + }, + { + "epoch": 0.95, + "learning_rate": 9.215176109665644e-09, + "loss": 0.0004, + "step": 49179 + }, + { + "epoch": 0.95, + "learning_rate": 9.2112927653295e-09, + "loss": 0.0004, + "step": 49180 + }, + { + "epoch": 0.95, + "learning_rate": 9.207409420993358e-09, + "loss": 0.0003, + "step": 49181 + }, + { + "epoch": 0.95, + "learning_rate": 9.203526076657217e-09, + "loss": 0.0003, + "step": 49182 + }, + { + "epoch": 0.95, + "learning_rate": 9.199642732321075e-09, + "loss": 1.4297, + "step": 49183 + }, + { + "epoch": 0.95, + "learning_rate": 9.195759387984931e-09, + "loss": 0.0483, + "step": 49184 + }, + { + "epoch": 0.95, + "learning_rate": 9.19187604364879e-09, + "loss": 0.0004, + "step": 49185 + }, + { + "epoch": 0.95, + "learning_rate": 9.187992699312648e-09, + "loss": 0.0004, + "step": 49186 + }, + { + "epoch": 0.95, + "learning_rate": 9.184109354976505e-09, + "loss": 0.0005, + "step": 49187 + }, + { + "epoch": 0.95, + "learning_rate": 9.180226010640363e-09, + "loss": 0.0002, + "step": 49188 + }, + { + "epoch": 0.95, + "learning_rate": 9.176342666304221e-09, + "loss": 0.0017, + "step": 49189 + }, + { + "epoch": 0.95, + "learning_rate": 9.17245932196808e-09, + "loss": 0.0005, + "step": 49190 + }, + { + "epoch": 0.95, + "learning_rate": 9.168575977631936e-09, + "loss": 0.0004, + "step": 49191 + }, + { + "epoch": 0.95, + "learning_rate": 9.164692633295794e-09, + "loss": 0.0006, + "step": 49192 + }, + { + "epoch": 0.95, + "learning_rate": 9.160809288959652e-09, + "loss": 0.0003, + "step": 49193 + }, + { + "epoch": 0.95, + "learning_rate": 9.15692594462351e-09, + "loss": 0.0003, + "step": 49194 + }, + { + "epoch": 0.95, + "learning_rate": 9.153042600287367e-09, + "loss": 0.0006, + "step": 49195 + }, + { + "epoch": 0.95, + "learning_rate": 9.149159255951225e-09, + "loss": 0.0005, + "step": 49196 + }, + { + "epoch": 0.95, + "learning_rate": 9.145275911615084e-09, + "loss": 0.0003, + "step": 49197 + }, + { + "epoch": 0.95, + "learning_rate": 9.14139256727894e-09, + "loss": 0.0004, + "step": 49198 + }, + { + "epoch": 0.95, + "learning_rate": 9.137509222942798e-09, + "loss": 0.0006, + "step": 49199 + }, + { + "epoch": 0.95, + "learning_rate": 9.133625878606655e-09, + "loss": 0.0003, + "step": 49200 + }, + { + "epoch": 0.95, + "learning_rate": 9.129742534270513e-09, + "loss": 0.0004, + "step": 49201 + }, + { + "epoch": 0.95, + "learning_rate": 9.12585918993437e-09, + "loss": 0.0004, + "step": 49202 + }, + { + "epoch": 0.95, + "learning_rate": 9.121975845598228e-09, + "loss": 0.0004, + "step": 49203 + }, + { + "epoch": 0.95, + "learning_rate": 9.118092501262086e-09, + "loss": 0.0003, + "step": 49204 + }, + { + "epoch": 0.95, + "learning_rate": 9.114209156925943e-09, + "loss": 0.0003, + "step": 49205 + }, + { + "epoch": 0.95, + "learning_rate": 9.110325812589801e-09, + "loss": 0.0004, + "step": 49206 + }, + { + "epoch": 0.95, + "learning_rate": 9.10644246825366e-09, + "loss": 0.0003, + "step": 49207 + }, + { + "epoch": 0.95, + "learning_rate": 9.102559123917518e-09, + "loss": 0.0018, + "step": 49208 + }, + { + "epoch": 0.95, + "learning_rate": 9.098675779581374e-09, + "loss": 0.0009, + "step": 49209 + }, + { + "epoch": 0.95, + "learning_rate": 9.094792435245233e-09, + "loss": 0.0005, + "step": 49210 + }, + { + "epoch": 0.95, + "learning_rate": 9.09090909090909e-09, + "loss": 0.0004, + "step": 49211 + }, + { + "epoch": 0.95, + "learning_rate": 9.087025746572949e-09, + "loss": 0.0005, + "step": 49212 + }, + { + "epoch": 0.95, + "learning_rate": 9.083142402236806e-09, + "loss": 0.0004, + "step": 49213 + }, + { + "epoch": 0.95, + "learning_rate": 9.079259057900664e-09, + "loss": 0.0004, + "step": 49214 + }, + { + "epoch": 0.95, + "learning_rate": 9.075375713564522e-09, + "loss": 0.0282, + "step": 49215 + }, + { + "epoch": 0.95, + "learning_rate": 9.071492369228379e-09, + "loss": 0.0003, + "step": 49216 + }, + { + "epoch": 0.95, + "learning_rate": 9.067609024892237e-09, + "loss": 0.0024, + "step": 49217 + }, + { + "epoch": 0.95, + "learning_rate": 9.063725680556095e-09, + "loss": 0.0007, + "step": 49218 + }, + { + "epoch": 0.95, + "learning_rate": 9.059842336219953e-09, + "loss": 0.0003, + "step": 49219 + }, + { + "epoch": 0.95, + "learning_rate": 9.05595899188381e-09, + "loss": 0.0003, + "step": 49220 + }, + { + "epoch": 0.95, + "learning_rate": 9.052075647547668e-09, + "loss": 0.0004, + "step": 49221 + }, + { + "epoch": 0.95, + "learning_rate": 9.048192303211525e-09, + "loss": 0.0004, + "step": 49222 + }, + { + "epoch": 0.95, + "learning_rate": 9.044308958875383e-09, + "loss": 0.0004, + "step": 49223 + }, + { + "epoch": 0.95, + "learning_rate": 9.04042561453924e-09, + "loss": 0.0003, + "step": 49224 + }, + { + "epoch": 0.95, + "learning_rate": 9.036542270203098e-09, + "loss": 0.0003, + "step": 49225 + }, + { + "epoch": 0.95, + "learning_rate": 9.032658925866956e-09, + "loss": 0.0004, + "step": 49226 + }, + { + "epoch": 0.95, + "learning_rate": 9.028775581530813e-09, + "loss": 0.0004, + "step": 49227 + }, + { + "epoch": 0.95, + "learning_rate": 9.024892237194671e-09, + "loss": 0.0006, + "step": 49228 + }, + { + "epoch": 0.95, + "learning_rate": 9.02100889285853e-09, + "loss": 0.0002, + "step": 49229 + }, + { + "epoch": 0.95, + "learning_rate": 9.017125548522388e-09, + "loss": 0.0005, + "step": 49230 + }, + { + "epoch": 0.95, + "learning_rate": 9.013242204186244e-09, + "loss": 0.0003, + "step": 49231 + }, + { + "epoch": 0.95, + "learning_rate": 9.009358859850102e-09, + "loss": 0.0003, + "step": 49232 + }, + { + "epoch": 0.96, + "learning_rate": 9.00547551551396e-09, + "loss": 0.0005, + "step": 49233 + }, + { + "epoch": 0.96, + "learning_rate": 9.001592171177817e-09, + "loss": 0.0005, + "step": 49234 + }, + { + "epoch": 0.96, + "learning_rate": 8.997708826841675e-09, + "loss": 0.0004, + "step": 49235 + }, + { + "epoch": 0.96, + "learning_rate": 8.993825482505534e-09, + "loss": 0.0005, + "step": 49236 + }, + { + "epoch": 0.96, + "learning_rate": 8.989942138169392e-09, + "loss": 0.0004, + "step": 49237 + }, + { + "epoch": 0.96, + "learning_rate": 8.986058793833249e-09, + "loss": 0.0005, + "step": 49238 + }, + { + "epoch": 0.96, + "learning_rate": 8.982175449497107e-09, + "loss": 0.0006, + "step": 49239 + }, + { + "epoch": 0.96, + "learning_rate": 8.978292105160965e-09, + "loss": 0.0004, + "step": 49240 + }, + { + "epoch": 0.96, + "learning_rate": 8.974408760824823e-09, + "loss": 0.3128, + "step": 49241 + }, + { + "epoch": 0.96, + "learning_rate": 8.97052541648868e-09, + "loss": 0.0004, + "step": 49242 + }, + { + "epoch": 0.96, + "learning_rate": 8.966642072152538e-09, + "loss": 0.0004, + "step": 49243 + }, + { + "epoch": 0.96, + "learning_rate": 8.962758727816395e-09, + "loss": 0.376, + "step": 49244 + }, + { + "epoch": 0.96, + "learning_rate": 8.958875383480253e-09, + "loss": 0.0003, + "step": 49245 + }, + { + "epoch": 0.96, + "learning_rate": 8.95499203914411e-09, + "loss": 0.0003, + "step": 49246 + }, + { + "epoch": 0.96, + "learning_rate": 8.951108694807968e-09, + "loss": 0.0003, + "step": 49247 + }, + { + "epoch": 0.96, + "learning_rate": 8.947225350471826e-09, + "loss": 0.0004, + "step": 49248 + }, + { + "epoch": 0.96, + "learning_rate": 8.943342006135683e-09, + "loss": 0.0005, + "step": 49249 + }, + { + "epoch": 0.96, + "learning_rate": 8.93945866179954e-09, + "loss": 0.447, + "step": 49250 + }, + { + "epoch": 0.96, + "learning_rate": 8.935575317463399e-09, + "loss": 0.4649, + "step": 49251 + }, + { + "epoch": 0.96, + "learning_rate": 8.931691973127257e-09, + "loss": 0.0008, + "step": 49252 + }, + { + "epoch": 0.96, + "learning_rate": 8.927808628791114e-09, + "loss": 0.0003, + "step": 49253 + }, + { + "epoch": 0.96, + "learning_rate": 8.923925284454972e-09, + "loss": 0.0006, + "step": 49254 + }, + { + "epoch": 0.96, + "learning_rate": 8.92004194011883e-09, + "loss": 0.0004, + "step": 49255 + }, + { + "epoch": 0.96, + "learning_rate": 8.916158595782687e-09, + "loss": 0.0004, + "step": 49256 + }, + { + "epoch": 0.96, + "learning_rate": 8.912275251446545e-09, + "loss": 0.0004, + "step": 49257 + }, + { + "epoch": 0.96, + "learning_rate": 8.908391907110403e-09, + "loss": 0.0003, + "step": 49258 + }, + { + "epoch": 0.96, + "learning_rate": 8.904508562774262e-09, + "loss": 0.0003, + "step": 49259 + }, + { + "epoch": 0.96, + "learning_rate": 8.900625218438118e-09, + "loss": 0.0004, + "step": 49260 + }, + { + "epoch": 0.96, + "learning_rate": 8.896741874101977e-09, + "loss": 0.0005, + "step": 49261 + }, + { + "epoch": 0.96, + "learning_rate": 8.892858529765835e-09, + "loss": 0.0005, + "step": 49262 + }, + { + "epoch": 0.96, + "learning_rate": 8.888975185429691e-09, + "loss": 0.0014, + "step": 49263 + }, + { + "epoch": 0.96, + "learning_rate": 8.88509184109355e-09, + "loss": 0.0004, + "step": 49264 + }, + { + "epoch": 0.96, + "learning_rate": 8.881208496757408e-09, + "loss": 0.0004, + "step": 49265 + }, + { + "epoch": 0.96, + "learning_rate": 8.877325152421264e-09, + "loss": 0.0005, + "step": 49266 + }, + { + "epoch": 0.96, + "learning_rate": 8.873441808085123e-09, + "loss": 0.0003, + "step": 49267 + }, + { + "epoch": 0.96, + "learning_rate": 8.86955846374898e-09, + "loss": 0.0008, + "step": 49268 + }, + { + "epoch": 0.96, + "learning_rate": 8.865675119412838e-09, + "loss": 0.0003, + "step": 49269 + }, + { + "epoch": 0.96, + "learning_rate": 8.861791775076696e-09, + "loss": 1.1807, + "step": 49270 + }, + { + "epoch": 0.96, + "learning_rate": 8.857908430740552e-09, + "loss": 0.0003, + "step": 49271 + }, + { + "epoch": 0.96, + "learning_rate": 8.85402508640441e-09, + "loss": 0.0003, + "step": 49272 + }, + { + "epoch": 0.96, + "learning_rate": 8.850141742068269e-09, + "loss": 0.0005, + "step": 49273 + }, + { + "epoch": 0.96, + "learning_rate": 8.846258397732125e-09, + "loss": 0.0004, + "step": 49274 + }, + { + "epoch": 0.96, + "learning_rate": 8.842375053395984e-09, + "loss": 0.0005, + "step": 49275 + }, + { + "epoch": 0.96, + "learning_rate": 8.838491709059842e-09, + "loss": 0.9699, + "step": 49276 + }, + { + "epoch": 0.96, + "learning_rate": 8.8346083647237e-09, + "loss": 0.0005, + "step": 49277 + }, + { + "epoch": 0.96, + "learning_rate": 8.830725020387557e-09, + "loss": 0.0003, + "step": 49278 + }, + { + "epoch": 0.96, + "learning_rate": 8.826841676051415e-09, + "loss": 0.0004, + "step": 49279 + }, + { + "epoch": 0.96, + "learning_rate": 8.822958331715273e-09, + "loss": 0.0003, + "step": 49280 + }, + { + "epoch": 0.96, + "learning_rate": 8.819074987379132e-09, + "loss": 0.0004, + "step": 49281 + }, + { + "epoch": 0.96, + "learning_rate": 8.815191643042988e-09, + "loss": 0.0004, + "step": 49282 + }, + { + "epoch": 0.96, + "learning_rate": 8.811308298706846e-09, + "loss": 0.0004, + "step": 49283 + }, + { + "epoch": 0.96, + "learning_rate": 8.807424954370705e-09, + "loss": 0.0003, + "step": 49284 + }, + { + "epoch": 0.96, + "learning_rate": 8.803541610034561e-09, + "loss": 0.0005, + "step": 49285 + }, + { + "epoch": 0.96, + "learning_rate": 8.79965826569842e-09, + "loss": 0.0003, + "step": 49286 + }, + { + "epoch": 0.96, + "learning_rate": 8.795774921362278e-09, + "loss": 1.121, + "step": 49287 + }, + { + "epoch": 0.96, + "learning_rate": 8.791891577026136e-09, + "loss": 0.0007, + "step": 49288 + }, + { + "epoch": 0.96, + "learning_rate": 8.788008232689992e-09, + "loss": 0.0006, + "step": 49289 + }, + { + "epoch": 0.96, + "learning_rate": 8.784124888353849e-09, + "loss": 0.0006, + "step": 49290 + }, + { + "epoch": 0.96, + "learning_rate": 8.780241544017707e-09, + "loss": 0.1924, + "step": 49291 + }, + { + "epoch": 0.96, + "learning_rate": 8.776358199681564e-09, + "loss": 0.0004, + "step": 49292 + }, + { + "epoch": 0.96, + "learning_rate": 8.772474855345422e-09, + "loss": 0.0003, + "step": 49293 + }, + { + "epoch": 0.96, + "learning_rate": 8.76859151100928e-09, + "loss": 0.0004, + "step": 49294 + }, + { + "epoch": 0.96, + "learning_rate": 8.764708166673139e-09, + "loss": 0.8538, + "step": 49295 + }, + { + "epoch": 0.96, + "learning_rate": 8.760824822336995e-09, + "loss": 0.0004, + "step": 49296 + }, + { + "epoch": 0.96, + "learning_rate": 8.756941478000853e-09, + "loss": 0.0006, + "step": 49297 + }, + { + "epoch": 0.96, + "learning_rate": 8.753058133664712e-09, + "loss": 0.0004, + "step": 49298 + }, + { + "epoch": 0.96, + "learning_rate": 8.74917478932857e-09, + "loss": 0.0005, + "step": 49299 + }, + { + "epoch": 0.96, + "learning_rate": 8.745291444992427e-09, + "loss": 0.0695, + "step": 49300 + }, + { + "epoch": 0.96, + "learning_rate": 8.741408100656285e-09, + "loss": 0.0004, + "step": 49301 + }, + { + "epoch": 0.96, + "learning_rate": 8.737524756320143e-09, + "loss": 0.0005, + "step": 49302 + }, + { + "epoch": 0.96, + "learning_rate": 8.733641411984e-09, + "loss": 0.0007, + "step": 49303 + }, + { + "epoch": 0.96, + "learning_rate": 8.729758067647858e-09, + "loss": 1.1991, + "step": 49304 + }, + { + "epoch": 0.96, + "learning_rate": 8.725874723311716e-09, + "loss": 0.0003, + "step": 49305 + }, + { + "epoch": 0.96, + "learning_rate": 8.721991378975574e-09, + "loss": 0.0007, + "step": 49306 + }, + { + "epoch": 0.96, + "learning_rate": 8.718108034639431e-09, + "loss": 0.0006, + "step": 49307 + }, + { + "epoch": 0.96, + "learning_rate": 8.71422469030329e-09, + "loss": 0.0003, + "step": 49308 + }, + { + "epoch": 0.96, + "learning_rate": 8.710341345967147e-09, + "loss": 0.0003, + "step": 49309 + }, + { + "epoch": 0.96, + "learning_rate": 8.706458001631006e-09, + "loss": 0.0003, + "step": 49310 + }, + { + "epoch": 0.96, + "learning_rate": 8.702574657294862e-09, + "loss": 0.0003, + "step": 49311 + }, + { + "epoch": 0.96, + "learning_rate": 8.69869131295872e-09, + "loss": 0.0003, + "step": 49312 + }, + { + "epoch": 0.96, + "learning_rate": 8.694807968622577e-09, + "loss": 0.0004, + "step": 49313 + }, + { + "epoch": 0.96, + "learning_rate": 8.690924624286434e-09, + "loss": 0.0003, + "step": 49314 + }, + { + "epoch": 0.96, + "learning_rate": 8.687041279950292e-09, + "loss": 1.2689, + "step": 49315 + }, + { + "epoch": 0.96, + "learning_rate": 8.68315793561415e-09, + "loss": 0.0003, + "step": 49316 + }, + { + "epoch": 0.96, + "learning_rate": 8.679274591278008e-09, + "loss": 0.0004, + "step": 49317 + }, + { + "epoch": 0.96, + "learning_rate": 8.675391246941865e-09, + "loss": 0.5895, + "step": 49318 + }, + { + "epoch": 0.96, + "learning_rate": 8.671507902605723e-09, + "loss": 0.0067, + "step": 49319 + }, + { + "epoch": 0.96, + "learning_rate": 8.667624558269582e-09, + "loss": 0.0004, + "step": 49320 + }, + { + "epoch": 0.96, + "learning_rate": 8.663741213933438e-09, + "loss": 0.0004, + "step": 49321 + }, + { + "epoch": 0.96, + "learning_rate": 8.659857869597296e-09, + "loss": 0.0004, + "step": 49322 + }, + { + "epoch": 0.96, + "learning_rate": 8.655974525261155e-09, + "loss": 0.0004, + "step": 49323 + }, + { + "epoch": 0.96, + "learning_rate": 8.652091180925013e-09, + "loss": 0.0002, + "step": 49324 + }, + { + "epoch": 0.96, + "learning_rate": 8.64820783658887e-09, + "loss": 0.0005, + "step": 49325 + }, + { + "epoch": 0.96, + "learning_rate": 8.644324492252728e-09, + "loss": 0.0004, + "step": 49326 + }, + { + "epoch": 0.96, + "learning_rate": 8.640441147916586e-09, + "loss": 0.0003, + "step": 49327 + }, + { + "epoch": 0.96, + "learning_rate": 8.636557803580444e-09, + "loss": 0.0004, + "step": 49328 + }, + { + "epoch": 0.96, + "learning_rate": 8.6326744592443e-09, + "loss": 0.0005, + "step": 49329 + }, + { + "epoch": 0.96, + "learning_rate": 8.628791114908159e-09, + "loss": 0.0002, + "step": 49330 + }, + { + "epoch": 0.96, + "learning_rate": 8.624907770572017e-09, + "loss": 0.0003, + "step": 49331 + }, + { + "epoch": 0.96, + "learning_rate": 8.621024426235874e-09, + "loss": 0.0005, + "step": 49332 + }, + { + "epoch": 0.96, + "learning_rate": 8.617141081899732e-09, + "loss": 0.0006, + "step": 49333 + }, + { + "epoch": 0.96, + "learning_rate": 8.61325773756359e-09, + "loss": 0.0005, + "step": 49334 + }, + { + "epoch": 0.96, + "learning_rate": 8.609374393227447e-09, + "loss": 0.0004, + "step": 49335 + }, + { + "epoch": 0.96, + "learning_rate": 8.605491048891305e-09, + "loss": 0.0004, + "step": 49336 + }, + { + "epoch": 0.96, + "learning_rate": 8.601607704555162e-09, + "loss": 0.0004, + "step": 49337 + }, + { + "epoch": 0.96, + "learning_rate": 8.59772436021902e-09, + "loss": 0.0004, + "step": 49338 + }, + { + "epoch": 0.96, + "learning_rate": 8.593841015882878e-09, + "loss": 0.0004, + "step": 49339 + }, + { + "epoch": 0.96, + "learning_rate": 8.589957671546735e-09, + "loss": 0.0005, + "step": 49340 + }, + { + "epoch": 0.96, + "learning_rate": 8.586074327210593e-09, + "loss": 0.0008, + "step": 49341 + }, + { + "epoch": 0.96, + "learning_rate": 8.582190982874451e-09, + "loss": 0.0003, + "step": 49342 + }, + { + "epoch": 0.96, + "learning_rate": 8.578307638538308e-09, + "loss": 0.0003, + "step": 49343 + }, + { + "epoch": 0.96, + "learning_rate": 8.574424294202166e-09, + "loss": 0.0003, + "step": 49344 + }, + { + "epoch": 0.96, + "learning_rate": 8.570540949866024e-09, + "loss": 0.0004, + "step": 49345 + }, + { + "epoch": 0.96, + "learning_rate": 8.566657605529883e-09, + "loss": 0.0003, + "step": 49346 + }, + { + "epoch": 0.96, + "learning_rate": 8.56277426119374e-09, + "loss": 0.0004, + "step": 49347 + }, + { + "epoch": 0.96, + "learning_rate": 8.558890916857597e-09, + "loss": 0.0006, + "step": 49348 + }, + { + "epoch": 0.96, + "learning_rate": 8.555007572521456e-09, + "loss": 0.0003, + "step": 49349 + }, + { + "epoch": 0.96, + "learning_rate": 8.551124228185312e-09, + "loss": 0.0003, + "step": 49350 + }, + { + "epoch": 0.96, + "learning_rate": 8.54724088384917e-09, + "loss": 0.0002, + "step": 49351 + }, + { + "epoch": 0.96, + "learning_rate": 8.543357539513029e-09, + "loss": 0.0003, + "step": 49352 + }, + { + "epoch": 0.96, + "learning_rate": 8.539474195176887e-09, + "loss": 0.0006, + "step": 49353 + }, + { + "epoch": 0.96, + "learning_rate": 8.535590850840744e-09, + "loss": 0.0004, + "step": 49354 + }, + { + "epoch": 0.96, + "learning_rate": 8.531707506504602e-09, + "loss": 0.0004, + "step": 49355 + }, + { + "epoch": 0.96, + "learning_rate": 8.52782416216846e-09, + "loss": 0.0005, + "step": 49356 + }, + { + "epoch": 0.96, + "learning_rate": 8.523940817832317e-09, + "loss": 0.0006, + "step": 49357 + }, + { + "epoch": 0.96, + "learning_rate": 8.520057473496175e-09, + "loss": 0.0004, + "step": 49358 + }, + { + "epoch": 0.96, + "learning_rate": 8.516174129160032e-09, + "loss": 0.0005, + "step": 49359 + }, + { + "epoch": 0.96, + "learning_rate": 8.51229078482389e-09, + "loss": 0.0004, + "step": 49360 + }, + { + "epoch": 0.96, + "learning_rate": 8.508407440487746e-09, + "loss": 0.0004, + "step": 49361 + }, + { + "epoch": 0.96, + "learning_rate": 8.504524096151605e-09, + "loss": 0.0004, + "step": 49362 + }, + { + "epoch": 0.96, + "learning_rate": 8.500640751815463e-09, + "loss": 0.0004, + "step": 49363 + }, + { + "epoch": 0.96, + "learning_rate": 8.496757407479321e-09, + "loss": 0.0003, + "step": 49364 + }, + { + "epoch": 0.96, + "learning_rate": 8.492874063143178e-09, + "loss": 0.0007, + "step": 49365 + }, + { + "epoch": 0.96, + "learning_rate": 8.488990718807036e-09, + "loss": 0.0003, + "step": 49366 + }, + { + "epoch": 0.96, + "learning_rate": 8.485107374470894e-09, + "loss": 0.0003, + "step": 49367 + }, + { + "epoch": 0.96, + "learning_rate": 8.481224030134752e-09, + "loss": 0.0003, + "step": 49368 + }, + { + "epoch": 0.96, + "learning_rate": 8.477340685798609e-09, + "loss": 0.0004, + "step": 49369 + }, + { + "epoch": 0.96, + "learning_rate": 8.473457341462467e-09, + "loss": 0.0003, + "step": 49370 + }, + { + "epoch": 0.96, + "learning_rate": 8.469573997126326e-09, + "loss": 0.0508, + "step": 49371 + }, + { + "epoch": 0.96, + "learning_rate": 8.465690652790182e-09, + "loss": 0.0005, + "step": 49372 + }, + { + "epoch": 0.96, + "learning_rate": 8.46180730845404e-09, + "loss": 0.0004, + "step": 49373 + }, + { + "epoch": 0.96, + "learning_rate": 8.457923964117899e-09, + "loss": 0.0005, + "step": 49374 + }, + { + "epoch": 0.96, + "learning_rate": 8.454040619781757e-09, + "loss": 0.0002, + "step": 49375 + }, + { + "epoch": 0.96, + "learning_rate": 8.450157275445613e-09, + "loss": 0.0003, + "step": 49376 + }, + { + "epoch": 0.96, + "learning_rate": 8.446273931109472e-09, + "loss": 0.0003, + "step": 49377 + }, + { + "epoch": 0.96, + "learning_rate": 8.44239058677333e-09, + "loss": 0.0005, + "step": 49378 + }, + { + "epoch": 0.96, + "learning_rate": 8.438507242437187e-09, + "loss": 0.0004, + "step": 49379 + }, + { + "epoch": 0.96, + "learning_rate": 8.434623898101045e-09, + "loss": 0.0019, + "step": 49380 + }, + { + "epoch": 0.96, + "learning_rate": 8.430740553764901e-09, + "loss": 0.0004, + "step": 49381 + }, + { + "epoch": 0.96, + "learning_rate": 8.42685720942876e-09, + "loss": 0.0003, + "step": 49382 + }, + { + "epoch": 0.96, + "learning_rate": 8.422973865092616e-09, + "loss": 0.0004, + "step": 49383 + }, + { + "epoch": 0.96, + "learning_rate": 8.419090520756474e-09, + "loss": 0.0005, + "step": 49384 + }, + { + "epoch": 0.96, + "learning_rate": 8.415207176420333e-09, + "loss": 0.0005, + "step": 49385 + }, + { + "epoch": 0.96, + "learning_rate": 8.411323832084191e-09, + "loss": 0.0003, + "step": 49386 + }, + { + "epoch": 0.96, + "learning_rate": 8.407440487748048e-09, + "loss": 0.0004, + "step": 49387 + }, + { + "epoch": 0.96, + "learning_rate": 8.403557143411906e-09, + "loss": 0.0004, + "step": 49388 + }, + { + "epoch": 0.96, + "learning_rate": 8.399673799075764e-09, + "loss": 0.0004, + "step": 49389 + }, + { + "epoch": 0.96, + "learning_rate": 8.39579045473962e-09, + "loss": 0.0018, + "step": 49390 + }, + { + "epoch": 0.96, + "learning_rate": 8.391907110403479e-09, + "loss": 0.0613, + "step": 49391 + }, + { + "epoch": 0.96, + "learning_rate": 8.388023766067337e-09, + "loss": 0.0003, + "step": 49392 + }, + { + "epoch": 0.96, + "learning_rate": 8.384140421731195e-09, + "loss": 0.0004, + "step": 49393 + }, + { + "epoch": 0.96, + "learning_rate": 8.380257077395052e-09, + "loss": 0.0003, + "step": 49394 + }, + { + "epoch": 0.96, + "learning_rate": 8.37637373305891e-09, + "loss": 0.0003, + "step": 49395 + }, + { + "epoch": 0.96, + "learning_rate": 8.372490388722768e-09, + "loss": 0.8516, + "step": 49396 + }, + { + "epoch": 0.96, + "learning_rate": 8.368607044386627e-09, + "loss": 0.0003, + "step": 49397 + }, + { + "epoch": 0.96, + "learning_rate": 8.364723700050483e-09, + "loss": 0.0323, + "step": 49398 + }, + { + "epoch": 0.96, + "learning_rate": 8.360840355714341e-09, + "loss": 0.0004, + "step": 49399 + }, + { + "epoch": 0.96, + "learning_rate": 8.3569570113782e-09, + "loss": 0.0004, + "step": 49400 + }, + { + "epoch": 0.96, + "learning_rate": 8.353073667042056e-09, + "loss": 0.0004, + "step": 49401 + }, + { + "epoch": 0.96, + "learning_rate": 8.349190322705915e-09, + "loss": 0.0003, + "step": 49402 + }, + { + "epoch": 0.96, + "learning_rate": 8.345306978369771e-09, + "loss": 0.0003, + "step": 49403 + }, + { + "epoch": 0.96, + "learning_rate": 8.34142363403363e-09, + "loss": 0.0003, + "step": 49404 + }, + { + "epoch": 0.96, + "learning_rate": 8.337540289697486e-09, + "loss": 0.0008, + "step": 49405 + }, + { + "epoch": 0.96, + "learning_rate": 8.333656945361344e-09, + "loss": 0.0003, + "step": 49406 + }, + { + "epoch": 0.96, + "learning_rate": 8.329773601025202e-09, + "loss": 0.0003, + "step": 49407 + }, + { + "epoch": 0.96, + "learning_rate": 8.325890256689059e-09, + "loss": 0.0004, + "step": 49408 + }, + { + "epoch": 0.96, + "learning_rate": 8.322006912352917e-09, + "loss": 0.0202, + "step": 49409 + }, + { + "epoch": 0.96, + "learning_rate": 8.318123568016776e-09, + "loss": 0.0003, + "step": 49410 + }, + { + "epoch": 0.96, + "learning_rate": 8.314240223680634e-09, + "loss": 0.0005, + "step": 49411 + }, + { + "epoch": 0.96, + "learning_rate": 8.31035687934449e-09, + "loss": 0.0003, + "step": 49412 + }, + { + "epoch": 0.96, + "learning_rate": 8.306473535008349e-09, + "loss": 0.0029, + "step": 49413 + }, + { + "epoch": 0.96, + "learning_rate": 8.302590190672207e-09, + "loss": 0.0003, + "step": 49414 + }, + { + "epoch": 0.96, + "learning_rate": 8.298706846336065e-09, + "loss": 0.0006, + "step": 49415 + }, + { + "epoch": 0.96, + "learning_rate": 8.294823501999922e-09, + "loss": 0.0138, + "step": 49416 + }, + { + "epoch": 0.96, + "learning_rate": 8.29094015766378e-09, + "loss": 0.0003, + "step": 49417 + }, + { + "epoch": 0.96, + "learning_rate": 8.287056813327638e-09, + "loss": 0.0004, + "step": 49418 + }, + { + "epoch": 0.96, + "learning_rate": 8.283173468991495e-09, + "loss": 0.0003, + "step": 49419 + }, + { + "epoch": 0.96, + "learning_rate": 8.279290124655353e-09, + "loss": 0.0005, + "step": 49420 + }, + { + "epoch": 0.96, + "learning_rate": 8.275406780319211e-09, + "loss": 0.0003, + "step": 49421 + }, + { + "epoch": 0.96, + "learning_rate": 8.27152343598307e-09, + "loss": 0.1361, + "step": 49422 + }, + { + "epoch": 0.96, + "learning_rate": 8.267640091646926e-09, + "loss": 0.0004, + "step": 49423 + }, + { + "epoch": 0.96, + "learning_rate": 8.263756747310784e-09, + "loss": 0.0004, + "step": 49424 + }, + { + "epoch": 0.96, + "learning_rate": 8.259873402974641e-09, + "loss": 0.0003, + "step": 49425 + }, + { + "epoch": 0.96, + "learning_rate": 8.2559900586385e-09, + "loss": 0.0389, + "step": 49426 + }, + { + "epoch": 0.96, + "learning_rate": 8.252106714302356e-09, + "loss": 0.0004, + "step": 49427 + }, + { + "epoch": 0.96, + "learning_rate": 8.248223369966214e-09, + "loss": 0.0005, + "step": 49428 + }, + { + "epoch": 0.96, + "learning_rate": 8.244340025630072e-09, + "loss": 0.0017, + "step": 49429 + }, + { + "epoch": 0.96, + "learning_rate": 8.240456681293929e-09, + "loss": 0.0004, + "step": 49430 + }, + { + "epoch": 0.96, + "learning_rate": 8.236573336957787e-09, + "loss": 0.0008, + "step": 49431 + }, + { + "epoch": 0.96, + "learning_rate": 8.232689992621645e-09, + "loss": 0.6241, + "step": 49432 + }, + { + "epoch": 0.96, + "learning_rate": 8.228806648285504e-09, + "loss": 0.0003, + "step": 49433 + }, + { + "epoch": 0.96, + "learning_rate": 8.22492330394936e-09, + "loss": 1.2863, + "step": 49434 + }, + { + "epoch": 0.96, + "learning_rate": 8.221039959613218e-09, + "loss": 0.0004, + "step": 49435 + }, + { + "epoch": 0.96, + "learning_rate": 8.217156615277077e-09, + "loss": 0.0004, + "step": 49436 + }, + { + "epoch": 0.96, + "learning_rate": 8.213273270940933e-09, + "loss": 0.0601, + "step": 49437 + }, + { + "epoch": 0.96, + "learning_rate": 8.209389926604791e-09, + "loss": 0.0004, + "step": 49438 + }, + { + "epoch": 0.96, + "learning_rate": 8.20550658226865e-09, + "loss": 0.0005, + "step": 49439 + }, + { + "epoch": 0.96, + "learning_rate": 8.201623237932508e-09, + "loss": 0.8451, + "step": 49440 + }, + { + "epoch": 0.96, + "learning_rate": 8.197739893596365e-09, + "loss": 0.0003, + "step": 49441 + }, + { + "epoch": 0.96, + "learning_rate": 8.193856549260223e-09, + "loss": 0.0003, + "step": 49442 + }, + { + "epoch": 0.96, + "learning_rate": 8.189973204924081e-09, + "loss": 0.0004, + "step": 49443 + }, + { + "epoch": 0.96, + "learning_rate": 8.18608986058794e-09, + "loss": 0.0004, + "step": 49444 + }, + { + "epoch": 0.96, + "learning_rate": 8.182206516251796e-09, + "loss": 0.0004, + "step": 49445 + }, + { + "epoch": 0.96, + "learning_rate": 8.178323171915654e-09, + "loss": 0.0003, + "step": 49446 + }, + { + "epoch": 0.96, + "learning_rate": 8.17443982757951e-09, + "loss": 0.0004, + "step": 49447 + }, + { + "epoch": 0.96, + "learning_rate": 8.170556483243369e-09, + "loss": 0.0004, + "step": 49448 + }, + { + "epoch": 0.96, + "learning_rate": 8.166673138907226e-09, + "loss": 0.0004, + "step": 49449 + }, + { + "epoch": 0.96, + "learning_rate": 8.162789794571084e-09, + "loss": 0.024, + "step": 49450 + }, + { + "epoch": 0.96, + "learning_rate": 8.158906450234942e-09, + "loss": 0.5327, + "step": 49451 + }, + { + "epoch": 0.96, + "learning_rate": 8.155023105898799e-09, + "loss": 1.199, + "step": 49452 + }, + { + "epoch": 0.96, + "learning_rate": 8.151139761562657e-09, + "loss": 0.588, + "step": 49453 + }, + { + "epoch": 0.96, + "learning_rate": 8.147256417226515e-09, + "loss": 0.0003, + "step": 49454 + }, + { + "epoch": 0.96, + "learning_rate": 8.143373072890373e-09, + "loss": 0.0005, + "step": 49455 + }, + { + "epoch": 0.96, + "learning_rate": 8.13948972855423e-09, + "loss": 0.0003, + "step": 49456 + }, + { + "epoch": 0.96, + "learning_rate": 8.135606384218088e-09, + "loss": 0.0005, + "step": 49457 + }, + { + "epoch": 0.96, + "learning_rate": 8.131723039881946e-09, + "loss": 0.0011, + "step": 49458 + }, + { + "epoch": 0.96, + "learning_rate": 8.127839695545803e-09, + "loss": 0.0003, + "step": 49459 + }, + { + "epoch": 0.96, + "learning_rate": 8.123956351209661e-09, + "loss": 0.0024, + "step": 49460 + }, + { + "epoch": 0.96, + "learning_rate": 8.12007300687352e-09, + "loss": 0.0003, + "step": 49461 + }, + { + "epoch": 0.96, + "learning_rate": 8.116189662537378e-09, + "loss": 0.0004, + "step": 49462 + }, + { + "epoch": 0.96, + "learning_rate": 8.112306318201234e-09, + "loss": 0.0003, + "step": 49463 + }, + { + "epoch": 0.96, + "learning_rate": 8.108422973865093e-09, + "loss": 0.0005, + "step": 49464 + }, + { + "epoch": 0.96, + "learning_rate": 8.104539629528951e-09, + "loss": 0.0003, + "step": 49465 + }, + { + "epoch": 0.96, + "learning_rate": 8.100656285192807e-09, + "loss": 0.0006, + "step": 49466 + }, + { + "epoch": 0.96, + "learning_rate": 8.096772940856666e-09, + "loss": 0.0005, + "step": 49467 + }, + { + "epoch": 0.96, + "learning_rate": 8.092889596520524e-09, + "loss": 0.0003, + "step": 49468 + }, + { + "epoch": 0.96, + "learning_rate": 8.08900625218438e-09, + "loss": 0.0003, + "step": 49469 + }, + { + "epoch": 0.96, + "learning_rate": 8.085122907848239e-09, + "loss": 0.0005, + "step": 49470 + }, + { + "epoch": 0.96, + "learning_rate": 8.081239563512095e-09, + "loss": 0.0007, + "step": 49471 + }, + { + "epoch": 0.96, + "learning_rate": 8.077356219175954e-09, + "loss": 0.0004, + "step": 49472 + }, + { + "epoch": 0.96, + "learning_rate": 8.073472874839812e-09, + "loss": 0.0005, + "step": 49473 + }, + { + "epoch": 0.96, + "learning_rate": 8.069589530503668e-09, + "loss": 0.0003, + "step": 49474 + }, + { + "epoch": 0.96, + "learning_rate": 8.065706186167527e-09, + "loss": 0.0017, + "step": 49475 + }, + { + "epoch": 0.96, + "learning_rate": 8.061822841831385e-09, + "loss": 0.0005, + "step": 49476 + }, + { + "epoch": 0.96, + "learning_rate": 8.057939497495242e-09, + "loss": 0.0004, + "step": 49477 + }, + { + "epoch": 0.96, + "learning_rate": 8.0540561531591e-09, + "loss": 0.0004, + "step": 49478 + }, + { + "epoch": 0.96, + "learning_rate": 8.050172808822958e-09, + "loss": 0.0004, + "step": 49479 + }, + { + "epoch": 0.96, + "learning_rate": 8.046289464486816e-09, + "loss": 0.0003, + "step": 49480 + }, + { + "epoch": 0.96, + "learning_rate": 8.042406120150673e-09, + "loss": 0.0004, + "step": 49481 + }, + { + "epoch": 0.96, + "learning_rate": 8.038522775814531e-09, + "loss": 0.0004, + "step": 49482 + }, + { + "epoch": 0.96, + "learning_rate": 8.03463943147839e-09, + "loss": 0.0003, + "step": 49483 + }, + { + "epoch": 0.96, + "learning_rate": 8.030756087142248e-09, + "loss": 0.6633, + "step": 49484 + }, + { + "epoch": 0.96, + "learning_rate": 8.026872742806104e-09, + "loss": 0.001, + "step": 49485 + }, + { + "epoch": 0.96, + "learning_rate": 8.022989398469962e-09, + "loss": 0.0003, + "step": 49486 + }, + { + "epoch": 0.96, + "learning_rate": 8.01910605413382e-09, + "loss": 0.0005, + "step": 49487 + }, + { + "epoch": 0.96, + "learning_rate": 8.015222709797677e-09, + "loss": 0.0003, + "step": 49488 + }, + { + "epoch": 0.96, + "learning_rate": 8.011339365461535e-09, + "loss": 0.0005, + "step": 49489 + }, + { + "epoch": 0.96, + "learning_rate": 8.007456021125394e-09, + "loss": 0.6967, + "step": 49490 + }, + { + "epoch": 0.96, + "learning_rate": 8.00357267678925e-09, + "loss": 0.0004, + "step": 49491 + }, + { + "epoch": 0.96, + "learning_rate": 7.999689332453109e-09, + "loss": 0.6021, + "step": 49492 + }, + { + "epoch": 0.96, + "learning_rate": 7.995805988116965e-09, + "loss": 0.0005, + "step": 49493 + }, + { + "epoch": 0.96, + "learning_rate": 7.991922643780823e-09, + "loss": 0.0008, + "step": 49494 + }, + { + "epoch": 0.96, + "learning_rate": 7.98803929944468e-09, + "loss": 0.0003, + "step": 49495 + }, + { + "epoch": 0.96, + "learning_rate": 7.984155955108538e-09, + "loss": 0.3248, + "step": 49496 + }, + { + "epoch": 0.96, + "learning_rate": 7.980272610772396e-09, + "loss": 0.0009, + "step": 49497 + }, + { + "epoch": 0.96, + "learning_rate": 7.976389266436255e-09, + "loss": 0.0005, + "step": 49498 + }, + { + "epoch": 0.96, + "learning_rate": 7.972505922100111e-09, + "loss": 0.0005, + "step": 49499 + }, + { + "epoch": 0.96, + "learning_rate": 7.96862257776397e-09, + "loss": 0.0003, + "step": 49500 + }, + { + "epoch": 0.96, + "learning_rate": 7.964739233427828e-09, + "loss": 0.0004, + "step": 49501 + }, + { + "epoch": 0.96, + "learning_rate": 7.960855889091686e-09, + "loss": 0.0005, + "step": 49502 + }, + { + "epoch": 0.96, + "learning_rate": 7.956972544755543e-09, + "loss": 0.0004, + "step": 49503 + }, + { + "epoch": 0.96, + "learning_rate": 7.953089200419401e-09, + "loss": 0.0078, + "step": 49504 + }, + { + "epoch": 0.96, + "learning_rate": 7.949205856083259e-09, + "loss": 0.0007, + "step": 49505 + }, + { + "epoch": 0.96, + "learning_rate": 7.945322511747116e-09, + "loss": 0.0003, + "step": 49506 + }, + { + "epoch": 0.96, + "learning_rate": 7.941439167410974e-09, + "loss": 0.0007, + "step": 49507 + }, + { + "epoch": 0.96, + "learning_rate": 7.937555823074832e-09, + "loss": 0.0004, + "step": 49508 + }, + { + "epoch": 0.96, + "learning_rate": 7.93367247873869e-09, + "loss": 0.0024, + "step": 49509 + }, + { + "epoch": 0.96, + "learning_rate": 7.929789134402547e-09, + "loss": 0.0004, + "step": 49510 + }, + { + "epoch": 0.96, + "learning_rate": 7.925905790066405e-09, + "loss": 0.0005, + "step": 49511 + }, + { + "epoch": 0.96, + "learning_rate": 7.922022445730264e-09, + "loss": 0.0004, + "step": 49512 + }, + { + "epoch": 0.96, + "learning_rate": 7.918139101394122e-09, + "loss": 0.0004, + "step": 49513 + }, + { + "epoch": 0.96, + "learning_rate": 7.914255757057978e-09, + "loss": 0.0004, + "step": 49514 + }, + { + "epoch": 0.96, + "learning_rate": 7.910372412721835e-09, + "loss": 0.0007, + "step": 49515 + }, + { + "epoch": 0.96, + "learning_rate": 7.906489068385693e-09, + "loss": 0.0004, + "step": 49516 + }, + { + "epoch": 0.96, + "learning_rate": 7.90260572404955e-09, + "loss": 0.6, + "step": 49517 + }, + { + "epoch": 0.96, + "learning_rate": 7.898722379713408e-09, + "loss": 0.0003, + "step": 49518 + }, + { + "epoch": 0.96, + "learning_rate": 7.894839035377266e-09, + "loss": 0.0004, + "step": 49519 + }, + { + "epoch": 0.96, + "learning_rate": 7.890955691041125e-09, + "loss": 0.0006, + "step": 49520 + }, + { + "epoch": 0.96, + "learning_rate": 7.887072346704981e-09, + "loss": 0.0004, + "step": 49521 + }, + { + "epoch": 0.96, + "learning_rate": 7.88318900236884e-09, + "loss": 0.0004, + "step": 49522 + }, + { + "epoch": 0.96, + "learning_rate": 7.879305658032698e-09, + "loss": 0.0006, + "step": 49523 + }, + { + "epoch": 0.96, + "learning_rate": 7.875422313696554e-09, + "loss": 0.0003, + "step": 49524 + }, + { + "epoch": 0.96, + "learning_rate": 7.871538969360412e-09, + "loss": 0.0004, + "step": 49525 + }, + { + "epoch": 0.96, + "learning_rate": 7.86765562502427e-09, + "loss": 0.0008, + "step": 49526 + }, + { + "epoch": 0.96, + "learning_rate": 7.863772280688129e-09, + "loss": 0.0006, + "step": 49527 + }, + { + "epoch": 0.96, + "learning_rate": 7.859888936351986e-09, + "loss": 0.0005, + "step": 49528 + }, + { + "epoch": 0.96, + "learning_rate": 7.856005592015844e-09, + "loss": 0.0012, + "step": 49529 + }, + { + "epoch": 0.96, + "learning_rate": 7.852122247679702e-09, + "loss": 0.0015, + "step": 49530 + }, + { + "epoch": 0.96, + "learning_rate": 7.84823890334356e-09, + "loss": 0.0037, + "step": 49531 + }, + { + "epoch": 0.96, + "learning_rate": 7.844355559007417e-09, + "loss": 0.0005, + "step": 49532 + }, + { + "epoch": 0.96, + "learning_rate": 7.840472214671275e-09, + "loss": 0.0007, + "step": 49533 + }, + { + "epoch": 0.96, + "learning_rate": 7.836588870335133e-09, + "loss": 0.0004, + "step": 49534 + }, + { + "epoch": 0.96, + "learning_rate": 7.83270552599899e-09, + "loss": 0.0008, + "step": 49535 + }, + { + "epoch": 0.96, + "learning_rate": 7.828822181662848e-09, + "loss": 0.0003, + "step": 49536 + }, + { + "epoch": 0.96, + "learning_rate": 7.824938837326705e-09, + "loss": 0.0005, + "step": 49537 + }, + { + "epoch": 0.96, + "learning_rate": 7.821055492990563e-09, + "loss": 0.0004, + "step": 49538 + }, + { + "epoch": 0.96, + "learning_rate": 7.81717214865442e-09, + "loss": 0.0003, + "step": 49539 + }, + { + "epoch": 0.96, + "learning_rate": 7.813288804318278e-09, + "loss": 0.0003, + "step": 49540 + }, + { + "epoch": 0.96, + "learning_rate": 7.809405459982136e-09, + "loss": 0.0005, + "step": 49541 + }, + { + "epoch": 0.96, + "learning_rate": 7.805522115645994e-09, + "loss": 0.0067, + "step": 49542 + }, + { + "epoch": 0.96, + "learning_rate": 7.801638771309851e-09, + "loss": 0.0003, + "step": 49543 + }, + { + "epoch": 0.96, + "learning_rate": 7.797755426973709e-09, + "loss": 0.069, + "step": 49544 + }, + { + "epoch": 0.96, + "learning_rate": 7.793872082637567e-09, + "loss": 0.0004, + "step": 49545 + }, + { + "epoch": 0.96, + "learning_rate": 7.789988738301424e-09, + "loss": 0.0004, + "step": 49546 + }, + { + "epoch": 0.96, + "learning_rate": 7.786105393965282e-09, + "loss": 0.0004, + "step": 49547 + }, + { + "epoch": 0.96, + "learning_rate": 7.78222204962914e-09, + "loss": 1.3246, + "step": 49548 + }, + { + "epoch": 0.96, + "learning_rate": 7.778338705292999e-09, + "loss": 0.0003, + "step": 49549 + }, + { + "epoch": 0.96, + "learning_rate": 7.774455360956855e-09, + "loss": 0.0005, + "step": 49550 + }, + { + "epoch": 0.96, + "learning_rate": 7.770572016620714e-09, + "loss": 0.0002, + "step": 49551 + }, + { + "epoch": 0.96, + "learning_rate": 7.766688672284572e-09, + "loss": 0.1403, + "step": 49552 + }, + { + "epoch": 0.96, + "learning_rate": 7.762805327948428e-09, + "loss": 0.0003, + "step": 49553 + }, + { + "epoch": 0.96, + "learning_rate": 7.758921983612287e-09, + "loss": 0.0003, + "step": 49554 + }, + { + "epoch": 0.96, + "learning_rate": 7.755038639276145e-09, + "loss": 0.0002, + "step": 49555 + }, + { + "epoch": 0.96, + "learning_rate": 7.751155294940003e-09, + "loss": 0.0003, + "step": 49556 + }, + { + "epoch": 0.96, + "learning_rate": 7.74727195060386e-09, + "loss": 0.0067, + "step": 49557 + }, + { + "epoch": 0.96, + "learning_rate": 7.743388606267718e-09, + "loss": 0.0004, + "step": 49558 + }, + { + "epoch": 0.96, + "learning_rate": 7.739505261931576e-09, + "loss": 0.0003, + "step": 49559 + }, + { + "epoch": 0.96, + "learning_rate": 7.735621917595433e-09, + "loss": 0.0004, + "step": 49560 + }, + { + "epoch": 0.96, + "learning_rate": 7.73173857325929e-09, + "loss": 0.0003, + "step": 49561 + }, + { + "epoch": 0.96, + "learning_rate": 7.727855228923148e-09, + "loss": 0.0005, + "step": 49562 + }, + { + "epoch": 0.96, + "learning_rate": 7.723971884587006e-09, + "loss": 0.0004, + "step": 49563 + }, + { + "epoch": 0.96, + "learning_rate": 7.720088540250862e-09, + "loss": 0.0004, + "step": 49564 + }, + { + "epoch": 0.96, + "learning_rate": 7.71620519591472e-09, + "loss": 0.0005, + "step": 49565 + }, + { + "epoch": 0.96, + "learning_rate": 7.712321851578579e-09, + "loss": 0.0005, + "step": 49566 + }, + { + "epoch": 0.96, + "learning_rate": 7.708438507242437e-09, + "loss": 0.0004, + "step": 49567 + }, + { + "epoch": 0.96, + "learning_rate": 7.704555162906294e-09, + "loss": 0.0003, + "step": 49568 + }, + { + "epoch": 0.96, + "learning_rate": 7.700671818570152e-09, + "loss": 0.0003, + "step": 49569 + }, + { + "epoch": 0.96, + "learning_rate": 7.69678847423401e-09, + "loss": 0.0004, + "step": 49570 + }, + { + "epoch": 0.96, + "learning_rate": 7.692905129897869e-09, + "loss": 0.0005, + "step": 49571 + }, + { + "epoch": 0.96, + "learning_rate": 7.689021785561725e-09, + "loss": 0.0004, + "step": 49572 + }, + { + "epoch": 0.96, + "learning_rate": 7.685138441225583e-09, + "loss": 0.0002, + "step": 49573 + }, + { + "epoch": 0.96, + "learning_rate": 7.681255096889442e-09, + "loss": 0.0003, + "step": 49574 + }, + { + "epoch": 0.96, + "learning_rate": 7.677371752553298e-09, + "loss": 0.0003, + "step": 49575 + }, + { + "epoch": 0.96, + "learning_rate": 7.673488408217156e-09, + "loss": 0.0005, + "step": 49576 + }, + { + "epoch": 0.96, + "learning_rate": 7.669605063881015e-09, + "loss": 0.0003, + "step": 49577 + }, + { + "epoch": 0.96, + "learning_rate": 7.665721719544873e-09, + "loss": 0.0004, + "step": 49578 + }, + { + "epoch": 0.96, + "learning_rate": 7.66183837520873e-09, + "loss": 0.0005, + "step": 49579 + }, + { + "epoch": 0.96, + "learning_rate": 7.657955030872588e-09, + "loss": 0.0004, + "step": 49580 + }, + { + "epoch": 0.96, + "learning_rate": 7.654071686536446e-09, + "loss": 0.0004, + "step": 49581 + }, + { + "epoch": 0.96, + "learning_rate": 7.650188342200303e-09, + "loss": 0.0003, + "step": 49582 + }, + { + "epoch": 0.96, + "learning_rate": 7.64630499786416e-09, + "loss": 0.0002, + "step": 49583 + }, + { + "epoch": 0.96, + "learning_rate": 7.642421653528017e-09, + "loss": 0.0005, + "step": 49584 + }, + { + "epoch": 0.96, + "learning_rate": 7.638538309191876e-09, + "loss": 0.0003, + "step": 49585 + }, + { + "epoch": 0.96, + "learning_rate": 7.634654964855732e-09, + "loss": 0.0003, + "step": 49586 + }, + { + "epoch": 0.96, + "learning_rate": 7.63077162051959e-09, + "loss": 0.0003, + "step": 49587 + }, + { + "epoch": 0.96, + "learning_rate": 7.626888276183449e-09, + "loss": 0.0006, + "step": 49588 + }, + { + "epoch": 0.96, + "learning_rate": 7.623004931847307e-09, + "loss": 0.006, + "step": 49589 + }, + { + "epoch": 0.96, + "learning_rate": 7.619121587511164e-09, + "loss": 0.0004, + "step": 49590 + }, + { + "epoch": 0.96, + "learning_rate": 7.615238243175022e-09, + "loss": 0.0003, + "step": 49591 + }, + { + "epoch": 0.96, + "learning_rate": 7.61135489883888e-09, + "loss": 0.0347, + "step": 49592 + }, + { + "epoch": 0.96, + "learning_rate": 7.607471554502737e-09, + "loss": 0.001, + "step": 49593 + }, + { + "epoch": 0.96, + "learning_rate": 7.603588210166595e-09, + "loss": 0.1108, + "step": 49594 + }, + { + "epoch": 0.96, + "learning_rate": 7.599704865830453e-09, + "loss": 0.0004, + "step": 49595 + }, + { + "epoch": 0.96, + "learning_rate": 7.595821521494311e-09, + "loss": 0.0004, + "step": 49596 + }, + { + "epoch": 0.96, + "learning_rate": 7.591938177158168e-09, + "loss": 0.0004, + "step": 49597 + }, + { + "epoch": 0.96, + "learning_rate": 7.588054832822026e-09, + "loss": 0.0006, + "step": 49598 + }, + { + "epoch": 0.96, + "learning_rate": 7.584171488485884e-09, + "loss": 0.0003, + "step": 49599 + }, + { + "epoch": 0.96, + "learning_rate": 7.580288144149743e-09, + "loss": 0.0006, + "step": 49600 + }, + { + "epoch": 0.96, + "learning_rate": 7.5764047998136e-09, + "loss": 0.0003, + "step": 49601 + }, + { + "epoch": 0.96, + "learning_rate": 7.572521455477458e-09, + "loss": 0.0002, + "step": 49602 + }, + { + "epoch": 0.96, + "learning_rate": 7.568638111141316e-09, + "loss": 0.0057, + "step": 49603 + }, + { + "epoch": 0.96, + "learning_rate": 7.564754766805172e-09, + "loss": 0.0004, + "step": 49604 + }, + { + "epoch": 0.96, + "learning_rate": 7.56087142246903e-09, + "loss": 0.0005, + "step": 49605 + }, + { + "epoch": 0.96, + "learning_rate": 7.556988078132887e-09, + "loss": 0.0004, + "step": 49606 + }, + { + "epoch": 0.96, + "learning_rate": 7.553104733796745e-09, + "loss": 0.0006, + "step": 49607 + }, + { + "epoch": 0.96, + "learning_rate": 7.549221389460602e-09, + "loss": 0.0003, + "step": 49608 + }, + { + "epoch": 0.96, + "learning_rate": 7.54533804512446e-09, + "loss": 0.2703, + "step": 49609 + }, + { + "epoch": 0.96, + "learning_rate": 7.541454700788319e-09, + "loss": 0.0003, + "step": 49610 + }, + { + "epoch": 0.96, + "learning_rate": 7.537571356452175e-09, + "loss": 0.0005, + "step": 49611 + }, + { + "epoch": 0.96, + "learning_rate": 7.533688012116033e-09, + "loss": 0.0004, + "step": 49612 + }, + { + "epoch": 0.96, + "learning_rate": 7.529804667779892e-09, + "loss": 0.0003, + "step": 49613 + }, + { + "epoch": 0.96, + "learning_rate": 7.52592132344375e-09, + "loss": 0.0006, + "step": 49614 + }, + { + "epoch": 0.96, + "learning_rate": 7.522037979107606e-09, + "loss": 0.0004, + "step": 49615 + }, + { + "epoch": 0.96, + "learning_rate": 7.518154634771465e-09, + "loss": 0.0004, + "step": 49616 + }, + { + "epoch": 0.96, + "learning_rate": 7.514271290435323e-09, + "loss": 0.0004, + "step": 49617 + }, + { + "epoch": 0.96, + "learning_rate": 7.510387946099181e-09, + "loss": 0.8572, + "step": 49618 + }, + { + "epoch": 0.96, + "learning_rate": 7.506504601763038e-09, + "loss": 0.8683, + "step": 49619 + }, + { + "epoch": 0.96, + "learning_rate": 7.502621257426896e-09, + "loss": 0.0003, + "step": 49620 + }, + { + "epoch": 0.96, + "learning_rate": 7.498737913090754e-09, + "loss": 0.0004, + "step": 49621 + }, + { + "epoch": 0.96, + "learning_rate": 7.494854568754611e-09, + "loss": 0.0003, + "step": 49622 + }, + { + "epoch": 0.96, + "learning_rate": 7.490971224418469e-09, + "loss": 0.0003, + "step": 49623 + }, + { + "epoch": 0.96, + "learning_rate": 7.487087880082327e-09, + "loss": 0.0003, + "step": 49624 + }, + { + "epoch": 0.96, + "learning_rate": 7.483204535746186e-09, + "loss": 0.0003, + "step": 49625 + }, + { + "epoch": 0.96, + "learning_rate": 7.479321191410042e-09, + "loss": 0.0004, + "step": 49626 + }, + { + "epoch": 0.96, + "learning_rate": 7.4754378470739e-09, + "loss": 0.0004, + "step": 49627 + }, + { + "epoch": 0.96, + "learning_rate": 7.471554502737757e-09, + "loss": 0.0006, + "step": 49628 + }, + { + "epoch": 0.96, + "learning_rate": 7.467671158401615e-09, + "loss": 0.0004, + "step": 49629 + }, + { + "epoch": 0.96, + "learning_rate": 7.463787814065472e-09, + "loss": 0.0313, + "step": 49630 + }, + { + "epoch": 0.96, + "learning_rate": 7.45990446972933e-09, + "loss": 0.0003, + "step": 49631 + }, + { + "epoch": 0.96, + "learning_rate": 7.456021125393188e-09, + "loss": 0.0007, + "step": 49632 + }, + { + "epoch": 0.96, + "learning_rate": 7.452137781057045e-09, + "loss": 0.0003, + "step": 49633 + }, + { + "epoch": 0.96, + "learning_rate": 7.448254436720903e-09, + "loss": 0.0004, + "step": 49634 + }, + { + "epoch": 0.96, + "learning_rate": 7.444371092384761e-09, + "loss": 0.029, + "step": 49635 + }, + { + "epoch": 0.96, + "learning_rate": 7.44048774804862e-09, + "loss": 0.0005, + "step": 49636 + }, + { + "epoch": 0.96, + "learning_rate": 7.436604403712476e-09, + "loss": 0.0004, + "step": 49637 + }, + { + "epoch": 0.96, + "learning_rate": 7.4327210593763345e-09, + "loss": 0.0004, + "step": 49638 + }, + { + "epoch": 0.96, + "learning_rate": 7.428837715040193e-09, + "loss": 0.011, + "step": 49639 + }, + { + "epoch": 0.96, + "learning_rate": 7.424954370704049e-09, + "loss": 0.0004, + "step": 49640 + }, + { + "epoch": 0.96, + "learning_rate": 7.4210710263679076e-09, + "loss": 1.2485, + "step": 49641 + }, + { + "epoch": 0.96, + "learning_rate": 7.417187682031766e-09, + "loss": 0.0006, + "step": 49642 + }, + { + "epoch": 0.96, + "learning_rate": 7.413304337695624e-09, + "loss": 0.0003, + "step": 49643 + }, + { + "epoch": 0.96, + "learning_rate": 7.409420993359481e-09, + "loss": 0.0004, + "step": 49644 + }, + { + "epoch": 0.96, + "learning_rate": 7.405537649023338e-09, + "loss": 0.0004, + "step": 49645 + }, + { + "epoch": 0.96, + "learning_rate": 7.401654304687196e-09, + "loss": 0.0004, + "step": 49646 + }, + { + "epoch": 0.96, + "learning_rate": 7.3977709603510545e-09, + "loss": 0.0514, + "step": 49647 + }, + { + "epoch": 0.96, + "learning_rate": 7.393887616014911e-09, + "loss": 0.0011, + "step": 49648 + }, + { + "epoch": 0.96, + "learning_rate": 7.390004271678769e-09, + "loss": 0.0009, + "step": 49649 + }, + { + "epoch": 0.96, + "learning_rate": 7.386120927342628e-09, + "loss": 0.0004, + "step": 49650 + }, + { + "epoch": 0.96, + "learning_rate": 7.382237583006484e-09, + "loss": 0.0003, + "step": 49651 + }, + { + "epoch": 0.96, + "learning_rate": 7.3783542386703425e-09, + "loss": 0.0014, + "step": 49652 + }, + { + "epoch": 0.96, + "learning_rate": 7.374470894334201e-09, + "loss": 0.0003, + "step": 49653 + }, + { + "epoch": 0.96, + "learning_rate": 7.370587549998059e-09, + "loss": 0.5682, + "step": 49654 + }, + { + "epoch": 0.96, + "learning_rate": 7.3667042056619155e-09, + "loss": 0.0005, + "step": 49655 + }, + { + "epoch": 0.96, + "learning_rate": 7.362820861325773e-09, + "loss": 0.0004, + "step": 49656 + }, + { + "epoch": 0.96, + "learning_rate": 7.358937516989631e-09, + "loss": 0.0003, + "step": 49657 + }, + { + "epoch": 0.96, + "learning_rate": 7.3550541726534894e-09, + "loss": 0.0003, + "step": 49658 + }, + { + "epoch": 0.96, + "learning_rate": 7.351170828317346e-09, + "loss": 0.0074, + "step": 49659 + }, + { + "epoch": 0.96, + "learning_rate": 7.347287483981204e-09, + "loss": 0.201, + "step": 49660 + }, + { + "epoch": 0.96, + "learning_rate": 7.3434041396450625e-09, + "loss": 0.0005, + "step": 49661 + }, + { + "epoch": 0.96, + "learning_rate": 7.339520795308919e-09, + "loss": 0.0003, + "step": 49662 + }, + { + "epoch": 0.96, + "learning_rate": 7.335637450972777e-09, + "loss": 0.0005, + "step": 49663 + }, + { + "epoch": 0.96, + "learning_rate": 7.331754106636636e-09, + "loss": 0.0002, + "step": 49664 + }, + { + "epoch": 0.96, + "learning_rate": 7.327870762300494e-09, + "loss": 0.0004, + "step": 49665 + }, + { + "epoch": 0.96, + "learning_rate": 7.3239874179643504e-09, + "loss": 0.0003, + "step": 49666 + }, + { + "epoch": 0.96, + "learning_rate": 7.320104073628208e-09, + "loss": 0.0036, + "step": 49667 + }, + { + "epoch": 0.96, + "learning_rate": 7.316220729292066e-09, + "loss": 0.0003, + "step": 49668 + }, + { + "epoch": 0.96, + "learning_rate": 7.312337384955923e-09, + "loss": 0.0004, + "step": 49669 + }, + { + "epoch": 0.96, + "learning_rate": 7.308454040619781e-09, + "loss": 0.0003, + "step": 49670 + }, + { + "epoch": 0.96, + "learning_rate": 7.304570696283639e-09, + "loss": 0.0003, + "step": 49671 + }, + { + "epoch": 0.96, + "learning_rate": 7.3006873519474974e-09, + "loss": 0.0007, + "step": 49672 + }, + { + "epoch": 0.96, + "learning_rate": 7.296804007611354e-09, + "loss": 0.0008, + "step": 49673 + }, + { + "epoch": 0.96, + "learning_rate": 7.292920663275212e-09, + "loss": 0.0004, + "step": 49674 + }, + { + "epoch": 0.96, + "learning_rate": 7.2890373189390705e-09, + "loss": 0.0003, + "step": 49675 + }, + { + "epoch": 0.96, + "learning_rate": 7.285153974602929e-09, + "loss": 0.0004, + "step": 49676 + }, + { + "epoch": 0.96, + "learning_rate": 7.281270630266785e-09, + "loss": 0.0005, + "step": 49677 + }, + { + "epoch": 0.96, + "learning_rate": 7.2773872859306436e-09, + "loss": 0.0004, + "step": 49678 + }, + { + "epoch": 0.96, + "learning_rate": 7.273503941594501e-09, + "loss": 0.0002, + "step": 49679 + }, + { + "epoch": 0.96, + "learning_rate": 7.2696205972583576e-09, + "loss": 0.0003, + "step": 49680 + }, + { + "epoch": 0.96, + "learning_rate": 7.265737252922216e-09, + "loss": 0.0004, + "step": 49681 + }, + { + "epoch": 0.96, + "learning_rate": 7.261853908586074e-09, + "loss": 0.0011, + "step": 49682 + }, + { + "epoch": 0.96, + "learning_rate": 7.257970564249932e-09, + "loss": 0.0004, + "step": 49683 + }, + { + "epoch": 0.96, + "learning_rate": 7.254087219913789e-09, + "loss": 0.234, + "step": 49684 + }, + { + "epoch": 0.96, + "learning_rate": 7.250203875577647e-09, + "loss": 0.0005, + "step": 49685 + }, + { + "epoch": 0.96, + "learning_rate": 7.246320531241505e-09, + "loss": 0.6414, + "step": 49686 + }, + { + "epoch": 0.96, + "learning_rate": 7.242437186905364e-09, + "loss": 0.0004, + "step": 49687 + }, + { + "epoch": 0.96, + "learning_rate": 7.23855384256922e-09, + "loss": 0.0007, + "step": 49688 + }, + { + "epoch": 0.96, + "learning_rate": 7.2346704982330785e-09, + "loss": 0.0004, + "step": 49689 + }, + { + "epoch": 0.96, + "learning_rate": 7.230787153896936e-09, + "loss": 0.0004, + "step": 49690 + }, + { + "epoch": 0.96, + "learning_rate": 7.2269038095607925e-09, + "loss": 0.0064, + "step": 49691 + }, + { + "epoch": 0.96, + "learning_rate": 7.223020465224651e-09, + "loss": 0.0003, + "step": 49692 + }, + { + "epoch": 0.96, + "learning_rate": 7.219137120888509e-09, + "loss": 0.0004, + "step": 49693 + }, + { + "epoch": 0.96, + "learning_rate": 7.215253776552367e-09, + "loss": 0.0004, + "step": 49694 + }, + { + "epoch": 0.96, + "learning_rate": 7.211370432216224e-09, + "loss": 0.0004, + "step": 49695 + }, + { + "epoch": 0.96, + "learning_rate": 7.207487087880082e-09, + "loss": 0.055, + "step": 49696 + }, + { + "epoch": 0.96, + "learning_rate": 7.20360374354394e-09, + "loss": 0.0004, + "step": 49697 + }, + { + "epoch": 0.96, + "learning_rate": 7.199720399207797e-09, + "loss": 0.0005, + "step": 49698 + }, + { + "epoch": 0.96, + "learning_rate": 7.195837054871655e-09, + "loss": 0.0003, + "step": 49699 + }, + { + "epoch": 0.96, + "learning_rate": 7.191953710535513e-09, + "loss": 0.0005, + "step": 49700 + }, + { + "epoch": 0.96, + "learning_rate": 7.188070366199371e-09, + "loss": 1.0422, + "step": 49701 + }, + { + "epoch": 0.96, + "learning_rate": 7.184187021863227e-09, + "loss": 0.0004, + "step": 49702 + }, + { + "epoch": 0.96, + "learning_rate": 7.180303677527086e-09, + "loss": 0.0003, + "step": 49703 + }, + { + "epoch": 0.96, + "learning_rate": 7.176420333190944e-09, + "loss": 0.0004, + "step": 49704 + }, + { + "epoch": 0.96, + "learning_rate": 7.172536988854802e-09, + "loss": 0.0007, + "step": 49705 + }, + { + "epoch": 0.96, + "learning_rate": 7.168653644518659e-09, + "loss": 0.0005, + "step": 49706 + }, + { + "epoch": 0.96, + "learning_rate": 7.164770300182517e-09, + "loss": 0.0004, + "step": 49707 + }, + { + "epoch": 0.96, + "learning_rate": 7.160886955846375e-09, + "loss": 0.0004, + "step": 49708 + }, + { + "epoch": 0.96, + "learning_rate": 7.157003611510232e-09, + "loss": 0.0009, + "step": 49709 + }, + { + "epoch": 0.96, + "learning_rate": 7.15312026717409e-09, + "loss": 0.0006, + "step": 49710 + }, + { + "epoch": 0.96, + "learning_rate": 7.149236922837948e-09, + "loss": 0.0004, + "step": 49711 + }, + { + "epoch": 0.96, + "learning_rate": 7.145353578501806e-09, + "loss": 0.0004, + "step": 49712 + }, + { + "epoch": 0.96, + "learning_rate": 7.141470234165663e-09, + "loss": 0.0492, + "step": 49713 + }, + { + "epoch": 0.96, + "learning_rate": 7.1375868898295205e-09, + "loss": 0.0003, + "step": 49714 + }, + { + "epoch": 0.96, + "learning_rate": 7.133703545493379e-09, + "loss": 0.0096, + "step": 49715 + }, + { + "epoch": 0.96, + "learning_rate": 7.129820201157237e-09, + "loss": 0.0004, + "step": 49716 + }, + { + "epoch": 0.96, + "learning_rate": 7.125936856821094e-09, + "loss": 0.0004, + "step": 49717 + }, + { + "epoch": 0.96, + "learning_rate": 7.122053512484952e-09, + "loss": 0.0004, + "step": 49718 + }, + { + "epoch": 0.96, + "learning_rate": 7.11817016814881e-09, + "loss": 0.0004, + "step": 49719 + }, + { + "epoch": 0.96, + "learning_rate": 7.114286823812667e-09, + "loss": 0.0003, + "step": 49720 + }, + { + "epoch": 0.96, + "learning_rate": 7.110403479476525e-09, + "loss": 0.0013, + "step": 49721 + }, + { + "epoch": 0.96, + "learning_rate": 7.106520135140383e-09, + "loss": 0.0003, + "step": 49722 + }, + { + "epoch": 0.96, + "learning_rate": 7.1026367908042406e-09, + "loss": 0.0004, + "step": 49723 + }, + { + "epoch": 0.96, + "learning_rate": 7.098753446468098e-09, + "loss": 0.0003, + "step": 49724 + }, + { + "epoch": 0.96, + "learning_rate": 7.0948701021319554e-09, + "loss": 0.011, + "step": 49725 + }, + { + "epoch": 0.96, + "learning_rate": 7.090986757795814e-09, + "loss": 0.0004, + "step": 49726 + }, + { + "epoch": 0.96, + "learning_rate": 7.08710341345967e-09, + "loss": 0.0004, + "step": 49727 + }, + { + "epoch": 0.96, + "learning_rate": 7.0832200691235285e-09, + "loss": 0.0004, + "step": 49728 + }, + { + "epoch": 0.96, + "learning_rate": 7.079336724787387e-09, + "loss": 0.0006, + "step": 49729 + }, + { + "epoch": 0.96, + "learning_rate": 7.075453380451245e-09, + "loss": 0.0004, + "step": 49730 + }, + { + "epoch": 0.96, + "learning_rate": 7.0715700361151016e-09, + "loss": 0.0033, + "step": 49731 + }, + { + "epoch": 0.96, + "learning_rate": 7.06768669177896e-09, + "loss": 0.0003, + "step": 49732 + }, + { + "epoch": 0.96, + "learning_rate": 7.063803347442818e-09, + "loss": 0.0005, + "step": 49733 + }, + { + "epoch": 0.96, + "learning_rate": 7.0599200031066755e-09, + "loss": 0.0003, + "step": 49734 + }, + { + "epoch": 0.96, + "learning_rate": 7.056036658770533e-09, + "loss": 0.0003, + "step": 49735 + }, + { + "epoch": 0.96, + "learning_rate": 7.05215331443439e-09, + "loss": 0.0005, + "step": 49736 + }, + { + "epoch": 0.96, + "learning_rate": 7.0482699700982486e-09, + "loss": 0.9185, + "step": 49737 + }, + { + "epoch": 0.96, + "learning_rate": 7.044386625762105e-09, + "loss": 0.0003, + "step": 49738 + }, + { + "epoch": 0.96, + "learning_rate": 7.040503281425963e-09, + "loss": 0.0006, + "step": 49739 + }, + { + "epoch": 0.96, + "learning_rate": 7.036619937089822e-09, + "loss": 1.1088, + "step": 49740 + }, + { + "epoch": 0.96, + "learning_rate": 7.03273659275368e-09, + "loss": 0.0003, + "step": 49741 + }, + { + "epoch": 0.96, + "learning_rate": 7.0288532484175365e-09, + "loss": 0.0003, + "step": 49742 + }, + { + "epoch": 0.96, + "learning_rate": 7.024969904081395e-09, + "loss": 0.4479, + "step": 49743 + }, + { + "epoch": 0.96, + "learning_rate": 7.021086559745253e-09, + "loss": 0.0004, + "step": 49744 + }, + { + "epoch": 0.96, + "learning_rate": 7.01720321540911e-09, + "loss": 1.0599, + "step": 49745 + }, + { + "epoch": 0.96, + "learning_rate": 7.013319871072968e-09, + "loss": 0.0004, + "step": 49746 + }, + { + "epoch": 0.96, + "learning_rate": 7.009436526736825e-09, + "loss": 0.0027, + "step": 49747 + }, + { + "epoch": 0.97, + "learning_rate": 7.0055531824006835e-09, + "loss": 0.0003, + "step": 49748 + }, + { + "epoch": 0.97, + "learning_rate": 7.00166983806454e-09, + "loss": 0.0004, + "step": 49749 + }, + { + "epoch": 0.97, + "learning_rate": 6.997786493728398e-09, + "loss": 0.0004, + "step": 49750 + }, + { + "epoch": 0.97, + "learning_rate": 6.9939031493922565e-09, + "loss": 0.0004, + "step": 49751 + }, + { + "epoch": 0.97, + "learning_rate": 6.990019805056115e-09, + "loss": 0.0006, + "step": 49752 + }, + { + "epoch": 0.97, + "learning_rate": 6.986136460719971e-09, + "loss": 0.0005, + "step": 49753 + }, + { + "epoch": 0.97, + "learning_rate": 6.98225311638383e-09, + "loss": 0.0003, + "step": 49754 + }, + { + "epoch": 0.97, + "learning_rate": 6.978369772047688e-09, + "loss": 0.0005, + "step": 49755 + }, + { + "epoch": 0.97, + "learning_rate": 6.9744864277115444e-09, + "loss": 0.0735, + "step": 49756 + }, + { + "epoch": 0.97, + "learning_rate": 6.970603083375403e-09, + "loss": 0.0004, + "step": 49757 + }, + { + "epoch": 0.97, + "learning_rate": 6.96671973903926e-09, + "loss": 0.0005, + "step": 49758 + }, + { + "epoch": 0.97, + "learning_rate": 6.962836394703118e-09, + "loss": 0.0008, + "step": 49759 + }, + { + "epoch": 0.97, + "learning_rate": 6.958953050366975e-09, + "loss": 0.0008, + "step": 49760 + }, + { + "epoch": 0.97, + "learning_rate": 6.955069706030833e-09, + "loss": 0.0005, + "step": 49761 + }, + { + "epoch": 0.97, + "learning_rate": 6.9511863616946914e-09, + "loss": 0.0007, + "step": 49762 + }, + { + "epoch": 0.97, + "learning_rate": 6.94730301735855e-09, + "loss": 0.0004, + "step": 49763 + }, + { + "epoch": 0.97, + "learning_rate": 6.943419673022406e-09, + "loss": 0.0005, + "step": 49764 + }, + { + "epoch": 0.97, + "learning_rate": 6.9395363286862645e-09, + "loss": 0.2635, + "step": 49765 + }, + { + "epoch": 0.97, + "learning_rate": 6.935652984350123e-09, + "loss": 0.0003, + "step": 49766 + }, + { + "epoch": 0.97, + "learning_rate": 6.931769640013979e-09, + "loss": 0.0267, + "step": 49767 + }, + { + "epoch": 0.97, + "learning_rate": 6.9278862956778376e-09, + "loss": 0.0003, + "step": 49768 + }, + { + "epoch": 0.97, + "learning_rate": 6.924002951341695e-09, + "loss": 0.8063, + "step": 49769 + }, + { + "epoch": 0.97, + "learning_rate": 6.920119607005553e-09, + "loss": 0.0572, + "step": 49770 + }, + { + "epoch": 0.97, + "learning_rate": 6.91623626266941e-09, + "loss": 0.0004, + "step": 49771 + }, + { + "epoch": 0.97, + "learning_rate": 6.912352918333268e-09, + "loss": 0.0003, + "step": 49772 + }, + { + "epoch": 0.97, + "learning_rate": 6.908469573997126e-09, + "loss": 0.0006, + "step": 49773 + }, + { + "epoch": 0.97, + "learning_rate": 6.9045862296609846e-09, + "loss": 0.0003, + "step": 49774 + }, + { + "epoch": 0.97, + "learning_rate": 6.900702885324841e-09, + "loss": 0.0458, + "step": 49775 + }, + { + "epoch": 0.97, + "learning_rate": 6.896819540988699e-09, + "loss": 0.0007, + "step": 49776 + }, + { + "epoch": 0.97, + "learning_rate": 6.892936196652558e-09, + "loss": 0.0005, + "step": 49777 + }, + { + "epoch": 0.97, + "learning_rate": 6.889052852316414e-09, + "loss": 0.0005, + "step": 49778 + }, + { + "epoch": 0.97, + "learning_rate": 6.8851695079802725e-09, + "loss": 0.0003, + "step": 49779 + }, + { + "epoch": 0.97, + "learning_rate": 6.88128616364413e-09, + "loss": 0.0034, + "step": 49780 + }, + { + "epoch": 0.97, + "learning_rate": 6.877402819307988e-09, + "loss": 0.0005, + "step": 49781 + }, + { + "epoch": 0.97, + "learning_rate": 6.873519474971845e-09, + "loss": 0.0189, + "step": 49782 + }, + { + "epoch": 0.97, + "learning_rate": 6.869636130635703e-09, + "loss": 0.0005, + "step": 49783 + }, + { + "epoch": 0.97, + "learning_rate": 6.865752786299561e-09, + "loss": 0.0006, + "step": 49784 + }, + { + "epoch": 0.97, + "learning_rate": 6.861869441963418e-09, + "loss": 0.0004, + "step": 49785 + }, + { + "epoch": 0.97, + "learning_rate": 6.857986097627276e-09, + "loss": 0.0004, + "step": 49786 + }, + { + "epoch": 0.97, + "learning_rate": 6.854102753291134e-09, + "loss": 0.0004, + "step": 49787 + }, + { + "epoch": 0.97, + "learning_rate": 6.8502194089549925e-09, + "loss": 0.0005, + "step": 49788 + }, + { + "epoch": 0.97, + "learning_rate": 6.846336064618849e-09, + "loss": 0.0005, + "step": 49789 + }, + { + "epoch": 0.97, + "learning_rate": 6.842452720282707e-09, + "loss": 0.0005, + "step": 49790 + }, + { + "epoch": 0.97, + "learning_rate": 6.838569375946565e-09, + "loss": 0.0026, + "step": 49791 + }, + { + "epoch": 0.97, + "learning_rate": 6.834686031610423e-09, + "loss": 0.0004, + "step": 49792 + }, + { + "epoch": 0.97, + "learning_rate": 6.83080268727428e-09, + "loss": 0.0005, + "step": 49793 + }, + { + "epoch": 0.97, + "learning_rate": 6.826919342938138e-09, + "loss": 0.0004, + "step": 49794 + }, + { + "epoch": 0.97, + "learning_rate": 6.823035998601996e-09, + "loss": 0.0002, + "step": 49795 + }, + { + "epoch": 0.97, + "learning_rate": 6.819152654265853e-09, + "loss": 0.0004, + "step": 49796 + }, + { + "epoch": 0.97, + "learning_rate": 6.815269309929711e-09, + "loss": 0.0004, + "step": 49797 + }, + { + "epoch": 0.97, + "learning_rate": 6.811385965593569e-09, + "loss": 0.0004, + "step": 49798 + }, + { + "epoch": 0.97, + "learning_rate": 6.8075026212574274e-09, + "loss": 0.0003, + "step": 49799 + }, + { + "epoch": 0.97, + "learning_rate": 6.803619276921284e-09, + "loss": 0.001, + "step": 49800 + }, + { + "epoch": 0.97, + "learning_rate": 6.799735932585142e-09, + "loss": 0.0011, + "step": 49801 + }, + { + "epoch": 0.97, + "learning_rate": 6.795852588249e-09, + "loss": 0.0004, + "step": 49802 + }, + { + "epoch": 0.97, + "learning_rate": 6.791969243912858e-09, + "loss": 0.0005, + "step": 49803 + }, + { + "epoch": 0.97, + "learning_rate": 6.7880858995767145e-09, + "loss": 0.0004, + "step": 49804 + }, + { + "epoch": 0.97, + "learning_rate": 6.784202555240573e-09, + "loss": 1.0129, + "step": 49805 + }, + { + "epoch": 0.97, + "learning_rate": 6.780319210904431e-09, + "loss": 0.0254, + "step": 49806 + }, + { + "epoch": 0.97, + "learning_rate": 6.776435866568288e-09, + "loss": 0.0361, + "step": 49807 + }, + { + "epoch": 0.97, + "learning_rate": 6.772552522232146e-09, + "loss": 0.0003, + "step": 49808 + }, + { + "epoch": 0.97, + "learning_rate": 6.768669177896004e-09, + "loss": 0.0004, + "step": 49809 + }, + { + "epoch": 0.97, + "learning_rate": 6.764785833559862e-09, + "loss": 0.001, + "step": 49810 + }, + { + "epoch": 0.97, + "learning_rate": 6.760902489223719e-09, + "loss": 0.2222, + "step": 49811 + }, + { + "epoch": 0.97, + "learning_rate": 6.757019144887577e-09, + "loss": 0.8493, + "step": 49812 + }, + { + "epoch": 0.97, + "learning_rate": 6.753135800551435e-09, + "loss": 0.0004, + "step": 49813 + }, + { + "epoch": 0.97, + "learning_rate": 6.749252456215292e-09, + "loss": 0.0004, + "step": 49814 + }, + { + "epoch": 0.97, + "learning_rate": 6.7453691118791494e-09, + "loss": 0.0004, + "step": 49815 + }, + { + "epoch": 0.97, + "learning_rate": 6.741485767543008e-09, + "loss": 0.0003, + "step": 49816 + }, + { + "epoch": 0.97, + "learning_rate": 6.737602423206866e-09, + "loss": 0.0003, + "step": 49817 + }, + { + "epoch": 0.97, + "learning_rate": 6.7337190788707225e-09, + "loss": 0.0003, + "step": 49818 + }, + { + "epoch": 0.97, + "learning_rate": 6.729835734534581e-09, + "loss": 0.0004, + "step": 49819 + }, + { + "epoch": 0.97, + "learning_rate": 6.725952390198439e-09, + "loss": 0.0005, + "step": 49820 + }, + { + "epoch": 0.97, + "learning_rate": 6.722069045862297e-09, + "loss": 0.0003, + "step": 49821 + }, + { + "epoch": 0.97, + "learning_rate": 6.718185701526154e-09, + "loss": 0.0003, + "step": 49822 + }, + { + "epoch": 0.97, + "learning_rate": 6.714302357190012e-09, + "loss": 0.0004, + "step": 49823 + }, + { + "epoch": 0.97, + "learning_rate": 6.7104190128538695e-09, + "loss": 0.0005, + "step": 49824 + }, + { + "epoch": 0.97, + "learning_rate": 6.706535668517727e-09, + "loss": 0.0003, + "step": 49825 + }, + { + "epoch": 0.97, + "learning_rate": 6.702652324181584e-09, + "loss": 0.0003, + "step": 49826 + }, + { + "epoch": 0.97, + "learning_rate": 6.6987689798454426e-09, + "loss": 0.0006, + "step": 49827 + }, + { + "epoch": 0.97, + "learning_rate": 6.694885635509301e-09, + "loss": 0.0485, + "step": 49828 + }, + { + "epoch": 0.97, + "learning_rate": 6.691002291173157e-09, + "loss": 0.0003, + "step": 49829 + }, + { + "epoch": 0.97, + "learning_rate": 6.687118946837016e-09, + "loss": 0.0004, + "step": 49830 + }, + { + "epoch": 0.97, + "learning_rate": 6.683235602500874e-09, + "loss": 0.0004, + "step": 49831 + }, + { + "epoch": 0.97, + "learning_rate": 6.679352258164732e-09, + "loss": 0.0016, + "step": 49832 + }, + { + "epoch": 0.97, + "learning_rate": 6.675468913828589e-09, + "loss": 0.0003, + "step": 49833 + }, + { + "epoch": 0.97, + "learning_rate": 6.671585569492447e-09, + "loss": 0.0004, + "step": 49834 + }, + { + "epoch": 0.97, + "learning_rate": 6.667702225156304e-09, + "loss": 0.0006, + "step": 49835 + }, + { + "epoch": 0.97, + "learning_rate": 6.663818880820162e-09, + "loss": 0.0004, + "step": 49836 + }, + { + "epoch": 0.97, + "learning_rate": 6.659935536484019e-09, + "loss": 0.3147, + "step": 49837 + }, + { + "epoch": 0.97, + "learning_rate": 6.6560521921478775e-09, + "loss": 0.0004, + "step": 49838 + }, + { + "epoch": 0.97, + "learning_rate": 6.652168847811736e-09, + "loss": 0.0004, + "step": 49839 + }, + { + "epoch": 0.97, + "learning_rate": 6.648285503475592e-09, + "loss": 0.0004, + "step": 49840 + }, + { + "epoch": 0.97, + "learning_rate": 6.6444021591394505e-09, + "loss": 0.0003, + "step": 49841 + }, + { + "epoch": 0.97, + "learning_rate": 6.640518814803309e-09, + "loss": 0.0003, + "step": 49842 + }, + { + "epoch": 0.97, + "learning_rate": 6.636635470467165e-09, + "loss": 0.0003, + "step": 49843 + }, + { + "epoch": 0.97, + "learning_rate": 6.632752126131024e-09, + "loss": 0.0003, + "step": 49844 + }, + { + "epoch": 0.97, + "learning_rate": 6.628868781794882e-09, + "loss": 0.0002, + "step": 49845 + }, + { + "epoch": 0.97, + "learning_rate": 6.624985437458739e-09, + "loss": 0.0004, + "step": 49846 + }, + { + "epoch": 0.97, + "learning_rate": 6.621102093122597e-09, + "loss": 0.0127, + "step": 49847 + }, + { + "epoch": 0.97, + "learning_rate": 6.617218748786454e-09, + "loss": 0.0003, + "step": 49848 + }, + { + "epoch": 0.97, + "learning_rate": 6.613335404450312e-09, + "loss": 0.0004, + "step": 49849 + }, + { + "epoch": 0.97, + "learning_rate": 6.609452060114171e-09, + "loss": 0.0009, + "step": 49850 + }, + { + "epoch": 0.97, + "learning_rate": 6.605568715778027e-09, + "loss": 0.0004, + "step": 49851 + }, + { + "epoch": 0.97, + "learning_rate": 6.6016853714418854e-09, + "loss": 0.0004, + "step": 49852 + }, + { + "epoch": 0.97, + "learning_rate": 6.597802027105744e-09, + "loss": 0.0004, + "step": 49853 + }, + { + "epoch": 0.97, + "learning_rate": 6.5939186827696e-09, + "loss": 0.0004, + "step": 49854 + }, + { + "epoch": 0.97, + "learning_rate": 6.5900353384334585e-09, + "loss": 0.0005, + "step": 49855 + }, + { + "epoch": 0.97, + "learning_rate": 6.586151994097317e-09, + "loss": 0.0395, + "step": 49856 + }, + { + "epoch": 0.97, + "learning_rate": 6.582268649761174e-09, + "loss": 0.0003, + "step": 49857 + }, + { + "epoch": 0.97, + "learning_rate": 6.578385305425032e-09, + "loss": 0.7672, + "step": 49858 + }, + { + "epoch": 0.97, + "learning_rate": 6.574501961088889e-09, + "loss": 0.0004, + "step": 49859 + }, + { + "epoch": 0.97, + "learning_rate": 6.570618616752747e-09, + "loss": 0.0003, + "step": 49860 + }, + { + "epoch": 0.97, + "learning_rate": 6.5667352724166055e-09, + "loss": 0.0003, + "step": 49861 + }, + { + "epoch": 0.97, + "learning_rate": 6.562851928080462e-09, + "loss": 0.0044, + "step": 49862 + }, + { + "epoch": 0.97, + "learning_rate": 6.55896858374432e-09, + "loss": 0.0005, + "step": 49863 + }, + { + "epoch": 0.97, + "learning_rate": 6.5550852394081786e-09, + "loss": 0.0006, + "step": 49864 + }, + { + "epoch": 0.97, + "learning_rate": 6.551201895072035e-09, + "loss": 0.0004, + "step": 49865 + }, + { + "epoch": 0.97, + "learning_rate": 6.5473185507358934e-09, + "loss": 0.0007, + "step": 49866 + }, + { + "epoch": 0.97, + "learning_rate": 6.543435206399752e-09, + "loss": 0.0003, + "step": 49867 + }, + { + "epoch": 0.97, + "learning_rate": 6.539551862063609e-09, + "loss": 0.0011, + "step": 49868 + }, + { + "epoch": 0.97, + "learning_rate": 6.5356685177274665e-09, + "loss": 0.0003, + "step": 49869 + }, + { + "epoch": 0.97, + "learning_rate": 6.531785173391324e-09, + "loss": 0.0004, + "step": 49870 + }, + { + "epoch": 0.97, + "learning_rate": 6.527901829055182e-09, + "loss": 0.0004, + "step": 49871 + }, + { + "epoch": 0.97, + "learning_rate": 6.524018484719039e-09, + "loss": 0.0004, + "step": 49872 + }, + { + "epoch": 0.97, + "learning_rate": 6.520135140382897e-09, + "loss": 0.0004, + "step": 49873 + }, + { + "epoch": 0.97, + "learning_rate": 6.516251796046755e-09, + "loss": 0.0006, + "step": 49874 + }, + { + "epoch": 0.97, + "learning_rate": 6.5123684517106135e-09, + "loss": 0.0004, + "step": 49875 + }, + { + "epoch": 0.97, + "learning_rate": 6.50848510737447e-09, + "loss": 0.0003, + "step": 49876 + }, + { + "epoch": 0.97, + "learning_rate": 6.504601763038328e-09, + "loss": 0.0024, + "step": 49877 + }, + { + "epoch": 0.97, + "learning_rate": 6.5007184187021866e-09, + "loss": 0.0006, + "step": 49878 + }, + { + "epoch": 0.97, + "learning_rate": 6.496835074366044e-09, + "loss": 0.0004, + "step": 49879 + }, + { + "epoch": 0.97, + "learning_rate": 6.492951730029901e-09, + "loss": 0.0004, + "step": 49880 + }, + { + "epoch": 0.97, + "learning_rate": 6.489068385693759e-09, + "loss": 0.0002, + "step": 49881 + }, + { + "epoch": 0.97, + "learning_rate": 6.485185041357617e-09, + "loss": 0.001, + "step": 49882 + }, + { + "epoch": 0.97, + "learning_rate": 6.481301697021474e-09, + "loss": 0.0004, + "step": 49883 + }, + { + "epoch": 0.97, + "learning_rate": 6.477418352685332e-09, + "loss": 0.0005, + "step": 49884 + }, + { + "epoch": 0.97, + "learning_rate": 6.47353500834919e-09, + "loss": 0.0022, + "step": 49885 + }, + { + "epoch": 0.97, + "learning_rate": 6.469651664013048e-09, + "loss": 0.0003, + "step": 49886 + }, + { + "epoch": 0.97, + "learning_rate": 6.465768319676905e-09, + "loss": 0.0003, + "step": 49887 + }, + { + "epoch": 0.97, + "learning_rate": 6.461884975340763e-09, + "loss": 0.0004, + "step": 49888 + }, + { + "epoch": 0.97, + "learning_rate": 6.4580016310046215e-09, + "loss": 0.0004, + "step": 49889 + }, + { + "epoch": 0.97, + "learning_rate": 6.45411828666848e-09, + "loss": 0.0003, + "step": 49890 + }, + { + "epoch": 0.97, + "learning_rate": 6.450234942332336e-09, + "loss": 0.0003, + "step": 49891 + }, + { + "epoch": 0.97, + "learning_rate": 6.446351597996194e-09, + "loss": 0.0002, + "step": 49892 + }, + { + "epoch": 0.97, + "learning_rate": 6.442468253660052e-09, + "loss": 0.0019, + "step": 49893 + }, + { + "epoch": 0.97, + "learning_rate": 6.4385849093239085e-09, + "loss": 0.0004, + "step": 49894 + }, + { + "epoch": 0.97, + "learning_rate": 6.434701564987767e-09, + "loss": 0.0004, + "step": 49895 + }, + { + "epoch": 0.97, + "learning_rate": 6.430818220651625e-09, + "loss": 0.0004, + "step": 49896 + }, + { + "epoch": 0.97, + "learning_rate": 6.426934876315483e-09, + "loss": 0.0005, + "step": 49897 + }, + { + "epoch": 0.97, + "learning_rate": 6.42305153197934e-09, + "loss": 0.6831, + "step": 49898 + }, + { + "epoch": 0.97, + "learning_rate": 6.419168187643198e-09, + "loss": 0.0005, + "step": 49899 + }, + { + "epoch": 0.97, + "learning_rate": 6.415284843307056e-09, + "loss": 1.4497, + "step": 49900 + }, + { + "epoch": 0.97, + "learning_rate": 6.411401498970913e-09, + "loss": 0.0008, + "step": 49901 + }, + { + "epoch": 0.97, + "learning_rate": 6.407518154634771e-09, + "loss": 0.0005, + "step": 49902 + }, + { + "epoch": 0.97, + "learning_rate": 6.403634810298629e-09, + "loss": 0.0004, + "step": 49903 + }, + { + "epoch": 0.97, + "learning_rate": 6.399751465962487e-09, + "loss": 0.0004, + "step": 49904 + }, + { + "epoch": 0.97, + "learning_rate": 6.3958681216263434e-09, + "loss": 0.0891, + "step": 49905 + }, + { + "epoch": 0.97, + "learning_rate": 6.391984777290202e-09, + "loss": 0.0012, + "step": 49906 + }, + { + "epoch": 0.97, + "learning_rate": 6.38810143295406e-09, + "loss": 0.0002, + "step": 49907 + }, + { + "epoch": 0.97, + "learning_rate": 6.384218088617918e-09, + "loss": 0.0005, + "step": 49908 + }, + { + "epoch": 0.97, + "learning_rate": 6.380334744281775e-09, + "loss": 0.055, + "step": 49909 + }, + { + "epoch": 0.97, + "learning_rate": 6.376451399945633e-09, + "loss": 0.0005, + "step": 49910 + }, + { + "epoch": 0.97, + "learning_rate": 6.372568055609491e-09, + "loss": 0.0004, + "step": 49911 + }, + { + "epoch": 0.97, + "learning_rate": 6.368684711273348e-09, + "loss": 0.3502, + "step": 49912 + }, + { + "epoch": 0.97, + "learning_rate": 6.364801366937206e-09, + "loss": 0.0004, + "step": 49913 + }, + { + "epoch": 0.97, + "learning_rate": 6.3609180226010635e-09, + "loss": 0.0003, + "step": 49914 + }, + { + "epoch": 0.97, + "learning_rate": 6.357034678264922e-09, + "loss": 0.0003, + "step": 49915 + }, + { + "epoch": 0.97, + "learning_rate": 6.353151333928778e-09, + "loss": 0.0003, + "step": 49916 + }, + { + "epoch": 0.97, + "learning_rate": 6.3492679895926366e-09, + "loss": 0.0006, + "step": 49917 + }, + { + "epoch": 0.97, + "learning_rate": 6.345384645256495e-09, + "loss": 0.0004, + "step": 49918 + }, + { + "epoch": 0.97, + "learning_rate": 6.341501300920353e-09, + "loss": 0.0004, + "step": 49919 + }, + { + "epoch": 0.97, + "learning_rate": 6.33761795658421e-09, + "loss": 0.0003, + "step": 49920 + }, + { + "epoch": 0.97, + "learning_rate": 6.333734612248068e-09, + "loss": 0.0004, + "step": 49921 + }, + { + "epoch": 0.97, + "learning_rate": 6.329851267911926e-09, + "loss": 0.0003, + "step": 49922 + }, + { + "epoch": 0.97, + "learning_rate": 6.325967923575783e-09, + "loss": 0.0002, + "step": 49923 + }, + { + "epoch": 0.97, + "learning_rate": 6.322084579239641e-09, + "loss": 0.0005, + "step": 49924 + }, + { + "epoch": 0.97, + "learning_rate": 6.318201234903499e-09, + "loss": 0.0006, + "step": 49925 + }, + { + "epoch": 0.97, + "learning_rate": 6.314317890567357e-09, + "loss": 0.0005, + "step": 49926 + }, + { + "epoch": 0.97, + "learning_rate": 6.310434546231213e-09, + "loss": 0.0004, + "step": 49927 + }, + { + "epoch": 0.97, + "learning_rate": 6.3065512018950715e-09, + "loss": 0.0003, + "step": 49928 + }, + { + "epoch": 0.97, + "learning_rate": 6.30266785755893e-09, + "loss": 0.0005, + "step": 49929 + }, + { + "epoch": 0.97, + "learning_rate": 6.298784513222786e-09, + "loss": 0.0004, + "step": 49930 + }, + { + "epoch": 0.97, + "learning_rate": 6.2949011688866446e-09, + "loss": 0.0003, + "step": 49931 + }, + { + "epoch": 0.97, + "learning_rate": 6.291017824550503e-09, + "loss": 0.0004, + "step": 49932 + }, + { + "epoch": 0.97, + "learning_rate": 6.287134480214361e-09, + "loss": 0.3838, + "step": 49933 + }, + { + "epoch": 0.97, + "learning_rate": 6.283251135878218e-09, + "loss": 0.0003, + "step": 49934 + }, + { + "epoch": 0.97, + "learning_rate": 6.279367791542076e-09, + "loss": 0.0004, + "step": 49935 + }, + { + "epoch": 0.97, + "learning_rate": 6.275484447205934e-09, + "loss": 0.0003, + "step": 49936 + }, + { + "epoch": 0.97, + "learning_rate": 6.2716011028697915e-09, + "loss": 0.0006, + "step": 49937 + }, + { + "epoch": 0.97, + "learning_rate": 6.267717758533648e-09, + "loss": 0.0004, + "step": 49938 + }, + { + "epoch": 0.97, + "learning_rate": 6.263834414197506e-09, + "loss": 0.0003, + "step": 49939 + }, + { + "epoch": 0.97, + "learning_rate": 6.259951069861365e-09, + "loss": 0.0002, + "step": 49940 + }, + { + "epoch": 0.97, + "learning_rate": 6.256067725525221e-09, + "loss": 0.0006, + "step": 49941 + }, + { + "epoch": 0.97, + "learning_rate": 6.2521843811890795e-09, + "loss": 0.0004, + "step": 49942 + }, + { + "epoch": 0.97, + "learning_rate": 6.248301036852938e-09, + "loss": 0.0003, + "step": 49943 + }, + { + "epoch": 0.97, + "learning_rate": 6.244417692516795e-09, + "loss": 0.0005, + "step": 49944 + }, + { + "epoch": 0.97, + "learning_rate": 6.240534348180653e-09, + "loss": 0.001, + "step": 49945 + }, + { + "epoch": 0.97, + "learning_rate": 6.236651003844511e-09, + "loss": 0.0002, + "step": 49946 + }, + { + "epoch": 0.97, + "learning_rate": 6.232767659508369e-09, + "loss": 0.773, + "step": 49947 + }, + { + "epoch": 0.97, + "learning_rate": 6.2288843151722264e-09, + "loss": 0.0008, + "step": 49948 + }, + { + "epoch": 0.97, + "learning_rate": 6.225000970836084e-09, + "loss": 0.0003, + "step": 49949 + }, + { + "epoch": 0.97, + "learning_rate": 6.221117626499941e-09, + "loss": 0.0005, + "step": 49950 + }, + { + "epoch": 0.97, + "learning_rate": 6.217234282163799e-09, + "loss": 0.0005, + "step": 49951 + }, + { + "epoch": 0.97, + "learning_rate": 6.213350937827657e-09, + "loss": 0.0005, + "step": 49952 + }, + { + "epoch": 0.97, + "learning_rate": 6.209467593491514e-09, + "loss": 0.0005, + "step": 49953 + }, + { + "epoch": 0.97, + "learning_rate": 6.205584249155373e-09, + "loss": 0.0009, + "step": 49954 + }, + { + "epoch": 0.97, + "learning_rate": 6.20170090481923e-09, + "loss": 0.0005, + "step": 49955 + }, + { + "epoch": 0.97, + "learning_rate": 6.197817560483088e-09, + "loss": 0.0004, + "step": 49956 + }, + { + "epoch": 0.97, + "learning_rate": 6.193934216146946e-09, + "loss": 0.0002, + "step": 49957 + }, + { + "epoch": 0.97, + "learning_rate": 6.190050871810803e-09, + "loss": 0.0004, + "step": 49958 + }, + { + "epoch": 0.97, + "learning_rate": 6.186167527474661e-09, + "loss": 0.0514, + "step": 49959 + }, + { + "epoch": 0.97, + "learning_rate": 6.182284183138519e-09, + "loss": 0.0003, + "step": 49960 + }, + { + "epoch": 0.97, + "learning_rate": 6.178400838802376e-09, + "loss": 0.0003, + "step": 49961 + }, + { + "epoch": 0.97, + "learning_rate": 6.174517494466234e-09, + "loss": 0.0004, + "step": 49962 + }, + { + "epoch": 0.97, + "learning_rate": 6.170634150130092e-09, + "loss": 0.0008, + "step": 49963 + }, + { + "epoch": 0.97, + "learning_rate": 6.166750805793949e-09, + "loss": 0.0007, + "step": 49964 + }, + { + "epoch": 0.97, + "learning_rate": 6.1628674614578075e-09, + "loss": 0.0003, + "step": 49965 + }, + { + "epoch": 0.97, + "learning_rate": 6.158984117121665e-09, + "loss": 1.4143, + "step": 49966 + }, + { + "epoch": 0.97, + "learning_rate": 6.155100772785523e-09, + "loss": 0.0013, + "step": 49967 + }, + { + "epoch": 0.97, + "learning_rate": 6.1512174284493806e-09, + "loss": 0.8331, + "step": 49968 + }, + { + "epoch": 0.97, + "learning_rate": 6.147334084113238e-09, + "loss": 0.0112, + "step": 49969 + }, + { + "epoch": 0.97, + "learning_rate": 6.143450739777096e-09, + "loss": 0.0004, + "step": 49970 + }, + { + "epoch": 0.97, + "learning_rate": 6.139567395440954e-09, + "loss": 0.0004, + "step": 49971 + }, + { + "epoch": 0.97, + "learning_rate": 6.135684051104811e-09, + "loss": 0.0003, + "step": 49972 + }, + { + "epoch": 0.97, + "learning_rate": 6.1318007067686685e-09, + "loss": 0.6413, + "step": 49973 + }, + { + "epoch": 0.97, + "learning_rate": 6.127917362432527e-09, + "loss": 0.005, + "step": 49974 + }, + { + "epoch": 0.97, + "learning_rate": 6.124034018096384e-09, + "loss": 0.0003, + "step": 49975 + }, + { + "epoch": 0.97, + "learning_rate": 6.120150673760242e-09, + "loss": 0.0004, + "step": 49976 + }, + { + "epoch": 0.97, + "learning_rate": 6.1162673294241e-09, + "loss": 0.0004, + "step": 49977 + }, + { + "epoch": 0.97, + "learning_rate": 6.112383985087957e-09, + "loss": 0.0006, + "step": 49978 + }, + { + "epoch": 0.97, + "learning_rate": 6.1085006407518155e-09, + "loss": 0.0005, + "step": 49979 + }, + { + "epoch": 0.97, + "learning_rate": 6.104617296415673e-09, + "loss": 0.0003, + "step": 49980 + }, + { + "epoch": 0.97, + "learning_rate": 6.100733952079531e-09, + "loss": 0.0004, + "step": 49981 + }, + { + "epoch": 0.97, + "learning_rate": 6.0968506077433885e-09, + "loss": 0.0004, + "step": 49982 + }, + { + "epoch": 0.97, + "learning_rate": 6.092967263407246e-09, + "loss": 0.0004, + "step": 49983 + }, + { + "epoch": 0.97, + "learning_rate": 6.089083919071103e-09, + "loss": 0.0003, + "step": 49984 + }, + { + "epoch": 0.97, + "learning_rate": 6.085200574734962e-09, + "loss": 0.0003, + "step": 49985 + }, + { + "epoch": 0.97, + "learning_rate": 6.081317230398819e-09, + "loss": 0.0006, + "step": 49986 + }, + { + "epoch": 0.97, + "learning_rate": 6.0774338860626765e-09, + "loss": 0.0004, + "step": 49987 + }, + { + "epoch": 0.97, + "learning_rate": 6.073550541726535e-09, + "loss": 0.0002, + "step": 49988 + }, + { + "epoch": 0.97, + "learning_rate": 6.069667197390392e-09, + "loss": 0.0003, + "step": 49989 + }, + { + "epoch": 0.97, + "learning_rate": 6.06578385305425e-09, + "loss": 0.0003, + "step": 49990 + }, + { + "epoch": 0.97, + "learning_rate": 6.061900508718108e-09, + "loss": 0.0004, + "step": 49991 + }, + { + "epoch": 0.97, + "learning_rate": 6.058017164381966e-09, + "loss": 0.0006, + "step": 49992 + }, + { + "epoch": 0.97, + "learning_rate": 6.0541338200458234e-09, + "loss": 0.0003, + "step": 49993 + }, + { + "epoch": 0.97, + "learning_rate": 6.050250475709681e-09, + "loss": 0.0004, + "step": 49994 + }, + { + "epoch": 0.97, + "learning_rate": 6.046367131373538e-09, + "loss": 0.0004, + "step": 49995 + }, + { + "epoch": 0.97, + "learning_rate": 6.0424837870373965e-09, + "loss": 0.0025, + "step": 49996 + }, + { + "epoch": 0.97, + "learning_rate": 6.038600442701254e-09, + "loss": 0.0005, + "step": 49997 + }, + { + "epoch": 0.97, + "learning_rate": 6.034717098365111e-09, + "loss": 1.212, + "step": 49998 + }, + { + "epoch": 0.97, + "learning_rate": 6.03083375402897e-09, + "loss": 0.0005, + "step": 49999 + }, + { + "epoch": 0.97, + "learning_rate": 6.026950409692827e-09, + "loss": 0.1233, + "step": 50000 + }, + { + "epoch": 0.97, + "learning_rate": 6.023067065356685e-09, + "loss": 0.0003, + "step": 50001 + }, + { + "epoch": 0.97, + "learning_rate": 6.019183721020543e-09, + "loss": 1.2617, + "step": 50002 + }, + { + "epoch": 0.97, + "learning_rate": 6.015300376684401e-09, + "loss": 0.0023, + "step": 50003 + }, + { + "epoch": 0.97, + "learning_rate": 6.011417032348258e-09, + "loss": 0.0005, + "step": 50004 + }, + { + "epoch": 0.97, + "learning_rate": 6.007533688012116e-09, + "loss": 0.3085, + "step": 50005 + }, + { + "epoch": 0.97, + "learning_rate": 6.003650343675973e-09, + "loss": 0.0004, + "step": 50006 + }, + { + "epoch": 0.97, + "learning_rate": 5.999766999339831e-09, + "loss": 0.0004, + "step": 50007 + }, + { + "epoch": 0.97, + "learning_rate": 5.995883655003689e-09, + "loss": 0.0006, + "step": 50008 + }, + { + "epoch": 0.97, + "learning_rate": 5.992000310667546e-09, + "loss": 0.0003, + "step": 50009 + }, + { + "epoch": 0.97, + "learning_rate": 5.9881169663314045e-09, + "loss": 0.051, + "step": 50010 + }, + { + "epoch": 0.97, + "learning_rate": 5.984233621995262e-09, + "loss": 0.0004, + "step": 50011 + }, + { + "epoch": 0.97, + "learning_rate": 5.98035027765912e-09, + "loss": 0.0005, + "step": 50012 + }, + { + "epoch": 0.97, + "learning_rate": 5.9764669333229776e-09, + "loss": 0.9068, + "step": 50013 + }, + { + "epoch": 0.97, + "learning_rate": 5.972583588986836e-09, + "loss": 0.0004, + "step": 50014 + }, + { + "epoch": 0.97, + "learning_rate": 5.968700244650693e-09, + "loss": 0.0003, + "step": 50015 + }, + { + "epoch": 0.97, + "learning_rate": 5.964816900314551e-09, + "loss": 0.0003, + "step": 50016 + }, + { + "epoch": 0.97, + "learning_rate": 5.960933555978408e-09, + "loss": 0.0009, + "step": 50017 + }, + { + "epoch": 0.97, + "learning_rate": 5.9570502116422655e-09, + "loss": 0.0003, + "step": 50018 + }, + { + "epoch": 0.97, + "learning_rate": 5.953166867306124e-09, + "loss": 0.0005, + "step": 50019 + }, + { + "epoch": 0.97, + "learning_rate": 5.949283522969981e-09, + "loss": 0.0003, + "step": 50020 + }, + { + "epoch": 0.97, + "learning_rate": 5.945400178633839e-09, + "loss": 0.0004, + "step": 50021 + }, + { + "epoch": 0.97, + "learning_rate": 5.941516834297697e-09, + "loss": 0.0092, + "step": 50022 + }, + { + "epoch": 0.97, + "learning_rate": 5.937633489961555e-09, + "loss": 0.0003, + "step": 50023 + }, + { + "epoch": 0.97, + "learning_rate": 5.9337501456254125e-09, + "loss": 0.1269, + "step": 50024 + }, + { + "epoch": 0.97, + "learning_rate": 5.929866801289271e-09, + "loss": 0.0004, + "step": 50025 + }, + { + "epoch": 0.97, + "learning_rate": 5.925983456953128e-09, + "loss": 0.0003, + "step": 50026 + }, + { + "epoch": 0.97, + "learning_rate": 5.9221001126169856e-09, + "loss": 0.0004, + "step": 50027 + }, + { + "epoch": 0.97, + "learning_rate": 5.918216768280843e-09, + "loss": 0.0004, + "step": 50028 + }, + { + "epoch": 0.97, + "learning_rate": 5.9143334239447e-09, + "loss": 0.9351, + "step": 50029 + }, + { + "epoch": 0.97, + "learning_rate": 5.910450079608559e-09, + "loss": 0.0014, + "step": 50030 + }, + { + "epoch": 0.97, + "learning_rate": 5.906566735272416e-09, + "loss": 0.1091, + "step": 50031 + }, + { + "epoch": 0.97, + "learning_rate": 5.902683390936274e-09, + "loss": 0.0003, + "step": 50032 + }, + { + "epoch": 0.97, + "learning_rate": 5.898800046600132e-09, + "loss": 0.0004, + "step": 50033 + }, + { + "epoch": 0.97, + "learning_rate": 5.89491670226399e-09, + "loss": 0.0005, + "step": 50034 + }, + { + "epoch": 0.97, + "learning_rate": 5.891033357927847e-09, + "loss": 0.0004, + "step": 50035 + }, + { + "epoch": 0.97, + "learning_rate": 5.887150013591705e-09, + "loss": 0.0004, + "step": 50036 + }, + { + "epoch": 0.97, + "learning_rate": 5.883266669255563e-09, + "loss": 0.0008, + "step": 50037 + }, + { + "epoch": 0.97, + "learning_rate": 5.8793833249194205e-09, + "loss": 0.0006, + "step": 50038 + }, + { + "epoch": 0.97, + "learning_rate": 5.875499980583278e-09, + "loss": 0.5029, + "step": 50039 + }, + { + "epoch": 0.97, + "learning_rate": 5.871616636247135e-09, + "loss": 0.0004, + "step": 50040 + }, + { + "epoch": 0.97, + "learning_rate": 5.8677332919109935e-09, + "loss": 0.0002, + "step": 50041 + }, + { + "epoch": 0.97, + "learning_rate": 5.863849947574851e-09, + "loss": 0.4924, + "step": 50042 + }, + { + "epoch": 0.97, + "learning_rate": 5.859966603238709e-09, + "loss": 0.0004, + "step": 50043 + }, + { + "epoch": 0.97, + "learning_rate": 5.856083258902567e-09, + "loss": 0.0003, + "step": 50044 + }, + { + "epoch": 0.97, + "learning_rate": 5.852199914566424e-09, + "loss": 0.0596, + "step": 50045 + }, + { + "epoch": 0.97, + "learning_rate": 5.848316570230282e-09, + "loss": 0.2667, + "step": 50046 + }, + { + "epoch": 0.97, + "learning_rate": 5.84443322589414e-09, + "loss": 0.0017, + "step": 50047 + }, + { + "epoch": 0.97, + "learning_rate": 5.840549881557998e-09, + "loss": 0.0002, + "step": 50048 + }, + { + "epoch": 0.97, + "learning_rate": 5.836666537221855e-09, + "loss": 0.0004, + "step": 50049 + }, + { + "epoch": 0.97, + "learning_rate": 5.832783192885713e-09, + "loss": 0.0004, + "step": 50050 + }, + { + "epoch": 0.97, + "learning_rate": 5.82889984854957e-09, + "loss": 0.0215, + "step": 50051 + }, + { + "epoch": 0.97, + "learning_rate": 5.8250165042134284e-09, + "loss": 0.0005, + "step": 50052 + }, + { + "epoch": 0.97, + "learning_rate": 5.821133159877286e-09, + "loss": 0.0004, + "step": 50053 + }, + { + "epoch": 0.97, + "learning_rate": 5.817249815541144e-09, + "loss": 0.0002, + "step": 50054 + }, + { + "epoch": 0.97, + "learning_rate": 5.8133664712050015e-09, + "loss": 0.0003, + "step": 50055 + }, + { + "epoch": 0.97, + "learning_rate": 5.809483126868859e-09, + "loss": 0.0003, + "step": 50056 + }, + { + "epoch": 0.97, + "learning_rate": 5.805599782532717e-09, + "loss": 0.0003, + "step": 50057 + }, + { + "epoch": 0.97, + "learning_rate": 5.8017164381965746e-09, + "loss": 0.0006, + "step": 50058 + }, + { + "epoch": 0.97, + "learning_rate": 5.797833093860433e-09, + "loss": 0.0043, + "step": 50059 + }, + { + "epoch": 0.97, + "learning_rate": 5.79394974952429e-09, + "loss": 0.0004, + "step": 50060 + }, + { + "epoch": 0.97, + "learning_rate": 5.790066405188148e-09, + "loss": 0.0003, + "step": 50061 + }, + { + "epoch": 0.97, + "learning_rate": 5.786183060852005e-09, + "loss": 0.0005, + "step": 50062 + }, + { + "epoch": 0.97, + "learning_rate": 5.782299716515863e-09, + "loss": 0.0005, + "step": 50063 + }, + { + "epoch": 0.97, + "learning_rate": 5.778416372179721e-09, + "loss": 0.0011, + "step": 50064 + }, + { + "epoch": 0.97, + "learning_rate": 5.774533027843578e-09, + "loss": 0.7644, + "step": 50065 + }, + { + "epoch": 0.97, + "learning_rate": 5.770649683507436e-09, + "loss": 0.0023, + "step": 50066 + }, + { + "epoch": 0.97, + "learning_rate": 5.766766339171294e-09, + "loss": 0.0005, + "step": 50067 + }, + { + "epoch": 0.97, + "learning_rate": 5.762882994835152e-09, + "loss": 0.0003, + "step": 50068 + }, + { + "epoch": 0.97, + "learning_rate": 5.7589996504990095e-09, + "loss": 0.0016, + "step": 50069 + }, + { + "epoch": 0.97, + "learning_rate": 5.755116306162868e-09, + "loss": 0.0003, + "step": 50070 + }, + { + "epoch": 0.97, + "learning_rate": 5.751232961826725e-09, + "loss": 0.0004, + "step": 50071 + }, + { + "epoch": 0.97, + "learning_rate": 5.7473496174905826e-09, + "loss": 0.0003, + "step": 50072 + }, + { + "epoch": 0.97, + "learning_rate": 5.74346627315444e-09, + "loss": 0.0006, + "step": 50073 + }, + { + "epoch": 0.97, + "learning_rate": 5.739582928818297e-09, + "loss": 0.0003, + "step": 50074 + }, + { + "epoch": 0.97, + "learning_rate": 5.735699584482156e-09, + "loss": 0.0211, + "step": 50075 + }, + { + "epoch": 0.97, + "learning_rate": 5.731816240146013e-09, + "loss": 0.0002, + "step": 50076 + }, + { + "epoch": 0.97, + "learning_rate": 5.727932895809871e-09, + "loss": 0.0003, + "step": 50077 + }, + { + "epoch": 0.97, + "learning_rate": 5.724049551473729e-09, + "loss": 0.0004, + "step": 50078 + }, + { + "epoch": 0.97, + "learning_rate": 5.720166207137587e-09, + "loss": 0.2536, + "step": 50079 + }, + { + "epoch": 0.97, + "learning_rate": 5.716282862801444e-09, + "loss": 0.0004, + "step": 50080 + }, + { + "epoch": 0.97, + "learning_rate": 5.712399518465303e-09, + "loss": 0.0003, + "step": 50081 + }, + { + "epoch": 0.97, + "learning_rate": 5.70851617412916e-09, + "loss": 0.0006, + "step": 50082 + }, + { + "epoch": 0.97, + "learning_rate": 5.7046328297930175e-09, + "loss": 0.0003, + "step": 50083 + }, + { + "epoch": 0.97, + "learning_rate": 5.700749485456875e-09, + "loss": 0.0003, + "step": 50084 + }, + { + "epoch": 0.97, + "learning_rate": 5.696866141120732e-09, + "loss": 0.0002, + "step": 50085 + }, + { + "epoch": 0.97, + "learning_rate": 5.6929827967845905e-09, + "loss": 0.0003, + "step": 50086 + }, + { + "epoch": 0.97, + "learning_rate": 5.689099452448448e-09, + "loss": 0.0004, + "step": 50087 + }, + { + "epoch": 0.97, + "learning_rate": 5.685216108112306e-09, + "loss": 0.0003, + "step": 50088 + }, + { + "epoch": 0.97, + "learning_rate": 5.681332763776164e-09, + "loss": 0.0003, + "step": 50089 + }, + { + "epoch": 0.97, + "learning_rate": 5.677449419440022e-09, + "loss": 0.0004, + "step": 50090 + }, + { + "epoch": 0.97, + "learning_rate": 5.673566075103879e-09, + "loss": 0.0003, + "step": 50091 + }, + { + "epoch": 0.97, + "learning_rate": 5.6696827307677375e-09, + "loss": 1.0516, + "step": 50092 + }, + { + "epoch": 0.97, + "learning_rate": 5.665799386431595e-09, + "loss": 0.0004, + "step": 50093 + }, + { + "epoch": 0.97, + "learning_rate": 5.661916042095452e-09, + "loss": 0.0004, + "step": 50094 + }, + { + "epoch": 0.97, + "learning_rate": 5.65803269775931e-09, + "loss": 0.0003, + "step": 50095 + }, + { + "epoch": 0.97, + "learning_rate": 5.654149353423167e-09, + "loss": 0.0005, + "step": 50096 + }, + { + "epoch": 0.97, + "learning_rate": 5.6502660090870254e-09, + "loss": 0.0007, + "step": 50097 + }, + { + "epoch": 0.97, + "learning_rate": 5.646382664750883e-09, + "loss": 0.0006, + "step": 50098 + }, + { + "epoch": 0.97, + "learning_rate": 5.642499320414741e-09, + "loss": 0.8194, + "step": 50099 + }, + { + "epoch": 0.97, + "learning_rate": 5.6386159760785985e-09, + "loss": 1.0789, + "step": 50100 + }, + { + "epoch": 0.97, + "learning_rate": 5.634732631742457e-09, + "loss": 0.003, + "step": 50101 + }, + { + "epoch": 0.97, + "learning_rate": 5.630849287406314e-09, + "loss": 0.4397, + "step": 50102 + }, + { + "epoch": 0.97, + "learning_rate": 5.626965943070172e-09, + "loss": 0.3196, + "step": 50103 + }, + { + "epoch": 0.97, + "learning_rate": 5.62308259873403e-09, + "loss": 0.0006, + "step": 50104 + }, + { + "epoch": 0.97, + "learning_rate": 5.619199254397887e-09, + "loss": 0.0003, + "step": 50105 + }, + { + "epoch": 0.97, + "learning_rate": 5.615315910061745e-09, + "loss": 0.0004, + "step": 50106 + }, + { + "epoch": 0.97, + "learning_rate": 5.611432565725602e-09, + "loss": 0.0055, + "step": 50107 + }, + { + "epoch": 0.97, + "learning_rate": 5.60754922138946e-09, + "loss": 0.0003, + "step": 50108 + }, + { + "epoch": 0.97, + "learning_rate": 5.603665877053318e-09, + "loss": 0.017, + "step": 50109 + }, + { + "epoch": 0.97, + "learning_rate": 5.599782532717176e-09, + "loss": 0.0586, + "step": 50110 + }, + { + "epoch": 0.97, + "learning_rate": 5.595899188381033e-09, + "loss": 0.0004, + "step": 50111 + }, + { + "epoch": 0.97, + "learning_rate": 5.592015844044892e-09, + "loss": 0.0004, + "step": 50112 + }, + { + "epoch": 0.97, + "learning_rate": 5.588132499708749e-09, + "loss": 0.0271, + "step": 50113 + }, + { + "epoch": 0.97, + "learning_rate": 5.5842491553726065e-09, + "loss": 0.0003, + "step": 50114 + }, + { + "epoch": 0.97, + "learning_rate": 5.580365811036465e-09, + "loss": 0.0845, + "step": 50115 + }, + { + "epoch": 0.97, + "learning_rate": 5.576482466700322e-09, + "loss": 0.0003, + "step": 50116 + }, + { + "epoch": 0.97, + "learning_rate": 5.5725991223641796e-09, + "loss": 0.0319, + "step": 50117 + }, + { + "epoch": 0.97, + "learning_rate": 5.568715778028037e-09, + "loss": 0.0004, + "step": 50118 + }, + { + "epoch": 0.97, + "learning_rate": 5.564832433691895e-09, + "loss": 0.0013, + "step": 50119 + }, + { + "epoch": 0.97, + "learning_rate": 5.560949089355753e-09, + "loss": 0.3473, + "step": 50120 + }, + { + "epoch": 0.97, + "learning_rate": 5.557065745019611e-09, + "loss": 0.0004, + "step": 50121 + }, + { + "epoch": 0.97, + "learning_rate": 5.553182400683468e-09, + "loss": 0.9099, + "step": 50122 + }, + { + "epoch": 0.97, + "learning_rate": 5.549299056347326e-09, + "loss": 0.0004, + "step": 50123 + }, + { + "epoch": 0.97, + "learning_rate": 5.545415712011184e-09, + "loss": 0.0002, + "step": 50124 + }, + { + "epoch": 0.97, + "learning_rate": 5.541532367675041e-09, + "loss": 0.0005, + "step": 50125 + }, + { + "epoch": 0.97, + "learning_rate": 5.5376490233389e-09, + "loss": 0.0003, + "step": 50126 + }, + { + "epoch": 0.97, + "learning_rate": 5.533765679002757e-09, + "loss": 0.0011, + "step": 50127 + }, + { + "epoch": 0.97, + "learning_rate": 5.5298823346666145e-09, + "loss": 0.0004, + "step": 50128 + }, + { + "epoch": 0.97, + "learning_rate": 5.525998990330472e-09, + "loss": 0.0002, + "step": 50129 + }, + { + "epoch": 0.97, + "learning_rate": 5.52211564599433e-09, + "loss": 0.4169, + "step": 50130 + }, + { + "epoch": 0.97, + "learning_rate": 5.5182323016581875e-09, + "loss": 0.0011, + "step": 50131 + }, + { + "epoch": 0.97, + "learning_rate": 5.514348957322045e-09, + "loss": 0.0004, + "step": 50132 + }, + { + "epoch": 0.97, + "learning_rate": 5.510465612985903e-09, + "loss": 0.0003, + "step": 50133 + }, + { + "epoch": 0.97, + "learning_rate": 5.506582268649761e-09, + "loss": 0.0003, + "step": 50134 + }, + { + "epoch": 0.97, + "learning_rate": 5.502698924313619e-09, + "loss": 0.0015, + "step": 50135 + }, + { + "epoch": 0.97, + "learning_rate": 5.498815579977476e-09, + "loss": 0.0003, + "step": 50136 + }, + { + "epoch": 0.97, + "learning_rate": 5.4949322356413345e-09, + "loss": 0.3094, + "step": 50137 + }, + { + "epoch": 0.97, + "learning_rate": 5.491048891305192e-09, + "loss": 0.0006, + "step": 50138 + }, + { + "epoch": 0.97, + "learning_rate": 5.487165546969049e-09, + "loss": 0.0003, + "step": 50139 + }, + { + "epoch": 0.97, + "learning_rate": 5.483282202632907e-09, + "loss": 0.0003, + "step": 50140 + }, + { + "epoch": 0.97, + "learning_rate": 5.479398858296765e-09, + "loss": 0.0006, + "step": 50141 + }, + { + "epoch": 0.97, + "learning_rate": 5.4755155139606224e-09, + "loss": 0.4544, + "step": 50142 + }, + { + "epoch": 0.97, + "learning_rate": 5.47163216962448e-09, + "loss": 0.0005, + "step": 50143 + }, + { + "epoch": 0.97, + "learning_rate": 5.467748825288338e-09, + "loss": 0.0004, + "step": 50144 + }, + { + "epoch": 0.97, + "learning_rate": 5.4638654809521955e-09, + "loss": 0.6044, + "step": 50145 + }, + { + "epoch": 0.97, + "learning_rate": 5.459982136616054e-09, + "loss": 0.0004, + "step": 50146 + }, + { + "epoch": 0.97, + "learning_rate": 5.456098792279911e-09, + "loss": 0.0004, + "step": 50147 + }, + { + "epoch": 0.97, + "learning_rate": 5.4522154479437694e-09, + "loss": 0.0004, + "step": 50148 + }, + { + "epoch": 0.97, + "learning_rate": 5.448332103607627e-09, + "loss": 0.0003, + "step": 50149 + }, + { + "epoch": 0.97, + "learning_rate": 5.444448759271484e-09, + "loss": 0.0005, + "step": 50150 + }, + { + "epoch": 0.97, + "learning_rate": 5.440565414935342e-09, + "loss": 0.0051, + "step": 50151 + }, + { + "epoch": 0.97, + "learning_rate": 5.436682070599199e-09, + "loss": 0.0004, + "step": 50152 + }, + { + "epoch": 0.97, + "learning_rate": 5.432798726263057e-09, + "loss": 0.3103, + "step": 50153 + }, + { + "epoch": 0.97, + "learning_rate": 5.428915381926915e-09, + "loss": 0.1622, + "step": 50154 + }, + { + "epoch": 0.97, + "learning_rate": 5.425032037590773e-09, + "loss": 0.6609, + "step": 50155 + }, + { + "epoch": 0.97, + "learning_rate": 5.4211486932546304e-09, + "loss": 0.0003, + "step": 50156 + }, + { + "epoch": 0.97, + "learning_rate": 5.417265348918489e-09, + "loss": 0.0006, + "step": 50157 + }, + { + "epoch": 0.97, + "learning_rate": 5.413382004582346e-09, + "loss": 0.0004, + "step": 50158 + }, + { + "epoch": 0.97, + "learning_rate": 5.409498660246204e-09, + "loss": 0.0003, + "step": 50159 + }, + { + "epoch": 0.97, + "learning_rate": 5.405615315910062e-09, + "loss": 0.0005, + "step": 50160 + }, + { + "epoch": 0.97, + "learning_rate": 5.401731971573919e-09, + "loss": 0.0004, + "step": 50161 + }, + { + "epoch": 0.97, + "learning_rate": 5.3978486272377766e-09, + "loss": 0.0004, + "step": 50162 + }, + { + "epoch": 0.97, + "learning_rate": 5.393965282901634e-09, + "loss": 0.0003, + "step": 50163 + }, + { + "epoch": 0.97, + "learning_rate": 5.390081938565492e-09, + "loss": 0.0003, + "step": 50164 + }, + { + "epoch": 0.97, + "learning_rate": 5.38619859422935e-09, + "loss": 0.0007, + "step": 50165 + }, + { + "epoch": 0.97, + "learning_rate": 5.382315249893208e-09, + "loss": 0.0003, + "step": 50166 + }, + { + "epoch": 0.97, + "learning_rate": 5.378431905557065e-09, + "loss": 0.0004, + "step": 50167 + }, + { + "epoch": 0.97, + "learning_rate": 5.3745485612209236e-09, + "loss": 0.0003, + "step": 50168 + }, + { + "epoch": 0.97, + "learning_rate": 5.370665216884781e-09, + "loss": 0.7484, + "step": 50169 + }, + { + "epoch": 0.97, + "learning_rate": 5.366781872548639e-09, + "loss": 0.0004, + "step": 50170 + }, + { + "epoch": 0.97, + "learning_rate": 5.362898528212497e-09, + "loss": 0.0004, + "step": 50171 + }, + { + "epoch": 0.97, + "learning_rate": 5.359015183876354e-09, + "loss": 0.0003, + "step": 50172 + }, + { + "epoch": 0.97, + "learning_rate": 5.355131839540212e-09, + "loss": 0.0003, + "step": 50173 + }, + { + "epoch": 0.97, + "learning_rate": 5.351248495204069e-09, + "loss": 0.0004, + "step": 50174 + }, + { + "epoch": 0.97, + "learning_rate": 5.347365150867927e-09, + "loss": 0.0003, + "step": 50175 + }, + { + "epoch": 0.97, + "learning_rate": 5.3434818065317846e-09, + "loss": 0.0006, + "step": 50176 + }, + { + "epoch": 0.97, + "learning_rate": 5.339598462195643e-09, + "loss": 0.0005, + "step": 50177 + }, + { + "epoch": 0.97, + "learning_rate": 5.3357151178595e-09, + "loss": 0.0006, + "step": 50178 + }, + { + "epoch": 0.97, + "learning_rate": 5.3318317735233585e-09, + "loss": 0.0002, + "step": 50179 + }, + { + "epoch": 0.97, + "learning_rate": 5.327948429187216e-09, + "loss": 0.0004, + "step": 50180 + }, + { + "epoch": 0.97, + "learning_rate": 5.324065084851073e-09, + "loss": 0.0004, + "step": 50181 + }, + { + "epoch": 0.97, + "learning_rate": 5.3201817405149315e-09, + "loss": 0.0004, + "step": 50182 + }, + { + "epoch": 0.97, + "learning_rate": 5.316298396178789e-09, + "loss": 0.2409, + "step": 50183 + }, + { + "epoch": 0.97, + "learning_rate": 5.312415051842647e-09, + "loss": 0.264, + "step": 50184 + }, + { + "epoch": 0.97, + "learning_rate": 5.308531707506504e-09, + "loss": 0.0003, + "step": 50185 + }, + { + "epoch": 0.97, + "learning_rate": 5.304648363170362e-09, + "loss": 0.0003, + "step": 50186 + }, + { + "epoch": 0.97, + "learning_rate": 5.3007650188342194e-09, + "loss": 0.0004, + "step": 50187 + }, + { + "epoch": 0.97, + "learning_rate": 5.296881674498078e-09, + "loss": 0.4283, + "step": 50188 + }, + { + "epoch": 0.97, + "learning_rate": 5.292998330161935e-09, + "loss": 0.0005, + "step": 50189 + }, + { + "epoch": 0.97, + "learning_rate": 5.2891149858257925e-09, + "loss": 0.0003, + "step": 50190 + }, + { + "epoch": 0.97, + "learning_rate": 5.285231641489651e-09, + "loss": 0.0004, + "step": 50191 + }, + { + "epoch": 0.97, + "learning_rate": 5.281348297153508e-09, + "loss": 0.0014, + "step": 50192 + }, + { + "epoch": 0.97, + "learning_rate": 5.2774649528173664e-09, + "loss": 0.0004, + "step": 50193 + }, + { + "epoch": 0.97, + "learning_rate": 5.273581608481224e-09, + "loss": 0.0009, + "step": 50194 + }, + { + "epoch": 0.97, + "learning_rate": 5.269698264145082e-09, + "loss": 0.0004, + "step": 50195 + }, + { + "epoch": 0.97, + "learning_rate": 5.2658149198089395e-09, + "loss": 0.5101, + "step": 50196 + }, + { + "epoch": 0.97, + "learning_rate": 5.261931575472797e-09, + "loss": 0.0003, + "step": 50197 + }, + { + "epoch": 0.97, + "learning_rate": 5.258048231136654e-09, + "loss": 0.0005, + "step": 50198 + }, + { + "epoch": 0.97, + "learning_rate": 5.254164886800513e-09, + "loss": 0.0004, + "step": 50199 + }, + { + "epoch": 0.97, + "learning_rate": 5.25028154246437e-09, + "loss": 0.0004, + "step": 50200 + }, + { + "epoch": 0.97, + "learning_rate": 5.2463981981282274e-09, + "loss": 0.0004, + "step": 50201 + }, + { + "epoch": 0.97, + "learning_rate": 5.242514853792086e-09, + "loss": 0.0011, + "step": 50202 + }, + { + "epoch": 0.97, + "learning_rate": 5.238631509455943e-09, + "loss": 0.0003, + "step": 50203 + }, + { + "epoch": 0.97, + "learning_rate": 5.234748165119801e-09, + "loss": 0.235, + "step": 50204 + }, + { + "epoch": 0.97, + "learning_rate": 5.230864820783659e-09, + "loss": 0.6751, + "step": 50205 + }, + { + "epoch": 0.97, + "learning_rate": 5.226981476447517e-09, + "loss": 0.0004, + "step": 50206 + }, + { + "epoch": 0.97, + "learning_rate": 5.223098132111374e-09, + "loss": 0.0003, + "step": 50207 + }, + { + "epoch": 0.97, + "learning_rate": 5.219214787775232e-09, + "loss": 0.7352, + "step": 50208 + }, + { + "epoch": 0.97, + "learning_rate": 5.215331443439089e-09, + "loss": 0.0003, + "step": 50209 + }, + { + "epoch": 0.97, + "learning_rate": 5.211448099102947e-09, + "loss": 0.0003, + "step": 50210 + }, + { + "epoch": 0.97, + "learning_rate": 5.207564754766805e-09, + "loss": 0.149, + "step": 50211 + }, + { + "epoch": 0.97, + "learning_rate": 5.203681410430662e-09, + "loss": 0.0003, + "step": 50212 + }, + { + "epoch": 0.97, + "learning_rate": 5.1997980660945206e-09, + "loss": 0.0006, + "step": 50213 + }, + { + "epoch": 0.97, + "learning_rate": 5.195914721758378e-09, + "loss": 0.0006, + "step": 50214 + }, + { + "epoch": 0.97, + "learning_rate": 5.192031377422236e-09, + "loss": 0.0004, + "step": 50215 + }, + { + "epoch": 0.97, + "learning_rate": 5.188148033086094e-09, + "loss": 0.0003, + "step": 50216 + }, + { + "epoch": 0.97, + "learning_rate": 5.184264688749952e-09, + "loss": 0.0004, + "step": 50217 + }, + { + "epoch": 0.97, + "learning_rate": 5.180381344413809e-09, + "loss": 0.0006, + "step": 50218 + }, + { + "epoch": 0.97, + "learning_rate": 5.176498000077667e-09, + "loss": 0.0003, + "step": 50219 + }, + { + "epoch": 0.97, + "learning_rate": 5.172614655741524e-09, + "loss": 0.0005, + "step": 50220 + }, + { + "epoch": 0.97, + "learning_rate": 5.1687313114053816e-09, + "loss": 0.0586, + "step": 50221 + }, + { + "epoch": 0.97, + "learning_rate": 5.16484796706924e-09, + "loss": 0.0003, + "step": 50222 + }, + { + "epoch": 0.97, + "learning_rate": 5.160964622733097e-09, + "loss": 0.0003, + "step": 50223 + }, + { + "epoch": 0.97, + "learning_rate": 5.1570812783969555e-09, + "loss": 0.0005, + "step": 50224 + }, + { + "epoch": 0.97, + "learning_rate": 5.153197934060813e-09, + "loss": 0.002, + "step": 50225 + }, + { + "epoch": 0.97, + "learning_rate": 5.149314589724671e-09, + "loss": 0.0004, + "step": 50226 + }, + { + "epoch": 0.97, + "learning_rate": 5.1454312453885285e-09, + "loss": 0.0004, + "step": 50227 + }, + { + "epoch": 0.97, + "learning_rate": 5.141547901052387e-09, + "loss": 0.0003, + "step": 50228 + }, + { + "epoch": 0.97, + "learning_rate": 5.137664556716244e-09, + "loss": 0.0005, + "step": 50229 + }, + { + "epoch": 0.97, + "learning_rate": 5.133781212380102e-09, + "loss": 0.0004, + "step": 50230 + }, + { + "epoch": 0.97, + "learning_rate": 5.129897868043959e-09, + "loss": 0.0004, + "step": 50231 + }, + { + "epoch": 0.97, + "learning_rate": 5.1260145237078165e-09, + "loss": 0.7995, + "step": 50232 + }, + { + "epoch": 0.97, + "learning_rate": 5.122131179371675e-09, + "loss": 0.8347, + "step": 50233 + }, + { + "epoch": 0.97, + "learning_rate": 5.118247835035532e-09, + "loss": 0.0003, + "step": 50234 + }, + { + "epoch": 0.97, + "learning_rate": 5.11436449069939e-09, + "loss": 0.0003, + "step": 50235 + }, + { + "epoch": 0.97, + "learning_rate": 5.110481146363248e-09, + "loss": 0.0004, + "step": 50236 + }, + { + "epoch": 0.97, + "learning_rate": 5.106597802027106e-09, + "loss": 0.0003, + "step": 50237 + }, + { + "epoch": 0.97, + "learning_rate": 5.1027144576909634e-09, + "loss": 0.0012, + "step": 50238 + }, + { + "epoch": 0.97, + "learning_rate": 5.098831113354821e-09, + "loss": 1.2205, + "step": 50239 + }, + { + "epoch": 0.97, + "learning_rate": 5.094947769018679e-09, + "loss": 0.0003, + "step": 50240 + }, + { + "epoch": 0.97, + "learning_rate": 5.0910644246825365e-09, + "loss": 0.0003, + "step": 50241 + }, + { + "epoch": 0.97, + "learning_rate": 5.087181080346394e-09, + "loss": 0.0004, + "step": 50242 + }, + { + "epoch": 0.97, + "learning_rate": 5.083297736010251e-09, + "loss": 0.0003, + "step": 50243 + }, + { + "epoch": 0.97, + "learning_rate": 5.07941439167411e-09, + "loss": 0.0003, + "step": 50244 + }, + { + "epoch": 0.97, + "learning_rate": 5.075531047337967e-09, + "loss": 0.0007, + "step": 50245 + }, + { + "epoch": 0.97, + "learning_rate": 5.071647703001825e-09, + "loss": 0.0005, + "step": 50246 + }, + { + "epoch": 0.97, + "learning_rate": 5.067764358665683e-09, + "loss": 0.0149, + "step": 50247 + }, + { + "epoch": 0.97, + "learning_rate": 5.06388101432954e-09, + "loss": 0.0004, + "step": 50248 + }, + { + "epoch": 0.97, + "learning_rate": 5.059997669993398e-09, + "loss": 0.0006, + "step": 50249 + }, + { + "epoch": 0.97, + "learning_rate": 5.056114325657256e-09, + "loss": 1.1, + "step": 50250 + }, + { + "epoch": 0.97, + "learning_rate": 5.052230981321114e-09, + "loss": 0.0004, + "step": 50251 + }, + { + "epoch": 0.97, + "learning_rate": 5.0483476369849714e-09, + "loss": 0.0004, + "step": 50252 + }, + { + "epoch": 0.97, + "learning_rate": 5.044464292648829e-09, + "loss": 0.0003, + "step": 50253 + }, + { + "epoch": 0.97, + "learning_rate": 5.040580948312686e-09, + "loss": 0.0003, + "step": 50254 + }, + { + "epoch": 0.97, + "learning_rate": 5.0366976039765445e-09, + "loss": 0.0004, + "step": 50255 + }, + { + "epoch": 0.97, + "learning_rate": 5.032814259640402e-09, + "loss": 0.0004, + "step": 50256 + }, + { + "epoch": 0.97, + "learning_rate": 5.02893091530426e-09, + "loss": 0.0002, + "step": 50257 + }, + { + "epoch": 0.97, + "learning_rate": 5.0250475709681176e-09, + "loss": 0.0003, + "step": 50258 + }, + { + "epoch": 0.97, + "learning_rate": 5.021164226631975e-09, + "loss": 0.0003, + "step": 50259 + }, + { + "epoch": 0.97, + "learning_rate": 5.017280882295833e-09, + "loss": 0.0003, + "step": 50260 + }, + { + "epoch": 0.97, + "learning_rate": 5.013397537959691e-09, + "loss": 0.0006, + "step": 50261 + }, + { + "epoch": 0.97, + "learning_rate": 5.009514193623549e-09, + "loss": 0.0004, + "step": 50262 + }, + { + "epoch": 0.97, + "learning_rate": 5.005630849287406e-09, + "loss": 0.2832, + "step": 50263 + }, + { + "epoch": 0.98, + "learning_rate": 5.001747504951264e-09, + "loss": 0.0004, + "step": 50264 + }, + { + "epoch": 0.98, + "learning_rate": 4.997864160615121e-09, + "loss": 0.0003, + "step": 50265 + }, + { + "epoch": 0.98, + "learning_rate": 4.993980816278979e-09, + "loss": 0.0004, + "step": 50266 + }, + { + "epoch": 0.98, + "learning_rate": 4.990097471942837e-09, + "loss": 0.0007, + "step": 50267 + }, + { + "epoch": 0.98, + "learning_rate": 4.986214127606694e-09, + "loss": 0.0004, + "step": 50268 + }, + { + "epoch": 0.98, + "learning_rate": 4.9823307832705525e-09, + "loss": 0.0004, + "step": 50269 + }, + { + "epoch": 0.98, + "learning_rate": 4.97844743893441e-09, + "loss": 0.7039, + "step": 50270 + }, + { + "epoch": 0.98, + "learning_rate": 4.974564094598268e-09, + "loss": 0.0005, + "step": 50271 + }, + { + "epoch": 0.98, + "learning_rate": 4.9706807502621255e-09, + "loss": 0.2086, + "step": 50272 + }, + { + "epoch": 0.98, + "learning_rate": 4.966797405925984e-09, + "loss": 0.1047, + "step": 50273 + }, + { + "epoch": 0.98, + "learning_rate": 4.962914061589841e-09, + "loss": 0.0003, + "step": 50274 + }, + { + "epoch": 0.98, + "learning_rate": 4.959030717253699e-09, + "loss": 0.0003, + "step": 50275 + }, + { + "epoch": 0.98, + "learning_rate": 4.955147372917556e-09, + "loss": 0.0004, + "step": 50276 + }, + { + "epoch": 0.98, + "learning_rate": 4.9512640285814135e-09, + "loss": 0.3456, + "step": 50277 + }, + { + "epoch": 0.98, + "learning_rate": 4.947380684245272e-09, + "loss": 0.0004, + "step": 50278 + }, + { + "epoch": 0.98, + "learning_rate": 4.943497339909129e-09, + "loss": 0.0003, + "step": 50279 + }, + { + "epoch": 0.98, + "learning_rate": 4.939613995572987e-09, + "loss": 0.0004, + "step": 50280 + }, + { + "epoch": 0.98, + "learning_rate": 4.935730651236845e-09, + "loss": 0.0003, + "step": 50281 + }, + { + "epoch": 0.98, + "learning_rate": 4.931847306900703e-09, + "loss": 0.0004, + "step": 50282 + }, + { + "epoch": 0.98, + "learning_rate": 4.9279639625645604e-09, + "loss": 0.0748, + "step": 50283 + }, + { + "epoch": 0.98, + "learning_rate": 4.924080618228419e-09, + "loss": 0.0004, + "step": 50284 + }, + { + "epoch": 0.98, + "learning_rate": 4.920197273892276e-09, + "loss": 0.8221, + "step": 50285 + }, + { + "epoch": 0.98, + "learning_rate": 4.9163139295561335e-09, + "loss": 0.0004, + "step": 50286 + }, + { + "epoch": 0.98, + "learning_rate": 4.912430585219991e-09, + "loss": 0.0003, + "step": 50287 + }, + { + "epoch": 0.98, + "learning_rate": 4.908547240883848e-09, + "loss": 0.0004, + "step": 50288 + }, + { + "epoch": 0.98, + "learning_rate": 4.904663896547707e-09, + "loss": 0.0004, + "step": 50289 + }, + { + "epoch": 0.98, + "learning_rate": 4.900780552211564e-09, + "loss": 0.0004, + "step": 50290 + }, + { + "epoch": 0.98, + "learning_rate": 4.896897207875422e-09, + "loss": 0.0009, + "step": 50291 + }, + { + "epoch": 0.98, + "learning_rate": 4.89301386353928e-09, + "loss": 0.0002, + "step": 50292 + }, + { + "epoch": 0.98, + "learning_rate": 4.889130519203138e-09, + "loss": 0.0004, + "step": 50293 + }, + { + "epoch": 0.98, + "learning_rate": 4.885247174866995e-09, + "loss": 0.0002, + "step": 50294 + }, + { + "epoch": 0.98, + "learning_rate": 4.881363830530854e-09, + "loss": 0.2921, + "step": 50295 + }, + { + "epoch": 0.98, + "learning_rate": 4.877480486194711e-09, + "loss": 1.2388, + "step": 50296 + }, + { + "epoch": 0.98, + "learning_rate": 4.8735971418585684e-09, + "loss": 0.0004, + "step": 50297 + }, + { + "epoch": 0.98, + "learning_rate": 4.869713797522426e-09, + "loss": 0.0003, + "step": 50298 + }, + { + "epoch": 0.98, + "learning_rate": 4.865830453186283e-09, + "loss": 0.0003, + "step": 50299 + }, + { + "epoch": 0.98, + "learning_rate": 4.8619471088501415e-09, + "loss": 0.0012, + "step": 50300 + }, + { + "epoch": 0.98, + "learning_rate": 4.858063764513999e-09, + "loss": 0.0003, + "step": 50301 + }, + { + "epoch": 0.98, + "learning_rate": 4.854180420177857e-09, + "loss": 0.0004, + "step": 50302 + }, + { + "epoch": 0.98, + "learning_rate": 4.8502970758417146e-09, + "loss": 0.0003, + "step": 50303 + }, + { + "epoch": 0.98, + "learning_rate": 4.846413731505573e-09, + "loss": 0.7123, + "step": 50304 + }, + { + "epoch": 0.98, + "learning_rate": 4.84253038716943e-09, + "loss": 0.0013, + "step": 50305 + }, + { + "epoch": 0.98, + "learning_rate": 4.838647042833288e-09, + "loss": 0.0004, + "step": 50306 + }, + { + "epoch": 0.98, + "learning_rate": 4.834763698497146e-09, + "loss": 0.0004, + "step": 50307 + }, + { + "epoch": 0.98, + "learning_rate": 4.830880354161003e-09, + "loss": 0.0004, + "step": 50308 + }, + { + "epoch": 0.98, + "learning_rate": 4.826997009824861e-09, + "loss": 0.6467, + "step": 50309 + }, + { + "epoch": 0.98, + "learning_rate": 4.823113665488718e-09, + "loss": 0.6981, + "step": 50310 + }, + { + "epoch": 0.98, + "learning_rate": 4.819230321152576e-09, + "loss": 0.0003, + "step": 50311 + }, + { + "epoch": 0.98, + "learning_rate": 4.815346976816434e-09, + "loss": 0.0003, + "step": 50312 + }, + { + "epoch": 0.98, + "learning_rate": 4.811463632480292e-09, + "loss": 0.0003, + "step": 50313 + }, + { + "epoch": 0.98, + "learning_rate": 4.8075802881441495e-09, + "loss": 0.0003, + "step": 50314 + }, + { + "epoch": 0.98, + "learning_rate": 4.803696943808008e-09, + "loss": 0.0068, + "step": 50315 + }, + { + "epoch": 0.98, + "learning_rate": 4.799813599471865e-09, + "loss": 0.5712, + "step": 50316 + }, + { + "epoch": 0.98, + "learning_rate": 4.7959302551357226e-09, + "loss": 0.0003, + "step": 50317 + }, + { + "epoch": 0.98, + "learning_rate": 4.792046910799581e-09, + "loss": 0.0003, + "step": 50318 + }, + { + "epoch": 0.98, + "learning_rate": 4.788163566463438e-09, + "loss": 1.0283, + "step": 50319 + }, + { + "epoch": 0.98, + "learning_rate": 4.784280222127296e-09, + "loss": 0.0005, + "step": 50320 + }, + { + "epoch": 0.98, + "learning_rate": 4.780396877791153e-09, + "loss": 0.0004, + "step": 50321 + }, + { + "epoch": 0.98, + "learning_rate": 4.776513533455011e-09, + "loss": 0.0005, + "step": 50322 + }, + { + "epoch": 0.98, + "learning_rate": 4.772630189118869e-09, + "loss": 0.0003, + "step": 50323 + }, + { + "epoch": 0.98, + "learning_rate": 4.768746844782727e-09, + "loss": 0.0003, + "step": 50324 + }, + { + "epoch": 0.98, + "learning_rate": 4.764863500446584e-09, + "loss": 0.0005, + "step": 50325 + }, + { + "epoch": 0.98, + "learning_rate": 4.760980156110442e-09, + "loss": 0.1142, + "step": 50326 + }, + { + "epoch": 0.98, + "learning_rate": 4.7570968117743e-09, + "loss": 0.0004, + "step": 50327 + }, + { + "epoch": 0.98, + "learning_rate": 4.7532134674381575e-09, + "loss": 0.3262, + "step": 50328 + }, + { + "epoch": 0.98, + "learning_rate": 4.749330123102016e-09, + "loss": 0.0003, + "step": 50329 + }, + { + "epoch": 0.98, + "learning_rate": 4.745446778765873e-09, + "loss": 0.0006, + "step": 50330 + }, + { + "epoch": 0.98, + "learning_rate": 4.7415634344297305e-09, + "loss": 0.0004, + "step": 50331 + }, + { + "epoch": 0.98, + "learning_rate": 4.737680090093588e-09, + "loss": 0.0004, + "step": 50332 + }, + { + "epoch": 0.98, + "learning_rate": 4.733796745757446e-09, + "loss": 0.0395, + "step": 50333 + }, + { + "epoch": 0.98, + "learning_rate": 4.729913401421304e-09, + "loss": 0.0004, + "step": 50334 + }, + { + "epoch": 0.98, + "learning_rate": 4.726030057085161e-09, + "loss": 0.0003, + "step": 50335 + }, + { + "epoch": 0.98, + "learning_rate": 4.722146712749019e-09, + "loss": 0.0003, + "step": 50336 + }, + { + "epoch": 0.98, + "learning_rate": 4.718263368412877e-09, + "loss": 0.0003, + "step": 50337 + }, + { + "epoch": 0.98, + "learning_rate": 4.714380024076735e-09, + "loss": 0.0008, + "step": 50338 + }, + { + "epoch": 0.98, + "learning_rate": 4.710496679740592e-09, + "loss": 0.0005, + "step": 50339 + }, + { + "epoch": 0.98, + "learning_rate": 4.706613335404451e-09, + "loss": 0.0005, + "step": 50340 + }, + { + "epoch": 0.98, + "learning_rate": 4.702729991068308e-09, + "loss": 0.0005, + "step": 50341 + }, + { + "epoch": 0.98, + "learning_rate": 4.6988466467321654e-09, + "loss": 0.0004, + "step": 50342 + }, + { + "epoch": 0.98, + "learning_rate": 4.694963302396023e-09, + "loss": 0.0172, + "step": 50343 + }, + { + "epoch": 0.98, + "learning_rate": 4.691079958059881e-09, + "loss": 0.1673, + "step": 50344 + }, + { + "epoch": 0.98, + "learning_rate": 4.6871966137237385e-09, + "loss": 0.1425, + "step": 50345 + }, + { + "epoch": 0.98, + "learning_rate": 4.683313269387596e-09, + "loss": 0.0777, + "step": 50346 + }, + { + "epoch": 0.98, + "learning_rate": 4.679429925051454e-09, + "loss": 0.0004, + "step": 50347 + }, + { + "epoch": 0.98, + "learning_rate": 4.6755465807153116e-09, + "loss": 0.0006, + "step": 50348 + }, + { + "epoch": 0.98, + "learning_rate": 4.67166323637917e-09, + "loss": 0.0005, + "step": 50349 + }, + { + "epoch": 0.98, + "learning_rate": 4.667779892043027e-09, + "loss": 0.0039, + "step": 50350 + }, + { + "epoch": 0.98, + "learning_rate": 4.6638965477068855e-09, + "loss": 0.0005, + "step": 50351 + }, + { + "epoch": 0.98, + "learning_rate": 4.660013203370743e-09, + "loss": 0.0004, + "step": 50352 + }, + { + "epoch": 0.98, + "learning_rate": 4.6561298590346e-09, + "loss": 0.6053, + "step": 50353 + }, + { + "epoch": 0.98, + "learning_rate": 4.652246514698458e-09, + "loss": 0.0004, + "step": 50354 + }, + { + "epoch": 0.98, + "learning_rate": 4.648363170362315e-09, + "loss": 0.8508, + "step": 50355 + }, + { + "epoch": 0.98, + "learning_rate": 4.644479826026173e-09, + "loss": 0.0008, + "step": 50356 + }, + { + "epoch": 0.98, + "learning_rate": 4.640596481690031e-09, + "loss": 0.0003, + "step": 50357 + }, + { + "epoch": 0.98, + "learning_rate": 4.636713137353889e-09, + "loss": 0.0011, + "step": 50358 + }, + { + "epoch": 0.98, + "learning_rate": 4.6328297930177465e-09, + "loss": 0.0003, + "step": 50359 + }, + { + "epoch": 0.98, + "learning_rate": 4.628946448681605e-09, + "loss": 0.0002, + "step": 50360 + }, + { + "epoch": 0.98, + "learning_rate": 4.625063104345462e-09, + "loss": 0.0003, + "step": 50361 + }, + { + "epoch": 0.98, + "learning_rate": 4.62117976000932e-09, + "loss": 0.0004, + "step": 50362 + }, + { + "epoch": 0.98, + "learning_rate": 4.617296415673178e-09, + "loss": 0.0003, + "step": 50363 + }, + { + "epoch": 0.98, + "learning_rate": 4.613413071337035e-09, + "loss": 0.0962, + "step": 50364 + }, + { + "epoch": 0.98, + "learning_rate": 4.609529727000893e-09, + "loss": 0.0002, + "step": 50365 + }, + { + "epoch": 0.98, + "learning_rate": 4.60564638266475e-09, + "loss": 0.0004, + "step": 50366 + }, + { + "epoch": 0.98, + "learning_rate": 4.601763038328608e-09, + "loss": 0.3864, + "step": 50367 + }, + { + "epoch": 0.98, + "learning_rate": 4.597879693992466e-09, + "loss": 0.0005, + "step": 50368 + }, + { + "epoch": 0.98, + "learning_rate": 4.593996349656324e-09, + "loss": 0.0028, + "step": 50369 + }, + { + "epoch": 0.98, + "learning_rate": 4.590113005320181e-09, + "loss": 0.0004, + "step": 50370 + }, + { + "epoch": 0.98, + "learning_rate": 4.58622966098404e-09, + "loss": 0.0002, + "step": 50371 + }, + { + "epoch": 0.98, + "learning_rate": 4.582346316647897e-09, + "loss": 0.0005, + "step": 50372 + }, + { + "epoch": 0.98, + "learning_rate": 4.578462972311755e-09, + "loss": 0.0005, + "step": 50373 + }, + { + "epoch": 0.98, + "learning_rate": 4.574579627975613e-09, + "loss": 0.0006, + "step": 50374 + }, + { + "epoch": 0.98, + "learning_rate": 4.57069628363947e-09, + "loss": 0.0004, + "step": 50375 + }, + { + "epoch": 0.98, + "learning_rate": 4.5668129393033275e-09, + "loss": 0.0013, + "step": 50376 + }, + { + "epoch": 0.98, + "learning_rate": 4.562929594967185e-09, + "loss": 0.0012, + "step": 50377 + }, + { + "epoch": 0.98, + "learning_rate": 4.559046250631043e-09, + "loss": 0.0004, + "step": 50378 + }, + { + "epoch": 0.98, + "learning_rate": 4.555162906294901e-09, + "loss": 0.0003, + "step": 50379 + }, + { + "epoch": 0.98, + "learning_rate": 4.551279561958759e-09, + "loss": 0.0004, + "step": 50380 + }, + { + "epoch": 0.98, + "learning_rate": 4.547396217622616e-09, + "loss": 0.0004, + "step": 50381 + }, + { + "epoch": 0.98, + "learning_rate": 4.5435128732864745e-09, + "loss": 1.0803, + "step": 50382 + }, + { + "epoch": 0.98, + "learning_rate": 4.539629528950332e-09, + "loss": 0.0009, + "step": 50383 + }, + { + "epoch": 0.98, + "learning_rate": 4.535746184614189e-09, + "loss": 0.0007, + "step": 50384 + }, + { + "epoch": 0.98, + "learning_rate": 4.531862840278048e-09, + "loss": 0.0005, + "step": 50385 + }, + { + "epoch": 0.98, + "learning_rate": 4.527979495941905e-09, + "loss": 0.0004, + "step": 50386 + }, + { + "epoch": 0.98, + "learning_rate": 4.5240961516057624e-09, + "loss": 0.0004, + "step": 50387 + }, + { + "epoch": 0.98, + "learning_rate": 4.52021280726962e-09, + "loss": 0.0004, + "step": 50388 + }, + { + "epoch": 0.98, + "learning_rate": 4.516329462933478e-09, + "loss": 0.0004, + "step": 50389 + }, + { + "epoch": 0.98, + "learning_rate": 4.5124461185973355e-09, + "loss": 0.0005, + "step": 50390 + }, + { + "epoch": 0.98, + "learning_rate": 4.508562774261194e-09, + "loss": 0.0003, + "step": 50391 + }, + { + "epoch": 0.98, + "learning_rate": 4.504679429925051e-09, + "loss": 0.0005, + "step": 50392 + }, + { + "epoch": 0.98, + "learning_rate": 4.500796085588909e-09, + "loss": 0.0004, + "step": 50393 + }, + { + "epoch": 0.98, + "learning_rate": 4.496912741252767e-09, + "loss": 0.0007, + "step": 50394 + }, + { + "epoch": 0.98, + "learning_rate": 4.493029396916624e-09, + "loss": 0.0006, + "step": 50395 + }, + { + "epoch": 0.98, + "learning_rate": 4.4891460525804825e-09, + "loss": 0.0002, + "step": 50396 + }, + { + "epoch": 0.98, + "learning_rate": 4.48526270824434e-09, + "loss": 0.194, + "step": 50397 + }, + { + "epoch": 0.98, + "learning_rate": 4.481379363908197e-09, + "loss": 0.0004, + "step": 50398 + }, + { + "epoch": 0.98, + "learning_rate": 4.477496019572055e-09, + "loss": 0.0004, + "step": 50399 + }, + { + "epoch": 0.98, + "learning_rate": 4.473612675235913e-09, + "loss": 0.0003, + "step": 50400 + }, + { + "epoch": 0.98, + "learning_rate": 4.46972933089977e-09, + "loss": 0.0023, + "step": 50401 + }, + { + "epoch": 0.98, + "learning_rate": 4.465845986563629e-09, + "loss": 1.0995, + "step": 50402 + }, + { + "epoch": 0.98, + "learning_rate": 4.461962642227486e-09, + "loss": 0.0003, + "step": 50403 + }, + { + "epoch": 0.98, + "learning_rate": 4.4580792978913435e-09, + "loss": 0.0005, + "step": 50404 + }, + { + "epoch": 0.98, + "learning_rate": 4.454195953555202e-09, + "loss": 0.0004, + "step": 50405 + }, + { + "epoch": 0.98, + "learning_rate": 4.450312609219059e-09, + "loss": 0.0004, + "step": 50406 + }, + { + "epoch": 0.98, + "learning_rate": 4.446429264882917e-09, + "loss": 0.0004, + "step": 50407 + }, + { + "epoch": 0.98, + "learning_rate": 4.442545920546775e-09, + "loss": 0.0003, + "step": 50408 + }, + { + "epoch": 0.98, + "learning_rate": 4.438662576210632e-09, + "loss": 0.0003, + "step": 50409 + }, + { + "epoch": 0.98, + "learning_rate": 4.43477923187449e-09, + "loss": 0.0004, + "step": 50410 + }, + { + "epoch": 0.98, + "learning_rate": 4.430895887538348e-09, + "loss": 0.0003, + "step": 50411 + }, + { + "epoch": 0.98, + "learning_rate": 4.427012543202205e-09, + "loss": 1.355, + "step": 50412 + }, + { + "epoch": 0.98, + "learning_rate": 4.423129198866063e-09, + "loss": 0.0005, + "step": 50413 + }, + { + "epoch": 0.98, + "learning_rate": 4.419245854529921e-09, + "loss": 0.0007, + "step": 50414 + }, + { + "epoch": 0.98, + "learning_rate": 4.415362510193778e-09, + "loss": 0.0054, + "step": 50415 + }, + { + "epoch": 0.98, + "learning_rate": 4.411479165857637e-09, + "loss": 0.0003, + "step": 50416 + }, + { + "epoch": 0.98, + "learning_rate": 4.407595821521494e-09, + "loss": 0.0004, + "step": 50417 + }, + { + "epoch": 0.98, + "learning_rate": 4.403712477185352e-09, + "loss": 0.0002, + "step": 50418 + }, + { + "epoch": 0.98, + "learning_rate": 4.39982913284921e-09, + "loss": 0.0004, + "step": 50419 + }, + { + "epoch": 0.98, + "learning_rate": 4.395945788513068e-09, + "loss": 0.0005, + "step": 50420 + }, + { + "epoch": 0.98, + "learning_rate": 4.3920624441769245e-09, + "loss": 1.2446, + "step": 50421 + }, + { + "epoch": 0.98, + "learning_rate": 4.388179099840782e-09, + "loss": 0.0004, + "step": 50422 + }, + { + "epoch": 0.98, + "learning_rate": 4.38429575550464e-09, + "loss": 0.9132, + "step": 50423 + }, + { + "epoch": 0.98, + "learning_rate": 4.380412411168498e-09, + "loss": 0.0004, + "step": 50424 + }, + { + "epoch": 0.98, + "learning_rate": 4.376529066832356e-09, + "loss": 0.0004, + "step": 50425 + }, + { + "epoch": 0.98, + "learning_rate": 4.372645722496213e-09, + "loss": 0.0002, + "step": 50426 + }, + { + "epoch": 0.98, + "learning_rate": 4.3687623781600715e-09, + "loss": 0.8718, + "step": 50427 + }, + { + "epoch": 0.98, + "learning_rate": 4.364879033823929e-09, + "loss": 0.0004, + "step": 50428 + }, + { + "epoch": 0.98, + "learning_rate": 4.360995689487787e-09, + "loss": 0.0003, + "step": 50429 + }, + { + "epoch": 0.98, + "learning_rate": 4.357112345151645e-09, + "loss": 0.0004, + "step": 50430 + }, + { + "epoch": 0.98, + "learning_rate": 4.353229000815503e-09, + "loss": 0.0005, + "step": 50431 + }, + { + "epoch": 0.98, + "learning_rate": 4.34934565647936e-09, + "loss": 0.0004, + "step": 50432 + }, + { + "epoch": 0.98, + "learning_rate": 4.345462312143217e-09, + "loss": 0.0005, + "step": 50433 + }, + { + "epoch": 0.98, + "learning_rate": 4.341578967807075e-09, + "loss": 0.0004, + "step": 50434 + }, + { + "epoch": 0.98, + "learning_rate": 4.3376956234709325e-09, + "loss": 0.0003, + "step": 50435 + }, + { + "epoch": 0.98, + "learning_rate": 4.333812279134791e-09, + "loss": 0.0003, + "step": 50436 + }, + { + "epoch": 0.98, + "learning_rate": 4.329928934798648e-09, + "loss": 0.0003, + "step": 50437 + }, + { + "epoch": 0.98, + "learning_rate": 4.3260455904625064e-09, + "loss": 0.0004, + "step": 50438 + }, + { + "epoch": 0.98, + "learning_rate": 4.322162246126364e-09, + "loss": 0.0003, + "step": 50439 + }, + { + "epoch": 0.98, + "learning_rate": 4.318278901790222e-09, + "loss": 0.0003, + "step": 50440 + }, + { + "epoch": 0.98, + "learning_rate": 4.3143955574540795e-09, + "loss": 0.0004, + "step": 50441 + }, + { + "epoch": 0.98, + "learning_rate": 4.310512213117937e-09, + "loss": 1.0039, + "step": 50442 + }, + { + "epoch": 0.98, + "learning_rate": 4.306628868781795e-09, + "loss": 0.0003, + "step": 50443 + }, + { + "epoch": 0.98, + "learning_rate": 4.3027455244456526e-09, + "loss": 0.0004, + "step": 50444 + }, + { + "epoch": 0.98, + "learning_rate": 4.29886218010951e-09, + "loss": 0.0005, + "step": 50445 + }, + { + "epoch": 0.98, + "learning_rate": 4.2949788357733674e-09, + "loss": 0.0004, + "step": 50446 + }, + { + "epoch": 0.98, + "learning_rate": 4.291095491437226e-09, + "loss": 0.0004, + "step": 50447 + }, + { + "epoch": 0.98, + "learning_rate": 4.287212147101083e-09, + "loss": 0.0003, + "step": 50448 + }, + { + "epoch": 0.98, + "learning_rate": 4.283328802764941e-09, + "loss": 1.0646, + "step": 50449 + }, + { + "epoch": 0.98, + "learning_rate": 4.279445458428799e-09, + "loss": 0.0005, + "step": 50450 + }, + { + "epoch": 0.98, + "learning_rate": 4.275562114092656e-09, + "loss": 0.0007, + "step": 50451 + }, + { + "epoch": 0.98, + "learning_rate": 4.271678769756514e-09, + "loss": 1.1817, + "step": 50452 + }, + { + "epoch": 0.98, + "learning_rate": 4.267795425420372e-09, + "loss": 0.0004, + "step": 50453 + }, + { + "epoch": 0.98, + "learning_rate": 4.26391208108423e-09, + "loss": 0.0004, + "step": 50454 + }, + { + "epoch": 0.98, + "learning_rate": 4.2600287367480875e-09, + "loss": 0.0029, + "step": 50455 + }, + { + "epoch": 0.98, + "learning_rate": 4.256145392411945e-09, + "loss": 0.0003, + "step": 50456 + }, + { + "epoch": 0.98, + "learning_rate": 4.252262048075802e-09, + "loss": 1.3535, + "step": 50457 + }, + { + "epoch": 0.98, + "learning_rate": 4.2483787037396606e-09, + "loss": 0.0003, + "step": 50458 + }, + { + "epoch": 0.98, + "learning_rate": 4.244495359403518e-09, + "loss": 0.0004, + "step": 50459 + }, + { + "epoch": 0.98, + "learning_rate": 4.240612015067376e-09, + "loss": 0.0003, + "step": 50460 + }, + { + "epoch": 0.98, + "learning_rate": 4.236728670731234e-09, + "loss": 0.0004, + "step": 50461 + }, + { + "epoch": 0.98, + "learning_rate": 4.232845326395091e-09, + "loss": 0.0005, + "step": 50462 + }, + { + "epoch": 0.98, + "learning_rate": 4.228961982058949e-09, + "loss": 0.0004, + "step": 50463 + }, + { + "epoch": 0.98, + "learning_rate": 4.225078637722807e-09, + "loss": 0.0002, + "step": 50464 + }, + { + "epoch": 0.98, + "learning_rate": 4.221195293386665e-09, + "loss": 0.0005, + "step": 50465 + }, + { + "epoch": 0.98, + "learning_rate": 4.217311949050522e-09, + "loss": 0.0003, + "step": 50466 + }, + { + "epoch": 0.98, + "learning_rate": 4.21342860471438e-09, + "loss": 0.0005, + "step": 50467 + }, + { + "epoch": 0.98, + "learning_rate": 4.209545260378237e-09, + "loss": 0.9068, + "step": 50468 + }, + { + "epoch": 0.98, + "learning_rate": 4.2056619160420955e-09, + "loss": 0.0003, + "step": 50469 + }, + { + "epoch": 0.98, + "learning_rate": 4.201778571705953e-09, + "loss": 0.0003, + "step": 50470 + }, + { + "epoch": 0.98, + "learning_rate": 4.19789522736981e-09, + "loss": 0.0993, + "step": 50471 + }, + { + "epoch": 0.98, + "learning_rate": 4.1940118830336685e-09, + "loss": 0.0005, + "step": 50472 + }, + { + "epoch": 0.98, + "learning_rate": 4.190128538697526e-09, + "loss": 0.0004, + "step": 50473 + }, + { + "epoch": 0.98, + "learning_rate": 4.186245194361384e-09, + "loss": 0.0003, + "step": 50474 + }, + { + "epoch": 0.98, + "learning_rate": 4.182361850025242e-09, + "loss": 0.272, + "step": 50475 + }, + { + "epoch": 0.98, + "learning_rate": 4.1784785056891e-09, + "loss": 0.0006, + "step": 50476 + }, + { + "epoch": 0.98, + "learning_rate": 4.174595161352957e-09, + "loss": 0.0004, + "step": 50477 + }, + { + "epoch": 0.98, + "learning_rate": 4.170711817016815e-09, + "loss": 0.0002, + "step": 50478 + }, + { + "epoch": 0.98, + "learning_rate": 4.166828472680672e-09, + "loss": 0.0003, + "step": 50479 + }, + { + "epoch": 0.98, + "learning_rate": 4.1629451283445295e-09, + "loss": 0.0003, + "step": 50480 + }, + { + "epoch": 0.98, + "learning_rate": 4.159061784008388e-09, + "loss": 0.0004, + "step": 50481 + }, + { + "epoch": 0.98, + "learning_rate": 4.155178439672245e-09, + "loss": 0.0019, + "step": 50482 + }, + { + "epoch": 0.98, + "learning_rate": 4.1512950953361034e-09, + "loss": 0.0005, + "step": 50483 + }, + { + "epoch": 0.98, + "learning_rate": 4.147411750999961e-09, + "loss": 0.0095, + "step": 50484 + }, + { + "epoch": 0.98, + "learning_rate": 4.143528406663819e-09, + "loss": 0.0003, + "step": 50485 + }, + { + "epoch": 0.98, + "learning_rate": 4.1396450623276765e-09, + "loss": 0.0009, + "step": 50486 + }, + { + "epoch": 0.98, + "learning_rate": 4.135761717991535e-09, + "loss": 0.0004, + "step": 50487 + }, + { + "epoch": 0.98, + "learning_rate": 4.131878373655392e-09, + "loss": 0.0045, + "step": 50488 + }, + { + "epoch": 0.98, + "learning_rate": 4.12799502931925e-09, + "loss": 0.0009, + "step": 50489 + }, + { + "epoch": 0.98, + "learning_rate": 4.124111684983107e-09, + "loss": 0.0004, + "step": 50490 + }, + { + "epoch": 0.98, + "learning_rate": 4.1202283406469644e-09, + "loss": 0.0003, + "step": 50491 + }, + { + "epoch": 0.98, + "learning_rate": 4.116344996310823e-09, + "loss": 0.0003, + "step": 50492 + }, + { + "epoch": 0.98, + "learning_rate": 4.11246165197468e-09, + "loss": 0.0003, + "step": 50493 + }, + { + "epoch": 0.98, + "learning_rate": 4.108578307638538e-09, + "loss": 0.0003, + "step": 50494 + }, + { + "epoch": 0.98, + "learning_rate": 4.104694963302396e-09, + "loss": 0.0005, + "step": 50495 + }, + { + "epoch": 0.98, + "learning_rate": 4.100811618966254e-09, + "loss": 0.0004, + "step": 50496 + }, + { + "epoch": 0.98, + "learning_rate": 4.096928274630111e-09, + "loss": 0.0005, + "step": 50497 + }, + { + "epoch": 0.98, + "learning_rate": 4.09304493029397e-09, + "loss": 0.0005, + "step": 50498 + }, + { + "epoch": 0.98, + "learning_rate": 4.089161585957827e-09, + "loss": 0.0003, + "step": 50499 + }, + { + "epoch": 0.98, + "learning_rate": 4.0852782416216845e-09, + "loss": 0.8353, + "step": 50500 + }, + { + "epoch": 0.98, + "learning_rate": 4.081394897285542e-09, + "loss": 0.0005, + "step": 50501 + }, + { + "epoch": 0.98, + "learning_rate": 4.077511552949399e-09, + "loss": 0.0002, + "step": 50502 + }, + { + "epoch": 0.98, + "learning_rate": 4.0736282086132576e-09, + "loss": 0.0004, + "step": 50503 + }, + { + "epoch": 0.98, + "learning_rate": 4.069744864277115e-09, + "loss": 0.9478, + "step": 50504 + }, + { + "epoch": 0.98, + "learning_rate": 4.065861519940973e-09, + "loss": 0.0003, + "step": 50505 + }, + { + "epoch": 0.98, + "learning_rate": 4.061978175604831e-09, + "loss": 0.0003, + "step": 50506 + }, + { + "epoch": 0.98, + "learning_rate": 4.058094831268689e-09, + "loss": 0.0005, + "step": 50507 + }, + { + "epoch": 0.98, + "learning_rate": 4.054211486932546e-09, + "loss": 0.0003, + "step": 50508 + }, + { + "epoch": 0.98, + "learning_rate": 4.050328142596404e-09, + "loss": 0.0004, + "step": 50509 + }, + { + "epoch": 0.98, + "learning_rate": 4.046444798260262e-09, + "loss": 0.0005, + "step": 50510 + }, + { + "epoch": 0.98, + "learning_rate": 4.042561453924119e-09, + "loss": 0.0005, + "step": 50511 + }, + { + "epoch": 0.98, + "learning_rate": 4.038678109587977e-09, + "loss": 0.0005, + "step": 50512 + }, + { + "epoch": 0.98, + "learning_rate": 4.034794765251834e-09, + "loss": 0.0004, + "step": 50513 + }, + { + "epoch": 0.98, + "learning_rate": 4.0309114209156925e-09, + "loss": 0.159, + "step": 50514 + }, + { + "epoch": 0.98, + "learning_rate": 4.02702807657955e-09, + "loss": 0.0005, + "step": 50515 + }, + { + "epoch": 0.98, + "learning_rate": 4.023144732243408e-09, + "loss": 0.002, + "step": 50516 + }, + { + "epoch": 0.98, + "learning_rate": 4.0192613879072655e-09, + "loss": 0.0003, + "step": 50517 + }, + { + "epoch": 0.98, + "learning_rate": 4.015378043571124e-09, + "loss": 0.0004, + "step": 50518 + }, + { + "epoch": 0.98, + "learning_rate": 4.011494699234981e-09, + "loss": 0.0004, + "step": 50519 + }, + { + "epoch": 0.98, + "learning_rate": 4.007611354898839e-09, + "loss": 0.0003, + "step": 50520 + }, + { + "epoch": 0.98, + "learning_rate": 4.003728010562697e-09, + "loss": 0.0003, + "step": 50521 + }, + { + "epoch": 0.98, + "learning_rate": 3.999844666226554e-09, + "loss": 0.0003, + "step": 50522 + }, + { + "epoch": 0.98, + "learning_rate": 3.995961321890412e-09, + "loss": 0.0006, + "step": 50523 + }, + { + "epoch": 0.98, + "learning_rate": 3.992077977554269e-09, + "loss": 0.0003, + "step": 50524 + }, + { + "epoch": 0.98, + "learning_rate": 3.988194633218127e-09, + "loss": 0.0005, + "step": 50525 + }, + { + "epoch": 0.98, + "learning_rate": 3.984311288881985e-09, + "loss": 0.0004, + "step": 50526 + }, + { + "epoch": 0.98, + "learning_rate": 3.980427944545843e-09, + "loss": 0.0004, + "step": 50527 + }, + { + "epoch": 0.98, + "learning_rate": 3.9765446002097004e-09, + "loss": 0.0003, + "step": 50528 + }, + { + "epoch": 0.98, + "learning_rate": 3.972661255873558e-09, + "loss": 0.0003, + "step": 50529 + }, + { + "epoch": 0.98, + "learning_rate": 3.968777911537416e-09, + "loss": 0.0004, + "step": 50530 + }, + { + "epoch": 0.98, + "learning_rate": 3.9648945672012735e-09, + "loss": 0.2483, + "step": 50531 + }, + { + "epoch": 0.98, + "learning_rate": 3.961011222865132e-09, + "loss": 0.0004, + "step": 50532 + }, + { + "epoch": 0.98, + "learning_rate": 3.957127878528989e-09, + "loss": 0.0004, + "step": 50533 + }, + { + "epoch": 0.98, + "learning_rate": 3.953244534192847e-09, + "loss": 0.0002, + "step": 50534 + }, + { + "epoch": 0.98, + "learning_rate": 3.949361189856704e-09, + "loss": 0.0004, + "step": 50535 + }, + { + "epoch": 0.98, + "learning_rate": 3.945477845520562e-09, + "loss": 0.0153, + "step": 50536 + }, + { + "epoch": 0.98, + "learning_rate": 3.94159450118442e-09, + "loss": 0.0004, + "step": 50537 + }, + { + "epoch": 0.98, + "learning_rate": 3.937711156848277e-09, + "loss": 0.0004, + "step": 50538 + }, + { + "epoch": 0.98, + "learning_rate": 3.933827812512135e-09, + "loss": 0.0003, + "step": 50539 + }, + { + "epoch": 0.98, + "learning_rate": 3.929944468175993e-09, + "loss": 0.7029, + "step": 50540 + }, + { + "epoch": 0.98, + "learning_rate": 3.926061123839851e-09, + "loss": 0.0005, + "step": 50541 + }, + { + "epoch": 0.98, + "learning_rate": 3.9221777795037084e-09, + "loss": 0.0004, + "step": 50542 + }, + { + "epoch": 0.98, + "learning_rate": 3.918294435167567e-09, + "loss": 0.0003, + "step": 50543 + }, + { + "epoch": 0.98, + "learning_rate": 3.914411090831424e-09, + "loss": 0.0003, + "step": 50544 + }, + { + "epoch": 0.98, + "learning_rate": 3.9105277464952815e-09, + "loss": 0.0004, + "step": 50545 + }, + { + "epoch": 0.98, + "learning_rate": 3.906644402159139e-09, + "loss": 0.0003, + "step": 50546 + }, + { + "epoch": 0.98, + "learning_rate": 3.902761057822997e-09, + "loss": 0.7686, + "step": 50547 + }, + { + "epoch": 0.98, + "learning_rate": 3.8988777134868546e-09, + "loss": 0.0002, + "step": 50548 + }, + { + "epoch": 0.98, + "learning_rate": 3.894994369150712e-09, + "loss": 0.0007, + "step": 50549 + }, + { + "epoch": 0.98, + "learning_rate": 3.89111102481457e-09, + "loss": 0.0003, + "step": 50550 + }, + { + "epoch": 0.98, + "learning_rate": 3.887227680478428e-09, + "loss": 0.6551, + "step": 50551 + }, + { + "epoch": 0.98, + "learning_rate": 3.883344336142286e-09, + "loss": 0.0005, + "step": 50552 + }, + { + "epoch": 0.98, + "learning_rate": 3.879460991806143e-09, + "loss": 0.0004, + "step": 50553 + }, + { + "epoch": 0.98, + "learning_rate": 3.8755776474700016e-09, + "loss": 0.0005, + "step": 50554 + }, + { + "epoch": 0.98, + "learning_rate": 3.871694303133859e-09, + "loss": 0.0003, + "step": 50555 + }, + { + "epoch": 0.98, + "learning_rate": 3.867810958797716e-09, + "loss": 0.0003, + "step": 50556 + }, + { + "epoch": 0.98, + "learning_rate": 3.863927614461574e-09, + "loss": 0.0005, + "step": 50557 + }, + { + "epoch": 0.98, + "learning_rate": 3.860044270125431e-09, + "loss": 0.0004, + "step": 50558 + }, + { + "epoch": 0.98, + "learning_rate": 3.8561609257892895e-09, + "loss": 0.0011, + "step": 50559 + }, + { + "epoch": 0.98, + "learning_rate": 3.852277581453147e-09, + "loss": 0.0002, + "step": 50560 + }, + { + "epoch": 0.98, + "learning_rate": 3.848394237117005e-09, + "loss": 0.0003, + "step": 50561 + }, + { + "epoch": 0.98, + "learning_rate": 3.8445108927808625e-09, + "loss": 0.0005, + "step": 50562 + }, + { + "epoch": 0.98, + "learning_rate": 3.840627548444721e-09, + "loss": 0.0004, + "step": 50563 + }, + { + "epoch": 0.98, + "learning_rate": 3.836744204108578e-09, + "loss": 0.001, + "step": 50564 + }, + { + "epoch": 0.98, + "learning_rate": 3.8328608597724365e-09, + "loss": 0.0006, + "step": 50565 + }, + { + "epoch": 0.98, + "learning_rate": 3.828977515436294e-09, + "loss": 0.0004, + "step": 50566 + }, + { + "epoch": 0.98, + "learning_rate": 3.825094171100151e-09, + "loss": 0.3955, + "step": 50567 + }, + { + "epoch": 0.98, + "learning_rate": 3.821210826764009e-09, + "loss": 0.0005, + "step": 50568 + }, + { + "epoch": 0.98, + "learning_rate": 3.817327482427866e-09, + "loss": 0.0003, + "step": 50569 + }, + { + "epoch": 0.98, + "learning_rate": 3.813444138091724e-09, + "loss": 0.0005, + "step": 50570 + }, + { + "epoch": 0.98, + "learning_rate": 3.809560793755582e-09, + "loss": 1.242, + "step": 50571 + }, + { + "epoch": 0.98, + "learning_rate": 3.80567744941944e-09, + "loss": 0.0006, + "step": 50572 + }, + { + "epoch": 0.98, + "learning_rate": 3.8017941050832974e-09, + "loss": 0.0004, + "step": 50573 + }, + { + "epoch": 0.98, + "learning_rate": 3.797910760747156e-09, + "loss": 0.0005, + "step": 50574 + }, + { + "epoch": 0.98, + "learning_rate": 3.794027416411013e-09, + "loss": 0.0004, + "step": 50575 + }, + { + "epoch": 0.98, + "learning_rate": 3.790144072074871e-09, + "loss": 0.0004, + "step": 50576 + }, + { + "epoch": 0.98, + "learning_rate": 3.786260727738729e-09, + "loss": 0.0003, + "step": 50577 + }, + { + "epoch": 0.98, + "learning_rate": 3.782377383402586e-09, + "loss": 0.7923, + "step": 50578 + }, + { + "epoch": 0.98, + "learning_rate": 3.778494039066444e-09, + "loss": 0.0014, + "step": 50579 + }, + { + "epoch": 0.98, + "learning_rate": 3.774610694730301e-09, + "loss": 0.0003, + "step": 50580 + }, + { + "epoch": 0.98, + "learning_rate": 3.770727350394159e-09, + "loss": 0.0004, + "step": 50581 + }, + { + "epoch": 0.98, + "learning_rate": 3.766844006058017e-09, + "loss": 0.0003, + "step": 50582 + }, + { + "epoch": 0.98, + "learning_rate": 3.762960661721875e-09, + "loss": 0.0003, + "step": 50583 + }, + { + "epoch": 0.98, + "learning_rate": 3.759077317385732e-09, + "loss": 0.0004, + "step": 50584 + }, + { + "epoch": 0.98, + "learning_rate": 3.755193973049591e-09, + "loss": 0.0005, + "step": 50585 + }, + { + "epoch": 0.98, + "learning_rate": 3.751310628713448e-09, + "loss": 0.0004, + "step": 50586 + }, + { + "epoch": 0.98, + "learning_rate": 3.7474272843773054e-09, + "loss": 0.0291, + "step": 50587 + }, + { + "epoch": 0.98, + "learning_rate": 3.743543940041164e-09, + "loss": 0.0004, + "step": 50588 + }, + { + "epoch": 0.98, + "learning_rate": 3.739660595705021e-09, + "loss": 0.0474, + "step": 50589 + }, + { + "epoch": 0.98, + "learning_rate": 3.7357772513688785e-09, + "loss": 0.0354, + "step": 50590 + }, + { + "epoch": 0.98, + "learning_rate": 3.731893907032736e-09, + "loss": 0.0003, + "step": 50591 + }, + { + "epoch": 0.98, + "learning_rate": 3.728010562696594e-09, + "loss": 0.0004, + "step": 50592 + }, + { + "epoch": 0.98, + "learning_rate": 3.7241272183604516e-09, + "loss": 0.0004, + "step": 50593 + }, + { + "epoch": 0.98, + "learning_rate": 3.72024387402431e-09, + "loss": 0.0004, + "step": 50594 + }, + { + "epoch": 0.98, + "learning_rate": 3.7163605296881672e-09, + "loss": 0.2984, + "step": 50595 + }, + { + "epoch": 0.98, + "learning_rate": 3.7124771853520247e-09, + "loss": 0.0011, + "step": 50596 + }, + { + "epoch": 0.98, + "learning_rate": 3.708593841015883e-09, + "loss": 0.0003, + "step": 50597 + }, + { + "epoch": 0.98, + "learning_rate": 3.7047104966797403e-09, + "loss": 0.0004, + "step": 50598 + }, + { + "epoch": 0.98, + "learning_rate": 3.700827152343598e-09, + "loss": 0.0002, + "step": 50599 + }, + { + "epoch": 0.98, + "learning_rate": 3.6969438080074556e-09, + "loss": 0.0004, + "step": 50600 + }, + { + "epoch": 0.98, + "learning_rate": 3.693060463671314e-09, + "loss": 0.0003, + "step": 50601 + }, + { + "epoch": 0.98, + "learning_rate": 3.6891771193351712e-09, + "loss": 0.0003, + "step": 50602 + }, + { + "epoch": 0.98, + "learning_rate": 3.6852937749990295e-09, + "loss": 0.0021, + "step": 50603 + }, + { + "epoch": 0.98, + "learning_rate": 3.6814104306628865e-09, + "loss": 0.9701, + "step": 50604 + }, + { + "epoch": 0.98, + "learning_rate": 3.6775270863267447e-09, + "loss": 0.0005, + "step": 50605 + }, + { + "epoch": 0.98, + "learning_rate": 3.673643741990602e-09, + "loss": 1.059, + "step": 50606 + }, + { + "epoch": 0.98, + "learning_rate": 3.6697603976544596e-09, + "loss": 0.0018, + "step": 50607 + }, + { + "epoch": 0.98, + "learning_rate": 3.665877053318318e-09, + "loss": 0.01, + "step": 50608 + }, + { + "epoch": 0.98, + "learning_rate": 3.6619937089821752e-09, + "loss": 0.0004, + "step": 50609 + }, + { + "epoch": 0.98, + "learning_rate": 3.658110364646033e-09, + "loss": 0.0005, + "step": 50610 + }, + { + "epoch": 0.98, + "learning_rate": 3.6542270203098905e-09, + "loss": 0.0003, + "step": 50611 + }, + { + "epoch": 0.98, + "learning_rate": 3.6503436759737487e-09, + "loss": 0.0004, + "step": 50612 + }, + { + "epoch": 0.98, + "learning_rate": 3.646460331637606e-09, + "loss": 0.0009, + "step": 50613 + }, + { + "epoch": 0.98, + "learning_rate": 3.6425769873014644e-09, + "loss": 0.0004, + "step": 50614 + }, + { + "epoch": 0.98, + "learning_rate": 3.6386936429653218e-09, + "loss": 0.0003, + "step": 50615 + }, + { + "epoch": 0.98, + "learning_rate": 3.6348102986291788e-09, + "loss": 0.0003, + "step": 50616 + }, + { + "epoch": 0.98, + "learning_rate": 3.630926954293037e-09, + "loss": 0.0007, + "step": 50617 + }, + { + "epoch": 0.98, + "learning_rate": 3.6270436099568945e-09, + "loss": 0.0002, + "step": 50618 + }, + { + "epoch": 0.98, + "learning_rate": 3.6231602656207527e-09, + "loss": 0.0035, + "step": 50619 + }, + { + "epoch": 0.98, + "learning_rate": 3.61927692128461e-09, + "loss": 0.0005, + "step": 50620 + }, + { + "epoch": 0.98, + "learning_rate": 3.615393576948468e-09, + "loss": 0.0114, + "step": 50621 + }, + { + "epoch": 0.98, + "learning_rate": 3.6115102326123254e-09, + "loss": 0.0004, + "step": 50622 + }, + { + "epoch": 0.98, + "learning_rate": 3.6076268882761836e-09, + "loss": 0.0003, + "step": 50623 + }, + { + "epoch": 0.98, + "learning_rate": 3.603743543940041e-09, + "loss": 0.0004, + "step": 50624 + }, + { + "epoch": 0.98, + "learning_rate": 3.5998601996038984e-09, + "loss": 0.0004, + "step": 50625 + }, + { + "epoch": 0.98, + "learning_rate": 3.5959768552677567e-09, + "loss": 0.0002, + "step": 50626 + }, + { + "epoch": 0.98, + "learning_rate": 3.5920935109316137e-09, + "loss": 0.0004, + "step": 50627 + }, + { + "epoch": 0.98, + "learning_rate": 3.588210166595472e-09, + "loss": 0.0003, + "step": 50628 + }, + { + "epoch": 0.98, + "learning_rate": 3.5843268222593293e-09, + "loss": 0.0003, + "step": 50629 + }, + { + "epoch": 0.98, + "learning_rate": 3.5804434779231876e-09, + "loss": 0.0005, + "step": 50630 + }, + { + "epoch": 0.98, + "learning_rate": 3.576560133587045e-09, + "loss": 0.0003, + "step": 50631 + }, + { + "epoch": 0.98, + "learning_rate": 3.572676789250903e-09, + "loss": 0.0004, + "step": 50632 + }, + { + "epoch": 0.98, + "learning_rate": 3.5687934449147603e-09, + "loss": 0.0004, + "step": 50633 + }, + { + "epoch": 0.98, + "learning_rate": 3.5649101005786185e-09, + "loss": 0.0002, + "step": 50634 + }, + { + "epoch": 0.98, + "learning_rate": 3.561026756242476e-09, + "loss": 0.0005, + "step": 50635 + }, + { + "epoch": 0.98, + "learning_rate": 3.5571434119063333e-09, + "loss": 0.0004, + "step": 50636 + }, + { + "epoch": 0.98, + "learning_rate": 3.5532600675701916e-09, + "loss": 0.0003, + "step": 50637 + }, + { + "epoch": 0.98, + "learning_rate": 3.549376723234049e-09, + "loss": 0.0003, + "step": 50638 + }, + { + "epoch": 0.98, + "learning_rate": 3.545493378897907e-09, + "loss": 0.0003, + "step": 50639 + }, + { + "epoch": 0.98, + "learning_rate": 3.5416100345617642e-09, + "loss": 0.0007, + "step": 50640 + }, + { + "epoch": 0.98, + "learning_rate": 3.5377266902256225e-09, + "loss": 0.0005, + "step": 50641 + }, + { + "epoch": 0.98, + "learning_rate": 3.53384334588948e-09, + "loss": 0.0006, + "step": 50642 + }, + { + "epoch": 0.98, + "learning_rate": 3.5299600015533377e-09, + "loss": 0.0003, + "step": 50643 + }, + { + "epoch": 0.98, + "learning_rate": 3.526076657217195e-09, + "loss": 0.0003, + "step": 50644 + }, + { + "epoch": 0.98, + "learning_rate": 3.5221933128810526e-09, + "loss": 0.813, + "step": 50645 + }, + { + "epoch": 0.98, + "learning_rate": 3.518309968544911e-09, + "loss": 0.0005, + "step": 50646 + }, + { + "epoch": 0.98, + "learning_rate": 3.5144266242087682e-09, + "loss": 0.0003, + "step": 50647 + }, + { + "epoch": 0.98, + "learning_rate": 3.5105432798726265e-09, + "loss": 0.0006, + "step": 50648 + }, + { + "epoch": 0.98, + "learning_rate": 3.506659935536484e-09, + "loss": 0.0004, + "step": 50649 + }, + { + "epoch": 0.98, + "learning_rate": 3.5027765912003417e-09, + "loss": 0.0003, + "step": 50650 + }, + { + "epoch": 0.98, + "learning_rate": 3.498893246864199e-09, + "loss": 0.0004, + "step": 50651 + }, + { + "epoch": 0.98, + "learning_rate": 3.4950099025280574e-09, + "loss": 0.0006, + "step": 50652 + }, + { + "epoch": 0.98, + "learning_rate": 3.491126558191915e-09, + "loss": 0.0006, + "step": 50653 + }, + { + "epoch": 0.98, + "learning_rate": 3.4872432138557722e-09, + "loss": 0.0005, + "step": 50654 + }, + { + "epoch": 0.98, + "learning_rate": 3.48335986951963e-09, + "loss": 0.0003, + "step": 50655 + }, + { + "epoch": 0.98, + "learning_rate": 3.4794765251834875e-09, + "loss": 0.2441, + "step": 50656 + }, + { + "epoch": 0.98, + "learning_rate": 3.4755931808473457e-09, + "loss": 0.0011, + "step": 50657 + }, + { + "epoch": 0.98, + "learning_rate": 3.471709836511203e-09, + "loss": 0.1457, + "step": 50658 + }, + { + "epoch": 0.98, + "learning_rate": 3.4678264921750614e-09, + "loss": 0.2057, + "step": 50659 + }, + { + "epoch": 0.98, + "learning_rate": 3.4639431478389188e-09, + "loss": 0.0003, + "step": 50660 + }, + { + "epoch": 0.98, + "learning_rate": 3.4600598035027766e-09, + "loss": 0.0004, + "step": 50661 + }, + { + "epoch": 0.98, + "learning_rate": 3.456176459166634e-09, + "loss": 0.0004, + "step": 50662 + }, + { + "epoch": 0.98, + "learning_rate": 3.4522931148304923e-09, + "loss": 0.0004, + "step": 50663 + }, + { + "epoch": 0.98, + "learning_rate": 3.4484097704943497e-09, + "loss": 0.0003, + "step": 50664 + }, + { + "epoch": 0.98, + "learning_rate": 3.444526426158207e-09, + "loss": 0.0005, + "step": 50665 + }, + { + "epoch": 0.98, + "learning_rate": 3.440643081822065e-09, + "loss": 0.0039, + "step": 50666 + }, + { + "epoch": 0.98, + "learning_rate": 3.4367597374859224e-09, + "loss": 0.0004, + "step": 50667 + }, + { + "epoch": 0.98, + "learning_rate": 3.4328763931497806e-09, + "loss": 0.0004, + "step": 50668 + }, + { + "epoch": 0.98, + "learning_rate": 3.428993048813638e-09, + "loss": 0.0003, + "step": 50669 + }, + { + "epoch": 0.98, + "learning_rate": 3.4251097044774963e-09, + "loss": 0.0003, + "step": 50670 + }, + { + "epoch": 0.98, + "learning_rate": 3.4212263601413537e-09, + "loss": 0.0004, + "step": 50671 + }, + { + "epoch": 0.98, + "learning_rate": 3.4173430158052115e-09, + "loss": 0.0003, + "step": 50672 + }, + { + "epoch": 0.98, + "learning_rate": 3.413459671469069e-09, + "loss": 0.0005, + "step": 50673 + }, + { + "epoch": 0.98, + "learning_rate": 3.4095763271329264e-09, + "loss": 0.0005, + "step": 50674 + }, + { + "epoch": 0.98, + "learning_rate": 3.4056929827967846e-09, + "loss": 0.0396, + "step": 50675 + }, + { + "epoch": 0.98, + "learning_rate": 3.401809638460642e-09, + "loss": 0.0004, + "step": 50676 + }, + { + "epoch": 0.98, + "learning_rate": 3.3979262941245e-09, + "loss": 0.0003, + "step": 50677 + }, + { + "epoch": 0.98, + "learning_rate": 3.3940429497883573e-09, + "loss": 0.0006, + "step": 50678 + }, + { + "epoch": 0.98, + "learning_rate": 3.3901596054522155e-09, + "loss": 0.0005, + "step": 50679 + }, + { + "epoch": 0.98, + "learning_rate": 3.386276261116073e-09, + "loss": 0.0003, + "step": 50680 + }, + { + "epoch": 0.98, + "learning_rate": 3.382392916779931e-09, + "loss": 0.0005, + "step": 50681 + }, + { + "epoch": 0.98, + "learning_rate": 3.3785095724437886e-09, + "loss": 0.7331, + "step": 50682 + }, + { + "epoch": 0.98, + "learning_rate": 3.374626228107646e-09, + "loss": 0.0007, + "step": 50683 + }, + { + "epoch": 0.98, + "learning_rate": 3.370742883771504e-09, + "loss": 0.0004, + "step": 50684 + }, + { + "epoch": 0.98, + "learning_rate": 3.3668595394353613e-09, + "loss": 0.0004, + "step": 50685 + }, + { + "epoch": 0.98, + "learning_rate": 3.3629761950992195e-09, + "loss": 0.0009, + "step": 50686 + }, + { + "epoch": 0.98, + "learning_rate": 3.359092850763077e-09, + "loss": 0.0008, + "step": 50687 + }, + { + "epoch": 0.98, + "learning_rate": 3.3552095064269347e-09, + "loss": 0.0007, + "step": 50688 + }, + { + "epoch": 0.98, + "learning_rate": 3.351326162090792e-09, + "loss": 0.0003, + "step": 50689 + }, + { + "epoch": 0.98, + "learning_rate": 3.3474428177546504e-09, + "loss": 0.0003, + "step": 50690 + }, + { + "epoch": 0.98, + "learning_rate": 3.343559473418508e-09, + "loss": 0.0006, + "step": 50691 + }, + { + "epoch": 0.98, + "learning_rate": 3.339676129082366e-09, + "loss": 0.0003, + "step": 50692 + }, + { + "epoch": 0.98, + "learning_rate": 3.3357927847462235e-09, + "loss": 0.0777, + "step": 50693 + }, + { + "epoch": 0.98, + "learning_rate": 3.331909440410081e-09, + "loss": 0.0003, + "step": 50694 + }, + { + "epoch": 0.98, + "learning_rate": 3.3280260960739387e-09, + "loss": 0.0004, + "step": 50695 + }, + { + "epoch": 0.98, + "learning_rate": 3.324142751737796e-09, + "loss": 0.0005, + "step": 50696 + }, + { + "epoch": 0.98, + "learning_rate": 3.3202594074016544e-09, + "loss": 0.0004, + "step": 50697 + }, + { + "epoch": 0.98, + "learning_rate": 3.316376063065512e-09, + "loss": 0.0003, + "step": 50698 + }, + { + "epoch": 0.98, + "learning_rate": 3.3124927187293696e-09, + "loss": 0.0004, + "step": 50699 + }, + { + "epoch": 0.98, + "learning_rate": 3.308609374393227e-09, + "loss": 0.0306, + "step": 50700 + }, + { + "epoch": 0.98, + "learning_rate": 3.3047260300570853e-09, + "loss": 0.0007, + "step": 50701 + }, + { + "epoch": 0.98, + "learning_rate": 3.3008426857209427e-09, + "loss": 0.1906, + "step": 50702 + }, + { + "epoch": 0.98, + "learning_rate": 3.2969593413848e-09, + "loss": 0.0005, + "step": 50703 + }, + { + "epoch": 0.98, + "learning_rate": 3.2930759970486584e-09, + "loss": 0.0003, + "step": 50704 + }, + { + "epoch": 0.98, + "learning_rate": 3.289192652712516e-09, + "loss": 0.0023, + "step": 50705 + }, + { + "epoch": 0.98, + "learning_rate": 3.2853093083763736e-09, + "loss": 0.0003, + "step": 50706 + }, + { + "epoch": 0.98, + "learning_rate": 3.281425964040231e-09, + "loss": 0.0005, + "step": 50707 + }, + { + "epoch": 0.98, + "learning_rate": 3.2775426197040893e-09, + "loss": 0.0441, + "step": 50708 + }, + { + "epoch": 0.98, + "learning_rate": 3.2736592753679467e-09, + "loss": 0.8185, + "step": 50709 + }, + { + "epoch": 0.98, + "learning_rate": 3.2697759310318045e-09, + "loss": 0.0511, + "step": 50710 + }, + { + "epoch": 0.98, + "learning_rate": 3.265892586695662e-09, + "loss": 0.0004, + "step": 50711 + }, + { + "epoch": 0.98, + "learning_rate": 3.2620092423595194e-09, + "loss": 0.0002, + "step": 50712 + }, + { + "epoch": 0.98, + "learning_rate": 3.2581258980233776e-09, + "loss": 0.0007, + "step": 50713 + }, + { + "epoch": 0.98, + "learning_rate": 3.254242553687235e-09, + "loss": 0.0005, + "step": 50714 + }, + { + "epoch": 0.98, + "learning_rate": 3.2503592093510933e-09, + "loss": 0.4386, + "step": 50715 + }, + { + "epoch": 0.98, + "learning_rate": 3.2464758650149507e-09, + "loss": 0.0003, + "step": 50716 + }, + { + "epoch": 0.98, + "learning_rate": 3.2425925206788085e-09, + "loss": 0.0005, + "step": 50717 + }, + { + "epoch": 0.98, + "learning_rate": 3.238709176342666e-09, + "loss": 0.0004, + "step": 50718 + }, + { + "epoch": 0.98, + "learning_rate": 3.234825832006524e-09, + "loss": 0.0004, + "step": 50719 + }, + { + "epoch": 0.98, + "learning_rate": 3.2309424876703816e-09, + "loss": 0.0006, + "step": 50720 + }, + { + "epoch": 0.98, + "learning_rate": 3.22705914333424e-09, + "loss": 0.0006, + "step": 50721 + }, + { + "epoch": 0.98, + "learning_rate": 3.223175798998097e-09, + "loss": 0.7293, + "step": 50722 + }, + { + "epoch": 0.98, + "learning_rate": 3.2192924546619543e-09, + "loss": 0.0008, + "step": 50723 + }, + { + "epoch": 0.98, + "learning_rate": 3.2154091103258125e-09, + "loss": 0.1266, + "step": 50724 + }, + { + "epoch": 0.98, + "learning_rate": 3.21152576598967e-09, + "loss": 0.0004, + "step": 50725 + }, + { + "epoch": 0.98, + "learning_rate": 3.207642421653528e-09, + "loss": 0.0002, + "step": 50726 + }, + { + "epoch": 0.98, + "learning_rate": 3.2037590773173856e-09, + "loss": 0.0005, + "step": 50727 + }, + { + "epoch": 0.98, + "learning_rate": 3.1998757329812434e-09, + "loss": 0.0004, + "step": 50728 + }, + { + "epoch": 0.98, + "learning_rate": 3.195992388645101e-09, + "loss": 0.0003, + "step": 50729 + }, + { + "epoch": 0.98, + "learning_rate": 3.192109044308959e-09, + "loss": 0.7422, + "step": 50730 + }, + { + "epoch": 0.98, + "learning_rate": 3.1882256999728165e-09, + "loss": 0.0006, + "step": 50731 + }, + { + "epoch": 0.98, + "learning_rate": 3.184342355636674e-09, + "loss": 0.0086, + "step": 50732 + }, + { + "epoch": 0.98, + "learning_rate": 3.1804590113005318e-09, + "loss": 1.3378, + "step": 50733 + }, + { + "epoch": 0.98, + "learning_rate": 3.176575666964389e-09, + "loss": 0.0004, + "step": 50734 + }, + { + "epoch": 0.98, + "learning_rate": 3.1726923226282474e-09, + "loss": 0.0006, + "step": 50735 + }, + { + "epoch": 0.98, + "learning_rate": 3.168808978292105e-09, + "loss": 0.0005, + "step": 50736 + }, + { + "epoch": 0.98, + "learning_rate": 3.164925633955963e-09, + "loss": 0.0004, + "step": 50737 + }, + { + "epoch": 0.98, + "learning_rate": 3.1610422896198205e-09, + "loss": 0.0006, + "step": 50738 + }, + { + "epoch": 0.98, + "learning_rate": 3.1571589452836783e-09, + "loss": 0.0005, + "step": 50739 + }, + { + "epoch": 0.98, + "learning_rate": 3.1532756009475357e-09, + "loss": 0.1542, + "step": 50740 + }, + { + "epoch": 0.98, + "learning_rate": 3.149392256611393e-09, + "loss": 0.0007, + "step": 50741 + }, + { + "epoch": 0.98, + "learning_rate": 3.1455089122752514e-09, + "loss": 0.0003, + "step": 50742 + }, + { + "epoch": 0.98, + "learning_rate": 3.141625567939109e-09, + "loss": 0.0004, + "step": 50743 + }, + { + "epoch": 0.98, + "learning_rate": 3.137742223602967e-09, + "loss": 0.0004, + "step": 50744 + }, + { + "epoch": 0.98, + "learning_rate": 3.133858879266824e-09, + "loss": 0.049, + "step": 50745 + }, + { + "epoch": 0.98, + "learning_rate": 3.1299755349306823e-09, + "loss": 0.0004, + "step": 50746 + }, + { + "epoch": 0.98, + "learning_rate": 3.1260921905945397e-09, + "loss": 0.2643, + "step": 50747 + }, + { + "epoch": 0.98, + "learning_rate": 3.1222088462583976e-09, + "loss": 0.0003, + "step": 50748 + }, + { + "epoch": 0.98, + "learning_rate": 3.1183255019222554e-09, + "loss": 0.0004, + "step": 50749 + }, + { + "epoch": 0.98, + "learning_rate": 3.1144421575861132e-09, + "loss": 0.0008, + "step": 50750 + }, + { + "epoch": 0.98, + "learning_rate": 3.1105588132499706e-09, + "loss": 0.0002, + "step": 50751 + }, + { + "epoch": 0.98, + "learning_rate": 3.1066754689138285e-09, + "loss": 0.0009, + "step": 50752 + }, + { + "epoch": 0.98, + "learning_rate": 3.1027921245776863e-09, + "loss": 0.0003, + "step": 50753 + }, + { + "epoch": 0.98, + "learning_rate": 3.098908780241544e-09, + "loss": 0.0003, + "step": 50754 + }, + { + "epoch": 0.98, + "learning_rate": 3.0950254359054015e-09, + "loss": 0.0002, + "step": 50755 + }, + { + "epoch": 0.98, + "learning_rate": 3.0911420915692594e-09, + "loss": 0.0003, + "step": 50756 + }, + { + "epoch": 0.98, + "learning_rate": 3.087258747233117e-09, + "loss": 0.0005, + "step": 50757 + }, + { + "epoch": 0.98, + "learning_rate": 3.0833754028969746e-09, + "loss": 0.0003, + "step": 50758 + }, + { + "epoch": 0.98, + "learning_rate": 3.0794920585608325e-09, + "loss": 0.0004, + "step": 50759 + }, + { + "epoch": 0.98, + "learning_rate": 3.0756087142246903e-09, + "loss": 0.0003, + "step": 50760 + }, + { + "epoch": 0.98, + "learning_rate": 3.071725369888548e-09, + "loss": 0.0003, + "step": 50761 + }, + { + "epoch": 0.98, + "learning_rate": 3.0678420255524055e-09, + "loss": 0.0004, + "step": 50762 + }, + { + "epoch": 0.98, + "learning_rate": 3.0639586812162634e-09, + "loss": 0.0003, + "step": 50763 + }, + { + "epoch": 0.98, + "learning_rate": 3.060075336880121e-09, + "loss": 0.0006, + "step": 50764 + }, + { + "epoch": 0.98, + "learning_rate": 3.0561919925439786e-09, + "loss": 0.0015, + "step": 50765 + }, + { + "epoch": 0.98, + "learning_rate": 3.0523086482078364e-09, + "loss": 0.0008, + "step": 50766 + }, + { + "epoch": 0.98, + "learning_rate": 3.0484253038716943e-09, + "loss": 0.0004, + "step": 50767 + }, + { + "epoch": 0.98, + "learning_rate": 3.0445419595355517e-09, + "loss": 0.0002, + "step": 50768 + }, + { + "epoch": 0.98, + "learning_rate": 3.0406586151994095e-09, + "loss": 0.0005, + "step": 50769 + }, + { + "epoch": 0.98, + "learning_rate": 3.0367752708632674e-09, + "loss": 0.0004, + "step": 50770 + }, + { + "epoch": 0.98, + "learning_rate": 3.032891926527125e-09, + "loss": 0.0003, + "step": 50771 + }, + { + "epoch": 0.98, + "learning_rate": 3.029008582190983e-09, + "loss": 0.0004, + "step": 50772 + }, + { + "epoch": 0.98, + "learning_rate": 3.0251252378548404e-09, + "loss": 0.0003, + "step": 50773 + }, + { + "epoch": 0.98, + "learning_rate": 3.0212418935186983e-09, + "loss": 0.0004, + "step": 50774 + }, + { + "epoch": 0.98, + "learning_rate": 3.0173585491825557e-09, + "loss": 0.0005, + "step": 50775 + }, + { + "epoch": 0.98, + "learning_rate": 3.0134752048464135e-09, + "loss": 0.0003, + "step": 50776 + }, + { + "epoch": 0.98, + "learning_rate": 3.0095918605102713e-09, + "loss": 0.0004, + "step": 50777 + }, + { + "epoch": 0.98, + "learning_rate": 3.005708516174129e-09, + "loss": 0.0004, + "step": 50778 + }, + { + "epoch": 0.99, + "learning_rate": 3.0018251718379866e-09, + "loss": 0.0007, + "step": 50779 + }, + { + "epoch": 0.99, + "learning_rate": 2.9979418275018444e-09, + "loss": 0.4957, + "step": 50780 + }, + { + "epoch": 0.99, + "learning_rate": 2.9940584831657023e-09, + "loss": 0.0006, + "step": 50781 + }, + { + "epoch": 0.99, + "learning_rate": 2.99017513882956e-09, + "loss": 0.0011, + "step": 50782 + }, + { + "epoch": 0.99, + "learning_rate": 2.986291794493418e-09, + "loss": 0.0008, + "step": 50783 + }, + { + "epoch": 0.99, + "learning_rate": 2.9824084501572753e-09, + "loss": 0.0005, + "step": 50784 + }, + { + "epoch": 0.99, + "learning_rate": 2.9785251058211327e-09, + "loss": 0.0004, + "step": 50785 + }, + { + "epoch": 0.99, + "learning_rate": 2.9746417614849906e-09, + "loss": 0.0002, + "step": 50786 + }, + { + "epoch": 0.99, + "learning_rate": 2.9707584171488484e-09, + "loss": 0.0002, + "step": 50787 + }, + { + "epoch": 0.99, + "learning_rate": 2.9668750728127062e-09, + "loss": 0.1227, + "step": 50788 + }, + { + "epoch": 0.99, + "learning_rate": 2.962991728476564e-09, + "loss": 0.0003, + "step": 50789 + }, + { + "epoch": 0.99, + "learning_rate": 2.9591083841404215e-09, + "loss": 0.0003, + "step": 50790 + }, + { + "epoch": 0.99, + "learning_rate": 2.9552250398042793e-09, + "loss": 0.0008, + "step": 50791 + }, + { + "epoch": 0.99, + "learning_rate": 2.951341695468137e-09, + "loss": 0.0003, + "step": 50792 + }, + { + "epoch": 0.99, + "learning_rate": 2.947458351131995e-09, + "loss": 0.0005, + "step": 50793 + }, + { + "epoch": 0.99, + "learning_rate": 2.9435750067958524e-09, + "loss": 0.0003, + "step": 50794 + }, + { + "epoch": 0.99, + "learning_rate": 2.9396916624597102e-09, + "loss": 0.0005, + "step": 50795 + }, + { + "epoch": 0.99, + "learning_rate": 2.9358083181235676e-09, + "loss": 0.0004, + "step": 50796 + }, + { + "epoch": 0.99, + "learning_rate": 2.9319249737874255e-09, + "loss": 0.0004, + "step": 50797 + }, + { + "epoch": 0.99, + "learning_rate": 2.9280416294512833e-09, + "loss": 0.3925, + "step": 50798 + }, + { + "epoch": 0.99, + "learning_rate": 2.924158285115141e-09, + "loss": 0.0004, + "step": 50799 + }, + { + "epoch": 0.99, + "learning_rate": 2.920274940778999e-09, + "loss": 0.0007, + "step": 50800 + }, + { + "epoch": 0.99, + "learning_rate": 2.9163915964428564e-09, + "loss": 0.0004, + "step": 50801 + }, + { + "epoch": 0.99, + "learning_rate": 2.9125082521067142e-09, + "loss": 0.0004, + "step": 50802 + }, + { + "epoch": 0.99, + "learning_rate": 2.908624907770572e-09, + "loss": 0.0004, + "step": 50803 + }, + { + "epoch": 0.99, + "learning_rate": 2.9047415634344295e-09, + "loss": 0.0006, + "step": 50804 + }, + { + "epoch": 0.99, + "learning_rate": 2.9008582190982873e-09, + "loss": 0.0006, + "step": 50805 + }, + { + "epoch": 0.99, + "learning_rate": 2.896974874762145e-09, + "loss": 0.0004, + "step": 50806 + }, + { + "epoch": 0.99, + "learning_rate": 2.8930915304260025e-09, + "loss": 0.0003, + "step": 50807 + }, + { + "epoch": 0.99, + "learning_rate": 2.8892081860898604e-09, + "loss": 0.0005, + "step": 50808 + }, + { + "epoch": 0.99, + "learning_rate": 2.885324841753718e-09, + "loss": 0.0003, + "step": 50809 + }, + { + "epoch": 0.99, + "learning_rate": 2.881441497417576e-09, + "loss": 0.0004, + "step": 50810 + }, + { + "epoch": 0.99, + "learning_rate": 2.877558153081434e-09, + "loss": 0.0005, + "step": 50811 + }, + { + "epoch": 0.99, + "learning_rate": 2.8736748087452913e-09, + "loss": 0.0005, + "step": 50812 + }, + { + "epoch": 0.99, + "learning_rate": 2.8697914644091487e-09, + "loss": 0.0016, + "step": 50813 + }, + { + "epoch": 0.99, + "learning_rate": 2.8659081200730065e-09, + "loss": 0.0003, + "step": 50814 + }, + { + "epoch": 0.99, + "learning_rate": 2.8620247757368644e-09, + "loss": 0.0005, + "step": 50815 + }, + { + "epoch": 0.99, + "learning_rate": 2.858141431400722e-09, + "loss": 0.0005, + "step": 50816 + }, + { + "epoch": 0.99, + "learning_rate": 2.85425808706458e-09, + "loss": 0.0003, + "step": 50817 + }, + { + "epoch": 0.99, + "learning_rate": 2.8503747427284374e-09, + "loss": 0.0003, + "step": 50818 + }, + { + "epoch": 0.99, + "learning_rate": 2.8464913983922953e-09, + "loss": 0.0007, + "step": 50819 + }, + { + "epoch": 0.99, + "learning_rate": 2.842608054056153e-09, + "loss": 0.0003, + "step": 50820 + }, + { + "epoch": 0.99, + "learning_rate": 2.838724709720011e-09, + "loss": 0.0003, + "step": 50821 + }, + { + "epoch": 0.99, + "learning_rate": 2.8348413653838688e-09, + "loss": 0.0008, + "step": 50822 + }, + { + "epoch": 0.99, + "learning_rate": 2.830958021047726e-09, + "loss": 0.0004, + "step": 50823 + }, + { + "epoch": 0.99, + "learning_rate": 2.8270746767115836e-09, + "loss": 0.0006, + "step": 50824 + }, + { + "epoch": 0.99, + "learning_rate": 2.8231913323754414e-09, + "loss": 0.4187, + "step": 50825 + }, + { + "epoch": 0.99, + "learning_rate": 2.8193079880392993e-09, + "loss": 0.0004, + "step": 50826 + }, + { + "epoch": 0.99, + "learning_rate": 2.815424643703157e-09, + "loss": 0.0003, + "step": 50827 + }, + { + "epoch": 0.99, + "learning_rate": 2.811541299367015e-09, + "loss": 0.0004, + "step": 50828 + }, + { + "epoch": 0.99, + "learning_rate": 2.8076579550308723e-09, + "loss": 0.0005, + "step": 50829 + }, + { + "epoch": 0.99, + "learning_rate": 2.80377461069473e-09, + "loss": 0.0004, + "step": 50830 + }, + { + "epoch": 0.99, + "learning_rate": 2.799891266358588e-09, + "loss": 0.0003, + "step": 50831 + }, + { + "epoch": 0.99, + "learning_rate": 2.796007922022446e-09, + "loss": 0.0004, + "step": 50832 + }, + { + "epoch": 0.99, + "learning_rate": 2.7921245776863032e-09, + "loss": 0.0003, + "step": 50833 + }, + { + "epoch": 0.99, + "learning_rate": 2.788241233350161e-09, + "loss": 0.0004, + "step": 50834 + }, + { + "epoch": 0.99, + "learning_rate": 2.7843578890140185e-09, + "loss": 0.0006, + "step": 50835 + }, + { + "epoch": 0.99, + "learning_rate": 2.7804745446778763e-09, + "loss": 0.0008, + "step": 50836 + }, + { + "epoch": 0.99, + "learning_rate": 2.776591200341734e-09, + "loss": 0.0004, + "step": 50837 + }, + { + "epoch": 0.99, + "learning_rate": 2.772707856005592e-09, + "loss": 0.0003, + "step": 50838 + }, + { + "epoch": 0.99, + "learning_rate": 2.76882451166945e-09, + "loss": 0.0004, + "step": 50839 + }, + { + "epoch": 0.99, + "learning_rate": 2.7649411673333072e-09, + "loss": 0.0004, + "step": 50840 + }, + { + "epoch": 0.99, + "learning_rate": 2.761057822997165e-09, + "loss": 0.0004, + "step": 50841 + }, + { + "epoch": 0.99, + "learning_rate": 2.7571744786610225e-09, + "loss": 0.0019, + "step": 50842 + }, + { + "epoch": 0.99, + "learning_rate": 2.7532911343248803e-09, + "loss": 0.0003, + "step": 50843 + }, + { + "epoch": 0.99, + "learning_rate": 2.749407789988738e-09, + "loss": 0.0002, + "step": 50844 + }, + { + "epoch": 0.99, + "learning_rate": 2.745524445652596e-09, + "loss": 0.0004, + "step": 50845 + }, + { + "epoch": 0.99, + "learning_rate": 2.7416411013164534e-09, + "loss": 0.0051, + "step": 50846 + }, + { + "epoch": 0.99, + "learning_rate": 2.7377577569803112e-09, + "loss": 0.0004, + "step": 50847 + }, + { + "epoch": 0.99, + "learning_rate": 2.733874412644169e-09, + "loss": 0.0003, + "step": 50848 + }, + { + "epoch": 0.99, + "learning_rate": 2.729991068308027e-09, + "loss": 0.0006, + "step": 50849 + }, + { + "epoch": 0.99, + "learning_rate": 2.7261077239718847e-09, + "loss": 0.0003, + "step": 50850 + }, + { + "epoch": 0.99, + "learning_rate": 2.722224379635742e-09, + "loss": 0.0004, + "step": 50851 + }, + { + "epoch": 0.99, + "learning_rate": 2.7183410352995995e-09, + "loss": 0.0003, + "step": 50852 + }, + { + "epoch": 0.99, + "learning_rate": 2.7144576909634574e-09, + "loss": 0.0025, + "step": 50853 + }, + { + "epoch": 0.99, + "learning_rate": 2.7105743466273152e-09, + "loss": 0.0003, + "step": 50854 + }, + { + "epoch": 0.99, + "learning_rate": 2.706691002291173e-09, + "loss": 0.0007, + "step": 50855 + }, + { + "epoch": 0.99, + "learning_rate": 2.702807657955031e-09, + "loss": 0.0006, + "step": 50856 + }, + { + "epoch": 0.99, + "learning_rate": 2.6989243136188883e-09, + "loss": 0.0003, + "step": 50857 + }, + { + "epoch": 0.99, + "learning_rate": 2.695040969282746e-09, + "loss": 0.0003, + "step": 50858 + }, + { + "epoch": 0.99, + "learning_rate": 2.691157624946604e-09, + "loss": 0.0017, + "step": 50859 + }, + { + "epoch": 0.99, + "learning_rate": 2.6872742806104618e-09, + "loss": 0.0004, + "step": 50860 + }, + { + "epoch": 0.99, + "learning_rate": 2.6833909362743196e-09, + "loss": 0.0595, + "step": 50861 + }, + { + "epoch": 0.99, + "learning_rate": 2.679507591938177e-09, + "loss": 0.0004, + "step": 50862 + }, + { + "epoch": 0.99, + "learning_rate": 2.6756242476020344e-09, + "loss": 0.0006, + "step": 50863 + }, + { + "epoch": 0.99, + "learning_rate": 2.6717409032658923e-09, + "loss": 0.0004, + "step": 50864 + }, + { + "epoch": 0.99, + "learning_rate": 2.66785755892975e-09, + "loss": 0.0003, + "step": 50865 + }, + { + "epoch": 0.99, + "learning_rate": 2.663974214593608e-09, + "loss": 0.0003, + "step": 50866 + }, + { + "epoch": 0.99, + "learning_rate": 2.6600908702574658e-09, + "loss": 0.0012, + "step": 50867 + }, + { + "epoch": 0.99, + "learning_rate": 2.6562075259213236e-09, + "loss": 0.0003, + "step": 50868 + }, + { + "epoch": 0.99, + "learning_rate": 2.652324181585181e-09, + "loss": 0.0003, + "step": 50869 + }, + { + "epoch": 0.99, + "learning_rate": 2.648440837249039e-09, + "loss": 0.0003, + "step": 50870 + }, + { + "epoch": 0.99, + "learning_rate": 2.6445574929128963e-09, + "loss": 0.0071, + "step": 50871 + }, + { + "epoch": 0.99, + "learning_rate": 2.640674148576754e-09, + "loss": 0.0004, + "step": 50872 + }, + { + "epoch": 0.99, + "learning_rate": 2.636790804240612e-09, + "loss": 0.0003, + "step": 50873 + }, + { + "epoch": 0.99, + "learning_rate": 2.6329074599044698e-09, + "loss": 1.2677, + "step": 50874 + }, + { + "epoch": 0.99, + "learning_rate": 2.629024115568327e-09, + "loss": 0.0005, + "step": 50875 + }, + { + "epoch": 0.99, + "learning_rate": 2.625140771232185e-09, + "loss": 0.0004, + "step": 50876 + }, + { + "epoch": 0.99, + "learning_rate": 2.621257426896043e-09, + "loss": 0.0006, + "step": 50877 + }, + { + "epoch": 0.99, + "learning_rate": 2.6173740825599007e-09, + "loss": 0.4242, + "step": 50878 + }, + { + "epoch": 0.99, + "learning_rate": 2.6134907382237585e-09, + "loss": 0.0004, + "step": 50879 + }, + { + "epoch": 0.99, + "learning_rate": 2.609607393887616e-09, + "loss": 0.0004, + "step": 50880 + }, + { + "epoch": 0.99, + "learning_rate": 2.6057240495514733e-09, + "loss": 0.0006, + "step": 50881 + }, + { + "epoch": 0.99, + "learning_rate": 2.601840705215331e-09, + "loss": 0.0004, + "step": 50882 + }, + { + "epoch": 0.99, + "learning_rate": 2.597957360879189e-09, + "loss": 0.0009, + "step": 50883 + }, + { + "epoch": 0.99, + "learning_rate": 2.594074016543047e-09, + "loss": 0.0006, + "step": 50884 + }, + { + "epoch": 0.99, + "learning_rate": 2.5901906722069047e-09, + "loss": 0.0004, + "step": 50885 + }, + { + "epoch": 0.99, + "learning_rate": 2.586307327870762e-09, + "loss": 0.0003, + "step": 50886 + }, + { + "epoch": 0.99, + "learning_rate": 2.58242398353462e-09, + "loss": 0.0005, + "step": 50887 + }, + { + "epoch": 0.99, + "learning_rate": 2.5785406391984777e-09, + "loss": 0.0003, + "step": 50888 + }, + { + "epoch": 0.99, + "learning_rate": 2.5746572948623356e-09, + "loss": 0.0006, + "step": 50889 + }, + { + "epoch": 0.99, + "learning_rate": 2.5707739505261934e-09, + "loss": 0.0004, + "step": 50890 + }, + { + "epoch": 0.99, + "learning_rate": 2.566890606190051e-09, + "loss": 0.0002, + "step": 50891 + }, + { + "epoch": 0.99, + "learning_rate": 2.5630072618539082e-09, + "loss": 0.0007, + "step": 50892 + }, + { + "epoch": 0.99, + "learning_rate": 2.559123917517766e-09, + "loss": 0.0004, + "step": 50893 + }, + { + "epoch": 0.99, + "learning_rate": 2.555240573181624e-09, + "loss": 0.0003, + "step": 50894 + }, + { + "epoch": 0.99, + "learning_rate": 2.5513572288454817e-09, + "loss": 0.0003, + "step": 50895 + }, + { + "epoch": 0.99, + "learning_rate": 2.5474738845093396e-09, + "loss": 0.0005, + "step": 50896 + }, + { + "epoch": 0.99, + "learning_rate": 2.543590540173197e-09, + "loss": 0.0857, + "step": 50897 + }, + { + "epoch": 0.99, + "learning_rate": 2.539707195837055e-09, + "loss": 0.0004, + "step": 50898 + }, + { + "epoch": 0.99, + "learning_rate": 2.5358238515009126e-09, + "loss": 0.0007, + "step": 50899 + }, + { + "epoch": 0.99, + "learning_rate": 2.53194050716477e-09, + "loss": 0.0003, + "step": 50900 + }, + { + "epoch": 0.99, + "learning_rate": 2.528057162828628e-09, + "loss": 0.0004, + "step": 50901 + }, + { + "epoch": 0.99, + "learning_rate": 2.5241738184924857e-09, + "loss": 0.0003, + "step": 50902 + }, + { + "epoch": 0.99, + "learning_rate": 2.520290474156343e-09, + "loss": 0.0004, + "step": 50903 + }, + { + "epoch": 0.99, + "learning_rate": 2.516407129820201e-09, + "loss": 0.0003, + "step": 50904 + }, + { + "epoch": 0.99, + "learning_rate": 2.5125237854840588e-09, + "loss": 0.9431, + "step": 50905 + }, + { + "epoch": 0.99, + "learning_rate": 2.5086404411479166e-09, + "loss": 0.9023, + "step": 50906 + }, + { + "epoch": 0.99, + "learning_rate": 2.5047570968117744e-09, + "loss": 0.0004, + "step": 50907 + }, + { + "epoch": 0.99, + "learning_rate": 2.500873752475632e-09, + "loss": 0.0004, + "step": 50908 + }, + { + "epoch": 0.99, + "learning_rate": 2.4969904081394897e-09, + "loss": 0.0006, + "step": 50909 + }, + { + "epoch": 0.99, + "learning_rate": 2.493107063803347e-09, + "loss": 0.0007, + "step": 50910 + }, + { + "epoch": 0.99, + "learning_rate": 2.489223719467205e-09, + "loss": 0.0004, + "step": 50911 + }, + { + "epoch": 0.99, + "learning_rate": 2.4853403751310628e-09, + "loss": 0.0003, + "step": 50912 + }, + { + "epoch": 0.99, + "learning_rate": 2.4814570307949206e-09, + "loss": 0.0002, + "step": 50913 + }, + { + "epoch": 0.99, + "learning_rate": 2.477573686458778e-09, + "loss": 0.0002, + "step": 50914 + }, + { + "epoch": 0.99, + "learning_rate": 2.473690342122636e-09, + "loss": 0.0004, + "step": 50915 + }, + { + "epoch": 0.99, + "learning_rate": 2.4698069977864937e-09, + "loss": 0.0006, + "step": 50916 + }, + { + "epoch": 0.99, + "learning_rate": 2.4659236534503515e-09, + "loss": 0.0004, + "step": 50917 + }, + { + "epoch": 0.99, + "learning_rate": 2.4620403091142093e-09, + "loss": 0.0004, + "step": 50918 + }, + { + "epoch": 0.99, + "learning_rate": 2.4581569647780668e-09, + "loss": 0.0003, + "step": 50919 + }, + { + "epoch": 0.99, + "learning_rate": 2.454273620441924e-09, + "loss": 0.0028, + "step": 50920 + }, + { + "epoch": 0.99, + "learning_rate": 2.450390276105782e-09, + "loss": 0.0004, + "step": 50921 + }, + { + "epoch": 0.99, + "learning_rate": 2.44650693176964e-09, + "loss": 0.0003, + "step": 50922 + }, + { + "epoch": 0.99, + "learning_rate": 2.4426235874334977e-09, + "loss": 0.0005, + "step": 50923 + }, + { + "epoch": 0.99, + "learning_rate": 2.4387402430973555e-09, + "loss": 0.0048, + "step": 50924 + }, + { + "epoch": 0.99, + "learning_rate": 2.434856898761213e-09, + "loss": 0.0004, + "step": 50925 + }, + { + "epoch": 0.99, + "learning_rate": 2.4309735544250707e-09, + "loss": 0.0004, + "step": 50926 + }, + { + "epoch": 0.99, + "learning_rate": 2.4270902100889286e-09, + "loss": 0.4464, + "step": 50927 + }, + { + "epoch": 0.99, + "learning_rate": 2.4232068657527864e-09, + "loss": 1.1349, + "step": 50928 + }, + { + "epoch": 0.99, + "learning_rate": 2.419323521416644e-09, + "loss": 0.0003, + "step": 50929 + }, + { + "epoch": 0.99, + "learning_rate": 2.4154401770805017e-09, + "loss": 0.0005, + "step": 50930 + }, + { + "epoch": 0.99, + "learning_rate": 2.411556832744359e-09, + "loss": 0.0004, + "step": 50931 + }, + { + "epoch": 0.99, + "learning_rate": 2.407673488408217e-09, + "loss": 0.0006, + "step": 50932 + }, + { + "epoch": 0.99, + "learning_rate": 2.4037901440720747e-09, + "loss": 0.0007, + "step": 50933 + }, + { + "epoch": 0.99, + "learning_rate": 2.3999067997359326e-09, + "loss": 0.0003, + "step": 50934 + }, + { + "epoch": 0.99, + "learning_rate": 2.3960234553997904e-09, + "loss": 0.0005, + "step": 50935 + }, + { + "epoch": 0.99, + "learning_rate": 2.392140111063648e-09, + "loss": 0.0003, + "step": 50936 + }, + { + "epoch": 0.99, + "learning_rate": 2.3882567667275056e-09, + "loss": 0.0004, + "step": 50937 + }, + { + "epoch": 0.99, + "learning_rate": 2.3843734223913635e-09, + "loss": 0.0004, + "step": 50938 + }, + { + "epoch": 0.99, + "learning_rate": 2.380490078055221e-09, + "loss": 0.0017, + "step": 50939 + }, + { + "epoch": 0.99, + "learning_rate": 2.3766067337190787e-09, + "loss": 0.0003, + "step": 50940 + }, + { + "epoch": 0.99, + "learning_rate": 2.3727233893829366e-09, + "loss": 0.0005, + "step": 50941 + }, + { + "epoch": 0.99, + "learning_rate": 2.368840045046794e-09, + "loss": 0.0005, + "step": 50942 + }, + { + "epoch": 0.99, + "learning_rate": 2.364956700710652e-09, + "loss": 0.0003, + "step": 50943 + }, + { + "epoch": 0.99, + "learning_rate": 2.3610733563745096e-09, + "loss": 0.0003, + "step": 50944 + }, + { + "epoch": 0.99, + "learning_rate": 2.3571900120383675e-09, + "loss": 0.0005, + "step": 50945 + }, + { + "epoch": 0.99, + "learning_rate": 2.3533066677022253e-09, + "loss": 0.0003, + "step": 50946 + }, + { + "epoch": 0.99, + "learning_rate": 2.3494233233660827e-09, + "loss": 0.0004, + "step": 50947 + }, + { + "epoch": 0.99, + "learning_rate": 2.3455399790299405e-09, + "loss": 0.0004, + "step": 50948 + }, + { + "epoch": 0.99, + "learning_rate": 2.341656634693798e-09, + "loss": 0.0004, + "step": 50949 + }, + { + "epoch": 0.99, + "learning_rate": 2.3377732903576558e-09, + "loss": 0.2859, + "step": 50950 + }, + { + "epoch": 0.99, + "learning_rate": 2.3338899460215136e-09, + "loss": 0.0005, + "step": 50951 + }, + { + "epoch": 0.99, + "learning_rate": 2.3300066016853715e-09, + "loss": 0.0004, + "step": 50952 + }, + { + "epoch": 0.99, + "learning_rate": 2.326123257349229e-09, + "loss": 0.0004, + "step": 50953 + }, + { + "epoch": 0.99, + "learning_rate": 2.3222399130130867e-09, + "loss": 0.0004, + "step": 50954 + }, + { + "epoch": 0.99, + "learning_rate": 2.3183565686769445e-09, + "loss": 0.0003, + "step": 50955 + }, + { + "epoch": 0.99, + "learning_rate": 2.3144732243408024e-09, + "loss": 0.0004, + "step": 50956 + }, + { + "epoch": 0.99, + "learning_rate": 2.31058988000466e-09, + "loss": 0.0004, + "step": 50957 + }, + { + "epoch": 0.99, + "learning_rate": 2.3067065356685176e-09, + "loss": 0.0197, + "step": 50958 + }, + { + "epoch": 0.99, + "learning_rate": 2.302823191332375e-09, + "loss": 0.0003, + "step": 50959 + }, + { + "epoch": 0.99, + "learning_rate": 2.298939846996233e-09, + "loss": 0.0004, + "step": 50960 + }, + { + "epoch": 0.99, + "learning_rate": 2.2950565026600907e-09, + "loss": 0.0005, + "step": 50961 + }, + { + "epoch": 0.99, + "learning_rate": 2.2911731583239485e-09, + "loss": 0.0004, + "step": 50962 + }, + { + "epoch": 0.99, + "learning_rate": 2.2872898139878064e-09, + "loss": 0.0008, + "step": 50963 + }, + { + "epoch": 0.99, + "learning_rate": 2.2834064696516638e-09, + "loss": 0.0006, + "step": 50964 + }, + { + "epoch": 0.99, + "learning_rate": 2.2795231253155216e-09, + "loss": 0.1419, + "step": 50965 + }, + { + "epoch": 0.99, + "learning_rate": 2.2756397809793794e-09, + "loss": 0.0003, + "step": 50966 + }, + { + "epoch": 0.99, + "learning_rate": 2.2717564366432373e-09, + "loss": 1.1619, + "step": 50967 + }, + { + "epoch": 0.99, + "learning_rate": 2.2678730923070947e-09, + "loss": 0.0005, + "step": 50968 + }, + { + "epoch": 0.99, + "learning_rate": 2.2639897479709525e-09, + "loss": 0.0004, + "step": 50969 + }, + { + "epoch": 0.99, + "learning_rate": 2.26010640363481e-09, + "loss": 0.0008, + "step": 50970 + }, + { + "epoch": 0.99, + "learning_rate": 2.2562230592986678e-09, + "loss": 0.0025, + "step": 50971 + }, + { + "epoch": 0.99, + "learning_rate": 2.2523397149625256e-09, + "loss": 0.0004, + "step": 50972 + }, + { + "epoch": 0.99, + "learning_rate": 2.2484563706263834e-09, + "loss": 0.0004, + "step": 50973 + }, + { + "epoch": 0.99, + "learning_rate": 2.2445730262902412e-09, + "loss": 0.0004, + "step": 50974 + }, + { + "epoch": 0.99, + "learning_rate": 2.2406896819540987e-09, + "loss": 0.0005, + "step": 50975 + }, + { + "epoch": 0.99, + "learning_rate": 2.2368063376179565e-09, + "loss": 0.0003, + "step": 50976 + }, + { + "epoch": 0.99, + "learning_rate": 2.2329229932818143e-09, + "loss": 0.0004, + "step": 50977 + }, + { + "epoch": 0.99, + "learning_rate": 2.2290396489456717e-09, + "loss": 0.0004, + "step": 50978 + }, + { + "epoch": 0.99, + "learning_rate": 2.2251563046095296e-09, + "loss": 0.0003, + "step": 50979 + }, + { + "epoch": 0.99, + "learning_rate": 2.2212729602733874e-09, + "loss": 0.0004, + "step": 50980 + }, + { + "epoch": 0.99, + "learning_rate": 2.217389615937245e-09, + "loss": 0.0004, + "step": 50981 + }, + { + "epoch": 0.99, + "learning_rate": 2.2135062716011027e-09, + "loss": 0.0003, + "step": 50982 + }, + { + "epoch": 0.99, + "learning_rate": 2.2096229272649605e-09, + "loss": 0.0005, + "step": 50983 + }, + { + "epoch": 0.99, + "learning_rate": 2.2057395829288183e-09, + "loss": 0.0026, + "step": 50984 + }, + { + "epoch": 0.99, + "learning_rate": 2.201856238592676e-09, + "loss": 0.0004, + "step": 50985 + }, + { + "epoch": 0.99, + "learning_rate": 2.197972894256534e-09, + "loss": 0.0007, + "step": 50986 + }, + { + "epoch": 0.99, + "learning_rate": 2.194089549920391e-09, + "loss": 0.0027, + "step": 50987 + }, + { + "epoch": 0.99, + "learning_rate": 2.190206205584249e-09, + "loss": 0.0289, + "step": 50988 + }, + { + "epoch": 0.99, + "learning_rate": 2.1863228612481066e-09, + "loss": 0.0003, + "step": 50989 + }, + { + "epoch": 0.99, + "learning_rate": 2.1824395169119645e-09, + "loss": 0.0004, + "step": 50990 + }, + { + "epoch": 0.99, + "learning_rate": 2.1785561725758223e-09, + "loss": 0.0753, + "step": 50991 + }, + { + "epoch": 0.99, + "learning_rate": 2.17467282823968e-09, + "loss": 0.4366, + "step": 50992 + }, + { + "epoch": 0.99, + "learning_rate": 2.1707894839035376e-09, + "loss": 0.0006, + "step": 50993 + }, + { + "epoch": 0.99, + "learning_rate": 2.1669061395673954e-09, + "loss": 0.0015, + "step": 50994 + }, + { + "epoch": 0.99, + "learning_rate": 2.1630227952312532e-09, + "loss": 0.0005, + "step": 50995 + }, + { + "epoch": 0.99, + "learning_rate": 2.159139450895111e-09, + "loss": 0.0004, + "step": 50996 + }, + { + "epoch": 0.99, + "learning_rate": 2.1552561065589685e-09, + "loss": 0.0004, + "step": 50997 + }, + { + "epoch": 0.99, + "learning_rate": 2.1513727622228263e-09, + "loss": 0.0004, + "step": 50998 + }, + { + "epoch": 0.99, + "learning_rate": 2.1474894178866837e-09, + "loss": 0.0004, + "step": 50999 + }, + { + "epoch": 0.99, + "learning_rate": 2.1436060735505415e-09, + "loss": 2.3544, + "step": 51000 + }, + { + "epoch": 0.99, + "learning_rate": 2.1397227292143994e-09, + "loss": 0.0004, + "step": 51001 + }, + { + "epoch": 0.99, + "learning_rate": 2.135839384878257e-09, + "loss": 0.0004, + "step": 51002 + }, + { + "epoch": 0.99, + "learning_rate": 2.131956040542115e-09, + "loss": 0.0003, + "step": 51003 + }, + { + "epoch": 0.99, + "learning_rate": 2.1280726962059724e-09, + "loss": 0.0004, + "step": 51004 + }, + { + "epoch": 0.99, + "learning_rate": 2.1241893518698303e-09, + "loss": 0.0111, + "step": 51005 + }, + { + "epoch": 0.99, + "learning_rate": 2.120306007533688e-09, + "loss": 0.006, + "step": 51006 + }, + { + "epoch": 0.99, + "learning_rate": 2.1164226631975455e-09, + "loss": 0.0004, + "step": 51007 + }, + { + "epoch": 0.99, + "learning_rate": 2.1125393188614034e-09, + "loss": 0.0005, + "step": 51008 + }, + { + "epoch": 0.99, + "learning_rate": 2.108655974525261e-09, + "loss": 1.3659, + "step": 51009 + }, + { + "epoch": 0.99, + "learning_rate": 2.1047726301891186e-09, + "loss": 0.0004, + "step": 51010 + }, + { + "epoch": 0.99, + "learning_rate": 2.1008892858529764e-09, + "loss": 0.0005, + "step": 51011 + }, + { + "epoch": 0.99, + "learning_rate": 2.0970059415168343e-09, + "loss": 0.0005, + "step": 51012 + }, + { + "epoch": 0.99, + "learning_rate": 2.093122597180692e-09, + "loss": 0.0002, + "step": 51013 + }, + { + "epoch": 0.99, + "learning_rate": 2.08923925284455e-09, + "loss": 0.0004, + "step": 51014 + }, + { + "epoch": 0.99, + "learning_rate": 2.0853559085084073e-09, + "loss": 0.0003, + "step": 51015 + }, + { + "epoch": 0.99, + "learning_rate": 2.0814725641722648e-09, + "loss": 0.0005, + "step": 51016 + }, + { + "epoch": 0.99, + "learning_rate": 2.0775892198361226e-09, + "loss": 0.0005, + "step": 51017 + }, + { + "epoch": 0.99, + "learning_rate": 2.0737058754999804e-09, + "loss": 0.0006, + "step": 51018 + }, + { + "epoch": 0.99, + "learning_rate": 2.0698225311638383e-09, + "loss": 0.0004, + "step": 51019 + }, + { + "epoch": 0.99, + "learning_rate": 2.065939186827696e-09, + "loss": 0.0003, + "step": 51020 + }, + { + "epoch": 0.99, + "learning_rate": 2.0620558424915535e-09, + "loss": 0.0005, + "step": 51021 + }, + { + "epoch": 0.99, + "learning_rate": 2.0581724981554113e-09, + "loss": 0.0003, + "step": 51022 + }, + { + "epoch": 0.99, + "learning_rate": 2.054289153819269e-09, + "loss": 0.0007, + "step": 51023 + }, + { + "epoch": 0.99, + "learning_rate": 2.050405809483127e-09, + "loss": 0.0004, + "step": 51024 + }, + { + "epoch": 0.99, + "learning_rate": 2.046522465146985e-09, + "loss": 0.0007, + "step": 51025 + }, + { + "epoch": 0.99, + "learning_rate": 2.0426391208108422e-09, + "loss": 0.0003, + "step": 51026 + }, + { + "epoch": 0.99, + "learning_rate": 2.0387557764746997e-09, + "loss": 0.0003, + "step": 51027 + }, + { + "epoch": 0.99, + "learning_rate": 2.0348724321385575e-09, + "loss": 0.0004, + "step": 51028 + }, + { + "epoch": 0.99, + "learning_rate": 2.0309890878024153e-09, + "loss": 0.0003, + "step": 51029 + }, + { + "epoch": 0.99, + "learning_rate": 2.027105743466273e-09, + "loss": 0.0011, + "step": 51030 + }, + { + "epoch": 0.99, + "learning_rate": 2.023222399130131e-09, + "loss": 0.0004, + "step": 51031 + }, + { + "epoch": 0.99, + "learning_rate": 2.0193390547939884e-09, + "loss": 0.0003, + "step": 51032 + }, + { + "epoch": 0.99, + "learning_rate": 2.0154557104578462e-09, + "loss": 0.0003, + "step": 51033 + }, + { + "epoch": 0.99, + "learning_rate": 2.011572366121704e-09, + "loss": 0.0005, + "step": 51034 + }, + { + "epoch": 0.99, + "learning_rate": 2.007689021785562e-09, + "loss": 0.0005, + "step": 51035 + }, + { + "epoch": 0.99, + "learning_rate": 2.0038056774494193e-09, + "loss": 0.0005, + "step": 51036 + }, + { + "epoch": 0.99, + "learning_rate": 1.999922333113277e-09, + "loss": 0.9393, + "step": 51037 + }, + { + "epoch": 0.99, + "learning_rate": 1.9960389887771346e-09, + "loss": 0.0005, + "step": 51038 + }, + { + "epoch": 0.99, + "learning_rate": 1.9921556444409924e-09, + "loss": 0.0003, + "step": 51039 + }, + { + "epoch": 0.99, + "learning_rate": 1.9882723001048502e-09, + "loss": 0.0005, + "step": 51040 + }, + { + "epoch": 0.99, + "learning_rate": 1.984388955768708e-09, + "loss": 0.0003, + "step": 51041 + }, + { + "epoch": 0.99, + "learning_rate": 1.980505611432566e-09, + "loss": 0.0004, + "step": 51042 + }, + { + "epoch": 0.99, + "learning_rate": 1.9766222670964233e-09, + "loss": 0.0002, + "step": 51043 + }, + { + "epoch": 0.99, + "learning_rate": 1.972738922760281e-09, + "loss": 0.0005, + "step": 51044 + }, + { + "epoch": 0.99, + "learning_rate": 1.9688555784241385e-09, + "loss": 0.0004, + "step": 51045 + }, + { + "epoch": 0.99, + "learning_rate": 1.9649722340879964e-09, + "loss": 0.3355, + "step": 51046 + }, + { + "epoch": 0.99, + "learning_rate": 1.9610888897518542e-09, + "loss": 0.0004, + "step": 51047 + }, + { + "epoch": 0.99, + "learning_rate": 1.957205545415712e-09, + "loss": 0.0004, + "step": 51048 + }, + { + "epoch": 0.99, + "learning_rate": 1.9533222010795695e-09, + "loss": 0.3387, + "step": 51049 + }, + { + "epoch": 0.99, + "learning_rate": 1.9494388567434273e-09, + "loss": 0.0005, + "step": 51050 + }, + { + "epoch": 0.99, + "learning_rate": 1.945555512407285e-09, + "loss": 0.0004, + "step": 51051 + }, + { + "epoch": 0.99, + "learning_rate": 1.941672168071143e-09, + "loss": 0.0005, + "step": 51052 + }, + { + "epoch": 0.99, + "learning_rate": 1.9377888237350008e-09, + "loss": 0.1624, + "step": 51053 + }, + { + "epoch": 0.99, + "learning_rate": 1.933905479398858e-09, + "loss": 0.0004, + "step": 51054 + }, + { + "epoch": 0.99, + "learning_rate": 1.9300221350627156e-09, + "loss": 0.0003, + "step": 51055 + }, + { + "epoch": 0.99, + "learning_rate": 1.9261387907265734e-09, + "loss": 0.0003, + "step": 51056 + }, + { + "epoch": 0.99, + "learning_rate": 1.9222554463904313e-09, + "loss": 0.0004, + "step": 51057 + }, + { + "epoch": 0.99, + "learning_rate": 1.918372102054289e-09, + "loss": 1.1912, + "step": 51058 + }, + { + "epoch": 0.99, + "learning_rate": 1.914488757718147e-09, + "loss": 0.0003, + "step": 51059 + }, + { + "epoch": 0.99, + "learning_rate": 1.9106054133820044e-09, + "loss": 0.0003, + "step": 51060 + }, + { + "epoch": 0.99, + "learning_rate": 1.906722069045862e-09, + "loss": 1.0406, + "step": 51061 + }, + { + "epoch": 0.99, + "learning_rate": 1.90283872470972e-09, + "loss": 0.0003, + "step": 51062 + }, + { + "epoch": 0.99, + "learning_rate": 1.898955380373578e-09, + "loss": 0.0004, + "step": 51063 + }, + { + "epoch": 0.99, + "learning_rate": 1.8950720360374357e-09, + "loss": 0.0004, + "step": 51064 + }, + { + "epoch": 0.99, + "learning_rate": 1.891188691701293e-09, + "loss": 0.0004, + "step": 51065 + }, + { + "epoch": 0.99, + "learning_rate": 1.8873053473651505e-09, + "loss": 0.0037, + "step": 51066 + }, + { + "epoch": 0.99, + "learning_rate": 1.8834220030290083e-09, + "loss": 0.0005, + "step": 51067 + }, + { + "epoch": 0.99, + "learning_rate": 1.879538658692866e-09, + "loss": 0.0004, + "step": 51068 + }, + { + "epoch": 0.99, + "learning_rate": 1.875655314356724e-09, + "loss": 0.0005, + "step": 51069 + }, + { + "epoch": 0.99, + "learning_rate": 1.871771970020582e-09, + "loss": 0.0003, + "step": 51070 + }, + { + "epoch": 0.99, + "learning_rate": 1.8678886256844392e-09, + "loss": 0.0004, + "step": 51071 + }, + { + "epoch": 0.99, + "learning_rate": 1.864005281348297e-09, + "loss": 0.0015, + "step": 51072 + }, + { + "epoch": 0.99, + "learning_rate": 1.860121937012155e-09, + "loss": 0.0004, + "step": 51073 + }, + { + "epoch": 0.99, + "learning_rate": 1.8562385926760123e-09, + "loss": 0.0005, + "step": 51074 + }, + { + "epoch": 0.99, + "learning_rate": 1.8523552483398702e-09, + "loss": 0.0005, + "step": 51075 + }, + { + "epoch": 0.99, + "learning_rate": 1.8484719040037278e-09, + "loss": 0.0004, + "step": 51076 + }, + { + "epoch": 0.99, + "learning_rate": 1.8445885596675856e-09, + "loss": 0.0005, + "step": 51077 + }, + { + "epoch": 0.99, + "learning_rate": 1.8407052153314432e-09, + "loss": 0.0004, + "step": 51078 + }, + { + "epoch": 0.99, + "learning_rate": 1.836821870995301e-09, + "loss": 0.0005, + "step": 51079 + }, + { + "epoch": 0.99, + "learning_rate": 1.832938526659159e-09, + "loss": 0.0003, + "step": 51080 + }, + { + "epoch": 0.99, + "learning_rate": 1.8290551823230165e-09, + "loss": 0.0005, + "step": 51081 + }, + { + "epoch": 0.99, + "learning_rate": 1.8251718379868744e-09, + "loss": 0.0005, + "step": 51082 + }, + { + "epoch": 0.99, + "learning_rate": 1.8212884936507322e-09, + "loss": 0.0003, + "step": 51083 + }, + { + "epoch": 0.99, + "learning_rate": 1.8174051493145894e-09, + "loss": 0.0009, + "step": 51084 + }, + { + "epoch": 0.99, + "learning_rate": 1.8135218049784472e-09, + "loss": 0.0004, + "step": 51085 + }, + { + "epoch": 0.99, + "learning_rate": 1.809638460642305e-09, + "loss": 0.0003, + "step": 51086 + }, + { + "epoch": 0.99, + "learning_rate": 1.8057551163061627e-09, + "loss": 0.0003, + "step": 51087 + }, + { + "epoch": 0.99, + "learning_rate": 1.8018717719700205e-09, + "loss": 0.0003, + "step": 51088 + }, + { + "epoch": 0.99, + "learning_rate": 1.7979884276338783e-09, + "loss": 0.0183, + "step": 51089 + }, + { + "epoch": 0.99, + "learning_rate": 1.794105083297736e-09, + "loss": 0.0003, + "step": 51090 + }, + { + "epoch": 0.99, + "learning_rate": 1.7902217389615938e-09, + "loss": 0.0224, + "step": 51091 + }, + { + "epoch": 0.99, + "learning_rate": 1.7863383946254514e-09, + "loss": 0.0003, + "step": 51092 + }, + { + "epoch": 0.99, + "learning_rate": 1.7824550502893093e-09, + "loss": 0.0278, + "step": 51093 + }, + { + "epoch": 0.99, + "learning_rate": 1.7785717059531667e-09, + "loss": 0.0005, + "step": 51094 + }, + { + "epoch": 0.99, + "learning_rate": 1.7746883616170245e-09, + "loss": 0.0005, + "step": 51095 + }, + { + "epoch": 0.99, + "learning_rate": 1.7708050172808821e-09, + "loss": 0.0005, + "step": 51096 + }, + { + "epoch": 0.99, + "learning_rate": 1.76692167294474e-09, + "loss": 0.0004, + "step": 51097 + }, + { + "epoch": 0.99, + "learning_rate": 1.7630383286085976e-09, + "loss": 0.0006, + "step": 51098 + }, + { + "epoch": 0.99, + "learning_rate": 1.7591549842724554e-09, + "loss": 0.0005, + "step": 51099 + }, + { + "epoch": 0.99, + "learning_rate": 1.7552716399363132e-09, + "loss": 0.0005, + "step": 51100 + }, + { + "epoch": 0.99, + "learning_rate": 1.7513882956001709e-09, + "loss": 0.0009, + "step": 51101 + }, + { + "epoch": 0.99, + "learning_rate": 1.7475049512640287e-09, + "loss": 0.0005, + "step": 51102 + }, + { + "epoch": 0.99, + "learning_rate": 1.7436216069278861e-09, + "loss": 0.0004, + "step": 51103 + }, + { + "epoch": 0.99, + "learning_rate": 1.7397382625917437e-09, + "loss": 0.3448, + "step": 51104 + }, + { + "epoch": 0.99, + "learning_rate": 1.7358549182556016e-09, + "loss": 0.0003, + "step": 51105 + }, + { + "epoch": 0.99, + "learning_rate": 1.7319715739194594e-09, + "loss": 0.0006, + "step": 51106 + }, + { + "epoch": 0.99, + "learning_rate": 1.728088229583317e-09, + "loss": 0.0012, + "step": 51107 + }, + { + "epoch": 0.99, + "learning_rate": 1.7242048852471749e-09, + "loss": 0.0002, + "step": 51108 + }, + { + "epoch": 0.99, + "learning_rate": 1.7203215409110325e-09, + "loss": 0.0005, + "step": 51109 + }, + { + "epoch": 0.99, + "learning_rate": 1.7164381965748903e-09, + "loss": 0.0327, + "step": 51110 + }, + { + "epoch": 0.99, + "learning_rate": 1.7125548522387481e-09, + "loss": 0.0005, + "step": 51111 + }, + { + "epoch": 0.99, + "learning_rate": 1.7086715079026058e-09, + "loss": 1.3375, + "step": 51112 + }, + { + "epoch": 0.99, + "learning_rate": 1.7047881635664632e-09, + "loss": 0.0003, + "step": 51113 + }, + { + "epoch": 0.99, + "learning_rate": 1.700904819230321e-09, + "loss": 0.0003, + "step": 51114 + }, + { + "epoch": 0.99, + "learning_rate": 1.6970214748941786e-09, + "loss": 0.0002, + "step": 51115 + }, + { + "epoch": 0.99, + "learning_rate": 1.6931381305580365e-09, + "loss": 0.0005, + "step": 51116 + }, + { + "epoch": 0.99, + "learning_rate": 1.6892547862218943e-09, + "loss": 0.0004, + "step": 51117 + }, + { + "epoch": 0.99, + "learning_rate": 1.685371441885752e-09, + "loss": 0.0005, + "step": 51118 + }, + { + "epoch": 0.99, + "learning_rate": 1.6814880975496097e-09, + "loss": 0.0004, + "step": 51119 + }, + { + "epoch": 0.99, + "learning_rate": 1.6776047532134674e-09, + "loss": 0.0005, + "step": 51120 + }, + { + "epoch": 0.99, + "learning_rate": 1.6737214088773252e-09, + "loss": 0.0005, + "step": 51121 + }, + { + "epoch": 0.99, + "learning_rate": 1.669838064541183e-09, + "loss": 0.0007, + "step": 51122 + }, + { + "epoch": 0.99, + "learning_rate": 1.6659547202050405e-09, + "loss": 0.0004, + "step": 51123 + }, + { + "epoch": 0.99, + "learning_rate": 1.662071375868898e-09, + "loss": 0.0003, + "step": 51124 + }, + { + "epoch": 0.99, + "learning_rate": 1.658188031532756e-09, + "loss": 0.0004, + "step": 51125 + }, + { + "epoch": 0.99, + "learning_rate": 1.6543046871966135e-09, + "loss": 0.0005, + "step": 51126 + }, + { + "epoch": 0.99, + "learning_rate": 1.6504213428604714e-09, + "loss": 0.0005, + "step": 51127 + }, + { + "epoch": 0.99, + "learning_rate": 1.6465379985243292e-09, + "loss": 0.0003, + "step": 51128 + }, + { + "epoch": 0.99, + "learning_rate": 1.6426546541881868e-09, + "loss": 0.0007, + "step": 51129 + }, + { + "epoch": 0.99, + "learning_rate": 1.6387713098520446e-09, + "loss": 0.0004, + "step": 51130 + }, + { + "epoch": 0.99, + "learning_rate": 1.6348879655159023e-09, + "loss": 0.0003, + "step": 51131 + }, + { + "epoch": 0.99, + "learning_rate": 1.6310046211797597e-09, + "loss": 0.0005, + "step": 51132 + }, + { + "epoch": 0.99, + "learning_rate": 1.6271212768436175e-09, + "loss": 0.0005, + "step": 51133 + }, + { + "epoch": 0.99, + "learning_rate": 1.6232379325074753e-09, + "loss": 0.0292, + "step": 51134 + }, + { + "epoch": 0.99, + "learning_rate": 1.619354588171333e-09, + "loss": 0.0004, + "step": 51135 + }, + { + "epoch": 0.99, + "learning_rate": 1.6154712438351908e-09, + "loss": 0.0006, + "step": 51136 + }, + { + "epoch": 0.99, + "learning_rate": 1.6115878994990484e-09, + "loss": 0.0004, + "step": 51137 + }, + { + "epoch": 0.99, + "learning_rate": 1.6077045551629063e-09, + "loss": 0.0004, + "step": 51138 + }, + { + "epoch": 0.99, + "learning_rate": 1.603821210826764e-09, + "loss": 0.0003, + "step": 51139 + }, + { + "epoch": 0.99, + "learning_rate": 1.5999378664906217e-09, + "loss": 0.0002, + "step": 51140 + }, + { + "epoch": 0.99, + "learning_rate": 1.5960545221544795e-09, + "loss": 0.0004, + "step": 51141 + }, + { + "epoch": 0.99, + "learning_rate": 1.592171177818337e-09, + "loss": 0.0005, + "step": 51142 + }, + { + "epoch": 0.99, + "learning_rate": 1.5882878334821946e-09, + "loss": 0.0003, + "step": 51143 + }, + { + "epoch": 0.99, + "learning_rate": 1.5844044891460524e-09, + "loss": 0.0005, + "step": 51144 + }, + { + "epoch": 0.99, + "learning_rate": 1.5805211448099102e-09, + "loss": 0.2206, + "step": 51145 + }, + { + "epoch": 0.99, + "learning_rate": 1.5766378004737679e-09, + "loss": 0.0006, + "step": 51146 + }, + { + "epoch": 0.99, + "learning_rate": 1.5727544561376257e-09, + "loss": 0.8207, + "step": 51147 + }, + { + "epoch": 0.99, + "learning_rate": 1.5688711118014835e-09, + "loss": 0.0004, + "step": 51148 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649877674653412e-09, + "loss": 1.3043, + "step": 51149 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611044231291988e-09, + "loss": 0.0004, + "step": 51150 + }, + { + "epoch": 0.99, + "learning_rate": 1.5572210787930566e-09, + "loss": 0.0004, + "step": 51151 + }, + { + "epoch": 0.99, + "learning_rate": 1.5533377344569142e-09, + "loss": 0.0003, + "step": 51152 + }, + { + "epoch": 0.99, + "learning_rate": 1.549454390120772e-09, + "loss": 0.0004, + "step": 51153 + }, + { + "epoch": 0.99, + "learning_rate": 1.5455710457846297e-09, + "loss": 0.0003, + "step": 51154 + }, + { + "epoch": 0.99, + "learning_rate": 1.5416877014484873e-09, + "loss": 0.0005, + "step": 51155 + }, + { + "epoch": 0.99, + "learning_rate": 1.5378043571123451e-09, + "loss": 0.0003, + "step": 51156 + }, + { + "epoch": 0.99, + "learning_rate": 1.5339210127762028e-09, + "loss": 0.0003, + "step": 51157 + }, + { + "epoch": 0.99, + "learning_rate": 1.5300376684400606e-09, + "loss": 0.0004, + "step": 51158 + }, + { + "epoch": 0.99, + "learning_rate": 1.5261543241039182e-09, + "loss": 0.0003, + "step": 51159 + }, + { + "epoch": 0.99, + "learning_rate": 1.5222709797677758e-09, + "loss": 0.0005, + "step": 51160 + }, + { + "epoch": 0.99, + "learning_rate": 1.5183876354316337e-09, + "loss": 0.0003, + "step": 51161 + }, + { + "epoch": 0.99, + "learning_rate": 1.5145042910954915e-09, + "loss": 0.0004, + "step": 51162 + }, + { + "epoch": 0.99, + "learning_rate": 1.5106209467593491e-09, + "loss": 0.0005, + "step": 51163 + }, + { + "epoch": 0.99, + "learning_rate": 1.5067376024232068e-09, + "loss": 0.0005, + "step": 51164 + }, + { + "epoch": 0.99, + "learning_rate": 1.5028542580870646e-09, + "loss": 0.297, + "step": 51165 + }, + { + "epoch": 0.99, + "learning_rate": 1.4989709137509222e-09, + "loss": 0.0006, + "step": 51166 + }, + { + "epoch": 0.99, + "learning_rate": 1.49508756941478e-09, + "loss": 0.0003, + "step": 51167 + }, + { + "epoch": 0.99, + "learning_rate": 1.4912042250786377e-09, + "loss": 0.0006, + "step": 51168 + }, + { + "epoch": 0.99, + "learning_rate": 1.4873208807424953e-09, + "loss": 0.0004, + "step": 51169 + }, + { + "epoch": 0.99, + "learning_rate": 1.4834375364063531e-09, + "loss": 0.0003, + "step": 51170 + }, + { + "epoch": 0.99, + "learning_rate": 1.4795541920702107e-09, + "loss": 0.0003, + "step": 51171 + }, + { + "epoch": 0.99, + "learning_rate": 1.4756708477340686e-09, + "loss": 0.0002, + "step": 51172 + }, + { + "epoch": 0.99, + "learning_rate": 1.4717875033979262e-09, + "loss": 0.0003, + "step": 51173 + }, + { + "epoch": 0.99, + "learning_rate": 1.4679041590617838e-09, + "loss": 0.0003, + "step": 51174 + }, + { + "epoch": 0.99, + "learning_rate": 1.4640208147256417e-09, + "loss": 0.0008, + "step": 51175 + }, + { + "epoch": 0.99, + "learning_rate": 1.4601374703894995e-09, + "loss": 0.01, + "step": 51176 + }, + { + "epoch": 0.99, + "learning_rate": 1.4562541260533571e-09, + "loss": 0.0004, + "step": 51177 + }, + { + "epoch": 0.99, + "learning_rate": 1.4523707817172147e-09, + "loss": 0.0002, + "step": 51178 + }, + { + "epoch": 0.99, + "learning_rate": 1.4484874373810726e-09, + "loss": 0.0005, + "step": 51179 + }, + { + "epoch": 0.99, + "learning_rate": 1.4446040930449302e-09, + "loss": 0.0007, + "step": 51180 + }, + { + "epoch": 0.99, + "learning_rate": 1.440720748708788e-09, + "loss": 0.0002, + "step": 51181 + }, + { + "epoch": 0.99, + "learning_rate": 1.4368374043726456e-09, + "loss": 0.0003, + "step": 51182 + }, + { + "epoch": 0.99, + "learning_rate": 1.4329540600365033e-09, + "loss": 0.0398, + "step": 51183 + }, + { + "epoch": 0.99, + "learning_rate": 1.429070715700361e-09, + "loss": 0.0003, + "step": 51184 + }, + { + "epoch": 0.99, + "learning_rate": 1.4251873713642187e-09, + "loss": 0.0004, + "step": 51185 + }, + { + "epoch": 0.99, + "learning_rate": 1.4213040270280765e-09, + "loss": 0.0004, + "step": 51186 + }, + { + "epoch": 0.99, + "learning_rate": 1.4174206826919344e-09, + "loss": 0.0004, + "step": 51187 + }, + { + "epoch": 0.99, + "learning_rate": 1.4135373383557918e-09, + "loss": 0.0031, + "step": 51188 + }, + { + "epoch": 0.99, + "learning_rate": 1.4096539940196496e-09, + "loss": 0.0138, + "step": 51189 + }, + { + "epoch": 0.99, + "learning_rate": 1.4057706496835075e-09, + "loss": 0.0004, + "step": 51190 + }, + { + "epoch": 0.99, + "learning_rate": 1.401887305347365e-09, + "loss": 0.7128, + "step": 51191 + }, + { + "epoch": 0.99, + "learning_rate": 1.398003961011223e-09, + "loss": 0.0005, + "step": 51192 + }, + { + "epoch": 0.99, + "learning_rate": 1.3941206166750805e-09, + "loss": 0.0005, + "step": 51193 + }, + { + "epoch": 0.99, + "learning_rate": 1.3902372723389382e-09, + "loss": 0.0004, + "step": 51194 + }, + { + "epoch": 0.99, + "learning_rate": 1.386353928002796e-09, + "loss": 0.0004, + "step": 51195 + }, + { + "epoch": 0.99, + "learning_rate": 1.3824705836666536e-09, + "loss": 0.0003, + "step": 51196 + }, + { + "epoch": 0.99, + "learning_rate": 1.3785872393305112e-09, + "loss": 0.0004, + "step": 51197 + }, + { + "epoch": 0.99, + "learning_rate": 1.374703894994369e-09, + "loss": 0.0004, + "step": 51198 + }, + { + "epoch": 0.99, + "learning_rate": 1.3708205506582267e-09, + "loss": 0.0005, + "step": 51199 + }, + { + "epoch": 0.99, + "learning_rate": 1.3669372063220845e-09, + "loss": 0.0002, + "step": 51200 + }, + { + "epoch": 0.99, + "learning_rate": 1.3630538619859424e-09, + "loss": 0.1599, + "step": 51201 + }, + { + "epoch": 0.99, + "learning_rate": 1.3591705176497998e-09, + "loss": 0.0004, + "step": 51202 + }, + { + "epoch": 0.99, + "learning_rate": 1.3552871733136576e-09, + "loss": 0.0003, + "step": 51203 + }, + { + "epoch": 0.99, + "learning_rate": 1.3514038289775154e-09, + "loss": 0.0005, + "step": 51204 + }, + { + "epoch": 0.99, + "learning_rate": 1.347520484641373e-09, + "loss": 0.0004, + "step": 51205 + }, + { + "epoch": 0.99, + "learning_rate": 1.3436371403052309e-09, + "loss": 0.0003, + "step": 51206 + }, + { + "epoch": 0.99, + "learning_rate": 1.3397537959690885e-09, + "loss": 0.0004, + "step": 51207 + }, + { + "epoch": 0.99, + "learning_rate": 1.3358704516329461e-09, + "loss": 0.0026, + "step": 51208 + }, + { + "epoch": 0.99, + "learning_rate": 1.331987107296804e-09, + "loss": 0.0004, + "step": 51209 + }, + { + "epoch": 0.99, + "learning_rate": 1.3281037629606618e-09, + "loss": 0.0004, + "step": 51210 + }, + { + "epoch": 0.99, + "learning_rate": 1.3242204186245194e-09, + "loss": 0.0004, + "step": 51211 + }, + { + "epoch": 0.99, + "learning_rate": 1.320337074288377e-09, + "loss": 0.0005, + "step": 51212 + }, + { + "epoch": 0.99, + "learning_rate": 1.3164537299522349e-09, + "loss": 0.0005, + "step": 51213 + }, + { + "epoch": 0.99, + "learning_rate": 1.3125703856160925e-09, + "loss": 0.0004, + "step": 51214 + }, + { + "epoch": 0.99, + "learning_rate": 1.3086870412799503e-09, + "loss": 0.6843, + "step": 51215 + }, + { + "epoch": 0.99, + "learning_rate": 1.304803696943808e-09, + "loss": 0.0063, + "step": 51216 + }, + { + "epoch": 0.99, + "learning_rate": 1.3009203526076656e-09, + "loss": 1.2101, + "step": 51217 + }, + { + "epoch": 0.99, + "learning_rate": 1.2970370082715234e-09, + "loss": 0.1782, + "step": 51218 + }, + { + "epoch": 0.99, + "learning_rate": 1.293153663935381e-09, + "loss": 0.0007, + "step": 51219 + }, + { + "epoch": 0.99, + "learning_rate": 1.2892703195992389e-09, + "loss": 0.0005, + "step": 51220 + }, + { + "epoch": 0.99, + "learning_rate": 1.2853869752630967e-09, + "loss": 0.0004, + "step": 51221 + }, + { + "epoch": 0.99, + "learning_rate": 1.2815036309269541e-09, + "loss": 0.0003, + "step": 51222 + }, + { + "epoch": 0.99, + "learning_rate": 1.277620286590812e-09, + "loss": 0.0003, + "step": 51223 + }, + { + "epoch": 0.99, + "learning_rate": 1.2737369422546698e-09, + "loss": 0.0005, + "step": 51224 + }, + { + "epoch": 0.99, + "learning_rate": 1.2698535979185274e-09, + "loss": 0.0004, + "step": 51225 + }, + { + "epoch": 0.99, + "learning_rate": 1.265970253582385e-09, + "loss": 0.0004, + "step": 51226 + }, + { + "epoch": 0.99, + "learning_rate": 1.2620869092462429e-09, + "loss": 0.0006, + "step": 51227 + }, + { + "epoch": 0.99, + "learning_rate": 1.2582035649101005e-09, + "loss": 0.0004, + "step": 51228 + }, + { + "epoch": 0.99, + "learning_rate": 1.2543202205739583e-09, + "loss": 0.0004, + "step": 51229 + }, + { + "epoch": 0.99, + "learning_rate": 1.250436876237816e-09, + "loss": 0.0265, + "step": 51230 + }, + { + "epoch": 0.99, + "learning_rate": 1.2465535319016736e-09, + "loss": 0.0007, + "step": 51231 + }, + { + "epoch": 0.99, + "learning_rate": 1.2426701875655314e-09, + "loss": 0.0007, + "step": 51232 + }, + { + "epoch": 0.99, + "learning_rate": 1.238786843229389e-09, + "loss": 0.0003, + "step": 51233 + }, + { + "epoch": 0.99, + "learning_rate": 1.2349034988932468e-09, + "loss": 0.0003, + "step": 51234 + }, + { + "epoch": 0.99, + "learning_rate": 1.2310201545571047e-09, + "loss": 0.0003, + "step": 51235 + }, + { + "epoch": 0.99, + "learning_rate": 1.227136810220962e-09, + "loss": 0.0002, + "step": 51236 + }, + { + "epoch": 0.99, + "learning_rate": 1.22325346588482e-09, + "loss": 0.0006, + "step": 51237 + }, + { + "epoch": 0.99, + "learning_rate": 1.2193701215486778e-09, + "loss": 0.001, + "step": 51238 + }, + { + "epoch": 0.99, + "learning_rate": 1.2154867772125354e-09, + "loss": 0.0004, + "step": 51239 + }, + { + "epoch": 0.99, + "learning_rate": 1.2116034328763932e-09, + "loss": 0.0002, + "step": 51240 + }, + { + "epoch": 0.99, + "learning_rate": 1.2077200885402508e-09, + "loss": 0.0003, + "step": 51241 + }, + { + "epoch": 0.99, + "learning_rate": 1.2038367442041085e-09, + "loss": 0.0004, + "step": 51242 + }, + { + "epoch": 0.99, + "learning_rate": 1.1999533998679663e-09, + "loss": 0.0004, + "step": 51243 + }, + { + "epoch": 0.99, + "learning_rate": 1.196070055531824e-09, + "loss": 0.0004, + "step": 51244 + }, + { + "epoch": 0.99, + "learning_rate": 1.1921867111956817e-09, + "loss": 0.0002, + "step": 51245 + }, + { + "epoch": 0.99, + "learning_rate": 1.1883033668595394e-09, + "loss": 0.0022, + "step": 51246 + }, + { + "epoch": 0.99, + "learning_rate": 1.184420022523397e-09, + "loss": 0.0004, + "step": 51247 + }, + { + "epoch": 0.99, + "learning_rate": 1.1805366781872548e-09, + "loss": 0.0236, + "step": 51248 + }, + { + "epoch": 0.99, + "learning_rate": 1.1766533338511126e-09, + "loss": 0.0004, + "step": 51249 + }, + { + "epoch": 0.99, + "learning_rate": 1.1727699895149703e-09, + "loss": 0.0004, + "step": 51250 + }, + { + "epoch": 0.99, + "learning_rate": 1.1688866451788279e-09, + "loss": 1.4314, + "step": 51251 + }, + { + "epoch": 0.99, + "learning_rate": 1.1650033008426857e-09, + "loss": 0.0003, + "step": 51252 + }, + { + "epoch": 0.99, + "learning_rate": 1.1611199565065434e-09, + "loss": 0.0002, + "step": 51253 + }, + { + "epoch": 0.99, + "learning_rate": 1.1572366121704012e-09, + "loss": 0.6964, + "step": 51254 + }, + { + "epoch": 0.99, + "learning_rate": 1.1533532678342588e-09, + "loss": 0.0022, + "step": 51255 + }, + { + "epoch": 0.99, + "learning_rate": 1.1494699234981164e-09, + "loss": 0.0006, + "step": 51256 + }, + { + "epoch": 0.99, + "learning_rate": 1.1455865791619743e-09, + "loss": 0.0003, + "step": 51257 + }, + { + "epoch": 0.99, + "learning_rate": 1.1417032348258319e-09, + "loss": 0.0049, + "step": 51258 + }, + { + "epoch": 0.99, + "learning_rate": 1.1378198904896897e-09, + "loss": 0.0003, + "step": 51259 + }, + { + "epoch": 0.99, + "learning_rate": 1.1339365461535473e-09, + "loss": 0.0107, + "step": 51260 + }, + { + "epoch": 0.99, + "learning_rate": 1.130053201817405e-09, + "loss": 0.0004, + "step": 51261 + }, + { + "epoch": 0.99, + "learning_rate": 1.1261698574812628e-09, + "loss": 0.0006, + "step": 51262 + }, + { + "epoch": 0.99, + "learning_rate": 1.1222865131451206e-09, + "loss": 0.4274, + "step": 51263 + }, + { + "epoch": 0.99, + "learning_rate": 1.1184031688089782e-09, + "loss": 0.0013, + "step": 51264 + }, + { + "epoch": 0.99, + "learning_rate": 1.1145198244728359e-09, + "loss": 0.0004, + "step": 51265 + }, + { + "epoch": 0.99, + "learning_rate": 1.1106364801366937e-09, + "loss": 0.0003, + "step": 51266 + }, + { + "epoch": 0.99, + "learning_rate": 1.1067531358005513e-09, + "loss": 0.0005, + "step": 51267 + }, + { + "epoch": 0.99, + "learning_rate": 1.1028697914644092e-09, + "loss": 0.0004, + "step": 51268 + }, + { + "epoch": 0.99, + "learning_rate": 1.098986447128267e-09, + "loss": 0.0004, + "step": 51269 + }, + { + "epoch": 0.99, + "learning_rate": 1.0951031027921244e-09, + "loss": 0.0004, + "step": 51270 + }, + { + "epoch": 0.99, + "learning_rate": 1.0912197584559822e-09, + "loss": 0.0003, + "step": 51271 + }, + { + "epoch": 0.99, + "learning_rate": 1.08733641411984e-09, + "loss": 0.0005, + "step": 51272 + }, + { + "epoch": 0.99, + "learning_rate": 1.0834530697836977e-09, + "loss": 0.0008, + "step": 51273 + }, + { + "epoch": 0.99, + "learning_rate": 1.0795697254475555e-09, + "loss": 0.0006, + "step": 51274 + }, + { + "epoch": 0.99, + "learning_rate": 1.0756863811114131e-09, + "loss": 0.0004, + "step": 51275 + }, + { + "epoch": 0.99, + "learning_rate": 1.0718030367752708e-09, + "loss": 0.0004, + "step": 51276 + }, + { + "epoch": 0.99, + "learning_rate": 1.0679196924391286e-09, + "loss": 0.0004, + "step": 51277 + }, + { + "epoch": 0.99, + "learning_rate": 1.0640363481029862e-09, + "loss": 1.2301, + "step": 51278 + }, + { + "epoch": 0.99, + "learning_rate": 1.060153003766844e-09, + "loss": 0.0004, + "step": 51279 + }, + { + "epoch": 0.99, + "learning_rate": 1.0562696594307017e-09, + "loss": 0.1486, + "step": 51280 + }, + { + "epoch": 0.99, + "learning_rate": 1.0523863150945593e-09, + "loss": 0.0005, + "step": 51281 + }, + { + "epoch": 0.99, + "learning_rate": 1.0485029707584171e-09, + "loss": 0.1232, + "step": 51282 + }, + { + "epoch": 0.99, + "learning_rate": 1.044619626422275e-09, + "loss": 0.0692, + "step": 51283 + }, + { + "epoch": 0.99, + "learning_rate": 1.0407362820861324e-09, + "loss": 0.001, + "step": 51284 + }, + { + "epoch": 0.99, + "learning_rate": 1.0368529377499902e-09, + "loss": 0.0003, + "step": 51285 + }, + { + "epoch": 0.99, + "learning_rate": 1.032969593413848e-09, + "loss": 0.0004, + "step": 51286 + }, + { + "epoch": 0.99, + "learning_rate": 1.0290862490777057e-09, + "loss": 0.0027, + "step": 51287 + }, + { + "epoch": 0.99, + "learning_rate": 1.0252029047415635e-09, + "loss": 0.0004, + "step": 51288 + }, + { + "epoch": 0.99, + "learning_rate": 1.0213195604054211e-09, + "loss": 0.0004, + "step": 51289 + }, + { + "epoch": 0.99, + "learning_rate": 1.0174362160692787e-09, + "loss": 0.0907, + "step": 51290 + }, + { + "epoch": 0.99, + "learning_rate": 1.0135528717331366e-09, + "loss": 0.0003, + "step": 51291 + }, + { + "epoch": 0.99, + "learning_rate": 1.0096695273969942e-09, + "loss": 0.0006, + "step": 51292 + }, + { + "epoch": 0.99, + "learning_rate": 1.005786183060852e-09, + "loss": 0.0157, + "step": 51293 + }, + { + "epoch": 0.99, + "learning_rate": 1.0019028387247097e-09, + "loss": 0.7158, + "step": 51294 + }, + { + "epoch": 1.0, + "learning_rate": 9.980194943885673e-10, + "loss": 0.0005, + "step": 51295 + }, + { + "epoch": 1.0, + "learning_rate": 9.941361500524251e-10, + "loss": 0.0032, + "step": 51296 + }, + { + "epoch": 1.0, + "learning_rate": 9.90252805716283e-10, + "loss": 0.0006, + "step": 51297 + }, + { + "epoch": 1.0, + "learning_rate": 9.863694613801406e-10, + "loss": 0.0003, + "step": 51298 + }, + { + "epoch": 1.0, + "learning_rate": 9.824861170439982e-10, + "loss": 0.4375, + "step": 51299 + }, + { + "epoch": 1.0, + "learning_rate": 9.78602772707856e-10, + "loss": 0.0004, + "step": 51300 + }, + { + "epoch": 1.0, + "learning_rate": 9.747194283717136e-10, + "loss": 0.002, + "step": 51301 + }, + { + "epoch": 1.0, + "learning_rate": 9.708360840355715e-10, + "loss": 0.0003, + "step": 51302 + }, + { + "epoch": 1.0, + "learning_rate": 9.66952739699429e-10, + "loss": 0.0005, + "step": 51303 + }, + { + "epoch": 1.0, + "learning_rate": 9.630693953632867e-10, + "loss": 0.0005, + "step": 51304 + }, + { + "epoch": 1.0, + "learning_rate": 9.591860510271446e-10, + "loss": 0.0003, + "step": 51305 + }, + { + "epoch": 1.0, + "learning_rate": 9.553027066910022e-10, + "loss": 0.0003, + "step": 51306 + }, + { + "epoch": 1.0, + "learning_rate": 9.5141936235486e-10, + "loss": 0.0007, + "step": 51307 + }, + { + "epoch": 1.0, + "learning_rate": 9.475360180187178e-10, + "loss": 0.0003, + "step": 51308 + }, + { + "epoch": 1.0, + "learning_rate": 9.436526736825753e-10, + "loss": 0.0003, + "step": 51309 + }, + { + "epoch": 1.0, + "learning_rate": 9.39769329346433e-10, + "loss": 0.0003, + "step": 51310 + }, + { + "epoch": 1.0, + "learning_rate": 9.35885985010291e-10, + "loss": 0.0003, + "step": 51311 + }, + { + "epoch": 1.0, + "learning_rate": 9.320026406741485e-10, + "loss": 0.0005, + "step": 51312 + }, + { + "epoch": 1.0, + "learning_rate": 9.281192963380062e-10, + "loss": 0.0003, + "step": 51313 + }, + { + "epoch": 1.0, + "learning_rate": 9.242359520018639e-10, + "loss": 0.0004, + "step": 51314 + }, + { + "epoch": 1.0, + "learning_rate": 9.203526076657216e-10, + "loss": 1.1065, + "step": 51315 + }, + { + "epoch": 1.0, + "learning_rate": 9.164692633295794e-10, + "loss": 0.0364, + "step": 51316 + }, + { + "epoch": 1.0, + "learning_rate": 9.125859189934372e-10, + "loss": 0.0004, + "step": 51317 + }, + { + "epoch": 1.0, + "learning_rate": 9.087025746572947e-10, + "loss": 0.0004, + "step": 51318 + }, + { + "epoch": 1.0, + "learning_rate": 9.048192303211525e-10, + "loss": 0.0005, + "step": 51319 + }, + { + "epoch": 1.0, + "learning_rate": 9.009358859850103e-10, + "loss": 0.0003, + "step": 51320 + }, + { + "epoch": 1.0, + "learning_rate": 8.97052541648868e-10, + "loss": 0.0004, + "step": 51321 + }, + { + "epoch": 1.0, + "learning_rate": 8.931691973127257e-10, + "loss": 0.0182, + "step": 51322 + }, + { + "epoch": 1.0, + "learning_rate": 8.892858529765833e-10, + "loss": 0.0003, + "step": 51323 + }, + { + "epoch": 1.0, + "learning_rate": 8.854025086404411e-10, + "loss": 0.0003, + "step": 51324 + }, + { + "epoch": 1.0, + "learning_rate": 8.815191643042988e-10, + "loss": 0.0003, + "step": 51325 + }, + { + "epoch": 1.0, + "learning_rate": 8.776358199681566e-10, + "loss": 0.0005, + "step": 51326 + }, + { + "epoch": 1.0, + "learning_rate": 8.737524756320143e-10, + "loss": 0.0004, + "step": 51327 + }, + { + "epoch": 1.0, + "learning_rate": 8.698691312958719e-10, + "loss": 0.0004, + "step": 51328 + }, + { + "epoch": 1.0, + "learning_rate": 8.659857869597297e-10, + "loss": 0.0003, + "step": 51329 + }, + { + "epoch": 1.0, + "learning_rate": 8.621024426235874e-10, + "loss": 0.8114, + "step": 51330 + }, + { + "epoch": 1.0, + "learning_rate": 8.582190982874452e-10, + "loss": 0.0005, + "step": 51331 + }, + { + "epoch": 1.0, + "learning_rate": 8.543357539513029e-10, + "loss": 0.0005, + "step": 51332 + }, + { + "epoch": 1.0, + "learning_rate": 8.504524096151605e-10, + "loss": 0.0002, + "step": 51333 + }, + { + "epoch": 1.0, + "learning_rate": 8.465690652790182e-10, + "loss": 0.0003, + "step": 51334 + }, + { + "epoch": 1.0, + "learning_rate": 8.42685720942876e-10, + "loss": 0.0003, + "step": 51335 + }, + { + "epoch": 1.0, + "learning_rate": 8.388023766067337e-10, + "loss": 0.0004, + "step": 51336 + }, + { + "epoch": 1.0, + "learning_rate": 8.349190322705915e-10, + "loss": 0.2063, + "step": 51337 + }, + { + "epoch": 1.0, + "learning_rate": 8.31035687934449e-10, + "loss": 0.0004, + "step": 51338 + }, + { + "epoch": 1.0, + "learning_rate": 8.271523435983068e-10, + "loss": 0.6245, + "step": 51339 + }, + { + "epoch": 1.0, + "learning_rate": 8.232689992621646e-10, + "loss": 0.0005, + "step": 51340 + }, + { + "epoch": 1.0, + "learning_rate": 8.193856549260223e-10, + "loss": 0.0004, + "step": 51341 + }, + { + "epoch": 1.0, + "learning_rate": 8.155023105898798e-10, + "loss": 0.0003, + "step": 51342 + }, + { + "epoch": 1.0, + "learning_rate": 8.116189662537377e-10, + "loss": 0.0004, + "step": 51343 + }, + { + "epoch": 1.0, + "learning_rate": 8.077356219175954e-10, + "loss": 0.0004, + "step": 51344 + }, + { + "epoch": 1.0, + "learning_rate": 8.038522775814531e-10, + "loss": 0.0003, + "step": 51345 + }, + { + "epoch": 1.0, + "learning_rate": 7.999689332453109e-10, + "loss": 0.0004, + "step": 51346 + }, + { + "epoch": 1.0, + "learning_rate": 7.960855889091685e-10, + "loss": 0.0003, + "step": 51347 + }, + { + "epoch": 1.0, + "learning_rate": 7.922022445730262e-10, + "loss": 0.0005, + "step": 51348 + }, + { + "epoch": 1.0, + "learning_rate": 7.883189002368839e-10, + "loss": 0.0006, + "step": 51349 + }, + { + "epoch": 1.0, + "learning_rate": 7.844355559007418e-10, + "loss": 0.0004, + "step": 51350 + }, + { + "epoch": 1.0, + "learning_rate": 7.805522115645994e-10, + "loss": 0.0025, + "step": 51351 + }, + { + "epoch": 1.0, + "learning_rate": 7.766688672284571e-10, + "loss": 0.0003, + "step": 51352 + }, + { + "epoch": 1.0, + "learning_rate": 7.727855228923148e-10, + "loss": 0.0014, + "step": 51353 + }, + { + "epoch": 1.0, + "learning_rate": 7.689021785561726e-10, + "loss": 0.0004, + "step": 51354 + }, + { + "epoch": 1.0, + "learning_rate": 7.650188342200303e-10, + "loss": 0.1059, + "step": 51355 + }, + { + "epoch": 1.0, + "learning_rate": 7.611354898838879e-10, + "loss": 0.5825, + "step": 51356 + }, + { + "epoch": 1.0, + "learning_rate": 7.572521455477458e-10, + "loss": 0.0003, + "step": 51357 + }, + { + "epoch": 1.0, + "learning_rate": 7.533688012116034e-10, + "loss": 0.0003, + "step": 51358 + }, + { + "epoch": 1.0, + "learning_rate": 7.494854568754611e-10, + "loss": 0.0003, + "step": 51359 + }, + { + "epoch": 1.0, + "learning_rate": 7.456021125393188e-10, + "loss": 0.0007, + "step": 51360 + }, + { + "epoch": 1.0, + "learning_rate": 7.417187682031766e-10, + "loss": 0.0004, + "step": 51361 + }, + { + "epoch": 1.0, + "learning_rate": 7.378354238670343e-10, + "loss": 0.0007, + "step": 51362 + }, + { + "epoch": 1.0, + "learning_rate": 7.339520795308919e-10, + "loss": 0.0021, + "step": 51363 + }, + { + "epoch": 1.0, + "learning_rate": 7.300687351947497e-10, + "loss": 0.0007, + "step": 51364 + }, + { + "epoch": 1.0, + "learning_rate": 7.261853908586074e-10, + "loss": 0.0002, + "step": 51365 + }, + { + "epoch": 1.0, + "learning_rate": 7.223020465224651e-10, + "loss": 0.0003, + "step": 51366 + }, + { + "epoch": 1.0, + "learning_rate": 7.184187021863228e-10, + "loss": 0.0008, + "step": 51367 + }, + { + "epoch": 1.0, + "learning_rate": 7.145353578501805e-10, + "loss": 0.0004, + "step": 51368 + }, + { + "epoch": 1.0, + "learning_rate": 7.106520135140383e-10, + "loss": 0.0005, + "step": 51369 + }, + { + "epoch": 1.0, + "learning_rate": 7.067686691778959e-10, + "loss": 0.0005, + "step": 51370 + }, + { + "epoch": 1.0, + "learning_rate": 7.028853248417537e-10, + "loss": 0.0003, + "step": 51371 + }, + { + "epoch": 1.0, + "learning_rate": 6.990019805056115e-10, + "loss": 0.0009, + "step": 51372 + }, + { + "epoch": 1.0, + "learning_rate": 6.951186361694691e-10, + "loss": 0.0004, + "step": 51373 + }, + { + "epoch": 1.0, + "learning_rate": 6.912352918333268e-10, + "loss": 0.0006, + "step": 51374 + }, + { + "epoch": 1.0, + "learning_rate": 6.873519474971845e-10, + "loss": 0.0005, + "step": 51375 + }, + { + "epoch": 1.0, + "learning_rate": 6.834686031610423e-10, + "loss": 0.0003, + "step": 51376 + }, + { + "epoch": 1.0, + "learning_rate": 6.795852588248999e-10, + "loss": 0.0006, + "step": 51377 + }, + { + "epoch": 1.0, + "learning_rate": 6.757019144887577e-10, + "loss": 0.0003, + "step": 51378 + }, + { + "epoch": 1.0, + "learning_rate": 6.718185701526154e-10, + "loss": 0.0004, + "step": 51379 + }, + { + "epoch": 1.0, + "learning_rate": 6.679352258164731e-10, + "loss": 0.0003, + "step": 51380 + }, + { + "epoch": 1.0, + "learning_rate": 6.640518814803309e-10, + "loss": 0.0003, + "step": 51381 + }, + { + "epoch": 1.0, + "learning_rate": 6.601685371441885e-10, + "loss": 0.0003, + "step": 51382 + }, + { + "epoch": 1.0, + "learning_rate": 6.562851928080463e-10, + "loss": 0.0237, + "step": 51383 + }, + { + "epoch": 1.0, + "learning_rate": 6.52401848471904e-10, + "loss": 0.0006, + "step": 51384 + }, + { + "epoch": 1.0, + "learning_rate": 6.485185041357617e-10, + "loss": 0.0003, + "step": 51385 + }, + { + "epoch": 1.0, + "learning_rate": 6.446351597996194e-10, + "loss": 0.0002, + "step": 51386 + }, + { + "epoch": 1.0, + "learning_rate": 6.407518154634771e-10, + "loss": 0.002, + "step": 51387 + }, + { + "epoch": 1.0, + "learning_rate": 6.368684711273349e-10, + "loss": 0.0006, + "step": 51388 + }, + { + "epoch": 1.0, + "learning_rate": 6.329851267911925e-10, + "loss": 0.0003, + "step": 51389 + }, + { + "epoch": 1.0, + "learning_rate": 6.291017824550502e-10, + "loss": 0.0004, + "step": 51390 + }, + { + "epoch": 1.0, + "learning_rate": 6.25218438118908e-10, + "loss": 0.0003, + "step": 51391 + }, + { + "epoch": 1.0, + "learning_rate": 6.213350937827657e-10, + "loss": 0.0003, + "step": 51392 + }, + { + "epoch": 1.0, + "learning_rate": 6.174517494466234e-10, + "loss": 0.0003, + "step": 51393 + }, + { + "epoch": 1.0, + "learning_rate": 6.13568405110481e-10, + "loss": 0.0005, + "step": 51394 + }, + { + "epoch": 1.0, + "learning_rate": 6.096850607743389e-10, + "loss": 0.025, + "step": 51395 + }, + { + "epoch": 1.0, + "learning_rate": 6.058017164381966e-10, + "loss": 0.0008, + "step": 51396 + }, + { + "epoch": 1.0, + "learning_rate": 6.019183721020542e-10, + "loss": 1.1585, + "step": 51397 + }, + { + "epoch": 1.0, + "learning_rate": 5.98035027765912e-10, + "loss": 0.0003, + "step": 51398 + }, + { + "epoch": 1.0, + "learning_rate": 5.941516834297697e-10, + "loss": 0.0025, + "step": 51399 + }, + { + "epoch": 1.0, + "learning_rate": 5.902683390936274e-10, + "loss": 0.0004, + "step": 51400 + }, + { + "epoch": 1.0, + "learning_rate": 5.863849947574851e-10, + "loss": 0.0004, + "step": 51401 + }, + { + "epoch": 1.0, + "learning_rate": 5.825016504213429e-10, + "loss": 0.0032, + "step": 51402 + }, + { + "epoch": 1.0, + "learning_rate": 5.786183060852006e-10, + "loss": 0.0004, + "step": 51403 + }, + { + "epoch": 1.0, + "learning_rate": 5.747349617490582e-10, + "loss": 0.0004, + "step": 51404 + }, + { + "epoch": 1.0, + "learning_rate": 5.708516174129159e-10, + "loss": 0.0004, + "step": 51405 + }, + { + "epoch": 1.0, + "learning_rate": 5.669682730767737e-10, + "loss": 0.0004, + "step": 51406 + }, + { + "epoch": 1.0, + "learning_rate": 5.630849287406314e-10, + "loss": 0.6539, + "step": 51407 + }, + { + "epoch": 1.0, + "learning_rate": 5.592015844044891e-10, + "loss": 0.0006, + "step": 51408 + }, + { + "epoch": 1.0, + "learning_rate": 5.553182400683469e-10, + "loss": 0.0004, + "step": 51409 + }, + { + "epoch": 1.0, + "learning_rate": 5.514348957322046e-10, + "loss": 0.0005, + "step": 51410 + }, + { + "epoch": 1.0, + "learning_rate": 5.475515513960622e-10, + "loss": 0.0004, + "step": 51411 + }, + { + "epoch": 1.0, + "learning_rate": 5.4366820705992e-10, + "loss": 0.0014, + "step": 51412 + }, + { + "epoch": 1.0, + "learning_rate": 5.397848627237778e-10, + "loss": 0.0008, + "step": 51413 + }, + { + "epoch": 1.0, + "learning_rate": 5.359015183876354e-10, + "loss": 0.0301, + "step": 51414 + }, + { + "epoch": 1.0, + "learning_rate": 5.320181740514931e-10, + "loss": 0.0004, + "step": 51415 + }, + { + "epoch": 1.0, + "learning_rate": 5.281348297153508e-10, + "loss": 0.0003, + "step": 51416 + }, + { + "epoch": 1.0, + "learning_rate": 5.242514853792086e-10, + "loss": 0.0006, + "step": 51417 + }, + { + "epoch": 1.0, + "learning_rate": 5.203681410430662e-10, + "loss": 0.0003, + "step": 51418 + }, + { + "epoch": 1.0, + "learning_rate": 5.16484796706924e-10, + "loss": 0.0004, + "step": 51419 + }, + { + "epoch": 1.0, + "learning_rate": 5.126014523707817e-10, + "loss": 1.2416, + "step": 51420 + }, + { + "epoch": 1.0, + "learning_rate": 5.087181080346394e-10, + "loss": 0.0003, + "step": 51421 + }, + { + "epoch": 1.0, + "learning_rate": 5.048347636984971e-10, + "loss": 0.3944, + "step": 51422 + }, + { + "epoch": 1.0, + "learning_rate": 5.009514193623548e-10, + "loss": 0.0003, + "step": 51423 + }, + { + "epoch": 1.0, + "learning_rate": 4.970680750262126e-10, + "loss": 0.0007, + "step": 51424 + }, + { + "epoch": 1.0, + "learning_rate": 4.931847306900703e-10, + "loss": 0.0003, + "step": 51425 + }, + { + "epoch": 1.0, + "learning_rate": 4.89301386353928e-10, + "loss": 0.0005, + "step": 51426 + }, + { + "epoch": 1.0, + "learning_rate": 4.854180420177857e-10, + "loss": 0.0003, + "step": 51427 + }, + { + "epoch": 1.0, + "learning_rate": 4.815346976816434e-10, + "loss": 0.6588, + "step": 51428 + }, + { + "epoch": 1.0, + "learning_rate": 4.776513533455011e-10, + "loss": 0.0004, + "step": 51429 + }, + { + "epoch": 1.0, + "learning_rate": 4.737680090093589e-10, + "loss": 0.0003, + "step": 51430 + }, + { + "epoch": 1.0, + "learning_rate": 4.698846646732165e-10, + "loss": 0.0005, + "step": 51431 + }, + { + "epoch": 1.0, + "learning_rate": 4.660013203370743e-10, + "loss": 0.0003, + "step": 51432 + }, + { + "epoch": 1.0, + "learning_rate": 4.6211797600093195e-10, + "loss": 0.0004, + "step": 51433 + }, + { + "epoch": 1.0, + "learning_rate": 4.582346316647897e-10, + "loss": 0.0003, + "step": 51434 + }, + { + "epoch": 1.0, + "learning_rate": 4.5435128732864735e-10, + "loss": 0.0003, + "step": 51435 + }, + { + "epoch": 1.0, + "learning_rate": 4.5046794299250513e-10, + "loss": 0.0008, + "step": 51436 + }, + { + "epoch": 1.0, + "learning_rate": 4.4658459865636286e-10, + "loss": 0.0004, + "step": 51437 + }, + { + "epoch": 1.0, + "learning_rate": 4.4270125432022053e-10, + "loss": 0.0004, + "step": 51438 + }, + { + "epoch": 1.0, + "learning_rate": 4.388179099840783e-10, + "loss": 0.0004, + "step": 51439 + }, + { + "epoch": 1.0, + "learning_rate": 4.3493456564793593e-10, + "loss": 0.0004, + "step": 51440 + }, + { + "epoch": 1.0, + "learning_rate": 4.310512213117937e-10, + "loss": 0.0006, + "step": 51441 + }, + { + "epoch": 1.0, + "learning_rate": 4.2716787697565144e-10, + "loss": 0.0003, + "step": 51442 + }, + { + "epoch": 1.0, + "learning_rate": 4.232845326395091e-10, + "loss": 0.0003, + "step": 51443 + }, + { + "epoch": 1.0, + "learning_rate": 4.1940118830336684e-10, + "loss": 0.0004, + "step": 51444 + }, + { + "epoch": 1.0, + "learning_rate": 4.155178439672245e-10, + "loss": 0.003, + "step": 51445 + }, + { + "epoch": 1.0, + "learning_rate": 4.116344996310823e-10, + "loss": 0.8747, + "step": 51446 + }, + { + "epoch": 1.0, + "learning_rate": 4.077511552949399e-10, + "loss": 0.0005, + "step": 51447 + }, + { + "epoch": 1.0, + "learning_rate": 4.038678109587977e-10, + "loss": 0.0004, + "step": 51448 + }, + { + "epoch": 1.0, + "learning_rate": 3.9998446662265543e-10, + "loss": 0.0008, + "step": 51449 + }, + { + "epoch": 1.0, + "learning_rate": 3.961011222865131e-10, + "loss": 0.0003, + "step": 51450 + }, + { + "epoch": 1.0, + "learning_rate": 3.922177779503709e-10, + "loss": 0.0007, + "step": 51451 + }, + { + "epoch": 1.0, + "learning_rate": 3.8833443361422856e-10, + "loss": 0.0003, + "step": 51452 + }, + { + "epoch": 1.0, + "learning_rate": 3.844510892780863e-10, + "loss": 0.0004, + "step": 51453 + }, + { + "epoch": 1.0, + "learning_rate": 3.8056774494194396e-10, + "loss": 0.0005, + "step": 51454 + }, + { + "epoch": 1.0, + "learning_rate": 3.766844006058017e-10, + "loss": 0.0004, + "step": 51455 + }, + { + "epoch": 1.0, + "learning_rate": 3.728010562696594e-10, + "loss": 0.0003, + "step": 51456 + }, + { + "epoch": 1.0, + "learning_rate": 3.6891771193351714e-10, + "loss": 0.0003, + "step": 51457 + }, + { + "epoch": 1.0, + "learning_rate": 3.6503436759737487e-10, + "loss": 0.0209, + "step": 51458 + }, + { + "epoch": 1.0, + "learning_rate": 3.6115102326123255e-10, + "loss": 0.0004, + "step": 51459 + }, + { + "epoch": 1.0, + "learning_rate": 3.5726767892509027e-10, + "loss": 0.0004, + "step": 51460 + }, + { + "epoch": 1.0, + "learning_rate": 3.5338433458894795e-10, + "loss": 0.0005, + "step": 51461 + }, + { + "epoch": 1.0, + "learning_rate": 3.4950099025280573e-10, + "loss": 0.0004, + "step": 51462 + }, + { + "epoch": 1.0, + "learning_rate": 3.456176459166634e-10, + "loss": 0.0004, + "step": 51463 + }, + { + "epoch": 1.0, + "learning_rate": 3.4173430158052113e-10, + "loss": 0.0759, + "step": 51464 + }, + { + "epoch": 1.0, + "learning_rate": 3.3785095724437886e-10, + "loss": 0.0003, + "step": 51465 + }, + { + "epoch": 1.0, + "learning_rate": 3.3396761290823653e-10, + "loss": 0.0004, + "step": 51466 + }, + { + "epoch": 1.0, + "learning_rate": 3.3008426857209426e-10, + "loss": 0.0004, + "step": 51467 + }, + { + "epoch": 1.0, + "learning_rate": 3.26200924235952e-10, + "loss": 0.0003, + "step": 51468 + }, + { + "epoch": 1.0, + "learning_rate": 3.223175798998097e-10, + "loss": 0.0004, + "step": 51469 + }, + { + "epoch": 1.0, + "learning_rate": 3.1843423556366744e-10, + "loss": 0.0004, + "step": 51470 + }, + { + "epoch": 1.0, + "learning_rate": 3.145508912275251e-10, + "loss": 0.0003, + "step": 51471 + }, + { + "epoch": 1.0, + "learning_rate": 3.1066754689138285e-10, + "loss": 0.0004, + "step": 51472 + }, + { + "epoch": 1.0, + "learning_rate": 3.067842025552405e-10, + "loss": 0.6723, + "step": 51473 + }, + { + "epoch": 1.0, + "learning_rate": 3.029008582190983e-10, + "loss": 0.0208, + "step": 51474 + }, + { + "epoch": 1.0, + "learning_rate": 2.99017513882956e-10, + "loss": 0.0003, + "step": 51475 + }, + { + "epoch": 1.0, + "learning_rate": 2.951341695468137e-10, + "loss": 0.0004, + "step": 51476 + }, + { + "epoch": 1.0, + "learning_rate": 2.9125082521067143e-10, + "loss": 0.6062, + "step": 51477 + }, + { + "epoch": 1.0, + "learning_rate": 2.873674808745291e-10, + "loss": 0.0005, + "step": 51478 + }, + { + "epoch": 1.0, + "learning_rate": 2.8348413653838683e-10, + "loss": 0.0004, + "step": 51479 + }, + { + "epoch": 1.0, + "learning_rate": 2.7960079220224456e-10, + "loss": 0.7166, + "step": 51480 + }, + { + "epoch": 1.0, + "learning_rate": 2.757174478661023e-10, + "loss": 0.0051, + "step": 51481 + }, + { + "epoch": 1.0, + "learning_rate": 2.7183410352996e-10, + "loss": 0.0004, + "step": 51482 + }, + { + "epoch": 1.0, + "learning_rate": 2.679507591938177e-10, + "loss": 1.1116, + "step": 51483 + }, + { + "epoch": 1.0, + "learning_rate": 2.640674148576754e-10, + "loss": 0.0009, + "step": 51484 + }, + { + "epoch": 1.0, + "learning_rate": 2.601840705215331e-10, + "loss": 0.5882, + "step": 51485 + }, + { + "epoch": 1.0, + "learning_rate": 2.563007261853909e-10, + "loss": 0.0004, + "step": 51486 + }, + { + "epoch": 1.0, + "learning_rate": 2.5241738184924855e-10, + "loss": 0.0003, + "step": 51487 + }, + { + "epoch": 1.0, + "learning_rate": 2.485340375131063e-10, + "loss": 0.0003, + "step": 51488 + }, + { + "epoch": 1.0, + "learning_rate": 2.44650693176964e-10, + "loss": 0.0003, + "step": 51489 + }, + { + "epoch": 1.0, + "learning_rate": 2.407673488408217e-10, + "loss": 0.0004, + "step": 51490 + }, + { + "epoch": 1.0, + "learning_rate": 2.3688400450467946e-10, + "loss": 0.0006, + "step": 51491 + }, + { + "epoch": 1.0, + "learning_rate": 2.3300066016853714e-10, + "loss": 0.0009, + "step": 51492 + }, + { + "epoch": 1.0, + "learning_rate": 2.2911731583239486e-10, + "loss": 0.0005, + "step": 51493 + }, + { + "epoch": 1.0, + "learning_rate": 2.2523397149625256e-10, + "loss": 0.0004, + "step": 51494 + }, + { + "epoch": 1.0, + "learning_rate": 2.2135062716011027e-10, + "loss": 0.0002, + "step": 51495 + }, + { + "epoch": 1.0, + "learning_rate": 2.1746728282396797e-10, + "loss": 0.0002, + "step": 51496 + }, + { + "epoch": 1.0, + "learning_rate": 2.1358393848782572e-10, + "loss": 0.0004, + "step": 51497 + }, + { + "epoch": 1.0, + "learning_rate": 2.0970059415168342e-10, + "loss": 0.001, + "step": 51498 + }, + { + "epoch": 1.0, + "learning_rate": 2.0581724981554115e-10, + "loss": 0.0004, + "step": 51499 + }, + { + "epoch": 1.0, + "learning_rate": 2.0193390547939885e-10, + "loss": 0.0004, + "step": 51500 + }, + { + "epoch": 1.0, + "learning_rate": 1.9805056114325655e-10, + "loss": 0.4005, + "step": 51501 + }, + { + "epoch": 1.0, + "learning_rate": 1.9416721680711428e-10, + "loss": 0.0004, + "step": 51502 + }, + { + "epoch": 1.0, + "learning_rate": 1.9028387247097198e-10, + "loss": 0.0003, + "step": 51503 + }, + { + "epoch": 1.0, + "learning_rate": 1.864005281348297e-10, + "loss": 0.0011, + "step": 51504 + }, + { + "epoch": 1.0, + "learning_rate": 1.8251718379868744e-10, + "loss": 0.0003, + "step": 51505 + }, + { + "epoch": 1.0, + "learning_rate": 1.7863383946254514e-10, + "loss": 0.0005, + "step": 51506 + }, + { + "epoch": 1.0, + "learning_rate": 1.7475049512640286e-10, + "loss": 0.209, + "step": 51507 + }, + { + "epoch": 1.0, + "learning_rate": 1.7086715079026057e-10, + "loss": 0.0003, + "step": 51508 + }, + { + "epoch": 1.0, + "learning_rate": 1.6698380645411827e-10, + "loss": 0.0003, + "step": 51509 + }, + { + "epoch": 1.0, + "learning_rate": 1.63100462117976e-10, + "loss": 0.0256, + "step": 51510 + }, + { + "epoch": 1.0, + "learning_rate": 1.5921711778183372e-10, + "loss": 0.0006, + "step": 51511 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533377344569142e-10, + "loss": 0.0004, + "step": 51512 + }, + { + "epoch": 1.0, + "learning_rate": 1.5145042910954915e-10, + "loss": 0.0011, + "step": 51513 + }, + { + "epoch": 1.0, + "learning_rate": 1.4756708477340685e-10, + "loss": 0.0004, + "step": 51514 + }, + { + "epoch": 1.0, + "learning_rate": 1.4368374043726455e-10, + "loss": 0.0009, + "step": 51515 + }, + { + "epoch": 1.0, + "learning_rate": 1.3980039610112228e-10, + "loss": 0.0005, + "step": 51516 + }, + { + "epoch": 1.0, + "learning_rate": 1.3591705176498e-10, + "loss": 0.0004, + "step": 51517 + }, + { + "epoch": 1.0, + "learning_rate": 1.320337074288377e-10, + "loss": 0.0004, + "step": 51518 + }, + { + "epoch": 1.0, + "learning_rate": 1.2815036309269544e-10, + "loss": 0.0003, + "step": 51519 + }, + { + "epoch": 1.0, + "learning_rate": 1.2426701875655314e-10, + "loss": 0.3211, + "step": 51520 + }, + { + "epoch": 1.0, + "learning_rate": 1.2038367442041084e-10, + "loss": 0.0003, + "step": 51521 + }, + { + "epoch": 1.0, + "learning_rate": 1.1650033008426857e-10, + "loss": 0.0005, + "step": 51522 + }, + { + "epoch": 1.0, + "learning_rate": 1.1261698574812628e-10, + "loss": 0.0004, + "step": 51523 + }, + { + "epoch": 1.0, + "learning_rate": 1.0873364141198398e-10, + "loss": 0.0003, + "step": 51524 + }, + { + "epoch": 1.0, + "learning_rate": 1.0485029707584171e-10, + "loss": 0.0016, + "step": 51525 + }, + { + "epoch": 1.0, + "learning_rate": 1.0096695273969943e-10, + "loss": 0.0005, + "step": 51526 + }, + { + "epoch": 1.0, + "learning_rate": 9.708360840355714e-11, + "loss": 0.0005, + "step": 51527 + }, + { + "epoch": 1.0, + "learning_rate": 9.320026406741485e-11, + "loss": 0.0004, + "step": 51528 + }, + { + "epoch": 1.0, + "learning_rate": 8.931691973127257e-11, + "loss": 0.0068, + "step": 51529 + }, + { + "epoch": 1.0, + "learning_rate": 8.543357539513028e-11, + "loss": 0.0003, + "step": 51530 + }, + { + "epoch": 1.0, + "learning_rate": 8.1550231058988e-11, + "loss": 0.0004, + "step": 51531 + }, + { + "epoch": 1.0, + "learning_rate": 7.766688672284571e-11, + "loss": 0.0004, + "step": 51532 + }, + { + "epoch": 1.0, + "learning_rate": 7.378354238670343e-11, + "loss": 0.0003, + "step": 51533 + }, + { + "epoch": 1.0, + "learning_rate": 6.990019805056114e-11, + "loss": 0.0004, + "step": 51534 + }, + { + "epoch": 1.0, + "learning_rate": 6.601685371441885e-11, + "loss": 0.0004, + "step": 51535 + }, + { + "epoch": 1.0, + "learning_rate": 6.213350937827657e-11, + "loss": 0.024, + "step": 51536 + }, + { + "epoch": 1.0, + "learning_rate": 5.825016504213428e-11, + "loss": 0.0003, + "step": 51537 + }, + { + "epoch": 1.0, + "learning_rate": 5.436682070599199e-11, + "loss": 0.0007, + "step": 51538 + }, + { + "epoch": 1.0, + "learning_rate": 5.048347636984971e-11, + "loss": 0.0005, + "step": 51539 + }, + { + "epoch": 1.0, + "learning_rate": 4.660013203370743e-11, + "loss": 0.0002, + "step": 51540 + }, + { + "epoch": 1.0, + "learning_rate": 4.271678769756514e-11, + "loss": 0.0003, + "step": 51541 + }, + { + "epoch": 1.0, + "learning_rate": 3.8833443361422856e-11, + "loss": 0.0003, + "step": 51542 + }, + { + "epoch": 1.0, + "learning_rate": 3.495009902528057e-11, + "loss": 0.0005, + "step": 51543 + }, + { + "epoch": 1.0, + "learning_rate": 3.1066754689138285e-11, + "loss": 0.0002, + "step": 51544 + }, + { + "epoch": 1.0, + "learning_rate": 2.7183410352995996e-11, + "loss": 0.0003, + "step": 51545 + }, + { + "epoch": 1.0, + "learning_rate": 2.3300066016853714e-11, + "loss": 0.0003, + "step": 51546 + }, + { + "epoch": 1.0, + "learning_rate": 1.9416721680711428e-11, + "loss": 0.0003, + "step": 51547 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533377344569142e-11, + "loss": 0.0003, + "step": 51548 + }, + { + "epoch": 1.0, + "learning_rate": 1.1650033008426857e-11, + "loss": 0.0005, + "step": 51549 + }, + { + "epoch": 1.0, + "learning_rate": 7.766688672284571e-12, + "loss": 0.0009, + "step": 51550 + }, + { + "epoch": 1.0, + "learning_rate": 3.8833443361422856e-12, + "loss": 0.0004, + "step": 51551 + }, + { + "epoch": 1.0, + "learning_rate": 0.0, + "loss": 0.0003, + "step": 51552 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.9822800279329609, + "eval_loss": 0.07964583486318588, + "eval_runtime": 448.4873, + "eval_samples_per_second": 102.175, + "eval_steps_per_second": 1.596, + "step": 51552 + } + ], + "logging_steps": 1, + "max_steps": 51552, + "num_train_epochs": 1, + "save_steps": 500, + "total_flos": 5.446815816909379e+16, + "trial_name": null, + "trial_params": null +}