diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,173240 @@ +{ + "best_metric": 0.5751461982727051, + "best_model_checkpoint": "clean_output/checkpoint-28860", + "epoch": 0.9999913381666363, + "eval_steps": 5772, + "global_step": 28862, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 2.0000000000000003e-06, + "loss": 1.1039, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 4.000000000000001e-06, + "loss": 1.059, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 6e-06, + "loss": 1.0878, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 8.000000000000001e-06, + "loss": 1.0608, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 1e-05, + "loss": 1.0106, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 1.2e-05, + "loss": 0.9002, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 1.4e-05, + "loss": 0.8761, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 1.6000000000000003e-05, + "loss": 0.8031, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 1.8e-05, + "loss": 0.7787, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 2e-05, + "loss": 0.7707, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999999940718676e-05, + "loss": 0.7745, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999999762874704e-05, + "loss": 0.7176, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 1.999999946646808e-05, + "loss": 0.7355, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999999051498816e-05, + "loss": 0.7355, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 1.999999851796691e-05, + "loss": 0.7445, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999997865872376e-05, + "loss": 0.7311, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 1.999999709521521e-05, + "loss": 0.7301, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999996205995435e-05, + "loss": 0.7276, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999995198213053e-05, + "loss": 0.7548, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999994071868078e-05, + "loss": 0.695, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999992826960523e-05, + "loss": 0.6671, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999991463490405e-05, + "loss": 0.7124, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999989981457735e-05, + "loss": 0.7277, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999988380862533e-05, + "loss": 0.7145, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999986661704822e-05, + "loss": 0.6726, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999984823984616e-05, + "loss": 0.6888, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999982867701943e-05, + "loss": 0.7278, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 1.999998079285682e-05, + "loss": 0.6938, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999978599449277e-05, + "loss": 0.6874, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999976287479336e-05, + "loss": 0.7285, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999973856947025e-05, + "loss": 0.6764, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 1.999997130785238e-05, + "loss": 0.7189, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999968640195417e-05, + "loss": 0.6773, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 1.999996585397618e-05, + "loss": 0.7218, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999962949194697e-05, + "loss": 0.6938, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999959925851006e-05, + "loss": 0.656, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 1.999995678394514e-05, + "loss": 0.7196, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999953523477132e-05, + "loss": 0.7177, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999950144447027e-05, + "loss": 0.7175, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 1.999994664685486e-05, + "loss": 0.6418, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999943030700678e-05, + "loss": 0.6706, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999939295984525e-05, + "loss": 0.7355, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999935442706436e-05, + "loss": 0.7043, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 1.999993147086647e-05, + "loss": 0.7332, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999927380464657e-05, + "loss": 0.6892, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999923171501062e-05, + "loss": 0.7006, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 1.999991884397572e-05, + "loss": 0.7, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 1.99999143978887e-05, + "loss": 0.7009, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999909833240038e-05, + "loss": 0.7425, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999905150029798e-05, + "loss": 0.6946, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 1.999990034825803e-05, + "loss": 0.7225, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999895427924797e-05, + "loss": 0.72, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 1.999989038903015e-05, + "loss": 0.7409, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999885231574153e-05, + "loss": 0.6759, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 1.999987995555687e-05, + "loss": 0.6848, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999874560978358e-05, + "loss": 0.6368, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999869047838683e-05, + "loss": 0.6673, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 1.999986341613791e-05, + "loss": 0.6344, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 1.999985766587611e-05, + "loss": 0.7001, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999851797053345e-05, + "loss": 0.6998, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999845809669685e-05, + "loss": 0.67, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999839703725206e-05, + "loss": 0.6732, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999833479219974e-05, + "loss": 0.6711, + "step": 63 + }, + { + "epoch": 0.0, + "learning_rate": 1.999982713615407e-05, + "loss": 0.6905, + "step": 64 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999820674527565e-05, + "loss": 0.7061, + "step": 65 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999814094340534e-05, + "loss": 0.6912, + "step": 66 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999807395593057e-05, + "loss": 0.7137, + "step": 67 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999800578285217e-05, + "loss": 0.741, + "step": 68 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999793642417087e-05, + "loss": 0.6492, + "step": 69 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999786587988757e-05, + "loss": 0.6843, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999779415000303e-05, + "loss": 0.6669, + "step": 71 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999772123451818e-05, + "loss": 0.6905, + "step": 72 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999764713343382e-05, + "loss": 0.725, + "step": 73 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999757184675087e-05, + "loss": 0.6838, + "step": 74 + }, + { + "epoch": 0.0, + "learning_rate": 1.999974953744702e-05, + "loss": 0.6803, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999741771659276e-05, + "loss": 0.6766, + "step": 76 + }, + { + "epoch": 0.0, + "learning_rate": 1.999973388731194e-05, + "loss": 0.6656, + "step": 77 + }, + { + "epoch": 0.0, + "learning_rate": 1.999972588440511e-05, + "loss": 0.6682, + "step": 78 + }, + { + "epoch": 0.0, + "learning_rate": 1.999971776293888e-05, + "loss": 0.6963, + "step": 79 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999709522913346e-05, + "loss": 0.6526, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999701164328607e-05, + "loss": 0.6638, + "step": 81 + }, + { + "epoch": 0.0, + "learning_rate": 1.999969268718476e-05, + "loss": 0.6587, + "step": 82 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999684091481907e-05, + "loss": 0.6862, + "step": 83 + }, + { + "epoch": 0.0, + "learning_rate": 1.999967537722015e-05, + "loss": 0.6593, + "step": 84 + }, + { + "epoch": 0.0, + "learning_rate": 1.999966654439959e-05, + "loss": 0.6967, + "step": 85 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999657593020333e-05, + "loss": 0.7101, + "step": 86 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999648523082488e-05, + "loss": 0.6885, + "step": 87 + }, + { + "epoch": 0.0, + "learning_rate": 1.999963933458616e-05, + "loss": 0.6838, + "step": 88 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999630027531457e-05, + "loss": 0.7213, + "step": 89 + }, + { + "epoch": 0.0, + "learning_rate": 1.999962060191849e-05, + "loss": 0.695, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 1.999961105774737e-05, + "loss": 0.6578, + "step": 91 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999601395018216e-05, + "loss": 0.6334, + "step": 92 + }, + { + "epoch": 0.0, + "learning_rate": 1.999959161373113e-05, + "loss": 0.7443, + "step": 93 + }, + { + "epoch": 0.0, + "learning_rate": 1.999958171388624e-05, + "loss": 0.6855, + "step": 94 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999571695483664e-05, + "loss": 0.6794, + "step": 95 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999561558523514e-05, + "loss": 0.6686, + "step": 96 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999551303005908e-05, + "loss": 0.6625, + "step": 97 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999540928930974e-05, + "loss": 0.6574, + "step": 98 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999530436298834e-05, + "loss": 0.5893, + "step": 99 + }, + { + "epoch": 0.0, + "learning_rate": 1.999951982510961e-05, + "loss": 0.6895, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 1.999950909536343e-05, + "loss": 0.6567, + "step": 101 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999498247060417e-05, + "loss": 0.659, + "step": 102 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999487280200703e-05, + "loss": 0.6648, + "step": 103 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999476194784423e-05, + "loss": 0.7062, + "step": 104 + }, + { + "epoch": 0.0, + "learning_rate": 1.99994649908117e-05, + "loss": 0.6743, + "step": 105 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999453668282668e-05, + "loss": 0.657, + "step": 106 + }, + { + "epoch": 0.0, + "learning_rate": 1.999944222719747e-05, + "loss": 0.7071, + "step": 107 + }, + { + "epoch": 0.0, + "learning_rate": 1.999943066755623e-05, + "loss": 0.6972, + "step": 108 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999418989359093e-05, + "loss": 0.6402, + "step": 109 + }, + { + "epoch": 0.0, + "learning_rate": 1.999940719260619e-05, + "loss": 0.6965, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 1.999939527729767e-05, + "loss": 0.6946, + "step": 111 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999383243433665e-05, + "loss": 0.6989, + "step": 112 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999371091014325e-05, + "loss": 0.7167, + "step": 113 + }, + { + "epoch": 0.0, + "learning_rate": 1.999935882003979e-05, + "loss": 0.715, + "step": 114 + }, + { + "epoch": 0.0, + "learning_rate": 1.999934643051021e-05, + "loss": 0.6478, + "step": 115 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999333922425727e-05, + "loss": 0.6596, + "step": 116 + }, + { + "epoch": 0.0, + "learning_rate": 1.999932129578649e-05, + "loss": 0.7149, + "step": 117 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999308550592655e-05, + "loss": 0.6807, + "step": 118 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999295686844363e-05, + "loss": 0.6778, + "step": 119 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999282704541772e-05, + "loss": 0.6956, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999269603685035e-05, + "loss": 0.6992, + "step": 121 + }, + { + "epoch": 0.0, + "learning_rate": 1.999925638427431e-05, + "loss": 0.6458, + "step": 122 + }, + { + "epoch": 0.0, + "learning_rate": 1.999924304630975e-05, + "loss": 0.6654, + "step": 123 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999229589791517e-05, + "loss": 0.6751, + "step": 124 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999216014719766e-05, + "loss": 0.6912, + "step": 125 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999202321094658e-05, + "loss": 0.6785, + "step": 126 + }, + { + "epoch": 0.0, + "learning_rate": 1.999918850891636e-05, + "loss": 0.6706, + "step": 127 + }, + { + "epoch": 0.0, + "learning_rate": 1.999917457818503e-05, + "loss": 0.6205, + "step": 128 + }, + { + "epoch": 0.0, + "learning_rate": 1.999916052890084e-05, + "loss": 0.7155, + "step": 129 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999146361063954e-05, + "loss": 0.6338, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999132074674534e-05, + "loss": 0.7315, + "step": 131 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999117669732756e-05, + "loss": 0.7305, + "step": 132 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999103146238793e-05, + "loss": 0.6543, + "step": 133 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999088504192808e-05, + "loss": 0.6456, + "step": 134 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999073743594984e-05, + "loss": 0.6311, + "step": 135 + }, + { + "epoch": 0.0, + "learning_rate": 1.999905886444549e-05, + "loss": 0.6616, + "step": 136 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999043866744502e-05, + "loss": 0.684, + "step": 137 + }, + { + "epoch": 0.0, + "learning_rate": 1.9999028750492204e-05, + "loss": 0.6658, + "step": 138 + }, + { + "epoch": 0.0, + "learning_rate": 1.999901351568877e-05, + "loss": 0.7399, + "step": 139 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998998162334383e-05, + "loss": 0.6358, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998982690429224e-05, + "loss": 0.7194, + "step": 141 + }, + { + "epoch": 0.0, + "learning_rate": 1.9998967099973475e-05, + "loss": 0.6876, + "step": 142 + }, + { + "epoch": 0.0, + "learning_rate": 1.999895139096732e-05, + "loss": 0.7008, + "step": 143 + }, + { + "epoch": 0.0, + "learning_rate": 1.999893556341095e-05, + "loss": 0.6821, + "step": 144 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998919617304552e-05, + "loss": 0.6604, + "step": 145 + }, + { + "epoch": 0.01, + "learning_rate": 1.999890355264831e-05, + "loss": 0.669, + "step": 146 + }, + { + "epoch": 0.01, + "learning_rate": 1.999888736944242e-05, + "loss": 0.6264, + "step": 147 + }, + { + "epoch": 0.01, + "learning_rate": 1.999887106768707e-05, + "loss": 0.6856, + "step": 148 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998854647382454e-05, + "loss": 0.6742, + "step": 149 + }, + { + "epoch": 0.01, + "learning_rate": 1.999883810852877e-05, + "loss": 0.7097, + "step": 150 + }, + { + "epoch": 0.01, + "learning_rate": 1.999882145112621e-05, + "loss": 0.671, + "step": 151 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998804675174973e-05, + "loss": 0.7166, + "step": 152 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998787780675258e-05, + "loss": 0.6844, + "step": 153 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998770767627268e-05, + "loss": 0.6494, + "step": 154 + }, + { + "epoch": 0.01, + "learning_rate": 1.99987536360312e-05, + "loss": 0.6819, + "step": 155 + }, + { + "epoch": 0.01, + "learning_rate": 1.999873638588726e-05, + "loss": 0.6262, + "step": 156 + }, + { + "epoch": 0.01, + "learning_rate": 1.999871901719565e-05, + "loss": 0.6497, + "step": 157 + }, + { + "epoch": 0.01, + "learning_rate": 1.999870152995658e-05, + "loss": 0.7246, + "step": 158 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998683924170255e-05, + "loss": 0.6237, + "step": 159 + }, + { + "epoch": 0.01, + "learning_rate": 1.999866619983688e-05, + "loss": 0.6849, + "step": 160 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998648356956672e-05, + "loss": 0.669, + "step": 161 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998630395529838e-05, + "loss": 0.6396, + "step": 162 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998612315556593e-05, + "loss": 0.7026, + "step": 163 + }, + { + "epoch": 0.01, + "learning_rate": 1.999859411703715e-05, + "loss": 0.649, + "step": 164 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998575799971726e-05, + "loss": 0.6342, + "step": 165 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998557364360537e-05, + "loss": 0.6696, + "step": 166 + }, + { + "epoch": 0.01, + "learning_rate": 1.99985388102038e-05, + "loss": 0.758, + "step": 167 + }, + { + "epoch": 0.01, + "learning_rate": 1.999852013750174e-05, + "loss": 0.6685, + "step": 168 + }, + { + "epoch": 0.01, + "learning_rate": 1.999850134625458e-05, + "loss": 0.6515, + "step": 169 + }, + { + "epoch": 0.01, + "learning_rate": 1.999848243646253e-05, + "loss": 0.6701, + "step": 170 + }, + { + "epoch": 0.01, + "learning_rate": 1.999846340812583e-05, + "loss": 0.7115, + "step": 171 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998444261244695e-05, + "loss": 0.6693, + "step": 172 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998424995819354e-05, + "loss": 0.6831, + "step": 173 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998405611850036e-05, + "loss": 0.6355, + "step": 174 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998386109336974e-05, + "loss": 0.6397, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998366488280398e-05, + "loss": 0.666, + "step": 176 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998346748680534e-05, + "loss": 0.7048, + "step": 177 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998326890537622e-05, + "loss": 0.692, + "step": 178 + }, + { + "epoch": 0.01, + "learning_rate": 1.99983069138519e-05, + "loss": 0.5899, + "step": 179 + }, + { + "epoch": 0.01, + "learning_rate": 1.99982868186236e-05, + "loss": 0.6942, + "step": 180 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998266604852965e-05, + "loss": 0.6529, + "step": 181 + }, + { + "epoch": 0.01, + "learning_rate": 1.999824627254023e-05, + "loss": 0.6145, + "step": 182 + }, + { + "epoch": 0.01, + "learning_rate": 1.999822582168563e-05, + "loss": 0.6123, + "step": 183 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998205252289425e-05, + "loss": 0.6338, + "step": 184 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998184564351846e-05, + "loss": 0.5915, + "step": 185 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998163757873138e-05, + "loss": 0.6495, + "step": 186 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998142832853554e-05, + "loss": 0.6947, + "step": 187 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998121789293342e-05, + "loss": 0.6541, + "step": 188 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998100627192743e-05, + "loss": 0.6577, + "step": 189 + }, + { + "epoch": 0.01, + "learning_rate": 1.9998079346552014e-05, + "loss": 0.6453, + "step": 190 + }, + { + "epoch": 0.01, + "learning_rate": 1.999805794737141e-05, + "loss": 0.642, + "step": 191 + }, + { + "epoch": 0.01, + "learning_rate": 1.999803642965118e-05, + "loss": 0.6259, + "step": 192 + }, + { + "epoch": 0.01, + "learning_rate": 1.999801479339158e-05, + "loss": 0.6648, + "step": 193 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997993038592866e-05, + "loss": 0.6516, + "step": 194 + }, + { + "epoch": 0.01, + "learning_rate": 1.99979711652553e-05, + "loss": 0.6825, + "step": 195 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997949173379138e-05, + "loss": 0.648, + "step": 196 + }, + { + "epoch": 0.01, + "learning_rate": 1.999792706296464e-05, + "loss": 0.7087, + "step": 197 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997904834012067e-05, + "loss": 0.6998, + "step": 198 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997882486521686e-05, + "loss": 0.7002, + "step": 199 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997860020493763e-05, + "loss": 0.6872, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 1.999783743592856e-05, + "loss": 0.6346, + "step": 201 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997814732826345e-05, + "loss": 0.6779, + "step": 202 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997791911187394e-05, + "loss": 0.6303, + "step": 203 + }, + { + "epoch": 0.01, + "learning_rate": 1.999776897101197e-05, + "loss": 0.7138, + "step": 204 + }, + { + "epoch": 0.01, + "learning_rate": 1.999774591230035e-05, + "loss": 0.6549, + "step": 205 + }, + { + "epoch": 0.01, + "learning_rate": 1.99977227350528e-05, + "loss": 0.6514, + "step": 206 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997699439269603e-05, + "loss": 0.7101, + "step": 207 + }, + { + "epoch": 0.01, + "learning_rate": 1.999767602495103e-05, + "loss": 0.7045, + "step": 208 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997652492097362e-05, + "loss": 0.6947, + "step": 209 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997628840708877e-05, + "loss": 0.6573, + "step": 210 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997605070785856e-05, + "loss": 0.6927, + "step": 211 + }, + { + "epoch": 0.01, + "learning_rate": 1.999758118232858e-05, + "loss": 0.7084, + "step": 212 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997557175337327e-05, + "loss": 0.637, + "step": 213 + }, + { + "epoch": 0.01, + "learning_rate": 1.999753304981239e-05, + "loss": 0.6459, + "step": 214 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997508805754055e-05, + "loss": 0.6703, + "step": 215 + }, + { + "epoch": 0.01, + "learning_rate": 1.99974844431626e-05, + "loss": 0.6845, + "step": 216 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997459962038325e-05, + "loss": 0.7065, + "step": 217 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997435362381513e-05, + "loss": 0.6916, + "step": 218 + }, + { + "epoch": 0.01, + "learning_rate": 1.999741064419246e-05, + "loss": 0.6717, + "step": 219 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997385807471455e-05, + "loss": 0.6564, + "step": 220 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997360852218795e-05, + "loss": 0.6881, + "step": 221 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997335778434776e-05, + "loss": 0.6871, + "step": 222 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997310586119694e-05, + "loss": 0.7128, + "step": 223 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997285275273847e-05, + "loss": 0.6689, + "step": 224 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997259845897537e-05, + "loss": 0.6682, + "step": 225 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997234297991065e-05, + "loss": 0.6399, + "step": 226 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997208631554736e-05, + "loss": 0.6845, + "step": 227 + }, + { + "epoch": 0.01, + "learning_rate": 1.999718284658885e-05, + "loss": 0.6598, + "step": 228 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997156943093716e-05, + "loss": 0.6531, + "step": 229 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997130921069638e-05, + "loss": 0.6963, + "step": 230 + }, + { + "epoch": 0.01, + "learning_rate": 1.999710478051693e-05, + "loss": 0.6536, + "step": 231 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997078521435897e-05, + "loss": 0.6364, + "step": 232 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997052143826852e-05, + "loss": 0.6612, + "step": 233 + }, + { + "epoch": 0.01, + "learning_rate": 1.9997025647690106e-05, + "loss": 0.6359, + "step": 234 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996999033025973e-05, + "loss": 0.6627, + "step": 235 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996972299834774e-05, + "loss": 0.6965, + "step": 236 + }, + { + "epoch": 0.01, + "learning_rate": 1.999694544811682e-05, + "loss": 0.6281, + "step": 237 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996918477872432e-05, + "loss": 0.6628, + "step": 238 + }, + { + "epoch": 0.01, + "learning_rate": 1.999689138910193e-05, + "loss": 0.6152, + "step": 239 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996864181805634e-05, + "loss": 0.7181, + "step": 240 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996836855983866e-05, + "loss": 0.6723, + "step": 241 + }, + { + "epoch": 0.01, + "learning_rate": 1.999680941163695e-05, + "loss": 0.6562, + "step": 242 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996781848765217e-05, + "loss": 0.676, + "step": 243 + }, + { + "epoch": 0.01, + "learning_rate": 1.999675416736899e-05, + "loss": 0.6982, + "step": 244 + }, + { + "epoch": 0.01, + "learning_rate": 1.999672636744859e-05, + "loss": 0.6426, + "step": 245 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996698449004355e-05, + "loss": 0.6921, + "step": 246 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996670412036615e-05, + "loss": 0.6698, + "step": 247 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996642256545703e-05, + "loss": 0.7375, + "step": 248 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996613982531947e-05, + "loss": 0.7026, + "step": 249 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996585589995693e-05, + "loss": 0.6962, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996557078937264e-05, + "loss": 0.6152, + "step": 251 + }, + { + "epoch": 0.01, + "learning_rate": 1.999652844935701e-05, + "loss": 0.6328, + "step": 252 + }, + { + "epoch": 0.01, + "learning_rate": 1.999649970125526e-05, + "loss": 0.6748, + "step": 253 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996470834632367e-05, + "loss": 0.6736, + "step": 254 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996441849488664e-05, + "loss": 0.6989, + "step": 255 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996412745824497e-05, + "loss": 0.7381, + "step": 256 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996383523640214e-05, + "loss": 0.6741, + "step": 257 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996354182936157e-05, + "loss": 0.7372, + "step": 258 + }, + { + "epoch": 0.01, + "learning_rate": 1.999632472371267e-05, + "loss": 0.6564, + "step": 259 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996295145970116e-05, + "loss": 0.6507, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996265449708834e-05, + "loss": 0.6899, + "step": 261 + }, + { + "epoch": 0.01, + "learning_rate": 1.999623563492918e-05, + "loss": 0.654, + "step": 262 + }, + { + "epoch": 0.01, + "learning_rate": 1.999620570163151e-05, + "loss": 0.6122, + "step": 263 + }, + { + "epoch": 0.01, + "learning_rate": 1.999617564981617e-05, + "loss": 0.68, + "step": 264 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996145479483528e-05, + "loss": 0.6505, + "step": 265 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996115190633937e-05, + "loss": 0.629, + "step": 266 + }, + { + "epoch": 0.01, + "learning_rate": 1.999608478326775e-05, + "loss": 0.6506, + "step": 267 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996054257385334e-05, + "loss": 0.6576, + "step": 268 + }, + { + "epoch": 0.01, + "learning_rate": 1.9996023612987054e-05, + "loss": 0.6864, + "step": 269 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995992850073265e-05, + "loss": 0.6596, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995961968644337e-05, + "loss": 0.7001, + "step": 271 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995930968700633e-05, + "loss": 0.6973, + "step": 272 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995899850242525e-05, + "loss": 0.7016, + "step": 273 + }, + { + "epoch": 0.01, + "learning_rate": 1.999586861327038e-05, + "loss": 0.6668, + "step": 274 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995837257784564e-05, + "loss": 0.6838, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995805783785457e-05, + "loss": 0.6747, + "step": 276 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995774191273427e-05, + "loss": 0.6399, + "step": 277 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995742480248847e-05, + "loss": 0.7069, + "step": 278 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995710650712096e-05, + "loss": 0.6573, + "step": 279 + }, + { + "epoch": 0.01, + "learning_rate": 1.999567870266355e-05, + "loss": 0.6539, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 1.999564663610359e-05, + "loss": 0.6717, + "step": 281 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995614451032593e-05, + "loss": 0.6501, + "step": 282 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995582147450943e-05, + "loss": 0.681, + "step": 283 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995549725359022e-05, + "loss": 0.6866, + "step": 284 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995517184757217e-05, + "loss": 0.6517, + "step": 285 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995484525645907e-05, + "loss": 0.669, + "step": 286 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995451748025486e-05, + "loss": 0.6985, + "step": 287 + }, + { + "epoch": 0.01, + "learning_rate": 1.999541885189634e-05, + "loss": 0.6871, + "step": 288 + }, + { + "epoch": 0.01, + "learning_rate": 1.999538583725886e-05, + "loss": 0.6825, + "step": 289 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995352704113434e-05, + "loss": 0.6675, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995319452460457e-05, + "loss": 0.6176, + "step": 291 + }, + { + "epoch": 0.01, + "learning_rate": 1.999528608230033e-05, + "loss": 0.6468, + "step": 292 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995252593633436e-05, + "loss": 0.6797, + "step": 293 + }, + { + "epoch": 0.01, + "learning_rate": 1.999521898646018e-05, + "loss": 0.6408, + "step": 294 + }, + { + "epoch": 0.01, + "learning_rate": 1.999518526078096e-05, + "loss": 0.7437, + "step": 295 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995151416596174e-05, + "loss": 0.6256, + "step": 296 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995117453906224e-05, + "loss": 0.6528, + "step": 297 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995083372711513e-05, + "loss": 0.6495, + "step": 298 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995049173012448e-05, + "loss": 0.6608, + "step": 299 + }, + { + "epoch": 0.01, + "learning_rate": 1.9995014854809427e-05, + "loss": 0.6979, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994980418102862e-05, + "loss": 0.669, + "step": 301 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994945862893162e-05, + "loss": 0.6566, + "step": 302 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994911189180734e-05, + "loss": 0.6375, + "step": 303 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994876396965987e-05, + "loss": 0.6745, + "step": 304 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994841486249342e-05, + "loss": 0.6077, + "step": 305 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994806457031206e-05, + "loss": 0.6828, + "step": 306 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994771309311995e-05, + "loss": 0.6229, + "step": 307 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994736043092126e-05, + "loss": 0.692, + "step": 308 + }, + { + "epoch": 0.01, + "learning_rate": 1.999470065837202e-05, + "loss": 0.725, + "step": 309 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994665155152093e-05, + "loss": 0.67, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994629533432767e-05, + "loss": 0.6253, + "step": 311 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994593793214467e-05, + "loss": 0.5849, + "step": 312 + }, + { + "epoch": 0.01, + "learning_rate": 1.999455793449761e-05, + "loss": 0.6863, + "step": 313 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994521957282627e-05, + "loss": 0.6389, + "step": 314 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994485861569946e-05, + "loss": 0.6762, + "step": 315 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994449647359987e-05, + "loss": 0.6483, + "step": 316 + }, + { + "epoch": 0.01, + "learning_rate": 1.999441331465319e-05, + "loss": 0.6637, + "step": 317 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994376863449978e-05, + "loss": 0.6964, + "step": 318 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994340293750784e-05, + "loss": 0.6615, + "step": 319 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994303605556045e-05, + "loss": 0.6757, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994266798866195e-05, + "loss": 0.7322, + "step": 321 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994229873681663e-05, + "loss": 0.6741, + "step": 322 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994192830002896e-05, + "loss": 0.6331, + "step": 323 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994155667830333e-05, + "loss": 0.6537, + "step": 324 + }, + { + "epoch": 0.01, + "learning_rate": 1.9994118387164413e-05, + "loss": 0.6324, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 1.999408098800557e-05, + "loss": 0.7125, + "step": 326 + }, + { + "epoch": 0.01, + "learning_rate": 1.999404347035426e-05, + "loss": 0.6934, + "step": 327 + }, + { + "epoch": 0.01, + "learning_rate": 1.999400583421092e-05, + "loss": 0.6976, + "step": 328 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993968079576002e-05, + "loss": 0.7064, + "step": 329 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993930206449943e-05, + "loss": 0.6366, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993892214833203e-05, + "loss": 0.6612, + "step": 331 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993854104726228e-05, + "loss": 0.6447, + "step": 332 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993815876129474e-05, + "loss": 0.6572, + "step": 333 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993777529043384e-05, + "loss": 0.6659, + "step": 334 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993739063468424e-05, + "loss": 0.6001, + "step": 335 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993700479405044e-05, + "loss": 0.6715, + "step": 336 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993661776853704e-05, + "loss": 0.6839, + "step": 337 + }, + { + "epoch": 0.01, + "learning_rate": 1.999362295581486e-05, + "loss": 0.6628, + "step": 338 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993584016288973e-05, + "loss": 0.6574, + "step": 339 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993544958276506e-05, + "loss": 0.6423, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993505781777923e-05, + "loss": 0.6907, + "step": 341 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993466486793685e-05, + "loss": 0.6485, + "step": 342 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993427073324262e-05, + "loss": 0.6791, + "step": 343 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993387541370116e-05, + "loss": 0.7051, + "step": 344 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993347890931723e-05, + "loss": 0.6364, + "step": 345 + }, + { + "epoch": 0.01, + "learning_rate": 1.999330812200955e-05, + "loss": 0.6741, + "step": 346 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993268234604063e-05, + "loss": 0.6663, + "step": 347 + }, + { + "epoch": 0.01, + "learning_rate": 1.999322822871574e-05, + "loss": 0.6749, + "step": 348 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993188104345054e-05, + "loss": 0.6691, + "step": 349 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993147861492486e-05, + "loss": 0.6295, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993107500158508e-05, + "loss": 0.6685, + "step": 351 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993067020343597e-05, + "loss": 0.6714, + "step": 352 + }, + { + "epoch": 0.01, + "learning_rate": 1.9993026422048238e-05, + "loss": 0.6694, + "step": 353 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992985705272906e-05, + "loss": 0.6869, + "step": 354 + }, + { + "epoch": 0.01, + "learning_rate": 1.999294487001809e-05, + "loss": 0.6464, + "step": 355 + }, + { + "epoch": 0.01, + "learning_rate": 1.999290391628427e-05, + "loss": 0.6531, + "step": 356 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992862844071933e-05, + "loss": 0.6748, + "step": 357 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992821653381568e-05, + "loss": 0.678, + "step": 358 + }, + { + "epoch": 0.01, + "learning_rate": 1.999278034421366e-05, + "loss": 0.662, + "step": 359 + }, + { + "epoch": 0.01, + "learning_rate": 1.99927389165687e-05, + "loss": 0.6468, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992697370447177e-05, + "loss": 0.6266, + "step": 361 + }, + { + "epoch": 0.01, + "learning_rate": 1.999265570584959e-05, + "loss": 0.6633, + "step": 362 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992613922776424e-05, + "loss": 0.6867, + "step": 363 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992572021228183e-05, + "loss": 0.6307, + "step": 364 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992530001205356e-05, + "loss": 0.6664, + "step": 365 + }, + { + "epoch": 0.01, + "learning_rate": 1.999248786270845e-05, + "loss": 0.6466, + "step": 366 + }, + { + "epoch": 0.01, + "learning_rate": 1.999244560573796e-05, + "loss": 0.6394, + "step": 367 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992403230294384e-05, + "loss": 0.6983, + "step": 368 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992360736378226e-05, + "loss": 0.6417, + "step": 369 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992318123989995e-05, + "loss": 0.6915, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 1.999227539313019e-05, + "loss": 0.6626, + "step": 371 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992232543799322e-05, + "loss": 0.6646, + "step": 372 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992189575997893e-05, + "loss": 0.6502, + "step": 373 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992146489726417e-05, + "loss": 0.6562, + "step": 374 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992103284985407e-05, + "loss": 0.6618, + "step": 375 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992059961775373e-05, + "loss": 0.6231, + "step": 376 + }, + { + "epoch": 0.01, + "learning_rate": 1.9992016520096825e-05, + "loss": 0.7064, + "step": 377 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991972959950284e-05, + "loss": 0.6356, + "step": 378 + }, + { + "epoch": 0.01, + "learning_rate": 1.999192928133626e-05, + "loss": 0.6997, + "step": 379 + }, + { + "epoch": 0.01, + "learning_rate": 1.999188548425528e-05, + "loss": 0.715, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991841568707854e-05, + "loss": 0.6737, + "step": 381 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991797534694507e-05, + "loss": 0.6466, + "step": 382 + }, + { + "epoch": 0.01, + "learning_rate": 1.999175338221576e-05, + "loss": 0.6137, + "step": 383 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991709111272138e-05, + "loss": 0.7074, + "step": 384 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991664721864167e-05, + "loss": 0.6301, + "step": 385 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991620213992366e-05, + "loss": 0.6615, + "step": 386 + }, + { + "epoch": 0.01, + "learning_rate": 1.999157558765727e-05, + "loss": 0.6592, + "step": 387 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991530842859408e-05, + "loss": 0.6536, + "step": 388 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991485979599305e-05, + "loss": 0.6525, + "step": 389 + }, + { + "epoch": 0.01, + "learning_rate": 1.99914409978775e-05, + "loss": 0.6904, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991395897694523e-05, + "loss": 0.6809, + "step": 391 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991350679050904e-05, + "loss": 0.7001, + "step": 392 + }, + { + "epoch": 0.01, + "learning_rate": 1.999130534194719e-05, + "loss": 0.6559, + "step": 393 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991259886383907e-05, + "loss": 0.7366, + "step": 394 + }, + { + "epoch": 0.01, + "learning_rate": 1.99912143123616e-05, + "loss": 0.6639, + "step": 395 + }, + { + "epoch": 0.01, + "learning_rate": 1.999116861988081e-05, + "loss": 0.6234, + "step": 396 + }, + { + "epoch": 0.01, + "learning_rate": 1.9991122808942075e-05, + "loss": 0.6446, + "step": 397 + }, + { + "epoch": 0.01, + "learning_rate": 1.999107687954594e-05, + "loss": 0.6334, + "step": 398 + }, + { + "epoch": 0.01, + "learning_rate": 1.999103083169295e-05, + "loss": 0.6646, + "step": 399 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990984665383654e-05, + "loss": 0.6418, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990938380618594e-05, + "loss": 0.6635, + "step": 401 + }, + { + "epoch": 0.01, + "learning_rate": 1.999089197739832e-05, + "loss": 0.6835, + "step": 402 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990845455723385e-05, + "loss": 0.6757, + "step": 403 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990798815594336e-05, + "loss": 0.6286, + "step": 404 + }, + { + "epoch": 0.01, + "learning_rate": 1.999075205701173e-05, + "loss": 0.6338, + "step": 405 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990705179976123e-05, + "loss": 0.7339, + "step": 406 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990658184488062e-05, + "loss": 0.6696, + "step": 407 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990611070548115e-05, + "loss": 0.6464, + "step": 408 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990563838156835e-05, + "loss": 0.6404, + "step": 409 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990516487314777e-05, + "loss": 0.6409, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990469018022513e-05, + "loss": 0.6854, + "step": 411 + }, + { + "epoch": 0.01, + "learning_rate": 1.99904214302806e-05, + "loss": 0.757, + "step": 412 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990373724089602e-05, + "loss": 0.6987, + "step": 413 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990325899450086e-05, + "loss": 0.6783, + "step": 414 + }, + { + "epoch": 0.01, + "learning_rate": 1.999027795636262e-05, + "loss": 0.6768, + "step": 415 + }, + { + "epoch": 0.01, + "learning_rate": 1.999022989482777e-05, + "loss": 0.6386, + "step": 416 + }, + { + "epoch": 0.01, + "learning_rate": 1.999018171484611e-05, + "loss": 0.6743, + "step": 417 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990133416418206e-05, + "loss": 0.705, + "step": 418 + }, + { + "epoch": 0.01, + "learning_rate": 1.9990084999544628e-05, + "loss": 0.6619, + "step": 419 + }, + { + "epoch": 0.01, + "learning_rate": 1.999003646422596e-05, + "loss": 0.6282, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 1.998998781046277e-05, + "loss": 0.6502, + "step": 421 + }, + { + "epoch": 0.01, + "learning_rate": 1.998993903825564e-05, + "loss": 0.6198, + "step": 422 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989890147605143e-05, + "loss": 0.6751, + "step": 423 + }, + { + "epoch": 0.01, + "learning_rate": 1.998984113851186e-05, + "loss": 0.6718, + "step": 424 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989792010976376e-05, + "loss": 0.677, + "step": 425 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989742764999268e-05, + "loss": 0.6689, + "step": 426 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989693400581122e-05, + "loss": 0.6629, + "step": 427 + }, + { + "epoch": 0.01, + "learning_rate": 1.998964391772253e-05, + "loss": 0.648, + "step": 428 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989594316424065e-05, + "loss": 0.652, + "step": 429 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989544596686325e-05, + "loss": 0.6425, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 1.99894947585099e-05, + "loss": 0.6606, + "step": 431 + }, + { + "epoch": 0.01, + "learning_rate": 1.9989444801895374e-05, + "loss": 0.6397, + "step": 432 + }, + { + "epoch": 0.02, + "learning_rate": 1.9989394726843342e-05, + "loss": 0.6531, + "step": 433 + }, + { + "epoch": 0.02, + "learning_rate": 1.9989344533354403e-05, + "loss": 0.6618, + "step": 434 + }, + { + "epoch": 0.02, + "learning_rate": 1.9989294221429146e-05, + "loss": 0.6447, + "step": 435 + }, + { + "epoch": 0.02, + "learning_rate": 1.998924379106817e-05, + "loss": 0.646, + "step": 436 + }, + { + "epoch": 0.02, + "learning_rate": 1.998919324227207e-05, + "loss": 0.6244, + "step": 437 + }, + { + "epoch": 0.02, + "learning_rate": 1.998914257504145e-05, + "loss": 0.6767, + "step": 438 + }, + { + "epoch": 0.02, + "learning_rate": 1.9989091789376905e-05, + "loss": 0.6886, + "step": 439 + }, + { + "epoch": 0.02, + "learning_rate": 1.9989040885279044e-05, + "loss": 0.6911, + "step": 440 + }, + { + "epoch": 0.02, + "learning_rate": 1.998898986274847e-05, + "loss": 0.6695, + "step": 441 + }, + { + "epoch": 0.02, + "learning_rate": 1.998893872178578e-05, + "loss": 0.6494, + "step": 442 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988887462391585e-05, + "loss": 0.6884, + "step": 443 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988836084566495e-05, + "loss": 0.6403, + "step": 444 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988784588311118e-05, + "loss": 0.6263, + "step": 445 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988732973626065e-05, + "loss": 0.7104, + "step": 446 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988681240511944e-05, + "loss": 0.6558, + "step": 447 + }, + { + "epoch": 0.02, + "learning_rate": 1.998862938896937e-05, + "loss": 0.7346, + "step": 448 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988577418998963e-05, + "loss": 0.7029, + "step": 449 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988525330601335e-05, + "loss": 0.6575, + "step": 450 + }, + { + "epoch": 0.02, + "learning_rate": 1.99884731237771e-05, + "loss": 0.6277, + "step": 451 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988420798526885e-05, + "loss": 0.6278, + "step": 452 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988368354851303e-05, + "loss": 0.6512, + "step": 453 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988315792750977e-05, + "loss": 0.6582, + "step": 454 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988263112226534e-05, + "loss": 0.6563, + "step": 455 + }, + { + "epoch": 0.02, + "learning_rate": 1.99882103132786e-05, + "loss": 0.6312, + "step": 456 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988157395907796e-05, + "loss": 0.671, + "step": 457 + }, + { + "epoch": 0.02, + "learning_rate": 1.998810436011475e-05, + "loss": 0.7301, + "step": 458 + }, + { + "epoch": 0.02, + "learning_rate": 1.9988051205900088e-05, + "loss": 0.7009, + "step": 459 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987997933264446e-05, + "loss": 0.684, + "step": 460 + }, + { + "epoch": 0.02, + "learning_rate": 1.998794454220846e-05, + "loss": 0.6436, + "step": 461 + }, + { + "epoch": 0.02, + "learning_rate": 1.998789103273275e-05, + "loss": 0.6916, + "step": 462 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987837404837957e-05, + "loss": 0.6431, + "step": 463 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987783658524717e-05, + "loss": 0.6918, + "step": 464 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987729793793668e-05, + "loss": 0.6749, + "step": 465 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987675810645452e-05, + "loss": 0.6272, + "step": 466 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987621709080698e-05, + "loss": 0.6625, + "step": 467 + }, + { + "epoch": 0.02, + "learning_rate": 1.998756748910006e-05, + "loss": 0.6728, + "step": 468 + }, + { + "epoch": 0.02, + "learning_rate": 1.998751315070417e-05, + "loss": 0.6727, + "step": 469 + }, + { + "epoch": 0.02, + "learning_rate": 1.998745869389368e-05, + "loss": 0.7283, + "step": 470 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987404118669233e-05, + "loss": 0.6727, + "step": 471 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987349425031475e-05, + "loss": 0.6526, + "step": 472 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987294612981055e-05, + "loss": 0.718, + "step": 473 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987239682518628e-05, + "loss": 0.6871, + "step": 474 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987184633644836e-05, + "loss": 0.6442, + "step": 475 + }, + { + "epoch": 0.02, + "learning_rate": 1.998712946636034e-05, + "loss": 0.6572, + "step": 476 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987074180665784e-05, + "loss": 0.6738, + "step": 477 + }, + { + "epoch": 0.02, + "learning_rate": 1.9987018776561835e-05, + "loss": 0.6871, + "step": 478 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986963254049144e-05, + "loss": 0.6738, + "step": 479 + }, + { + "epoch": 0.02, + "learning_rate": 1.998690761312837e-05, + "loss": 0.7051, + "step": 480 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986851853800174e-05, + "loss": 0.657, + "step": 481 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986795976065213e-05, + "loss": 0.6326, + "step": 482 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986739979924153e-05, + "loss": 0.6632, + "step": 483 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986683865377658e-05, + "loss": 0.6244, + "step": 484 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986627632426393e-05, + "loss": 0.6894, + "step": 485 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986571281071024e-05, + "loss": 0.669, + "step": 486 + }, + { + "epoch": 0.02, + "learning_rate": 1.998651481131222e-05, + "loss": 0.6596, + "step": 487 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986458223150648e-05, + "loss": 0.735, + "step": 488 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986401516586982e-05, + "loss": 0.6984, + "step": 489 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986344691621892e-05, + "loss": 0.6437, + "step": 490 + }, + { + "epoch": 0.02, + "learning_rate": 1.998628774825605e-05, + "loss": 0.6491, + "step": 491 + }, + { + "epoch": 0.02, + "learning_rate": 1.998623068649014e-05, + "loss": 0.7071, + "step": 492 + }, + { + "epoch": 0.02, + "learning_rate": 1.998617350632483e-05, + "loss": 0.6113, + "step": 493 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986116207760802e-05, + "loss": 0.5655, + "step": 494 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986058790798735e-05, + "loss": 0.661, + "step": 495 + }, + { + "epoch": 0.02, + "learning_rate": 1.9986001255439307e-05, + "loss": 0.7126, + "step": 496 + }, + { + "epoch": 0.02, + "learning_rate": 1.99859436016832e-05, + "loss": 0.6351, + "step": 497 + }, + { + "epoch": 0.02, + "learning_rate": 1.99858858295311e-05, + "loss": 0.724, + "step": 498 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985827938983695e-05, + "loss": 0.6657, + "step": 499 + }, + { + "epoch": 0.02, + "learning_rate": 1.998576993004166e-05, + "loss": 0.6827, + "step": 500 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985711802705695e-05, + "loss": 0.6548, + "step": 501 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985653556976485e-05, + "loss": 0.7073, + "step": 502 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985595192854718e-05, + "loss": 0.6465, + "step": 503 + }, + { + "epoch": 0.02, + "learning_rate": 1.998553671034109e-05, + "loss": 0.6026, + "step": 504 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985478109436294e-05, + "loss": 0.7391, + "step": 505 + }, + { + "epoch": 0.02, + "learning_rate": 1.998541939014102e-05, + "loss": 0.714, + "step": 506 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985360552455973e-05, + "loss": 0.6015, + "step": 507 + }, + { + "epoch": 0.02, + "learning_rate": 1.998530159638184e-05, + "loss": 0.7485, + "step": 508 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985242521919325e-05, + "loss": 0.7235, + "step": 509 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985183329069132e-05, + "loss": 0.643, + "step": 510 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985124017831956e-05, + "loss": 0.6729, + "step": 511 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985064588208502e-05, + "loss": 0.6805, + "step": 512 + }, + { + "epoch": 0.02, + "learning_rate": 1.9985005040199482e-05, + "loss": 0.7176, + "step": 513 + }, + { + "epoch": 0.02, + "learning_rate": 1.998494537380559e-05, + "loss": 0.7054, + "step": 514 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984885589027546e-05, + "loss": 0.7019, + "step": 515 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984825685866048e-05, + "loss": 0.683, + "step": 516 + }, + { + "epoch": 0.02, + "learning_rate": 1.998476566432181e-05, + "loss": 0.7019, + "step": 517 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984705524395545e-05, + "loss": 0.6943, + "step": 518 + }, + { + "epoch": 0.02, + "learning_rate": 1.998464526608797e-05, + "loss": 0.6749, + "step": 519 + }, + { + "epoch": 0.02, + "learning_rate": 1.998458488939979e-05, + "loss": 0.6843, + "step": 520 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984524394331727e-05, + "loss": 0.7013, + "step": 521 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984463780884492e-05, + "loss": 0.6499, + "step": 522 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984403049058813e-05, + "loss": 0.6786, + "step": 523 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984342198855407e-05, + "loss": 0.6882, + "step": 524 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984281230274993e-05, + "loss": 0.7124, + "step": 525 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984220143318292e-05, + "loss": 0.6805, + "step": 526 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984158937986033e-05, + "loss": 0.5811, + "step": 527 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984097614278938e-05, + "loss": 0.6887, + "step": 528 + }, + { + "epoch": 0.02, + "learning_rate": 1.9984036172197738e-05, + "loss": 0.6854, + "step": 529 + }, + { + "epoch": 0.02, + "learning_rate": 1.998397461174316e-05, + "loss": 0.6233, + "step": 530 + }, + { + "epoch": 0.02, + "learning_rate": 1.998391293291593e-05, + "loss": 0.6501, + "step": 531 + }, + { + "epoch": 0.02, + "learning_rate": 1.998385113571679e-05, + "loss": 0.6383, + "step": 532 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983789220146458e-05, + "loss": 0.6274, + "step": 533 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983727186205676e-05, + "loss": 0.6285, + "step": 534 + }, + { + "epoch": 0.02, + "learning_rate": 1.998366503389518e-05, + "loss": 0.7192, + "step": 535 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983602763215705e-05, + "loss": 0.6715, + "step": 536 + }, + { + "epoch": 0.02, + "learning_rate": 1.998354037416799e-05, + "loss": 0.6664, + "step": 537 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983477866752775e-05, + "loss": 0.6312, + "step": 538 + }, + { + "epoch": 0.02, + "learning_rate": 1.99834152409708e-05, + "loss": 0.6394, + "step": 539 + }, + { + "epoch": 0.02, + "learning_rate": 1.998335249682281e-05, + "loss": 0.6965, + "step": 540 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983289634309546e-05, + "loss": 0.6828, + "step": 541 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983226653431753e-05, + "loss": 0.6856, + "step": 542 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983163554190182e-05, + "loss": 0.6557, + "step": 543 + }, + { + "epoch": 0.02, + "learning_rate": 1.9983100336585576e-05, + "loss": 0.6143, + "step": 544 + }, + { + "epoch": 0.02, + "learning_rate": 1.998303700061869e-05, + "loss": 0.6438, + "step": 545 + }, + { + "epoch": 0.02, + "learning_rate": 1.998297354629027e-05, + "loss": 0.6269, + "step": 546 + }, + { + "epoch": 0.02, + "learning_rate": 1.998290997360107e-05, + "loss": 0.6387, + "step": 547 + }, + { + "epoch": 0.02, + "learning_rate": 1.998284628255184e-05, + "loss": 0.6978, + "step": 548 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982782473143343e-05, + "loss": 0.7045, + "step": 549 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982718545376332e-05, + "loss": 0.6099, + "step": 550 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982654499251565e-05, + "loss": 0.6118, + "step": 551 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982590334769796e-05, + "loss": 0.687, + "step": 552 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982526051931795e-05, + "loss": 0.6417, + "step": 553 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982461650738317e-05, + "loss": 0.6631, + "step": 554 + }, + { + "epoch": 0.02, + "learning_rate": 1.998239713119013e-05, + "loss": 0.6352, + "step": 555 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982332493287998e-05, + "loss": 0.6242, + "step": 556 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982267737032685e-05, + "loss": 0.6579, + "step": 557 + }, + { + "epoch": 0.02, + "learning_rate": 1.998220286242496e-05, + "loss": 0.6848, + "step": 558 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982137869465596e-05, + "loss": 0.6569, + "step": 559 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982072758155352e-05, + "loss": 0.6796, + "step": 560 + }, + { + "epoch": 0.02, + "learning_rate": 1.9982007528495015e-05, + "loss": 0.6234, + "step": 561 + }, + { + "epoch": 0.02, + "learning_rate": 1.998194218048535e-05, + "loss": 0.6612, + "step": 562 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981876714127132e-05, + "loss": 0.6573, + "step": 563 + }, + { + "epoch": 0.02, + "learning_rate": 1.998181112942114e-05, + "loss": 0.6689, + "step": 564 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981745426368147e-05, + "loss": 0.6617, + "step": 565 + }, + { + "epoch": 0.02, + "learning_rate": 1.998167960496894e-05, + "loss": 0.6799, + "step": 566 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981613665224292e-05, + "loss": 0.6492, + "step": 567 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981547607134985e-05, + "loss": 0.6006, + "step": 568 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981481430701806e-05, + "loss": 0.7015, + "step": 569 + }, + { + "epoch": 0.02, + "learning_rate": 1.998141513592554e-05, + "loss": 0.6743, + "step": 570 + }, + { + "epoch": 0.02, + "learning_rate": 1.998134872280697e-05, + "loss": 0.6573, + "step": 571 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981282191346886e-05, + "loss": 0.6176, + "step": 572 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981215541546072e-05, + "loss": 0.6557, + "step": 573 + }, + { + "epoch": 0.02, + "learning_rate": 1.9981148773405322e-05, + "loss": 0.7244, + "step": 574 + }, + { + "epoch": 0.02, + "learning_rate": 1.998108188692543e-05, + "loss": 0.6493, + "step": 575 + }, + { + "epoch": 0.02, + "learning_rate": 1.998101488210718e-05, + "loss": 0.6381, + "step": 576 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980947758951376e-05, + "loss": 0.6693, + "step": 577 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980880517458813e-05, + "loss": 0.6679, + "step": 578 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980813157630283e-05, + "loss": 0.6581, + "step": 579 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980745679466587e-05, + "loss": 0.7063, + "step": 580 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980678082968527e-05, + "loss": 0.7262, + "step": 581 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980610368136898e-05, + "loss": 0.7239, + "step": 582 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980542534972512e-05, + "loss": 0.6892, + "step": 583 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980474583476167e-05, + "loss": 0.6459, + "step": 584 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980406513648673e-05, + "loss": 0.6314, + "step": 585 + }, + { + "epoch": 0.02, + "learning_rate": 1.998033832549083e-05, + "loss": 0.6919, + "step": 586 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980270019003452e-05, + "loss": 0.6956, + "step": 587 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980201594187353e-05, + "loss": 0.6729, + "step": 588 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980133051043336e-05, + "loss": 0.6526, + "step": 589 + }, + { + "epoch": 0.02, + "learning_rate": 1.9980064389572215e-05, + "loss": 0.6537, + "step": 590 + }, + { + "epoch": 0.02, + "learning_rate": 1.997999560977481e-05, + "loss": 0.7245, + "step": 591 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979926711651928e-05, + "loss": 0.6586, + "step": 592 + }, + { + "epoch": 0.02, + "learning_rate": 1.997985769520439e-05, + "loss": 0.6778, + "step": 593 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979788560433016e-05, + "loss": 0.6635, + "step": 594 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979719307338624e-05, + "loss": 0.6056, + "step": 595 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979649935922033e-05, + "loss": 0.6642, + "step": 596 + }, + { + "epoch": 0.02, + "learning_rate": 1.997958044618407e-05, + "loss": 0.6176, + "step": 597 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979510838125557e-05, + "loss": 0.6504, + "step": 598 + }, + { + "epoch": 0.02, + "learning_rate": 1.997944111174732e-05, + "loss": 0.6681, + "step": 599 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979371267050184e-05, + "loss": 0.668, + "step": 600 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979301304034978e-05, + "loss": 0.6805, + "step": 601 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979231222702527e-05, + "loss": 0.5749, + "step": 602 + }, + { + "epoch": 0.02, + "learning_rate": 1.997916102305367e-05, + "loss": 0.6246, + "step": 603 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979090705089232e-05, + "loss": 0.6548, + "step": 604 + }, + { + "epoch": 0.02, + "learning_rate": 1.9979020268810054e-05, + "loss": 0.6684, + "step": 605 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978949714216965e-05, + "loss": 0.6862, + "step": 606 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978879041310805e-05, + "loss": 0.6373, + "step": 607 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978808250092408e-05, + "loss": 0.6562, + "step": 608 + }, + { + "epoch": 0.02, + "learning_rate": 1.997873734056262e-05, + "loss": 0.6862, + "step": 609 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978666312722273e-05, + "loss": 0.6813, + "step": 610 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978595166572216e-05, + "loss": 0.6866, + "step": 611 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978523902113292e-05, + "loss": 0.6897, + "step": 612 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978452519346343e-05, + "loss": 0.6791, + "step": 613 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978381018272218e-05, + "loss": 0.6791, + "step": 614 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978309398891758e-05, + "loss": 0.596, + "step": 615 + }, + { + "epoch": 0.02, + "learning_rate": 1.997823766120582e-05, + "loss": 0.7414, + "step": 616 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978165805215255e-05, + "loss": 0.6518, + "step": 617 + }, + { + "epoch": 0.02, + "learning_rate": 1.9978093830920912e-05, + "loss": 0.7035, + "step": 618 + }, + { + "epoch": 0.02, + "learning_rate": 1.997802173832364e-05, + "loss": 0.687, + "step": 619 + }, + { + "epoch": 0.02, + "learning_rate": 1.99779495274243e-05, + "loss": 0.6969, + "step": 620 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977877198223746e-05, + "loss": 0.6914, + "step": 621 + }, + { + "epoch": 0.02, + "learning_rate": 1.997780475072284e-05, + "loss": 0.6692, + "step": 622 + }, + { + "epoch": 0.02, + "learning_rate": 1.997773218492243e-05, + "loss": 0.6312, + "step": 623 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977659500823387e-05, + "loss": 0.6515, + "step": 624 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977586698426568e-05, + "loss": 0.6731, + "step": 625 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977513777732837e-05, + "loss": 0.6746, + "step": 626 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977440738743057e-05, + "loss": 0.666, + "step": 627 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977367581458095e-05, + "loss": 0.6846, + "step": 628 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977294305878823e-05, + "loss": 0.6311, + "step": 629 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977220912006104e-05, + "loss": 0.7214, + "step": 630 + }, + { + "epoch": 0.02, + "learning_rate": 1.997714739984081e-05, + "loss": 0.6589, + "step": 631 + }, + { + "epoch": 0.02, + "learning_rate": 1.997707376938381e-05, + "loss": 0.6794, + "step": 632 + }, + { + "epoch": 0.02, + "learning_rate": 1.9977000020635978e-05, + "loss": 0.6651, + "step": 633 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976926153598196e-05, + "loss": 0.6242, + "step": 634 + }, + { + "epoch": 0.02, + "learning_rate": 1.997685216827133e-05, + "loss": 0.636, + "step": 635 + }, + { + "epoch": 0.02, + "learning_rate": 1.997677806465626e-05, + "loss": 0.6702, + "step": 636 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976703842753865e-05, + "loss": 0.7023, + "step": 637 + }, + { + "epoch": 0.02, + "learning_rate": 1.997662950256503e-05, + "loss": 0.7261, + "step": 638 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976555044090628e-05, + "loss": 0.6894, + "step": 639 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976480467331546e-05, + "loss": 0.6068, + "step": 640 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976405772288667e-05, + "loss": 0.6743, + "step": 641 + }, + { + "epoch": 0.02, + "learning_rate": 1.997633095896288e-05, + "loss": 0.6967, + "step": 642 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976256027355068e-05, + "loss": 0.6662, + "step": 643 + }, + { + "epoch": 0.02, + "learning_rate": 1.997618097746612e-05, + "loss": 0.6928, + "step": 644 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976105809296925e-05, + "loss": 0.7312, + "step": 645 + }, + { + "epoch": 0.02, + "learning_rate": 1.9976030522848378e-05, + "loss": 0.6117, + "step": 646 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975955118121367e-05, + "loss": 0.661, + "step": 647 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975879595116793e-05, + "loss": 0.6827, + "step": 648 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975803953835543e-05, + "loss": 0.6607, + "step": 649 + }, + { + "epoch": 0.02, + "learning_rate": 1.997572819427852e-05, + "loss": 0.6394, + "step": 650 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975652316446618e-05, + "loss": 0.6767, + "step": 651 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975576320340742e-05, + "loss": 0.6378, + "step": 652 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975500205961786e-05, + "loss": 0.6641, + "step": 653 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975423973310657e-05, + "loss": 0.634, + "step": 654 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975347622388256e-05, + "loss": 0.6461, + "step": 655 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975271153195496e-05, + "loss": 0.6987, + "step": 656 + }, + { + "epoch": 0.02, + "learning_rate": 1.997519456573327e-05, + "loss": 0.629, + "step": 657 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975117860002497e-05, + "loss": 0.6563, + "step": 658 + }, + { + "epoch": 0.02, + "learning_rate": 1.9975041036004087e-05, + "loss": 0.6754, + "step": 659 + }, + { + "epoch": 0.02, + "learning_rate": 1.997496409373894e-05, + "loss": 0.583, + "step": 660 + }, + { + "epoch": 0.02, + "learning_rate": 1.997488703320798e-05, + "loss": 0.6448, + "step": 661 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974809854412114e-05, + "loss": 0.6472, + "step": 662 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974732557352258e-05, + "loss": 0.6221, + "step": 663 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974655142029333e-05, + "loss": 0.6354, + "step": 664 + }, + { + "epoch": 0.02, + "learning_rate": 1.997457760844425e-05, + "loss": 0.6744, + "step": 665 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974499956597933e-05, + "loss": 0.6218, + "step": 666 + }, + { + "epoch": 0.02, + "learning_rate": 1.99744221864913e-05, + "loss": 0.6858, + "step": 667 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974344298125277e-05, + "loss": 0.7109, + "step": 668 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974266291500785e-05, + "loss": 0.6245, + "step": 669 + }, + { + "epoch": 0.02, + "learning_rate": 1.9974188166618743e-05, + "loss": 0.7175, + "step": 670 + }, + { + "epoch": 0.02, + "learning_rate": 1.997410992348009e-05, + "loss": 0.6277, + "step": 671 + }, + { + "epoch": 0.02, + "learning_rate": 1.997403156208574e-05, + "loss": 0.6664, + "step": 672 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973953082436635e-05, + "loss": 0.5916, + "step": 673 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973874484533696e-05, + "loss": 0.6305, + "step": 674 + }, + { + "epoch": 0.02, + "learning_rate": 1.997379576837786e-05, + "loss": 0.7272, + "step": 675 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973716933970053e-05, + "loss": 0.6461, + "step": 676 + }, + { + "epoch": 0.02, + "learning_rate": 1.997363798131122e-05, + "loss": 0.659, + "step": 677 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973558910402287e-05, + "loss": 0.6459, + "step": 678 + }, + { + "epoch": 0.02, + "learning_rate": 1.99734797212442e-05, + "loss": 0.6481, + "step": 679 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973400413837893e-05, + "loss": 0.6818, + "step": 680 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973320988184312e-05, + "loss": 0.6896, + "step": 681 + }, + { + "epoch": 0.02, + "learning_rate": 1.997324144428439e-05, + "loss": 0.705, + "step": 682 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973161782139074e-05, + "loss": 0.6069, + "step": 683 + }, + { + "epoch": 0.02, + "learning_rate": 1.997308200174931e-05, + "loss": 0.649, + "step": 684 + }, + { + "epoch": 0.02, + "learning_rate": 1.9973002103116045e-05, + "loss": 0.6244, + "step": 685 + }, + { + "epoch": 0.02, + "learning_rate": 1.997292208624022e-05, + "loss": 0.6134, + "step": 686 + }, + { + "epoch": 0.02, + "learning_rate": 1.997284195112279e-05, + "loss": 0.6361, + "step": 687 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972761697764708e-05, + "loss": 0.6589, + "step": 688 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972681326166913e-05, + "loss": 0.6722, + "step": 689 + }, + { + "epoch": 0.02, + "learning_rate": 1.997260083633037e-05, + "loss": 0.6137, + "step": 690 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972520228256023e-05, + "loss": 0.655, + "step": 691 + }, + { + "epoch": 0.02, + "learning_rate": 1.997243950194484e-05, + "loss": 0.6788, + "step": 692 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972358657397768e-05, + "loss": 0.6674, + "step": 693 + }, + { + "epoch": 0.02, + "learning_rate": 1.997227769461577e-05, + "loss": 0.6437, + "step": 694 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972196613599802e-05, + "loss": 0.6946, + "step": 695 + }, + { + "epoch": 0.02, + "learning_rate": 1.997211541435083e-05, + "loss": 0.6197, + "step": 696 + }, + { + "epoch": 0.02, + "learning_rate": 1.9972034096869816e-05, + "loss": 0.6597, + "step": 697 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971952661157727e-05, + "loss": 0.6862, + "step": 698 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971871107215518e-05, + "loss": 0.6711, + "step": 699 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971789435044166e-05, + "loss": 0.6499, + "step": 700 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971707644644636e-05, + "loss": 0.667, + "step": 701 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971625736017894e-05, + "loss": 0.6668, + "step": 702 + }, + { + "epoch": 0.02, + "learning_rate": 1.997154370916492e-05, + "loss": 0.6213, + "step": 703 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971461564086677e-05, + "loss": 0.7301, + "step": 704 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971379300784143e-05, + "loss": 0.6449, + "step": 705 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971296919258297e-05, + "loss": 0.673, + "step": 706 + }, + { + "epoch": 0.02, + "learning_rate": 1.997121441951011e-05, + "loss": 0.6323, + "step": 707 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971131801540563e-05, + "loss": 0.7592, + "step": 708 + }, + { + "epoch": 0.02, + "learning_rate": 1.9971049065350635e-05, + "loss": 0.6485, + "step": 709 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970966210941303e-05, + "loss": 0.664, + "step": 710 + }, + { + "epoch": 0.02, + "learning_rate": 1.997088323831356e-05, + "loss": 0.6895, + "step": 711 + }, + { + "epoch": 0.02, + "learning_rate": 1.997080014746838e-05, + "loss": 0.6652, + "step": 712 + }, + { + "epoch": 0.02, + "learning_rate": 1.997071693840675e-05, + "loss": 0.666, + "step": 713 + }, + { + "epoch": 0.02, + "learning_rate": 1.997063361112966e-05, + "loss": 0.6135, + "step": 714 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970550165638094e-05, + "loss": 0.6552, + "step": 715 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970466601933042e-05, + "loss": 0.7183, + "step": 716 + }, + { + "epoch": 0.02, + "learning_rate": 1.99703829200155e-05, + "loss": 0.6539, + "step": 717 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970299119886453e-05, + "loss": 0.6946, + "step": 718 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970215201546897e-05, + "loss": 0.6823, + "step": 719 + }, + { + "epoch": 0.02, + "learning_rate": 1.997013116499783e-05, + "loss": 0.6968, + "step": 720 + }, + { + "epoch": 0.02, + "learning_rate": 1.9970047010240237e-05, + "loss": 0.6087, + "step": 721 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969962737275136e-05, + "loss": 0.6283, + "step": 722 + }, + { + "epoch": 0.03, + "learning_rate": 1.996987834610351e-05, + "loss": 0.6209, + "step": 723 + }, + { + "epoch": 0.03, + "learning_rate": 1.996979383672636e-05, + "loss": 0.6954, + "step": 724 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969709209144697e-05, + "loss": 0.6573, + "step": 725 + }, + { + "epoch": 0.03, + "learning_rate": 1.996962446335952e-05, + "loss": 0.6562, + "step": 726 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969539599371832e-05, + "loss": 0.6646, + "step": 727 + }, + { + "epoch": 0.03, + "learning_rate": 1.996945461718264e-05, + "loss": 0.7025, + "step": 728 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969369516792952e-05, + "loss": 0.652, + "step": 729 + }, + { + "epoch": 0.03, + "learning_rate": 1.996928429820378e-05, + "loss": 0.6749, + "step": 730 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969198961416127e-05, + "loss": 0.6288, + "step": 731 + }, + { + "epoch": 0.03, + "learning_rate": 1.996911350643101e-05, + "loss": 0.6815, + "step": 732 + }, + { + "epoch": 0.03, + "learning_rate": 1.9969027933249445e-05, + "loss": 0.6958, + "step": 733 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968942241872443e-05, + "loss": 0.6204, + "step": 734 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968856432301016e-05, + "loss": 0.7274, + "step": 735 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968770504536187e-05, + "loss": 0.6811, + "step": 736 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968684458578973e-05, + "loss": 0.6852, + "step": 737 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968598294430396e-05, + "loss": 0.6714, + "step": 738 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968512012091473e-05, + "loss": 0.6398, + "step": 739 + }, + { + "epoch": 0.03, + "learning_rate": 1.996842561156323e-05, + "loss": 0.675, + "step": 740 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968339092846693e-05, + "loss": 0.6102, + "step": 741 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968252455942886e-05, + "loss": 0.6682, + "step": 742 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968165700852835e-05, + "loss": 0.675, + "step": 743 + }, + { + "epoch": 0.03, + "learning_rate": 1.9968078827577572e-05, + "loss": 0.6789, + "step": 744 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967991836118123e-05, + "loss": 0.6685, + "step": 745 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967904726475524e-05, + "loss": 0.6302, + "step": 746 + }, + { + "epoch": 0.03, + "learning_rate": 1.99678174986508e-05, + "loss": 0.6546, + "step": 747 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967730152644994e-05, + "loss": 0.6236, + "step": 748 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967642688459133e-05, + "loss": 0.7276, + "step": 749 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967555106094263e-05, + "loss": 0.6164, + "step": 750 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967467405551418e-05, + "loss": 0.6692, + "step": 751 + }, + { + "epoch": 0.03, + "learning_rate": 1.996737958683164e-05, + "loss": 0.6237, + "step": 752 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967291649935966e-05, + "loss": 0.7058, + "step": 753 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967203594865437e-05, + "loss": 0.6501, + "step": 754 + }, + { + "epoch": 0.03, + "learning_rate": 1.9967115421621107e-05, + "loss": 0.6314, + "step": 755 + }, + { + "epoch": 0.03, + "learning_rate": 1.996702713020401e-05, + "loss": 0.6275, + "step": 756 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966938720615202e-05, + "loss": 0.6657, + "step": 757 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966850192855728e-05, + "loss": 0.6485, + "step": 758 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966761546926633e-05, + "loss": 0.6413, + "step": 759 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966672782828975e-05, + "loss": 0.6994, + "step": 760 + }, + { + "epoch": 0.03, + "learning_rate": 1.99665839005638e-05, + "loss": 0.571, + "step": 761 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966494900132165e-05, + "loss": 0.6537, + "step": 762 + }, + { + "epoch": 0.03, + "learning_rate": 1.996640578153513e-05, + "loss": 0.6617, + "step": 763 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966316544773742e-05, + "loss": 0.697, + "step": 764 + }, + { + "epoch": 0.03, + "learning_rate": 1.9966227189849068e-05, + "loss": 0.6728, + "step": 765 + }, + { + "epoch": 0.03, + "learning_rate": 1.996613771676216e-05, + "loss": 0.6724, + "step": 766 + }, + { + "epoch": 0.03, + "learning_rate": 1.996604812551408e-05, + "loss": 0.6865, + "step": 767 + }, + { + "epoch": 0.03, + "learning_rate": 1.99659584161059e-05, + "loss": 0.6182, + "step": 768 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965868588538672e-05, + "loss": 0.664, + "step": 769 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965778642813464e-05, + "loss": 0.6478, + "step": 770 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965688578931344e-05, + "loss": 0.6195, + "step": 771 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965598396893376e-05, + "loss": 0.62, + "step": 772 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965508096700638e-05, + "loss": 0.6355, + "step": 773 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965417678354193e-05, + "loss": 0.6178, + "step": 774 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965327141855116e-05, + "loss": 0.6532, + "step": 775 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965236487204476e-05, + "loss": 0.6551, + "step": 776 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965145714403355e-05, + "loss": 0.5818, + "step": 777 + }, + { + "epoch": 0.03, + "learning_rate": 1.9965054823452824e-05, + "loss": 0.7093, + "step": 778 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964963814353964e-05, + "loss": 0.5974, + "step": 779 + }, + { + "epoch": 0.03, + "learning_rate": 1.996487268710785e-05, + "loss": 0.678, + "step": 780 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964781441715563e-05, + "loss": 0.6419, + "step": 781 + }, + { + "epoch": 0.03, + "learning_rate": 1.996469007817819e-05, + "loss": 0.6929, + "step": 782 + }, + { + "epoch": 0.03, + "learning_rate": 1.996459859649681e-05, + "loss": 0.6679, + "step": 783 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964506996672506e-05, + "loss": 0.6728, + "step": 784 + }, + { + "epoch": 0.03, + "learning_rate": 1.996441527870637e-05, + "loss": 0.6373, + "step": 785 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964323442599486e-05, + "loss": 0.6557, + "step": 786 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964231488352942e-05, + "loss": 0.6519, + "step": 787 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964139415967825e-05, + "loss": 0.6264, + "step": 788 + }, + { + "epoch": 0.03, + "learning_rate": 1.9964047225445235e-05, + "loss": 0.6571, + "step": 789 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963954916786258e-05, + "loss": 0.7012, + "step": 790 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963862489991992e-05, + "loss": 0.7036, + "step": 791 + }, + { + "epoch": 0.03, + "learning_rate": 1.996376994506353e-05, + "loss": 0.6963, + "step": 792 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963677282001975e-05, + "loss": 0.6553, + "step": 793 + }, + { + "epoch": 0.03, + "learning_rate": 1.996358450080842e-05, + "loss": 0.7194, + "step": 794 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963491601483966e-05, + "loss": 0.6633, + "step": 795 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963398584029712e-05, + "loss": 0.6564, + "step": 796 + }, + { + "epoch": 0.03, + "learning_rate": 1.996330544844677e-05, + "loss": 0.7003, + "step": 797 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963212194736237e-05, + "loss": 0.6697, + "step": 798 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963118822899218e-05, + "loss": 0.6766, + "step": 799 + }, + { + "epoch": 0.03, + "learning_rate": 1.9963025332936824e-05, + "loss": 0.7033, + "step": 800 + }, + { + "epoch": 0.03, + "learning_rate": 1.996293172485016e-05, + "loss": 0.6664, + "step": 801 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962837998640335e-05, + "loss": 0.6186, + "step": 802 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962744154308466e-05, + "loss": 0.6845, + "step": 803 + }, + { + "epoch": 0.03, + "learning_rate": 1.996265019185566e-05, + "loss": 0.6507, + "step": 804 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962556111283033e-05, + "loss": 0.6528, + "step": 805 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962461912591702e-05, + "loss": 0.6812, + "step": 806 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962367595782782e-05, + "loss": 0.6321, + "step": 807 + }, + { + "epoch": 0.03, + "learning_rate": 1.9962273160857394e-05, + "loss": 0.5897, + "step": 808 + }, + { + "epoch": 0.03, + "learning_rate": 1.996217860781665e-05, + "loss": 0.6878, + "step": 809 + }, + { + "epoch": 0.03, + "learning_rate": 1.996208393666168e-05, + "loss": 0.6513, + "step": 810 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961989147393602e-05, + "loss": 0.6111, + "step": 811 + }, + { + "epoch": 0.03, + "learning_rate": 1.996189424001354e-05, + "loss": 0.6622, + "step": 812 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961799214522624e-05, + "loss": 0.6152, + "step": 813 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961704070921974e-05, + "loss": 0.6572, + "step": 814 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961608809212717e-05, + "loss": 0.7035, + "step": 815 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961513429395988e-05, + "loss": 0.6253, + "step": 816 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961417931472918e-05, + "loss": 0.6329, + "step": 817 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961322315444636e-05, + "loss": 0.6807, + "step": 818 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961226581312277e-05, + "loss": 0.6351, + "step": 819 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961130729076975e-05, + "loss": 0.6808, + "step": 820 + }, + { + "epoch": 0.03, + "learning_rate": 1.9961034758739866e-05, + "loss": 0.6376, + "step": 821 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960938670302096e-05, + "loss": 0.6665, + "step": 822 + }, + { + "epoch": 0.03, + "learning_rate": 1.996084246376479e-05, + "loss": 0.7131, + "step": 823 + }, + { + "epoch": 0.03, + "learning_rate": 1.99607461391291e-05, + "loss": 0.6868, + "step": 824 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960649696396165e-05, + "loss": 0.6807, + "step": 825 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960553135567123e-05, + "loss": 0.7006, + "step": 826 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960456456643125e-05, + "loss": 0.6536, + "step": 827 + }, + { + "epoch": 0.03, + "learning_rate": 1.996035965962532e-05, + "loss": 0.6801, + "step": 828 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960262744514844e-05, + "loss": 0.6191, + "step": 829 + }, + { + "epoch": 0.03, + "learning_rate": 1.996016571131286e-05, + "loss": 0.6118, + "step": 830 + }, + { + "epoch": 0.03, + "learning_rate": 1.9960068560020507e-05, + "loss": 0.6537, + "step": 831 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959971290638945e-05, + "loss": 0.6816, + "step": 832 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959873903169322e-05, + "loss": 0.6334, + "step": 833 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959776397612796e-05, + "loss": 0.6519, + "step": 834 + }, + { + "epoch": 0.03, + "learning_rate": 1.995967877397052e-05, + "loss": 0.6921, + "step": 835 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959581032243653e-05, + "loss": 0.7153, + "step": 836 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959483172433354e-05, + "loss": 0.6587, + "step": 837 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959385194540784e-05, + "loss": 0.6968, + "step": 838 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959287098567105e-05, + "loss": 0.6617, + "step": 839 + }, + { + "epoch": 0.03, + "learning_rate": 1.995918888451348e-05, + "loss": 0.7113, + "step": 840 + }, + { + "epoch": 0.03, + "learning_rate": 1.9959090552381067e-05, + "loss": 0.6243, + "step": 841 + }, + { + "epoch": 0.03, + "learning_rate": 1.995899210217104e-05, + "loss": 0.6312, + "step": 842 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958893533884566e-05, + "loss": 0.6603, + "step": 843 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958794847522806e-05, + "loss": 0.6749, + "step": 844 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958696043086938e-05, + "loss": 0.6222, + "step": 845 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958597120578133e-05, + "loss": 0.686, + "step": 846 + }, + { + "epoch": 0.03, + "learning_rate": 1.995849807999756e-05, + "loss": 0.6389, + "step": 847 + }, + { + "epoch": 0.03, + "learning_rate": 1.995839892134639e-05, + "loss": 0.6612, + "step": 848 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958299644625807e-05, + "loss": 0.6377, + "step": 849 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958200249836984e-05, + "loss": 0.6757, + "step": 850 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958100736981102e-05, + "loss": 0.6573, + "step": 851 + }, + { + "epoch": 0.03, + "learning_rate": 1.9958001106059337e-05, + "loss": 0.6419, + "step": 852 + }, + { + "epoch": 0.03, + "learning_rate": 1.995790135707287e-05, + "loss": 0.6547, + "step": 853 + }, + { + "epoch": 0.03, + "learning_rate": 1.995780149002289e-05, + "loss": 0.7177, + "step": 854 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957701504910573e-05, + "loss": 0.6589, + "step": 855 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957601401737108e-05, + "loss": 0.6633, + "step": 856 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957501180503686e-05, + "loss": 0.6528, + "step": 857 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957400841211486e-05, + "loss": 0.6204, + "step": 858 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957300383861708e-05, + "loss": 0.6685, + "step": 859 + }, + { + "epoch": 0.03, + "learning_rate": 1.9957199808455533e-05, + "loss": 0.6273, + "step": 860 + }, + { + "epoch": 0.03, + "learning_rate": 1.995709911499416e-05, + "loss": 0.6372, + "step": 861 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956998303478783e-05, + "loss": 0.588, + "step": 862 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956897373910593e-05, + "loss": 0.6503, + "step": 863 + }, + { + "epoch": 0.03, + "learning_rate": 1.995679632629079e-05, + "loss": 0.6776, + "step": 864 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956695160620572e-05, + "loss": 0.6681, + "step": 865 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956593876901137e-05, + "loss": 0.6227, + "step": 866 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956492475133685e-05, + "loss": 0.6932, + "step": 867 + }, + { + "epoch": 0.03, + "learning_rate": 1.995639095531942e-05, + "loss": 0.678, + "step": 868 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956289317459547e-05, + "loss": 0.6568, + "step": 869 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956187561555273e-05, + "loss": 0.6827, + "step": 870 + }, + { + "epoch": 0.03, + "learning_rate": 1.9956085687607793e-05, + "loss": 0.7149, + "step": 871 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955983695618327e-05, + "loss": 0.6758, + "step": 872 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955881585588077e-05, + "loss": 0.6459, + "step": 873 + }, + { + "epoch": 0.03, + "learning_rate": 1.995577935751826e-05, + "loss": 0.724, + "step": 874 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955677011410082e-05, + "loss": 0.6303, + "step": 875 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955574547264763e-05, + "loss": 0.6415, + "step": 876 + }, + { + "epoch": 0.03, + "learning_rate": 1.995547196508351e-05, + "loss": 0.6768, + "step": 877 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955369264867545e-05, + "loss": 0.5706, + "step": 878 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955266446618083e-05, + "loss": 0.6614, + "step": 879 + }, + { + "epoch": 0.03, + "learning_rate": 1.995516351033634e-05, + "loss": 0.6229, + "step": 880 + }, + { + "epoch": 0.03, + "learning_rate": 1.9955060456023547e-05, + "loss": 0.6771, + "step": 881 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954957283680916e-05, + "loss": 0.6815, + "step": 882 + }, + { + "epoch": 0.03, + "learning_rate": 1.995485399330967e-05, + "loss": 0.5953, + "step": 883 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954750584911043e-05, + "loss": 0.6611, + "step": 884 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954647058486252e-05, + "loss": 0.628, + "step": 885 + }, + { + "epoch": 0.03, + "learning_rate": 1.995454341403653e-05, + "loss": 0.6283, + "step": 886 + }, + { + "epoch": 0.03, + "learning_rate": 1.99544396515631e-05, + "loss": 0.7106, + "step": 887 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954335771067196e-05, + "loss": 0.6685, + "step": 888 + }, + { + "epoch": 0.03, + "learning_rate": 1.995423177255005e-05, + "loss": 0.6758, + "step": 889 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954127656012892e-05, + "loss": 0.6501, + "step": 890 + }, + { + "epoch": 0.03, + "learning_rate": 1.9954023421456962e-05, + "loss": 0.6767, + "step": 891 + }, + { + "epoch": 0.03, + "learning_rate": 1.995391906888349e-05, + "loss": 0.6599, + "step": 892 + }, + { + "epoch": 0.03, + "learning_rate": 1.9953814598293716e-05, + "loss": 0.62, + "step": 893 + }, + { + "epoch": 0.03, + "learning_rate": 1.9953710009688884e-05, + "loss": 0.6284, + "step": 894 + }, + { + "epoch": 0.03, + "learning_rate": 1.995360530307022e-05, + "loss": 0.5902, + "step": 895 + }, + { + "epoch": 0.03, + "learning_rate": 1.9953500478438976e-05, + "loss": 0.6139, + "step": 896 + }, + { + "epoch": 0.03, + "learning_rate": 1.9953395535796397e-05, + "loss": 0.6801, + "step": 897 + }, + { + "epoch": 0.03, + "learning_rate": 1.9953290475143715e-05, + "loss": 0.6635, + "step": 898 + }, + { + "epoch": 0.03, + "learning_rate": 1.995318529648219e-05, + "loss": 0.6484, + "step": 899 + }, + { + "epoch": 0.03, + "learning_rate": 1.995307999981306e-05, + "loss": 0.6516, + "step": 900 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952974585137576e-05, + "loss": 0.6761, + "step": 901 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952869052456986e-05, + "loss": 0.6572, + "step": 902 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952763401772547e-05, + "loss": 0.649, + "step": 903 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952657633085505e-05, + "loss": 0.6165, + "step": 904 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952551746397117e-05, + "loss": 0.6816, + "step": 905 + }, + { + "epoch": 0.03, + "learning_rate": 1.995244574170864e-05, + "loss": 0.6575, + "step": 906 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952339619021326e-05, + "loss": 0.6408, + "step": 907 + }, + { + "epoch": 0.03, + "learning_rate": 1.9952233378336436e-05, + "loss": 0.6727, + "step": 908 + }, + { + "epoch": 0.03, + "learning_rate": 1.995212701965523e-05, + "loss": 0.6615, + "step": 909 + }, + { + "epoch": 0.03, + "learning_rate": 1.995202054297897e-05, + "loss": 0.6523, + "step": 910 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951913948308913e-05, + "loss": 0.6624, + "step": 911 + }, + { + "epoch": 0.03, + "learning_rate": 1.995180723564633e-05, + "loss": 0.6226, + "step": 912 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951700404992484e-05, + "loss": 0.6941, + "step": 913 + }, + { + "epoch": 0.03, + "learning_rate": 1.995159345634864e-05, + "loss": 0.6587, + "step": 914 + }, + { + "epoch": 0.03, + "learning_rate": 1.995148638971607e-05, + "loss": 0.6709, + "step": 915 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951379205096034e-05, + "loss": 0.6155, + "step": 916 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951271902489814e-05, + "loss": 0.6745, + "step": 917 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951164481898675e-05, + "loss": 0.5887, + "step": 918 + }, + { + "epoch": 0.03, + "learning_rate": 1.9951056943323892e-05, + "loss": 0.6985, + "step": 919 + }, + { + "epoch": 0.03, + "learning_rate": 1.9950949286766745e-05, + "loss": 0.6759, + "step": 920 + }, + { + "epoch": 0.03, + "learning_rate": 1.99508415122285e-05, + "loss": 0.6747, + "step": 921 + }, + { + "epoch": 0.03, + "learning_rate": 1.995073361971044e-05, + "loss": 0.6896, + "step": 922 + }, + { + "epoch": 0.03, + "learning_rate": 1.9950625609213855e-05, + "loss": 0.6642, + "step": 923 + }, + { + "epoch": 0.03, + "learning_rate": 1.995051748074001e-05, + "loss": 0.7297, + "step": 924 + }, + { + "epoch": 0.03, + "learning_rate": 1.995040923429019e-05, + "loss": 0.6708, + "step": 925 + }, + { + "epoch": 0.03, + "learning_rate": 1.995030086986568e-05, + "loss": 0.6658, + "step": 926 + }, + { + "epoch": 0.03, + "learning_rate": 1.9950192387467774e-05, + "loss": 0.5721, + "step": 927 + }, + { + "epoch": 0.03, + "learning_rate": 1.9950083787097744e-05, + "loss": 0.6448, + "step": 928 + }, + { + "epoch": 0.03, + "learning_rate": 1.994997506875689e-05, + "loss": 0.7138, + "step": 929 + }, + { + "epoch": 0.03, + "learning_rate": 1.994986623244649e-05, + "loss": 0.7068, + "step": 930 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949757278167835e-05, + "loss": 0.6277, + "step": 931 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949648205922228e-05, + "loss": 0.6207, + "step": 932 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949539015710953e-05, + "loss": 0.6545, + "step": 933 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949429707535306e-05, + "loss": 0.6758, + "step": 934 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949320281396583e-05, + "loss": 0.6425, + "step": 935 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949210737296084e-05, + "loss": 0.6833, + "step": 936 + }, + { + "epoch": 0.03, + "learning_rate": 1.9949101075235107e-05, + "loss": 0.6376, + "step": 937 + }, + { + "epoch": 0.03, + "learning_rate": 1.9948991295214947e-05, + "loss": 0.6198, + "step": 938 + }, + { + "epoch": 0.03, + "learning_rate": 1.9948881397236913e-05, + "loss": 0.6531, + "step": 939 + }, + { + "epoch": 0.03, + "learning_rate": 1.99487713813023e-05, + "loss": 0.5996, + "step": 940 + }, + { + "epoch": 0.03, + "learning_rate": 1.9948661247412423e-05, + "loss": 0.616, + "step": 941 + }, + { + "epoch": 0.03, + "learning_rate": 1.994855099556858e-05, + "loss": 0.6328, + "step": 942 + }, + { + "epoch": 0.03, + "learning_rate": 1.994844062577208e-05, + "loss": 0.6399, + "step": 943 + }, + { + "epoch": 0.03, + "learning_rate": 1.994833013802423e-05, + "loss": 0.6709, + "step": 944 + }, + { + "epoch": 0.03, + "learning_rate": 1.994821953232634e-05, + "loss": 0.6997, + "step": 945 + }, + { + "epoch": 0.03, + "learning_rate": 1.9948108808679727e-05, + "loss": 0.7059, + "step": 946 + }, + { + "epoch": 0.03, + "learning_rate": 1.99479979670857e-05, + "loss": 0.6378, + "step": 947 + }, + { + "epoch": 0.03, + "learning_rate": 1.994788700754557e-05, + "loss": 0.6833, + "step": 948 + }, + { + "epoch": 0.03, + "learning_rate": 1.994777593006066e-05, + "loss": 0.6088, + "step": 949 + }, + { + "epoch": 0.03, + "learning_rate": 1.9947664734632275e-05, + "loss": 0.6755, + "step": 950 + }, + { + "epoch": 0.03, + "learning_rate": 1.9947553421261743e-05, + "loss": 0.6743, + "step": 951 + }, + { + "epoch": 0.03, + "learning_rate": 1.9947441989950384e-05, + "loss": 0.6672, + "step": 952 + }, + { + "epoch": 0.03, + "learning_rate": 1.9947330440699516e-05, + "loss": 0.6452, + "step": 953 + }, + { + "epoch": 0.03, + "learning_rate": 1.994721877351046e-05, + "loss": 0.7122, + "step": 954 + }, + { + "epoch": 0.03, + "learning_rate": 1.9947106988384542e-05, + "loss": 0.6517, + "step": 955 + }, + { + "epoch": 0.03, + "learning_rate": 1.994699508532309e-05, + "loss": 0.6411, + "step": 956 + }, + { + "epoch": 0.03, + "learning_rate": 1.994688306432743e-05, + "loss": 0.6134, + "step": 957 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946770925398885e-05, + "loss": 0.6593, + "step": 958 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946658668538787e-05, + "loss": 0.6626, + "step": 959 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946546293748474e-05, + "loss": 0.6254, + "step": 960 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946433801029266e-05, + "loss": 0.5781, + "step": 961 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946321190382503e-05, + "loss": 0.6458, + "step": 962 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946208461809523e-05, + "loss": 0.6922, + "step": 963 + }, + { + "epoch": 0.03, + "learning_rate": 1.9946095615311657e-05, + "loss": 0.6487, + "step": 964 + }, + { + "epoch": 0.03, + "learning_rate": 1.9945982650890247e-05, + "loss": 0.6865, + "step": 965 + }, + { + "epoch": 0.03, + "learning_rate": 1.994586956854663e-05, + "loss": 0.6574, + "step": 966 + }, + { + "epoch": 0.03, + "learning_rate": 1.994575636828215e-05, + "loss": 0.652, + "step": 967 + }, + { + "epoch": 0.03, + "learning_rate": 1.994564305009815e-05, + "loss": 0.6921, + "step": 968 + }, + { + "epoch": 0.03, + "learning_rate": 1.9945529613995962e-05, + "loss": 0.6655, + "step": 969 + }, + { + "epoch": 0.03, + "learning_rate": 1.9945416059976944e-05, + "loss": 0.6271, + "step": 970 + }, + { + "epoch": 0.03, + "learning_rate": 1.9945302388042438e-05, + "loss": 0.6198, + "step": 971 + }, + { + "epoch": 0.03, + "learning_rate": 1.9945188598193787e-05, + "loss": 0.6322, + "step": 972 + }, + { + "epoch": 0.03, + "learning_rate": 1.994507469043235e-05, + "loss": 0.6348, + "step": 973 + }, + { + "epoch": 0.03, + "learning_rate": 1.994496066475947e-05, + "loss": 0.6567, + "step": 974 + }, + { + "epoch": 0.03, + "learning_rate": 1.99448465211765e-05, + "loss": 0.688, + "step": 975 + }, + { + "epoch": 0.03, + "learning_rate": 1.9944732259684794e-05, + "loss": 0.6371, + "step": 976 + }, + { + "epoch": 0.03, + "learning_rate": 1.9944617880285708e-05, + "loss": 0.6764, + "step": 977 + }, + { + "epoch": 0.03, + "learning_rate": 1.9944503382980594e-05, + "loss": 0.6615, + "step": 978 + }, + { + "epoch": 0.03, + "learning_rate": 1.9944388767770818e-05, + "loss": 0.654, + "step": 979 + }, + { + "epoch": 0.03, + "learning_rate": 1.994427403465773e-05, + "loss": 0.6322, + "step": 980 + }, + { + "epoch": 0.03, + "learning_rate": 1.994415918364269e-05, + "loss": 0.6361, + "step": 981 + }, + { + "epoch": 0.03, + "learning_rate": 1.994404421472707e-05, + "loss": 0.7075, + "step": 982 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943929127912227e-05, + "loss": 0.6598, + "step": 983 + }, + { + "epoch": 0.03, + "learning_rate": 1.994381392319952e-05, + "loss": 0.6476, + "step": 984 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943698600590325e-05, + "loss": 0.6707, + "step": 985 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943583160085998e-05, + "loss": 0.6571, + "step": 986 + }, + { + "epoch": 0.03, + "learning_rate": 1.994346760168792e-05, + "loss": 0.6246, + "step": 987 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943351925397453e-05, + "loss": 0.6975, + "step": 988 + }, + { + "epoch": 0.03, + "learning_rate": 1.994323613121597e-05, + "loss": 0.6214, + "step": 989 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943120219144845e-05, + "loss": 0.6481, + "step": 990 + }, + { + "epoch": 0.03, + "learning_rate": 1.9943004189185452e-05, + "loss": 0.6499, + "step": 991 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942888041339164e-05, + "loss": 0.6718, + "step": 992 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942771775607364e-05, + "loss": 0.6454, + "step": 993 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942655391991423e-05, + "loss": 0.647, + "step": 994 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942538890492725e-05, + "loss": 0.6505, + "step": 995 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942422271112655e-05, + "loss": 0.6634, + "step": 996 + }, + { + "epoch": 0.03, + "learning_rate": 1.994230553385259e-05, + "loss": 0.6945, + "step": 997 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942188678713915e-05, + "loss": 0.6659, + "step": 998 + }, + { + "epoch": 0.03, + "learning_rate": 1.9942071705698016e-05, + "loss": 0.6857, + "step": 999 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941954614806282e-05, + "loss": 0.6576, + "step": 1000 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941837406040097e-05, + "loss": 0.6682, + "step": 1001 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941720079400855e-05, + "loss": 0.7274, + "step": 1002 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941602634889942e-05, + "loss": 0.667, + "step": 1003 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941485072508756e-05, + "loss": 0.6634, + "step": 1004 + }, + { + "epoch": 0.03, + "learning_rate": 1.994136739225869e-05, + "loss": 0.6417, + "step": 1005 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941249594141136e-05, + "loss": 0.6436, + "step": 1006 + }, + { + "epoch": 0.03, + "learning_rate": 1.994113167815749e-05, + "loss": 0.6596, + "step": 1007 + }, + { + "epoch": 0.03, + "learning_rate": 1.9941013644309154e-05, + "loss": 0.6626, + "step": 1008 + }, + { + "epoch": 0.03, + "learning_rate": 1.9940895492597527e-05, + "loss": 0.6991, + "step": 1009 + }, + { + "epoch": 0.03, + "learning_rate": 1.994077722302401e-05, + "loss": 0.7163, + "step": 1010 + }, + { + "epoch": 0.04, + "learning_rate": 1.9940658835590002e-05, + "loss": 0.6366, + "step": 1011 + }, + { + "epoch": 0.04, + "learning_rate": 1.994054033029691e-05, + "loss": 0.637, + "step": 1012 + }, + { + "epoch": 0.04, + "learning_rate": 1.9940421707146138e-05, + "loss": 0.6907, + "step": 1013 + }, + { + "epoch": 0.04, + "learning_rate": 1.9940302966139086e-05, + "loss": 0.5981, + "step": 1014 + }, + { + "epoch": 0.04, + "learning_rate": 1.9940184107277172e-05, + "loss": 0.6173, + "step": 1015 + }, + { + "epoch": 0.04, + "learning_rate": 1.99400651305618e-05, + "loss": 0.6585, + "step": 1016 + }, + { + "epoch": 0.04, + "learning_rate": 1.9939946035994385e-05, + "loss": 0.618, + "step": 1017 + }, + { + "epoch": 0.04, + "learning_rate": 1.993982682357633e-05, + "loss": 0.691, + "step": 1018 + }, + { + "epoch": 0.04, + "learning_rate": 1.993970749330906e-05, + "loss": 0.624, + "step": 1019 + }, + { + "epoch": 0.04, + "learning_rate": 1.993958804519398e-05, + "loss": 0.6919, + "step": 1020 + }, + { + "epoch": 0.04, + "learning_rate": 1.9939468479232512e-05, + "loss": 0.7062, + "step": 1021 + }, + { + "epoch": 0.04, + "learning_rate": 1.9939348795426068e-05, + "loss": 0.6964, + "step": 1022 + }, + { + "epoch": 0.04, + "learning_rate": 1.9939228993776076e-05, + "loss": 0.6498, + "step": 1023 + }, + { + "epoch": 0.04, + "learning_rate": 1.9939109074283947e-05, + "loss": 0.5902, + "step": 1024 + }, + { + "epoch": 0.04, + "learning_rate": 1.9938989036951108e-05, + "loss": 0.6298, + "step": 1025 + }, + { + "epoch": 0.04, + "learning_rate": 1.9938868881778983e-05, + "loss": 0.6774, + "step": 1026 + }, + { + "epoch": 0.04, + "learning_rate": 1.993874860876899e-05, + "loss": 0.6484, + "step": 1027 + }, + { + "epoch": 0.04, + "learning_rate": 1.9938628217922566e-05, + "loss": 0.6886, + "step": 1028 + }, + { + "epoch": 0.04, + "learning_rate": 1.993850770924113e-05, + "loss": 0.634, + "step": 1029 + }, + { + "epoch": 0.04, + "learning_rate": 1.993838708272611e-05, + "loss": 0.6976, + "step": 1030 + }, + { + "epoch": 0.04, + "learning_rate": 1.993826633837894e-05, + "loss": 0.6509, + "step": 1031 + }, + { + "epoch": 0.04, + "learning_rate": 1.9938145476201053e-05, + "loss": 0.6619, + "step": 1032 + }, + { + "epoch": 0.04, + "learning_rate": 1.9938024496193876e-05, + "loss": 0.6289, + "step": 1033 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937903398358852e-05, + "loss": 0.7019, + "step": 1034 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937782182697405e-05, + "loss": 0.607, + "step": 1035 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937660849210982e-05, + "loss": 0.7335, + "step": 1036 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937539397901022e-05, + "loss": 0.6915, + "step": 1037 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937417828768958e-05, + "loss": 0.6806, + "step": 1038 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937296141816235e-05, + "loss": 0.6355, + "step": 1039 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937174337044295e-05, + "loss": 0.6796, + "step": 1040 + }, + { + "epoch": 0.04, + "learning_rate": 1.9937052414454584e-05, + "loss": 0.6276, + "step": 1041 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936930374048544e-05, + "loss": 0.6477, + "step": 1042 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936808215827624e-05, + "loss": 0.6175, + "step": 1043 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936685939793274e-05, + "loss": 0.6403, + "step": 1044 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936563545946945e-05, + "loss": 0.6573, + "step": 1045 + }, + { + "epoch": 0.04, + "learning_rate": 1.993644103429008e-05, + "loss": 0.6349, + "step": 1046 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936318404824137e-05, + "loss": 0.6539, + "step": 1047 + }, + { + "epoch": 0.04, + "learning_rate": 1.9936195657550573e-05, + "loss": 0.648, + "step": 1048 + }, + { + "epoch": 0.04, + "learning_rate": 1.993607279247084e-05, + "loss": 0.6935, + "step": 1049 + }, + { + "epoch": 0.04, + "learning_rate": 1.9935949809586394e-05, + "loss": 0.6749, + "step": 1050 + }, + { + "epoch": 0.04, + "learning_rate": 1.9935826708898697e-05, + "loss": 0.6792, + "step": 1051 + }, + { + "epoch": 0.04, + "learning_rate": 1.99357034904092e-05, + "loss": 0.6409, + "step": 1052 + }, + { + "epoch": 0.04, + "learning_rate": 1.993558015411937e-05, + "loss": 0.6528, + "step": 1053 + }, + { + "epoch": 0.04, + "learning_rate": 1.993545670003067e-05, + "loss": 0.6629, + "step": 1054 + }, + { + "epoch": 0.04, + "learning_rate": 1.9935333128144564e-05, + "loss": 0.6447, + "step": 1055 + }, + { + "epoch": 0.04, + "learning_rate": 1.993520943846252e-05, + "loss": 0.5856, + "step": 1056 + }, + { + "epoch": 0.04, + "learning_rate": 1.993508563098599e-05, + "loss": 0.6782, + "step": 1057 + }, + { + "epoch": 0.04, + "learning_rate": 1.993496170571646e-05, + "loss": 0.6574, + "step": 1058 + }, + { + "epoch": 0.04, + "learning_rate": 1.9934837662655385e-05, + "loss": 0.7085, + "step": 1059 + }, + { + "epoch": 0.04, + "learning_rate": 1.9934713501804242e-05, + "loss": 0.6474, + "step": 1060 + }, + { + "epoch": 0.04, + "learning_rate": 1.9934589223164508e-05, + "loss": 0.6584, + "step": 1061 + }, + { + "epoch": 0.04, + "learning_rate": 1.9934464826737647e-05, + "loss": 0.6658, + "step": 1062 + }, + { + "epoch": 0.04, + "learning_rate": 1.993434031252514e-05, + "loss": 0.6565, + "step": 1063 + }, + { + "epoch": 0.04, + "learning_rate": 1.9934215680528463e-05, + "loss": 0.6951, + "step": 1064 + }, + { + "epoch": 0.04, + "learning_rate": 1.993409093074909e-05, + "loss": 0.6446, + "step": 1065 + }, + { + "epoch": 0.04, + "learning_rate": 1.9933966063188505e-05, + "loss": 0.67, + "step": 1066 + }, + { + "epoch": 0.04, + "learning_rate": 1.9933841077848184e-05, + "loss": 0.6092, + "step": 1067 + }, + { + "epoch": 0.04, + "learning_rate": 1.993371597472961e-05, + "loss": 0.6321, + "step": 1068 + }, + { + "epoch": 0.04, + "learning_rate": 1.9933590753834265e-05, + "loss": 0.6517, + "step": 1069 + }, + { + "epoch": 0.04, + "learning_rate": 1.9933465415163644e-05, + "loss": 0.6269, + "step": 1070 + }, + { + "epoch": 0.04, + "learning_rate": 1.9933339958719216e-05, + "loss": 0.6794, + "step": 1071 + }, + { + "epoch": 0.04, + "learning_rate": 1.993321438450248e-05, + "loss": 0.6821, + "step": 1072 + }, + { + "epoch": 0.04, + "learning_rate": 1.993308869251492e-05, + "loss": 0.6778, + "step": 1073 + }, + { + "epoch": 0.04, + "learning_rate": 1.9932962882758032e-05, + "loss": 0.6271, + "step": 1074 + }, + { + "epoch": 0.04, + "learning_rate": 1.99328369552333e-05, + "loss": 0.6348, + "step": 1075 + }, + { + "epoch": 0.04, + "learning_rate": 1.9932710909942224e-05, + "loss": 0.6483, + "step": 1076 + }, + { + "epoch": 0.04, + "learning_rate": 1.9932584746886293e-05, + "loss": 0.6324, + "step": 1077 + }, + { + "epoch": 0.04, + "learning_rate": 1.9932458466067005e-05, + "loss": 0.6037, + "step": 1078 + }, + { + "epoch": 0.04, + "learning_rate": 1.993233206748586e-05, + "loss": 0.698, + "step": 1079 + }, + { + "epoch": 0.04, + "learning_rate": 1.993220555114435e-05, + "loss": 0.6798, + "step": 1080 + }, + { + "epoch": 0.04, + "learning_rate": 1.9932078917043983e-05, + "loss": 0.7007, + "step": 1081 + }, + { + "epoch": 0.04, + "learning_rate": 1.993195216518625e-05, + "loss": 0.6736, + "step": 1082 + }, + { + "epoch": 0.04, + "learning_rate": 1.9931825295572665e-05, + "loss": 0.6602, + "step": 1083 + }, + { + "epoch": 0.04, + "learning_rate": 1.9931698308204727e-05, + "loss": 0.6736, + "step": 1084 + }, + { + "epoch": 0.04, + "learning_rate": 1.993157120308394e-05, + "loss": 0.6636, + "step": 1085 + }, + { + "epoch": 0.04, + "learning_rate": 1.9931443980211817e-05, + "loss": 0.676, + "step": 1086 + }, + { + "epoch": 0.04, + "learning_rate": 1.993131663958986e-05, + "loss": 0.6531, + "step": 1087 + }, + { + "epoch": 0.04, + "learning_rate": 1.9931189181219582e-05, + "loss": 0.6498, + "step": 1088 + }, + { + "epoch": 0.04, + "learning_rate": 1.993106160510249e-05, + "loss": 0.6325, + "step": 1089 + }, + { + "epoch": 0.04, + "learning_rate": 1.99309339112401e-05, + "loss": 0.6227, + "step": 1090 + }, + { + "epoch": 0.04, + "learning_rate": 1.993080609963393e-05, + "loss": 0.6344, + "step": 1091 + }, + { + "epoch": 0.04, + "learning_rate": 1.9930678170285486e-05, + "loss": 0.6421, + "step": 1092 + }, + { + "epoch": 0.04, + "learning_rate": 1.9930550123196295e-05, + "loss": 0.6824, + "step": 1093 + }, + { + "epoch": 0.04, + "learning_rate": 1.9930421958367865e-05, + "loss": 0.5911, + "step": 1094 + }, + { + "epoch": 0.04, + "learning_rate": 1.9930293675801726e-05, + "loss": 0.638, + "step": 1095 + }, + { + "epoch": 0.04, + "learning_rate": 1.993016527549939e-05, + "loss": 0.6445, + "step": 1096 + }, + { + "epoch": 0.04, + "learning_rate": 1.993003675746238e-05, + "loss": 0.6421, + "step": 1097 + }, + { + "epoch": 0.04, + "learning_rate": 1.992990812169223e-05, + "loss": 0.7435, + "step": 1098 + }, + { + "epoch": 0.04, + "learning_rate": 1.9929779368190453e-05, + "loss": 0.6612, + "step": 1099 + }, + { + "epoch": 0.04, + "learning_rate": 1.992965049695858e-05, + "loss": 0.6776, + "step": 1100 + }, + { + "epoch": 0.04, + "learning_rate": 1.9929521507998144e-05, + "loss": 0.7012, + "step": 1101 + }, + { + "epoch": 0.04, + "learning_rate": 1.9929392401310665e-05, + "loss": 0.6209, + "step": 1102 + }, + { + "epoch": 0.04, + "learning_rate": 1.992926317689768e-05, + "loss": 0.6061, + "step": 1103 + }, + { + "epoch": 0.04, + "learning_rate": 1.992913383476072e-05, + "loss": 0.6861, + "step": 1104 + }, + { + "epoch": 0.04, + "learning_rate": 1.9929004374901315e-05, + "loss": 0.6645, + "step": 1105 + }, + { + "epoch": 0.04, + "learning_rate": 1.9928874797321004e-05, + "loss": 0.6859, + "step": 1106 + }, + { + "epoch": 0.04, + "learning_rate": 1.9928745102021325e-05, + "loss": 0.6822, + "step": 1107 + }, + { + "epoch": 0.04, + "learning_rate": 1.992861528900381e-05, + "loss": 0.6597, + "step": 1108 + }, + { + "epoch": 0.04, + "learning_rate": 1.9928485358270003e-05, + "loss": 0.6764, + "step": 1109 + }, + { + "epoch": 0.04, + "learning_rate": 1.992835530982144e-05, + "loss": 0.6531, + "step": 1110 + }, + { + "epoch": 0.04, + "learning_rate": 1.992822514365967e-05, + "loss": 0.6519, + "step": 1111 + }, + { + "epoch": 0.04, + "learning_rate": 1.9928094859786228e-05, + "loss": 0.6316, + "step": 1112 + }, + { + "epoch": 0.04, + "learning_rate": 1.9927964458202664e-05, + "loss": 0.6524, + "step": 1113 + }, + { + "epoch": 0.04, + "learning_rate": 1.9927833938910522e-05, + "loss": 0.6522, + "step": 1114 + }, + { + "epoch": 0.04, + "learning_rate": 1.992770330191135e-05, + "loss": 0.6765, + "step": 1115 + }, + { + "epoch": 0.04, + "learning_rate": 1.992757254720669e-05, + "loss": 0.7068, + "step": 1116 + }, + { + "epoch": 0.04, + "learning_rate": 1.992744167479811e-05, + "loss": 0.6484, + "step": 1117 + }, + { + "epoch": 0.04, + "learning_rate": 1.9927310684687145e-05, + "loss": 0.6971, + "step": 1118 + }, + { + "epoch": 0.04, + "learning_rate": 1.9927179576875353e-05, + "loss": 0.6314, + "step": 1119 + }, + { + "epoch": 0.04, + "learning_rate": 1.992704835136429e-05, + "loss": 0.641, + "step": 1120 + }, + { + "epoch": 0.04, + "learning_rate": 1.992691700815551e-05, + "loss": 0.67, + "step": 1121 + }, + { + "epoch": 0.04, + "learning_rate": 1.9926785547250575e-05, + "loss": 0.6263, + "step": 1122 + }, + { + "epoch": 0.04, + "learning_rate": 1.9926653968651037e-05, + "loss": 0.6828, + "step": 1123 + }, + { + "epoch": 0.04, + "learning_rate": 1.992652227235846e-05, + "loss": 0.6033, + "step": 1124 + }, + { + "epoch": 0.04, + "learning_rate": 1.9926390458374406e-05, + "loss": 0.6729, + "step": 1125 + }, + { + "epoch": 0.04, + "learning_rate": 1.9926258526700433e-05, + "loss": 0.6233, + "step": 1126 + }, + { + "epoch": 0.04, + "learning_rate": 1.992612647733811e-05, + "loss": 0.6485, + "step": 1127 + }, + { + "epoch": 0.04, + "learning_rate": 1.9925994310289e-05, + "loss": 0.6452, + "step": 1128 + }, + { + "epoch": 0.04, + "learning_rate": 1.992586202555467e-05, + "loss": 0.6819, + "step": 1129 + }, + { + "epoch": 0.04, + "learning_rate": 1.9925729623136695e-05, + "loss": 0.6846, + "step": 1130 + }, + { + "epoch": 0.04, + "learning_rate": 1.992559710303663e-05, + "loss": 0.6311, + "step": 1131 + }, + { + "epoch": 0.04, + "learning_rate": 1.9925464465256064e-05, + "loss": 0.6223, + "step": 1132 + }, + { + "epoch": 0.04, + "learning_rate": 1.9925331709796556e-05, + "loss": 0.6002, + "step": 1133 + }, + { + "epoch": 0.04, + "learning_rate": 1.992519883665969e-05, + "loss": 0.6376, + "step": 1134 + }, + { + "epoch": 0.04, + "learning_rate": 1.992506584584703e-05, + "loss": 0.6576, + "step": 1135 + }, + { + "epoch": 0.04, + "learning_rate": 1.9924932737360162e-05, + "loss": 0.6465, + "step": 1136 + }, + { + "epoch": 0.04, + "learning_rate": 1.992479951120066e-05, + "loss": 0.6861, + "step": 1137 + }, + { + "epoch": 0.04, + "learning_rate": 1.9924666167370108e-05, + "loss": 0.6449, + "step": 1138 + }, + { + "epoch": 0.04, + "learning_rate": 1.992453270587008e-05, + "loss": 0.6907, + "step": 1139 + }, + { + "epoch": 0.04, + "learning_rate": 1.9924399126702166e-05, + "loss": 0.6556, + "step": 1140 + }, + { + "epoch": 0.04, + "learning_rate": 1.9924265429867943e-05, + "loss": 0.6818, + "step": 1141 + }, + { + "epoch": 0.04, + "learning_rate": 1.9924131615369e-05, + "loss": 0.646, + "step": 1142 + }, + { + "epoch": 0.04, + "learning_rate": 1.9923997683206925e-05, + "loss": 0.6933, + "step": 1143 + }, + { + "epoch": 0.04, + "learning_rate": 1.99238636333833e-05, + "loss": 0.6312, + "step": 1144 + }, + { + "epoch": 0.04, + "learning_rate": 1.992372946589972e-05, + "loss": 0.6395, + "step": 1145 + }, + { + "epoch": 0.04, + "learning_rate": 1.9923595180757773e-05, + "loss": 0.6488, + "step": 1146 + }, + { + "epoch": 0.04, + "learning_rate": 1.992346077795905e-05, + "loss": 0.6489, + "step": 1147 + }, + { + "epoch": 0.04, + "learning_rate": 1.9923326257505145e-05, + "loss": 0.6232, + "step": 1148 + }, + { + "epoch": 0.04, + "learning_rate": 1.992319161939766e-05, + "loss": 0.6601, + "step": 1149 + }, + { + "epoch": 0.04, + "learning_rate": 1.9923056863638183e-05, + "loss": 0.6524, + "step": 1150 + }, + { + "epoch": 0.04, + "learning_rate": 1.992292199022831e-05, + "loss": 0.6275, + "step": 1151 + }, + { + "epoch": 0.04, + "learning_rate": 1.992278699916965e-05, + "loss": 0.5776, + "step": 1152 + }, + { + "epoch": 0.04, + "learning_rate": 1.9922651890463793e-05, + "loss": 0.6589, + "step": 1153 + }, + { + "epoch": 0.04, + "learning_rate": 1.9922516664112352e-05, + "loss": 0.673, + "step": 1154 + }, + { + "epoch": 0.04, + "learning_rate": 1.9922381320116918e-05, + "loss": 0.6397, + "step": 1155 + }, + { + "epoch": 0.04, + "learning_rate": 1.9922245858479104e-05, + "loss": 0.6543, + "step": 1156 + }, + { + "epoch": 0.04, + "learning_rate": 1.9922110279200512e-05, + "loss": 0.6268, + "step": 1157 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921974582282753e-05, + "loss": 0.6548, + "step": 1158 + }, + { + "epoch": 0.04, + "learning_rate": 1.992183876772743e-05, + "loss": 0.7301, + "step": 1159 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921702835536164e-05, + "loss": 0.5919, + "step": 1160 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921566785710557e-05, + "loss": 0.6387, + "step": 1161 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921430618252222e-05, + "loss": 0.6725, + "step": 1162 + }, + { + "epoch": 0.04, + "learning_rate": 1.992129433316278e-05, + "loss": 0.6473, + "step": 1163 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921157930443843e-05, + "loss": 0.6224, + "step": 1164 + }, + { + "epoch": 0.04, + "learning_rate": 1.9921021410097024e-05, + "loss": 0.7047, + "step": 1165 + }, + { + "epoch": 0.04, + "learning_rate": 1.992088477212395e-05, + "loss": 0.6174, + "step": 1166 + }, + { + "epoch": 0.04, + "learning_rate": 1.9920748016526238e-05, + "loss": 0.69, + "step": 1167 + }, + { + "epoch": 0.04, + "learning_rate": 1.9920611143305507e-05, + "loss": 0.6087, + "step": 1168 + }, + { + "epoch": 0.04, + "learning_rate": 1.9920474152463378e-05, + "loss": 0.6355, + "step": 1169 + }, + { + "epoch": 0.04, + "learning_rate": 1.9920337044001482e-05, + "loss": 0.6484, + "step": 1170 + }, + { + "epoch": 0.04, + "learning_rate": 1.992019981792144e-05, + "loss": 0.7094, + "step": 1171 + }, + { + "epoch": 0.04, + "learning_rate": 1.992006247422488e-05, + "loss": 0.7021, + "step": 1172 + }, + { + "epoch": 0.04, + "learning_rate": 1.991992501291343e-05, + "loss": 0.6468, + "step": 1173 + }, + { + "epoch": 0.04, + "learning_rate": 1.9919787433988725e-05, + "loss": 0.6814, + "step": 1174 + }, + { + "epoch": 0.04, + "learning_rate": 1.9919649737452385e-05, + "loss": 0.6521, + "step": 1175 + }, + { + "epoch": 0.04, + "learning_rate": 1.9919511923306053e-05, + "loss": 0.6325, + "step": 1176 + }, + { + "epoch": 0.04, + "learning_rate": 1.9919373991551355e-05, + "loss": 0.6266, + "step": 1177 + }, + { + "epoch": 0.04, + "learning_rate": 1.9919235942189933e-05, + "loss": 0.7159, + "step": 1178 + }, + { + "epoch": 0.04, + "learning_rate": 1.991909777522342e-05, + "loss": 0.6689, + "step": 1179 + }, + { + "epoch": 0.04, + "learning_rate": 1.9918959490653455e-05, + "loss": 0.6934, + "step": 1180 + }, + { + "epoch": 0.04, + "learning_rate": 1.991882108848168e-05, + "loss": 0.6841, + "step": 1181 + }, + { + "epoch": 0.04, + "learning_rate": 1.9918682568709732e-05, + "loss": 0.6274, + "step": 1182 + }, + { + "epoch": 0.04, + "learning_rate": 1.9918543931339255e-05, + "loss": 0.6321, + "step": 1183 + }, + { + "epoch": 0.04, + "learning_rate": 1.991840517637189e-05, + "loss": 0.665, + "step": 1184 + }, + { + "epoch": 0.04, + "learning_rate": 1.991826630380929e-05, + "loss": 0.6128, + "step": 1185 + }, + { + "epoch": 0.04, + "learning_rate": 1.9918127313653094e-05, + "loss": 0.6636, + "step": 1186 + }, + { + "epoch": 0.04, + "learning_rate": 1.991798820590495e-05, + "loss": 0.7125, + "step": 1187 + }, + { + "epoch": 0.04, + "learning_rate": 1.9917848980566515e-05, + "loss": 0.5833, + "step": 1188 + }, + { + "epoch": 0.04, + "learning_rate": 1.991770963763943e-05, + "loss": 0.6172, + "step": 1189 + }, + { + "epoch": 0.04, + "learning_rate": 1.991757017712535e-05, + "loss": 0.6579, + "step": 1190 + }, + { + "epoch": 0.04, + "learning_rate": 1.9917430599025934e-05, + "loss": 0.6499, + "step": 1191 + }, + { + "epoch": 0.04, + "learning_rate": 1.9917290903342826e-05, + "loss": 0.649, + "step": 1192 + }, + { + "epoch": 0.04, + "learning_rate": 1.9917151090077694e-05, + "loss": 0.673, + "step": 1193 + }, + { + "epoch": 0.04, + "learning_rate": 1.991701115923219e-05, + "loss": 0.6416, + "step": 1194 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916871110807972e-05, + "loss": 0.6226, + "step": 1195 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916730944806706e-05, + "loss": 0.6329, + "step": 1196 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916590661230047e-05, + "loss": 0.6454, + "step": 1197 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916450260079662e-05, + "loss": 0.6165, + "step": 1198 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916309741357214e-05, + "loss": 0.6876, + "step": 1199 + }, + { + "epoch": 0.04, + "learning_rate": 1.991616910506437e-05, + "loss": 0.6788, + "step": 1200 + }, + { + "epoch": 0.04, + "learning_rate": 1.9916028351202798e-05, + "loss": 0.6536, + "step": 1201 + }, + { + "epoch": 0.04, + "learning_rate": 1.9915887479774164e-05, + "loss": 0.6663, + "step": 1202 + }, + { + "epoch": 0.04, + "learning_rate": 1.9915746490780145e-05, + "loss": 0.5825, + "step": 1203 + }, + { + "epoch": 0.04, + "learning_rate": 1.99156053842224e-05, + "loss": 0.7305, + "step": 1204 + }, + { + "epoch": 0.04, + "learning_rate": 1.9915464160102614e-05, + "loss": 0.6215, + "step": 1205 + }, + { + "epoch": 0.04, + "learning_rate": 1.991532281842246e-05, + "loss": 0.6503, + "step": 1206 + }, + { + "epoch": 0.04, + "learning_rate": 1.991518135918361e-05, + "loss": 0.6364, + "step": 1207 + }, + { + "epoch": 0.04, + "learning_rate": 1.991503978238774e-05, + "loss": 0.6243, + "step": 1208 + }, + { + "epoch": 0.04, + "learning_rate": 1.991489808803653e-05, + "loss": 0.6171, + "step": 1209 + }, + { + "epoch": 0.04, + "learning_rate": 1.9914756276131664e-05, + "loss": 0.6022, + "step": 1210 + }, + { + "epoch": 0.04, + "learning_rate": 1.991461434667482e-05, + "loss": 0.6931, + "step": 1211 + }, + { + "epoch": 0.04, + "learning_rate": 1.991447229966768e-05, + "loss": 0.6628, + "step": 1212 + }, + { + "epoch": 0.04, + "learning_rate": 1.9914330135111925e-05, + "loss": 0.6439, + "step": 1213 + }, + { + "epoch": 0.04, + "learning_rate": 1.991418785300925e-05, + "loss": 0.668, + "step": 1214 + }, + { + "epoch": 0.04, + "learning_rate": 1.9914045453361333e-05, + "loss": 0.6198, + "step": 1215 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913902936169868e-05, + "loss": 0.6636, + "step": 1216 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913760301436542e-05, + "loss": 0.6635, + "step": 1217 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913617549163046e-05, + "loss": 0.6834, + "step": 1218 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913474679351073e-05, + "loss": 0.5948, + "step": 1219 + }, + { + "epoch": 0.04, + "learning_rate": 1.991333169200232e-05, + "loss": 0.6185, + "step": 1220 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913188587118477e-05, + "loss": 0.6185, + "step": 1221 + }, + { + "epoch": 0.04, + "learning_rate": 1.9913045364701244e-05, + "loss": 0.6673, + "step": 1222 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912902024752318e-05, + "loss": 0.65, + "step": 1223 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912758567273396e-05, + "loss": 0.6195, + "step": 1224 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912614992266183e-05, + "loss": 0.688, + "step": 1225 + }, + { + "epoch": 0.04, + "learning_rate": 1.991247129973238e-05, + "loss": 0.6656, + "step": 1226 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912327489673694e-05, + "loss": 0.6057, + "step": 1227 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912183562091822e-05, + "loss": 0.6479, + "step": 1228 + }, + { + "epoch": 0.04, + "learning_rate": 1.9912039516988475e-05, + "loss": 0.7484, + "step": 1229 + }, + { + "epoch": 0.04, + "learning_rate": 1.991189535436536e-05, + "loss": 0.6628, + "step": 1230 + }, + { + "epoch": 0.04, + "learning_rate": 1.9911751074224187e-05, + "loss": 0.6569, + "step": 1231 + }, + { + "epoch": 0.04, + "learning_rate": 1.991160667656667e-05, + "loss": 0.6042, + "step": 1232 + }, + { + "epoch": 0.04, + "learning_rate": 1.9911462161394515e-05, + "loss": 0.6056, + "step": 1233 + }, + { + "epoch": 0.04, + "learning_rate": 1.991131752870944e-05, + "loss": 0.6185, + "step": 1234 + }, + { + "epoch": 0.04, + "learning_rate": 1.9911172778513156e-05, + "loss": 0.6059, + "step": 1235 + }, + { + "epoch": 0.04, + "learning_rate": 1.9911027910807383e-05, + "loss": 0.7182, + "step": 1236 + }, + { + "epoch": 0.04, + "learning_rate": 1.9910882925593834e-05, + "loss": 0.6209, + "step": 1237 + }, + { + "epoch": 0.04, + "learning_rate": 1.991073782287423e-05, + "loss": 0.688, + "step": 1238 + }, + { + "epoch": 0.04, + "learning_rate": 1.9910592602650295e-05, + "loss": 0.616, + "step": 1239 + }, + { + "epoch": 0.04, + "learning_rate": 1.9910447264923747e-05, + "loss": 0.629, + "step": 1240 + }, + { + "epoch": 0.04, + "learning_rate": 1.991030180969631e-05, + "loss": 0.6231, + "step": 1241 + }, + { + "epoch": 0.04, + "learning_rate": 1.9910156236969706e-05, + "loss": 0.65, + "step": 1242 + }, + { + "epoch": 0.04, + "learning_rate": 1.9910010546745668e-05, + "loss": 0.622, + "step": 1243 + }, + { + "epoch": 0.04, + "learning_rate": 1.9909864739025915e-05, + "loss": 0.6233, + "step": 1244 + }, + { + "epoch": 0.04, + "learning_rate": 1.990971881381218e-05, + "loss": 0.6408, + "step": 1245 + }, + { + "epoch": 0.04, + "learning_rate": 1.9909572771106195e-05, + "loss": 0.6481, + "step": 1246 + }, + { + "epoch": 0.04, + "learning_rate": 1.9909426610909686e-05, + "loss": 0.6068, + "step": 1247 + }, + { + "epoch": 0.04, + "learning_rate": 1.990928033322439e-05, + "loss": 0.638, + "step": 1248 + }, + { + "epoch": 0.04, + "learning_rate": 1.990913393805204e-05, + "loss": 0.6249, + "step": 1249 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908987425394373e-05, + "loss": 0.6598, + "step": 1250 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908840795253126e-05, + "loss": 0.6811, + "step": 1251 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908694047630033e-05, + "loss": 0.665, + "step": 1252 + }, + { + "epoch": 0.04, + "learning_rate": 1.990854718252684e-05, + "loss": 0.7012, + "step": 1253 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908400199945286e-05, + "loss": 0.6408, + "step": 1254 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908253099887114e-05, + "loss": 0.7042, + "step": 1255 + }, + { + "epoch": 0.04, + "learning_rate": 1.9908105882354066e-05, + "loss": 0.6041, + "step": 1256 + }, + { + "epoch": 0.04, + "learning_rate": 1.990795854734789e-05, + "loss": 0.5998, + "step": 1257 + }, + { + "epoch": 0.04, + "learning_rate": 1.9907811094870332e-05, + "loss": 0.6611, + "step": 1258 + }, + { + "epoch": 0.04, + "learning_rate": 1.9907663524923137e-05, + "loss": 0.6815, + "step": 1259 + }, + { + "epoch": 0.04, + "learning_rate": 1.990751583750806e-05, + "loss": 0.6243, + "step": 1260 + }, + { + "epoch": 0.04, + "learning_rate": 1.990736803262685e-05, + "loss": 0.5945, + "step": 1261 + }, + { + "epoch": 0.04, + "learning_rate": 1.990722011028126e-05, + "loss": 0.6729, + "step": 1262 + }, + { + "epoch": 0.04, + "learning_rate": 1.990707207047304e-05, + "loss": 0.6078, + "step": 1263 + }, + { + "epoch": 0.04, + "learning_rate": 1.990692391320395e-05, + "loss": 0.6977, + "step": 1264 + }, + { + "epoch": 0.04, + "learning_rate": 1.9906775638475745e-05, + "loss": 0.6339, + "step": 1265 + }, + { + "epoch": 0.04, + "learning_rate": 1.9906627246290182e-05, + "loss": 0.6844, + "step": 1266 + }, + { + "epoch": 0.04, + "learning_rate": 1.990647873664902e-05, + "loss": 0.6349, + "step": 1267 + }, + { + "epoch": 0.04, + "learning_rate": 1.9906330109554023e-05, + "loss": 0.5935, + "step": 1268 + }, + { + "epoch": 0.04, + "learning_rate": 1.990618136500695e-05, + "loss": 0.6314, + "step": 1269 + }, + { + "epoch": 0.04, + "learning_rate": 1.9906032503009567e-05, + "loss": 0.5971, + "step": 1270 + }, + { + "epoch": 0.04, + "learning_rate": 1.9905883523563637e-05, + "loss": 0.5836, + "step": 1271 + }, + { + "epoch": 0.04, + "learning_rate": 1.9905734426670924e-05, + "loss": 0.6617, + "step": 1272 + }, + { + "epoch": 0.04, + "learning_rate": 1.99055852123332e-05, + "loss": 0.675, + "step": 1273 + }, + { + "epoch": 0.04, + "learning_rate": 1.9905435880552233e-05, + "loss": 0.6747, + "step": 1274 + }, + { + "epoch": 0.04, + "learning_rate": 1.9905286431329793e-05, + "loss": 0.6227, + "step": 1275 + }, + { + "epoch": 0.04, + "learning_rate": 1.9905136864667654e-05, + "loss": 0.6117, + "step": 1276 + }, + { + "epoch": 0.04, + "learning_rate": 1.9904987180567585e-05, + "loss": 0.6002, + "step": 1277 + }, + { + "epoch": 0.04, + "learning_rate": 1.9904837379031365e-05, + "loss": 0.6462, + "step": 1278 + }, + { + "epoch": 0.04, + "learning_rate": 1.9904687460060765e-05, + "loss": 0.6675, + "step": 1279 + }, + { + "epoch": 0.04, + "learning_rate": 1.9904537423657566e-05, + "loss": 0.6415, + "step": 1280 + }, + { + "epoch": 0.04, + "learning_rate": 1.990438726982355e-05, + "loss": 0.6785, + "step": 1281 + }, + { + "epoch": 0.04, + "learning_rate": 1.990423699856049e-05, + "loss": 0.642, + "step": 1282 + }, + { + "epoch": 0.04, + "learning_rate": 1.9904086609870176e-05, + "loss": 0.6322, + "step": 1283 + }, + { + "epoch": 0.04, + "learning_rate": 1.9903936103754383e-05, + "loss": 0.7202, + "step": 1284 + }, + { + "epoch": 0.04, + "learning_rate": 1.99037854802149e-05, + "loss": 0.6776, + "step": 1285 + }, + { + "epoch": 0.04, + "learning_rate": 1.990363473925351e-05, + "loss": 0.7208, + "step": 1286 + }, + { + "epoch": 0.04, + "learning_rate": 1.9903483880872005e-05, + "loss": 0.6708, + "step": 1287 + }, + { + "epoch": 0.04, + "learning_rate": 1.9903332905072167e-05, + "loss": 0.6082, + "step": 1288 + }, + { + "epoch": 0.04, + "learning_rate": 1.9903181811855795e-05, + "loss": 0.6612, + "step": 1289 + }, + { + "epoch": 0.04, + "learning_rate": 1.990303060122467e-05, + "loss": 0.6859, + "step": 1290 + }, + { + "epoch": 0.04, + "learning_rate": 1.9902879273180592e-05, + "loss": 0.6536, + "step": 1291 + }, + { + "epoch": 0.04, + "learning_rate": 1.9902727827725355e-05, + "loss": 0.6328, + "step": 1292 + }, + { + "epoch": 0.04, + "learning_rate": 1.9902576264860747e-05, + "loss": 0.6062, + "step": 1293 + }, + { + "epoch": 0.04, + "learning_rate": 1.9902424584588574e-05, + "loss": 0.6671, + "step": 1294 + }, + { + "epoch": 0.04, + "learning_rate": 1.990227278691063e-05, + "loss": 0.7005, + "step": 1295 + }, + { + "epoch": 0.04, + "learning_rate": 1.9902120871828717e-05, + "loss": 0.6873, + "step": 1296 + }, + { + "epoch": 0.04, + "learning_rate": 1.9901968839344635e-05, + "loss": 0.6075, + "step": 1297 + }, + { + "epoch": 0.04, + "learning_rate": 1.9901816689460188e-05, + "loss": 0.6664, + "step": 1298 + }, + { + "epoch": 0.05, + "learning_rate": 1.9901664422177177e-05, + "loss": 0.6847, + "step": 1299 + }, + { + "epoch": 0.05, + "learning_rate": 1.9901512037497405e-05, + "loss": 0.6691, + "step": 1300 + }, + { + "epoch": 0.05, + "learning_rate": 1.9901359535422686e-05, + "loss": 0.6783, + "step": 1301 + }, + { + "epoch": 0.05, + "learning_rate": 1.9901206915954824e-05, + "loss": 0.6504, + "step": 1302 + }, + { + "epoch": 0.05, + "learning_rate": 1.9901054179095626e-05, + "loss": 0.6447, + "step": 1303 + }, + { + "epoch": 0.05, + "learning_rate": 1.9900901324846907e-05, + "loss": 0.6051, + "step": 1304 + }, + { + "epoch": 0.05, + "learning_rate": 1.990074835321048e-05, + "loss": 0.6807, + "step": 1305 + }, + { + "epoch": 0.05, + "learning_rate": 1.9900595264188157e-05, + "loss": 0.7003, + "step": 1306 + }, + { + "epoch": 0.05, + "learning_rate": 1.9900442057781753e-05, + "loss": 0.6297, + "step": 1307 + }, + { + "epoch": 0.05, + "learning_rate": 1.9900288733993084e-05, + "loss": 0.6416, + "step": 1308 + }, + { + "epoch": 0.05, + "learning_rate": 1.9900135292823964e-05, + "loss": 0.6375, + "step": 1309 + }, + { + "epoch": 0.05, + "learning_rate": 1.989998173427622e-05, + "loss": 0.7014, + "step": 1310 + }, + { + "epoch": 0.05, + "learning_rate": 1.9899828058351668e-05, + "loss": 0.6584, + "step": 1311 + }, + { + "epoch": 0.05, + "learning_rate": 1.989967426505213e-05, + "loss": 0.6365, + "step": 1312 + }, + { + "epoch": 0.05, + "learning_rate": 1.9899520354379435e-05, + "loss": 0.6424, + "step": 1313 + }, + { + "epoch": 0.05, + "learning_rate": 1.98993663263354e-05, + "loss": 0.6478, + "step": 1314 + }, + { + "epoch": 0.05, + "learning_rate": 1.9899212180921854e-05, + "loss": 0.6692, + "step": 1315 + }, + { + "epoch": 0.05, + "learning_rate": 1.9899057918140628e-05, + "loss": 0.6653, + "step": 1316 + }, + { + "epoch": 0.05, + "learning_rate": 1.9898903537993544e-05, + "loss": 0.6362, + "step": 1317 + }, + { + "epoch": 0.05, + "learning_rate": 1.989874904048244e-05, + "loss": 0.6465, + "step": 1318 + }, + { + "epoch": 0.05, + "learning_rate": 1.989859442560914e-05, + "loss": 0.6551, + "step": 1319 + }, + { + "epoch": 0.05, + "learning_rate": 1.989843969337548e-05, + "loss": 0.5773, + "step": 1320 + }, + { + "epoch": 0.05, + "learning_rate": 1.98982848437833e-05, + "loss": 0.6539, + "step": 1321 + }, + { + "epoch": 0.05, + "learning_rate": 1.9898129876834434e-05, + "loss": 0.6845, + "step": 1322 + }, + { + "epoch": 0.05, + "learning_rate": 1.9897974792530714e-05, + "loss": 0.7116, + "step": 1323 + }, + { + "epoch": 0.05, + "learning_rate": 1.9897819590873985e-05, + "loss": 0.6396, + "step": 1324 + }, + { + "epoch": 0.05, + "learning_rate": 1.989766427186608e-05, + "loss": 0.6699, + "step": 1325 + }, + { + "epoch": 0.05, + "learning_rate": 1.9897508835508843e-05, + "loss": 0.6493, + "step": 1326 + }, + { + "epoch": 0.05, + "learning_rate": 1.9897353281804123e-05, + "loss": 0.6554, + "step": 1327 + }, + { + "epoch": 0.05, + "learning_rate": 1.9897197610753755e-05, + "loss": 0.6815, + "step": 1328 + }, + { + "epoch": 0.05, + "learning_rate": 1.989704182235959e-05, + "loss": 0.6426, + "step": 1329 + }, + { + "epoch": 0.05, + "learning_rate": 1.9896885916623478e-05, + "loss": 0.6327, + "step": 1330 + }, + { + "epoch": 0.05, + "learning_rate": 1.989672989354726e-05, + "loss": 0.6879, + "step": 1331 + }, + { + "epoch": 0.05, + "learning_rate": 1.9896573753132794e-05, + "loss": 0.6964, + "step": 1332 + }, + { + "epoch": 0.05, + "learning_rate": 1.9896417495381925e-05, + "loss": 0.6737, + "step": 1333 + }, + { + "epoch": 0.05, + "learning_rate": 1.9896261120296505e-05, + "loss": 0.6901, + "step": 1334 + }, + { + "epoch": 0.05, + "learning_rate": 1.9896104627878393e-05, + "loss": 0.6876, + "step": 1335 + }, + { + "epoch": 0.05, + "learning_rate": 1.9895948018129444e-05, + "loss": 0.6862, + "step": 1336 + }, + { + "epoch": 0.05, + "learning_rate": 1.989579129105151e-05, + "loss": 0.7041, + "step": 1337 + }, + { + "epoch": 0.05, + "learning_rate": 1.9895634446646453e-05, + "loss": 0.6725, + "step": 1338 + }, + { + "epoch": 0.05, + "learning_rate": 1.989547748491613e-05, + "loss": 0.662, + "step": 1339 + }, + { + "epoch": 0.05, + "learning_rate": 1.9895320405862403e-05, + "loss": 0.663, + "step": 1340 + }, + { + "epoch": 0.05, + "learning_rate": 1.989516320948714e-05, + "loss": 0.6535, + "step": 1341 + }, + { + "epoch": 0.05, + "learning_rate": 1.9895005895792194e-05, + "loss": 0.6184, + "step": 1342 + }, + { + "epoch": 0.05, + "learning_rate": 1.989484846477944e-05, + "loss": 0.63, + "step": 1343 + }, + { + "epoch": 0.05, + "learning_rate": 1.9894690916450737e-05, + "loss": 0.6764, + "step": 1344 + }, + { + "epoch": 0.05, + "learning_rate": 1.9894533250807958e-05, + "loss": 0.6407, + "step": 1345 + }, + { + "epoch": 0.05, + "learning_rate": 1.9894375467852972e-05, + "loss": 0.7016, + "step": 1346 + }, + { + "epoch": 0.05, + "learning_rate": 1.9894217567587647e-05, + "loss": 0.6326, + "step": 1347 + }, + { + "epoch": 0.05, + "learning_rate": 1.9894059550013852e-05, + "loss": 0.633, + "step": 1348 + }, + { + "epoch": 0.05, + "learning_rate": 1.9893901415133472e-05, + "loss": 0.6352, + "step": 1349 + }, + { + "epoch": 0.05, + "learning_rate": 1.9893743162948373e-05, + "loss": 0.6563, + "step": 1350 + }, + { + "epoch": 0.05, + "learning_rate": 1.9893584793460432e-05, + "loss": 0.6657, + "step": 1351 + }, + { + "epoch": 0.05, + "learning_rate": 1.9893426306671527e-05, + "loss": 0.6722, + "step": 1352 + }, + { + "epoch": 0.05, + "learning_rate": 1.989326770258354e-05, + "loss": 0.6753, + "step": 1353 + }, + { + "epoch": 0.05, + "learning_rate": 1.9893108981198348e-05, + "loss": 0.6914, + "step": 1354 + }, + { + "epoch": 0.05, + "learning_rate": 1.9892950142517834e-05, + "loss": 0.669, + "step": 1355 + }, + { + "epoch": 0.05, + "learning_rate": 1.9892791186543884e-05, + "loss": 0.6292, + "step": 1356 + }, + { + "epoch": 0.05, + "learning_rate": 1.989263211327838e-05, + "loss": 0.6698, + "step": 1357 + }, + { + "epoch": 0.05, + "learning_rate": 1.9892472922723205e-05, + "loss": 0.5943, + "step": 1358 + }, + { + "epoch": 0.05, + "learning_rate": 1.989231361488025e-05, + "loss": 0.6626, + "step": 1359 + }, + { + "epoch": 0.05, + "learning_rate": 1.9892154189751403e-05, + "loss": 0.6376, + "step": 1360 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891994647338556e-05, + "loss": 0.6931, + "step": 1361 + }, + { + "epoch": 0.05, + "learning_rate": 1.98918349876436e-05, + "loss": 0.6318, + "step": 1362 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891675210668423e-05, + "loss": 0.659, + "step": 1363 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891515316414926e-05, + "loss": 0.6579, + "step": 1364 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891355304885e-05, + "loss": 0.6273, + "step": 1365 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891195176080548e-05, + "loss": 0.6335, + "step": 1366 + }, + { + "epoch": 0.05, + "learning_rate": 1.9891034930003463e-05, + "loss": 0.6412, + "step": 1367 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890874566655648e-05, + "loss": 0.5981, + "step": 1368 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890714086039e-05, + "loss": 0.6142, + "step": 1369 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890553488155425e-05, + "loss": 0.6059, + "step": 1370 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890392773006828e-05, + "loss": 0.6973, + "step": 1371 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890231940595112e-05, + "loss": 0.619, + "step": 1372 + }, + { + "epoch": 0.05, + "learning_rate": 1.9890070990922187e-05, + "loss": 0.6237, + "step": 1373 + }, + { + "epoch": 0.05, + "learning_rate": 1.988990992398996e-05, + "loss": 0.6392, + "step": 1374 + }, + { + "epoch": 0.05, + "learning_rate": 1.9889748739800336e-05, + "loss": 0.6901, + "step": 1375 + }, + { + "epoch": 0.05, + "learning_rate": 1.9889587438355235e-05, + "loss": 0.7011, + "step": 1376 + }, + { + "epoch": 0.05, + "learning_rate": 1.9889426019656562e-05, + "loss": 0.6798, + "step": 1377 + }, + { + "epoch": 0.05, + "learning_rate": 1.9889264483706233e-05, + "loss": 0.6473, + "step": 1378 + }, + { + "epoch": 0.05, + "learning_rate": 1.9889102830506167e-05, + "loss": 0.7064, + "step": 1379 + }, + { + "epoch": 0.05, + "learning_rate": 1.9888941060058272e-05, + "loss": 0.6719, + "step": 1380 + }, + { + "epoch": 0.05, + "learning_rate": 1.9888779172364474e-05, + "loss": 0.6724, + "step": 1381 + }, + { + "epoch": 0.05, + "learning_rate": 1.988861716742669e-05, + "loss": 0.6901, + "step": 1382 + }, + { + "epoch": 0.05, + "learning_rate": 1.9888455045246838e-05, + "loss": 0.6484, + "step": 1383 + }, + { + "epoch": 0.05, + "learning_rate": 1.9888292805826843e-05, + "loss": 0.6231, + "step": 1384 + }, + { + "epoch": 0.05, + "learning_rate": 1.988813044916863e-05, + "loss": 0.6263, + "step": 1385 + }, + { + "epoch": 0.05, + "learning_rate": 1.988796797527412e-05, + "loss": 0.643, + "step": 1386 + }, + { + "epoch": 0.05, + "learning_rate": 1.9887805384145244e-05, + "loss": 0.6264, + "step": 1387 + }, + { + "epoch": 0.05, + "learning_rate": 1.9887642675783926e-05, + "loss": 0.669, + "step": 1388 + }, + { + "epoch": 0.05, + "learning_rate": 1.9887479850192094e-05, + "loss": 0.6464, + "step": 1389 + }, + { + "epoch": 0.05, + "learning_rate": 1.988731690737168e-05, + "loss": 0.6208, + "step": 1390 + }, + { + "epoch": 0.05, + "learning_rate": 1.988715384732462e-05, + "loss": 0.6935, + "step": 1391 + }, + { + "epoch": 0.05, + "learning_rate": 1.988699067005284e-05, + "loss": 0.6288, + "step": 1392 + }, + { + "epoch": 0.05, + "learning_rate": 1.9886827375558283e-05, + "loss": 0.612, + "step": 1393 + }, + { + "epoch": 0.05, + "learning_rate": 1.988666396384288e-05, + "loss": 0.6623, + "step": 1394 + }, + { + "epoch": 0.05, + "learning_rate": 1.9886500434908565e-05, + "loss": 0.6891, + "step": 1395 + }, + { + "epoch": 0.05, + "learning_rate": 1.9886336788757285e-05, + "loss": 0.6628, + "step": 1396 + }, + { + "epoch": 0.05, + "learning_rate": 1.9886173025390977e-05, + "loss": 0.6336, + "step": 1397 + }, + { + "epoch": 0.05, + "learning_rate": 1.9886009144811575e-05, + "loss": 0.6723, + "step": 1398 + }, + { + "epoch": 0.05, + "learning_rate": 1.9885845147021035e-05, + "loss": 0.6729, + "step": 1399 + }, + { + "epoch": 0.05, + "learning_rate": 1.988568103202129e-05, + "loss": 0.6553, + "step": 1400 + }, + { + "epoch": 0.05, + "learning_rate": 1.9885516799814298e-05, + "loss": 0.6421, + "step": 1401 + }, + { + "epoch": 0.05, + "learning_rate": 1.9885352450401994e-05, + "loss": 0.6021, + "step": 1402 + }, + { + "epoch": 0.05, + "learning_rate": 1.988518798378633e-05, + "loss": 0.6737, + "step": 1403 + }, + { + "epoch": 0.05, + "learning_rate": 1.9885023399969262e-05, + "loss": 0.6451, + "step": 1404 + }, + { + "epoch": 0.05, + "learning_rate": 1.9884858698952735e-05, + "loss": 0.6484, + "step": 1405 + }, + { + "epoch": 0.05, + "learning_rate": 1.9884693880738703e-05, + "loss": 0.6756, + "step": 1406 + }, + { + "epoch": 0.05, + "learning_rate": 1.9884528945329124e-05, + "loss": 0.6399, + "step": 1407 + }, + { + "epoch": 0.05, + "learning_rate": 1.9884363892725948e-05, + "loss": 0.6359, + "step": 1408 + }, + { + "epoch": 0.05, + "learning_rate": 1.9884198722931134e-05, + "loss": 0.6248, + "step": 1409 + }, + { + "epoch": 0.05, + "learning_rate": 1.988403343594664e-05, + "loss": 0.6312, + "step": 1410 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883868031774425e-05, + "loss": 0.6324, + "step": 1411 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883702510416456e-05, + "loss": 0.7058, + "step": 1412 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883536871874688e-05, + "loss": 0.6388, + "step": 1413 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883371116151088e-05, + "loss": 0.6312, + "step": 1414 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883205243247622e-05, + "loss": 0.6651, + "step": 1415 + }, + { + "epoch": 0.05, + "learning_rate": 1.9883039253166255e-05, + "loss": 0.652, + "step": 1416 + }, + { + "epoch": 0.05, + "learning_rate": 1.9882873145908955e-05, + "loss": 0.6632, + "step": 1417 + }, + { + "epoch": 0.05, + "learning_rate": 1.988270692147769e-05, + "loss": 0.6767, + "step": 1418 + }, + { + "epoch": 0.05, + "learning_rate": 1.9882540579874437e-05, + "loss": 0.6731, + "step": 1419 + }, + { + "epoch": 0.05, + "learning_rate": 1.988237412110116e-05, + "loss": 0.6888, + "step": 1420 + }, + { + "epoch": 0.05, + "learning_rate": 1.988220754515984e-05, + "loss": 0.6435, + "step": 1421 + }, + { + "epoch": 0.05, + "learning_rate": 1.9882040852052444e-05, + "loss": 0.6407, + "step": 1422 + }, + { + "epoch": 0.05, + "learning_rate": 1.9881874041780956e-05, + "loss": 0.7255, + "step": 1423 + }, + { + "epoch": 0.05, + "learning_rate": 1.988170711434735e-05, + "loss": 0.7067, + "step": 1424 + }, + { + "epoch": 0.05, + "learning_rate": 1.9881540069753606e-05, + "loss": 0.6413, + "step": 1425 + }, + { + "epoch": 0.05, + "learning_rate": 1.9881372908001704e-05, + "loss": 0.6557, + "step": 1426 + }, + { + "epoch": 0.05, + "learning_rate": 1.988120562909363e-05, + "loss": 0.6536, + "step": 1427 + }, + { + "epoch": 0.05, + "learning_rate": 1.9881038233031356e-05, + "loss": 0.6743, + "step": 1428 + }, + { + "epoch": 0.05, + "learning_rate": 1.9880870719816882e-05, + "loss": 0.6251, + "step": 1429 + }, + { + "epoch": 0.05, + "learning_rate": 1.988070308945218e-05, + "loss": 0.6675, + "step": 1430 + }, + { + "epoch": 0.05, + "learning_rate": 1.9880535341939245e-05, + "loss": 0.6477, + "step": 1431 + }, + { + "epoch": 0.05, + "learning_rate": 1.9880367477280064e-05, + "loss": 0.6542, + "step": 1432 + }, + { + "epoch": 0.05, + "learning_rate": 1.9880199495476632e-05, + "loss": 0.6795, + "step": 1433 + }, + { + "epoch": 0.05, + "learning_rate": 1.9880031396530933e-05, + "loss": 0.6401, + "step": 1434 + }, + { + "epoch": 0.05, + "learning_rate": 1.9879863180444965e-05, + "loss": 0.7072, + "step": 1435 + }, + { + "epoch": 0.05, + "learning_rate": 1.987969484722072e-05, + "loss": 0.6383, + "step": 1436 + }, + { + "epoch": 0.05, + "learning_rate": 1.9879526396860194e-05, + "loss": 0.6869, + "step": 1437 + }, + { + "epoch": 0.05, + "learning_rate": 1.9879357829365385e-05, + "loss": 0.6173, + "step": 1438 + }, + { + "epoch": 0.05, + "learning_rate": 1.9879189144738294e-05, + "loss": 0.6392, + "step": 1439 + }, + { + "epoch": 0.05, + "learning_rate": 1.987902034298092e-05, + "loss": 0.6364, + "step": 1440 + }, + { + "epoch": 0.05, + "learning_rate": 1.9878851424095254e-05, + "loss": 0.6799, + "step": 1441 + }, + { + "epoch": 0.05, + "learning_rate": 1.9878682388083314e-05, + "loss": 0.6432, + "step": 1442 + }, + { + "epoch": 0.05, + "learning_rate": 1.9878513234947097e-05, + "loss": 0.6622, + "step": 1443 + }, + { + "epoch": 0.05, + "learning_rate": 1.987834396468861e-05, + "loss": 0.6867, + "step": 1444 + }, + { + "epoch": 0.05, + "learning_rate": 1.987817457730986e-05, + "loss": 0.6514, + "step": 1445 + }, + { + "epoch": 0.05, + "learning_rate": 1.9878005072812848e-05, + "loss": 0.6882, + "step": 1446 + }, + { + "epoch": 0.05, + "learning_rate": 1.9877835451199598e-05, + "loss": 0.7195, + "step": 1447 + }, + { + "epoch": 0.05, + "learning_rate": 1.9877665712472106e-05, + "loss": 0.7126, + "step": 1448 + }, + { + "epoch": 0.05, + "learning_rate": 1.98774958566324e-05, + "loss": 0.6164, + "step": 1449 + }, + { + "epoch": 0.05, + "learning_rate": 1.987732588368248e-05, + "loss": 0.6606, + "step": 1450 + }, + { + "epoch": 0.05, + "learning_rate": 1.9877155793624366e-05, + "loss": 0.7277, + "step": 1451 + }, + { + "epoch": 0.05, + "learning_rate": 1.9876985586460078e-05, + "loss": 0.6283, + "step": 1452 + }, + { + "epoch": 0.05, + "learning_rate": 1.987681526219163e-05, + "loss": 0.6189, + "step": 1453 + }, + { + "epoch": 0.05, + "learning_rate": 1.9876644820821044e-05, + "loss": 0.7051, + "step": 1454 + }, + { + "epoch": 0.05, + "learning_rate": 1.987647426235034e-05, + "loss": 0.6037, + "step": 1455 + }, + { + "epoch": 0.05, + "learning_rate": 1.987630358678154e-05, + "loss": 0.5958, + "step": 1456 + }, + { + "epoch": 0.05, + "learning_rate": 1.9876132794116666e-05, + "loss": 0.6899, + "step": 1457 + }, + { + "epoch": 0.05, + "learning_rate": 1.9875961884357743e-05, + "loss": 0.6467, + "step": 1458 + }, + { + "epoch": 0.05, + "learning_rate": 1.9875790857506797e-05, + "loss": 0.6572, + "step": 1459 + }, + { + "epoch": 0.05, + "learning_rate": 1.9875619713565863e-05, + "loss": 0.6796, + "step": 1460 + }, + { + "epoch": 0.05, + "learning_rate": 1.987544845253696e-05, + "loss": 0.6563, + "step": 1461 + }, + { + "epoch": 0.05, + "learning_rate": 1.9875277074422127e-05, + "loss": 0.6815, + "step": 1462 + }, + { + "epoch": 0.05, + "learning_rate": 1.9875105579223392e-05, + "loss": 0.6722, + "step": 1463 + }, + { + "epoch": 0.05, + "learning_rate": 1.9874933966942786e-05, + "loss": 0.6836, + "step": 1464 + }, + { + "epoch": 0.05, + "learning_rate": 1.9874762237582348e-05, + "loss": 0.6554, + "step": 1465 + }, + { + "epoch": 0.05, + "learning_rate": 1.9874590391144108e-05, + "loss": 0.6118, + "step": 1466 + }, + { + "epoch": 0.05, + "learning_rate": 1.9874418427630113e-05, + "loss": 0.5869, + "step": 1467 + }, + { + "epoch": 0.05, + "learning_rate": 1.9874246347042395e-05, + "loss": 0.5536, + "step": 1468 + }, + { + "epoch": 0.05, + "learning_rate": 1.987407414938299e-05, + "loss": 0.6216, + "step": 1469 + }, + { + "epoch": 0.05, + "learning_rate": 1.987390183465395e-05, + "loss": 0.6683, + "step": 1470 + }, + { + "epoch": 0.05, + "learning_rate": 1.9873729402857315e-05, + "loss": 0.7107, + "step": 1471 + }, + { + "epoch": 0.05, + "learning_rate": 1.9873556853995123e-05, + "loss": 0.6345, + "step": 1472 + }, + { + "epoch": 0.05, + "learning_rate": 1.9873384188069427e-05, + "loss": 0.6362, + "step": 1473 + }, + { + "epoch": 0.05, + "learning_rate": 1.987321140508227e-05, + "loss": 0.6946, + "step": 1474 + }, + { + "epoch": 0.05, + "learning_rate": 1.9873038505035705e-05, + "loss": 0.6397, + "step": 1475 + }, + { + "epoch": 0.05, + "learning_rate": 1.9872865487931776e-05, + "loss": 0.6781, + "step": 1476 + }, + { + "epoch": 0.05, + "learning_rate": 1.9872692353772538e-05, + "loss": 0.6732, + "step": 1477 + }, + { + "epoch": 0.05, + "learning_rate": 1.9872519102560045e-05, + "loss": 0.6368, + "step": 1478 + }, + { + "epoch": 0.05, + "learning_rate": 1.9872345734296348e-05, + "loss": 0.6446, + "step": 1479 + }, + { + "epoch": 0.05, + "learning_rate": 1.9872172248983505e-05, + "loss": 0.6964, + "step": 1480 + }, + { + "epoch": 0.05, + "learning_rate": 1.987199864662357e-05, + "loss": 0.6075, + "step": 1481 + }, + { + "epoch": 0.05, + "learning_rate": 1.9871824927218603e-05, + "loss": 0.6619, + "step": 1482 + }, + { + "epoch": 0.05, + "learning_rate": 1.9871651090770664e-05, + "loss": 0.6759, + "step": 1483 + }, + { + "epoch": 0.05, + "learning_rate": 1.9871477137281813e-05, + "loss": 0.7027, + "step": 1484 + }, + { + "epoch": 0.05, + "learning_rate": 1.9871303066754113e-05, + "loss": 0.6964, + "step": 1485 + }, + { + "epoch": 0.05, + "learning_rate": 1.9871128879189628e-05, + "loss": 0.6691, + "step": 1486 + }, + { + "epoch": 0.05, + "learning_rate": 1.9870954574590425e-05, + "loss": 0.6382, + "step": 1487 + }, + { + "epoch": 0.05, + "learning_rate": 1.9870780152958566e-05, + "loss": 0.6271, + "step": 1488 + }, + { + "epoch": 0.05, + "learning_rate": 1.9870605614296123e-05, + "loss": 0.6333, + "step": 1489 + }, + { + "epoch": 0.05, + "learning_rate": 1.9870430958605165e-05, + "loss": 0.589, + "step": 1490 + }, + { + "epoch": 0.05, + "learning_rate": 1.9870256185887758e-05, + "loss": 0.6758, + "step": 1491 + }, + { + "epoch": 0.05, + "learning_rate": 1.987008129614598e-05, + "loss": 0.6234, + "step": 1492 + }, + { + "epoch": 0.05, + "learning_rate": 1.9869906289381906e-05, + "loss": 0.6719, + "step": 1493 + }, + { + "epoch": 0.05, + "learning_rate": 1.9869731165597603e-05, + "loss": 0.6746, + "step": 1494 + }, + { + "epoch": 0.05, + "learning_rate": 1.9869555924795153e-05, + "loss": 0.6948, + "step": 1495 + }, + { + "epoch": 0.05, + "learning_rate": 1.9869380566976637e-05, + "loss": 0.6403, + "step": 1496 + }, + { + "epoch": 0.05, + "learning_rate": 1.9869205092144123e-05, + "loss": 0.649, + "step": 1497 + }, + { + "epoch": 0.05, + "learning_rate": 1.98690295002997e-05, + "loss": 0.6473, + "step": 1498 + }, + { + "epoch": 0.05, + "learning_rate": 1.9868853791445448e-05, + "loss": 0.72, + "step": 1499 + }, + { + "epoch": 0.05, + "learning_rate": 1.986867796558345e-05, + "loss": 0.597, + "step": 1500 + }, + { + "epoch": 0.05, + "learning_rate": 1.986850202271579e-05, + "loss": 0.6726, + "step": 1501 + }, + { + "epoch": 0.05, + "learning_rate": 1.986832596284456e-05, + "loss": 0.6268, + "step": 1502 + }, + { + "epoch": 0.05, + "learning_rate": 1.9868149785971837e-05, + "loss": 0.5721, + "step": 1503 + }, + { + "epoch": 0.05, + "learning_rate": 1.9867973492099715e-05, + "loss": 0.6725, + "step": 1504 + }, + { + "epoch": 0.05, + "learning_rate": 1.9867797081230285e-05, + "loss": 0.6535, + "step": 1505 + }, + { + "epoch": 0.05, + "learning_rate": 1.986762055336564e-05, + "loss": 0.6679, + "step": 1506 + }, + { + "epoch": 0.05, + "learning_rate": 1.9867443908507868e-05, + "loss": 0.636, + "step": 1507 + }, + { + "epoch": 0.05, + "learning_rate": 1.9867267146659067e-05, + "loss": 0.6293, + "step": 1508 + }, + { + "epoch": 0.05, + "learning_rate": 1.9867090267821333e-05, + "loss": 0.694, + "step": 1509 + }, + { + "epoch": 0.05, + "learning_rate": 1.986691327199676e-05, + "loss": 0.6236, + "step": 1510 + }, + { + "epoch": 0.05, + "learning_rate": 1.986673615918745e-05, + "loss": 0.6556, + "step": 1511 + }, + { + "epoch": 0.05, + "learning_rate": 1.98665589293955e-05, + "loss": 0.6188, + "step": 1512 + }, + { + "epoch": 0.05, + "learning_rate": 1.9866381582623012e-05, + "loss": 0.6471, + "step": 1513 + }, + { + "epoch": 0.05, + "learning_rate": 1.9866204118872093e-05, + "loss": 0.6375, + "step": 1514 + }, + { + "epoch": 0.05, + "learning_rate": 1.986602653814484e-05, + "loss": 0.6576, + "step": 1515 + }, + { + "epoch": 0.05, + "learning_rate": 1.9865848840443363e-05, + "loss": 0.6541, + "step": 1516 + }, + { + "epoch": 0.05, + "learning_rate": 1.9865671025769767e-05, + "loss": 0.6435, + "step": 1517 + }, + { + "epoch": 0.05, + "learning_rate": 1.986549309412616e-05, + "loss": 0.6192, + "step": 1518 + }, + { + "epoch": 0.05, + "learning_rate": 1.9865315045514653e-05, + "loss": 0.6498, + "step": 1519 + }, + { + "epoch": 0.05, + "learning_rate": 1.9865136879937357e-05, + "loss": 0.6623, + "step": 1520 + }, + { + "epoch": 0.05, + "learning_rate": 1.9864958597396385e-05, + "loss": 0.6449, + "step": 1521 + }, + { + "epoch": 0.05, + "learning_rate": 1.9864780197893848e-05, + "loss": 0.6395, + "step": 1522 + }, + { + "epoch": 0.05, + "learning_rate": 1.9864601681431862e-05, + "loss": 0.6753, + "step": 1523 + }, + { + "epoch": 0.05, + "learning_rate": 1.986442304801255e-05, + "loss": 0.5958, + "step": 1524 + }, + { + "epoch": 0.05, + "learning_rate": 1.986424429763802e-05, + "loss": 0.6662, + "step": 1525 + }, + { + "epoch": 0.05, + "learning_rate": 1.9864065430310392e-05, + "loss": 0.6639, + "step": 1526 + }, + { + "epoch": 0.05, + "learning_rate": 1.986388644603179e-05, + "loss": 0.6664, + "step": 1527 + }, + { + "epoch": 0.05, + "learning_rate": 1.9863707344804345e-05, + "loss": 0.6815, + "step": 1528 + }, + { + "epoch": 0.05, + "learning_rate": 1.9863528126630166e-05, + "loss": 0.6952, + "step": 1529 + }, + { + "epoch": 0.05, + "learning_rate": 1.9863348791511382e-05, + "loss": 0.669, + "step": 1530 + }, + { + "epoch": 0.05, + "learning_rate": 1.9863169339450126e-05, + "loss": 0.6493, + "step": 1531 + }, + { + "epoch": 0.05, + "learning_rate": 1.9862989770448517e-05, + "loss": 0.6283, + "step": 1532 + }, + { + "epoch": 0.05, + "learning_rate": 1.9862810084508687e-05, + "loss": 0.66, + "step": 1533 + }, + { + "epoch": 0.05, + "learning_rate": 1.986263028163277e-05, + "loss": 0.668, + "step": 1534 + }, + { + "epoch": 0.05, + "learning_rate": 1.986245036182289e-05, + "loss": 0.669, + "step": 1535 + }, + { + "epoch": 0.05, + "learning_rate": 1.986227032508119e-05, + "loss": 0.6989, + "step": 1536 + }, + { + "epoch": 0.05, + "learning_rate": 1.9862090171409795e-05, + "loss": 0.6742, + "step": 1537 + }, + { + "epoch": 0.05, + "learning_rate": 1.986190990081085e-05, + "loss": 0.6209, + "step": 1538 + }, + { + "epoch": 0.05, + "learning_rate": 1.986172951328648e-05, + "loss": 0.6729, + "step": 1539 + }, + { + "epoch": 0.05, + "learning_rate": 1.986154900883884e-05, + "loss": 0.6454, + "step": 1540 + }, + { + "epoch": 0.05, + "learning_rate": 1.986136838747006e-05, + "loss": 0.6318, + "step": 1541 + }, + { + "epoch": 0.05, + "learning_rate": 1.986118764918228e-05, + "loss": 0.632, + "step": 1542 + }, + { + "epoch": 0.05, + "learning_rate": 1.9861006793977648e-05, + "loss": 0.6394, + "step": 1543 + }, + { + "epoch": 0.05, + "learning_rate": 1.9860825821858304e-05, + "loss": 0.6525, + "step": 1544 + }, + { + "epoch": 0.05, + "learning_rate": 1.98606447328264e-05, + "loss": 0.6132, + "step": 1545 + }, + { + "epoch": 0.05, + "learning_rate": 1.9860463526884074e-05, + "loss": 0.7398, + "step": 1546 + }, + { + "epoch": 0.05, + "learning_rate": 1.9860282204033484e-05, + "loss": 0.6128, + "step": 1547 + }, + { + "epoch": 0.05, + "learning_rate": 1.986010076427677e-05, + "loss": 0.6755, + "step": 1548 + }, + { + "epoch": 0.05, + "learning_rate": 1.985991920761609e-05, + "loss": 0.6336, + "step": 1549 + }, + { + "epoch": 0.05, + "learning_rate": 1.98597375340536e-05, + "loss": 0.6816, + "step": 1550 + }, + { + "epoch": 0.05, + "learning_rate": 1.9859555743591443e-05, + "loss": 0.6598, + "step": 1551 + }, + { + "epoch": 0.05, + "learning_rate": 1.985937383623178e-05, + "loss": 0.6152, + "step": 1552 + }, + { + "epoch": 0.05, + "learning_rate": 1.985919181197677e-05, + "loss": 0.654, + "step": 1553 + }, + { + "epoch": 0.05, + "learning_rate": 1.985900967082857e-05, + "loss": 0.6337, + "step": 1554 + }, + { + "epoch": 0.05, + "learning_rate": 1.985882741278934e-05, + "loss": 0.6617, + "step": 1555 + }, + { + "epoch": 0.05, + "learning_rate": 1.9858645037861237e-05, + "loss": 0.6571, + "step": 1556 + }, + { + "epoch": 0.05, + "learning_rate": 1.9858462546046426e-05, + "loss": 0.6223, + "step": 1557 + }, + { + "epoch": 0.05, + "learning_rate": 1.985827993734707e-05, + "loss": 0.628, + "step": 1558 + }, + { + "epoch": 0.05, + "learning_rate": 1.9858097211765336e-05, + "loss": 0.64, + "step": 1559 + }, + { + "epoch": 0.05, + "learning_rate": 1.985791436930339e-05, + "loss": 0.6326, + "step": 1560 + }, + { + "epoch": 0.05, + "learning_rate": 1.9857731409963397e-05, + "loss": 0.6731, + "step": 1561 + }, + { + "epoch": 0.05, + "learning_rate": 1.985754833374753e-05, + "loss": 0.6663, + "step": 1562 + }, + { + "epoch": 0.05, + "learning_rate": 1.9857365140657954e-05, + "loss": 0.6838, + "step": 1563 + }, + { + "epoch": 0.05, + "learning_rate": 1.9857181830696848e-05, + "loss": 0.6229, + "step": 1564 + }, + { + "epoch": 0.05, + "learning_rate": 1.9856998403866378e-05, + "loss": 0.6276, + "step": 1565 + }, + { + "epoch": 0.05, + "learning_rate": 1.985681486016873e-05, + "loss": 0.6309, + "step": 1566 + }, + { + "epoch": 0.05, + "learning_rate": 1.9856631199606066e-05, + "loss": 0.6796, + "step": 1567 + }, + { + "epoch": 0.05, + "learning_rate": 1.985644742218057e-05, + "loss": 0.6719, + "step": 1568 + }, + { + "epoch": 0.05, + "learning_rate": 1.9856263527894426e-05, + "loss": 0.693, + "step": 1569 + }, + { + "epoch": 0.05, + "learning_rate": 1.9856079516749807e-05, + "loss": 0.6737, + "step": 1570 + }, + { + "epoch": 0.05, + "learning_rate": 1.98558953887489e-05, + "loss": 0.6907, + "step": 1571 + }, + { + "epoch": 0.05, + "learning_rate": 1.985571114389388e-05, + "loss": 0.6599, + "step": 1572 + }, + { + "epoch": 0.05, + "learning_rate": 1.9855526782186942e-05, + "loss": 0.6608, + "step": 1573 + }, + { + "epoch": 0.05, + "learning_rate": 1.9855342303630264e-05, + "loss": 0.628, + "step": 1574 + }, + { + "epoch": 0.05, + "learning_rate": 1.9855157708226035e-05, + "loss": 0.6486, + "step": 1575 + }, + { + "epoch": 0.05, + "learning_rate": 1.9854972995976446e-05, + "loss": 0.6874, + "step": 1576 + }, + { + "epoch": 0.05, + "learning_rate": 1.9854788166883687e-05, + "loss": 0.7012, + "step": 1577 + }, + { + "epoch": 0.05, + "learning_rate": 1.9854603220949946e-05, + "loss": 0.6682, + "step": 1578 + }, + { + "epoch": 0.05, + "learning_rate": 1.985441815817742e-05, + "loss": 0.6766, + "step": 1579 + }, + { + "epoch": 0.05, + "learning_rate": 1.98542329785683e-05, + "loss": 0.6982, + "step": 1580 + }, + { + "epoch": 0.05, + "learning_rate": 1.9854047682124782e-05, + "loss": 0.6698, + "step": 1581 + }, + { + "epoch": 0.05, + "learning_rate": 1.9853862268849063e-05, + "loss": 0.6369, + "step": 1582 + }, + { + "epoch": 0.05, + "learning_rate": 1.985367673874334e-05, + "loss": 0.6122, + "step": 1583 + }, + { + "epoch": 0.05, + "learning_rate": 1.9853491091809814e-05, + "loss": 0.6798, + "step": 1584 + }, + { + "epoch": 0.05, + "learning_rate": 1.985330532805069e-05, + "loss": 0.6697, + "step": 1585 + }, + { + "epoch": 0.05, + "learning_rate": 1.9853119447468167e-05, + "loss": 0.6557, + "step": 1586 + }, + { + "epoch": 0.05, + "learning_rate": 1.9852933450064446e-05, + "loss": 0.6646, + "step": 1587 + }, + { + "epoch": 0.06, + "learning_rate": 1.9852747335841736e-05, + "loss": 0.7025, + "step": 1588 + }, + { + "epoch": 0.06, + "learning_rate": 1.9852561104802238e-05, + "loss": 0.6149, + "step": 1589 + }, + { + "epoch": 0.06, + "learning_rate": 1.9852374756948173e-05, + "loss": 0.6556, + "step": 1590 + }, + { + "epoch": 0.06, + "learning_rate": 1.9852188292281736e-05, + "loss": 0.6084, + "step": 1591 + }, + { + "epoch": 0.06, + "learning_rate": 1.9852001710805145e-05, + "loss": 0.6217, + "step": 1592 + }, + { + "epoch": 0.06, + "learning_rate": 1.9851815012520614e-05, + "loss": 0.6503, + "step": 1593 + }, + { + "epoch": 0.06, + "learning_rate": 1.9851628197430347e-05, + "loss": 0.6302, + "step": 1594 + }, + { + "epoch": 0.06, + "learning_rate": 1.9851441265536572e-05, + "loss": 0.674, + "step": 1595 + }, + { + "epoch": 0.06, + "learning_rate": 1.9851254216841493e-05, + "loss": 0.6594, + "step": 1596 + }, + { + "epoch": 0.06, + "learning_rate": 1.9851067051347337e-05, + "loss": 0.6454, + "step": 1597 + }, + { + "epoch": 0.06, + "learning_rate": 1.9850879769056316e-05, + "loss": 0.682, + "step": 1598 + }, + { + "epoch": 0.06, + "learning_rate": 1.985069236997066e-05, + "loss": 0.6718, + "step": 1599 + }, + { + "epoch": 0.06, + "learning_rate": 1.985050485409258e-05, + "loss": 0.7154, + "step": 1600 + }, + { + "epoch": 0.06, + "learning_rate": 1.9850317221424308e-05, + "loss": 0.6944, + "step": 1601 + }, + { + "epoch": 0.06, + "learning_rate": 1.9850129471968057e-05, + "loss": 0.6619, + "step": 1602 + }, + { + "epoch": 0.06, + "learning_rate": 1.9849941605726068e-05, + "loss": 0.6105, + "step": 1603 + }, + { + "epoch": 0.06, + "learning_rate": 1.984975362270056e-05, + "loss": 0.6755, + "step": 1604 + }, + { + "epoch": 0.06, + "learning_rate": 1.984956552289376e-05, + "loss": 0.6717, + "step": 1605 + }, + { + "epoch": 0.06, + "learning_rate": 1.98493773063079e-05, + "loss": 0.6058, + "step": 1606 + }, + { + "epoch": 0.06, + "learning_rate": 1.9849188972945215e-05, + "loss": 0.6064, + "step": 1607 + }, + { + "epoch": 0.06, + "learning_rate": 1.9849000522807938e-05, + "loss": 0.6756, + "step": 1608 + }, + { + "epoch": 0.06, + "learning_rate": 1.9848811955898296e-05, + "loss": 0.6622, + "step": 1609 + }, + { + "epoch": 0.06, + "learning_rate": 1.984862327221853e-05, + "loss": 0.6317, + "step": 1610 + }, + { + "epoch": 0.06, + "learning_rate": 1.9848434471770878e-05, + "loss": 0.6827, + "step": 1611 + }, + { + "epoch": 0.06, + "learning_rate": 1.9848245554557577e-05, + "loss": 0.619, + "step": 1612 + }, + { + "epoch": 0.06, + "learning_rate": 1.9848056520580866e-05, + "loss": 0.651, + "step": 1613 + }, + { + "epoch": 0.06, + "learning_rate": 1.9847867369842987e-05, + "loss": 0.622, + "step": 1614 + }, + { + "epoch": 0.06, + "learning_rate": 1.9847678102346188e-05, + "loss": 0.7039, + "step": 1615 + }, + { + "epoch": 0.06, + "learning_rate": 1.98474887180927e-05, + "loss": 0.6355, + "step": 1616 + }, + { + "epoch": 0.06, + "learning_rate": 1.984729921708478e-05, + "loss": 0.6322, + "step": 1617 + }, + { + "epoch": 0.06, + "learning_rate": 1.9847109599324674e-05, + "loss": 0.677, + "step": 1618 + }, + { + "epoch": 0.06, + "learning_rate": 1.984691986481462e-05, + "loss": 0.6476, + "step": 1619 + }, + { + "epoch": 0.06, + "learning_rate": 1.9846730013556877e-05, + "loss": 0.6263, + "step": 1620 + }, + { + "epoch": 0.06, + "learning_rate": 1.9846540045553696e-05, + "loss": 0.6533, + "step": 1621 + }, + { + "epoch": 0.06, + "learning_rate": 1.9846349960807325e-05, + "loss": 0.6446, + "step": 1622 + }, + { + "epoch": 0.06, + "learning_rate": 1.9846159759320017e-05, + "loss": 0.6793, + "step": 1623 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845969441094035e-05, + "loss": 0.7626, + "step": 1624 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845779006131626e-05, + "loss": 0.6473, + "step": 1625 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845588454435056e-05, + "loss": 0.6648, + "step": 1626 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845397786006578e-05, + "loss": 0.6301, + "step": 1627 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845207000848453e-05, + "loss": 0.7015, + "step": 1628 + }, + { + "epoch": 0.06, + "learning_rate": 1.9845016098962943e-05, + "loss": 0.5658, + "step": 1629 + }, + { + "epoch": 0.06, + "learning_rate": 1.9844825080352315e-05, + "loss": 0.5699, + "step": 1630 + }, + { + "epoch": 0.06, + "learning_rate": 1.9844633945018837e-05, + "loss": 0.5991, + "step": 1631 + }, + { + "epoch": 0.06, + "learning_rate": 1.9844442692964763e-05, + "loss": 0.6714, + "step": 1632 + }, + { + "epoch": 0.06, + "learning_rate": 1.9844251324192376e-05, + "loss": 0.6434, + "step": 1633 + }, + { + "epoch": 0.06, + "learning_rate": 1.9844059838703926e-05, + "loss": 0.6246, + "step": 1634 + }, + { + "epoch": 0.06, + "learning_rate": 1.98438682365017e-05, + "loss": 0.6685, + "step": 1635 + }, + { + "epoch": 0.06, + "learning_rate": 1.984367651758796e-05, + "loss": 0.6328, + "step": 1636 + }, + { + "epoch": 0.06, + "learning_rate": 1.984348468196499e-05, + "loss": 0.6532, + "step": 1637 + }, + { + "epoch": 0.06, + "learning_rate": 1.984329272963505e-05, + "loss": 0.6377, + "step": 1638 + }, + { + "epoch": 0.06, + "learning_rate": 1.9843100660600426e-05, + "loss": 0.6448, + "step": 1639 + }, + { + "epoch": 0.06, + "learning_rate": 1.984290847486339e-05, + "loss": 0.6868, + "step": 1640 + }, + { + "epoch": 0.06, + "learning_rate": 1.984271617242622e-05, + "loss": 0.6848, + "step": 1641 + }, + { + "epoch": 0.06, + "learning_rate": 1.9842523753291206e-05, + "loss": 0.616, + "step": 1642 + }, + { + "epoch": 0.06, + "learning_rate": 1.9842331217460618e-05, + "loss": 0.6908, + "step": 1643 + }, + { + "epoch": 0.06, + "learning_rate": 1.9842138564936744e-05, + "loss": 0.6943, + "step": 1644 + }, + { + "epoch": 0.06, + "learning_rate": 1.9841945795721863e-05, + "loss": 0.6651, + "step": 1645 + }, + { + "epoch": 0.06, + "learning_rate": 1.984175290981827e-05, + "loss": 0.7029, + "step": 1646 + }, + { + "epoch": 0.06, + "learning_rate": 1.9841559907228243e-05, + "loss": 0.6716, + "step": 1647 + }, + { + "epoch": 0.06, + "learning_rate": 1.9841366787954076e-05, + "loss": 0.6629, + "step": 1648 + }, + { + "epoch": 0.06, + "learning_rate": 1.9841173551998055e-05, + "loss": 0.6408, + "step": 1649 + }, + { + "epoch": 0.06, + "learning_rate": 1.9840980199362473e-05, + "loss": 0.6243, + "step": 1650 + }, + { + "epoch": 0.06, + "learning_rate": 1.984078673004962e-05, + "loss": 0.6464, + "step": 1651 + }, + { + "epoch": 0.06, + "learning_rate": 1.9840593144061794e-05, + "loss": 0.657, + "step": 1652 + }, + { + "epoch": 0.06, + "learning_rate": 1.9840399441401284e-05, + "loss": 0.6517, + "step": 1653 + }, + { + "epoch": 0.06, + "learning_rate": 1.9840205622070396e-05, + "loss": 0.6366, + "step": 1654 + }, + { + "epoch": 0.06, + "learning_rate": 1.984001168607142e-05, + "loss": 0.6209, + "step": 1655 + }, + { + "epoch": 0.06, + "learning_rate": 1.9839817633406656e-05, + "loss": 0.6138, + "step": 1656 + }, + { + "epoch": 0.06, + "learning_rate": 1.9839623464078407e-05, + "loss": 0.6765, + "step": 1657 + }, + { + "epoch": 0.06, + "learning_rate": 1.9839429178088976e-05, + "loss": 0.6673, + "step": 1658 + }, + { + "epoch": 0.06, + "learning_rate": 1.9839234775440667e-05, + "loss": 0.6125, + "step": 1659 + }, + { + "epoch": 0.06, + "learning_rate": 1.983904025613578e-05, + "loss": 0.6958, + "step": 1660 + }, + { + "epoch": 0.06, + "learning_rate": 1.9838845620176623e-05, + "loss": 0.6555, + "step": 1661 + }, + { + "epoch": 0.06, + "learning_rate": 1.9838650867565507e-05, + "loss": 0.6502, + "step": 1662 + }, + { + "epoch": 0.06, + "learning_rate": 1.983845599830474e-05, + "loss": 0.6443, + "step": 1663 + }, + { + "epoch": 0.06, + "learning_rate": 1.983826101239663e-05, + "loss": 0.6601, + "step": 1664 + }, + { + "epoch": 0.06, + "learning_rate": 1.9838065909843493e-05, + "loss": 0.6819, + "step": 1665 + }, + { + "epoch": 0.06, + "learning_rate": 1.9837870690647633e-05, + "loss": 0.7038, + "step": 1666 + }, + { + "epoch": 0.06, + "learning_rate": 1.9837675354811378e-05, + "loss": 0.6084, + "step": 1667 + }, + { + "epoch": 0.06, + "learning_rate": 1.9837479902337033e-05, + "loss": 0.5908, + "step": 1668 + }, + { + "epoch": 0.06, + "learning_rate": 1.983728433322692e-05, + "loss": 0.6706, + "step": 1669 + }, + { + "epoch": 0.06, + "learning_rate": 1.983708864748336e-05, + "loss": 0.7215, + "step": 1670 + }, + { + "epoch": 0.06, + "learning_rate": 1.9836892845108666e-05, + "loss": 0.6364, + "step": 1671 + }, + { + "epoch": 0.06, + "learning_rate": 1.9836696926105162e-05, + "loss": 0.6727, + "step": 1672 + }, + { + "epoch": 0.06, + "learning_rate": 1.9836500890475176e-05, + "loss": 0.6614, + "step": 1673 + }, + { + "epoch": 0.06, + "learning_rate": 1.9836304738221027e-05, + "loss": 0.6358, + "step": 1674 + }, + { + "epoch": 0.06, + "learning_rate": 1.9836108469345045e-05, + "loss": 0.6526, + "step": 1675 + }, + { + "epoch": 0.06, + "learning_rate": 1.9835912083849554e-05, + "loss": 0.6642, + "step": 1676 + }, + { + "epoch": 0.06, + "learning_rate": 1.983571558173688e-05, + "loss": 0.6378, + "step": 1677 + }, + { + "epoch": 0.06, + "learning_rate": 1.983551896300936e-05, + "loss": 0.6549, + "step": 1678 + }, + { + "epoch": 0.06, + "learning_rate": 1.9835322227669317e-05, + "loss": 0.6591, + "step": 1679 + }, + { + "epoch": 0.06, + "learning_rate": 1.9835125375719086e-05, + "loss": 0.6439, + "step": 1680 + }, + { + "epoch": 0.06, + "learning_rate": 1.9834928407161005e-05, + "loss": 0.6908, + "step": 1681 + }, + { + "epoch": 0.06, + "learning_rate": 1.9834731321997406e-05, + "loss": 0.6865, + "step": 1682 + }, + { + "epoch": 0.06, + "learning_rate": 1.9834534120230626e-05, + "loss": 0.6352, + "step": 1683 + }, + { + "epoch": 0.06, + "learning_rate": 1.9834336801863004e-05, + "loss": 0.6781, + "step": 1684 + }, + { + "epoch": 0.06, + "learning_rate": 1.983413936689688e-05, + "loss": 0.6983, + "step": 1685 + }, + { + "epoch": 0.06, + "learning_rate": 1.9833941815334588e-05, + "loss": 0.6352, + "step": 1686 + }, + { + "epoch": 0.06, + "learning_rate": 1.983374414717848e-05, + "loss": 0.7022, + "step": 1687 + }, + { + "epoch": 0.06, + "learning_rate": 1.9833546362430892e-05, + "loss": 0.6684, + "step": 1688 + }, + { + "epoch": 0.06, + "learning_rate": 1.983334846109418e-05, + "loss": 0.6555, + "step": 1689 + }, + { + "epoch": 0.06, + "learning_rate": 1.9833150443170675e-05, + "loss": 0.6848, + "step": 1690 + }, + { + "epoch": 0.06, + "learning_rate": 1.9832952308662733e-05, + "loss": 0.5992, + "step": 1691 + }, + { + "epoch": 0.06, + "learning_rate": 1.9832754057572706e-05, + "loss": 0.6612, + "step": 1692 + }, + { + "epoch": 0.06, + "learning_rate": 1.9832555689902942e-05, + "loss": 0.6513, + "step": 1693 + }, + { + "epoch": 0.06, + "learning_rate": 1.983235720565579e-05, + "loss": 0.6094, + "step": 1694 + }, + { + "epoch": 0.06, + "learning_rate": 1.9832158604833605e-05, + "loss": 0.5358, + "step": 1695 + }, + { + "epoch": 0.06, + "learning_rate": 1.9831959887438743e-05, + "loss": 0.6332, + "step": 1696 + }, + { + "epoch": 0.06, + "learning_rate": 1.9831761053473558e-05, + "loss": 0.6903, + "step": 1697 + }, + { + "epoch": 0.06, + "learning_rate": 1.9831562102940406e-05, + "loss": 0.6224, + "step": 1698 + }, + { + "epoch": 0.06, + "learning_rate": 1.9831363035841654e-05, + "loss": 0.708, + "step": 1699 + }, + { + "epoch": 0.06, + "learning_rate": 1.983116385217965e-05, + "loss": 0.6803, + "step": 1700 + }, + { + "epoch": 0.06, + "learning_rate": 1.9830964551956767e-05, + "loss": 0.6729, + "step": 1701 + }, + { + "epoch": 0.06, + "learning_rate": 1.9830765135175363e-05, + "loss": 0.6696, + "step": 1702 + }, + { + "epoch": 0.06, + "learning_rate": 1.98305656018378e-05, + "loss": 0.6447, + "step": 1703 + }, + { + "epoch": 0.06, + "learning_rate": 1.9830365951946448e-05, + "loss": 0.7428, + "step": 1704 + }, + { + "epoch": 0.06, + "learning_rate": 1.9830166185503674e-05, + "loss": 0.6939, + "step": 1705 + }, + { + "epoch": 0.06, + "learning_rate": 1.982996630251184e-05, + "loss": 0.6875, + "step": 1706 + }, + { + "epoch": 0.06, + "learning_rate": 1.9829766302973322e-05, + "loss": 0.6409, + "step": 1707 + }, + { + "epoch": 0.06, + "learning_rate": 1.982956618689049e-05, + "loss": 0.6107, + "step": 1708 + }, + { + "epoch": 0.06, + "learning_rate": 1.9829365954265717e-05, + "loss": 0.6183, + "step": 1709 + }, + { + "epoch": 0.06, + "learning_rate": 1.9829165605101375e-05, + "loss": 0.6833, + "step": 1710 + }, + { + "epoch": 0.06, + "learning_rate": 1.982896513939984e-05, + "loss": 0.6267, + "step": 1711 + }, + { + "epoch": 0.06, + "learning_rate": 1.9828764557163494e-05, + "loss": 0.6329, + "step": 1712 + }, + { + "epoch": 0.06, + "learning_rate": 1.9828563858394706e-05, + "loss": 0.6547, + "step": 1713 + }, + { + "epoch": 0.06, + "learning_rate": 1.9828363043095864e-05, + "loss": 0.5749, + "step": 1714 + }, + { + "epoch": 0.06, + "learning_rate": 1.9828162111269345e-05, + "loss": 0.6522, + "step": 1715 + }, + { + "epoch": 0.06, + "learning_rate": 1.982796106291753e-05, + "loss": 0.604, + "step": 1716 + }, + { + "epoch": 0.06, + "learning_rate": 1.98277598980428e-05, + "loss": 0.6603, + "step": 1717 + }, + { + "epoch": 0.06, + "learning_rate": 1.982755861664755e-05, + "loss": 0.6165, + "step": 1718 + }, + { + "epoch": 0.06, + "learning_rate": 1.9827357218734158e-05, + "loss": 0.6548, + "step": 1719 + }, + { + "epoch": 0.06, + "learning_rate": 1.9827155704305018e-05, + "loss": 0.6317, + "step": 1720 + }, + { + "epoch": 0.06, + "learning_rate": 1.9826954073362512e-05, + "loss": 0.6283, + "step": 1721 + }, + { + "epoch": 0.06, + "learning_rate": 1.9826752325909035e-05, + "loss": 0.6713, + "step": 1722 + }, + { + "epoch": 0.06, + "learning_rate": 1.982655046194698e-05, + "loss": 0.6847, + "step": 1723 + }, + { + "epoch": 0.06, + "learning_rate": 1.9826348481478736e-05, + "loss": 0.6297, + "step": 1724 + }, + { + "epoch": 0.06, + "learning_rate": 1.9826146384506702e-05, + "loss": 0.6341, + "step": 1725 + }, + { + "epoch": 0.06, + "learning_rate": 1.9825944171033272e-05, + "loss": 0.6742, + "step": 1726 + }, + { + "epoch": 0.06, + "learning_rate": 1.9825741841060844e-05, + "loss": 0.6974, + "step": 1727 + }, + { + "epoch": 0.06, + "learning_rate": 1.9825539394591818e-05, + "loss": 0.6195, + "step": 1728 + }, + { + "epoch": 0.06, + "learning_rate": 1.9825336831628593e-05, + "loss": 0.624, + "step": 1729 + }, + { + "epoch": 0.06, + "learning_rate": 1.982513415217357e-05, + "loss": 0.6598, + "step": 1730 + }, + { + "epoch": 0.06, + "learning_rate": 1.982493135622915e-05, + "loss": 0.6939, + "step": 1731 + }, + { + "epoch": 0.06, + "learning_rate": 1.9824728443797746e-05, + "loss": 0.6733, + "step": 1732 + }, + { + "epoch": 0.06, + "learning_rate": 1.9824525414881753e-05, + "loss": 0.6946, + "step": 1733 + }, + { + "epoch": 0.06, + "learning_rate": 1.9824322269483586e-05, + "loss": 0.6246, + "step": 1734 + }, + { + "epoch": 0.06, + "learning_rate": 1.982411900760565e-05, + "loss": 0.672, + "step": 1735 + }, + { + "epoch": 0.06, + "learning_rate": 1.9823915629250354e-05, + "loss": 0.6647, + "step": 1736 + }, + { + "epoch": 0.06, + "learning_rate": 1.982371213442011e-05, + "loss": 0.655, + "step": 1737 + }, + { + "epoch": 0.06, + "learning_rate": 1.9823508523117336e-05, + "loss": 0.6474, + "step": 1738 + }, + { + "epoch": 0.06, + "learning_rate": 1.982330479534444e-05, + "loss": 0.6522, + "step": 1739 + }, + { + "epoch": 0.06, + "learning_rate": 1.9823100951103837e-05, + "loss": 0.5937, + "step": 1740 + }, + { + "epoch": 0.06, + "learning_rate": 1.9822896990397948e-05, + "loss": 0.6453, + "step": 1741 + }, + { + "epoch": 0.06, + "learning_rate": 1.982269291322919e-05, + "loss": 0.6907, + "step": 1742 + }, + { + "epoch": 0.06, + "learning_rate": 1.982248871959998e-05, + "loss": 0.6383, + "step": 1743 + }, + { + "epoch": 0.06, + "learning_rate": 1.982228440951274e-05, + "loss": 0.6409, + "step": 1744 + }, + { + "epoch": 0.06, + "learning_rate": 1.9822079982969894e-05, + "loss": 0.6679, + "step": 1745 + }, + { + "epoch": 0.06, + "learning_rate": 1.9821875439973865e-05, + "loss": 0.6567, + "step": 1746 + }, + { + "epoch": 0.06, + "learning_rate": 1.9821670780527076e-05, + "loss": 0.6972, + "step": 1747 + }, + { + "epoch": 0.06, + "learning_rate": 1.982146600463196e-05, + "loss": 0.682, + "step": 1748 + }, + { + "epoch": 0.06, + "learning_rate": 1.9821261112290937e-05, + "loss": 0.6318, + "step": 1749 + }, + { + "epoch": 0.06, + "learning_rate": 1.982105610350644e-05, + "loss": 0.6345, + "step": 1750 + }, + { + "epoch": 0.06, + "learning_rate": 1.9820850978280897e-05, + "loss": 0.6752, + "step": 1751 + }, + { + "epoch": 0.06, + "learning_rate": 1.9820645736616745e-05, + "loss": 0.6217, + "step": 1752 + }, + { + "epoch": 0.06, + "learning_rate": 1.9820440378516415e-05, + "loss": 0.621, + "step": 1753 + }, + { + "epoch": 0.06, + "learning_rate": 1.982023490398234e-05, + "loss": 0.6486, + "step": 1754 + }, + { + "epoch": 0.06, + "learning_rate": 1.9820029313016956e-05, + "loss": 0.6138, + "step": 1755 + }, + { + "epoch": 0.06, + "learning_rate": 1.9819823605622705e-05, + "loss": 0.6629, + "step": 1756 + }, + { + "epoch": 0.06, + "learning_rate": 1.9819617781802024e-05, + "loss": 0.6557, + "step": 1757 + }, + { + "epoch": 0.06, + "learning_rate": 1.981941184155735e-05, + "loss": 0.6627, + "step": 1758 + }, + { + "epoch": 0.06, + "learning_rate": 1.9819205784891126e-05, + "loss": 0.6343, + "step": 1759 + }, + { + "epoch": 0.06, + "learning_rate": 1.9818999611805798e-05, + "loss": 0.6815, + "step": 1760 + }, + { + "epoch": 0.06, + "learning_rate": 1.9818793322303807e-05, + "loss": 0.6758, + "step": 1761 + }, + { + "epoch": 0.06, + "learning_rate": 1.98185869163876e-05, + "loss": 0.6688, + "step": 1762 + }, + { + "epoch": 0.06, + "learning_rate": 1.9818380394059627e-05, + "loss": 0.6287, + "step": 1763 + }, + { + "epoch": 0.06, + "learning_rate": 1.9818173755322334e-05, + "loss": 0.6486, + "step": 1764 + }, + { + "epoch": 0.06, + "learning_rate": 1.981796700017817e-05, + "loss": 0.6651, + "step": 1765 + }, + { + "epoch": 0.06, + "learning_rate": 1.981776012862959e-05, + "loss": 0.6541, + "step": 1766 + }, + { + "epoch": 0.06, + "learning_rate": 1.981755314067904e-05, + "loss": 0.6983, + "step": 1767 + }, + { + "epoch": 0.06, + "learning_rate": 1.981734603632898e-05, + "loss": 0.691, + "step": 1768 + }, + { + "epoch": 0.06, + "learning_rate": 1.9817138815581863e-05, + "loss": 0.7108, + "step": 1769 + }, + { + "epoch": 0.06, + "learning_rate": 1.9816931478440148e-05, + "loss": 0.6643, + "step": 1770 + }, + { + "epoch": 0.06, + "learning_rate": 1.981672402490629e-05, + "loss": 0.6701, + "step": 1771 + }, + { + "epoch": 0.06, + "learning_rate": 1.981651645498275e-05, + "loss": 0.6634, + "step": 1772 + }, + { + "epoch": 0.06, + "learning_rate": 1.9816308768671992e-05, + "loss": 0.6075, + "step": 1773 + }, + { + "epoch": 0.06, + "learning_rate": 1.9816100965976473e-05, + "loss": 0.6565, + "step": 1774 + }, + { + "epoch": 0.06, + "learning_rate": 1.9815893046898665e-05, + "loss": 0.6068, + "step": 1775 + }, + { + "epoch": 0.06, + "learning_rate": 1.9815685011441023e-05, + "loss": 0.636, + "step": 1776 + }, + { + "epoch": 0.06, + "learning_rate": 1.9815476859606018e-05, + "loss": 0.6016, + "step": 1777 + }, + { + "epoch": 0.06, + "learning_rate": 1.9815268591396123e-05, + "loss": 0.6395, + "step": 1778 + }, + { + "epoch": 0.06, + "learning_rate": 1.9815060206813797e-05, + "loss": 0.6853, + "step": 1779 + }, + { + "epoch": 0.06, + "learning_rate": 1.981485170586152e-05, + "loss": 0.6496, + "step": 1780 + }, + { + "epoch": 0.06, + "learning_rate": 1.9814643088541756e-05, + "loss": 0.6125, + "step": 1781 + }, + { + "epoch": 0.06, + "learning_rate": 1.9814434354856983e-05, + "loss": 0.698, + "step": 1782 + }, + { + "epoch": 0.06, + "learning_rate": 1.9814225504809677e-05, + "loss": 0.7012, + "step": 1783 + }, + { + "epoch": 0.06, + "learning_rate": 1.9814016538402314e-05, + "loss": 0.6877, + "step": 1784 + }, + { + "epoch": 0.06, + "learning_rate": 1.981380745563737e-05, + "loss": 0.6483, + "step": 1785 + }, + { + "epoch": 0.06, + "learning_rate": 1.9813598256517322e-05, + "loss": 0.692, + "step": 1786 + }, + { + "epoch": 0.06, + "learning_rate": 1.9813388941044656e-05, + "loss": 0.6808, + "step": 1787 + }, + { + "epoch": 0.06, + "learning_rate": 1.9813179509221847e-05, + "loss": 0.6846, + "step": 1788 + }, + { + "epoch": 0.06, + "learning_rate": 1.981296996105138e-05, + "loss": 0.669, + "step": 1789 + }, + { + "epoch": 0.06, + "learning_rate": 1.9812760296535744e-05, + "loss": 0.6212, + "step": 1790 + }, + { + "epoch": 0.06, + "learning_rate": 1.981255051567742e-05, + "loss": 0.6957, + "step": 1791 + }, + { + "epoch": 0.06, + "learning_rate": 1.9812340618478897e-05, + "loss": 0.6847, + "step": 1792 + }, + { + "epoch": 0.06, + "learning_rate": 1.9812130604942662e-05, + "loss": 0.6481, + "step": 1793 + }, + { + "epoch": 0.06, + "learning_rate": 1.9811920475071206e-05, + "loss": 0.6662, + "step": 1794 + }, + { + "epoch": 0.06, + "learning_rate": 1.981171022886702e-05, + "loss": 0.6987, + "step": 1795 + }, + { + "epoch": 0.06, + "learning_rate": 1.9811499866332605e-05, + "loss": 0.6446, + "step": 1796 + }, + { + "epoch": 0.06, + "learning_rate": 1.981128938747044e-05, + "loss": 0.6416, + "step": 1797 + }, + { + "epoch": 0.06, + "learning_rate": 1.981107879228303e-05, + "loss": 0.627, + "step": 1798 + }, + { + "epoch": 0.06, + "learning_rate": 1.9810868080772868e-05, + "loss": 0.6362, + "step": 1799 + }, + { + "epoch": 0.06, + "learning_rate": 1.9810657252942458e-05, + "loss": 0.6943, + "step": 1800 + }, + { + "epoch": 0.06, + "learning_rate": 1.9810446308794292e-05, + "loss": 0.6134, + "step": 1801 + }, + { + "epoch": 0.06, + "learning_rate": 1.9810235248330874e-05, + "loss": 0.6157, + "step": 1802 + }, + { + "epoch": 0.06, + "learning_rate": 1.981002407155471e-05, + "loss": 0.6391, + "step": 1803 + }, + { + "epoch": 0.06, + "learning_rate": 1.98098127784683e-05, + "loss": 0.6102, + "step": 1804 + }, + { + "epoch": 0.06, + "learning_rate": 1.9809601369074153e-05, + "loss": 0.6443, + "step": 1805 + }, + { + "epoch": 0.06, + "learning_rate": 1.9809389843374768e-05, + "loss": 0.669, + "step": 1806 + }, + { + "epoch": 0.06, + "learning_rate": 1.980917820137266e-05, + "loss": 0.673, + "step": 1807 + }, + { + "epoch": 0.06, + "learning_rate": 1.9808966443070334e-05, + "loss": 0.6509, + "step": 1808 + }, + { + "epoch": 0.06, + "learning_rate": 1.9808754568470303e-05, + "loss": 0.6335, + "step": 1809 + }, + { + "epoch": 0.06, + "learning_rate": 1.9808542577575077e-05, + "loss": 0.5754, + "step": 1810 + }, + { + "epoch": 0.06, + "learning_rate": 1.9808330470387177e-05, + "loss": 0.6934, + "step": 1811 + }, + { + "epoch": 0.06, + "learning_rate": 1.9808118246909105e-05, + "loss": 0.6484, + "step": 1812 + }, + { + "epoch": 0.06, + "learning_rate": 1.9807905907143387e-05, + "loss": 0.6079, + "step": 1813 + }, + { + "epoch": 0.06, + "learning_rate": 1.9807693451092537e-05, + "loss": 0.6721, + "step": 1814 + }, + { + "epoch": 0.06, + "learning_rate": 1.9807480878759073e-05, + "loss": 0.6284, + "step": 1815 + }, + { + "epoch": 0.06, + "learning_rate": 1.9807268190145515e-05, + "loss": 0.6307, + "step": 1816 + }, + { + "epoch": 0.06, + "learning_rate": 1.980705538525439e-05, + "loss": 0.656, + "step": 1817 + }, + { + "epoch": 0.06, + "learning_rate": 1.9806842464088216e-05, + "loss": 0.63, + "step": 1818 + }, + { + "epoch": 0.06, + "learning_rate": 1.980662942664952e-05, + "loss": 0.6083, + "step": 1819 + }, + { + "epoch": 0.06, + "learning_rate": 1.9806416272940824e-05, + "loss": 0.6887, + "step": 1820 + }, + { + "epoch": 0.06, + "learning_rate": 1.980620300296466e-05, + "loss": 0.6545, + "step": 1821 + }, + { + "epoch": 0.06, + "learning_rate": 1.9805989616723557e-05, + "loss": 0.7075, + "step": 1822 + }, + { + "epoch": 0.06, + "learning_rate": 1.980577611422004e-05, + "loss": 0.7079, + "step": 1823 + }, + { + "epoch": 0.06, + "learning_rate": 1.9805562495456644e-05, + "loss": 0.6022, + "step": 1824 + }, + { + "epoch": 0.06, + "learning_rate": 1.9805348760435896e-05, + "loss": 0.608, + "step": 1825 + }, + { + "epoch": 0.06, + "learning_rate": 1.9805134909160338e-05, + "loss": 0.657, + "step": 1826 + }, + { + "epoch": 0.06, + "learning_rate": 1.9804920941632503e-05, + "loss": 0.6542, + "step": 1827 + }, + { + "epoch": 0.06, + "learning_rate": 1.9804706857854925e-05, + "loss": 0.6589, + "step": 1828 + }, + { + "epoch": 0.06, + "learning_rate": 1.9804492657830145e-05, + "loss": 0.6494, + "step": 1829 + }, + { + "epoch": 0.06, + "learning_rate": 1.9804278341560702e-05, + "loss": 0.6328, + "step": 1830 + }, + { + "epoch": 0.06, + "learning_rate": 1.9804063909049133e-05, + "loss": 0.6306, + "step": 1831 + }, + { + "epoch": 0.06, + "learning_rate": 1.9803849360297992e-05, + "loss": 0.6331, + "step": 1832 + }, + { + "epoch": 0.06, + "learning_rate": 1.9803634695309808e-05, + "loss": 0.6643, + "step": 1833 + }, + { + "epoch": 0.06, + "learning_rate": 1.9803419914087138e-05, + "loss": 0.6672, + "step": 1834 + }, + { + "epoch": 0.06, + "learning_rate": 1.980320501663252e-05, + "loss": 0.6517, + "step": 1835 + }, + { + "epoch": 0.06, + "learning_rate": 1.9802990002948504e-05, + "loss": 0.6593, + "step": 1836 + }, + { + "epoch": 0.06, + "learning_rate": 1.9802774873037643e-05, + "loss": 0.6169, + "step": 1837 + }, + { + "epoch": 0.06, + "learning_rate": 1.9802559626902488e-05, + "loss": 0.6247, + "step": 1838 + }, + { + "epoch": 0.06, + "learning_rate": 1.9802344264545583e-05, + "loss": 0.6639, + "step": 1839 + }, + { + "epoch": 0.06, + "learning_rate": 1.980212878596949e-05, + "loss": 0.6209, + "step": 1840 + }, + { + "epoch": 0.06, + "learning_rate": 1.980191319117676e-05, + "loss": 0.6136, + "step": 1841 + }, + { + "epoch": 0.06, + "learning_rate": 1.980169748016995e-05, + "loss": 0.5871, + "step": 1842 + }, + { + "epoch": 0.06, + "learning_rate": 1.980148165295162e-05, + "loss": 0.592, + "step": 1843 + }, + { + "epoch": 0.06, + "learning_rate": 1.980126570952432e-05, + "loss": 0.5993, + "step": 1844 + }, + { + "epoch": 0.06, + "learning_rate": 1.980104964989062e-05, + "loss": 0.6877, + "step": 1845 + }, + { + "epoch": 0.06, + "learning_rate": 1.9800833474053077e-05, + "loss": 0.6383, + "step": 1846 + }, + { + "epoch": 0.06, + "learning_rate": 1.9800617182014256e-05, + "loss": 0.5955, + "step": 1847 + }, + { + "epoch": 0.06, + "learning_rate": 1.9800400773776718e-05, + "loss": 0.649, + "step": 1848 + }, + { + "epoch": 0.06, + "learning_rate": 1.9800184249343034e-05, + "loss": 0.6669, + "step": 1849 + }, + { + "epoch": 0.06, + "learning_rate": 1.9799967608715765e-05, + "loss": 0.6896, + "step": 1850 + }, + { + "epoch": 0.06, + "learning_rate": 1.9799750851897488e-05, + "loss": 0.6312, + "step": 1851 + }, + { + "epoch": 0.06, + "learning_rate": 1.9799533978890762e-05, + "loss": 0.6943, + "step": 1852 + }, + { + "epoch": 0.06, + "learning_rate": 1.979931698969817e-05, + "loss": 0.6839, + "step": 1853 + }, + { + "epoch": 0.06, + "learning_rate": 1.9799099884322274e-05, + "loss": 0.6102, + "step": 1854 + }, + { + "epoch": 0.06, + "learning_rate": 1.9798882662765658e-05, + "loss": 0.6801, + "step": 1855 + }, + { + "epoch": 0.06, + "learning_rate": 1.9798665325030887e-05, + "loss": 0.6297, + "step": 1856 + }, + { + "epoch": 0.06, + "learning_rate": 1.9798447871120547e-05, + "loss": 0.5974, + "step": 1857 + }, + { + "epoch": 0.06, + "learning_rate": 1.9798230301037212e-05, + "loss": 0.6171, + "step": 1858 + }, + { + "epoch": 0.06, + "learning_rate": 1.979801261478346e-05, + "loss": 0.6694, + "step": 1859 + }, + { + "epoch": 0.06, + "learning_rate": 1.9797794812361875e-05, + "loss": 0.5956, + "step": 1860 + }, + { + "epoch": 0.06, + "learning_rate": 1.979757689377504e-05, + "loss": 0.639, + "step": 1861 + }, + { + "epoch": 0.06, + "learning_rate": 1.9797358859025534e-05, + "loss": 0.6525, + "step": 1862 + }, + { + "epoch": 0.06, + "learning_rate": 1.9797140708115946e-05, + "loss": 0.6563, + "step": 1863 + }, + { + "epoch": 0.06, + "learning_rate": 1.9796922441048863e-05, + "loss": 0.6101, + "step": 1864 + }, + { + "epoch": 0.06, + "learning_rate": 1.979670405782687e-05, + "loss": 0.6311, + "step": 1865 + }, + { + "epoch": 0.06, + "learning_rate": 1.9796485558452557e-05, + "loss": 0.6436, + "step": 1866 + }, + { + "epoch": 0.06, + "learning_rate": 1.9796266942928514e-05, + "loss": 0.6838, + "step": 1867 + }, + { + "epoch": 0.06, + "learning_rate": 1.9796048211257335e-05, + "loss": 0.5818, + "step": 1868 + }, + { + "epoch": 0.06, + "learning_rate": 1.9795829363441614e-05, + "loss": 0.6486, + "step": 1869 + }, + { + "epoch": 0.06, + "learning_rate": 1.9795610399483945e-05, + "loss": 0.653, + "step": 1870 + }, + { + "epoch": 0.06, + "learning_rate": 1.979539131938692e-05, + "loss": 0.6771, + "step": 1871 + }, + { + "epoch": 0.06, + "learning_rate": 1.9795172123153142e-05, + "loss": 0.6628, + "step": 1872 + }, + { + "epoch": 0.06, + "learning_rate": 1.9794952810785207e-05, + "loss": 0.6289, + "step": 1873 + }, + { + "epoch": 0.06, + "learning_rate": 1.9794733382285714e-05, + "loss": 0.639, + "step": 1874 + }, + { + "epoch": 0.06, + "learning_rate": 1.979451383765727e-05, + "loss": 0.692, + "step": 1875 + }, + { + "epoch": 0.06, + "learning_rate": 1.979429417690247e-05, + "loss": 0.6382, + "step": 1876 + }, + { + "epoch": 0.07, + "learning_rate": 1.9794074400023923e-05, + "loss": 0.6595, + "step": 1877 + }, + { + "epoch": 0.07, + "learning_rate": 1.9793854507024237e-05, + "loss": 0.5874, + "step": 1878 + }, + { + "epoch": 0.07, + "learning_rate": 1.9793634497906017e-05, + "loss": 0.6658, + "step": 1879 + }, + { + "epoch": 0.07, + "learning_rate": 1.979341437267187e-05, + "loss": 0.6495, + "step": 1880 + }, + { + "epoch": 0.07, + "learning_rate": 1.9793194131324404e-05, + "loss": 0.6673, + "step": 1881 + }, + { + "epoch": 0.07, + "learning_rate": 1.979297377386624e-05, + "loss": 0.6384, + "step": 1882 + }, + { + "epoch": 0.07, + "learning_rate": 1.9792753300299976e-05, + "loss": 0.727, + "step": 1883 + }, + { + "epoch": 0.07, + "learning_rate": 1.9792532710628237e-05, + "loss": 0.584, + "step": 1884 + }, + { + "epoch": 0.07, + "learning_rate": 1.9792312004853634e-05, + "loss": 0.6538, + "step": 1885 + }, + { + "epoch": 0.07, + "learning_rate": 1.9792091182978787e-05, + "loss": 0.6244, + "step": 1886 + }, + { + "epoch": 0.07, + "learning_rate": 1.979187024500631e-05, + "loss": 0.6891, + "step": 1887 + }, + { + "epoch": 0.07, + "learning_rate": 1.9791649190938827e-05, + "loss": 0.6249, + "step": 1888 + }, + { + "epoch": 0.07, + "learning_rate": 1.9791428020778953e-05, + "loss": 0.6699, + "step": 1889 + }, + { + "epoch": 0.07, + "learning_rate": 1.9791206734529317e-05, + "loss": 0.6565, + "step": 1890 + }, + { + "epoch": 0.07, + "learning_rate": 1.9790985332192535e-05, + "loss": 0.6404, + "step": 1891 + }, + { + "epoch": 0.07, + "learning_rate": 1.979076381377124e-05, + "loss": 0.7028, + "step": 1892 + }, + { + "epoch": 0.07, + "learning_rate": 1.9790542179268053e-05, + "loss": 0.5966, + "step": 1893 + }, + { + "epoch": 0.07, + "learning_rate": 1.9790320428685605e-05, + "loss": 0.6158, + "step": 1894 + }, + { + "epoch": 0.07, + "learning_rate": 1.979009856202652e-05, + "loss": 0.6724, + "step": 1895 + }, + { + "epoch": 0.07, + "learning_rate": 1.9789876579293435e-05, + "loss": 0.6689, + "step": 1896 + }, + { + "epoch": 0.07, + "learning_rate": 1.978965448048898e-05, + "loss": 0.5927, + "step": 1897 + }, + { + "epoch": 0.07, + "learning_rate": 1.9789432265615785e-05, + "loss": 0.5469, + "step": 1898 + }, + { + "epoch": 0.07, + "learning_rate": 1.9789209934676488e-05, + "loss": 0.6034, + "step": 1899 + }, + { + "epoch": 0.07, + "learning_rate": 1.9788987487673725e-05, + "loss": 0.6556, + "step": 1900 + }, + { + "epoch": 0.07, + "learning_rate": 1.9788764924610128e-05, + "loss": 0.6426, + "step": 1901 + }, + { + "epoch": 0.07, + "learning_rate": 1.978854224548834e-05, + "loss": 0.6258, + "step": 1902 + }, + { + "epoch": 0.07, + "learning_rate": 1.9788319450311006e-05, + "loss": 0.6146, + "step": 1903 + }, + { + "epoch": 0.07, + "learning_rate": 1.978809653908076e-05, + "loss": 0.6152, + "step": 1904 + }, + { + "epoch": 0.07, + "learning_rate": 1.9787873511800245e-05, + "loss": 0.6898, + "step": 1905 + }, + { + "epoch": 0.07, + "learning_rate": 1.978765036847211e-05, + "loss": 0.6333, + "step": 1906 + }, + { + "epoch": 0.07, + "learning_rate": 1.9787427109099e-05, + "loss": 0.64, + "step": 1907 + }, + { + "epoch": 0.07, + "learning_rate": 1.9787203733683558e-05, + "loss": 0.6443, + "step": 1908 + }, + { + "epoch": 0.07, + "learning_rate": 1.9786980242228435e-05, + "loss": 0.6558, + "step": 1909 + }, + { + "epoch": 0.07, + "learning_rate": 1.978675663473628e-05, + "loss": 0.6615, + "step": 1910 + }, + { + "epoch": 0.07, + "learning_rate": 1.978653291120975e-05, + "loss": 0.6221, + "step": 1911 + }, + { + "epoch": 0.07, + "learning_rate": 1.9786309071651488e-05, + "loss": 0.62, + "step": 1912 + }, + { + "epoch": 0.07, + "learning_rate": 1.978608511606415e-05, + "loss": 0.6715, + "step": 1913 + }, + { + "epoch": 0.07, + "learning_rate": 1.9785861044450398e-05, + "loss": 0.6753, + "step": 1914 + }, + { + "epoch": 0.07, + "learning_rate": 1.9785636856812882e-05, + "loss": 0.6459, + "step": 1915 + }, + { + "epoch": 0.07, + "learning_rate": 1.9785412553154265e-05, + "loss": 0.6416, + "step": 1916 + }, + { + "epoch": 0.07, + "learning_rate": 1.97851881334772e-05, + "loss": 0.7021, + "step": 1917 + }, + { + "epoch": 0.07, + "learning_rate": 1.978496359778435e-05, + "loss": 0.6721, + "step": 1918 + }, + { + "epoch": 0.07, + "learning_rate": 1.9784738946078385e-05, + "loss": 0.6911, + "step": 1919 + }, + { + "epoch": 0.07, + "learning_rate": 1.978451417836196e-05, + "loss": 0.6565, + "step": 1920 + }, + { + "epoch": 0.07, + "learning_rate": 1.9784289294637737e-05, + "loss": 0.6327, + "step": 1921 + }, + { + "epoch": 0.07, + "learning_rate": 1.978406429490839e-05, + "loss": 0.6332, + "step": 1922 + }, + { + "epoch": 0.07, + "learning_rate": 1.9783839179176584e-05, + "loss": 0.6335, + "step": 1923 + }, + { + "epoch": 0.07, + "learning_rate": 1.978361394744499e-05, + "loss": 0.6471, + "step": 1924 + }, + { + "epoch": 0.07, + "learning_rate": 1.9783388599716272e-05, + "loss": 0.6429, + "step": 1925 + }, + { + "epoch": 0.07, + "learning_rate": 1.9783163135993108e-05, + "loss": 0.6452, + "step": 1926 + }, + { + "epoch": 0.07, + "learning_rate": 1.9782937556278173e-05, + "loss": 0.6815, + "step": 1927 + }, + { + "epoch": 0.07, + "learning_rate": 1.978271186057413e-05, + "loss": 0.6608, + "step": 1928 + }, + { + "epoch": 0.07, + "learning_rate": 1.9782486048883668e-05, + "loss": 0.6352, + "step": 1929 + }, + { + "epoch": 0.07, + "learning_rate": 1.978226012120946e-05, + "loss": 0.5929, + "step": 1930 + }, + { + "epoch": 0.07, + "learning_rate": 1.9782034077554182e-05, + "loss": 0.6814, + "step": 1931 + }, + { + "epoch": 0.07, + "learning_rate": 1.9781807917920515e-05, + "loss": 0.6718, + "step": 1932 + }, + { + "epoch": 0.07, + "learning_rate": 1.9781581642311144e-05, + "loss": 0.67, + "step": 1933 + }, + { + "epoch": 0.07, + "learning_rate": 1.9781355250728746e-05, + "loss": 0.6711, + "step": 1934 + }, + { + "epoch": 0.07, + "learning_rate": 1.9781128743176004e-05, + "loss": 0.621, + "step": 1935 + }, + { + "epoch": 0.07, + "learning_rate": 1.9780902119655616e-05, + "loss": 0.6603, + "step": 1936 + }, + { + "epoch": 0.07, + "learning_rate": 1.9780675380170257e-05, + "loss": 0.6392, + "step": 1937 + }, + { + "epoch": 0.07, + "learning_rate": 1.9780448524722615e-05, + "loss": 0.7097, + "step": 1938 + }, + { + "epoch": 0.07, + "learning_rate": 1.9780221553315387e-05, + "loss": 0.6351, + "step": 1939 + }, + { + "epoch": 0.07, + "learning_rate": 1.977999446595126e-05, + "loss": 0.6301, + "step": 1940 + }, + { + "epoch": 0.07, + "learning_rate": 1.9779767262632926e-05, + "loss": 0.6342, + "step": 1941 + }, + { + "epoch": 0.07, + "learning_rate": 1.9779539943363083e-05, + "loss": 0.6734, + "step": 1942 + }, + { + "epoch": 0.07, + "learning_rate": 1.977931250814442e-05, + "loss": 0.6906, + "step": 1943 + }, + { + "epoch": 0.07, + "learning_rate": 1.9779084956979634e-05, + "loss": 0.6511, + "step": 1944 + }, + { + "epoch": 0.07, + "learning_rate": 1.977885728987143e-05, + "loss": 0.5811, + "step": 1945 + }, + { + "epoch": 0.07, + "learning_rate": 1.97786295068225e-05, + "loss": 0.598, + "step": 1946 + }, + { + "epoch": 0.07, + "learning_rate": 1.977840160783555e-05, + "loss": 0.6097, + "step": 1947 + }, + { + "epoch": 0.07, + "learning_rate": 1.9778173592913274e-05, + "loss": 0.6418, + "step": 1948 + }, + { + "epoch": 0.07, + "learning_rate": 1.9777945462058383e-05, + "loss": 0.6943, + "step": 1949 + }, + { + "epoch": 0.07, + "learning_rate": 1.977771721527358e-05, + "loss": 0.6618, + "step": 1950 + }, + { + "epoch": 0.07, + "learning_rate": 1.977748885256157e-05, + "loss": 0.606, + "step": 1951 + }, + { + "epoch": 0.07, + "learning_rate": 1.977726037392506e-05, + "loss": 0.5941, + "step": 1952 + }, + { + "epoch": 0.07, + "learning_rate": 1.9777031779366763e-05, + "loss": 0.6305, + "step": 1953 + }, + { + "epoch": 0.07, + "learning_rate": 1.9776803068889388e-05, + "loss": 0.6461, + "step": 1954 + }, + { + "epoch": 0.07, + "learning_rate": 1.9776574242495638e-05, + "loss": 0.6318, + "step": 1955 + }, + { + "epoch": 0.07, + "learning_rate": 1.9776345300188238e-05, + "loss": 0.6588, + "step": 1956 + }, + { + "epoch": 0.07, + "learning_rate": 1.9776116241969895e-05, + "loss": 0.642, + "step": 1957 + }, + { + "epoch": 0.07, + "learning_rate": 1.977588706784333e-05, + "loss": 0.6645, + "step": 1958 + }, + { + "epoch": 0.07, + "learning_rate": 1.9775657777811253e-05, + "loss": 0.6195, + "step": 1959 + }, + { + "epoch": 0.07, + "learning_rate": 1.9775428371876392e-05, + "loss": 0.6399, + "step": 1960 + }, + { + "epoch": 0.07, + "learning_rate": 1.9775198850041457e-05, + "loss": 0.6571, + "step": 1961 + }, + { + "epoch": 0.07, + "learning_rate": 1.9774969212309176e-05, + "loss": 0.7086, + "step": 1962 + }, + { + "epoch": 0.07, + "learning_rate": 1.977473945868227e-05, + "loss": 0.681, + "step": 1963 + }, + { + "epoch": 0.07, + "learning_rate": 1.977450958916346e-05, + "loss": 0.6816, + "step": 1964 + }, + { + "epoch": 0.07, + "learning_rate": 1.9774279603755477e-05, + "loss": 0.6755, + "step": 1965 + }, + { + "epoch": 0.07, + "learning_rate": 1.977404950246104e-05, + "loss": 0.6826, + "step": 1966 + }, + { + "epoch": 0.07, + "learning_rate": 1.9773819285282888e-05, + "loss": 0.6688, + "step": 1967 + }, + { + "epoch": 0.07, + "learning_rate": 1.977358895222374e-05, + "loss": 0.6819, + "step": 1968 + }, + { + "epoch": 0.07, + "learning_rate": 1.9773358503286335e-05, + "loss": 0.6577, + "step": 1969 + }, + { + "epoch": 0.07, + "learning_rate": 1.97731279384734e-05, + "loss": 0.5945, + "step": 1970 + }, + { + "epoch": 0.07, + "learning_rate": 1.9772897257787668e-05, + "loss": 0.6507, + "step": 1971 + }, + { + "epoch": 0.07, + "learning_rate": 1.9772666461231878e-05, + "loss": 0.6488, + "step": 1972 + }, + { + "epoch": 0.07, + "learning_rate": 1.9772435548808767e-05, + "loss": 0.6168, + "step": 1973 + }, + { + "epoch": 0.07, + "learning_rate": 1.9772204520521066e-05, + "loss": 0.665, + "step": 1974 + }, + { + "epoch": 0.07, + "learning_rate": 1.977197337637152e-05, + "loss": 0.6329, + "step": 1975 + }, + { + "epoch": 0.07, + "learning_rate": 1.977174211636287e-05, + "loss": 0.6436, + "step": 1976 + }, + { + "epoch": 0.07, + "learning_rate": 1.9771510740497855e-05, + "loss": 0.6117, + "step": 1977 + }, + { + "epoch": 0.07, + "learning_rate": 1.977127924877922e-05, + "loss": 0.6598, + "step": 1978 + }, + { + "epoch": 0.07, + "learning_rate": 1.9771047641209704e-05, + "loss": 0.6906, + "step": 1979 + }, + { + "epoch": 0.07, + "learning_rate": 1.9770815917792062e-05, + "loss": 0.646, + "step": 1980 + }, + { + "epoch": 0.07, + "learning_rate": 1.9770584078529037e-05, + "loss": 0.6403, + "step": 1981 + }, + { + "epoch": 0.07, + "learning_rate": 1.9770352123423378e-05, + "loss": 0.6413, + "step": 1982 + }, + { + "epoch": 0.07, + "learning_rate": 1.9770120052477835e-05, + "loss": 0.6187, + "step": 1983 + }, + { + "epoch": 0.07, + "learning_rate": 1.976988786569516e-05, + "loss": 0.6322, + "step": 1984 + }, + { + "epoch": 0.07, + "learning_rate": 1.97696555630781e-05, + "loss": 0.6453, + "step": 1985 + }, + { + "epoch": 0.07, + "learning_rate": 1.976942314462942e-05, + "loss": 0.6194, + "step": 1986 + }, + { + "epoch": 0.07, + "learning_rate": 1.976919061035187e-05, + "loss": 0.6643, + "step": 1987 + }, + { + "epoch": 0.07, + "learning_rate": 1.9768957960248203e-05, + "loss": 0.6507, + "step": 1988 + }, + { + "epoch": 0.07, + "learning_rate": 1.9768725194321187e-05, + "loss": 0.6055, + "step": 1989 + }, + { + "epoch": 0.07, + "learning_rate": 1.9768492312573576e-05, + "loss": 0.7409, + "step": 1990 + }, + { + "epoch": 0.07, + "learning_rate": 1.976825931500813e-05, + "loss": 0.6888, + "step": 1991 + }, + { + "epoch": 0.07, + "learning_rate": 1.976802620162761e-05, + "loss": 0.6312, + "step": 1992 + }, + { + "epoch": 0.07, + "learning_rate": 1.9767792972434785e-05, + "loss": 0.6059, + "step": 1993 + }, + { + "epoch": 0.07, + "learning_rate": 1.976755962743242e-05, + "loss": 0.6474, + "step": 1994 + }, + { + "epoch": 0.07, + "learning_rate": 1.9767326166623277e-05, + "loss": 0.6474, + "step": 1995 + }, + { + "epoch": 0.07, + "learning_rate": 1.9767092590010128e-05, + "loss": 0.655, + "step": 1996 + }, + { + "epoch": 0.07, + "learning_rate": 1.976685889759574e-05, + "loss": 0.6314, + "step": 1997 + }, + { + "epoch": 0.07, + "learning_rate": 1.9766625089382884e-05, + "loss": 0.6017, + "step": 1998 + }, + { + "epoch": 0.07, + "learning_rate": 1.9766391165374333e-05, + "loss": 0.6662, + "step": 1999 + }, + { + "epoch": 0.07, + "learning_rate": 1.976615712557286e-05, + "loss": 0.6728, + "step": 2000 + }, + { + "epoch": 0.07, + "learning_rate": 1.976592296998124e-05, + "loss": 0.6309, + "step": 2001 + }, + { + "epoch": 0.07, + "learning_rate": 1.976568869860225e-05, + "loss": 0.5995, + "step": 2002 + }, + { + "epoch": 0.07, + "learning_rate": 1.976545431143867e-05, + "loss": 0.6118, + "step": 2003 + }, + { + "epoch": 0.07, + "learning_rate": 1.9765219808493274e-05, + "loss": 0.6591, + "step": 2004 + }, + { + "epoch": 0.07, + "learning_rate": 1.976498518976884e-05, + "loss": 0.6851, + "step": 2005 + }, + { + "epoch": 0.07, + "learning_rate": 1.976475045526816e-05, + "loss": 0.6285, + "step": 2006 + }, + { + "epoch": 0.07, + "learning_rate": 1.9764515604994006e-05, + "loss": 0.6283, + "step": 2007 + }, + { + "epoch": 0.07, + "learning_rate": 1.9764280638949168e-05, + "loss": 0.6426, + "step": 2008 + }, + { + "epoch": 0.07, + "learning_rate": 1.976404555713643e-05, + "loss": 0.6341, + "step": 2009 + }, + { + "epoch": 0.07, + "learning_rate": 1.9763810359558584e-05, + "loss": 0.6295, + "step": 2010 + }, + { + "epoch": 0.07, + "learning_rate": 1.9763575046218414e-05, + "loss": 0.7087, + "step": 2011 + }, + { + "epoch": 0.07, + "learning_rate": 1.976333961711871e-05, + "loss": 0.6454, + "step": 2012 + }, + { + "epoch": 0.07, + "learning_rate": 1.9763104072262266e-05, + "loss": 0.6878, + "step": 2013 + }, + { + "epoch": 0.07, + "learning_rate": 1.976286841165187e-05, + "loss": 0.6402, + "step": 2014 + }, + { + "epoch": 0.07, + "learning_rate": 1.976263263529032e-05, + "loss": 0.6457, + "step": 2015 + }, + { + "epoch": 0.07, + "learning_rate": 1.9762396743180407e-05, + "loss": 0.6479, + "step": 2016 + }, + { + "epoch": 0.07, + "learning_rate": 1.9762160735324937e-05, + "loss": 0.671, + "step": 2017 + }, + { + "epoch": 0.07, + "learning_rate": 1.97619246117267e-05, + "loss": 0.6706, + "step": 2018 + }, + { + "epoch": 0.07, + "learning_rate": 1.9761688372388496e-05, + "loss": 0.681, + "step": 2019 + }, + { + "epoch": 0.07, + "learning_rate": 1.976145201731313e-05, + "loss": 0.6944, + "step": 2020 + }, + { + "epoch": 0.07, + "learning_rate": 1.9761215546503402e-05, + "loss": 0.6079, + "step": 2021 + }, + { + "epoch": 0.07, + "learning_rate": 1.9760978959962113e-05, + "loss": 0.6505, + "step": 2022 + }, + { + "epoch": 0.07, + "learning_rate": 1.9760742257692075e-05, + "loss": 0.6477, + "step": 2023 + }, + { + "epoch": 0.07, + "learning_rate": 1.9760505439696086e-05, + "loss": 0.5803, + "step": 2024 + }, + { + "epoch": 0.07, + "learning_rate": 1.976026850597696e-05, + "loss": 0.6362, + "step": 2025 + }, + { + "epoch": 0.07, + "learning_rate": 1.9760031456537506e-05, + "loss": 0.6331, + "step": 2026 + }, + { + "epoch": 0.07, + "learning_rate": 1.975979429138053e-05, + "loss": 0.7165, + "step": 2027 + }, + { + "epoch": 0.07, + "learning_rate": 1.9759557010508845e-05, + "loss": 0.5964, + "step": 2028 + }, + { + "epoch": 0.07, + "learning_rate": 1.9759319613925266e-05, + "loss": 0.6509, + "step": 2029 + }, + { + "epoch": 0.07, + "learning_rate": 1.9759082101632613e-05, + "loss": 0.6478, + "step": 2030 + }, + { + "epoch": 0.07, + "learning_rate": 1.975884447363369e-05, + "loss": 0.6993, + "step": 2031 + }, + { + "epoch": 0.07, + "learning_rate": 1.9758606729931324e-05, + "loss": 0.6475, + "step": 2032 + }, + { + "epoch": 0.07, + "learning_rate": 1.975836887052833e-05, + "loss": 0.6435, + "step": 2033 + }, + { + "epoch": 0.07, + "learning_rate": 1.9758130895427526e-05, + "loss": 0.6801, + "step": 2034 + }, + { + "epoch": 0.07, + "learning_rate": 1.975789280463174e-05, + "loss": 0.6954, + "step": 2035 + }, + { + "epoch": 0.07, + "learning_rate": 1.9757654598143788e-05, + "loss": 0.6895, + "step": 2036 + }, + { + "epoch": 0.07, + "learning_rate": 1.9757416275966497e-05, + "loss": 0.7047, + "step": 2037 + }, + { + "epoch": 0.07, + "learning_rate": 1.9757177838102697e-05, + "loss": 0.6224, + "step": 2038 + }, + { + "epoch": 0.07, + "learning_rate": 1.9756939284555207e-05, + "loss": 0.6586, + "step": 2039 + }, + { + "epoch": 0.07, + "learning_rate": 1.975670061532686e-05, + "loss": 0.6825, + "step": 2040 + }, + { + "epoch": 0.07, + "learning_rate": 1.9756461830420486e-05, + "loss": 0.6305, + "step": 2041 + }, + { + "epoch": 0.07, + "learning_rate": 1.9756222929838914e-05, + "loss": 0.6808, + "step": 2042 + }, + { + "epoch": 0.07, + "learning_rate": 1.975598391358498e-05, + "loss": 0.6754, + "step": 2043 + }, + { + "epoch": 0.07, + "learning_rate": 1.975574478166151e-05, + "loss": 0.676, + "step": 2044 + }, + { + "epoch": 0.07, + "learning_rate": 1.975550553407135e-05, + "loss": 0.6589, + "step": 2045 + }, + { + "epoch": 0.07, + "learning_rate": 1.975526617081733e-05, + "loss": 0.643, + "step": 2046 + }, + { + "epoch": 0.07, + "learning_rate": 1.9755026691902286e-05, + "loss": 0.653, + "step": 2047 + }, + { + "epoch": 0.07, + "learning_rate": 1.9754787097329063e-05, + "loss": 0.6209, + "step": 2048 + }, + { + "epoch": 0.07, + "learning_rate": 1.97545473871005e-05, + "loss": 0.6699, + "step": 2049 + }, + { + "epoch": 0.07, + "learning_rate": 1.9754307561219434e-05, + "loss": 0.6348, + "step": 2050 + }, + { + "epoch": 0.07, + "learning_rate": 1.9754067619688716e-05, + "loss": 0.7143, + "step": 2051 + }, + { + "epoch": 0.07, + "learning_rate": 1.9753827562511186e-05, + "loss": 0.6228, + "step": 2052 + }, + { + "epoch": 0.07, + "learning_rate": 1.9753587389689692e-05, + "loss": 0.6521, + "step": 2053 + }, + { + "epoch": 0.07, + "learning_rate": 1.975334710122708e-05, + "loss": 0.6984, + "step": 2054 + }, + { + "epoch": 0.07, + "learning_rate": 1.9753106697126204e-05, + "loss": 0.7173, + "step": 2055 + }, + { + "epoch": 0.07, + "learning_rate": 1.9752866177389908e-05, + "loss": 0.6519, + "step": 2056 + }, + { + "epoch": 0.07, + "learning_rate": 1.9752625542021045e-05, + "loss": 0.6973, + "step": 2057 + }, + { + "epoch": 0.07, + "learning_rate": 1.975238479102247e-05, + "loss": 0.6537, + "step": 2058 + }, + { + "epoch": 0.07, + "learning_rate": 1.9752143924397035e-05, + "loss": 0.6217, + "step": 2059 + }, + { + "epoch": 0.07, + "learning_rate": 1.9751902942147597e-05, + "loss": 0.6881, + "step": 2060 + }, + { + "epoch": 0.07, + "learning_rate": 1.9751661844277016e-05, + "loss": 0.6414, + "step": 2061 + }, + { + "epoch": 0.07, + "learning_rate": 1.9751420630788146e-05, + "loss": 0.6493, + "step": 2062 + }, + { + "epoch": 0.07, + "learning_rate": 1.9751179301683853e-05, + "loss": 0.613, + "step": 2063 + }, + { + "epoch": 0.07, + "learning_rate": 1.975093785696699e-05, + "loss": 0.5898, + "step": 2064 + }, + { + "epoch": 0.07, + "learning_rate": 1.9750696296640424e-05, + "loss": 0.662, + "step": 2065 + }, + { + "epoch": 0.07, + "learning_rate": 1.975045462070702e-05, + "loss": 0.6276, + "step": 2066 + }, + { + "epoch": 0.07, + "learning_rate": 1.975021282916964e-05, + "loss": 0.6918, + "step": 2067 + }, + { + "epoch": 0.07, + "learning_rate": 1.9749970922031156e-05, + "loss": 0.6403, + "step": 2068 + }, + { + "epoch": 0.07, + "learning_rate": 1.9749728899294428e-05, + "loss": 0.6793, + "step": 2069 + }, + { + "epoch": 0.07, + "learning_rate": 1.9749486760962334e-05, + "loss": 0.6071, + "step": 2070 + }, + { + "epoch": 0.07, + "learning_rate": 1.974924450703774e-05, + "loss": 0.662, + "step": 2071 + }, + { + "epoch": 0.07, + "learning_rate": 1.9749002137523523e-05, + "loss": 0.6306, + "step": 2072 + }, + { + "epoch": 0.07, + "learning_rate": 1.9748759652422548e-05, + "loss": 0.5944, + "step": 2073 + }, + { + "epoch": 0.07, + "learning_rate": 1.97485170517377e-05, + "loss": 0.6209, + "step": 2074 + }, + { + "epoch": 0.07, + "learning_rate": 1.9748274335471845e-05, + "loss": 0.6691, + "step": 2075 + }, + { + "epoch": 0.07, + "learning_rate": 1.974803150362787e-05, + "loss": 0.6359, + "step": 2076 + }, + { + "epoch": 0.07, + "learning_rate": 1.974778855620865e-05, + "loss": 0.7043, + "step": 2077 + }, + { + "epoch": 0.07, + "learning_rate": 1.9747545493217063e-05, + "loss": 0.6533, + "step": 2078 + }, + { + "epoch": 0.07, + "learning_rate": 1.9747302314655998e-05, + "loss": 0.6483, + "step": 2079 + }, + { + "epoch": 0.07, + "learning_rate": 1.974705902052833e-05, + "loss": 0.6081, + "step": 2080 + }, + { + "epoch": 0.07, + "learning_rate": 1.9746815610836946e-05, + "loss": 0.6496, + "step": 2081 + }, + { + "epoch": 0.07, + "learning_rate": 1.9746572085584736e-05, + "loss": 0.5861, + "step": 2082 + }, + { + "epoch": 0.07, + "learning_rate": 1.9746328444774586e-05, + "loss": 0.6522, + "step": 2083 + }, + { + "epoch": 0.07, + "learning_rate": 1.974608468840938e-05, + "loss": 0.5862, + "step": 2084 + }, + { + "epoch": 0.07, + "learning_rate": 1.974584081649201e-05, + "loss": 0.6676, + "step": 2085 + }, + { + "epoch": 0.07, + "learning_rate": 1.974559682902537e-05, + "loss": 0.6554, + "step": 2086 + }, + { + "epoch": 0.07, + "learning_rate": 1.9745352726012354e-05, + "loss": 0.6628, + "step": 2087 + }, + { + "epoch": 0.07, + "learning_rate": 1.9745108507455853e-05, + "loss": 0.6908, + "step": 2088 + }, + { + "epoch": 0.07, + "learning_rate": 1.974486417335876e-05, + "loss": 0.673, + "step": 2089 + }, + { + "epoch": 0.07, + "learning_rate": 1.9744619723723977e-05, + "loss": 0.6773, + "step": 2090 + }, + { + "epoch": 0.07, + "learning_rate": 1.97443751585544e-05, + "loss": 0.597, + "step": 2091 + }, + { + "epoch": 0.07, + "learning_rate": 1.9744130477852924e-05, + "loss": 0.5708, + "step": 2092 + }, + { + "epoch": 0.07, + "learning_rate": 1.974388568162246e-05, + "loss": 0.6644, + "step": 2093 + }, + { + "epoch": 0.07, + "learning_rate": 1.9743640769865906e-05, + "loss": 0.6914, + "step": 2094 + }, + { + "epoch": 0.07, + "learning_rate": 1.9743395742586166e-05, + "loss": 0.638, + "step": 2095 + }, + { + "epoch": 0.07, + "learning_rate": 1.9743150599786138e-05, + "loss": 0.7225, + "step": 2096 + }, + { + "epoch": 0.07, + "learning_rate": 1.974290534146874e-05, + "loss": 0.634, + "step": 2097 + }, + { + "epoch": 0.07, + "learning_rate": 1.974265996763687e-05, + "loss": 0.6732, + "step": 2098 + }, + { + "epoch": 0.07, + "learning_rate": 1.9742414478293445e-05, + "loss": 0.6805, + "step": 2099 + }, + { + "epoch": 0.07, + "learning_rate": 1.974216887344137e-05, + "loss": 0.6495, + "step": 2100 + }, + { + "epoch": 0.07, + "learning_rate": 1.974192315308356e-05, + "loss": 0.6675, + "step": 2101 + }, + { + "epoch": 0.07, + "learning_rate": 1.9741677317222927e-05, + "loss": 0.5874, + "step": 2102 + }, + { + "epoch": 0.07, + "learning_rate": 1.9741431365862385e-05, + "loss": 0.6805, + "step": 2103 + }, + { + "epoch": 0.07, + "learning_rate": 1.9741185299004852e-05, + "loss": 0.6416, + "step": 2104 + }, + { + "epoch": 0.07, + "learning_rate": 1.9740939116653245e-05, + "loss": 0.6179, + "step": 2105 + }, + { + "epoch": 0.07, + "learning_rate": 1.9740692818810484e-05, + "loss": 0.7175, + "step": 2106 + }, + { + "epoch": 0.07, + "learning_rate": 1.9740446405479487e-05, + "loss": 0.6455, + "step": 2107 + }, + { + "epoch": 0.07, + "learning_rate": 1.9740199876663175e-05, + "loss": 0.6981, + "step": 2108 + }, + { + "epoch": 0.07, + "learning_rate": 1.9739953232364474e-05, + "loss": 0.6375, + "step": 2109 + }, + { + "epoch": 0.07, + "learning_rate": 1.9739706472586305e-05, + "loss": 0.6463, + "step": 2110 + }, + { + "epoch": 0.07, + "learning_rate": 1.9739459597331593e-05, + "loss": 0.6573, + "step": 2111 + }, + { + "epoch": 0.07, + "learning_rate": 1.9739212606603267e-05, + "loss": 0.6311, + "step": 2112 + }, + { + "epoch": 0.07, + "learning_rate": 1.9738965500404256e-05, + "loss": 0.6602, + "step": 2113 + }, + { + "epoch": 0.07, + "learning_rate": 1.9738718278737493e-05, + "loss": 0.6505, + "step": 2114 + }, + { + "epoch": 0.07, + "learning_rate": 1.9738470941605903e-05, + "loss": 0.6822, + "step": 2115 + }, + { + "epoch": 0.07, + "learning_rate": 1.9738223489012422e-05, + "loss": 0.6629, + "step": 2116 + }, + { + "epoch": 0.07, + "learning_rate": 1.973797592095998e-05, + "loss": 0.6268, + "step": 2117 + }, + { + "epoch": 0.07, + "learning_rate": 1.9737728237451513e-05, + "loss": 0.7028, + "step": 2118 + }, + { + "epoch": 0.07, + "learning_rate": 1.9737480438489964e-05, + "loss": 0.6609, + "step": 2119 + }, + { + "epoch": 0.07, + "learning_rate": 1.9737232524078264e-05, + "loss": 0.6327, + "step": 2120 + }, + { + "epoch": 0.07, + "learning_rate": 1.9736984494219354e-05, + "loss": 0.6604, + "step": 2121 + }, + { + "epoch": 0.07, + "learning_rate": 1.9736736348916177e-05, + "loss": 0.6645, + "step": 2122 + }, + { + "epoch": 0.07, + "learning_rate": 1.9736488088171675e-05, + "loss": 0.6796, + "step": 2123 + }, + { + "epoch": 0.07, + "learning_rate": 1.9736239711988786e-05, + "loss": 0.68, + "step": 2124 + }, + { + "epoch": 0.07, + "learning_rate": 1.9735991220370462e-05, + "loss": 0.6625, + "step": 2125 + }, + { + "epoch": 0.07, + "learning_rate": 1.9735742613319643e-05, + "loss": 0.679, + "step": 2126 + }, + { + "epoch": 0.07, + "learning_rate": 1.9735493890839284e-05, + "loss": 0.6868, + "step": 2127 + }, + { + "epoch": 0.07, + "learning_rate": 1.9735245052932326e-05, + "loss": 0.648, + "step": 2128 + }, + { + "epoch": 0.07, + "learning_rate": 1.9734996099601726e-05, + "loss": 0.6652, + "step": 2129 + }, + { + "epoch": 0.07, + "learning_rate": 1.973474703085043e-05, + "loss": 0.6854, + "step": 2130 + }, + { + "epoch": 0.07, + "learning_rate": 1.9734497846681392e-05, + "loss": 0.6477, + "step": 2131 + }, + { + "epoch": 0.07, + "learning_rate": 1.973424854709757e-05, + "loss": 0.6479, + "step": 2132 + }, + { + "epoch": 0.07, + "learning_rate": 1.973399913210192e-05, + "loss": 0.6387, + "step": 2133 + }, + { + "epoch": 0.07, + "learning_rate": 1.973374960169739e-05, + "loss": 0.5708, + "step": 2134 + }, + { + "epoch": 0.07, + "learning_rate": 1.973349995588695e-05, + "loss": 0.6536, + "step": 2135 + }, + { + "epoch": 0.07, + "learning_rate": 1.9733250194673555e-05, + "loss": 0.6217, + "step": 2136 + }, + { + "epoch": 0.07, + "learning_rate": 1.9733000318060166e-05, + "loss": 0.6324, + "step": 2137 + }, + { + "epoch": 0.07, + "learning_rate": 1.9732750326049746e-05, + "loss": 0.6407, + "step": 2138 + }, + { + "epoch": 0.07, + "learning_rate": 1.9732500218645256e-05, + "loss": 0.6235, + "step": 2139 + }, + { + "epoch": 0.07, + "learning_rate": 1.9732249995849665e-05, + "loss": 0.6167, + "step": 2140 + }, + { + "epoch": 0.07, + "learning_rate": 1.9731999657665942e-05, + "loss": 0.6248, + "step": 2141 + }, + { + "epoch": 0.07, + "learning_rate": 1.973174920409705e-05, + "loss": 0.596, + "step": 2142 + }, + { + "epoch": 0.07, + "learning_rate": 1.973149863514596e-05, + "loss": 0.5955, + "step": 2143 + }, + { + "epoch": 0.07, + "learning_rate": 1.9731247950815646e-05, + "loss": 0.6754, + "step": 2144 + }, + { + "epoch": 0.07, + "learning_rate": 1.9730997151109075e-05, + "loss": 0.5907, + "step": 2145 + }, + { + "epoch": 0.07, + "learning_rate": 1.9730746236029224e-05, + "loss": 0.6457, + "step": 2146 + }, + { + "epoch": 0.07, + "learning_rate": 1.9730495205579067e-05, + "loss": 0.6364, + "step": 2147 + }, + { + "epoch": 0.07, + "learning_rate": 1.973024405976158e-05, + "loss": 0.6198, + "step": 2148 + }, + { + "epoch": 0.07, + "learning_rate": 1.972999279857974e-05, + "loss": 0.646, + "step": 2149 + }, + { + "epoch": 0.07, + "learning_rate": 1.9729741422036528e-05, + "loss": 0.6881, + "step": 2150 + }, + { + "epoch": 0.07, + "learning_rate": 1.972948993013492e-05, + "loss": 0.6325, + "step": 2151 + }, + { + "epoch": 0.07, + "learning_rate": 1.9729238322877905e-05, + "loss": 0.6259, + "step": 2152 + }, + { + "epoch": 0.07, + "learning_rate": 1.972898660026846e-05, + "loss": 0.6526, + "step": 2153 + }, + { + "epoch": 0.07, + "learning_rate": 1.9728734762309574e-05, + "loss": 0.6604, + "step": 2154 + }, + { + "epoch": 0.07, + "learning_rate": 1.972848280900423e-05, + "loss": 0.6643, + "step": 2155 + }, + { + "epoch": 0.07, + "learning_rate": 1.9728230740355413e-05, + "loss": 0.6364, + "step": 2156 + }, + { + "epoch": 0.07, + "learning_rate": 1.9727978556366115e-05, + "loss": 0.607, + "step": 2157 + }, + { + "epoch": 0.07, + "learning_rate": 1.972772625703933e-05, + "loss": 0.6759, + "step": 2158 + }, + { + "epoch": 0.07, + "learning_rate": 1.9727473842378037e-05, + "loss": 0.6367, + "step": 2159 + }, + { + "epoch": 0.07, + "learning_rate": 1.972722131238524e-05, + "loss": 0.5954, + "step": 2160 + }, + { + "epoch": 0.07, + "learning_rate": 1.972696866706393e-05, + "loss": 0.6104, + "step": 2161 + }, + { + "epoch": 0.07, + "learning_rate": 1.9726715906417102e-05, + "loss": 0.6591, + "step": 2162 + }, + { + "epoch": 0.07, + "learning_rate": 1.972646303044775e-05, + "loss": 0.6548, + "step": 2163 + }, + { + "epoch": 0.07, + "learning_rate": 1.972621003915888e-05, + "loss": 0.6675, + "step": 2164 + }, + { + "epoch": 0.08, + "learning_rate": 1.972595693255348e-05, + "loss": 0.6534, + "step": 2165 + }, + { + "epoch": 0.08, + "learning_rate": 1.972570371063456e-05, + "loss": 0.6971, + "step": 2166 + }, + { + "epoch": 0.08, + "learning_rate": 1.972545037340512e-05, + "loss": 0.6474, + "step": 2167 + }, + { + "epoch": 0.08, + "learning_rate": 1.972519692086816e-05, + "loss": 0.5973, + "step": 2168 + }, + { + "epoch": 0.08, + "learning_rate": 1.9724943353026692e-05, + "loss": 0.6762, + "step": 2169 + }, + { + "epoch": 0.08, + "learning_rate": 1.972468966988372e-05, + "loss": 0.6234, + "step": 2170 + }, + { + "epoch": 0.08, + "learning_rate": 1.9724435871442244e-05, + "loss": 0.6374, + "step": 2171 + }, + { + "epoch": 0.08, + "learning_rate": 1.972418195770528e-05, + "loss": 0.5963, + "step": 2172 + }, + { + "epoch": 0.08, + "learning_rate": 1.9723927928675844e-05, + "loss": 0.678, + "step": 2173 + }, + { + "epoch": 0.08, + "learning_rate": 1.972367378435694e-05, + "loss": 0.6222, + "step": 2174 + }, + { + "epoch": 0.08, + "learning_rate": 1.9723419524751578e-05, + "loss": 0.6535, + "step": 2175 + }, + { + "epoch": 0.08, + "learning_rate": 1.972316514986278e-05, + "loss": 0.6727, + "step": 2176 + }, + { + "epoch": 0.08, + "learning_rate": 1.9722910659693557e-05, + "loss": 0.7144, + "step": 2177 + }, + { + "epoch": 0.08, + "learning_rate": 1.972265605424693e-05, + "loss": 0.641, + "step": 2178 + }, + { + "epoch": 0.08, + "learning_rate": 1.972240133352592e-05, + "loss": 0.6344, + "step": 2179 + }, + { + "epoch": 0.08, + "learning_rate": 1.9722146497533538e-05, + "loss": 0.6611, + "step": 2180 + }, + { + "epoch": 0.08, + "learning_rate": 1.9721891546272812e-05, + "loss": 0.666, + "step": 2181 + }, + { + "epoch": 0.08, + "learning_rate": 1.9721636479746765e-05, + "loss": 0.6884, + "step": 2182 + }, + { + "epoch": 0.08, + "learning_rate": 1.972138129795842e-05, + "loss": 0.6944, + "step": 2183 + }, + { + "epoch": 0.08, + "learning_rate": 1.9721126000910802e-05, + "loss": 0.7121, + "step": 2184 + }, + { + "epoch": 0.08, + "learning_rate": 1.9720870588606936e-05, + "loss": 0.6755, + "step": 2185 + }, + { + "epoch": 0.08, + "learning_rate": 1.9720615061049852e-05, + "loss": 0.6368, + "step": 2186 + }, + { + "epoch": 0.08, + "learning_rate": 1.9720359418242582e-05, + "loss": 0.676, + "step": 2187 + }, + { + "epoch": 0.08, + "learning_rate": 1.9720103660188154e-05, + "loss": 0.7082, + "step": 2188 + }, + { + "epoch": 0.08, + "learning_rate": 1.9719847786889602e-05, + "loss": 0.6201, + "step": 2189 + }, + { + "epoch": 0.08, + "learning_rate": 1.9719591798349954e-05, + "loss": 0.7122, + "step": 2190 + }, + { + "epoch": 0.08, + "learning_rate": 1.9719335694572253e-05, + "loss": 0.6616, + "step": 2191 + }, + { + "epoch": 0.08, + "learning_rate": 1.9719079475559538e-05, + "loss": 0.6671, + "step": 2192 + }, + { + "epoch": 0.08, + "learning_rate": 1.9718823141314834e-05, + "loss": 0.6449, + "step": 2193 + }, + { + "epoch": 0.08, + "learning_rate": 1.971856669184119e-05, + "loss": 0.621, + "step": 2194 + }, + { + "epoch": 0.08, + "learning_rate": 1.9718310127141642e-05, + "loss": 0.6277, + "step": 2195 + }, + { + "epoch": 0.08, + "learning_rate": 1.9718053447219235e-05, + "loss": 0.6049, + "step": 2196 + }, + { + "epoch": 0.08, + "learning_rate": 1.9717796652077014e-05, + "loss": 0.6165, + "step": 2197 + }, + { + "epoch": 0.08, + "learning_rate": 1.9717539741718016e-05, + "loss": 0.615, + "step": 2198 + }, + { + "epoch": 0.08, + "learning_rate": 1.9717282716145292e-05, + "loss": 0.663, + "step": 2199 + }, + { + "epoch": 0.08, + "learning_rate": 1.971702557536189e-05, + "loss": 0.7006, + "step": 2200 + }, + { + "epoch": 0.08, + "learning_rate": 1.971676831937086e-05, + "loss": 0.6513, + "step": 2201 + }, + { + "epoch": 0.08, + "learning_rate": 1.9716510948175245e-05, + "loss": 0.6503, + "step": 2202 + }, + { + "epoch": 0.08, + "learning_rate": 1.9716253461778105e-05, + "loss": 0.5981, + "step": 2203 + }, + { + "epoch": 0.08, + "learning_rate": 1.9715995860182485e-05, + "loss": 0.6222, + "step": 2204 + }, + { + "epoch": 0.08, + "learning_rate": 1.971573814339145e-05, + "loss": 0.6454, + "step": 2205 + }, + { + "epoch": 0.08, + "learning_rate": 1.971548031140804e-05, + "loss": 0.6357, + "step": 2206 + }, + { + "epoch": 0.08, + "learning_rate": 1.971522236423533e-05, + "loss": 0.6123, + "step": 2207 + }, + { + "epoch": 0.08, + "learning_rate": 1.9714964301876364e-05, + "loss": 0.6826, + "step": 2208 + }, + { + "epoch": 0.08, + "learning_rate": 1.9714706124334207e-05, + "loss": 0.6515, + "step": 2209 + }, + { + "epoch": 0.08, + "learning_rate": 1.971444783161192e-05, + "loss": 0.6262, + "step": 2210 + }, + { + "epoch": 0.08, + "learning_rate": 1.9714189423712567e-05, + "loss": 0.6912, + "step": 2211 + }, + { + "epoch": 0.08, + "learning_rate": 1.9713930900639206e-05, + "loss": 0.6184, + "step": 2212 + }, + { + "epoch": 0.08, + "learning_rate": 1.971367226239491e-05, + "loss": 0.6372, + "step": 2213 + }, + { + "epoch": 0.08, + "learning_rate": 1.971341350898274e-05, + "loss": 0.7006, + "step": 2214 + }, + { + "epoch": 0.08, + "learning_rate": 1.9713154640405765e-05, + "loss": 0.62, + "step": 2215 + }, + { + "epoch": 0.08, + "learning_rate": 1.971289565666705e-05, + "loss": 0.6528, + "step": 2216 + }, + { + "epoch": 0.08, + "learning_rate": 1.9712636557769678e-05, + "loss": 0.6698, + "step": 2217 + }, + { + "epoch": 0.08, + "learning_rate": 1.9712377343716712e-05, + "loss": 0.6152, + "step": 2218 + }, + { + "epoch": 0.08, + "learning_rate": 1.9712118014511223e-05, + "loss": 0.6091, + "step": 2219 + }, + { + "epoch": 0.08, + "learning_rate": 1.971185857015629e-05, + "loss": 0.6574, + "step": 2220 + }, + { + "epoch": 0.08, + "learning_rate": 1.9711599010654987e-05, + "loss": 0.6124, + "step": 2221 + }, + { + "epoch": 0.08, + "learning_rate": 1.9711339336010393e-05, + "loss": 0.6586, + "step": 2222 + }, + { + "epoch": 0.08, + "learning_rate": 1.971107954622559e-05, + "loss": 0.5973, + "step": 2223 + }, + { + "epoch": 0.08, + "learning_rate": 1.971081964130365e-05, + "loss": 0.6331, + "step": 2224 + }, + { + "epoch": 0.08, + "learning_rate": 1.971055962124766e-05, + "loss": 0.6098, + "step": 2225 + }, + { + "epoch": 0.08, + "learning_rate": 1.9710299486060703e-05, + "loss": 0.6335, + "step": 2226 + }, + { + "epoch": 0.08, + "learning_rate": 1.971003923574586e-05, + "loss": 0.6483, + "step": 2227 + }, + { + "epoch": 0.08, + "learning_rate": 1.970977887030622e-05, + "loss": 0.6137, + "step": 2228 + }, + { + "epoch": 0.08, + "learning_rate": 1.9709518389744868e-05, + "loss": 0.6718, + "step": 2229 + }, + { + "epoch": 0.08, + "learning_rate": 1.970925779406489e-05, + "loss": 0.6727, + "step": 2230 + }, + { + "epoch": 0.08, + "learning_rate": 1.9708997083269382e-05, + "loss": 0.6501, + "step": 2231 + }, + { + "epoch": 0.08, + "learning_rate": 1.9708736257361435e-05, + "loss": 0.6003, + "step": 2232 + }, + { + "epoch": 0.08, + "learning_rate": 1.9708475316344133e-05, + "loss": 0.6659, + "step": 2233 + }, + { + "epoch": 0.08, + "learning_rate": 1.9708214260220577e-05, + "loss": 0.5728, + "step": 2234 + }, + { + "epoch": 0.08, + "learning_rate": 1.970795308899386e-05, + "loss": 0.636, + "step": 2235 + }, + { + "epoch": 0.08, + "learning_rate": 1.9707691802667076e-05, + "loss": 0.6266, + "step": 2236 + }, + { + "epoch": 0.08, + "learning_rate": 1.9707430401243325e-05, + "loss": 0.684, + "step": 2237 + }, + { + "epoch": 0.08, + "learning_rate": 1.9707168884725713e-05, + "loss": 0.6765, + "step": 2238 + }, + { + "epoch": 0.08, + "learning_rate": 1.970690725311733e-05, + "loss": 0.6843, + "step": 2239 + }, + { + "epoch": 0.08, + "learning_rate": 1.970664550642128e-05, + "loss": 0.6361, + "step": 2240 + }, + { + "epoch": 0.08, + "learning_rate": 1.970638364464067e-05, + "loss": 0.6403, + "step": 2241 + }, + { + "epoch": 0.08, + "learning_rate": 1.9706121667778605e-05, + "loss": 0.6601, + "step": 2242 + }, + { + "epoch": 0.08, + "learning_rate": 1.970585957583819e-05, + "loss": 0.6392, + "step": 2243 + }, + { + "epoch": 0.08, + "learning_rate": 1.9705597368822528e-05, + "loss": 0.6143, + "step": 2244 + }, + { + "epoch": 0.08, + "learning_rate": 1.9705335046734736e-05, + "loss": 0.6056, + "step": 2245 + }, + { + "epoch": 0.08, + "learning_rate": 1.9705072609577915e-05, + "loss": 0.6505, + "step": 2246 + }, + { + "epoch": 0.08, + "learning_rate": 1.9704810057355185e-05, + "loss": 0.6225, + "step": 2247 + }, + { + "epoch": 0.08, + "learning_rate": 1.9704547390069653e-05, + "loss": 0.5879, + "step": 2248 + }, + { + "epoch": 0.08, + "learning_rate": 1.9704284607724435e-05, + "loss": 0.6255, + "step": 2249 + }, + { + "epoch": 0.08, + "learning_rate": 1.970402171032265e-05, + "loss": 0.6619, + "step": 2250 + }, + { + "epoch": 0.08, + "learning_rate": 1.9703758697867407e-05, + "loss": 0.6645, + "step": 2251 + }, + { + "epoch": 0.08, + "learning_rate": 1.9703495570361834e-05, + "loss": 0.6372, + "step": 2252 + }, + { + "epoch": 0.08, + "learning_rate": 1.9703232327809044e-05, + "loss": 0.6941, + "step": 2253 + }, + { + "epoch": 0.08, + "learning_rate": 1.9702968970212158e-05, + "loss": 0.6171, + "step": 2254 + }, + { + "epoch": 0.08, + "learning_rate": 1.9702705497574306e-05, + "loss": 0.7018, + "step": 2255 + }, + { + "epoch": 0.08, + "learning_rate": 1.9702441909898603e-05, + "loss": 0.6013, + "step": 2256 + }, + { + "epoch": 0.08, + "learning_rate": 1.9702178207188178e-05, + "loss": 0.6586, + "step": 2257 + }, + { + "epoch": 0.08, + "learning_rate": 1.9701914389446156e-05, + "loss": 0.696, + "step": 2258 + }, + { + "epoch": 0.08, + "learning_rate": 1.9701650456675663e-05, + "loss": 0.6375, + "step": 2259 + }, + { + "epoch": 0.08, + "learning_rate": 1.970138640887984e-05, + "loss": 0.6344, + "step": 2260 + }, + { + "epoch": 0.08, + "learning_rate": 1.9701122246061804e-05, + "loss": 0.6603, + "step": 2261 + }, + { + "epoch": 0.08, + "learning_rate": 1.9700857968224692e-05, + "loss": 0.6233, + "step": 2262 + }, + { + "epoch": 0.08, + "learning_rate": 1.9700593575371636e-05, + "loss": 0.6682, + "step": 2263 + }, + { + "epoch": 0.08, + "learning_rate": 1.9700329067505772e-05, + "loss": 0.5949, + "step": 2264 + }, + { + "epoch": 0.08, + "learning_rate": 1.9700064444630236e-05, + "loss": 0.6485, + "step": 2265 + }, + { + "epoch": 0.08, + "learning_rate": 1.9699799706748165e-05, + "loss": 0.6615, + "step": 2266 + }, + { + "epoch": 0.08, + "learning_rate": 1.96995348538627e-05, + "loss": 0.6824, + "step": 2267 + }, + { + "epoch": 0.08, + "learning_rate": 1.9699269885976976e-05, + "loss": 0.6091, + "step": 2268 + }, + { + "epoch": 0.08, + "learning_rate": 1.9699004803094143e-05, + "loss": 0.6602, + "step": 2269 + }, + { + "epoch": 0.08, + "learning_rate": 1.9698739605217335e-05, + "loss": 0.6149, + "step": 2270 + }, + { + "epoch": 0.08, + "learning_rate": 1.96984742923497e-05, + "loss": 0.6128, + "step": 2271 + }, + { + "epoch": 0.08, + "learning_rate": 1.9698208864494385e-05, + "loss": 0.6864, + "step": 2272 + }, + { + "epoch": 0.08, + "learning_rate": 1.9697943321654535e-05, + "loss": 0.5946, + "step": 2273 + }, + { + "epoch": 0.08, + "learning_rate": 1.96976776638333e-05, + "loss": 0.6462, + "step": 2274 + }, + { + "epoch": 0.08, + "learning_rate": 1.9697411891033828e-05, + "loss": 0.7159, + "step": 2275 + }, + { + "epoch": 0.08, + "learning_rate": 1.969714600325927e-05, + "loss": 0.5784, + "step": 2276 + }, + { + "epoch": 0.08, + "learning_rate": 1.969688000051278e-05, + "loss": 0.6593, + "step": 2277 + }, + { + "epoch": 0.08, + "learning_rate": 1.969661388279751e-05, + "loss": 0.6379, + "step": 2278 + }, + { + "epoch": 0.08, + "learning_rate": 1.969634765011662e-05, + "loss": 0.6413, + "step": 2279 + }, + { + "epoch": 0.08, + "learning_rate": 1.9696081302473257e-05, + "loss": 0.6062, + "step": 2280 + }, + { + "epoch": 0.08, + "learning_rate": 1.969581483987059e-05, + "loss": 0.6211, + "step": 2281 + }, + { + "epoch": 0.08, + "learning_rate": 1.9695548262311765e-05, + "loss": 0.6658, + "step": 2282 + }, + { + "epoch": 0.08, + "learning_rate": 1.9695281569799957e-05, + "loss": 0.6595, + "step": 2283 + }, + { + "epoch": 0.08, + "learning_rate": 1.969501476233832e-05, + "loss": 0.6879, + "step": 2284 + }, + { + "epoch": 0.08, + "learning_rate": 1.969474783993002e-05, + "loss": 0.568, + "step": 2285 + }, + { + "epoch": 0.08, + "learning_rate": 1.9694480802578217e-05, + "loss": 0.6625, + "step": 2286 + }, + { + "epoch": 0.08, + "learning_rate": 1.9694213650286083e-05, + "loss": 0.6992, + "step": 2287 + }, + { + "epoch": 0.08, + "learning_rate": 1.969394638305678e-05, + "loss": 0.6755, + "step": 2288 + }, + { + "epoch": 0.08, + "learning_rate": 1.9693679000893484e-05, + "loss": 0.6506, + "step": 2289 + }, + { + "epoch": 0.08, + "learning_rate": 1.9693411503799358e-05, + "loss": 0.6419, + "step": 2290 + }, + { + "epoch": 0.08, + "learning_rate": 1.969314389177758e-05, + "loss": 0.6772, + "step": 2291 + }, + { + "epoch": 0.08, + "learning_rate": 1.9692876164831314e-05, + "loss": 0.6185, + "step": 2292 + }, + { + "epoch": 0.08, + "learning_rate": 1.9692608322963743e-05, + "loss": 0.5849, + "step": 2293 + }, + { + "epoch": 0.08, + "learning_rate": 1.969234036617804e-05, + "loss": 0.6105, + "step": 2294 + }, + { + "epoch": 0.08, + "learning_rate": 1.9692072294477378e-05, + "loss": 0.6211, + "step": 2295 + }, + { + "epoch": 0.08, + "learning_rate": 1.969180410786494e-05, + "loss": 0.6509, + "step": 2296 + }, + { + "epoch": 0.08, + "learning_rate": 1.9691535806343905e-05, + "loss": 0.6455, + "step": 2297 + }, + { + "epoch": 0.08, + "learning_rate": 1.969126738991745e-05, + "loss": 0.6573, + "step": 2298 + }, + { + "epoch": 0.08, + "learning_rate": 1.969099885858876e-05, + "loss": 0.6929, + "step": 2299 + }, + { + "epoch": 0.08, + "learning_rate": 1.9690730212361026e-05, + "loss": 0.6488, + "step": 2300 + }, + { + "epoch": 0.08, + "learning_rate": 1.9690461451237423e-05, + "loss": 0.5831, + "step": 2301 + }, + { + "epoch": 0.08, + "learning_rate": 1.969019257522114e-05, + "loss": 0.6445, + "step": 2302 + }, + { + "epoch": 0.08, + "learning_rate": 1.9689923584315364e-05, + "loss": 0.6763, + "step": 2303 + }, + { + "epoch": 0.08, + "learning_rate": 1.968965447852329e-05, + "loss": 0.63, + "step": 2304 + }, + { + "epoch": 0.08, + "learning_rate": 1.9689385257848102e-05, + "loss": 0.6482, + "step": 2305 + }, + { + "epoch": 0.08, + "learning_rate": 1.9689115922292996e-05, + "loss": 0.691, + "step": 2306 + }, + { + "epoch": 0.08, + "learning_rate": 1.9688846471861163e-05, + "loss": 0.624, + "step": 2307 + }, + { + "epoch": 0.08, + "learning_rate": 1.96885769065558e-05, + "loss": 0.6146, + "step": 2308 + }, + { + "epoch": 0.08, + "learning_rate": 1.96883072263801e-05, + "loss": 0.5542, + "step": 2309 + }, + { + "epoch": 0.08, + "learning_rate": 1.968803743133726e-05, + "loss": 0.6864, + "step": 2310 + }, + { + "epoch": 0.08, + "learning_rate": 1.9687767521430485e-05, + "loss": 0.6508, + "step": 2311 + }, + { + "epoch": 0.08, + "learning_rate": 1.9687497496662972e-05, + "loss": 0.6303, + "step": 2312 + }, + { + "epoch": 0.08, + "learning_rate": 1.968722735703792e-05, + "loss": 0.6589, + "step": 2313 + }, + { + "epoch": 0.08, + "learning_rate": 1.968695710255853e-05, + "loss": 0.6575, + "step": 2314 + }, + { + "epoch": 0.08, + "learning_rate": 1.9686686733228014e-05, + "loss": 0.6417, + "step": 2315 + }, + { + "epoch": 0.08, + "learning_rate": 1.968641624904957e-05, + "loss": 0.7045, + "step": 2316 + }, + { + "epoch": 0.08, + "learning_rate": 1.968614565002641e-05, + "loss": 0.6264, + "step": 2317 + }, + { + "epoch": 0.08, + "learning_rate": 1.9685874936161738e-05, + "loss": 0.6893, + "step": 2318 + }, + { + "epoch": 0.08, + "learning_rate": 1.9685604107458768e-05, + "loss": 0.6542, + "step": 2319 + }, + { + "epoch": 0.08, + "learning_rate": 1.968533316392071e-05, + "loss": 0.6461, + "step": 2320 + }, + { + "epoch": 0.08, + "learning_rate": 1.9685062105550773e-05, + "loss": 0.645, + "step": 2321 + }, + { + "epoch": 0.08, + "learning_rate": 1.968479093235217e-05, + "loss": 0.6441, + "step": 2322 + }, + { + "epoch": 0.08, + "learning_rate": 1.9684519644328123e-05, + "loss": 0.6407, + "step": 2323 + }, + { + "epoch": 0.08, + "learning_rate": 1.9684248241481844e-05, + "loss": 0.6348, + "step": 2324 + }, + { + "epoch": 0.08, + "learning_rate": 1.9683976723816553e-05, + "loss": 0.6855, + "step": 2325 + }, + { + "epoch": 0.08, + "learning_rate": 1.9683705091335467e-05, + "loss": 0.6835, + "step": 2326 + }, + { + "epoch": 0.08, + "learning_rate": 1.9683433344041804e-05, + "loss": 0.6439, + "step": 2327 + }, + { + "epoch": 0.08, + "learning_rate": 1.9683161481938794e-05, + "loss": 0.6287, + "step": 2328 + }, + { + "epoch": 0.08, + "learning_rate": 1.9682889505029653e-05, + "loss": 0.6405, + "step": 2329 + }, + { + "epoch": 0.08, + "learning_rate": 1.9682617413317607e-05, + "loss": 0.6536, + "step": 2330 + }, + { + "epoch": 0.08, + "learning_rate": 1.9682345206805885e-05, + "loss": 0.6686, + "step": 2331 + }, + { + "epoch": 0.08, + "learning_rate": 1.9682072885497712e-05, + "loss": 0.5975, + "step": 2332 + }, + { + "epoch": 0.08, + "learning_rate": 1.9681800449396317e-05, + "loss": 0.6634, + "step": 2333 + }, + { + "epoch": 0.08, + "learning_rate": 1.968152789850493e-05, + "loss": 0.6204, + "step": 2334 + }, + { + "epoch": 0.08, + "learning_rate": 1.968125523282678e-05, + "loss": 0.6376, + "step": 2335 + }, + { + "epoch": 0.08, + "learning_rate": 1.9680982452365105e-05, + "loss": 0.6625, + "step": 2336 + }, + { + "epoch": 0.08, + "learning_rate": 1.9680709557123135e-05, + "loss": 0.6287, + "step": 2337 + }, + { + "epoch": 0.08, + "learning_rate": 1.968043654710411e-05, + "loss": 0.6437, + "step": 2338 + }, + { + "epoch": 0.08, + "learning_rate": 1.968016342231126e-05, + "loss": 0.6965, + "step": 2339 + }, + { + "epoch": 0.08, + "learning_rate": 1.967989018274783e-05, + "loss": 0.6205, + "step": 2340 + }, + { + "epoch": 0.08, + "learning_rate": 1.9679616828417058e-05, + "loss": 0.6088, + "step": 2341 + }, + { + "epoch": 0.08, + "learning_rate": 1.967934335932218e-05, + "loss": 0.6458, + "step": 2342 + }, + { + "epoch": 0.08, + "learning_rate": 1.9679069775466444e-05, + "loss": 0.6516, + "step": 2343 + }, + { + "epoch": 0.08, + "learning_rate": 1.967879607685309e-05, + "loss": 0.6275, + "step": 2344 + }, + { + "epoch": 0.08, + "learning_rate": 1.9678522263485368e-05, + "loss": 0.6128, + "step": 2345 + }, + { + "epoch": 0.08, + "learning_rate": 1.967824833536652e-05, + "loss": 0.6036, + "step": 2346 + }, + { + "epoch": 0.08, + "learning_rate": 1.967797429249979e-05, + "loss": 0.6548, + "step": 2347 + }, + { + "epoch": 0.08, + "learning_rate": 1.9677700134888438e-05, + "loss": 0.6545, + "step": 2348 + }, + { + "epoch": 0.08, + "learning_rate": 1.9677425862535708e-05, + "loss": 0.639, + "step": 2349 + }, + { + "epoch": 0.08, + "learning_rate": 1.967715147544485e-05, + "loss": 0.6142, + "step": 2350 + }, + { + "epoch": 0.08, + "learning_rate": 1.967687697361912e-05, + "loss": 0.6152, + "step": 2351 + }, + { + "epoch": 0.08, + "learning_rate": 1.9676602357061775e-05, + "loss": 0.6211, + "step": 2352 + }, + { + "epoch": 0.08, + "learning_rate": 1.9676327625776067e-05, + "loss": 0.6446, + "step": 2353 + }, + { + "epoch": 0.08, + "learning_rate": 1.9676052779765255e-05, + "loss": 0.7061, + "step": 2354 + }, + { + "epoch": 0.08, + "learning_rate": 1.9675777819032592e-05, + "loss": 0.6398, + "step": 2355 + }, + { + "epoch": 0.08, + "learning_rate": 1.9675502743581348e-05, + "loss": 0.6813, + "step": 2356 + }, + { + "epoch": 0.08, + "learning_rate": 1.9675227553414778e-05, + "loss": 0.7004, + "step": 2357 + }, + { + "epoch": 0.08, + "learning_rate": 1.9674952248536146e-05, + "loss": 0.6159, + "step": 2358 + }, + { + "epoch": 0.08, + "learning_rate": 1.9674676828948717e-05, + "loss": 0.6823, + "step": 2359 + }, + { + "epoch": 0.08, + "learning_rate": 1.9674401294655758e-05, + "loss": 0.6689, + "step": 2360 + }, + { + "epoch": 0.08, + "learning_rate": 1.9674125645660527e-05, + "loss": 0.6213, + "step": 2361 + }, + { + "epoch": 0.08, + "learning_rate": 1.9673849881966302e-05, + "loss": 0.6579, + "step": 2362 + }, + { + "epoch": 0.08, + "learning_rate": 1.967357400357635e-05, + "loss": 0.6596, + "step": 2363 + }, + { + "epoch": 0.08, + "learning_rate": 1.967329801049394e-05, + "loss": 0.5946, + "step": 2364 + }, + { + "epoch": 0.08, + "learning_rate": 1.967302190272235e-05, + "loss": 0.59, + "step": 2365 + }, + { + "epoch": 0.08, + "learning_rate": 1.967274568026484e-05, + "loss": 0.6563, + "step": 2366 + }, + { + "epoch": 0.08, + "learning_rate": 1.96724693431247e-05, + "loss": 0.6346, + "step": 2367 + }, + { + "epoch": 0.08, + "learning_rate": 1.9672192891305197e-05, + "loss": 0.6637, + "step": 2368 + }, + { + "epoch": 0.08, + "learning_rate": 1.967191632480961e-05, + "loss": 0.652, + "step": 2369 + }, + { + "epoch": 0.08, + "learning_rate": 1.9671639643641227e-05, + "loss": 0.659, + "step": 2370 + }, + { + "epoch": 0.08, + "learning_rate": 1.9671362847803316e-05, + "loss": 0.6262, + "step": 2371 + }, + { + "epoch": 0.08, + "learning_rate": 1.9671085937299166e-05, + "loss": 0.6316, + "step": 2372 + }, + { + "epoch": 0.08, + "learning_rate": 1.967080891213206e-05, + "loss": 0.6868, + "step": 2373 + }, + { + "epoch": 0.08, + "learning_rate": 1.9670531772305277e-05, + "loss": 0.5558, + "step": 2374 + }, + { + "epoch": 0.08, + "learning_rate": 1.9670254517822108e-05, + "loss": 0.6651, + "step": 2375 + }, + { + "epoch": 0.08, + "learning_rate": 1.9669977148685843e-05, + "loss": 0.7398, + "step": 2376 + }, + { + "epoch": 0.08, + "learning_rate": 1.966969966489976e-05, + "loss": 0.679, + "step": 2377 + }, + { + "epoch": 0.08, + "learning_rate": 1.966942206646716e-05, + "loss": 0.6307, + "step": 2378 + }, + { + "epoch": 0.08, + "learning_rate": 1.9669144353391326e-05, + "loss": 0.6484, + "step": 2379 + }, + { + "epoch": 0.08, + "learning_rate": 1.9668866525675553e-05, + "loss": 0.7205, + "step": 2380 + }, + { + "epoch": 0.08, + "learning_rate": 1.966858858332314e-05, + "loss": 0.6429, + "step": 2381 + }, + { + "epoch": 0.08, + "learning_rate": 1.9668310526337376e-05, + "loss": 0.6772, + "step": 2382 + }, + { + "epoch": 0.08, + "learning_rate": 1.9668032354721562e-05, + "loss": 0.6608, + "step": 2383 + }, + { + "epoch": 0.08, + "learning_rate": 1.966775406847899e-05, + "loss": 0.576, + "step": 2384 + }, + { + "epoch": 0.08, + "learning_rate": 1.966747566761297e-05, + "loss": 0.6594, + "step": 2385 + }, + { + "epoch": 0.08, + "learning_rate": 1.9667197152126794e-05, + "loss": 0.6165, + "step": 2386 + }, + { + "epoch": 0.08, + "learning_rate": 1.966691852202377e-05, + "loss": 0.6754, + "step": 2387 + }, + { + "epoch": 0.08, + "learning_rate": 1.9666639777307193e-05, + "loss": 0.6696, + "step": 2388 + }, + { + "epoch": 0.08, + "learning_rate": 1.9666360917980375e-05, + "loss": 0.6064, + "step": 2389 + }, + { + "epoch": 0.08, + "learning_rate": 1.966608194404662e-05, + "loss": 0.7055, + "step": 2390 + }, + { + "epoch": 0.08, + "learning_rate": 1.9665802855509236e-05, + "loss": 0.6496, + "step": 2391 + }, + { + "epoch": 0.08, + "learning_rate": 1.966552365237153e-05, + "loss": 0.6624, + "step": 2392 + }, + { + "epoch": 0.08, + "learning_rate": 1.9665244334636818e-05, + "loss": 0.6558, + "step": 2393 + }, + { + "epoch": 0.08, + "learning_rate": 1.9664964902308404e-05, + "loss": 0.6365, + "step": 2394 + }, + { + "epoch": 0.08, + "learning_rate": 1.9664685355389607e-05, + "loss": 0.6595, + "step": 2395 + }, + { + "epoch": 0.08, + "learning_rate": 1.966440569388374e-05, + "loss": 0.6099, + "step": 2396 + }, + { + "epoch": 0.08, + "learning_rate": 1.9664125917794116e-05, + "loss": 0.6556, + "step": 2397 + }, + { + "epoch": 0.08, + "learning_rate": 1.9663846027124057e-05, + "loss": 0.6563, + "step": 2398 + }, + { + "epoch": 0.08, + "learning_rate": 1.9663566021876875e-05, + "loss": 0.6486, + "step": 2399 + }, + { + "epoch": 0.08, + "learning_rate": 1.9663285902055893e-05, + "loss": 0.6313, + "step": 2400 + }, + { + "epoch": 0.08, + "learning_rate": 1.9663005667664435e-05, + "loss": 0.7002, + "step": 2401 + }, + { + "epoch": 0.08, + "learning_rate": 1.966272531870582e-05, + "loss": 0.6634, + "step": 2402 + }, + { + "epoch": 0.08, + "learning_rate": 1.9662444855183373e-05, + "loss": 0.6136, + "step": 2403 + }, + { + "epoch": 0.08, + "learning_rate": 1.966216427710042e-05, + "loss": 0.6273, + "step": 2404 + }, + { + "epoch": 0.08, + "learning_rate": 1.9661883584460288e-05, + "loss": 0.6624, + "step": 2405 + }, + { + "epoch": 0.08, + "learning_rate": 1.9661602777266303e-05, + "loss": 0.6488, + "step": 2406 + }, + { + "epoch": 0.08, + "learning_rate": 1.966132185552179e-05, + "loss": 0.6148, + "step": 2407 + }, + { + "epoch": 0.08, + "learning_rate": 1.966104081923009e-05, + "loss": 0.6318, + "step": 2408 + }, + { + "epoch": 0.08, + "learning_rate": 1.966075966839453e-05, + "loss": 0.6337, + "step": 2409 + }, + { + "epoch": 0.08, + "learning_rate": 1.966047840301844e-05, + "loss": 0.6249, + "step": 2410 + }, + { + "epoch": 0.08, + "learning_rate": 1.9660197023105162e-05, + "loss": 0.7171, + "step": 2411 + }, + { + "epoch": 0.08, + "learning_rate": 1.9659915528658025e-05, + "loss": 0.5855, + "step": 2412 + }, + { + "epoch": 0.08, + "learning_rate": 1.9659633919680372e-05, + "loss": 0.6123, + "step": 2413 + }, + { + "epoch": 0.08, + "learning_rate": 1.9659352196175537e-05, + "loss": 0.6755, + "step": 2414 + }, + { + "epoch": 0.08, + "learning_rate": 1.9659070358146863e-05, + "loss": 0.6762, + "step": 2415 + }, + { + "epoch": 0.08, + "learning_rate": 1.965878840559769e-05, + "loss": 0.6306, + "step": 2416 + }, + { + "epoch": 0.08, + "learning_rate": 1.9658506338531366e-05, + "loss": 0.6536, + "step": 2417 + }, + { + "epoch": 0.08, + "learning_rate": 1.9658224156951227e-05, + "loss": 0.6233, + "step": 2418 + }, + { + "epoch": 0.08, + "learning_rate": 1.9657941860860627e-05, + "loss": 0.6342, + "step": 2419 + }, + { + "epoch": 0.08, + "learning_rate": 1.9657659450262905e-05, + "loss": 0.6431, + "step": 2420 + }, + { + "epoch": 0.08, + "learning_rate": 1.9657376925161413e-05, + "loss": 0.6225, + "step": 2421 + }, + { + "epoch": 0.08, + "learning_rate": 1.9657094285559505e-05, + "loss": 0.6511, + "step": 2422 + }, + { + "epoch": 0.08, + "learning_rate": 1.9656811531460524e-05, + "loss": 0.6108, + "step": 2423 + }, + { + "epoch": 0.08, + "learning_rate": 1.965652866286783e-05, + "loss": 0.6491, + "step": 2424 + }, + { + "epoch": 0.08, + "learning_rate": 1.965624567978477e-05, + "loss": 0.6653, + "step": 2425 + }, + { + "epoch": 0.08, + "learning_rate": 1.9655962582214702e-05, + "loss": 0.6419, + "step": 2426 + }, + { + "epoch": 0.08, + "learning_rate": 1.965567937016099e-05, + "loss": 0.6838, + "step": 2427 + }, + { + "epoch": 0.08, + "learning_rate": 1.9655396043626975e-05, + "loss": 0.6447, + "step": 2428 + }, + { + "epoch": 0.08, + "learning_rate": 1.9655112602616027e-05, + "loss": 0.6391, + "step": 2429 + }, + { + "epoch": 0.08, + "learning_rate": 1.9654829047131508e-05, + "loss": 0.7095, + "step": 2430 + }, + { + "epoch": 0.08, + "learning_rate": 1.9654545377176778e-05, + "loss": 0.6124, + "step": 2431 + }, + { + "epoch": 0.08, + "learning_rate": 1.96542615927552e-05, + "loss": 0.7071, + "step": 2432 + }, + { + "epoch": 0.08, + "learning_rate": 1.9653977693870138e-05, + "loss": 0.6509, + "step": 2433 + }, + { + "epoch": 0.08, + "learning_rate": 1.9653693680524957e-05, + "loss": 0.7269, + "step": 2434 + }, + { + "epoch": 0.08, + "learning_rate": 1.965340955272302e-05, + "loss": 0.6307, + "step": 2435 + }, + { + "epoch": 0.08, + "learning_rate": 1.965312531046771e-05, + "loss": 0.6143, + "step": 2436 + }, + { + "epoch": 0.08, + "learning_rate": 1.9652840953762384e-05, + "loss": 0.6112, + "step": 2437 + }, + { + "epoch": 0.08, + "learning_rate": 1.965255648261042e-05, + "loss": 0.611, + "step": 2438 + }, + { + "epoch": 0.08, + "learning_rate": 1.9652271897015185e-05, + "loss": 0.6468, + "step": 2439 + }, + { + "epoch": 0.08, + "learning_rate": 1.965198719698006e-05, + "loss": 0.6241, + "step": 2440 + }, + { + "epoch": 0.08, + "learning_rate": 1.965170238250841e-05, + "loss": 0.6413, + "step": 2441 + }, + { + "epoch": 0.08, + "learning_rate": 1.9651417453603625e-05, + "loss": 0.6714, + "step": 2442 + }, + { + "epoch": 0.08, + "learning_rate": 1.9651132410269075e-05, + "loss": 0.6638, + "step": 2443 + }, + { + "epoch": 0.08, + "learning_rate": 1.965084725250814e-05, + "loss": 0.6673, + "step": 2444 + }, + { + "epoch": 0.08, + "learning_rate": 1.965056198032421e-05, + "loss": 0.6142, + "step": 2445 + }, + { + "epoch": 0.08, + "learning_rate": 1.965027659372065e-05, + "loss": 0.6838, + "step": 2446 + }, + { + "epoch": 0.08, + "learning_rate": 1.964999109270086e-05, + "loss": 0.66, + "step": 2447 + }, + { + "epoch": 0.08, + "learning_rate": 1.9649705477268215e-05, + "loss": 0.6516, + "step": 2448 + }, + { + "epoch": 0.08, + "learning_rate": 1.9649419747426105e-05, + "loss": 0.6575, + "step": 2449 + }, + { + "epoch": 0.08, + "learning_rate": 1.9649133903177918e-05, + "loss": 0.6742, + "step": 2450 + }, + { + "epoch": 0.08, + "learning_rate": 1.9648847944527042e-05, + "loss": 0.6536, + "step": 2451 + }, + { + "epoch": 0.08, + "learning_rate": 1.964856187147687e-05, + "loss": 0.7029, + "step": 2452 + }, + { + "epoch": 0.08, + "learning_rate": 1.964827568403079e-05, + "loss": 0.6345, + "step": 2453 + }, + { + "epoch": 0.09, + "learning_rate": 1.9647989382192195e-05, + "loss": 0.6208, + "step": 2454 + }, + { + "epoch": 0.09, + "learning_rate": 1.964770296596448e-05, + "loss": 0.6461, + "step": 2455 + }, + { + "epoch": 0.09, + "learning_rate": 1.9647416435351047e-05, + "loss": 0.6667, + "step": 2456 + }, + { + "epoch": 0.09, + "learning_rate": 1.9647129790355282e-05, + "loss": 0.6493, + "step": 2457 + }, + { + "epoch": 0.09, + "learning_rate": 1.9646843030980597e-05, + "loss": 0.6895, + "step": 2458 + }, + { + "epoch": 0.09, + "learning_rate": 1.9646556157230378e-05, + "loss": 0.6002, + "step": 2459 + }, + { + "epoch": 0.09, + "learning_rate": 1.9646269169108038e-05, + "loss": 0.6145, + "step": 2460 + }, + { + "epoch": 0.09, + "learning_rate": 1.9645982066616968e-05, + "loss": 0.6683, + "step": 2461 + }, + { + "epoch": 0.09, + "learning_rate": 1.9645694849760584e-05, + "loss": 0.6422, + "step": 2462 + }, + { + "epoch": 0.09, + "learning_rate": 1.9645407518542284e-05, + "loss": 0.6735, + "step": 2463 + }, + { + "epoch": 0.09, + "learning_rate": 1.9645120072965475e-05, + "loss": 0.6339, + "step": 2464 + }, + { + "epoch": 0.09, + "learning_rate": 1.9644832513033568e-05, + "loss": 0.6536, + "step": 2465 + }, + { + "epoch": 0.09, + "learning_rate": 1.964454483874997e-05, + "loss": 0.5935, + "step": 2466 + }, + { + "epoch": 0.09, + "learning_rate": 1.9644257050118092e-05, + "loss": 0.6051, + "step": 2467 + }, + { + "epoch": 0.09, + "learning_rate": 1.9643969147141348e-05, + "loss": 0.6445, + "step": 2468 + }, + { + "epoch": 0.09, + "learning_rate": 1.9643681129823152e-05, + "loss": 0.6039, + "step": 2469 + }, + { + "epoch": 0.09, + "learning_rate": 1.9643392998166912e-05, + "loss": 0.632, + "step": 2470 + }, + { + "epoch": 0.09, + "learning_rate": 1.964310475217605e-05, + "loss": 0.647, + "step": 2471 + }, + { + "epoch": 0.09, + "learning_rate": 1.9642816391853987e-05, + "loss": 0.6165, + "step": 2472 + }, + { + "epoch": 0.09, + "learning_rate": 1.9642527917204132e-05, + "loss": 0.6499, + "step": 2473 + }, + { + "epoch": 0.09, + "learning_rate": 1.9642239328229915e-05, + "loss": 0.6483, + "step": 2474 + }, + { + "epoch": 0.09, + "learning_rate": 1.964195062493475e-05, + "loss": 0.6338, + "step": 2475 + }, + { + "epoch": 0.09, + "learning_rate": 1.9641661807322066e-05, + "loss": 0.6835, + "step": 2476 + }, + { + "epoch": 0.09, + "learning_rate": 1.9641372875395285e-05, + "loss": 0.6518, + "step": 2477 + }, + { + "epoch": 0.09, + "learning_rate": 1.964108382915783e-05, + "loss": 0.6701, + "step": 2478 + }, + { + "epoch": 0.09, + "learning_rate": 1.9640794668613128e-05, + "loss": 0.604, + "step": 2479 + }, + { + "epoch": 0.09, + "learning_rate": 1.9640505393764614e-05, + "loss": 0.6215, + "step": 2480 + }, + { + "epoch": 0.09, + "learning_rate": 1.9640216004615712e-05, + "loss": 0.624, + "step": 2481 + }, + { + "epoch": 0.09, + "learning_rate": 1.963992650116985e-05, + "loss": 0.6407, + "step": 2482 + }, + { + "epoch": 0.09, + "learning_rate": 1.9639636883430467e-05, + "loss": 0.6325, + "step": 2483 + }, + { + "epoch": 0.09, + "learning_rate": 1.9639347151401e-05, + "loss": 0.635, + "step": 2484 + }, + { + "epoch": 0.09, + "learning_rate": 1.963905730508487e-05, + "loss": 0.607, + "step": 2485 + }, + { + "epoch": 0.09, + "learning_rate": 1.963876734448553e-05, + "loss": 0.6267, + "step": 2486 + }, + { + "epoch": 0.09, + "learning_rate": 1.9638477269606405e-05, + "loss": 0.646, + "step": 2487 + }, + { + "epoch": 0.09, + "learning_rate": 1.963818708045094e-05, + "loss": 0.5939, + "step": 2488 + }, + { + "epoch": 0.09, + "learning_rate": 1.9637896777022577e-05, + "loss": 0.6435, + "step": 2489 + }, + { + "epoch": 0.09, + "learning_rate": 1.9637606359324756e-05, + "loss": 0.6321, + "step": 2490 + }, + { + "epoch": 0.09, + "learning_rate": 1.9637315827360916e-05, + "loss": 0.6389, + "step": 2491 + }, + { + "epoch": 0.09, + "learning_rate": 1.963702518113451e-05, + "loss": 0.6848, + "step": 2492 + }, + { + "epoch": 0.09, + "learning_rate": 1.9636734420648977e-05, + "loss": 0.6075, + "step": 2493 + }, + { + "epoch": 0.09, + "learning_rate": 1.963644354590777e-05, + "loss": 0.6157, + "step": 2494 + }, + { + "epoch": 0.09, + "learning_rate": 1.963615255691433e-05, + "loss": 0.6214, + "step": 2495 + }, + { + "epoch": 0.09, + "learning_rate": 1.9635861453672113e-05, + "loss": 0.6631, + "step": 2496 + }, + { + "epoch": 0.09, + "learning_rate": 1.963557023618457e-05, + "loss": 0.6313, + "step": 2497 + }, + { + "epoch": 0.09, + "learning_rate": 1.9635278904455152e-05, + "loss": 0.6703, + "step": 2498 + }, + { + "epoch": 0.09, + "learning_rate": 1.9634987458487315e-05, + "loss": 0.635, + "step": 2499 + }, + { + "epoch": 0.09, + "learning_rate": 1.9634695898284515e-05, + "loss": 0.6346, + "step": 2500 + }, + { + "epoch": 0.09, + "learning_rate": 1.9634404223850202e-05, + "loss": 0.6277, + "step": 2501 + }, + { + "epoch": 0.09, + "learning_rate": 1.9634112435187844e-05, + "loss": 0.7033, + "step": 2502 + }, + { + "epoch": 0.09, + "learning_rate": 1.9633820532300894e-05, + "loss": 0.6695, + "step": 2503 + }, + { + "epoch": 0.09, + "learning_rate": 1.9633528515192816e-05, + "loss": 0.6626, + "step": 2504 + }, + { + "epoch": 0.09, + "learning_rate": 1.963323638386707e-05, + "loss": 0.6023, + "step": 2505 + }, + { + "epoch": 0.09, + "learning_rate": 1.9632944138327118e-05, + "loss": 0.6715, + "step": 2506 + }, + { + "epoch": 0.09, + "learning_rate": 1.9632651778576434e-05, + "loss": 0.6308, + "step": 2507 + }, + { + "epoch": 0.09, + "learning_rate": 1.9632359304618472e-05, + "loss": 0.638, + "step": 2508 + }, + { + "epoch": 0.09, + "learning_rate": 1.9632066716456708e-05, + "loss": 0.6387, + "step": 2509 + }, + { + "epoch": 0.09, + "learning_rate": 1.9631774014094607e-05, + "loss": 0.6195, + "step": 2510 + }, + { + "epoch": 0.09, + "learning_rate": 1.963148119753564e-05, + "loss": 0.6731, + "step": 2511 + }, + { + "epoch": 0.09, + "learning_rate": 1.9631188266783282e-05, + "loss": 0.6624, + "step": 2512 + }, + { + "epoch": 0.09, + "learning_rate": 1.9630895221841004e-05, + "loss": 0.7061, + "step": 2513 + }, + { + "epoch": 0.09, + "learning_rate": 1.963060206271228e-05, + "loss": 0.6501, + "step": 2514 + }, + { + "epoch": 0.09, + "learning_rate": 1.963030878940058e-05, + "loss": 0.6438, + "step": 2515 + }, + { + "epoch": 0.09, + "learning_rate": 1.9630015401909393e-05, + "loss": 0.6296, + "step": 2516 + }, + { + "epoch": 0.09, + "learning_rate": 1.962972190024219e-05, + "loss": 0.6144, + "step": 2517 + }, + { + "epoch": 0.09, + "learning_rate": 1.962942828440245e-05, + "loss": 0.6192, + "step": 2518 + }, + { + "epoch": 0.09, + "learning_rate": 1.962913455439366e-05, + "loss": 0.6291, + "step": 2519 + }, + { + "epoch": 0.09, + "learning_rate": 1.9628840710219298e-05, + "loss": 0.663, + "step": 2520 + }, + { + "epoch": 0.09, + "learning_rate": 1.9628546751882846e-05, + "loss": 0.6496, + "step": 2521 + }, + { + "epoch": 0.09, + "learning_rate": 1.9628252679387795e-05, + "loss": 0.6621, + "step": 2522 + }, + { + "epoch": 0.09, + "learning_rate": 1.962795849273763e-05, + "loss": 0.6489, + "step": 2523 + }, + { + "epoch": 0.09, + "learning_rate": 1.9627664191935833e-05, + "loss": 0.6585, + "step": 2524 + }, + { + "epoch": 0.09, + "learning_rate": 1.96273697769859e-05, + "loss": 0.6489, + "step": 2525 + }, + { + "epoch": 0.09, + "learning_rate": 1.962707524789132e-05, + "loss": 0.6375, + "step": 2526 + }, + { + "epoch": 0.09, + "learning_rate": 1.9626780604655583e-05, + "loss": 0.6967, + "step": 2527 + }, + { + "epoch": 0.09, + "learning_rate": 1.962648584728219e-05, + "loss": 0.6458, + "step": 2528 + }, + { + "epoch": 0.09, + "learning_rate": 1.9626190975774625e-05, + "loss": 0.7115, + "step": 2529 + }, + { + "epoch": 0.09, + "learning_rate": 1.9625895990136386e-05, + "loss": 0.6716, + "step": 2530 + }, + { + "epoch": 0.09, + "learning_rate": 1.962560089037098e-05, + "loss": 0.6522, + "step": 2531 + }, + { + "epoch": 0.09, + "learning_rate": 1.962530567648189e-05, + "loss": 0.6635, + "step": 2532 + }, + { + "epoch": 0.09, + "learning_rate": 1.9625010348472634e-05, + "loss": 0.6238, + "step": 2533 + }, + { + "epoch": 0.09, + "learning_rate": 1.96247149063467e-05, + "loss": 0.6241, + "step": 2534 + }, + { + "epoch": 0.09, + "learning_rate": 1.9624419350107598e-05, + "loss": 0.632, + "step": 2535 + }, + { + "epoch": 0.09, + "learning_rate": 1.9624123679758828e-05, + "loss": 0.5853, + "step": 2536 + }, + { + "epoch": 0.09, + "learning_rate": 1.9623827895303895e-05, + "loss": 0.6243, + "step": 2537 + }, + { + "epoch": 0.09, + "learning_rate": 1.9623531996746313e-05, + "loss": 0.5766, + "step": 2538 + }, + { + "epoch": 0.09, + "learning_rate": 1.962323598408958e-05, + "loss": 0.701, + "step": 2539 + }, + { + "epoch": 0.09, + "learning_rate": 1.9622939857337216e-05, + "loss": 0.6765, + "step": 2540 + }, + { + "epoch": 0.09, + "learning_rate": 1.9622643616492726e-05, + "loss": 0.6712, + "step": 2541 + }, + { + "epoch": 0.09, + "learning_rate": 1.962234726155962e-05, + "loss": 0.6085, + "step": 2542 + }, + { + "epoch": 0.09, + "learning_rate": 1.9622050792541417e-05, + "loss": 0.6496, + "step": 2543 + }, + { + "epoch": 0.09, + "learning_rate": 1.962175420944163e-05, + "loss": 0.6531, + "step": 2544 + }, + { + "epoch": 0.09, + "learning_rate": 1.9621457512263776e-05, + "loss": 0.6274, + "step": 2545 + }, + { + "epoch": 0.09, + "learning_rate": 1.962116070101137e-05, + "loss": 0.5921, + "step": 2546 + }, + { + "epoch": 0.09, + "learning_rate": 1.9620863775687934e-05, + "loss": 0.6233, + "step": 2547 + }, + { + "epoch": 0.09, + "learning_rate": 1.962056673629699e-05, + "loss": 0.6562, + "step": 2548 + }, + { + "epoch": 0.09, + "learning_rate": 1.9620269582842054e-05, + "loss": 0.6512, + "step": 2549 + }, + { + "epoch": 0.09, + "learning_rate": 1.961997231532665e-05, + "loss": 0.6094, + "step": 2550 + }, + { + "epoch": 0.09, + "learning_rate": 1.9619674933754308e-05, + "loss": 0.7113, + "step": 2551 + }, + { + "epoch": 0.09, + "learning_rate": 1.9619377438128552e-05, + "loss": 0.6229, + "step": 2552 + }, + { + "epoch": 0.09, + "learning_rate": 1.9619079828452906e-05, + "loss": 0.6474, + "step": 2553 + }, + { + "epoch": 0.09, + "learning_rate": 1.96187821047309e-05, + "loss": 0.6051, + "step": 2554 + }, + { + "epoch": 0.09, + "learning_rate": 1.9618484266966067e-05, + "loss": 0.6143, + "step": 2555 + }, + { + "epoch": 0.09, + "learning_rate": 1.9618186315161935e-05, + "loss": 0.6597, + "step": 2556 + }, + { + "epoch": 0.09, + "learning_rate": 1.9617888249322035e-05, + "loss": 0.668, + "step": 2557 + }, + { + "epoch": 0.09, + "learning_rate": 1.9617590069449904e-05, + "loss": 0.6574, + "step": 2558 + }, + { + "epoch": 0.09, + "learning_rate": 1.9617291775549077e-05, + "loss": 0.7242, + "step": 2559 + }, + { + "epoch": 0.09, + "learning_rate": 1.961699336762309e-05, + "loss": 0.6199, + "step": 2560 + }, + { + "epoch": 0.09, + "learning_rate": 1.961669484567548e-05, + "loss": 0.6537, + "step": 2561 + }, + { + "epoch": 0.09, + "learning_rate": 1.9616396209709786e-05, + "loss": 0.6306, + "step": 2562 + }, + { + "epoch": 0.09, + "learning_rate": 1.9616097459729553e-05, + "loss": 0.6368, + "step": 2563 + }, + { + "epoch": 0.09, + "learning_rate": 1.9615798595738323e-05, + "loss": 0.5995, + "step": 2564 + }, + { + "epoch": 0.09, + "learning_rate": 1.961549961773963e-05, + "loss": 0.6665, + "step": 2565 + }, + { + "epoch": 0.09, + "learning_rate": 1.961520052573703e-05, + "loss": 0.6442, + "step": 2566 + }, + { + "epoch": 0.09, + "learning_rate": 1.961490131973406e-05, + "loss": 0.6282, + "step": 2567 + }, + { + "epoch": 0.09, + "learning_rate": 1.9614601999734278e-05, + "loss": 0.654, + "step": 2568 + }, + { + "epoch": 0.09, + "learning_rate": 1.9614302565741222e-05, + "loss": 0.6534, + "step": 2569 + }, + { + "epoch": 0.09, + "learning_rate": 1.961400301775845e-05, + "loss": 0.6323, + "step": 2570 + }, + { + "epoch": 0.09, + "learning_rate": 1.9613703355789508e-05, + "loss": 0.6136, + "step": 2571 + }, + { + "epoch": 0.09, + "learning_rate": 1.961340357983795e-05, + "loss": 0.6763, + "step": 2572 + }, + { + "epoch": 0.09, + "learning_rate": 1.9613103689907338e-05, + "loss": 0.6529, + "step": 2573 + }, + { + "epoch": 0.09, + "learning_rate": 1.9612803686001218e-05, + "loss": 0.6389, + "step": 2574 + }, + { + "epoch": 0.09, + "learning_rate": 1.961250356812315e-05, + "loss": 0.629, + "step": 2575 + }, + { + "epoch": 0.09, + "learning_rate": 1.9612203336276688e-05, + "loss": 0.6543, + "step": 2576 + }, + { + "epoch": 0.09, + "learning_rate": 1.96119029904654e-05, + "loss": 0.6359, + "step": 2577 + }, + { + "epoch": 0.09, + "learning_rate": 1.9611602530692843e-05, + "loss": 0.6652, + "step": 2578 + }, + { + "epoch": 0.09, + "learning_rate": 1.961130195696258e-05, + "loss": 0.6808, + "step": 2579 + }, + { + "epoch": 0.09, + "learning_rate": 1.961100126927817e-05, + "loss": 0.6116, + "step": 2580 + }, + { + "epoch": 0.09, + "learning_rate": 1.9610700467643182e-05, + "loss": 0.6244, + "step": 2581 + }, + { + "epoch": 0.09, + "learning_rate": 1.961039955206119e-05, + "loss": 0.6722, + "step": 2582 + }, + { + "epoch": 0.09, + "learning_rate": 1.9610098522535745e-05, + "loss": 0.642, + "step": 2583 + }, + { + "epoch": 0.09, + "learning_rate": 1.9609797379070427e-05, + "loss": 0.6394, + "step": 2584 + }, + { + "epoch": 0.09, + "learning_rate": 1.9609496121668807e-05, + "loss": 0.6991, + "step": 2585 + }, + { + "epoch": 0.09, + "learning_rate": 1.960919475033446e-05, + "loss": 0.5908, + "step": 2586 + }, + { + "epoch": 0.09, + "learning_rate": 1.9608893265070943e-05, + "loss": 0.6498, + "step": 2587 + }, + { + "epoch": 0.09, + "learning_rate": 1.9608591665881845e-05, + "loss": 0.6697, + "step": 2588 + }, + { + "epoch": 0.09, + "learning_rate": 1.960828995277074e-05, + "loss": 0.5942, + "step": 2589 + }, + { + "epoch": 0.09, + "learning_rate": 1.96079881257412e-05, + "loss": 0.6464, + "step": 2590 + }, + { + "epoch": 0.09, + "learning_rate": 1.960768618479681e-05, + "loss": 0.588, + "step": 2591 + }, + { + "epoch": 0.09, + "learning_rate": 1.9607384129941143e-05, + "loss": 0.6606, + "step": 2592 + }, + { + "epoch": 0.09, + "learning_rate": 1.9607081961177785e-05, + "loss": 0.6773, + "step": 2593 + }, + { + "epoch": 0.09, + "learning_rate": 1.960677967851032e-05, + "loss": 0.6848, + "step": 2594 + }, + { + "epoch": 0.09, + "learning_rate": 1.9606477281942323e-05, + "loss": 0.6029, + "step": 2595 + }, + { + "epoch": 0.09, + "learning_rate": 1.9606174771477392e-05, + "loss": 0.6399, + "step": 2596 + }, + { + "epoch": 0.09, + "learning_rate": 1.9605872147119104e-05, + "loss": 0.6517, + "step": 2597 + }, + { + "epoch": 0.09, + "learning_rate": 1.9605569408871053e-05, + "loss": 0.601, + "step": 2598 + }, + { + "epoch": 0.09, + "learning_rate": 1.9605266556736823e-05, + "loss": 0.6026, + "step": 2599 + }, + { + "epoch": 0.09, + "learning_rate": 1.9604963590720007e-05, + "loss": 0.6839, + "step": 2600 + }, + { + "epoch": 0.09, + "learning_rate": 1.9604660510824198e-05, + "loss": 0.6355, + "step": 2601 + }, + { + "epoch": 0.09, + "learning_rate": 1.9604357317052988e-05, + "loss": 0.7125, + "step": 2602 + }, + { + "epoch": 0.09, + "learning_rate": 1.9604054009409975e-05, + "loss": 0.6094, + "step": 2603 + }, + { + "epoch": 0.09, + "learning_rate": 1.960375058789875e-05, + "loss": 0.6309, + "step": 2604 + }, + { + "epoch": 0.09, + "learning_rate": 1.9603447052522915e-05, + "loss": 0.6325, + "step": 2605 + }, + { + "epoch": 0.09, + "learning_rate": 1.9603143403286064e-05, + "loss": 0.6619, + "step": 2606 + }, + { + "epoch": 0.09, + "learning_rate": 1.9602839640191803e-05, + "loss": 0.6805, + "step": 2607 + }, + { + "epoch": 0.09, + "learning_rate": 1.9602535763243726e-05, + "loss": 0.5466, + "step": 2608 + }, + { + "epoch": 0.09, + "learning_rate": 1.9602231772445443e-05, + "loss": 0.6244, + "step": 2609 + }, + { + "epoch": 0.09, + "learning_rate": 1.960192766780056e-05, + "loss": 0.7076, + "step": 2610 + }, + { + "epoch": 0.09, + "learning_rate": 1.960162344931267e-05, + "loss": 0.5925, + "step": 2611 + }, + { + "epoch": 0.09, + "learning_rate": 1.960131911698539e-05, + "loss": 0.6809, + "step": 2612 + }, + { + "epoch": 0.09, + "learning_rate": 1.9601014670822328e-05, + "loss": 0.6642, + "step": 2613 + }, + { + "epoch": 0.09, + "learning_rate": 1.9600710110827093e-05, + "loss": 0.6569, + "step": 2614 + }, + { + "epoch": 0.09, + "learning_rate": 1.960040543700329e-05, + "loss": 0.7129, + "step": 2615 + }, + { + "epoch": 0.09, + "learning_rate": 1.960010064935454e-05, + "loss": 0.6078, + "step": 2616 + }, + { + "epoch": 0.09, + "learning_rate": 1.9599795747884452e-05, + "loss": 0.6601, + "step": 2617 + }, + { + "epoch": 0.09, + "learning_rate": 1.959949073259664e-05, + "loss": 0.6384, + "step": 2618 + }, + { + "epoch": 0.09, + "learning_rate": 1.9599185603494725e-05, + "loss": 0.6872, + "step": 2619 + }, + { + "epoch": 0.09, + "learning_rate": 1.959888036058232e-05, + "loss": 0.6482, + "step": 2620 + }, + { + "epoch": 0.09, + "learning_rate": 1.9598575003863043e-05, + "loss": 0.5938, + "step": 2621 + }, + { + "epoch": 0.09, + "learning_rate": 1.959826953334052e-05, + "loss": 0.629, + "step": 2622 + }, + { + "epoch": 0.09, + "learning_rate": 1.959796394901837e-05, + "loss": 0.6484, + "step": 2623 + }, + { + "epoch": 0.09, + "learning_rate": 1.9597658250900214e-05, + "loss": 0.6328, + "step": 2624 + }, + { + "epoch": 0.09, + "learning_rate": 1.959735243898968e-05, + "loss": 0.6658, + "step": 2625 + }, + { + "epoch": 0.09, + "learning_rate": 1.9597046513290394e-05, + "loss": 0.6356, + "step": 2626 + }, + { + "epoch": 0.09, + "learning_rate": 1.9596740473805976e-05, + "loss": 0.5979, + "step": 2627 + }, + { + "epoch": 0.09, + "learning_rate": 1.9596434320540063e-05, + "loss": 0.6407, + "step": 2628 + }, + { + "epoch": 0.09, + "learning_rate": 1.959612805349628e-05, + "loss": 0.6532, + "step": 2629 + }, + { + "epoch": 0.09, + "learning_rate": 1.9595821672678263e-05, + "loss": 0.665, + "step": 2630 + }, + { + "epoch": 0.09, + "learning_rate": 1.9595515178089636e-05, + "loss": 0.6219, + "step": 2631 + }, + { + "epoch": 0.09, + "learning_rate": 1.9595208569734042e-05, + "loss": 0.6687, + "step": 2632 + }, + { + "epoch": 0.09, + "learning_rate": 1.9594901847615113e-05, + "loss": 0.6375, + "step": 2633 + }, + { + "epoch": 0.09, + "learning_rate": 1.9594595011736485e-05, + "loss": 0.5864, + "step": 2634 + }, + { + "epoch": 0.09, + "learning_rate": 1.9594288062101793e-05, + "loss": 0.6177, + "step": 2635 + }, + { + "epoch": 0.09, + "learning_rate": 1.9593980998714682e-05, + "loss": 0.6532, + "step": 2636 + }, + { + "epoch": 0.09, + "learning_rate": 1.959367382157879e-05, + "loss": 0.6385, + "step": 2637 + }, + { + "epoch": 0.09, + "learning_rate": 1.9593366530697758e-05, + "loss": 0.6591, + "step": 2638 + }, + { + "epoch": 0.09, + "learning_rate": 1.9593059126075228e-05, + "loss": 0.6708, + "step": 2639 + }, + { + "epoch": 0.09, + "learning_rate": 1.9592751607714846e-05, + "loss": 0.5967, + "step": 2640 + }, + { + "epoch": 0.09, + "learning_rate": 1.959244397562026e-05, + "loss": 0.6308, + "step": 2641 + }, + { + "epoch": 0.09, + "learning_rate": 1.959213622979512e-05, + "loss": 0.6708, + "step": 2642 + }, + { + "epoch": 0.09, + "learning_rate": 1.9591828370243066e-05, + "loss": 0.5922, + "step": 2643 + }, + { + "epoch": 0.09, + "learning_rate": 1.959152039696776e-05, + "loss": 0.6431, + "step": 2644 + }, + { + "epoch": 0.09, + "learning_rate": 1.9591212309972838e-05, + "loss": 0.656, + "step": 2645 + }, + { + "epoch": 0.09, + "learning_rate": 1.9590904109261965e-05, + "loss": 0.6308, + "step": 2646 + }, + { + "epoch": 0.09, + "learning_rate": 1.9590595794838792e-05, + "loss": 0.6837, + "step": 2647 + }, + { + "epoch": 0.09, + "learning_rate": 1.959028736670697e-05, + "loss": 0.6679, + "step": 2648 + }, + { + "epoch": 0.09, + "learning_rate": 1.9589978824870164e-05, + "loss": 0.6359, + "step": 2649 + }, + { + "epoch": 0.09, + "learning_rate": 1.9589670169332025e-05, + "loss": 0.6262, + "step": 2650 + }, + { + "epoch": 0.09, + "learning_rate": 1.9589361400096215e-05, + "loss": 0.6332, + "step": 2651 + }, + { + "epoch": 0.09, + "learning_rate": 1.95890525171664e-05, + "loss": 0.6248, + "step": 2652 + }, + { + "epoch": 0.09, + "learning_rate": 1.958874352054623e-05, + "loss": 0.6816, + "step": 2653 + }, + { + "epoch": 0.09, + "learning_rate": 1.9588434410239378e-05, + "loss": 0.646, + "step": 2654 + }, + { + "epoch": 0.09, + "learning_rate": 1.9588125186249506e-05, + "loss": 0.688, + "step": 2655 + }, + { + "epoch": 0.09, + "learning_rate": 1.9587815848580283e-05, + "loss": 0.6323, + "step": 2656 + }, + { + "epoch": 0.09, + "learning_rate": 1.9587506397235374e-05, + "loss": 0.7012, + "step": 2657 + }, + { + "epoch": 0.09, + "learning_rate": 1.958719683221845e-05, + "loss": 0.6704, + "step": 2658 + }, + { + "epoch": 0.09, + "learning_rate": 1.9586887153533177e-05, + "loss": 0.6393, + "step": 2659 + }, + { + "epoch": 0.09, + "learning_rate": 1.958657736118323e-05, + "loss": 0.6744, + "step": 2660 + }, + { + "epoch": 0.09, + "learning_rate": 1.9586267455172282e-05, + "loss": 0.6782, + "step": 2661 + }, + { + "epoch": 0.09, + "learning_rate": 1.9585957435504003e-05, + "loss": 0.6519, + "step": 2662 + }, + { + "epoch": 0.09, + "learning_rate": 1.9585647302182077e-05, + "loss": 0.6364, + "step": 2663 + }, + { + "epoch": 0.09, + "learning_rate": 1.9585337055210175e-05, + "loss": 0.6572, + "step": 2664 + }, + { + "epoch": 0.09, + "learning_rate": 1.9585026694591978e-05, + "loss": 0.6484, + "step": 2665 + }, + { + "epoch": 0.09, + "learning_rate": 1.9584716220331162e-05, + "loss": 0.6856, + "step": 2666 + }, + { + "epoch": 0.09, + "learning_rate": 1.9584405632431413e-05, + "loss": 0.6852, + "step": 2667 + }, + { + "epoch": 0.09, + "learning_rate": 1.9584094930896407e-05, + "loss": 0.6405, + "step": 2668 + }, + { + "epoch": 0.09, + "learning_rate": 1.958378411572983e-05, + "loss": 0.6483, + "step": 2669 + }, + { + "epoch": 0.09, + "learning_rate": 1.9583473186935376e-05, + "loss": 0.6019, + "step": 2670 + }, + { + "epoch": 0.09, + "learning_rate": 1.958316214451672e-05, + "loss": 0.6268, + "step": 2671 + }, + { + "epoch": 0.09, + "learning_rate": 1.9582850988477554e-05, + "loss": 0.6486, + "step": 2672 + }, + { + "epoch": 0.09, + "learning_rate": 1.958253971882157e-05, + "loss": 0.5842, + "step": 2673 + }, + { + "epoch": 0.09, + "learning_rate": 1.958222833555245e-05, + "loss": 0.6209, + "step": 2674 + }, + { + "epoch": 0.09, + "learning_rate": 1.9581916838673898e-05, + "loss": 0.677, + "step": 2675 + }, + { + "epoch": 0.09, + "learning_rate": 1.9581605228189598e-05, + "loss": 0.6585, + "step": 2676 + }, + { + "epoch": 0.09, + "learning_rate": 1.9581293504103245e-05, + "loss": 0.6389, + "step": 2677 + }, + { + "epoch": 0.09, + "learning_rate": 1.958098166641854e-05, + "loss": 0.6431, + "step": 2678 + }, + { + "epoch": 0.09, + "learning_rate": 1.9580669715139176e-05, + "loss": 0.7201, + "step": 2679 + }, + { + "epoch": 0.09, + "learning_rate": 1.9580357650268853e-05, + "loss": 0.7021, + "step": 2680 + }, + { + "epoch": 0.09, + "learning_rate": 1.9580045471811272e-05, + "loss": 0.6655, + "step": 2681 + }, + { + "epoch": 0.09, + "learning_rate": 1.9579733179770134e-05, + "loss": 0.6091, + "step": 2682 + }, + { + "epoch": 0.09, + "learning_rate": 1.957942077414914e-05, + "loss": 0.6935, + "step": 2683 + }, + { + "epoch": 0.09, + "learning_rate": 1.957910825495199e-05, + "loss": 0.6861, + "step": 2684 + }, + { + "epoch": 0.09, + "learning_rate": 1.95787956221824e-05, + "loss": 0.6154, + "step": 2685 + }, + { + "epoch": 0.09, + "learning_rate": 1.9578482875844068e-05, + "loss": 0.6505, + "step": 2686 + }, + { + "epoch": 0.09, + "learning_rate": 1.9578170015940706e-05, + "loss": 0.6189, + "step": 2687 + }, + { + "epoch": 0.09, + "learning_rate": 1.957785704247602e-05, + "loss": 0.5898, + "step": 2688 + }, + { + "epoch": 0.09, + "learning_rate": 1.9577543955453725e-05, + "loss": 0.6318, + "step": 2689 + }, + { + "epoch": 0.09, + "learning_rate": 1.9577230754877526e-05, + "loss": 0.6819, + "step": 2690 + }, + { + "epoch": 0.09, + "learning_rate": 1.9576917440751147e-05, + "loss": 0.6584, + "step": 2691 + }, + { + "epoch": 0.09, + "learning_rate": 1.9576604013078296e-05, + "loss": 0.6755, + "step": 2692 + }, + { + "epoch": 0.09, + "learning_rate": 1.9576290471862685e-05, + "loss": 0.6354, + "step": 2693 + }, + { + "epoch": 0.09, + "learning_rate": 1.9575976817108044e-05, + "loss": 0.6703, + "step": 2694 + }, + { + "epoch": 0.09, + "learning_rate": 1.9575663048818078e-05, + "loss": 0.6471, + "step": 2695 + }, + { + "epoch": 0.09, + "learning_rate": 1.9575349166996516e-05, + "loss": 0.6442, + "step": 2696 + }, + { + "epoch": 0.09, + "learning_rate": 1.9575035171647077e-05, + "loss": 0.6109, + "step": 2697 + }, + { + "epoch": 0.09, + "learning_rate": 1.957472106277348e-05, + "loss": 0.6067, + "step": 2698 + }, + { + "epoch": 0.09, + "learning_rate": 1.9574406840379456e-05, + "loss": 0.712, + "step": 2699 + }, + { + "epoch": 0.09, + "learning_rate": 1.9574092504468728e-05, + "loss": 0.6462, + "step": 2700 + }, + { + "epoch": 0.09, + "learning_rate": 1.957377805504502e-05, + "loss": 0.6295, + "step": 2701 + }, + { + "epoch": 0.09, + "learning_rate": 1.957346349211206e-05, + "loss": 0.6998, + "step": 2702 + }, + { + "epoch": 0.09, + "learning_rate": 1.9573148815673587e-05, + "loss": 0.6651, + "step": 2703 + }, + { + "epoch": 0.09, + "learning_rate": 1.9572834025733318e-05, + "loss": 0.6651, + "step": 2704 + }, + { + "epoch": 0.09, + "learning_rate": 1.9572519122294994e-05, + "loss": 0.6137, + "step": 2705 + }, + { + "epoch": 0.09, + "learning_rate": 1.957220410536235e-05, + "loss": 0.6569, + "step": 2706 + }, + { + "epoch": 0.09, + "learning_rate": 1.9571888974939112e-05, + "loss": 0.6337, + "step": 2707 + }, + { + "epoch": 0.09, + "learning_rate": 1.9571573731029024e-05, + "loss": 0.6113, + "step": 2708 + }, + { + "epoch": 0.09, + "learning_rate": 1.9571258373635823e-05, + "loss": 0.5898, + "step": 2709 + }, + { + "epoch": 0.09, + "learning_rate": 1.957094290276324e-05, + "loss": 0.6605, + "step": 2710 + }, + { + "epoch": 0.09, + "learning_rate": 1.957062731841503e-05, + "loss": 0.6398, + "step": 2711 + }, + { + "epoch": 0.09, + "learning_rate": 1.9570311620594923e-05, + "loss": 0.6479, + "step": 2712 + }, + { + "epoch": 0.09, + "learning_rate": 1.9569995809306663e-05, + "loss": 0.5832, + "step": 2713 + }, + { + "epoch": 0.09, + "learning_rate": 1.9569679884554e-05, + "loss": 0.6633, + "step": 2714 + }, + { + "epoch": 0.09, + "learning_rate": 1.9569363846340672e-05, + "loss": 0.5929, + "step": 2715 + }, + { + "epoch": 0.09, + "learning_rate": 1.9569047694670433e-05, + "loss": 0.6923, + "step": 2716 + }, + { + "epoch": 0.09, + "learning_rate": 1.956873142954703e-05, + "loss": 0.6365, + "step": 2717 + }, + { + "epoch": 0.09, + "learning_rate": 1.9568415050974207e-05, + "loss": 0.6549, + "step": 2718 + }, + { + "epoch": 0.09, + "learning_rate": 1.9568098558955725e-05, + "loss": 0.6108, + "step": 2719 + }, + { + "epoch": 0.09, + "learning_rate": 1.9567781953495326e-05, + "loss": 0.6289, + "step": 2720 + }, + { + "epoch": 0.09, + "learning_rate": 1.9567465234596772e-05, + "loss": 0.584, + "step": 2721 + }, + { + "epoch": 0.09, + "learning_rate": 1.9567148402263813e-05, + "loss": 0.66, + "step": 2722 + }, + { + "epoch": 0.09, + "learning_rate": 1.956683145650021e-05, + "loss": 0.6591, + "step": 2723 + }, + { + "epoch": 0.09, + "learning_rate": 1.9566514397309713e-05, + "loss": 0.6642, + "step": 2724 + }, + { + "epoch": 0.09, + "learning_rate": 1.956619722469609e-05, + "loss": 0.6585, + "step": 2725 + }, + { + "epoch": 0.09, + "learning_rate": 1.9565879938663096e-05, + "loss": 0.6457, + "step": 2726 + }, + { + "epoch": 0.09, + "learning_rate": 1.9565562539214497e-05, + "loss": 0.6501, + "step": 2727 + }, + { + "epoch": 0.09, + "learning_rate": 1.9565245026354048e-05, + "loss": 0.6403, + "step": 2728 + }, + { + "epoch": 0.09, + "learning_rate": 1.9564927400085523e-05, + "loss": 0.6898, + "step": 2729 + }, + { + "epoch": 0.09, + "learning_rate": 1.9564609660412684e-05, + "loss": 0.6217, + "step": 2730 + }, + { + "epoch": 0.09, + "learning_rate": 1.9564291807339296e-05, + "loss": 0.5731, + "step": 2731 + }, + { + "epoch": 0.09, + "learning_rate": 1.9563973840869136e-05, + "loss": 0.619, + "step": 2732 + }, + { + "epoch": 0.09, + "learning_rate": 1.956365576100596e-05, + "loss": 0.6802, + "step": 2733 + }, + { + "epoch": 0.09, + "learning_rate": 1.956333756775355e-05, + "loss": 0.6326, + "step": 2734 + }, + { + "epoch": 0.09, + "learning_rate": 1.9563019261115674e-05, + "loss": 0.6635, + "step": 2735 + }, + { + "epoch": 0.09, + "learning_rate": 1.956270084109611e-05, + "loss": 0.6747, + "step": 2736 + }, + { + "epoch": 0.09, + "learning_rate": 1.9562382307698628e-05, + "loss": 0.6393, + "step": 2737 + }, + { + "epoch": 0.09, + "learning_rate": 1.956206366092701e-05, + "loss": 0.6167, + "step": 2738 + }, + { + "epoch": 0.09, + "learning_rate": 1.956174490078503e-05, + "loss": 0.6309, + "step": 2739 + }, + { + "epoch": 0.09, + "learning_rate": 1.956142602727647e-05, + "loss": 0.5782, + "step": 2740 + }, + { + "epoch": 0.09, + "learning_rate": 1.956110704040511e-05, + "loss": 0.6235, + "step": 2741 + }, + { + "epoch": 0.1, + "learning_rate": 1.9560787940174725e-05, + "loss": 0.6865, + "step": 2742 + }, + { + "epoch": 0.1, + "learning_rate": 1.9560468726589107e-05, + "loss": 0.6216, + "step": 2743 + }, + { + "epoch": 0.1, + "learning_rate": 1.9560149399652042e-05, + "loss": 0.6084, + "step": 2744 + }, + { + "epoch": 0.1, + "learning_rate": 1.955982995936731e-05, + "loss": 0.6352, + "step": 2745 + }, + { + "epoch": 0.1, + "learning_rate": 1.95595104057387e-05, + "loss": 0.6544, + "step": 2746 + }, + { + "epoch": 0.1, + "learning_rate": 1.955919073877e-05, + "loss": 0.6926, + "step": 2747 + }, + { + "epoch": 0.1, + "learning_rate": 1.9558870958465005e-05, + "loss": 0.7066, + "step": 2748 + }, + { + "epoch": 0.1, + "learning_rate": 1.95585510648275e-05, + "loss": 0.6209, + "step": 2749 + }, + { + "epoch": 0.1, + "learning_rate": 1.955823105786128e-05, + "loss": 0.6425, + "step": 2750 + }, + { + "epoch": 0.1, + "learning_rate": 1.9557910937570143e-05, + "loss": 0.6129, + "step": 2751 + }, + { + "epoch": 0.1, + "learning_rate": 1.9557590703957874e-05, + "loss": 0.719, + "step": 2752 + }, + { + "epoch": 0.1, + "learning_rate": 1.9557270357028285e-05, + "loss": 0.6424, + "step": 2753 + }, + { + "epoch": 0.1, + "learning_rate": 1.9556949896785162e-05, + "loss": 0.6297, + "step": 2754 + }, + { + "epoch": 0.1, + "learning_rate": 1.955662932323231e-05, + "loss": 0.6891, + "step": 2755 + }, + { + "epoch": 0.1, + "learning_rate": 1.9556308636373525e-05, + "loss": 0.63, + "step": 2756 + }, + { + "epoch": 0.1, + "learning_rate": 1.9555987836212615e-05, + "loss": 0.6266, + "step": 2757 + }, + { + "epoch": 0.1, + "learning_rate": 1.955566692275338e-05, + "loss": 0.6845, + "step": 2758 + }, + { + "epoch": 0.1, + "learning_rate": 1.9555345895999626e-05, + "loss": 0.6472, + "step": 2759 + }, + { + "epoch": 0.1, + "learning_rate": 1.9555024755955158e-05, + "loss": 0.6683, + "step": 2760 + }, + { + "epoch": 0.1, + "learning_rate": 1.9554703502623783e-05, + "loss": 0.5818, + "step": 2761 + }, + { + "epoch": 0.1, + "learning_rate": 1.9554382136009315e-05, + "loss": 0.617, + "step": 2762 + }, + { + "epoch": 0.1, + "learning_rate": 1.955406065611556e-05, + "loss": 0.6291, + "step": 2763 + }, + { + "epoch": 0.1, + "learning_rate": 1.9553739062946327e-05, + "loss": 0.6285, + "step": 2764 + }, + { + "epoch": 0.1, + "learning_rate": 1.9553417356505435e-05, + "loss": 0.6387, + "step": 2765 + }, + { + "epoch": 0.1, + "learning_rate": 1.9553095536796692e-05, + "loss": 0.7261, + "step": 2766 + }, + { + "epoch": 0.1, + "learning_rate": 1.955277360382392e-05, + "loss": 0.6218, + "step": 2767 + }, + { + "epoch": 0.1, + "learning_rate": 1.955245155759093e-05, + "loss": 0.6988, + "step": 2768 + }, + { + "epoch": 0.1, + "learning_rate": 1.9552129398101543e-05, + "loss": 0.597, + "step": 2769 + }, + { + "epoch": 0.1, + "learning_rate": 1.955180712535958e-05, + "loss": 0.6237, + "step": 2770 + }, + { + "epoch": 0.1, + "learning_rate": 1.9551484739368856e-05, + "loss": 0.6066, + "step": 2771 + }, + { + "epoch": 0.1, + "learning_rate": 1.9551162240133203e-05, + "loss": 0.6079, + "step": 2772 + }, + { + "epoch": 0.1, + "learning_rate": 1.9550839627656438e-05, + "loss": 0.6488, + "step": 2773 + }, + { + "epoch": 0.1, + "learning_rate": 1.955051690194239e-05, + "loss": 0.6178, + "step": 2774 + }, + { + "epoch": 0.1, + "learning_rate": 1.955019406299488e-05, + "loss": 0.5575, + "step": 2775 + }, + { + "epoch": 0.1, + "learning_rate": 1.954987111081774e-05, + "loss": 0.6515, + "step": 2776 + }, + { + "epoch": 0.1, + "learning_rate": 1.9549548045414794e-05, + "loss": 0.644, + "step": 2777 + }, + { + "epoch": 0.1, + "learning_rate": 1.9549224866789874e-05, + "loss": 0.6518, + "step": 2778 + }, + { + "epoch": 0.1, + "learning_rate": 1.9548901574946816e-05, + "loss": 0.6289, + "step": 2779 + }, + { + "epoch": 0.1, + "learning_rate": 1.954857816988945e-05, + "loss": 0.6311, + "step": 2780 + }, + { + "epoch": 0.1, + "learning_rate": 1.9548254651621614e-05, + "loss": 0.6149, + "step": 2781 + }, + { + "epoch": 0.1, + "learning_rate": 1.9547931020147137e-05, + "loss": 0.623, + "step": 2782 + }, + { + "epoch": 0.1, + "learning_rate": 1.954760727546986e-05, + "loss": 0.6721, + "step": 2783 + }, + { + "epoch": 0.1, + "learning_rate": 1.9547283417593625e-05, + "loss": 0.6467, + "step": 2784 + }, + { + "epoch": 0.1, + "learning_rate": 1.9546959446522263e-05, + "loss": 0.6447, + "step": 2785 + }, + { + "epoch": 0.1, + "learning_rate": 1.954663536225962e-05, + "loss": 0.632, + "step": 2786 + }, + { + "epoch": 0.1, + "learning_rate": 1.9546311164809538e-05, + "loss": 0.6277, + "step": 2787 + }, + { + "epoch": 0.1, + "learning_rate": 1.954598685417586e-05, + "loss": 0.6762, + "step": 2788 + }, + { + "epoch": 0.1, + "learning_rate": 1.954566243036244e-05, + "loss": 0.597, + "step": 2789 + }, + { + "epoch": 0.1, + "learning_rate": 1.954533789337311e-05, + "loss": 0.6238, + "step": 2790 + }, + { + "epoch": 0.1, + "learning_rate": 1.9545013243211723e-05, + "loss": 0.6793, + "step": 2791 + }, + { + "epoch": 0.1, + "learning_rate": 1.9544688479882135e-05, + "loss": 0.6244, + "step": 2792 + }, + { + "epoch": 0.1, + "learning_rate": 1.9544363603388187e-05, + "loss": 0.6815, + "step": 2793 + }, + { + "epoch": 0.1, + "learning_rate": 1.9544038613733733e-05, + "loss": 0.5783, + "step": 2794 + }, + { + "epoch": 0.1, + "learning_rate": 1.9543713510922633e-05, + "loss": 0.6111, + "step": 2795 + }, + { + "epoch": 0.1, + "learning_rate": 1.9543388294958733e-05, + "loss": 0.6687, + "step": 2796 + }, + { + "epoch": 0.1, + "learning_rate": 1.9543062965845895e-05, + "loss": 0.6304, + "step": 2797 + }, + { + "epoch": 0.1, + "learning_rate": 1.954273752358797e-05, + "loss": 0.6509, + "step": 2798 + }, + { + "epoch": 0.1, + "learning_rate": 1.9542411968188824e-05, + "loss": 0.6234, + "step": 2799 + }, + { + "epoch": 0.1, + "learning_rate": 1.954208629965231e-05, + "loss": 0.6132, + "step": 2800 + }, + { + "epoch": 0.1, + "learning_rate": 1.9541760517982294e-05, + "loss": 0.6042, + "step": 2801 + }, + { + "epoch": 0.1, + "learning_rate": 1.9541434623182636e-05, + "loss": 0.6635, + "step": 2802 + }, + { + "epoch": 0.1, + "learning_rate": 1.9541108615257198e-05, + "loss": 0.6475, + "step": 2803 + }, + { + "epoch": 0.1, + "learning_rate": 1.954078249420985e-05, + "loss": 0.6577, + "step": 2804 + }, + { + "epoch": 0.1, + "learning_rate": 1.9540456260044454e-05, + "loss": 0.6458, + "step": 2805 + }, + { + "epoch": 0.1, + "learning_rate": 1.9540129912764888e-05, + "loss": 0.6328, + "step": 2806 + }, + { + "epoch": 0.1, + "learning_rate": 1.9539803452375005e-05, + "loss": 0.6905, + "step": 2807 + }, + { + "epoch": 0.1, + "learning_rate": 1.953947687887869e-05, + "loss": 0.6322, + "step": 2808 + }, + { + "epoch": 0.1, + "learning_rate": 1.9539150192279807e-05, + "loss": 0.6796, + "step": 2809 + }, + { + "epoch": 0.1, + "learning_rate": 1.953882339258223e-05, + "loss": 0.6208, + "step": 2810 + }, + { + "epoch": 0.1, + "learning_rate": 1.9538496479789834e-05, + "loss": 0.655, + "step": 2811 + }, + { + "epoch": 0.1, + "learning_rate": 1.95381694539065e-05, + "loss": 0.6464, + "step": 2812 + }, + { + "epoch": 0.1, + "learning_rate": 1.95378423149361e-05, + "loss": 0.6313, + "step": 2813 + }, + { + "epoch": 0.1, + "learning_rate": 1.953751506288251e-05, + "loss": 0.6682, + "step": 2814 + }, + { + "epoch": 0.1, + "learning_rate": 1.9537187697749615e-05, + "loss": 0.6181, + "step": 2815 + }, + { + "epoch": 0.1, + "learning_rate": 1.95368602195413e-05, + "loss": 0.6531, + "step": 2816 + }, + { + "epoch": 0.1, + "learning_rate": 1.953653262826144e-05, + "loss": 0.6319, + "step": 2817 + }, + { + "epoch": 0.1, + "learning_rate": 1.9536204923913922e-05, + "loss": 0.6597, + "step": 2818 + }, + { + "epoch": 0.1, + "learning_rate": 1.953587710650263e-05, + "loss": 0.6444, + "step": 2819 + }, + { + "epoch": 0.1, + "learning_rate": 1.9535549176031455e-05, + "loss": 0.598, + "step": 2820 + }, + { + "epoch": 0.1, + "learning_rate": 1.9535221132504277e-05, + "loss": 0.6913, + "step": 2821 + }, + { + "epoch": 0.1, + "learning_rate": 1.9534892975924995e-05, + "loss": 0.6836, + "step": 2822 + }, + { + "epoch": 0.1, + "learning_rate": 1.9534564706297494e-05, + "loss": 0.6893, + "step": 2823 + }, + { + "epoch": 0.1, + "learning_rate": 1.9534236323625667e-05, + "loss": 0.6624, + "step": 2824 + }, + { + "epoch": 0.1, + "learning_rate": 1.9533907827913406e-05, + "loss": 0.6024, + "step": 2825 + }, + { + "epoch": 0.1, + "learning_rate": 1.953357921916461e-05, + "loss": 0.6448, + "step": 2826 + }, + { + "epoch": 0.1, + "learning_rate": 1.9533250497383172e-05, + "loss": 0.6559, + "step": 2827 + }, + { + "epoch": 0.1, + "learning_rate": 1.9532921662572988e-05, + "loss": 0.6198, + "step": 2828 + }, + { + "epoch": 0.1, + "learning_rate": 1.9532592714737956e-05, + "loss": 0.6704, + "step": 2829 + }, + { + "epoch": 0.1, + "learning_rate": 1.9532263653881983e-05, + "loss": 0.6756, + "step": 2830 + }, + { + "epoch": 0.1, + "learning_rate": 1.9531934480008968e-05, + "loss": 0.724, + "step": 2831 + }, + { + "epoch": 0.1, + "learning_rate": 1.9531605193122805e-05, + "loss": 0.6679, + "step": 2832 + }, + { + "epoch": 0.1, + "learning_rate": 1.9531275793227407e-05, + "loss": 0.6936, + "step": 2833 + }, + { + "epoch": 0.1, + "learning_rate": 1.953094628032668e-05, + "loss": 0.573, + "step": 2834 + }, + { + "epoch": 0.1, + "learning_rate": 1.953061665442453e-05, + "loss": 0.6127, + "step": 2835 + }, + { + "epoch": 0.1, + "learning_rate": 1.9530286915524858e-05, + "loss": 0.6848, + "step": 2836 + }, + { + "epoch": 0.1, + "learning_rate": 1.9529957063631578e-05, + "loss": 0.6984, + "step": 2837 + }, + { + "epoch": 0.1, + "learning_rate": 1.9529627098748606e-05, + "loss": 0.6324, + "step": 2838 + }, + { + "epoch": 0.1, + "learning_rate": 1.9529297020879848e-05, + "loss": 0.6237, + "step": 2839 + }, + { + "epoch": 0.1, + "learning_rate": 1.9528966830029217e-05, + "loss": 0.6467, + "step": 2840 + }, + { + "epoch": 0.1, + "learning_rate": 1.9528636526200634e-05, + "loss": 0.6685, + "step": 2841 + }, + { + "epoch": 0.1, + "learning_rate": 1.9528306109398012e-05, + "loss": 0.6563, + "step": 2842 + }, + { + "epoch": 0.1, + "learning_rate": 1.9527975579625264e-05, + "loss": 0.731, + "step": 2843 + }, + { + "epoch": 0.1, + "learning_rate": 1.952764493688631e-05, + "loss": 0.6585, + "step": 2844 + }, + { + "epoch": 0.1, + "learning_rate": 1.952731418118508e-05, + "loss": 0.696, + "step": 2845 + }, + { + "epoch": 0.1, + "learning_rate": 1.9526983312525486e-05, + "loss": 0.7009, + "step": 2846 + }, + { + "epoch": 0.1, + "learning_rate": 1.9526652330911452e-05, + "loss": 0.6506, + "step": 2847 + }, + { + "epoch": 0.1, + "learning_rate": 1.9526321236346902e-05, + "loss": 0.6041, + "step": 2848 + }, + { + "epoch": 0.1, + "learning_rate": 1.9525990028835765e-05, + "loss": 0.6767, + "step": 2849 + }, + { + "epoch": 0.1, + "learning_rate": 1.9525658708381962e-05, + "loss": 0.6112, + "step": 2850 + }, + { + "epoch": 0.1, + "learning_rate": 1.952532727498943e-05, + "loss": 0.62, + "step": 2851 + }, + { + "epoch": 0.1, + "learning_rate": 1.9524995728662092e-05, + "loss": 0.6768, + "step": 2852 + }, + { + "epoch": 0.1, + "learning_rate": 1.9524664069403882e-05, + "loss": 0.6304, + "step": 2853 + }, + { + "epoch": 0.1, + "learning_rate": 1.9524332297218724e-05, + "loss": 0.682, + "step": 2854 + }, + { + "epoch": 0.1, + "learning_rate": 1.9524000412110563e-05, + "loss": 0.6622, + "step": 2855 + }, + { + "epoch": 0.1, + "learning_rate": 1.952366841408333e-05, + "loss": 0.6274, + "step": 2856 + }, + { + "epoch": 0.1, + "learning_rate": 1.952333630314096e-05, + "loss": 0.6717, + "step": 2857 + }, + { + "epoch": 0.1, + "learning_rate": 1.952300407928739e-05, + "loss": 0.6291, + "step": 2858 + }, + { + "epoch": 0.1, + "learning_rate": 1.952267174252656e-05, + "loss": 0.6333, + "step": 2859 + }, + { + "epoch": 0.1, + "learning_rate": 1.9522339292862412e-05, + "loss": 0.6463, + "step": 2860 + }, + { + "epoch": 0.1, + "learning_rate": 1.9522006730298885e-05, + "loss": 0.6926, + "step": 2861 + }, + { + "epoch": 0.1, + "learning_rate": 1.952167405483992e-05, + "loss": 0.6034, + "step": 2862 + }, + { + "epoch": 0.1, + "learning_rate": 1.9521341266489465e-05, + "loss": 0.6216, + "step": 2863 + }, + { + "epoch": 0.1, + "learning_rate": 1.952100836525147e-05, + "loss": 0.6206, + "step": 2864 + }, + { + "epoch": 0.1, + "learning_rate": 1.952067535112987e-05, + "loss": 0.6007, + "step": 2865 + }, + { + "epoch": 0.1, + "learning_rate": 1.9520342224128623e-05, + "loss": 0.6337, + "step": 2866 + }, + { + "epoch": 0.1, + "learning_rate": 1.9520008984251676e-05, + "loss": 0.632, + "step": 2867 + }, + { + "epoch": 0.1, + "learning_rate": 1.9519675631502978e-05, + "loss": 0.6735, + "step": 2868 + }, + { + "epoch": 0.1, + "learning_rate": 1.9519342165886486e-05, + "loss": 0.6077, + "step": 2869 + }, + { + "epoch": 0.1, + "learning_rate": 1.951900858740615e-05, + "loss": 0.591, + "step": 2870 + }, + { + "epoch": 0.1, + "learning_rate": 1.9518674896065925e-05, + "loss": 0.5599, + "step": 2871 + }, + { + "epoch": 0.1, + "learning_rate": 1.9518341091869767e-05, + "loss": 0.6671, + "step": 2872 + }, + { + "epoch": 0.1, + "learning_rate": 1.9518007174821635e-05, + "loss": 0.6408, + "step": 2873 + }, + { + "epoch": 0.1, + "learning_rate": 1.9517673144925485e-05, + "loss": 0.6097, + "step": 2874 + }, + { + "epoch": 0.1, + "learning_rate": 1.9517339002185284e-05, + "loss": 0.6445, + "step": 2875 + }, + { + "epoch": 0.1, + "learning_rate": 1.9517004746604988e-05, + "loss": 0.6357, + "step": 2876 + }, + { + "epoch": 0.1, + "learning_rate": 1.951667037818856e-05, + "loss": 0.6399, + "step": 2877 + }, + { + "epoch": 0.1, + "learning_rate": 1.951633589693997e-05, + "loss": 0.6776, + "step": 2878 + }, + { + "epoch": 0.1, + "learning_rate": 1.9516001302863173e-05, + "loss": 0.6565, + "step": 2879 + }, + { + "epoch": 0.1, + "learning_rate": 1.9515666595962147e-05, + "loss": 0.6183, + "step": 2880 + }, + { + "epoch": 0.1, + "learning_rate": 1.9515331776240858e-05, + "loss": 0.6782, + "step": 2881 + }, + { + "epoch": 0.1, + "learning_rate": 1.9514996843703272e-05, + "loss": 0.6518, + "step": 2882 + }, + { + "epoch": 0.1, + "learning_rate": 1.9514661798353362e-05, + "loss": 0.6313, + "step": 2883 + }, + { + "epoch": 0.1, + "learning_rate": 1.9514326640195103e-05, + "loss": 0.6545, + "step": 2884 + }, + { + "epoch": 0.1, + "learning_rate": 1.951399136923246e-05, + "loss": 0.6188, + "step": 2885 + }, + { + "epoch": 0.1, + "learning_rate": 1.951365598546942e-05, + "loss": 0.6785, + "step": 2886 + }, + { + "epoch": 0.1, + "learning_rate": 1.9513320488909948e-05, + "loss": 0.6182, + "step": 2887 + }, + { + "epoch": 0.1, + "learning_rate": 1.951298487955803e-05, + "loss": 0.6473, + "step": 2888 + }, + { + "epoch": 0.1, + "learning_rate": 1.9512649157417645e-05, + "loss": 0.6272, + "step": 2889 + }, + { + "epoch": 0.1, + "learning_rate": 1.9512313322492767e-05, + "loss": 0.5942, + "step": 2890 + }, + { + "epoch": 0.1, + "learning_rate": 1.9511977374787382e-05, + "loss": 0.6619, + "step": 2891 + }, + { + "epoch": 0.1, + "learning_rate": 1.9511641314305473e-05, + "loss": 0.6752, + "step": 2892 + }, + { + "epoch": 0.1, + "learning_rate": 1.951130514105102e-05, + "loss": 0.6497, + "step": 2893 + }, + { + "epoch": 0.1, + "learning_rate": 1.951096885502802e-05, + "loss": 0.6138, + "step": 2894 + }, + { + "epoch": 0.1, + "learning_rate": 1.9510632456240446e-05, + "loss": 0.6298, + "step": 2895 + }, + { + "epoch": 0.1, + "learning_rate": 1.95102959446923e-05, + "loss": 0.6372, + "step": 2896 + }, + { + "epoch": 0.1, + "learning_rate": 1.950995932038756e-05, + "loss": 0.6444, + "step": 2897 + }, + { + "epoch": 0.1, + "learning_rate": 1.9509622583330222e-05, + "loss": 0.6476, + "step": 2898 + }, + { + "epoch": 0.1, + "learning_rate": 1.950928573352428e-05, + "loss": 0.648, + "step": 2899 + }, + { + "epoch": 0.1, + "learning_rate": 1.950894877097373e-05, + "loss": 0.6717, + "step": 2900 + }, + { + "epoch": 0.1, + "learning_rate": 1.9508611695682557e-05, + "loss": 0.6462, + "step": 2901 + }, + { + "epoch": 0.1, + "learning_rate": 1.9508274507654767e-05, + "loss": 0.6252, + "step": 2902 + }, + { + "epoch": 0.1, + "learning_rate": 1.9507937206894355e-05, + "loss": 0.6384, + "step": 2903 + }, + { + "epoch": 0.1, + "learning_rate": 1.950759979340532e-05, + "loss": 0.6555, + "step": 2904 + }, + { + "epoch": 0.1, + "learning_rate": 1.9507262267191662e-05, + "loss": 0.6148, + "step": 2905 + }, + { + "epoch": 0.1, + "learning_rate": 1.950692462825738e-05, + "loss": 0.6039, + "step": 2906 + }, + { + "epoch": 0.1, + "learning_rate": 1.9506586876606485e-05, + "loss": 0.5911, + "step": 2907 + }, + { + "epoch": 0.1, + "learning_rate": 1.9506249012242974e-05, + "loss": 0.6076, + "step": 2908 + }, + { + "epoch": 0.1, + "learning_rate": 1.9505911035170854e-05, + "loss": 0.6519, + "step": 2909 + }, + { + "epoch": 0.1, + "learning_rate": 1.950557294539414e-05, + "loss": 0.6645, + "step": 2910 + }, + { + "epoch": 0.1, + "learning_rate": 1.9505234742916827e-05, + "loss": 0.6329, + "step": 2911 + }, + { + "epoch": 0.1, + "learning_rate": 1.9504896427742934e-05, + "loss": 0.6529, + "step": 2912 + }, + { + "epoch": 0.1, + "learning_rate": 1.9504557999876473e-05, + "loss": 0.682, + "step": 2913 + }, + { + "epoch": 0.1, + "learning_rate": 1.9504219459321448e-05, + "loss": 0.6165, + "step": 2914 + }, + { + "epoch": 0.1, + "learning_rate": 1.9503880806081882e-05, + "loss": 0.6951, + "step": 2915 + }, + { + "epoch": 0.1, + "learning_rate": 1.9503542040161788e-05, + "loss": 0.6626, + "step": 2916 + }, + { + "epoch": 0.1, + "learning_rate": 1.950320316156518e-05, + "loss": 0.642, + "step": 2917 + }, + { + "epoch": 0.1, + "learning_rate": 1.9502864170296073e-05, + "loss": 0.6248, + "step": 2918 + }, + { + "epoch": 0.1, + "learning_rate": 1.9502525066358496e-05, + "loss": 0.6212, + "step": 2919 + }, + { + "epoch": 0.1, + "learning_rate": 1.950218584975646e-05, + "loss": 0.6539, + "step": 2920 + }, + { + "epoch": 0.1, + "learning_rate": 1.9501846520493993e-05, + "loss": 0.6314, + "step": 2921 + }, + { + "epoch": 0.1, + "learning_rate": 1.950150707857511e-05, + "loss": 0.5868, + "step": 2922 + }, + { + "epoch": 0.1, + "learning_rate": 1.9501167524003846e-05, + "loss": 0.6768, + "step": 2923 + }, + { + "epoch": 0.1, + "learning_rate": 1.9500827856784223e-05, + "loss": 0.6489, + "step": 2924 + }, + { + "epoch": 0.1, + "learning_rate": 1.9500488076920266e-05, + "loss": 0.6414, + "step": 2925 + }, + { + "epoch": 0.1, + "learning_rate": 1.9500148184416004e-05, + "loss": 0.6657, + "step": 2926 + }, + { + "epoch": 0.1, + "learning_rate": 1.9499808179275466e-05, + "loss": 0.5883, + "step": 2927 + }, + { + "epoch": 0.1, + "learning_rate": 1.9499468061502687e-05, + "loss": 0.6605, + "step": 2928 + }, + { + "epoch": 0.1, + "learning_rate": 1.9499127831101696e-05, + "loss": 0.6914, + "step": 2929 + }, + { + "epoch": 0.1, + "learning_rate": 1.9498787488076527e-05, + "loss": 0.649, + "step": 2930 + }, + { + "epoch": 0.1, + "learning_rate": 1.949844703243122e-05, + "loss": 0.6413, + "step": 2931 + }, + { + "epoch": 0.1, + "learning_rate": 1.9498106464169805e-05, + "loss": 0.6226, + "step": 2932 + }, + { + "epoch": 0.1, + "learning_rate": 1.9497765783296323e-05, + "loss": 0.6956, + "step": 2933 + }, + { + "epoch": 0.1, + "learning_rate": 1.9497424989814814e-05, + "loss": 0.6488, + "step": 2934 + }, + { + "epoch": 0.1, + "learning_rate": 1.9497084083729315e-05, + "loss": 0.6563, + "step": 2935 + }, + { + "epoch": 0.1, + "learning_rate": 1.949674306504387e-05, + "loss": 0.6346, + "step": 2936 + }, + { + "epoch": 0.1, + "learning_rate": 1.9496401933762526e-05, + "loss": 0.6351, + "step": 2937 + }, + { + "epoch": 0.1, + "learning_rate": 1.9496060689889323e-05, + "loss": 0.6696, + "step": 2938 + }, + { + "epoch": 0.1, + "learning_rate": 1.9495719333428308e-05, + "loss": 0.6481, + "step": 2939 + }, + { + "epoch": 0.1, + "learning_rate": 1.9495377864383526e-05, + "loss": 0.637, + "step": 2940 + }, + { + "epoch": 0.1, + "learning_rate": 1.949503628275903e-05, + "loss": 0.6508, + "step": 2941 + }, + { + "epoch": 0.1, + "learning_rate": 1.9494694588558863e-05, + "loss": 0.6682, + "step": 2942 + }, + { + "epoch": 0.1, + "learning_rate": 1.949435278178709e-05, + "loss": 0.65, + "step": 2943 + }, + { + "epoch": 0.1, + "learning_rate": 1.9494010862447745e-05, + "loss": 0.6324, + "step": 2944 + }, + { + "epoch": 0.1, + "learning_rate": 1.9493668830544897e-05, + "loss": 0.6406, + "step": 2945 + }, + { + "epoch": 0.1, + "learning_rate": 1.9493326686082592e-05, + "loss": 0.6587, + "step": 2946 + }, + { + "epoch": 0.1, + "learning_rate": 1.9492984429064893e-05, + "loss": 0.6883, + "step": 2947 + }, + { + "epoch": 0.1, + "learning_rate": 1.9492642059495854e-05, + "loss": 0.6353, + "step": 2948 + }, + { + "epoch": 0.1, + "learning_rate": 1.9492299577379534e-05, + "loss": 0.6333, + "step": 2949 + }, + { + "epoch": 0.1, + "learning_rate": 1.9491956982719994e-05, + "loss": 0.6484, + "step": 2950 + }, + { + "epoch": 0.1, + "learning_rate": 1.94916142755213e-05, + "loss": 0.5977, + "step": 2951 + }, + { + "epoch": 0.1, + "learning_rate": 1.949127145578751e-05, + "loss": 0.679, + "step": 2952 + }, + { + "epoch": 0.1, + "learning_rate": 1.9490928523522692e-05, + "loss": 0.7095, + "step": 2953 + }, + { + "epoch": 0.1, + "learning_rate": 1.9490585478730904e-05, + "loss": 0.6252, + "step": 2954 + }, + { + "epoch": 0.1, + "learning_rate": 1.9490242321416227e-05, + "loss": 0.6887, + "step": 2955 + }, + { + "epoch": 0.1, + "learning_rate": 1.948989905158272e-05, + "loss": 0.6389, + "step": 2956 + }, + { + "epoch": 0.1, + "learning_rate": 1.948955566923445e-05, + "loss": 0.6223, + "step": 2957 + }, + { + "epoch": 0.1, + "learning_rate": 1.94892121743755e-05, + "loss": 0.6817, + "step": 2958 + }, + { + "epoch": 0.1, + "learning_rate": 1.9488868567009935e-05, + "loss": 0.6624, + "step": 2959 + }, + { + "epoch": 0.1, + "learning_rate": 1.9488524847141825e-05, + "loss": 0.6844, + "step": 2960 + }, + { + "epoch": 0.1, + "learning_rate": 1.9488181014775255e-05, + "loss": 0.6694, + "step": 2961 + }, + { + "epoch": 0.1, + "learning_rate": 1.9487837069914294e-05, + "loss": 0.6936, + "step": 2962 + }, + { + "epoch": 0.1, + "learning_rate": 1.948749301256302e-05, + "loss": 0.6617, + "step": 2963 + }, + { + "epoch": 0.1, + "learning_rate": 1.9487148842725517e-05, + "loss": 0.6485, + "step": 2964 + }, + { + "epoch": 0.1, + "learning_rate": 1.9486804560405863e-05, + "loss": 0.6164, + "step": 2965 + }, + { + "epoch": 0.1, + "learning_rate": 1.948646016560814e-05, + "loss": 0.6194, + "step": 2966 + }, + { + "epoch": 0.1, + "learning_rate": 1.9486115658336433e-05, + "loss": 0.7146, + "step": 2967 + }, + { + "epoch": 0.1, + "learning_rate": 1.9485771038594822e-05, + "loss": 0.5839, + "step": 2968 + }, + { + "epoch": 0.1, + "learning_rate": 1.94854263063874e-05, + "loss": 0.6575, + "step": 2969 + }, + { + "epoch": 0.1, + "learning_rate": 1.9485081461718245e-05, + "loss": 0.5793, + "step": 2970 + }, + { + "epoch": 0.1, + "learning_rate": 1.9484736504591454e-05, + "loss": 0.6651, + "step": 2971 + }, + { + "epoch": 0.1, + "learning_rate": 1.948439143501111e-05, + "loss": 0.7193, + "step": 2972 + }, + { + "epoch": 0.1, + "learning_rate": 1.948404625298131e-05, + "loss": 0.6561, + "step": 2973 + }, + { + "epoch": 0.1, + "learning_rate": 1.9483700958506143e-05, + "loss": 0.6226, + "step": 2974 + }, + { + "epoch": 0.1, + "learning_rate": 1.9483355551589706e-05, + "loss": 0.645, + "step": 2975 + }, + { + "epoch": 0.1, + "learning_rate": 1.9483010032236092e-05, + "loss": 0.6416, + "step": 2976 + }, + { + "epoch": 0.1, + "learning_rate": 1.94826644004494e-05, + "loss": 0.6335, + "step": 2977 + }, + { + "epoch": 0.1, + "learning_rate": 1.948231865623372e-05, + "loss": 0.628, + "step": 2978 + }, + { + "epoch": 0.1, + "learning_rate": 1.9481972799593164e-05, + "loss": 0.6177, + "step": 2979 + }, + { + "epoch": 0.1, + "learning_rate": 1.948162683053182e-05, + "loss": 0.6396, + "step": 2980 + }, + { + "epoch": 0.1, + "learning_rate": 1.9481280749053798e-05, + "loss": 0.6138, + "step": 2981 + }, + { + "epoch": 0.1, + "learning_rate": 1.94809345551632e-05, + "loss": 0.6541, + "step": 2982 + }, + { + "epoch": 0.1, + "learning_rate": 1.9480588248864126e-05, + "loss": 0.6375, + "step": 2983 + }, + { + "epoch": 0.1, + "learning_rate": 1.948024183016069e-05, + "loss": 0.6352, + "step": 2984 + }, + { + "epoch": 0.1, + "learning_rate": 1.9479895299056992e-05, + "loss": 0.6467, + "step": 2985 + }, + { + "epoch": 0.1, + "learning_rate": 1.9479548655557145e-05, + "loss": 0.6427, + "step": 2986 + }, + { + "epoch": 0.1, + "learning_rate": 1.9479201899665255e-05, + "loss": 0.7015, + "step": 2987 + }, + { + "epoch": 0.1, + "learning_rate": 1.9478855031385435e-05, + "loss": 0.6062, + "step": 2988 + }, + { + "epoch": 0.1, + "learning_rate": 1.94785080507218e-05, + "loss": 0.6458, + "step": 2989 + }, + { + "epoch": 0.1, + "learning_rate": 1.947816095767846e-05, + "loss": 0.6326, + "step": 2990 + }, + { + "epoch": 0.1, + "learning_rate": 1.9477813752259533e-05, + "loss": 0.6358, + "step": 2991 + }, + { + "epoch": 0.1, + "learning_rate": 1.947746643446913e-05, + "loss": 0.6853, + "step": 2992 + }, + { + "epoch": 0.1, + "learning_rate": 1.9477119004311376e-05, + "loss": 0.674, + "step": 2993 + }, + { + "epoch": 0.1, + "learning_rate": 1.947677146179039e-05, + "loss": 0.6589, + "step": 2994 + }, + { + "epoch": 0.1, + "learning_rate": 1.9476423806910286e-05, + "loss": 0.6283, + "step": 2995 + }, + { + "epoch": 0.1, + "learning_rate": 1.9476076039675195e-05, + "loss": 0.6294, + "step": 2996 + }, + { + "epoch": 0.1, + "learning_rate": 1.9475728160089234e-05, + "loss": 0.6335, + "step": 2997 + }, + { + "epoch": 0.1, + "learning_rate": 1.9475380168156527e-05, + "loss": 0.6314, + "step": 2998 + }, + { + "epoch": 0.1, + "learning_rate": 1.9475032063881202e-05, + "loss": 0.6668, + "step": 2999 + }, + { + "epoch": 0.1, + "learning_rate": 1.9474683847267384e-05, + "loss": 0.5716, + "step": 3000 + }, + { + "epoch": 0.1, + "learning_rate": 1.9474335518319206e-05, + "loss": 0.5958, + "step": 3001 + }, + { + "epoch": 0.1, + "learning_rate": 1.9473987077040795e-05, + "loss": 0.6297, + "step": 3002 + }, + { + "epoch": 0.1, + "learning_rate": 1.9473638523436285e-05, + "loss": 0.6791, + "step": 3003 + }, + { + "epoch": 0.1, + "learning_rate": 1.94732898575098e-05, + "loss": 0.6715, + "step": 3004 + }, + { + "epoch": 0.1, + "learning_rate": 1.9472941079265486e-05, + "loss": 0.6935, + "step": 3005 + }, + { + "epoch": 0.1, + "learning_rate": 1.9472592188707467e-05, + "loss": 0.7065, + "step": 3006 + }, + { + "epoch": 0.1, + "learning_rate": 1.947224318583989e-05, + "loss": 0.667, + "step": 3007 + }, + { + "epoch": 0.1, + "learning_rate": 1.9471894070666884e-05, + "loss": 0.6577, + "step": 3008 + }, + { + "epoch": 0.1, + "learning_rate": 1.9471544843192593e-05, + "loss": 0.6942, + "step": 3009 + }, + { + "epoch": 0.1, + "learning_rate": 1.9471195503421158e-05, + "loss": 0.6628, + "step": 3010 + }, + { + "epoch": 0.1, + "learning_rate": 1.9470846051356715e-05, + "loss": 0.6345, + "step": 3011 + }, + { + "epoch": 0.1, + "learning_rate": 1.9470496487003414e-05, + "loss": 0.6421, + "step": 3012 + }, + { + "epoch": 0.1, + "learning_rate": 1.9470146810365397e-05, + "loss": 0.6375, + "step": 3013 + }, + { + "epoch": 0.1, + "learning_rate": 1.946979702144681e-05, + "loss": 0.6728, + "step": 3014 + }, + { + "epoch": 0.1, + "learning_rate": 1.94694471202518e-05, + "loss": 0.698, + "step": 3015 + }, + { + "epoch": 0.1, + "learning_rate": 1.9469097106784513e-05, + "loss": 0.6699, + "step": 3016 + }, + { + "epoch": 0.1, + "learning_rate": 1.9468746981049102e-05, + "loss": 0.6403, + "step": 3017 + }, + { + "epoch": 0.1, + "learning_rate": 1.946839674304972e-05, + "loss": 0.6336, + "step": 3018 + }, + { + "epoch": 0.1, + "learning_rate": 1.9468046392790516e-05, + "loss": 0.6554, + "step": 3019 + }, + { + "epoch": 0.1, + "learning_rate": 1.9467695930275642e-05, + "loss": 0.6653, + "step": 3020 + }, + { + "epoch": 0.1, + "learning_rate": 1.946734535550926e-05, + "loss": 0.6416, + "step": 3021 + }, + { + "epoch": 0.1, + "learning_rate": 1.946699466849552e-05, + "loss": 0.593, + "step": 3022 + }, + { + "epoch": 0.1, + "learning_rate": 1.9466643869238585e-05, + "loss": 0.6224, + "step": 3023 + }, + { + "epoch": 0.1, + "learning_rate": 1.9466292957742608e-05, + "loss": 0.5788, + "step": 3024 + }, + { + "epoch": 0.1, + "learning_rate": 1.9465941934011757e-05, + "loss": 0.6412, + "step": 3025 + }, + { + "epoch": 0.1, + "learning_rate": 1.946559079805019e-05, + "loss": 0.5931, + "step": 3026 + }, + { + "epoch": 0.1, + "learning_rate": 1.9465239549862068e-05, + "loss": 0.6723, + "step": 3027 + }, + { + "epoch": 0.1, + "learning_rate": 1.9464888189451558e-05, + "loss": 0.6886, + "step": 3028 + }, + { + "epoch": 0.1, + "learning_rate": 1.9464536716822823e-05, + "loss": 0.5871, + "step": 3029 + }, + { + "epoch": 0.1, + "learning_rate": 1.9464185131980034e-05, + "loss": 0.6522, + "step": 3030 + }, + { + "epoch": 0.11, + "learning_rate": 1.9463833434927358e-05, + "loss": 0.6113, + "step": 3031 + }, + { + "epoch": 0.11, + "learning_rate": 1.9463481625668966e-05, + "loss": 0.6701, + "step": 3032 + }, + { + "epoch": 0.11, + "learning_rate": 1.9463129704209026e-05, + "loss": 0.6714, + "step": 3033 + }, + { + "epoch": 0.11, + "learning_rate": 1.9462777670551715e-05, + "loss": 0.6528, + "step": 3034 + }, + { + "epoch": 0.11, + "learning_rate": 1.9462425524701204e-05, + "loss": 0.6543, + "step": 3035 + }, + { + "epoch": 0.11, + "learning_rate": 1.9462073266661666e-05, + "loss": 0.5957, + "step": 3036 + }, + { + "epoch": 0.11, + "learning_rate": 1.9461720896437284e-05, + "loss": 0.638, + "step": 3037 + }, + { + "epoch": 0.11, + "learning_rate": 1.9461368414032228e-05, + "loss": 0.6218, + "step": 3038 + }, + { + "epoch": 0.11, + "learning_rate": 1.9461015819450678e-05, + "loss": 0.6295, + "step": 3039 + }, + { + "epoch": 0.11, + "learning_rate": 1.9460663112696823e-05, + "loss": 0.6267, + "step": 3040 + }, + { + "epoch": 0.11, + "learning_rate": 1.946031029377484e-05, + "loss": 0.6694, + "step": 3041 + }, + { + "epoch": 0.11, + "learning_rate": 1.9459957362688902e-05, + "loss": 0.6847, + "step": 3042 + }, + { + "epoch": 0.11, + "learning_rate": 1.9459604319443213e-05, + "loss": 0.6347, + "step": 3043 + }, + { + "epoch": 0.11, + "learning_rate": 1.9459251164041945e-05, + "loss": 0.6352, + "step": 3044 + }, + { + "epoch": 0.11, + "learning_rate": 1.9458897896489283e-05, + "loss": 0.5886, + "step": 3045 + }, + { + "epoch": 0.11, + "learning_rate": 1.9458544516789425e-05, + "loss": 0.6914, + "step": 3046 + }, + { + "epoch": 0.11, + "learning_rate": 1.945819102494656e-05, + "loss": 0.6448, + "step": 3047 + }, + { + "epoch": 0.11, + "learning_rate": 1.945783742096487e-05, + "loss": 0.6415, + "step": 3048 + }, + { + "epoch": 0.11, + "learning_rate": 1.9457483704848555e-05, + "loss": 0.6407, + "step": 3049 + }, + { + "epoch": 0.11, + "learning_rate": 1.9457129876601807e-05, + "loss": 0.6142, + "step": 3050 + }, + { + "epoch": 0.11, + "learning_rate": 1.9456775936228825e-05, + "loss": 0.5882, + "step": 3051 + }, + { + "epoch": 0.11, + "learning_rate": 1.9456421883733797e-05, + "loss": 0.6539, + "step": 3052 + }, + { + "epoch": 0.11, + "learning_rate": 1.9456067719120924e-05, + "loss": 0.6023, + "step": 3053 + }, + { + "epoch": 0.11, + "learning_rate": 1.945571344239441e-05, + "loss": 0.6728, + "step": 3054 + }, + { + "epoch": 0.11, + "learning_rate": 1.945535905355845e-05, + "loss": 0.6222, + "step": 3055 + }, + { + "epoch": 0.11, + "learning_rate": 1.9455004552617248e-05, + "loss": 0.6741, + "step": 3056 + }, + { + "epoch": 0.11, + "learning_rate": 1.9454649939575002e-05, + "loss": 0.661, + "step": 3057 + }, + { + "epoch": 0.11, + "learning_rate": 1.945429521443593e-05, + "loss": 0.6496, + "step": 3058 + }, + { + "epoch": 0.11, + "learning_rate": 1.945394037720422e-05, + "loss": 0.6755, + "step": 3059 + }, + { + "epoch": 0.11, + "learning_rate": 1.945358542788409e-05, + "loss": 0.6241, + "step": 3060 + }, + { + "epoch": 0.11, + "learning_rate": 1.9453230366479746e-05, + "loss": 0.6432, + "step": 3061 + }, + { + "epoch": 0.11, + "learning_rate": 1.94528751929954e-05, + "loss": 0.6157, + "step": 3062 + }, + { + "epoch": 0.11, + "learning_rate": 1.9452519907435256e-05, + "loss": 0.6187, + "step": 3063 + }, + { + "epoch": 0.11, + "learning_rate": 1.9452164509803535e-05, + "loss": 0.6488, + "step": 3064 + }, + { + "epoch": 0.11, + "learning_rate": 1.9451809000104446e-05, + "loss": 0.6612, + "step": 3065 + }, + { + "epoch": 0.11, + "learning_rate": 1.94514533783422e-05, + "loss": 0.6838, + "step": 3066 + }, + { + "epoch": 0.11, + "learning_rate": 1.9451097644521023e-05, + "loss": 0.634, + "step": 3067 + }, + { + "epoch": 0.11, + "learning_rate": 1.945074179864513e-05, + "loss": 0.5979, + "step": 3068 + }, + { + "epoch": 0.11, + "learning_rate": 1.945038584071873e-05, + "loss": 0.6853, + "step": 3069 + }, + { + "epoch": 0.11, + "learning_rate": 1.9450029770746058e-05, + "loss": 0.651, + "step": 3070 + }, + { + "epoch": 0.11, + "learning_rate": 1.9449673588731325e-05, + "loss": 0.6535, + "step": 3071 + }, + { + "epoch": 0.11, + "learning_rate": 1.944931729467876e-05, + "loss": 0.6404, + "step": 3072 + }, + { + "epoch": 0.11, + "learning_rate": 1.9448960888592582e-05, + "loss": 0.6389, + "step": 3073 + }, + { + "epoch": 0.11, + "learning_rate": 1.9448604370477022e-05, + "loss": 0.6477, + "step": 3074 + }, + { + "epoch": 0.11, + "learning_rate": 1.9448247740336303e-05, + "loss": 0.6357, + "step": 3075 + }, + { + "epoch": 0.11, + "learning_rate": 1.9447890998174657e-05, + "loss": 0.6639, + "step": 3076 + }, + { + "epoch": 0.11, + "learning_rate": 1.9447534143996312e-05, + "loss": 0.5919, + "step": 3077 + }, + { + "epoch": 0.11, + "learning_rate": 1.9447177177805497e-05, + "loss": 0.617, + "step": 3078 + }, + { + "epoch": 0.11, + "learning_rate": 1.9446820099606446e-05, + "loss": 0.6443, + "step": 3079 + }, + { + "epoch": 0.11, + "learning_rate": 1.9446462909403392e-05, + "loss": 0.6581, + "step": 3080 + }, + { + "epoch": 0.11, + "learning_rate": 1.9446105607200573e-05, + "loss": 0.6251, + "step": 3081 + }, + { + "epoch": 0.11, + "learning_rate": 1.9445748193002217e-05, + "loss": 0.6437, + "step": 3082 + }, + { + "epoch": 0.11, + "learning_rate": 1.9445390666812574e-05, + "loss": 0.6047, + "step": 3083 + }, + { + "epoch": 0.11, + "learning_rate": 1.944503302863587e-05, + "loss": 0.6008, + "step": 3084 + }, + { + "epoch": 0.11, + "learning_rate": 1.9444675278476354e-05, + "loss": 0.6747, + "step": 3085 + }, + { + "epoch": 0.11, + "learning_rate": 1.944431741633827e-05, + "loss": 0.6692, + "step": 3086 + }, + { + "epoch": 0.11, + "learning_rate": 1.944395944222585e-05, + "loss": 0.6599, + "step": 3087 + }, + { + "epoch": 0.11, + "learning_rate": 1.944360135614334e-05, + "loss": 0.6431, + "step": 3088 + }, + { + "epoch": 0.11, + "learning_rate": 1.9443243158095e-05, + "loss": 0.6313, + "step": 3089 + }, + { + "epoch": 0.11, + "learning_rate": 1.944288484808506e-05, + "loss": 0.6328, + "step": 3090 + }, + { + "epoch": 0.11, + "learning_rate": 1.944252642611778e-05, + "loss": 0.6597, + "step": 3091 + }, + { + "epoch": 0.11, + "learning_rate": 1.94421678921974e-05, + "loss": 0.7125, + "step": 3092 + }, + { + "epoch": 0.11, + "learning_rate": 1.9441809246328174e-05, + "loss": 0.6483, + "step": 3093 + }, + { + "epoch": 0.11, + "learning_rate": 1.9441450488514357e-05, + "loss": 0.6538, + "step": 3094 + }, + { + "epoch": 0.11, + "learning_rate": 1.9441091618760202e-05, + "loss": 0.6629, + "step": 3095 + }, + { + "epoch": 0.11, + "learning_rate": 1.9440732637069962e-05, + "loss": 0.651, + "step": 3096 + }, + { + "epoch": 0.11, + "learning_rate": 1.9440373543447896e-05, + "loss": 0.6338, + "step": 3097 + }, + { + "epoch": 0.11, + "learning_rate": 1.9440014337898256e-05, + "loss": 0.6601, + "step": 3098 + }, + { + "epoch": 0.11, + "learning_rate": 1.9439655020425305e-05, + "loss": 0.6394, + "step": 3099 + }, + { + "epoch": 0.11, + "learning_rate": 1.9439295591033304e-05, + "loss": 0.6131, + "step": 3100 + }, + { + "epoch": 0.11, + "learning_rate": 1.9438936049726512e-05, + "loss": 0.6369, + "step": 3101 + }, + { + "epoch": 0.11, + "learning_rate": 1.9438576396509196e-05, + "loss": 0.6314, + "step": 3102 + }, + { + "epoch": 0.11, + "learning_rate": 1.9438216631385613e-05, + "loss": 0.6551, + "step": 3103 + }, + { + "epoch": 0.11, + "learning_rate": 1.9437856754360033e-05, + "loss": 0.6567, + "step": 3104 + }, + { + "epoch": 0.11, + "learning_rate": 1.9437496765436722e-05, + "loss": 0.6271, + "step": 3105 + }, + { + "epoch": 0.11, + "learning_rate": 1.9437136664619953e-05, + "loss": 0.5671, + "step": 3106 + }, + { + "epoch": 0.11, + "learning_rate": 1.9436776451913986e-05, + "loss": 0.6519, + "step": 3107 + }, + { + "epoch": 0.11, + "learning_rate": 1.9436416127323095e-05, + "loss": 0.5807, + "step": 3108 + }, + { + "epoch": 0.11, + "learning_rate": 1.943605569085156e-05, + "loss": 0.6495, + "step": 3109 + }, + { + "epoch": 0.11, + "learning_rate": 1.9435695142503645e-05, + "loss": 0.6915, + "step": 3110 + }, + { + "epoch": 0.11, + "learning_rate": 1.9435334482283626e-05, + "loss": 0.6565, + "step": 3111 + }, + { + "epoch": 0.11, + "learning_rate": 1.943497371019578e-05, + "loss": 0.6466, + "step": 3112 + }, + { + "epoch": 0.11, + "learning_rate": 1.943461282624439e-05, + "loss": 0.6629, + "step": 3113 + }, + { + "epoch": 0.11, + "learning_rate": 1.9434251830433728e-05, + "loss": 0.6518, + "step": 3114 + }, + { + "epoch": 0.11, + "learning_rate": 1.9433890722768077e-05, + "loss": 0.6832, + "step": 3115 + }, + { + "epoch": 0.11, + "learning_rate": 1.9433529503251716e-05, + "loss": 0.6896, + "step": 3116 + }, + { + "epoch": 0.11, + "learning_rate": 1.943316817188893e-05, + "loss": 0.6675, + "step": 3117 + }, + { + "epoch": 0.11, + "learning_rate": 1.9432806728684e-05, + "loss": 0.6286, + "step": 3118 + }, + { + "epoch": 0.11, + "learning_rate": 1.9432445173641216e-05, + "loss": 0.6674, + "step": 3119 + }, + { + "epoch": 0.11, + "learning_rate": 1.9432083506764864e-05, + "loss": 0.6316, + "step": 3120 + }, + { + "epoch": 0.11, + "learning_rate": 1.9431721728059228e-05, + "loss": 0.6473, + "step": 3121 + }, + { + "epoch": 0.11, + "learning_rate": 1.94313598375286e-05, + "loss": 0.6282, + "step": 3122 + }, + { + "epoch": 0.11, + "learning_rate": 1.943099783517727e-05, + "loss": 0.6587, + "step": 3123 + }, + { + "epoch": 0.11, + "learning_rate": 1.943063572100953e-05, + "loss": 0.645, + "step": 3124 + }, + { + "epoch": 0.11, + "learning_rate": 1.9430273495029675e-05, + "loss": 0.6508, + "step": 3125 + }, + { + "epoch": 0.11, + "learning_rate": 1.9429911157242e-05, + "loss": 0.6414, + "step": 3126 + }, + { + "epoch": 0.11, + "learning_rate": 1.9429548707650795e-05, + "loss": 0.6116, + "step": 3127 + }, + { + "epoch": 0.11, + "learning_rate": 1.9429186146260366e-05, + "loss": 0.6113, + "step": 3128 + }, + { + "epoch": 0.11, + "learning_rate": 1.9428823473075008e-05, + "loss": 0.638, + "step": 3129 + }, + { + "epoch": 0.11, + "learning_rate": 1.9428460688099015e-05, + "loss": 0.6345, + "step": 3130 + }, + { + "epoch": 0.11, + "learning_rate": 1.94280977913367e-05, + "loss": 0.5896, + "step": 3131 + }, + { + "epoch": 0.11, + "learning_rate": 1.9427734782792352e-05, + "loss": 0.6514, + "step": 3132 + }, + { + "epoch": 0.11, + "learning_rate": 1.9427371662470286e-05, + "loss": 0.7311, + "step": 3133 + }, + { + "epoch": 0.11, + "learning_rate": 1.9427008430374802e-05, + "loss": 0.6387, + "step": 3134 + }, + { + "epoch": 0.11, + "learning_rate": 1.9426645086510207e-05, + "loss": 0.6737, + "step": 3135 + }, + { + "epoch": 0.11, + "learning_rate": 1.942628163088081e-05, + "loss": 0.6173, + "step": 3136 + }, + { + "epoch": 0.11, + "learning_rate": 1.9425918063490922e-05, + "loss": 0.6257, + "step": 3137 + }, + { + "epoch": 0.11, + "learning_rate": 1.942555438434485e-05, + "loss": 0.6192, + "step": 3138 + }, + { + "epoch": 0.11, + "learning_rate": 1.9425190593446906e-05, + "loss": 0.6783, + "step": 3139 + }, + { + "epoch": 0.11, + "learning_rate": 1.942482669080141e-05, + "loss": 0.6251, + "step": 3140 + }, + { + "epoch": 0.11, + "learning_rate": 1.9424462676412664e-05, + "loss": 0.6449, + "step": 3141 + }, + { + "epoch": 0.11, + "learning_rate": 1.9424098550284997e-05, + "loss": 0.6743, + "step": 3142 + }, + { + "epoch": 0.11, + "learning_rate": 1.9423734312422717e-05, + "loss": 0.6623, + "step": 3143 + }, + { + "epoch": 0.11, + "learning_rate": 1.9423369962830147e-05, + "loss": 0.6346, + "step": 3144 + }, + { + "epoch": 0.11, + "learning_rate": 1.9423005501511603e-05, + "loss": 0.6562, + "step": 3145 + }, + { + "epoch": 0.11, + "learning_rate": 1.942264092847141e-05, + "loss": 0.6426, + "step": 3146 + }, + { + "epoch": 0.11, + "learning_rate": 1.942227624371389e-05, + "loss": 0.6003, + "step": 3147 + }, + { + "epoch": 0.11, + "learning_rate": 1.9421911447243365e-05, + "loss": 0.6501, + "step": 3148 + }, + { + "epoch": 0.11, + "learning_rate": 1.942154653906416e-05, + "loss": 0.6335, + "step": 3149 + }, + { + "epoch": 0.11, + "learning_rate": 1.9421181519180606e-05, + "loss": 0.6445, + "step": 3150 + }, + { + "epoch": 0.11, + "learning_rate": 1.9420816387597024e-05, + "loss": 0.6382, + "step": 3151 + }, + { + "epoch": 0.11, + "learning_rate": 1.9420451144317745e-05, + "loss": 0.6755, + "step": 3152 + }, + { + "epoch": 0.11, + "learning_rate": 1.9420085789347106e-05, + "loss": 0.6448, + "step": 3153 + }, + { + "epoch": 0.11, + "learning_rate": 1.941972032268943e-05, + "loss": 0.619, + "step": 3154 + }, + { + "epoch": 0.11, + "learning_rate": 1.9419354744349054e-05, + "loss": 0.6582, + "step": 3155 + }, + { + "epoch": 0.11, + "learning_rate": 1.9418989054330314e-05, + "loss": 0.6275, + "step": 3156 + }, + { + "epoch": 0.11, + "learning_rate": 1.941862325263754e-05, + "loss": 0.6265, + "step": 3157 + }, + { + "epoch": 0.11, + "learning_rate": 1.9418257339275075e-05, + "loss": 0.5854, + "step": 3158 + }, + { + "epoch": 0.11, + "learning_rate": 1.9417891314247256e-05, + "loss": 0.698, + "step": 3159 + }, + { + "epoch": 0.11, + "learning_rate": 1.9417525177558418e-05, + "loss": 0.6824, + "step": 3160 + }, + { + "epoch": 0.11, + "learning_rate": 1.9417158929212907e-05, + "loss": 0.6686, + "step": 3161 + }, + { + "epoch": 0.11, + "learning_rate": 1.9416792569215067e-05, + "loss": 0.6721, + "step": 3162 + }, + { + "epoch": 0.11, + "learning_rate": 1.9416426097569238e-05, + "loss": 0.5964, + "step": 3163 + }, + { + "epoch": 0.11, + "learning_rate": 1.9416059514279764e-05, + "loss": 0.6744, + "step": 3164 + }, + { + "epoch": 0.11, + "learning_rate": 1.941569281935099e-05, + "loss": 0.6743, + "step": 3165 + }, + { + "epoch": 0.11, + "learning_rate": 1.9415326012787275e-05, + "loss": 0.678, + "step": 3166 + }, + { + "epoch": 0.11, + "learning_rate": 1.9414959094592954e-05, + "loss": 0.6114, + "step": 3167 + }, + { + "epoch": 0.11, + "learning_rate": 1.9414592064772386e-05, + "loss": 0.6124, + "step": 3168 + }, + { + "epoch": 0.11, + "learning_rate": 1.9414224923329918e-05, + "loss": 0.6545, + "step": 3169 + }, + { + "epoch": 0.11, + "learning_rate": 1.9413857670269903e-05, + "loss": 0.6617, + "step": 3170 + }, + { + "epoch": 0.11, + "learning_rate": 1.94134903055967e-05, + "loss": 0.6378, + "step": 3171 + }, + { + "epoch": 0.11, + "learning_rate": 1.9413122829314657e-05, + "loss": 0.6551, + "step": 3172 + }, + { + "epoch": 0.11, + "learning_rate": 1.941275524142814e-05, + "loss": 0.6292, + "step": 3173 + }, + { + "epoch": 0.11, + "learning_rate": 1.9412387541941497e-05, + "loss": 0.6375, + "step": 3174 + }, + { + "epoch": 0.11, + "learning_rate": 1.9412019730859097e-05, + "loss": 0.6796, + "step": 3175 + }, + { + "epoch": 0.11, + "learning_rate": 1.9411651808185294e-05, + "loss": 0.6432, + "step": 3176 + }, + { + "epoch": 0.11, + "learning_rate": 1.9411283773924455e-05, + "loss": 0.5815, + "step": 3177 + }, + { + "epoch": 0.11, + "learning_rate": 1.9410915628080943e-05, + "loss": 0.5916, + "step": 3178 + }, + { + "epoch": 0.11, + "learning_rate": 1.941054737065912e-05, + "loss": 0.6141, + "step": 3179 + }, + { + "epoch": 0.11, + "learning_rate": 1.941017900166335e-05, + "loss": 0.5911, + "step": 3180 + }, + { + "epoch": 0.11, + "learning_rate": 1.940981052109801e-05, + "loss": 0.6455, + "step": 3181 + }, + { + "epoch": 0.11, + "learning_rate": 1.9409441928967457e-05, + "loss": 0.6442, + "step": 3182 + }, + { + "epoch": 0.11, + "learning_rate": 1.9409073225276073e-05, + "loss": 0.6025, + "step": 3183 + }, + { + "epoch": 0.11, + "learning_rate": 1.940870441002822e-05, + "loss": 0.6165, + "step": 3184 + }, + { + "epoch": 0.11, + "learning_rate": 1.9408335483228272e-05, + "loss": 0.6409, + "step": 3185 + }, + { + "epoch": 0.11, + "learning_rate": 1.9407966444880608e-05, + "loss": 0.6806, + "step": 3186 + }, + { + "epoch": 0.11, + "learning_rate": 1.94075972949896e-05, + "loss": 0.5893, + "step": 3187 + }, + { + "epoch": 0.11, + "learning_rate": 1.9407228033559628e-05, + "loss": 0.5674, + "step": 3188 + }, + { + "epoch": 0.11, + "learning_rate": 1.9406858660595064e-05, + "loss": 0.6596, + "step": 3189 + }, + { + "epoch": 0.11, + "learning_rate": 1.9406489176100292e-05, + "loss": 0.6762, + "step": 3190 + }, + { + "epoch": 0.11, + "learning_rate": 1.940611958007969e-05, + "loss": 0.6767, + "step": 3191 + }, + { + "epoch": 0.11, + "learning_rate": 1.9405749872537645e-05, + "loss": 0.6326, + "step": 3192 + }, + { + "epoch": 0.11, + "learning_rate": 1.9405380053478534e-05, + "loss": 0.5791, + "step": 3193 + }, + { + "epoch": 0.11, + "learning_rate": 1.9405010122906746e-05, + "loss": 0.5877, + "step": 3194 + }, + { + "epoch": 0.11, + "learning_rate": 1.9404640080826665e-05, + "loss": 0.6365, + "step": 3195 + }, + { + "epoch": 0.11, + "learning_rate": 1.940426992724268e-05, + "loss": 0.6996, + "step": 3196 + }, + { + "epoch": 0.11, + "learning_rate": 1.9403899662159177e-05, + "loss": 0.6283, + "step": 3197 + }, + { + "epoch": 0.11, + "learning_rate": 1.9403529285580547e-05, + "loss": 0.6357, + "step": 3198 + }, + { + "epoch": 0.11, + "learning_rate": 1.9403158797511182e-05, + "loss": 0.6243, + "step": 3199 + }, + { + "epoch": 0.11, + "learning_rate": 1.9402788197955476e-05, + "loss": 0.62, + "step": 3200 + }, + { + "epoch": 0.11, + "learning_rate": 1.940241748691782e-05, + "loss": 0.6419, + "step": 3201 + }, + { + "epoch": 0.11, + "learning_rate": 1.9402046664402612e-05, + "loss": 0.6246, + "step": 3202 + }, + { + "epoch": 0.11, + "learning_rate": 1.9401675730414246e-05, + "loss": 0.59, + "step": 3203 + }, + { + "epoch": 0.11, + "learning_rate": 1.940130468495712e-05, + "loss": 0.6738, + "step": 3204 + }, + { + "epoch": 0.11, + "learning_rate": 1.940093352803564e-05, + "loss": 0.6733, + "step": 3205 + }, + { + "epoch": 0.11, + "learning_rate": 1.9400562259654194e-05, + "loss": 0.6233, + "step": 3206 + }, + { + "epoch": 0.11, + "learning_rate": 1.9400190879817192e-05, + "loss": 0.5503, + "step": 3207 + }, + { + "epoch": 0.11, + "learning_rate": 1.9399819388529038e-05, + "loss": 0.6588, + "step": 3208 + }, + { + "epoch": 0.11, + "learning_rate": 1.9399447785794133e-05, + "loss": 0.6376, + "step": 3209 + }, + { + "epoch": 0.11, + "learning_rate": 1.9399076071616886e-05, + "loss": 0.6789, + "step": 3210 + }, + { + "epoch": 0.11, + "learning_rate": 1.9398704246001697e-05, + "loss": 0.6527, + "step": 3211 + }, + { + "epoch": 0.11, + "learning_rate": 1.939833230895299e-05, + "loss": 0.6706, + "step": 3212 + }, + { + "epoch": 0.11, + "learning_rate": 1.9397960260475154e-05, + "loss": 0.6729, + "step": 3213 + }, + { + "epoch": 0.11, + "learning_rate": 1.9397588100572612e-05, + "loss": 0.6613, + "step": 3214 + }, + { + "epoch": 0.11, + "learning_rate": 1.9397215829249777e-05, + "loss": 0.6424, + "step": 3215 + }, + { + "epoch": 0.11, + "learning_rate": 1.9396843446511065e-05, + "loss": 0.6657, + "step": 3216 + }, + { + "epoch": 0.11, + "learning_rate": 1.9396470952360882e-05, + "loss": 0.644, + "step": 3217 + }, + { + "epoch": 0.11, + "learning_rate": 1.939609834680365e-05, + "loss": 0.5904, + "step": 3218 + }, + { + "epoch": 0.11, + "learning_rate": 1.9395725629843786e-05, + "loss": 0.6298, + "step": 3219 + }, + { + "epoch": 0.11, + "learning_rate": 1.9395352801485708e-05, + "loss": 0.6621, + "step": 3220 + }, + { + "epoch": 0.11, + "learning_rate": 1.9394979861733843e-05, + "loss": 0.665, + "step": 3221 + }, + { + "epoch": 0.11, + "learning_rate": 1.9394606810592603e-05, + "loss": 0.6663, + "step": 3222 + }, + { + "epoch": 0.11, + "learning_rate": 1.939423364806641e-05, + "loss": 0.6324, + "step": 3223 + }, + { + "epoch": 0.11, + "learning_rate": 1.9393860374159703e-05, + "loss": 0.7051, + "step": 3224 + }, + { + "epoch": 0.11, + "learning_rate": 1.939348698887689e-05, + "loss": 0.6807, + "step": 3225 + }, + { + "epoch": 0.11, + "learning_rate": 1.939311349222241e-05, + "loss": 0.6581, + "step": 3226 + }, + { + "epoch": 0.11, + "learning_rate": 1.9392739884200687e-05, + "loss": 0.627, + "step": 3227 + }, + { + "epoch": 0.11, + "learning_rate": 1.939236616481615e-05, + "loss": 0.6897, + "step": 3228 + }, + { + "epoch": 0.11, + "learning_rate": 1.939199233407323e-05, + "loss": 0.6474, + "step": 3229 + }, + { + "epoch": 0.11, + "learning_rate": 1.9391618391976363e-05, + "loss": 0.645, + "step": 3230 + }, + { + "epoch": 0.11, + "learning_rate": 1.9391244338529977e-05, + "loss": 0.6322, + "step": 3231 + }, + { + "epoch": 0.11, + "learning_rate": 1.9390870173738508e-05, + "loss": 0.617, + "step": 3232 + }, + { + "epoch": 0.11, + "learning_rate": 1.9390495897606398e-05, + "loss": 0.6526, + "step": 3233 + }, + { + "epoch": 0.11, + "learning_rate": 1.9390121510138074e-05, + "loss": 0.6691, + "step": 3234 + }, + { + "epoch": 0.11, + "learning_rate": 1.9389747011337987e-05, + "loss": 0.6229, + "step": 3235 + }, + { + "epoch": 0.11, + "learning_rate": 1.9389372401210567e-05, + "loss": 0.6199, + "step": 3236 + }, + { + "epoch": 0.11, + "learning_rate": 1.9388997679760263e-05, + "loss": 0.5942, + "step": 3237 + }, + { + "epoch": 0.11, + "learning_rate": 1.938862284699151e-05, + "loss": 0.6264, + "step": 3238 + }, + { + "epoch": 0.11, + "learning_rate": 1.938824790290876e-05, + "loss": 0.6392, + "step": 3239 + }, + { + "epoch": 0.11, + "learning_rate": 1.9387872847516452e-05, + "loss": 0.5896, + "step": 3240 + }, + { + "epoch": 0.11, + "learning_rate": 1.9387497680819037e-05, + "loss": 0.6363, + "step": 3241 + }, + { + "epoch": 0.11, + "learning_rate": 1.9387122402820965e-05, + "loss": 0.7295, + "step": 3242 + }, + { + "epoch": 0.11, + "learning_rate": 1.938674701352668e-05, + "loss": 0.6591, + "step": 3243 + }, + { + "epoch": 0.11, + "learning_rate": 1.938637151294063e-05, + "loss": 0.637, + "step": 3244 + }, + { + "epoch": 0.11, + "learning_rate": 1.9385995901067276e-05, + "loss": 0.6126, + "step": 3245 + }, + { + "epoch": 0.11, + "learning_rate": 1.938562017791107e-05, + "loss": 0.6596, + "step": 3246 + }, + { + "epoch": 0.11, + "learning_rate": 1.938524434347646e-05, + "loss": 0.6384, + "step": 3247 + }, + { + "epoch": 0.11, + "learning_rate": 1.9384868397767906e-05, + "loss": 0.6283, + "step": 3248 + }, + { + "epoch": 0.11, + "learning_rate": 1.9384492340789868e-05, + "loss": 0.6618, + "step": 3249 + }, + { + "epoch": 0.11, + "learning_rate": 1.9384116172546798e-05, + "loss": 0.6021, + "step": 3250 + }, + { + "epoch": 0.11, + "learning_rate": 1.9383739893043162e-05, + "loss": 0.6354, + "step": 3251 + }, + { + "epoch": 0.11, + "learning_rate": 1.938336350228342e-05, + "loss": 0.6577, + "step": 3252 + }, + { + "epoch": 0.11, + "learning_rate": 1.9382987000272035e-05, + "loss": 0.5928, + "step": 3253 + }, + { + "epoch": 0.11, + "learning_rate": 1.9382610387013464e-05, + "loss": 0.613, + "step": 3254 + }, + { + "epoch": 0.11, + "learning_rate": 1.9382233662512182e-05, + "loss": 0.5817, + "step": 3255 + }, + { + "epoch": 0.11, + "learning_rate": 1.938185682677265e-05, + "loss": 0.6563, + "step": 3256 + }, + { + "epoch": 0.11, + "learning_rate": 1.938147987979934e-05, + "loss": 0.6562, + "step": 3257 + }, + { + "epoch": 0.11, + "learning_rate": 1.9381102821596712e-05, + "loss": 0.6055, + "step": 3258 + }, + { + "epoch": 0.11, + "learning_rate": 1.938072565216925e-05, + "loss": 0.606, + "step": 3259 + }, + { + "epoch": 0.11, + "learning_rate": 1.9380348371521417e-05, + "loss": 0.5991, + "step": 3260 + }, + { + "epoch": 0.11, + "learning_rate": 1.9379970979657682e-05, + "loss": 0.5861, + "step": 3261 + }, + { + "epoch": 0.11, + "learning_rate": 1.9379593476582533e-05, + "loss": 0.5849, + "step": 3262 + }, + { + "epoch": 0.11, + "learning_rate": 1.9379215862300435e-05, + "loss": 0.6591, + "step": 3263 + }, + { + "epoch": 0.11, + "learning_rate": 1.9378838136815864e-05, + "loss": 0.6198, + "step": 3264 + }, + { + "epoch": 0.11, + "learning_rate": 1.937846030013331e-05, + "loss": 0.579, + "step": 3265 + }, + { + "epoch": 0.11, + "learning_rate": 1.9378082352257243e-05, + "loss": 0.6293, + "step": 3266 + }, + { + "epoch": 0.11, + "learning_rate": 1.9377704293192144e-05, + "loss": 0.64, + "step": 3267 + }, + { + "epoch": 0.11, + "learning_rate": 1.9377326122942498e-05, + "loss": 0.6227, + "step": 3268 + }, + { + "epoch": 0.11, + "learning_rate": 1.937694784151279e-05, + "loss": 0.6723, + "step": 3269 + }, + { + "epoch": 0.11, + "learning_rate": 1.9376569448907505e-05, + "loss": 0.5972, + "step": 3270 + }, + { + "epoch": 0.11, + "learning_rate": 1.9376190945131125e-05, + "loss": 0.6178, + "step": 3271 + }, + { + "epoch": 0.11, + "learning_rate": 1.937581233018814e-05, + "loss": 0.5915, + "step": 3272 + }, + { + "epoch": 0.11, + "learning_rate": 1.9375433604083042e-05, + "loss": 0.633, + "step": 3273 + }, + { + "epoch": 0.11, + "learning_rate": 1.9375054766820317e-05, + "loss": 0.6703, + "step": 3274 + }, + { + "epoch": 0.11, + "learning_rate": 1.9374675818404454e-05, + "loss": 0.5989, + "step": 3275 + }, + { + "epoch": 0.11, + "learning_rate": 1.937429675883996e-05, + "loss": 0.6374, + "step": 3276 + }, + { + "epoch": 0.11, + "learning_rate": 1.937391758813131e-05, + "loss": 0.6051, + "step": 3277 + }, + { + "epoch": 0.11, + "learning_rate": 1.937353830628301e-05, + "loss": 0.6732, + "step": 3278 + }, + { + "epoch": 0.11, + "learning_rate": 1.937315891329956e-05, + "loss": 0.5908, + "step": 3279 + }, + { + "epoch": 0.11, + "learning_rate": 1.9372779409185453e-05, + "loss": 0.6661, + "step": 3280 + }, + { + "epoch": 0.11, + "learning_rate": 1.9372399793945193e-05, + "loss": 0.6091, + "step": 3281 + }, + { + "epoch": 0.11, + "learning_rate": 1.937202006758327e-05, + "loss": 0.6655, + "step": 3282 + }, + { + "epoch": 0.11, + "learning_rate": 1.9371640230104197e-05, + "loss": 0.664, + "step": 3283 + }, + { + "epoch": 0.11, + "learning_rate": 1.9371260281512473e-05, + "loss": 0.6435, + "step": 3284 + }, + { + "epoch": 0.11, + "learning_rate": 1.9370880221812606e-05, + "loss": 0.6417, + "step": 3285 + }, + { + "epoch": 0.11, + "learning_rate": 1.9370500051009097e-05, + "loss": 0.6282, + "step": 3286 + }, + { + "epoch": 0.11, + "learning_rate": 1.937011976910646e-05, + "loss": 0.6341, + "step": 3287 + }, + { + "epoch": 0.11, + "learning_rate": 1.9369739376109197e-05, + "loss": 0.6755, + "step": 3288 + }, + { + "epoch": 0.11, + "learning_rate": 1.9369358872021818e-05, + "loss": 0.6856, + "step": 3289 + }, + { + "epoch": 0.11, + "learning_rate": 1.9368978256848843e-05, + "loss": 0.6295, + "step": 3290 + }, + { + "epoch": 0.11, + "learning_rate": 1.9368597530594775e-05, + "loss": 0.6399, + "step": 3291 + }, + { + "epoch": 0.11, + "learning_rate": 1.9368216693264133e-05, + "loss": 0.6023, + "step": 3292 + }, + { + "epoch": 0.11, + "learning_rate": 1.936783574486143e-05, + "loss": 0.669, + "step": 3293 + }, + { + "epoch": 0.11, + "learning_rate": 1.9367454685391188e-05, + "loss": 0.6061, + "step": 3294 + }, + { + "epoch": 0.11, + "learning_rate": 1.9367073514857917e-05, + "loss": 0.6133, + "step": 3295 + }, + { + "epoch": 0.11, + "learning_rate": 1.936669223326614e-05, + "loss": 0.6474, + "step": 3296 + }, + { + "epoch": 0.11, + "learning_rate": 1.936631084062038e-05, + "loss": 0.5922, + "step": 3297 + }, + { + "epoch": 0.11, + "learning_rate": 1.9365929336925156e-05, + "loss": 0.6521, + "step": 3298 + }, + { + "epoch": 0.11, + "learning_rate": 1.936554772218499e-05, + "loss": 0.6581, + "step": 3299 + }, + { + "epoch": 0.11, + "learning_rate": 1.9365165996404412e-05, + "loss": 0.6236, + "step": 3300 + }, + { + "epoch": 0.11, + "learning_rate": 1.936478415958794e-05, + "loss": 0.62, + "step": 3301 + }, + { + "epoch": 0.11, + "learning_rate": 1.9364402211740106e-05, + "loss": 0.638, + "step": 3302 + }, + { + "epoch": 0.11, + "learning_rate": 1.936402015286544e-05, + "loss": 0.6888, + "step": 3303 + }, + { + "epoch": 0.11, + "learning_rate": 1.9363637982968467e-05, + "loss": 0.6667, + "step": 3304 + }, + { + "epoch": 0.11, + "learning_rate": 1.936325570205372e-05, + "loss": 0.6613, + "step": 3305 + }, + { + "epoch": 0.11, + "learning_rate": 1.9362873310125735e-05, + "loss": 0.6506, + "step": 3306 + }, + { + "epoch": 0.11, + "learning_rate": 1.936249080718904e-05, + "loss": 0.7132, + "step": 3307 + }, + { + "epoch": 0.11, + "learning_rate": 1.9362108193248176e-05, + "loss": 0.6212, + "step": 3308 + }, + { + "epoch": 0.11, + "learning_rate": 1.9361725468307674e-05, + "loss": 0.6384, + "step": 3309 + }, + { + "epoch": 0.11, + "learning_rate": 1.9361342632372076e-05, + "loss": 0.6507, + "step": 3310 + }, + { + "epoch": 0.11, + "learning_rate": 1.9360959685445916e-05, + "loss": 0.6545, + "step": 3311 + }, + { + "epoch": 0.11, + "learning_rate": 1.936057662753374e-05, + "loss": 0.6433, + "step": 3312 + }, + { + "epoch": 0.11, + "learning_rate": 1.9360193458640086e-05, + "loss": 0.6219, + "step": 3313 + }, + { + "epoch": 0.11, + "learning_rate": 1.93598101787695e-05, + "loss": 0.6703, + "step": 3314 + }, + { + "epoch": 0.11, + "learning_rate": 1.9359426787926518e-05, + "loss": 0.6763, + "step": 3315 + }, + { + "epoch": 0.11, + "learning_rate": 1.9359043286115695e-05, + "loss": 0.6481, + "step": 3316 + }, + { + "epoch": 0.11, + "learning_rate": 1.9358659673341577e-05, + "loss": 0.682, + "step": 3317 + }, + { + "epoch": 0.11, + "learning_rate": 1.9358275949608707e-05, + "loss": 0.6546, + "step": 3318 + }, + { + "epoch": 0.11, + "learning_rate": 1.9357892114921637e-05, + "loss": 0.6033, + "step": 3319 + }, + { + "epoch": 0.12, + "learning_rate": 1.9357508169284922e-05, + "loss": 0.6829, + "step": 3320 + }, + { + "epoch": 0.12, + "learning_rate": 1.9357124112703104e-05, + "loss": 0.5963, + "step": 3321 + }, + { + "epoch": 0.12, + "learning_rate": 1.9356739945180746e-05, + "loss": 0.6401, + "step": 3322 + }, + { + "epoch": 0.12, + "learning_rate": 1.9356355666722405e-05, + "loss": 0.7062, + "step": 3323 + }, + { + "epoch": 0.12, + "learning_rate": 1.9355971277332624e-05, + "loss": 0.6604, + "step": 3324 + }, + { + "epoch": 0.12, + "learning_rate": 1.935558677701597e-05, + "loss": 0.6527, + "step": 3325 + }, + { + "epoch": 0.12, + "learning_rate": 1.9355202165777002e-05, + "loss": 0.6968, + "step": 3326 + }, + { + "epoch": 0.12, + "learning_rate": 1.9354817443620275e-05, + "loss": 0.6418, + "step": 3327 + }, + { + "epoch": 0.12, + "learning_rate": 1.9354432610550357e-05, + "loss": 0.5997, + "step": 3328 + }, + { + "epoch": 0.12, + "learning_rate": 1.9354047666571805e-05, + "loss": 0.6172, + "step": 3329 + }, + { + "epoch": 0.12, + "learning_rate": 1.9353662611689183e-05, + "loss": 0.634, + "step": 3330 + }, + { + "epoch": 0.12, + "learning_rate": 1.935327744590706e-05, + "loss": 0.6374, + "step": 3331 + }, + { + "epoch": 0.12, + "learning_rate": 1.935289216923e-05, + "loss": 0.6322, + "step": 3332 + }, + { + "epoch": 0.12, + "learning_rate": 1.9352506781662578e-05, + "loss": 0.6685, + "step": 3333 + }, + { + "epoch": 0.12, + "learning_rate": 1.935212128320935e-05, + "loss": 0.6815, + "step": 3334 + }, + { + "epoch": 0.12, + "learning_rate": 1.9351735673874895e-05, + "loss": 0.619, + "step": 3335 + }, + { + "epoch": 0.12, + "learning_rate": 1.9351349953663787e-05, + "loss": 0.6465, + "step": 3336 + }, + { + "epoch": 0.12, + "learning_rate": 1.9350964122580592e-05, + "loss": 0.6616, + "step": 3337 + }, + { + "epoch": 0.12, + "learning_rate": 1.9350578180629892e-05, + "loss": 0.6217, + "step": 3338 + }, + { + "epoch": 0.12, + "learning_rate": 1.9350192127816253e-05, + "loss": 0.6642, + "step": 3339 + }, + { + "epoch": 0.12, + "learning_rate": 1.9349805964144264e-05, + "loss": 0.6855, + "step": 3340 + }, + { + "epoch": 0.12, + "learning_rate": 1.9349419689618494e-05, + "loss": 0.6196, + "step": 3341 + }, + { + "epoch": 0.12, + "learning_rate": 1.934903330424353e-05, + "loss": 0.6437, + "step": 3342 + }, + { + "epoch": 0.12, + "learning_rate": 1.9348646808023948e-05, + "loss": 0.5858, + "step": 3343 + }, + { + "epoch": 0.12, + "learning_rate": 1.934826020096433e-05, + "loss": 0.6265, + "step": 3344 + }, + { + "epoch": 0.12, + "learning_rate": 1.9347873483069264e-05, + "loss": 0.6286, + "step": 3345 + }, + { + "epoch": 0.12, + "learning_rate": 1.9347486654343332e-05, + "loss": 0.6339, + "step": 3346 + }, + { + "epoch": 0.12, + "learning_rate": 1.934709971479112e-05, + "loss": 0.6554, + "step": 3347 + }, + { + "epoch": 0.12, + "learning_rate": 1.934671266441722e-05, + "loss": 0.6675, + "step": 3348 + }, + { + "epoch": 0.12, + "learning_rate": 1.9346325503226214e-05, + "loss": 0.6689, + "step": 3349 + }, + { + "epoch": 0.12, + "learning_rate": 1.93459382312227e-05, + "loss": 0.6458, + "step": 3350 + }, + { + "epoch": 0.12, + "learning_rate": 1.9345550848411263e-05, + "loss": 0.6135, + "step": 3351 + }, + { + "epoch": 0.12, + "learning_rate": 1.93451633547965e-05, + "loss": 0.6529, + "step": 3352 + }, + { + "epoch": 0.12, + "learning_rate": 1.9344775750383e-05, + "loss": 0.6056, + "step": 3353 + }, + { + "epoch": 0.12, + "learning_rate": 1.9344388035175365e-05, + "loss": 0.597, + "step": 3354 + }, + { + "epoch": 0.12, + "learning_rate": 1.9344000209178188e-05, + "loss": 0.6397, + "step": 3355 + }, + { + "epoch": 0.12, + "learning_rate": 1.9343612272396067e-05, + "loss": 0.6755, + "step": 3356 + }, + { + "epoch": 0.12, + "learning_rate": 1.9343224224833607e-05, + "loss": 0.6014, + "step": 3357 + }, + { + "epoch": 0.12, + "learning_rate": 1.9342836066495402e-05, + "loss": 0.7102, + "step": 3358 + }, + { + "epoch": 0.12, + "learning_rate": 1.934244779738606e-05, + "loss": 0.6745, + "step": 3359 + }, + { + "epoch": 0.12, + "learning_rate": 1.9342059417510177e-05, + "loss": 0.6311, + "step": 3360 + }, + { + "epoch": 0.12, + "learning_rate": 1.934167092687236e-05, + "loss": 0.6236, + "step": 3361 + }, + { + "epoch": 0.12, + "learning_rate": 1.9341282325477223e-05, + "loss": 0.632, + "step": 3362 + }, + { + "epoch": 0.12, + "learning_rate": 1.9340893613329365e-05, + "loss": 0.6323, + "step": 3363 + }, + { + "epoch": 0.12, + "learning_rate": 1.9340504790433396e-05, + "loss": 0.6377, + "step": 3364 + }, + { + "epoch": 0.12, + "learning_rate": 1.9340115856793927e-05, + "loss": 0.6846, + "step": 3365 + }, + { + "epoch": 0.12, + "learning_rate": 1.933972681241557e-05, + "loss": 0.6436, + "step": 3366 + }, + { + "epoch": 0.12, + "learning_rate": 1.9339337657302938e-05, + "loss": 0.6397, + "step": 3367 + }, + { + "epoch": 0.12, + "learning_rate": 1.933894839146064e-05, + "loss": 0.6935, + "step": 3368 + }, + { + "epoch": 0.12, + "learning_rate": 1.9338559014893298e-05, + "loss": 0.7015, + "step": 3369 + }, + { + "epoch": 0.12, + "learning_rate": 1.9338169527605523e-05, + "loss": 0.617, + "step": 3370 + }, + { + "epoch": 0.12, + "learning_rate": 1.9337779929601938e-05, + "loss": 0.6717, + "step": 3371 + }, + { + "epoch": 0.12, + "learning_rate": 1.9337390220887156e-05, + "loss": 0.6833, + "step": 3372 + }, + { + "epoch": 0.12, + "learning_rate": 1.9337000401465805e-05, + "loss": 0.6686, + "step": 3373 + }, + { + "epoch": 0.12, + "learning_rate": 1.9336610471342503e-05, + "loss": 0.6675, + "step": 3374 + }, + { + "epoch": 0.12, + "learning_rate": 1.933622043052187e-05, + "loss": 0.6235, + "step": 3375 + }, + { + "epoch": 0.12, + "learning_rate": 1.9335830279008534e-05, + "loss": 0.6326, + "step": 3376 + }, + { + "epoch": 0.12, + "learning_rate": 1.933544001680712e-05, + "loss": 0.6081, + "step": 3377 + }, + { + "epoch": 0.12, + "learning_rate": 1.933504964392226e-05, + "loss": 0.6052, + "step": 3378 + }, + { + "epoch": 0.12, + "learning_rate": 1.933465916035857e-05, + "loss": 0.5826, + "step": 3379 + }, + { + "epoch": 0.12, + "learning_rate": 1.9334268566120692e-05, + "loss": 0.6249, + "step": 3380 + }, + { + "epoch": 0.12, + "learning_rate": 1.9333877861213253e-05, + "loss": 0.6743, + "step": 3381 + }, + { + "epoch": 0.12, + "learning_rate": 1.933348704564088e-05, + "loss": 0.638, + "step": 3382 + }, + { + "epoch": 0.12, + "learning_rate": 1.9333096119408215e-05, + "loss": 0.6389, + "step": 3383 + }, + { + "epoch": 0.12, + "learning_rate": 1.933270508251989e-05, + "loss": 0.6544, + "step": 3384 + }, + { + "epoch": 0.12, + "learning_rate": 1.9332313934980538e-05, + "loss": 0.6731, + "step": 3385 + }, + { + "epoch": 0.12, + "learning_rate": 1.93319226767948e-05, + "loss": 0.6993, + "step": 3386 + }, + { + "epoch": 0.12, + "learning_rate": 1.9331531307967313e-05, + "loss": 0.6707, + "step": 3387 + }, + { + "epoch": 0.12, + "learning_rate": 1.9331139828502718e-05, + "loss": 0.6287, + "step": 3388 + }, + { + "epoch": 0.12, + "learning_rate": 1.9330748238405655e-05, + "loss": 0.6412, + "step": 3389 + }, + { + "epoch": 0.12, + "learning_rate": 1.933035653768077e-05, + "loss": 0.6444, + "step": 3390 + }, + { + "epoch": 0.12, + "learning_rate": 1.9329964726332705e-05, + "loss": 0.6195, + "step": 3391 + }, + { + "epoch": 0.12, + "learning_rate": 1.9329572804366104e-05, + "loss": 0.6171, + "step": 3392 + }, + { + "epoch": 0.12, + "learning_rate": 1.932918077178562e-05, + "loss": 0.5822, + "step": 3393 + }, + { + "epoch": 0.12, + "learning_rate": 1.932878862859589e-05, + "loss": 0.6316, + "step": 3394 + }, + { + "epoch": 0.12, + "learning_rate": 1.932839637480157e-05, + "loss": 0.6493, + "step": 3395 + }, + { + "epoch": 0.12, + "learning_rate": 1.9328004010407317e-05, + "loss": 0.6224, + "step": 3396 + }, + { + "epoch": 0.12, + "learning_rate": 1.9327611535417774e-05, + "loss": 0.6474, + "step": 3397 + }, + { + "epoch": 0.12, + "learning_rate": 1.9327218949837596e-05, + "loss": 0.6281, + "step": 3398 + }, + { + "epoch": 0.12, + "learning_rate": 1.9326826253671437e-05, + "loss": 0.6359, + "step": 3399 + }, + { + "epoch": 0.12, + "learning_rate": 1.9326433446923957e-05, + "loss": 0.6705, + "step": 3400 + }, + { + "epoch": 0.12, + "learning_rate": 1.932604052959981e-05, + "loss": 0.6422, + "step": 3401 + }, + { + "epoch": 0.12, + "learning_rate": 1.9325647501703654e-05, + "loss": 0.6011, + "step": 3402 + }, + { + "epoch": 0.12, + "learning_rate": 1.9325254363240146e-05, + "loss": 0.6095, + "step": 3403 + }, + { + "epoch": 0.12, + "learning_rate": 1.932486111421396e-05, + "loss": 0.5911, + "step": 3404 + }, + { + "epoch": 0.12, + "learning_rate": 1.932446775462974e-05, + "loss": 0.6536, + "step": 3405 + }, + { + "epoch": 0.12, + "learning_rate": 1.9324074284492162e-05, + "loss": 0.6033, + "step": 3406 + }, + { + "epoch": 0.12, + "learning_rate": 1.932368070380589e-05, + "loss": 0.586, + "step": 3407 + }, + { + "epoch": 0.12, + "learning_rate": 1.9323287012575593e-05, + "loss": 0.6715, + "step": 3408 + }, + { + "epoch": 0.12, + "learning_rate": 1.932289321080593e-05, + "loss": 0.652, + "step": 3409 + }, + { + "epoch": 0.12, + "learning_rate": 1.932249929850157e-05, + "loss": 0.6563, + "step": 3410 + }, + { + "epoch": 0.12, + "learning_rate": 1.9322105275667194e-05, + "loss": 0.6465, + "step": 3411 + }, + { + "epoch": 0.12, + "learning_rate": 1.9321711142307466e-05, + "loss": 0.668, + "step": 3412 + }, + { + "epoch": 0.12, + "learning_rate": 1.932131689842706e-05, + "loss": 0.6796, + "step": 3413 + }, + { + "epoch": 0.12, + "learning_rate": 1.932092254403065e-05, + "loss": 0.6049, + "step": 3414 + }, + { + "epoch": 0.12, + "learning_rate": 1.9320528079122915e-05, + "loss": 0.5967, + "step": 3415 + }, + { + "epoch": 0.12, + "learning_rate": 1.9320133503708527e-05, + "loss": 0.6737, + "step": 3416 + }, + { + "epoch": 0.12, + "learning_rate": 1.9319738817792165e-05, + "loss": 0.6311, + "step": 3417 + }, + { + "epoch": 0.12, + "learning_rate": 1.9319344021378512e-05, + "loss": 0.6811, + "step": 3418 + }, + { + "epoch": 0.12, + "learning_rate": 1.9318949114472247e-05, + "loss": 0.6369, + "step": 3419 + }, + { + "epoch": 0.12, + "learning_rate": 1.931855409707805e-05, + "loss": 0.6605, + "step": 3420 + }, + { + "epoch": 0.12, + "learning_rate": 1.9318158969200607e-05, + "loss": 0.6505, + "step": 3421 + }, + { + "epoch": 0.12, + "learning_rate": 1.93177637308446e-05, + "loss": 0.6729, + "step": 3422 + }, + { + "epoch": 0.12, + "learning_rate": 1.9317368382014717e-05, + "loss": 0.6551, + "step": 3423 + }, + { + "epoch": 0.12, + "learning_rate": 1.9316972922715648e-05, + "loss": 0.6233, + "step": 3424 + }, + { + "epoch": 0.12, + "learning_rate": 1.931657735295208e-05, + "loss": 0.6027, + "step": 3425 + }, + { + "epoch": 0.12, + "learning_rate": 1.93161816727287e-05, + "loss": 0.6027, + "step": 3426 + }, + { + "epoch": 0.12, + "learning_rate": 1.93157858820502e-05, + "loss": 0.6537, + "step": 3427 + }, + { + "epoch": 0.12, + "learning_rate": 1.9315389980921275e-05, + "loss": 0.6645, + "step": 3428 + }, + { + "epoch": 0.12, + "learning_rate": 1.9314993969346617e-05, + "loss": 0.6535, + "step": 3429 + }, + { + "epoch": 0.12, + "learning_rate": 1.931459784733092e-05, + "loss": 0.6463, + "step": 3430 + }, + { + "epoch": 0.12, + "learning_rate": 1.9314201614878887e-05, + "loss": 0.6478, + "step": 3431 + }, + { + "epoch": 0.12, + "learning_rate": 1.931380527199521e-05, + "loss": 0.6534, + "step": 3432 + }, + { + "epoch": 0.12, + "learning_rate": 1.931340881868459e-05, + "loss": 0.6188, + "step": 3433 + }, + { + "epoch": 0.12, + "learning_rate": 1.9313012254951726e-05, + "loss": 0.6882, + "step": 3434 + }, + { + "epoch": 0.12, + "learning_rate": 1.9312615580801317e-05, + "loss": 0.6225, + "step": 3435 + }, + { + "epoch": 0.12, + "learning_rate": 1.9312218796238073e-05, + "loss": 0.6897, + "step": 3436 + }, + { + "epoch": 0.12, + "learning_rate": 1.9311821901266696e-05, + "loss": 0.6053, + "step": 3437 + }, + { + "epoch": 0.12, + "learning_rate": 1.931142489589189e-05, + "loss": 0.5912, + "step": 3438 + }, + { + "epoch": 0.12, + "learning_rate": 1.9311027780118363e-05, + "loss": 0.668, + "step": 3439 + }, + { + "epoch": 0.12, + "learning_rate": 1.9310630553950823e-05, + "loss": 0.6329, + "step": 3440 + }, + { + "epoch": 0.12, + "learning_rate": 1.931023321739398e-05, + "loss": 0.6015, + "step": 3441 + }, + { + "epoch": 0.12, + "learning_rate": 1.9309835770452544e-05, + "loss": 0.6658, + "step": 3442 + }, + { + "epoch": 0.12, + "learning_rate": 1.9309438213131232e-05, + "loss": 0.5799, + "step": 3443 + }, + { + "epoch": 0.12, + "learning_rate": 1.9309040545434747e-05, + "loss": 0.6378, + "step": 3444 + }, + { + "epoch": 0.12, + "learning_rate": 1.9308642767367813e-05, + "loss": 0.672, + "step": 3445 + }, + { + "epoch": 0.12, + "learning_rate": 1.9308244878935145e-05, + "loss": 0.6353, + "step": 3446 + }, + { + "epoch": 0.12, + "learning_rate": 1.930784688014146e-05, + "loss": 0.6407, + "step": 3447 + }, + { + "epoch": 0.12, + "learning_rate": 1.930744877099147e-05, + "loss": 0.6239, + "step": 3448 + }, + { + "epoch": 0.12, + "learning_rate": 1.9307050551489904e-05, + "loss": 0.6383, + "step": 3449 + }, + { + "epoch": 0.12, + "learning_rate": 1.9306652221641483e-05, + "loss": 0.6459, + "step": 3450 + }, + { + "epoch": 0.12, + "learning_rate": 1.9306253781450923e-05, + "loss": 0.6462, + "step": 3451 + }, + { + "epoch": 0.12, + "learning_rate": 1.9305855230922955e-05, + "loss": 0.6353, + "step": 3452 + }, + { + "epoch": 0.12, + "learning_rate": 1.93054565700623e-05, + "loss": 0.6448, + "step": 3453 + }, + { + "epoch": 0.12, + "learning_rate": 1.9305057798873684e-05, + "loss": 0.6127, + "step": 3454 + }, + { + "epoch": 0.12, + "learning_rate": 1.930465891736184e-05, + "loss": 0.6316, + "step": 3455 + }, + { + "epoch": 0.12, + "learning_rate": 1.9304259925531494e-05, + "loss": 0.6279, + "step": 3456 + }, + { + "epoch": 0.12, + "learning_rate": 1.9303860823387373e-05, + "loss": 0.6389, + "step": 3457 + }, + { + "epoch": 0.12, + "learning_rate": 1.9303461610934215e-05, + "loss": 0.6613, + "step": 3458 + }, + { + "epoch": 0.12, + "learning_rate": 1.930306228817675e-05, + "loss": 0.6455, + "step": 3459 + }, + { + "epoch": 0.12, + "learning_rate": 1.9302662855119717e-05, + "loss": 0.6429, + "step": 3460 + }, + { + "epoch": 0.12, + "learning_rate": 1.9302263311767842e-05, + "loss": 0.6442, + "step": 3461 + }, + { + "epoch": 0.12, + "learning_rate": 1.930186365812587e-05, + "loss": 0.6459, + "step": 3462 + }, + { + "epoch": 0.12, + "learning_rate": 1.930146389419854e-05, + "loss": 0.6174, + "step": 3463 + }, + { + "epoch": 0.12, + "learning_rate": 1.9301064019990586e-05, + "loss": 0.6398, + "step": 3464 + }, + { + "epoch": 0.12, + "learning_rate": 1.930066403550675e-05, + "loss": 0.6347, + "step": 3465 + }, + { + "epoch": 0.12, + "learning_rate": 1.9300263940751784e-05, + "loss": 0.6361, + "step": 3466 + }, + { + "epoch": 0.12, + "learning_rate": 1.929986373573042e-05, + "loss": 0.6777, + "step": 3467 + }, + { + "epoch": 0.12, + "learning_rate": 1.9299463420447405e-05, + "loss": 0.6388, + "step": 3468 + }, + { + "epoch": 0.12, + "learning_rate": 1.929906299490749e-05, + "loss": 0.6093, + "step": 3469 + }, + { + "epoch": 0.12, + "learning_rate": 1.9298662459115417e-05, + "loss": 0.6863, + "step": 3470 + }, + { + "epoch": 0.12, + "learning_rate": 1.9298261813075943e-05, + "loss": 0.6607, + "step": 3471 + }, + { + "epoch": 0.12, + "learning_rate": 1.9297861056793807e-05, + "loss": 0.6256, + "step": 3472 + }, + { + "epoch": 0.12, + "learning_rate": 1.9297460190273768e-05, + "loss": 0.6855, + "step": 3473 + }, + { + "epoch": 0.12, + "learning_rate": 1.929705921352058e-05, + "loss": 0.6737, + "step": 3474 + }, + { + "epoch": 0.12, + "learning_rate": 1.929665812653899e-05, + "loss": 0.6624, + "step": 3475 + }, + { + "epoch": 0.12, + "learning_rate": 1.9296256929333758e-05, + "loss": 0.6209, + "step": 3476 + }, + { + "epoch": 0.12, + "learning_rate": 1.9295855621909645e-05, + "loss": 0.6104, + "step": 3477 + }, + { + "epoch": 0.12, + "learning_rate": 1.92954542042714e-05, + "loss": 0.6308, + "step": 3478 + }, + { + "epoch": 0.12, + "learning_rate": 1.9295052676423788e-05, + "loss": 0.6467, + "step": 3479 + }, + { + "epoch": 0.12, + "learning_rate": 1.9294651038371568e-05, + "loss": 0.617, + "step": 3480 + }, + { + "epoch": 0.12, + "learning_rate": 1.92942492901195e-05, + "loss": 0.645, + "step": 3481 + }, + { + "epoch": 0.12, + "learning_rate": 1.929384743167235e-05, + "loss": 0.6796, + "step": 3482 + }, + { + "epoch": 0.12, + "learning_rate": 1.9293445463034888e-05, + "loss": 0.6553, + "step": 3483 + }, + { + "epoch": 0.12, + "learning_rate": 1.929304338421187e-05, + "loss": 0.5978, + "step": 3484 + }, + { + "epoch": 0.12, + "learning_rate": 1.9292641195208065e-05, + "loss": 0.6432, + "step": 3485 + }, + { + "epoch": 0.12, + "learning_rate": 1.9292238896028242e-05, + "loss": 0.6035, + "step": 3486 + }, + { + "epoch": 0.12, + "learning_rate": 1.9291836486677175e-05, + "loss": 0.6622, + "step": 3487 + }, + { + "epoch": 0.12, + "learning_rate": 1.929143396715963e-05, + "loss": 0.6101, + "step": 3488 + }, + { + "epoch": 0.12, + "learning_rate": 1.9291031337480386e-05, + "loss": 0.6265, + "step": 3489 + }, + { + "epoch": 0.12, + "learning_rate": 1.929062859764421e-05, + "loss": 0.6967, + "step": 3490 + }, + { + "epoch": 0.12, + "learning_rate": 1.929022574765588e-05, + "loss": 0.6182, + "step": 3491 + }, + { + "epoch": 0.12, + "learning_rate": 1.9289822787520168e-05, + "loss": 0.6165, + "step": 3492 + }, + { + "epoch": 0.12, + "learning_rate": 1.928941971724186e-05, + "loss": 0.66, + "step": 3493 + }, + { + "epoch": 0.12, + "learning_rate": 1.9289016536825726e-05, + "loss": 0.5948, + "step": 3494 + }, + { + "epoch": 0.12, + "learning_rate": 1.928861324627655e-05, + "loss": 0.6492, + "step": 3495 + }, + { + "epoch": 0.12, + "learning_rate": 1.928820984559912e-05, + "loss": 0.6539, + "step": 3496 + }, + { + "epoch": 0.12, + "learning_rate": 1.9287806334798207e-05, + "loss": 0.7062, + "step": 3497 + }, + { + "epoch": 0.12, + "learning_rate": 1.9287402713878602e-05, + "loss": 0.6414, + "step": 3498 + }, + { + "epoch": 0.12, + "learning_rate": 1.928699898284509e-05, + "loss": 0.701, + "step": 3499 + }, + { + "epoch": 0.12, + "learning_rate": 1.9286595141702455e-05, + "loss": 0.6014, + "step": 3500 + }, + { + "epoch": 0.12, + "learning_rate": 1.928619119045549e-05, + "loss": 0.679, + "step": 3501 + }, + { + "epoch": 0.12, + "learning_rate": 1.928578712910898e-05, + "loss": 0.6202, + "step": 3502 + }, + { + "epoch": 0.12, + "learning_rate": 1.9285382957667716e-05, + "loss": 0.6077, + "step": 3503 + }, + { + "epoch": 0.12, + "learning_rate": 1.9284978676136494e-05, + "loss": 0.6577, + "step": 3504 + }, + { + "epoch": 0.12, + "learning_rate": 1.92845742845201e-05, + "loss": 0.6834, + "step": 3505 + }, + { + "epoch": 0.12, + "learning_rate": 1.9284169782823333e-05, + "loss": 0.5994, + "step": 3506 + }, + { + "epoch": 0.12, + "learning_rate": 1.928376517105099e-05, + "loss": 0.6636, + "step": 3507 + }, + { + "epoch": 0.12, + "learning_rate": 1.9283360449207867e-05, + "loss": 0.7007, + "step": 3508 + }, + { + "epoch": 0.12, + "learning_rate": 1.9282955617298766e-05, + "loss": 0.6246, + "step": 3509 + }, + { + "epoch": 0.12, + "learning_rate": 1.9282550675328477e-05, + "loss": 0.5976, + "step": 3510 + }, + { + "epoch": 0.12, + "learning_rate": 1.928214562330181e-05, + "loss": 0.6229, + "step": 3511 + }, + { + "epoch": 0.12, + "learning_rate": 1.9281740461223566e-05, + "loss": 0.5942, + "step": 3512 + }, + { + "epoch": 0.12, + "learning_rate": 1.9281335189098547e-05, + "loss": 0.6169, + "step": 3513 + }, + { + "epoch": 0.12, + "learning_rate": 1.9280929806931558e-05, + "loss": 0.6122, + "step": 3514 + }, + { + "epoch": 0.12, + "learning_rate": 1.9280524314727406e-05, + "loss": 0.6919, + "step": 3515 + }, + { + "epoch": 0.12, + "learning_rate": 1.9280118712490896e-05, + "loss": 0.6176, + "step": 3516 + }, + { + "epoch": 0.12, + "learning_rate": 1.9279713000226842e-05, + "loss": 0.6365, + "step": 3517 + }, + { + "epoch": 0.12, + "learning_rate": 1.9279307177940046e-05, + "loss": 0.6951, + "step": 3518 + }, + { + "epoch": 0.12, + "learning_rate": 1.9278901245635332e-05, + "loss": 0.674, + "step": 3519 + }, + { + "epoch": 0.12, + "learning_rate": 1.92784952033175e-05, + "loss": 0.6064, + "step": 3520 + }, + { + "epoch": 0.12, + "learning_rate": 1.9278089050991374e-05, + "loss": 0.7077, + "step": 3521 + }, + { + "epoch": 0.12, + "learning_rate": 1.9277682788661763e-05, + "loss": 0.6504, + "step": 3522 + }, + { + "epoch": 0.12, + "learning_rate": 1.927727641633349e-05, + "loss": 0.6712, + "step": 3523 + }, + { + "epoch": 0.12, + "learning_rate": 1.9276869934011366e-05, + "loss": 0.5404, + "step": 3524 + }, + { + "epoch": 0.12, + "learning_rate": 1.927646334170022e-05, + "loss": 0.659, + "step": 3525 + }, + { + "epoch": 0.12, + "learning_rate": 1.9276056639404856e-05, + "loss": 0.6261, + "step": 3526 + }, + { + "epoch": 0.12, + "learning_rate": 1.9275649827130115e-05, + "loss": 0.6584, + "step": 3527 + }, + { + "epoch": 0.12, + "learning_rate": 1.9275242904880804e-05, + "loss": 0.6334, + "step": 3528 + }, + { + "epoch": 0.12, + "learning_rate": 1.9274835872661758e-05, + "loss": 0.6577, + "step": 3529 + }, + { + "epoch": 0.12, + "learning_rate": 1.9274428730477805e-05, + "loss": 0.6606, + "step": 3530 + }, + { + "epoch": 0.12, + "learning_rate": 1.9274021478333762e-05, + "loss": 0.6789, + "step": 3531 + }, + { + "epoch": 0.12, + "learning_rate": 1.9273614116234465e-05, + "loss": 0.659, + "step": 3532 + }, + { + "epoch": 0.12, + "learning_rate": 1.9273206644184738e-05, + "loss": 0.6356, + "step": 3533 + }, + { + "epoch": 0.12, + "learning_rate": 1.9272799062189417e-05, + "loss": 0.6559, + "step": 3534 + }, + { + "epoch": 0.12, + "learning_rate": 1.9272391370253335e-05, + "loss": 0.591, + "step": 3535 + }, + { + "epoch": 0.12, + "learning_rate": 1.927198356838132e-05, + "loss": 0.6612, + "step": 3536 + }, + { + "epoch": 0.12, + "learning_rate": 1.9271575656578214e-05, + "loss": 0.6269, + "step": 3537 + }, + { + "epoch": 0.12, + "learning_rate": 1.9271167634848852e-05, + "loss": 0.6208, + "step": 3538 + }, + { + "epoch": 0.12, + "learning_rate": 1.9270759503198065e-05, + "loss": 0.6615, + "step": 3539 + }, + { + "epoch": 0.12, + "learning_rate": 1.92703512616307e-05, + "loss": 0.6508, + "step": 3540 + }, + { + "epoch": 0.12, + "learning_rate": 1.926994291015159e-05, + "loss": 0.622, + "step": 3541 + }, + { + "epoch": 0.12, + "learning_rate": 1.9269534448765583e-05, + "loss": 0.6332, + "step": 3542 + }, + { + "epoch": 0.12, + "learning_rate": 1.9269125877477517e-05, + "loss": 0.6467, + "step": 3543 + }, + { + "epoch": 0.12, + "learning_rate": 1.9268717196292242e-05, + "loss": 0.6294, + "step": 3544 + }, + { + "epoch": 0.12, + "learning_rate": 1.9268308405214594e-05, + "loss": 0.6296, + "step": 3545 + }, + { + "epoch": 0.12, + "learning_rate": 1.9267899504249433e-05, + "loss": 0.6464, + "step": 3546 + }, + { + "epoch": 0.12, + "learning_rate": 1.9267490493401592e-05, + "loss": 0.6748, + "step": 3547 + }, + { + "epoch": 0.12, + "learning_rate": 1.9267081372675932e-05, + "loss": 0.6313, + "step": 3548 + }, + { + "epoch": 0.12, + "learning_rate": 1.9266672142077295e-05, + "loss": 0.5971, + "step": 3549 + }, + { + "epoch": 0.12, + "learning_rate": 1.9266262801610543e-05, + "loss": 0.6157, + "step": 3550 + }, + { + "epoch": 0.12, + "learning_rate": 1.926585335128052e-05, + "loss": 0.6312, + "step": 3551 + }, + { + "epoch": 0.12, + "learning_rate": 1.9265443791092087e-05, + "loss": 0.6147, + "step": 3552 + }, + { + "epoch": 0.12, + "learning_rate": 1.9265034121050094e-05, + "loss": 0.6934, + "step": 3553 + }, + { + "epoch": 0.12, + "learning_rate": 1.9264624341159403e-05, + "loss": 0.6358, + "step": 3554 + }, + { + "epoch": 0.12, + "learning_rate": 1.926421445142487e-05, + "loss": 0.6143, + "step": 3555 + }, + { + "epoch": 0.12, + "learning_rate": 1.9263804451851356e-05, + "loss": 0.6727, + "step": 3556 + }, + { + "epoch": 0.12, + "learning_rate": 1.926339434244372e-05, + "loss": 0.621, + "step": 3557 + }, + { + "epoch": 0.12, + "learning_rate": 1.926298412320683e-05, + "loss": 0.6666, + "step": 3558 + }, + { + "epoch": 0.12, + "learning_rate": 1.926257379414554e-05, + "loss": 0.599, + "step": 3559 + }, + { + "epoch": 0.12, + "learning_rate": 1.9262163355264723e-05, + "loss": 0.6553, + "step": 3560 + }, + { + "epoch": 0.12, + "learning_rate": 1.9261752806569243e-05, + "loss": 0.6134, + "step": 3561 + }, + { + "epoch": 0.12, + "learning_rate": 1.9261342148063968e-05, + "loss": 0.6209, + "step": 3562 + }, + { + "epoch": 0.12, + "learning_rate": 1.9260931379753763e-05, + "loss": 0.6152, + "step": 3563 + }, + { + "epoch": 0.12, + "learning_rate": 1.9260520501643504e-05, + "loss": 0.6339, + "step": 3564 + }, + { + "epoch": 0.12, + "learning_rate": 1.926010951373806e-05, + "loss": 0.7084, + "step": 3565 + }, + { + "epoch": 0.12, + "learning_rate": 1.92596984160423e-05, + "loss": 0.6156, + "step": 3566 + }, + { + "epoch": 0.12, + "learning_rate": 1.9259287208561102e-05, + "loss": 0.6346, + "step": 3567 + }, + { + "epoch": 0.12, + "learning_rate": 1.9258875891299348e-05, + "loss": 0.6646, + "step": 3568 + }, + { + "epoch": 0.12, + "learning_rate": 1.9258464464261903e-05, + "loss": 0.5862, + "step": 3569 + }, + { + "epoch": 0.12, + "learning_rate": 1.925805292745365e-05, + "loss": 0.6484, + "step": 3570 + }, + { + "epoch": 0.12, + "learning_rate": 1.9257641280879468e-05, + "loss": 0.6522, + "step": 3571 + }, + { + "epoch": 0.12, + "learning_rate": 1.9257229524544236e-05, + "loss": 0.6649, + "step": 3572 + }, + { + "epoch": 0.12, + "learning_rate": 1.9256817658452837e-05, + "loss": 0.6234, + "step": 3573 + }, + { + "epoch": 0.12, + "learning_rate": 1.925640568261016e-05, + "loss": 0.6634, + "step": 3574 + }, + { + "epoch": 0.12, + "learning_rate": 1.9255993597021077e-05, + "loss": 0.627, + "step": 3575 + }, + { + "epoch": 0.12, + "learning_rate": 1.9255581401690488e-05, + "loss": 0.6454, + "step": 3576 + }, + { + "epoch": 0.12, + "learning_rate": 1.925516909662327e-05, + "loss": 0.7241, + "step": 3577 + }, + { + "epoch": 0.12, + "learning_rate": 1.9254756681824314e-05, + "loss": 0.6622, + "step": 3578 + }, + { + "epoch": 0.12, + "learning_rate": 1.925434415729851e-05, + "loss": 0.6459, + "step": 3579 + }, + { + "epoch": 0.12, + "learning_rate": 1.9253931523050753e-05, + "loss": 0.6871, + "step": 3580 + }, + { + "epoch": 0.12, + "learning_rate": 1.9253518779085926e-05, + "loss": 0.6547, + "step": 3581 + }, + { + "epoch": 0.12, + "learning_rate": 1.9253105925408934e-05, + "loss": 0.6655, + "step": 3582 + }, + { + "epoch": 0.12, + "learning_rate": 1.925269296202466e-05, + "loss": 0.6344, + "step": 3583 + }, + { + "epoch": 0.12, + "learning_rate": 1.9252279888938013e-05, + "loss": 0.6313, + "step": 3584 + }, + { + "epoch": 0.12, + "learning_rate": 1.925186670615388e-05, + "loss": 0.6583, + "step": 3585 + }, + { + "epoch": 0.12, + "learning_rate": 1.925145341367716e-05, + "loss": 0.681, + "step": 3586 + }, + { + "epoch": 0.12, + "learning_rate": 1.9251040011512762e-05, + "loss": 0.6666, + "step": 3587 + }, + { + "epoch": 0.12, + "learning_rate": 1.925062649966558e-05, + "loss": 0.6688, + "step": 3588 + }, + { + "epoch": 0.12, + "learning_rate": 1.925021287814052e-05, + "loss": 0.6795, + "step": 3589 + }, + { + "epoch": 0.12, + "learning_rate": 1.924979914694248e-05, + "loss": 0.617, + "step": 3590 + }, + { + "epoch": 0.12, + "learning_rate": 1.9249385306076377e-05, + "loss": 0.6466, + "step": 3591 + }, + { + "epoch": 0.12, + "learning_rate": 1.9248971355547103e-05, + "loss": 0.6773, + "step": 3592 + }, + { + "epoch": 0.12, + "learning_rate": 1.924855729535958e-05, + "loss": 0.67, + "step": 3593 + }, + { + "epoch": 0.12, + "learning_rate": 1.924814312551871e-05, + "loss": 0.6373, + "step": 3594 + }, + { + "epoch": 0.12, + "learning_rate": 1.92477288460294e-05, + "loss": 0.6707, + "step": 3595 + }, + { + "epoch": 0.12, + "learning_rate": 1.9247314456896568e-05, + "loss": 0.6144, + "step": 3596 + }, + { + "epoch": 0.12, + "learning_rate": 1.924689995812513e-05, + "loss": 0.6219, + "step": 3597 + }, + { + "epoch": 0.12, + "learning_rate": 1.924648534971999e-05, + "loss": 0.6173, + "step": 3598 + }, + { + "epoch": 0.12, + "learning_rate": 1.9246070631686072e-05, + "loss": 0.5784, + "step": 3599 + }, + { + "epoch": 0.12, + "learning_rate": 1.924565580402829e-05, + "loss": 0.561, + "step": 3600 + }, + { + "epoch": 0.12, + "learning_rate": 1.924524086675156e-05, + "loss": 0.5706, + "step": 3601 + }, + { + "epoch": 0.12, + "learning_rate": 1.9244825819860805e-05, + "loss": 0.6255, + "step": 3602 + }, + { + "epoch": 0.12, + "learning_rate": 1.924441066336095e-05, + "loss": 0.6934, + "step": 3603 + }, + { + "epoch": 0.12, + "learning_rate": 1.9243995397256908e-05, + "loss": 0.6467, + "step": 3604 + }, + { + "epoch": 0.12, + "learning_rate": 1.9243580021553606e-05, + "loss": 0.6096, + "step": 3605 + }, + { + "epoch": 0.12, + "learning_rate": 1.924316453625597e-05, + "loss": 0.6346, + "step": 3606 + }, + { + "epoch": 0.12, + "learning_rate": 1.9242748941368927e-05, + "loss": 0.639, + "step": 3607 + }, + { + "epoch": 0.13, + "learning_rate": 1.9242333236897406e-05, + "loss": 0.6182, + "step": 3608 + }, + { + "epoch": 0.13, + "learning_rate": 1.924191742284633e-05, + "loss": 0.6393, + "step": 3609 + }, + { + "epoch": 0.13, + "learning_rate": 1.924150149922063e-05, + "loss": 0.6537, + "step": 3610 + }, + { + "epoch": 0.13, + "learning_rate": 1.9241085466025242e-05, + "loss": 0.6607, + "step": 3611 + }, + { + "epoch": 0.13, + "learning_rate": 1.9240669323265092e-05, + "loss": 0.6256, + "step": 3612 + }, + { + "epoch": 0.13, + "learning_rate": 1.9240253070945122e-05, + "loss": 0.615, + "step": 3613 + }, + { + "epoch": 0.13, + "learning_rate": 1.9239836709070264e-05, + "loss": 0.646, + "step": 3614 + }, + { + "epoch": 0.13, + "learning_rate": 1.923942023764545e-05, + "loss": 0.5895, + "step": 3615 + }, + { + "epoch": 0.13, + "learning_rate": 1.9239003656675623e-05, + "loss": 0.5995, + "step": 3616 + }, + { + "epoch": 0.13, + "learning_rate": 1.9238586966165716e-05, + "loss": 0.6305, + "step": 3617 + }, + { + "epoch": 0.13, + "learning_rate": 1.9238170166120677e-05, + "loss": 0.6609, + "step": 3618 + }, + { + "epoch": 0.13, + "learning_rate": 1.9237753256545445e-05, + "loss": 0.6777, + "step": 3619 + }, + { + "epoch": 0.13, + "learning_rate": 1.923733623744496e-05, + "loss": 0.6328, + "step": 3620 + }, + { + "epoch": 0.13, + "learning_rate": 1.923691910882417e-05, + "loss": 0.6708, + "step": 3621 + }, + { + "epoch": 0.13, + "learning_rate": 1.923650187068802e-05, + "loss": 0.5624, + "step": 3622 + }, + { + "epoch": 0.13, + "learning_rate": 1.9236084523041456e-05, + "loss": 0.6226, + "step": 3623 + }, + { + "epoch": 0.13, + "learning_rate": 1.9235667065889425e-05, + "loss": 0.6176, + "step": 3624 + }, + { + "epoch": 0.13, + "learning_rate": 1.9235249499236878e-05, + "loss": 0.6382, + "step": 3625 + }, + { + "epoch": 0.13, + "learning_rate": 1.9234831823088768e-05, + "loss": 0.6266, + "step": 3626 + }, + { + "epoch": 0.13, + "learning_rate": 1.923441403745004e-05, + "loss": 0.5934, + "step": 3627 + }, + { + "epoch": 0.13, + "learning_rate": 1.9233996142325653e-05, + "loss": 0.6023, + "step": 3628 + }, + { + "epoch": 0.13, + "learning_rate": 1.9233578137720562e-05, + "loss": 0.6225, + "step": 3629 + }, + { + "epoch": 0.13, + "learning_rate": 1.9233160023639722e-05, + "loss": 0.6817, + "step": 3630 + }, + { + "epoch": 0.13, + "learning_rate": 1.923274180008809e-05, + "loss": 0.6336, + "step": 3631 + }, + { + "epoch": 0.13, + "learning_rate": 1.9232323467070625e-05, + "loss": 0.6227, + "step": 3632 + }, + { + "epoch": 0.13, + "learning_rate": 1.9231905024592285e-05, + "loss": 0.6769, + "step": 3633 + }, + { + "epoch": 0.13, + "learning_rate": 1.9231486472658034e-05, + "loss": 0.7383, + "step": 3634 + }, + { + "epoch": 0.13, + "learning_rate": 1.923106781127283e-05, + "loss": 0.6784, + "step": 3635 + }, + { + "epoch": 0.13, + "learning_rate": 1.923064904044164e-05, + "loss": 0.6241, + "step": 3636 + }, + { + "epoch": 0.13, + "learning_rate": 1.9230230160169434e-05, + "loss": 0.6516, + "step": 3637 + }, + { + "epoch": 0.13, + "learning_rate": 1.922981117046117e-05, + "loss": 0.6549, + "step": 3638 + }, + { + "epoch": 0.13, + "learning_rate": 1.9229392071321818e-05, + "loss": 0.6759, + "step": 3639 + }, + { + "epoch": 0.13, + "learning_rate": 1.9228972862756347e-05, + "loss": 0.5907, + "step": 3640 + }, + { + "epoch": 0.13, + "learning_rate": 1.922855354476973e-05, + "loss": 0.6055, + "step": 3641 + }, + { + "epoch": 0.13, + "learning_rate": 1.9228134117366938e-05, + "loss": 0.62, + "step": 3642 + }, + { + "epoch": 0.13, + "learning_rate": 1.922771458055294e-05, + "loss": 0.66, + "step": 3643 + }, + { + "epoch": 0.13, + "learning_rate": 1.922729493433271e-05, + "loss": 0.637, + "step": 3644 + }, + { + "epoch": 0.13, + "learning_rate": 1.922687517871123e-05, + "loss": 0.6915, + "step": 3645 + }, + { + "epoch": 0.13, + "learning_rate": 1.922645531369347e-05, + "loss": 0.6701, + "step": 3646 + }, + { + "epoch": 0.13, + "learning_rate": 1.922603533928441e-05, + "loss": 0.6512, + "step": 3647 + }, + { + "epoch": 0.13, + "learning_rate": 1.9225615255489035e-05, + "loss": 0.6439, + "step": 3648 + }, + { + "epoch": 0.13, + "learning_rate": 1.9225195062312317e-05, + "loss": 0.6646, + "step": 3649 + }, + { + "epoch": 0.13, + "learning_rate": 1.9224774759759245e-05, + "loss": 0.6171, + "step": 3650 + }, + { + "epoch": 0.13, + "learning_rate": 1.9224354347834794e-05, + "loss": 0.5985, + "step": 3651 + }, + { + "epoch": 0.13, + "learning_rate": 1.9223933826543956e-05, + "loss": 0.6831, + "step": 3652 + }, + { + "epoch": 0.13, + "learning_rate": 1.9223513195891713e-05, + "loss": 0.5749, + "step": 3653 + }, + { + "epoch": 0.13, + "learning_rate": 1.9223092455883056e-05, + "loss": 0.5947, + "step": 3654 + }, + { + "epoch": 0.13, + "learning_rate": 1.9222671606522965e-05, + "loss": 0.6524, + "step": 3655 + }, + { + "epoch": 0.13, + "learning_rate": 1.9222250647816443e-05, + "loss": 0.6512, + "step": 3656 + }, + { + "epoch": 0.13, + "learning_rate": 1.9221829579768467e-05, + "loss": 0.5757, + "step": 3657 + }, + { + "epoch": 0.13, + "learning_rate": 1.9221408402384042e-05, + "loss": 0.6958, + "step": 3658 + }, + { + "epoch": 0.13, + "learning_rate": 1.922098711566815e-05, + "loss": 0.591, + "step": 3659 + }, + { + "epoch": 0.13, + "learning_rate": 1.9220565719625793e-05, + "loss": 0.672, + "step": 3660 + }, + { + "epoch": 0.13, + "learning_rate": 1.922014421426196e-05, + "loss": 0.6865, + "step": 3661 + }, + { + "epoch": 0.13, + "learning_rate": 1.9219722599581662e-05, + "loss": 0.6643, + "step": 3662 + }, + { + "epoch": 0.13, + "learning_rate": 1.9219300875589885e-05, + "loss": 0.6537, + "step": 3663 + }, + { + "epoch": 0.13, + "learning_rate": 1.9218879042291636e-05, + "loss": 0.6543, + "step": 3664 + }, + { + "epoch": 0.13, + "learning_rate": 1.9218457099691913e-05, + "loss": 0.6541, + "step": 3665 + }, + { + "epoch": 0.13, + "learning_rate": 1.9218035047795718e-05, + "loss": 0.611, + "step": 3666 + }, + { + "epoch": 0.13, + "learning_rate": 1.9217612886608058e-05, + "loss": 0.65, + "step": 3667 + }, + { + "epoch": 0.13, + "learning_rate": 1.921719061613394e-05, + "loss": 0.6005, + "step": 3668 + }, + { + "epoch": 0.13, + "learning_rate": 1.9216768236378362e-05, + "loss": 0.6494, + "step": 3669 + }, + { + "epoch": 0.13, + "learning_rate": 1.921634574734634e-05, + "loss": 0.6575, + "step": 3670 + }, + { + "epoch": 0.13, + "learning_rate": 1.921592314904288e-05, + "loss": 0.5845, + "step": 3671 + }, + { + "epoch": 0.13, + "learning_rate": 1.9215500441472992e-05, + "loss": 0.6844, + "step": 3672 + }, + { + "epoch": 0.13, + "learning_rate": 1.9215077624641688e-05, + "loss": 0.7066, + "step": 3673 + }, + { + "epoch": 0.13, + "learning_rate": 1.9214654698553986e-05, + "loss": 0.6956, + "step": 3674 + }, + { + "epoch": 0.13, + "learning_rate": 1.9214231663214893e-05, + "loss": 0.641, + "step": 3675 + }, + { + "epoch": 0.13, + "learning_rate": 1.9213808518629428e-05, + "loss": 0.6717, + "step": 3676 + }, + { + "epoch": 0.13, + "learning_rate": 1.9213385264802605e-05, + "loss": 0.6116, + "step": 3677 + }, + { + "epoch": 0.13, + "learning_rate": 1.9212961901739448e-05, + "loss": 0.6594, + "step": 3678 + }, + { + "epoch": 0.13, + "learning_rate": 1.9212538429444972e-05, + "loss": 0.6755, + "step": 3679 + }, + { + "epoch": 0.13, + "learning_rate": 1.9212114847924202e-05, + "loss": 0.6518, + "step": 3680 + }, + { + "epoch": 0.13, + "learning_rate": 1.9211691157182152e-05, + "loss": 0.6125, + "step": 3681 + }, + { + "epoch": 0.13, + "learning_rate": 1.9211267357223853e-05, + "loss": 0.6842, + "step": 3682 + }, + { + "epoch": 0.13, + "learning_rate": 1.9210843448054327e-05, + "loss": 0.5969, + "step": 3683 + }, + { + "epoch": 0.13, + "learning_rate": 1.9210419429678598e-05, + "loss": 0.7185, + "step": 3684 + }, + { + "epoch": 0.13, + "learning_rate": 1.9209995302101697e-05, + "loss": 0.6229, + "step": 3685 + }, + { + "epoch": 0.13, + "learning_rate": 1.9209571065328653e-05, + "loss": 0.6258, + "step": 3686 + }, + { + "epoch": 0.13, + "learning_rate": 1.9209146719364494e-05, + "loss": 0.597, + "step": 3687 + }, + { + "epoch": 0.13, + "learning_rate": 1.9208722264214247e-05, + "loss": 0.6166, + "step": 3688 + }, + { + "epoch": 0.13, + "learning_rate": 1.920829769988295e-05, + "loss": 0.7169, + "step": 3689 + }, + { + "epoch": 0.13, + "learning_rate": 1.920787302637564e-05, + "loss": 0.6631, + "step": 3690 + }, + { + "epoch": 0.13, + "learning_rate": 1.920744824369734e-05, + "loss": 0.6677, + "step": 3691 + }, + { + "epoch": 0.13, + "learning_rate": 1.92070233518531e-05, + "loss": 0.5927, + "step": 3692 + }, + { + "epoch": 0.13, + "learning_rate": 1.9206598350847946e-05, + "loss": 0.6265, + "step": 3693 + }, + { + "epoch": 0.13, + "learning_rate": 1.9206173240686925e-05, + "loss": 0.6505, + "step": 3694 + }, + { + "epoch": 0.13, + "learning_rate": 1.9205748021375072e-05, + "loss": 0.6285, + "step": 3695 + }, + { + "epoch": 0.13, + "learning_rate": 1.9205322692917434e-05, + "loss": 0.6863, + "step": 3696 + }, + { + "epoch": 0.13, + "learning_rate": 1.920489725531905e-05, + "loss": 0.6177, + "step": 3697 + }, + { + "epoch": 0.13, + "learning_rate": 1.920447170858496e-05, + "loss": 0.6005, + "step": 3698 + }, + { + "epoch": 0.13, + "learning_rate": 1.920404605272022e-05, + "loss": 0.5945, + "step": 3699 + }, + { + "epoch": 0.13, + "learning_rate": 1.9203620287729867e-05, + "loss": 0.6326, + "step": 3700 + }, + { + "epoch": 0.13, + "learning_rate": 1.9203194413618958e-05, + "loss": 0.6354, + "step": 3701 + }, + { + "epoch": 0.13, + "learning_rate": 1.9202768430392532e-05, + "loss": 0.6226, + "step": 3702 + }, + { + "epoch": 0.13, + "learning_rate": 1.9202342338055646e-05, + "loss": 0.6588, + "step": 3703 + }, + { + "epoch": 0.13, + "learning_rate": 1.9201916136613353e-05, + "loss": 0.5926, + "step": 3704 + }, + { + "epoch": 0.13, + "learning_rate": 1.92014898260707e-05, + "loss": 0.613, + "step": 3705 + }, + { + "epoch": 0.13, + "learning_rate": 1.9201063406432748e-05, + "loss": 0.6444, + "step": 3706 + }, + { + "epoch": 0.13, + "learning_rate": 1.9200636877704548e-05, + "loss": 0.6631, + "step": 3707 + }, + { + "epoch": 0.13, + "learning_rate": 1.920021023989116e-05, + "loss": 0.6598, + "step": 3708 + }, + { + "epoch": 0.13, + "learning_rate": 1.919978349299764e-05, + "loss": 0.6985, + "step": 3709 + }, + { + "epoch": 0.13, + "learning_rate": 1.9199356637029052e-05, + "loss": 0.6473, + "step": 3710 + }, + { + "epoch": 0.13, + "learning_rate": 1.919892967199045e-05, + "loss": 0.6514, + "step": 3711 + }, + { + "epoch": 0.13, + "learning_rate": 1.91985025978869e-05, + "loss": 0.7051, + "step": 3712 + }, + { + "epoch": 0.13, + "learning_rate": 1.9198075414723472e-05, + "loss": 0.5915, + "step": 3713 + }, + { + "epoch": 0.13, + "learning_rate": 1.919764812250522e-05, + "loss": 0.6206, + "step": 3714 + }, + { + "epoch": 0.13, + "learning_rate": 1.9197220721237212e-05, + "loss": 0.6574, + "step": 3715 + }, + { + "epoch": 0.13, + "learning_rate": 1.919679321092452e-05, + "loss": 0.6789, + "step": 3716 + }, + { + "epoch": 0.13, + "learning_rate": 1.919636559157221e-05, + "loss": 0.6544, + "step": 3717 + }, + { + "epoch": 0.13, + "learning_rate": 1.9195937863185352e-05, + "loss": 0.6609, + "step": 3718 + }, + { + "epoch": 0.13, + "learning_rate": 1.9195510025769023e-05, + "loss": 0.6577, + "step": 3719 + }, + { + "epoch": 0.13, + "learning_rate": 1.9195082079328284e-05, + "loss": 0.666, + "step": 3720 + }, + { + "epoch": 0.13, + "learning_rate": 1.9194654023868215e-05, + "loss": 0.6149, + "step": 3721 + }, + { + "epoch": 0.13, + "learning_rate": 1.9194225859393897e-05, + "loss": 0.6568, + "step": 3722 + }, + { + "epoch": 0.13, + "learning_rate": 1.9193797585910394e-05, + "loss": 0.6317, + "step": 3723 + }, + { + "epoch": 0.13, + "learning_rate": 1.9193369203422792e-05, + "loss": 0.6275, + "step": 3724 + }, + { + "epoch": 0.13, + "learning_rate": 1.9192940711936173e-05, + "loss": 0.5831, + "step": 3725 + }, + { + "epoch": 0.13, + "learning_rate": 1.9192512111455606e-05, + "loss": 0.6363, + "step": 3726 + }, + { + "epoch": 0.13, + "learning_rate": 1.9192083401986186e-05, + "loss": 0.6325, + "step": 3727 + }, + { + "epoch": 0.13, + "learning_rate": 1.9191654583532987e-05, + "loss": 0.6149, + "step": 3728 + }, + { + "epoch": 0.13, + "learning_rate": 1.9191225656101094e-05, + "loss": 0.6465, + "step": 3729 + }, + { + "epoch": 0.13, + "learning_rate": 1.9190796619695594e-05, + "loss": 0.6257, + "step": 3730 + }, + { + "epoch": 0.13, + "learning_rate": 1.9190367474321572e-05, + "loss": 0.5962, + "step": 3731 + }, + { + "epoch": 0.13, + "learning_rate": 1.918993821998412e-05, + "loss": 0.5845, + "step": 3732 + }, + { + "epoch": 0.13, + "learning_rate": 1.9189508856688325e-05, + "loss": 0.6539, + "step": 3733 + }, + { + "epoch": 0.13, + "learning_rate": 1.9189079384439278e-05, + "loss": 0.6777, + "step": 3734 + }, + { + "epoch": 0.13, + "learning_rate": 1.918864980324207e-05, + "loss": 0.6349, + "step": 3735 + }, + { + "epoch": 0.13, + "learning_rate": 1.9188220113101794e-05, + "loss": 0.6206, + "step": 3736 + }, + { + "epoch": 0.13, + "learning_rate": 1.9187790314023546e-05, + "loss": 0.6574, + "step": 3737 + }, + { + "epoch": 0.13, + "learning_rate": 1.9187360406012422e-05, + "loss": 0.6468, + "step": 3738 + }, + { + "epoch": 0.13, + "learning_rate": 1.9186930389073518e-05, + "loss": 0.6193, + "step": 3739 + }, + { + "epoch": 0.13, + "learning_rate": 1.9186500263211934e-05, + "loss": 0.6254, + "step": 3740 + }, + { + "epoch": 0.13, + "learning_rate": 1.9186070028432765e-05, + "loss": 0.5945, + "step": 3741 + }, + { + "epoch": 0.13, + "learning_rate": 1.918563968474112e-05, + "loss": 0.6568, + "step": 3742 + }, + { + "epoch": 0.13, + "learning_rate": 1.9185209232142093e-05, + "loss": 0.6227, + "step": 3743 + }, + { + "epoch": 0.13, + "learning_rate": 1.9184778670640792e-05, + "loss": 0.6731, + "step": 3744 + }, + { + "epoch": 0.13, + "learning_rate": 1.9184348000242322e-05, + "loss": 0.6525, + "step": 3745 + }, + { + "epoch": 0.13, + "learning_rate": 1.9183917220951788e-05, + "loss": 0.7041, + "step": 3746 + }, + { + "epoch": 0.13, + "learning_rate": 1.9183486332774297e-05, + "loss": 0.656, + "step": 3747 + }, + { + "epoch": 0.13, + "learning_rate": 1.918305533571496e-05, + "loss": 0.6159, + "step": 3748 + }, + { + "epoch": 0.13, + "learning_rate": 1.918262422977888e-05, + "loss": 0.6323, + "step": 3749 + }, + { + "epoch": 0.13, + "learning_rate": 1.9182193014971177e-05, + "loss": 0.6577, + "step": 3750 + }, + { + "epoch": 0.13, + "learning_rate": 1.918176169129696e-05, + "loss": 0.6238, + "step": 3751 + }, + { + "epoch": 0.13, + "learning_rate": 1.918133025876135e-05, + "loss": 0.6313, + "step": 3752 + }, + { + "epoch": 0.13, + "learning_rate": 1.9180898717369448e-05, + "loss": 0.6812, + "step": 3753 + }, + { + "epoch": 0.13, + "learning_rate": 1.918046706712638e-05, + "loss": 0.6005, + "step": 3754 + }, + { + "epoch": 0.13, + "learning_rate": 1.918003530803726e-05, + "loss": 0.6429, + "step": 3755 + }, + { + "epoch": 0.13, + "learning_rate": 1.917960344010721e-05, + "loss": 0.6391, + "step": 3756 + }, + { + "epoch": 0.13, + "learning_rate": 1.9179171463341345e-05, + "loss": 0.6729, + "step": 3757 + }, + { + "epoch": 0.13, + "learning_rate": 1.9178739377744792e-05, + "loss": 0.6574, + "step": 3758 + }, + { + "epoch": 0.13, + "learning_rate": 1.9178307183322675e-05, + "loss": 0.6385, + "step": 3759 + }, + { + "epoch": 0.13, + "learning_rate": 1.9177874880080118e-05, + "loss": 0.594, + "step": 3760 + }, + { + "epoch": 0.13, + "learning_rate": 1.917744246802224e-05, + "loss": 0.5916, + "step": 3761 + }, + { + "epoch": 0.13, + "learning_rate": 1.9177009947154174e-05, + "loss": 0.6113, + "step": 3762 + }, + { + "epoch": 0.13, + "learning_rate": 1.9176577317481043e-05, + "loss": 0.7035, + "step": 3763 + }, + { + "epoch": 0.13, + "learning_rate": 1.9176144579007983e-05, + "loss": 0.6481, + "step": 3764 + }, + { + "epoch": 0.13, + "learning_rate": 1.917571173174012e-05, + "loss": 0.6794, + "step": 3765 + }, + { + "epoch": 0.13, + "learning_rate": 1.9175278775682587e-05, + "loss": 0.6077, + "step": 3766 + }, + { + "epoch": 0.13, + "learning_rate": 1.9174845710840517e-05, + "loss": 0.6436, + "step": 3767 + }, + { + "epoch": 0.13, + "learning_rate": 1.9174412537219046e-05, + "loss": 0.5757, + "step": 3768 + }, + { + "epoch": 0.13, + "learning_rate": 1.917397925482331e-05, + "loss": 0.6204, + "step": 3769 + }, + { + "epoch": 0.13, + "learning_rate": 1.917354586365844e-05, + "loss": 0.6332, + "step": 3770 + }, + { + "epoch": 0.13, + "learning_rate": 1.9173112363729585e-05, + "loss": 0.6573, + "step": 3771 + }, + { + "epoch": 0.13, + "learning_rate": 1.9172678755041873e-05, + "loss": 0.689, + "step": 3772 + }, + { + "epoch": 0.13, + "learning_rate": 1.9172245037600456e-05, + "loss": 0.6012, + "step": 3773 + }, + { + "epoch": 0.13, + "learning_rate": 1.9171811211410467e-05, + "loss": 0.6595, + "step": 3774 + }, + { + "epoch": 0.13, + "learning_rate": 1.9171377276477058e-05, + "loss": 0.7174, + "step": 3775 + }, + { + "epoch": 0.13, + "learning_rate": 1.9170943232805366e-05, + "loss": 0.6624, + "step": 3776 + }, + { + "epoch": 0.13, + "learning_rate": 1.917050908040054e-05, + "loss": 0.6229, + "step": 3777 + }, + { + "epoch": 0.13, + "learning_rate": 1.9170074819267733e-05, + "loss": 0.5394, + "step": 3778 + }, + { + "epoch": 0.13, + "learning_rate": 1.9169640449412083e-05, + "loss": 0.6392, + "step": 3779 + }, + { + "epoch": 0.13, + "learning_rate": 1.916920597083875e-05, + "loss": 0.6307, + "step": 3780 + }, + { + "epoch": 0.13, + "learning_rate": 1.916877138355288e-05, + "loss": 0.6088, + "step": 3781 + }, + { + "epoch": 0.13, + "learning_rate": 1.9168336687559624e-05, + "loss": 0.6509, + "step": 3782 + }, + { + "epoch": 0.13, + "learning_rate": 1.916790188286414e-05, + "loss": 0.6344, + "step": 3783 + }, + { + "epoch": 0.13, + "learning_rate": 1.9167466969471583e-05, + "loss": 0.6266, + "step": 3784 + }, + { + "epoch": 0.13, + "learning_rate": 1.916703194738711e-05, + "loss": 0.62, + "step": 3785 + }, + { + "epoch": 0.13, + "learning_rate": 1.9166596816615875e-05, + "loss": 0.6925, + "step": 3786 + }, + { + "epoch": 0.13, + "learning_rate": 1.9166161577163035e-05, + "loss": 0.6077, + "step": 3787 + }, + { + "epoch": 0.13, + "learning_rate": 1.916572622903376e-05, + "loss": 0.6358, + "step": 3788 + }, + { + "epoch": 0.13, + "learning_rate": 1.9165290772233206e-05, + "loss": 0.6389, + "step": 3789 + }, + { + "epoch": 0.13, + "learning_rate": 1.916485520676653e-05, + "loss": 0.6659, + "step": 3790 + }, + { + "epoch": 0.13, + "learning_rate": 1.9164419532638906e-05, + "loss": 0.6682, + "step": 3791 + }, + { + "epoch": 0.13, + "learning_rate": 1.9163983749855495e-05, + "loss": 0.6526, + "step": 3792 + }, + { + "epoch": 0.13, + "learning_rate": 1.9163547858421463e-05, + "loss": 0.5878, + "step": 3793 + }, + { + "epoch": 0.13, + "learning_rate": 1.9163111858341982e-05, + "loss": 0.6109, + "step": 3794 + }, + { + "epoch": 0.13, + "learning_rate": 1.9162675749622214e-05, + "loss": 0.6518, + "step": 3795 + }, + { + "epoch": 0.13, + "learning_rate": 1.9162239532267336e-05, + "loss": 0.6496, + "step": 3796 + }, + { + "epoch": 0.13, + "learning_rate": 1.916180320628252e-05, + "loss": 0.6427, + "step": 3797 + }, + { + "epoch": 0.13, + "learning_rate": 1.9161366771672937e-05, + "loss": 0.5929, + "step": 3798 + }, + { + "epoch": 0.13, + "learning_rate": 1.916093022844376e-05, + "loss": 0.6421, + "step": 3799 + }, + { + "epoch": 0.13, + "learning_rate": 1.9160493576600167e-05, + "loss": 0.6179, + "step": 3800 + }, + { + "epoch": 0.13, + "learning_rate": 1.9160056816147334e-05, + "loss": 0.5858, + "step": 3801 + }, + { + "epoch": 0.13, + "learning_rate": 1.9159619947090443e-05, + "loss": 0.6815, + "step": 3802 + }, + { + "epoch": 0.13, + "learning_rate": 1.915918296943467e-05, + "loss": 0.6215, + "step": 3803 + }, + { + "epoch": 0.13, + "learning_rate": 1.915874588318519e-05, + "loss": 0.6062, + "step": 3804 + }, + { + "epoch": 0.13, + "learning_rate": 1.91583086883472e-05, + "loss": 0.6598, + "step": 3805 + }, + { + "epoch": 0.13, + "learning_rate": 1.9157871384925872e-05, + "loss": 0.6362, + "step": 3806 + }, + { + "epoch": 0.13, + "learning_rate": 1.9157433972926395e-05, + "loss": 0.6623, + "step": 3807 + }, + { + "epoch": 0.13, + "learning_rate": 1.915699645235395e-05, + "loss": 0.6719, + "step": 3808 + }, + { + "epoch": 0.13, + "learning_rate": 1.915655882321373e-05, + "loss": 0.5919, + "step": 3809 + }, + { + "epoch": 0.13, + "learning_rate": 1.9156121085510922e-05, + "loss": 0.6205, + "step": 3810 + }, + { + "epoch": 0.13, + "learning_rate": 1.915568323925072e-05, + "loss": 0.5998, + "step": 3811 + }, + { + "epoch": 0.13, + "learning_rate": 1.9155245284438308e-05, + "loss": 0.6651, + "step": 3812 + }, + { + "epoch": 0.13, + "learning_rate": 1.9154807221078883e-05, + "loss": 0.6624, + "step": 3813 + }, + { + "epoch": 0.13, + "learning_rate": 1.9154369049177634e-05, + "loss": 0.6807, + "step": 3814 + }, + { + "epoch": 0.13, + "learning_rate": 1.9153930768739762e-05, + "loss": 0.6779, + "step": 3815 + }, + { + "epoch": 0.13, + "learning_rate": 1.915349237977046e-05, + "loss": 0.6564, + "step": 3816 + }, + { + "epoch": 0.13, + "learning_rate": 1.915305388227493e-05, + "loss": 0.6271, + "step": 3817 + }, + { + "epoch": 0.13, + "learning_rate": 1.9152615276258364e-05, + "loss": 0.6339, + "step": 3818 + }, + { + "epoch": 0.13, + "learning_rate": 1.9152176561725966e-05, + "loss": 0.5899, + "step": 3819 + }, + { + "epoch": 0.13, + "learning_rate": 1.915173773868294e-05, + "loss": 0.6577, + "step": 3820 + }, + { + "epoch": 0.13, + "learning_rate": 1.9151298807134485e-05, + "loss": 0.6209, + "step": 3821 + }, + { + "epoch": 0.13, + "learning_rate": 1.9150859767085805e-05, + "loss": 0.6298, + "step": 3822 + }, + { + "epoch": 0.13, + "learning_rate": 1.9150420618542103e-05, + "loss": 0.6075, + "step": 3823 + }, + { + "epoch": 0.13, + "learning_rate": 1.91499813615086e-05, + "loss": 0.6377, + "step": 3824 + }, + { + "epoch": 0.13, + "learning_rate": 1.9149541995990483e-05, + "loss": 0.6406, + "step": 3825 + }, + { + "epoch": 0.13, + "learning_rate": 1.9149102521992976e-05, + "loss": 0.6463, + "step": 3826 + }, + { + "epoch": 0.13, + "learning_rate": 1.9148662939521282e-05, + "loss": 0.6505, + "step": 3827 + }, + { + "epoch": 0.13, + "learning_rate": 1.914822324858062e-05, + "loss": 0.6287, + "step": 3828 + }, + { + "epoch": 0.13, + "learning_rate": 1.9147783449176195e-05, + "loss": 0.6351, + "step": 3829 + }, + { + "epoch": 0.13, + "learning_rate": 1.9147343541313227e-05, + "loss": 0.6339, + "step": 3830 + }, + { + "epoch": 0.13, + "learning_rate": 1.914690352499693e-05, + "loss": 0.6259, + "step": 3831 + }, + { + "epoch": 0.13, + "learning_rate": 1.9146463400232516e-05, + "loss": 0.6544, + "step": 3832 + }, + { + "epoch": 0.13, + "learning_rate": 1.9146023167025216e-05, + "loss": 0.6233, + "step": 3833 + }, + { + "epoch": 0.13, + "learning_rate": 1.9145582825380236e-05, + "loss": 0.6616, + "step": 3834 + }, + { + "epoch": 0.13, + "learning_rate": 1.9145142375302805e-05, + "loss": 0.6211, + "step": 3835 + }, + { + "epoch": 0.13, + "learning_rate": 1.9144701816798143e-05, + "loss": 0.6586, + "step": 3836 + }, + { + "epoch": 0.13, + "learning_rate": 1.914426114987147e-05, + "loss": 0.6269, + "step": 3837 + }, + { + "epoch": 0.13, + "learning_rate": 1.9143820374528017e-05, + "loss": 0.6643, + "step": 3838 + }, + { + "epoch": 0.13, + "learning_rate": 1.9143379490773003e-05, + "loss": 0.5995, + "step": 3839 + }, + { + "epoch": 0.13, + "learning_rate": 1.914293849861166e-05, + "loss": 0.6285, + "step": 3840 + }, + { + "epoch": 0.13, + "learning_rate": 1.9142497398049215e-05, + "loss": 0.5983, + "step": 3841 + }, + { + "epoch": 0.13, + "learning_rate": 1.9142056189090897e-05, + "loss": 0.5782, + "step": 3842 + }, + { + "epoch": 0.13, + "learning_rate": 1.9141614871741943e-05, + "loss": 0.6357, + "step": 3843 + }, + { + "epoch": 0.13, + "learning_rate": 1.9141173446007575e-05, + "loss": 0.5978, + "step": 3844 + }, + { + "epoch": 0.13, + "learning_rate": 1.9140731911893034e-05, + "loss": 0.6542, + "step": 3845 + }, + { + "epoch": 0.13, + "learning_rate": 1.9140290269403555e-05, + "loss": 0.6591, + "step": 3846 + }, + { + "epoch": 0.13, + "learning_rate": 1.9139848518544372e-05, + "loss": 0.6603, + "step": 3847 + }, + { + "epoch": 0.13, + "learning_rate": 1.913940665932072e-05, + "loss": 0.6546, + "step": 3848 + }, + { + "epoch": 0.13, + "learning_rate": 1.913896469173784e-05, + "loss": 0.6439, + "step": 3849 + }, + { + "epoch": 0.13, + "learning_rate": 1.9138522615800976e-05, + "loss": 0.6116, + "step": 3850 + }, + { + "epoch": 0.13, + "learning_rate": 1.9138080431515366e-05, + "loss": 0.6876, + "step": 3851 + }, + { + "epoch": 0.13, + "learning_rate": 1.9137638138886253e-05, + "loss": 0.5811, + "step": 3852 + }, + { + "epoch": 0.13, + "learning_rate": 1.9137195737918878e-05, + "loss": 0.707, + "step": 3853 + }, + { + "epoch": 0.13, + "learning_rate": 1.913675322861849e-05, + "loss": 0.6908, + "step": 3854 + }, + { + "epoch": 0.13, + "learning_rate": 1.9136310610990336e-05, + "loss": 0.6895, + "step": 3855 + }, + { + "epoch": 0.13, + "learning_rate": 1.9135867885039662e-05, + "loss": 0.5792, + "step": 3856 + }, + { + "epoch": 0.13, + "learning_rate": 1.9135425050771715e-05, + "loss": 0.5842, + "step": 3857 + }, + { + "epoch": 0.13, + "learning_rate": 1.913498210819175e-05, + "loss": 0.627, + "step": 3858 + }, + { + "epoch": 0.13, + "learning_rate": 1.9134539057305016e-05, + "loss": 0.6787, + "step": 3859 + }, + { + "epoch": 0.13, + "learning_rate": 1.9134095898116766e-05, + "loss": 0.5951, + "step": 3860 + }, + { + "epoch": 0.13, + "learning_rate": 1.9133652630632253e-05, + "loss": 0.676, + "step": 3861 + }, + { + "epoch": 0.13, + "learning_rate": 1.9133209254856733e-05, + "loss": 0.6486, + "step": 3862 + }, + { + "epoch": 0.13, + "learning_rate": 1.9132765770795467e-05, + "loss": 0.651, + "step": 3863 + }, + { + "epoch": 0.13, + "learning_rate": 1.9132322178453708e-05, + "loss": 0.6353, + "step": 3864 + }, + { + "epoch": 0.13, + "learning_rate": 1.9131878477836716e-05, + "loss": 0.5975, + "step": 3865 + }, + { + "epoch": 0.13, + "learning_rate": 1.9131434668949756e-05, + "loss": 0.6854, + "step": 3866 + }, + { + "epoch": 0.13, + "learning_rate": 1.9130990751798085e-05, + "loss": 0.6725, + "step": 3867 + }, + { + "epoch": 0.13, + "learning_rate": 1.9130546726386967e-05, + "loss": 0.6279, + "step": 3868 + }, + { + "epoch": 0.13, + "learning_rate": 1.913010259272167e-05, + "loss": 0.6576, + "step": 3869 + }, + { + "epoch": 0.13, + "learning_rate": 1.9129658350807453e-05, + "loss": 0.6419, + "step": 3870 + }, + { + "epoch": 0.13, + "learning_rate": 1.912921400064959e-05, + "loss": 0.5909, + "step": 3871 + }, + { + "epoch": 0.13, + "learning_rate": 1.9128769542253346e-05, + "loss": 0.6865, + "step": 3872 + }, + { + "epoch": 0.13, + "learning_rate": 1.9128324975623994e-05, + "loss": 0.6023, + "step": 3873 + }, + { + "epoch": 0.13, + "learning_rate": 1.9127880300766796e-05, + "loss": 0.6546, + "step": 3874 + }, + { + "epoch": 0.13, + "learning_rate": 1.9127435517687034e-05, + "loss": 0.6876, + "step": 3875 + }, + { + "epoch": 0.13, + "learning_rate": 1.9126990626389976e-05, + "loss": 0.6535, + "step": 3876 + }, + { + "epoch": 0.13, + "learning_rate": 1.91265456268809e-05, + "loss": 0.698, + "step": 3877 + }, + { + "epoch": 0.13, + "learning_rate": 1.912610051916508e-05, + "loss": 0.6202, + "step": 3878 + }, + { + "epoch": 0.13, + "learning_rate": 1.9125655303247793e-05, + "loss": 0.6237, + "step": 3879 + }, + { + "epoch": 0.13, + "learning_rate": 1.9125209979134318e-05, + "loss": 0.6398, + "step": 3880 + }, + { + "epoch": 0.13, + "learning_rate": 1.9124764546829937e-05, + "loss": 0.604, + "step": 3881 + }, + { + "epoch": 0.13, + "learning_rate": 1.912431900633993e-05, + "loss": 0.6902, + "step": 3882 + }, + { + "epoch": 0.13, + "learning_rate": 1.9123873357669577e-05, + "loss": 0.5979, + "step": 3883 + }, + { + "epoch": 0.13, + "learning_rate": 1.9123427600824164e-05, + "loss": 0.5798, + "step": 3884 + }, + { + "epoch": 0.13, + "learning_rate": 1.9122981735808977e-05, + "loss": 0.6988, + "step": 3885 + }, + { + "epoch": 0.13, + "learning_rate": 1.9122535762629297e-05, + "loss": 0.6156, + "step": 3886 + }, + { + "epoch": 0.13, + "learning_rate": 1.912208968129042e-05, + "loss": 0.6435, + "step": 3887 + }, + { + "epoch": 0.13, + "learning_rate": 1.9121643491797627e-05, + "loss": 0.6971, + "step": 3888 + }, + { + "epoch": 0.13, + "learning_rate": 1.9121197194156212e-05, + "loss": 0.6296, + "step": 3889 + }, + { + "epoch": 0.13, + "learning_rate": 1.912075078837147e-05, + "loss": 0.6518, + "step": 3890 + }, + { + "epoch": 0.13, + "learning_rate": 1.9120304274448685e-05, + "loss": 0.6229, + "step": 3891 + }, + { + "epoch": 0.13, + "learning_rate": 1.9119857652393157e-05, + "loss": 0.6008, + "step": 3892 + }, + { + "epoch": 0.13, + "learning_rate": 1.9119410922210177e-05, + "loss": 0.6446, + "step": 3893 + }, + { + "epoch": 0.13, + "learning_rate": 1.911896408390505e-05, + "loss": 0.5959, + "step": 3894 + }, + { + "epoch": 0.13, + "learning_rate": 1.9118517137483063e-05, + "loss": 0.6638, + "step": 3895 + }, + { + "epoch": 0.13, + "learning_rate": 1.9118070082949524e-05, + "loss": 0.6597, + "step": 3896 + }, + { + "epoch": 0.14, + "learning_rate": 1.911762292030973e-05, + "loss": 0.5972, + "step": 3897 + }, + { + "epoch": 0.14, + "learning_rate": 1.911717564956898e-05, + "loss": 0.6057, + "step": 3898 + }, + { + "epoch": 0.14, + "learning_rate": 1.911672827073258e-05, + "loss": 0.6261, + "step": 3899 + }, + { + "epoch": 0.14, + "learning_rate": 1.9116280783805835e-05, + "loss": 0.6355, + "step": 3900 + }, + { + "epoch": 0.14, + "learning_rate": 1.9115833188794046e-05, + "loss": 0.6133, + "step": 3901 + }, + { + "epoch": 0.14, + "learning_rate": 1.9115385485702528e-05, + "loss": 0.7078, + "step": 3902 + }, + { + "epoch": 0.14, + "learning_rate": 1.9114937674536578e-05, + "loss": 0.6106, + "step": 3903 + }, + { + "epoch": 0.14, + "learning_rate": 1.9114489755301517e-05, + "loss": 0.6625, + "step": 3904 + }, + { + "epoch": 0.14, + "learning_rate": 1.9114041728002645e-05, + "loss": 0.6528, + "step": 3905 + }, + { + "epoch": 0.14, + "learning_rate": 1.911359359264528e-05, + "loss": 0.6805, + "step": 3906 + }, + { + "epoch": 0.14, + "learning_rate": 1.911314534923474e-05, + "loss": 0.6697, + "step": 3907 + }, + { + "epoch": 0.14, + "learning_rate": 1.9112696997776328e-05, + "loss": 0.6653, + "step": 3908 + }, + { + "epoch": 0.14, + "learning_rate": 1.9112248538275365e-05, + "loss": 0.6068, + "step": 3909 + }, + { + "epoch": 0.14, + "learning_rate": 1.9111799970737172e-05, + "loss": 0.6357, + "step": 3910 + }, + { + "epoch": 0.14, + "learning_rate": 1.9111351295167063e-05, + "loss": 0.6725, + "step": 3911 + }, + { + "epoch": 0.14, + "learning_rate": 1.911090251157036e-05, + "loss": 0.6202, + "step": 3912 + }, + { + "epoch": 0.14, + "learning_rate": 1.9110453619952377e-05, + "loss": 0.695, + "step": 3913 + }, + { + "epoch": 0.14, + "learning_rate": 1.9110004620318446e-05, + "loss": 0.6066, + "step": 3914 + }, + { + "epoch": 0.14, + "learning_rate": 1.9109555512673882e-05, + "loss": 0.6183, + "step": 3915 + }, + { + "epoch": 0.14, + "learning_rate": 1.910910629702402e-05, + "loss": 0.6301, + "step": 3916 + }, + { + "epoch": 0.14, + "learning_rate": 1.9108656973374174e-05, + "loss": 0.663, + "step": 3917 + }, + { + "epoch": 0.14, + "learning_rate": 1.910820754172968e-05, + "loss": 0.5878, + "step": 3918 + }, + { + "epoch": 0.14, + "learning_rate": 1.9107758002095863e-05, + "loss": 0.6255, + "step": 3919 + }, + { + "epoch": 0.14, + "learning_rate": 1.9107308354478055e-05, + "loss": 0.7236, + "step": 3920 + }, + { + "epoch": 0.14, + "learning_rate": 1.910685859888158e-05, + "loss": 0.6553, + "step": 3921 + }, + { + "epoch": 0.14, + "learning_rate": 1.910640873531178e-05, + "loss": 0.633, + "step": 3922 + }, + { + "epoch": 0.14, + "learning_rate": 1.9105958763773988e-05, + "loss": 0.6552, + "step": 3923 + }, + { + "epoch": 0.14, + "learning_rate": 1.910550868427353e-05, + "loss": 0.6341, + "step": 3924 + }, + { + "epoch": 0.14, + "learning_rate": 1.910505849681575e-05, + "loss": 0.6355, + "step": 3925 + }, + { + "epoch": 0.14, + "learning_rate": 1.910460820140599e-05, + "loss": 0.6183, + "step": 3926 + }, + { + "epoch": 0.14, + "learning_rate": 1.9104157798049576e-05, + "loss": 0.6458, + "step": 3927 + }, + { + "epoch": 0.14, + "learning_rate": 1.910370728675185e-05, + "loss": 0.5981, + "step": 3928 + }, + { + "epoch": 0.14, + "learning_rate": 1.9103256667518165e-05, + "loss": 0.6502, + "step": 3929 + }, + { + "epoch": 0.14, + "learning_rate": 1.9102805940353857e-05, + "loss": 0.6209, + "step": 3930 + }, + { + "epoch": 0.14, + "learning_rate": 1.9102355105264266e-05, + "loss": 0.6309, + "step": 3931 + }, + { + "epoch": 0.14, + "learning_rate": 1.910190416225474e-05, + "loss": 0.6314, + "step": 3932 + }, + { + "epoch": 0.14, + "learning_rate": 1.910145311133063e-05, + "loss": 0.633, + "step": 3933 + }, + { + "epoch": 0.14, + "learning_rate": 1.9101001952497275e-05, + "loss": 0.6243, + "step": 3934 + }, + { + "epoch": 0.14, + "learning_rate": 1.9100550685760034e-05, + "loss": 0.6358, + "step": 3935 + }, + { + "epoch": 0.14, + "learning_rate": 1.9100099311124252e-05, + "loss": 0.6968, + "step": 3936 + }, + { + "epoch": 0.14, + "learning_rate": 1.9099647828595277e-05, + "loss": 0.6636, + "step": 3937 + }, + { + "epoch": 0.14, + "learning_rate": 1.909919623817847e-05, + "loss": 0.6561, + "step": 3938 + }, + { + "epoch": 0.14, + "learning_rate": 1.9098744539879178e-05, + "loss": 0.6008, + "step": 3939 + }, + { + "epoch": 0.14, + "learning_rate": 1.9098292733702762e-05, + "loss": 0.6923, + "step": 3940 + }, + { + "epoch": 0.14, + "learning_rate": 1.9097840819654574e-05, + "loss": 0.6311, + "step": 3941 + }, + { + "epoch": 0.14, + "learning_rate": 1.909738879773997e-05, + "loss": 0.6134, + "step": 3942 + }, + { + "epoch": 0.14, + "learning_rate": 1.9096936667964323e-05, + "loss": 0.5899, + "step": 3943 + }, + { + "epoch": 0.14, + "learning_rate": 1.909648443033298e-05, + "loss": 0.6275, + "step": 3944 + }, + { + "epoch": 0.14, + "learning_rate": 1.9096032084851308e-05, + "loss": 0.668, + "step": 3945 + }, + { + "epoch": 0.14, + "learning_rate": 1.909557963152467e-05, + "loss": 0.6349, + "step": 3946 + }, + { + "epoch": 0.14, + "learning_rate": 1.9095127070358422e-05, + "loss": 0.5979, + "step": 3947 + }, + { + "epoch": 0.14, + "learning_rate": 1.9094674401357944e-05, + "loss": 0.7024, + "step": 3948 + }, + { + "epoch": 0.14, + "learning_rate": 1.9094221624528595e-05, + "loss": 0.6902, + "step": 3949 + }, + { + "epoch": 0.14, + "learning_rate": 1.9093768739875743e-05, + "loss": 0.5834, + "step": 3950 + }, + { + "epoch": 0.14, + "learning_rate": 1.9093315747404763e-05, + "loss": 0.6319, + "step": 3951 + }, + { + "epoch": 0.14, + "learning_rate": 1.909286264712102e-05, + "loss": 0.6641, + "step": 3952 + }, + { + "epoch": 0.14, + "learning_rate": 1.9092409439029884e-05, + "loss": 0.6019, + "step": 3953 + }, + { + "epoch": 0.14, + "learning_rate": 1.9091956123136736e-05, + "loss": 0.582, + "step": 3954 + }, + { + "epoch": 0.14, + "learning_rate": 1.9091502699446944e-05, + "loss": 0.6662, + "step": 3955 + }, + { + "epoch": 0.14, + "learning_rate": 1.9091049167965886e-05, + "loss": 0.7051, + "step": 3956 + }, + { + "epoch": 0.14, + "learning_rate": 1.9090595528698944e-05, + "loss": 0.5981, + "step": 3957 + }, + { + "epoch": 0.14, + "learning_rate": 1.909014178165149e-05, + "loss": 0.6675, + "step": 3958 + }, + { + "epoch": 0.14, + "learning_rate": 1.9089687926828908e-05, + "loss": 0.6593, + "step": 3959 + }, + { + "epoch": 0.14, + "learning_rate": 1.9089233964236575e-05, + "loss": 0.6613, + "step": 3960 + }, + { + "epoch": 0.14, + "learning_rate": 1.9088779893879875e-05, + "loss": 0.6395, + "step": 3961 + }, + { + "epoch": 0.14, + "learning_rate": 1.9088325715764192e-05, + "loss": 0.6406, + "step": 3962 + }, + { + "epoch": 0.14, + "learning_rate": 1.9087871429894914e-05, + "loss": 0.6465, + "step": 3963 + }, + { + "epoch": 0.14, + "learning_rate": 1.908741703627742e-05, + "loss": 0.6108, + "step": 3964 + }, + { + "epoch": 0.14, + "learning_rate": 1.9086962534917103e-05, + "loss": 0.6598, + "step": 3965 + }, + { + "epoch": 0.14, + "learning_rate": 1.908650792581935e-05, + "loss": 0.6917, + "step": 3966 + }, + { + "epoch": 0.14, + "learning_rate": 1.9086053208989552e-05, + "loss": 0.6389, + "step": 3967 + }, + { + "epoch": 0.14, + "learning_rate": 1.90855983844331e-05, + "loss": 0.6618, + "step": 3968 + }, + { + "epoch": 0.14, + "learning_rate": 1.9085143452155385e-05, + "loss": 0.6187, + "step": 3969 + }, + { + "epoch": 0.14, + "learning_rate": 1.90846884121618e-05, + "loss": 0.6455, + "step": 3970 + }, + { + "epoch": 0.14, + "learning_rate": 1.908423326445774e-05, + "loss": 0.6189, + "step": 3971 + }, + { + "epoch": 0.14, + "learning_rate": 1.9083778009048607e-05, + "loss": 0.611, + "step": 3972 + }, + { + "epoch": 0.14, + "learning_rate": 1.9083322645939795e-05, + "loss": 0.6764, + "step": 3973 + }, + { + "epoch": 0.14, + "learning_rate": 1.90828671751367e-05, + "loss": 0.6589, + "step": 3974 + }, + { + "epoch": 0.14, + "learning_rate": 1.9082411596644728e-05, + "loss": 0.6173, + "step": 3975 + }, + { + "epoch": 0.14, + "learning_rate": 1.9081955910469272e-05, + "loss": 0.6596, + "step": 3976 + }, + { + "epoch": 0.14, + "learning_rate": 1.9081500116615746e-05, + "loss": 0.6464, + "step": 3977 + }, + { + "epoch": 0.14, + "learning_rate": 1.9081044215089542e-05, + "loss": 0.6103, + "step": 3978 + }, + { + "epoch": 0.14, + "learning_rate": 1.9080588205896076e-05, + "loss": 0.6375, + "step": 3979 + }, + { + "epoch": 0.14, + "learning_rate": 1.9080132089040745e-05, + "loss": 0.6073, + "step": 3980 + }, + { + "epoch": 0.14, + "learning_rate": 1.9079675864528966e-05, + "loss": 0.6651, + "step": 3981 + }, + { + "epoch": 0.14, + "learning_rate": 1.9079219532366144e-05, + "loss": 0.6647, + "step": 3982 + }, + { + "epoch": 0.14, + "learning_rate": 1.9078763092557685e-05, + "loss": 0.6983, + "step": 3983 + }, + { + "epoch": 0.14, + "learning_rate": 1.907830654510901e-05, + "loss": 0.6581, + "step": 3984 + }, + { + "epoch": 0.14, + "learning_rate": 1.9077849890025524e-05, + "loss": 0.7043, + "step": 3985 + }, + { + "epoch": 0.14, + "learning_rate": 1.9077393127312646e-05, + "loss": 0.6311, + "step": 3986 + }, + { + "epoch": 0.14, + "learning_rate": 1.9076936256975785e-05, + "loss": 0.6409, + "step": 3987 + }, + { + "epoch": 0.14, + "learning_rate": 1.9076479279020366e-05, + "loss": 0.6163, + "step": 3988 + }, + { + "epoch": 0.14, + "learning_rate": 1.9076022193451803e-05, + "loss": 0.6504, + "step": 3989 + }, + { + "epoch": 0.14, + "learning_rate": 1.9075565000275514e-05, + "loss": 0.6449, + "step": 3990 + }, + { + "epoch": 0.14, + "learning_rate": 1.907510769949692e-05, + "loss": 0.6375, + "step": 3991 + }, + { + "epoch": 0.14, + "learning_rate": 1.907465029112145e-05, + "loss": 0.6007, + "step": 3992 + }, + { + "epoch": 0.14, + "learning_rate": 1.9074192775154517e-05, + "loss": 0.5889, + "step": 3993 + }, + { + "epoch": 0.14, + "learning_rate": 1.907373515160155e-05, + "loss": 0.7103, + "step": 3994 + }, + { + "epoch": 0.14, + "learning_rate": 1.9073277420467975e-05, + "loss": 0.6192, + "step": 3995 + }, + { + "epoch": 0.14, + "learning_rate": 1.9072819581759216e-05, + "loss": 0.611, + "step": 3996 + }, + { + "epoch": 0.14, + "learning_rate": 1.9072361635480706e-05, + "loss": 0.642, + "step": 3997 + }, + { + "epoch": 0.14, + "learning_rate": 1.907190358163787e-05, + "loss": 0.6667, + "step": 3998 + }, + { + "epoch": 0.14, + "learning_rate": 1.9071445420236147e-05, + "loss": 0.6411, + "step": 3999 + }, + { + "epoch": 0.14, + "learning_rate": 1.907098715128096e-05, + "loss": 0.608, + "step": 4000 + }, + { + "epoch": 0.14, + "learning_rate": 1.9070528774777743e-05, + "loss": 0.6342, + "step": 4001 + }, + { + "epoch": 0.14, + "learning_rate": 1.9070070290731933e-05, + "loss": 0.6088, + "step": 4002 + }, + { + "epoch": 0.14, + "learning_rate": 1.906961169914897e-05, + "loss": 0.672, + "step": 4003 + }, + { + "epoch": 0.14, + "learning_rate": 1.9069153000034286e-05, + "loss": 0.6732, + "step": 4004 + }, + { + "epoch": 0.14, + "learning_rate": 1.906869419339332e-05, + "loss": 0.6268, + "step": 4005 + }, + { + "epoch": 0.14, + "learning_rate": 1.9068235279231513e-05, + "loss": 0.6503, + "step": 4006 + }, + { + "epoch": 0.14, + "learning_rate": 1.90677762575543e-05, + "loss": 0.6347, + "step": 4007 + }, + { + "epoch": 0.14, + "learning_rate": 1.9067317128367134e-05, + "loss": 0.6503, + "step": 4008 + }, + { + "epoch": 0.14, + "learning_rate": 1.9066857891675454e-05, + "loss": 0.6599, + "step": 4009 + }, + { + "epoch": 0.14, + "learning_rate": 1.90663985474847e-05, + "loss": 0.6487, + "step": 4010 + }, + { + "epoch": 0.14, + "learning_rate": 1.9065939095800327e-05, + "loss": 0.6538, + "step": 4011 + }, + { + "epoch": 0.14, + "learning_rate": 1.9065479536627774e-05, + "loss": 0.6295, + "step": 4012 + }, + { + "epoch": 0.14, + "learning_rate": 1.9065019869972497e-05, + "loss": 0.6518, + "step": 4013 + }, + { + "epoch": 0.14, + "learning_rate": 1.906456009583994e-05, + "loss": 0.5956, + "step": 4014 + }, + { + "epoch": 0.14, + "learning_rate": 1.9064100214235553e-05, + "loss": 0.7012, + "step": 4015 + }, + { + "epoch": 0.14, + "learning_rate": 1.9063640225164794e-05, + "loss": 0.7303, + "step": 4016 + }, + { + "epoch": 0.14, + "learning_rate": 1.9063180128633116e-05, + "loss": 0.6168, + "step": 4017 + }, + { + "epoch": 0.14, + "learning_rate": 1.906271992464597e-05, + "loss": 0.6944, + "step": 4018 + }, + { + "epoch": 0.14, + "learning_rate": 1.906225961320882e-05, + "loss": 0.6517, + "step": 4019 + }, + { + "epoch": 0.14, + "learning_rate": 1.9061799194327114e-05, + "loss": 0.6199, + "step": 4020 + }, + { + "epoch": 0.14, + "learning_rate": 1.9061338668006317e-05, + "loss": 0.6153, + "step": 4021 + }, + { + "epoch": 0.14, + "learning_rate": 1.9060878034251887e-05, + "loss": 0.6122, + "step": 4022 + }, + { + "epoch": 0.14, + "learning_rate": 1.9060417293069288e-05, + "loss": 0.654, + "step": 4023 + }, + { + "epoch": 0.14, + "learning_rate": 1.9059956444463975e-05, + "loss": 0.6551, + "step": 4024 + }, + { + "epoch": 0.14, + "learning_rate": 1.9059495488441423e-05, + "loss": 0.621, + "step": 4025 + }, + { + "epoch": 0.14, + "learning_rate": 1.905903442500709e-05, + "loss": 0.5993, + "step": 4026 + }, + { + "epoch": 0.14, + "learning_rate": 1.9058573254166443e-05, + "loss": 0.633, + "step": 4027 + }, + { + "epoch": 0.14, + "learning_rate": 1.9058111975924948e-05, + "loss": 0.6867, + "step": 4028 + }, + { + "epoch": 0.14, + "learning_rate": 1.9057650590288085e-05, + "loss": 0.6468, + "step": 4029 + }, + { + "epoch": 0.14, + "learning_rate": 1.9057189097261308e-05, + "loss": 0.6375, + "step": 4030 + }, + { + "epoch": 0.14, + "learning_rate": 1.9056727496850103e-05, + "loss": 0.6471, + "step": 4031 + }, + { + "epoch": 0.14, + "learning_rate": 1.9056265789059932e-05, + "loss": 0.6697, + "step": 4032 + }, + { + "epoch": 0.14, + "learning_rate": 1.9055803973896277e-05, + "loss": 0.6398, + "step": 4033 + }, + { + "epoch": 0.14, + "learning_rate": 1.905534205136461e-05, + "loss": 0.6665, + "step": 4034 + }, + { + "epoch": 0.14, + "learning_rate": 1.9054880021470406e-05, + "loss": 0.62, + "step": 4035 + }, + { + "epoch": 0.14, + "learning_rate": 1.905441788421915e-05, + "loss": 0.667, + "step": 4036 + }, + { + "epoch": 0.14, + "learning_rate": 1.9053955639616308e-05, + "loss": 0.6272, + "step": 4037 + }, + { + "epoch": 0.14, + "learning_rate": 1.9053493287667372e-05, + "loss": 0.5821, + "step": 4038 + }, + { + "epoch": 0.14, + "learning_rate": 1.9053030828377823e-05, + "loss": 0.6451, + "step": 4039 + }, + { + "epoch": 0.14, + "learning_rate": 1.905256826175314e-05, + "loss": 0.5887, + "step": 4040 + }, + { + "epoch": 0.14, + "learning_rate": 1.9052105587798806e-05, + "loss": 0.5971, + "step": 4041 + }, + { + "epoch": 0.14, + "learning_rate": 1.905164280652031e-05, + "loss": 0.6256, + "step": 4042 + }, + { + "epoch": 0.14, + "learning_rate": 1.9051179917923144e-05, + "loss": 0.5889, + "step": 4043 + }, + { + "epoch": 0.14, + "learning_rate": 1.9050716922012786e-05, + "loss": 0.6163, + "step": 4044 + }, + { + "epoch": 0.14, + "learning_rate": 1.905025381879473e-05, + "loss": 0.6403, + "step": 4045 + }, + { + "epoch": 0.14, + "learning_rate": 1.9049790608274462e-05, + "loss": 0.6922, + "step": 4046 + }, + { + "epoch": 0.14, + "learning_rate": 1.9049327290457485e-05, + "loss": 0.62, + "step": 4047 + }, + { + "epoch": 0.14, + "learning_rate": 1.904886386534928e-05, + "loss": 0.6614, + "step": 4048 + }, + { + "epoch": 0.14, + "learning_rate": 1.904840033295535e-05, + "loss": 0.6164, + "step": 4049 + }, + { + "epoch": 0.14, + "learning_rate": 1.904793669328119e-05, + "loss": 0.6431, + "step": 4050 + }, + { + "epoch": 0.14, + "learning_rate": 1.904747294633229e-05, + "loss": 0.638, + "step": 4051 + }, + { + "epoch": 0.14, + "learning_rate": 1.9047009092114156e-05, + "loss": 0.6435, + "step": 4052 + }, + { + "epoch": 0.14, + "learning_rate": 1.9046545130632282e-05, + "loss": 0.6341, + "step": 4053 + }, + { + "epoch": 0.14, + "learning_rate": 1.9046081061892178e-05, + "loss": 0.6041, + "step": 4054 + }, + { + "epoch": 0.14, + "learning_rate": 1.9045616885899335e-05, + "loss": 0.5987, + "step": 4055 + }, + { + "epoch": 0.14, + "learning_rate": 1.9045152602659257e-05, + "loss": 0.6747, + "step": 4056 + }, + { + "epoch": 0.14, + "learning_rate": 1.904468821217746e-05, + "loss": 0.6419, + "step": 4057 + }, + { + "epoch": 0.14, + "learning_rate": 1.904422371445944e-05, + "loss": 0.6232, + "step": 4058 + }, + { + "epoch": 0.14, + "learning_rate": 1.9043759109510708e-05, + "loss": 0.6513, + "step": 4059 + }, + { + "epoch": 0.14, + "learning_rate": 1.904329439733677e-05, + "loss": 0.5927, + "step": 4060 + }, + { + "epoch": 0.14, + "learning_rate": 1.9042829577943136e-05, + "loss": 0.6291, + "step": 4061 + }, + { + "epoch": 0.14, + "learning_rate": 1.904236465133532e-05, + "loss": 0.6292, + "step": 4062 + }, + { + "epoch": 0.14, + "learning_rate": 1.904189961751883e-05, + "loss": 0.6559, + "step": 4063 + }, + { + "epoch": 0.14, + "learning_rate": 1.9041434476499184e-05, + "loss": 0.6931, + "step": 4064 + }, + { + "epoch": 0.14, + "learning_rate": 1.9040969228281893e-05, + "loss": 0.6202, + "step": 4065 + }, + { + "epoch": 0.14, + "learning_rate": 1.9040503872872477e-05, + "loss": 0.6605, + "step": 4066 + }, + { + "epoch": 0.14, + "learning_rate": 1.904003841027645e-05, + "loss": 0.6155, + "step": 4067 + }, + { + "epoch": 0.14, + "learning_rate": 1.903957284049933e-05, + "loss": 0.661, + "step": 4068 + }, + { + "epoch": 0.14, + "learning_rate": 1.9039107163546644e-05, + "loss": 0.61, + "step": 4069 + }, + { + "epoch": 0.14, + "learning_rate": 1.9038641379423906e-05, + "loss": 0.6403, + "step": 4070 + }, + { + "epoch": 0.14, + "learning_rate": 1.903817548813664e-05, + "loss": 0.639, + "step": 4071 + }, + { + "epoch": 0.14, + "learning_rate": 1.903770948969037e-05, + "loss": 0.6393, + "step": 4072 + }, + { + "epoch": 0.14, + "learning_rate": 1.903724338409062e-05, + "loss": 0.6198, + "step": 4073 + }, + { + "epoch": 0.14, + "learning_rate": 1.9036777171342918e-05, + "loss": 0.6075, + "step": 4074 + }, + { + "epoch": 0.14, + "learning_rate": 1.9036310851452792e-05, + "loss": 0.6036, + "step": 4075 + }, + { + "epoch": 0.14, + "learning_rate": 1.903584442442577e-05, + "loss": 0.6659, + "step": 4076 + }, + { + "epoch": 0.14, + "learning_rate": 1.9035377890267384e-05, + "loss": 0.6759, + "step": 4077 + }, + { + "epoch": 0.14, + "learning_rate": 1.903491124898316e-05, + "loss": 0.6318, + "step": 4078 + }, + { + "epoch": 0.14, + "learning_rate": 1.9034444500578636e-05, + "loss": 0.6493, + "step": 4079 + }, + { + "epoch": 0.14, + "learning_rate": 1.9033977645059342e-05, + "loss": 0.6346, + "step": 4080 + }, + { + "epoch": 0.14, + "learning_rate": 1.9033510682430814e-05, + "loss": 0.6803, + "step": 4081 + }, + { + "epoch": 0.14, + "learning_rate": 1.9033043612698592e-05, + "loss": 0.673, + "step": 4082 + }, + { + "epoch": 0.14, + "learning_rate": 1.903257643586821e-05, + "loss": 0.6357, + "step": 4083 + }, + { + "epoch": 0.14, + "learning_rate": 1.9032109151945207e-05, + "loss": 0.6437, + "step": 4084 + }, + { + "epoch": 0.14, + "learning_rate": 1.9031641760935126e-05, + "loss": 0.5928, + "step": 4085 + }, + { + "epoch": 0.14, + "learning_rate": 1.9031174262843506e-05, + "loss": 0.6547, + "step": 4086 + }, + { + "epoch": 0.14, + "learning_rate": 1.9030706657675893e-05, + "loss": 0.6781, + "step": 4087 + }, + { + "epoch": 0.14, + "learning_rate": 1.9030238945437823e-05, + "loss": 0.6277, + "step": 4088 + }, + { + "epoch": 0.14, + "learning_rate": 1.9029771126134854e-05, + "loss": 0.6325, + "step": 4089 + }, + { + "epoch": 0.14, + "learning_rate": 1.9029303199772523e-05, + "loss": 0.713, + "step": 4090 + }, + { + "epoch": 0.14, + "learning_rate": 1.902883516635638e-05, + "loss": 0.655, + "step": 4091 + }, + { + "epoch": 0.14, + "learning_rate": 1.9028367025891973e-05, + "loss": 0.6807, + "step": 4092 + }, + { + "epoch": 0.14, + "learning_rate": 1.9027898778384856e-05, + "loss": 0.6796, + "step": 4093 + }, + { + "epoch": 0.14, + "learning_rate": 1.9027430423840578e-05, + "loss": 0.6629, + "step": 4094 + }, + { + "epoch": 0.14, + "learning_rate": 1.902696196226469e-05, + "loss": 0.7129, + "step": 4095 + }, + { + "epoch": 0.14, + "learning_rate": 1.9026493393662752e-05, + "loss": 0.6411, + "step": 4096 + }, + { + "epoch": 0.14, + "learning_rate": 1.902602471804032e-05, + "loss": 0.6645, + "step": 4097 + }, + { + "epoch": 0.14, + "learning_rate": 1.902555593540294e-05, + "loss": 0.6381, + "step": 4098 + }, + { + "epoch": 0.14, + "learning_rate": 1.9025087045756177e-05, + "loss": 0.6052, + "step": 4099 + }, + { + "epoch": 0.14, + "learning_rate": 1.9024618049105593e-05, + "loss": 0.6606, + "step": 4100 + }, + { + "epoch": 0.14, + "learning_rate": 1.9024148945456747e-05, + "loss": 0.6137, + "step": 4101 + }, + { + "epoch": 0.14, + "learning_rate": 1.9023679734815198e-05, + "loss": 0.6335, + "step": 4102 + }, + { + "epoch": 0.14, + "learning_rate": 1.902321041718651e-05, + "loss": 0.6881, + "step": 4103 + }, + { + "epoch": 0.14, + "learning_rate": 1.902274099257625e-05, + "loss": 0.658, + "step": 4104 + }, + { + "epoch": 0.14, + "learning_rate": 1.902227146098998e-05, + "loss": 0.592, + "step": 4105 + }, + { + "epoch": 0.14, + "learning_rate": 1.902180182243327e-05, + "loss": 0.6976, + "step": 4106 + }, + { + "epoch": 0.14, + "learning_rate": 1.9021332076911684e-05, + "loss": 0.6376, + "step": 4107 + }, + { + "epoch": 0.14, + "learning_rate": 1.9020862224430797e-05, + "loss": 0.6188, + "step": 4108 + }, + { + "epoch": 0.14, + "learning_rate": 1.902039226499618e-05, + "loss": 0.6052, + "step": 4109 + }, + { + "epoch": 0.14, + "learning_rate": 1.9019922198613394e-05, + "loss": 0.5609, + "step": 4110 + }, + { + "epoch": 0.14, + "learning_rate": 1.9019452025288025e-05, + "loss": 0.6355, + "step": 4111 + }, + { + "epoch": 0.14, + "learning_rate": 1.9018981745025644e-05, + "loss": 0.6591, + "step": 4112 + }, + { + "epoch": 0.14, + "learning_rate": 1.901851135783182e-05, + "loss": 0.6937, + "step": 4113 + }, + { + "epoch": 0.14, + "learning_rate": 1.901804086371214e-05, + "loss": 0.6168, + "step": 4114 + }, + { + "epoch": 0.14, + "learning_rate": 1.9017570262672175e-05, + "loss": 0.656, + "step": 4115 + }, + { + "epoch": 0.14, + "learning_rate": 1.9017099554717512e-05, + "loss": 0.6188, + "step": 4116 + }, + { + "epoch": 0.14, + "learning_rate": 1.901662873985372e-05, + "loss": 0.6604, + "step": 4117 + }, + { + "epoch": 0.14, + "learning_rate": 1.901615781808639e-05, + "loss": 0.6229, + "step": 4118 + }, + { + "epoch": 0.14, + "learning_rate": 1.9015686789421107e-05, + "loss": 0.6513, + "step": 4119 + }, + { + "epoch": 0.14, + "learning_rate": 1.901521565386345e-05, + "loss": 0.6697, + "step": 4120 + }, + { + "epoch": 0.14, + "learning_rate": 1.901474441141901e-05, + "loss": 0.6556, + "step": 4121 + }, + { + "epoch": 0.14, + "learning_rate": 1.9014273062093368e-05, + "loss": 0.656, + "step": 4122 + }, + { + "epoch": 0.14, + "learning_rate": 1.9013801605892113e-05, + "loss": 0.6601, + "step": 4123 + }, + { + "epoch": 0.14, + "learning_rate": 1.9013330042820844e-05, + "loss": 0.6682, + "step": 4124 + }, + { + "epoch": 0.14, + "learning_rate": 1.901285837288514e-05, + "loss": 0.6552, + "step": 4125 + }, + { + "epoch": 0.14, + "learning_rate": 1.9012386596090603e-05, + "loss": 0.6507, + "step": 4126 + }, + { + "epoch": 0.14, + "learning_rate": 1.9011914712442822e-05, + "loss": 0.6359, + "step": 4127 + }, + { + "epoch": 0.14, + "learning_rate": 1.9011442721947388e-05, + "loss": 0.6273, + "step": 4128 + }, + { + "epoch": 0.14, + "learning_rate": 1.9010970624609904e-05, + "loss": 0.6152, + "step": 4129 + }, + { + "epoch": 0.14, + "learning_rate": 1.9010498420435962e-05, + "loss": 0.6587, + "step": 4130 + }, + { + "epoch": 0.14, + "learning_rate": 1.9010026109431165e-05, + "loss": 0.6307, + "step": 4131 + }, + { + "epoch": 0.14, + "learning_rate": 1.900955369160111e-05, + "loss": 0.6808, + "step": 4132 + }, + { + "epoch": 0.14, + "learning_rate": 1.90090811669514e-05, + "loss": 0.6513, + "step": 4133 + }, + { + "epoch": 0.14, + "learning_rate": 1.9008608535487634e-05, + "loss": 0.6641, + "step": 4134 + }, + { + "epoch": 0.14, + "learning_rate": 1.900813579721542e-05, + "loss": 0.6858, + "step": 4135 + }, + { + "epoch": 0.14, + "learning_rate": 1.900766295214036e-05, + "loss": 0.6285, + "step": 4136 + }, + { + "epoch": 0.14, + "learning_rate": 1.9007190000268058e-05, + "loss": 0.6544, + "step": 4137 + }, + { + "epoch": 0.14, + "learning_rate": 1.9006716941604128e-05, + "loss": 0.6587, + "step": 4138 + }, + { + "epoch": 0.14, + "learning_rate": 1.9006243776154174e-05, + "loss": 0.6401, + "step": 4139 + }, + { + "epoch": 0.14, + "learning_rate": 1.900577050392381e-05, + "loss": 0.601, + "step": 4140 + }, + { + "epoch": 0.14, + "learning_rate": 1.900529712491864e-05, + "loss": 0.6526, + "step": 4141 + }, + { + "epoch": 0.14, + "learning_rate": 1.9004823639144283e-05, + "loss": 0.6794, + "step": 4142 + }, + { + "epoch": 0.14, + "learning_rate": 1.9004350046606352e-05, + "loss": 0.6188, + "step": 4143 + }, + { + "epoch": 0.14, + "learning_rate": 1.9003876347310455e-05, + "loss": 0.573, + "step": 4144 + }, + { + "epoch": 0.14, + "learning_rate": 1.900340254126222e-05, + "loss": 0.6221, + "step": 4145 + }, + { + "epoch": 0.14, + "learning_rate": 1.9002928628467256e-05, + "loss": 0.6362, + "step": 4146 + }, + { + "epoch": 0.14, + "learning_rate": 1.9002454608931183e-05, + "loss": 0.6268, + "step": 4147 + }, + { + "epoch": 0.14, + "learning_rate": 1.9001980482659625e-05, + "loss": 0.6159, + "step": 4148 + }, + { + "epoch": 0.14, + "learning_rate": 1.9001506249658198e-05, + "loss": 0.5981, + "step": 4149 + }, + { + "epoch": 0.14, + "learning_rate": 1.900103190993253e-05, + "loss": 0.6814, + "step": 4150 + }, + { + "epoch": 0.14, + "learning_rate": 1.9000557463488244e-05, + "loss": 0.564, + "step": 4151 + }, + { + "epoch": 0.14, + "learning_rate": 1.900008291033096e-05, + "loss": 0.6632, + "step": 4152 + }, + { + "epoch": 0.14, + "learning_rate": 1.899960825046631e-05, + "loss": 0.6754, + "step": 4153 + }, + { + "epoch": 0.14, + "learning_rate": 1.8999133483899917e-05, + "loss": 0.6119, + "step": 4154 + }, + { + "epoch": 0.14, + "learning_rate": 1.8998658610637415e-05, + "loss": 0.6749, + "step": 4155 + }, + { + "epoch": 0.14, + "learning_rate": 1.899818363068443e-05, + "loss": 0.7039, + "step": 4156 + }, + { + "epoch": 0.14, + "learning_rate": 1.8997708544046597e-05, + "loss": 0.6297, + "step": 4157 + }, + { + "epoch": 0.14, + "learning_rate": 1.899723335072955e-05, + "loss": 0.6651, + "step": 4158 + }, + { + "epoch": 0.14, + "learning_rate": 1.899675805073891e-05, + "loss": 0.6856, + "step": 4159 + }, + { + "epoch": 0.14, + "learning_rate": 1.899628264408033e-05, + "loss": 0.5886, + "step": 4160 + }, + { + "epoch": 0.14, + "learning_rate": 1.899580713075944e-05, + "loss": 0.6282, + "step": 4161 + }, + { + "epoch": 0.14, + "learning_rate": 1.8995331510781873e-05, + "loss": 0.6643, + "step": 4162 + }, + { + "epoch": 0.14, + "learning_rate": 1.8994855784153274e-05, + "loss": 0.6436, + "step": 4163 + }, + { + "epoch": 0.14, + "learning_rate": 1.899437995087928e-05, + "loss": 0.6595, + "step": 4164 + }, + { + "epoch": 0.14, + "learning_rate": 1.8993904010965535e-05, + "loss": 0.6276, + "step": 4165 + }, + { + "epoch": 0.14, + "learning_rate": 1.8993427964417677e-05, + "loss": 0.6201, + "step": 4166 + }, + { + "epoch": 0.14, + "learning_rate": 1.899295181124136e-05, + "loss": 0.6319, + "step": 4167 + }, + { + "epoch": 0.14, + "learning_rate": 1.8992475551442216e-05, + "loss": 0.6688, + "step": 4168 + }, + { + "epoch": 0.14, + "learning_rate": 1.8991999185025902e-05, + "loss": 0.5875, + "step": 4169 + }, + { + "epoch": 0.14, + "learning_rate": 1.8991522711998063e-05, + "loss": 0.6285, + "step": 4170 + }, + { + "epoch": 0.14, + "learning_rate": 1.899104613236435e-05, + "loss": 0.692, + "step": 4171 + }, + { + "epoch": 0.14, + "learning_rate": 1.8990569446130406e-05, + "loss": 0.6631, + "step": 4172 + }, + { + "epoch": 0.14, + "learning_rate": 1.8990092653301894e-05, + "loss": 0.6737, + "step": 4173 + }, + { + "epoch": 0.14, + "learning_rate": 1.898961575388446e-05, + "loss": 0.6217, + "step": 4174 + }, + { + "epoch": 0.14, + "learning_rate": 1.8989138747883754e-05, + "loss": 0.6948, + "step": 4175 + }, + { + "epoch": 0.14, + "learning_rate": 1.8988661635305444e-05, + "loss": 0.6258, + "step": 4176 + }, + { + "epoch": 0.14, + "learning_rate": 1.8988184416155173e-05, + "loss": 0.6474, + "step": 4177 + }, + { + "epoch": 0.14, + "learning_rate": 1.898770709043861e-05, + "loss": 0.6622, + "step": 4178 + }, + { + "epoch": 0.14, + "learning_rate": 1.8987229658161408e-05, + "loss": 0.619, + "step": 4179 + }, + { + "epoch": 0.14, + "learning_rate": 1.898675211932923e-05, + "loss": 0.6656, + "step": 4180 + }, + { + "epoch": 0.14, + "learning_rate": 1.8986274473947738e-05, + "loss": 0.6032, + "step": 4181 + }, + { + "epoch": 0.14, + "learning_rate": 1.8985796722022596e-05, + "loss": 0.6324, + "step": 4182 + }, + { + "epoch": 0.14, + "learning_rate": 1.8985318863559463e-05, + "loss": 0.681, + "step": 4183 + }, + { + "epoch": 0.14, + "learning_rate": 1.898484089856401e-05, + "loss": 0.6984, + "step": 4184 + }, + { + "epoch": 0.14, + "learning_rate": 1.8984362827041903e-05, + "loss": 0.6549, + "step": 4185 + }, + { + "epoch": 0.15, + "learning_rate": 1.898388464899881e-05, + "loss": 0.6517, + "step": 4186 + }, + { + "epoch": 0.15, + "learning_rate": 1.8983406364440396e-05, + "loss": 0.6544, + "step": 4187 + }, + { + "epoch": 0.15, + "learning_rate": 1.8982927973372338e-05, + "loss": 0.6675, + "step": 4188 + }, + { + "epoch": 0.15, + "learning_rate": 1.8982449475800308e-05, + "loss": 0.6113, + "step": 4189 + }, + { + "epoch": 0.15, + "learning_rate": 1.8981970871729972e-05, + "loss": 0.5703, + "step": 4190 + }, + { + "epoch": 0.15, + "learning_rate": 1.898149216116701e-05, + "loss": 0.6622, + "step": 4191 + }, + { + "epoch": 0.15, + "learning_rate": 1.89810133441171e-05, + "loss": 0.6143, + "step": 4192 + }, + { + "epoch": 0.15, + "learning_rate": 1.898053442058591e-05, + "loss": 0.592, + "step": 4193 + }, + { + "epoch": 0.15, + "learning_rate": 1.898005539057913e-05, + "loss": 0.5827, + "step": 4194 + }, + { + "epoch": 0.15, + "learning_rate": 1.897957625410243e-05, + "loss": 0.6293, + "step": 4195 + }, + { + "epoch": 0.15, + "learning_rate": 1.8979097011161497e-05, + "loss": 0.6419, + "step": 4196 + }, + { + "epoch": 0.15, + "learning_rate": 1.897861766176201e-05, + "loss": 0.6656, + "step": 4197 + }, + { + "epoch": 0.15, + "learning_rate": 1.897813820590965e-05, + "loss": 0.6738, + "step": 4198 + }, + { + "epoch": 0.15, + "learning_rate": 1.8977658643610106e-05, + "loss": 0.6589, + "step": 4199 + }, + { + "epoch": 0.15, + "learning_rate": 1.8977178974869065e-05, + "loss": 0.5942, + "step": 4200 + }, + { + "epoch": 0.15, + "learning_rate": 1.8976699199692206e-05, + "loss": 0.6655, + "step": 4201 + }, + { + "epoch": 0.15, + "learning_rate": 1.8976219318085224e-05, + "loss": 0.6473, + "step": 4202 + }, + { + "epoch": 0.15, + "learning_rate": 1.8975739330053807e-05, + "loss": 0.618, + "step": 4203 + }, + { + "epoch": 0.15, + "learning_rate": 1.8975259235603646e-05, + "loss": 0.6405, + "step": 4204 + }, + { + "epoch": 0.15, + "learning_rate": 1.8974779034740432e-05, + "loss": 0.6672, + "step": 4205 + }, + { + "epoch": 0.15, + "learning_rate": 1.8974298727469863e-05, + "loss": 0.5964, + "step": 4206 + }, + { + "epoch": 0.15, + "learning_rate": 1.8973818313797627e-05, + "loss": 0.6645, + "step": 4207 + }, + { + "epoch": 0.15, + "learning_rate": 1.897333779372942e-05, + "loss": 0.6293, + "step": 4208 + }, + { + "epoch": 0.15, + "learning_rate": 1.897285716727095e-05, + "loss": 0.7272, + "step": 4209 + }, + { + "epoch": 0.15, + "learning_rate": 1.89723764344279e-05, + "loss": 0.6197, + "step": 4210 + }, + { + "epoch": 0.15, + "learning_rate": 1.897189559520598e-05, + "loss": 0.6793, + "step": 4211 + }, + { + "epoch": 0.15, + "learning_rate": 1.897141464961089e-05, + "loss": 0.6443, + "step": 4212 + }, + { + "epoch": 0.15, + "learning_rate": 1.8970933597648326e-05, + "loss": 0.6052, + "step": 4213 + }, + { + "epoch": 0.15, + "learning_rate": 1.8970452439324002e-05, + "loss": 0.7044, + "step": 4214 + }, + { + "epoch": 0.15, + "learning_rate": 1.8969971174643615e-05, + "loss": 0.6483, + "step": 4215 + }, + { + "epoch": 0.15, + "learning_rate": 1.8969489803612868e-05, + "loss": 0.6647, + "step": 4216 + }, + { + "epoch": 0.15, + "learning_rate": 1.8969008326237473e-05, + "loss": 0.6118, + "step": 4217 + }, + { + "epoch": 0.15, + "learning_rate": 1.8968526742523147e-05, + "loss": 0.6658, + "step": 4218 + }, + { + "epoch": 0.15, + "learning_rate": 1.8968045052475583e-05, + "loss": 0.6035, + "step": 4219 + }, + { + "epoch": 0.15, + "learning_rate": 1.8967563256100503e-05, + "loss": 0.6004, + "step": 4220 + }, + { + "epoch": 0.15, + "learning_rate": 1.8967081353403614e-05, + "loss": 0.6045, + "step": 4221 + }, + { + "epoch": 0.15, + "learning_rate": 1.8966599344390636e-05, + "loss": 0.6089, + "step": 4222 + }, + { + "epoch": 0.15, + "learning_rate": 1.896611722906728e-05, + "loss": 0.6888, + "step": 4223 + }, + { + "epoch": 0.15, + "learning_rate": 1.896563500743926e-05, + "loss": 0.6392, + "step": 4224 + }, + { + "epoch": 0.15, + "learning_rate": 1.89651526795123e-05, + "loss": 0.7264, + "step": 4225 + }, + { + "epoch": 0.15, + "learning_rate": 1.8964670245292108e-05, + "loss": 0.6189, + "step": 4226 + }, + { + "epoch": 0.15, + "learning_rate": 1.896418770478441e-05, + "loss": 0.6222, + "step": 4227 + }, + { + "epoch": 0.15, + "learning_rate": 1.896370505799493e-05, + "loss": 0.6814, + "step": 4228 + }, + { + "epoch": 0.15, + "learning_rate": 1.8963222304929386e-05, + "loss": 0.622, + "step": 4229 + }, + { + "epoch": 0.15, + "learning_rate": 1.8962739445593504e-05, + "loss": 0.6694, + "step": 4230 + }, + { + "epoch": 0.15, + "learning_rate": 1.8962256479993008e-05, + "loss": 0.6516, + "step": 4231 + }, + { + "epoch": 0.15, + "learning_rate": 1.8961773408133625e-05, + "loss": 0.653, + "step": 4232 + }, + { + "epoch": 0.15, + "learning_rate": 1.8961290230021077e-05, + "loss": 0.6049, + "step": 4233 + }, + { + "epoch": 0.15, + "learning_rate": 1.89608069456611e-05, + "loss": 0.5989, + "step": 4234 + }, + { + "epoch": 0.15, + "learning_rate": 1.896032355505942e-05, + "loss": 0.6146, + "step": 4235 + }, + { + "epoch": 0.15, + "learning_rate": 1.8959840058221772e-05, + "loss": 0.6547, + "step": 4236 + }, + { + "epoch": 0.15, + "learning_rate": 1.8959356455153886e-05, + "loss": 0.6499, + "step": 4237 + }, + { + "epoch": 0.15, + "learning_rate": 1.8958872745861495e-05, + "loss": 0.7389, + "step": 4238 + }, + { + "epoch": 0.15, + "learning_rate": 1.8958388930350332e-05, + "loss": 0.6316, + "step": 4239 + }, + { + "epoch": 0.15, + "learning_rate": 1.895790500862614e-05, + "loss": 0.6885, + "step": 4240 + }, + { + "epoch": 0.15, + "learning_rate": 1.895742098069465e-05, + "loss": 0.6124, + "step": 4241 + }, + { + "epoch": 0.15, + "learning_rate": 1.89569368465616e-05, + "loss": 0.6298, + "step": 4242 + }, + { + "epoch": 0.15, + "learning_rate": 1.895645260623274e-05, + "loss": 0.6333, + "step": 4243 + }, + { + "epoch": 0.15, + "learning_rate": 1.89559682597138e-05, + "loss": 0.656, + "step": 4244 + }, + { + "epoch": 0.15, + "learning_rate": 1.8955483807010524e-05, + "loss": 0.6397, + "step": 4245 + }, + { + "epoch": 0.15, + "learning_rate": 1.8954999248128664e-05, + "loss": 0.5894, + "step": 4246 + }, + { + "epoch": 0.15, + "learning_rate": 1.8954514583073958e-05, + "loss": 0.6656, + "step": 4247 + }, + { + "epoch": 0.15, + "learning_rate": 1.8954029811852153e-05, + "loss": 0.5952, + "step": 4248 + }, + { + "epoch": 0.15, + "learning_rate": 1.8953544934469e-05, + "loss": 0.6878, + "step": 4249 + }, + { + "epoch": 0.15, + "learning_rate": 1.8953059950930243e-05, + "loss": 0.7441, + "step": 4250 + }, + { + "epoch": 0.15, + "learning_rate": 1.8952574861241638e-05, + "loss": 0.6165, + "step": 4251 + }, + { + "epoch": 0.15, + "learning_rate": 1.8952089665408932e-05, + "loss": 0.6481, + "step": 4252 + }, + { + "epoch": 0.15, + "learning_rate": 1.8951604363437874e-05, + "loss": 0.6031, + "step": 4253 + }, + { + "epoch": 0.15, + "learning_rate": 1.8951118955334226e-05, + "loss": 0.677, + "step": 4254 + }, + { + "epoch": 0.15, + "learning_rate": 1.8950633441103742e-05, + "loss": 0.6364, + "step": 4255 + }, + { + "epoch": 0.15, + "learning_rate": 1.895014782075217e-05, + "loss": 0.6256, + "step": 4256 + }, + { + "epoch": 0.15, + "learning_rate": 1.8949662094285276e-05, + "loss": 0.6145, + "step": 4257 + }, + { + "epoch": 0.15, + "learning_rate": 1.894917626170882e-05, + "loss": 0.6472, + "step": 4258 + }, + { + "epoch": 0.15, + "learning_rate": 1.8948690323028557e-05, + "loss": 0.681, + "step": 4259 + }, + { + "epoch": 0.15, + "learning_rate": 1.8948204278250245e-05, + "loss": 0.6159, + "step": 4260 + }, + { + "epoch": 0.15, + "learning_rate": 1.8947718127379658e-05, + "loss": 0.677, + "step": 4261 + }, + { + "epoch": 0.15, + "learning_rate": 1.894723187042255e-05, + "loss": 0.6159, + "step": 4262 + }, + { + "epoch": 0.15, + "learning_rate": 1.8946745507384695e-05, + "loss": 0.6841, + "step": 4263 + }, + { + "epoch": 0.15, + "learning_rate": 1.894625903827185e-05, + "loss": 0.6628, + "step": 4264 + }, + { + "epoch": 0.15, + "learning_rate": 1.8945772463089786e-05, + "loss": 0.6127, + "step": 4265 + }, + { + "epoch": 0.15, + "learning_rate": 1.8945285781844274e-05, + "loss": 0.6559, + "step": 4266 + }, + { + "epoch": 0.15, + "learning_rate": 1.8944798994541085e-05, + "loss": 0.6338, + "step": 4267 + }, + { + "epoch": 0.15, + "learning_rate": 1.8944312101185987e-05, + "loss": 0.6606, + "step": 4268 + }, + { + "epoch": 0.15, + "learning_rate": 1.8943825101784752e-05, + "loss": 0.6752, + "step": 4269 + }, + { + "epoch": 0.15, + "learning_rate": 1.894333799634316e-05, + "loss": 0.6199, + "step": 4270 + }, + { + "epoch": 0.15, + "learning_rate": 1.8942850784866988e-05, + "loss": 0.5722, + "step": 4271 + }, + { + "epoch": 0.15, + "learning_rate": 1.8942363467361998e-05, + "loss": 0.7209, + "step": 4272 + }, + { + "epoch": 0.15, + "learning_rate": 1.894187604383398e-05, + "loss": 0.6353, + "step": 4273 + }, + { + "epoch": 0.15, + "learning_rate": 1.894138851428871e-05, + "loss": 0.5975, + "step": 4274 + }, + { + "epoch": 0.15, + "learning_rate": 1.894090087873197e-05, + "loss": 0.5835, + "step": 4275 + }, + { + "epoch": 0.15, + "learning_rate": 1.8940413137169537e-05, + "loss": 0.618, + "step": 4276 + }, + { + "epoch": 0.15, + "learning_rate": 1.89399252896072e-05, + "loss": 0.6829, + "step": 4277 + }, + { + "epoch": 0.15, + "learning_rate": 1.8939437336050735e-05, + "loss": 0.6055, + "step": 4278 + }, + { + "epoch": 0.15, + "learning_rate": 1.8938949276505933e-05, + "loss": 0.5941, + "step": 4279 + }, + { + "epoch": 0.15, + "learning_rate": 1.893846111097858e-05, + "loss": 0.6655, + "step": 4280 + }, + { + "epoch": 0.15, + "learning_rate": 1.8937972839474466e-05, + "loss": 0.6436, + "step": 4281 + }, + { + "epoch": 0.15, + "learning_rate": 1.8937484461999375e-05, + "loss": 0.6575, + "step": 4282 + }, + { + "epoch": 0.15, + "learning_rate": 1.89369959785591e-05, + "loss": 0.6134, + "step": 4283 + }, + { + "epoch": 0.15, + "learning_rate": 1.8936507389159435e-05, + "loss": 0.6771, + "step": 4284 + }, + { + "epoch": 0.15, + "learning_rate": 1.893601869380617e-05, + "loss": 0.6386, + "step": 4285 + }, + { + "epoch": 0.15, + "learning_rate": 1.8935529892505092e-05, + "loss": 0.617, + "step": 4286 + }, + { + "epoch": 0.15, + "learning_rate": 1.8935040985262013e-05, + "loss": 0.6482, + "step": 4287 + }, + { + "epoch": 0.15, + "learning_rate": 1.8934551972082714e-05, + "loss": 0.6253, + "step": 4288 + }, + { + "epoch": 0.15, + "learning_rate": 1.8934062852973e-05, + "loss": 0.6816, + "step": 4289 + }, + { + "epoch": 0.15, + "learning_rate": 1.893357362793867e-05, + "loss": 0.6939, + "step": 4290 + }, + { + "epoch": 0.15, + "learning_rate": 1.8933084296985526e-05, + "loss": 0.631, + "step": 4291 + }, + { + "epoch": 0.15, + "learning_rate": 1.8932594860119365e-05, + "loss": 0.6405, + "step": 4292 + }, + { + "epoch": 0.15, + "learning_rate": 1.893210531734599e-05, + "loss": 0.6074, + "step": 4293 + }, + { + "epoch": 0.15, + "learning_rate": 1.893161566867121e-05, + "loss": 0.6463, + "step": 4294 + }, + { + "epoch": 0.15, + "learning_rate": 1.8931125914100827e-05, + "loss": 0.6453, + "step": 4295 + }, + { + "epoch": 0.15, + "learning_rate": 1.8930636053640648e-05, + "loss": 0.6458, + "step": 4296 + }, + { + "epoch": 0.15, + "learning_rate": 1.8930146087296482e-05, + "loss": 0.6064, + "step": 4297 + }, + { + "epoch": 0.15, + "learning_rate": 1.892965601507414e-05, + "loss": 0.6245, + "step": 4298 + }, + { + "epoch": 0.15, + "learning_rate": 1.8929165836979428e-05, + "loss": 0.6141, + "step": 4299 + }, + { + "epoch": 0.15, + "learning_rate": 1.8928675553018157e-05, + "loss": 0.6584, + "step": 4300 + }, + { + "epoch": 0.15, + "learning_rate": 1.8928185163196146e-05, + "loss": 0.6928, + "step": 4301 + }, + { + "epoch": 0.15, + "learning_rate": 1.8927694667519204e-05, + "loss": 0.6837, + "step": 4302 + }, + { + "epoch": 0.15, + "learning_rate": 1.8927204065993145e-05, + "loss": 0.5881, + "step": 4303 + }, + { + "epoch": 0.15, + "learning_rate": 1.8926713358623794e-05, + "loss": 0.6035, + "step": 4304 + }, + { + "epoch": 0.15, + "learning_rate": 1.892622254541696e-05, + "loss": 0.6291, + "step": 4305 + }, + { + "epoch": 0.15, + "learning_rate": 1.8925731626378468e-05, + "loss": 0.6199, + "step": 4306 + }, + { + "epoch": 0.15, + "learning_rate": 1.8925240601514138e-05, + "loss": 0.6259, + "step": 4307 + }, + { + "epoch": 0.15, + "learning_rate": 1.8924749470829785e-05, + "loss": 0.6371, + "step": 4308 + }, + { + "epoch": 0.15, + "learning_rate": 1.892425823433124e-05, + "loss": 0.6955, + "step": 4309 + }, + { + "epoch": 0.15, + "learning_rate": 1.8923766892024326e-05, + "loss": 0.6374, + "step": 4310 + }, + { + "epoch": 0.15, + "learning_rate": 1.8923275443914867e-05, + "loss": 0.6175, + "step": 4311 + }, + { + "epoch": 0.15, + "learning_rate": 1.8922783890008686e-05, + "loss": 0.6878, + "step": 4312 + }, + { + "epoch": 0.15, + "learning_rate": 1.8922292230311618e-05, + "loss": 0.6107, + "step": 4313 + }, + { + "epoch": 0.15, + "learning_rate": 1.8921800464829488e-05, + "loss": 0.638, + "step": 4314 + }, + { + "epoch": 0.15, + "learning_rate": 1.8921308593568126e-05, + "loss": 0.6852, + "step": 4315 + }, + { + "epoch": 0.15, + "learning_rate": 1.892081661653337e-05, + "loss": 0.665, + "step": 4316 + }, + { + "epoch": 0.15, + "learning_rate": 1.892032453373104e-05, + "loss": 0.6673, + "step": 4317 + }, + { + "epoch": 0.15, + "learning_rate": 1.8919832345166985e-05, + "loss": 0.6803, + "step": 4318 + }, + { + "epoch": 0.15, + "learning_rate": 1.8919340050847032e-05, + "loss": 0.6089, + "step": 4319 + }, + { + "epoch": 0.15, + "learning_rate": 1.891884765077702e-05, + "loss": 0.5858, + "step": 4320 + }, + { + "epoch": 0.15, + "learning_rate": 1.8918355144962782e-05, + "loss": 0.5712, + "step": 4321 + }, + { + "epoch": 0.15, + "learning_rate": 1.8917862533410166e-05, + "loss": 0.6607, + "step": 4322 + }, + { + "epoch": 0.15, + "learning_rate": 1.891736981612501e-05, + "loss": 0.6221, + "step": 4323 + }, + { + "epoch": 0.15, + "learning_rate": 1.8916876993113153e-05, + "loss": 0.6366, + "step": 4324 + }, + { + "epoch": 0.15, + "learning_rate": 1.8916384064380437e-05, + "loss": 0.6863, + "step": 4325 + }, + { + "epoch": 0.15, + "learning_rate": 1.8915891029932713e-05, + "loss": 0.6455, + "step": 4326 + }, + { + "epoch": 0.15, + "learning_rate": 1.891539788977582e-05, + "loss": 0.6925, + "step": 4327 + }, + { + "epoch": 0.15, + "learning_rate": 1.8914904643915607e-05, + "loss": 0.6613, + "step": 4328 + }, + { + "epoch": 0.15, + "learning_rate": 1.891441129235792e-05, + "loss": 0.6849, + "step": 4329 + }, + { + "epoch": 0.15, + "learning_rate": 1.8913917835108612e-05, + "loss": 0.6883, + "step": 4330 + }, + { + "epoch": 0.15, + "learning_rate": 1.8913424272173536e-05, + "loss": 0.6859, + "step": 4331 + }, + { + "epoch": 0.15, + "learning_rate": 1.8912930603558536e-05, + "loss": 0.6543, + "step": 4332 + }, + { + "epoch": 0.15, + "learning_rate": 1.8912436829269464e-05, + "loss": 0.6374, + "step": 4333 + }, + { + "epoch": 0.15, + "learning_rate": 1.891194294931219e-05, + "loss": 0.6377, + "step": 4334 + }, + { + "epoch": 0.15, + "learning_rate": 1.8911448963692547e-05, + "loss": 0.5917, + "step": 4335 + }, + { + "epoch": 0.15, + "learning_rate": 1.891095487241641e-05, + "loss": 0.7067, + "step": 4336 + }, + { + "epoch": 0.15, + "learning_rate": 1.8910460675489628e-05, + "loss": 0.6268, + "step": 4337 + }, + { + "epoch": 0.15, + "learning_rate": 1.8909966372918067e-05, + "loss": 0.6289, + "step": 4338 + }, + { + "epoch": 0.15, + "learning_rate": 1.890947196470758e-05, + "loss": 0.6673, + "step": 4339 + }, + { + "epoch": 0.15, + "learning_rate": 1.8908977450864032e-05, + "loss": 0.673, + "step": 4340 + }, + { + "epoch": 0.15, + "learning_rate": 1.8908482831393288e-05, + "loss": 0.6226, + "step": 4341 + }, + { + "epoch": 0.15, + "learning_rate": 1.890798810630121e-05, + "loss": 0.5689, + "step": 4342 + }, + { + "epoch": 0.15, + "learning_rate": 1.8907493275593664e-05, + "loss": 0.6906, + "step": 4343 + }, + { + "epoch": 0.15, + "learning_rate": 1.890699833927652e-05, + "loss": 0.6734, + "step": 4344 + }, + { + "epoch": 0.15, + "learning_rate": 1.890650329735564e-05, + "loss": 0.6492, + "step": 4345 + }, + { + "epoch": 0.15, + "learning_rate": 1.89060081498369e-05, + "loss": 0.6499, + "step": 4346 + }, + { + "epoch": 0.15, + "learning_rate": 1.8905512896726165e-05, + "loss": 0.623, + "step": 4347 + }, + { + "epoch": 0.15, + "learning_rate": 1.890501753802931e-05, + "loss": 0.5874, + "step": 4348 + }, + { + "epoch": 0.15, + "learning_rate": 1.8904522073752204e-05, + "loss": 0.6331, + "step": 4349 + }, + { + "epoch": 0.15, + "learning_rate": 1.8904026503900725e-05, + "loss": 0.6395, + "step": 4350 + }, + { + "epoch": 0.15, + "learning_rate": 1.8903530828480752e-05, + "loss": 0.6712, + "step": 4351 + }, + { + "epoch": 0.15, + "learning_rate": 1.8903035047498156e-05, + "loss": 0.6248, + "step": 4352 + }, + { + "epoch": 0.15, + "learning_rate": 1.8902539160958815e-05, + "loss": 0.6903, + "step": 4353 + }, + { + "epoch": 0.15, + "learning_rate": 1.8902043168868612e-05, + "loss": 0.6346, + "step": 4354 + }, + { + "epoch": 0.15, + "learning_rate": 1.890154707123343e-05, + "loss": 0.6945, + "step": 4355 + }, + { + "epoch": 0.15, + "learning_rate": 1.8901050868059142e-05, + "loss": 0.5838, + "step": 4356 + }, + { + "epoch": 0.15, + "learning_rate": 1.8900554559351638e-05, + "loss": 0.6672, + "step": 4357 + }, + { + "epoch": 0.15, + "learning_rate": 1.89000581451168e-05, + "loss": 0.6411, + "step": 4358 + }, + { + "epoch": 0.15, + "learning_rate": 1.8899561625360513e-05, + "loss": 0.6598, + "step": 4359 + }, + { + "epoch": 0.15, + "learning_rate": 1.889906500008867e-05, + "loss": 0.6287, + "step": 4360 + }, + { + "epoch": 0.15, + "learning_rate": 1.8898568269307147e-05, + "loss": 0.6903, + "step": 4361 + }, + { + "epoch": 0.15, + "learning_rate": 1.8898071433021842e-05, + "loss": 0.6893, + "step": 4362 + }, + { + "epoch": 0.15, + "learning_rate": 1.8897574491238647e-05, + "loss": 0.6423, + "step": 4363 + }, + { + "epoch": 0.15, + "learning_rate": 1.889707744396345e-05, + "loss": 0.6528, + "step": 4364 + }, + { + "epoch": 0.15, + "learning_rate": 1.8896580291202145e-05, + "loss": 0.6276, + "step": 4365 + }, + { + "epoch": 0.15, + "learning_rate": 1.8896083032960627e-05, + "loss": 0.6621, + "step": 4366 + }, + { + "epoch": 0.15, + "learning_rate": 1.8895585669244785e-05, + "loss": 0.6076, + "step": 4367 + }, + { + "epoch": 0.15, + "learning_rate": 1.889508820006053e-05, + "loss": 0.6158, + "step": 4368 + }, + { + "epoch": 0.15, + "learning_rate": 1.889459062541375e-05, + "loss": 0.6009, + "step": 4369 + }, + { + "epoch": 0.15, + "learning_rate": 1.8894092945310345e-05, + "loss": 0.6723, + "step": 4370 + }, + { + "epoch": 0.15, + "learning_rate": 1.889359515975622e-05, + "loss": 0.6458, + "step": 4371 + }, + { + "epoch": 0.15, + "learning_rate": 1.8893097268757268e-05, + "loss": 0.7086, + "step": 4372 + }, + { + "epoch": 0.15, + "learning_rate": 1.8892599272319402e-05, + "loss": 0.6264, + "step": 4373 + }, + { + "epoch": 0.15, + "learning_rate": 1.889210117044852e-05, + "loss": 0.6897, + "step": 4374 + }, + { + "epoch": 0.15, + "learning_rate": 1.889160296315053e-05, + "loss": 0.6235, + "step": 4375 + }, + { + "epoch": 0.15, + "learning_rate": 1.8891104650431346e-05, + "loss": 0.6086, + "step": 4376 + }, + { + "epoch": 0.15, + "learning_rate": 1.8890606232296863e-05, + "loss": 0.6784, + "step": 4377 + }, + { + "epoch": 0.15, + "learning_rate": 1.8890107708752996e-05, + "loss": 0.6273, + "step": 4378 + }, + { + "epoch": 0.15, + "learning_rate": 1.8889609079805656e-05, + "loss": 0.6547, + "step": 4379 + }, + { + "epoch": 0.15, + "learning_rate": 1.8889110345460757e-05, + "loss": 0.6157, + "step": 4380 + }, + { + "epoch": 0.15, + "learning_rate": 1.888861150572421e-05, + "loss": 0.6341, + "step": 4381 + }, + { + "epoch": 0.15, + "learning_rate": 1.8888112560601928e-05, + "loss": 0.671, + "step": 4382 + }, + { + "epoch": 0.15, + "learning_rate": 1.888761351009983e-05, + "loss": 0.6093, + "step": 4383 + }, + { + "epoch": 0.15, + "learning_rate": 1.888711435422383e-05, + "loss": 0.6383, + "step": 4384 + }, + { + "epoch": 0.15, + "learning_rate": 1.8886615092979848e-05, + "loss": 0.6059, + "step": 4385 + }, + { + "epoch": 0.15, + "learning_rate": 1.8886115726373798e-05, + "loss": 0.6007, + "step": 4386 + }, + { + "epoch": 0.15, + "learning_rate": 1.888561625441161e-05, + "loss": 0.6803, + "step": 4387 + }, + { + "epoch": 0.15, + "learning_rate": 1.88851166770992e-05, + "loss": 0.6458, + "step": 4388 + }, + { + "epoch": 0.15, + "learning_rate": 1.8884616994442493e-05, + "loss": 0.674, + "step": 4389 + }, + { + "epoch": 0.15, + "learning_rate": 1.888411720644741e-05, + "loss": 0.6404, + "step": 4390 + }, + { + "epoch": 0.15, + "learning_rate": 1.8883617313119878e-05, + "loss": 0.6791, + "step": 4391 + }, + { + "epoch": 0.15, + "learning_rate": 1.888311731446583e-05, + "loss": 0.6104, + "step": 4392 + }, + { + "epoch": 0.15, + "learning_rate": 1.888261721049118e-05, + "loss": 0.6435, + "step": 4393 + }, + { + "epoch": 0.15, + "learning_rate": 1.8882117001201875e-05, + "loss": 0.5999, + "step": 4394 + }, + { + "epoch": 0.15, + "learning_rate": 1.8881616686603836e-05, + "loss": 0.671, + "step": 4395 + }, + { + "epoch": 0.15, + "learning_rate": 1.8881116266702992e-05, + "loss": 0.7054, + "step": 4396 + }, + { + "epoch": 0.15, + "learning_rate": 1.8880615741505284e-05, + "loss": 0.6924, + "step": 4397 + }, + { + "epoch": 0.15, + "learning_rate": 1.8880115111016638e-05, + "loss": 0.6334, + "step": 4398 + }, + { + "epoch": 0.15, + "learning_rate": 1.8879614375242998e-05, + "loss": 0.5868, + "step": 4399 + }, + { + "epoch": 0.15, + "learning_rate": 1.8879113534190296e-05, + "loss": 0.6344, + "step": 4400 + }, + { + "epoch": 0.15, + "learning_rate": 1.8878612587864473e-05, + "loss": 0.623, + "step": 4401 + }, + { + "epoch": 0.15, + "learning_rate": 1.8878111536271458e-05, + "loss": 0.628, + "step": 4402 + }, + { + "epoch": 0.15, + "learning_rate": 1.887761037941721e-05, + "loss": 0.5686, + "step": 4403 + }, + { + "epoch": 0.15, + "learning_rate": 1.8877109117307653e-05, + "loss": 0.5985, + "step": 4404 + }, + { + "epoch": 0.15, + "learning_rate": 1.8876607749948742e-05, + "loss": 0.6493, + "step": 4405 + }, + { + "epoch": 0.15, + "learning_rate": 1.8876106277346414e-05, + "loss": 0.6479, + "step": 4406 + }, + { + "epoch": 0.15, + "learning_rate": 1.8875604699506622e-05, + "loss": 0.613, + "step": 4407 + }, + { + "epoch": 0.15, + "learning_rate": 1.8875103016435305e-05, + "loss": 0.6591, + "step": 4408 + }, + { + "epoch": 0.15, + "learning_rate": 1.8874601228138417e-05, + "loss": 0.6735, + "step": 4409 + }, + { + "epoch": 0.15, + "learning_rate": 1.8874099334621904e-05, + "loss": 0.5728, + "step": 4410 + }, + { + "epoch": 0.15, + "learning_rate": 1.887359733589172e-05, + "loss": 0.6601, + "step": 4411 + }, + { + "epoch": 0.15, + "learning_rate": 1.887309523195381e-05, + "loss": 0.6768, + "step": 4412 + }, + { + "epoch": 0.15, + "learning_rate": 1.887259302281413e-05, + "loss": 0.6327, + "step": 4413 + }, + { + "epoch": 0.15, + "learning_rate": 1.887209070847864e-05, + "loss": 0.6291, + "step": 4414 + }, + { + "epoch": 0.15, + "learning_rate": 1.8871588288953294e-05, + "loss": 0.6538, + "step": 4415 + }, + { + "epoch": 0.15, + "learning_rate": 1.8871085764244044e-05, + "loss": 0.6636, + "step": 4416 + }, + { + "epoch": 0.15, + "learning_rate": 1.887058313435685e-05, + "loss": 0.6006, + "step": 4417 + }, + { + "epoch": 0.15, + "learning_rate": 1.887008039929767e-05, + "loss": 0.6389, + "step": 4418 + }, + { + "epoch": 0.15, + "learning_rate": 1.8869577559072466e-05, + "loss": 0.6179, + "step": 4419 + }, + { + "epoch": 0.15, + "learning_rate": 1.8869074613687203e-05, + "loss": 0.5969, + "step": 4420 + }, + { + "epoch": 0.15, + "learning_rate": 1.8868571563147834e-05, + "loss": 0.6172, + "step": 4421 + }, + { + "epoch": 0.15, + "learning_rate": 1.886806840746034e-05, + "loss": 0.6062, + "step": 4422 + }, + { + "epoch": 0.15, + "learning_rate": 1.886756514663067e-05, + "loss": 0.6441, + "step": 4423 + }, + { + "epoch": 0.15, + "learning_rate": 1.8867061780664803e-05, + "loss": 0.621, + "step": 4424 + }, + { + "epoch": 0.15, + "learning_rate": 1.8866558309568694e-05, + "loss": 0.6762, + "step": 4425 + }, + { + "epoch": 0.15, + "learning_rate": 1.886605473334833e-05, + "loss": 0.6155, + "step": 4426 + }, + { + "epoch": 0.15, + "learning_rate": 1.8865551052009663e-05, + "loss": 0.6206, + "step": 4427 + }, + { + "epoch": 0.15, + "learning_rate": 1.8865047265558675e-05, + "loss": 0.6616, + "step": 4428 + }, + { + "epoch": 0.15, + "learning_rate": 1.886454337400134e-05, + "loss": 0.6188, + "step": 4429 + }, + { + "epoch": 0.15, + "learning_rate": 1.8864039377343628e-05, + "loss": 0.608, + "step": 4430 + }, + { + "epoch": 0.15, + "learning_rate": 1.8863535275591516e-05, + "loss": 0.642, + "step": 4431 + }, + { + "epoch": 0.15, + "learning_rate": 1.886303106875098e-05, + "loss": 0.6063, + "step": 4432 + }, + { + "epoch": 0.15, + "learning_rate": 1.8862526756828e-05, + "loss": 0.6434, + "step": 4433 + }, + { + "epoch": 0.15, + "learning_rate": 1.8862022339828555e-05, + "loss": 0.6001, + "step": 4434 + }, + { + "epoch": 0.15, + "learning_rate": 1.8861517817758623e-05, + "loss": 0.636, + "step": 4435 + }, + { + "epoch": 0.15, + "learning_rate": 1.886101319062419e-05, + "loss": 0.6476, + "step": 4436 + }, + { + "epoch": 0.15, + "learning_rate": 1.8860508458431235e-05, + "loss": 0.699, + "step": 4437 + }, + { + "epoch": 0.15, + "learning_rate": 1.8860003621185744e-05, + "loss": 0.657, + "step": 4438 + }, + { + "epoch": 0.15, + "learning_rate": 1.88594986788937e-05, + "loss": 0.6434, + "step": 4439 + }, + { + "epoch": 0.15, + "learning_rate": 1.8858993631561092e-05, + "loss": 0.6641, + "step": 4440 + }, + { + "epoch": 0.15, + "learning_rate": 1.885848847919391e-05, + "loss": 0.597, + "step": 4441 + }, + { + "epoch": 0.15, + "learning_rate": 1.885798322179814e-05, + "loss": 0.5973, + "step": 4442 + }, + { + "epoch": 0.15, + "learning_rate": 1.8857477859379775e-05, + "loss": 0.5977, + "step": 4443 + }, + { + "epoch": 0.15, + "learning_rate": 1.8856972391944804e-05, + "loss": 0.6285, + "step": 4444 + }, + { + "epoch": 0.15, + "learning_rate": 1.8856466819499218e-05, + "loss": 0.6459, + "step": 4445 + }, + { + "epoch": 0.15, + "learning_rate": 1.8855961142049018e-05, + "loss": 0.6266, + "step": 4446 + }, + { + "epoch": 0.15, + "learning_rate": 1.8855455359600197e-05, + "loss": 0.6671, + "step": 4447 + }, + { + "epoch": 0.15, + "learning_rate": 1.885494947215875e-05, + "loss": 0.6866, + "step": 4448 + }, + { + "epoch": 0.15, + "learning_rate": 1.8854443479730674e-05, + "loss": 0.6193, + "step": 4449 + }, + { + "epoch": 0.15, + "learning_rate": 1.885393738232197e-05, + "loss": 0.6525, + "step": 4450 + }, + { + "epoch": 0.15, + "learning_rate": 1.8853431179938634e-05, + "loss": 0.652, + "step": 4451 + }, + { + "epoch": 0.15, + "learning_rate": 1.8852924872586677e-05, + "loss": 0.5822, + "step": 4452 + }, + { + "epoch": 0.15, + "learning_rate": 1.8852418460272095e-05, + "loss": 0.6193, + "step": 4453 + }, + { + "epoch": 0.15, + "learning_rate": 1.8851911943000894e-05, + "loss": 0.6075, + "step": 4454 + }, + { + "epoch": 0.15, + "learning_rate": 1.885140532077908e-05, + "loss": 0.6229, + "step": 4455 + }, + { + "epoch": 0.15, + "learning_rate": 1.8850898593612657e-05, + "loss": 0.6761, + "step": 4456 + }, + { + "epoch": 0.15, + "learning_rate": 1.8850391761507638e-05, + "loss": 0.6135, + "step": 4457 + }, + { + "epoch": 0.15, + "learning_rate": 1.8849884824470023e-05, + "loss": 0.6637, + "step": 4458 + }, + { + "epoch": 0.15, + "learning_rate": 1.8849377782505835e-05, + "loss": 0.6291, + "step": 4459 + }, + { + "epoch": 0.15, + "learning_rate": 1.8848870635621075e-05, + "loss": 0.5853, + "step": 4460 + }, + { + "epoch": 0.15, + "learning_rate": 1.8848363383821758e-05, + "loss": 0.7012, + "step": 4461 + }, + { + "epoch": 0.15, + "learning_rate": 1.8847856027113903e-05, + "loss": 0.6112, + "step": 4462 + }, + { + "epoch": 0.15, + "learning_rate": 1.8847348565503522e-05, + "loss": 0.5669, + "step": 4463 + }, + { + "epoch": 0.15, + "learning_rate": 1.884684099899663e-05, + "loss": 0.6863, + "step": 4464 + }, + { + "epoch": 0.15, + "learning_rate": 1.8846333327599252e-05, + "loss": 0.6849, + "step": 4465 + }, + { + "epoch": 0.15, + "learning_rate": 1.8845825551317394e-05, + "loss": 0.6629, + "step": 4466 + }, + { + "epoch": 0.15, + "learning_rate": 1.884531767015709e-05, + "loss": 0.6243, + "step": 4467 + }, + { + "epoch": 0.15, + "learning_rate": 1.884480968412435e-05, + "loss": 0.6144, + "step": 4468 + }, + { + "epoch": 0.15, + "learning_rate": 1.8844301593225208e-05, + "loss": 0.6015, + "step": 4469 + }, + { + "epoch": 0.15, + "learning_rate": 1.884379339746568e-05, + "loss": 0.5922, + "step": 4470 + }, + { + "epoch": 0.15, + "learning_rate": 1.8843285096851796e-05, + "loss": 0.6388, + "step": 4471 + }, + { + "epoch": 0.15, + "learning_rate": 1.8842776691389576e-05, + "loss": 0.6173, + "step": 4472 + }, + { + "epoch": 0.15, + "learning_rate": 1.8842268181085056e-05, + "loss": 0.6087, + "step": 4473 + }, + { + "epoch": 0.16, + "learning_rate": 1.8841759565944258e-05, + "loss": 0.6534, + "step": 4474 + }, + { + "epoch": 0.16, + "learning_rate": 1.884125084597322e-05, + "loss": 0.6406, + "step": 4475 + }, + { + "epoch": 0.16, + "learning_rate": 1.8840742021177964e-05, + "loss": 0.7058, + "step": 4476 + }, + { + "epoch": 0.16, + "learning_rate": 1.884023309156453e-05, + "loss": 0.6814, + "step": 4477 + }, + { + "epoch": 0.16, + "learning_rate": 1.883972405713895e-05, + "loss": 0.6511, + "step": 4478 + }, + { + "epoch": 0.16, + "learning_rate": 1.883921491790726e-05, + "loss": 0.6577, + "step": 4479 + }, + { + "epoch": 0.16, + "learning_rate": 1.8838705673875496e-05, + "loss": 0.6537, + "step": 4480 + }, + { + "epoch": 0.16, + "learning_rate": 1.883819632504969e-05, + "loss": 0.6587, + "step": 4481 + }, + { + "epoch": 0.16, + "learning_rate": 1.883768687143589e-05, + "loss": 0.6319, + "step": 4482 + }, + { + "epoch": 0.16, + "learning_rate": 1.8837177313040135e-05, + "loss": 0.6394, + "step": 4483 + }, + { + "epoch": 0.16, + "learning_rate": 1.883666764986846e-05, + "loss": 0.6163, + "step": 4484 + }, + { + "epoch": 0.16, + "learning_rate": 1.883615788192691e-05, + "loss": 0.6488, + "step": 4485 + }, + { + "epoch": 0.16, + "learning_rate": 1.8835648009221534e-05, + "loss": 0.6313, + "step": 4486 + }, + { + "epoch": 0.16, + "learning_rate": 1.8835138031758375e-05, + "loss": 0.6001, + "step": 4487 + }, + { + "epoch": 0.16, + "learning_rate": 1.8834627949543475e-05, + "loss": 0.6135, + "step": 4488 + }, + { + "epoch": 0.16, + "learning_rate": 1.8834117762582885e-05, + "loss": 0.6066, + "step": 4489 + }, + { + "epoch": 0.16, + "learning_rate": 1.8833607470882652e-05, + "loss": 0.6166, + "step": 4490 + }, + { + "epoch": 0.16, + "learning_rate": 1.883309707444883e-05, + "loss": 0.6219, + "step": 4491 + }, + { + "epoch": 0.16, + "learning_rate": 1.883258657328747e-05, + "loss": 0.6499, + "step": 4492 + }, + { + "epoch": 0.16, + "learning_rate": 1.883207596740462e-05, + "loss": 0.6376, + "step": 4493 + }, + { + "epoch": 0.16, + "learning_rate": 1.8831565256806338e-05, + "loss": 0.6352, + "step": 4494 + }, + { + "epoch": 0.16, + "learning_rate": 1.883105444149868e-05, + "loss": 0.6154, + "step": 4495 + }, + { + "epoch": 0.16, + "learning_rate": 1.88305435214877e-05, + "loss": 0.6241, + "step": 4496 + }, + { + "epoch": 0.16, + "learning_rate": 1.8830032496779452e-05, + "loss": 0.6692, + "step": 4497 + }, + { + "epoch": 0.16, + "learning_rate": 1.882952136738e-05, + "loss": 0.6401, + "step": 4498 + }, + { + "epoch": 0.16, + "learning_rate": 1.8829010133295403e-05, + "loss": 0.6696, + "step": 4499 + }, + { + "epoch": 0.16, + "learning_rate": 1.8828498794531723e-05, + "loss": 0.7034, + "step": 4500 + }, + { + "epoch": 0.16, + "learning_rate": 1.8827987351095022e-05, + "loss": 0.699, + "step": 4501 + }, + { + "epoch": 0.16, + "learning_rate": 1.882747580299136e-05, + "loss": 0.5925, + "step": 4502 + }, + { + "epoch": 0.16, + "learning_rate": 1.882696415022681e-05, + "loss": 0.6076, + "step": 4503 + }, + { + "epoch": 0.16, + "learning_rate": 1.8826452392807432e-05, + "loss": 0.6311, + "step": 4504 + }, + { + "epoch": 0.16, + "learning_rate": 1.8825940530739296e-05, + "loss": 0.6197, + "step": 4505 + }, + { + "epoch": 0.16, + "learning_rate": 1.882542856402847e-05, + "loss": 0.649, + "step": 4506 + }, + { + "epoch": 0.16, + "learning_rate": 1.8824916492681024e-05, + "loss": 0.6053, + "step": 4507 + }, + { + "epoch": 0.16, + "learning_rate": 1.882440431670303e-05, + "loss": 0.6143, + "step": 4508 + }, + { + "epoch": 0.16, + "learning_rate": 1.882389203610056e-05, + "loss": 0.687, + "step": 4509 + }, + { + "epoch": 0.16, + "learning_rate": 1.8823379650879686e-05, + "loss": 0.6606, + "step": 4510 + }, + { + "epoch": 0.16, + "learning_rate": 1.882286716104648e-05, + "loss": 0.6303, + "step": 4511 + }, + { + "epoch": 0.16, + "learning_rate": 1.8822354566607032e-05, + "loss": 0.6182, + "step": 4512 + }, + { + "epoch": 0.16, + "learning_rate": 1.8821841867567406e-05, + "loss": 0.6272, + "step": 4513 + }, + { + "epoch": 0.16, + "learning_rate": 1.8821329063933686e-05, + "loss": 0.6385, + "step": 4514 + }, + { + "epoch": 0.16, + "learning_rate": 1.882081615571195e-05, + "loss": 0.6478, + "step": 4515 + }, + { + "epoch": 0.16, + "learning_rate": 1.882030314290828e-05, + "loss": 0.6246, + "step": 4516 + }, + { + "epoch": 0.16, + "learning_rate": 1.881979002552876e-05, + "loss": 0.6197, + "step": 4517 + }, + { + "epoch": 0.16, + "learning_rate": 1.881927680357947e-05, + "loss": 0.6118, + "step": 4518 + }, + { + "epoch": 0.16, + "learning_rate": 1.88187634770665e-05, + "loss": 0.6615, + "step": 4519 + }, + { + "epoch": 0.16, + "learning_rate": 1.881825004599593e-05, + "loss": 0.6255, + "step": 4520 + }, + { + "epoch": 0.16, + "learning_rate": 1.8817736510373854e-05, + "loss": 0.6337, + "step": 4521 + }, + { + "epoch": 0.16, + "learning_rate": 1.8817222870206353e-05, + "loss": 0.6347, + "step": 4522 + }, + { + "epoch": 0.16, + "learning_rate": 1.8816709125499522e-05, + "loss": 0.6617, + "step": 4523 + }, + { + "epoch": 0.16, + "learning_rate": 1.8816195276259454e-05, + "loss": 0.6327, + "step": 4524 + }, + { + "epoch": 0.16, + "learning_rate": 1.8815681322492238e-05, + "loss": 0.6751, + "step": 4525 + }, + { + "epoch": 0.16, + "learning_rate": 1.8815167264203968e-05, + "loss": 0.635, + "step": 4526 + }, + { + "epoch": 0.16, + "learning_rate": 1.8814653101400736e-05, + "loss": 0.6233, + "step": 4527 + }, + { + "epoch": 0.16, + "learning_rate": 1.881413883408864e-05, + "loss": 0.6467, + "step": 4528 + }, + { + "epoch": 0.16, + "learning_rate": 1.8813624462273782e-05, + "loss": 0.6309, + "step": 4529 + }, + { + "epoch": 0.16, + "learning_rate": 1.8813109985962254e-05, + "loss": 0.6967, + "step": 4530 + }, + { + "epoch": 0.16, + "learning_rate": 1.881259540516016e-05, + "loss": 0.6916, + "step": 4531 + }, + { + "epoch": 0.16, + "learning_rate": 1.88120807198736e-05, + "loss": 0.6608, + "step": 4532 + }, + { + "epoch": 0.16, + "learning_rate": 1.8811565930108674e-05, + "loss": 0.6772, + "step": 4533 + }, + { + "epoch": 0.16, + "learning_rate": 1.881105103587149e-05, + "loss": 0.5767, + "step": 4534 + }, + { + "epoch": 0.16, + "learning_rate": 1.881053603716815e-05, + "loss": 0.6495, + "step": 4535 + }, + { + "epoch": 0.16, + "learning_rate": 1.8810020934004755e-05, + "loss": 0.5983, + "step": 4536 + }, + { + "epoch": 0.16, + "learning_rate": 1.8809505726387423e-05, + "loss": 0.6248, + "step": 4537 + }, + { + "epoch": 0.16, + "learning_rate": 1.880899041432225e-05, + "loss": 0.6307, + "step": 4538 + }, + { + "epoch": 0.16, + "learning_rate": 1.880847499781536e-05, + "loss": 0.6595, + "step": 4539 + }, + { + "epoch": 0.16, + "learning_rate": 1.880795947687285e-05, + "loss": 0.6481, + "step": 4540 + }, + { + "epoch": 0.16, + "learning_rate": 1.880744385150084e-05, + "loss": 0.6185, + "step": 4541 + }, + { + "epoch": 0.16, + "learning_rate": 1.8806928121705442e-05, + "loss": 0.6153, + "step": 4542 + }, + { + "epoch": 0.16, + "learning_rate": 1.880641228749277e-05, + "loss": 0.5983, + "step": 4543 + }, + { + "epoch": 0.16, + "learning_rate": 1.8805896348868942e-05, + "loss": 0.6498, + "step": 4544 + }, + { + "epoch": 0.16, + "learning_rate": 1.880538030584007e-05, + "loss": 0.6225, + "step": 4545 + }, + { + "epoch": 0.16, + "learning_rate": 1.8804864158412276e-05, + "loss": 0.613, + "step": 4546 + }, + { + "epoch": 0.16, + "learning_rate": 1.8804347906591683e-05, + "loss": 0.595, + "step": 4547 + }, + { + "epoch": 0.16, + "learning_rate": 1.8803831550384407e-05, + "loss": 0.6815, + "step": 4548 + }, + { + "epoch": 0.16, + "learning_rate": 1.880331508979657e-05, + "loss": 0.6927, + "step": 4549 + }, + { + "epoch": 0.16, + "learning_rate": 1.8802798524834293e-05, + "loss": 0.6391, + "step": 4550 + }, + { + "epoch": 0.16, + "learning_rate": 1.8802281855503706e-05, + "loss": 0.6836, + "step": 4551 + }, + { + "epoch": 0.16, + "learning_rate": 1.8801765081810936e-05, + "loss": 0.6605, + "step": 4552 + }, + { + "epoch": 0.16, + "learning_rate": 1.88012482037621e-05, + "loss": 0.6957, + "step": 4553 + }, + { + "epoch": 0.16, + "learning_rate": 1.880073122136334e-05, + "loss": 0.5803, + "step": 4554 + }, + { + "epoch": 0.16, + "learning_rate": 1.8800214134620774e-05, + "loss": 0.6001, + "step": 4555 + }, + { + "epoch": 0.16, + "learning_rate": 1.879969694354054e-05, + "loss": 0.6333, + "step": 4556 + }, + { + "epoch": 0.16, + "learning_rate": 1.8799179648128768e-05, + "loss": 0.6637, + "step": 4557 + }, + { + "epoch": 0.16, + "learning_rate": 1.8798662248391585e-05, + "loss": 0.6181, + "step": 4558 + }, + { + "epoch": 0.16, + "learning_rate": 1.8798144744335135e-05, + "loss": 0.5929, + "step": 4559 + }, + { + "epoch": 0.16, + "learning_rate": 1.8797627135965547e-05, + "loss": 0.6561, + "step": 4560 + }, + { + "epoch": 0.16, + "learning_rate": 1.8797109423288962e-05, + "loss": 0.6157, + "step": 4561 + }, + { + "epoch": 0.16, + "learning_rate": 1.8796591606311514e-05, + "loss": 0.6055, + "step": 4562 + }, + { + "epoch": 0.16, + "learning_rate": 1.8796073685039347e-05, + "loss": 0.6434, + "step": 4563 + }, + { + "epoch": 0.16, + "learning_rate": 1.8795555659478596e-05, + "loss": 0.6937, + "step": 4564 + }, + { + "epoch": 0.16, + "learning_rate": 1.879503752963541e-05, + "loss": 0.6251, + "step": 4565 + }, + { + "epoch": 0.16, + "learning_rate": 1.8794519295515927e-05, + "loss": 0.6459, + "step": 4566 + }, + { + "epoch": 0.16, + "learning_rate": 1.8794000957126295e-05, + "loss": 0.6614, + "step": 4567 + }, + { + "epoch": 0.16, + "learning_rate": 1.8793482514472653e-05, + "loss": 0.5986, + "step": 4568 + }, + { + "epoch": 0.16, + "learning_rate": 1.879296396756115e-05, + "loss": 0.6259, + "step": 4569 + }, + { + "epoch": 0.16, + "learning_rate": 1.8792445316397946e-05, + "loss": 0.619, + "step": 4570 + }, + { + "epoch": 0.16, + "learning_rate": 1.8791926560989172e-05, + "loss": 0.6704, + "step": 4571 + }, + { + "epoch": 0.16, + "learning_rate": 1.879140770134099e-05, + "loss": 0.6914, + "step": 4572 + }, + { + "epoch": 0.16, + "learning_rate": 1.8790888737459546e-05, + "loss": 0.603, + "step": 4573 + }, + { + "epoch": 0.16, + "learning_rate": 1.8790369669351e-05, + "loss": 0.5983, + "step": 4574 + }, + { + "epoch": 0.16, + "learning_rate": 1.87898504970215e-05, + "loss": 0.6937, + "step": 4575 + }, + { + "epoch": 0.16, + "learning_rate": 1.87893312204772e-05, + "loss": 0.6285, + "step": 4576 + }, + { + "epoch": 0.16, + "learning_rate": 1.878881183972426e-05, + "loss": 0.6473, + "step": 4577 + }, + { + "epoch": 0.16, + "learning_rate": 1.878829235476884e-05, + "loss": 0.6365, + "step": 4578 + }, + { + "epoch": 0.16, + "learning_rate": 1.8787772765617096e-05, + "loss": 0.6719, + "step": 4579 + }, + { + "epoch": 0.16, + "learning_rate": 1.878725307227519e-05, + "loss": 0.616, + "step": 4580 + }, + { + "epoch": 0.16, + "learning_rate": 1.8786733274749283e-05, + "loss": 0.6429, + "step": 4581 + }, + { + "epoch": 0.16, + "learning_rate": 1.8786213373045536e-05, + "loss": 0.6197, + "step": 4582 + }, + { + "epoch": 0.16, + "learning_rate": 1.8785693367170114e-05, + "loss": 0.6349, + "step": 4583 + }, + { + "epoch": 0.16, + "learning_rate": 1.8785173257129188e-05, + "loss": 0.6803, + "step": 4584 + }, + { + "epoch": 0.16, + "learning_rate": 1.878465304292892e-05, + "loss": 0.6506, + "step": 4585 + }, + { + "epoch": 0.16, + "learning_rate": 1.878413272457547e-05, + "loss": 0.6678, + "step": 4586 + }, + { + "epoch": 0.16, + "learning_rate": 1.878361230207502e-05, + "loss": 0.6773, + "step": 4587 + }, + { + "epoch": 0.16, + "learning_rate": 1.8783091775433732e-05, + "loss": 0.6854, + "step": 4588 + }, + { + "epoch": 0.16, + "learning_rate": 1.8782571144657784e-05, + "loss": 0.6919, + "step": 4589 + }, + { + "epoch": 0.16, + "learning_rate": 1.8782050409753344e-05, + "loss": 0.6507, + "step": 4590 + }, + { + "epoch": 0.16, + "learning_rate": 1.8781529570726587e-05, + "loss": 0.6797, + "step": 4591 + }, + { + "epoch": 0.16, + "learning_rate": 1.878100862758369e-05, + "loss": 0.6184, + "step": 4592 + }, + { + "epoch": 0.16, + "learning_rate": 1.8780487580330823e-05, + "loss": 0.6315, + "step": 4593 + }, + { + "epoch": 0.16, + "learning_rate": 1.8779966428974168e-05, + "loss": 0.6429, + "step": 4594 + }, + { + "epoch": 0.16, + "learning_rate": 1.877944517351991e-05, + "loss": 0.6331, + "step": 4595 + }, + { + "epoch": 0.16, + "learning_rate": 1.877892381397422e-05, + "loss": 0.6128, + "step": 4596 + }, + { + "epoch": 0.16, + "learning_rate": 1.877840235034328e-05, + "loss": 0.637, + "step": 4597 + }, + { + "epoch": 0.16, + "learning_rate": 1.877788078263328e-05, + "loss": 0.6693, + "step": 4598 + }, + { + "epoch": 0.16, + "learning_rate": 1.8777359110850397e-05, + "loss": 0.5934, + "step": 4599 + }, + { + "epoch": 0.16, + "learning_rate": 1.877683733500082e-05, + "loss": 0.6201, + "step": 4600 + }, + { + "epoch": 0.16, + "learning_rate": 1.877631545509073e-05, + "loss": 0.6459, + "step": 4601 + }, + { + "epoch": 0.16, + "learning_rate": 1.8775793471126324e-05, + "loss": 0.6777, + "step": 4602 + }, + { + "epoch": 0.16, + "learning_rate": 1.877527138311378e-05, + "loss": 0.6089, + "step": 4603 + }, + { + "epoch": 0.16, + "learning_rate": 1.8774749191059295e-05, + "loss": 0.6307, + "step": 4604 + }, + { + "epoch": 0.16, + "learning_rate": 1.8774226894969057e-05, + "loss": 0.6375, + "step": 4605 + }, + { + "epoch": 0.16, + "learning_rate": 1.8773704494849262e-05, + "loss": 0.5783, + "step": 4606 + }, + { + "epoch": 0.16, + "learning_rate": 1.8773181990706103e-05, + "loss": 0.5945, + "step": 4607 + }, + { + "epoch": 0.16, + "learning_rate": 1.877265938254577e-05, + "loss": 0.6209, + "step": 4608 + }, + { + "epoch": 0.16, + "learning_rate": 1.8772136670374463e-05, + "loss": 0.6447, + "step": 4609 + }, + { + "epoch": 0.16, + "learning_rate": 1.8771613854198376e-05, + "loss": 0.6229, + "step": 4610 + }, + { + "epoch": 0.16, + "learning_rate": 1.8771090934023715e-05, + "loss": 0.6713, + "step": 4611 + }, + { + "epoch": 0.16, + "learning_rate": 1.8770567909856675e-05, + "loss": 0.6003, + "step": 4612 + }, + { + "epoch": 0.16, + "learning_rate": 1.8770044781703456e-05, + "loss": 0.6639, + "step": 4613 + }, + { + "epoch": 0.16, + "learning_rate": 1.876952154957026e-05, + "loss": 0.6266, + "step": 4614 + }, + { + "epoch": 0.16, + "learning_rate": 1.8768998213463298e-05, + "loss": 0.6224, + "step": 4615 + }, + { + "epoch": 0.16, + "learning_rate": 1.8768474773388766e-05, + "loss": 0.6273, + "step": 4616 + }, + { + "epoch": 0.16, + "learning_rate": 1.8767951229352873e-05, + "loss": 0.6622, + "step": 4617 + }, + { + "epoch": 0.16, + "learning_rate": 1.876742758136183e-05, + "loss": 0.6282, + "step": 4618 + }, + { + "epoch": 0.16, + "learning_rate": 1.8766903829421838e-05, + "loss": 0.6765, + "step": 4619 + }, + { + "epoch": 0.16, + "learning_rate": 1.8766379973539113e-05, + "loss": 0.6341, + "step": 4620 + }, + { + "epoch": 0.16, + "learning_rate": 1.8765856013719863e-05, + "loss": 0.6545, + "step": 4621 + }, + { + "epoch": 0.16, + "learning_rate": 1.8765331949970303e-05, + "loss": 0.6753, + "step": 4622 + }, + { + "epoch": 0.16, + "learning_rate": 1.8764807782296644e-05, + "loss": 0.7012, + "step": 4623 + }, + { + "epoch": 0.16, + "learning_rate": 1.8764283510705098e-05, + "loss": 0.6463, + "step": 4624 + }, + { + "epoch": 0.16, + "learning_rate": 1.8763759135201887e-05, + "loss": 0.6487, + "step": 4625 + }, + { + "epoch": 0.16, + "learning_rate": 1.8763234655793226e-05, + "loss": 0.5993, + "step": 4626 + }, + { + "epoch": 0.16, + "learning_rate": 1.8762710072485332e-05, + "loss": 0.6291, + "step": 4627 + }, + { + "epoch": 0.16, + "learning_rate": 1.8762185385284422e-05, + "loss": 0.6347, + "step": 4628 + }, + { + "epoch": 0.16, + "learning_rate": 1.8761660594196724e-05, + "loss": 0.6497, + "step": 4629 + }, + { + "epoch": 0.16, + "learning_rate": 1.8761135699228454e-05, + "loss": 0.6642, + "step": 4630 + }, + { + "epoch": 0.16, + "learning_rate": 1.876061070038584e-05, + "loss": 0.6679, + "step": 4631 + }, + { + "epoch": 0.16, + "learning_rate": 1.87600855976751e-05, + "loss": 0.6631, + "step": 4632 + }, + { + "epoch": 0.16, + "learning_rate": 1.8759560391102467e-05, + "loss": 0.6467, + "step": 4633 + }, + { + "epoch": 0.16, + "learning_rate": 1.8759035080674162e-05, + "loss": 0.631, + "step": 4634 + }, + { + "epoch": 0.16, + "learning_rate": 1.8758509666396417e-05, + "loss": 0.6175, + "step": 4635 + }, + { + "epoch": 0.16, + "learning_rate": 1.875798414827546e-05, + "loss": 0.6333, + "step": 4636 + }, + { + "epoch": 0.16, + "learning_rate": 1.875745852631752e-05, + "loss": 0.6398, + "step": 4637 + }, + { + "epoch": 0.16, + "learning_rate": 1.8756932800528837e-05, + "loss": 0.6353, + "step": 4638 + }, + { + "epoch": 0.16, + "learning_rate": 1.8756406970915634e-05, + "loss": 0.6882, + "step": 4639 + }, + { + "epoch": 0.16, + "learning_rate": 1.8755881037484148e-05, + "loss": 0.6597, + "step": 4640 + }, + { + "epoch": 0.16, + "learning_rate": 1.8755355000240622e-05, + "loss": 0.5771, + "step": 4641 + }, + { + "epoch": 0.16, + "learning_rate": 1.875482885919128e-05, + "loss": 0.6046, + "step": 4642 + }, + { + "epoch": 0.16, + "learning_rate": 1.875430261434237e-05, + "loss": 0.6418, + "step": 4643 + }, + { + "epoch": 0.16, + "learning_rate": 1.875377626570013e-05, + "loss": 0.6215, + "step": 4644 + }, + { + "epoch": 0.16, + "learning_rate": 1.8753249813270796e-05, + "loss": 0.6367, + "step": 4645 + }, + { + "epoch": 0.16, + "learning_rate": 1.8752723257060612e-05, + "loss": 0.6234, + "step": 4646 + }, + { + "epoch": 0.16, + "learning_rate": 1.8752196597075824e-05, + "loss": 0.6305, + "step": 4647 + }, + { + "epoch": 0.16, + "learning_rate": 1.8751669833322673e-05, + "loss": 0.532, + "step": 4648 + }, + { + "epoch": 0.16, + "learning_rate": 1.8751142965807406e-05, + "loss": 0.6598, + "step": 4649 + }, + { + "epoch": 0.16, + "learning_rate": 1.8750615994536268e-05, + "loss": 0.6816, + "step": 4650 + }, + { + "epoch": 0.16, + "learning_rate": 1.8750088919515507e-05, + "loss": 0.6687, + "step": 4651 + }, + { + "epoch": 0.16, + "learning_rate": 1.874956174075137e-05, + "loss": 0.6969, + "step": 4652 + }, + { + "epoch": 0.16, + "learning_rate": 1.8749034458250116e-05, + "loss": 0.6736, + "step": 4653 + }, + { + "epoch": 0.16, + "learning_rate": 1.8748507072017988e-05, + "loss": 0.6353, + "step": 4654 + }, + { + "epoch": 0.16, + "learning_rate": 1.8747979582061244e-05, + "loss": 0.6241, + "step": 4655 + }, + { + "epoch": 0.16, + "learning_rate": 1.8747451988386136e-05, + "loss": 0.6942, + "step": 4656 + }, + { + "epoch": 0.16, + "learning_rate": 1.874692429099892e-05, + "loss": 0.6654, + "step": 4657 + }, + { + "epoch": 0.16, + "learning_rate": 1.874639648990585e-05, + "loss": 0.6547, + "step": 4658 + }, + { + "epoch": 0.16, + "learning_rate": 1.874586858511318e-05, + "loss": 0.6351, + "step": 4659 + }, + { + "epoch": 0.16, + "learning_rate": 1.874534057662718e-05, + "loss": 0.6086, + "step": 4660 + }, + { + "epoch": 0.16, + "learning_rate": 1.8744812464454105e-05, + "loss": 0.6218, + "step": 4661 + }, + { + "epoch": 0.16, + "learning_rate": 1.874428424860021e-05, + "loss": 0.663, + "step": 4662 + }, + { + "epoch": 0.16, + "learning_rate": 1.874375592907177e-05, + "loss": 0.5909, + "step": 4663 + }, + { + "epoch": 0.16, + "learning_rate": 1.874322750587504e-05, + "loss": 0.6045, + "step": 4664 + }, + { + "epoch": 0.16, + "learning_rate": 1.8742698979016287e-05, + "loss": 0.6865, + "step": 4665 + }, + { + "epoch": 0.16, + "learning_rate": 1.8742170348501782e-05, + "loss": 0.6368, + "step": 4666 + }, + { + "epoch": 0.16, + "learning_rate": 1.8741641614337783e-05, + "loss": 0.6492, + "step": 4667 + }, + { + "epoch": 0.16, + "learning_rate": 1.874111277653057e-05, + "loss": 0.6659, + "step": 4668 + }, + { + "epoch": 0.16, + "learning_rate": 1.8740583835086403e-05, + "loss": 0.6404, + "step": 4669 + }, + { + "epoch": 0.16, + "learning_rate": 1.8740054790011558e-05, + "loss": 0.6611, + "step": 4670 + }, + { + "epoch": 0.16, + "learning_rate": 1.873952564131231e-05, + "loss": 0.6248, + "step": 4671 + }, + { + "epoch": 0.16, + "learning_rate": 1.873899638899493e-05, + "loss": 0.6344, + "step": 4672 + }, + { + "epoch": 0.16, + "learning_rate": 1.873846703306569e-05, + "loss": 0.6667, + "step": 4673 + }, + { + "epoch": 0.16, + "learning_rate": 1.873793757353087e-05, + "loss": 0.6642, + "step": 4674 + }, + { + "epoch": 0.16, + "learning_rate": 1.873740801039675e-05, + "loss": 0.6537, + "step": 4675 + }, + { + "epoch": 0.16, + "learning_rate": 1.87368783436696e-05, + "loss": 0.6235, + "step": 4676 + }, + { + "epoch": 0.16, + "learning_rate": 1.8736348573355708e-05, + "loss": 0.5861, + "step": 4677 + }, + { + "epoch": 0.16, + "learning_rate": 1.8735818699461353e-05, + "loss": 0.6135, + "step": 4678 + }, + { + "epoch": 0.16, + "learning_rate": 1.8735288721992816e-05, + "loss": 0.6752, + "step": 4679 + }, + { + "epoch": 0.16, + "learning_rate": 1.8734758640956378e-05, + "loss": 0.6307, + "step": 4680 + }, + { + "epoch": 0.16, + "learning_rate": 1.8734228456358327e-05, + "loss": 0.6368, + "step": 4681 + }, + { + "epoch": 0.16, + "learning_rate": 1.8733698168204952e-05, + "loss": 0.6201, + "step": 4682 + }, + { + "epoch": 0.16, + "learning_rate": 1.8733167776502535e-05, + "loss": 0.6876, + "step": 4683 + }, + { + "epoch": 0.16, + "learning_rate": 1.873263728125737e-05, + "loss": 0.6247, + "step": 4684 + }, + { + "epoch": 0.16, + "learning_rate": 1.873210668247574e-05, + "loss": 0.6363, + "step": 4685 + }, + { + "epoch": 0.16, + "learning_rate": 1.8731575980163938e-05, + "loss": 0.6401, + "step": 4686 + }, + { + "epoch": 0.16, + "learning_rate": 1.8731045174328258e-05, + "loss": 0.6085, + "step": 4687 + }, + { + "epoch": 0.16, + "learning_rate": 1.8730514264974994e-05, + "loss": 0.6299, + "step": 4688 + }, + { + "epoch": 0.16, + "learning_rate": 1.872998325211044e-05, + "loss": 0.7117, + "step": 4689 + }, + { + "epoch": 0.16, + "learning_rate": 1.872945213574089e-05, + "loss": 0.6276, + "step": 4690 + }, + { + "epoch": 0.16, + "learning_rate": 1.872892091587264e-05, + "loss": 0.6059, + "step": 4691 + }, + { + "epoch": 0.16, + "learning_rate": 1.8728389592511993e-05, + "loss": 0.6398, + "step": 4692 + }, + { + "epoch": 0.16, + "learning_rate": 1.8727858165665244e-05, + "loss": 0.6197, + "step": 4693 + }, + { + "epoch": 0.16, + "learning_rate": 1.8727326635338696e-05, + "loss": 0.6469, + "step": 4694 + }, + { + "epoch": 0.16, + "learning_rate": 1.8726795001538654e-05, + "loss": 0.606, + "step": 4695 + }, + { + "epoch": 0.16, + "learning_rate": 1.8726263264271413e-05, + "loss": 0.6706, + "step": 4696 + }, + { + "epoch": 0.16, + "learning_rate": 1.8725731423543285e-05, + "loss": 0.593, + "step": 4697 + }, + { + "epoch": 0.16, + "learning_rate": 1.8725199479360572e-05, + "loss": 0.6001, + "step": 4698 + }, + { + "epoch": 0.16, + "learning_rate": 1.8724667431729583e-05, + "loss": 0.6003, + "step": 4699 + }, + { + "epoch": 0.16, + "learning_rate": 1.872413528065662e-05, + "loss": 0.6181, + "step": 4700 + }, + { + "epoch": 0.16, + "learning_rate": 1.8723603026148e-05, + "loss": 0.6552, + "step": 4701 + }, + { + "epoch": 0.16, + "learning_rate": 1.8723070668210036e-05, + "loss": 0.6534, + "step": 4702 + }, + { + "epoch": 0.16, + "learning_rate": 1.8722538206849027e-05, + "loss": 0.6742, + "step": 4703 + }, + { + "epoch": 0.16, + "learning_rate": 1.8722005642071298e-05, + "loss": 0.7013, + "step": 4704 + }, + { + "epoch": 0.16, + "learning_rate": 1.872147297388316e-05, + "loss": 0.6227, + "step": 4705 + }, + { + "epoch": 0.16, + "learning_rate": 1.872094020229092e-05, + "loss": 0.7003, + "step": 4706 + }, + { + "epoch": 0.16, + "learning_rate": 1.8720407327300907e-05, + "loss": 0.6637, + "step": 4707 + }, + { + "epoch": 0.16, + "learning_rate": 1.8719874348919433e-05, + "loss": 0.6504, + "step": 4708 + }, + { + "epoch": 0.16, + "learning_rate": 1.871934126715282e-05, + "loss": 0.6045, + "step": 4709 + }, + { + "epoch": 0.16, + "learning_rate": 1.8718808082007385e-05, + "loss": 0.6592, + "step": 4710 + }, + { + "epoch": 0.16, + "learning_rate": 1.871827479348945e-05, + "loss": 0.6477, + "step": 4711 + }, + { + "epoch": 0.16, + "learning_rate": 1.8717741401605338e-05, + "loss": 0.6106, + "step": 4712 + }, + { + "epoch": 0.16, + "learning_rate": 1.8717207906361375e-05, + "loss": 0.6168, + "step": 4713 + }, + { + "epoch": 0.16, + "learning_rate": 1.8716674307763884e-05, + "loss": 0.6469, + "step": 4714 + }, + { + "epoch": 0.16, + "learning_rate": 1.8716140605819192e-05, + "loss": 0.6426, + "step": 4715 + }, + { + "epoch": 0.16, + "learning_rate": 1.8715606800533627e-05, + "loss": 0.611, + "step": 4716 + }, + { + "epoch": 0.16, + "learning_rate": 1.871507289191352e-05, + "loss": 0.663, + "step": 4717 + }, + { + "epoch": 0.16, + "learning_rate": 1.8714538879965198e-05, + "loss": 0.6219, + "step": 4718 + }, + { + "epoch": 0.16, + "learning_rate": 1.8714004764694994e-05, + "loss": 0.6435, + "step": 4719 + }, + { + "epoch": 0.16, + "learning_rate": 1.871347054610924e-05, + "loss": 0.5847, + "step": 4720 + }, + { + "epoch": 0.16, + "learning_rate": 1.871293622421427e-05, + "loss": 0.6238, + "step": 4721 + }, + { + "epoch": 0.16, + "learning_rate": 1.8712401799016418e-05, + "loss": 0.6204, + "step": 4722 + }, + { + "epoch": 0.16, + "learning_rate": 1.8711867270522024e-05, + "loss": 0.6781, + "step": 4723 + }, + { + "epoch": 0.16, + "learning_rate": 1.871133263873742e-05, + "loss": 0.614, + "step": 4724 + }, + { + "epoch": 0.16, + "learning_rate": 1.871079790366895e-05, + "loss": 0.5951, + "step": 4725 + }, + { + "epoch": 0.16, + "learning_rate": 1.8710263065322952e-05, + "loss": 0.6438, + "step": 4726 + }, + { + "epoch": 0.16, + "learning_rate": 1.8709728123705765e-05, + "loss": 0.6295, + "step": 4727 + }, + { + "epoch": 0.16, + "learning_rate": 1.8709193078823735e-05, + "loss": 0.5874, + "step": 4728 + }, + { + "epoch": 0.16, + "learning_rate": 1.8708657930683202e-05, + "loss": 0.6966, + "step": 4729 + }, + { + "epoch": 0.16, + "learning_rate": 1.8708122679290515e-05, + "loss": 0.6314, + "step": 4730 + }, + { + "epoch": 0.16, + "learning_rate": 1.8707587324652016e-05, + "loss": 0.6398, + "step": 4731 + }, + { + "epoch": 0.16, + "learning_rate": 1.870705186677405e-05, + "loss": 0.6707, + "step": 4732 + }, + { + "epoch": 0.16, + "learning_rate": 1.8706516305662977e-05, + "loss": 0.7148, + "step": 4733 + }, + { + "epoch": 0.16, + "learning_rate": 1.870598064132514e-05, + "loss": 0.6196, + "step": 4734 + }, + { + "epoch": 0.16, + "learning_rate": 1.8705444873766882e-05, + "loss": 0.6429, + "step": 4735 + }, + { + "epoch": 0.16, + "learning_rate": 1.870490900299457e-05, + "loss": 0.5796, + "step": 4736 + }, + { + "epoch": 0.16, + "learning_rate": 1.8704373029014547e-05, + "loss": 0.6406, + "step": 4737 + }, + { + "epoch": 0.16, + "learning_rate": 1.8703836951833166e-05, + "loss": 0.612, + "step": 4738 + }, + { + "epoch": 0.16, + "learning_rate": 1.8703300771456793e-05, + "loss": 0.6977, + "step": 4739 + }, + { + "epoch": 0.16, + "learning_rate": 1.870276448789178e-05, + "loss": 0.6248, + "step": 4740 + }, + { + "epoch": 0.16, + "learning_rate": 1.870222810114448e-05, + "loss": 0.6579, + "step": 4741 + }, + { + "epoch": 0.16, + "learning_rate": 1.870169161122126e-05, + "loss": 0.643, + "step": 4742 + }, + { + "epoch": 0.16, + "learning_rate": 1.8701155018128484e-05, + "loss": 0.6169, + "step": 4743 + }, + { + "epoch": 0.16, + "learning_rate": 1.87006183218725e-05, + "loss": 0.6065, + "step": 4744 + }, + { + "epoch": 0.16, + "learning_rate": 1.8700081522459682e-05, + "loss": 0.6399, + "step": 4745 + }, + { + "epoch": 0.16, + "learning_rate": 1.8699544619896393e-05, + "loss": 0.6522, + "step": 4746 + }, + { + "epoch": 0.16, + "learning_rate": 1.8699007614189e-05, + "loss": 0.6503, + "step": 4747 + }, + { + "epoch": 0.16, + "learning_rate": 1.8698470505343863e-05, + "loss": 0.5965, + "step": 4748 + }, + { + "epoch": 0.16, + "learning_rate": 1.8697933293367357e-05, + "loss": 0.6617, + "step": 4749 + }, + { + "epoch": 0.16, + "learning_rate": 1.869739597826585e-05, + "loss": 0.6681, + "step": 4750 + }, + { + "epoch": 0.16, + "learning_rate": 1.869685856004571e-05, + "loss": 0.6624, + "step": 4751 + }, + { + "epoch": 0.16, + "learning_rate": 1.869632103871331e-05, + "loss": 0.7247, + "step": 4752 + }, + { + "epoch": 0.16, + "learning_rate": 1.869578341427502e-05, + "loss": 0.6279, + "step": 4753 + }, + { + "epoch": 0.16, + "learning_rate": 1.869524568673722e-05, + "loss": 0.7001, + "step": 4754 + }, + { + "epoch": 0.16, + "learning_rate": 1.8694707856106284e-05, + "loss": 0.6289, + "step": 4755 + }, + { + "epoch": 0.16, + "learning_rate": 1.8694169922388586e-05, + "loss": 0.5541, + "step": 4756 + }, + { + "epoch": 0.16, + "learning_rate": 1.8693631885590505e-05, + "loss": 0.6316, + "step": 4757 + }, + { + "epoch": 0.16, + "learning_rate": 1.869309374571842e-05, + "loss": 0.6254, + "step": 4758 + }, + { + "epoch": 0.16, + "learning_rate": 1.8692555502778715e-05, + "loss": 0.7052, + "step": 4759 + }, + { + "epoch": 0.16, + "learning_rate": 1.8692017156777765e-05, + "loss": 0.6439, + "step": 4760 + }, + { + "epoch": 0.16, + "learning_rate": 1.869147870772196e-05, + "loss": 0.6367, + "step": 4761 + }, + { + "epoch": 0.16, + "learning_rate": 1.8690940155617676e-05, + "loss": 0.6039, + "step": 4762 + }, + { + "epoch": 0.17, + "learning_rate": 1.8690401500471303e-05, + "loss": 0.6797, + "step": 4763 + }, + { + "epoch": 0.17, + "learning_rate": 1.868986274228923e-05, + "loss": 0.6068, + "step": 4764 + }, + { + "epoch": 0.17, + "learning_rate": 1.8689323881077838e-05, + "loss": 0.6014, + "step": 4765 + }, + { + "epoch": 0.17, + "learning_rate": 1.868878491684352e-05, + "loss": 0.6244, + "step": 4766 + }, + { + "epoch": 0.17, + "learning_rate": 1.868824584959267e-05, + "loss": 0.5863, + "step": 4767 + }, + { + "epoch": 0.17, + "learning_rate": 1.8687706679331673e-05, + "loss": 0.7018, + "step": 4768 + }, + { + "epoch": 0.17, + "learning_rate": 1.8687167406066917e-05, + "loss": 0.6306, + "step": 4769 + }, + { + "epoch": 0.17, + "learning_rate": 1.8686628029804807e-05, + "loss": 0.6188, + "step": 4770 + }, + { + "epoch": 0.17, + "learning_rate": 1.8686088550551735e-05, + "loss": 0.655, + "step": 4771 + }, + { + "epoch": 0.17, + "learning_rate": 1.868554896831409e-05, + "loss": 0.6787, + "step": 4772 + }, + { + "epoch": 0.17, + "learning_rate": 1.868500928309828e-05, + "loss": 0.6495, + "step": 4773 + }, + { + "epoch": 0.17, + "learning_rate": 1.8684469494910694e-05, + "loss": 0.651, + "step": 4774 + }, + { + "epoch": 0.17, + "learning_rate": 1.8683929603757738e-05, + "loss": 0.618, + "step": 4775 + }, + { + "epoch": 0.17, + "learning_rate": 1.8683389609645812e-05, + "loss": 0.6496, + "step": 4776 + }, + { + "epoch": 0.17, + "learning_rate": 1.8682849512581315e-05, + "loss": 0.609, + "step": 4777 + }, + { + "epoch": 0.17, + "learning_rate": 1.868230931257066e-05, + "loss": 0.6372, + "step": 4778 + }, + { + "epoch": 0.17, + "learning_rate": 1.8681769009620237e-05, + "loss": 0.6401, + "step": 4779 + }, + { + "epoch": 0.17, + "learning_rate": 1.8681228603736462e-05, + "loss": 0.6011, + "step": 4780 + }, + { + "epoch": 0.17, + "learning_rate": 1.8680688094925742e-05, + "loss": 0.6102, + "step": 4781 + }, + { + "epoch": 0.17, + "learning_rate": 1.8680147483194484e-05, + "loss": 0.6712, + "step": 4782 + }, + { + "epoch": 0.17, + "learning_rate": 1.8679606768549093e-05, + "loss": 0.6547, + "step": 4783 + }, + { + "epoch": 0.17, + "learning_rate": 1.867906595099599e-05, + "loss": 0.6247, + "step": 4784 + }, + { + "epoch": 0.17, + "learning_rate": 1.8678525030541578e-05, + "loss": 0.6567, + "step": 4785 + }, + { + "epoch": 0.17, + "learning_rate": 1.867798400719227e-05, + "loss": 0.6171, + "step": 4786 + }, + { + "epoch": 0.17, + "learning_rate": 1.867744288095449e-05, + "loss": 0.5696, + "step": 4787 + }, + { + "epoch": 0.17, + "learning_rate": 1.8676901651834645e-05, + "loss": 0.6543, + "step": 4788 + }, + { + "epoch": 0.17, + "learning_rate": 1.8676360319839153e-05, + "loss": 0.6076, + "step": 4789 + }, + { + "epoch": 0.17, + "learning_rate": 1.8675818884974434e-05, + "loss": 0.6193, + "step": 4790 + }, + { + "epoch": 0.17, + "learning_rate": 1.867527734724691e-05, + "loss": 0.6167, + "step": 4791 + }, + { + "epoch": 0.17, + "learning_rate": 1.8674735706662998e-05, + "loss": 0.6661, + "step": 4792 + }, + { + "epoch": 0.17, + "learning_rate": 1.8674193963229116e-05, + "loss": 0.6836, + "step": 4793 + }, + { + "epoch": 0.17, + "learning_rate": 1.8673652116951698e-05, + "loss": 0.6105, + "step": 4794 + }, + { + "epoch": 0.17, + "learning_rate": 1.867311016783716e-05, + "loss": 0.6166, + "step": 4795 + }, + { + "epoch": 0.17, + "learning_rate": 1.8672568115891926e-05, + "loss": 0.6272, + "step": 4796 + }, + { + "epoch": 0.17, + "learning_rate": 1.867202596112243e-05, + "loss": 0.673, + "step": 4797 + }, + { + "epoch": 0.17, + "learning_rate": 1.8671483703535092e-05, + "loss": 0.6683, + "step": 4798 + }, + { + "epoch": 0.17, + "learning_rate": 1.8670941343136347e-05, + "loss": 0.6155, + "step": 4799 + }, + { + "epoch": 0.17, + "learning_rate": 1.8670398879932626e-05, + "loss": 0.6422, + "step": 4800 + }, + { + "epoch": 0.17, + "learning_rate": 1.8669856313930358e-05, + "loss": 0.6163, + "step": 4801 + }, + { + "epoch": 0.17, + "learning_rate": 1.8669313645135973e-05, + "loss": 0.6298, + "step": 4802 + }, + { + "epoch": 0.17, + "learning_rate": 1.866877087355591e-05, + "loss": 0.6707, + "step": 4803 + }, + { + "epoch": 0.17, + "learning_rate": 1.8668227999196605e-05, + "loss": 0.6075, + "step": 4804 + }, + { + "epoch": 0.17, + "learning_rate": 1.8667685022064486e-05, + "loss": 0.6265, + "step": 4805 + }, + { + "epoch": 0.17, + "learning_rate": 1.8667141942165998e-05, + "loss": 0.6372, + "step": 4806 + }, + { + "epoch": 0.17, + "learning_rate": 1.8666598759507582e-05, + "loss": 0.6325, + "step": 4807 + }, + { + "epoch": 0.17, + "learning_rate": 1.866605547409567e-05, + "loss": 0.7276, + "step": 4808 + }, + { + "epoch": 0.17, + "learning_rate": 1.866551208593671e-05, + "loss": 0.6292, + "step": 4809 + }, + { + "epoch": 0.17, + "learning_rate": 1.8664968595037143e-05, + "loss": 0.7128, + "step": 4810 + }, + { + "epoch": 0.17, + "learning_rate": 1.866442500140341e-05, + "loss": 0.6886, + "step": 4811 + }, + { + "epoch": 0.17, + "learning_rate": 1.866388130504196e-05, + "loss": 0.6813, + "step": 4812 + }, + { + "epoch": 0.17, + "learning_rate": 1.8663337505959233e-05, + "loss": 0.6535, + "step": 4813 + }, + { + "epoch": 0.17, + "learning_rate": 1.8662793604161687e-05, + "loss": 0.5794, + "step": 4814 + }, + { + "epoch": 0.17, + "learning_rate": 1.866224959965576e-05, + "loss": 0.6694, + "step": 4815 + }, + { + "epoch": 0.17, + "learning_rate": 1.8661705492447905e-05, + "loss": 0.6601, + "step": 4816 + }, + { + "epoch": 0.17, + "learning_rate": 1.8661161282544577e-05, + "loss": 0.6957, + "step": 4817 + }, + { + "epoch": 0.17, + "learning_rate": 1.8660616969952227e-05, + "loss": 0.6236, + "step": 4818 + }, + { + "epoch": 0.17, + "learning_rate": 1.8660072554677304e-05, + "loss": 0.7016, + "step": 4819 + }, + { + "epoch": 0.17, + "learning_rate": 1.8659528036726268e-05, + "loss": 0.5994, + "step": 4820 + }, + { + "epoch": 0.17, + "learning_rate": 1.865898341610557e-05, + "loss": 0.6827, + "step": 4821 + }, + { + "epoch": 0.17, + "learning_rate": 1.8658438692821673e-05, + "loss": 0.6862, + "step": 4822 + }, + { + "epoch": 0.17, + "learning_rate": 1.865789386688103e-05, + "loss": 0.6264, + "step": 4823 + }, + { + "epoch": 0.17, + "learning_rate": 1.8657348938290105e-05, + "loss": 0.6515, + "step": 4824 + }, + { + "epoch": 0.17, + "learning_rate": 1.8656803907055358e-05, + "loss": 0.5885, + "step": 4825 + }, + { + "epoch": 0.17, + "learning_rate": 1.8656258773183246e-05, + "loss": 0.6854, + "step": 4826 + }, + { + "epoch": 0.17, + "learning_rate": 1.8655713536680235e-05, + "loss": 0.6263, + "step": 4827 + }, + { + "epoch": 0.17, + "learning_rate": 1.8655168197552796e-05, + "loss": 0.612, + "step": 4828 + }, + { + "epoch": 0.17, + "learning_rate": 1.8654622755807386e-05, + "loss": 0.631, + "step": 4829 + }, + { + "epoch": 0.17, + "learning_rate": 1.8654077211450474e-05, + "loss": 0.6431, + "step": 4830 + }, + { + "epoch": 0.17, + "learning_rate": 1.8653531564488528e-05, + "loss": 0.6326, + "step": 4831 + }, + { + "epoch": 0.17, + "learning_rate": 1.8652985814928025e-05, + "loss": 0.5824, + "step": 4832 + }, + { + "epoch": 0.17, + "learning_rate": 1.8652439962775423e-05, + "loss": 0.6111, + "step": 4833 + }, + { + "epoch": 0.17, + "learning_rate": 1.86518940080372e-05, + "loss": 0.6223, + "step": 4834 + }, + { + "epoch": 0.17, + "learning_rate": 1.8651347950719833e-05, + "loss": 0.63, + "step": 4835 + }, + { + "epoch": 0.17, + "learning_rate": 1.865080179082979e-05, + "loss": 0.6183, + "step": 4836 + }, + { + "epoch": 0.17, + "learning_rate": 1.865025552837355e-05, + "loss": 0.6273, + "step": 4837 + }, + { + "epoch": 0.17, + "learning_rate": 1.8649709163357585e-05, + "loss": 0.6433, + "step": 4838 + }, + { + "epoch": 0.17, + "learning_rate": 1.8649162695788378e-05, + "loss": 0.5928, + "step": 4839 + }, + { + "epoch": 0.17, + "learning_rate": 1.8648616125672405e-05, + "loss": 0.638, + "step": 4840 + }, + { + "epoch": 0.17, + "learning_rate": 1.8648069453016148e-05, + "loss": 0.6406, + "step": 4841 + }, + { + "epoch": 0.17, + "learning_rate": 1.8647522677826086e-05, + "loss": 0.6403, + "step": 4842 + }, + { + "epoch": 0.17, + "learning_rate": 1.8646975800108705e-05, + "loss": 0.6449, + "step": 4843 + }, + { + "epoch": 0.17, + "learning_rate": 1.864642881987049e-05, + "loss": 0.6871, + "step": 4844 + }, + { + "epoch": 0.17, + "learning_rate": 1.8645881737117915e-05, + "loss": 0.6721, + "step": 4845 + }, + { + "epoch": 0.17, + "learning_rate": 1.8645334551857485e-05, + "loss": 0.6574, + "step": 4846 + }, + { + "epoch": 0.17, + "learning_rate": 1.864478726409567e-05, + "loss": 0.6076, + "step": 4847 + }, + { + "epoch": 0.17, + "learning_rate": 1.864423987383897e-05, + "loss": 0.6159, + "step": 4848 + }, + { + "epoch": 0.17, + "learning_rate": 1.8643692381093873e-05, + "loss": 0.5847, + "step": 4849 + }, + { + "epoch": 0.17, + "learning_rate": 1.8643144785866863e-05, + "loss": 0.628, + "step": 4850 + }, + { + "epoch": 0.17, + "learning_rate": 1.864259708816444e-05, + "loss": 0.6153, + "step": 4851 + }, + { + "epoch": 0.17, + "learning_rate": 1.86420492879931e-05, + "loss": 0.677, + "step": 4852 + }, + { + "epoch": 0.17, + "learning_rate": 1.8641501385359327e-05, + "loss": 0.7157, + "step": 4853 + }, + { + "epoch": 0.17, + "learning_rate": 1.864095338026963e-05, + "loss": 0.6272, + "step": 4854 + }, + { + "epoch": 0.17, + "learning_rate": 1.8640405272730496e-05, + "loss": 0.6213, + "step": 4855 + }, + { + "epoch": 0.17, + "learning_rate": 1.8639857062748428e-05, + "loss": 0.6728, + "step": 4856 + }, + { + "epoch": 0.17, + "learning_rate": 1.8639308750329925e-05, + "loss": 0.6185, + "step": 4857 + }, + { + "epoch": 0.17, + "learning_rate": 1.8638760335481486e-05, + "loss": 0.6255, + "step": 4858 + }, + { + "epoch": 0.17, + "learning_rate": 1.8638211818209616e-05, + "loss": 0.6245, + "step": 4859 + }, + { + "epoch": 0.17, + "learning_rate": 1.8637663198520818e-05, + "loss": 0.6785, + "step": 4860 + }, + { + "epoch": 0.17, + "learning_rate": 1.86371144764216e-05, + "loss": 0.6226, + "step": 4861 + }, + { + "epoch": 0.17, + "learning_rate": 1.8636565651918455e-05, + "loss": 0.5986, + "step": 4862 + }, + { + "epoch": 0.17, + "learning_rate": 1.863601672501791e-05, + "loss": 0.6621, + "step": 4863 + }, + { + "epoch": 0.17, + "learning_rate": 1.8635467695726454e-05, + "loss": 0.6364, + "step": 4864 + }, + { + "epoch": 0.17, + "learning_rate": 1.8634918564050606e-05, + "loss": 0.6405, + "step": 4865 + }, + { + "epoch": 0.17, + "learning_rate": 1.8634369329996875e-05, + "loss": 0.6418, + "step": 4866 + }, + { + "epoch": 0.17, + "learning_rate": 1.8633819993571775e-05, + "loss": 0.6417, + "step": 4867 + }, + { + "epoch": 0.17, + "learning_rate": 1.8633270554781818e-05, + "loss": 0.6937, + "step": 4868 + }, + { + "epoch": 0.17, + "learning_rate": 1.8632721013633513e-05, + "loss": 0.6393, + "step": 4869 + }, + { + "epoch": 0.17, + "learning_rate": 1.8632171370133386e-05, + "loss": 0.6328, + "step": 4870 + }, + { + "epoch": 0.17, + "learning_rate": 1.8631621624287945e-05, + "loss": 0.6575, + "step": 4871 + }, + { + "epoch": 0.17, + "learning_rate": 1.863107177610371e-05, + "loss": 0.5902, + "step": 4872 + }, + { + "epoch": 0.17, + "learning_rate": 1.86305218255872e-05, + "loss": 0.6626, + "step": 4873 + }, + { + "epoch": 0.17, + "learning_rate": 1.8629971772744936e-05, + "loss": 0.6392, + "step": 4874 + }, + { + "epoch": 0.17, + "learning_rate": 1.862942161758344e-05, + "loss": 0.6641, + "step": 4875 + }, + { + "epoch": 0.17, + "learning_rate": 1.862887136010923e-05, + "loss": 0.6244, + "step": 4876 + }, + { + "epoch": 0.17, + "learning_rate": 1.8628321000328845e-05, + "loss": 0.6355, + "step": 4877 + }, + { + "epoch": 0.17, + "learning_rate": 1.8627770538248793e-05, + "loss": 0.6341, + "step": 4878 + }, + { + "epoch": 0.17, + "learning_rate": 1.8627219973875608e-05, + "loss": 0.6511, + "step": 4879 + }, + { + "epoch": 0.17, + "learning_rate": 1.8626669307215815e-05, + "loss": 0.6921, + "step": 4880 + }, + { + "epoch": 0.17, + "learning_rate": 1.8626118538275947e-05, + "loss": 0.6519, + "step": 4881 + }, + { + "epoch": 0.17, + "learning_rate": 1.862556766706253e-05, + "loss": 0.6392, + "step": 4882 + }, + { + "epoch": 0.17, + "learning_rate": 1.86250166935821e-05, + "loss": 0.6559, + "step": 4883 + }, + { + "epoch": 0.17, + "learning_rate": 1.8624465617841182e-05, + "loss": 0.6266, + "step": 4884 + }, + { + "epoch": 0.17, + "learning_rate": 1.8623914439846318e-05, + "loss": 0.6388, + "step": 4885 + }, + { + "epoch": 0.17, + "learning_rate": 1.8623363159604037e-05, + "loss": 0.5824, + "step": 4886 + }, + { + "epoch": 0.17, + "learning_rate": 1.8622811777120878e-05, + "loss": 0.6654, + "step": 4887 + }, + { + "epoch": 0.17, + "learning_rate": 1.8622260292403377e-05, + "loss": 0.6111, + "step": 4888 + }, + { + "epoch": 0.17, + "learning_rate": 1.862170870545807e-05, + "loss": 0.6833, + "step": 4889 + }, + { + "epoch": 0.17, + "learning_rate": 1.8621157016291506e-05, + "loss": 0.6175, + "step": 4890 + }, + { + "epoch": 0.17, + "learning_rate": 1.8620605224910215e-05, + "loss": 0.607, + "step": 4891 + }, + { + "epoch": 0.17, + "learning_rate": 1.8620053331320745e-05, + "loss": 0.6195, + "step": 4892 + }, + { + "epoch": 0.17, + "learning_rate": 1.861950133552964e-05, + "loss": 0.6027, + "step": 4893 + }, + { + "epoch": 0.17, + "learning_rate": 1.861894923754344e-05, + "loss": 0.608, + "step": 4894 + }, + { + "epoch": 0.17, + "learning_rate": 1.8618397037368698e-05, + "loss": 0.623, + "step": 4895 + }, + { + "epoch": 0.17, + "learning_rate": 1.8617844735011953e-05, + "loss": 0.6617, + "step": 4896 + }, + { + "epoch": 0.17, + "learning_rate": 1.8617292330479757e-05, + "loss": 0.6446, + "step": 4897 + }, + { + "epoch": 0.17, + "learning_rate": 1.861673982377866e-05, + "loss": 0.6466, + "step": 4898 + }, + { + "epoch": 0.17, + "learning_rate": 1.8616187214915214e-05, + "loss": 0.6343, + "step": 4899 + }, + { + "epoch": 0.17, + "learning_rate": 1.8615634503895968e-05, + "loss": 0.6784, + "step": 4900 + }, + { + "epoch": 0.17, + "learning_rate": 1.8615081690727476e-05, + "loss": 0.6467, + "step": 4901 + }, + { + "epoch": 0.17, + "learning_rate": 1.861452877541629e-05, + "loss": 0.5737, + "step": 4902 + }, + { + "epoch": 0.17, + "learning_rate": 1.8613975757968974e-05, + "loss": 0.6416, + "step": 4903 + }, + { + "epoch": 0.17, + "learning_rate": 1.8613422638392077e-05, + "loss": 0.6959, + "step": 4904 + }, + { + "epoch": 0.17, + "learning_rate": 1.8612869416692154e-05, + "loss": 0.6301, + "step": 4905 + }, + { + "epoch": 0.17, + "learning_rate": 1.8612316092875772e-05, + "loss": 0.6246, + "step": 4906 + }, + { + "epoch": 0.17, + "learning_rate": 1.861176266694949e-05, + "loss": 0.6276, + "step": 4907 + }, + { + "epoch": 0.17, + "learning_rate": 1.8611209138919865e-05, + "loss": 0.6958, + "step": 4908 + }, + { + "epoch": 0.17, + "learning_rate": 1.8610655508793462e-05, + "loss": 0.6177, + "step": 4909 + }, + { + "epoch": 0.17, + "learning_rate": 1.8610101776576844e-05, + "loss": 0.6507, + "step": 4910 + }, + { + "epoch": 0.17, + "learning_rate": 1.860954794227658e-05, + "loss": 0.6072, + "step": 4911 + }, + { + "epoch": 0.17, + "learning_rate": 1.8608994005899233e-05, + "loss": 0.6369, + "step": 4912 + }, + { + "epoch": 0.17, + "learning_rate": 1.8608439967451372e-05, + "loss": 0.6859, + "step": 4913 + }, + { + "epoch": 0.17, + "learning_rate": 1.8607885826939568e-05, + "loss": 0.6586, + "step": 4914 + }, + { + "epoch": 0.17, + "learning_rate": 1.8607331584370384e-05, + "loss": 0.6591, + "step": 4915 + }, + { + "epoch": 0.17, + "learning_rate": 1.86067772397504e-05, + "loss": 0.576, + "step": 4916 + }, + { + "epoch": 0.17, + "learning_rate": 1.860622279308618e-05, + "loss": 0.6781, + "step": 4917 + }, + { + "epoch": 0.17, + "learning_rate": 1.8605668244384306e-05, + "loss": 0.6332, + "step": 4918 + }, + { + "epoch": 0.17, + "learning_rate": 1.8605113593651343e-05, + "loss": 0.6963, + "step": 4919 + }, + { + "epoch": 0.17, + "learning_rate": 1.860455884089388e-05, + "loss": 0.6394, + "step": 4920 + }, + { + "epoch": 0.17, + "learning_rate": 1.8604003986118483e-05, + "loss": 0.6333, + "step": 4921 + }, + { + "epoch": 0.17, + "learning_rate": 1.8603449029331734e-05, + "loss": 0.5868, + "step": 4922 + }, + { + "epoch": 0.17, + "learning_rate": 1.8602893970540216e-05, + "loss": 0.6599, + "step": 4923 + }, + { + "epoch": 0.17, + "learning_rate": 1.8602338809750504e-05, + "loss": 0.6761, + "step": 4924 + }, + { + "epoch": 0.17, + "learning_rate": 1.8601783546969187e-05, + "loss": 0.6136, + "step": 4925 + }, + { + "epoch": 0.17, + "learning_rate": 1.8601228182202842e-05, + "loss": 0.6627, + "step": 4926 + }, + { + "epoch": 0.17, + "learning_rate": 1.8600672715458057e-05, + "loss": 0.6485, + "step": 4927 + }, + { + "epoch": 0.17, + "learning_rate": 1.860011714674142e-05, + "loss": 0.6324, + "step": 4928 + }, + { + "epoch": 0.17, + "learning_rate": 1.859956147605951e-05, + "loss": 0.6264, + "step": 4929 + }, + { + "epoch": 0.17, + "learning_rate": 1.859900570341892e-05, + "loss": 0.6234, + "step": 4930 + }, + { + "epoch": 0.17, + "learning_rate": 1.8598449828826244e-05, + "loss": 0.6551, + "step": 4931 + }, + { + "epoch": 0.17, + "learning_rate": 1.8597893852288066e-05, + "loss": 0.6321, + "step": 4932 + }, + { + "epoch": 0.17, + "learning_rate": 1.859733777381098e-05, + "loss": 0.6324, + "step": 4933 + }, + { + "epoch": 0.17, + "learning_rate": 1.859678159340158e-05, + "loss": 0.6407, + "step": 4934 + }, + { + "epoch": 0.17, + "learning_rate": 1.8596225311066458e-05, + "loss": 0.6994, + "step": 4935 + }, + { + "epoch": 0.17, + "learning_rate": 1.859566892681221e-05, + "loss": 0.6406, + "step": 4936 + }, + { + "epoch": 0.17, + "learning_rate": 1.859511244064544e-05, + "loss": 0.6509, + "step": 4937 + }, + { + "epoch": 0.17, + "learning_rate": 1.859455585257273e-05, + "loss": 0.6904, + "step": 4938 + }, + { + "epoch": 0.17, + "learning_rate": 1.8593999162600692e-05, + "loss": 0.5893, + "step": 4939 + }, + { + "epoch": 0.17, + "learning_rate": 1.859344237073592e-05, + "loss": 0.6898, + "step": 4940 + }, + { + "epoch": 0.17, + "learning_rate": 1.859288547698502e-05, + "loss": 0.645, + "step": 4941 + }, + { + "epoch": 0.17, + "learning_rate": 1.8592328481354592e-05, + "loss": 0.6249, + "step": 4942 + }, + { + "epoch": 0.17, + "learning_rate": 1.8591771383851243e-05, + "loss": 0.6808, + "step": 4943 + }, + { + "epoch": 0.17, + "learning_rate": 1.8591214184481574e-05, + "loss": 0.6308, + "step": 4944 + }, + { + "epoch": 0.17, + "learning_rate": 1.8590656883252192e-05, + "loss": 0.6344, + "step": 4945 + }, + { + "epoch": 0.17, + "learning_rate": 1.8590099480169707e-05, + "loss": 0.6396, + "step": 4946 + }, + { + "epoch": 0.17, + "learning_rate": 1.8589541975240726e-05, + "loss": 0.6251, + "step": 4947 + }, + { + "epoch": 0.17, + "learning_rate": 1.858898436847186e-05, + "loss": 0.6302, + "step": 4948 + }, + { + "epoch": 0.17, + "learning_rate": 1.8588426659869716e-05, + "loss": 0.6778, + "step": 4949 + }, + { + "epoch": 0.17, + "learning_rate": 1.858786884944091e-05, + "loss": 0.5824, + "step": 4950 + }, + { + "epoch": 0.17, + "learning_rate": 1.8587310937192057e-05, + "loss": 0.6394, + "step": 4951 + }, + { + "epoch": 0.17, + "learning_rate": 1.858675292312977e-05, + "loss": 0.66, + "step": 4952 + }, + { + "epoch": 0.17, + "learning_rate": 1.8586194807260663e-05, + "loss": 0.64, + "step": 4953 + }, + { + "epoch": 0.17, + "learning_rate": 1.8585636589591356e-05, + "loss": 0.6473, + "step": 4954 + }, + { + "epoch": 0.17, + "learning_rate": 1.8585078270128466e-05, + "loss": 0.6018, + "step": 4955 + }, + { + "epoch": 0.17, + "learning_rate": 1.8584519848878612e-05, + "loss": 0.6786, + "step": 4956 + }, + { + "epoch": 0.17, + "learning_rate": 1.858396132584842e-05, + "loss": 0.6455, + "step": 4957 + }, + { + "epoch": 0.17, + "learning_rate": 1.8583402701044502e-05, + "loss": 0.6583, + "step": 4958 + }, + { + "epoch": 0.17, + "learning_rate": 1.858284397447349e-05, + "loss": 0.6634, + "step": 4959 + }, + { + "epoch": 0.17, + "learning_rate": 1.8582285146142005e-05, + "loss": 0.5984, + "step": 4960 + }, + { + "epoch": 0.17, + "learning_rate": 1.858172621605667e-05, + "loss": 0.6435, + "step": 4961 + }, + { + "epoch": 0.17, + "learning_rate": 1.858116718422412e-05, + "loss": 0.6318, + "step": 4962 + }, + { + "epoch": 0.17, + "learning_rate": 1.8580608050650976e-05, + "loss": 0.6207, + "step": 4963 + }, + { + "epoch": 0.17, + "learning_rate": 1.858004881534387e-05, + "loss": 0.6283, + "step": 4964 + }, + { + "epoch": 0.17, + "learning_rate": 1.8579489478309426e-05, + "loss": 0.6391, + "step": 4965 + }, + { + "epoch": 0.17, + "learning_rate": 1.8578930039554285e-05, + "loss": 0.6847, + "step": 4966 + }, + { + "epoch": 0.17, + "learning_rate": 1.8578370499085077e-05, + "loss": 0.5995, + "step": 4967 + }, + { + "epoch": 0.17, + "learning_rate": 1.8577810856908434e-05, + "loss": 0.6289, + "step": 4968 + }, + { + "epoch": 0.17, + "learning_rate": 1.8577251113030992e-05, + "loss": 0.6787, + "step": 4969 + }, + { + "epoch": 0.17, + "learning_rate": 1.8576691267459388e-05, + "loss": 0.6348, + "step": 4970 + }, + { + "epoch": 0.17, + "learning_rate": 1.8576131320200258e-05, + "loss": 0.6417, + "step": 4971 + }, + { + "epoch": 0.17, + "learning_rate": 1.8575571271260244e-05, + "loss": 0.6903, + "step": 4972 + }, + { + "epoch": 0.17, + "learning_rate": 1.8575011120645987e-05, + "loss": 0.6281, + "step": 4973 + }, + { + "epoch": 0.17, + "learning_rate": 1.8574450868364123e-05, + "loss": 0.6278, + "step": 4974 + }, + { + "epoch": 0.17, + "learning_rate": 1.8573890514421294e-05, + "loss": 0.6262, + "step": 4975 + }, + { + "epoch": 0.17, + "learning_rate": 1.8573330058824154e-05, + "loss": 0.644, + "step": 4976 + }, + { + "epoch": 0.17, + "learning_rate": 1.8572769501579336e-05, + "loss": 0.6526, + "step": 4977 + }, + { + "epoch": 0.17, + "learning_rate": 1.8572208842693492e-05, + "loss": 0.6892, + "step": 4978 + }, + { + "epoch": 0.17, + "learning_rate": 1.8571648082173266e-05, + "loss": 0.6126, + "step": 4979 + }, + { + "epoch": 0.17, + "learning_rate": 1.857108722002531e-05, + "loss": 0.6129, + "step": 4980 + }, + { + "epoch": 0.17, + "learning_rate": 1.8570526256256275e-05, + "loss": 0.678, + "step": 4981 + }, + { + "epoch": 0.17, + "learning_rate": 1.856996519087281e-05, + "loss": 0.6563, + "step": 4982 + }, + { + "epoch": 0.17, + "learning_rate": 1.8569404023881562e-05, + "loss": 0.6785, + "step": 4983 + }, + { + "epoch": 0.17, + "learning_rate": 1.856884275528919e-05, + "loss": 0.6541, + "step": 4984 + }, + { + "epoch": 0.17, + "learning_rate": 1.856828138510235e-05, + "loss": 0.6504, + "step": 4985 + }, + { + "epoch": 0.17, + "learning_rate": 1.8567719913327696e-05, + "loss": 0.6369, + "step": 4986 + }, + { + "epoch": 0.17, + "learning_rate": 1.8567158339971882e-05, + "loss": 0.5985, + "step": 4987 + }, + { + "epoch": 0.17, + "learning_rate": 1.856659666504157e-05, + "loss": 0.637, + "step": 4988 + }, + { + "epoch": 0.17, + "learning_rate": 1.8566034888543414e-05, + "loss": 0.6113, + "step": 4989 + }, + { + "epoch": 0.17, + "learning_rate": 1.8565473010484082e-05, + "loss": 0.6329, + "step": 4990 + }, + { + "epoch": 0.17, + "learning_rate": 1.8564911030870234e-05, + "loss": 0.6476, + "step": 4991 + }, + { + "epoch": 0.17, + "learning_rate": 1.8564348949708525e-05, + "loss": 0.6659, + "step": 4992 + }, + { + "epoch": 0.17, + "learning_rate": 1.856378676700563e-05, + "loss": 0.6513, + "step": 4993 + }, + { + "epoch": 0.17, + "learning_rate": 1.8563224482768205e-05, + "loss": 0.641, + "step": 4994 + }, + { + "epoch": 0.17, + "learning_rate": 1.8562662097002925e-05, + "loss": 0.6503, + "step": 4995 + }, + { + "epoch": 0.17, + "learning_rate": 1.8562099609716454e-05, + "loss": 0.6154, + "step": 4996 + }, + { + "epoch": 0.17, + "learning_rate": 1.856153702091546e-05, + "loss": 0.6116, + "step": 4997 + }, + { + "epoch": 0.17, + "learning_rate": 1.8560974330606615e-05, + "loss": 0.6905, + "step": 4998 + }, + { + "epoch": 0.17, + "learning_rate": 1.8560411538796587e-05, + "loss": 0.5852, + "step": 4999 + }, + { + "epoch": 0.17, + "learning_rate": 1.855984864549205e-05, + "loss": 0.6535, + "step": 5000 + }, + { + "epoch": 0.17, + "learning_rate": 1.8559285650699685e-05, + "loss": 0.6599, + "step": 5001 + }, + { + "epoch": 0.17, + "learning_rate": 1.8558722554426157e-05, + "loss": 0.6151, + "step": 5002 + }, + { + "epoch": 0.17, + "learning_rate": 1.8558159356678146e-05, + "loss": 0.6342, + "step": 5003 + }, + { + "epoch": 0.17, + "learning_rate": 1.855759605746233e-05, + "loss": 0.6576, + "step": 5004 + }, + { + "epoch": 0.17, + "learning_rate": 1.8557032656785393e-05, + "loss": 0.6348, + "step": 5005 + }, + { + "epoch": 0.17, + "learning_rate": 1.8556469154654006e-05, + "loss": 0.6403, + "step": 5006 + }, + { + "epoch": 0.17, + "learning_rate": 1.8555905551074848e-05, + "loss": 0.6104, + "step": 5007 + }, + { + "epoch": 0.17, + "learning_rate": 1.8555341846054615e-05, + "loss": 0.6184, + "step": 5008 + }, + { + "epoch": 0.17, + "learning_rate": 1.8554778039599973e-05, + "loss": 0.6524, + "step": 5009 + }, + { + "epoch": 0.17, + "learning_rate": 1.855421413171762e-05, + "loss": 0.6368, + "step": 5010 + }, + { + "epoch": 0.17, + "learning_rate": 1.8553650122414236e-05, + "loss": 0.5921, + "step": 5011 + }, + { + "epoch": 0.17, + "learning_rate": 1.8553086011696514e-05, + "loss": 0.6647, + "step": 5012 + }, + { + "epoch": 0.17, + "learning_rate": 1.8552521799571133e-05, + "loss": 0.5958, + "step": 5013 + }, + { + "epoch": 0.17, + "learning_rate": 1.8551957486044788e-05, + "loss": 0.6236, + "step": 5014 + }, + { + "epoch": 0.17, + "learning_rate": 1.8551393071124168e-05, + "loss": 0.6452, + "step": 5015 + }, + { + "epoch": 0.17, + "learning_rate": 1.8550828554815968e-05, + "loss": 0.6482, + "step": 5016 + }, + { + "epoch": 0.17, + "learning_rate": 1.8550263937126875e-05, + "loss": 0.6734, + "step": 5017 + }, + { + "epoch": 0.17, + "learning_rate": 1.854969921806359e-05, + "loss": 0.6055, + "step": 5018 + }, + { + "epoch": 0.17, + "learning_rate": 1.8549134397632805e-05, + "loss": 0.6271, + "step": 5019 + }, + { + "epoch": 0.17, + "learning_rate": 1.8548569475841215e-05, + "loss": 0.6439, + "step": 5020 + }, + { + "epoch": 0.17, + "learning_rate": 1.854800445269552e-05, + "loss": 0.6649, + "step": 5021 + }, + { + "epoch": 0.17, + "learning_rate": 1.8547439328202422e-05, + "loss": 0.6743, + "step": 5022 + }, + { + "epoch": 0.17, + "learning_rate": 1.8546874102368613e-05, + "loss": 0.6517, + "step": 5023 + }, + { + "epoch": 0.17, + "learning_rate": 1.8546308775200807e-05, + "loss": 0.6482, + "step": 5024 + }, + { + "epoch": 0.17, + "learning_rate": 1.854574334670569e-05, + "loss": 0.6178, + "step": 5025 + }, + { + "epoch": 0.17, + "learning_rate": 1.8545177816889983e-05, + "loss": 0.6224, + "step": 5026 + }, + { + "epoch": 0.17, + "learning_rate": 1.854461218576038e-05, + "loss": 0.628, + "step": 5027 + }, + { + "epoch": 0.17, + "learning_rate": 1.8544046453323593e-05, + "loss": 0.6526, + "step": 5028 + }, + { + "epoch": 0.17, + "learning_rate": 1.8543480619586324e-05, + "loss": 0.6347, + "step": 5029 + }, + { + "epoch": 0.17, + "learning_rate": 1.8542914684555287e-05, + "loss": 0.6512, + "step": 5030 + }, + { + "epoch": 0.17, + "learning_rate": 1.8542348648237186e-05, + "loss": 0.6266, + "step": 5031 + }, + { + "epoch": 0.17, + "learning_rate": 1.854178251063874e-05, + "loss": 0.6673, + "step": 5032 + }, + { + "epoch": 0.17, + "learning_rate": 1.8541216271766657e-05, + "loss": 0.6002, + "step": 5033 + }, + { + "epoch": 0.17, + "learning_rate": 1.8540649931627646e-05, + "loss": 0.6051, + "step": 5034 + }, + { + "epoch": 0.17, + "learning_rate": 1.854008349022843e-05, + "loss": 0.6765, + "step": 5035 + }, + { + "epoch": 0.17, + "learning_rate": 1.853951694757572e-05, + "loss": 0.6413, + "step": 5036 + }, + { + "epoch": 0.17, + "learning_rate": 1.8538950303676233e-05, + "loss": 0.6338, + "step": 5037 + }, + { + "epoch": 0.17, + "learning_rate": 1.853838355853669e-05, + "loss": 0.6795, + "step": 5038 + }, + { + "epoch": 0.17, + "learning_rate": 1.8537816712163805e-05, + "loss": 0.6271, + "step": 5039 + }, + { + "epoch": 0.17, + "learning_rate": 1.853724976456431e-05, + "loss": 0.7059, + "step": 5040 + }, + { + "epoch": 0.17, + "learning_rate": 1.853668271574491e-05, + "loss": 0.6024, + "step": 5041 + }, + { + "epoch": 0.17, + "learning_rate": 1.853611556571234e-05, + "loss": 0.5582, + "step": 5042 + }, + { + "epoch": 0.17, + "learning_rate": 1.8535548314473325e-05, + "loss": 0.62, + "step": 5043 + }, + { + "epoch": 0.17, + "learning_rate": 1.8534980962034587e-05, + "loss": 0.6341, + "step": 5044 + }, + { + "epoch": 0.17, + "learning_rate": 1.853441350840285e-05, + "loss": 0.6586, + "step": 5045 + }, + { + "epoch": 0.17, + "learning_rate": 1.853384595358485e-05, + "loss": 0.6135, + "step": 5046 + }, + { + "epoch": 0.17, + "learning_rate": 1.8533278297587303e-05, + "loss": 0.6441, + "step": 5047 + }, + { + "epoch": 0.17, + "learning_rate": 1.8532710540416955e-05, + "loss": 0.677, + "step": 5048 + }, + { + "epoch": 0.17, + "learning_rate": 1.8532142682080524e-05, + "loss": 0.6522, + "step": 5049 + }, + { + "epoch": 0.17, + "learning_rate": 1.8531574722584752e-05, + "loss": 0.6021, + "step": 5050 + }, + { + "epoch": 0.18, + "learning_rate": 1.853100666193637e-05, + "loss": 0.6689, + "step": 5051 + }, + { + "epoch": 0.18, + "learning_rate": 1.853043850014211e-05, + "loss": 0.6417, + "step": 5052 + }, + { + "epoch": 0.18, + "learning_rate": 1.8529870237208705e-05, + "loss": 0.6356, + "step": 5053 + }, + { + "epoch": 0.18, + "learning_rate": 1.8529301873142906e-05, + "loss": 0.5657, + "step": 5054 + }, + { + "epoch": 0.18, + "learning_rate": 1.852873340795144e-05, + "loss": 0.6434, + "step": 5055 + }, + { + "epoch": 0.18, + "learning_rate": 1.8528164841641052e-05, + "loss": 0.6285, + "step": 5056 + }, + { + "epoch": 0.18, + "learning_rate": 1.8527596174218483e-05, + "loss": 0.6835, + "step": 5057 + }, + { + "epoch": 0.18, + "learning_rate": 1.852702740569047e-05, + "loss": 0.6155, + "step": 5058 + }, + { + "epoch": 0.18, + "learning_rate": 1.8526458536063762e-05, + "loss": 0.5861, + "step": 5059 + }, + { + "epoch": 0.18, + "learning_rate": 1.85258895653451e-05, + "loss": 0.6335, + "step": 5060 + }, + { + "epoch": 0.18, + "learning_rate": 1.8525320493541238e-05, + "loss": 0.6317, + "step": 5061 + }, + { + "epoch": 0.18, + "learning_rate": 1.8524751320658913e-05, + "loss": 0.5732, + "step": 5062 + }, + { + "epoch": 0.18, + "learning_rate": 1.852418204670488e-05, + "loss": 0.65, + "step": 5063 + }, + { + "epoch": 0.18, + "learning_rate": 1.852361267168588e-05, + "loss": 0.6622, + "step": 5064 + }, + { + "epoch": 0.18, + "learning_rate": 1.8523043195608676e-05, + "loss": 0.6054, + "step": 5065 + }, + { + "epoch": 0.18, + "learning_rate": 1.852247361848001e-05, + "loss": 0.599, + "step": 5066 + }, + { + "epoch": 0.18, + "learning_rate": 1.8521903940306634e-05, + "loss": 0.604, + "step": 5067 + }, + { + "epoch": 0.18, + "learning_rate": 1.8521334161095314e-05, + "loss": 0.6226, + "step": 5068 + }, + { + "epoch": 0.18, + "learning_rate": 1.8520764280852793e-05, + "loss": 0.6235, + "step": 5069 + }, + { + "epoch": 0.18, + "learning_rate": 1.8520194299585832e-05, + "loss": 0.653, + "step": 5070 + }, + { + "epoch": 0.18, + "learning_rate": 1.8519624217301194e-05, + "loss": 0.6452, + "step": 5071 + }, + { + "epoch": 0.18, + "learning_rate": 1.8519054034005633e-05, + "loss": 0.6288, + "step": 5072 + }, + { + "epoch": 0.18, + "learning_rate": 1.8518483749705906e-05, + "loss": 0.6194, + "step": 5073 + }, + { + "epoch": 0.18, + "learning_rate": 1.851791336440878e-05, + "loss": 0.6708, + "step": 5074 + }, + { + "epoch": 0.18, + "learning_rate": 1.8517342878121016e-05, + "loss": 0.61, + "step": 5075 + }, + { + "epoch": 0.18, + "learning_rate": 1.8516772290849378e-05, + "loss": 0.6361, + "step": 5076 + }, + { + "epoch": 0.18, + "learning_rate": 1.851620160260063e-05, + "loss": 0.6389, + "step": 5077 + }, + { + "epoch": 0.18, + "learning_rate": 1.851563081338154e-05, + "loss": 0.6148, + "step": 5078 + }, + { + "epoch": 0.18, + "learning_rate": 1.851505992319887e-05, + "loss": 0.62, + "step": 5079 + }, + { + "epoch": 0.18, + "learning_rate": 1.85144889320594e-05, + "loss": 0.589, + "step": 5080 + }, + { + "epoch": 0.18, + "learning_rate": 1.851391783996989e-05, + "loss": 0.6127, + "step": 5081 + }, + { + "epoch": 0.18, + "learning_rate": 1.8513346646937114e-05, + "loss": 0.6169, + "step": 5082 + }, + { + "epoch": 0.18, + "learning_rate": 1.8512775352967843e-05, + "loss": 0.6628, + "step": 5083 + }, + { + "epoch": 0.18, + "learning_rate": 1.8512203958068853e-05, + "loss": 0.6337, + "step": 5084 + }, + { + "epoch": 0.18, + "learning_rate": 1.8511632462246914e-05, + "loss": 0.6706, + "step": 5085 + }, + { + "epoch": 0.18, + "learning_rate": 1.8511060865508806e-05, + "loss": 0.6683, + "step": 5086 + }, + { + "epoch": 0.18, + "learning_rate": 1.8510489167861308e-05, + "loss": 0.6436, + "step": 5087 + }, + { + "epoch": 0.18, + "learning_rate": 1.8509917369311193e-05, + "loss": 0.6487, + "step": 5088 + }, + { + "epoch": 0.18, + "learning_rate": 1.8509345469865245e-05, + "loss": 0.6121, + "step": 5089 + }, + { + "epoch": 0.18, + "learning_rate": 1.850877346953024e-05, + "loss": 0.6836, + "step": 5090 + }, + { + "epoch": 0.18, + "learning_rate": 1.8508201368312957e-05, + "loss": 0.608, + "step": 5091 + }, + { + "epoch": 0.18, + "learning_rate": 1.850762916622019e-05, + "loss": 0.6609, + "step": 5092 + }, + { + "epoch": 0.18, + "learning_rate": 1.8507056863258714e-05, + "loss": 0.6125, + "step": 5093 + }, + { + "epoch": 0.18, + "learning_rate": 1.850648445943532e-05, + "loss": 0.6084, + "step": 5094 + }, + { + "epoch": 0.18, + "learning_rate": 1.850591195475679e-05, + "loss": 0.6206, + "step": 5095 + }, + { + "epoch": 0.18, + "learning_rate": 1.8505339349229913e-05, + "loss": 0.6178, + "step": 5096 + }, + { + "epoch": 0.18, + "learning_rate": 1.850476664286148e-05, + "loss": 0.5591, + "step": 5097 + }, + { + "epoch": 0.18, + "learning_rate": 1.8504193835658283e-05, + "loss": 0.6332, + "step": 5098 + }, + { + "epoch": 0.18, + "learning_rate": 1.8503620927627107e-05, + "loss": 0.6145, + "step": 5099 + }, + { + "epoch": 0.18, + "learning_rate": 1.8503047918774745e-05, + "loss": 0.6896, + "step": 5100 + }, + { + "epoch": 0.18, + "learning_rate": 1.8502474809108e-05, + "loss": 0.6257, + "step": 5101 + }, + { + "epoch": 0.18, + "learning_rate": 1.8501901598633653e-05, + "loss": 0.6531, + "step": 5102 + }, + { + "epoch": 0.18, + "learning_rate": 1.8501328287358514e-05, + "loss": 0.6335, + "step": 5103 + }, + { + "epoch": 0.18, + "learning_rate": 1.850075487528937e-05, + "loss": 0.6241, + "step": 5104 + }, + { + "epoch": 0.18, + "learning_rate": 1.8500181362433026e-05, + "loss": 0.6448, + "step": 5105 + }, + { + "epoch": 0.18, + "learning_rate": 1.8499607748796276e-05, + "loss": 0.6397, + "step": 5106 + }, + { + "epoch": 0.18, + "learning_rate": 1.849903403438593e-05, + "loss": 0.6156, + "step": 5107 + }, + { + "epoch": 0.18, + "learning_rate": 1.8498460219208776e-05, + "loss": 0.6609, + "step": 5108 + }, + { + "epoch": 0.18, + "learning_rate": 1.8497886303271632e-05, + "loss": 0.65, + "step": 5109 + }, + { + "epoch": 0.18, + "learning_rate": 1.849731228658129e-05, + "loss": 0.6586, + "step": 5110 + }, + { + "epoch": 0.18, + "learning_rate": 1.8496738169144568e-05, + "loss": 0.652, + "step": 5111 + }, + { + "epoch": 0.18, + "learning_rate": 1.8496163950968264e-05, + "loss": 0.6973, + "step": 5112 + }, + { + "epoch": 0.18, + "learning_rate": 1.8495589632059187e-05, + "loss": 0.6392, + "step": 5113 + }, + { + "epoch": 0.18, + "learning_rate": 1.8495015212424153e-05, + "loss": 0.6167, + "step": 5114 + }, + { + "epoch": 0.18, + "learning_rate": 1.849444069206996e-05, + "loss": 0.6068, + "step": 5115 + }, + { + "epoch": 0.18, + "learning_rate": 1.849386607100343e-05, + "loss": 0.6233, + "step": 5116 + }, + { + "epoch": 0.18, + "learning_rate": 1.8493291349231376e-05, + "loss": 0.5714, + "step": 5117 + }, + { + "epoch": 0.18, + "learning_rate": 1.849271652676061e-05, + "loss": 0.6973, + "step": 5118 + }, + { + "epoch": 0.18, + "learning_rate": 1.8492141603597942e-05, + "loss": 0.6571, + "step": 5119 + }, + { + "epoch": 0.18, + "learning_rate": 1.8491566579750194e-05, + "loss": 0.5916, + "step": 5120 + }, + { + "epoch": 0.18, + "learning_rate": 1.849099145522418e-05, + "loss": 0.6601, + "step": 5121 + }, + { + "epoch": 0.18, + "learning_rate": 1.8490416230026724e-05, + "loss": 0.6694, + "step": 5122 + }, + { + "epoch": 0.18, + "learning_rate": 1.8489840904164645e-05, + "loss": 0.6444, + "step": 5123 + }, + { + "epoch": 0.18, + "learning_rate": 1.848926547764476e-05, + "loss": 0.6017, + "step": 5124 + }, + { + "epoch": 0.18, + "learning_rate": 1.848868995047389e-05, + "loss": 0.5687, + "step": 5125 + }, + { + "epoch": 0.18, + "learning_rate": 1.8488114322658866e-05, + "loss": 0.6634, + "step": 5126 + }, + { + "epoch": 0.18, + "learning_rate": 1.848753859420651e-05, + "loss": 0.6491, + "step": 5127 + }, + { + "epoch": 0.18, + "learning_rate": 1.8486962765123645e-05, + "loss": 0.6484, + "step": 5128 + }, + { + "epoch": 0.18, + "learning_rate": 1.84863868354171e-05, + "loss": 0.6399, + "step": 5129 + }, + { + "epoch": 0.18, + "learning_rate": 1.848581080509371e-05, + "loss": 0.6515, + "step": 5130 + }, + { + "epoch": 0.18, + "learning_rate": 1.8485234674160292e-05, + "loss": 0.6454, + "step": 5131 + }, + { + "epoch": 0.18, + "learning_rate": 1.8484658442623685e-05, + "loss": 0.6725, + "step": 5132 + }, + { + "epoch": 0.18, + "learning_rate": 1.848408211049072e-05, + "loss": 0.633, + "step": 5133 + }, + { + "epoch": 0.18, + "learning_rate": 1.848350567776823e-05, + "loss": 0.6044, + "step": 5134 + }, + { + "epoch": 0.18, + "learning_rate": 1.8482929144463043e-05, + "loss": 0.6112, + "step": 5135 + }, + { + "epoch": 0.18, + "learning_rate": 1.8482352510582004e-05, + "loss": 0.6521, + "step": 5136 + }, + { + "epoch": 0.18, + "learning_rate": 1.8481775776131944e-05, + "loss": 0.6052, + "step": 5137 + }, + { + "epoch": 0.18, + "learning_rate": 1.8481198941119703e-05, + "loss": 0.5778, + "step": 5138 + }, + { + "epoch": 0.18, + "learning_rate": 1.8480622005552126e-05, + "loss": 0.6449, + "step": 5139 + }, + { + "epoch": 0.18, + "learning_rate": 1.8480044969436038e-05, + "loss": 0.5935, + "step": 5140 + }, + { + "epoch": 0.18, + "learning_rate": 1.84794678327783e-05, + "loss": 0.6354, + "step": 5141 + }, + { + "epoch": 0.18, + "learning_rate": 1.847889059558573e-05, + "loss": 0.6621, + "step": 5142 + }, + { + "epoch": 0.18, + "learning_rate": 1.8478313257865196e-05, + "loss": 0.6497, + "step": 5143 + }, + { + "epoch": 0.18, + "learning_rate": 1.8477735819623534e-05, + "loss": 0.6684, + "step": 5144 + }, + { + "epoch": 0.18, + "learning_rate": 1.8477158280867586e-05, + "loss": 0.6679, + "step": 5145 + }, + { + "epoch": 0.18, + "learning_rate": 1.8476580641604202e-05, + "loss": 0.6654, + "step": 5146 + }, + { + "epoch": 0.18, + "learning_rate": 1.8476002901840234e-05, + "loss": 0.6525, + "step": 5147 + }, + { + "epoch": 0.18, + "learning_rate": 1.8475425061582525e-05, + "loss": 0.6045, + "step": 5148 + }, + { + "epoch": 0.18, + "learning_rate": 1.8474847120837937e-05, + "loss": 0.6455, + "step": 5149 + }, + { + "epoch": 0.18, + "learning_rate": 1.8474269079613313e-05, + "loss": 0.5865, + "step": 5150 + }, + { + "epoch": 0.18, + "learning_rate": 1.8473690937915508e-05, + "loss": 0.6515, + "step": 5151 + }, + { + "epoch": 0.18, + "learning_rate": 1.847311269575138e-05, + "loss": 0.6764, + "step": 5152 + }, + { + "epoch": 0.18, + "learning_rate": 1.8472534353127778e-05, + "loss": 0.6533, + "step": 5153 + }, + { + "epoch": 0.18, + "learning_rate": 1.8471955910051567e-05, + "loss": 0.6341, + "step": 5154 + }, + { + "epoch": 0.18, + "learning_rate": 1.84713773665296e-05, + "loss": 0.5798, + "step": 5155 + }, + { + "epoch": 0.18, + "learning_rate": 1.847079872256874e-05, + "loss": 0.6157, + "step": 5156 + }, + { + "epoch": 0.18, + "learning_rate": 1.8470219978175843e-05, + "loss": 0.6162, + "step": 5157 + }, + { + "epoch": 0.18, + "learning_rate": 1.846964113335777e-05, + "loss": 0.6663, + "step": 5158 + }, + { + "epoch": 0.18, + "learning_rate": 1.8469062188121395e-05, + "loss": 0.6063, + "step": 5159 + }, + { + "epoch": 0.18, + "learning_rate": 1.8468483142473572e-05, + "loss": 0.6261, + "step": 5160 + }, + { + "epoch": 0.18, + "learning_rate": 1.8467903996421168e-05, + "loss": 0.6164, + "step": 5161 + }, + { + "epoch": 0.18, + "learning_rate": 1.8467324749971046e-05, + "loss": 0.6112, + "step": 5162 + }, + { + "epoch": 0.18, + "learning_rate": 1.8466745403130085e-05, + "loss": 0.6183, + "step": 5163 + }, + { + "epoch": 0.18, + "learning_rate": 1.8466165955905145e-05, + "loss": 0.5857, + "step": 5164 + }, + { + "epoch": 0.18, + "learning_rate": 1.8465586408303094e-05, + "loss": 0.5694, + "step": 5165 + }, + { + "epoch": 0.18, + "learning_rate": 1.846500676033081e-05, + "loss": 0.6465, + "step": 5166 + }, + { + "epoch": 0.18, + "learning_rate": 1.846442701199516e-05, + "loss": 0.6296, + "step": 5167 + }, + { + "epoch": 0.18, + "learning_rate": 1.8463847163303022e-05, + "loss": 0.6506, + "step": 5168 + }, + { + "epoch": 0.18, + "learning_rate": 1.846326721426127e-05, + "loss": 0.5876, + "step": 5169 + }, + { + "epoch": 0.18, + "learning_rate": 1.846268716487678e-05, + "loss": 0.6111, + "step": 5170 + }, + { + "epoch": 0.18, + "learning_rate": 1.8462107015156424e-05, + "loss": 0.6232, + "step": 5171 + }, + { + "epoch": 0.18, + "learning_rate": 1.846152676510709e-05, + "loss": 0.5749, + "step": 5172 + }, + { + "epoch": 0.18, + "learning_rate": 1.846094641473565e-05, + "loss": 0.6499, + "step": 5173 + }, + { + "epoch": 0.18, + "learning_rate": 1.8460365964048985e-05, + "loss": 0.5915, + "step": 5174 + }, + { + "epoch": 0.18, + "learning_rate": 1.845978541305398e-05, + "loss": 0.6209, + "step": 5175 + }, + { + "epoch": 0.18, + "learning_rate": 1.8459204761757518e-05, + "loss": 0.6339, + "step": 5176 + }, + { + "epoch": 0.18, + "learning_rate": 1.8458624010166485e-05, + "loss": 0.6393, + "step": 5177 + }, + { + "epoch": 0.18, + "learning_rate": 1.845804315828776e-05, + "loss": 0.6321, + "step": 5178 + }, + { + "epoch": 0.18, + "learning_rate": 1.8457462206128236e-05, + "loss": 0.6312, + "step": 5179 + }, + { + "epoch": 0.18, + "learning_rate": 1.84568811536948e-05, + "loss": 0.6091, + "step": 5180 + }, + { + "epoch": 0.18, + "learning_rate": 1.8456300000994337e-05, + "loss": 0.6902, + "step": 5181 + }, + { + "epoch": 0.18, + "learning_rate": 1.845571874803374e-05, + "loss": 0.5848, + "step": 5182 + }, + { + "epoch": 0.18, + "learning_rate": 1.8455137394819905e-05, + "loss": 0.6137, + "step": 5183 + }, + { + "epoch": 0.18, + "learning_rate": 1.8454555941359717e-05, + "loss": 0.6372, + "step": 5184 + }, + { + "epoch": 0.18, + "learning_rate": 1.8453974387660073e-05, + "loss": 0.6288, + "step": 5185 + }, + { + "epoch": 0.18, + "learning_rate": 1.8453392733727867e-05, + "loss": 0.614, + "step": 5186 + }, + { + "epoch": 0.18, + "learning_rate": 1.8452810979570003e-05, + "loss": 0.6513, + "step": 5187 + }, + { + "epoch": 0.18, + "learning_rate": 1.8452229125193366e-05, + "loss": 0.6328, + "step": 5188 + }, + { + "epoch": 0.18, + "learning_rate": 1.8451647170604863e-05, + "loss": 0.6564, + "step": 5189 + }, + { + "epoch": 0.18, + "learning_rate": 1.845106511581139e-05, + "loss": 0.6346, + "step": 5190 + }, + { + "epoch": 0.18, + "learning_rate": 1.845048296081985e-05, + "loss": 0.6593, + "step": 5191 + }, + { + "epoch": 0.18, + "learning_rate": 1.8449900705637145e-05, + "loss": 0.6498, + "step": 5192 + }, + { + "epoch": 0.18, + "learning_rate": 1.844931835027018e-05, + "loss": 0.6864, + "step": 5193 + }, + { + "epoch": 0.18, + "learning_rate": 1.8448735894725853e-05, + "loss": 0.5876, + "step": 5194 + }, + { + "epoch": 0.18, + "learning_rate": 1.844815333901108e-05, + "loss": 0.6697, + "step": 5195 + }, + { + "epoch": 0.18, + "learning_rate": 1.8447570683132757e-05, + "loss": 0.6027, + "step": 5196 + }, + { + "epoch": 0.18, + "learning_rate": 1.8446987927097797e-05, + "loss": 0.6443, + "step": 5197 + }, + { + "epoch": 0.18, + "learning_rate": 1.844640507091311e-05, + "loss": 0.6046, + "step": 5198 + }, + { + "epoch": 0.18, + "learning_rate": 1.844582211458561e-05, + "loss": 0.568, + "step": 5199 + }, + { + "epoch": 0.18, + "learning_rate": 1.8445239058122202e-05, + "loss": 0.6224, + "step": 5200 + }, + { + "epoch": 0.18, + "learning_rate": 1.8444655901529804e-05, + "loss": 0.5947, + "step": 5201 + }, + { + "epoch": 0.18, + "learning_rate": 1.8444072644815322e-05, + "loss": 0.5833, + "step": 5202 + }, + { + "epoch": 0.18, + "learning_rate": 1.8443489287985683e-05, + "loss": 0.6598, + "step": 5203 + }, + { + "epoch": 0.18, + "learning_rate": 1.84429058310478e-05, + "loss": 0.6007, + "step": 5204 + }, + { + "epoch": 0.18, + "learning_rate": 1.844232227400858e-05, + "loss": 0.681, + "step": 5205 + }, + { + "epoch": 0.18, + "learning_rate": 1.8441738616874953e-05, + "loss": 0.6806, + "step": 5206 + }, + { + "epoch": 0.18, + "learning_rate": 1.8441154859653836e-05, + "loss": 0.6228, + "step": 5207 + }, + { + "epoch": 0.18, + "learning_rate": 1.844057100235215e-05, + "loss": 0.6561, + "step": 5208 + }, + { + "epoch": 0.18, + "learning_rate": 1.8439987044976817e-05, + "loss": 0.6179, + "step": 5209 + }, + { + "epoch": 0.18, + "learning_rate": 1.843940298753476e-05, + "loss": 0.6608, + "step": 5210 + }, + { + "epoch": 0.18, + "learning_rate": 1.8438818830032908e-05, + "loss": 0.6272, + "step": 5211 + }, + { + "epoch": 0.18, + "learning_rate": 1.8438234572478184e-05, + "loss": 0.6894, + "step": 5212 + }, + { + "epoch": 0.18, + "learning_rate": 1.8437650214877508e-05, + "loss": 0.6399, + "step": 5213 + }, + { + "epoch": 0.18, + "learning_rate": 1.8437065757237823e-05, + "loss": 0.6325, + "step": 5214 + }, + { + "epoch": 0.18, + "learning_rate": 1.8436481199566045e-05, + "loss": 0.6544, + "step": 5215 + }, + { + "epoch": 0.18, + "learning_rate": 1.843589654186911e-05, + "loss": 0.6256, + "step": 5216 + }, + { + "epoch": 0.18, + "learning_rate": 1.8435311784153954e-05, + "loss": 0.6227, + "step": 5217 + }, + { + "epoch": 0.18, + "learning_rate": 1.8434726926427506e-05, + "loss": 0.6938, + "step": 5218 + }, + { + "epoch": 0.18, + "learning_rate": 1.8434141968696696e-05, + "loss": 0.592, + "step": 5219 + }, + { + "epoch": 0.18, + "learning_rate": 1.843355691096847e-05, + "loss": 0.5702, + "step": 5220 + }, + { + "epoch": 0.18, + "learning_rate": 1.8432971753249753e-05, + "loss": 0.629, + "step": 5221 + }, + { + "epoch": 0.18, + "learning_rate": 1.8432386495547486e-05, + "loss": 0.6424, + "step": 5222 + }, + { + "epoch": 0.18, + "learning_rate": 1.8431801137868617e-05, + "loss": 0.65, + "step": 5223 + }, + { + "epoch": 0.18, + "learning_rate": 1.8431215680220076e-05, + "loss": 0.6578, + "step": 5224 + }, + { + "epoch": 0.18, + "learning_rate": 1.8430630122608807e-05, + "loss": 0.6707, + "step": 5225 + }, + { + "epoch": 0.18, + "learning_rate": 1.8430044465041754e-05, + "loss": 0.5872, + "step": 5226 + }, + { + "epoch": 0.18, + "learning_rate": 1.842945870752586e-05, + "loss": 0.6775, + "step": 5227 + }, + { + "epoch": 0.18, + "learning_rate": 1.842887285006807e-05, + "loss": 0.5764, + "step": 5228 + }, + { + "epoch": 0.18, + "learning_rate": 1.8428286892675327e-05, + "loss": 0.6497, + "step": 5229 + }, + { + "epoch": 0.18, + "learning_rate": 1.8427700835354585e-05, + "loss": 0.6664, + "step": 5230 + }, + { + "epoch": 0.18, + "learning_rate": 1.8427114678112785e-05, + "loss": 0.6248, + "step": 5231 + }, + { + "epoch": 0.18, + "learning_rate": 1.8426528420956883e-05, + "loss": 0.5956, + "step": 5232 + }, + { + "epoch": 0.18, + "learning_rate": 1.8425942063893824e-05, + "loss": 0.6241, + "step": 5233 + }, + { + "epoch": 0.18, + "learning_rate": 1.8425355606930564e-05, + "loss": 0.636, + "step": 5234 + }, + { + "epoch": 0.18, + "learning_rate": 1.8424769050074056e-05, + "loss": 0.5955, + "step": 5235 + }, + { + "epoch": 0.18, + "learning_rate": 1.8424182393331255e-05, + "loss": 0.6467, + "step": 5236 + }, + { + "epoch": 0.18, + "learning_rate": 1.842359563670911e-05, + "loss": 0.6269, + "step": 5237 + }, + { + "epoch": 0.18, + "learning_rate": 1.842300878021459e-05, + "loss": 0.6287, + "step": 5238 + }, + { + "epoch": 0.18, + "learning_rate": 1.842242182385464e-05, + "loss": 0.5745, + "step": 5239 + }, + { + "epoch": 0.18, + "learning_rate": 1.8421834767636226e-05, + "loss": 0.6379, + "step": 5240 + }, + { + "epoch": 0.18, + "learning_rate": 1.842124761156631e-05, + "loss": 0.6701, + "step": 5241 + }, + { + "epoch": 0.18, + "learning_rate": 1.8420660355651847e-05, + "loss": 0.6352, + "step": 5242 + }, + { + "epoch": 0.18, + "learning_rate": 1.8420072999899806e-05, + "loss": 0.6335, + "step": 5243 + }, + { + "epoch": 0.18, + "learning_rate": 1.841948554431715e-05, + "loss": 0.6113, + "step": 5244 + }, + { + "epoch": 0.18, + "learning_rate": 1.8418897988910836e-05, + "loss": 0.5564, + "step": 5245 + }, + { + "epoch": 0.18, + "learning_rate": 1.841831033368784e-05, + "loss": 0.6172, + "step": 5246 + }, + { + "epoch": 0.18, + "learning_rate": 1.8417722578655123e-05, + "loss": 0.6325, + "step": 5247 + }, + { + "epoch": 0.18, + "learning_rate": 1.8417134723819662e-05, + "loss": 0.6347, + "step": 5248 + }, + { + "epoch": 0.18, + "learning_rate": 1.841654676918842e-05, + "loss": 0.6454, + "step": 5249 + }, + { + "epoch": 0.18, + "learning_rate": 1.8415958714768363e-05, + "loss": 0.6612, + "step": 5250 + }, + { + "epoch": 0.18, + "learning_rate": 1.8415370560566473e-05, + "loss": 0.652, + "step": 5251 + }, + { + "epoch": 0.18, + "learning_rate": 1.841478230658972e-05, + "loss": 0.6302, + "step": 5252 + }, + { + "epoch": 0.18, + "learning_rate": 1.8414193952845077e-05, + "loss": 0.6295, + "step": 5253 + }, + { + "epoch": 0.18, + "learning_rate": 1.8413605499339522e-05, + "loss": 0.5553, + "step": 5254 + }, + { + "epoch": 0.18, + "learning_rate": 1.841301694608003e-05, + "loss": 0.629, + "step": 5255 + }, + { + "epoch": 0.18, + "learning_rate": 1.841242829307358e-05, + "loss": 0.6141, + "step": 5256 + }, + { + "epoch": 0.18, + "learning_rate": 1.8411839540327147e-05, + "loss": 0.6072, + "step": 5257 + }, + { + "epoch": 0.18, + "learning_rate": 1.841125068784772e-05, + "loss": 0.6766, + "step": 5258 + }, + { + "epoch": 0.18, + "learning_rate": 1.8410661735642273e-05, + "loss": 0.6383, + "step": 5259 + }, + { + "epoch": 0.18, + "learning_rate": 1.8410072683717794e-05, + "loss": 0.6479, + "step": 5260 + }, + { + "epoch": 0.18, + "learning_rate": 1.8409483532081263e-05, + "loss": 0.7031, + "step": 5261 + }, + { + "epoch": 0.18, + "learning_rate": 1.8408894280739668e-05, + "loss": 0.6543, + "step": 5262 + }, + { + "epoch": 0.18, + "learning_rate": 1.840830492969999e-05, + "loss": 0.6176, + "step": 5263 + }, + { + "epoch": 0.18, + "learning_rate": 1.8407715478969225e-05, + "loss": 0.6847, + "step": 5264 + }, + { + "epoch": 0.18, + "learning_rate": 1.8407125928554356e-05, + "loss": 0.6233, + "step": 5265 + }, + { + "epoch": 0.18, + "learning_rate": 1.8406536278462375e-05, + "loss": 0.6128, + "step": 5266 + }, + { + "epoch": 0.18, + "learning_rate": 1.8405946528700268e-05, + "loss": 0.6528, + "step": 5267 + }, + { + "epoch": 0.18, + "learning_rate": 1.8405356679275034e-05, + "loss": 0.6934, + "step": 5268 + }, + { + "epoch": 0.18, + "learning_rate": 1.8404766730193664e-05, + "loss": 0.6482, + "step": 5269 + }, + { + "epoch": 0.18, + "learning_rate": 1.8404176681463153e-05, + "loss": 0.6541, + "step": 5270 + }, + { + "epoch": 0.18, + "learning_rate": 1.8403586533090495e-05, + "loss": 0.6486, + "step": 5271 + }, + { + "epoch": 0.18, + "learning_rate": 1.840299628508269e-05, + "loss": 0.6694, + "step": 5272 + }, + { + "epoch": 0.18, + "learning_rate": 1.8402405937446734e-05, + "loss": 0.6169, + "step": 5273 + }, + { + "epoch": 0.18, + "learning_rate": 1.8401815490189623e-05, + "loss": 0.6511, + "step": 5274 + }, + { + "epoch": 0.18, + "learning_rate": 1.8401224943318362e-05, + "loss": 0.648, + "step": 5275 + }, + { + "epoch": 0.18, + "learning_rate": 1.8400634296839953e-05, + "loss": 0.653, + "step": 5276 + }, + { + "epoch": 0.18, + "learning_rate": 1.8400043550761396e-05, + "loss": 0.6628, + "step": 5277 + }, + { + "epoch": 0.18, + "learning_rate": 1.83994527050897e-05, + "loss": 0.6057, + "step": 5278 + }, + { + "epoch": 0.18, + "learning_rate": 1.8398861759831862e-05, + "loss": 0.6145, + "step": 5279 + }, + { + "epoch": 0.18, + "learning_rate": 1.8398270714994898e-05, + "loss": 0.6096, + "step": 5280 + }, + { + "epoch": 0.18, + "learning_rate": 1.839767957058581e-05, + "loss": 0.6358, + "step": 5281 + }, + { + "epoch": 0.18, + "learning_rate": 1.8397088326611606e-05, + "loss": 0.6298, + "step": 5282 + }, + { + "epoch": 0.18, + "learning_rate": 1.8396496983079295e-05, + "loss": 0.6825, + "step": 5283 + }, + { + "epoch": 0.18, + "learning_rate": 1.8395905539995896e-05, + "loss": 0.6321, + "step": 5284 + }, + { + "epoch": 0.18, + "learning_rate": 1.8395313997368412e-05, + "loss": 0.5516, + "step": 5285 + }, + { + "epoch": 0.18, + "learning_rate": 1.839472235520386e-05, + "loss": 0.6402, + "step": 5286 + }, + { + "epoch": 0.18, + "learning_rate": 1.8394130613509256e-05, + "loss": 0.6358, + "step": 5287 + }, + { + "epoch": 0.18, + "learning_rate": 1.839353877229162e-05, + "loss": 0.6274, + "step": 5288 + }, + { + "epoch": 0.18, + "learning_rate": 1.8392946831557957e-05, + "loss": 0.6851, + "step": 5289 + }, + { + "epoch": 0.18, + "learning_rate": 1.8392354791315297e-05, + "loss": 0.6237, + "step": 5290 + }, + { + "epoch": 0.18, + "learning_rate": 1.8391762651570654e-05, + "loss": 0.6342, + "step": 5291 + }, + { + "epoch": 0.18, + "learning_rate": 1.8391170412331047e-05, + "loss": 0.6866, + "step": 5292 + }, + { + "epoch": 0.18, + "learning_rate": 1.83905780736035e-05, + "loss": 0.5956, + "step": 5293 + }, + { + "epoch": 0.18, + "learning_rate": 1.8389985635395037e-05, + "loss": 0.6685, + "step": 5294 + }, + { + "epoch": 0.18, + "learning_rate": 1.838939309771268e-05, + "loss": 0.5411, + "step": 5295 + }, + { + "epoch": 0.18, + "learning_rate": 1.8388800460563458e-05, + "loss": 0.62, + "step": 5296 + }, + { + "epoch": 0.18, + "learning_rate": 1.838820772395439e-05, + "loss": 0.6467, + "step": 5297 + }, + { + "epoch": 0.18, + "learning_rate": 1.8387614887892507e-05, + "loss": 0.6472, + "step": 5298 + }, + { + "epoch": 0.18, + "learning_rate": 1.8387021952384848e-05, + "loss": 0.6617, + "step": 5299 + }, + { + "epoch": 0.18, + "learning_rate": 1.8386428917438425e-05, + "loss": 0.6391, + "step": 5300 + }, + { + "epoch": 0.18, + "learning_rate": 1.8385835783060284e-05, + "loss": 0.621, + "step": 5301 + }, + { + "epoch": 0.18, + "learning_rate": 1.8385242549257447e-05, + "loss": 0.6018, + "step": 5302 + }, + { + "epoch": 0.18, + "learning_rate": 1.8384649216036957e-05, + "loss": 0.6267, + "step": 5303 + }, + { + "epoch": 0.18, + "learning_rate": 1.838405578340584e-05, + "loss": 0.6975, + "step": 5304 + }, + { + "epoch": 0.18, + "learning_rate": 1.838346225137114e-05, + "loss": 0.6732, + "step": 5305 + }, + { + "epoch": 0.18, + "learning_rate": 1.8382868619939886e-05, + "loss": 0.6426, + "step": 5306 + }, + { + "epoch": 0.18, + "learning_rate": 1.838227488911912e-05, + "loss": 0.6068, + "step": 5307 + }, + { + "epoch": 0.18, + "learning_rate": 1.8381681058915887e-05, + "loss": 0.7103, + "step": 5308 + }, + { + "epoch": 0.18, + "learning_rate": 1.8381087129337215e-05, + "loss": 0.6001, + "step": 5309 + }, + { + "epoch": 0.18, + "learning_rate": 1.8380493100390157e-05, + "loss": 0.6526, + "step": 5310 + }, + { + "epoch": 0.18, + "learning_rate": 1.8379898972081754e-05, + "loss": 0.6783, + "step": 5311 + }, + { + "epoch": 0.18, + "learning_rate": 1.8379304744419042e-05, + "loss": 0.6001, + "step": 5312 + }, + { + "epoch": 0.18, + "learning_rate": 1.8378710417409076e-05, + "loss": 0.6538, + "step": 5313 + }, + { + "epoch": 0.18, + "learning_rate": 1.83781159910589e-05, + "loss": 0.6162, + "step": 5314 + }, + { + "epoch": 0.18, + "learning_rate": 1.8377521465375557e-05, + "loss": 0.5948, + "step": 5315 + }, + { + "epoch": 0.18, + "learning_rate": 1.83769268403661e-05, + "loss": 0.6637, + "step": 5316 + }, + { + "epoch": 0.18, + "learning_rate": 1.837633211603758e-05, + "loss": 0.669, + "step": 5317 + }, + { + "epoch": 0.18, + "learning_rate": 1.8375737292397046e-05, + "loss": 0.6244, + "step": 5318 + }, + { + "epoch": 0.18, + "learning_rate": 1.8375142369451554e-05, + "loss": 0.6745, + "step": 5319 + }, + { + "epoch": 0.18, + "learning_rate": 1.837454734720815e-05, + "loss": 0.6252, + "step": 5320 + }, + { + "epoch": 0.18, + "learning_rate": 1.83739522256739e-05, + "loss": 0.6304, + "step": 5321 + }, + { + "epoch": 0.18, + "learning_rate": 1.837335700485585e-05, + "loss": 0.6036, + "step": 5322 + }, + { + "epoch": 0.18, + "learning_rate": 1.8372761684761057e-05, + "loss": 0.6431, + "step": 5323 + }, + { + "epoch": 0.18, + "learning_rate": 1.837216626539658e-05, + "loss": 0.662, + "step": 5324 + }, + { + "epoch": 0.18, + "learning_rate": 1.8371570746769488e-05, + "loss": 0.6586, + "step": 5325 + }, + { + "epoch": 0.18, + "learning_rate": 1.8370975128886833e-05, + "loss": 0.6235, + "step": 5326 + }, + { + "epoch": 0.18, + "learning_rate": 1.8370379411755677e-05, + "loss": 0.6707, + "step": 5327 + }, + { + "epoch": 0.18, + "learning_rate": 1.836978359538309e-05, + "loss": 0.6383, + "step": 5328 + }, + { + "epoch": 0.18, + "learning_rate": 1.8369187679776125e-05, + "loss": 0.6676, + "step": 5329 + }, + { + "epoch": 0.18, + "learning_rate": 1.8368591664941854e-05, + "loss": 0.6325, + "step": 5330 + }, + { + "epoch": 0.18, + "learning_rate": 1.836799555088734e-05, + "loss": 0.6878, + "step": 5331 + }, + { + "epoch": 0.18, + "learning_rate": 1.836739933761966e-05, + "loss": 0.6528, + "step": 5332 + }, + { + "epoch": 0.18, + "learning_rate": 1.8366803025145867e-05, + "loss": 0.6124, + "step": 5333 + }, + { + "epoch": 0.18, + "learning_rate": 1.8366206613473045e-05, + "loss": 0.6244, + "step": 5334 + }, + { + "epoch": 0.18, + "learning_rate": 1.8365610102608263e-05, + "loss": 0.69, + "step": 5335 + }, + { + "epoch": 0.18, + "learning_rate": 1.8365013492558587e-05, + "loss": 0.6223, + "step": 5336 + }, + { + "epoch": 0.18, + "learning_rate": 1.8364416783331093e-05, + "loss": 0.6159, + "step": 5337 + }, + { + "epoch": 0.18, + "learning_rate": 1.8363819974932863e-05, + "loss": 0.6099, + "step": 5338 + }, + { + "epoch": 0.18, + "learning_rate": 1.836322306737096e-05, + "loss": 0.6502, + "step": 5339 + }, + { + "epoch": 0.19, + "learning_rate": 1.8362626060652472e-05, + "loss": 0.5467, + "step": 5340 + }, + { + "epoch": 0.19, + "learning_rate": 1.836202895478447e-05, + "loss": 0.6283, + "step": 5341 + }, + { + "epoch": 0.19, + "learning_rate": 1.836143174977404e-05, + "loss": 0.6195, + "step": 5342 + }, + { + "epoch": 0.19, + "learning_rate": 1.836083444562826e-05, + "loss": 0.6126, + "step": 5343 + }, + { + "epoch": 0.19, + "learning_rate": 1.8360237042354207e-05, + "loss": 0.7186, + "step": 5344 + }, + { + "epoch": 0.19, + "learning_rate": 1.835963953995897e-05, + "loss": 0.5851, + "step": 5345 + }, + { + "epoch": 0.19, + "learning_rate": 1.8359041938449636e-05, + "loss": 0.5955, + "step": 5346 + }, + { + "epoch": 0.19, + "learning_rate": 1.835844423783328e-05, + "loss": 0.6371, + "step": 5347 + }, + { + "epoch": 0.19, + "learning_rate": 1.8357846438116995e-05, + "loss": 0.6714, + "step": 5348 + }, + { + "epoch": 0.19, + "learning_rate": 1.835724853930787e-05, + "loss": 0.6596, + "step": 5349 + }, + { + "epoch": 0.19, + "learning_rate": 1.8356650541412987e-05, + "loss": 0.6761, + "step": 5350 + }, + { + "epoch": 0.19, + "learning_rate": 1.8356052444439445e-05, + "loss": 0.6088, + "step": 5351 + }, + { + "epoch": 0.19, + "learning_rate": 1.8355454248394328e-05, + "loss": 0.6246, + "step": 5352 + }, + { + "epoch": 0.19, + "learning_rate": 1.8354855953284733e-05, + "loss": 0.6227, + "step": 5353 + }, + { + "epoch": 0.19, + "learning_rate": 1.835425755911775e-05, + "loss": 0.6622, + "step": 5354 + }, + { + "epoch": 0.19, + "learning_rate": 1.835365906590048e-05, + "loss": 0.6466, + "step": 5355 + }, + { + "epoch": 0.19, + "learning_rate": 1.835306047364001e-05, + "loss": 0.6467, + "step": 5356 + }, + { + "epoch": 0.19, + "learning_rate": 1.835246178234344e-05, + "loss": 0.5771, + "step": 5357 + }, + { + "epoch": 0.19, + "learning_rate": 1.835186299201787e-05, + "loss": 0.6301, + "step": 5358 + }, + { + "epoch": 0.19, + "learning_rate": 1.8351264102670405e-05, + "loss": 0.6632, + "step": 5359 + }, + { + "epoch": 0.19, + "learning_rate": 1.8350665114308138e-05, + "loss": 0.649, + "step": 5360 + }, + { + "epoch": 0.19, + "learning_rate": 1.8350066026938168e-05, + "loss": 0.6598, + "step": 5361 + }, + { + "epoch": 0.19, + "learning_rate": 1.8349466840567604e-05, + "loss": 0.6782, + "step": 5362 + }, + { + "epoch": 0.19, + "learning_rate": 1.834886755520355e-05, + "loss": 0.5737, + "step": 5363 + }, + { + "epoch": 0.19, + "learning_rate": 1.8348268170853106e-05, + "loss": 0.6499, + "step": 5364 + }, + { + "epoch": 0.19, + "learning_rate": 1.834766868752339e-05, + "loss": 0.6001, + "step": 5365 + }, + { + "epoch": 0.19, + "learning_rate": 1.8347069105221493e-05, + "loss": 0.6542, + "step": 5366 + }, + { + "epoch": 0.19, + "learning_rate": 1.8346469423954535e-05, + "loss": 0.6349, + "step": 5367 + }, + { + "epoch": 0.19, + "learning_rate": 1.834586964372963e-05, + "loss": 0.6157, + "step": 5368 + }, + { + "epoch": 0.19, + "learning_rate": 1.8345269764553877e-05, + "loss": 0.6233, + "step": 5369 + }, + { + "epoch": 0.19, + "learning_rate": 1.8344669786434393e-05, + "loss": 0.6544, + "step": 5370 + }, + { + "epoch": 0.19, + "learning_rate": 1.8344069709378294e-05, + "loss": 0.6545, + "step": 5371 + }, + { + "epoch": 0.19, + "learning_rate": 1.8343469533392696e-05, + "loss": 0.599, + "step": 5372 + }, + { + "epoch": 0.19, + "learning_rate": 1.834286925848471e-05, + "loss": 0.7031, + "step": 5373 + }, + { + "epoch": 0.19, + "learning_rate": 1.8342268884661452e-05, + "loss": 0.6785, + "step": 5374 + }, + { + "epoch": 0.19, + "learning_rate": 1.834166841193005e-05, + "loss": 0.6267, + "step": 5375 + }, + { + "epoch": 0.19, + "learning_rate": 1.834106784029761e-05, + "loss": 0.636, + "step": 5376 + }, + { + "epoch": 0.19, + "learning_rate": 1.8340467169771266e-05, + "loss": 0.6181, + "step": 5377 + }, + { + "epoch": 0.19, + "learning_rate": 1.833986640035813e-05, + "loss": 0.6342, + "step": 5378 + }, + { + "epoch": 0.19, + "learning_rate": 1.8339265532065328e-05, + "loss": 0.6083, + "step": 5379 + }, + { + "epoch": 0.19, + "learning_rate": 1.833866456489998e-05, + "loss": 0.6292, + "step": 5380 + }, + { + "epoch": 0.19, + "learning_rate": 1.8338063498869218e-05, + "loss": 0.6312, + "step": 5381 + }, + { + "epoch": 0.19, + "learning_rate": 1.8337462333980166e-05, + "loss": 0.6259, + "step": 5382 + }, + { + "epoch": 0.19, + "learning_rate": 1.8336861070239954e-05, + "loss": 0.6167, + "step": 5383 + }, + { + "epoch": 0.19, + "learning_rate": 1.8336259707655702e-05, + "loss": 0.696, + "step": 5384 + }, + { + "epoch": 0.19, + "learning_rate": 1.833565824623455e-05, + "loss": 0.6203, + "step": 5385 + }, + { + "epoch": 0.19, + "learning_rate": 1.833505668598362e-05, + "loss": 0.6843, + "step": 5386 + }, + { + "epoch": 0.19, + "learning_rate": 1.8334455026910056e-05, + "loss": 0.6276, + "step": 5387 + }, + { + "epoch": 0.19, + "learning_rate": 1.833385326902098e-05, + "loss": 0.577, + "step": 5388 + }, + { + "epoch": 0.19, + "learning_rate": 1.8333251412323535e-05, + "loss": 0.6386, + "step": 5389 + }, + { + "epoch": 0.19, + "learning_rate": 1.8332649456824847e-05, + "loss": 0.6484, + "step": 5390 + }, + { + "epoch": 0.19, + "learning_rate": 1.8332047402532064e-05, + "loss": 0.6522, + "step": 5391 + }, + { + "epoch": 0.19, + "learning_rate": 1.8331445249452316e-05, + "loss": 0.6399, + "step": 5392 + }, + { + "epoch": 0.19, + "learning_rate": 1.8330842997592748e-05, + "loss": 0.5963, + "step": 5393 + }, + { + "epoch": 0.19, + "learning_rate": 1.8330240646960494e-05, + "loss": 0.6274, + "step": 5394 + }, + { + "epoch": 0.19, + "learning_rate": 1.83296381975627e-05, + "loss": 0.6197, + "step": 5395 + }, + { + "epoch": 0.19, + "learning_rate": 1.832903564940651e-05, + "loss": 0.5964, + "step": 5396 + }, + { + "epoch": 0.19, + "learning_rate": 1.8328433002499065e-05, + "loss": 0.6141, + "step": 5397 + }, + { + "epoch": 0.19, + "learning_rate": 1.832783025684751e-05, + "loss": 0.6741, + "step": 5398 + }, + { + "epoch": 0.19, + "learning_rate": 1.8327227412458994e-05, + "loss": 0.6568, + "step": 5399 + }, + { + "epoch": 0.19, + "learning_rate": 1.8326624469340662e-05, + "loss": 0.6958, + "step": 5400 + }, + { + "epoch": 0.19, + "learning_rate": 1.8326021427499668e-05, + "loss": 0.6332, + "step": 5401 + }, + { + "epoch": 0.19, + "learning_rate": 1.8325418286943153e-05, + "loss": 0.664, + "step": 5402 + }, + { + "epoch": 0.19, + "learning_rate": 1.8324815047678274e-05, + "loss": 0.643, + "step": 5403 + }, + { + "epoch": 0.19, + "learning_rate": 1.832421170971218e-05, + "loss": 0.6761, + "step": 5404 + }, + { + "epoch": 0.19, + "learning_rate": 1.8323608273052028e-05, + "loss": 0.6394, + "step": 5405 + }, + { + "epoch": 0.19, + "learning_rate": 1.832300473770497e-05, + "loss": 0.6174, + "step": 5406 + }, + { + "epoch": 0.19, + "learning_rate": 1.8322401103678163e-05, + "loss": 0.6466, + "step": 5407 + }, + { + "epoch": 0.19, + "learning_rate": 1.8321797370978764e-05, + "loss": 0.6128, + "step": 5408 + }, + { + "epoch": 0.19, + "learning_rate": 1.8321193539613924e-05, + "loss": 0.6315, + "step": 5409 + }, + { + "epoch": 0.19, + "learning_rate": 1.8320589609590813e-05, + "loss": 0.6512, + "step": 5410 + }, + { + "epoch": 0.19, + "learning_rate": 1.8319985580916588e-05, + "loss": 0.5846, + "step": 5411 + }, + { + "epoch": 0.19, + "learning_rate": 1.8319381453598406e-05, + "loss": 0.6276, + "step": 5412 + }, + { + "epoch": 0.19, + "learning_rate": 1.831877722764343e-05, + "loss": 0.5678, + "step": 5413 + }, + { + "epoch": 0.19, + "learning_rate": 1.8318172903058834e-05, + "loss": 0.6427, + "step": 5414 + }, + { + "epoch": 0.19, + "learning_rate": 1.8317568479851772e-05, + "loss": 0.6722, + "step": 5415 + }, + { + "epoch": 0.19, + "learning_rate": 1.831696395802941e-05, + "loss": 0.6378, + "step": 5416 + }, + { + "epoch": 0.19, + "learning_rate": 1.8316359337598928e-05, + "loss": 0.6209, + "step": 5417 + }, + { + "epoch": 0.19, + "learning_rate": 1.831575461856748e-05, + "loss": 0.6602, + "step": 5418 + }, + { + "epoch": 0.19, + "learning_rate": 1.8315149800942243e-05, + "loss": 0.6578, + "step": 5419 + }, + { + "epoch": 0.19, + "learning_rate": 1.8314544884730385e-05, + "loss": 0.6519, + "step": 5420 + }, + { + "epoch": 0.19, + "learning_rate": 1.8313939869939084e-05, + "loss": 0.636, + "step": 5421 + }, + { + "epoch": 0.19, + "learning_rate": 1.8313334756575503e-05, + "loss": 0.6368, + "step": 5422 + }, + { + "epoch": 0.19, + "learning_rate": 1.8312729544646824e-05, + "loss": 0.638, + "step": 5423 + }, + { + "epoch": 0.19, + "learning_rate": 1.831212423416022e-05, + "loss": 0.6661, + "step": 5424 + }, + { + "epoch": 0.19, + "learning_rate": 1.8311518825122873e-05, + "loss": 0.666, + "step": 5425 + }, + { + "epoch": 0.19, + "learning_rate": 1.831091331754195e-05, + "loss": 0.6202, + "step": 5426 + }, + { + "epoch": 0.19, + "learning_rate": 1.831030771142464e-05, + "loss": 0.6605, + "step": 5427 + }, + { + "epoch": 0.19, + "learning_rate": 1.8309702006778118e-05, + "loss": 0.7051, + "step": 5428 + }, + { + "epoch": 0.19, + "learning_rate": 1.8309096203609566e-05, + "loss": 0.5795, + "step": 5429 + }, + { + "epoch": 0.19, + "learning_rate": 1.8308490301926167e-05, + "loss": 0.652, + "step": 5430 + }, + { + "epoch": 0.19, + "learning_rate": 1.830788430173511e-05, + "loss": 0.6556, + "step": 5431 + }, + { + "epoch": 0.19, + "learning_rate": 1.830727820304357e-05, + "loss": 0.6892, + "step": 5432 + }, + { + "epoch": 0.19, + "learning_rate": 1.830667200585874e-05, + "loss": 0.6471, + "step": 5433 + }, + { + "epoch": 0.19, + "learning_rate": 1.8306065710187804e-05, + "loss": 0.6777, + "step": 5434 + }, + { + "epoch": 0.19, + "learning_rate": 1.830545931603795e-05, + "loss": 0.6327, + "step": 5435 + }, + { + "epoch": 0.19, + "learning_rate": 1.830485282341637e-05, + "loss": 0.67, + "step": 5436 + }, + { + "epoch": 0.19, + "learning_rate": 1.830424623233026e-05, + "loss": 0.6638, + "step": 5437 + }, + { + "epoch": 0.19, + "learning_rate": 1.8303639542786806e-05, + "loss": 0.6431, + "step": 5438 + }, + { + "epoch": 0.19, + "learning_rate": 1.8303032754793192e-05, + "loss": 0.6163, + "step": 5439 + }, + { + "epoch": 0.19, + "learning_rate": 1.830242586835663e-05, + "loss": 0.6604, + "step": 5440 + }, + { + "epoch": 0.19, + "learning_rate": 1.8301818883484303e-05, + "loss": 0.6012, + "step": 5441 + }, + { + "epoch": 0.19, + "learning_rate": 1.830121180018341e-05, + "loss": 0.6359, + "step": 5442 + }, + { + "epoch": 0.19, + "learning_rate": 1.8300604618461154e-05, + "loss": 0.6157, + "step": 5443 + }, + { + "epoch": 0.19, + "learning_rate": 1.8299997338324725e-05, + "loss": 0.6677, + "step": 5444 + }, + { + "epoch": 0.19, + "learning_rate": 1.8299389959781333e-05, + "loss": 0.6564, + "step": 5445 + }, + { + "epoch": 0.19, + "learning_rate": 1.829878248283817e-05, + "loss": 0.6511, + "step": 5446 + }, + { + "epoch": 0.19, + "learning_rate": 1.8298174907502442e-05, + "loss": 0.6636, + "step": 5447 + }, + { + "epoch": 0.19, + "learning_rate": 1.829756723378136e-05, + "loss": 0.5845, + "step": 5448 + }, + { + "epoch": 0.19, + "learning_rate": 1.8296959461682117e-05, + "loss": 0.6389, + "step": 5449 + }, + { + "epoch": 0.19, + "learning_rate": 1.8296351591211924e-05, + "loss": 0.6301, + "step": 5450 + }, + { + "epoch": 0.19, + "learning_rate": 1.829574362237799e-05, + "loss": 0.6651, + "step": 5451 + }, + { + "epoch": 0.19, + "learning_rate": 1.829513555518752e-05, + "loss": 0.6036, + "step": 5452 + }, + { + "epoch": 0.19, + "learning_rate": 1.8294527389647722e-05, + "loss": 0.6285, + "step": 5453 + }, + { + "epoch": 0.19, + "learning_rate": 1.8293919125765812e-05, + "loss": 0.6885, + "step": 5454 + }, + { + "epoch": 0.19, + "learning_rate": 1.8293310763548998e-05, + "loss": 0.6097, + "step": 5455 + }, + { + "epoch": 0.19, + "learning_rate": 1.8292702303004496e-05, + "loss": 0.6041, + "step": 5456 + }, + { + "epoch": 0.19, + "learning_rate": 1.8292093744139513e-05, + "loss": 0.5934, + "step": 5457 + }, + { + "epoch": 0.19, + "learning_rate": 1.8291485086961273e-05, + "loss": 0.6735, + "step": 5458 + }, + { + "epoch": 0.19, + "learning_rate": 1.8290876331476988e-05, + "loss": 0.6487, + "step": 5459 + }, + { + "epoch": 0.19, + "learning_rate": 1.8290267477693876e-05, + "loss": 0.6333, + "step": 5460 + }, + { + "epoch": 0.19, + "learning_rate": 1.8289658525619157e-05, + "loss": 0.6538, + "step": 5461 + }, + { + "epoch": 0.19, + "learning_rate": 1.8289049475260044e-05, + "loss": 0.6631, + "step": 5462 + }, + { + "epoch": 0.19, + "learning_rate": 1.828844032662377e-05, + "loss": 0.6722, + "step": 5463 + }, + { + "epoch": 0.19, + "learning_rate": 1.828783107971755e-05, + "loss": 0.6439, + "step": 5464 + }, + { + "epoch": 0.19, + "learning_rate": 1.828722173454861e-05, + "loss": 0.6113, + "step": 5465 + }, + { + "epoch": 0.19, + "learning_rate": 1.828661229112417e-05, + "loss": 0.6688, + "step": 5466 + }, + { + "epoch": 0.19, + "learning_rate": 1.8286002749451458e-05, + "loss": 0.5986, + "step": 5467 + }, + { + "epoch": 0.19, + "learning_rate": 1.82853931095377e-05, + "loss": 0.648, + "step": 5468 + }, + { + "epoch": 0.19, + "learning_rate": 1.828478337139013e-05, + "loss": 0.6518, + "step": 5469 + }, + { + "epoch": 0.19, + "learning_rate": 1.828417353501597e-05, + "loss": 0.6205, + "step": 5470 + }, + { + "epoch": 0.19, + "learning_rate": 1.8283563600422453e-05, + "loss": 0.6601, + "step": 5471 + }, + { + "epoch": 0.19, + "learning_rate": 1.8282953567616814e-05, + "loss": 0.6496, + "step": 5472 + }, + { + "epoch": 0.19, + "learning_rate": 1.828234343660628e-05, + "loss": 0.5873, + "step": 5473 + }, + { + "epoch": 0.19, + "learning_rate": 1.8281733207398086e-05, + "loss": 0.6425, + "step": 5474 + }, + { + "epoch": 0.19, + "learning_rate": 1.828112287999947e-05, + "loss": 0.627, + "step": 5475 + }, + { + "epoch": 0.19, + "learning_rate": 1.828051245441767e-05, + "loss": 0.6386, + "step": 5476 + }, + { + "epoch": 0.19, + "learning_rate": 1.8279901930659914e-05, + "loss": 0.6222, + "step": 5477 + }, + { + "epoch": 0.19, + "learning_rate": 1.827929130873345e-05, + "loss": 0.6334, + "step": 5478 + }, + { + "epoch": 0.19, + "learning_rate": 1.8278680588645513e-05, + "loss": 0.6453, + "step": 5479 + }, + { + "epoch": 0.19, + "learning_rate": 1.827806977040335e-05, + "loss": 0.6294, + "step": 5480 + }, + { + "epoch": 0.19, + "learning_rate": 1.827745885401419e-05, + "loss": 0.6221, + "step": 5481 + }, + { + "epoch": 0.19, + "learning_rate": 1.8276847839485287e-05, + "loss": 0.6733, + "step": 5482 + }, + { + "epoch": 0.19, + "learning_rate": 1.8276236726823886e-05, + "loss": 0.6213, + "step": 5483 + }, + { + "epoch": 0.19, + "learning_rate": 1.8275625516037225e-05, + "loss": 0.634, + "step": 5484 + }, + { + "epoch": 0.19, + "learning_rate": 1.8275014207132555e-05, + "loss": 0.6766, + "step": 5485 + }, + { + "epoch": 0.19, + "learning_rate": 1.8274402800117125e-05, + "loss": 0.643, + "step": 5486 + }, + { + "epoch": 0.19, + "learning_rate": 1.8273791294998184e-05, + "loss": 0.6178, + "step": 5487 + }, + { + "epoch": 0.19, + "learning_rate": 1.8273179691782978e-05, + "loss": 0.6375, + "step": 5488 + }, + { + "epoch": 0.19, + "learning_rate": 1.827256799047876e-05, + "loss": 0.6277, + "step": 5489 + }, + { + "epoch": 0.19, + "learning_rate": 1.8271956191092788e-05, + "loss": 0.6202, + "step": 5490 + }, + { + "epoch": 0.19, + "learning_rate": 1.827134429363231e-05, + "loss": 0.604, + "step": 5491 + }, + { + "epoch": 0.19, + "learning_rate": 1.8270732298104584e-05, + "loss": 0.6512, + "step": 5492 + }, + { + "epoch": 0.19, + "learning_rate": 1.827012020451686e-05, + "loss": 0.6152, + "step": 5493 + }, + { + "epoch": 0.19, + "learning_rate": 1.82695080128764e-05, + "loss": 0.6622, + "step": 5494 + }, + { + "epoch": 0.19, + "learning_rate": 1.826889572319046e-05, + "loss": 0.5792, + "step": 5495 + }, + { + "epoch": 0.19, + "learning_rate": 1.8268283335466304e-05, + "loss": 0.7125, + "step": 5496 + }, + { + "epoch": 0.19, + "learning_rate": 1.826767084971119e-05, + "loss": 0.6577, + "step": 5497 + }, + { + "epoch": 0.19, + "learning_rate": 1.826705826593238e-05, + "loss": 0.6308, + "step": 5498 + }, + { + "epoch": 0.19, + "learning_rate": 1.826644558413713e-05, + "loss": 0.5865, + "step": 5499 + }, + { + "epoch": 0.19, + "learning_rate": 1.8265832804332717e-05, + "loss": 0.6244, + "step": 5500 + }, + { + "epoch": 0.19, + "learning_rate": 1.8265219926526398e-05, + "loss": 0.6203, + "step": 5501 + }, + { + "epoch": 0.19, + "learning_rate": 1.826460695072544e-05, + "loss": 0.6474, + "step": 5502 + }, + { + "epoch": 0.19, + "learning_rate": 1.8263993876937114e-05, + "loss": 0.6529, + "step": 5503 + }, + { + "epoch": 0.19, + "learning_rate": 1.826338070516869e-05, + "loss": 0.6141, + "step": 5504 + }, + { + "epoch": 0.19, + "learning_rate": 1.8262767435427428e-05, + "loss": 0.64, + "step": 5505 + }, + { + "epoch": 0.19, + "learning_rate": 1.8262154067720606e-05, + "loss": 0.6458, + "step": 5506 + }, + { + "epoch": 0.19, + "learning_rate": 1.82615406020555e-05, + "loss": 0.6538, + "step": 5507 + }, + { + "epoch": 0.19, + "learning_rate": 1.8260927038439375e-05, + "loss": 0.6771, + "step": 5508 + }, + { + "epoch": 0.19, + "learning_rate": 1.826031337687951e-05, + "loss": 0.5957, + "step": 5509 + }, + { + "epoch": 0.19, + "learning_rate": 1.825969961738318e-05, + "loss": 0.5753, + "step": 5510 + }, + { + "epoch": 0.19, + "learning_rate": 1.8259085759957667e-05, + "loss": 0.6326, + "step": 5511 + }, + { + "epoch": 0.19, + "learning_rate": 1.825847180461024e-05, + "loss": 0.6056, + "step": 5512 + }, + { + "epoch": 0.19, + "learning_rate": 1.8257857751348188e-05, + "loss": 0.6173, + "step": 5513 + }, + { + "epoch": 0.19, + "learning_rate": 1.825724360017878e-05, + "loss": 0.6031, + "step": 5514 + }, + { + "epoch": 0.19, + "learning_rate": 1.825662935110931e-05, + "loss": 0.6386, + "step": 5515 + }, + { + "epoch": 0.19, + "learning_rate": 1.825601500414705e-05, + "loss": 0.6342, + "step": 5516 + }, + { + "epoch": 0.19, + "learning_rate": 1.825540055929929e-05, + "loss": 0.5765, + "step": 5517 + }, + { + "epoch": 0.19, + "learning_rate": 1.8254786016573313e-05, + "loss": 0.6222, + "step": 5518 + }, + { + "epoch": 0.19, + "learning_rate": 1.8254171375976403e-05, + "loss": 0.6798, + "step": 5519 + }, + { + "epoch": 0.19, + "learning_rate": 1.8253556637515852e-05, + "loss": 0.5926, + "step": 5520 + }, + { + "epoch": 0.19, + "learning_rate": 1.8252941801198946e-05, + "loss": 0.6688, + "step": 5521 + }, + { + "epoch": 0.19, + "learning_rate": 1.8252326867032973e-05, + "loss": 0.6777, + "step": 5522 + }, + { + "epoch": 0.19, + "learning_rate": 1.825171183502523e-05, + "loss": 0.6393, + "step": 5523 + }, + { + "epoch": 0.19, + "learning_rate": 1.8251096705183e-05, + "loss": 0.6157, + "step": 5524 + }, + { + "epoch": 0.19, + "learning_rate": 1.8250481477513583e-05, + "loss": 0.6484, + "step": 5525 + }, + { + "epoch": 0.19, + "learning_rate": 1.824986615202427e-05, + "loss": 0.6149, + "step": 5526 + }, + { + "epoch": 0.19, + "learning_rate": 1.824925072872236e-05, + "loss": 0.6351, + "step": 5527 + }, + { + "epoch": 0.19, + "learning_rate": 1.8248635207615147e-05, + "loss": 0.6013, + "step": 5528 + }, + { + "epoch": 0.19, + "learning_rate": 1.824801958870993e-05, + "loss": 0.6152, + "step": 5529 + }, + { + "epoch": 0.19, + "learning_rate": 1.8247403872014e-05, + "loss": 0.6026, + "step": 5530 + }, + { + "epoch": 0.19, + "learning_rate": 1.8246788057534672e-05, + "loss": 0.6801, + "step": 5531 + }, + { + "epoch": 0.19, + "learning_rate": 1.8246172145279237e-05, + "loss": 0.6636, + "step": 5532 + }, + { + "epoch": 0.19, + "learning_rate": 1.8245556135255e-05, + "loss": 0.6327, + "step": 5533 + }, + { + "epoch": 0.19, + "learning_rate": 1.8244940027469263e-05, + "loss": 0.6373, + "step": 5534 + }, + { + "epoch": 0.19, + "learning_rate": 1.8244323821929334e-05, + "loss": 0.6658, + "step": 5535 + }, + { + "epoch": 0.19, + "learning_rate": 1.8243707518642514e-05, + "loss": 0.6185, + "step": 5536 + }, + { + "epoch": 0.19, + "learning_rate": 1.8243091117616115e-05, + "loss": 0.5985, + "step": 5537 + }, + { + "epoch": 0.19, + "learning_rate": 1.8242474618857442e-05, + "loss": 0.6476, + "step": 5538 + }, + { + "epoch": 0.19, + "learning_rate": 1.8241858022373807e-05, + "loss": 0.6566, + "step": 5539 + }, + { + "epoch": 0.19, + "learning_rate": 1.824124132817252e-05, + "loss": 0.6255, + "step": 5540 + }, + { + "epoch": 0.19, + "learning_rate": 1.824062453626089e-05, + "loss": 0.6315, + "step": 5541 + }, + { + "epoch": 0.19, + "learning_rate": 1.824000764664623e-05, + "loss": 0.6915, + "step": 5542 + }, + { + "epoch": 0.19, + "learning_rate": 1.823939065933586e-05, + "loss": 0.6583, + "step": 5543 + }, + { + "epoch": 0.19, + "learning_rate": 1.823877357433709e-05, + "loss": 0.7038, + "step": 5544 + }, + { + "epoch": 0.19, + "learning_rate": 1.8238156391657234e-05, + "loss": 0.6627, + "step": 5545 + }, + { + "epoch": 0.19, + "learning_rate": 1.8237539111303615e-05, + "loss": 0.6746, + "step": 5546 + }, + { + "epoch": 0.19, + "learning_rate": 1.8236921733283547e-05, + "loss": 0.6617, + "step": 5547 + }, + { + "epoch": 0.19, + "learning_rate": 1.8236304257604357e-05, + "loss": 0.6575, + "step": 5548 + }, + { + "epoch": 0.19, + "learning_rate": 1.8235686684273358e-05, + "loss": 0.6495, + "step": 5549 + }, + { + "epoch": 0.19, + "learning_rate": 1.8235069013297875e-05, + "loss": 0.6438, + "step": 5550 + }, + { + "epoch": 0.19, + "learning_rate": 1.8234451244685232e-05, + "loss": 0.677, + "step": 5551 + }, + { + "epoch": 0.19, + "learning_rate": 1.8233833378442752e-05, + "loss": 0.6836, + "step": 5552 + }, + { + "epoch": 0.19, + "learning_rate": 1.823321541457776e-05, + "loss": 0.6971, + "step": 5553 + }, + { + "epoch": 0.19, + "learning_rate": 1.8232597353097587e-05, + "loss": 0.6726, + "step": 5554 + }, + { + "epoch": 0.19, + "learning_rate": 1.8231979194009556e-05, + "loss": 0.6364, + "step": 5555 + }, + { + "epoch": 0.19, + "learning_rate": 1.8231360937321e-05, + "loss": 0.6137, + "step": 5556 + }, + { + "epoch": 0.19, + "learning_rate": 1.8230742583039245e-05, + "loss": 0.6449, + "step": 5557 + }, + { + "epoch": 0.19, + "learning_rate": 1.8230124131171626e-05, + "loss": 0.6651, + "step": 5558 + }, + { + "epoch": 0.19, + "learning_rate": 1.8229505581725476e-05, + "loss": 0.6005, + "step": 5559 + }, + { + "epoch": 0.19, + "learning_rate": 1.8228886934708127e-05, + "loss": 0.6244, + "step": 5560 + }, + { + "epoch": 0.19, + "learning_rate": 1.822826819012691e-05, + "loss": 0.669, + "step": 5561 + }, + { + "epoch": 0.19, + "learning_rate": 1.822764934798917e-05, + "loss": 0.653, + "step": 5562 + }, + { + "epoch": 0.19, + "learning_rate": 1.8227030408302236e-05, + "loss": 0.643, + "step": 5563 + }, + { + "epoch": 0.19, + "learning_rate": 1.822641137107345e-05, + "loss": 0.6253, + "step": 5564 + }, + { + "epoch": 0.19, + "learning_rate": 1.822579223631015e-05, + "loss": 0.6401, + "step": 5565 + }, + { + "epoch": 0.19, + "learning_rate": 1.8225173004019675e-05, + "loss": 0.6873, + "step": 5566 + }, + { + "epoch": 0.19, + "learning_rate": 1.8224553674209372e-05, + "loss": 0.6521, + "step": 5567 + }, + { + "epoch": 0.19, + "learning_rate": 1.822393424688658e-05, + "loss": 0.6154, + "step": 5568 + }, + { + "epoch": 0.19, + "learning_rate": 1.8223314722058647e-05, + "loss": 0.6674, + "step": 5569 + }, + { + "epoch": 0.19, + "learning_rate": 1.8222695099732912e-05, + "loss": 0.6535, + "step": 5570 + }, + { + "epoch": 0.19, + "learning_rate": 1.8222075379916728e-05, + "loss": 0.6556, + "step": 5571 + }, + { + "epoch": 0.19, + "learning_rate": 1.822145556261744e-05, + "loss": 0.5962, + "step": 5572 + }, + { + "epoch": 0.19, + "learning_rate": 1.822083564784239e-05, + "loss": 0.6828, + "step": 5573 + }, + { + "epoch": 0.19, + "learning_rate": 1.8220215635598938e-05, + "loss": 0.6538, + "step": 5574 + }, + { + "epoch": 0.19, + "learning_rate": 1.821959552589443e-05, + "loss": 0.6265, + "step": 5575 + }, + { + "epoch": 0.19, + "learning_rate": 1.821897531873622e-05, + "loss": 0.659, + "step": 5576 + }, + { + "epoch": 0.19, + "learning_rate": 1.8218355014131662e-05, + "loss": 0.6303, + "step": 5577 + }, + { + "epoch": 0.19, + "learning_rate": 1.8217734612088108e-05, + "loss": 0.6235, + "step": 5578 + }, + { + "epoch": 0.19, + "learning_rate": 1.8217114112612912e-05, + "loss": 0.6286, + "step": 5579 + }, + { + "epoch": 0.19, + "learning_rate": 1.8216493515713437e-05, + "loss": 0.5933, + "step": 5580 + }, + { + "epoch": 0.19, + "learning_rate": 1.8215872821397034e-05, + "loss": 0.648, + "step": 5581 + }, + { + "epoch": 0.19, + "learning_rate": 1.821525202967107e-05, + "loss": 0.6492, + "step": 5582 + }, + { + "epoch": 0.19, + "learning_rate": 1.8214631140542896e-05, + "loss": 0.6445, + "step": 5583 + }, + { + "epoch": 0.19, + "learning_rate": 1.821401015401988e-05, + "loss": 0.6458, + "step": 5584 + }, + { + "epoch": 0.19, + "learning_rate": 1.8213389070109385e-05, + "loss": 0.657, + "step": 5585 + }, + { + "epoch": 0.19, + "learning_rate": 1.8212767888818772e-05, + "loss": 0.6497, + "step": 5586 + }, + { + "epoch": 0.19, + "learning_rate": 1.8212146610155407e-05, + "loss": 0.6569, + "step": 5587 + }, + { + "epoch": 0.19, + "learning_rate": 1.821152523412665e-05, + "loss": 0.5769, + "step": 5588 + }, + { + "epoch": 0.19, + "learning_rate": 1.821090376073988e-05, + "loss": 0.6527, + "step": 5589 + }, + { + "epoch": 0.19, + "learning_rate": 1.8210282190002458e-05, + "loss": 0.6758, + "step": 5590 + }, + { + "epoch": 0.19, + "learning_rate": 1.8209660521921753e-05, + "loss": 0.6408, + "step": 5591 + }, + { + "epoch": 0.19, + "learning_rate": 1.8209038756505137e-05, + "loss": 0.6058, + "step": 5592 + }, + { + "epoch": 0.19, + "learning_rate": 1.8208416893759984e-05, + "loss": 0.705, + "step": 5593 + }, + { + "epoch": 0.19, + "learning_rate": 1.8207794933693663e-05, + "loss": 0.6479, + "step": 5594 + }, + { + "epoch": 0.19, + "learning_rate": 1.820717287631355e-05, + "loss": 0.6443, + "step": 5595 + }, + { + "epoch": 0.19, + "learning_rate": 1.8206550721627022e-05, + "loss": 0.6557, + "step": 5596 + }, + { + "epoch": 0.19, + "learning_rate": 1.8205928469641454e-05, + "loss": 0.6964, + "step": 5597 + }, + { + "epoch": 0.19, + "learning_rate": 1.8205306120364222e-05, + "loss": 0.6388, + "step": 5598 + }, + { + "epoch": 0.19, + "learning_rate": 1.8204683673802708e-05, + "loss": 0.6353, + "step": 5599 + }, + { + "epoch": 0.19, + "learning_rate": 1.8204061129964288e-05, + "loss": 0.6237, + "step": 5600 + }, + { + "epoch": 0.19, + "learning_rate": 1.8203438488856348e-05, + "loss": 0.6607, + "step": 5601 + }, + { + "epoch": 0.19, + "learning_rate": 1.8202815750486264e-05, + "loss": 0.6388, + "step": 5602 + }, + { + "epoch": 0.19, + "learning_rate": 1.8202192914861423e-05, + "loss": 0.6502, + "step": 5603 + }, + { + "epoch": 0.19, + "learning_rate": 1.820156998198921e-05, + "loss": 0.635, + "step": 5604 + }, + { + "epoch": 0.19, + "learning_rate": 1.820094695187701e-05, + "loss": 0.6079, + "step": 5605 + }, + { + "epoch": 0.19, + "learning_rate": 1.820032382453221e-05, + "loss": 0.6103, + "step": 5606 + }, + { + "epoch": 0.19, + "learning_rate": 1.81997005999622e-05, + "loss": 0.6061, + "step": 5607 + }, + { + "epoch": 0.19, + "learning_rate": 1.819907727817436e-05, + "loss": 0.6136, + "step": 5608 + }, + { + "epoch": 0.19, + "learning_rate": 1.8198453859176093e-05, + "loss": 0.6008, + "step": 5609 + }, + { + "epoch": 0.19, + "learning_rate": 1.8197830342974783e-05, + "loss": 0.6617, + "step": 5610 + }, + { + "epoch": 0.19, + "learning_rate": 1.819720672957782e-05, + "loss": 0.6672, + "step": 5611 + }, + { + "epoch": 0.19, + "learning_rate": 1.8196583018992608e-05, + "loss": 0.6834, + "step": 5612 + }, + { + "epoch": 0.19, + "learning_rate": 1.819595921122653e-05, + "loss": 0.6469, + "step": 5613 + }, + { + "epoch": 0.19, + "learning_rate": 1.8195335306286993e-05, + "loss": 0.6241, + "step": 5614 + }, + { + "epoch": 0.19, + "learning_rate": 1.8194711304181384e-05, + "loss": 0.5881, + "step": 5615 + }, + { + "epoch": 0.19, + "learning_rate": 1.819408720491711e-05, + "loss": 0.6256, + "step": 5616 + }, + { + "epoch": 0.19, + "learning_rate": 1.8193463008501565e-05, + "loss": 0.6255, + "step": 5617 + }, + { + "epoch": 0.19, + "learning_rate": 1.819283871494215e-05, + "loss": 0.6257, + "step": 5618 + }, + { + "epoch": 0.19, + "learning_rate": 1.819221432424627e-05, + "loss": 0.5905, + "step": 5619 + }, + { + "epoch": 0.19, + "learning_rate": 1.8191589836421322e-05, + "loss": 0.6378, + "step": 5620 + }, + { + "epoch": 0.19, + "learning_rate": 1.819096525147472e-05, + "loss": 0.6903, + "step": 5621 + }, + { + "epoch": 0.19, + "learning_rate": 1.819034056941386e-05, + "loss": 0.6382, + "step": 5622 + }, + { + "epoch": 0.19, + "learning_rate": 1.818971579024615e-05, + "loss": 0.6435, + "step": 5623 + }, + { + "epoch": 0.19, + "learning_rate": 1.8189090913979e-05, + "loss": 0.6316, + "step": 5624 + }, + { + "epoch": 0.19, + "learning_rate": 1.8188465940619823e-05, + "loss": 0.6905, + "step": 5625 + }, + { + "epoch": 0.19, + "learning_rate": 1.818784087017602e-05, + "loss": 0.7193, + "step": 5626 + }, + { + "epoch": 0.19, + "learning_rate": 1.8187215702655004e-05, + "loss": 0.6179, + "step": 5627 + }, + { + "epoch": 0.19, + "learning_rate": 1.8186590438064192e-05, + "loss": 0.6333, + "step": 5628 + }, + { + "epoch": 0.2, + "learning_rate": 1.8185965076410994e-05, + "loss": 0.7022, + "step": 5629 + }, + { + "epoch": 0.2, + "learning_rate": 1.8185339617702822e-05, + "loss": 0.673, + "step": 5630 + }, + { + "epoch": 0.2, + "learning_rate": 1.8184714061947098e-05, + "loss": 0.6772, + "step": 5631 + }, + { + "epoch": 0.2, + "learning_rate": 1.8184088409151233e-05, + "loss": 0.6865, + "step": 5632 + }, + { + "epoch": 0.2, + "learning_rate": 1.818346265932265e-05, + "loss": 0.6913, + "step": 5633 + }, + { + "epoch": 0.2, + "learning_rate": 1.818283681246876e-05, + "loss": 0.6006, + "step": 5634 + }, + { + "epoch": 0.2, + "learning_rate": 1.818221086859699e-05, + "loss": 0.5941, + "step": 5635 + }, + { + "epoch": 0.2, + "learning_rate": 1.818158482771476e-05, + "loss": 0.6682, + "step": 5636 + }, + { + "epoch": 0.2, + "learning_rate": 1.8180958689829493e-05, + "loss": 0.6147, + "step": 5637 + }, + { + "epoch": 0.2, + "learning_rate": 1.818033245494861e-05, + "loss": 0.5888, + "step": 5638 + }, + { + "epoch": 0.2, + "learning_rate": 1.817970612307954e-05, + "loss": 0.6053, + "step": 5639 + }, + { + "epoch": 0.2, + "learning_rate": 1.8179079694229704e-05, + "loss": 0.6374, + "step": 5640 + }, + { + "epoch": 0.2, + "learning_rate": 1.8178453168406535e-05, + "loss": 0.5984, + "step": 5641 + }, + { + "epoch": 0.2, + "learning_rate": 1.8177826545617454e-05, + "loss": 0.6772, + "step": 5642 + }, + { + "epoch": 0.2, + "learning_rate": 1.8177199825869897e-05, + "loss": 0.6536, + "step": 5643 + }, + { + "epoch": 0.2, + "learning_rate": 1.817657300917129e-05, + "loss": 0.6478, + "step": 5644 + }, + { + "epoch": 0.2, + "learning_rate": 1.8175946095529066e-05, + "loss": 0.5984, + "step": 5645 + }, + { + "epoch": 0.2, + "learning_rate": 1.8175319084950663e-05, + "loss": 0.6705, + "step": 5646 + }, + { + "epoch": 0.2, + "learning_rate": 1.8174691977443505e-05, + "loss": 0.6436, + "step": 5647 + }, + { + "epoch": 0.2, + "learning_rate": 1.8174064773015035e-05, + "loss": 0.6075, + "step": 5648 + }, + { + "epoch": 0.2, + "learning_rate": 1.8173437471672688e-05, + "loss": 0.6667, + "step": 5649 + }, + { + "epoch": 0.2, + "learning_rate": 1.81728100734239e-05, + "loss": 0.572, + "step": 5650 + }, + { + "epoch": 0.2, + "learning_rate": 1.8172182578276104e-05, + "loss": 0.6472, + "step": 5651 + }, + { + "epoch": 0.2, + "learning_rate": 1.8171554986236756e-05, + "loss": 0.6339, + "step": 5652 + }, + { + "epoch": 0.2, + "learning_rate": 1.8170927297313277e-05, + "loss": 0.6363, + "step": 5653 + }, + { + "epoch": 0.2, + "learning_rate": 1.8170299511513122e-05, + "loss": 0.6336, + "step": 5654 + }, + { + "epoch": 0.2, + "learning_rate": 1.8169671628843732e-05, + "loss": 0.6678, + "step": 5655 + }, + { + "epoch": 0.2, + "learning_rate": 1.8169043649312553e-05, + "loss": 0.616, + "step": 5656 + }, + { + "epoch": 0.2, + "learning_rate": 1.8168415572927022e-05, + "loss": 0.6423, + "step": 5657 + }, + { + "epoch": 0.2, + "learning_rate": 1.8167787399694594e-05, + "loss": 0.6564, + "step": 5658 + }, + { + "epoch": 0.2, + "learning_rate": 1.8167159129622715e-05, + "loss": 0.6705, + "step": 5659 + }, + { + "epoch": 0.2, + "learning_rate": 1.816653076271883e-05, + "loss": 0.6319, + "step": 5660 + }, + { + "epoch": 0.2, + "learning_rate": 1.8165902298990393e-05, + "loss": 0.6624, + "step": 5661 + }, + { + "epoch": 0.2, + "learning_rate": 1.8165273738444855e-05, + "loss": 0.6135, + "step": 5662 + }, + { + "epoch": 0.2, + "learning_rate": 1.8164645081089668e-05, + "loss": 0.6441, + "step": 5663 + }, + { + "epoch": 0.2, + "learning_rate": 1.8164016326932286e-05, + "loss": 0.6864, + "step": 5664 + }, + { + "epoch": 0.2, + "learning_rate": 1.816338747598016e-05, + "loss": 0.6524, + "step": 5665 + }, + { + "epoch": 0.2, + "learning_rate": 1.816275852824075e-05, + "loss": 0.6269, + "step": 5666 + }, + { + "epoch": 0.2, + "learning_rate": 1.8162129483721515e-05, + "loss": 0.6116, + "step": 5667 + }, + { + "epoch": 0.2, + "learning_rate": 1.8161500342429907e-05, + "loss": 0.6031, + "step": 5668 + }, + { + "epoch": 0.2, + "learning_rate": 1.816087110437339e-05, + "loss": 0.643, + "step": 5669 + }, + { + "epoch": 0.2, + "learning_rate": 1.8160241769559422e-05, + "loss": 0.5983, + "step": 5670 + }, + { + "epoch": 0.2, + "learning_rate": 1.815961233799546e-05, + "loss": 0.641, + "step": 5671 + }, + { + "epoch": 0.2, + "learning_rate": 1.815898280968898e-05, + "loss": 0.637, + "step": 5672 + }, + { + "epoch": 0.2, + "learning_rate": 1.815835318464743e-05, + "loss": 0.6298, + "step": 5673 + }, + { + "epoch": 0.2, + "learning_rate": 1.8157723462878288e-05, + "loss": 0.7178, + "step": 5674 + }, + { + "epoch": 0.2, + "learning_rate": 1.815709364438901e-05, + "loss": 0.668, + "step": 5675 + }, + { + "epoch": 0.2, + "learning_rate": 1.8156463729187073e-05, + "loss": 0.616, + "step": 5676 + }, + { + "epoch": 0.2, + "learning_rate": 1.8155833717279938e-05, + "loss": 0.6202, + "step": 5677 + }, + { + "epoch": 0.2, + "learning_rate": 1.8155203608675077e-05, + "loss": 0.6328, + "step": 5678 + }, + { + "epoch": 0.2, + "learning_rate": 1.815457340337996e-05, + "loss": 0.6795, + "step": 5679 + }, + { + "epoch": 0.2, + "learning_rate": 1.815394310140206e-05, + "loss": 0.5134, + "step": 5680 + }, + { + "epoch": 0.2, + "learning_rate": 1.8153312702748854e-05, + "loss": 0.593, + "step": 5681 + }, + { + "epoch": 0.2, + "learning_rate": 1.815268220742781e-05, + "loss": 0.6712, + "step": 5682 + }, + { + "epoch": 0.2, + "learning_rate": 1.8152051615446402e-05, + "loss": 0.6376, + "step": 5683 + }, + { + "epoch": 0.2, + "learning_rate": 1.8151420926812113e-05, + "loss": 0.6416, + "step": 5684 + }, + { + "epoch": 0.2, + "learning_rate": 1.8150790141532414e-05, + "loss": 0.6131, + "step": 5685 + }, + { + "epoch": 0.2, + "learning_rate": 1.8150159259614788e-05, + "loss": 0.6331, + "step": 5686 + }, + { + "epoch": 0.2, + "learning_rate": 1.8149528281066714e-05, + "loss": 0.6571, + "step": 5687 + }, + { + "epoch": 0.2, + "learning_rate": 1.8148897205895675e-05, + "loss": 0.661, + "step": 5688 + }, + { + "epoch": 0.2, + "learning_rate": 1.814826603410915e-05, + "loss": 0.6878, + "step": 5689 + }, + { + "epoch": 0.2, + "learning_rate": 1.8147634765714625e-05, + "loss": 0.609, + "step": 5690 + }, + { + "epoch": 0.2, + "learning_rate": 1.814700340071958e-05, + "loss": 0.6181, + "step": 5691 + }, + { + "epoch": 0.2, + "learning_rate": 1.8146371939131504e-05, + "loss": 0.6766, + "step": 5692 + }, + { + "epoch": 0.2, + "learning_rate": 1.8145740380957887e-05, + "loss": 0.6108, + "step": 5693 + }, + { + "epoch": 0.2, + "learning_rate": 1.814510872620621e-05, + "loss": 0.6255, + "step": 5694 + }, + { + "epoch": 0.2, + "learning_rate": 1.8144476974883968e-05, + "loss": 0.6319, + "step": 5695 + }, + { + "epoch": 0.2, + "learning_rate": 1.8143845126998645e-05, + "loss": 0.6559, + "step": 5696 + }, + { + "epoch": 0.2, + "learning_rate": 1.814321318255774e-05, + "loss": 0.6219, + "step": 5697 + }, + { + "epoch": 0.2, + "learning_rate": 1.814258114156874e-05, + "loss": 0.673, + "step": 5698 + }, + { + "epoch": 0.2, + "learning_rate": 1.8141949004039138e-05, + "loss": 0.6578, + "step": 5699 + }, + { + "epoch": 0.2, + "learning_rate": 1.8141316769976435e-05, + "loss": 0.637, + "step": 5700 + }, + { + "epoch": 0.2, + "learning_rate": 1.814068443938812e-05, + "loss": 0.6665, + "step": 5701 + }, + { + "epoch": 0.2, + "learning_rate": 1.814005201228169e-05, + "loss": 0.6677, + "step": 5702 + }, + { + "epoch": 0.2, + "learning_rate": 1.8139419488664654e-05, + "loss": 0.6171, + "step": 5703 + }, + { + "epoch": 0.2, + "learning_rate": 1.81387868685445e-05, + "loss": 0.6328, + "step": 5704 + }, + { + "epoch": 0.2, + "learning_rate": 1.813815415192873e-05, + "loss": 0.6259, + "step": 5705 + }, + { + "epoch": 0.2, + "learning_rate": 1.813752133882485e-05, + "loss": 0.6429, + "step": 5706 + }, + { + "epoch": 0.2, + "learning_rate": 1.813688842924036e-05, + "loss": 0.5939, + "step": 5707 + }, + { + "epoch": 0.2, + "learning_rate": 1.813625542318276e-05, + "loss": 0.6557, + "step": 5708 + }, + { + "epoch": 0.2, + "learning_rate": 1.813562232065957e-05, + "loss": 0.61, + "step": 5709 + }, + { + "epoch": 0.2, + "learning_rate": 1.8134989121678277e-05, + "loss": 0.6052, + "step": 5710 + }, + { + "epoch": 0.2, + "learning_rate": 1.81343558262464e-05, + "loss": 0.6129, + "step": 5711 + }, + { + "epoch": 0.2, + "learning_rate": 1.8133722434371444e-05, + "loss": 0.641, + "step": 5712 + }, + { + "epoch": 0.2, + "learning_rate": 1.8133088946060916e-05, + "loss": 0.6223, + "step": 5713 + }, + { + "epoch": 0.2, + "learning_rate": 1.8132455361322337e-05, + "loss": 0.5894, + "step": 5714 + }, + { + "epoch": 0.2, + "learning_rate": 1.813182168016321e-05, + "loss": 0.6749, + "step": 5715 + }, + { + "epoch": 0.2, + "learning_rate": 1.813118790259105e-05, + "loss": 0.648, + "step": 5716 + }, + { + "epoch": 0.2, + "learning_rate": 1.813055402861337e-05, + "loss": 0.6845, + "step": 5717 + }, + { + "epoch": 0.2, + "learning_rate": 1.8129920058237685e-05, + "loss": 0.6029, + "step": 5718 + }, + { + "epoch": 0.2, + "learning_rate": 1.8129285991471514e-05, + "loss": 0.6168, + "step": 5719 + }, + { + "epoch": 0.2, + "learning_rate": 1.8128651828322376e-05, + "loss": 0.6008, + "step": 5720 + }, + { + "epoch": 0.2, + "learning_rate": 1.812801756879779e-05, + "loss": 0.6453, + "step": 5721 + }, + { + "epoch": 0.2, + "learning_rate": 1.8127383212905267e-05, + "loss": 0.6513, + "step": 5722 + }, + { + "epoch": 0.2, + "learning_rate": 1.8126748760652343e-05, + "loss": 0.5887, + "step": 5723 + }, + { + "epoch": 0.2, + "learning_rate": 1.8126114212046527e-05, + "loss": 0.5915, + "step": 5724 + }, + { + "epoch": 0.2, + "learning_rate": 1.812547956709535e-05, + "loss": 0.6419, + "step": 5725 + }, + { + "epoch": 0.2, + "learning_rate": 1.812484482580633e-05, + "loss": 0.626, + "step": 5726 + }, + { + "epoch": 0.2, + "learning_rate": 1.8124209988187e-05, + "loss": 0.6393, + "step": 5727 + }, + { + "epoch": 0.2, + "learning_rate": 1.812357505424488e-05, + "loss": 0.5963, + "step": 5728 + }, + { + "epoch": 0.2, + "learning_rate": 1.8122940023987504e-05, + "loss": 0.6992, + "step": 5729 + }, + { + "epoch": 0.2, + "learning_rate": 1.8122304897422397e-05, + "loss": 0.6667, + "step": 5730 + }, + { + "epoch": 0.2, + "learning_rate": 1.812166967455709e-05, + "loss": 0.6285, + "step": 5731 + }, + { + "epoch": 0.2, + "learning_rate": 1.812103435539912e-05, + "loss": 0.6022, + "step": 5732 + }, + { + "epoch": 0.2, + "learning_rate": 1.812039893995601e-05, + "loss": 0.6563, + "step": 5733 + }, + { + "epoch": 0.2, + "learning_rate": 1.81197634282353e-05, + "loss": 0.6084, + "step": 5734 + }, + { + "epoch": 0.2, + "learning_rate": 1.8119127820244522e-05, + "loss": 0.633, + "step": 5735 + }, + { + "epoch": 0.2, + "learning_rate": 1.8118492115991212e-05, + "loss": 0.6605, + "step": 5736 + }, + { + "epoch": 0.2, + "learning_rate": 1.811785631548291e-05, + "loss": 0.6291, + "step": 5737 + }, + { + "epoch": 0.2, + "learning_rate": 1.8117220418727154e-05, + "loss": 0.5887, + "step": 5738 + }, + { + "epoch": 0.2, + "learning_rate": 1.8116584425731477e-05, + "loss": 0.6236, + "step": 5739 + }, + { + "epoch": 0.2, + "learning_rate": 1.8115948336503427e-05, + "loss": 0.6938, + "step": 5740 + }, + { + "epoch": 0.2, + "learning_rate": 1.811531215105054e-05, + "loss": 0.6681, + "step": 5741 + }, + { + "epoch": 0.2, + "learning_rate": 1.8114675869380366e-05, + "loss": 0.6302, + "step": 5742 + }, + { + "epoch": 0.2, + "learning_rate": 1.8114039491500442e-05, + "loss": 0.6404, + "step": 5743 + }, + { + "epoch": 0.2, + "learning_rate": 1.8113403017418318e-05, + "loss": 0.6375, + "step": 5744 + }, + { + "epoch": 0.2, + "learning_rate": 1.811276644714153e-05, + "loss": 0.6292, + "step": 5745 + }, + { + "epoch": 0.2, + "learning_rate": 1.811212978067764e-05, + "loss": 0.6025, + "step": 5746 + }, + { + "epoch": 0.2, + "learning_rate": 1.8111493018034187e-05, + "loss": 0.6345, + "step": 5747 + }, + { + "epoch": 0.2, + "learning_rate": 1.8110856159218727e-05, + "loss": 0.6681, + "step": 5748 + }, + { + "epoch": 0.2, + "learning_rate": 1.8110219204238804e-05, + "loss": 0.6284, + "step": 5749 + }, + { + "epoch": 0.2, + "learning_rate": 1.8109582153101972e-05, + "loss": 0.7254, + "step": 5750 + }, + { + "epoch": 0.2, + "learning_rate": 1.8108945005815784e-05, + "loss": 0.6527, + "step": 5751 + }, + { + "epoch": 0.2, + "learning_rate": 1.81083077623878e-05, + "loss": 0.6655, + "step": 5752 + }, + { + "epoch": 0.2, + "learning_rate": 1.8107670422825567e-05, + "loss": 0.6253, + "step": 5753 + }, + { + "epoch": 0.2, + "learning_rate": 1.8107032987136644e-05, + "loss": 0.5821, + "step": 5754 + }, + { + "epoch": 0.2, + "learning_rate": 1.810639545532859e-05, + "loss": 0.5844, + "step": 5755 + }, + { + "epoch": 0.2, + "learning_rate": 1.8105757827408964e-05, + "loss": 0.644, + "step": 5756 + }, + { + "epoch": 0.2, + "learning_rate": 1.8105120103385327e-05, + "loss": 0.5669, + "step": 5757 + }, + { + "epoch": 0.2, + "learning_rate": 1.8104482283265236e-05, + "loss": 0.6485, + "step": 5758 + }, + { + "epoch": 0.2, + "learning_rate": 1.8103844367056257e-05, + "loss": 0.6757, + "step": 5759 + }, + { + "epoch": 0.2, + "learning_rate": 1.8103206354765946e-05, + "loss": 0.6231, + "step": 5760 + }, + { + "epoch": 0.2, + "learning_rate": 1.810256824640188e-05, + "loss": 0.6973, + "step": 5761 + }, + { + "epoch": 0.2, + "learning_rate": 1.8101930041971613e-05, + "loss": 0.6406, + "step": 5762 + }, + { + "epoch": 0.2, + "learning_rate": 1.810129174148272e-05, + "loss": 0.6171, + "step": 5763 + }, + { + "epoch": 0.2, + "learning_rate": 1.8100653344942762e-05, + "loss": 0.5669, + "step": 5764 + }, + { + "epoch": 0.2, + "learning_rate": 1.8100014852359312e-05, + "loss": 0.6671, + "step": 5765 + }, + { + "epoch": 0.2, + "learning_rate": 1.809937626373994e-05, + "loss": 0.6568, + "step": 5766 + }, + { + "epoch": 0.2, + "learning_rate": 1.809873757909222e-05, + "loss": 0.6303, + "step": 5767 + }, + { + "epoch": 0.2, + "learning_rate": 1.8098098798423715e-05, + "loss": 0.6279, + "step": 5768 + }, + { + "epoch": 0.2, + "learning_rate": 1.8097459921742007e-05, + "loss": 0.5785, + "step": 5769 + }, + { + "epoch": 0.2, + "learning_rate": 1.8096820949054668e-05, + "loss": 0.6485, + "step": 5770 + }, + { + "epoch": 0.2, + "learning_rate": 1.8096181880369273e-05, + "loss": 0.6257, + "step": 5771 + }, + { + "epoch": 0.2, + "learning_rate": 1.8095542715693402e-05, + "loss": 0.629, + "step": 5772 + }, + { + "epoch": 0.2, + "eval_loss": 0.580484926700592, + "eval_runtime": 4925.8584, + "eval_samples_per_second": 111.989, + "eval_steps_per_second": 37.33, + "step": 5772 + }, + { + "epoch": 0.2, + "learning_rate": 1.8094903455034634e-05, + "loss": 0.6303, + "step": 5773 + }, + { + "epoch": 0.2, + "learning_rate": 1.809426409840054e-05, + "loss": 0.6349, + "step": 5774 + }, + { + "epoch": 0.2, + "learning_rate": 1.809362464579871e-05, + "loss": 0.6056, + "step": 5775 + }, + { + "epoch": 0.2, + "learning_rate": 1.809298509723672e-05, + "loss": 0.6424, + "step": 5776 + }, + { + "epoch": 0.2, + "learning_rate": 1.8092345452722152e-05, + "loss": 0.6212, + "step": 5777 + }, + { + "epoch": 0.2, + "learning_rate": 1.8091705712262594e-05, + "loss": 0.6177, + "step": 5778 + }, + { + "epoch": 0.2, + "learning_rate": 1.809106587586563e-05, + "loss": 0.6557, + "step": 5779 + }, + { + "epoch": 0.2, + "learning_rate": 1.809042594353884e-05, + "loss": 0.6419, + "step": 5780 + }, + { + "epoch": 0.2, + "learning_rate": 1.808978591528982e-05, + "loss": 0.652, + "step": 5781 + }, + { + "epoch": 0.2, + "learning_rate": 1.8089145791126156e-05, + "loss": 0.5965, + "step": 5782 + }, + { + "epoch": 0.2, + "learning_rate": 1.808850557105543e-05, + "loss": 0.5975, + "step": 5783 + }, + { + "epoch": 0.2, + "learning_rate": 1.808786525508524e-05, + "loss": 0.6019, + "step": 5784 + }, + { + "epoch": 0.2, + "learning_rate": 1.808722484322318e-05, + "loss": 0.6316, + "step": 5785 + }, + { + "epoch": 0.2, + "learning_rate": 1.8086584335476835e-05, + "loss": 0.6188, + "step": 5786 + }, + { + "epoch": 0.2, + "learning_rate": 1.8085943731853807e-05, + "loss": 0.6465, + "step": 5787 + }, + { + "epoch": 0.2, + "learning_rate": 1.8085303032361686e-05, + "loss": 0.6494, + "step": 5788 + }, + { + "epoch": 0.2, + "learning_rate": 1.8084662237008065e-05, + "loss": 0.6187, + "step": 5789 + }, + { + "epoch": 0.2, + "learning_rate": 1.808402134580055e-05, + "loss": 0.6777, + "step": 5790 + }, + { + "epoch": 0.2, + "learning_rate": 1.8083380358746736e-05, + "loss": 0.592, + "step": 5791 + }, + { + "epoch": 0.2, + "learning_rate": 1.808273927585422e-05, + "loss": 0.675, + "step": 5792 + }, + { + "epoch": 0.2, + "learning_rate": 1.808209809713061e-05, + "loss": 0.6473, + "step": 5793 + }, + { + "epoch": 0.2, + "learning_rate": 1.80814568225835e-05, + "loss": 0.6049, + "step": 5794 + }, + { + "epoch": 0.2, + "learning_rate": 1.8080815452220495e-05, + "loss": 0.6355, + "step": 5795 + }, + { + "epoch": 0.2, + "learning_rate": 1.8080173986049204e-05, + "loss": 0.6665, + "step": 5796 + }, + { + "epoch": 0.2, + "learning_rate": 1.8079532424077222e-05, + "loss": 0.6552, + "step": 5797 + }, + { + "epoch": 0.2, + "learning_rate": 1.807889076631217e-05, + "loss": 0.5823, + "step": 5798 + }, + { + "epoch": 0.2, + "learning_rate": 1.8078249012761646e-05, + "loss": 0.6406, + "step": 5799 + }, + { + "epoch": 0.2, + "learning_rate": 1.807760716343326e-05, + "loss": 0.5953, + "step": 5800 + }, + { + "epoch": 0.2, + "learning_rate": 1.8076965218334622e-05, + "loss": 0.6558, + "step": 5801 + }, + { + "epoch": 0.2, + "learning_rate": 1.8076323177473346e-05, + "loss": 0.6123, + "step": 5802 + }, + { + "epoch": 0.2, + "learning_rate": 1.807568104085704e-05, + "loss": 0.6494, + "step": 5803 + }, + { + "epoch": 0.2, + "learning_rate": 1.807503880849332e-05, + "loss": 0.6335, + "step": 5804 + }, + { + "epoch": 0.2, + "learning_rate": 1.80743964803898e-05, + "loss": 0.6866, + "step": 5805 + }, + { + "epoch": 0.2, + "learning_rate": 1.8073754056554097e-05, + "loss": 0.652, + "step": 5806 + }, + { + "epoch": 0.2, + "learning_rate": 1.8073111536993825e-05, + "loss": 0.6657, + "step": 5807 + }, + { + "epoch": 0.2, + "learning_rate": 1.8072468921716604e-05, + "loss": 0.675, + "step": 5808 + }, + { + "epoch": 0.2, + "learning_rate": 1.8071826210730054e-05, + "loss": 0.6383, + "step": 5809 + }, + { + "epoch": 0.2, + "learning_rate": 1.8071183404041788e-05, + "loss": 0.6181, + "step": 5810 + }, + { + "epoch": 0.2, + "learning_rate": 1.8070540501659436e-05, + "loss": 0.6427, + "step": 5811 + }, + { + "epoch": 0.2, + "learning_rate": 1.8069897503590618e-05, + "loss": 0.6114, + "step": 5812 + }, + { + "epoch": 0.2, + "learning_rate": 1.8069254409842957e-05, + "loss": 0.6551, + "step": 5813 + }, + { + "epoch": 0.2, + "learning_rate": 1.8068611220424074e-05, + "loss": 0.6589, + "step": 5814 + }, + { + "epoch": 0.2, + "learning_rate": 1.80679679353416e-05, + "loss": 0.6764, + "step": 5815 + }, + { + "epoch": 0.2, + "learning_rate": 1.8067324554603162e-05, + "loss": 0.6316, + "step": 5816 + }, + { + "epoch": 0.2, + "learning_rate": 1.806668107821638e-05, + "loss": 0.6187, + "step": 5817 + }, + { + "epoch": 0.2, + "learning_rate": 1.8066037506188896e-05, + "loss": 0.6209, + "step": 5818 + }, + { + "epoch": 0.2, + "learning_rate": 1.8065393838528332e-05, + "loss": 0.6849, + "step": 5819 + }, + { + "epoch": 0.2, + "learning_rate": 1.806475007524232e-05, + "loss": 0.6178, + "step": 5820 + }, + { + "epoch": 0.2, + "learning_rate": 1.8064106216338495e-05, + "loss": 0.6413, + "step": 5821 + }, + { + "epoch": 0.2, + "learning_rate": 1.8063462261824488e-05, + "loss": 0.6736, + "step": 5822 + }, + { + "epoch": 0.2, + "learning_rate": 1.8062818211707935e-05, + "loss": 0.6468, + "step": 5823 + }, + { + "epoch": 0.2, + "learning_rate": 1.8062174065996477e-05, + "loss": 0.6868, + "step": 5824 + }, + { + "epoch": 0.2, + "learning_rate": 1.806152982469774e-05, + "loss": 0.647, + "step": 5825 + }, + { + "epoch": 0.2, + "learning_rate": 1.8060885487819374e-05, + "loss": 0.5567, + "step": 5826 + }, + { + "epoch": 0.2, + "learning_rate": 1.8060241055369015e-05, + "loss": 0.6259, + "step": 5827 + }, + { + "epoch": 0.2, + "learning_rate": 1.8059596527354298e-05, + "loss": 0.6644, + "step": 5828 + }, + { + "epoch": 0.2, + "learning_rate": 1.805895190378287e-05, + "loss": 0.6277, + "step": 5829 + }, + { + "epoch": 0.2, + "learning_rate": 1.8058307184662377e-05, + "loss": 0.6441, + "step": 5830 + }, + { + "epoch": 0.2, + "learning_rate": 1.8057662370000452e-05, + "loss": 0.6719, + "step": 5831 + }, + { + "epoch": 0.2, + "learning_rate": 1.8057017459804747e-05, + "loss": 0.6236, + "step": 5832 + }, + { + "epoch": 0.2, + "learning_rate": 1.805637245408291e-05, + "loss": 0.6351, + "step": 5833 + }, + { + "epoch": 0.2, + "learning_rate": 1.8055727352842587e-05, + "loss": 0.6931, + "step": 5834 + }, + { + "epoch": 0.2, + "learning_rate": 1.8055082156091425e-05, + "loss": 0.5984, + "step": 5835 + }, + { + "epoch": 0.2, + "learning_rate": 1.8054436863837074e-05, + "loss": 0.6663, + "step": 5836 + }, + { + "epoch": 0.2, + "learning_rate": 1.8053791476087186e-05, + "loss": 0.6301, + "step": 5837 + }, + { + "epoch": 0.2, + "learning_rate": 1.805314599284941e-05, + "loss": 0.6531, + "step": 5838 + }, + { + "epoch": 0.2, + "learning_rate": 1.8052500414131403e-05, + "loss": 0.5841, + "step": 5839 + }, + { + "epoch": 0.2, + "learning_rate": 1.8051854739940817e-05, + "loss": 0.649, + "step": 5840 + }, + { + "epoch": 0.2, + "learning_rate": 1.8051208970285304e-05, + "loss": 0.676, + "step": 5841 + }, + { + "epoch": 0.2, + "learning_rate": 1.805056310517253e-05, + "loss": 0.6285, + "step": 5842 + }, + { + "epoch": 0.2, + "learning_rate": 1.8049917144610138e-05, + "loss": 0.6587, + "step": 5843 + }, + { + "epoch": 0.2, + "learning_rate": 1.8049271088605803e-05, + "loss": 0.6402, + "step": 5844 + }, + { + "epoch": 0.2, + "learning_rate": 1.8048624937167174e-05, + "loss": 0.6738, + "step": 5845 + }, + { + "epoch": 0.2, + "learning_rate": 1.804797869030191e-05, + "loss": 0.6242, + "step": 5846 + }, + { + "epoch": 0.2, + "learning_rate": 1.8047332348017686e-05, + "loss": 0.6853, + "step": 5847 + }, + { + "epoch": 0.2, + "learning_rate": 1.804668591032215e-05, + "loss": 0.6479, + "step": 5848 + }, + { + "epoch": 0.2, + "learning_rate": 1.804603937722298e-05, + "loss": 0.6085, + "step": 5849 + }, + { + "epoch": 0.2, + "learning_rate": 1.804539274872783e-05, + "loss": 0.5331, + "step": 5850 + }, + { + "epoch": 0.2, + "learning_rate": 1.8044746024844374e-05, + "loss": 0.6677, + "step": 5851 + }, + { + "epoch": 0.2, + "learning_rate": 1.8044099205580276e-05, + "loss": 0.6521, + "step": 5852 + }, + { + "epoch": 0.2, + "learning_rate": 1.8043452290943206e-05, + "loss": 0.6397, + "step": 5853 + }, + { + "epoch": 0.2, + "learning_rate": 1.8042805280940835e-05, + "loss": 0.6639, + "step": 5854 + }, + { + "epoch": 0.2, + "learning_rate": 1.8042158175580833e-05, + "loss": 0.6779, + "step": 5855 + }, + { + "epoch": 0.2, + "learning_rate": 1.8041510974870874e-05, + "loss": 0.612, + "step": 5856 + }, + { + "epoch": 0.2, + "learning_rate": 1.804086367881863e-05, + "loss": 0.6291, + "step": 5857 + }, + { + "epoch": 0.2, + "learning_rate": 1.804021628743177e-05, + "loss": 0.6329, + "step": 5858 + }, + { + "epoch": 0.2, + "learning_rate": 1.8039568800717977e-05, + "loss": 0.6307, + "step": 5859 + }, + { + "epoch": 0.2, + "learning_rate": 1.8038921218684932e-05, + "loss": 0.6249, + "step": 5860 + }, + { + "epoch": 0.2, + "learning_rate": 1.8038273541340297e-05, + "loss": 0.6098, + "step": 5861 + }, + { + "epoch": 0.2, + "learning_rate": 1.8037625768691768e-05, + "loss": 0.6316, + "step": 5862 + }, + { + "epoch": 0.2, + "learning_rate": 1.8036977900747014e-05, + "loss": 0.6839, + "step": 5863 + }, + { + "epoch": 0.2, + "learning_rate": 1.8036329937513723e-05, + "loss": 0.5936, + "step": 5864 + }, + { + "epoch": 0.2, + "learning_rate": 1.8035681878999573e-05, + "loss": 0.6425, + "step": 5865 + }, + { + "epoch": 0.2, + "learning_rate": 1.8035033725212248e-05, + "loss": 0.6753, + "step": 5866 + }, + { + "epoch": 0.2, + "learning_rate": 1.8034385476159436e-05, + "loss": 0.6094, + "step": 5867 + }, + { + "epoch": 0.2, + "learning_rate": 1.8033737131848818e-05, + "loss": 0.588, + "step": 5868 + }, + { + "epoch": 0.2, + "learning_rate": 1.8033088692288084e-05, + "loss": 0.6909, + "step": 5869 + }, + { + "epoch": 0.2, + "learning_rate": 1.8032440157484926e-05, + "loss": 0.6004, + "step": 5870 + }, + { + "epoch": 0.2, + "learning_rate": 1.8031791527447024e-05, + "loss": 0.6062, + "step": 5871 + }, + { + "epoch": 0.2, + "learning_rate": 1.8031142802182074e-05, + "loss": 0.6192, + "step": 5872 + }, + { + "epoch": 0.2, + "learning_rate": 1.803049398169777e-05, + "loss": 0.6976, + "step": 5873 + }, + { + "epoch": 0.2, + "learning_rate": 1.8029845066001798e-05, + "loss": 0.6532, + "step": 5874 + }, + { + "epoch": 0.2, + "learning_rate": 1.8029196055101857e-05, + "loss": 0.6215, + "step": 5875 + }, + { + "epoch": 0.2, + "learning_rate": 1.802854694900564e-05, + "loss": 0.6501, + "step": 5876 + }, + { + "epoch": 0.2, + "learning_rate": 1.8027897747720837e-05, + "loss": 0.6465, + "step": 5877 + }, + { + "epoch": 0.2, + "learning_rate": 1.8027248451255156e-05, + "loss": 0.6206, + "step": 5878 + }, + { + "epoch": 0.2, + "learning_rate": 1.802659905961629e-05, + "loss": 0.6583, + "step": 5879 + }, + { + "epoch": 0.2, + "learning_rate": 1.802594957281194e-05, + "loss": 0.6112, + "step": 5880 + }, + { + "epoch": 0.2, + "learning_rate": 1.80252999908498e-05, + "loss": 0.6552, + "step": 5881 + }, + { + "epoch": 0.2, + "learning_rate": 1.802465031373758e-05, + "loss": 0.6148, + "step": 5882 + }, + { + "epoch": 0.2, + "learning_rate": 1.8024000541482978e-05, + "loss": 0.6512, + "step": 5883 + }, + { + "epoch": 0.2, + "learning_rate": 1.80233506740937e-05, + "loss": 0.6459, + "step": 5884 + }, + { + "epoch": 0.2, + "learning_rate": 1.8022700711577447e-05, + "loss": 0.6096, + "step": 5885 + }, + { + "epoch": 0.2, + "learning_rate": 1.8022050653941932e-05, + "loss": 0.6018, + "step": 5886 + }, + { + "epoch": 0.2, + "learning_rate": 1.802140050119486e-05, + "loss": 0.6165, + "step": 5887 + }, + { + "epoch": 0.2, + "learning_rate": 1.802075025334393e-05, + "loss": 0.6897, + "step": 5888 + }, + { + "epoch": 0.2, + "learning_rate": 1.8020099910396867e-05, + "loss": 0.6179, + "step": 5889 + }, + { + "epoch": 0.2, + "learning_rate": 1.8019449472361374e-05, + "loss": 0.626, + "step": 5890 + }, + { + "epoch": 0.2, + "learning_rate": 1.801879893924516e-05, + "loss": 0.6289, + "step": 5891 + }, + { + "epoch": 0.2, + "learning_rate": 1.8018148311055944e-05, + "loss": 0.6233, + "step": 5892 + }, + { + "epoch": 0.2, + "learning_rate": 1.8017497587801434e-05, + "loss": 0.6527, + "step": 5893 + }, + { + "epoch": 0.2, + "learning_rate": 1.8016846769489347e-05, + "loss": 0.6625, + "step": 5894 + }, + { + "epoch": 0.2, + "learning_rate": 1.8016195856127403e-05, + "loss": 0.6024, + "step": 5895 + }, + { + "epoch": 0.2, + "learning_rate": 1.8015544847723314e-05, + "loss": 0.6915, + "step": 5896 + }, + { + "epoch": 0.2, + "learning_rate": 1.80148937442848e-05, + "loss": 0.6812, + "step": 5897 + }, + { + "epoch": 0.2, + "learning_rate": 1.8014242545819587e-05, + "loss": 0.6524, + "step": 5898 + }, + { + "epoch": 0.2, + "learning_rate": 1.8013591252335386e-05, + "loss": 0.6321, + "step": 5899 + }, + { + "epoch": 0.2, + "learning_rate": 1.8012939863839926e-05, + "loss": 0.6187, + "step": 5900 + }, + { + "epoch": 0.2, + "learning_rate": 1.8012288380340925e-05, + "loss": 0.6792, + "step": 5901 + }, + { + "epoch": 0.2, + "learning_rate": 1.8011636801846112e-05, + "loss": 0.61, + "step": 5902 + }, + { + "epoch": 0.2, + "learning_rate": 1.801098512836321e-05, + "loss": 0.6305, + "step": 5903 + }, + { + "epoch": 0.2, + "learning_rate": 1.8010333359899945e-05, + "loss": 0.6004, + "step": 5904 + }, + { + "epoch": 0.2, + "learning_rate": 1.8009681496464045e-05, + "loss": 0.6494, + "step": 5905 + }, + { + "epoch": 0.2, + "learning_rate": 1.8009029538063235e-05, + "loss": 0.647, + "step": 5906 + }, + { + "epoch": 0.2, + "learning_rate": 1.8008377484705252e-05, + "loss": 0.6361, + "step": 5907 + }, + { + "epoch": 0.2, + "learning_rate": 1.8007725336397823e-05, + "loss": 0.6355, + "step": 5908 + }, + { + "epoch": 0.2, + "learning_rate": 1.8007073093148683e-05, + "loss": 0.6973, + "step": 5909 + }, + { + "epoch": 0.2, + "learning_rate": 1.8006420754965557e-05, + "loss": 0.6393, + "step": 5910 + }, + { + "epoch": 0.2, + "learning_rate": 1.8005768321856188e-05, + "loss": 0.6004, + "step": 5911 + }, + { + "epoch": 0.2, + "learning_rate": 1.8005115793828307e-05, + "loss": 0.6088, + "step": 5912 + }, + { + "epoch": 0.2, + "learning_rate": 1.800446317088965e-05, + "loss": 0.6198, + "step": 5913 + }, + { + "epoch": 0.2, + "learning_rate": 1.8003810453047958e-05, + "loss": 0.634, + "step": 5914 + }, + { + "epoch": 0.2, + "learning_rate": 1.800315764031097e-05, + "loss": 0.6331, + "step": 5915 + }, + { + "epoch": 0.2, + "learning_rate": 1.8002504732686423e-05, + "loss": 0.66, + "step": 5916 + }, + { + "epoch": 0.21, + "learning_rate": 1.800185173018206e-05, + "loss": 0.6476, + "step": 5917 + }, + { + "epoch": 0.21, + "learning_rate": 1.8001198632805617e-05, + "loss": 0.5753, + "step": 5918 + }, + { + "epoch": 0.21, + "learning_rate": 1.800054544056485e-05, + "loss": 0.5939, + "step": 5919 + }, + { + "epoch": 0.21, + "learning_rate": 1.799989215346749e-05, + "loss": 0.6588, + "step": 5920 + }, + { + "epoch": 0.21, + "learning_rate": 1.7999238771521294e-05, + "loss": 0.6462, + "step": 5921 + }, + { + "epoch": 0.21, + "learning_rate": 1.7998585294733997e-05, + "loss": 0.6502, + "step": 5922 + }, + { + "epoch": 0.21, + "learning_rate": 1.799793172311336e-05, + "loss": 0.668, + "step": 5923 + }, + { + "epoch": 0.21, + "learning_rate": 1.7997278056667122e-05, + "loss": 0.5748, + "step": 5924 + }, + { + "epoch": 0.21, + "learning_rate": 1.7996624295403037e-05, + "loss": 0.6025, + "step": 5925 + }, + { + "epoch": 0.21, + "learning_rate": 1.7995970439328854e-05, + "loss": 0.6748, + "step": 5926 + }, + { + "epoch": 0.21, + "learning_rate": 1.7995316488452324e-05, + "loss": 0.6589, + "step": 5927 + }, + { + "epoch": 0.21, + "learning_rate": 1.7994662442781206e-05, + "loss": 0.6584, + "step": 5928 + }, + { + "epoch": 0.21, + "learning_rate": 1.7994008302323253e-05, + "loss": 0.5808, + "step": 5929 + }, + { + "epoch": 0.21, + "learning_rate": 1.7993354067086216e-05, + "loss": 0.6148, + "step": 5930 + }, + { + "epoch": 0.21, + "learning_rate": 1.7992699737077857e-05, + "loss": 0.6087, + "step": 5931 + }, + { + "epoch": 0.21, + "learning_rate": 1.799204531230593e-05, + "loss": 0.6354, + "step": 5932 + }, + { + "epoch": 0.21, + "learning_rate": 1.7991390792778198e-05, + "loss": 0.5697, + "step": 5933 + }, + { + "epoch": 0.21, + "learning_rate": 1.7990736178502418e-05, + "loss": 0.602, + "step": 5934 + }, + { + "epoch": 0.21, + "learning_rate": 1.7990081469486348e-05, + "loss": 0.6029, + "step": 5935 + }, + { + "epoch": 0.21, + "learning_rate": 1.798942666573776e-05, + "loss": 0.6255, + "step": 5936 + }, + { + "epoch": 0.21, + "learning_rate": 1.7988771767264413e-05, + "loss": 0.6387, + "step": 5937 + }, + { + "epoch": 0.21, + "learning_rate": 1.7988116774074068e-05, + "loss": 0.6293, + "step": 5938 + }, + { + "epoch": 0.21, + "learning_rate": 1.7987461686174496e-05, + "loss": 0.6464, + "step": 5939 + }, + { + "epoch": 0.21, + "learning_rate": 1.798680650357346e-05, + "loss": 0.5912, + "step": 5940 + }, + { + "epoch": 0.21, + "learning_rate": 1.7986151226278726e-05, + "loss": 0.6229, + "step": 5941 + }, + { + "epoch": 0.21, + "learning_rate": 1.798549585429807e-05, + "loss": 0.6987, + "step": 5942 + }, + { + "epoch": 0.21, + "learning_rate": 1.798484038763926e-05, + "loss": 0.6536, + "step": 5943 + }, + { + "epoch": 0.21, + "learning_rate": 1.7984184826310062e-05, + "loss": 0.5952, + "step": 5944 + }, + { + "epoch": 0.21, + "learning_rate": 1.798352917031826e-05, + "loss": 0.6453, + "step": 5945 + }, + { + "epoch": 0.21, + "learning_rate": 1.7982873419671615e-05, + "loss": 0.5765, + "step": 5946 + }, + { + "epoch": 0.21, + "learning_rate": 1.7982217574377905e-05, + "loss": 0.6254, + "step": 5947 + }, + { + "epoch": 0.21, + "learning_rate": 1.7981561634444914e-05, + "loss": 0.6603, + "step": 5948 + }, + { + "epoch": 0.21, + "learning_rate": 1.7980905599880412e-05, + "loss": 0.6411, + "step": 5949 + }, + { + "epoch": 0.21, + "learning_rate": 1.798024947069218e-05, + "loss": 0.6461, + "step": 5950 + }, + { + "epoch": 0.21, + "learning_rate": 1.797959324688799e-05, + "loss": 0.603, + "step": 5951 + }, + { + "epoch": 0.21, + "learning_rate": 1.797893692847563e-05, + "loss": 0.6164, + "step": 5952 + }, + { + "epoch": 0.21, + "learning_rate": 1.7978280515462878e-05, + "loss": 0.6803, + "step": 5953 + }, + { + "epoch": 0.21, + "learning_rate": 1.7977624007857523e-05, + "loss": 0.6689, + "step": 5954 + }, + { + "epoch": 0.21, + "learning_rate": 1.797696740566734e-05, + "loss": 0.6412, + "step": 5955 + }, + { + "epoch": 0.21, + "learning_rate": 1.7976310708900115e-05, + "loss": 0.6871, + "step": 5956 + }, + { + "epoch": 0.21, + "learning_rate": 1.797565391756364e-05, + "loss": 0.6548, + "step": 5957 + }, + { + "epoch": 0.21, + "learning_rate": 1.7974997031665698e-05, + "loss": 0.6671, + "step": 5958 + }, + { + "epoch": 0.21, + "learning_rate": 1.797434005121408e-05, + "loss": 0.5975, + "step": 5959 + }, + { + "epoch": 0.21, + "learning_rate": 1.797368297621657e-05, + "loss": 0.622, + "step": 5960 + }, + { + "epoch": 0.21, + "learning_rate": 1.7973025806680962e-05, + "loss": 0.606, + "step": 5961 + }, + { + "epoch": 0.21, + "learning_rate": 1.7972368542615046e-05, + "loss": 0.6799, + "step": 5962 + }, + { + "epoch": 0.21, + "learning_rate": 1.7971711184026618e-05, + "loss": 0.6124, + "step": 5963 + }, + { + "epoch": 0.21, + "learning_rate": 1.7971053730923466e-05, + "loss": 0.6949, + "step": 5964 + }, + { + "epoch": 0.21, + "learning_rate": 1.7970396183313396e-05, + "loss": 0.6079, + "step": 5965 + }, + { + "epoch": 0.21, + "learning_rate": 1.796973854120419e-05, + "loss": 0.6227, + "step": 5966 + }, + { + "epoch": 0.21, + "learning_rate": 1.7969080804603653e-05, + "loss": 0.6879, + "step": 5967 + }, + { + "epoch": 0.21, + "learning_rate": 1.7968422973519584e-05, + "loss": 0.6429, + "step": 5968 + }, + { + "epoch": 0.21, + "learning_rate": 1.796776504795978e-05, + "loss": 0.6307, + "step": 5969 + }, + { + "epoch": 0.21, + "learning_rate": 1.796710702793204e-05, + "loss": 0.5842, + "step": 5970 + }, + { + "epoch": 0.21, + "learning_rate": 1.796644891344417e-05, + "loss": 0.5808, + "step": 5971 + }, + { + "epoch": 0.21, + "learning_rate": 1.796579070450397e-05, + "loss": 0.6307, + "step": 5972 + }, + { + "epoch": 0.21, + "learning_rate": 1.796513240111924e-05, + "loss": 0.6474, + "step": 5973 + }, + { + "epoch": 0.21, + "learning_rate": 1.7964474003297797e-05, + "loss": 0.6618, + "step": 5974 + }, + { + "epoch": 0.21, + "learning_rate": 1.7963815511047435e-05, + "loss": 0.6607, + "step": 5975 + }, + { + "epoch": 0.21, + "learning_rate": 1.796315692437597e-05, + "loss": 0.6114, + "step": 5976 + }, + { + "epoch": 0.21, + "learning_rate": 1.79624982432912e-05, + "loss": 0.5861, + "step": 5977 + }, + { + "epoch": 0.21, + "learning_rate": 1.7961839467800947e-05, + "loss": 0.7041, + "step": 5978 + }, + { + "epoch": 0.21, + "learning_rate": 1.7961180597913014e-05, + "loss": 0.5995, + "step": 5979 + }, + { + "epoch": 0.21, + "learning_rate": 1.796052163363521e-05, + "loss": 0.644, + "step": 5980 + }, + { + "epoch": 0.21, + "learning_rate": 1.7959862574975356e-05, + "loss": 0.6936, + "step": 5981 + }, + { + "epoch": 0.21, + "learning_rate": 1.7959203421941257e-05, + "loss": 0.6726, + "step": 5982 + }, + { + "epoch": 0.21, + "learning_rate": 1.795854417454074e-05, + "loss": 0.6409, + "step": 5983 + }, + { + "epoch": 0.21, + "learning_rate": 1.7957884832781607e-05, + "loss": 0.6081, + "step": 5984 + }, + { + "epoch": 0.21, + "learning_rate": 1.7957225396671685e-05, + "loss": 0.7048, + "step": 5985 + }, + { + "epoch": 0.21, + "learning_rate": 1.7956565866218793e-05, + "loss": 0.6027, + "step": 5986 + }, + { + "epoch": 0.21, + "learning_rate": 1.7955906241430745e-05, + "loss": 0.5902, + "step": 5987 + }, + { + "epoch": 0.21, + "learning_rate": 1.7955246522315365e-05, + "loss": 0.6269, + "step": 5988 + }, + { + "epoch": 0.21, + "learning_rate": 1.7954586708880475e-05, + "loss": 0.6093, + "step": 5989 + }, + { + "epoch": 0.21, + "learning_rate": 1.7953926801133894e-05, + "loss": 0.5901, + "step": 5990 + }, + { + "epoch": 0.21, + "learning_rate": 1.7953266799083452e-05, + "loss": 0.6239, + "step": 5991 + }, + { + "epoch": 0.21, + "learning_rate": 1.795260670273697e-05, + "loss": 0.6087, + "step": 5992 + }, + { + "epoch": 0.21, + "learning_rate": 1.7951946512102275e-05, + "loss": 0.6619, + "step": 5993 + }, + { + "epoch": 0.21, + "learning_rate": 1.7951286227187193e-05, + "loss": 0.6683, + "step": 5994 + }, + { + "epoch": 0.21, + "learning_rate": 1.795062584799956e-05, + "loss": 0.6281, + "step": 5995 + }, + { + "epoch": 0.21, + "learning_rate": 1.7949965374547195e-05, + "loss": 0.6256, + "step": 5996 + }, + { + "epoch": 0.21, + "learning_rate": 1.7949304806837936e-05, + "loss": 0.678, + "step": 5997 + }, + { + "epoch": 0.21, + "learning_rate": 1.794864414487961e-05, + "loss": 0.6704, + "step": 5998 + }, + { + "epoch": 0.21, + "learning_rate": 1.7947983388680053e-05, + "loss": 0.6584, + "step": 5999 + }, + { + "epoch": 0.21, + "learning_rate": 1.7947322538247104e-05, + "loss": 0.6378, + "step": 6000 + }, + { + "epoch": 0.21, + "learning_rate": 1.7946661593588586e-05, + "loss": 0.6467, + "step": 6001 + }, + { + "epoch": 0.21, + "learning_rate": 1.7946000554712347e-05, + "loss": 0.6209, + "step": 6002 + }, + { + "epoch": 0.21, + "learning_rate": 1.7945339421626217e-05, + "loss": 0.6077, + "step": 6003 + }, + { + "epoch": 0.21, + "learning_rate": 1.794467819433804e-05, + "loss": 0.6547, + "step": 6004 + }, + { + "epoch": 0.21, + "learning_rate": 1.794401687285565e-05, + "loss": 0.6817, + "step": 6005 + }, + { + "epoch": 0.21, + "learning_rate": 1.7943355457186892e-05, + "loss": 0.6022, + "step": 6006 + }, + { + "epoch": 0.21, + "learning_rate": 1.7942693947339606e-05, + "loss": 0.62, + "step": 6007 + }, + { + "epoch": 0.21, + "learning_rate": 1.7942032343321637e-05, + "loss": 0.6712, + "step": 6008 + }, + { + "epoch": 0.21, + "learning_rate": 1.7941370645140827e-05, + "loss": 0.64, + "step": 6009 + }, + { + "epoch": 0.21, + "learning_rate": 1.794070885280502e-05, + "loss": 0.5979, + "step": 6010 + }, + { + "epoch": 0.21, + "learning_rate": 1.7940046966322068e-05, + "loss": 0.657, + "step": 6011 + }, + { + "epoch": 0.21, + "learning_rate": 1.7939384985699812e-05, + "loss": 0.6252, + "step": 6012 + }, + { + "epoch": 0.21, + "learning_rate": 1.7938722910946108e-05, + "loss": 0.6284, + "step": 6013 + }, + { + "epoch": 0.21, + "learning_rate": 1.7938060742068798e-05, + "loss": 0.6244, + "step": 6014 + }, + { + "epoch": 0.21, + "learning_rate": 1.7937398479075736e-05, + "loss": 0.6034, + "step": 6015 + }, + { + "epoch": 0.21, + "learning_rate": 1.7936736121974776e-05, + "loss": 0.6191, + "step": 6016 + }, + { + "epoch": 0.21, + "learning_rate": 1.793607367077377e-05, + "loss": 0.661, + "step": 6017 + }, + { + "epoch": 0.21, + "learning_rate": 1.7935411125480567e-05, + "loss": 0.6471, + "step": 6018 + }, + { + "epoch": 0.21, + "learning_rate": 1.7934748486103027e-05, + "loss": 0.6087, + "step": 6019 + }, + { + "epoch": 0.21, + "learning_rate": 1.7934085752649012e-05, + "loss": 0.7051, + "step": 6020 + }, + { + "epoch": 0.21, + "learning_rate": 1.793342292512637e-05, + "loss": 0.6202, + "step": 6021 + }, + { + "epoch": 0.21, + "learning_rate": 1.7932760003542965e-05, + "loss": 0.6091, + "step": 6022 + }, + { + "epoch": 0.21, + "learning_rate": 1.7932096987906652e-05, + "loss": 0.6299, + "step": 6023 + }, + { + "epoch": 0.21, + "learning_rate": 1.79314338782253e-05, + "loss": 0.6402, + "step": 6024 + }, + { + "epoch": 0.21, + "learning_rate": 1.793077067450676e-05, + "loss": 0.6261, + "step": 6025 + }, + { + "epoch": 0.21, + "learning_rate": 1.7930107376758905e-05, + "loss": 0.6514, + "step": 6026 + }, + { + "epoch": 0.21, + "learning_rate": 1.7929443984989595e-05, + "loss": 0.6106, + "step": 6027 + }, + { + "epoch": 0.21, + "learning_rate": 1.7928780499206696e-05, + "loss": 0.6187, + "step": 6028 + }, + { + "epoch": 0.21, + "learning_rate": 1.792811691941807e-05, + "loss": 0.6798, + "step": 6029 + }, + { + "epoch": 0.21, + "learning_rate": 1.7927453245631595e-05, + "loss": 0.6504, + "step": 6030 + }, + { + "epoch": 0.21, + "learning_rate": 1.792678947785513e-05, + "loss": 0.6717, + "step": 6031 + }, + { + "epoch": 0.21, + "learning_rate": 1.792612561609655e-05, + "loss": 0.5778, + "step": 6032 + }, + { + "epoch": 0.21, + "learning_rate": 1.7925461660363724e-05, + "loss": 0.6299, + "step": 6033 + }, + { + "epoch": 0.21, + "learning_rate": 1.7924797610664524e-05, + "loss": 0.6197, + "step": 6034 + }, + { + "epoch": 0.21, + "learning_rate": 1.7924133467006825e-05, + "loss": 0.5911, + "step": 6035 + }, + { + "epoch": 0.21, + "learning_rate": 1.7923469229398495e-05, + "loss": 0.6851, + "step": 6036 + }, + { + "epoch": 0.21, + "learning_rate": 1.7922804897847418e-05, + "loss": 0.5903, + "step": 6037 + }, + { + "epoch": 0.21, + "learning_rate": 1.7922140472361464e-05, + "loss": 0.6348, + "step": 6038 + }, + { + "epoch": 0.21, + "learning_rate": 1.792147595294851e-05, + "loss": 0.5905, + "step": 6039 + }, + { + "epoch": 0.21, + "learning_rate": 1.7920811339616447e-05, + "loss": 0.6915, + "step": 6040 + }, + { + "epoch": 0.21, + "learning_rate": 1.7920146632373142e-05, + "loss": 0.6434, + "step": 6041 + }, + { + "epoch": 0.21, + "learning_rate": 1.7919481831226477e-05, + "loss": 0.6245, + "step": 6042 + }, + { + "epoch": 0.21, + "learning_rate": 1.7918816936184336e-05, + "loss": 0.6414, + "step": 6043 + }, + { + "epoch": 0.21, + "learning_rate": 1.7918151947254607e-05, + "loss": 0.6844, + "step": 6044 + }, + { + "epoch": 0.21, + "learning_rate": 1.791748686444517e-05, + "loss": 0.6872, + "step": 6045 + }, + { + "epoch": 0.21, + "learning_rate": 1.7916821687763907e-05, + "loss": 0.6197, + "step": 6046 + }, + { + "epoch": 0.21, + "learning_rate": 1.7916156417218712e-05, + "loss": 0.5847, + "step": 6047 + }, + { + "epoch": 0.21, + "learning_rate": 1.7915491052817465e-05, + "loss": 0.671, + "step": 6048 + }, + { + "epoch": 0.21, + "learning_rate": 1.791482559456806e-05, + "loss": 0.6758, + "step": 6049 + }, + { + "epoch": 0.21, + "learning_rate": 1.7914160042478386e-05, + "loss": 0.6553, + "step": 6050 + }, + { + "epoch": 0.21, + "learning_rate": 1.7913494396556334e-05, + "loss": 0.6147, + "step": 6051 + }, + { + "epoch": 0.21, + "learning_rate": 1.7912828656809794e-05, + "loss": 0.6582, + "step": 6052 + }, + { + "epoch": 0.21, + "learning_rate": 1.791216282324666e-05, + "loss": 0.66, + "step": 6053 + }, + { + "epoch": 0.21, + "learning_rate": 1.7911496895874827e-05, + "loss": 0.6284, + "step": 6054 + }, + { + "epoch": 0.21, + "learning_rate": 1.791083087470219e-05, + "loss": 0.6522, + "step": 6055 + }, + { + "epoch": 0.21, + "learning_rate": 1.7910164759736646e-05, + "loss": 0.6486, + "step": 6056 + }, + { + "epoch": 0.21, + "learning_rate": 1.7909498550986092e-05, + "loss": 0.6004, + "step": 6057 + }, + { + "epoch": 0.21, + "learning_rate": 1.7908832248458427e-05, + "loss": 0.6341, + "step": 6058 + }, + { + "epoch": 0.21, + "learning_rate": 1.7908165852161552e-05, + "loss": 0.6242, + "step": 6059 + }, + { + "epoch": 0.21, + "learning_rate": 1.7907499362103364e-05, + "loss": 0.6163, + "step": 6060 + }, + { + "epoch": 0.21, + "learning_rate": 1.7906832778291772e-05, + "loss": 0.6706, + "step": 6061 + }, + { + "epoch": 0.21, + "learning_rate": 1.7906166100734676e-05, + "loss": 0.6161, + "step": 6062 + }, + { + "epoch": 0.21, + "learning_rate": 1.7905499329439977e-05, + "loss": 0.6132, + "step": 6063 + }, + { + "epoch": 0.21, + "learning_rate": 1.790483246441558e-05, + "loss": 0.6337, + "step": 6064 + }, + { + "epoch": 0.21, + "learning_rate": 1.7904165505669398e-05, + "loss": 0.6938, + "step": 6065 + }, + { + "epoch": 0.21, + "learning_rate": 1.790349845320934e-05, + "loss": 0.6556, + "step": 6066 + }, + { + "epoch": 0.21, + "learning_rate": 1.7902831307043303e-05, + "loss": 0.6465, + "step": 6067 + }, + { + "epoch": 0.21, + "learning_rate": 1.7902164067179204e-05, + "loss": 0.6381, + "step": 6068 + }, + { + "epoch": 0.21, + "learning_rate": 1.7901496733624953e-05, + "loss": 0.5602, + "step": 6069 + }, + { + "epoch": 0.21, + "learning_rate": 1.7900829306388465e-05, + "loss": 0.6365, + "step": 6070 + }, + { + "epoch": 0.21, + "learning_rate": 1.7900161785477652e-05, + "loss": 0.6503, + "step": 6071 + }, + { + "epoch": 0.21, + "learning_rate": 1.7899494170900427e-05, + "loss": 0.6849, + "step": 6072 + }, + { + "epoch": 0.21, + "learning_rate": 1.7898826462664703e-05, + "loss": 0.677, + "step": 6073 + }, + { + "epoch": 0.21, + "learning_rate": 1.78981586607784e-05, + "loss": 0.6381, + "step": 6074 + }, + { + "epoch": 0.21, + "learning_rate": 1.7897490765249438e-05, + "loss": 0.6655, + "step": 6075 + }, + { + "epoch": 0.21, + "learning_rate": 1.789682277608573e-05, + "loss": 0.6685, + "step": 6076 + }, + { + "epoch": 0.21, + "learning_rate": 1.7896154693295197e-05, + "loss": 0.6341, + "step": 6077 + }, + { + "epoch": 0.21, + "learning_rate": 1.7895486516885766e-05, + "loss": 0.6617, + "step": 6078 + }, + { + "epoch": 0.21, + "learning_rate": 1.789481824686535e-05, + "loss": 0.6477, + "step": 6079 + }, + { + "epoch": 0.21, + "learning_rate": 1.7894149883241877e-05, + "loss": 0.6438, + "step": 6080 + }, + { + "epoch": 0.21, + "learning_rate": 1.7893481426023273e-05, + "loss": 0.5927, + "step": 6081 + }, + { + "epoch": 0.21, + "learning_rate": 1.7892812875217462e-05, + "loss": 0.6468, + "step": 6082 + }, + { + "epoch": 0.21, + "learning_rate": 1.789214423083237e-05, + "loss": 0.6987, + "step": 6083 + }, + { + "epoch": 0.21, + "learning_rate": 1.7891475492875924e-05, + "loss": 0.6358, + "step": 6084 + }, + { + "epoch": 0.21, + "learning_rate": 1.789080666135605e-05, + "loss": 0.6404, + "step": 6085 + }, + { + "epoch": 0.21, + "learning_rate": 1.7890137736280687e-05, + "loss": 0.6292, + "step": 6086 + }, + { + "epoch": 0.21, + "learning_rate": 1.7889468717657753e-05, + "loss": 0.6323, + "step": 6087 + }, + { + "epoch": 0.21, + "learning_rate": 1.788879960549519e-05, + "loss": 0.6202, + "step": 6088 + }, + { + "epoch": 0.21, + "learning_rate": 1.788813039980093e-05, + "loss": 0.6311, + "step": 6089 + }, + { + "epoch": 0.21, + "learning_rate": 1.7887461100582907e-05, + "loss": 0.5722, + "step": 6090 + }, + { + "epoch": 0.21, + "learning_rate": 1.788679170784905e-05, + "loss": 0.6735, + "step": 6091 + }, + { + "epoch": 0.21, + "learning_rate": 1.7886122221607304e-05, + "loss": 0.5911, + "step": 6092 + }, + { + "epoch": 0.21, + "learning_rate": 1.7885452641865605e-05, + "loss": 0.6326, + "step": 6093 + }, + { + "epoch": 0.21, + "learning_rate": 1.7884782968631885e-05, + "loss": 0.6038, + "step": 6094 + }, + { + "epoch": 0.21, + "learning_rate": 1.788411320191409e-05, + "loss": 0.6091, + "step": 6095 + }, + { + "epoch": 0.21, + "learning_rate": 1.7883443341720162e-05, + "loss": 0.6572, + "step": 6096 + }, + { + "epoch": 0.21, + "learning_rate": 1.788277338805804e-05, + "loss": 0.6086, + "step": 6097 + }, + { + "epoch": 0.21, + "learning_rate": 1.7882103340935665e-05, + "loss": 0.6069, + "step": 6098 + }, + { + "epoch": 0.21, + "learning_rate": 1.7881433200360983e-05, + "loss": 0.6172, + "step": 6099 + }, + { + "epoch": 0.21, + "learning_rate": 1.7880762966341945e-05, + "loss": 0.6956, + "step": 6100 + }, + { + "epoch": 0.21, + "learning_rate": 1.788009263888649e-05, + "loss": 0.5686, + "step": 6101 + }, + { + "epoch": 0.21, + "learning_rate": 1.7879422218002568e-05, + "loss": 0.628, + "step": 6102 + }, + { + "epoch": 0.21, + "learning_rate": 1.787875170369813e-05, + "loss": 0.6615, + "step": 6103 + }, + { + "epoch": 0.21, + "learning_rate": 1.787808109598112e-05, + "loss": 0.6263, + "step": 6104 + }, + { + "epoch": 0.21, + "learning_rate": 1.78774103948595e-05, + "loss": 0.629, + "step": 6105 + }, + { + "epoch": 0.21, + "learning_rate": 1.787673960034121e-05, + "loss": 0.5994, + "step": 6106 + }, + { + "epoch": 0.21, + "learning_rate": 1.7876068712434207e-05, + "loss": 0.6324, + "step": 6107 + }, + { + "epoch": 0.21, + "learning_rate": 1.7875397731146446e-05, + "loss": 0.6764, + "step": 6108 + }, + { + "epoch": 0.21, + "learning_rate": 1.7874726656485887e-05, + "loss": 0.6457, + "step": 6109 + }, + { + "epoch": 0.21, + "learning_rate": 1.7874055488460478e-05, + "loss": 0.673, + "step": 6110 + }, + { + "epoch": 0.21, + "learning_rate": 1.787338422707818e-05, + "loss": 0.5814, + "step": 6111 + }, + { + "epoch": 0.21, + "learning_rate": 1.7872712872346952e-05, + "loss": 0.6448, + "step": 6112 + }, + { + "epoch": 0.21, + "learning_rate": 1.7872041424274758e-05, + "loss": 0.6421, + "step": 6113 + }, + { + "epoch": 0.21, + "learning_rate": 1.7871369882869554e-05, + "loss": 0.6754, + "step": 6114 + }, + { + "epoch": 0.21, + "learning_rate": 1.78706982481393e-05, + "loss": 0.6385, + "step": 6115 + }, + { + "epoch": 0.21, + "learning_rate": 1.787002652009196e-05, + "loss": 0.6419, + "step": 6116 + }, + { + "epoch": 0.21, + "learning_rate": 1.7869354698735506e-05, + "loss": 0.6331, + "step": 6117 + }, + { + "epoch": 0.21, + "learning_rate": 1.7868682784077892e-05, + "loss": 0.65, + "step": 6118 + }, + { + "epoch": 0.21, + "learning_rate": 1.786801077612709e-05, + "loss": 0.6352, + "step": 6119 + }, + { + "epoch": 0.21, + "learning_rate": 1.786733867489107e-05, + "loss": 0.5773, + "step": 6120 + }, + { + "epoch": 0.21, + "learning_rate": 1.7866666480377795e-05, + "loss": 0.6385, + "step": 6121 + }, + { + "epoch": 0.21, + "learning_rate": 1.786599419259524e-05, + "loss": 0.6192, + "step": 6122 + }, + { + "epoch": 0.21, + "learning_rate": 1.786532181155137e-05, + "loss": 0.667, + "step": 6123 + }, + { + "epoch": 0.21, + "learning_rate": 1.7864649337254163e-05, + "loss": 0.6562, + "step": 6124 + }, + { + "epoch": 0.21, + "learning_rate": 1.786397676971159e-05, + "loss": 0.5974, + "step": 6125 + }, + { + "epoch": 0.21, + "learning_rate": 1.786330410893162e-05, + "loss": 0.6057, + "step": 6126 + }, + { + "epoch": 0.21, + "learning_rate": 1.786263135492224e-05, + "loss": 0.5961, + "step": 6127 + }, + { + "epoch": 0.21, + "learning_rate": 1.7861958507691414e-05, + "loss": 0.639, + "step": 6128 + }, + { + "epoch": 0.21, + "learning_rate": 1.7861285567247123e-05, + "loss": 0.6695, + "step": 6129 + }, + { + "epoch": 0.21, + "learning_rate": 1.7860612533597352e-05, + "loss": 0.6303, + "step": 6130 + }, + { + "epoch": 0.21, + "learning_rate": 1.7859939406750075e-05, + "loss": 0.6925, + "step": 6131 + }, + { + "epoch": 0.21, + "learning_rate": 1.785926618671327e-05, + "loss": 0.6145, + "step": 6132 + }, + { + "epoch": 0.21, + "learning_rate": 1.785859287349492e-05, + "loss": 0.6683, + "step": 6133 + }, + { + "epoch": 0.21, + "learning_rate": 1.7857919467103016e-05, + "loss": 0.5773, + "step": 6134 + }, + { + "epoch": 0.21, + "learning_rate": 1.7857245967545534e-05, + "loss": 0.5925, + "step": 6135 + }, + { + "epoch": 0.21, + "learning_rate": 1.7856572374830464e-05, + "loss": 0.6471, + "step": 6136 + }, + { + "epoch": 0.21, + "learning_rate": 1.785589868896579e-05, + "loss": 0.6532, + "step": 6137 + }, + { + "epoch": 0.21, + "learning_rate": 1.7855224909959493e-05, + "loss": 0.6343, + "step": 6138 + }, + { + "epoch": 0.21, + "learning_rate": 1.7854551037819573e-05, + "loss": 0.6929, + "step": 6139 + }, + { + "epoch": 0.21, + "learning_rate": 1.7853877072554012e-05, + "loss": 0.626, + "step": 6140 + }, + { + "epoch": 0.21, + "learning_rate": 1.785320301417081e-05, + "loss": 0.6681, + "step": 6141 + }, + { + "epoch": 0.21, + "learning_rate": 1.7852528862677943e-05, + "loss": 0.6007, + "step": 6142 + }, + { + "epoch": 0.21, + "learning_rate": 1.7851854618083416e-05, + "loss": 0.5735, + "step": 6143 + }, + { + "epoch": 0.21, + "learning_rate": 1.785118028039522e-05, + "loss": 0.6079, + "step": 6144 + }, + { + "epoch": 0.21, + "learning_rate": 1.785050584962135e-05, + "loss": 0.6605, + "step": 6145 + }, + { + "epoch": 0.21, + "learning_rate": 1.78498313257698e-05, + "loss": 0.6478, + "step": 6146 + }, + { + "epoch": 0.21, + "learning_rate": 1.7849156708848573e-05, + "loss": 0.6279, + "step": 6147 + }, + { + "epoch": 0.21, + "learning_rate": 1.7848481998865665e-05, + "loss": 0.6629, + "step": 6148 + }, + { + "epoch": 0.21, + "learning_rate": 1.7847807195829072e-05, + "loss": 0.623, + "step": 6149 + }, + { + "epoch": 0.21, + "learning_rate": 1.7847132299746798e-05, + "loss": 0.6877, + "step": 6150 + }, + { + "epoch": 0.21, + "learning_rate": 1.784645731062684e-05, + "loss": 0.6204, + "step": 6151 + }, + { + "epoch": 0.21, + "learning_rate": 1.7845782228477212e-05, + "loss": 0.6084, + "step": 6152 + }, + { + "epoch": 0.21, + "learning_rate": 1.7845107053305906e-05, + "loss": 0.6416, + "step": 6153 + }, + { + "epoch": 0.21, + "learning_rate": 1.7844431785120934e-05, + "loss": 0.6478, + "step": 6154 + }, + { + "epoch": 0.21, + "learning_rate": 1.7843756423930296e-05, + "loss": 0.5702, + "step": 6155 + }, + { + "epoch": 0.21, + "learning_rate": 1.7843080969742004e-05, + "loss": 0.6489, + "step": 6156 + }, + { + "epoch": 0.21, + "learning_rate": 1.784240542256407e-05, + "loss": 0.644, + "step": 6157 + }, + { + "epoch": 0.21, + "learning_rate": 1.7841729782404494e-05, + "loss": 0.6528, + "step": 6158 + }, + { + "epoch": 0.21, + "learning_rate": 1.7841054049271295e-05, + "loss": 0.6442, + "step": 6159 + }, + { + "epoch": 0.21, + "learning_rate": 1.784037822317248e-05, + "loss": 0.6461, + "step": 6160 + }, + { + "epoch": 0.21, + "learning_rate": 1.7839702304116063e-05, + "loss": 0.6876, + "step": 6161 + }, + { + "epoch": 0.21, + "learning_rate": 1.783902629211006e-05, + "loss": 0.6156, + "step": 6162 + }, + { + "epoch": 0.21, + "learning_rate": 1.7838350187162482e-05, + "loss": 0.5995, + "step": 6163 + }, + { + "epoch": 0.21, + "learning_rate": 1.7837673989281346e-05, + "loss": 0.6038, + "step": 6164 + }, + { + "epoch": 0.21, + "learning_rate": 1.7836997698474672e-05, + "loss": 0.6558, + "step": 6165 + }, + { + "epoch": 0.21, + "learning_rate": 1.7836321314750472e-05, + "loss": 0.6285, + "step": 6166 + }, + { + "epoch": 0.21, + "learning_rate": 1.7835644838116776e-05, + "loss": 0.6205, + "step": 6167 + }, + { + "epoch": 0.21, + "learning_rate": 1.7834968268581595e-05, + "loss": 0.6318, + "step": 6168 + }, + { + "epoch": 0.21, + "learning_rate": 1.7834291606152957e-05, + "loss": 0.702, + "step": 6169 + }, + { + "epoch": 0.21, + "learning_rate": 1.7833614850838876e-05, + "loss": 0.6477, + "step": 6170 + }, + { + "epoch": 0.21, + "learning_rate": 1.7832938002647385e-05, + "loss": 0.6632, + "step": 6171 + }, + { + "epoch": 0.21, + "learning_rate": 1.7832261061586504e-05, + "loss": 0.5773, + "step": 6172 + }, + { + "epoch": 0.21, + "learning_rate": 1.7831584027664262e-05, + "loss": 0.6615, + "step": 6173 + }, + { + "epoch": 0.21, + "learning_rate": 1.7830906900888687e-05, + "loss": 0.629, + "step": 6174 + }, + { + "epoch": 0.21, + "learning_rate": 1.7830229681267797e-05, + "loss": 0.6246, + "step": 6175 + }, + { + "epoch": 0.21, + "learning_rate": 1.7829552368809633e-05, + "loss": 0.6372, + "step": 6176 + }, + { + "epoch": 0.21, + "learning_rate": 1.782887496352222e-05, + "loss": 0.5479, + "step": 6177 + }, + { + "epoch": 0.21, + "learning_rate": 1.7828197465413595e-05, + "loss": 0.6194, + "step": 6178 + }, + { + "epoch": 0.21, + "learning_rate": 1.7827519874491784e-05, + "loss": 0.6537, + "step": 6179 + }, + { + "epoch": 0.21, + "learning_rate": 1.7826842190764822e-05, + "loss": 0.6131, + "step": 6180 + }, + { + "epoch": 0.21, + "learning_rate": 1.782616441424074e-05, + "loss": 0.6647, + "step": 6181 + }, + { + "epoch": 0.21, + "learning_rate": 1.7825486544927587e-05, + "loss": 0.6643, + "step": 6182 + }, + { + "epoch": 0.21, + "learning_rate": 1.7824808582833387e-05, + "loss": 0.622, + "step": 6183 + }, + { + "epoch": 0.21, + "learning_rate": 1.7824130527966183e-05, + "loss": 0.6473, + "step": 6184 + }, + { + "epoch": 0.21, + "learning_rate": 1.7823452380334017e-05, + "loss": 0.6291, + "step": 6185 + }, + { + "epoch": 0.21, + "learning_rate": 1.7822774139944924e-05, + "loss": 0.6328, + "step": 6186 + }, + { + "epoch": 0.21, + "learning_rate": 1.7822095806806946e-05, + "loss": 0.617, + "step": 6187 + }, + { + "epoch": 0.21, + "learning_rate": 1.7821417380928133e-05, + "loss": 0.6025, + "step": 6188 + }, + { + "epoch": 0.21, + "learning_rate": 1.782073886231652e-05, + "loss": 0.5982, + "step": 6189 + }, + { + "epoch": 0.21, + "learning_rate": 1.7820060250980155e-05, + "loss": 0.6339, + "step": 6190 + }, + { + "epoch": 0.21, + "learning_rate": 1.781938154692708e-05, + "loss": 0.593, + "step": 6191 + }, + { + "epoch": 0.21, + "learning_rate": 1.7818702750165346e-05, + "loss": 0.6542, + "step": 6192 + }, + { + "epoch": 0.21, + "learning_rate": 1.7818023860703003e-05, + "loss": 0.6551, + "step": 6193 + }, + { + "epoch": 0.21, + "learning_rate": 1.7817344878548092e-05, + "loss": 0.6236, + "step": 6194 + }, + { + "epoch": 0.21, + "learning_rate": 1.7816665803708675e-05, + "loss": 0.6038, + "step": 6195 + }, + { + "epoch": 0.21, + "learning_rate": 1.7815986636192794e-05, + "loss": 0.6341, + "step": 6196 + }, + { + "epoch": 0.21, + "learning_rate": 1.7815307376008504e-05, + "loss": 0.6515, + "step": 6197 + }, + { + "epoch": 0.21, + "learning_rate": 1.7814628023163858e-05, + "loss": 0.6307, + "step": 6198 + }, + { + "epoch": 0.21, + "learning_rate": 1.7813948577666912e-05, + "loss": 0.6308, + "step": 6199 + }, + { + "epoch": 0.21, + "learning_rate": 1.781326903952572e-05, + "loss": 0.6149, + "step": 6200 + }, + { + "epoch": 0.21, + "learning_rate": 1.781258940874834e-05, + "loss": 0.6056, + "step": 6201 + }, + { + "epoch": 0.21, + "learning_rate": 1.781190968534283e-05, + "loss": 0.5867, + "step": 6202 + }, + { + "epoch": 0.21, + "learning_rate": 1.781122986931725e-05, + "loss": 0.6762, + "step": 6203 + }, + { + "epoch": 0.21, + "learning_rate": 1.781054996067966e-05, + "loss": 0.6363, + "step": 6204 + }, + { + "epoch": 0.21, + "learning_rate": 1.7809869959438115e-05, + "loss": 0.6786, + "step": 6205 + }, + { + "epoch": 0.22, + "learning_rate": 1.780918986560068e-05, + "loss": 0.6414, + "step": 6206 + }, + { + "epoch": 0.22, + "learning_rate": 1.7808509679175427e-05, + "loss": 0.6723, + "step": 6207 + }, + { + "epoch": 0.22, + "learning_rate": 1.7807829400170414e-05, + "loss": 0.6461, + "step": 6208 + }, + { + "epoch": 0.22, + "learning_rate": 1.7807149028593703e-05, + "loss": 0.6517, + "step": 6209 + }, + { + "epoch": 0.22, + "learning_rate": 1.7806468564453366e-05, + "loss": 0.6254, + "step": 6210 + }, + { + "epoch": 0.22, + "learning_rate": 1.780578800775747e-05, + "loss": 0.6789, + "step": 6211 + }, + { + "epoch": 0.22, + "learning_rate": 1.780510735851408e-05, + "loss": 0.6261, + "step": 6212 + }, + { + "epoch": 0.22, + "learning_rate": 1.7804426616731268e-05, + "loss": 0.6679, + "step": 6213 + }, + { + "epoch": 0.22, + "learning_rate": 1.7803745782417107e-05, + "loss": 0.6047, + "step": 6214 + }, + { + "epoch": 0.22, + "learning_rate": 1.780306485557967e-05, + "loss": 0.6531, + "step": 6215 + }, + { + "epoch": 0.22, + "learning_rate": 1.7802383836227027e-05, + "loss": 0.6411, + "step": 6216 + }, + { + "epoch": 0.22, + "learning_rate": 1.7801702724367253e-05, + "loss": 0.6697, + "step": 6217 + }, + { + "epoch": 0.22, + "learning_rate": 1.7801021520008423e-05, + "loss": 0.6687, + "step": 6218 + }, + { + "epoch": 0.22, + "learning_rate": 1.7800340223158615e-05, + "loss": 0.6406, + "step": 6219 + }, + { + "epoch": 0.22, + "learning_rate": 1.779965883382591e-05, + "loss": 0.6704, + "step": 6220 + }, + { + "epoch": 0.22, + "learning_rate": 1.779897735201838e-05, + "loss": 0.6434, + "step": 6221 + }, + { + "epoch": 0.22, + "learning_rate": 1.7798295777744105e-05, + "loss": 0.6008, + "step": 6222 + }, + { + "epoch": 0.22, + "learning_rate": 1.7797614111011175e-05, + "loss": 0.6264, + "step": 6223 + }, + { + "epoch": 0.22, + "learning_rate": 1.779693235182766e-05, + "loss": 0.6435, + "step": 6224 + }, + { + "epoch": 0.22, + "learning_rate": 1.779625050020165e-05, + "loss": 0.6582, + "step": 6225 + }, + { + "epoch": 0.22, + "learning_rate": 1.779556855614123e-05, + "loss": 0.6374, + "step": 6226 + }, + { + "epoch": 0.22, + "learning_rate": 1.7794886519654482e-05, + "loss": 0.6624, + "step": 6227 + }, + { + "epoch": 0.22, + "learning_rate": 1.7794204390749493e-05, + "loss": 0.6432, + "step": 6228 + }, + { + "epoch": 0.22, + "learning_rate": 1.779352216943435e-05, + "loss": 0.5938, + "step": 6229 + }, + { + "epoch": 0.22, + "learning_rate": 1.779283985571715e-05, + "loss": 0.6533, + "step": 6230 + }, + { + "epoch": 0.22, + "learning_rate": 1.7792157449605967e-05, + "loss": 0.6807, + "step": 6231 + }, + { + "epoch": 0.22, + "learning_rate": 1.7791474951108905e-05, + "loss": 0.6599, + "step": 6232 + }, + { + "epoch": 0.22, + "learning_rate": 1.779079236023405e-05, + "loss": 0.6318, + "step": 6233 + }, + { + "epoch": 0.22, + "learning_rate": 1.7790109676989496e-05, + "loss": 0.6176, + "step": 6234 + }, + { + "epoch": 0.22, + "learning_rate": 1.7789426901383335e-05, + "loss": 0.6133, + "step": 6235 + }, + { + "epoch": 0.22, + "learning_rate": 1.7788744033423668e-05, + "loss": 0.649, + "step": 6236 + }, + { + "epoch": 0.22, + "learning_rate": 1.7788061073118584e-05, + "loss": 0.6679, + "step": 6237 + }, + { + "epoch": 0.22, + "learning_rate": 1.7787378020476193e-05, + "loss": 0.6258, + "step": 6238 + }, + { + "epoch": 0.22, + "learning_rate": 1.7786694875504575e-05, + "loss": 0.5994, + "step": 6239 + }, + { + "epoch": 0.22, + "learning_rate": 1.778601163821184e-05, + "loss": 0.6717, + "step": 6240 + }, + { + "epoch": 0.22, + "learning_rate": 1.778532830860609e-05, + "loss": 0.6276, + "step": 6241 + }, + { + "epoch": 0.22, + "learning_rate": 1.7784644886695427e-05, + "loss": 0.5737, + "step": 6242 + }, + { + "epoch": 0.22, + "learning_rate": 1.7783961372487947e-05, + "loss": 0.6178, + "step": 6243 + }, + { + "epoch": 0.22, + "learning_rate": 1.778327776599176e-05, + "loss": 0.6661, + "step": 6244 + }, + { + "epoch": 0.22, + "learning_rate": 1.778259406721497e-05, + "loss": 0.603, + "step": 6245 + }, + { + "epoch": 0.22, + "learning_rate": 1.778191027616568e-05, + "loss": 0.6039, + "step": 6246 + }, + { + "epoch": 0.22, + "learning_rate": 1.7781226392851997e-05, + "loss": 0.6035, + "step": 6247 + }, + { + "epoch": 0.22, + "learning_rate": 1.778054241728204e-05, + "loss": 0.6409, + "step": 6248 + }, + { + "epoch": 0.22, + "learning_rate": 1.7779858349463904e-05, + "loss": 0.6917, + "step": 6249 + }, + { + "epoch": 0.22, + "learning_rate": 1.7779174189405708e-05, + "loss": 0.6479, + "step": 6250 + }, + { + "epoch": 0.22, + "learning_rate": 1.777848993711556e-05, + "loss": 0.6668, + "step": 6251 + }, + { + "epoch": 0.22, + "learning_rate": 1.7777805592601575e-05, + "loss": 0.6926, + "step": 6252 + }, + { + "epoch": 0.22, + "learning_rate": 1.7777121155871864e-05, + "loss": 0.638, + "step": 6253 + }, + { + "epoch": 0.22, + "learning_rate": 1.7776436626934543e-05, + "loss": 0.6134, + "step": 6254 + }, + { + "epoch": 0.22, + "learning_rate": 1.777575200579773e-05, + "loss": 0.6788, + "step": 6255 + }, + { + "epoch": 0.22, + "learning_rate": 1.7775067292469545e-05, + "loss": 0.641, + "step": 6256 + }, + { + "epoch": 0.22, + "learning_rate": 1.7774382486958094e-05, + "loss": 0.6338, + "step": 6257 + }, + { + "epoch": 0.22, + "learning_rate": 1.7773697589271508e-05, + "loss": 0.6775, + "step": 6258 + }, + { + "epoch": 0.22, + "learning_rate": 1.7773012599417902e-05, + "loss": 0.6311, + "step": 6259 + }, + { + "epoch": 0.22, + "learning_rate": 1.77723275174054e-05, + "loss": 0.6247, + "step": 6260 + }, + { + "epoch": 0.22, + "learning_rate": 1.777164234324212e-05, + "loss": 0.6408, + "step": 6261 + }, + { + "epoch": 0.22, + "learning_rate": 1.7770957076936195e-05, + "loss": 0.6323, + "step": 6262 + }, + { + "epoch": 0.22, + "learning_rate": 1.777027171849574e-05, + "loss": 0.6206, + "step": 6263 + }, + { + "epoch": 0.22, + "learning_rate": 1.7769586267928883e-05, + "loss": 0.6192, + "step": 6264 + }, + { + "epoch": 0.22, + "learning_rate": 1.7768900725243753e-05, + "loss": 0.6557, + "step": 6265 + }, + { + "epoch": 0.22, + "learning_rate": 1.776821509044848e-05, + "loss": 0.5892, + "step": 6266 + }, + { + "epoch": 0.22, + "learning_rate": 1.7767529363551188e-05, + "loss": 0.5731, + "step": 6267 + }, + { + "epoch": 0.22, + "learning_rate": 1.776684354456001e-05, + "loss": 0.6482, + "step": 6268 + }, + { + "epoch": 0.22, + "learning_rate": 1.7766157633483075e-05, + "loss": 0.6386, + "step": 6269 + }, + { + "epoch": 0.22, + "learning_rate": 1.7765471630328518e-05, + "loss": 0.6781, + "step": 6270 + }, + { + "epoch": 0.22, + "learning_rate": 1.7764785535104474e-05, + "loss": 0.626, + "step": 6271 + }, + { + "epoch": 0.22, + "learning_rate": 1.7764099347819073e-05, + "loss": 0.6474, + "step": 6272 + }, + { + "epoch": 0.22, + "learning_rate": 1.776341306848045e-05, + "loss": 0.6227, + "step": 6273 + }, + { + "epoch": 0.22, + "learning_rate": 1.7762726697096748e-05, + "loss": 0.606, + "step": 6274 + }, + { + "epoch": 0.22, + "learning_rate": 1.7762040233676102e-05, + "loss": 0.689, + "step": 6275 + }, + { + "epoch": 0.22, + "learning_rate": 1.7761353678226644e-05, + "loss": 0.6072, + "step": 6276 + }, + { + "epoch": 0.22, + "learning_rate": 1.7760667030756526e-05, + "loss": 0.6837, + "step": 6277 + }, + { + "epoch": 0.22, + "learning_rate": 1.775998029127388e-05, + "loss": 0.6248, + "step": 6278 + }, + { + "epoch": 0.22, + "learning_rate": 1.775929345978685e-05, + "loss": 0.6791, + "step": 6279 + }, + { + "epoch": 0.22, + "learning_rate": 1.7758606536303586e-05, + "loss": 0.6327, + "step": 6280 + }, + { + "epoch": 0.22, + "learning_rate": 1.775791952083222e-05, + "loss": 0.6113, + "step": 6281 + }, + { + "epoch": 0.22, + "learning_rate": 1.775723241338091e-05, + "loss": 0.6094, + "step": 6282 + }, + { + "epoch": 0.22, + "learning_rate": 1.7756545213957793e-05, + "loss": 0.6435, + "step": 6283 + }, + { + "epoch": 0.22, + "learning_rate": 1.7755857922571023e-05, + "loss": 0.6563, + "step": 6284 + }, + { + "epoch": 0.22, + "learning_rate": 1.7755170539228744e-05, + "loss": 0.6195, + "step": 6285 + }, + { + "epoch": 0.22, + "learning_rate": 1.775448306393911e-05, + "loss": 0.609, + "step": 6286 + }, + { + "epoch": 0.22, + "learning_rate": 1.7753795496710267e-05, + "loss": 0.6576, + "step": 6287 + }, + { + "epoch": 0.22, + "learning_rate": 1.7753107837550373e-05, + "loss": 0.6118, + "step": 6288 + }, + { + "epoch": 0.22, + "learning_rate": 1.7752420086467577e-05, + "loss": 0.6389, + "step": 6289 + }, + { + "epoch": 0.22, + "learning_rate": 1.775173224347003e-05, + "loss": 0.6157, + "step": 6290 + }, + { + "epoch": 0.22, + "learning_rate": 1.7751044308565894e-05, + "loss": 0.6306, + "step": 6291 + }, + { + "epoch": 0.22, + "learning_rate": 1.7750356281763326e-05, + "loss": 0.6314, + "step": 6292 + }, + { + "epoch": 0.22, + "learning_rate": 1.7749668163070474e-05, + "loss": 0.6166, + "step": 6293 + }, + { + "epoch": 0.22, + "learning_rate": 1.7748979952495507e-05, + "loss": 0.5925, + "step": 6294 + }, + { + "epoch": 0.22, + "learning_rate": 1.774829165004658e-05, + "loss": 0.6589, + "step": 6295 + }, + { + "epoch": 0.22, + "learning_rate": 1.774760325573185e-05, + "loss": 0.6165, + "step": 6296 + }, + { + "epoch": 0.22, + "learning_rate": 1.7746914769559488e-05, + "loss": 0.5919, + "step": 6297 + }, + { + "epoch": 0.22, + "learning_rate": 1.7746226191537647e-05, + "loss": 0.6593, + "step": 6298 + }, + { + "epoch": 0.22, + "learning_rate": 1.77455375216745e-05, + "loss": 0.6533, + "step": 6299 + }, + { + "epoch": 0.22, + "learning_rate": 1.7744848759978202e-05, + "loss": 0.6723, + "step": 6300 + }, + { + "epoch": 0.22, + "learning_rate": 1.774415990645693e-05, + "loss": 0.6303, + "step": 6301 + }, + { + "epoch": 0.22, + "learning_rate": 1.774347096111884e-05, + "loss": 0.656, + "step": 6302 + }, + { + "epoch": 0.22, + "learning_rate": 1.774278192397211e-05, + "loss": 0.6594, + "step": 6303 + }, + { + "epoch": 0.22, + "learning_rate": 1.7742092795024906e-05, + "loss": 0.6584, + "step": 6304 + }, + { + "epoch": 0.22, + "learning_rate": 1.7741403574285398e-05, + "loss": 0.5816, + "step": 6305 + }, + { + "epoch": 0.22, + "learning_rate": 1.7740714261761756e-05, + "loss": 0.6293, + "step": 6306 + }, + { + "epoch": 0.22, + "learning_rate": 1.7740024857462158e-05, + "loss": 0.6605, + "step": 6307 + }, + { + "epoch": 0.22, + "learning_rate": 1.773933536139477e-05, + "loss": 0.6526, + "step": 6308 + }, + { + "epoch": 0.22, + "learning_rate": 1.7738645773567774e-05, + "loss": 0.6455, + "step": 6309 + }, + { + "epoch": 0.22, + "learning_rate": 1.773795609398934e-05, + "loss": 0.6057, + "step": 6310 + }, + { + "epoch": 0.22, + "learning_rate": 1.7737266322667647e-05, + "loss": 0.6522, + "step": 6311 + }, + { + "epoch": 0.22, + "learning_rate": 1.773657645961088e-05, + "loss": 0.6662, + "step": 6312 + }, + { + "epoch": 0.22, + "learning_rate": 1.7735886504827207e-05, + "loss": 0.5417, + "step": 6313 + }, + { + "epoch": 0.22, + "learning_rate": 1.7735196458324816e-05, + "loss": 0.7134, + "step": 6314 + }, + { + "epoch": 0.22, + "learning_rate": 1.7734506320111885e-05, + "loss": 0.678, + "step": 6315 + }, + { + "epoch": 0.22, + "learning_rate": 1.7733816090196598e-05, + "loss": 0.6079, + "step": 6316 + }, + { + "epoch": 0.22, + "learning_rate": 1.7733125768587135e-05, + "loss": 0.6184, + "step": 6317 + }, + { + "epoch": 0.22, + "learning_rate": 1.7732435355291685e-05, + "loss": 0.6572, + "step": 6318 + }, + { + "epoch": 0.22, + "learning_rate": 1.7731744850318438e-05, + "loss": 0.6413, + "step": 6319 + }, + { + "epoch": 0.22, + "learning_rate": 1.7731054253675568e-05, + "loss": 0.6775, + "step": 6320 + }, + { + "epoch": 0.22, + "learning_rate": 1.7730363565371274e-05, + "loss": 0.6046, + "step": 6321 + }, + { + "epoch": 0.22, + "learning_rate": 1.7729672785413737e-05, + "loss": 0.6735, + "step": 6322 + }, + { + "epoch": 0.22, + "learning_rate": 1.7728981913811155e-05, + "loss": 0.6362, + "step": 6323 + }, + { + "epoch": 0.22, + "learning_rate": 1.7728290950571714e-05, + "loss": 0.6304, + "step": 6324 + }, + { + "epoch": 0.22, + "learning_rate": 1.7727599895703606e-05, + "loss": 0.6117, + "step": 6325 + }, + { + "epoch": 0.22, + "learning_rate": 1.7726908749215028e-05, + "loss": 0.6547, + "step": 6326 + }, + { + "epoch": 0.22, + "learning_rate": 1.7726217511114168e-05, + "loss": 0.6525, + "step": 6327 + }, + { + "epoch": 0.22, + "learning_rate": 1.7725526181409232e-05, + "loss": 0.5855, + "step": 6328 + }, + { + "epoch": 0.22, + "learning_rate": 1.7724834760108403e-05, + "loss": 0.6075, + "step": 6329 + }, + { + "epoch": 0.22, + "learning_rate": 1.772414324721989e-05, + "loss": 0.6118, + "step": 6330 + }, + { + "epoch": 0.22, + "learning_rate": 1.772345164275189e-05, + "loss": 0.6547, + "step": 6331 + }, + { + "epoch": 0.22, + "learning_rate": 1.7722759946712598e-05, + "loss": 0.5965, + "step": 6332 + }, + { + "epoch": 0.22, + "learning_rate": 1.7722068159110216e-05, + "loss": 0.6437, + "step": 6333 + }, + { + "epoch": 0.22, + "learning_rate": 1.7721376279952948e-05, + "loss": 0.6355, + "step": 6334 + }, + { + "epoch": 0.22, + "learning_rate": 1.7720684309249e-05, + "loss": 0.6536, + "step": 6335 + }, + { + "epoch": 0.22, + "learning_rate": 1.771999224700657e-05, + "loss": 0.6447, + "step": 6336 + }, + { + "epoch": 0.22, + "learning_rate": 1.771930009323387e-05, + "loss": 0.6461, + "step": 6337 + }, + { + "epoch": 0.22, + "learning_rate": 1.77186078479391e-05, + "loss": 0.5968, + "step": 6338 + }, + { + "epoch": 0.22, + "learning_rate": 1.7717915511130465e-05, + "loss": 0.7068, + "step": 6339 + }, + { + "epoch": 0.22, + "learning_rate": 1.7717223082816183e-05, + "loss": 0.6066, + "step": 6340 + }, + { + "epoch": 0.22, + "learning_rate": 1.7716530563004458e-05, + "loss": 0.622, + "step": 6341 + }, + { + "epoch": 0.22, + "learning_rate": 1.7715837951703504e-05, + "loss": 0.655, + "step": 6342 + }, + { + "epoch": 0.22, + "learning_rate": 1.7715145248921525e-05, + "loss": 0.6378, + "step": 6343 + }, + { + "epoch": 0.22, + "learning_rate": 1.7714452454666744e-05, + "loss": 0.6497, + "step": 6344 + }, + { + "epoch": 0.22, + "learning_rate": 1.771375956894737e-05, + "loss": 0.6836, + "step": 6345 + }, + { + "epoch": 0.22, + "learning_rate": 1.771306659177162e-05, + "loss": 0.661, + "step": 6346 + }, + { + "epoch": 0.22, + "learning_rate": 1.7712373523147704e-05, + "loss": 0.6046, + "step": 6347 + }, + { + "epoch": 0.22, + "learning_rate": 1.7711680363083845e-05, + "loss": 0.622, + "step": 6348 + }, + { + "epoch": 0.22, + "learning_rate": 1.771098711158826e-05, + "loss": 0.7245, + "step": 6349 + }, + { + "epoch": 0.22, + "learning_rate": 1.771029376866917e-05, + "loss": 0.6822, + "step": 6350 + }, + { + "epoch": 0.22, + "learning_rate": 1.7709600334334794e-05, + "loss": 0.6306, + "step": 6351 + }, + { + "epoch": 0.22, + "learning_rate": 1.770890680859335e-05, + "loss": 0.604, + "step": 6352 + }, + { + "epoch": 0.22, + "learning_rate": 1.7708213191453065e-05, + "loss": 0.6336, + "step": 6353 + }, + { + "epoch": 0.22, + "learning_rate": 1.7707519482922165e-05, + "loss": 0.6488, + "step": 6354 + }, + { + "epoch": 0.22, + "learning_rate": 1.770682568300887e-05, + "loss": 0.6491, + "step": 6355 + }, + { + "epoch": 0.22, + "learning_rate": 1.7706131791721406e-05, + "loss": 0.6283, + "step": 6356 + }, + { + "epoch": 0.22, + "learning_rate": 1.7705437809068e-05, + "loss": 0.6717, + "step": 6357 + }, + { + "epoch": 0.22, + "learning_rate": 1.7704743735056883e-05, + "loss": 0.6395, + "step": 6358 + }, + { + "epoch": 0.22, + "learning_rate": 1.7704049569696284e-05, + "loss": 0.6365, + "step": 6359 + }, + { + "epoch": 0.22, + "learning_rate": 1.770335531299443e-05, + "loss": 0.6563, + "step": 6360 + }, + { + "epoch": 0.22, + "learning_rate": 1.7702660964959557e-05, + "loss": 0.637, + "step": 6361 + }, + { + "epoch": 0.22, + "learning_rate": 1.7701966525599893e-05, + "loss": 0.6878, + "step": 6362 + }, + { + "epoch": 0.22, + "learning_rate": 1.7701271994923667e-05, + "loss": 0.6833, + "step": 6363 + }, + { + "epoch": 0.22, + "learning_rate": 1.770057737293913e-05, + "loss": 0.5652, + "step": 6364 + }, + { + "epoch": 0.22, + "learning_rate": 1.7699882659654498e-05, + "loss": 0.6598, + "step": 6365 + }, + { + "epoch": 0.22, + "learning_rate": 1.7699187855078018e-05, + "loss": 0.5691, + "step": 6366 + }, + { + "epoch": 0.22, + "learning_rate": 1.769849295921793e-05, + "loss": 0.5826, + "step": 6367 + }, + { + "epoch": 0.22, + "learning_rate": 1.7697797972082465e-05, + "loss": 0.5988, + "step": 6368 + }, + { + "epoch": 0.22, + "learning_rate": 1.769710289367987e-05, + "loss": 0.6696, + "step": 6369 + }, + { + "epoch": 0.22, + "learning_rate": 1.7696407724018384e-05, + "loss": 0.657, + "step": 6370 + }, + { + "epoch": 0.22, + "learning_rate": 1.7695712463106245e-05, + "loss": 0.6536, + "step": 6371 + }, + { + "epoch": 0.22, + "learning_rate": 1.7695017110951703e-05, + "loss": 0.6693, + "step": 6372 + }, + { + "epoch": 0.22, + "learning_rate": 1.7694321667563e-05, + "loss": 0.6919, + "step": 6373 + }, + { + "epoch": 0.22, + "learning_rate": 1.7693626132948378e-05, + "loss": 0.5516, + "step": 6374 + }, + { + "epoch": 0.22, + "learning_rate": 1.7692930507116084e-05, + "loss": 0.6466, + "step": 6375 + }, + { + "epoch": 0.22, + "learning_rate": 1.769223479007437e-05, + "loss": 0.6162, + "step": 6376 + }, + { + "epoch": 0.22, + "learning_rate": 1.769153898183148e-05, + "loss": 0.598, + "step": 6377 + }, + { + "epoch": 0.22, + "learning_rate": 1.7690843082395666e-05, + "loss": 0.6393, + "step": 6378 + }, + { + "epoch": 0.22, + "learning_rate": 1.7690147091775177e-05, + "loss": 0.6404, + "step": 6379 + }, + { + "epoch": 0.22, + "learning_rate": 1.768945100997827e-05, + "loss": 0.6197, + "step": 6380 + }, + { + "epoch": 0.22, + "learning_rate": 1.768875483701319e-05, + "loss": 0.6315, + "step": 6381 + }, + { + "epoch": 0.22, + "learning_rate": 1.76880585728882e-05, + "loss": 0.6745, + "step": 6382 + }, + { + "epoch": 0.22, + "learning_rate": 1.7687362217611545e-05, + "loss": 0.609, + "step": 6383 + }, + { + "epoch": 0.22, + "learning_rate": 1.768666577119149e-05, + "loss": 0.6607, + "step": 6384 + }, + { + "epoch": 0.22, + "learning_rate": 1.7685969233636286e-05, + "loss": 0.6393, + "step": 6385 + }, + { + "epoch": 0.22, + "learning_rate": 1.7685272604954195e-05, + "loss": 0.6545, + "step": 6386 + }, + { + "epoch": 0.22, + "learning_rate": 1.7684575885153474e-05, + "loss": 0.6277, + "step": 6387 + }, + { + "epoch": 0.22, + "learning_rate": 1.7683879074242388e-05, + "loss": 0.5958, + "step": 6388 + }, + { + "epoch": 0.22, + "learning_rate": 1.7683182172229192e-05, + "loss": 0.6146, + "step": 6389 + }, + { + "epoch": 0.22, + "learning_rate": 1.7682485179122157e-05, + "loss": 0.6337, + "step": 6390 + }, + { + "epoch": 0.22, + "learning_rate": 1.7681788094929535e-05, + "loss": 0.6648, + "step": 6391 + }, + { + "epoch": 0.22, + "learning_rate": 1.7681090919659604e-05, + "loss": 0.6125, + "step": 6392 + }, + { + "epoch": 0.22, + "learning_rate": 1.768039365332062e-05, + "loss": 0.6527, + "step": 6393 + }, + { + "epoch": 0.22, + "learning_rate": 1.7679696295920852e-05, + "loss": 0.6653, + "step": 6394 + }, + { + "epoch": 0.22, + "learning_rate": 1.7678998847468572e-05, + "loss": 0.6559, + "step": 6395 + }, + { + "epoch": 0.22, + "learning_rate": 1.7678301307972048e-05, + "loss": 0.6422, + "step": 6396 + }, + { + "epoch": 0.22, + "learning_rate": 1.7677603677439546e-05, + "loss": 0.6412, + "step": 6397 + }, + { + "epoch": 0.22, + "learning_rate": 1.767690595587934e-05, + "loss": 0.6402, + "step": 6398 + }, + { + "epoch": 0.22, + "learning_rate": 1.7676208143299706e-05, + "loss": 0.5953, + "step": 6399 + }, + { + "epoch": 0.22, + "learning_rate": 1.7675510239708912e-05, + "loss": 0.6393, + "step": 6400 + }, + { + "epoch": 0.22, + "learning_rate": 1.7674812245115233e-05, + "loss": 0.6043, + "step": 6401 + }, + { + "epoch": 0.22, + "learning_rate": 1.767411415952695e-05, + "loss": 0.6521, + "step": 6402 + }, + { + "epoch": 0.22, + "learning_rate": 1.7673415982952333e-05, + "loss": 0.6097, + "step": 6403 + }, + { + "epoch": 0.22, + "learning_rate": 1.7672717715399664e-05, + "loss": 0.7108, + "step": 6404 + }, + { + "epoch": 0.22, + "learning_rate": 1.767201935687722e-05, + "loss": 0.5815, + "step": 6405 + }, + { + "epoch": 0.22, + "learning_rate": 1.767132090739328e-05, + "loss": 0.6251, + "step": 6406 + }, + { + "epoch": 0.22, + "learning_rate": 1.7670622366956126e-05, + "loss": 0.6521, + "step": 6407 + }, + { + "epoch": 0.22, + "learning_rate": 1.7669923735574045e-05, + "loss": 0.6249, + "step": 6408 + }, + { + "epoch": 0.22, + "learning_rate": 1.7669225013255312e-05, + "loss": 0.7024, + "step": 6409 + }, + { + "epoch": 0.22, + "learning_rate": 1.7668526200008212e-05, + "loss": 0.6622, + "step": 6410 + }, + { + "epoch": 0.22, + "learning_rate": 1.7667827295841037e-05, + "loss": 0.5927, + "step": 6411 + }, + { + "epoch": 0.22, + "learning_rate": 1.7667128300762073e-05, + "loss": 0.5946, + "step": 6412 + }, + { + "epoch": 0.22, + "learning_rate": 1.7666429214779597e-05, + "loss": 0.5833, + "step": 6413 + }, + { + "epoch": 0.22, + "learning_rate": 1.7665730037901907e-05, + "loss": 0.6634, + "step": 6414 + }, + { + "epoch": 0.22, + "learning_rate": 1.766503077013729e-05, + "loss": 0.6608, + "step": 6415 + }, + { + "epoch": 0.22, + "learning_rate": 1.766433141149404e-05, + "loss": 0.6102, + "step": 6416 + }, + { + "epoch": 0.22, + "learning_rate": 1.7663631961980444e-05, + "loss": 0.6371, + "step": 6417 + }, + { + "epoch": 0.22, + "learning_rate": 1.7662932421604796e-05, + "loss": 0.5829, + "step": 6418 + }, + { + "epoch": 0.22, + "learning_rate": 1.766223279037539e-05, + "loss": 0.6739, + "step": 6419 + }, + { + "epoch": 0.22, + "learning_rate": 1.766153306830052e-05, + "loss": 0.6459, + "step": 6420 + }, + { + "epoch": 0.22, + "learning_rate": 1.7660833255388486e-05, + "loss": 0.6202, + "step": 6421 + }, + { + "epoch": 0.22, + "learning_rate": 1.7660133351647582e-05, + "loss": 0.6812, + "step": 6422 + }, + { + "epoch": 0.22, + "learning_rate": 1.7659433357086108e-05, + "loss": 0.6098, + "step": 6423 + }, + { + "epoch": 0.22, + "learning_rate": 1.765873327171236e-05, + "loss": 0.6911, + "step": 6424 + }, + { + "epoch": 0.22, + "learning_rate": 1.7658033095534643e-05, + "loss": 0.5746, + "step": 6425 + }, + { + "epoch": 0.22, + "learning_rate": 1.7657332828561255e-05, + "loss": 0.6476, + "step": 6426 + }, + { + "epoch": 0.22, + "learning_rate": 1.76566324708005e-05, + "loss": 0.6205, + "step": 6427 + }, + { + "epoch": 0.22, + "learning_rate": 1.7655932022260682e-05, + "loss": 0.677, + "step": 6428 + }, + { + "epoch": 0.22, + "learning_rate": 1.7655231482950107e-05, + "loss": 0.6709, + "step": 6429 + }, + { + "epoch": 0.22, + "learning_rate": 1.7654530852877075e-05, + "loss": 0.6492, + "step": 6430 + }, + { + "epoch": 0.22, + "learning_rate": 1.7653830132049898e-05, + "loss": 0.6276, + "step": 6431 + }, + { + "epoch": 0.22, + "learning_rate": 1.7653129320476882e-05, + "loss": 0.6605, + "step": 6432 + }, + { + "epoch": 0.22, + "learning_rate": 1.7652428418166336e-05, + "loss": 0.6458, + "step": 6433 + }, + { + "epoch": 0.22, + "learning_rate": 1.7651727425126574e-05, + "loss": 0.6309, + "step": 6434 + }, + { + "epoch": 0.22, + "learning_rate": 1.76510263413659e-05, + "loss": 0.6636, + "step": 6435 + }, + { + "epoch": 0.22, + "learning_rate": 1.765032516689263e-05, + "loss": 0.6406, + "step": 6436 + }, + { + "epoch": 0.22, + "learning_rate": 1.7649623901715084e-05, + "loss": 0.6791, + "step": 6437 + }, + { + "epoch": 0.22, + "learning_rate": 1.7648922545841567e-05, + "loss": 0.6589, + "step": 6438 + }, + { + "epoch": 0.22, + "learning_rate": 1.7648221099280395e-05, + "loss": 0.6564, + "step": 6439 + }, + { + "epoch": 0.22, + "learning_rate": 1.7647519562039885e-05, + "loss": 0.6246, + "step": 6440 + }, + { + "epoch": 0.22, + "learning_rate": 1.764681793412836e-05, + "loss": 0.6476, + "step": 6441 + }, + { + "epoch": 0.22, + "learning_rate": 1.7646116215554134e-05, + "loss": 0.6927, + "step": 6442 + }, + { + "epoch": 0.22, + "learning_rate": 1.7645414406325527e-05, + "loss": 0.6752, + "step": 6443 + }, + { + "epoch": 0.22, + "learning_rate": 1.7644712506450862e-05, + "loss": 0.6573, + "step": 6444 + }, + { + "epoch": 0.22, + "learning_rate": 1.764401051593846e-05, + "loss": 0.6245, + "step": 6445 + }, + { + "epoch": 0.22, + "learning_rate": 1.764330843479664e-05, + "loss": 0.664, + "step": 6446 + }, + { + "epoch": 0.22, + "learning_rate": 1.7642606263033735e-05, + "loss": 0.6486, + "step": 6447 + }, + { + "epoch": 0.22, + "learning_rate": 1.7641904000658062e-05, + "loss": 0.5877, + "step": 6448 + }, + { + "epoch": 0.22, + "learning_rate": 1.7641201647677952e-05, + "loss": 0.6907, + "step": 6449 + }, + { + "epoch": 0.22, + "learning_rate": 1.764049920410173e-05, + "loss": 0.6861, + "step": 6450 + }, + { + "epoch": 0.22, + "learning_rate": 1.763979666993772e-05, + "loss": 0.6867, + "step": 6451 + }, + { + "epoch": 0.22, + "learning_rate": 1.763909404519426e-05, + "loss": 0.6527, + "step": 6452 + }, + { + "epoch": 0.22, + "learning_rate": 1.7638391329879677e-05, + "loss": 0.6752, + "step": 6453 + }, + { + "epoch": 0.22, + "learning_rate": 1.7637688524002302e-05, + "loss": 0.6367, + "step": 6454 + }, + { + "epoch": 0.22, + "learning_rate": 1.7636985627570468e-05, + "loss": 0.675, + "step": 6455 + }, + { + "epoch": 0.22, + "learning_rate": 1.7636282640592505e-05, + "loss": 0.6748, + "step": 6456 + }, + { + "epoch": 0.22, + "learning_rate": 1.7635579563076753e-05, + "loss": 0.5962, + "step": 6457 + }, + { + "epoch": 0.22, + "learning_rate": 1.763487639503155e-05, + "loss": 0.585, + "step": 6458 + }, + { + "epoch": 0.22, + "learning_rate": 1.7634173136465228e-05, + "loss": 0.6575, + "step": 6459 + }, + { + "epoch": 0.22, + "learning_rate": 1.7633469787386122e-05, + "loss": 0.6399, + "step": 6460 + }, + { + "epoch": 0.22, + "learning_rate": 1.7632766347802576e-05, + "loss": 0.6907, + "step": 6461 + }, + { + "epoch": 0.22, + "learning_rate": 1.7632062817722934e-05, + "loss": 0.6834, + "step": 6462 + }, + { + "epoch": 0.22, + "learning_rate": 1.7631359197155528e-05, + "loss": 0.6881, + "step": 6463 + }, + { + "epoch": 0.22, + "learning_rate": 1.763065548610871e-05, + "loss": 0.6117, + "step": 6464 + }, + { + "epoch": 0.22, + "learning_rate": 1.7629951684590813e-05, + "loss": 0.6307, + "step": 6465 + }, + { + "epoch": 0.22, + "learning_rate": 1.762924779261019e-05, + "loss": 0.6526, + "step": 6466 + }, + { + "epoch": 0.22, + "learning_rate": 1.7628543810175183e-05, + "loss": 0.6274, + "step": 6467 + }, + { + "epoch": 0.22, + "learning_rate": 1.7627839737294138e-05, + "loss": 0.6567, + "step": 6468 + }, + { + "epoch": 0.22, + "learning_rate": 1.7627135573975402e-05, + "loss": 0.6109, + "step": 6469 + }, + { + "epoch": 0.22, + "learning_rate": 1.762643132022733e-05, + "loss": 0.6882, + "step": 6470 + }, + { + "epoch": 0.22, + "learning_rate": 1.7625726976058265e-05, + "loss": 0.6601, + "step": 6471 + }, + { + "epoch": 0.22, + "learning_rate": 1.762502254147656e-05, + "loss": 0.6306, + "step": 6472 + }, + { + "epoch": 0.22, + "learning_rate": 1.7624318016490565e-05, + "loss": 0.6456, + "step": 6473 + }, + { + "epoch": 0.22, + "learning_rate": 1.7623613401108638e-05, + "loss": 0.6722, + "step": 6474 + }, + { + "epoch": 0.22, + "learning_rate": 1.7622908695339127e-05, + "loss": 0.5628, + "step": 6475 + }, + { + "epoch": 0.22, + "learning_rate": 1.7622203899190394e-05, + "loss": 0.6852, + "step": 6476 + }, + { + "epoch": 0.22, + "learning_rate": 1.762149901267079e-05, + "loss": 0.6222, + "step": 6477 + }, + { + "epoch": 0.22, + "learning_rate": 1.7620794035788673e-05, + "loss": 0.6415, + "step": 6478 + }, + { + "epoch": 0.22, + "learning_rate": 1.7620088968552405e-05, + "loss": 0.6762, + "step": 6479 + }, + { + "epoch": 0.22, + "learning_rate": 1.7619383810970343e-05, + "loss": 0.6548, + "step": 6480 + }, + { + "epoch": 0.22, + "learning_rate": 1.7618678563050845e-05, + "loss": 0.6462, + "step": 6481 + }, + { + "epoch": 0.22, + "learning_rate": 1.7617973224802276e-05, + "loss": 0.6201, + "step": 6482 + }, + { + "epoch": 0.22, + "learning_rate": 1.7617267796232998e-05, + "loss": 0.6712, + "step": 6483 + }, + { + "epoch": 0.22, + "learning_rate": 1.7616562277351373e-05, + "loss": 0.6239, + "step": 6484 + }, + { + "epoch": 0.22, + "learning_rate": 1.7615856668165767e-05, + "loss": 0.611, + "step": 6485 + }, + { + "epoch": 0.22, + "learning_rate": 1.7615150968684548e-05, + "loss": 0.6264, + "step": 6486 + }, + { + "epoch": 0.22, + "learning_rate": 1.761444517891608e-05, + "loss": 0.6335, + "step": 6487 + }, + { + "epoch": 0.22, + "learning_rate": 1.7613739298868732e-05, + "loss": 0.6559, + "step": 6488 + }, + { + "epoch": 0.22, + "learning_rate": 1.7613033328550872e-05, + "loss": 0.6428, + "step": 6489 + }, + { + "epoch": 0.22, + "learning_rate": 1.761232726797087e-05, + "loss": 0.678, + "step": 6490 + }, + { + "epoch": 0.22, + "learning_rate": 1.7611621117137104e-05, + "loss": 0.608, + "step": 6491 + }, + { + "epoch": 0.22, + "learning_rate": 1.761091487605794e-05, + "loss": 0.654, + "step": 6492 + }, + { + "epoch": 0.22, + "learning_rate": 1.761020854474175e-05, + "loss": 0.6302, + "step": 6493 + }, + { + "epoch": 0.22, + "learning_rate": 1.760950212319691e-05, + "loss": 0.6077, + "step": 6494 + }, + { + "epoch": 0.23, + "learning_rate": 1.7608795611431796e-05, + "loss": 0.6231, + "step": 6495 + }, + { + "epoch": 0.23, + "learning_rate": 1.7608089009454787e-05, + "loss": 0.6681, + "step": 6496 + }, + { + "epoch": 0.23, + "learning_rate": 1.7607382317274257e-05, + "loss": 0.6383, + "step": 6497 + }, + { + "epoch": 0.23, + "learning_rate": 1.7606675534898586e-05, + "loss": 0.6991, + "step": 6498 + }, + { + "epoch": 0.23, + "learning_rate": 1.7605968662336156e-05, + "loss": 0.6879, + "step": 6499 + }, + { + "epoch": 0.23, + "learning_rate": 1.7605261699595345e-05, + "loss": 0.6172, + "step": 6500 + }, + { + "epoch": 0.23, + "learning_rate": 1.7604554646684537e-05, + "loss": 0.6621, + "step": 6501 + }, + { + "epoch": 0.23, + "learning_rate": 1.7603847503612113e-05, + "loss": 0.6532, + "step": 6502 + }, + { + "epoch": 0.23, + "learning_rate": 1.760314027038646e-05, + "loss": 0.6292, + "step": 6503 + }, + { + "epoch": 0.23, + "learning_rate": 1.7602432947015958e-05, + "loss": 0.6177, + "step": 6504 + }, + { + "epoch": 0.23, + "learning_rate": 1.7601725533508994e-05, + "loss": 0.656, + "step": 6505 + }, + { + "epoch": 0.23, + "learning_rate": 1.7601018029873963e-05, + "loss": 0.6029, + "step": 6506 + }, + { + "epoch": 0.23, + "learning_rate": 1.7600310436119245e-05, + "loss": 0.6543, + "step": 6507 + }, + { + "epoch": 0.23, + "learning_rate": 1.7599602752253232e-05, + "loss": 0.6431, + "step": 6508 + }, + { + "epoch": 0.23, + "learning_rate": 1.7598894978284316e-05, + "loss": 0.6072, + "step": 6509 + }, + { + "epoch": 0.23, + "learning_rate": 1.7598187114220887e-05, + "loss": 0.5566, + "step": 6510 + }, + { + "epoch": 0.23, + "learning_rate": 1.759747916007134e-05, + "loss": 0.5789, + "step": 6511 + }, + { + "epoch": 0.23, + "learning_rate": 1.7596771115844063e-05, + "loss": 0.6472, + "step": 6512 + }, + { + "epoch": 0.23, + "learning_rate": 1.7596062981547456e-05, + "loss": 0.6042, + "step": 6513 + }, + { + "epoch": 0.23, + "learning_rate": 1.759535475718991e-05, + "loss": 0.6776, + "step": 6514 + }, + { + "epoch": 0.23, + "learning_rate": 1.759464644277983e-05, + "loss": 0.6492, + "step": 6515 + }, + { + "epoch": 0.23, + "learning_rate": 1.759393803832561e-05, + "loss": 0.6801, + "step": 6516 + }, + { + "epoch": 0.23, + "learning_rate": 1.7593229543835643e-05, + "loss": 0.6543, + "step": 6517 + }, + { + "epoch": 0.23, + "learning_rate": 1.7592520959318338e-05, + "loss": 0.6248, + "step": 6518 + }, + { + "epoch": 0.23, + "learning_rate": 1.7591812284782092e-05, + "loss": 0.6491, + "step": 6519 + }, + { + "epoch": 0.23, + "learning_rate": 1.759110352023531e-05, + "loss": 0.6699, + "step": 6520 + }, + { + "epoch": 0.23, + "learning_rate": 1.759039466568639e-05, + "loss": 0.6308, + "step": 6521 + }, + { + "epoch": 0.23, + "learning_rate": 1.7589685721143737e-05, + "loss": 0.5761, + "step": 6522 + }, + { + "epoch": 0.23, + "learning_rate": 1.758897668661576e-05, + "loss": 0.6326, + "step": 6523 + }, + { + "epoch": 0.23, + "learning_rate": 1.758826756211087e-05, + "loss": 0.6412, + "step": 6524 + }, + { + "epoch": 0.23, + "learning_rate": 1.7587558347637462e-05, + "loss": 0.6907, + "step": 6525 + }, + { + "epoch": 0.23, + "learning_rate": 1.7586849043203955e-05, + "loss": 0.629, + "step": 6526 + }, + { + "epoch": 0.23, + "learning_rate": 1.7586139648818755e-05, + "loss": 0.633, + "step": 6527 + }, + { + "epoch": 0.23, + "learning_rate": 1.7585430164490273e-05, + "loss": 0.6385, + "step": 6528 + }, + { + "epoch": 0.23, + "learning_rate": 1.758472059022692e-05, + "loss": 0.6714, + "step": 6529 + }, + { + "epoch": 0.23, + "learning_rate": 1.7584010926037107e-05, + "loss": 0.6368, + "step": 6530 + }, + { + "epoch": 0.23, + "learning_rate": 1.758330117192925e-05, + "loss": 0.6554, + "step": 6531 + }, + { + "epoch": 0.23, + "learning_rate": 1.7582591327911772e-05, + "loss": 0.6563, + "step": 6532 + }, + { + "epoch": 0.23, + "learning_rate": 1.758188139399308e-05, + "loss": 0.6228, + "step": 6533 + }, + { + "epoch": 0.23, + "learning_rate": 1.7581171370181588e-05, + "loss": 0.6011, + "step": 6534 + }, + { + "epoch": 0.23, + "learning_rate": 1.7580461256485722e-05, + "loss": 0.6267, + "step": 6535 + }, + { + "epoch": 0.23, + "learning_rate": 1.7579751052913897e-05, + "loss": 0.6103, + "step": 6536 + }, + { + "epoch": 0.23, + "learning_rate": 1.7579040759474537e-05, + "loss": 0.6608, + "step": 6537 + }, + { + "epoch": 0.23, + "learning_rate": 1.757833037617606e-05, + "loss": 0.6, + "step": 6538 + }, + { + "epoch": 0.23, + "learning_rate": 1.757761990302689e-05, + "loss": 0.6233, + "step": 6539 + }, + { + "epoch": 0.23, + "learning_rate": 1.757690934003545e-05, + "loss": 0.68, + "step": 6540 + }, + { + "epoch": 0.23, + "learning_rate": 1.7576198687210167e-05, + "loss": 0.6524, + "step": 6541 + }, + { + "epoch": 0.23, + "learning_rate": 1.7575487944559463e-05, + "loss": 0.6324, + "step": 6542 + }, + { + "epoch": 0.23, + "learning_rate": 1.7574777112091767e-05, + "loss": 0.6019, + "step": 6543 + }, + { + "epoch": 0.23, + "learning_rate": 1.7574066189815505e-05, + "loss": 0.5972, + "step": 6544 + }, + { + "epoch": 0.23, + "learning_rate": 1.7573355177739107e-05, + "loss": 0.6349, + "step": 6545 + }, + { + "epoch": 0.23, + "learning_rate": 1.7572644075871003e-05, + "loss": 0.6115, + "step": 6546 + }, + { + "epoch": 0.23, + "learning_rate": 1.7571932884219626e-05, + "loss": 0.6363, + "step": 6547 + }, + { + "epoch": 0.23, + "learning_rate": 1.7571221602793405e-05, + "loss": 0.652, + "step": 6548 + }, + { + "epoch": 0.23, + "learning_rate": 1.757051023160077e-05, + "loss": 0.5956, + "step": 6549 + }, + { + "epoch": 0.23, + "learning_rate": 1.7569798770650166e-05, + "loss": 0.6463, + "step": 6550 + }, + { + "epoch": 0.23, + "learning_rate": 1.756908721995002e-05, + "loss": 0.626, + "step": 6551 + }, + { + "epoch": 0.23, + "learning_rate": 1.756837557950877e-05, + "loss": 0.6216, + "step": 6552 + }, + { + "epoch": 0.23, + "learning_rate": 1.756766384933485e-05, + "loss": 0.6405, + "step": 6553 + }, + { + "epoch": 0.23, + "learning_rate": 1.7566952029436707e-05, + "loss": 0.6408, + "step": 6554 + }, + { + "epoch": 0.23, + "learning_rate": 1.7566240119822772e-05, + "loss": 0.574, + "step": 6555 + }, + { + "epoch": 0.23, + "learning_rate": 1.7565528120501492e-05, + "loss": 0.5897, + "step": 6556 + }, + { + "epoch": 0.23, + "learning_rate": 1.7564816031481303e-05, + "loss": 0.612, + "step": 6557 + }, + { + "epoch": 0.23, + "learning_rate": 1.7564103852770652e-05, + "loss": 0.598, + "step": 6558 + }, + { + "epoch": 0.23, + "learning_rate": 1.756339158437798e-05, + "loss": 0.646, + "step": 6559 + }, + { + "epoch": 0.23, + "learning_rate": 1.7562679226311733e-05, + "loss": 0.6237, + "step": 6560 + }, + { + "epoch": 0.23, + "learning_rate": 1.756196677858036e-05, + "loss": 0.6396, + "step": 6561 + }, + { + "epoch": 0.23, + "learning_rate": 1.75612542411923e-05, + "loss": 0.6275, + "step": 6562 + }, + { + "epoch": 0.23, + "learning_rate": 1.756054161415601e-05, + "loss": 0.6215, + "step": 6563 + }, + { + "epoch": 0.23, + "learning_rate": 1.755982889747993e-05, + "loss": 0.6609, + "step": 6564 + }, + { + "epoch": 0.23, + "learning_rate": 1.7559116091172522e-05, + "loss": 0.6471, + "step": 6565 + }, + { + "epoch": 0.23, + "learning_rate": 1.7558403195242225e-05, + "loss": 0.5921, + "step": 6566 + }, + { + "epoch": 0.23, + "learning_rate": 1.7557690209697496e-05, + "loss": 0.6094, + "step": 6567 + }, + { + "epoch": 0.23, + "learning_rate": 1.7556977134546795e-05, + "loss": 0.6785, + "step": 6568 + }, + { + "epoch": 0.23, + "learning_rate": 1.7556263969798567e-05, + "loss": 0.6889, + "step": 6569 + }, + { + "epoch": 0.23, + "learning_rate": 1.7555550715461268e-05, + "loss": 0.6313, + "step": 6570 + }, + { + "epoch": 0.23, + "learning_rate": 1.7554837371543363e-05, + "loss": 0.6561, + "step": 6571 + }, + { + "epoch": 0.23, + "learning_rate": 1.75541239380533e-05, + "loss": 0.6363, + "step": 6572 + }, + { + "epoch": 0.23, + "learning_rate": 1.7553410414999545e-05, + "loss": 0.6707, + "step": 6573 + }, + { + "epoch": 0.23, + "learning_rate": 1.755269680239055e-05, + "loss": 0.6483, + "step": 6574 + }, + { + "epoch": 0.23, + "learning_rate": 1.7551983100234783e-05, + "loss": 0.6195, + "step": 6575 + }, + { + "epoch": 0.23, + "learning_rate": 1.7551269308540704e-05, + "loss": 0.6627, + "step": 6576 + }, + { + "epoch": 0.23, + "learning_rate": 1.7550555427316773e-05, + "loss": 0.7067, + "step": 6577 + }, + { + "epoch": 0.23, + "learning_rate": 1.7549841456571458e-05, + "loss": 0.6018, + "step": 6578 + }, + { + "epoch": 0.23, + "learning_rate": 1.7549127396313223e-05, + "loss": 0.6673, + "step": 6579 + }, + { + "epoch": 0.23, + "learning_rate": 1.7548413246550527e-05, + "loss": 0.6228, + "step": 6580 + }, + { + "epoch": 0.23, + "learning_rate": 1.7547699007291848e-05, + "loss": 0.6495, + "step": 6581 + }, + { + "epoch": 0.23, + "learning_rate": 1.754698467854565e-05, + "loss": 0.6689, + "step": 6582 + }, + { + "epoch": 0.23, + "learning_rate": 1.7546270260320397e-05, + "loss": 0.6248, + "step": 6583 + }, + { + "epoch": 0.23, + "learning_rate": 1.7545555752624566e-05, + "loss": 0.7273, + "step": 6584 + }, + { + "epoch": 0.23, + "learning_rate": 1.7544841155466627e-05, + "loss": 0.6258, + "step": 6585 + }, + { + "epoch": 0.23, + "learning_rate": 1.7544126468855052e-05, + "loss": 0.6265, + "step": 6586 + }, + { + "epoch": 0.23, + "learning_rate": 1.7543411692798313e-05, + "loss": 0.6296, + "step": 6587 + }, + { + "epoch": 0.23, + "learning_rate": 1.754269682730489e-05, + "loss": 0.6506, + "step": 6588 + }, + { + "epoch": 0.23, + "learning_rate": 1.754198187238325e-05, + "loss": 0.5766, + "step": 6589 + }, + { + "epoch": 0.23, + "learning_rate": 1.7541266828041877e-05, + "loss": 0.5604, + "step": 6590 + }, + { + "epoch": 0.23, + "learning_rate": 1.7540551694289246e-05, + "loss": 0.6479, + "step": 6591 + }, + { + "epoch": 0.23, + "learning_rate": 1.7539836471133833e-05, + "loss": 0.5989, + "step": 6592 + }, + { + "epoch": 0.23, + "learning_rate": 1.7539121158584124e-05, + "loss": 0.6472, + "step": 6593 + }, + { + "epoch": 0.23, + "learning_rate": 1.7538405756648594e-05, + "loss": 0.648, + "step": 6594 + }, + { + "epoch": 0.23, + "learning_rate": 1.753769026533573e-05, + "loss": 0.6633, + "step": 6595 + }, + { + "epoch": 0.23, + "learning_rate": 1.753697468465401e-05, + "loss": 0.6617, + "step": 6596 + }, + { + "epoch": 0.23, + "learning_rate": 1.7536259014611926e-05, + "loss": 0.6036, + "step": 6597 + }, + { + "epoch": 0.23, + "learning_rate": 1.7535543255217952e-05, + "loss": 0.6557, + "step": 6598 + }, + { + "epoch": 0.23, + "learning_rate": 1.7534827406480582e-05, + "loss": 0.6843, + "step": 6599 + }, + { + "epoch": 0.23, + "learning_rate": 1.75341114684083e-05, + "loss": 0.6294, + "step": 6600 + }, + { + "epoch": 0.23, + "learning_rate": 1.7533395441009598e-05, + "loss": 0.6637, + "step": 6601 + }, + { + "epoch": 0.23, + "learning_rate": 1.7532679324292966e-05, + "loss": 0.6083, + "step": 6602 + }, + { + "epoch": 0.23, + "learning_rate": 1.7531963118266887e-05, + "loss": 0.6062, + "step": 6603 + }, + { + "epoch": 0.23, + "learning_rate": 1.753124682293986e-05, + "loss": 0.6649, + "step": 6604 + }, + { + "epoch": 0.23, + "learning_rate": 1.7530530438320373e-05, + "loss": 0.6269, + "step": 6605 + }, + { + "epoch": 0.23, + "learning_rate": 1.7529813964416923e-05, + "loss": 0.6623, + "step": 6606 + }, + { + "epoch": 0.23, + "learning_rate": 1.7529097401238003e-05, + "loss": 0.6698, + "step": 6607 + }, + { + "epoch": 0.23, + "learning_rate": 1.7528380748792106e-05, + "loss": 0.6123, + "step": 6608 + }, + { + "epoch": 0.23, + "learning_rate": 1.7527664007087738e-05, + "loss": 0.5865, + "step": 6609 + }, + { + "epoch": 0.23, + "learning_rate": 1.7526947176133388e-05, + "loss": 0.6372, + "step": 6610 + }, + { + "epoch": 0.23, + "learning_rate": 1.7526230255937555e-05, + "loss": 0.5839, + "step": 6611 + }, + { + "epoch": 0.23, + "learning_rate": 1.752551324650874e-05, + "loss": 0.5986, + "step": 6612 + }, + { + "epoch": 0.23, + "learning_rate": 1.752479614785545e-05, + "loss": 0.6381, + "step": 6613 + }, + { + "epoch": 0.23, + "learning_rate": 1.752407895998618e-05, + "loss": 0.6409, + "step": 6614 + }, + { + "epoch": 0.23, + "learning_rate": 1.752336168290944e-05, + "loss": 0.6156, + "step": 6615 + }, + { + "epoch": 0.23, + "learning_rate": 1.7522644316633727e-05, + "loss": 0.5945, + "step": 6616 + }, + { + "epoch": 0.23, + "learning_rate": 1.752192686116755e-05, + "loss": 0.5627, + "step": 6617 + }, + { + "epoch": 0.23, + "learning_rate": 1.7521209316519413e-05, + "loss": 0.6541, + "step": 6618 + }, + { + "epoch": 0.23, + "learning_rate": 1.7520491682697827e-05, + "loss": 0.6903, + "step": 6619 + }, + { + "epoch": 0.23, + "learning_rate": 1.7519773959711298e-05, + "loss": 0.6634, + "step": 6620 + }, + { + "epoch": 0.23, + "learning_rate": 1.7519056147568338e-05, + "loss": 0.6273, + "step": 6621 + }, + { + "epoch": 0.23, + "learning_rate": 1.7518338246277454e-05, + "loss": 0.6537, + "step": 6622 + }, + { + "epoch": 0.23, + "learning_rate": 1.751762025584716e-05, + "loss": 0.707, + "step": 6623 + }, + { + "epoch": 0.23, + "learning_rate": 1.7516902176285968e-05, + "loss": 0.5949, + "step": 6624 + }, + { + "epoch": 0.23, + "learning_rate": 1.751618400760239e-05, + "loss": 0.6586, + "step": 6625 + }, + { + "epoch": 0.23, + "learning_rate": 1.7515465749804945e-05, + "loss": 0.64, + "step": 6626 + }, + { + "epoch": 0.23, + "learning_rate": 1.7514747402902147e-05, + "loss": 0.6597, + "step": 6627 + }, + { + "epoch": 0.23, + "learning_rate": 1.751402896690251e-05, + "loss": 0.5763, + "step": 6628 + }, + { + "epoch": 0.23, + "learning_rate": 1.7513310441814555e-05, + "loss": 0.6046, + "step": 6629 + }, + { + "epoch": 0.23, + "learning_rate": 1.75125918276468e-05, + "loss": 0.6151, + "step": 6630 + }, + { + "epoch": 0.23, + "learning_rate": 1.7511873124407768e-05, + "loss": 0.6908, + "step": 6631 + }, + { + "epoch": 0.23, + "learning_rate": 1.7511154332105972e-05, + "loss": 0.6292, + "step": 6632 + }, + { + "epoch": 0.23, + "learning_rate": 1.7510435450749945e-05, + "loss": 0.6235, + "step": 6633 + }, + { + "epoch": 0.23, + "learning_rate": 1.7509716480348203e-05, + "loss": 0.6401, + "step": 6634 + }, + { + "epoch": 0.23, + "learning_rate": 1.7508997420909272e-05, + "loss": 0.5997, + "step": 6635 + }, + { + "epoch": 0.23, + "learning_rate": 1.750827827244168e-05, + "loss": 0.65, + "step": 6636 + }, + { + "epoch": 0.23, + "learning_rate": 1.7507559034953946e-05, + "loss": 0.6, + "step": 6637 + }, + { + "epoch": 0.23, + "learning_rate": 1.7506839708454606e-05, + "loss": 0.6987, + "step": 6638 + }, + { + "epoch": 0.23, + "learning_rate": 1.7506120292952186e-05, + "loss": 0.6972, + "step": 6639 + }, + { + "epoch": 0.23, + "learning_rate": 1.7505400788455215e-05, + "loss": 0.6238, + "step": 6640 + }, + { + "epoch": 0.23, + "learning_rate": 1.750468119497222e-05, + "loss": 0.605, + "step": 6641 + }, + { + "epoch": 0.23, + "learning_rate": 1.750396151251174e-05, + "loss": 0.597, + "step": 6642 + }, + { + "epoch": 0.23, + "learning_rate": 1.7503241741082296e-05, + "loss": 0.5905, + "step": 6643 + }, + { + "epoch": 0.23, + "learning_rate": 1.7502521880692435e-05, + "loss": 0.6056, + "step": 6644 + }, + { + "epoch": 0.23, + "learning_rate": 1.7501801931350688e-05, + "loss": 0.6601, + "step": 6645 + }, + { + "epoch": 0.23, + "learning_rate": 1.750108189306559e-05, + "loss": 0.6572, + "step": 6646 + }, + { + "epoch": 0.23, + "learning_rate": 1.7500361765845672e-05, + "loss": 0.6582, + "step": 6647 + }, + { + "epoch": 0.23, + "learning_rate": 1.749964154969948e-05, + "loss": 0.6464, + "step": 6648 + }, + { + "epoch": 0.23, + "learning_rate": 1.7498921244635553e-05, + "loss": 0.7006, + "step": 6649 + }, + { + "epoch": 0.23, + "learning_rate": 1.7498200850662424e-05, + "loss": 0.7104, + "step": 6650 + }, + { + "epoch": 0.23, + "learning_rate": 1.749748036778864e-05, + "loss": 0.7081, + "step": 6651 + }, + { + "epoch": 0.23, + "learning_rate": 1.7496759796022742e-05, + "loss": 0.6217, + "step": 6652 + }, + { + "epoch": 0.23, + "learning_rate": 1.7496039135373273e-05, + "loss": 0.6178, + "step": 6653 + }, + { + "epoch": 0.23, + "learning_rate": 1.7495318385848777e-05, + "loss": 0.6351, + "step": 6654 + }, + { + "epoch": 0.23, + "learning_rate": 1.7494597547457803e-05, + "loss": 0.6739, + "step": 6655 + }, + { + "epoch": 0.23, + "learning_rate": 1.749387662020889e-05, + "loss": 0.6695, + "step": 6656 + }, + { + "epoch": 0.23, + "learning_rate": 1.7493155604110594e-05, + "loss": 0.5767, + "step": 6657 + }, + { + "epoch": 0.23, + "learning_rate": 1.749243449917146e-05, + "loss": 0.6349, + "step": 6658 + }, + { + "epoch": 0.23, + "learning_rate": 1.7491713305400033e-05, + "loss": 0.5978, + "step": 6659 + }, + { + "epoch": 0.23, + "learning_rate": 1.749099202280487e-05, + "loss": 0.6239, + "step": 6660 + }, + { + "epoch": 0.23, + "learning_rate": 1.7490270651394515e-05, + "loss": 0.6827, + "step": 6661 + }, + { + "epoch": 0.23, + "learning_rate": 1.748954919117753e-05, + "loss": 0.6375, + "step": 6662 + }, + { + "epoch": 0.23, + "learning_rate": 1.748882764216247e-05, + "loss": 0.6619, + "step": 6663 + }, + { + "epoch": 0.23, + "learning_rate": 1.7488106004357882e-05, + "loss": 0.637, + "step": 6664 + }, + { + "epoch": 0.23, + "learning_rate": 1.748738427777232e-05, + "loss": 0.677, + "step": 6665 + }, + { + "epoch": 0.23, + "learning_rate": 1.748666246241435e-05, + "loss": 0.5787, + "step": 6666 + }, + { + "epoch": 0.23, + "learning_rate": 1.748594055829253e-05, + "loss": 0.647, + "step": 6667 + }, + { + "epoch": 0.23, + "learning_rate": 1.7485218565415406e-05, + "loss": 0.6353, + "step": 6668 + }, + { + "epoch": 0.23, + "learning_rate": 1.7484496483791552e-05, + "loss": 0.6571, + "step": 6669 + }, + { + "epoch": 0.23, + "learning_rate": 1.748377431342952e-05, + "loss": 0.6632, + "step": 6670 + }, + { + "epoch": 0.23, + "learning_rate": 1.7483052054337883e-05, + "loss": 0.6068, + "step": 6671 + }, + { + "epoch": 0.23, + "learning_rate": 1.748232970652519e-05, + "loss": 0.6071, + "step": 6672 + }, + { + "epoch": 0.23, + "learning_rate": 1.748160727000002e-05, + "loss": 0.6405, + "step": 6673 + }, + { + "epoch": 0.23, + "learning_rate": 1.748088474477093e-05, + "loss": 0.6543, + "step": 6674 + }, + { + "epoch": 0.23, + "learning_rate": 1.7480162130846487e-05, + "loss": 0.6251, + "step": 6675 + }, + { + "epoch": 0.23, + "learning_rate": 1.747943942823526e-05, + "loss": 0.6537, + "step": 6676 + }, + { + "epoch": 0.23, + "learning_rate": 1.7478716636945815e-05, + "loss": 0.5749, + "step": 6677 + }, + { + "epoch": 0.23, + "learning_rate": 1.747799375698673e-05, + "loss": 0.6233, + "step": 6678 + }, + { + "epoch": 0.23, + "learning_rate": 1.7477270788366562e-05, + "loss": 0.6271, + "step": 6679 + }, + { + "epoch": 0.23, + "learning_rate": 1.7476547731093893e-05, + "loss": 0.6247, + "step": 6680 + }, + { + "epoch": 0.23, + "learning_rate": 1.747582458517729e-05, + "loss": 0.6103, + "step": 6681 + }, + { + "epoch": 0.23, + "learning_rate": 1.7475101350625335e-05, + "loss": 0.7034, + "step": 6682 + }, + { + "epoch": 0.23, + "learning_rate": 1.7474378027446595e-05, + "loss": 0.644, + "step": 6683 + }, + { + "epoch": 0.23, + "learning_rate": 1.7473654615649647e-05, + "loss": 0.642, + "step": 6684 + }, + { + "epoch": 0.23, + "learning_rate": 1.747293111524307e-05, + "loss": 0.5946, + "step": 6685 + }, + { + "epoch": 0.23, + "learning_rate": 1.7472207526235442e-05, + "loss": 0.6624, + "step": 6686 + }, + { + "epoch": 0.23, + "learning_rate": 1.747148384863534e-05, + "loss": 0.6322, + "step": 6687 + }, + { + "epoch": 0.23, + "learning_rate": 1.747076008245135e-05, + "loss": 0.7134, + "step": 6688 + }, + { + "epoch": 0.23, + "learning_rate": 1.7470036227692044e-05, + "loss": 0.6537, + "step": 6689 + }, + { + "epoch": 0.23, + "learning_rate": 1.7469312284366008e-05, + "loss": 0.6668, + "step": 6690 + }, + { + "epoch": 0.23, + "learning_rate": 1.7468588252481827e-05, + "loss": 0.5963, + "step": 6691 + }, + { + "epoch": 0.23, + "learning_rate": 1.7467864132048087e-05, + "loss": 0.6229, + "step": 6692 + }, + { + "epoch": 0.23, + "learning_rate": 1.746713992307337e-05, + "loss": 0.6782, + "step": 6693 + }, + { + "epoch": 0.23, + "learning_rate": 1.7466415625566263e-05, + "loss": 0.6403, + "step": 6694 + }, + { + "epoch": 0.23, + "learning_rate": 1.746569123953535e-05, + "loss": 0.6173, + "step": 6695 + }, + { + "epoch": 0.23, + "learning_rate": 1.7464966764989228e-05, + "loss": 0.6264, + "step": 6696 + }, + { + "epoch": 0.23, + "learning_rate": 1.7464242201936483e-05, + "loss": 0.6028, + "step": 6697 + }, + { + "epoch": 0.23, + "learning_rate": 1.7463517550385698e-05, + "loss": 0.6936, + "step": 6698 + }, + { + "epoch": 0.23, + "learning_rate": 1.7462792810345477e-05, + "loss": 0.6039, + "step": 6699 + }, + { + "epoch": 0.23, + "learning_rate": 1.7462067981824403e-05, + "loss": 0.6242, + "step": 6700 + }, + { + "epoch": 0.23, + "learning_rate": 1.7461343064831074e-05, + "loss": 0.6196, + "step": 6701 + }, + { + "epoch": 0.23, + "learning_rate": 1.7460618059374085e-05, + "loss": 0.6713, + "step": 6702 + }, + { + "epoch": 0.23, + "learning_rate": 1.7459892965462035e-05, + "loss": 0.6245, + "step": 6703 + }, + { + "epoch": 0.23, + "learning_rate": 1.7459167783103512e-05, + "loss": 0.6267, + "step": 6704 + }, + { + "epoch": 0.23, + "learning_rate": 1.745844251230712e-05, + "loss": 0.6442, + "step": 6705 + }, + { + "epoch": 0.23, + "learning_rate": 1.7457717153081456e-05, + "loss": 0.6309, + "step": 6706 + }, + { + "epoch": 0.23, + "learning_rate": 1.7456991705435125e-05, + "loss": 0.6471, + "step": 6707 + }, + { + "epoch": 0.23, + "learning_rate": 1.7456266169376718e-05, + "loss": 0.6059, + "step": 6708 + }, + { + "epoch": 0.23, + "learning_rate": 1.745554054491485e-05, + "loss": 0.6136, + "step": 6709 + }, + { + "epoch": 0.23, + "learning_rate": 1.7454814832058112e-05, + "loss": 0.6857, + "step": 6710 + }, + { + "epoch": 0.23, + "learning_rate": 1.745408903081512e-05, + "loss": 0.6067, + "step": 6711 + }, + { + "epoch": 0.23, + "learning_rate": 1.745336314119447e-05, + "loss": 0.6463, + "step": 6712 + }, + { + "epoch": 0.23, + "learning_rate": 1.7452637163204767e-05, + "loss": 0.6169, + "step": 6713 + }, + { + "epoch": 0.23, + "learning_rate": 1.745191109685463e-05, + "loss": 0.638, + "step": 6714 + }, + { + "epoch": 0.23, + "learning_rate": 1.7451184942152656e-05, + "loss": 0.646, + "step": 6715 + }, + { + "epoch": 0.23, + "learning_rate": 1.745045869910746e-05, + "loss": 0.6044, + "step": 6716 + }, + { + "epoch": 0.23, + "learning_rate": 1.744973236772765e-05, + "loss": 0.6452, + "step": 6717 + }, + { + "epoch": 0.23, + "learning_rate": 1.744900594802184e-05, + "loss": 0.6111, + "step": 6718 + }, + { + "epoch": 0.23, + "learning_rate": 1.744827943999864e-05, + "loss": 0.6416, + "step": 6719 + }, + { + "epoch": 0.23, + "learning_rate": 1.744755284366667e-05, + "loss": 0.6212, + "step": 6720 + }, + { + "epoch": 0.23, + "learning_rate": 1.7446826159034537e-05, + "loss": 0.6357, + "step": 6721 + }, + { + "epoch": 0.23, + "learning_rate": 1.7446099386110854e-05, + "loss": 0.5872, + "step": 6722 + }, + { + "epoch": 0.23, + "learning_rate": 1.7445372524904248e-05, + "loss": 0.6537, + "step": 6723 + }, + { + "epoch": 0.23, + "learning_rate": 1.7444645575423334e-05, + "loss": 0.6271, + "step": 6724 + }, + { + "epoch": 0.23, + "learning_rate": 1.7443918537676728e-05, + "loss": 0.65, + "step": 6725 + }, + { + "epoch": 0.23, + "learning_rate": 1.744319141167305e-05, + "loss": 0.6103, + "step": 6726 + }, + { + "epoch": 0.23, + "learning_rate": 1.7442464197420926e-05, + "loss": 0.6022, + "step": 6727 + }, + { + "epoch": 0.23, + "learning_rate": 1.744173689492897e-05, + "loss": 0.6396, + "step": 6728 + }, + { + "epoch": 0.23, + "learning_rate": 1.744100950420581e-05, + "loss": 0.6491, + "step": 6729 + }, + { + "epoch": 0.23, + "learning_rate": 1.7440282025260068e-05, + "loss": 0.633, + "step": 6730 + }, + { + "epoch": 0.23, + "learning_rate": 1.7439554458100374e-05, + "loss": 0.6026, + "step": 6731 + }, + { + "epoch": 0.23, + "learning_rate": 1.7438826802735348e-05, + "loss": 0.607, + "step": 6732 + }, + { + "epoch": 0.23, + "learning_rate": 1.7438099059173622e-05, + "loss": 0.6487, + "step": 6733 + }, + { + "epoch": 0.23, + "learning_rate": 1.7437371227423824e-05, + "loss": 0.6469, + "step": 6734 + }, + { + "epoch": 0.23, + "learning_rate": 1.7436643307494575e-05, + "loss": 0.658, + "step": 6735 + }, + { + "epoch": 0.23, + "learning_rate": 1.743591529939452e-05, + "loss": 0.6315, + "step": 6736 + }, + { + "epoch": 0.23, + "learning_rate": 1.7435187203132277e-05, + "loss": 0.6734, + "step": 6737 + }, + { + "epoch": 0.23, + "learning_rate": 1.743445901871649e-05, + "loss": 0.6226, + "step": 6738 + }, + { + "epoch": 0.23, + "learning_rate": 1.743373074615578e-05, + "loss": 0.6198, + "step": 6739 + }, + { + "epoch": 0.23, + "learning_rate": 1.743300238545879e-05, + "loss": 0.6421, + "step": 6740 + }, + { + "epoch": 0.23, + "learning_rate": 1.7432273936634158e-05, + "loss": 0.7019, + "step": 6741 + }, + { + "epoch": 0.23, + "learning_rate": 1.743154539969051e-05, + "loss": 0.6001, + "step": 6742 + }, + { + "epoch": 0.23, + "learning_rate": 1.74308167746365e-05, + "loss": 0.6469, + "step": 6743 + }, + { + "epoch": 0.23, + "learning_rate": 1.7430088061480746e-05, + "loss": 0.6506, + "step": 6744 + }, + { + "epoch": 0.23, + "learning_rate": 1.7429359260231907e-05, + "loss": 0.6372, + "step": 6745 + }, + { + "epoch": 0.23, + "learning_rate": 1.7428630370898614e-05, + "loss": 0.6678, + "step": 6746 + }, + { + "epoch": 0.23, + "learning_rate": 1.7427901393489507e-05, + "loss": 0.5693, + "step": 6747 + }, + { + "epoch": 0.23, + "learning_rate": 1.7427172328013236e-05, + "loss": 0.6868, + "step": 6748 + }, + { + "epoch": 0.23, + "learning_rate": 1.7426443174478444e-05, + "loss": 0.6466, + "step": 6749 + }, + { + "epoch": 0.23, + "learning_rate": 1.7425713932893767e-05, + "loss": 0.6224, + "step": 6750 + }, + { + "epoch": 0.23, + "learning_rate": 1.7424984603267866e-05, + "loss": 0.7055, + "step": 6751 + }, + { + "epoch": 0.23, + "learning_rate": 1.7424255185609373e-05, + "loss": 0.616, + "step": 6752 + }, + { + "epoch": 0.23, + "learning_rate": 1.7423525679926945e-05, + "loss": 0.6298, + "step": 6753 + }, + { + "epoch": 0.23, + "learning_rate": 1.742279608622923e-05, + "loss": 0.6185, + "step": 6754 + }, + { + "epoch": 0.23, + "learning_rate": 1.7422066404524874e-05, + "loss": 0.5859, + "step": 6755 + }, + { + "epoch": 0.23, + "learning_rate": 1.7421336634822538e-05, + "loss": 0.5945, + "step": 6756 + }, + { + "epoch": 0.23, + "learning_rate": 1.7420606777130866e-05, + "loss": 0.6867, + "step": 6757 + }, + { + "epoch": 0.23, + "learning_rate": 1.7419876831458512e-05, + "loss": 0.6982, + "step": 6758 + }, + { + "epoch": 0.23, + "learning_rate": 1.741914679781413e-05, + "loss": 0.6303, + "step": 6759 + }, + { + "epoch": 0.23, + "learning_rate": 1.741841667620638e-05, + "loss": 0.637, + "step": 6760 + }, + { + "epoch": 0.23, + "learning_rate": 1.7417686466643918e-05, + "loss": 0.6113, + "step": 6761 + }, + { + "epoch": 0.23, + "learning_rate": 1.7416956169135396e-05, + "loss": 0.6315, + "step": 6762 + }, + { + "epoch": 0.23, + "learning_rate": 1.7416225783689478e-05, + "loss": 0.619, + "step": 6763 + }, + { + "epoch": 0.23, + "learning_rate": 1.741549531031482e-05, + "loss": 0.633, + "step": 6764 + }, + { + "epoch": 0.23, + "learning_rate": 1.7414764749020088e-05, + "loss": 0.6452, + "step": 6765 + }, + { + "epoch": 0.23, + "learning_rate": 1.7414034099813938e-05, + "loss": 0.6571, + "step": 6766 + }, + { + "epoch": 0.23, + "learning_rate": 1.7413303362705034e-05, + "loss": 0.6084, + "step": 6767 + }, + { + "epoch": 0.23, + "learning_rate": 1.741257253770204e-05, + "loss": 0.6733, + "step": 6768 + }, + { + "epoch": 0.23, + "learning_rate": 1.7411841624813627e-05, + "loss": 0.6564, + "step": 6769 + }, + { + "epoch": 0.23, + "learning_rate": 1.741111062404845e-05, + "loss": 0.6414, + "step": 6770 + }, + { + "epoch": 0.23, + "learning_rate": 1.7410379535415182e-05, + "loss": 0.5946, + "step": 6771 + }, + { + "epoch": 0.23, + "learning_rate": 1.740964835892249e-05, + "loss": 0.6238, + "step": 6772 + }, + { + "epoch": 0.23, + "learning_rate": 1.7408917094579047e-05, + "loss": 0.6207, + "step": 6773 + }, + { + "epoch": 0.23, + "learning_rate": 1.740818574239352e-05, + "loss": 0.6265, + "step": 6774 + }, + { + "epoch": 0.23, + "learning_rate": 1.7407454302374577e-05, + "loss": 0.6165, + "step": 6775 + }, + { + "epoch": 0.23, + "learning_rate": 1.7406722774530892e-05, + "loss": 0.6588, + "step": 6776 + }, + { + "epoch": 0.23, + "learning_rate": 1.740599115887114e-05, + "loss": 0.6033, + "step": 6777 + }, + { + "epoch": 0.23, + "learning_rate": 1.7405259455403993e-05, + "loss": 0.5982, + "step": 6778 + }, + { + "epoch": 0.23, + "learning_rate": 1.740452766413813e-05, + "loss": 0.6315, + "step": 6779 + }, + { + "epoch": 0.23, + "learning_rate": 1.7403795785082222e-05, + "loss": 0.625, + "step": 6780 + }, + { + "epoch": 0.23, + "learning_rate": 1.7403063818244952e-05, + "loss": 0.5925, + "step": 6781 + }, + { + "epoch": 0.23, + "learning_rate": 1.7402331763634994e-05, + "loss": 0.6105, + "step": 6782 + }, + { + "epoch": 0.24, + "learning_rate": 1.7401599621261028e-05, + "loss": 0.5946, + "step": 6783 + }, + { + "epoch": 0.24, + "learning_rate": 1.740086739113174e-05, + "loss": 0.6859, + "step": 6784 + }, + { + "epoch": 0.24, + "learning_rate": 1.7400135073255802e-05, + "loss": 0.6187, + "step": 6785 + }, + { + "epoch": 0.24, + "learning_rate": 1.7399402667641903e-05, + "loss": 0.6162, + "step": 6786 + }, + { + "epoch": 0.24, + "learning_rate": 1.739867017429872e-05, + "loss": 0.6249, + "step": 6787 + }, + { + "epoch": 0.24, + "learning_rate": 1.739793759323495e-05, + "loss": 0.609, + "step": 6788 + }, + { + "epoch": 0.24, + "learning_rate": 1.739720492445927e-05, + "loss": 0.623, + "step": 6789 + }, + { + "epoch": 0.24, + "learning_rate": 1.7396472167980368e-05, + "loss": 0.6454, + "step": 6790 + }, + { + "epoch": 0.24, + "learning_rate": 1.739573932380693e-05, + "loss": 0.6191, + "step": 6791 + }, + { + "epoch": 0.24, + "learning_rate": 1.739500639194765e-05, + "loss": 0.6999, + "step": 6792 + }, + { + "epoch": 0.24, + "learning_rate": 1.739427337241121e-05, + "loss": 0.6477, + "step": 6793 + }, + { + "epoch": 0.24, + "learning_rate": 1.739354026520631e-05, + "loss": 0.6512, + "step": 6794 + }, + { + "epoch": 0.24, + "learning_rate": 1.7392807070341634e-05, + "loss": 0.6271, + "step": 6795 + }, + { + "epoch": 0.24, + "learning_rate": 1.7392073787825875e-05, + "loss": 0.6856, + "step": 6796 + }, + { + "epoch": 0.24, + "learning_rate": 1.739134041766774e-05, + "loss": 0.6433, + "step": 6797 + }, + { + "epoch": 0.24, + "learning_rate": 1.7390606959875905e-05, + "loss": 0.6207, + "step": 6798 + }, + { + "epoch": 0.24, + "learning_rate": 1.738987341445908e-05, + "loss": 0.6029, + "step": 6799 + }, + { + "epoch": 0.24, + "learning_rate": 1.7389139781425955e-05, + "loss": 0.6481, + "step": 6800 + }, + { + "epoch": 0.24, + "learning_rate": 1.7388406060785233e-05, + "loss": 0.6695, + "step": 6801 + }, + { + "epoch": 0.24, + "learning_rate": 1.7387672252545607e-05, + "loss": 0.6001, + "step": 6802 + }, + { + "epoch": 0.24, + "learning_rate": 1.7386938356715784e-05, + "loss": 0.5765, + "step": 6803 + }, + { + "epoch": 0.24, + "learning_rate": 1.7386204373304463e-05, + "loss": 0.6723, + "step": 6804 + }, + { + "epoch": 0.24, + "learning_rate": 1.7385470302320343e-05, + "loss": 0.5645, + "step": 6805 + }, + { + "epoch": 0.24, + "learning_rate": 1.738473614377213e-05, + "loss": 0.6174, + "step": 6806 + }, + { + "epoch": 0.24, + "learning_rate": 1.738400189766853e-05, + "loss": 0.6581, + "step": 6807 + }, + { + "epoch": 0.24, + "learning_rate": 1.7383267564018247e-05, + "loss": 0.5981, + "step": 6808 + }, + { + "epoch": 0.24, + "learning_rate": 1.7382533142829987e-05, + "loss": 0.5718, + "step": 6809 + }, + { + "epoch": 0.24, + "learning_rate": 1.7381798634112457e-05, + "loss": 0.6519, + "step": 6810 + }, + { + "epoch": 0.24, + "learning_rate": 1.7381064037874367e-05, + "loss": 0.644, + "step": 6811 + }, + { + "epoch": 0.24, + "learning_rate": 1.7380329354124424e-05, + "loss": 0.6225, + "step": 6812 + }, + { + "epoch": 0.24, + "learning_rate": 1.7379594582871342e-05, + "loss": 0.6521, + "step": 6813 + }, + { + "epoch": 0.24, + "learning_rate": 1.737885972412383e-05, + "loss": 0.6754, + "step": 6814 + }, + { + "epoch": 0.24, + "learning_rate": 1.73781247778906e-05, + "loss": 0.6349, + "step": 6815 + }, + { + "epoch": 0.24, + "learning_rate": 1.737738974418037e-05, + "loss": 0.5538, + "step": 6816 + }, + { + "epoch": 0.24, + "learning_rate": 1.737665462300185e-05, + "loss": 0.6383, + "step": 6817 + }, + { + "epoch": 0.24, + "learning_rate": 1.7375919414363764e-05, + "loss": 0.7244, + "step": 6818 + }, + { + "epoch": 0.24, + "learning_rate": 1.7375184118274818e-05, + "loss": 0.6671, + "step": 6819 + }, + { + "epoch": 0.24, + "learning_rate": 1.7374448734743733e-05, + "loss": 0.5907, + "step": 6820 + }, + { + "epoch": 0.24, + "learning_rate": 1.737371326377923e-05, + "loss": 0.6405, + "step": 6821 + }, + { + "epoch": 0.24, + "learning_rate": 1.737297770539003e-05, + "loss": 0.6657, + "step": 6822 + }, + { + "epoch": 0.24, + "learning_rate": 1.7372242059584856e-05, + "loss": 0.6453, + "step": 6823 + }, + { + "epoch": 0.24, + "learning_rate": 1.737150632637242e-05, + "loss": 0.6544, + "step": 6824 + }, + { + "epoch": 0.24, + "learning_rate": 1.7370770505761453e-05, + "loss": 0.5818, + "step": 6825 + }, + { + "epoch": 0.24, + "learning_rate": 1.737003459776068e-05, + "loss": 0.5649, + "step": 6826 + }, + { + "epoch": 0.24, + "learning_rate": 1.7369298602378825e-05, + "loss": 0.6453, + "step": 6827 + }, + { + "epoch": 0.24, + "learning_rate": 1.7368562519624607e-05, + "loss": 0.6156, + "step": 6828 + }, + { + "epoch": 0.24, + "learning_rate": 1.736782634950676e-05, + "loss": 0.6042, + "step": 6829 + }, + { + "epoch": 0.24, + "learning_rate": 1.7367090092034017e-05, + "loss": 0.5912, + "step": 6830 + }, + { + "epoch": 0.24, + "learning_rate": 1.7366353747215097e-05, + "loss": 0.6403, + "step": 6831 + }, + { + "epoch": 0.24, + "learning_rate": 1.7365617315058735e-05, + "loss": 0.6638, + "step": 6832 + }, + { + "epoch": 0.24, + "learning_rate": 1.7364880795573665e-05, + "loss": 0.6613, + "step": 6833 + }, + { + "epoch": 0.24, + "learning_rate": 1.7364144188768613e-05, + "loss": 0.6351, + "step": 6834 + }, + { + "epoch": 0.24, + "learning_rate": 1.736340749465232e-05, + "loss": 0.6348, + "step": 6835 + }, + { + "epoch": 0.24, + "learning_rate": 1.7362670713233512e-05, + "loss": 0.5969, + "step": 6836 + }, + { + "epoch": 0.24, + "learning_rate": 1.736193384452093e-05, + "loss": 0.6439, + "step": 6837 + }, + { + "epoch": 0.24, + "learning_rate": 1.7361196888523313e-05, + "loss": 0.6714, + "step": 6838 + }, + { + "epoch": 0.24, + "learning_rate": 1.7360459845249393e-05, + "loss": 0.627, + "step": 6839 + }, + { + "epoch": 0.24, + "learning_rate": 1.7359722714707908e-05, + "loss": 0.6611, + "step": 6840 + }, + { + "epoch": 0.24, + "learning_rate": 1.7358985496907603e-05, + "loss": 0.6019, + "step": 6841 + }, + { + "epoch": 0.24, + "learning_rate": 1.7358248191857212e-05, + "loss": 0.6155, + "step": 6842 + }, + { + "epoch": 0.24, + "learning_rate": 1.7357510799565484e-05, + "loss": 0.6334, + "step": 6843 + }, + { + "epoch": 0.24, + "learning_rate": 1.735677332004116e-05, + "loss": 0.6433, + "step": 6844 + }, + { + "epoch": 0.24, + "learning_rate": 1.7356035753292973e-05, + "loss": 0.6148, + "step": 6845 + }, + { + "epoch": 0.24, + "learning_rate": 1.7355298099329684e-05, + "loss": 0.5963, + "step": 6846 + }, + { + "epoch": 0.24, + "learning_rate": 1.7354560358160034e-05, + "loss": 0.6312, + "step": 6847 + }, + { + "epoch": 0.24, + "learning_rate": 1.7353822529792762e-05, + "loss": 0.7055, + "step": 6848 + }, + { + "epoch": 0.24, + "learning_rate": 1.7353084614236622e-05, + "loss": 0.6214, + "step": 6849 + }, + { + "epoch": 0.24, + "learning_rate": 1.7352346611500365e-05, + "loss": 0.6055, + "step": 6850 + }, + { + "epoch": 0.24, + "learning_rate": 1.7351608521592735e-05, + "loss": 0.6584, + "step": 6851 + }, + { + "epoch": 0.24, + "learning_rate": 1.7350870344522487e-05, + "loss": 0.6257, + "step": 6852 + }, + { + "epoch": 0.24, + "learning_rate": 1.7350132080298374e-05, + "loss": 0.6403, + "step": 6853 + }, + { + "epoch": 0.24, + "learning_rate": 1.7349393728929146e-05, + "loss": 0.6088, + "step": 6854 + }, + { + "epoch": 0.24, + "learning_rate": 1.7348655290423558e-05, + "loss": 0.6572, + "step": 6855 + }, + { + "epoch": 0.24, + "learning_rate": 1.7347916764790365e-05, + "loss": 0.5875, + "step": 6856 + }, + { + "epoch": 0.24, + "learning_rate": 1.7347178152038323e-05, + "loss": 0.615, + "step": 6857 + }, + { + "epoch": 0.24, + "learning_rate": 1.7346439452176193e-05, + "loss": 0.6306, + "step": 6858 + }, + { + "epoch": 0.24, + "learning_rate": 1.7345700665212726e-05, + "loss": 0.6788, + "step": 6859 + }, + { + "epoch": 0.24, + "learning_rate": 1.734496179115669e-05, + "loss": 0.6644, + "step": 6860 + }, + { + "epoch": 0.24, + "learning_rate": 1.734422283001684e-05, + "loss": 0.6157, + "step": 6861 + }, + { + "epoch": 0.24, + "learning_rate": 1.734348378180193e-05, + "loss": 0.568, + "step": 6862 + }, + { + "epoch": 0.24, + "learning_rate": 1.734274464652074e-05, + "loss": 0.6315, + "step": 6863 + }, + { + "epoch": 0.24, + "learning_rate": 1.734200542418202e-05, + "loss": 0.6535, + "step": 6864 + }, + { + "epoch": 0.24, + "learning_rate": 1.7341266114794536e-05, + "loss": 0.5823, + "step": 6865 + }, + { + "epoch": 0.24, + "learning_rate": 1.7340526718367056e-05, + "loss": 0.6544, + "step": 6866 + }, + { + "epoch": 0.24, + "learning_rate": 1.733978723490835e-05, + "loss": 0.6396, + "step": 6867 + }, + { + "epoch": 0.24, + "learning_rate": 1.7339047664427175e-05, + "loss": 0.6074, + "step": 6868 + }, + { + "epoch": 0.24, + "learning_rate": 1.7338308006932312e-05, + "loss": 0.6772, + "step": 6869 + }, + { + "epoch": 0.24, + "learning_rate": 1.733756826243252e-05, + "loss": 0.5861, + "step": 6870 + }, + { + "epoch": 0.24, + "learning_rate": 1.7336828430936577e-05, + "loss": 0.6661, + "step": 6871 + }, + { + "epoch": 0.24, + "learning_rate": 1.733608851245325e-05, + "loss": 0.5953, + "step": 6872 + }, + { + "epoch": 0.24, + "learning_rate": 1.7335348506991314e-05, + "loss": 0.6436, + "step": 6873 + }, + { + "epoch": 0.24, + "learning_rate": 1.7334608414559544e-05, + "loss": 0.6079, + "step": 6874 + }, + { + "epoch": 0.24, + "learning_rate": 1.7333868235166713e-05, + "loss": 0.6513, + "step": 6875 + }, + { + "epoch": 0.24, + "learning_rate": 1.7333127968821593e-05, + "loss": 0.6282, + "step": 6876 + }, + { + "epoch": 0.24, + "learning_rate": 1.7332387615532966e-05, + "loss": 0.6171, + "step": 6877 + }, + { + "epoch": 0.24, + "learning_rate": 1.733164717530961e-05, + "loss": 0.6322, + "step": 6878 + }, + { + "epoch": 0.24, + "learning_rate": 1.73309066481603e-05, + "loss": 0.7119, + "step": 6879 + }, + { + "epoch": 0.24, + "learning_rate": 1.7330166034093817e-05, + "loss": 0.6067, + "step": 6880 + }, + { + "epoch": 0.24, + "learning_rate": 1.7329425333118948e-05, + "loss": 0.6384, + "step": 6881 + }, + { + "epoch": 0.24, + "learning_rate": 1.7328684545244468e-05, + "loss": 0.6739, + "step": 6882 + }, + { + "epoch": 0.24, + "learning_rate": 1.732794367047916e-05, + "loss": 0.6481, + "step": 6883 + }, + { + "epoch": 0.24, + "learning_rate": 1.7327202708831812e-05, + "loss": 0.6381, + "step": 6884 + }, + { + "epoch": 0.24, + "learning_rate": 1.7326461660311206e-05, + "loss": 0.6723, + "step": 6885 + }, + { + "epoch": 0.24, + "learning_rate": 1.732572052492613e-05, + "loss": 0.651, + "step": 6886 + }, + { + "epoch": 0.24, + "learning_rate": 1.7324979302685364e-05, + "loss": 0.6283, + "step": 6887 + }, + { + "epoch": 0.24, + "learning_rate": 1.7324237993597708e-05, + "loss": 0.65, + "step": 6888 + }, + { + "epoch": 0.24, + "learning_rate": 1.7323496597671943e-05, + "loss": 0.6462, + "step": 6889 + }, + { + "epoch": 0.24, + "learning_rate": 1.7322755114916865e-05, + "loss": 0.6717, + "step": 6890 + }, + { + "epoch": 0.24, + "learning_rate": 1.7322013545341262e-05, + "loss": 0.7049, + "step": 6891 + }, + { + "epoch": 0.24, + "learning_rate": 1.7321271888953923e-05, + "loss": 0.6053, + "step": 6892 + }, + { + "epoch": 0.24, + "learning_rate": 1.7320530145763643e-05, + "loss": 0.579, + "step": 6893 + }, + { + "epoch": 0.24, + "learning_rate": 1.731978831577922e-05, + "loss": 0.6561, + "step": 6894 + }, + { + "epoch": 0.24, + "learning_rate": 1.7319046399009446e-05, + "loss": 0.6072, + "step": 6895 + }, + { + "epoch": 0.24, + "learning_rate": 1.731830439546312e-05, + "loss": 0.6094, + "step": 6896 + }, + { + "epoch": 0.24, + "learning_rate": 1.7317562305149035e-05, + "loss": 0.5793, + "step": 6897 + }, + { + "epoch": 0.24, + "learning_rate": 1.7316820128075998e-05, + "loss": 0.5948, + "step": 6898 + }, + { + "epoch": 0.24, + "learning_rate": 1.7316077864252797e-05, + "loss": 0.6639, + "step": 6899 + }, + { + "epoch": 0.24, + "learning_rate": 1.731533551368824e-05, + "loss": 0.6487, + "step": 6900 + }, + { + "epoch": 0.24, + "learning_rate": 1.7314593076391123e-05, + "loss": 0.6349, + "step": 6901 + }, + { + "epoch": 0.24, + "learning_rate": 1.7313850552370256e-05, + "loss": 0.6179, + "step": 6902 + }, + { + "epoch": 0.24, + "learning_rate": 1.7313107941634436e-05, + "loss": 0.6028, + "step": 6903 + }, + { + "epoch": 0.24, + "learning_rate": 1.731236524419247e-05, + "loss": 0.6647, + "step": 6904 + }, + { + "epoch": 0.24, + "learning_rate": 1.731162246005317e-05, + "loss": 0.6205, + "step": 6905 + }, + { + "epoch": 0.24, + "learning_rate": 1.731087958922533e-05, + "loss": 0.6908, + "step": 6906 + }, + { + "epoch": 0.24, + "learning_rate": 1.7310136631717766e-05, + "loss": 0.6657, + "step": 6907 + }, + { + "epoch": 0.24, + "learning_rate": 1.7309393587539286e-05, + "loss": 0.6275, + "step": 6908 + }, + { + "epoch": 0.24, + "learning_rate": 1.73086504566987e-05, + "loss": 0.662, + "step": 6909 + }, + { + "epoch": 0.24, + "learning_rate": 1.7307907239204815e-05, + "loss": 0.6319, + "step": 6910 + }, + { + "epoch": 0.24, + "learning_rate": 1.7307163935066445e-05, + "loss": 0.6216, + "step": 6911 + }, + { + "epoch": 0.24, + "learning_rate": 1.73064205442924e-05, + "loss": 0.6182, + "step": 6912 + }, + { + "epoch": 0.24, + "learning_rate": 1.7305677066891503e-05, + "loss": 0.6192, + "step": 6913 + }, + { + "epoch": 0.24, + "learning_rate": 1.730493350287256e-05, + "loss": 0.6308, + "step": 6914 + }, + { + "epoch": 0.24, + "learning_rate": 1.7304189852244388e-05, + "loss": 0.635, + "step": 6915 + }, + { + "epoch": 0.24, + "learning_rate": 1.7303446115015806e-05, + "loss": 0.6627, + "step": 6916 + }, + { + "epoch": 0.24, + "learning_rate": 1.730270229119563e-05, + "loss": 0.6944, + "step": 6917 + }, + { + "epoch": 0.24, + "learning_rate": 1.7301958380792684e-05, + "loss": 0.6359, + "step": 6918 + }, + { + "epoch": 0.24, + "learning_rate": 1.7301214383815783e-05, + "loss": 0.6364, + "step": 6919 + }, + { + "epoch": 0.24, + "learning_rate": 1.730047030027375e-05, + "loss": 0.6147, + "step": 6920 + }, + { + "epoch": 0.24, + "learning_rate": 1.7299726130175406e-05, + "loss": 0.6108, + "step": 6921 + }, + { + "epoch": 0.24, + "learning_rate": 1.729898187352957e-05, + "loss": 0.6873, + "step": 6922 + }, + { + "epoch": 0.24, + "learning_rate": 1.7298237530345076e-05, + "loss": 0.6483, + "step": 6923 + }, + { + "epoch": 0.24, + "learning_rate": 1.7297493100630746e-05, + "loss": 0.6569, + "step": 6924 + }, + { + "epoch": 0.24, + "learning_rate": 1.7296748584395397e-05, + "loss": 0.6068, + "step": 6925 + }, + { + "epoch": 0.24, + "learning_rate": 1.7296003981647865e-05, + "loss": 0.6434, + "step": 6926 + }, + { + "epoch": 0.24, + "learning_rate": 1.729525929239698e-05, + "loss": 0.6264, + "step": 6927 + }, + { + "epoch": 0.24, + "learning_rate": 1.7294514516651565e-05, + "loss": 0.6193, + "step": 6928 + }, + { + "epoch": 0.24, + "learning_rate": 1.7293769654420452e-05, + "loss": 0.6554, + "step": 6929 + }, + { + "epoch": 0.24, + "learning_rate": 1.7293024705712477e-05, + "loss": 0.6278, + "step": 6930 + }, + { + "epoch": 0.24, + "learning_rate": 1.729227967053646e-05, + "loss": 0.5601, + "step": 6931 + }, + { + "epoch": 0.24, + "learning_rate": 1.729153454890125e-05, + "loss": 0.6853, + "step": 6932 + }, + { + "epoch": 0.24, + "learning_rate": 1.7290789340815674e-05, + "loss": 0.651, + "step": 6933 + }, + { + "epoch": 0.24, + "learning_rate": 1.7290044046288564e-05, + "loss": 0.6347, + "step": 6934 + }, + { + "epoch": 0.24, + "learning_rate": 1.7289298665328763e-05, + "loss": 0.6564, + "step": 6935 + }, + { + "epoch": 0.24, + "learning_rate": 1.7288553197945105e-05, + "loss": 0.6649, + "step": 6936 + }, + { + "epoch": 0.24, + "learning_rate": 1.728780764414643e-05, + "loss": 0.6278, + "step": 6937 + }, + { + "epoch": 0.24, + "learning_rate": 1.728706200394157e-05, + "loss": 0.5986, + "step": 6938 + }, + { + "epoch": 0.24, + "learning_rate": 1.7286316277339378e-05, + "loss": 0.6638, + "step": 6939 + }, + { + "epoch": 0.24, + "learning_rate": 1.7285570464348687e-05, + "loss": 0.6764, + "step": 6940 + }, + { + "epoch": 0.24, + "learning_rate": 1.728482456497834e-05, + "loss": 0.5743, + "step": 6941 + }, + { + "epoch": 0.24, + "learning_rate": 1.728407857923719e-05, + "loss": 0.5939, + "step": 6942 + }, + { + "epoch": 0.24, + "learning_rate": 1.7283332507134064e-05, + "loss": 0.6059, + "step": 6943 + }, + { + "epoch": 0.24, + "learning_rate": 1.7282586348677824e-05, + "loss": 0.6017, + "step": 6944 + }, + { + "epoch": 0.24, + "learning_rate": 1.7281840103877306e-05, + "loss": 0.6258, + "step": 6945 + }, + { + "epoch": 0.24, + "learning_rate": 1.7281093772741365e-05, + "loss": 0.593, + "step": 6946 + }, + { + "epoch": 0.24, + "learning_rate": 1.7280347355278845e-05, + "loss": 0.6945, + "step": 6947 + }, + { + "epoch": 0.24, + "learning_rate": 1.72796008514986e-05, + "loss": 0.6077, + "step": 6948 + }, + { + "epoch": 0.24, + "learning_rate": 1.7278854261409478e-05, + "loss": 0.615, + "step": 6949 + }, + { + "epoch": 0.24, + "learning_rate": 1.7278107585020326e-05, + "loss": 0.6148, + "step": 6950 + }, + { + "epoch": 0.24, + "learning_rate": 1.7277360822340008e-05, + "loss": 0.6681, + "step": 6951 + }, + { + "epoch": 0.24, + "learning_rate": 1.7276613973377366e-05, + "loss": 0.6641, + "step": 6952 + }, + { + "epoch": 0.24, + "learning_rate": 1.7275867038141265e-05, + "loss": 0.631, + "step": 6953 + }, + { + "epoch": 0.24, + "learning_rate": 1.7275120016640553e-05, + "loss": 0.6825, + "step": 6954 + }, + { + "epoch": 0.24, + "learning_rate": 1.727437290888409e-05, + "loss": 0.6334, + "step": 6955 + }, + { + "epoch": 0.24, + "learning_rate": 1.727362571488074e-05, + "loss": 0.6486, + "step": 6956 + }, + { + "epoch": 0.24, + "learning_rate": 1.727287843463935e-05, + "loss": 0.5864, + "step": 6957 + }, + { + "epoch": 0.24, + "learning_rate": 1.7272131068168786e-05, + "loss": 0.639, + "step": 6958 + }, + { + "epoch": 0.24, + "learning_rate": 1.7271383615477913e-05, + "loss": 0.6301, + "step": 6959 + }, + { + "epoch": 0.24, + "learning_rate": 1.7270636076575585e-05, + "loss": 0.5978, + "step": 6960 + }, + { + "epoch": 0.24, + "learning_rate": 1.726988845147067e-05, + "loss": 0.6067, + "step": 6961 + }, + { + "epoch": 0.24, + "learning_rate": 1.726914074017203e-05, + "loss": 0.6769, + "step": 6962 + }, + { + "epoch": 0.24, + "learning_rate": 1.7268392942688534e-05, + "loss": 0.6115, + "step": 6963 + }, + { + "epoch": 0.24, + "learning_rate": 1.7267645059029042e-05, + "loss": 0.6074, + "step": 6964 + }, + { + "epoch": 0.24, + "learning_rate": 1.7266897089202426e-05, + "loss": 0.6171, + "step": 6965 + }, + { + "epoch": 0.24, + "learning_rate": 1.7266149033217554e-05, + "loss": 0.6428, + "step": 6966 + }, + { + "epoch": 0.24, + "learning_rate": 1.7265400891083288e-05, + "loss": 0.6598, + "step": 6967 + }, + { + "epoch": 0.24, + "learning_rate": 1.726465266280851e-05, + "loss": 0.6384, + "step": 6968 + }, + { + "epoch": 0.24, + "learning_rate": 1.726390434840208e-05, + "loss": 0.7376, + "step": 6969 + }, + { + "epoch": 0.24, + "learning_rate": 1.7263155947872875e-05, + "loss": 0.6122, + "step": 6970 + }, + { + "epoch": 0.24, + "learning_rate": 1.726240746122977e-05, + "loss": 0.6478, + "step": 6971 + }, + { + "epoch": 0.24, + "learning_rate": 1.726165888848164e-05, + "loss": 0.614, + "step": 6972 + }, + { + "epoch": 0.24, + "learning_rate": 1.7260910229637354e-05, + "loss": 0.6423, + "step": 6973 + }, + { + "epoch": 0.24, + "learning_rate": 1.7260161484705796e-05, + "loss": 0.6707, + "step": 6974 + }, + { + "epoch": 0.24, + "learning_rate": 1.7259412653695836e-05, + "loss": 0.6231, + "step": 6975 + }, + { + "epoch": 0.24, + "learning_rate": 1.7258663736616358e-05, + "loss": 0.5897, + "step": 6976 + }, + { + "epoch": 0.24, + "learning_rate": 1.725791473347624e-05, + "loss": 0.6641, + "step": 6977 + }, + { + "epoch": 0.24, + "learning_rate": 1.7257165644284358e-05, + "loss": 0.643, + "step": 6978 + }, + { + "epoch": 0.24, + "learning_rate": 1.7256416469049597e-05, + "loss": 0.6509, + "step": 6979 + }, + { + "epoch": 0.24, + "learning_rate": 1.7255667207780842e-05, + "loss": 0.6698, + "step": 6980 + }, + { + "epoch": 0.24, + "learning_rate": 1.7254917860486974e-05, + "loss": 0.6137, + "step": 6981 + }, + { + "epoch": 0.24, + "learning_rate": 1.7254168427176873e-05, + "loss": 0.6175, + "step": 6982 + }, + { + "epoch": 0.24, + "learning_rate": 1.7253418907859433e-05, + "loss": 0.5888, + "step": 6983 + }, + { + "epoch": 0.24, + "learning_rate": 1.7252669302543533e-05, + "loss": 0.5839, + "step": 6984 + }, + { + "epoch": 0.24, + "learning_rate": 1.7251919611238065e-05, + "loss": 0.6059, + "step": 6985 + }, + { + "epoch": 0.24, + "learning_rate": 1.725116983395192e-05, + "loss": 0.6618, + "step": 6986 + }, + { + "epoch": 0.24, + "learning_rate": 1.725041997069398e-05, + "loss": 0.6582, + "step": 6987 + }, + { + "epoch": 0.24, + "learning_rate": 1.724967002147314e-05, + "loss": 0.5658, + "step": 6988 + }, + { + "epoch": 0.24, + "learning_rate": 1.724891998629829e-05, + "loss": 0.671, + "step": 6989 + }, + { + "epoch": 0.24, + "learning_rate": 1.7248169865178325e-05, + "loss": 0.6272, + "step": 6990 + }, + { + "epoch": 0.24, + "learning_rate": 1.724741965812214e-05, + "loss": 0.6298, + "step": 6991 + }, + { + "epoch": 0.24, + "learning_rate": 1.724666936513862e-05, + "loss": 0.5934, + "step": 6992 + }, + { + "epoch": 0.24, + "learning_rate": 1.7245918986236672e-05, + "loss": 0.6672, + "step": 6993 + }, + { + "epoch": 0.24, + "learning_rate": 1.724516852142519e-05, + "loss": 0.6537, + "step": 6994 + }, + { + "epoch": 0.24, + "learning_rate": 1.7244417970713066e-05, + "loss": 0.6168, + "step": 6995 + }, + { + "epoch": 0.24, + "learning_rate": 1.7243667334109204e-05, + "loss": 0.6464, + "step": 6996 + }, + { + "epoch": 0.24, + "learning_rate": 1.7242916611622506e-05, + "loss": 0.6394, + "step": 6997 + }, + { + "epoch": 0.24, + "learning_rate": 1.7242165803261866e-05, + "loss": 0.661, + "step": 6998 + }, + { + "epoch": 0.24, + "learning_rate": 1.7241414909036188e-05, + "loss": 0.6316, + "step": 6999 + }, + { + "epoch": 0.24, + "learning_rate": 1.7240663928954377e-05, + "loss": 0.6344, + "step": 7000 + }, + { + "epoch": 0.24, + "learning_rate": 1.7239912863025336e-05, + "loss": 0.5946, + "step": 7001 + }, + { + "epoch": 0.24, + "learning_rate": 1.723916171125797e-05, + "loss": 0.6378, + "step": 7002 + }, + { + "epoch": 0.24, + "learning_rate": 1.723841047366118e-05, + "loss": 0.6469, + "step": 7003 + }, + { + "epoch": 0.24, + "learning_rate": 1.7237659150243882e-05, + "loss": 0.6304, + "step": 7004 + }, + { + "epoch": 0.24, + "learning_rate": 1.723690774101498e-05, + "loss": 0.6455, + "step": 7005 + }, + { + "epoch": 0.24, + "learning_rate": 1.7236156245983378e-05, + "loss": 0.6328, + "step": 7006 + }, + { + "epoch": 0.24, + "learning_rate": 1.7235404665157994e-05, + "loss": 0.5842, + "step": 7007 + }, + { + "epoch": 0.24, + "learning_rate": 1.7234652998547732e-05, + "loss": 0.6784, + "step": 7008 + }, + { + "epoch": 0.24, + "learning_rate": 1.7233901246161507e-05, + "loss": 0.6678, + "step": 7009 + }, + { + "epoch": 0.24, + "learning_rate": 1.7233149408008232e-05, + "loss": 0.657, + "step": 7010 + }, + { + "epoch": 0.24, + "learning_rate": 1.7232397484096822e-05, + "loss": 0.6292, + "step": 7011 + }, + { + "epoch": 0.24, + "learning_rate": 1.7231645474436187e-05, + "loss": 0.6667, + "step": 7012 + }, + { + "epoch": 0.24, + "learning_rate": 1.7230893379035252e-05, + "loss": 0.6068, + "step": 7013 + }, + { + "epoch": 0.24, + "learning_rate": 1.7230141197902924e-05, + "loss": 0.6535, + "step": 7014 + }, + { + "epoch": 0.24, + "learning_rate": 1.722938893104813e-05, + "loss": 0.7011, + "step": 7015 + }, + { + "epoch": 0.24, + "learning_rate": 1.7228636578479784e-05, + "loss": 0.6284, + "step": 7016 + }, + { + "epoch": 0.24, + "learning_rate": 1.7227884140206807e-05, + "loss": 0.6575, + "step": 7017 + }, + { + "epoch": 0.24, + "learning_rate": 1.7227131616238117e-05, + "loss": 0.5928, + "step": 7018 + }, + { + "epoch": 0.24, + "learning_rate": 1.7226379006582643e-05, + "loss": 0.64, + "step": 7019 + }, + { + "epoch": 0.24, + "learning_rate": 1.7225626311249305e-05, + "loss": 0.6157, + "step": 7020 + }, + { + "epoch": 0.24, + "learning_rate": 1.722487353024702e-05, + "loss": 0.6619, + "step": 7021 + }, + { + "epoch": 0.24, + "learning_rate": 1.7224120663584728e-05, + "loss": 0.5835, + "step": 7022 + }, + { + "epoch": 0.24, + "learning_rate": 1.7223367711271345e-05, + "loss": 0.6873, + "step": 7023 + }, + { + "epoch": 0.24, + "learning_rate": 1.72226146733158e-05, + "loss": 0.6788, + "step": 7024 + }, + { + "epoch": 0.24, + "learning_rate": 1.7221861549727017e-05, + "loss": 0.6171, + "step": 7025 + }, + { + "epoch": 0.24, + "learning_rate": 1.7221108340513935e-05, + "loss": 0.5934, + "step": 7026 + }, + { + "epoch": 0.24, + "learning_rate": 1.7220355045685476e-05, + "loss": 0.6629, + "step": 7027 + }, + { + "epoch": 0.24, + "learning_rate": 1.7219601665250576e-05, + "loss": 0.6945, + "step": 7028 + }, + { + "epoch": 0.24, + "learning_rate": 1.7218848199218165e-05, + "loss": 0.6407, + "step": 7029 + }, + { + "epoch": 0.24, + "learning_rate": 1.7218094647597174e-05, + "loss": 0.6337, + "step": 7030 + }, + { + "epoch": 0.24, + "learning_rate": 1.721734101039654e-05, + "loss": 0.6256, + "step": 7031 + }, + { + "epoch": 0.24, + "learning_rate": 1.7216587287625204e-05, + "loss": 0.6273, + "step": 7032 + }, + { + "epoch": 0.24, + "learning_rate": 1.7215833479292095e-05, + "loss": 0.6622, + "step": 7033 + }, + { + "epoch": 0.24, + "learning_rate": 1.7215079585406147e-05, + "loss": 0.6437, + "step": 7034 + }, + { + "epoch": 0.24, + "learning_rate": 1.721432560597631e-05, + "loss": 0.6611, + "step": 7035 + }, + { + "epoch": 0.24, + "learning_rate": 1.7213571541011512e-05, + "loss": 0.5795, + "step": 7036 + }, + { + "epoch": 0.24, + "learning_rate": 1.7212817390520697e-05, + "loss": 0.6562, + "step": 7037 + }, + { + "epoch": 0.24, + "learning_rate": 1.7212063154512812e-05, + "loss": 0.6013, + "step": 7038 + }, + { + "epoch": 0.24, + "learning_rate": 1.7211308832996792e-05, + "loss": 0.5932, + "step": 7039 + }, + { + "epoch": 0.24, + "learning_rate": 1.7210554425981585e-05, + "loss": 0.5979, + "step": 7040 + }, + { + "epoch": 0.24, + "learning_rate": 1.7209799933476135e-05, + "loss": 0.6197, + "step": 7041 + }, + { + "epoch": 0.24, + "learning_rate": 1.720904535548938e-05, + "loss": 0.6662, + "step": 7042 + }, + { + "epoch": 0.24, + "learning_rate": 1.720829069203028e-05, + "loss": 0.6921, + "step": 7043 + }, + { + "epoch": 0.24, + "learning_rate": 1.7207535943107774e-05, + "loss": 0.6181, + "step": 7044 + }, + { + "epoch": 0.24, + "learning_rate": 1.720678110873081e-05, + "loss": 0.6114, + "step": 7045 + }, + { + "epoch": 0.24, + "learning_rate": 1.720602618890834e-05, + "loss": 0.6669, + "step": 7046 + }, + { + "epoch": 0.24, + "learning_rate": 1.7205271183649313e-05, + "loss": 0.6351, + "step": 7047 + }, + { + "epoch": 0.24, + "learning_rate": 1.7204516092962684e-05, + "loss": 0.6177, + "step": 7048 + }, + { + "epoch": 0.24, + "learning_rate": 1.72037609168574e-05, + "loss": 0.6093, + "step": 7049 + }, + { + "epoch": 0.24, + "learning_rate": 1.720300565534242e-05, + "loss": 0.5606, + "step": 7050 + }, + { + "epoch": 0.24, + "learning_rate": 1.7202250308426695e-05, + "loss": 0.6213, + "step": 7051 + }, + { + "epoch": 0.24, + "learning_rate": 1.720149487611918e-05, + "loss": 0.6739, + "step": 7052 + }, + { + "epoch": 0.24, + "learning_rate": 1.7200739358428835e-05, + "loss": 0.6829, + "step": 7053 + }, + { + "epoch": 0.24, + "learning_rate": 1.7199983755364614e-05, + "loss": 0.6354, + "step": 7054 + }, + { + "epoch": 0.24, + "learning_rate": 1.719922806693548e-05, + "loss": 0.5687, + "step": 7055 + }, + { + "epoch": 0.24, + "learning_rate": 1.7198472293150393e-05, + "loss": 0.6239, + "step": 7056 + }, + { + "epoch": 0.24, + "learning_rate": 1.7197716434018307e-05, + "loss": 0.6505, + "step": 7057 + }, + { + "epoch": 0.24, + "learning_rate": 1.7196960489548186e-05, + "loss": 0.6178, + "step": 7058 + }, + { + "epoch": 0.24, + "learning_rate": 1.7196204459748996e-05, + "loss": 0.7034, + "step": 7059 + }, + { + "epoch": 0.24, + "learning_rate": 1.71954483446297e-05, + "loss": 0.6357, + "step": 7060 + }, + { + "epoch": 0.24, + "learning_rate": 1.719469214419926e-05, + "loss": 0.6111, + "step": 7061 + }, + { + "epoch": 0.24, + "learning_rate": 1.7193935858466642e-05, + "loss": 0.6344, + "step": 7062 + }, + { + "epoch": 0.24, + "learning_rate": 1.719317948744082e-05, + "loss": 0.6561, + "step": 7063 + }, + { + "epoch": 0.24, + "learning_rate": 1.719242303113075e-05, + "loss": 0.6659, + "step": 7064 + }, + { + "epoch": 0.24, + "learning_rate": 1.719166648954541e-05, + "loss": 0.6382, + "step": 7065 + }, + { + "epoch": 0.24, + "learning_rate": 1.719090986269376e-05, + "loss": 0.6096, + "step": 7066 + }, + { + "epoch": 0.24, + "learning_rate": 1.7190153150584784e-05, + "loss": 0.6564, + "step": 7067 + }, + { + "epoch": 0.24, + "learning_rate": 1.7189396353227444e-05, + "loss": 0.6307, + "step": 7068 + }, + { + "epoch": 0.24, + "learning_rate": 1.7188639470630716e-05, + "loss": 0.5997, + "step": 7069 + }, + { + "epoch": 0.24, + "learning_rate": 1.7187882502803575e-05, + "loss": 0.6543, + "step": 7070 + }, + { + "epoch": 0.24, + "learning_rate": 1.718712544975499e-05, + "loss": 0.6414, + "step": 7071 + }, + { + "epoch": 0.25, + "learning_rate": 1.7186368311493945e-05, + "loss": 0.6906, + "step": 7072 + }, + { + "epoch": 0.25, + "learning_rate": 1.718561108802941e-05, + "loss": 0.6863, + "step": 7073 + }, + { + "epoch": 0.25, + "learning_rate": 1.7184853779370367e-05, + "loss": 0.6222, + "step": 7074 + }, + { + "epoch": 0.25, + "learning_rate": 1.7184096385525792e-05, + "loss": 0.5705, + "step": 7075 + }, + { + "epoch": 0.25, + "learning_rate": 1.718333890650467e-05, + "loss": 0.6609, + "step": 7076 + }, + { + "epoch": 0.25, + "learning_rate": 1.7182581342315977e-05, + "loss": 0.6778, + "step": 7077 + }, + { + "epoch": 0.25, + "learning_rate": 1.7181823692968694e-05, + "loss": 0.6335, + "step": 7078 + }, + { + "epoch": 0.25, + "learning_rate": 1.718106595847181e-05, + "loss": 0.6375, + "step": 7079 + }, + { + "epoch": 0.25, + "learning_rate": 1.71803081388343e-05, + "loss": 0.6369, + "step": 7080 + }, + { + "epoch": 0.25, + "learning_rate": 1.717955023406516e-05, + "loss": 0.6502, + "step": 7081 + }, + { + "epoch": 0.25, + "learning_rate": 1.7178792244173365e-05, + "loss": 0.6374, + "step": 7082 + }, + { + "epoch": 0.25, + "learning_rate": 1.7178034169167906e-05, + "loss": 0.6791, + "step": 7083 + }, + { + "epoch": 0.25, + "learning_rate": 1.7177276009057774e-05, + "loss": 0.6623, + "step": 7084 + }, + { + "epoch": 0.25, + "learning_rate": 1.7176517763851954e-05, + "loss": 0.651, + "step": 7085 + }, + { + "epoch": 0.25, + "learning_rate": 1.717575943355944e-05, + "loss": 0.6669, + "step": 7086 + }, + { + "epoch": 0.25, + "learning_rate": 1.7175001018189223e-05, + "loss": 0.6912, + "step": 7087 + }, + { + "epoch": 0.25, + "learning_rate": 1.7174242517750285e-05, + "loss": 0.6329, + "step": 7088 + }, + { + "epoch": 0.25, + "learning_rate": 1.7173483932251632e-05, + "loss": 0.5797, + "step": 7089 + }, + { + "epoch": 0.25, + "learning_rate": 1.717272526170225e-05, + "loss": 0.5742, + "step": 7090 + }, + { + "epoch": 0.25, + "learning_rate": 1.7171966506111135e-05, + "loss": 0.6223, + "step": 7091 + }, + { + "epoch": 0.25, + "learning_rate": 1.717120766548729e-05, + "loss": 0.5795, + "step": 7092 + }, + { + "epoch": 0.25, + "learning_rate": 1.7170448739839703e-05, + "loss": 0.6894, + "step": 7093 + }, + { + "epoch": 0.25, + "learning_rate": 1.7169689729177375e-05, + "loss": 0.6554, + "step": 7094 + }, + { + "epoch": 0.25, + "learning_rate": 1.7168930633509307e-05, + "loss": 0.6732, + "step": 7095 + }, + { + "epoch": 0.25, + "learning_rate": 1.7168171452844498e-05, + "loss": 0.6471, + "step": 7096 + }, + { + "epoch": 0.25, + "learning_rate": 1.7167412187191944e-05, + "loss": 0.6029, + "step": 7097 + }, + { + "epoch": 0.25, + "learning_rate": 1.7166652836560657e-05, + "loss": 0.5949, + "step": 7098 + }, + { + "epoch": 0.25, + "learning_rate": 1.7165893400959636e-05, + "loss": 0.6052, + "step": 7099 + }, + { + "epoch": 0.25, + "learning_rate": 1.7165133880397876e-05, + "loss": 0.6365, + "step": 7100 + }, + { + "epoch": 0.25, + "learning_rate": 1.7164374274884397e-05, + "loss": 0.6492, + "step": 7101 + }, + { + "epoch": 0.25, + "learning_rate": 1.7163614584428194e-05, + "loss": 0.6299, + "step": 7102 + }, + { + "epoch": 0.25, + "learning_rate": 1.716285480903828e-05, + "loss": 0.5664, + "step": 7103 + }, + { + "epoch": 0.25, + "learning_rate": 1.7162094948723664e-05, + "loss": 0.6242, + "step": 7104 + }, + { + "epoch": 0.25, + "learning_rate": 1.7161335003493347e-05, + "loss": 0.6231, + "step": 7105 + }, + { + "epoch": 0.25, + "learning_rate": 1.7160574973356346e-05, + "loss": 0.6273, + "step": 7106 + }, + { + "epoch": 0.25, + "learning_rate": 1.7159814858321673e-05, + "loss": 0.6583, + "step": 7107 + }, + { + "epoch": 0.25, + "learning_rate": 1.7159054658398334e-05, + "loss": 0.6034, + "step": 7108 + }, + { + "epoch": 0.25, + "learning_rate": 1.715829437359535e-05, + "loss": 0.6757, + "step": 7109 + }, + { + "epoch": 0.25, + "learning_rate": 1.7157534003921728e-05, + "loss": 0.6061, + "step": 7110 + }, + { + "epoch": 0.25, + "learning_rate": 1.715677354938649e-05, + "loss": 0.6398, + "step": 7111 + }, + { + "epoch": 0.25, + "learning_rate": 1.7156013009998643e-05, + "loss": 0.6032, + "step": 7112 + }, + { + "epoch": 0.25, + "learning_rate": 1.715525238576721e-05, + "loss": 0.5969, + "step": 7113 + }, + { + "epoch": 0.25, + "learning_rate": 1.7154491676701207e-05, + "loss": 0.6044, + "step": 7114 + }, + { + "epoch": 0.25, + "learning_rate": 1.7153730882809657e-05, + "loss": 0.5904, + "step": 7115 + }, + { + "epoch": 0.25, + "learning_rate": 1.7152970004101582e-05, + "loss": 0.6128, + "step": 7116 + }, + { + "epoch": 0.25, + "learning_rate": 1.7152209040585993e-05, + "loss": 0.6268, + "step": 7117 + }, + { + "epoch": 0.25, + "learning_rate": 1.715144799227192e-05, + "loss": 0.6444, + "step": 7118 + }, + { + "epoch": 0.25, + "learning_rate": 1.7150686859168385e-05, + "loss": 0.6038, + "step": 7119 + }, + { + "epoch": 0.25, + "learning_rate": 1.7149925641284414e-05, + "loss": 0.6378, + "step": 7120 + }, + { + "epoch": 0.25, + "learning_rate": 1.7149164338629027e-05, + "loss": 0.5909, + "step": 7121 + }, + { + "epoch": 0.25, + "learning_rate": 1.7148402951211253e-05, + "loss": 0.6211, + "step": 7122 + }, + { + "epoch": 0.25, + "learning_rate": 1.714764147904012e-05, + "loss": 0.6685, + "step": 7123 + }, + { + "epoch": 0.25, + "learning_rate": 1.7146879922124654e-05, + "loss": 0.5957, + "step": 7124 + }, + { + "epoch": 0.25, + "learning_rate": 1.7146118280473887e-05, + "loss": 0.6094, + "step": 7125 + }, + { + "epoch": 0.25, + "learning_rate": 1.7145356554096848e-05, + "loss": 0.6411, + "step": 7126 + }, + { + "epoch": 0.25, + "learning_rate": 1.714459474300257e-05, + "loss": 0.5905, + "step": 7127 + }, + { + "epoch": 0.25, + "learning_rate": 1.7143832847200078e-05, + "loss": 0.6147, + "step": 7128 + }, + { + "epoch": 0.25, + "learning_rate": 1.7143070866698416e-05, + "loss": 0.6282, + "step": 7129 + }, + { + "epoch": 0.25, + "learning_rate": 1.7142308801506612e-05, + "loss": 0.6253, + "step": 7130 + }, + { + "epoch": 0.25, + "learning_rate": 1.71415466516337e-05, + "loss": 0.6601, + "step": 7131 + }, + { + "epoch": 0.25, + "learning_rate": 1.7140784417088717e-05, + "loss": 0.6211, + "step": 7132 + }, + { + "epoch": 0.25, + "learning_rate": 1.7140022097880704e-05, + "loss": 0.7028, + "step": 7133 + }, + { + "epoch": 0.25, + "learning_rate": 1.7139259694018697e-05, + "loss": 0.68, + "step": 7134 + }, + { + "epoch": 0.25, + "learning_rate": 1.7138497205511732e-05, + "loss": 0.6434, + "step": 7135 + }, + { + "epoch": 0.25, + "learning_rate": 1.7137734632368855e-05, + "loss": 0.632, + "step": 7136 + }, + { + "epoch": 0.25, + "learning_rate": 1.7136971974599107e-05, + "loss": 0.6176, + "step": 7137 + }, + { + "epoch": 0.25, + "learning_rate": 1.7136209232211526e-05, + "loss": 0.6703, + "step": 7138 + }, + { + "epoch": 0.25, + "learning_rate": 1.7135446405215156e-05, + "loss": 0.6412, + "step": 7139 + }, + { + "epoch": 0.25, + "learning_rate": 1.7134683493619042e-05, + "loss": 0.6427, + "step": 7140 + }, + { + "epoch": 0.25, + "learning_rate": 1.713392049743223e-05, + "loss": 0.6519, + "step": 7141 + }, + { + "epoch": 0.25, + "learning_rate": 1.713315741666377e-05, + "loss": 0.6481, + "step": 7142 + }, + { + "epoch": 0.25, + "learning_rate": 1.71323942513227e-05, + "loss": 0.5857, + "step": 7143 + }, + { + "epoch": 0.25, + "learning_rate": 1.7131631001418077e-05, + "loss": 0.6075, + "step": 7144 + }, + { + "epoch": 0.25, + "learning_rate": 1.7130867666958945e-05, + "loss": 0.6417, + "step": 7145 + }, + { + "epoch": 0.25, + "learning_rate": 1.713010424795436e-05, + "loss": 0.6392, + "step": 7146 + }, + { + "epoch": 0.25, + "learning_rate": 1.7129340744413366e-05, + "loss": 0.6638, + "step": 7147 + }, + { + "epoch": 0.25, + "learning_rate": 1.7128577156345017e-05, + "loss": 0.6127, + "step": 7148 + }, + { + "epoch": 0.25, + "learning_rate": 1.7127813483758373e-05, + "loss": 0.6706, + "step": 7149 + }, + { + "epoch": 0.25, + "learning_rate": 1.7127049726662482e-05, + "loss": 0.6709, + "step": 7150 + }, + { + "epoch": 0.25, + "learning_rate": 1.7126285885066398e-05, + "loss": 0.6109, + "step": 7151 + }, + { + "epoch": 0.25, + "learning_rate": 1.712552195897918e-05, + "loss": 0.6753, + "step": 7152 + }, + { + "epoch": 0.25, + "learning_rate": 1.712475794840989e-05, + "loss": 0.6299, + "step": 7153 + }, + { + "epoch": 0.25, + "learning_rate": 1.7123993853367576e-05, + "loss": 0.6945, + "step": 7154 + }, + { + "epoch": 0.25, + "learning_rate": 1.7123229673861308e-05, + "loss": 0.6333, + "step": 7155 + }, + { + "epoch": 0.25, + "learning_rate": 1.7122465409900136e-05, + "loss": 0.6473, + "step": 7156 + }, + { + "epoch": 0.25, + "learning_rate": 1.7121701061493134e-05, + "loss": 0.6674, + "step": 7157 + }, + { + "epoch": 0.25, + "learning_rate": 1.712093662864935e-05, + "loss": 0.6157, + "step": 7158 + }, + { + "epoch": 0.25, + "learning_rate": 1.712017211137786e-05, + "loss": 0.7164, + "step": 7159 + }, + { + "epoch": 0.25, + "learning_rate": 1.7119407509687717e-05, + "loss": 0.6115, + "step": 7160 + }, + { + "epoch": 0.25, + "learning_rate": 1.7118642823587994e-05, + "loss": 0.6253, + "step": 7161 + }, + { + "epoch": 0.25, + "learning_rate": 1.7117878053087757e-05, + "loss": 0.6583, + "step": 7162 + }, + { + "epoch": 0.25, + "learning_rate": 1.711711319819607e-05, + "loss": 0.6231, + "step": 7163 + }, + { + "epoch": 0.25, + "learning_rate": 1.7116348258922002e-05, + "loss": 0.5644, + "step": 7164 + }, + { + "epoch": 0.25, + "learning_rate": 1.7115583235274625e-05, + "loss": 0.6451, + "step": 7165 + }, + { + "epoch": 0.25, + "learning_rate": 1.7114818127263007e-05, + "loss": 0.6186, + "step": 7166 + }, + { + "epoch": 0.25, + "learning_rate": 1.711405293489622e-05, + "loss": 0.6263, + "step": 7167 + }, + { + "epoch": 0.25, + "learning_rate": 1.7113287658183332e-05, + "loss": 0.6513, + "step": 7168 + }, + { + "epoch": 0.25, + "learning_rate": 1.7112522297133425e-05, + "loss": 0.6422, + "step": 7169 + }, + { + "epoch": 0.25, + "learning_rate": 1.7111756851755567e-05, + "loss": 0.6996, + "step": 7170 + }, + { + "epoch": 0.25, + "learning_rate": 1.7110991322058835e-05, + "loss": 0.6154, + "step": 7171 + }, + { + "epoch": 0.25, + "learning_rate": 1.7110225708052306e-05, + "loss": 0.6399, + "step": 7172 + }, + { + "epoch": 0.25, + "learning_rate": 1.7109460009745056e-05, + "loss": 0.595, + "step": 7173 + }, + { + "epoch": 0.25, + "learning_rate": 1.7108694227146167e-05, + "loss": 0.6339, + "step": 7174 + }, + { + "epoch": 0.25, + "learning_rate": 1.7107928360264714e-05, + "loss": 0.6493, + "step": 7175 + }, + { + "epoch": 0.25, + "learning_rate": 1.7107162409109775e-05, + "loss": 0.5986, + "step": 7176 + }, + { + "epoch": 0.25, + "learning_rate": 1.710639637369044e-05, + "loss": 0.6685, + "step": 7177 + }, + { + "epoch": 0.25, + "learning_rate": 1.7105630254015785e-05, + "loss": 0.6891, + "step": 7178 + }, + { + "epoch": 0.25, + "learning_rate": 1.7104864050094895e-05, + "loss": 0.6484, + "step": 7179 + }, + { + "epoch": 0.25, + "learning_rate": 1.7104097761936852e-05, + "loss": 0.5876, + "step": 7180 + }, + { + "epoch": 0.25, + "learning_rate": 1.7103331389550745e-05, + "loss": 0.6628, + "step": 7181 + }, + { + "epoch": 0.25, + "learning_rate": 1.710256493294566e-05, + "loss": 0.6561, + "step": 7182 + }, + { + "epoch": 0.25, + "learning_rate": 1.7101798392130678e-05, + "loss": 0.6768, + "step": 7183 + }, + { + "epoch": 0.25, + "learning_rate": 1.7101031767114897e-05, + "loss": 0.5898, + "step": 7184 + }, + { + "epoch": 0.25, + "learning_rate": 1.7100265057907398e-05, + "loss": 0.632, + "step": 7185 + }, + { + "epoch": 0.25, + "learning_rate": 1.7099498264517275e-05, + "loss": 0.6579, + "step": 7186 + }, + { + "epoch": 0.25, + "learning_rate": 1.7098731386953623e-05, + "loss": 0.6018, + "step": 7187 + }, + { + "epoch": 0.25, + "learning_rate": 1.7097964425225528e-05, + "loss": 0.5938, + "step": 7188 + }, + { + "epoch": 0.25, + "learning_rate": 1.7097197379342084e-05, + "loss": 0.6963, + "step": 7189 + }, + { + "epoch": 0.25, + "learning_rate": 1.709643024931239e-05, + "loss": 0.6188, + "step": 7190 + }, + { + "epoch": 0.25, + "learning_rate": 1.7095663035145537e-05, + "loss": 0.6098, + "step": 7191 + }, + { + "epoch": 0.25, + "learning_rate": 1.7094895736850625e-05, + "loss": 0.6948, + "step": 7192 + }, + { + "epoch": 0.25, + "learning_rate": 1.7094128354436745e-05, + "loss": 0.669, + "step": 7193 + }, + { + "epoch": 0.25, + "learning_rate": 1.7093360887913002e-05, + "loss": 0.6653, + "step": 7194 + }, + { + "epoch": 0.25, + "learning_rate": 1.7092593337288493e-05, + "loss": 0.6697, + "step": 7195 + }, + { + "epoch": 0.25, + "learning_rate": 1.7091825702572315e-05, + "loss": 0.5986, + "step": 7196 + }, + { + "epoch": 0.25, + "learning_rate": 1.7091057983773574e-05, + "loss": 0.6774, + "step": 7197 + }, + { + "epoch": 0.25, + "learning_rate": 1.7090290180901373e-05, + "loss": 0.6736, + "step": 7198 + }, + { + "epoch": 0.25, + "learning_rate": 1.7089522293964807e-05, + "loss": 0.6267, + "step": 7199 + }, + { + "epoch": 0.25, + "learning_rate": 1.7088754322972987e-05, + "loss": 0.6084, + "step": 7200 + }, + { + "epoch": 0.25, + "learning_rate": 1.708798626793502e-05, + "loss": 0.5697, + "step": 7201 + }, + { + "epoch": 0.25, + "learning_rate": 1.708721812886001e-05, + "loss": 0.603, + "step": 7202 + }, + { + "epoch": 0.25, + "learning_rate": 1.708644990575706e-05, + "loss": 0.7185, + "step": 7203 + }, + { + "epoch": 0.25, + "learning_rate": 1.7085681598635283e-05, + "loss": 0.6192, + "step": 7204 + }, + { + "epoch": 0.25, + "learning_rate": 1.708491320750379e-05, + "loss": 0.613, + "step": 7205 + }, + { + "epoch": 0.25, + "learning_rate": 1.7084144732371685e-05, + "loss": 0.6589, + "step": 7206 + }, + { + "epoch": 0.25, + "learning_rate": 1.7083376173248085e-05, + "loss": 0.6781, + "step": 7207 + }, + { + "epoch": 0.25, + "learning_rate": 1.70826075301421e-05, + "loss": 0.5949, + "step": 7208 + }, + { + "epoch": 0.25, + "learning_rate": 1.7081838803062844e-05, + "loss": 0.6666, + "step": 7209 + }, + { + "epoch": 0.25, + "learning_rate": 1.7081069992019424e-05, + "loss": 0.6469, + "step": 7210 + }, + { + "epoch": 0.25, + "learning_rate": 1.708030109702097e-05, + "loss": 0.6149, + "step": 7211 + }, + { + "epoch": 0.25, + "learning_rate": 1.7079532118076585e-05, + "loss": 0.6274, + "step": 7212 + }, + { + "epoch": 0.25, + "learning_rate": 1.7078763055195393e-05, + "loss": 0.6552, + "step": 7213 + }, + { + "epoch": 0.25, + "learning_rate": 1.707799390838651e-05, + "loss": 0.6516, + "step": 7214 + }, + { + "epoch": 0.25, + "learning_rate": 1.7077224677659055e-05, + "loss": 0.5999, + "step": 7215 + }, + { + "epoch": 0.25, + "learning_rate": 1.707645536302215e-05, + "loss": 0.6535, + "step": 7216 + }, + { + "epoch": 0.25, + "learning_rate": 1.7075685964484913e-05, + "loss": 0.656, + "step": 7217 + }, + { + "epoch": 0.25, + "learning_rate": 1.7074916482056468e-05, + "loss": 0.6211, + "step": 7218 + }, + { + "epoch": 0.25, + "learning_rate": 1.7074146915745943e-05, + "loss": 0.6363, + "step": 7219 + }, + { + "epoch": 0.25, + "learning_rate": 1.707337726556245e-05, + "loss": 0.6607, + "step": 7220 + }, + { + "epoch": 0.25, + "learning_rate": 1.7072607531515125e-05, + "loss": 0.6326, + "step": 7221 + }, + { + "epoch": 0.25, + "learning_rate": 1.7071837713613094e-05, + "loss": 0.5892, + "step": 7222 + }, + { + "epoch": 0.25, + "learning_rate": 1.7071067811865477e-05, + "loss": 0.6658, + "step": 7223 + }, + { + "epoch": 0.25, + "learning_rate": 1.707029782628141e-05, + "loss": 0.6128, + "step": 7224 + }, + { + "epoch": 0.25, + "learning_rate": 1.7069527756870014e-05, + "loss": 0.631, + "step": 7225 + }, + { + "epoch": 0.25, + "learning_rate": 1.7068757603640423e-05, + "loss": 0.6278, + "step": 7226 + }, + { + "epoch": 0.25, + "learning_rate": 1.706798736660177e-05, + "loss": 0.5707, + "step": 7227 + }, + { + "epoch": 0.25, + "learning_rate": 1.7067217045763186e-05, + "loss": 0.6106, + "step": 7228 + }, + { + "epoch": 0.25, + "learning_rate": 1.7066446641133806e-05, + "loss": 0.6783, + "step": 7229 + }, + { + "epoch": 0.25, + "learning_rate": 1.706567615272276e-05, + "loss": 0.624, + "step": 7230 + }, + { + "epoch": 0.25, + "learning_rate": 1.7064905580539184e-05, + "loss": 0.6327, + "step": 7231 + }, + { + "epoch": 0.25, + "learning_rate": 1.7064134924592218e-05, + "loss": 0.6593, + "step": 7232 + }, + { + "epoch": 0.25, + "learning_rate": 1.7063364184890994e-05, + "loss": 0.639, + "step": 7233 + }, + { + "epoch": 0.25, + "learning_rate": 1.7062593361444655e-05, + "loss": 0.6177, + "step": 7234 + }, + { + "epoch": 0.25, + "learning_rate": 1.7061822454262333e-05, + "loss": 0.668, + "step": 7235 + }, + { + "epoch": 0.25, + "learning_rate": 1.7061051463353176e-05, + "loss": 0.5952, + "step": 7236 + }, + { + "epoch": 0.25, + "learning_rate": 1.7060280388726322e-05, + "loss": 0.6316, + "step": 7237 + }, + { + "epoch": 0.25, + "learning_rate": 1.705950923039091e-05, + "loss": 0.6098, + "step": 7238 + }, + { + "epoch": 0.25, + "learning_rate": 1.705873798835609e-05, + "loss": 0.578, + "step": 7239 + }, + { + "epoch": 0.25, + "learning_rate": 1.7057966662630997e-05, + "loss": 0.6958, + "step": 7240 + }, + { + "epoch": 0.25, + "learning_rate": 1.7057195253224782e-05, + "loss": 0.6674, + "step": 7241 + }, + { + "epoch": 0.25, + "learning_rate": 1.7056423760146592e-05, + "loss": 0.6025, + "step": 7242 + }, + { + "epoch": 0.25, + "learning_rate": 1.705565218340557e-05, + "loss": 0.7283, + "step": 7243 + }, + { + "epoch": 0.25, + "learning_rate": 1.7054880523010865e-05, + "loss": 0.65, + "step": 7244 + }, + { + "epoch": 0.25, + "learning_rate": 1.705410877897163e-05, + "loss": 0.6569, + "step": 7245 + }, + { + "epoch": 0.25, + "learning_rate": 1.705333695129701e-05, + "loss": 0.6201, + "step": 7246 + }, + { + "epoch": 0.25, + "learning_rate": 1.7052565039996158e-05, + "loss": 0.6257, + "step": 7247 + }, + { + "epoch": 0.25, + "learning_rate": 1.705179304507823e-05, + "loss": 0.6353, + "step": 7248 + }, + { + "epoch": 0.25, + "learning_rate": 1.705102096655237e-05, + "loss": 0.5971, + "step": 7249 + }, + { + "epoch": 0.25, + "learning_rate": 1.7050248804427735e-05, + "loss": 0.6157, + "step": 7250 + }, + { + "epoch": 0.25, + "learning_rate": 1.7049476558713487e-05, + "loss": 0.6184, + "step": 7251 + }, + { + "epoch": 0.25, + "learning_rate": 1.7048704229418775e-05, + "loss": 0.6451, + "step": 7252 + }, + { + "epoch": 0.25, + "learning_rate": 1.7047931816552753e-05, + "loss": 0.6183, + "step": 7253 + }, + { + "epoch": 0.25, + "learning_rate": 1.7047159320124592e-05, + "loss": 0.5745, + "step": 7254 + }, + { + "epoch": 0.25, + "learning_rate": 1.7046386740143435e-05, + "loss": 0.6655, + "step": 7255 + }, + { + "epoch": 0.25, + "learning_rate": 1.7045614076618457e-05, + "loss": 0.6387, + "step": 7256 + }, + { + "epoch": 0.25, + "learning_rate": 1.7044841329558804e-05, + "loss": 0.6728, + "step": 7257 + }, + { + "epoch": 0.25, + "learning_rate": 1.7044068498973652e-05, + "loss": 0.6436, + "step": 7258 + }, + { + "epoch": 0.25, + "learning_rate": 1.7043295584872153e-05, + "loss": 0.6377, + "step": 7259 + }, + { + "epoch": 0.25, + "learning_rate": 1.7042522587263475e-05, + "loss": 0.616, + "step": 7260 + }, + { + "epoch": 0.25, + "learning_rate": 1.7041749506156783e-05, + "loss": 0.654, + "step": 7261 + }, + { + "epoch": 0.25, + "learning_rate": 1.704097634156124e-05, + "loss": 0.637, + "step": 7262 + }, + { + "epoch": 0.25, + "learning_rate": 1.704020309348602e-05, + "loss": 0.6368, + "step": 7263 + }, + { + "epoch": 0.25, + "learning_rate": 1.703942976194029e-05, + "loss": 0.6298, + "step": 7264 + }, + { + "epoch": 0.25, + "learning_rate": 1.7038656346933206e-05, + "loss": 0.637, + "step": 7265 + }, + { + "epoch": 0.25, + "learning_rate": 1.7037882848473956e-05, + "loss": 0.693, + "step": 7266 + }, + { + "epoch": 0.25, + "learning_rate": 1.7037109266571695e-05, + "loss": 0.6053, + "step": 7267 + }, + { + "epoch": 0.25, + "learning_rate": 1.7036335601235604e-05, + "loss": 0.623, + "step": 7268 + }, + { + "epoch": 0.25, + "learning_rate": 1.7035561852474853e-05, + "loss": 0.6727, + "step": 7269 + }, + { + "epoch": 0.25, + "learning_rate": 1.7034788020298618e-05, + "loss": 0.6631, + "step": 7270 + }, + { + "epoch": 0.25, + "learning_rate": 1.7034014104716073e-05, + "loss": 0.5819, + "step": 7271 + }, + { + "epoch": 0.25, + "learning_rate": 1.7033240105736388e-05, + "loss": 0.6455, + "step": 7272 + }, + { + "epoch": 0.25, + "learning_rate": 1.7032466023368748e-05, + "loss": 0.6517, + "step": 7273 + }, + { + "epoch": 0.25, + "learning_rate": 1.7031691857622326e-05, + "loss": 0.6571, + "step": 7274 + }, + { + "epoch": 0.25, + "learning_rate": 1.70309176085063e-05, + "loss": 0.6488, + "step": 7275 + }, + { + "epoch": 0.25, + "learning_rate": 1.7030143276029856e-05, + "loss": 0.6405, + "step": 7276 + }, + { + "epoch": 0.25, + "learning_rate": 1.7029368860202167e-05, + "loss": 0.6108, + "step": 7277 + }, + { + "epoch": 0.25, + "learning_rate": 1.7028594361032417e-05, + "loss": 0.6288, + "step": 7278 + }, + { + "epoch": 0.25, + "learning_rate": 1.7027819778529796e-05, + "loss": 0.623, + "step": 7279 + }, + { + "epoch": 0.25, + "learning_rate": 1.7027045112703474e-05, + "loss": 0.6164, + "step": 7280 + }, + { + "epoch": 0.25, + "learning_rate": 1.7026270363562646e-05, + "loss": 0.6471, + "step": 7281 + }, + { + "epoch": 0.25, + "learning_rate": 1.7025495531116497e-05, + "loss": 0.6126, + "step": 7282 + }, + { + "epoch": 0.25, + "learning_rate": 1.7024720615374208e-05, + "loss": 0.6374, + "step": 7283 + }, + { + "epoch": 0.25, + "learning_rate": 1.702394561634497e-05, + "loss": 0.6152, + "step": 7284 + }, + { + "epoch": 0.25, + "learning_rate": 1.702317053403797e-05, + "loss": 0.64, + "step": 7285 + }, + { + "epoch": 0.25, + "learning_rate": 1.70223953684624e-05, + "loss": 0.6337, + "step": 7286 + }, + { + "epoch": 0.25, + "learning_rate": 1.702162011962745e-05, + "loss": 0.6074, + "step": 7287 + }, + { + "epoch": 0.25, + "learning_rate": 1.702084478754231e-05, + "loss": 0.6261, + "step": 7288 + }, + { + "epoch": 0.25, + "learning_rate": 1.7020069372216176e-05, + "loss": 0.6281, + "step": 7289 + }, + { + "epoch": 0.25, + "learning_rate": 1.7019293873658238e-05, + "loss": 0.6633, + "step": 7290 + }, + { + "epoch": 0.25, + "learning_rate": 1.7018518291877693e-05, + "loss": 0.6457, + "step": 7291 + }, + { + "epoch": 0.25, + "learning_rate": 1.7017742626883734e-05, + "loss": 0.6095, + "step": 7292 + }, + { + "epoch": 0.25, + "learning_rate": 1.7016966878685556e-05, + "loss": 0.5947, + "step": 7293 + }, + { + "epoch": 0.25, + "learning_rate": 1.7016191047292364e-05, + "loss": 0.652, + "step": 7294 + }, + { + "epoch": 0.25, + "learning_rate": 1.701541513271335e-05, + "loss": 0.6476, + "step": 7295 + }, + { + "epoch": 0.25, + "learning_rate": 1.7014639134957713e-05, + "loss": 0.6219, + "step": 7296 + }, + { + "epoch": 0.25, + "learning_rate": 1.701386305403466e-05, + "loss": 0.6376, + "step": 7297 + }, + { + "epoch": 0.25, + "learning_rate": 1.7013086889953384e-05, + "loss": 0.6355, + "step": 7298 + }, + { + "epoch": 0.25, + "learning_rate": 1.701231064272309e-05, + "loss": 0.6442, + "step": 7299 + }, + { + "epoch": 0.25, + "learning_rate": 1.7011534312352985e-05, + "loss": 0.6562, + "step": 7300 + }, + { + "epoch": 0.25, + "learning_rate": 1.701075789885227e-05, + "loss": 0.6008, + "step": 7301 + }, + { + "epoch": 0.25, + "learning_rate": 1.7009981402230152e-05, + "loss": 0.6091, + "step": 7302 + }, + { + "epoch": 0.25, + "learning_rate": 1.700920482249584e-05, + "loss": 0.648, + "step": 7303 + }, + { + "epoch": 0.25, + "learning_rate": 1.7008428159658536e-05, + "loss": 0.6102, + "step": 7304 + }, + { + "epoch": 0.25, + "learning_rate": 1.700765141372745e-05, + "loss": 0.6142, + "step": 7305 + }, + { + "epoch": 0.25, + "learning_rate": 1.7006874584711787e-05, + "loss": 0.6118, + "step": 7306 + }, + { + "epoch": 0.25, + "learning_rate": 1.700609767262077e-05, + "loss": 0.6632, + "step": 7307 + }, + { + "epoch": 0.25, + "learning_rate": 1.7005320677463598e-05, + "loss": 0.6528, + "step": 7308 + }, + { + "epoch": 0.25, + "learning_rate": 1.700454359924949e-05, + "loss": 0.5996, + "step": 7309 + }, + { + "epoch": 0.25, + "learning_rate": 1.7003766437987654e-05, + "loss": 0.6821, + "step": 7310 + }, + { + "epoch": 0.25, + "learning_rate": 1.7002989193687307e-05, + "loss": 0.589, + "step": 7311 + }, + { + "epoch": 0.25, + "learning_rate": 1.7002211866357667e-05, + "loss": 0.6182, + "step": 7312 + }, + { + "epoch": 0.25, + "learning_rate": 1.7001434456007945e-05, + "loss": 0.5621, + "step": 7313 + }, + { + "epoch": 0.25, + "learning_rate": 1.7000656962647362e-05, + "loss": 0.6091, + "step": 7314 + }, + { + "epoch": 0.25, + "learning_rate": 1.6999879386285133e-05, + "loss": 0.6873, + "step": 7315 + }, + { + "epoch": 0.25, + "learning_rate": 1.6999101726930483e-05, + "loss": 0.6215, + "step": 7316 + }, + { + "epoch": 0.25, + "learning_rate": 1.6998323984592625e-05, + "loss": 0.6241, + "step": 7317 + }, + { + "epoch": 0.25, + "learning_rate": 1.6997546159280785e-05, + "loss": 0.638, + "step": 7318 + }, + { + "epoch": 0.25, + "learning_rate": 1.6996768251004182e-05, + "loss": 0.662, + "step": 7319 + }, + { + "epoch": 0.25, + "learning_rate": 1.6995990259772042e-05, + "loss": 0.6223, + "step": 7320 + }, + { + "epoch": 0.25, + "learning_rate": 1.6995212185593585e-05, + "loss": 0.6307, + "step": 7321 + }, + { + "epoch": 0.25, + "learning_rate": 1.6994434028478038e-05, + "loss": 0.6611, + "step": 7322 + }, + { + "epoch": 0.25, + "learning_rate": 1.6993655788434632e-05, + "loss": 0.6568, + "step": 7323 + }, + { + "epoch": 0.25, + "learning_rate": 1.6992877465472585e-05, + "loss": 0.6576, + "step": 7324 + }, + { + "epoch": 0.25, + "learning_rate": 1.699209905960113e-05, + "loss": 0.5888, + "step": 7325 + }, + { + "epoch": 0.25, + "learning_rate": 1.6991320570829502e-05, + "loss": 0.5923, + "step": 7326 + }, + { + "epoch": 0.25, + "learning_rate": 1.6990541999166917e-05, + "loss": 0.6525, + "step": 7327 + }, + { + "epoch": 0.25, + "learning_rate": 1.6989763344622615e-05, + "loss": 0.5845, + "step": 7328 + }, + { + "epoch": 0.25, + "learning_rate": 1.698898460720583e-05, + "loss": 0.6414, + "step": 7329 + }, + { + "epoch": 0.25, + "learning_rate": 1.698820578692579e-05, + "loss": 0.6175, + "step": 7330 + }, + { + "epoch": 0.25, + "learning_rate": 1.6987426883791728e-05, + "loss": 0.6449, + "step": 7331 + }, + { + "epoch": 0.25, + "learning_rate": 1.6986647897812884e-05, + "loss": 0.6431, + "step": 7332 + }, + { + "epoch": 0.25, + "learning_rate": 1.698586882899849e-05, + "loss": 0.6615, + "step": 7333 + }, + { + "epoch": 0.25, + "learning_rate": 1.698508967735778e-05, + "loss": 0.5945, + "step": 7334 + }, + { + "epoch": 0.25, + "learning_rate": 1.69843104429e-05, + "loss": 0.6761, + "step": 7335 + }, + { + "epoch": 0.25, + "learning_rate": 1.6983531125634386e-05, + "loss": 0.6744, + "step": 7336 + }, + { + "epoch": 0.25, + "learning_rate": 1.6982751725570173e-05, + "loss": 0.6188, + "step": 7337 + }, + { + "epoch": 0.25, + "learning_rate": 1.6981972242716604e-05, + "loss": 0.6159, + "step": 7338 + }, + { + "epoch": 0.25, + "learning_rate": 1.6981192677082926e-05, + "loss": 0.6443, + "step": 7339 + }, + { + "epoch": 0.25, + "learning_rate": 1.6980413028678374e-05, + "loss": 0.6435, + "step": 7340 + }, + { + "epoch": 0.25, + "learning_rate": 1.6979633297512197e-05, + "loss": 0.6636, + "step": 7341 + }, + { + "epoch": 0.25, + "learning_rate": 1.6978853483593636e-05, + "loss": 0.6257, + "step": 7342 + }, + { + "epoch": 0.25, + "learning_rate": 1.697807358693194e-05, + "loss": 0.7056, + "step": 7343 + }, + { + "epoch": 0.25, + "learning_rate": 1.6977293607536355e-05, + "loss": 0.63, + "step": 7344 + }, + { + "epoch": 0.25, + "learning_rate": 1.6976513545416127e-05, + "loss": 0.6317, + "step": 7345 + }, + { + "epoch": 0.25, + "learning_rate": 1.6975733400580506e-05, + "loss": 0.6227, + "step": 7346 + }, + { + "epoch": 0.25, + "learning_rate": 1.6974953173038745e-05, + "loss": 0.6214, + "step": 7347 + }, + { + "epoch": 0.25, + "learning_rate": 1.6974172862800084e-05, + "loss": 0.6449, + "step": 7348 + }, + { + "epoch": 0.25, + "learning_rate": 1.6973392469873788e-05, + "loss": 0.6523, + "step": 7349 + }, + { + "epoch": 0.25, + "learning_rate": 1.6972611994269097e-05, + "loss": 0.6759, + "step": 7350 + }, + { + "epoch": 0.25, + "learning_rate": 1.6971831435995275e-05, + "loss": 0.635, + "step": 7351 + }, + { + "epoch": 0.25, + "learning_rate": 1.6971050795061564e-05, + "loss": 0.6138, + "step": 7352 + }, + { + "epoch": 0.25, + "learning_rate": 1.6970270071477238e-05, + "loss": 0.6123, + "step": 7353 + }, + { + "epoch": 0.25, + "learning_rate": 1.6969489265251536e-05, + "loss": 0.5839, + "step": 7354 + }, + { + "epoch": 0.25, + "learning_rate": 1.6968708376393724e-05, + "loss": 0.6106, + "step": 7355 + }, + { + "epoch": 0.25, + "learning_rate": 1.696792740491306e-05, + "loss": 0.6357, + "step": 7356 + }, + { + "epoch": 0.25, + "learning_rate": 1.6967146350818802e-05, + "loss": 0.6181, + "step": 7357 + }, + { + "epoch": 0.25, + "learning_rate": 1.6966365214120207e-05, + "loss": 0.6175, + "step": 7358 + }, + { + "epoch": 0.25, + "learning_rate": 1.696558399482654e-05, + "loss": 0.6117, + "step": 7359 + }, + { + "epoch": 0.26, + "learning_rate": 1.696480269294707e-05, + "loss": 0.6425, + "step": 7360 + }, + { + "epoch": 0.26, + "learning_rate": 1.696402130849105e-05, + "loss": 0.6314, + "step": 7361 + }, + { + "epoch": 0.26, + "learning_rate": 1.6963239841467745e-05, + "loss": 0.6281, + "step": 7362 + }, + { + "epoch": 0.26, + "learning_rate": 1.6962458291886426e-05, + "loss": 0.6499, + "step": 7363 + }, + { + "epoch": 0.26, + "learning_rate": 1.6961676659756356e-05, + "loss": 0.6684, + "step": 7364 + }, + { + "epoch": 0.26, + "learning_rate": 1.69608949450868e-05, + "loss": 0.6122, + "step": 7365 + }, + { + "epoch": 0.26, + "learning_rate": 1.6960113147887032e-05, + "loss": 0.6781, + "step": 7366 + }, + { + "epoch": 0.26, + "learning_rate": 1.6959331268166318e-05, + "loss": 0.6128, + "step": 7367 + }, + { + "epoch": 0.26, + "learning_rate": 1.6958549305933926e-05, + "loss": 0.6566, + "step": 7368 + }, + { + "epoch": 0.26, + "learning_rate": 1.6957767261199132e-05, + "loss": 0.6426, + "step": 7369 + }, + { + "epoch": 0.26, + "learning_rate": 1.6956985133971206e-05, + "loss": 0.6444, + "step": 7370 + }, + { + "epoch": 0.26, + "learning_rate": 1.695620292425942e-05, + "loss": 0.6836, + "step": 7371 + }, + { + "epoch": 0.26, + "learning_rate": 1.6955420632073046e-05, + "loss": 0.6323, + "step": 7372 + }, + { + "epoch": 0.26, + "learning_rate": 1.6954638257421362e-05, + "loss": 0.6504, + "step": 7373 + }, + { + "epoch": 0.26, + "learning_rate": 1.6953855800313643e-05, + "loss": 0.6173, + "step": 7374 + }, + { + "epoch": 0.26, + "learning_rate": 1.6953073260759172e-05, + "loss": 0.6319, + "step": 7375 + }, + { + "epoch": 0.26, + "learning_rate": 1.6952290638767217e-05, + "loss": 0.648, + "step": 7376 + }, + { + "epoch": 0.26, + "learning_rate": 1.6951507934347063e-05, + "loss": 0.5749, + "step": 7377 + }, + { + "epoch": 0.26, + "learning_rate": 1.695072514750799e-05, + "loss": 0.6145, + "step": 7378 + }, + { + "epoch": 0.26, + "learning_rate": 1.6949942278259278e-05, + "loss": 0.676, + "step": 7379 + }, + { + "epoch": 0.26, + "learning_rate": 1.6949159326610204e-05, + "loss": 0.619, + "step": 7380 + }, + { + "epoch": 0.26, + "learning_rate": 1.6948376292570062e-05, + "loss": 0.5778, + "step": 7381 + }, + { + "epoch": 0.26, + "learning_rate": 1.6947593176148126e-05, + "loss": 0.6152, + "step": 7382 + }, + { + "epoch": 0.26, + "learning_rate": 1.6946809977353682e-05, + "loss": 0.5872, + "step": 7383 + }, + { + "epoch": 0.26, + "learning_rate": 1.694602669619602e-05, + "loss": 0.628, + "step": 7384 + }, + { + "epoch": 0.26, + "learning_rate": 1.6945243332684427e-05, + "loss": 0.6489, + "step": 7385 + }, + { + "epoch": 0.26, + "learning_rate": 1.6944459886828186e-05, + "loss": 0.7078, + "step": 7386 + }, + { + "epoch": 0.26, + "learning_rate": 1.694367635863659e-05, + "loss": 0.588, + "step": 7387 + }, + { + "epoch": 0.26, + "learning_rate": 1.6942892748118928e-05, + "loss": 0.6331, + "step": 7388 + }, + { + "epoch": 0.26, + "learning_rate": 1.6942109055284485e-05, + "loss": 0.6284, + "step": 7389 + }, + { + "epoch": 0.26, + "learning_rate": 1.694132528014256e-05, + "loss": 0.6317, + "step": 7390 + }, + { + "epoch": 0.26, + "learning_rate": 1.6940541422702445e-05, + "loss": 0.5889, + "step": 7391 + }, + { + "epoch": 0.26, + "learning_rate": 1.6939757482973425e-05, + "loss": 0.6238, + "step": 7392 + }, + { + "epoch": 0.26, + "learning_rate": 1.6938973460964808e-05, + "loss": 0.6512, + "step": 7393 + }, + { + "epoch": 0.26, + "learning_rate": 1.6938189356685882e-05, + "loss": 0.6436, + "step": 7394 + }, + { + "epoch": 0.26, + "learning_rate": 1.6937405170145943e-05, + "loss": 0.6523, + "step": 7395 + }, + { + "epoch": 0.26, + "learning_rate": 1.693662090135429e-05, + "loss": 0.6494, + "step": 7396 + }, + { + "epoch": 0.26, + "learning_rate": 1.693583655032022e-05, + "loss": 0.6254, + "step": 7397 + }, + { + "epoch": 0.26, + "learning_rate": 1.6935052117053033e-05, + "loss": 0.6572, + "step": 7398 + }, + { + "epoch": 0.26, + "learning_rate": 1.693426760156203e-05, + "loss": 0.625, + "step": 7399 + }, + { + "epoch": 0.26, + "learning_rate": 1.6933483003856517e-05, + "loss": 0.597, + "step": 7400 + }, + { + "epoch": 0.26, + "learning_rate": 1.693269832394579e-05, + "loss": 0.6277, + "step": 7401 + }, + { + "epoch": 0.26, + "learning_rate": 1.693191356183915e-05, + "loss": 0.5998, + "step": 7402 + }, + { + "epoch": 0.26, + "learning_rate": 1.6931128717545914e-05, + "loss": 0.6669, + "step": 7403 + }, + { + "epoch": 0.26, + "learning_rate": 1.6930343791075373e-05, + "loss": 0.6331, + "step": 7404 + }, + { + "epoch": 0.26, + "learning_rate": 1.6929558782436842e-05, + "loss": 0.6884, + "step": 7405 + }, + { + "epoch": 0.26, + "learning_rate": 1.692877369163963e-05, + "loss": 0.6979, + "step": 7406 + }, + { + "epoch": 0.26, + "learning_rate": 1.6927988518693034e-05, + "loss": 0.6245, + "step": 7407 + }, + { + "epoch": 0.26, + "learning_rate": 1.692720326360637e-05, + "loss": 0.6556, + "step": 7408 + }, + { + "epoch": 0.26, + "learning_rate": 1.692641792638895e-05, + "loss": 0.6452, + "step": 7409 + }, + { + "epoch": 0.26, + "learning_rate": 1.6925632507050087e-05, + "loss": 0.6156, + "step": 7410 + }, + { + "epoch": 0.26, + "learning_rate": 1.6924847005599084e-05, + "loss": 0.656, + "step": 7411 + }, + { + "epoch": 0.26, + "learning_rate": 1.6924061422045265e-05, + "loss": 0.6654, + "step": 7412 + }, + { + "epoch": 0.26, + "learning_rate": 1.6923275756397938e-05, + "loss": 0.6352, + "step": 7413 + }, + { + "epoch": 0.26, + "learning_rate": 1.6922490008666416e-05, + "loss": 0.669, + "step": 7414 + }, + { + "epoch": 0.26, + "learning_rate": 1.6921704178860018e-05, + "loss": 0.6086, + "step": 7415 + }, + { + "epoch": 0.26, + "learning_rate": 1.6920918266988063e-05, + "loss": 0.6775, + "step": 7416 + }, + { + "epoch": 0.26, + "learning_rate": 1.6920132273059866e-05, + "loss": 0.6257, + "step": 7417 + }, + { + "epoch": 0.26, + "learning_rate": 1.6919346197084748e-05, + "loss": 0.5923, + "step": 7418 + }, + { + "epoch": 0.26, + "learning_rate": 1.691856003907203e-05, + "loss": 0.6184, + "step": 7419 + }, + { + "epoch": 0.26, + "learning_rate": 1.6917773799031026e-05, + "loss": 0.6582, + "step": 7420 + }, + { + "epoch": 0.26, + "learning_rate": 1.691698747697106e-05, + "loss": 0.6897, + "step": 7421 + }, + { + "epoch": 0.26, + "learning_rate": 1.6916201072901465e-05, + "loss": 0.6685, + "step": 7422 + }, + { + "epoch": 0.26, + "learning_rate": 1.6915414586831553e-05, + "loss": 0.6625, + "step": 7423 + }, + { + "epoch": 0.26, + "learning_rate": 1.6914628018770652e-05, + "loss": 0.6749, + "step": 7424 + }, + { + "epoch": 0.26, + "learning_rate": 1.6913841368728095e-05, + "loss": 0.6036, + "step": 7425 + }, + { + "epoch": 0.26, + "learning_rate": 1.6913054636713196e-05, + "loss": 0.6688, + "step": 7426 + }, + { + "epoch": 0.26, + "learning_rate": 1.6912267822735293e-05, + "loss": 0.5863, + "step": 7427 + }, + { + "epoch": 0.26, + "learning_rate": 1.691148092680371e-05, + "loss": 0.5703, + "step": 7428 + }, + { + "epoch": 0.26, + "learning_rate": 1.6910693948927777e-05, + "loss": 0.6317, + "step": 7429 + }, + { + "epoch": 0.26, + "learning_rate": 1.6909906889116822e-05, + "loss": 0.619, + "step": 7430 + }, + { + "epoch": 0.26, + "learning_rate": 1.6909119747380184e-05, + "loss": 0.6391, + "step": 7431 + }, + { + "epoch": 0.26, + "learning_rate": 1.690833252372719e-05, + "loss": 0.7282, + "step": 7432 + }, + { + "epoch": 0.26, + "learning_rate": 1.6907545218167176e-05, + "loss": 0.6539, + "step": 7433 + }, + { + "epoch": 0.26, + "learning_rate": 1.6906757830709475e-05, + "loss": 0.6133, + "step": 7434 + }, + { + "epoch": 0.26, + "learning_rate": 1.690597036136342e-05, + "loss": 0.6649, + "step": 7435 + }, + { + "epoch": 0.26, + "learning_rate": 1.6905182810138353e-05, + "loss": 0.6155, + "step": 7436 + }, + { + "epoch": 0.26, + "learning_rate": 1.6904395177043608e-05, + "loss": 0.617, + "step": 7437 + }, + { + "epoch": 0.26, + "learning_rate": 1.6903607462088526e-05, + "loss": 0.5995, + "step": 7438 + }, + { + "epoch": 0.26, + "learning_rate": 1.690281966528244e-05, + "loss": 0.6814, + "step": 7439 + }, + { + "epoch": 0.26, + "learning_rate": 1.6902031786634697e-05, + "loss": 0.637, + "step": 7440 + }, + { + "epoch": 0.26, + "learning_rate": 1.690124382615464e-05, + "loss": 0.6163, + "step": 7441 + }, + { + "epoch": 0.26, + "learning_rate": 1.6900455783851603e-05, + "loss": 0.5606, + "step": 7442 + }, + { + "epoch": 0.26, + "learning_rate": 1.689966765973493e-05, + "loss": 0.6134, + "step": 7443 + }, + { + "epoch": 0.26, + "learning_rate": 1.689887945381398e-05, + "loss": 0.6659, + "step": 7444 + }, + { + "epoch": 0.26, + "learning_rate": 1.6898091166098077e-05, + "loss": 0.6286, + "step": 7445 + }, + { + "epoch": 0.26, + "learning_rate": 1.689730279659658e-05, + "loss": 0.584, + "step": 7446 + }, + { + "epoch": 0.26, + "learning_rate": 1.6896514345318834e-05, + "loss": 0.6608, + "step": 7447 + }, + { + "epoch": 0.26, + "learning_rate": 1.6895725812274184e-05, + "loss": 0.6723, + "step": 7448 + }, + { + "epoch": 0.26, + "learning_rate": 1.6894937197471987e-05, + "loss": 0.6883, + "step": 7449 + }, + { + "epoch": 0.26, + "learning_rate": 1.6894148500921583e-05, + "loss": 0.6146, + "step": 7450 + }, + { + "epoch": 0.26, + "learning_rate": 1.6893359722632326e-05, + "loss": 0.6362, + "step": 7451 + }, + { + "epoch": 0.26, + "learning_rate": 1.6892570862613572e-05, + "loss": 0.6392, + "step": 7452 + }, + { + "epoch": 0.26, + "learning_rate": 1.6891781920874672e-05, + "loss": 0.682, + "step": 7453 + }, + { + "epoch": 0.26, + "learning_rate": 1.6890992897424973e-05, + "loss": 0.6216, + "step": 7454 + }, + { + "epoch": 0.26, + "learning_rate": 1.6890203792273844e-05, + "loss": 0.6017, + "step": 7455 + }, + { + "epoch": 0.26, + "learning_rate": 1.688941460543063e-05, + "loss": 0.686, + "step": 7456 + }, + { + "epoch": 0.26, + "learning_rate": 1.688862533690469e-05, + "loss": 0.6104, + "step": 7457 + }, + { + "epoch": 0.26, + "learning_rate": 1.688783598670538e-05, + "loss": 0.6388, + "step": 7458 + }, + { + "epoch": 0.26, + "learning_rate": 1.6887046554842066e-05, + "loss": 0.6543, + "step": 7459 + }, + { + "epoch": 0.26, + "learning_rate": 1.68862570413241e-05, + "loss": 0.5787, + "step": 7460 + }, + { + "epoch": 0.26, + "learning_rate": 1.6885467446160845e-05, + "loss": 0.6616, + "step": 7461 + }, + { + "epoch": 0.26, + "learning_rate": 1.6884677769361667e-05, + "loss": 0.6271, + "step": 7462 + }, + { + "epoch": 0.26, + "learning_rate": 1.6883888010935924e-05, + "loss": 0.6452, + "step": 7463 + }, + { + "epoch": 0.26, + "learning_rate": 1.6883098170892975e-05, + "loss": 0.6672, + "step": 7464 + }, + { + "epoch": 0.26, + "learning_rate": 1.6882308249242197e-05, + "loss": 0.6159, + "step": 7465 + }, + { + "epoch": 0.26, + "learning_rate": 1.6881518245992944e-05, + "loss": 0.5754, + "step": 7466 + }, + { + "epoch": 0.26, + "learning_rate": 1.688072816115459e-05, + "loss": 0.6591, + "step": 7467 + }, + { + "epoch": 0.26, + "learning_rate": 1.6879937994736498e-05, + "loss": 0.6613, + "step": 7468 + }, + { + "epoch": 0.26, + "learning_rate": 1.687914774674804e-05, + "loss": 0.6145, + "step": 7469 + }, + { + "epoch": 0.26, + "learning_rate": 1.687835741719858e-05, + "loss": 0.6292, + "step": 7470 + }, + { + "epoch": 0.26, + "learning_rate": 1.6877567006097494e-05, + "loss": 0.6315, + "step": 7471 + }, + { + "epoch": 0.26, + "learning_rate": 1.687677651345415e-05, + "loss": 0.6473, + "step": 7472 + }, + { + "epoch": 0.26, + "learning_rate": 1.687598593927792e-05, + "loss": 0.7176, + "step": 7473 + }, + { + "epoch": 0.26, + "learning_rate": 1.6875195283578178e-05, + "loss": 0.6524, + "step": 7474 + }, + { + "epoch": 0.26, + "learning_rate": 1.68744045463643e-05, + "loss": 0.5979, + "step": 7475 + }, + { + "epoch": 0.26, + "learning_rate": 1.6873613727645662e-05, + "loss": 0.6477, + "step": 7476 + }, + { + "epoch": 0.26, + "learning_rate": 1.6872822827431635e-05, + "loss": 0.6444, + "step": 7477 + }, + { + "epoch": 0.26, + "learning_rate": 1.68720318457316e-05, + "loss": 0.6494, + "step": 7478 + }, + { + "epoch": 0.26, + "learning_rate": 1.6871240782554937e-05, + "loss": 0.5808, + "step": 7479 + }, + { + "epoch": 0.26, + "learning_rate": 1.687044963791102e-05, + "loss": 0.625, + "step": 7480 + }, + { + "epoch": 0.26, + "learning_rate": 1.6869658411809232e-05, + "loss": 0.6904, + "step": 7481 + }, + { + "epoch": 0.26, + "learning_rate": 1.686886710425895e-05, + "loss": 0.664, + "step": 7482 + }, + { + "epoch": 0.26, + "learning_rate": 1.6868075715269566e-05, + "loss": 0.6704, + "step": 7483 + }, + { + "epoch": 0.26, + "learning_rate": 1.6867284244850452e-05, + "loss": 0.6466, + "step": 7484 + }, + { + "epoch": 0.26, + "learning_rate": 1.6866492693010997e-05, + "loss": 0.6463, + "step": 7485 + }, + { + "epoch": 0.26, + "learning_rate": 1.6865701059760583e-05, + "loss": 0.637, + "step": 7486 + }, + { + "epoch": 0.26, + "learning_rate": 1.6864909345108602e-05, + "loss": 0.6489, + "step": 7487 + }, + { + "epoch": 0.26, + "learning_rate": 1.6864117549064432e-05, + "loss": 0.6508, + "step": 7488 + }, + { + "epoch": 0.26, + "learning_rate": 1.686332567163747e-05, + "loss": 0.6511, + "step": 7489 + }, + { + "epoch": 0.26, + "learning_rate": 1.6862533712837097e-05, + "loss": 0.6368, + "step": 7490 + }, + { + "epoch": 0.26, + "learning_rate": 1.6861741672672706e-05, + "loss": 0.6577, + "step": 7491 + }, + { + "epoch": 0.26, + "learning_rate": 1.6860949551153687e-05, + "loss": 0.6114, + "step": 7492 + }, + { + "epoch": 0.26, + "learning_rate": 1.6860157348289435e-05, + "loss": 0.6154, + "step": 7493 + }, + { + "epoch": 0.26, + "learning_rate": 1.6859365064089336e-05, + "loss": 0.6466, + "step": 7494 + }, + { + "epoch": 0.26, + "learning_rate": 1.6858572698562788e-05, + "loss": 0.6137, + "step": 7495 + }, + { + "epoch": 0.26, + "learning_rate": 1.6857780251719183e-05, + "loss": 0.6315, + "step": 7496 + }, + { + "epoch": 0.26, + "learning_rate": 1.685698772356792e-05, + "loss": 0.6619, + "step": 7497 + }, + { + "epoch": 0.26, + "learning_rate": 1.6856195114118394e-05, + "loss": 0.6531, + "step": 7498 + }, + { + "epoch": 0.26, + "learning_rate": 1.685540242338e-05, + "loss": 0.6301, + "step": 7499 + }, + { + "epoch": 0.26, + "learning_rate": 1.6854609651362137e-05, + "loss": 0.6248, + "step": 7500 + }, + { + "epoch": 0.26, + "learning_rate": 1.6853816798074207e-05, + "loss": 0.6332, + "step": 7501 + }, + { + "epoch": 0.26, + "learning_rate": 1.685302386352561e-05, + "loss": 0.6999, + "step": 7502 + }, + { + "epoch": 0.26, + "learning_rate": 1.6852230847725745e-05, + "loss": 0.5905, + "step": 7503 + }, + { + "epoch": 0.26, + "learning_rate": 1.6851437750684014e-05, + "loss": 0.6329, + "step": 7504 + }, + { + "epoch": 0.26, + "learning_rate": 1.6850644572409824e-05, + "loss": 0.664, + "step": 7505 + }, + { + "epoch": 0.26, + "learning_rate": 1.6849851312912574e-05, + "loss": 0.6062, + "step": 7506 + }, + { + "epoch": 0.26, + "learning_rate": 1.6849057972201672e-05, + "loss": 0.6127, + "step": 7507 + }, + { + "epoch": 0.26, + "learning_rate": 1.6848264550286525e-05, + "loss": 0.5974, + "step": 7508 + }, + { + "epoch": 0.26, + "learning_rate": 1.684747104717654e-05, + "loss": 0.6171, + "step": 7509 + }, + { + "epoch": 0.26, + "learning_rate": 1.6846677462881116e-05, + "loss": 0.6236, + "step": 7510 + }, + { + "epoch": 0.26, + "learning_rate": 1.684588379740968e-05, + "loss": 0.5907, + "step": 7511 + }, + { + "epoch": 0.26, + "learning_rate": 1.6845090050771628e-05, + "loss": 0.6249, + "step": 7512 + }, + { + "epoch": 0.26, + "learning_rate": 1.6844296222976368e-05, + "loss": 0.6252, + "step": 7513 + }, + { + "epoch": 0.26, + "learning_rate": 1.6843502314033323e-05, + "loss": 0.6609, + "step": 7514 + }, + { + "epoch": 0.26, + "learning_rate": 1.6842708323951904e-05, + "loss": 0.6262, + "step": 7515 + }, + { + "epoch": 0.26, + "learning_rate": 1.6841914252741516e-05, + "loss": 0.5856, + "step": 7516 + }, + { + "epoch": 0.26, + "learning_rate": 1.6841120100411584e-05, + "loss": 0.6316, + "step": 7517 + }, + { + "epoch": 0.26, + "learning_rate": 1.6840325866971517e-05, + "loss": 0.6284, + "step": 7518 + }, + { + "epoch": 0.26, + "learning_rate": 1.6839531552430736e-05, + "loss": 0.661, + "step": 7519 + }, + { + "epoch": 0.26, + "learning_rate": 1.6838737156798653e-05, + "loss": 0.6628, + "step": 7520 + }, + { + "epoch": 0.26, + "learning_rate": 1.683794268008469e-05, + "loss": 0.6244, + "step": 7521 + }, + { + "epoch": 0.26, + "learning_rate": 1.683714812229827e-05, + "loss": 0.6368, + "step": 7522 + }, + { + "epoch": 0.26, + "learning_rate": 1.6836353483448807e-05, + "loss": 0.6858, + "step": 7523 + }, + { + "epoch": 0.26, + "learning_rate": 1.6835558763545728e-05, + "loss": 0.6845, + "step": 7524 + }, + { + "epoch": 0.26, + "learning_rate": 1.6834763962598452e-05, + "loss": 0.5765, + "step": 7525 + }, + { + "epoch": 0.26, + "learning_rate": 1.68339690806164e-05, + "loss": 0.652, + "step": 7526 + }, + { + "epoch": 0.26, + "learning_rate": 1.6833174117609002e-05, + "loss": 0.5468, + "step": 7527 + }, + { + "epoch": 0.26, + "learning_rate": 1.683237907358568e-05, + "loss": 0.7273, + "step": 7528 + }, + { + "epoch": 0.26, + "learning_rate": 1.6831583948555863e-05, + "loss": 0.6211, + "step": 7529 + }, + { + "epoch": 0.26, + "learning_rate": 1.6830788742528975e-05, + "loss": 0.6394, + "step": 7530 + }, + { + "epoch": 0.26, + "learning_rate": 1.6829993455514445e-05, + "loss": 0.6083, + "step": 7531 + }, + { + "epoch": 0.26, + "learning_rate": 1.6829198087521705e-05, + "loss": 0.6699, + "step": 7532 + }, + { + "epoch": 0.26, + "learning_rate": 1.682840263856018e-05, + "loss": 0.6207, + "step": 7533 + }, + { + "epoch": 0.26, + "learning_rate": 1.6827607108639304e-05, + "loss": 0.6394, + "step": 7534 + }, + { + "epoch": 0.26, + "learning_rate": 1.6826811497768513e-05, + "loss": 0.6235, + "step": 7535 + }, + { + "epoch": 0.26, + "learning_rate": 1.682601580595723e-05, + "loss": 0.6883, + "step": 7536 + }, + { + "epoch": 0.26, + "learning_rate": 1.6825220033214897e-05, + "loss": 0.6533, + "step": 7537 + }, + { + "epoch": 0.26, + "learning_rate": 1.6824424179550947e-05, + "loss": 0.6835, + "step": 7538 + }, + { + "epoch": 0.26, + "learning_rate": 1.6823628244974816e-05, + "loss": 0.6695, + "step": 7539 + }, + { + "epoch": 0.26, + "learning_rate": 1.682283222949594e-05, + "loss": 0.5917, + "step": 7540 + }, + { + "epoch": 0.26, + "learning_rate": 1.682203613312375e-05, + "loss": 0.7009, + "step": 7541 + }, + { + "epoch": 0.26, + "learning_rate": 1.68212399558677e-05, + "loss": 0.6497, + "step": 7542 + }, + { + "epoch": 0.26, + "learning_rate": 1.682044369773722e-05, + "loss": 0.6498, + "step": 7543 + }, + { + "epoch": 0.26, + "learning_rate": 1.681964735874175e-05, + "loss": 0.6564, + "step": 7544 + }, + { + "epoch": 0.26, + "learning_rate": 1.6818850938890735e-05, + "loss": 0.6482, + "step": 7545 + }, + { + "epoch": 0.26, + "learning_rate": 1.6818054438193615e-05, + "loss": 0.585, + "step": 7546 + }, + { + "epoch": 0.26, + "learning_rate": 1.6817257856659837e-05, + "loss": 0.6494, + "step": 7547 + }, + { + "epoch": 0.26, + "learning_rate": 1.6816461194298842e-05, + "loss": 0.7678, + "step": 7548 + }, + { + "epoch": 0.26, + "learning_rate": 1.681566445112008e-05, + "loss": 0.5734, + "step": 7549 + }, + { + "epoch": 0.26, + "learning_rate": 1.681486762713299e-05, + "loss": 0.6589, + "step": 7550 + }, + { + "epoch": 0.26, + "learning_rate": 1.6814070722347024e-05, + "loss": 0.5806, + "step": 7551 + }, + { + "epoch": 0.26, + "learning_rate": 1.681327373677163e-05, + "loss": 0.6014, + "step": 7552 + }, + { + "epoch": 0.26, + "learning_rate": 1.6812476670416257e-05, + "loss": 0.6026, + "step": 7553 + }, + { + "epoch": 0.26, + "learning_rate": 1.6811679523290358e-05, + "loss": 0.6519, + "step": 7554 + }, + { + "epoch": 0.26, + "learning_rate": 1.6810882295403373e-05, + "loss": 0.6264, + "step": 7555 + }, + { + "epoch": 0.26, + "learning_rate": 1.681008498676477e-05, + "loss": 0.6839, + "step": 7556 + }, + { + "epoch": 0.26, + "learning_rate": 1.6809287597383992e-05, + "loss": 0.6282, + "step": 7557 + }, + { + "epoch": 0.26, + "learning_rate": 1.6808490127270498e-05, + "loss": 0.6158, + "step": 7558 + }, + { + "epoch": 0.26, + "learning_rate": 1.680769257643374e-05, + "loss": 0.6586, + "step": 7559 + }, + { + "epoch": 0.26, + "learning_rate": 1.6806894944883173e-05, + "loss": 0.6373, + "step": 7560 + }, + { + "epoch": 0.26, + "learning_rate": 1.6806097232628258e-05, + "loss": 0.6018, + "step": 7561 + }, + { + "epoch": 0.26, + "learning_rate": 1.680529943967845e-05, + "loss": 0.6907, + "step": 7562 + }, + { + "epoch": 0.26, + "learning_rate": 1.680450156604321e-05, + "loss": 0.6197, + "step": 7563 + }, + { + "epoch": 0.26, + "learning_rate": 1.680370361173199e-05, + "loss": 0.59, + "step": 7564 + }, + { + "epoch": 0.26, + "learning_rate": 1.6802905576754263e-05, + "loss": 0.6058, + "step": 7565 + }, + { + "epoch": 0.26, + "learning_rate": 1.680210746111948e-05, + "loss": 0.6178, + "step": 7566 + }, + { + "epoch": 0.26, + "learning_rate": 1.6801309264837112e-05, + "loss": 0.701, + "step": 7567 + }, + { + "epoch": 0.26, + "learning_rate": 1.6800510987916617e-05, + "loss": 0.6167, + "step": 7568 + }, + { + "epoch": 0.26, + "learning_rate": 1.6799712630367463e-05, + "loss": 0.63, + "step": 7569 + }, + { + "epoch": 0.26, + "learning_rate": 1.6798914192199115e-05, + "loss": 0.6019, + "step": 7570 + }, + { + "epoch": 0.26, + "learning_rate": 1.6798115673421034e-05, + "loss": 0.6163, + "step": 7571 + }, + { + "epoch": 0.26, + "learning_rate": 1.67973170740427e-05, + "loss": 0.6617, + "step": 7572 + }, + { + "epoch": 0.26, + "learning_rate": 1.6796518394073568e-05, + "loss": 0.6574, + "step": 7573 + }, + { + "epoch": 0.26, + "learning_rate": 1.6795719633523112e-05, + "loss": 0.6299, + "step": 7574 + }, + { + "epoch": 0.26, + "learning_rate": 1.6794920792400805e-05, + "loss": 0.6297, + "step": 7575 + }, + { + "epoch": 0.26, + "learning_rate": 1.6794121870716117e-05, + "loss": 0.6475, + "step": 7576 + }, + { + "epoch": 0.26, + "learning_rate": 1.6793322868478518e-05, + "loss": 0.6566, + "step": 7577 + }, + { + "epoch": 0.26, + "learning_rate": 1.679252378569748e-05, + "loss": 0.6302, + "step": 7578 + }, + { + "epoch": 0.26, + "learning_rate": 1.6791724622382486e-05, + "loss": 0.6159, + "step": 7579 + }, + { + "epoch": 0.26, + "learning_rate": 1.6790925378543002e-05, + "loss": 0.6636, + "step": 7580 + }, + { + "epoch": 0.26, + "learning_rate": 1.6790126054188507e-05, + "loss": 0.6183, + "step": 7581 + }, + { + "epoch": 0.26, + "learning_rate": 1.6789326649328478e-05, + "loss": 0.619, + "step": 7582 + }, + { + "epoch": 0.26, + "learning_rate": 1.6788527163972396e-05, + "loss": 0.6323, + "step": 7583 + }, + { + "epoch": 0.26, + "learning_rate": 1.6787727598129733e-05, + "loss": 0.6319, + "step": 7584 + }, + { + "epoch": 0.26, + "learning_rate": 1.6786927951809975e-05, + "loss": 0.6489, + "step": 7585 + }, + { + "epoch": 0.26, + "learning_rate": 1.67861282250226e-05, + "loss": 0.6439, + "step": 7586 + }, + { + "epoch": 0.26, + "learning_rate": 1.678532841777709e-05, + "loss": 0.6295, + "step": 7587 + }, + { + "epoch": 0.26, + "learning_rate": 1.6784528530082927e-05, + "loss": 0.6918, + "step": 7588 + }, + { + "epoch": 0.26, + "learning_rate": 1.6783728561949596e-05, + "loss": 0.6112, + "step": 7589 + }, + { + "epoch": 0.26, + "learning_rate": 1.6782928513386583e-05, + "loss": 0.6791, + "step": 7590 + }, + { + "epoch": 0.26, + "learning_rate": 1.6782128384403372e-05, + "loss": 0.6296, + "step": 7591 + }, + { + "epoch": 0.26, + "learning_rate": 1.678132817500945e-05, + "loss": 0.6411, + "step": 7592 + }, + { + "epoch": 0.26, + "learning_rate": 1.6780527885214303e-05, + "loss": 0.6683, + "step": 7593 + }, + { + "epoch": 0.26, + "learning_rate": 1.6779727515027418e-05, + "loss": 0.6256, + "step": 7594 + }, + { + "epoch": 0.26, + "learning_rate": 1.677892706445829e-05, + "loss": 0.6708, + "step": 7595 + }, + { + "epoch": 0.26, + "learning_rate": 1.6778126533516406e-05, + "loss": 0.6229, + "step": 7596 + }, + { + "epoch": 0.26, + "learning_rate": 1.677732592221126e-05, + "loss": 0.6145, + "step": 7597 + }, + { + "epoch": 0.26, + "learning_rate": 1.677652523055234e-05, + "loss": 0.6392, + "step": 7598 + }, + { + "epoch": 0.26, + "learning_rate": 1.6775724458549138e-05, + "loss": 0.6069, + "step": 7599 + }, + { + "epoch": 0.26, + "learning_rate": 1.6774923606211154e-05, + "loss": 0.6342, + "step": 7600 + }, + { + "epoch": 0.26, + "learning_rate": 1.677412267354788e-05, + "loss": 0.6288, + "step": 7601 + }, + { + "epoch": 0.26, + "learning_rate": 1.6773321660568813e-05, + "loss": 0.5799, + "step": 7602 + }, + { + "epoch": 0.26, + "learning_rate": 1.6772520567283447e-05, + "loss": 0.6064, + "step": 7603 + }, + { + "epoch": 0.26, + "learning_rate": 1.6771719393701286e-05, + "loss": 0.6453, + "step": 7604 + }, + { + "epoch": 0.26, + "learning_rate": 1.6770918139831822e-05, + "loss": 0.6659, + "step": 7605 + }, + { + "epoch": 0.26, + "learning_rate": 1.677011680568456e-05, + "loss": 0.6164, + "step": 7606 + }, + { + "epoch": 0.26, + "learning_rate": 1.6769315391268997e-05, + "loss": 0.6224, + "step": 7607 + }, + { + "epoch": 0.26, + "learning_rate": 1.676851389659464e-05, + "loss": 0.6352, + "step": 7608 + }, + { + "epoch": 0.26, + "learning_rate": 1.6767712321670985e-05, + "loss": 0.6689, + "step": 7609 + }, + { + "epoch": 0.26, + "learning_rate": 1.6766910666507544e-05, + "loss": 0.5952, + "step": 7610 + }, + { + "epoch": 0.26, + "learning_rate": 1.6766108931113812e-05, + "loss": 0.6321, + "step": 7611 + }, + { + "epoch": 0.26, + "learning_rate": 1.6765307115499305e-05, + "loss": 0.6475, + "step": 7612 + }, + { + "epoch": 0.26, + "learning_rate": 1.6764505219673518e-05, + "loss": 0.6751, + "step": 7613 + }, + { + "epoch": 0.26, + "learning_rate": 1.676370324364597e-05, + "loss": 0.6979, + "step": 7614 + }, + { + "epoch": 0.26, + "learning_rate": 1.676290118742616e-05, + "loss": 0.6563, + "step": 7615 + }, + { + "epoch": 0.26, + "learning_rate": 1.67620990510236e-05, + "loss": 0.6386, + "step": 7616 + }, + { + "epoch": 0.26, + "learning_rate": 1.6761296834447804e-05, + "loss": 0.6635, + "step": 7617 + }, + { + "epoch": 0.26, + "learning_rate": 1.6760494537708282e-05, + "loss": 0.6462, + "step": 7618 + }, + { + "epoch": 0.26, + "learning_rate": 1.6759692160814544e-05, + "loss": 0.5732, + "step": 7619 + }, + { + "epoch": 0.26, + "learning_rate": 1.6758889703776104e-05, + "loss": 0.6457, + "step": 7620 + }, + { + "epoch": 0.26, + "learning_rate": 1.6758087166602476e-05, + "loss": 0.6229, + "step": 7621 + }, + { + "epoch": 0.26, + "learning_rate": 1.6757284549303176e-05, + "loss": 0.6478, + "step": 7622 + }, + { + "epoch": 0.26, + "learning_rate": 1.6756481851887723e-05, + "loss": 0.6374, + "step": 7623 + }, + { + "epoch": 0.26, + "learning_rate": 1.6755679074365626e-05, + "loss": 0.6694, + "step": 7624 + }, + { + "epoch": 0.26, + "learning_rate": 1.675487621674641e-05, + "loss": 0.6553, + "step": 7625 + }, + { + "epoch": 0.26, + "learning_rate": 1.675407327903959e-05, + "loss": 0.6589, + "step": 7626 + }, + { + "epoch": 0.26, + "learning_rate": 1.6753270261254687e-05, + "loss": 0.6437, + "step": 7627 + }, + { + "epoch": 0.26, + "learning_rate": 1.6752467163401226e-05, + "loss": 0.649, + "step": 7628 + }, + { + "epoch": 0.26, + "learning_rate": 1.6751663985488722e-05, + "loss": 0.6168, + "step": 7629 + }, + { + "epoch": 0.26, + "learning_rate": 1.67508607275267e-05, + "loss": 0.6582, + "step": 7630 + }, + { + "epoch": 0.26, + "learning_rate": 1.6750057389524682e-05, + "loss": 0.6226, + "step": 7631 + }, + { + "epoch": 0.26, + "learning_rate": 1.67492539714922e-05, + "loss": 0.6452, + "step": 7632 + }, + { + "epoch": 0.26, + "learning_rate": 1.6748450473438773e-05, + "loss": 0.6101, + "step": 7633 + }, + { + "epoch": 0.26, + "learning_rate": 1.674764689537393e-05, + "loss": 0.6024, + "step": 7634 + }, + { + "epoch": 0.26, + "learning_rate": 1.6746843237307195e-05, + "loss": 0.6164, + "step": 7635 + }, + { + "epoch": 0.26, + "learning_rate": 1.6746039499248096e-05, + "loss": 0.6315, + "step": 7636 + }, + { + "epoch": 0.26, + "learning_rate": 1.6745235681206166e-05, + "loss": 0.6428, + "step": 7637 + }, + { + "epoch": 0.26, + "learning_rate": 1.674443178319094e-05, + "loss": 0.6774, + "step": 7638 + }, + { + "epoch": 0.26, + "learning_rate": 1.674362780521194e-05, + "loss": 0.6459, + "step": 7639 + }, + { + "epoch": 0.26, + "learning_rate": 1.6742823747278698e-05, + "loss": 0.6525, + "step": 7640 + }, + { + "epoch": 0.26, + "learning_rate": 1.6742019609400756e-05, + "loss": 0.6083, + "step": 7641 + }, + { + "epoch": 0.26, + "learning_rate": 1.674121539158764e-05, + "loss": 0.6771, + "step": 7642 + }, + { + "epoch": 0.26, + "learning_rate": 1.674041109384889e-05, + "loss": 0.6199, + "step": 7643 + }, + { + "epoch": 0.26, + "learning_rate": 1.6739606716194036e-05, + "loss": 0.6204, + "step": 7644 + }, + { + "epoch": 0.26, + "learning_rate": 1.6738802258632622e-05, + "loss": 0.6013, + "step": 7645 + }, + { + "epoch": 0.26, + "learning_rate": 1.6737997721174178e-05, + "loss": 0.6486, + "step": 7646 + }, + { + "epoch": 0.26, + "learning_rate": 1.6737193103828252e-05, + "loss": 0.6048, + "step": 7647 + }, + { + "epoch": 0.26, + "learning_rate": 1.673638840660438e-05, + "loss": 0.6451, + "step": 7648 + }, + { + "epoch": 0.27, + "learning_rate": 1.67355836295121e-05, + "loss": 0.6486, + "step": 7649 + }, + { + "epoch": 0.27, + "learning_rate": 1.6734778772560954e-05, + "loss": 0.668, + "step": 7650 + }, + { + "epoch": 0.27, + "learning_rate": 1.673397383576049e-05, + "loss": 0.5881, + "step": 7651 + }, + { + "epoch": 0.27, + "learning_rate": 1.6733168819120244e-05, + "loss": 0.6121, + "step": 7652 + }, + { + "epoch": 0.27, + "learning_rate": 1.6732363722649765e-05, + "loss": 0.6149, + "step": 7653 + }, + { + "epoch": 0.27, + "learning_rate": 1.67315585463586e-05, + "loss": 0.6227, + "step": 7654 + }, + { + "epoch": 0.27, + "learning_rate": 1.673075329025629e-05, + "loss": 0.5831, + "step": 7655 + }, + { + "epoch": 0.27, + "learning_rate": 1.6729947954352387e-05, + "loss": 0.6537, + "step": 7656 + }, + { + "epoch": 0.27, + "learning_rate": 1.6729142538656434e-05, + "loss": 0.6498, + "step": 7657 + }, + { + "epoch": 0.27, + "learning_rate": 1.6728337043177987e-05, + "loss": 0.6214, + "step": 7658 + }, + { + "epoch": 0.27, + "learning_rate": 1.672753146792659e-05, + "loss": 0.6434, + "step": 7659 + }, + { + "epoch": 0.27, + "learning_rate": 1.6726725812911803e-05, + "loss": 0.591, + "step": 7660 + }, + { + "epoch": 0.27, + "learning_rate": 1.672592007814317e-05, + "loss": 0.6201, + "step": 7661 + }, + { + "epoch": 0.27, + "learning_rate": 1.6725114263630245e-05, + "loss": 0.6479, + "step": 7662 + }, + { + "epoch": 0.27, + "learning_rate": 1.672430836938258e-05, + "loss": 0.6507, + "step": 7663 + }, + { + "epoch": 0.27, + "learning_rate": 1.6723502395409737e-05, + "loss": 0.6556, + "step": 7664 + }, + { + "epoch": 0.27, + "learning_rate": 1.6722696341721267e-05, + "loss": 0.5714, + "step": 7665 + }, + { + "epoch": 0.27, + "learning_rate": 1.672189020832673e-05, + "loss": 0.6272, + "step": 7666 + }, + { + "epoch": 0.27, + "learning_rate": 1.6721083995235678e-05, + "loss": 0.6292, + "step": 7667 + }, + { + "epoch": 0.27, + "learning_rate": 1.672027770245767e-05, + "loss": 0.6034, + "step": 7668 + }, + { + "epoch": 0.27, + "learning_rate": 1.6719471330002277e-05, + "loss": 0.6665, + "step": 7669 + }, + { + "epoch": 0.27, + "learning_rate": 1.6718664877879046e-05, + "loss": 0.6498, + "step": 7670 + }, + { + "epoch": 0.27, + "learning_rate": 1.6717858346097543e-05, + "loss": 0.6197, + "step": 7671 + }, + { + "epoch": 0.27, + "learning_rate": 1.6717051734667334e-05, + "loss": 0.5976, + "step": 7672 + }, + { + "epoch": 0.27, + "learning_rate": 1.6716245043597976e-05, + "loss": 0.6317, + "step": 7673 + }, + { + "epoch": 0.27, + "learning_rate": 1.671543827289904e-05, + "loss": 0.6078, + "step": 7674 + }, + { + "epoch": 0.27, + "learning_rate": 1.6714631422580088e-05, + "loss": 0.6317, + "step": 7675 + }, + { + "epoch": 0.27, + "learning_rate": 1.6713824492650684e-05, + "loss": 0.6429, + "step": 7676 + }, + { + "epoch": 0.27, + "learning_rate": 1.67130174831204e-05, + "loss": 0.6714, + "step": 7677 + }, + { + "epoch": 0.27, + "learning_rate": 1.67122103939988e-05, + "loss": 0.6499, + "step": 7678 + }, + { + "epoch": 0.27, + "learning_rate": 1.671140322529546e-05, + "loss": 0.6318, + "step": 7679 + }, + { + "epoch": 0.27, + "learning_rate": 1.671059597701994e-05, + "loss": 0.5943, + "step": 7680 + }, + { + "epoch": 0.27, + "learning_rate": 1.6709788649181817e-05, + "loss": 0.6454, + "step": 7681 + }, + { + "epoch": 0.27, + "learning_rate": 1.670898124179066e-05, + "loss": 0.6095, + "step": 7682 + }, + { + "epoch": 0.27, + "learning_rate": 1.6708173754856044e-05, + "loss": 0.6791, + "step": 7683 + }, + { + "epoch": 0.27, + "learning_rate": 1.6707366188387543e-05, + "loss": 0.6097, + "step": 7684 + }, + { + "epoch": 0.27, + "learning_rate": 1.670655854239473e-05, + "loss": 0.655, + "step": 7685 + }, + { + "epoch": 0.27, + "learning_rate": 1.6705750816887182e-05, + "loss": 0.6669, + "step": 7686 + }, + { + "epoch": 0.27, + "learning_rate": 1.6704943011874478e-05, + "loss": 0.6122, + "step": 7687 + }, + { + "epoch": 0.27, + "learning_rate": 1.6704135127366187e-05, + "loss": 0.6989, + "step": 7688 + }, + { + "epoch": 0.27, + "learning_rate": 1.67033271633719e-05, + "loss": 0.6387, + "step": 7689 + }, + { + "epoch": 0.27, + "learning_rate": 1.6702519119901183e-05, + "loss": 0.642, + "step": 7690 + }, + { + "epoch": 0.27, + "learning_rate": 1.6701710996963627e-05, + "loss": 0.619, + "step": 7691 + }, + { + "epoch": 0.27, + "learning_rate": 1.670090279456881e-05, + "loss": 0.6384, + "step": 7692 + }, + { + "epoch": 0.27, + "learning_rate": 1.6700094512726312e-05, + "loss": 0.6127, + "step": 7693 + }, + { + "epoch": 0.27, + "learning_rate": 1.669928615144572e-05, + "loss": 0.6568, + "step": 7694 + }, + { + "epoch": 0.27, + "learning_rate": 1.6698477710736615e-05, + "loss": 0.6714, + "step": 7695 + }, + { + "epoch": 0.27, + "learning_rate": 1.669766919060858e-05, + "loss": 0.6279, + "step": 7696 + }, + { + "epoch": 0.27, + "learning_rate": 1.6696860591071205e-05, + "loss": 0.6449, + "step": 7697 + }, + { + "epoch": 0.27, + "learning_rate": 1.669605191213408e-05, + "loss": 0.6193, + "step": 7698 + }, + { + "epoch": 0.27, + "learning_rate": 1.6695243153806787e-05, + "loss": 0.5965, + "step": 7699 + }, + { + "epoch": 0.27, + "learning_rate": 1.6694434316098917e-05, + "loss": 0.6316, + "step": 7700 + }, + { + "epoch": 0.27, + "learning_rate": 1.6693625399020058e-05, + "loss": 0.5819, + "step": 7701 + }, + { + "epoch": 0.27, + "learning_rate": 1.6692816402579806e-05, + "loss": 0.6918, + "step": 7702 + }, + { + "epoch": 0.27, + "learning_rate": 1.669200732678775e-05, + "loss": 0.5988, + "step": 7703 + }, + { + "epoch": 0.27, + "learning_rate": 1.6691198171653475e-05, + "loss": 0.6192, + "step": 7704 + }, + { + "epoch": 0.27, + "learning_rate": 1.6690388937186586e-05, + "loss": 0.6333, + "step": 7705 + }, + { + "epoch": 0.27, + "learning_rate": 1.668957962339667e-05, + "loss": 0.6409, + "step": 7706 + }, + { + "epoch": 0.27, + "learning_rate": 1.668877023029333e-05, + "loss": 0.6259, + "step": 7707 + }, + { + "epoch": 0.27, + "learning_rate": 1.6687960757886156e-05, + "loss": 0.6048, + "step": 7708 + }, + { + "epoch": 0.27, + "learning_rate": 1.668715120618474e-05, + "loss": 0.6374, + "step": 7709 + }, + { + "epoch": 0.27, + "learning_rate": 1.6686341575198694e-05, + "loss": 0.7457, + "step": 7710 + }, + { + "epoch": 0.27, + "learning_rate": 1.668553186493761e-05, + "loss": 0.6033, + "step": 7711 + }, + { + "epoch": 0.27, + "learning_rate": 1.668472207541109e-05, + "loss": 0.6525, + "step": 7712 + }, + { + "epoch": 0.27, + "learning_rate": 1.6683912206628728e-05, + "loss": 0.5833, + "step": 7713 + }, + { + "epoch": 0.27, + "learning_rate": 1.6683102258600133e-05, + "loss": 0.6839, + "step": 7714 + }, + { + "epoch": 0.27, + "learning_rate": 1.6682292231334912e-05, + "loss": 0.6265, + "step": 7715 + }, + { + "epoch": 0.27, + "learning_rate": 1.6681482124842658e-05, + "loss": 0.6093, + "step": 7716 + }, + { + "epoch": 0.27, + "learning_rate": 1.6680671939132983e-05, + "loss": 0.7036, + "step": 7717 + }, + { + "epoch": 0.27, + "learning_rate": 1.667986167421549e-05, + "loss": 0.6379, + "step": 7718 + }, + { + "epoch": 0.27, + "learning_rate": 1.667905133009979e-05, + "loss": 0.672, + "step": 7719 + }, + { + "epoch": 0.27, + "learning_rate": 1.6678240906795484e-05, + "loss": 0.6148, + "step": 7720 + }, + { + "epoch": 0.27, + "learning_rate": 1.6677430404312186e-05, + "loss": 0.5953, + "step": 7721 + }, + { + "epoch": 0.27, + "learning_rate": 1.6676619822659504e-05, + "loss": 0.6249, + "step": 7722 + }, + { + "epoch": 0.27, + "learning_rate": 1.6675809161847046e-05, + "loss": 0.6359, + "step": 7723 + }, + { + "epoch": 0.27, + "learning_rate": 1.6674998421884424e-05, + "loss": 0.6871, + "step": 7724 + }, + { + "epoch": 0.27, + "learning_rate": 1.6674187602781254e-05, + "loss": 0.6104, + "step": 7725 + }, + { + "epoch": 0.27, + "learning_rate": 1.6673376704547148e-05, + "loss": 0.6286, + "step": 7726 + }, + { + "epoch": 0.27, + "learning_rate": 1.667256572719172e-05, + "loss": 0.6596, + "step": 7727 + }, + { + "epoch": 0.27, + "learning_rate": 1.667175467072458e-05, + "loss": 0.607, + "step": 7728 + }, + { + "epoch": 0.27, + "learning_rate": 1.6670943535155353e-05, + "loss": 0.6645, + "step": 7729 + }, + { + "epoch": 0.27, + "learning_rate": 1.667013232049365e-05, + "loss": 0.6464, + "step": 7730 + }, + { + "epoch": 0.27, + "learning_rate": 1.666932102674909e-05, + "loss": 0.5897, + "step": 7731 + }, + { + "epoch": 0.27, + "learning_rate": 1.666850965393129e-05, + "loss": 0.6346, + "step": 7732 + }, + { + "epoch": 0.27, + "learning_rate": 1.666769820204988e-05, + "loss": 0.6064, + "step": 7733 + }, + { + "epoch": 0.27, + "learning_rate": 1.666688667111447e-05, + "loss": 0.6003, + "step": 7734 + }, + { + "epoch": 0.27, + "learning_rate": 1.6666075061134682e-05, + "loss": 0.6139, + "step": 7735 + }, + { + "epoch": 0.27, + "learning_rate": 1.6665263372120144e-05, + "loss": 0.6037, + "step": 7736 + }, + { + "epoch": 0.27, + "learning_rate": 1.6664451604080475e-05, + "loss": 0.6523, + "step": 7737 + }, + { + "epoch": 0.27, + "learning_rate": 1.6663639757025306e-05, + "loss": 0.6384, + "step": 7738 + }, + { + "epoch": 0.27, + "learning_rate": 1.6662827830964254e-05, + "loss": 0.6765, + "step": 7739 + }, + { + "epoch": 0.27, + "learning_rate": 1.666201582590695e-05, + "loss": 0.5676, + "step": 7740 + }, + { + "epoch": 0.27, + "learning_rate": 1.666120374186302e-05, + "loss": 0.6612, + "step": 7741 + }, + { + "epoch": 0.27, + "learning_rate": 1.6660391578842095e-05, + "loss": 0.662, + "step": 7742 + }, + { + "epoch": 0.27, + "learning_rate": 1.66595793368538e-05, + "loss": 0.6481, + "step": 7743 + }, + { + "epoch": 0.27, + "learning_rate": 1.665876701590777e-05, + "loss": 0.6164, + "step": 7744 + }, + { + "epoch": 0.27, + "learning_rate": 1.6657954616013635e-05, + "loss": 0.6137, + "step": 7745 + }, + { + "epoch": 0.27, + "learning_rate": 1.6657142137181023e-05, + "loss": 0.5964, + "step": 7746 + }, + { + "epoch": 0.27, + "learning_rate": 1.665632957941957e-05, + "loss": 0.6588, + "step": 7747 + }, + { + "epoch": 0.27, + "learning_rate": 1.6655516942738912e-05, + "loss": 0.6223, + "step": 7748 + }, + { + "epoch": 0.27, + "learning_rate": 1.6654704227148676e-05, + "loss": 0.6722, + "step": 7749 + }, + { + "epoch": 0.27, + "learning_rate": 1.665389143265851e-05, + "loss": 0.6562, + "step": 7750 + }, + { + "epoch": 0.27, + "learning_rate": 1.6653078559278038e-05, + "loss": 0.6743, + "step": 7751 + }, + { + "epoch": 0.27, + "learning_rate": 1.6652265607016906e-05, + "loss": 0.653, + "step": 7752 + }, + { + "epoch": 0.27, + "learning_rate": 1.665145257588475e-05, + "loss": 0.6384, + "step": 7753 + }, + { + "epoch": 0.27, + "learning_rate": 1.665063946589121e-05, + "loss": 0.6315, + "step": 7754 + }, + { + "epoch": 0.27, + "learning_rate": 1.6649826277045926e-05, + "loss": 0.6089, + "step": 7755 + }, + { + "epoch": 0.27, + "learning_rate": 1.664901300935854e-05, + "loss": 0.5965, + "step": 7756 + }, + { + "epoch": 0.27, + "learning_rate": 1.6648199662838692e-05, + "loss": 0.6674, + "step": 7757 + }, + { + "epoch": 0.27, + "learning_rate": 1.6647386237496025e-05, + "loss": 0.6195, + "step": 7758 + }, + { + "epoch": 0.27, + "learning_rate": 1.664657273334019e-05, + "loss": 0.6307, + "step": 7759 + }, + { + "epoch": 0.27, + "learning_rate": 1.6645759150380824e-05, + "loss": 0.6885, + "step": 7760 + }, + { + "epoch": 0.27, + "learning_rate": 1.6644945488627578e-05, + "loss": 0.6738, + "step": 7761 + }, + { + "epoch": 0.27, + "learning_rate": 1.6644131748090097e-05, + "loss": 0.5674, + "step": 7762 + }, + { + "epoch": 0.27, + "learning_rate": 1.664331792877803e-05, + "loss": 0.6348, + "step": 7763 + }, + { + "epoch": 0.27, + "learning_rate": 1.6642504030701024e-05, + "loss": 0.6172, + "step": 7764 + }, + { + "epoch": 0.27, + "learning_rate": 1.664169005386873e-05, + "loss": 0.6958, + "step": 7765 + }, + { + "epoch": 0.27, + "learning_rate": 1.66408759982908e-05, + "loss": 0.6656, + "step": 7766 + }, + { + "epoch": 0.27, + "learning_rate": 1.664006186397688e-05, + "loss": 0.6277, + "step": 7767 + }, + { + "epoch": 0.27, + "learning_rate": 1.663924765093663e-05, + "loss": 0.6193, + "step": 7768 + }, + { + "epoch": 0.27, + "learning_rate": 1.6638433359179703e-05, + "loss": 0.6386, + "step": 7769 + }, + { + "epoch": 0.27, + "learning_rate": 1.6637618988715746e-05, + "loss": 0.5694, + "step": 7770 + }, + { + "epoch": 0.27, + "learning_rate": 1.663680453955442e-05, + "loss": 0.6247, + "step": 7771 + }, + { + "epoch": 0.27, + "learning_rate": 1.6635990011705386e-05, + "loss": 0.6747, + "step": 7772 + }, + { + "epoch": 0.27, + "learning_rate": 1.663517540517829e-05, + "loss": 0.6445, + "step": 7773 + }, + { + "epoch": 0.27, + "learning_rate": 1.6634360719982798e-05, + "loss": 0.6315, + "step": 7774 + }, + { + "epoch": 0.27, + "learning_rate": 1.6633545956128564e-05, + "loss": 0.667, + "step": 7775 + }, + { + "epoch": 0.27, + "learning_rate": 1.6632731113625257e-05, + "loss": 0.5812, + "step": 7776 + }, + { + "epoch": 0.27, + "learning_rate": 1.6631916192482528e-05, + "loss": 0.673, + "step": 7777 + }, + { + "epoch": 0.27, + "learning_rate": 1.6631101192710045e-05, + "loss": 0.6085, + "step": 7778 + }, + { + "epoch": 0.27, + "learning_rate": 1.6630286114317468e-05, + "loss": 0.6176, + "step": 7779 + }, + { + "epoch": 0.27, + "learning_rate": 1.6629470957314464e-05, + "loss": 0.63, + "step": 7780 + }, + { + "epoch": 0.27, + "learning_rate": 1.6628655721710695e-05, + "loss": 0.6555, + "step": 7781 + }, + { + "epoch": 0.27, + "learning_rate": 1.6627840407515824e-05, + "loss": 0.6037, + "step": 7782 + }, + { + "epoch": 0.27, + "learning_rate": 1.6627025014739522e-05, + "loss": 0.6599, + "step": 7783 + }, + { + "epoch": 0.27, + "learning_rate": 1.6626209543391458e-05, + "loss": 0.6258, + "step": 7784 + }, + { + "epoch": 0.27, + "learning_rate": 1.6625393993481294e-05, + "loss": 0.6276, + "step": 7785 + }, + { + "epoch": 0.27, + "learning_rate": 1.6624578365018704e-05, + "loss": 0.5492, + "step": 7786 + }, + { + "epoch": 0.27, + "learning_rate": 1.662376265801336e-05, + "loss": 0.575, + "step": 7787 + }, + { + "epoch": 0.27, + "learning_rate": 1.6622946872474926e-05, + "loss": 0.5956, + "step": 7788 + }, + { + "epoch": 0.27, + "learning_rate": 1.6622131008413083e-05, + "loss": 0.6005, + "step": 7789 + }, + { + "epoch": 0.27, + "learning_rate": 1.6621315065837497e-05, + "loss": 0.6094, + "step": 7790 + }, + { + "epoch": 0.27, + "learning_rate": 1.6620499044757846e-05, + "loss": 0.6437, + "step": 7791 + }, + { + "epoch": 0.27, + "learning_rate": 1.6619682945183805e-05, + "loss": 0.6222, + "step": 7792 + }, + { + "epoch": 0.27, + "learning_rate": 1.6618866767125046e-05, + "loss": 0.6464, + "step": 7793 + }, + { + "epoch": 0.27, + "learning_rate": 1.661805051059125e-05, + "loss": 0.6552, + "step": 7794 + }, + { + "epoch": 0.27, + "learning_rate": 1.6617234175592095e-05, + "loss": 0.6483, + "step": 7795 + }, + { + "epoch": 0.27, + "learning_rate": 1.6616417762137253e-05, + "loss": 0.6252, + "step": 7796 + }, + { + "epoch": 0.27, + "learning_rate": 1.6615601270236416e-05, + "loss": 0.5911, + "step": 7797 + }, + { + "epoch": 0.27, + "learning_rate": 1.661478469989925e-05, + "loss": 0.6174, + "step": 7798 + }, + { + "epoch": 0.27, + "learning_rate": 1.6613968051135446e-05, + "loss": 0.6333, + "step": 7799 + }, + { + "epoch": 0.27, + "learning_rate": 1.6613151323954688e-05, + "loss": 0.6151, + "step": 7800 + }, + { + "epoch": 0.27, + "learning_rate": 1.6612334518366654e-05, + "loss": 0.6279, + "step": 7801 + }, + { + "epoch": 0.27, + "learning_rate": 1.6611517634381025e-05, + "loss": 0.6625, + "step": 7802 + }, + { + "epoch": 0.27, + "learning_rate": 1.6610700672007494e-05, + "loss": 0.6214, + "step": 7803 + }, + { + "epoch": 0.27, + "learning_rate": 1.6609883631255744e-05, + "loss": 0.6427, + "step": 7804 + }, + { + "epoch": 0.27, + "learning_rate": 1.660906651213546e-05, + "loss": 0.6828, + "step": 7805 + }, + { + "epoch": 0.27, + "learning_rate": 1.6608249314656337e-05, + "loss": 0.6497, + "step": 7806 + }, + { + "epoch": 0.27, + "learning_rate": 1.6607432038828052e-05, + "loss": 0.6679, + "step": 7807 + }, + { + "epoch": 0.27, + "learning_rate": 1.660661468466031e-05, + "loss": 0.6315, + "step": 7808 + }, + { + "epoch": 0.27, + "learning_rate": 1.6605797252162784e-05, + "loss": 0.6594, + "step": 7809 + }, + { + "epoch": 0.27, + "learning_rate": 1.660497974134518e-05, + "loss": 0.6017, + "step": 7810 + }, + { + "epoch": 0.27, + "learning_rate": 1.6604162152217186e-05, + "loss": 0.6074, + "step": 7811 + }, + { + "epoch": 0.27, + "learning_rate": 1.6603344484788494e-05, + "loss": 0.6308, + "step": 7812 + }, + { + "epoch": 0.27, + "learning_rate": 1.6602526739068803e-05, + "loss": 0.6208, + "step": 7813 + }, + { + "epoch": 0.27, + "learning_rate": 1.6601708915067805e-05, + "loss": 0.637, + "step": 7814 + }, + { + "epoch": 0.27, + "learning_rate": 1.6600891012795193e-05, + "loss": 0.6344, + "step": 7815 + }, + { + "epoch": 0.27, + "learning_rate": 1.660007303226067e-05, + "loss": 0.5901, + "step": 7816 + }, + { + "epoch": 0.27, + "learning_rate": 1.659925497347393e-05, + "loss": 0.6437, + "step": 7817 + }, + { + "epoch": 0.27, + "learning_rate": 1.6598436836444678e-05, + "loss": 0.6312, + "step": 7818 + }, + { + "epoch": 0.27, + "learning_rate": 1.659761862118261e-05, + "loss": 0.6622, + "step": 7819 + }, + { + "epoch": 0.27, + "learning_rate": 1.6596800327697423e-05, + "loss": 0.6692, + "step": 7820 + }, + { + "epoch": 0.27, + "learning_rate": 1.6595981955998826e-05, + "loss": 0.6164, + "step": 7821 + }, + { + "epoch": 0.27, + "learning_rate": 1.659516350609652e-05, + "loss": 0.6089, + "step": 7822 + }, + { + "epoch": 0.27, + "learning_rate": 1.6594344978000204e-05, + "loss": 0.648, + "step": 7823 + }, + { + "epoch": 0.27, + "learning_rate": 1.659352637171959e-05, + "loss": 0.5927, + "step": 7824 + }, + { + "epoch": 0.27, + "learning_rate": 1.659270768726438e-05, + "loss": 0.6513, + "step": 7825 + }, + { + "epoch": 0.27, + "learning_rate": 1.6591888924644276e-05, + "loss": 0.6063, + "step": 7826 + }, + { + "epoch": 0.27, + "learning_rate": 1.6591070083868993e-05, + "loss": 0.6912, + "step": 7827 + }, + { + "epoch": 0.27, + "learning_rate": 1.659025116494824e-05, + "loss": 0.6305, + "step": 7828 + }, + { + "epoch": 0.27, + "learning_rate": 1.6589432167891717e-05, + "loss": 0.6166, + "step": 7829 + }, + { + "epoch": 0.27, + "learning_rate": 1.6588613092709143e-05, + "loss": 0.6202, + "step": 7830 + }, + { + "epoch": 0.27, + "learning_rate": 1.6587793939410226e-05, + "loss": 0.5826, + "step": 7831 + }, + { + "epoch": 0.27, + "learning_rate": 1.6586974708004677e-05, + "loss": 0.6218, + "step": 7832 + }, + { + "epoch": 0.27, + "learning_rate": 1.6586155398502213e-05, + "loss": 0.6031, + "step": 7833 + }, + { + "epoch": 0.27, + "learning_rate": 1.658533601091254e-05, + "loss": 0.6426, + "step": 7834 + }, + { + "epoch": 0.27, + "learning_rate": 1.6584516545245385e-05, + "loss": 0.6553, + "step": 7835 + }, + { + "epoch": 0.27, + "learning_rate": 1.6583697001510453e-05, + "loss": 0.6593, + "step": 7836 + }, + { + "epoch": 0.27, + "learning_rate": 1.6582877379717464e-05, + "loss": 0.6104, + "step": 7837 + }, + { + "epoch": 0.27, + "learning_rate": 1.658205767987614e-05, + "loss": 0.6599, + "step": 7838 + }, + { + "epoch": 0.27, + "learning_rate": 1.658123790199619e-05, + "loss": 0.683, + "step": 7839 + }, + { + "epoch": 0.27, + "learning_rate": 1.6580418046087344e-05, + "loss": 0.6497, + "step": 7840 + }, + { + "epoch": 0.27, + "learning_rate": 1.6579598112159313e-05, + "loss": 0.6041, + "step": 7841 + }, + { + "epoch": 0.27, + "learning_rate": 1.6578778100221827e-05, + "loss": 0.6833, + "step": 7842 + }, + { + "epoch": 0.27, + "learning_rate": 1.6577958010284604e-05, + "loss": 0.6789, + "step": 7843 + }, + { + "epoch": 0.27, + "learning_rate": 1.6577137842357368e-05, + "loss": 0.5845, + "step": 7844 + }, + { + "epoch": 0.27, + "learning_rate": 1.6576317596449843e-05, + "loss": 0.6212, + "step": 7845 + }, + { + "epoch": 0.27, + "learning_rate": 1.657549727257175e-05, + "loss": 0.6256, + "step": 7846 + }, + { + "epoch": 0.27, + "learning_rate": 1.6574676870732824e-05, + "loss": 0.6167, + "step": 7847 + }, + { + "epoch": 0.27, + "learning_rate": 1.6573856390942782e-05, + "loss": 0.6683, + "step": 7848 + }, + { + "epoch": 0.27, + "learning_rate": 1.6573035833211363e-05, + "loss": 0.6322, + "step": 7849 + }, + { + "epoch": 0.27, + "learning_rate": 1.6572215197548285e-05, + "loss": 0.595, + "step": 7850 + }, + { + "epoch": 0.27, + "learning_rate": 1.6571394483963278e-05, + "loss": 0.6118, + "step": 7851 + }, + { + "epoch": 0.27, + "learning_rate": 1.657057369246608e-05, + "loss": 0.6383, + "step": 7852 + }, + { + "epoch": 0.27, + "learning_rate": 1.656975282306642e-05, + "loss": 0.5938, + "step": 7853 + }, + { + "epoch": 0.27, + "learning_rate": 1.656893187577403e-05, + "loss": 0.7081, + "step": 7854 + }, + { + "epoch": 0.27, + "learning_rate": 1.6568110850598643e-05, + "loss": 0.6119, + "step": 7855 + }, + { + "epoch": 0.27, + "learning_rate": 1.656728974754999e-05, + "loss": 0.6356, + "step": 7856 + }, + { + "epoch": 0.27, + "learning_rate": 1.6566468566637812e-05, + "loss": 0.6757, + "step": 7857 + }, + { + "epoch": 0.27, + "learning_rate": 1.6565647307871843e-05, + "loss": 0.6284, + "step": 7858 + }, + { + "epoch": 0.27, + "learning_rate": 1.656482597126182e-05, + "loss": 0.6083, + "step": 7859 + }, + { + "epoch": 0.27, + "learning_rate": 1.6564004556817478e-05, + "loss": 0.6336, + "step": 7860 + }, + { + "epoch": 0.27, + "learning_rate": 1.656318306454856e-05, + "loss": 0.6323, + "step": 7861 + }, + { + "epoch": 0.27, + "learning_rate": 1.6562361494464806e-05, + "loss": 0.6295, + "step": 7862 + }, + { + "epoch": 0.27, + "learning_rate": 1.6561539846575953e-05, + "loss": 0.5708, + "step": 7863 + }, + { + "epoch": 0.27, + "learning_rate": 1.6560718120891742e-05, + "loss": 0.6139, + "step": 7864 + }, + { + "epoch": 0.27, + "learning_rate": 1.6559896317421924e-05, + "loss": 0.5982, + "step": 7865 + }, + { + "epoch": 0.27, + "learning_rate": 1.6559074436176236e-05, + "loss": 0.6454, + "step": 7866 + }, + { + "epoch": 0.27, + "learning_rate": 1.655825247716442e-05, + "loss": 0.6047, + "step": 7867 + }, + { + "epoch": 0.27, + "learning_rate": 1.6557430440396225e-05, + "loss": 0.6217, + "step": 7868 + }, + { + "epoch": 0.27, + "learning_rate": 1.6556608325881397e-05, + "loss": 0.5812, + "step": 7869 + }, + { + "epoch": 0.27, + "learning_rate": 1.6555786133629683e-05, + "loss": 0.6048, + "step": 7870 + }, + { + "epoch": 0.27, + "learning_rate": 1.6554963863650834e-05, + "loss": 0.6626, + "step": 7871 + }, + { + "epoch": 0.27, + "learning_rate": 1.6554141515954592e-05, + "loss": 0.6731, + "step": 7872 + }, + { + "epoch": 0.27, + "learning_rate": 1.6553319090550717e-05, + "loss": 0.6185, + "step": 7873 + }, + { + "epoch": 0.27, + "learning_rate": 1.655249658744895e-05, + "loss": 0.647, + "step": 7874 + }, + { + "epoch": 0.27, + "learning_rate": 1.655167400665905e-05, + "loss": 0.6475, + "step": 7875 + }, + { + "epoch": 0.27, + "learning_rate": 1.6550851348190762e-05, + "loss": 0.6396, + "step": 7876 + }, + { + "epoch": 0.27, + "learning_rate": 1.655002861205385e-05, + "loss": 0.6052, + "step": 7877 + }, + { + "epoch": 0.27, + "learning_rate": 1.654920579825806e-05, + "loss": 0.693, + "step": 7878 + }, + { + "epoch": 0.27, + "learning_rate": 1.654838290681315e-05, + "loss": 0.5504, + "step": 7879 + }, + { + "epoch": 0.27, + "learning_rate": 1.654755993772888e-05, + "loss": 0.6233, + "step": 7880 + }, + { + "epoch": 0.27, + "learning_rate": 1.6546736891014998e-05, + "loss": 0.6338, + "step": 7881 + }, + { + "epoch": 0.27, + "learning_rate": 1.6545913766681273e-05, + "loss": 0.6177, + "step": 7882 + }, + { + "epoch": 0.27, + "learning_rate": 1.6545090564737457e-05, + "loss": 0.629, + "step": 7883 + }, + { + "epoch": 0.27, + "learning_rate": 1.6544267285193317e-05, + "loss": 0.6147, + "step": 7884 + }, + { + "epoch": 0.27, + "learning_rate": 1.6543443928058607e-05, + "loss": 0.6221, + "step": 7885 + }, + { + "epoch": 0.27, + "learning_rate": 1.6542620493343093e-05, + "loss": 0.607, + "step": 7886 + }, + { + "epoch": 0.27, + "learning_rate": 1.6541796981056535e-05, + "loss": 0.6246, + "step": 7887 + }, + { + "epoch": 0.27, + "learning_rate": 1.6540973391208698e-05, + "loss": 0.641, + "step": 7888 + }, + { + "epoch": 0.27, + "learning_rate": 1.654014972380935e-05, + "loss": 0.6546, + "step": 7889 + }, + { + "epoch": 0.27, + "learning_rate": 1.6539325978868253e-05, + "loss": 0.6291, + "step": 7890 + }, + { + "epoch": 0.27, + "learning_rate": 1.653850215639517e-05, + "loss": 0.6041, + "step": 7891 + }, + { + "epoch": 0.27, + "learning_rate": 1.6537678256399877e-05, + "loss": 0.6542, + "step": 7892 + }, + { + "epoch": 0.27, + "learning_rate": 1.653685427889214e-05, + "loss": 0.6243, + "step": 7893 + }, + { + "epoch": 0.27, + "learning_rate": 1.6536030223881722e-05, + "loss": 0.5855, + "step": 7894 + }, + { + "epoch": 0.27, + "learning_rate": 1.6535206091378396e-05, + "loss": 0.626, + "step": 7895 + }, + { + "epoch": 0.27, + "learning_rate": 1.653438188139194e-05, + "loss": 0.6278, + "step": 7896 + }, + { + "epoch": 0.27, + "learning_rate": 1.653355759393212e-05, + "loss": 0.658, + "step": 7897 + }, + { + "epoch": 0.27, + "learning_rate": 1.6532733229008705e-05, + "loss": 0.6138, + "step": 7898 + }, + { + "epoch": 0.27, + "learning_rate": 1.6531908786631477e-05, + "loss": 0.6011, + "step": 7899 + }, + { + "epoch": 0.27, + "learning_rate": 1.653108426681021e-05, + "loss": 0.6283, + "step": 7900 + }, + { + "epoch": 0.27, + "learning_rate": 1.6530259669554674e-05, + "loss": 0.6035, + "step": 7901 + }, + { + "epoch": 0.27, + "learning_rate": 1.6529434994874648e-05, + "loss": 0.6471, + "step": 7902 + }, + { + "epoch": 0.27, + "learning_rate": 1.652861024277991e-05, + "loss": 0.6544, + "step": 7903 + }, + { + "epoch": 0.27, + "learning_rate": 1.6527785413280243e-05, + "loss": 0.6361, + "step": 7904 + }, + { + "epoch": 0.27, + "learning_rate": 1.652696050638542e-05, + "loss": 0.64, + "step": 7905 + }, + { + "epoch": 0.27, + "learning_rate": 1.6526135522105223e-05, + "loss": 0.6237, + "step": 7906 + }, + { + "epoch": 0.27, + "learning_rate": 1.6525310460449434e-05, + "loss": 0.6452, + "step": 7907 + }, + { + "epoch": 0.27, + "learning_rate": 1.6524485321427834e-05, + "loss": 0.6615, + "step": 7908 + }, + { + "epoch": 0.27, + "learning_rate": 1.6523660105050208e-05, + "loss": 0.6474, + "step": 7909 + }, + { + "epoch": 0.27, + "learning_rate": 1.6522834811326338e-05, + "loss": 0.6503, + "step": 7910 + }, + { + "epoch": 0.27, + "learning_rate": 1.652200944026601e-05, + "loss": 0.5794, + "step": 7911 + }, + { + "epoch": 0.27, + "learning_rate": 1.652118399187901e-05, + "loss": 0.6297, + "step": 7912 + }, + { + "epoch": 0.27, + "learning_rate": 1.6520358466175127e-05, + "loss": 0.698, + "step": 7913 + }, + { + "epoch": 0.27, + "learning_rate": 1.6519532863164142e-05, + "loss": 0.6603, + "step": 7914 + }, + { + "epoch": 0.27, + "learning_rate": 1.651870718285585e-05, + "loss": 0.6367, + "step": 7915 + }, + { + "epoch": 0.27, + "learning_rate": 1.6517881425260038e-05, + "loss": 0.6009, + "step": 7916 + }, + { + "epoch": 0.27, + "learning_rate": 1.6517055590386496e-05, + "loss": 0.6663, + "step": 7917 + }, + { + "epoch": 0.27, + "learning_rate": 1.6516229678245016e-05, + "loss": 0.5758, + "step": 7918 + }, + { + "epoch": 0.27, + "learning_rate": 1.651540368884539e-05, + "loss": 0.6794, + "step": 7919 + }, + { + "epoch": 0.27, + "learning_rate": 1.6514577622197413e-05, + "loss": 0.6177, + "step": 7920 + }, + { + "epoch": 0.27, + "learning_rate": 1.6513751478310873e-05, + "loss": 0.6127, + "step": 7921 + }, + { + "epoch": 0.27, + "learning_rate": 1.6512925257195572e-05, + "loss": 0.5998, + "step": 7922 + }, + { + "epoch": 0.27, + "learning_rate": 1.6512098958861305e-05, + "loss": 0.6112, + "step": 7923 + }, + { + "epoch": 0.27, + "learning_rate": 1.6511272583317864e-05, + "loss": 0.6855, + "step": 7924 + }, + { + "epoch": 0.27, + "learning_rate": 1.651044613057505e-05, + "loss": 0.6003, + "step": 7925 + }, + { + "epoch": 0.27, + "learning_rate": 1.6509619600642664e-05, + "loss": 0.5903, + "step": 7926 + }, + { + "epoch": 0.27, + "learning_rate": 1.6508792993530502e-05, + "loss": 0.6443, + "step": 7927 + }, + { + "epoch": 0.27, + "learning_rate": 1.6507966309248363e-05, + "loss": 0.6382, + "step": 7928 + }, + { + "epoch": 0.27, + "learning_rate": 1.6507139547806053e-05, + "loss": 0.6247, + "step": 7929 + }, + { + "epoch": 0.27, + "learning_rate": 1.6506312709213373e-05, + "loss": 0.6137, + "step": 7930 + }, + { + "epoch": 0.27, + "learning_rate": 1.650548579348012e-05, + "loss": 0.6014, + "step": 7931 + }, + { + "epoch": 0.27, + "learning_rate": 1.6504658800616107e-05, + "loss": 0.6581, + "step": 7932 + }, + { + "epoch": 0.27, + "learning_rate": 1.650383173063114e-05, + "loss": 0.6092, + "step": 7933 + }, + { + "epoch": 0.27, + "learning_rate": 1.6503004583535016e-05, + "loss": 0.6469, + "step": 7934 + }, + { + "epoch": 0.27, + "learning_rate": 1.6502177359337546e-05, + "loss": 0.6202, + "step": 7935 + }, + { + "epoch": 0.27, + "learning_rate": 1.6501350058048538e-05, + "loss": 0.6317, + "step": 7936 + }, + { + "epoch": 0.27, + "learning_rate": 1.6500522679677803e-05, + "loss": 0.6248, + "step": 7937 + }, + { + "epoch": 0.28, + "learning_rate": 1.6499695224235144e-05, + "loss": 0.646, + "step": 7938 + }, + { + "epoch": 0.28, + "learning_rate": 1.6498867691730377e-05, + "loss": 0.6699, + "step": 7939 + }, + { + "epoch": 0.28, + "learning_rate": 1.6498040082173315e-05, + "loss": 0.6395, + "step": 7940 + }, + { + "epoch": 0.28, + "learning_rate": 1.6497212395573766e-05, + "loss": 0.646, + "step": 7941 + }, + { + "epoch": 0.28, + "learning_rate": 1.6496384631941547e-05, + "loss": 0.6802, + "step": 7942 + }, + { + "epoch": 0.28, + "learning_rate": 1.649555679128647e-05, + "loss": 0.6028, + "step": 7943 + }, + { + "epoch": 0.28, + "learning_rate": 1.649472887361835e-05, + "loss": 0.6653, + "step": 7944 + }, + { + "epoch": 0.28, + "learning_rate": 1.6493900878947002e-05, + "loss": 0.6289, + "step": 7945 + }, + { + "epoch": 0.28, + "learning_rate": 1.6493072807282246e-05, + "loss": 0.6502, + "step": 7946 + }, + { + "epoch": 0.28, + "learning_rate": 1.6492244658633895e-05, + "loss": 0.6247, + "step": 7947 + }, + { + "epoch": 0.28, + "learning_rate": 1.6491416433011774e-05, + "loss": 0.6685, + "step": 7948 + }, + { + "epoch": 0.28, + "learning_rate": 1.64905881304257e-05, + "loss": 0.5878, + "step": 7949 + }, + { + "epoch": 0.28, + "learning_rate": 1.6489759750885492e-05, + "loss": 0.6586, + "step": 7950 + }, + { + "epoch": 0.28, + "learning_rate": 1.648893129440097e-05, + "loss": 0.6386, + "step": 7951 + }, + { + "epoch": 0.28, + "learning_rate": 1.648810276098196e-05, + "loss": 0.6332, + "step": 7952 + }, + { + "epoch": 0.28, + "learning_rate": 1.6487274150638287e-05, + "loss": 0.6368, + "step": 7953 + }, + { + "epoch": 0.28, + "learning_rate": 1.6486445463379774e-05, + "loss": 0.651, + "step": 7954 + }, + { + "epoch": 0.28, + "learning_rate": 1.648561669921624e-05, + "loss": 0.6504, + "step": 7955 + }, + { + "epoch": 0.28, + "learning_rate": 1.6484787858157515e-05, + "loss": 0.6203, + "step": 7956 + }, + { + "epoch": 0.28, + "learning_rate": 1.648395894021343e-05, + "loss": 0.6677, + "step": 7957 + }, + { + "epoch": 0.28, + "learning_rate": 1.648312994539381e-05, + "loss": 0.619, + "step": 7958 + }, + { + "epoch": 0.28, + "learning_rate": 1.648230087370848e-05, + "loss": 0.6378, + "step": 7959 + }, + { + "epoch": 0.28, + "learning_rate": 1.6481471725167277e-05, + "loss": 0.6519, + "step": 7960 + }, + { + "epoch": 0.28, + "learning_rate": 1.648064249978002e-05, + "loss": 0.625, + "step": 7961 + }, + { + "epoch": 0.28, + "learning_rate": 1.6479813197556557e-05, + "loss": 0.6508, + "step": 7962 + }, + { + "epoch": 0.28, + "learning_rate": 1.647898381850671e-05, + "loss": 0.6144, + "step": 7963 + }, + { + "epoch": 0.28, + "learning_rate": 1.647815436264031e-05, + "loss": 0.6874, + "step": 7964 + }, + { + "epoch": 0.28, + "learning_rate": 1.6477324829967196e-05, + "loss": 0.6561, + "step": 7965 + }, + { + "epoch": 0.28, + "learning_rate": 1.6476495220497205e-05, + "loss": 0.6343, + "step": 7966 + }, + { + "epoch": 0.28, + "learning_rate": 1.6475665534240166e-05, + "loss": 0.6284, + "step": 7967 + }, + { + "epoch": 0.28, + "learning_rate": 1.6474835771205927e-05, + "loss": 0.6205, + "step": 7968 + }, + { + "epoch": 0.28, + "learning_rate": 1.6474005931404312e-05, + "loss": 0.6276, + "step": 7969 + }, + { + "epoch": 0.28, + "learning_rate": 1.647317601484517e-05, + "loss": 0.641, + "step": 7970 + }, + { + "epoch": 0.28, + "learning_rate": 1.6472346021538338e-05, + "loss": 0.6405, + "step": 7971 + }, + { + "epoch": 0.28, + "learning_rate": 1.6471515951493656e-05, + "loss": 0.6308, + "step": 7972 + }, + { + "epoch": 0.28, + "learning_rate": 1.647068580472097e-05, + "loss": 0.6501, + "step": 7973 + }, + { + "epoch": 0.28, + "learning_rate": 1.646985558123011e-05, + "loss": 0.665, + "step": 7974 + }, + { + "epoch": 0.28, + "learning_rate": 1.6469025281030932e-05, + "loss": 0.5859, + "step": 7975 + }, + { + "epoch": 0.28, + "learning_rate": 1.6468194904133278e-05, + "loss": 0.6746, + "step": 7976 + }, + { + "epoch": 0.28, + "learning_rate": 1.6467364450546988e-05, + "loss": 0.619, + "step": 7977 + }, + { + "epoch": 0.28, + "learning_rate": 1.646653392028191e-05, + "loss": 0.6483, + "step": 7978 + }, + { + "epoch": 0.28, + "learning_rate": 1.6465703313347894e-05, + "loss": 0.6663, + "step": 7979 + }, + { + "epoch": 0.28, + "learning_rate": 1.646487262975479e-05, + "loss": 0.6478, + "step": 7980 + }, + { + "epoch": 0.28, + "learning_rate": 1.646404186951244e-05, + "loss": 0.6613, + "step": 7981 + }, + { + "epoch": 0.28, + "learning_rate": 1.6463211032630693e-05, + "loss": 0.6027, + "step": 7982 + }, + { + "epoch": 0.28, + "learning_rate": 1.6462380119119408e-05, + "loss": 0.6143, + "step": 7983 + }, + { + "epoch": 0.28, + "learning_rate": 1.646154912898843e-05, + "loss": 0.6567, + "step": 7984 + }, + { + "epoch": 0.28, + "learning_rate": 1.646071806224761e-05, + "loss": 0.6534, + "step": 7985 + }, + { + "epoch": 0.28, + "learning_rate": 1.645988691890681e-05, + "loss": 0.6163, + "step": 7986 + }, + { + "epoch": 0.28, + "learning_rate": 1.6459055698975877e-05, + "loss": 0.6674, + "step": 7987 + }, + { + "epoch": 0.28, + "learning_rate": 1.6458224402464666e-05, + "loss": 0.5981, + "step": 7988 + }, + { + "epoch": 0.28, + "learning_rate": 1.6457393029383038e-05, + "loss": 0.647, + "step": 7989 + }, + { + "epoch": 0.28, + "learning_rate": 1.6456561579740843e-05, + "loss": 0.5749, + "step": 7990 + }, + { + "epoch": 0.28, + "learning_rate": 1.6455730053547947e-05, + "loss": 0.6143, + "step": 7991 + }, + { + "epoch": 0.28, + "learning_rate": 1.6454898450814203e-05, + "loss": 0.6245, + "step": 7992 + }, + { + "epoch": 0.28, + "learning_rate": 1.6454066771549473e-05, + "loss": 0.6115, + "step": 7993 + }, + { + "epoch": 0.28, + "learning_rate": 1.6453235015763615e-05, + "loss": 0.5967, + "step": 7994 + }, + { + "epoch": 0.28, + "learning_rate": 1.6452403183466493e-05, + "loss": 0.6433, + "step": 7995 + }, + { + "epoch": 0.28, + "learning_rate": 1.645157127466797e-05, + "loss": 0.6455, + "step": 7996 + }, + { + "epoch": 0.28, + "learning_rate": 1.645073928937791e-05, + "loss": 0.6114, + "step": 7997 + }, + { + "epoch": 0.28, + "learning_rate": 1.644990722760617e-05, + "loss": 0.5969, + "step": 7998 + }, + { + "epoch": 0.28, + "learning_rate": 1.6449075089362626e-05, + "loss": 0.625, + "step": 7999 + }, + { + "epoch": 0.28, + "learning_rate": 1.6448242874657136e-05, + "loss": 0.6566, + "step": 8000 + }, + { + "epoch": 0.28, + "learning_rate": 1.6447410583499573e-05, + "loss": 0.5944, + "step": 8001 + }, + { + "epoch": 0.28, + "learning_rate": 1.6446578215899797e-05, + "loss": 0.6102, + "step": 8002 + }, + { + "epoch": 0.28, + "learning_rate": 1.644574577186768e-05, + "loss": 0.6233, + "step": 8003 + }, + { + "epoch": 0.28, + "learning_rate": 1.64449132514131e-05, + "loss": 0.6547, + "step": 8004 + }, + { + "epoch": 0.28, + "learning_rate": 1.6444080654545915e-05, + "loss": 0.6376, + "step": 8005 + }, + { + "epoch": 0.28, + "learning_rate": 1.6443247981276005e-05, + "loss": 0.6446, + "step": 8006 + }, + { + "epoch": 0.28, + "learning_rate": 1.644241523161324e-05, + "loss": 0.6292, + "step": 8007 + }, + { + "epoch": 0.28, + "learning_rate": 1.644158240556749e-05, + "loss": 0.6598, + "step": 8008 + }, + { + "epoch": 0.28, + "learning_rate": 1.6440749503148634e-05, + "loss": 0.6112, + "step": 8009 + }, + { + "epoch": 0.28, + "learning_rate": 1.6439916524366543e-05, + "loss": 0.6426, + "step": 8010 + }, + { + "epoch": 0.28, + "learning_rate": 1.6439083469231096e-05, + "loss": 0.5837, + "step": 8011 + }, + { + "epoch": 0.28, + "learning_rate": 1.6438250337752166e-05, + "loss": 0.6745, + "step": 8012 + }, + { + "epoch": 0.28, + "learning_rate": 1.6437417129939638e-05, + "loss": 0.6378, + "step": 8013 + }, + { + "epoch": 0.28, + "learning_rate": 1.6436583845803385e-05, + "loss": 0.6576, + "step": 8014 + }, + { + "epoch": 0.28, + "learning_rate": 1.643575048535329e-05, + "loss": 0.6171, + "step": 8015 + }, + { + "epoch": 0.28, + "learning_rate": 1.643491704859923e-05, + "loss": 0.6731, + "step": 8016 + }, + { + "epoch": 0.28, + "learning_rate": 1.6434083535551088e-05, + "loss": 0.6229, + "step": 8017 + }, + { + "epoch": 0.28, + "learning_rate": 1.6433249946218748e-05, + "loss": 0.6528, + "step": 8018 + }, + { + "epoch": 0.28, + "learning_rate": 1.6432416280612087e-05, + "loss": 0.6031, + "step": 8019 + }, + { + "epoch": 0.28, + "learning_rate": 1.6431582538741e-05, + "loss": 0.6512, + "step": 8020 + }, + { + "epoch": 0.28, + "learning_rate": 1.6430748720615363e-05, + "loss": 0.6566, + "step": 8021 + }, + { + "epoch": 0.28, + "learning_rate": 1.6429914826245066e-05, + "loss": 0.5827, + "step": 8022 + }, + { + "epoch": 0.28, + "learning_rate": 1.6429080855639995e-05, + "loss": 0.658, + "step": 8023 + }, + { + "epoch": 0.28, + "learning_rate": 1.642824680881004e-05, + "loss": 0.6372, + "step": 8024 + }, + { + "epoch": 0.28, + "learning_rate": 1.642741268576508e-05, + "loss": 0.674, + "step": 8025 + }, + { + "epoch": 0.28, + "learning_rate": 1.642657848651502e-05, + "loss": 0.6408, + "step": 8026 + }, + { + "epoch": 0.28, + "learning_rate": 1.6425744211069736e-05, + "loss": 0.6458, + "step": 8027 + }, + { + "epoch": 0.28, + "learning_rate": 1.6424909859439128e-05, + "loss": 0.6762, + "step": 8028 + }, + { + "epoch": 0.28, + "learning_rate": 1.6424075431633088e-05, + "loss": 0.6486, + "step": 8029 + }, + { + "epoch": 0.28, + "learning_rate": 1.6423240927661507e-05, + "loss": 0.6647, + "step": 8030 + }, + { + "epoch": 0.28, + "learning_rate": 1.6422406347534278e-05, + "loss": 0.617, + "step": 8031 + }, + { + "epoch": 0.28, + "learning_rate": 1.6421571691261297e-05, + "loss": 0.6249, + "step": 8032 + }, + { + "epoch": 0.28, + "learning_rate": 1.642073695885246e-05, + "loss": 0.6239, + "step": 8033 + }, + { + "epoch": 0.28, + "learning_rate": 1.6419902150317666e-05, + "loss": 0.6321, + "step": 8034 + }, + { + "epoch": 0.28, + "learning_rate": 1.6419067265666808e-05, + "loss": 0.5991, + "step": 8035 + }, + { + "epoch": 0.28, + "learning_rate": 1.641823230490979e-05, + "loss": 0.6039, + "step": 8036 + }, + { + "epoch": 0.28, + "learning_rate": 1.6417397268056507e-05, + "loss": 0.6359, + "step": 8037 + }, + { + "epoch": 0.28, + "learning_rate": 1.6416562155116863e-05, + "loss": 0.6382, + "step": 8038 + }, + { + "epoch": 0.28, + "learning_rate": 1.641572696610076e-05, + "loss": 0.6272, + "step": 8039 + }, + { + "epoch": 0.28, + "learning_rate": 1.641489170101809e-05, + "loss": 0.6732, + "step": 8040 + }, + { + "epoch": 0.28, + "learning_rate": 1.641405635987877e-05, + "loss": 0.6332, + "step": 8041 + }, + { + "epoch": 0.28, + "learning_rate": 1.6413220942692697e-05, + "loss": 0.6668, + "step": 8042 + }, + { + "epoch": 0.28, + "learning_rate": 1.6412385449469778e-05, + "loss": 0.69, + "step": 8043 + }, + { + "epoch": 0.28, + "learning_rate": 1.6411549880219916e-05, + "loss": 0.6704, + "step": 8044 + }, + { + "epoch": 0.28, + "learning_rate": 1.641071423495302e-05, + "loss": 0.6307, + "step": 8045 + }, + { + "epoch": 0.28, + "learning_rate": 1.6409878513678997e-05, + "loss": 0.655, + "step": 8046 + }, + { + "epoch": 0.28, + "learning_rate": 1.6409042716407758e-05, + "loss": 0.659, + "step": 8047 + }, + { + "epoch": 0.28, + "learning_rate": 1.6408206843149206e-05, + "loss": 0.6386, + "step": 8048 + }, + { + "epoch": 0.28, + "learning_rate": 1.640737089391326e-05, + "loss": 0.6765, + "step": 8049 + }, + { + "epoch": 0.28, + "learning_rate": 1.6406534868709824e-05, + "loss": 0.63, + "step": 8050 + }, + { + "epoch": 0.28, + "learning_rate": 1.640569876754881e-05, + "loss": 0.6166, + "step": 8051 + }, + { + "epoch": 0.28, + "learning_rate": 1.640486259044014e-05, + "loss": 0.6767, + "step": 8052 + }, + { + "epoch": 0.28, + "learning_rate": 1.6404026337393716e-05, + "loss": 0.6523, + "step": 8053 + }, + { + "epoch": 0.28, + "learning_rate": 1.6403190008419462e-05, + "loss": 0.6328, + "step": 8054 + }, + { + "epoch": 0.28, + "learning_rate": 1.640235360352729e-05, + "loss": 0.6181, + "step": 8055 + }, + { + "epoch": 0.28, + "learning_rate": 1.6401517122727117e-05, + "loss": 0.5848, + "step": 8056 + }, + { + "epoch": 0.28, + "learning_rate": 1.6400680566028858e-05, + "loss": 0.599, + "step": 8057 + }, + { + "epoch": 0.28, + "learning_rate": 1.639984393344244e-05, + "loss": 0.6471, + "step": 8058 + }, + { + "epoch": 0.28, + "learning_rate": 1.639900722497777e-05, + "loss": 0.6742, + "step": 8059 + }, + { + "epoch": 0.28, + "learning_rate": 1.6398170440644777e-05, + "loss": 0.6534, + "step": 8060 + }, + { + "epoch": 0.28, + "learning_rate": 1.639733358045338e-05, + "loss": 0.607, + "step": 8061 + }, + { + "epoch": 0.28, + "learning_rate": 1.6396496644413502e-05, + "loss": 0.5887, + "step": 8062 + }, + { + "epoch": 0.28, + "learning_rate": 1.6395659632535064e-05, + "loss": 0.6035, + "step": 8063 + }, + { + "epoch": 0.28, + "learning_rate": 1.639482254482799e-05, + "loss": 0.5801, + "step": 8064 + }, + { + "epoch": 0.28, + "learning_rate": 1.6393985381302203e-05, + "loss": 0.6195, + "step": 8065 + }, + { + "epoch": 0.28, + "learning_rate": 1.6393148141967633e-05, + "loss": 0.693, + "step": 8066 + }, + { + "epoch": 0.28, + "learning_rate": 1.6392310826834206e-05, + "loss": 0.6161, + "step": 8067 + }, + { + "epoch": 0.28, + "learning_rate": 1.6391473435911845e-05, + "loss": 0.6177, + "step": 8068 + }, + { + "epoch": 0.28, + "learning_rate": 1.6390635969210485e-05, + "loss": 0.6563, + "step": 8069 + }, + { + "epoch": 0.28, + "learning_rate": 1.6389798426740045e-05, + "loss": 0.6332, + "step": 8070 + }, + { + "epoch": 0.28, + "learning_rate": 1.6388960808510467e-05, + "loss": 0.6309, + "step": 8071 + }, + { + "epoch": 0.28, + "learning_rate": 1.6388123114531675e-05, + "loss": 0.5357, + "step": 8072 + }, + { + "epoch": 0.28, + "learning_rate": 1.63872853448136e-05, + "loss": 0.6483, + "step": 8073 + }, + { + "epoch": 0.28, + "learning_rate": 1.638644749936618e-05, + "loss": 0.6951, + "step": 8074 + }, + { + "epoch": 0.28, + "learning_rate": 1.6385609578199346e-05, + "loss": 0.7481, + "step": 8075 + }, + { + "epoch": 0.28, + "learning_rate": 1.6384771581323035e-05, + "loss": 0.6424, + "step": 8076 + }, + { + "epoch": 0.28, + "learning_rate": 1.6383933508747173e-05, + "loss": 0.6279, + "step": 8077 + }, + { + "epoch": 0.28, + "learning_rate": 1.638309536048171e-05, + "loss": 0.6761, + "step": 8078 + }, + { + "epoch": 0.28, + "learning_rate": 1.6382257136536574e-05, + "loss": 0.6329, + "step": 8079 + }, + { + "epoch": 0.28, + "learning_rate": 1.6381418836921706e-05, + "loss": 0.6714, + "step": 8080 + }, + { + "epoch": 0.28, + "learning_rate": 1.6380580461647046e-05, + "loss": 0.6604, + "step": 8081 + }, + { + "epoch": 0.28, + "learning_rate": 1.6379742010722536e-05, + "loss": 0.5978, + "step": 8082 + }, + { + "epoch": 0.28, + "learning_rate": 1.6378903484158112e-05, + "loss": 0.6504, + "step": 8083 + }, + { + "epoch": 0.28, + "learning_rate": 1.6378064881963715e-05, + "loss": 0.6263, + "step": 8084 + }, + { + "epoch": 0.28, + "learning_rate": 1.637722620414929e-05, + "loss": 0.6673, + "step": 8085 + }, + { + "epoch": 0.28, + "learning_rate": 1.6376387450724784e-05, + "loss": 0.6432, + "step": 8086 + }, + { + "epoch": 0.28, + "learning_rate": 1.637554862170014e-05, + "loss": 0.6625, + "step": 8087 + }, + { + "epoch": 0.28, + "learning_rate": 1.63747097170853e-05, + "loss": 0.6586, + "step": 8088 + }, + { + "epoch": 0.28, + "learning_rate": 1.637387073689021e-05, + "loss": 0.5652, + "step": 8089 + }, + { + "epoch": 0.28, + "learning_rate": 1.6373031681124823e-05, + "loss": 0.6221, + "step": 8090 + }, + { + "epoch": 0.28, + "learning_rate": 1.637219254979908e-05, + "loss": 0.606, + "step": 8091 + }, + { + "epoch": 0.28, + "learning_rate": 1.6371353342922937e-05, + "loss": 0.5977, + "step": 8092 + }, + { + "epoch": 0.28, + "learning_rate": 1.637051406050634e-05, + "loss": 0.6148, + "step": 8093 + }, + { + "epoch": 0.28, + "learning_rate": 1.636967470255924e-05, + "loss": 0.6038, + "step": 8094 + }, + { + "epoch": 0.28, + "learning_rate": 1.6368835269091587e-05, + "loss": 0.595, + "step": 8095 + }, + { + "epoch": 0.28, + "learning_rate": 1.6367995760113333e-05, + "loss": 0.6389, + "step": 8096 + }, + { + "epoch": 0.28, + "learning_rate": 1.6367156175634438e-05, + "loss": 0.6401, + "step": 8097 + }, + { + "epoch": 0.28, + "learning_rate": 1.6366316515664852e-05, + "loss": 0.6256, + "step": 8098 + }, + { + "epoch": 0.28, + "learning_rate": 1.636547678021453e-05, + "loss": 0.6419, + "step": 8099 + }, + { + "epoch": 0.28, + "learning_rate": 1.6364636969293426e-05, + "loss": 0.5943, + "step": 8100 + }, + { + "epoch": 0.28, + "learning_rate": 1.63637970829115e-05, + "loss": 0.6838, + "step": 8101 + }, + { + "epoch": 0.28, + "learning_rate": 1.636295712107871e-05, + "loss": 0.5847, + "step": 8102 + }, + { + "epoch": 0.28, + "learning_rate": 1.6362117083805017e-05, + "loss": 0.5692, + "step": 8103 + }, + { + "epoch": 0.28, + "learning_rate": 1.6361276971100373e-05, + "loss": 0.6138, + "step": 8104 + }, + { + "epoch": 0.28, + "learning_rate": 1.6360436782974748e-05, + "loss": 0.6284, + "step": 8105 + }, + { + "epoch": 0.28, + "learning_rate": 1.6359596519438094e-05, + "loss": 0.609, + "step": 8106 + }, + { + "epoch": 0.28, + "learning_rate": 1.6358756180500383e-05, + "loss": 0.6093, + "step": 8107 + }, + { + "epoch": 0.28, + "learning_rate": 1.635791576617157e-05, + "loss": 0.5721, + "step": 8108 + }, + { + "epoch": 0.28, + "learning_rate": 1.6357075276461625e-05, + "loss": 0.6667, + "step": 8109 + }, + { + "epoch": 0.28, + "learning_rate": 1.6356234711380513e-05, + "loss": 0.6835, + "step": 8110 + }, + { + "epoch": 0.28, + "learning_rate": 1.6355394070938192e-05, + "loss": 0.6158, + "step": 8111 + }, + { + "epoch": 0.28, + "learning_rate": 1.6354553355144637e-05, + "loss": 0.6131, + "step": 8112 + }, + { + "epoch": 0.28, + "learning_rate": 1.6353712564009815e-05, + "loss": 0.6103, + "step": 8113 + }, + { + "epoch": 0.28, + "learning_rate": 1.6352871697543692e-05, + "loss": 0.6127, + "step": 8114 + }, + { + "epoch": 0.28, + "learning_rate": 1.6352030755756237e-05, + "loss": 0.6372, + "step": 8115 + }, + { + "epoch": 0.28, + "learning_rate": 1.6351189738657426e-05, + "loss": 0.6116, + "step": 8116 + }, + { + "epoch": 0.28, + "learning_rate": 1.6350348646257224e-05, + "loss": 0.6367, + "step": 8117 + }, + { + "epoch": 0.28, + "learning_rate": 1.6349507478565608e-05, + "loss": 0.6094, + "step": 8118 + }, + { + "epoch": 0.28, + "learning_rate": 1.6348666235592546e-05, + "loss": 0.634, + "step": 8119 + }, + { + "epoch": 0.28, + "learning_rate": 1.6347824917348014e-05, + "loss": 0.6546, + "step": 8120 + }, + { + "epoch": 0.28, + "learning_rate": 1.6346983523841988e-05, + "loss": 0.6382, + "step": 8121 + }, + { + "epoch": 0.28, + "learning_rate": 1.6346142055084447e-05, + "loss": 0.6302, + "step": 8122 + }, + { + "epoch": 0.28, + "learning_rate": 1.634530051108536e-05, + "loss": 0.6917, + "step": 8123 + }, + { + "epoch": 0.28, + "learning_rate": 1.6344458891854706e-05, + "loss": 0.6047, + "step": 8124 + }, + { + "epoch": 0.28, + "learning_rate": 1.6343617197402472e-05, + "loss": 0.6168, + "step": 8125 + }, + { + "epoch": 0.28, + "learning_rate": 1.634277542773863e-05, + "loss": 0.6281, + "step": 8126 + }, + { + "epoch": 0.28, + "learning_rate": 1.634193358287316e-05, + "loss": 0.6512, + "step": 8127 + }, + { + "epoch": 0.28, + "learning_rate": 1.6341091662816048e-05, + "loss": 0.6393, + "step": 8128 + }, + { + "epoch": 0.28, + "learning_rate": 1.6340249667577268e-05, + "loss": 0.6632, + "step": 8129 + }, + { + "epoch": 0.28, + "learning_rate": 1.633940759716681e-05, + "loss": 0.6592, + "step": 8130 + }, + { + "epoch": 0.28, + "learning_rate": 1.6338565451594654e-05, + "loss": 0.6596, + "step": 8131 + }, + { + "epoch": 0.28, + "learning_rate": 1.633772323087079e-05, + "loss": 0.6414, + "step": 8132 + }, + { + "epoch": 0.28, + "learning_rate": 1.6336880935005198e-05, + "loss": 0.5967, + "step": 8133 + }, + { + "epoch": 0.28, + "learning_rate": 1.6336038564007864e-05, + "loss": 0.6307, + "step": 8134 + }, + { + "epoch": 0.28, + "learning_rate": 1.633519611788878e-05, + "loss": 0.6052, + "step": 8135 + }, + { + "epoch": 0.28, + "learning_rate": 1.633435359665793e-05, + "loss": 0.622, + "step": 8136 + }, + { + "epoch": 0.28, + "learning_rate": 1.633351100032531e-05, + "loss": 0.6712, + "step": 8137 + }, + { + "epoch": 0.28, + "learning_rate": 1.6332668328900904e-05, + "loss": 0.6662, + "step": 8138 + }, + { + "epoch": 0.28, + "learning_rate": 1.6331825582394698e-05, + "loss": 0.6198, + "step": 8139 + }, + { + "epoch": 0.28, + "learning_rate": 1.6330982760816697e-05, + "loss": 0.597, + "step": 8140 + }, + { + "epoch": 0.28, + "learning_rate": 1.6330139864176882e-05, + "loss": 0.6469, + "step": 8141 + }, + { + "epoch": 0.28, + "learning_rate": 1.6329296892485252e-05, + "loss": 0.6647, + "step": 8142 + }, + { + "epoch": 0.28, + "learning_rate": 1.6328453845751803e-05, + "loss": 0.6141, + "step": 8143 + }, + { + "epoch": 0.28, + "learning_rate": 1.6327610723986524e-05, + "loss": 0.6282, + "step": 8144 + }, + { + "epoch": 0.28, + "learning_rate": 1.632676752719942e-05, + "loss": 0.6089, + "step": 8145 + }, + { + "epoch": 0.28, + "learning_rate": 1.632592425540048e-05, + "loss": 0.5493, + "step": 8146 + }, + { + "epoch": 0.28, + "learning_rate": 1.632508090859971e-05, + "loss": 0.671, + "step": 8147 + }, + { + "epoch": 0.28, + "learning_rate": 1.63242374868071e-05, + "loss": 0.6613, + "step": 8148 + }, + { + "epoch": 0.28, + "learning_rate": 1.6323393990032656e-05, + "loss": 0.5778, + "step": 8149 + }, + { + "epoch": 0.28, + "learning_rate": 1.632255041828638e-05, + "loss": 0.6235, + "step": 8150 + }, + { + "epoch": 0.28, + "learning_rate": 1.6321706771578266e-05, + "loss": 0.6955, + "step": 8151 + }, + { + "epoch": 0.28, + "learning_rate": 1.6320863049918322e-05, + "loss": 0.6161, + "step": 8152 + }, + { + "epoch": 0.28, + "learning_rate": 1.632001925331655e-05, + "loss": 0.6184, + "step": 8153 + }, + { + "epoch": 0.28, + "learning_rate": 1.631917538178296e-05, + "loss": 0.6645, + "step": 8154 + }, + { + "epoch": 0.28, + "learning_rate": 1.631833143532755e-05, + "loss": 0.6574, + "step": 8155 + }, + { + "epoch": 0.28, + "learning_rate": 1.6317487413960328e-05, + "loss": 0.6558, + "step": 8156 + }, + { + "epoch": 0.28, + "learning_rate": 1.6316643317691298e-05, + "loss": 0.5963, + "step": 8157 + }, + { + "epoch": 0.28, + "learning_rate": 1.631579914653047e-05, + "loss": 0.6218, + "step": 8158 + }, + { + "epoch": 0.28, + "learning_rate": 1.6314954900487858e-05, + "loss": 0.6447, + "step": 8159 + }, + { + "epoch": 0.28, + "learning_rate": 1.6314110579573466e-05, + "loss": 0.6744, + "step": 8160 + }, + { + "epoch": 0.28, + "learning_rate": 1.6313266183797305e-05, + "loss": 0.5793, + "step": 8161 + }, + { + "epoch": 0.28, + "learning_rate": 1.631242171316939e-05, + "loss": 0.6586, + "step": 8162 + }, + { + "epoch": 0.28, + "learning_rate": 1.6311577167699725e-05, + "loss": 0.5962, + "step": 8163 + }, + { + "epoch": 0.28, + "learning_rate": 1.6310732547398332e-05, + "loss": 0.6702, + "step": 8164 + }, + { + "epoch": 0.28, + "learning_rate": 1.6309887852275223e-05, + "loss": 0.6715, + "step": 8165 + }, + { + "epoch": 0.28, + "learning_rate": 1.630904308234041e-05, + "loss": 0.5938, + "step": 8166 + }, + { + "epoch": 0.28, + "learning_rate": 1.6308198237603904e-05, + "loss": 0.614, + "step": 8167 + }, + { + "epoch": 0.28, + "learning_rate": 1.6307353318075736e-05, + "loss": 0.6132, + "step": 8168 + }, + { + "epoch": 0.28, + "learning_rate": 1.6306508323765912e-05, + "loss": 0.6791, + "step": 8169 + }, + { + "epoch": 0.28, + "learning_rate": 1.6305663254684455e-05, + "loss": 0.681, + "step": 8170 + }, + { + "epoch": 0.28, + "learning_rate": 1.6304818110841382e-05, + "loss": 0.6863, + "step": 8171 + }, + { + "epoch": 0.28, + "learning_rate": 1.6303972892246717e-05, + "loss": 0.5871, + "step": 8172 + }, + { + "epoch": 0.28, + "learning_rate": 1.630312759891048e-05, + "loss": 0.6711, + "step": 8173 + }, + { + "epoch": 0.28, + "learning_rate": 1.6302282230842688e-05, + "loss": 0.7095, + "step": 8174 + }, + { + "epoch": 0.28, + "learning_rate": 1.630143678805337e-05, + "loss": 0.7288, + "step": 8175 + }, + { + "epoch": 0.28, + "learning_rate": 1.630059127055255e-05, + "loss": 0.6837, + "step": 8176 + }, + { + "epoch": 0.28, + "learning_rate": 1.6299745678350245e-05, + "loss": 0.5905, + "step": 8177 + }, + { + "epoch": 0.28, + "learning_rate": 1.6298900011456487e-05, + "loss": 0.6663, + "step": 8178 + }, + { + "epoch": 0.28, + "learning_rate": 1.6298054269881305e-05, + "loss": 0.645, + "step": 8179 + }, + { + "epoch": 0.28, + "learning_rate": 1.6297208453634718e-05, + "loss": 0.5918, + "step": 8180 + }, + { + "epoch": 0.28, + "learning_rate": 1.6296362562726763e-05, + "loss": 0.6146, + "step": 8181 + }, + { + "epoch": 0.28, + "learning_rate": 1.629551659716746e-05, + "loss": 0.6172, + "step": 8182 + }, + { + "epoch": 0.28, + "learning_rate": 1.6294670556966846e-05, + "loss": 0.6153, + "step": 8183 + }, + { + "epoch": 0.28, + "learning_rate": 1.629382444213495e-05, + "loss": 0.6271, + "step": 8184 + }, + { + "epoch": 0.28, + "learning_rate": 1.6292978252681805e-05, + "loss": 0.6781, + "step": 8185 + }, + { + "epoch": 0.28, + "learning_rate": 1.629213198861744e-05, + "loss": 0.6255, + "step": 8186 + }, + { + "epoch": 0.28, + "learning_rate": 1.629128564995189e-05, + "loss": 0.607, + "step": 8187 + }, + { + "epoch": 0.28, + "learning_rate": 1.629043923669519e-05, + "loss": 0.679, + "step": 8188 + }, + { + "epoch": 0.28, + "learning_rate": 1.628959274885738e-05, + "loss": 0.6551, + "step": 8189 + }, + { + "epoch": 0.28, + "learning_rate": 1.6288746186448487e-05, + "loss": 0.6479, + "step": 8190 + }, + { + "epoch": 0.28, + "learning_rate": 1.6287899549478554e-05, + "loss": 0.6219, + "step": 8191 + }, + { + "epoch": 0.28, + "learning_rate": 1.6287052837957617e-05, + "loss": 0.6528, + "step": 8192 + }, + { + "epoch": 0.28, + "learning_rate": 1.6286206051895716e-05, + "loss": 0.6181, + "step": 8193 + }, + { + "epoch": 0.28, + "learning_rate": 1.6285359191302892e-05, + "loss": 0.6683, + "step": 8194 + }, + { + "epoch": 0.28, + "learning_rate": 1.628451225618918e-05, + "loss": 0.596, + "step": 8195 + }, + { + "epoch": 0.28, + "learning_rate": 1.628366524656463e-05, + "loss": 0.71, + "step": 8196 + }, + { + "epoch": 0.28, + "learning_rate": 1.6282818162439274e-05, + "loss": 0.6628, + "step": 8197 + }, + { + "epoch": 0.28, + "learning_rate": 1.6281971003823166e-05, + "loss": 0.6477, + "step": 8198 + }, + { + "epoch": 0.28, + "learning_rate": 1.6281123770726343e-05, + "loss": 0.6322, + "step": 8199 + }, + { + "epoch": 0.28, + "learning_rate": 1.6280276463158854e-05, + "loss": 0.6558, + "step": 8200 + }, + { + "epoch": 0.28, + "learning_rate": 1.6279429081130738e-05, + "loss": 0.6153, + "step": 8201 + }, + { + "epoch": 0.28, + "learning_rate": 1.627858162465205e-05, + "loss": 0.6831, + "step": 8202 + }, + { + "epoch": 0.28, + "learning_rate": 1.6277734093732833e-05, + "loss": 0.5911, + "step": 8203 + }, + { + "epoch": 0.28, + "learning_rate": 1.627688648838314e-05, + "loss": 0.5865, + "step": 8204 + }, + { + "epoch": 0.28, + "learning_rate": 1.6276038808613015e-05, + "loss": 0.6659, + "step": 8205 + }, + { + "epoch": 0.28, + "learning_rate": 1.627519105443251e-05, + "loss": 0.6715, + "step": 8206 + }, + { + "epoch": 0.28, + "learning_rate": 1.6274343225851678e-05, + "loss": 0.6811, + "step": 8207 + }, + { + "epoch": 0.28, + "learning_rate": 1.627349532288057e-05, + "loss": 0.6408, + "step": 8208 + }, + { + "epoch": 0.28, + "learning_rate": 1.6272647345529238e-05, + "loss": 0.5871, + "step": 8209 + }, + { + "epoch": 0.28, + "learning_rate": 1.6271799293807736e-05, + "loss": 0.6408, + "step": 8210 + }, + { + "epoch": 0.28, + "learning_rate": 1.6270951167726123e-05, + "loss": 0.62, + "step": 8211 + }, + { + "epoch": 0.28, + "learning_rate": 1.627010296729445e-05, + "loss": 0.6397, + "step": 8212 + }, + { + "epoch": 0.28, + "learning_rate": 1.6269254692522775e-05, + "loss": 0.6993, + "step": 8213 + }, + { + "epoch": 0.28, + "learning_rate": 1.626840634342115e-05, + "loss": 0.6274, + "step": 8214 + }, + { + "epoch": 0.28, + "learning_rate": 1.6267557919999647e-05, + "loss": 0.67, + "step": 8215 + }, + { + "epoch": 0.28, + "learning_rate": 1.626670942226831e-05, + "loss": 0.6389, + "step": 8216 + }, + { + "epoch": 0.28, + "learning_rate": 1.6265860850237202e-05, + "loss": 0.5989, + "step": 8217 + }, + { + "epoch": 0.28, + "learning_rate": 1.6265012203916396e-05, + "loss": 0.5683, + "step": 8218 + }, + { + "epoch": 0.28, + "learning_rate": 1.626416348331594e-05, + "loss": 0.6371, + "step": 8219 + }, + { + "epoch": 0.28, + "learning_rate": 1.62633146884459e-05, + "loss": 0.6564, + "step": 8220 + }, + { + "epoch": 0.28, + "learning_rate": 1.6262465819316345e-05, + "loss": 0.6231, + "step": 8221 + }, + { + "epoch": 0.28, + "learning_rate": 1.6261616875937337e-05, + "loss": 0.6622, + "step": 8222 + }, + { + "epoch": 0.28, + "learning_rate": 1.6260767858318934e-05, + "loss": 0.6184, + "step": 8223 + }, + { + "epoch": 0.28, + "learning_rate": 1.6259918766471216e-05, + "loss": 0.6559, + "step": 8224 + }, + { + "epoch": 0.28, + "learning_rate": 1.6259069600404234e-05, + "loss": 0.6088, + "step": 8225 + }, + { + "epoch": 0.29, + "learning_rate": 1.625822036012807e-05, + "loss": 0.607, + "step": 8226 + }, + { + "epoch": 0.29, + "learning_rate": 1.6257371045652784e-05, + "loss": 0.6245, + "step": 8227 + }, + { + "epoch": 0.29, + "learning_rate": 1.625652165698845e-05, + "loss": 0.6457, + "step": 8228 + }, + { + "epoch": 0.29, + "learning_rate": 1.6255672194145136e-05, + "loss": 0.6252, + "step": 8229 + }, + { + "epoch": 0.29, + "learning_rate": 1.6254822657132917e-05, + "loss": 0.6222, + "step": 8230 + }, + { + "epoch": 0.29, + "learning_rate": 1.625397304596186e-05, + "loss": 0.6337, + "step": 8231 + }, + { + "epoch": 0.29, + "learning_rate": 1.6253123360642043e-05, + "loss": 0.6531, + "step": 8232 + }, + { + "epoch": 0.29, + "learning_rate": 1.6252273601183538e-05, + "loss": 0.6185, + "step": 8233 + }, + { + "epoch": 0.29, + "learning_rate": 1.625142376759642e-05, + "loss": 0.6432, + "step": 8234 + }, + { + "epoch": 0.29, + "learning_rate": 1.6250573859890768e-05, + "loss": 0.5832, + "step": 8235 + }, + { + "epoch": 0.29, + "learning_rate": 1.624972387807665e-05, + "loss": 0.6229, + "step": 8236 + }, + { + "epoch": 0.29, + "learning_rate": 1.6248873822164154e-05, + "loss": 0.5955, + "step": 8237 + }, + { + "epoch": 0.29, + "learning_rate": 1.624802369216335e-05, + "loss": 0.6419, + "step": 8238 + }, + { + "epoch": 0.29, + "learning_rate": 1.6247173488084327e-05, + "loss": 0.6439, + "step": 8239 + }, + { + "epoch": 0.29, + "learning_rate": 1.6246323209937157e-05, + "loss": 0.6447, + "step": 8240 + }, + { + "epoch": 0.29, + "learning_rate": 1.6245472857731924e-05, + "loss": 0.6102, + "step": 8241 + }, + { + "epoch": 0.29, + "learning_rate": 1.6244622431478706e-05, + "loss": 0.6074, + "step": 8242 + }, + { + "epoch": 0.29, + "learning_rate": 1.6243771931187594e-05, + "loss": 0.6463, + "step": 8243 + }, + { + "epoch": 0.29, + "learning_rate": 1.624292135686867e-05, + "loss": 0.617, + "step": 8244 + }, + { + "epoch": 0.29, + "learning_rate": 1.624207070853201e-05, + "loss": 0.6578, + "step": 8245 + }, + { + "epoch": 0.29, + "learning_rate": 1.6241219986187706e-05, + "loss": 0.5577, + "step": 8246 + }, + { + "epoch": 0.29, + "learning_rate": 1.6240369189845847e-05, + "loss": 0.621, + "step": 8247 + }, + { + "epoch": 0.29, + "learning_rate": 1.6239518319516513e-05, + "loss": 0.6058, + "step": 8248 + }, + { + "epoch": 0.29, + "learning_rate": 1.62386673752098e-05, + "loss": 0.5958, + "step": 8249 + }, + { + "epoch": 0.29, + "learning_rate": 1.623781635693579e-05, + "loss": 0.6554, + "step": 8250 + }, + { + "epoch": 0.29, + "learning_rate": 1.6236965264704577e-05, + "loss": 0.6143, + "step": 8251 + }, + { + "epoch": 0.29, + "learning_rate": 1.6236114098526256e-05, + "loss": 0.6122, + "step": 8252 + }, + { + "epoch": 0.29, + "learning_rate": 1.623526285841091e-05, + "loss": 0.6759, + "step": 8253 + }, + { + "epoch": 0.29, + "learning_rate": 1.6234411544368632e-05, + "loss": 0.6408, + "step": 8254 + }, + { + "epoch": 0.29, + "learning_rate": 1.6233560156409523e-05, + "loss": 0.6582, + "step": 8255 + }, + { + "epoch": 0.29, + "learning_rate": 1.6232708694543672e-05, + "loss": 0.6105, + "step": 8256 + }, + { + "epoch": 0.29, + "learning_rate": 1.6231857158781173e-05, + "loss": 0.6563, + "step": 8257 + }, + { + "epoch": 0.29, + "learning_rate": 1.623100554913213e-05, + "loss": 0.6428, + "step": 8258 + }, + { + "epoch": 0.29, + "learning_rate": 1.623015386560663e-05, + "loss": 0.6245, + "step": 8259 + }, + { + "epoch": 0.29, + "learning_rate": 1.622930210821477e-05, + "loss": 0.6143, + "step": 8260 + }, + { + "epoch": 0.29, + "learning_rate": 1.6228450276966657e-05, + "loss": 0.6807, + "step": 8261 + }, + { + "epoch": 0.29, + "learning_rate": 1.6227598371872392e-05, + "loss": 0.6306, + "step": 8262 + }, + { + "epoch": 0.29, + "learning_rate": 1.6226746392942065e-05, + "loss": 0.6256, + "step": 8263 + }, + { + "epoch": 0.29, + "learning_rate": 1.6225894340185782e-05, + "loss": 0.6505, + "step": 8264 + }, + { + "epoch": 0.29, + "learning_rate": 1.6225042213613645e-05, + "loss": 0.6198, + "step": 8265 + }, + { + "epoch": 0.29, + "learning_rate": 1.6224190013235763e-05, + "loss": 0.65, + "step": 8266 + }, + { + "epoch": 0.29, + "learning_rate": 1.622333773906223e-05, + "loss": 0.7053, + "step": 8267 + }, + { + "epoch": 0.29, + "learning_rate": 1.622248539110316e-05, + "loss": 0.6433, + "step": 8268 + }, + { + "epoch": 0.29, + "learning_rate": 1.622163296936865e-05, + "loss": 0.6244, + "step": 8269 + }, + { + "epoch": 0.29, + "learning_rate": 1.6220780473868812e-05, + "loss": 0.6631, + "step": 8270 + }, + { + "epoch": 0.29, + "learning_rate": 1.6219927904613753e-05, + "loss": 0.6333, + "step": 8271 + }, + { + "epoch": 0.29, + "learning_rate": 1.621907526161358e-05, + "loss": 0.6711, + "step": 8272 + }, + { + "epoch": 0.29, + "learning_rate": 1.6218222544878402e-05, + "loss": 0.621, + "step": 8273 + }, + { + "epoch": 0.29, + "learning_rate": 1.621736975441833e-05, + "loss": 0.6296, + "step": 8274 + }, + { + "epoch": 0.29, + "learning_rate": 1.6216516890243476e-05, + "loss": 0.6538, + "step": 8275 + }, + { + "epoch": 0.29, + "learning_rate": 1.621566395236395e-05, + "loss": 0.6755, + "step": 8276 + }, + { + "epoch": 0.29, + "learning_rate": 1.6214810940789862e-05, + "loss": 0.5693, + "step": 8277 + }, + { + "epoch": 0.29, + "learning_rate": 1.6213957855531334e-05, + "loss": 0.669, + "step": 8278 + }, + { + "epoch": 0.29, + "learning_rate": 1.621310469659847e-05, + "loss": 0.5954, + "step": 8279 + }, + { + "epoch": 0.29, + "learning_rate": 1.6212251464001392e-05, + "loss": 0.5718, + "step": 8280 + }, + { + "epoch": 0.29, + "learning_rate": 1.6211398157750213e-05, + "loss": 0.5975, + "step": 8281 + }, + { + "epoch": 0.29, + "learning_rate": 1.6210544777855052e-05, + "loss": 0.6284, + "step": 8282 + }, + { + "epoch": 0.29, + "learning_rate": 1.620969132432603e-05, + "loss": 0.6308, + "step": 8283 + }, + { + "epoch": 0.29, + "learning_rate": 1.6208837797173255e-05, + "loss": 0.6407, + "step": 8284 + }, + { + "epoch": 0.29, + "learning_rate": 1.620798419640686e-05, + "loss": 0.6456, + "step": 8285 + }, + { + "epoch": 0.29, + "learning_rate": 1.6207130522036954e-05, + "loss": 0.6151, + "step": 8286 + }, + { + "epoch": 0.29, + "learning_rate": 1.620627677407367e-05, + "loss": 0.5913, + "step": 8287 + }, + { + "epoch": 0.29, + "learning_rate": 1.620542295252712e-05, + "loss": 0.66, + "step": 8288 + }, + { + "epoch": 0.29, + "learning_rate": 1.620456905740743e-05, + "loss": 0.616, + "step": 8289 + }, + { + "epoch": 0.29, + "learning_rate": 1.620371508872473e-05, + "loss": 0.71, + "step": 8290 + }, + { + "epoch": 0.29, + "learning_rate": 1.6202861046489133e-05, + "loss": 0.6259, + "step": 8291 + }, + { + "epoch": 0.29, + "learning_rate": 1.6202006930710775e-05, + "loss": 0.6497, + "step": 8292 + }, + { + "epoch": 0.29, + "learning_rate": 1.620115274139978e-05, + "loss": 0.605, + "step": 8293 + }, + { + "epoch": 0.29, + "learning_rate": 1.620029847856627e-05, + "loss": 0.6556, + "step": 8294 + }, + { + "epoch": 0.29, + "learning_rate": 1.6199444142220382e-05, + "loss": 0.5994, + "step": 8295 + }, + { + "epoch": 0.29, + "learning_rate": 1.6198589732372243e-05, + "loss": 0.6477, + "step": 8296 + }, + { + "epoch": 0.29, + "learning_rate": 1.619773524903198e-05, + "loss": 0.6831, + "step": 8297 + }, + { + "epoch": 0.29, + "learning_rate": 1.6196880692209723e-05, + "loss": 0.6739, + "step": 8298 + }, + { + "epoch": 0.29, + "learning_rate": 1.619602606191561e-05, + "loss": 0.5811, + "step": 8299 + }, + { + "epoch": 0.29, + "learning_rate": 1.6195171358159768e-05, + "loss": 0.5595, + "step": 8300 + }, + { + "epoch": 0.29, + "learning_rate": 1.6194316580952335e-05, + "loss": 0.6556, + "step": 8301 + }, + { + "epoch": 0.29, + "learning_rate": 1.6193461730303442e-05, + "loss": 0.6456, + "step": 8302 + }, + { + "epoch": 0.29, + "learning_rate": 1.6192606806223223e-05, + "loss": 0.6279, + "step": 8303 + }, + { + "epoch": 0.29, + "learning_rate": 1.6191751808721815e-05, + "loss": 0.6427, + "step": 8304 + }, + { + "epoch": 0.29, + "learning_rate": 1.6190896737809363e-05, + "loss": 0.6261, + "step": 8305 + }, + { + "epoch": 0.29, + "learning_rate": 1.6190041593495998e-05, + "loss": 0.6424, + "step": 8306 + }, + { + "epoch": 0.29, + "learning_rate": 1.6189186375791855e-05, + "loss": 0.6725, + "step": 8307 + }, + { + "epoch": 0.29, + "learning_rate": 1.618833108470708e-05, + "loss": 0.6418, + "step": 8308 + }, + { + "epoch": 0.29, + "learning_rate": 1.6187475720251812e-05, + "loss": 0.6635, + "step": 8309 + }, + { + "epoch": 0.29, + "learning_rate": 1.618662028243619e-05, + "loss": 0.6664, + "step": 8310 + }, + { + "epoch": 0.29, + "learning_rate": 1.618576477127036e-05, + "loss": 0.6533, + "step": 8311 + }, + { + "epoch": 0.29, + "learning_rate": 1.6184909186764466e-05, + "loss": 0.6782, + "step": 8312 + }, + { + "epoch": 0.29, + "learning_rate": 1.6184053528928648e-05, + "loss": 0.6866, + "step": 8313 + }, + { + "epoch": 0.29, + "learning_rate": 1.618319779777305e-05, + "loss": 0.6734, + "step": 8314 + }, + { + "epoch": 0.29, + "learning_rate": 1.6182341993307824e-05, + "loss": 0.668, + "step": 8315 + }, + { + "epoch": 0.29, + "learning_rate": 1.618148611554311e-05, + "loss": 0.6288, + "step": 8316 + }, + { + "epoch": 0.29, + "learning_rate": 1.6180630164489063e-05, + "loss": 0.6247, + "step": 8317 + }, + { + "epoch": 0.29, + "learning_rate": 1.6179774140155824e-05, + "loss": 0.5951, + "step": 8318 + }, + { + "epoch": 0.29, + "learning_rate": 1.617891804255354e-05, + "loss": 0.6301, + "step": 8319 + }, + { + "epoch": 0.29, + "learning_rate": 1.6178061871692374e-05, + "loss": 0.6889, + "step": 8320 + }, + { + "epoch": 0.29, + "learning_rate": 1.6177205627582467e-05, + "loss": 0.6315, + "step": 8321 + }, + { + "epoch": 0.29, + "learning_rate": 1.6176349310233972e-05, + "loss": 0.6185, + "step": 8322 + }, + { + "epoch": 0.29, + "learning_rate": 1.6175492919657047e-05, + "loss": 0.6645, + "step": 8323 + }, + { + "epoch": 0.29, + "learning_rate": 1.6174636455861837e-05, + "loss": 0.5885, + "step": 8324 + }, + { + "epoch": 0.29, + "learning_rate": 1.61737799188585e-05, + "loss": 0.6144, + "step": 8325 + }, + { + "epoch": 0.29, + "learning_rate": 1.6172923308657195e-05, + "loss": 0.6207, + "step": 8326 + }, + { + "epoch": 0.29, + "learning_rate": 1.6172066625268074e-05, + "loss": 0.6642, + "step": 8327 + }, + { + "epoch": 0.29, + "learning_rate": 1.6171209868701297e-05, + "loss": 0.6125, + "step": 8328 + }, + { + "epoch": 0.29, + "learning_rate": 1.6170353038967017e-05, + "loss": 0.6316, + "step": 8329 + }, + { + "epoch": 0.29, + "learning_rate": 1.6169496136075396e-05, + "loss": 0.658, + "step": 8330 + }, + { + "epoch": 0.29, + "learning_rate": 1.6168639160036595e-05, + "loss": 0.6788, + "step": 8331 + }, + { + "epoch": 0.29, + "learning_rate": 1.6167782110860775e-05, + "loss": 0.5938, + "step": 8332 + }, + { + "epoch": 0.29, + "learning_rate": 1.6166924988558097e-05, + "loss": 0.6189, + "step": 8333 + }, + { + "epoch": 0.29, + "learning_rate": 1.616606779313872e-05, + "loss": 0.6447, + "step": 8334 + }, + { + "epoch": 0.29, + "learning_rate": 1.616521052461281e-05, + "loss": 0.6113, + "step": 8335 + }, + { + "epoch": 0.29, + "learning_rate": 1.616435318299053e-05, + "loss": 0.6751, + "step": 8336 + }, + { + "epoch": 0.29, + "learning_rate": 1.6163495768282046e-05, + "loss": 0.6131, + "step": 8337 + }, + { + "epoch": 0.29, + "learning_rate": 1.616263828049752e-05, + "loss": 0.6102, + "step": 8338 + }, + { + "epoch": 0.29, + "learning_rate": 1.616178071964712e-05, + "loss": 0.6669, + "step": 8339 + }, + { + "epoch": 0.29, + "learning_rate": 1.616092308574102e-05, + "loss": 0.632, + "step": 8340 + }, + { + "epoch": 0.29, + "learning_rate": 1.616006537878938e-05, + "loss": 0.6449, + "step": 8341 + }, + { + "epoch": 0.29, + "learning_rate": 1.6159207598802375e-05, + "loss": 0.6921, + "step": 8342 + }, + { + "epoch": 0.29, + "learning_rate": 1.615834974579017e-05, + "loss": 0.6544, + "step": 8343 + }, + { + "epoch": 0.29, + "learning_rate": 1.615749181976294e-05, + "loss": 0.6406, + "step": 8344 + }, + { + "epoch": 0.29, + "learning_rate": 1.6156633820730854e-05, + "loss": 0.6402, + "step": 8345 + }, + { + "epoch": 0.29, + "learning_rate": 1.6155775748704088e-05, + "loss": 0.6167, + "step": 8346 + }, + { + "epoch": 0.29, + "learning_rate": 1.615491760369281e-05, + "loss": 0.6301, + "step": 8347 + }, + { + "epoch": 0.29, + "learning_rate": 1.6154059385707203e-05, + "loss": 0.6058, + "step": 8348 + }, + { + "epoch": 0.29, + "learning_rate": 1.6153201094757433e-05, + "loss": 0.6144, + "step": 8349 + }, + { + "epoch": 0.29, + "learning_rate": 1.6152342730853677e-05, + "loss": 0.6807, + "step": 8350 + }, + { + "epoch": 0.29, + "learning_rate": 1.615148429400612e-05, + "loss": 0.5992, + "step": 8351 + }, + { + "epoch": 0.29, + "learning_rate": 1.6150625784224935e-05, + "loss": 0.6073, + "step": 8352 + }, + { + "epoch": 0.29, + "learning_rate": 1.6149767201520297e-05, + "loss": 0.5958, + "step": 8353 + }, + { + "epoch": 0.29, + "learning_rate": 1.6148908545902396e-05, + "loss": 0.6226, + "step": 8354 + }, + { + "epoch": 0.29, + "learning_rate": 1.6148049817381403e-05, + "loss": 0.6486, + "step": 8355 + }, + { + "epoch": 0.29, + "learning_rate": 1.6147191015967498e-05, + "loss": 0.6541, + "step": 8356 + }, + { + "epoch": 0.29, + "learning_rate": 1.6146332141670874e-05, + "loss": 0.6543, + "step": 8357 + }, + { + "epoch": 0.29, + "learning_rate": 1.61454731945017e-05, + "loss": 0.6031, + "step": 8358 + }, + { + "epoch": 0.29, + "learning_rate": 1.6144614174470172e-05, + "loss": 0.6029, + "step": 8359 + }, + { + "epoch": 0.29, + "learning_rate": 1.6143755081586467e-05, + "loss": 0.6308, + "step": 8360 + }, + { + "epoch": 0.29, + "learning_rate": 1.614289591586078e-05, + "loss": 0.6094, + "step": 8361 + }, + { + "epoch": 0.29, + "learning_rate": 1.6142036677303283e-05, + "loss": 0.6498, + "step": 8362 + }, + { + "epoch": 0.29, + "learning_rate": 1.6141177365924177e-05, + "loss": 0.638, + "step": 8363 + }, + { + "epoch": 0.29, + "learning_rate": 1.614031798173364e-05, + "loss": 0.6368, + "step": 8364 + }, + { + "epoch": 0.29, + "learning_rate": 1.613945852474187e-05, + "loss": 0.649, + "step": 8365 + }, + { + "epoch": 0.29, + "learning_rate": 1.613859899495905e-05, + "loss": 0.6454, + "step": 8366 + }, + { + "epoch": 0.29, + "learning_rate": 1.6137739392395375e-05, + "loss": 0.6224, + "step": 8367 + }, + { + "epoch": 0.29, + "learning_rate": 1.6136879717061034e-05, + "loss": 0.5716, + "step": 8368 + }, + { + "epoch": 0.29, + "learning_rate": 1.6136019968966225e-05, + "loss": 0.6236, + "step": 8369 + }, + { + "epoch": 0.29, + "learning_rate": 1.613516014812113e-05, + "loss": 0.6942, + "step": 8370 + }, + { + "epoch": 0.29, + "learning_rate": 1.6134300254535958e-05, + "loss": 0.598, + "step": 8371 + }, + { + "epoch": 0.29, + "learning_rate": 1.6133440288220893e-05, + "loss": 0.6812, + "step": 8372 + }, + { + "epoch": 0.29, + "learning_rate": 1.6132580249186133e-05, + "loss": 0.5564, + "step": 8373 + }, + { + "epoch": 0.29, + "learning_rate": 1.6131720137441878e-05, + "loss": 0.6742, + "step": 8374 + }, + { + "epoch": 0.29, + "learning_rate": 1.6130859952998324e-05, + "loss": 0.6243, + "step": 8375 + }, + { + "epoch": 0.29, + "learning_rate": 1.612999969586567e-05, + "loss": 0.6111, + "step": 8376 + }, + { + "epoch": 0.29, + "learning_rate": 1.6129139366054115e-05, + "loss": 0.6265, + "step": 8377 + }, + { + "epoch": 0.29, + "learning_rate": 1.6128278963573858e-05, + "loss": 0.6676, + "step": 8378 + }, + { + "epoch": 0.29, + "learning_rate": 1.61274184884351e-05, + "loss": 0.6519, + "step": 8379 + }, + { + "epoch": 0.29, + "learning_rate": 1.612655794064805e-05, + "loss": 0.6416, + "step": 8380 + }, + { + "epoch": 0.29, + "learning_rate": 1.6125697320222902e-05, + "loss": 0.6415, + "step": 8381 + }, + { + "epoch": 0.29, + "learning_rate": 1.6124836627169866e-05, + "loss": 0.6477, + "step": 8382 + }, + { + "epoch": 0.29, + "learning_rate": 1.612397586149914e-05, + "loss": 0.6094, + "step": 8383 + }, + { + "epoch": 0.29, + "learning_rate": 1.6123115023220933e-05, + "loss": 0.6227, + "step": 8384 + }, + { + "epoch": 0.29, + "learning_rate": 1.6122254112345457e-05, + "loss": 0.6336, + "step": 8385 + }, + { + "epoch": 0.29, + "learning_rate": 1.612139312888291e-05, + "loss": 0.6291, + "step": 8386 + }, + { + "epoch": 0.29, + "learning_rate": 1.6120532072843505e-05, + "loss": 0.6688, + "step": 8387 + }, + { + "epoch": 0.29, + "learning_rate": 1.6119670944237448e-05, + "loss": 0.6314, + "step": 8388 + }, + { + "epoch": 0.29, + "learning_rate": 1.6118809743074954e-05, + "loss": 0.6103, + "step": 8389 + }, + { + "epoch": 0.29, + "learning_rate": 1.6117948469366226e-05, + "loss": 0.6504, + "step": 8390 + }, + { + "epoch": 0.29, + "learning_rate": 1.6117087123121483e-05, + "loss": 0.6423, + "step": 8391 + }, + { + "epoch": 0.29, + "learning_rate": 1.6116225704350933e-05, + "loss": 0.6472, + "step": 8392 + }, + { + "epoch": 0.29, + "learning_rate": 1.6115364213064788e-05, + "loss": 0.656, + "step": 8393 + }, + { + "epoch": 0.29, + "learning_rate": 1.6114502649273263e-05, + "loss": 0.6088, + "step": 8394 + }, + { + "epoch": 0.29, + "learning_rate": 1.611364101298658e-05, + "loss": 0.5975, + "step": 8395 + }, + { + "epoch": 0.29, + "learning_rate": 1.6112779304214944e-05, + "loss": 0.5862, + "step": 8396 + }, + { + "epoch": 0.29, + "learning_rate": 1.611191752296858e-05, + "loss": 0.6508, + "step": 8397 + }, + { + "epoch": 0.29, + "learning_rate": 1.6111055669257702e-05, + "loss": 0.6312, + "step": 8398 + }, + { + "epoch": 0.29, + "learning_rate": 1.611019374309253e-05, + "loss": 0.6655, + "step": 8399 + }, + { + "epoch": 0.29, + "learning_rate": 1.6109331744483278e-05, + "loss": 0.6267, + "step": 8400 + }, + { + "epoch": 0.29, + "learning_rate": 1.610846967344017e-05, + "loss": 0.5996, + "step": 8401 + }, + { + "epoch": 0.29, + "learning_rate": 1.610760752997343e-05, + "loss": 0.6052, + "step": 8402 + }, + { + "epoch": 0.29, + "learning_rate": 1.6106745314093274e-05, + "loss": 0.6528, + "step": 8403 + }, + { + "epoch": 0.29, + "learning_rate": 1.6105883025809925e-05, + "loss": 0.6144, + "step": 8404 + }, + { + "epoch": 0.29, + "learning_rate": 1.610502066513361e-05, + "loss": 0.6449, + "step": 8405 + }, + { + "epoch": 0.29, + "learning_rate": 1.6104158232074555e-05, + "loss": 0.6166, + "step": 8406 + }, + { + "epoch": 0.29, + "learning_rate": 1.610329572664298e-05, + "loss": 0.6202, + "step": 8407 + }, + { + "epoch": 0.29, + "learning_rate": 1.6102433148849117e-05, + "loss": 0.6128, + "step": 8408 + }, + { + "epoch": 0.29, + "learning_rate": 1.6101570498703184e-05, + "loss": 0.6698, + "step": 8409 + }, + { + "epoch": 0.29, + "learning_rate": 1.610070777621542e-05, + "loss": 0.6275, + "step": 8410 + }, + { + "epoch": 0.29, + "learning_rate": 1.6099844981396044e-05, + "loss": 0.636, + "step": 8411 + }, + { + "epoch": 0.29, + "learning_rate": 1.609898211425529e-05, + "loss": 0.6345, + "step": 8412 + }, + { + "epoch": 0.29, + "learning_rate": 1.6098119174803385e-05, + "loss": 0.6075, + "step": 8413 + }, + { + "epoch": 0.29, + "learning_rate": 1.6097256163050568e-05, + "loss": 0.6459, + "step": 8414 + }, + { + "epoch": 0.29, + "learning_rate": 1.6096393079007064e-05, + "loss": 0.6596, + "step": 8415 + }, + { + "epoch": 0.29, + "learning_rate": 1.6095529922683108e-05, + "loss": 0.5957, + "step": 8416 + }, + { + "epoch": 0.29, + "learning_rate": 1.6094666694088935e-05, + "loss": 0.6858, + "step": 8417 + }, + { + "epoch": 0.29, + "learning_rate": 1.6093803393234778e-05, + "loss": 0.5846, + "step": 8418 + }, + { + "epoch": 0.29, + "learning_rate": 1.6092940020130872e-05, + "loss": 0.6153, + "step": 8419 + }, + { + "epoch": 0.29, + "learning_rate": 1.6092076574787453e-05, + "loss": 0.7032, + "step": 8420 + }, + { + "epoch": 0.29, + "learning_rate": 1.6091213057214766e-05, + "loss": 0.5707, + "step": 8421 + }, + { + "epoch": 0.29, + "learning_rate": 1.6090349467423038e-05, + "loss": 0.6473, + "step": 8422 + }, + { + "epoch": 0.29, + "learning_rate": 1.6089485805422513e-05, + "loss": 0.627, + "step": 8423 + }, + { + "epoch": 0.29, + "learning_rate": 1.6088622071223433e-05, + "loss": 0.6092, + "step": 8424 + }, + { + "epoch": 0.29, + "learning_rate": 1.6087758264836032e-05, + "loss": 0.5783, + "step": 8425 + }, + { + "epoch": 0.29, + "learning_rate": 1.6086894386270558e-05, + "loss": 0.6421, + "step": 8426 + }, + { + "epoch": 0.29, + "learning_rate": 1.608603043553725e-05, + "loss": 0.6207, + "step": 8427 + }, + { + "epoch": 0.29, + "learning_rate": 1.608516641264635e-05, + "loss": 0.6003, + "step": 8428 + }, + { + "epoch": 0.29, + "learning_rate": 1.608430231760811e-05, + "loss": 0.5959, + "step": 8429 + }, + { + "epoch": 0.29, + "learning_rate": 1.6083438150432767e-05, + "loss": 0.655, + "step": 8430 + }, + { + "epoch": 0.29, + "learning_rate": 1.6082573911130567e-05, + "loss": 0.655, + "step": 8431 + }, + { + "epoch": 0.29, + "learning_rate": 1.6081709599711765e-05, + "loss": 0.6236, + "step": 8432 + }, + { + "epoch": 0.29, + "learning_rate": 1.60808452161866e-05, + "loss": 0.6568, + "step": 8433 + }, + { + "epoch": 0.29, + "learning_rate": 1.6079980760565317e-05, + "loss": 0.6106, + "step": 8434 + }, + { + "epoch": 0.29, + "learning_rate": 1.6079116232858173e-05, + "loss": 0.6334, + "step": 8435 + }, + { + "epoch": 0.29, + "learning_rate": 1.6078251633075417e-05, + "loss": 0.6641, + "step": 8436 + }, + { + "epoch": 0.29, + "learning_rate": 1.60773869612273e-05, + "loss": 0.6867, + "step": 8437 + }, + { + "epoch": 0.29, + "learning_rate": 1.6076522217324075e-05, + "loss": 0.6155, + "step": 8438 + }, + { + "epoch": 0.29, + "learning_rate": 1.607565740137599e-05, + "loss": 0.6202, + "step": 8439 + }, + { + "epoch": 0.29, + "learning_rate": 1.60747925133933e-05, + "loss": 0.6393, + "step": 8440 + }, + { + "epoch": 0.29, + "learning_rate": 1.6073927553386258e-05, + "loss": 0.6736, + "step": 8441 + }, + { + "epoch": 0.29, + "learning_rate": 1.6073062521365126e-05, + "loss": 0.6268, + "step": 8442 + }, + { + "epoch": 0.29, + "learning_rate": 1.607219741734015e-05, + "loss": 0.6114, + "step": 8443 + }, + { + "epoch": 0.29, + "learning_rate": 1.6071332241321595e-05, + "loss": 0.6904, + "step": 8444 + }, + { + "epoch": 0.29, + "learning_rate": 1.6070466993319717e-05, + "loss": 0.6587, + "step": 8445 + }, + { + "epoch": 0.29, + "learning_rate": 1.606960167334477e-05, + "loss": 0.6383, + "step": 8446 + }, + { + "epoch": 0.29, + "learning_rate": 1.606873628140702e-05, + "loss": 0.6195, + "step": 8447 + }, + { + "epoch": 0.29, + "learning_rate": 1.606787081751673e-05, + "loss": 0.6349, + "step": 8448 + }, + { + "epoch": 0.29, + "learning_rate": 1.6067005281684145e-05, + "loss": 0.6915, + "step": 8449 + }, + { + "epoch": 0.29, + "learning_rate": 1.6066139673919544e-05, + "loss": 0.6387, + "step": 8450 + }, + { + "epoch": 0.29, + "learning_rate": 1.6065273994233185e-05, + "loss": 0.6451, + "step": 8451 + }, + { + "epoch": 0.29, + "learning_rate": 1.6064408242635325e-05, + "loss": 0.6732, + "step": 8452 + }, + { + "epoch": 0.29, + "learning_rate": 1.6063542419136237e-05, + "loss": 0.6031, + "step": 8453 + }, + { + "epoch": 0.29, + "learning_rate": 1.606267652374618e-05, + "loss": 0.6114, + "step": 8454 + }, + { + "epoch": 0.29, + "learning_rate": 1.6061810556475425e-05, + "loss": 0.6244, + "step": 8455 + }, + { + "epoch": 0.29, + "learning_rate": 1.6060944517334237e-05, + "loss": 0.5949, + "step": 8456 + }, + { + "epoch": 0.29, + "learning_rate": 1.6060078406332888e-05, + "loss": 0.6989, + "step": 8457 + }, + { + "epoch": 0.29, + "learning_rate": 1.605921222348164e-05, + "loss": 0.6243, + "step": 8458 + }, + { + "epoch": 0.29, + "learning_rate": 1.6058345968790767e-05, + "loss": 0.6172, + "step": 8459 + }, + { + "epoch": 0.29, + "learning_rate": 1.6057479642270538e-05, + "loss": 0.5963, + "step": 8460 + }, + { + "epoch": 0.29, + "learning_rate": 1.605661324393123e-05, + "loss": 0.631, + "step": 8461 + }, + { + "epoch": 0.29, + "learning_rate": 1.6055746773783102e-05, + "loss": 0.6607, + "step": 8462 + }, + { + "epoch": 0.29, + "learning_rate": 1.6054880231836444e-05, + "loss": 0.6065, + "step": 8463 + }, + { + "epoch": 0.29, + "learning_rate": 1.6054013618101515e-05, + "loss": 0.6292, + "step": 8464 + }, + { + "epoch": 0.29, + "learning_rate": 1.6053146932588597e-05, + "loss": 0.6129, + "step": 8465 + }, + { + "epoch": 0.29, + "learning_rate": 1.6052280175307967e-05, + "loss": 0.6217, + "step": 8466 + }, + { + "epoch": 0.29, + "learning_rate": 1.60514133462699e-05, + "loss": 0.6098, + "step": 8467 + }, + { + "epoch": 0.29, + "learning_rate": 1.605054644548467e-05, + "loss": 0.6564, + "step": 8468 + }, + { + "epoch": 0.29, + "learning_rate": 1.604967947296256e-05, + "loss": 0.6022, + "step": 8469 + }, + { + "epoch": 0.29, + "learning_rate": 1.6048812428713848e-05, + "loss": 0.6144, + "step": 8470 + }, + { + "epoch": 0.29, + "learning_rate": 1.604794531274881e-05, + "loss": 0.6713, + "step": 8471 + }, + { + "epoch": 0.29, + "learning_rate": 1.604707812507773e-05, + "loss": 0.6304, + "step": 8472 + }, + { + "epoch": 0.29, + "learning_rate": 1.604621086571089e-05, + "loss": 0.6301, + "step": 8473 + }, + { + "epoch": 0.29, + "learning_rate": 1.604534353465857e-05, + "loss": 0.5976, + "step": 8474 + }, + { + "epoch": 0.29, + "learning_rate": 1.604447613193106e-05, + "loss": 0.6292, + "step": 8475 + }, + { + "epoch": 0.29, + "learning_rate": 1.6043608657538638e-05, + "loss": 0.6138, + "step": 8476 + }, + { + "epoch": 0.29, + "learning_rate": 1.6042741111491583e-05, + "loss": 0.6475, + "step": 8477 + }, + { + "epoch": 0.29, + "learning_rate": 1.6041873493800194e-05, + "loss": 0.644, + "step": 8478 + }, + { + "epoch": 0.29, + "learning_rate": 1.604100580447475e-05, + "loss": 0.6122, + "step": 8479 + }, + { + "epoch": 0.29, + "learning_rate": 1.6040138043525543e-05, + "loss": 0.6361, + "step": 8480 + }, + { + "epoch": 0.29, + "learning_rate": 1.6039270210962855e-05, + "loss": 0.628, + "step": 8481 + }, + { + "epoch": 0.29, + "learning_rate": 1.603840230679698e-05, + "loss": 0.6848, + "step": 8482 + }, + { + "epoch": 0.29, + "learning_rate": 1.603753433103821e-05, + "loss": 0.6256, + "step": 8483 + }, + { + "epoch": 0.29, + "learning_rate": 1.6036666283696832e-05, + "loss": 0.663, + "step": 8484 + }, + { + "epoch": 0.29, + "learning_rate": 1.6035798164783132e-05, + "loss": 0.6775, + "step": 8485 + }, + { + "epoch": 0.29, + "learning_rate": 1.6034929974307417e-05, + "loss": 0.5744, + "step": 8486 + }, + { + "epoch": 0.29, + "learning_rate": 1.6034061712279973e-05, + "loss": 0.6789, + "step": 8487 + }, + { + "epoch": 0.29, + "learning_rate": 1.603319337871109e-05, + "loss": 0.5675, + "step": 8488 + }, + { + "epoch": 0.29, + "learning_rate": 1.6032324973611072e-05, + "loss": 0.6305, + "step": 8489 + }, + { + "epoch": 0.29, + "learning_rate": 1.6031456496990206e-05, + "loss": 0.6686, + "step": 8490 + }, + { + "epoch": 0.29, + "learning_rate": 1.6030587948858796e-05, + "loss": 0.6364, + "step": 8491 + }, + { + "epoch": 0.29, + "learning_rate": 1.6029719329227136e-05, + "loss": 0.6537, + "step": 8492 + }, + { + "epoch": 0.29, + "learning_rate": 1.6028850638105527e-05, + "loss": 0.5896, + "step": 8493 + }, + { + "epoch": 0.29, + "learning_rate": 1.6027981875504267e-05, + "loss": 0.633, + "step": 8494 + }, + { + "epoch": 0.29, + "learning_rate": 1.6027113041433657e-05, + "loss": 0.6763, + "step": 8495 + }, + { + "epoch": 0.29, + "learning_rate": 1.6026244135903993e-05, + "loss": 0.6118, + "step": 8496 + }, + { + "epoch": 0.29, + "learning_rate": 1.6025375158925586e-05, + "loss": 0.6585, + "step": 8497 + }, + { + "epoch": 0.29, + "learning_rate": 1.602450611050873e-05, + "loss": 0.6542, + "step": 8498 + }, + { + "epoch": 0.29, + "learning_rate": 1.6023636990663737e-05, + "loss": 0.6252, + "step": 8499 + }, + { + "epoch": 0.29, + "learning_rate": 1.6022767799400908e-05, + "loss": 0.6174, + "step": 8500 + }, + { + "epoch": 0.29, + "learning_rate": 1.6021898536730546e-05, + "loss": 0.6147, + "step": 8501 + }, + { + "epoch": 0.29, + "learning_rate": 1.602102920266296e-05, + "loss": 0.6626, + "step": 8502 + }, + { + "epoch": 0.29, + "learning_rate": 1.6020159797208457e-05, + "loss": 0.6421, + "step": 8503 + }, + { + "epoch": 0.29, + "learning_rate": 1.6019290320377344e-05, + "loss": 0.6215, + "step": 8504 + }, + { + "epoch": 0.29, + "learning_rate": 1.6018420772179928e-05, + "loss": 0.6444, + "step": 8505 + }, + { + "epoch": 0.29, + "learning_rate": 1.601755115262652e-05, + "loss": 0.6452, + "step": 8506 + }, + { + "epoch": 0.29, + "learning_rate": 1.6016681461727434e-05, + "loss": 0.6855, + "step": 8507 + }, + { + "epoch": 0.29, + "learning_rate": 1.6015811699492974e-05, + "loss": 0.6099, + "step": 8508 + }, + { + "epoch": 0.29, + "learning_rate": 1.601494186593346e-05, + "loss": 0.6086, + "step": 8509 + }, + { + "epoch": 0.29, + "learning_rate": 1.60140719610592e-05, + "loss": 0.6399, + "step": 8510 + }, + { + "epoch": 0.29, + "learning_rate": 1.601320198488051e-05, + "loss": 0.618, + "step": 8511 + }, + { + "epoch": 0.29, + "learning_rate": 1.60123319374077e-05, + "loss": 0.6569, + "step": 8512 + }, + { + "epoch": 0.29, + "learning_rate": 1.6011461818651093e-05, + "loss": 0.6306, + "step": 8513 + }, + { + "epoch": 0.29, + "learning_rate": 1.6010591628621003e-05, + "loss": 0.6703, + "step": 8514 + }, + { + "epoch": 0.3, + "learning_rate": 1.600972136732774e-05, + "loss": 0.6712, + "step": 8515 + }, + { + "epoch": 0.3, + "learning_rate": 1.600885103478163e-05, + "loss": 0.5944, + "step": 8516 + }, + { + "epoch": 0.3, + "learning_rate": 1.6007980630992995e-05, + "loss": 0.5941, + "step": 8517 + }, + { + "epoch": 0.3, + "learning_rate": 1.6007110155972144e-05, + "loss": 0.6588, + "step": 8518 + }, + { + "epoch": 0.3, + "learning_rate": 1.6006239609729402e-05, + "loss": 0.6818, + "step": 8519 + }, + { + "epoch": 0.3, + "learning_rate": 1.6005368992275093e-05, + "loss": 0.6255, + "step": 8520 + }, + { + "epoch": 0.3, + "learning_rate": 1.600449830361954e-05, + "loss": 0.6112, + "step": 8521 + }, + { + "epoch": 0.3, + "learning_rate": 1.6003627543773062e-05, + "loss": 0.6146, + "step": 8522 + }, + { + "epoch": 0.3, + "learning_rate": 1.6002756712745985e-05, + "loss": 0.6184, + "step": 8523 + }, + { + "epoch": 0.3, + "learning_rate": 1.6001885810548635e-05, + "loss": 0.6405, + "step": 8524 + }, + { + "epoch": 0.3, + "learning_rate": 1.6001014837191336e-05, + "loss": 0.5897, + "step": 8525 + }, + { + "epoch": 0.3, + "learning_rate": 1.6000143792684414e-05, + "loss": 0.6467, + "step": 8526 + }, + { + "epoch": 0.3, + "learning_rate": 1.5999272677038196e-05, + "loss": 0.6132, + "step": 8527 + }, + { + "epoch": 0.3, + "learning_rate": 1.599840149026301e-05, + "loss": 0.6617, + "step": 8528 + }, + { + "epoch": 0.3, + "learning_rate": 1.599753023236919e-05, + "loss": 0.6143, + "step": 8529 + }, + { + "epoch": 0.3, + "learning_rate": 1.5996658903367063e-05, + "loss": 0.6864, + "step": 8530 + }, + { + "epoch": 0.3, + "learning_rate": 1.5995787503266958e-05, + "loss": 0.63, + "step": 8531 + }, + { + "epoch": 0.3, + "learning_rate": 1.5994916032079203e-05, + "loss": 0.6505, + "step": 8532 + }, + { + "epoch": 0.3, + "learning_rate": 1.599404448981414e-05, + "loss": 0.623, + "step": 8533 + }, + { + "epoch": 0.3, + "learning_rate": 1.5993172876482095e-05, + "loss": 0.6317, + "step": 8534 + }, + { + "epoch": 0.3, + "learning_rate": 1.5992301192093403e-05, + "loss": 0.6146, + "step": 8535 + }, + { + "epoch": 0.3, + "learning_rate": 1.59914294366584e-05, + "loss": 0.582, + "step": 8536 + }, + { + "epoch": 0.3, + "learning_rate": 1.5990557610187426e-05, + "loss": 0.6596, + "step": 8537 + }, + { + "epoch": 0.3, + "learning_rate": 1.598968571269081e-05, + "loss": 0.6601, + "step": 8538 + }, + { + "epoch": 0.3, + "learning_rate": 1.5988813744178893e-05, + "loss": 0.5259, + "step": 8539 + }, + { + "epoch": 0.3, + "learning_rate": 1.598794170466201e-05, + "loss": 0.6102, + "step": 8540 + }, + { + "epoch": 0.3, + "learning_rate": 1.5987069594150512e-05, + "loss": 0.6778, + "step": 8541 + }, + { + "epoch": 0.3, + "learning_rate": 1.5986197412654724e-05, + "loss": 0.6166, + "step": 8542 + }, + { + "epoch": 0.3, + "learning_rate": 1.5985325160184995e-05, + "loss": 0.632, + "step": 8543 + }, + { + "epoch": 0.3, + "learning_rate": 1.5984452836751666e-05, + "loss": 0.5737, + "step": 8544 + }, + { + "epoch": 0.3, + "learning_rate": 1.5983580442365077e-05, + "loss": 0.6429, + "step": 8545 + }, + { + "epoch": 0.3, + "learning_rate": 1.598270797703557e-05, + "loss": 0.5876, + "step": 8546 + }, + { + "epoch": 0.3, + "learning_rate": 1.598183544077349e-05, + "loss": 0.6827, + "step": 8547 + }, + { + "epoch": 0.3, + "learning_rate": 1.598096283358919e-05, + "loss": 0.6173, + "step": 8548 + }, + { + "epoch": 0.3, + "learning_rate": 1.5980090155493005e-05, + "loss": 0.693, + "step": 8549 + }, + { + "epoch": 0.3, + "learning_rate": 1.597921740649529e-05, + "loss": 0.6117, + "step": 8550 + }, + { + "epoch": 0.3, + "learning_rate": 1.597834458660639e-05, + "loss": 0.6648, + "step": 8551 + }, + { + "epoch": 0.3, + "learning_rate": 1.5977471695836646e-05, + "loss": 0.6623, + "step": 8552 + }, + { + "epoch": 0.3, + "learning_rate": 1.597659873419642e-05, + "loss": 0.6843, + "step": 8553 + }, + { + "epoch": 0.3, + "learning_rate": 1.5975725701696055e-05, + "loss": 0.6097, + "step": 8554 + }, + { + "epoch": 0.3, + "learning_rate": 1.5974852598345897e-05, + "loss": 0.6347, + "step": 8555 + }, + { + "epoch": 0.3, + "learning_rate": 1.5973979424156304e-05, + "loss": 0.6365, + "step": 8556 + }, + { + "epoch": 0.3, + "learning_rate": 1.5973106179137634e-05, + "loss": 0.6571, + "step": 8557 + }, + { + "epoch": 0.3, + "learning_rate": 1.597223286330023e-05, + "loss": 0.6471, + "step": 8558 + }, + { + "epoch": 0.3, + "learning_rate": 1.597135947665445e-05, + "loss": 0.6337, + "step": 8559 + }, + { + "epoch": 0.3, + "learning_rate": 1.597048601921065e-05, + "loss": 0.6187, + "step": 8560 + }, + { + "epoch": 0.3, + "learning_rate": 1.596961249097919e-05, + "loss": 0.5679, + "step": 8561 + }, + { + "epoch": 0.3, + "learning_rate": 1.5968738891970416e-05, + "loss": 0.6155, + "step": 8562 + }, + { + "epoch": 0.3, + "learning_rate": 1.5967865222194693e-05, + "loss": 0.5902, + "step": 8563 + }, + { + "epoch": 0.3, + "learning_rate": 1.596699148166238e-05, + "loss": 0.6357, + "step": 8564 + }, + { + "epoch": 0.3, + "learning_rate": 1.5966117670383832e-05, + "loss": 0.6512, + "step": 8565 + }, + { + "epoch": 0.3, + "learning_rate": 1.596524378836942e-05, + "loss": 0.5978, + "step": 8566 + }, + { + "epoch": 0.3, + "learning_rate": 1.5964369835629486e-05, + "loss": 0.6965, + "step": 8567 + }, + { + "epoch": 0.3, + "learning_rate": 1.596349581217441e-05, + "loss": 0.5754, + "step": 8568 + }, + { + "epoch": 0.3, + "learning_rate": 1.5962621718014545e-05, + "loss": 0.683, + "step": 8569 + }, + { + "epoch": 0.3, + "learning_rate": 1.5961747553160255e-05, + "loss": 0.5958, + "step": 8570 + }, + { + "epoch": 0.3, + "learning_rate": 1.596087331762191e-05, + "loss": 0.6585, + "step": 8571 + }, + { + "epoch": 0.3, + "learning_rate": 1.595999901140987e-05, + "loss": 0.6791, + "step": 8572 + }, + { + "epoch": 0.3, + "learning_rate": 1.59591246345345e-05, + "loss": 0.6666, + "step": 8573 + }, + { + "epoch": 0.3, + "learning_rate": 1.595825018700617e-05, + "loss": 0.6281, + "step": 8574 + }, + { + "epoch": 0.3, + "learning_rate": 1.595737566883525e-05, + "loss": 0.6231, + "step": 8575 + }, + { + "epoch": 0.3, + "learning_rate": 1.59565010800321e-05, + "loss": 0.646, + "step": 8576 + }, + { + "epoch": 0.3, + "learning_rate": 1.5955626420607096e-05, + "loss": 0.6236, + "step": 8577 + }, + { + "epoch": 0.3, + "learning_rate": 1.595475169057061e-05, + "loss": 0.6115, + "step": 8578 + }, + { + "epoch": 0.3, + "learning_rate": 1.595387688993301e-05, + "loss": 0.6647, + "step": 8579 + }, + { + "epoch": 0.3, + "learning_rate": 1.5953002018704666e-05, + "loss": 0.6317, + "step": 8580 + }, + { + "epoch": 0.3, + "learning_rate": 1.595212707689595e-05, + "loss": 0.6766, + "step": 8581 + }, + { + "epoch": 0.3, + "learning_rate": 1.5951252064517242e-05, + "loss": 0.6041, + "step": 8582 + }, + { + "epoch": 0.3, + "learning_rate": 1.5950376981578913e-05, + "loss": 0.6954, + "step": 8583 + }, + { + "epoch": 0.3, + "learning_rate": 1.5949501828091335e-05, + "loss": 0.6139, + "step": 8584 + }, + { + "epoch": 0.3, + "learning_rate": 1.5948626604064887e-05, + "loss": 0.613, + "step": 8585 + }, + { + "epoch": 0.3, + "learning_rate": 1.5947751309509945e-05, + "loss": 0.6989, + "step": 8586 + }, + { + "epoch": 0.3, + "learning_rate": 1.5946875944436887e-05, + "loss": 0.5928, + "step": 8587 + }, + { + "epoch": 0.3, + "learning_rate": 1.5946000508856093e-05, + "loss": 0.6554, + "step": 8588 + }, + { + "epoch": 0.3, + "learning_rate": 1.5945125002777942e-05, + "loss": 0.6468, + "step": 8589 + }, + { + "epoch": 0.3, + "learning_rate": 1.5944249426212813e-05, + "loss": 0.6109, + "step": 8590 + }, + { + "epoch": 0.3, + "learning_rate": 1.5943373779171087e-05, + "loss": 0.5914, + "step": 8591 + }, + { + "epoch": 0.3, + "learning_rate": 1.5942498061663148e-05, + "loss": 0.6252, + "step": 8592 + }, + { + "epoch": 0.3, + "learning_rate": 1.5941622273699375e-05, + "loss": 0.619, + "step": 8593 + }, + { + "epoch": 0.3, + "learning_rate": 1.5940746415290155e-05, + "loss": 0.6376, + "step": 8594 + }, + { + "epoch": 0.3, + "learning_rate": 1.593987048644587e-05, + "loss": 0.6099, + "step": 8595 + }, + { + "epoch": 0.3, + "learning_rate": 1.5938994487176906e-05, + "loss": 0.594, + "step": 8596 + }, + { + "epoch": 0.3, + "learning_rate": 1.593811841749365e-05, + "loss": 0.6313, + "step": 8597 + }, + { + "epoch": 0.3, + "learning_rate": 1.593724227740649e-05, + "loss": 0.5589, + "step": 8598 + }, + { + "epoch": 0.3, + "learning_rate": 1.593636606692581e-05, + "loss": 0.6197, + "step": 8599 + }, + { + "epoch": 0.3, + "learning_rate": 1.5935489786062005e-05, + "loss": 0.6529, + "step": 8600 + }, + { + "epoch": 0.3, + "learning_rate": 1.5934613434825455e-05, + "loss": 0.617, + "step": 8601 + }, + { + "epoch": 0.3, + "learning_rate": 1.593373701322656e-05, + "loss": 0.6696, + "step": 8602 + }, + { + "epoch": 0.3, + "learning_rate": 1.59328605212757e-05, + "loss": 0.607, + "step": 8603 + }, + { + "epoch": 0.3, + "learning_rate": 1.5931983958983275e-05, + "loss": 0.698, + "step": 8604 + }, + { + "epoch": 0.3, + "learning_rate": 1.5931107326359684e-05, + "loss": 0.6519, + "step": 8605 + }, + { + "epoch": 0.3, + "learning_rate": 1.5930230623415305e-05, + "loss": 0.6118, + "step": 8606 + }, + { + "epoch": 0.3, + "learning_rate": 1.5929353850160544e-05, + "loss": 0.6438, + "step": 8607 + }, + { + "epoch": 0.3, + "learning_rate": 1.592847700660579e-05, + "loss": 0.6106, + "step": 8608 + }, + { + "epoch": 0.3, + "learning_rate": 1.592760009276144e-05, + "loss": 0.6024, + "step": 8609 + }, + { + "epoch": 0.3, + "learning_rate": 1.5926723108637895e-05, + "loss": 0.6005, + "step": 8610 + }, + { + "epoch": 0.3, + "learning_rate": 1.592584605424555e-05, + "loss": 0.7332, + "step": 8611 + }, + { + "epoch": 0.3, + "learning_rate": 1.5924968929594804e-05, + "loss": 0.6257, + "step": 8612 + }, + { + "epoch": 0.3, + "learning_rate": 1.5924091734696057e-05, + "loss": 0.6208, + "step": 8613 + }, + { + "epoch": 0.3, + "learning_rate": 1.5923214469559706e-05, + "loss": 0.6376, + "step": 8614 + }, + { + "epoch": 0.3, + "learning_rate": 1.5922337134196158e-05, + "loss": 0.6303, + "step": 8615 + }, + { + "epoch": 0.3, + "learning_rate": 1.5921459728615808e-05, + "loss": 0.6366, + "step": 8616 + }, + { + "epoch": 0.3, + "learning_rate": 1.5920582252829064e-05, + "loss": 0.6524, + "step": 8617 + }, + { + "epoch": 0.3, + "learning_rate": 1.591970470684633e-05, + "loss": 0.643, + "step": 8618 + }, + { + "epoch": 0.3, + "learning_rate": 1.5918827090678006e-05, + "loss": 0.6509, + "step": 8619 + }, + { + "epoch": 0.3, + "learning_rate": 1.5917949404334497e-05, + "loss": 0.5954, + "step": 8620 + }, + { + "epoch": 0.3, + "learning_rate": 1.5917071647826215e-05, + "loss": 0.5931, + "step": 8621 + }, + { + "epoch": 0.3, + "learning_rate": 1.591619382116356e-05, + "loss": 0.6175, + "step": 8622 + }, + { + "epoch": 0.3, + "learning_rate": 1.5915315924356946e-05, + "loss": 0.6329, + "step": 8623 + }, + { + "epoch": 0.3, + "learning_rate": 1.591443795741678e-05, + "loss": 0.6298, + "step": 8624 + }, + { + "epoch": 0.3, + "learning_rate": 1.591355992035347e-05, + "loss": 0.6398, + "step": 8625 + }, + { + "epoch": 0.3, + "learning_rate": 1.5912681813177422e-05, + "loss": 0.6196, + "step": 8626 + }, + { + "epoch": 0.3, + "learning_rate": 1.5911803635899056e-05, + "loss": 0.6198, + "step": 8627 + }, + { + "epoch": 0.3, + "learning_rate": 1.5910925388528777e-05, + "loss": 0.615, + "step": 8628 + }, + { + "epoch": 0.3, + "learning_rate": 1.5910047071076998e-05, + "loss": 0.6401, + "step": 8629 + }, + { + "epoch": 0.3, + "learning_rate": 1.590916868355414e-05, + "loss": 0.613, + "step": 8630 + }, + { + "epoch": 0.3, + "learning_rate": 1.590829022597061e-05, + "loss": 0.5991, + "step": 8631 + }, + { + "epoch": 0.3, + "learning_rate": 1.5907411698336828e-05, + "loss": 0.6193, + "step": 8632 + }, + { + "epoch": 0.3, + "learning_rate": 1.5906533100663203e-05, + "loss": 0.6428, + "step": 8633 + }, + { + "epoch": 0.3, + "learning_rate": 1.590565443296016e-05, + "loss": 0.5701, + "step": 8634 + }, + { + "epoch": 0.3, + "learning_rate": 1.590477569523811e-05, + "loss": 0.6651, + "step": 8635 + }, + { + "epoch": 0.3, + "learning_rate": 1.5903896887507476e-05, + "loss": 0.6232, + "step": 8636 + }, + { + "epoch": 0.3, + "learning_rate": 1.5903018009778676e-05, + "loss": 0.5938, + "step": 8637 + }, + { + "epoch": 0.3, + "learning_rate": 1.5902139062062126e-05, + "loss": 0.6866, + "step": 8638 + }, + { + "epoch": 0.3, + "learning_rate": 1.5901260044368257e-05, + "loss": 0.6288, + "step": 8639 + }, + { + "epoch": 0.3, + "learning_rate": 1.590038095670748e-05, + "loss": 0.6545, + "step": 8640 + }, + { + "epoch": 0.3, + "learning_rate": 1.589950179909023e-05, + "loss": 0.6483, + "step": 8641 + }, + { + "epoch": 0.3, + "learning_rate": 1.5898622571526917e-05, + "loss": 0.5837, + "step": 8642 + }, + { + "epoch": 0.3, + "learning_rate": 1.5897743274027972e-05, + "loss": 0.6561, + "step": 8643 + }, + { + "epoch": 0.3, + "learning_rate": 1.5896863906603825e-05, + "loss": 0.7057, + "step": 8644 + }, + { + "epoch": 0.3, + "learning_rate": 1.589598446926489e-05, + "loss": 0.6458, + "step": 8645 + }, + { + "epoch": 0.3, + "learning_rate": 1.5895104962021607e-05, + "loss": 0.6277, + "step": 8646 + }, + { + "epoch": 0.3, + "learning_rate": 1.589422538488439e-05, + "loss": 0.6143, + "step": 8647 + }, + { + "epoch": 0.3, + "learning_rate": 1.589334573786368e-05, + "loss": 0.5908, + "step": 8648 + }, + { + "epoch": 0.3, + "learning_rate": 1.58924660209699e-05, + "loss": 0.664, + "step": 8649 + }, + { + "epoch": 0.3, + "learning_rate": 1.5891586234213484e-05, + "loss": 0.6761, + "step": 8650 + }, + { + "epoch": 0.3, + "learning_rate": 1.5890706377604855e-05, + "loss": 0.6244, + "step": 8651 + }, + { + "epoch": 0.3, + "learning_rate": 1.5889826451154453e-05, + "loss": 0.6746, + "step": 8652 + }, + { + "epoch": 0.3, + "learning_rate": 1.5888946454872707e-05, + "loss": 0.6106, + "step": 8653 + }, + { + "epoch": 0.3, + "learning_rate": 1.5888066388770052e-05, + "loss": 0.63, + "step": 8654 + }, + { + "epoch": 0.3, + "learning_rate": 1.5887186252856924e-05, + "loss": 0.5461, + "step": 8655 + }, + { + "epoch": 0.3, + "learning_rate": 1.588630604714375e-05, + "loss": 0.6755, + "step": 8656 + }, + { + "epoch": 0.3, + "learning_rate": 1.5885425771640974e-05, + "loss": 0.6881, + "step": 8657 + }, + { + "epoch": 0.3, + "learning_rate": 1.588454542635903e-05, + "loss": 0.6613, + "step": 8658 + }, + { + "epoch": 0.3, + "learning_rate": 1.5883665011308357e-05, + "loss": 0.6069, + "step": 8659 + }, + { + "epoch": 0.3, + "learning_rate": 1.5882784526499393e-05, + "loss": 0.6373, + "step": 8660 + }, + { + "epoch": 0.3, + "learning_rate": 1.5881903971942574e-05, + "loss": 0.652, + "step": 8661 + }, + { + "epoch": 0.3, + "learning_rate": 1.5881023347648348e-05, + "loss": 0.6753, + "step": 8662 + }, + { + "epoch": 0.3, + "learning_rate": 1.588014265362715e-05, + "loss": 0.7159, + "step": 8663 + }, + { + "epoch": 0.3, + "learning_rate": 1.587926188988942e-05, + "loss": 0.6025, + "step": 8664 + }, + { + "epoch": 0.3, + "learning_rate": 1.58783810564456e-05, + "loss": 0.6146, + "step": 8665 + }, + { + "epoch": 0.3, + "learning_rate": 1.587750015330614e-05, + "loss": 0.6301, + "step": 8666 + }, + { + "epoch": 0.3, + "learning_rate": 1.587661918048148e-05, + "loss": 0.643, + "step": 8667 + }, + { + "epoch": 0.3, + "learning_rate": 1.5875738137982065e-05, + "loss": 0.6219, + "step": 8668 + }, + { + "epoch": 0.3, + "learning_rate": 1.5874857025818342e-05, + "loss": 0.6265, + "step": 8669 + }, + { + "epoch": 0.3, + "learning_rate": 1.5873975844000758e-05, + "loss": 0.6598, + "step": 8670 + }, + { + "epoch": 0.3, + "learning_rate": 1.5873094592539756e-05, + "loss": 0.6316, + "step": 8671 + }, + { + "epoch": 0.3, + "learning_rate": 1.5872213271445795e-05, + "loss": 0.6395, + "step": 8672 + }, + { + "epoch": 0.3, + "learning_rate": 1.5871331880729314e-05, + "loss": 0.629, + "step": 8673 + }, + { + "epoch": 0.3, + "learning_rate": 1.587045042040076e-05, + "loss": 0.6711, + "step": 8674 + }, + { + "epoch": 0.3, + "learning_rate": 1.58695688904706e-05, + "loss": 0.6624, + "step": 8675 + }, + { + "epoch": 0.3, + "learning_rate": 1.586868729094927e-05, + "loss": 0.6413, + "step": 8676 + }, + { + "epoch": 0.3, + "learning_rate": 1.586780562184723e-05, + "loss": 0.6206, + "step": 8677 + }, + { + "epoch": 0.3, + "learning_rate": 1.586692388317493e-05, + "loss": 0.6452, + "step": 8678 + }, + { + "epoch": 0.3, + "learning_rate": 1.5866042074942827e-05, + "loss": 0.5941, + "step": 8679 + }, + { + "epoch": 0.3, + "learning_rate": 1.5865160197161378e-05, + "loss": 0.6719, + "step": 8680 + }, + { + "epoch": 0.3, + "learning_rate": 1.586427824984103e-05, + "loss": 0.6269, + "step": 8681 + }, + { + "epoch": 0.3, + "learning_rate": 1.5863396232992245e-05, + "loss": 0.6844, + "step": 8682 + }, + { + "epoch": 0.3, + "learning_rate": 1.5862514146625483e-05, + "loss": 0.6197, + "step": 8683 + }, + { + "epoch": 0.3, + "learning_rate": 1.58616319907512e-05, + "loss": 0.6275, + "step": 8684 + }, + { + "epoch": 0.3, + "learning_rate": 1.586074976537985e-05, + "loss": 0.6116, + "step": 8685 + }, + { + "epoch": 0.3, + "learning_rate": 1.5859867470521906e-05, + "loss": 0.6438, + "step": 8686 + }, + { + "epoch": 0.3, + "learning_rate": 1.5858985106187815e-05, + "loss": 0.636, + "step": 8687 + }, + { + "epoch": 0.3, + "learning_rate": 1.5858102672388044e-05, + "loss": 0.617, + "step": 8688 + }, + { + "epoch": 0.3, + "learning_rate": 1.5857220169133055e-05, + "loss": 0.6658, + "step": 8689 + }, + { + "epoch": 0.3, + "learning_rate": 1.5856337596433314e-05, + "loss": 0.6577, + "step": 8690 + }, + { + "epoch": 0.3, + "learning_rate": 1.585545495429928e-05, + "loss": 0.6874, + "step": 8691 + }, + { + "epoch": 0.3, + "learning_rate": 1.5854572242741424e-05, + "loss": 0.6086, + "step": 8692 + }, + { + "epoch": 0.3, + "learning_rate": 1.5853689461770206e-05, + "loss": 0.642, + "step": 8693 + }, + { + "epoch": 0.3, + "learning_rate": 1.585280661139609e-05, + "loss": 0.5947, + "step": 8694 + }, + { + "epoch": 0.3, + "learning_rate": 1.5851923691629553e-05, + "loss": 0.691, + "step": 8695 + }, + { + "epoch": 0.3, + "learning_rate": 1.5851040702481056e-05, + "loss": 0.6144, + "step": 8696 + }, + { + "epoch": 0.3, + "learning_rate": 1.585015764396107e-05, + "loss": 0.6448, + "step": 8697 + }, + { + "epoch": 0.3, + "learning_rate": 1.5849274516080068e-05, + "loss": 0.636, + "step": 8698 + }, + { + "epoch": 0.3, + "learning_rate": 1.584839131884851e-05, + "loss": 0.5914, + "step": 8699 + }, + { + "epoch": 0.3, + "learning_rate": 1.5847508052276884e-05, + "loss": 0.609, + "step": 8700 + }, + { + "epoch": 0.3, + "learning_rate": 1.5846624716375646e-05, + "loss": 0.6179, + "step": 8701 + }, + { + "epoch": 0.3, + "learning_rate": 1.5845741311155278e-05, + "loss": 0.638, + "step": 8702 + }, + { + "epoch": 0.3, + "learning_rate": 1.584485783662625e-05, + "loss": 0.6384, + "step": 8703 + }, + { + "epoch": 0.3, + "learning_rate": 1.584397429279904e-05, + "loss": 0.5932, + "step": 8704 + }, + { + "epoch": 0.3, + "learning_rate": 1.5843090679684123e-05, + "loss": 0.5766, + "step": 8705 + }, + { + "epoch": 0.3, + "learning_rate": 1.5842206997291976e-05, + "loss": 0.6848, + "step": 8706 + }, + { + "epoch": 0.3, + "learning_rate": 1.584132324563307e-05, + "loss": 0.5924, + "step": 8707 + }, + { + "epoch": 0.3, + "learning_rate": 1.584043942471789e-05, + "loss": 0.6284, + "step": 8708 + }, + { + "epoch": 0.3, + "learning_rate": 1.5839555534556913e-05, + "loss": 0.6147, + "step": 8709 + }, + { + "epoch": 0.3, + "learning_rate": 1.5838671575160618e-05, + "loss": 0.5985, + "step": 8710 + }, + { + "epoch": 0.3, + "learning_rate": 1.5837787546539485e-05, + "loss": 0.6344, + "step": 8711 + }, + { + "epoch": 0.3, + "learning_rate": 1.5836903448703997e-05, + "loss": 0.619, + "step": 8712 + }, + { + "epoch": 0.3, + "learning_rate": 1.5836019281664632e-05, + "loss": 0.6738, + "step": 8713 + }, + { + "epoch": 0.3, + "learning_rate": 1.583513504543188e-05, + "loss": 0.6401, + "step": 8714 + }, + { + "epoch": 0.3, + "learning_rate": 1.5834250740016215e-05, + "loss": 0.6963, + "step": 8715 + }, + { + "epoch": 0.3, + "learning_rate": 1.583336636542813e-05, + "loss": 0.6185, + "step": 8716 + }, + { + "epoch": 0.3, + "learning_rate": 1.5832481921678108e-05, + "loss": 0.5791, + "step": 8717 + }, + { + "epoch": 0.3, + "learning_rate": 1.5831597408776634e-05, + "loss": 0.6872, + "step": 8718 + }, + { + "epoch": 0.3, + "learning_rate": 1.5830712826734193e-05, + "loss": 0.6593, + "step": 8719 + }, + { + "epoch": 0.3, + "learning_rate": 1.5829828175561282e-05, + "loss": 0.668, + "step": 8720 + }, + { + "epoch": 0.3, + "learning_rate": 1.582894345526838e-05, + "loss": 0.7414, + "step": 8721 + }, + { + "epoch": 0.3, + "learning_rate": 1.5828058665865976e-05, + "loss": 0.6154, + "step": 8722 + }, + { + "epoch": 0.3, + "learning_rate": 1.5827173807364567e-05, + "loss": 0.6456, + "step": 8723 + }, + { + "epoch": 0.3, + "learning_rate": 1.5826288879774645e-05, + "loss": 0.6198, + "step": 8724 + }, + { + "epoch": 0.3, + "learning_rate": 1.5825403883106692e-05, + "loss": 0.6948, + "step": 8725 + }, + { + "epoch": 0.3, + "learning_rate": 1.5824518817371212e-05, + "loss": 0.6138, + "step": 8726 + }, + { + "epoch": 0.3, + "learning_rate": 1.582363368257869e-05, + "loss": 0.5739, + "step": 8727 + }, + { + "epoch": 0.3, + "learning_rate": 1.582274847873962e-05, + "loss": 0.5841, + "step": 8728 + }, + { + "epoch": 0.3, + "learning_rate": 1.582186320586451e-05, + "loss": 0.5634, + "step": 8729 + }, + { + "epoch": 0.3, + "learning_rate": 1.5820977863963842e-05, + "loss": 0.587, + "step": 8730 + }, + { + "epoch": 0.3, + "learning_rate": 1.582009245304812e-05, + "loss": 0.6274, + "step": 8731 + }, + { + "epoch": 0.3, + "learning_rate": 1.5819206973127837e-05, + "loss": 0.6916, + "step": 8732 + }, + { + "epoch": 0.3, + "learning_rate": 1.5818321424213495e-05, + "loss": 0.6705, + "step": 8733 + }, + { + "epoch": 0.3, + "learning_rate": 1.5817435806315593e-05, + "loss": 0.5973, + "step": 8734 + }, + { + "epoch": 0.3, + "learning_rate": 1.581655011944463e-05, + "loss": 0.5865, + "step": 8735 + }, + { + "epoch": 0.3, + "learning_rate": 1.5815664363611105e-05, + "loss": 0.6643, + "step": 8736 + }, + { + "epoch": 0.3, + "learning_rate": 1.5814778538825525e-05, + "loss": 0.6083, + "step": 8737 + }, + { + "epoch": 0.3, + "learning_rate": 1.5813892645098388e-05, + "loss": 0.6288, + "step": 8738 + }, + { + "epoch": 0.3, + "learning_rate": 1.58130066824402e-05, + "loss": 0.5992, + "step": 8739 + }, + { + "epoch": 0.3, + "learning_rate": 1.5812120650861464e-05, + "loss": 0.6888, + "step": 8740 + }, + { + "epoch": 0.3, + "learning_rate": 1.5811234550372683e-05, + "loss": 0.646, + "step": 8741 + }, + { + "epoch": 0.3, + "learning_rate": 1.581034838098437e-05, + "loss": 0.6387, + "step": 8742 + }, + { + "epoch": 0.3, + "learning_rate": 1.5809462142707024e-05, + "loss": 0.5663, + "step": 8743 + }, + { + "epoch": 0.3, + "learning_rate": 1.5808575835551153e-05, + "loss": 0.6733, + "step": 8744 + }, + { + "epoch": 0.3, + "learning_rate": 1.5807689459527274e-05, + "loss": 0.6237, + "step": 8745 + }, + { + "epoch": 0.3, + "learning_rate": 1.5806803014645885e-05, + "loss": 0.6311, + "step": 8746 + }, + { + "epoch": 0.3, + "learning_rate": 1.58059165009175e-05, + "loss": 0.5718, + "step": 8747 + }, + { + "epoch": 0.3, + "learning_rate": 1.580502991835263e-05, + "loss": 0.6615, + "step": 8748 + }, + { + "epoch": 0.3, + "learning_rate": 1.580414326696179e-05, + "loss": 0.6613, + "step": 8749 + }, + { + "epoch": 0.3, + "learning_rate": 1.5803256546755486e-05, + "loss": 0.5902, + "step": 8750 + }, + { + "epoch": 0.3, + "learning_rate": 1.580236975774424e-05, + "loss": 0.5513, + "step": 8751 + }, + { + "epoch": 0.3, + "learning_rate": 1.5801482899938556e-05, + "loss": 0.6556, + "step": 8752 + }, + { + "epoch": 0.3, + "learning_rate": 1.5800595973348954e-05, + "loss": 0.6468, + "step": 8753 + }, + { + "epoch": 0.3, + "learning_rate": 1.579970897798595e-05, + "loss": 0.6156, + "step": 8754 + }, + { + "epoch": 0.3, + "learning_rate": 1.5798821913860058e-05, + "loss": 0.6162, + "step": 8755 + }, + { + "epoch": 0.3, + "learning_rate": 1.57979347809818e-05, + "loss": 0.6559, + "step": 8756 + }, + { + "epoch": 0.3, + "learning_rate": 1.5797047579361686e-05, + "loss": 0.6418, + "step": 8757 + }, + { + "epoch": 0.3, + "learning_rate": 1.5796160309010244e-05, + "loss": 0.6323, + "step": 8758 + }, + { + "epoch": 0.3, + "learning_rate": 1.5795272969937985e-05, + "loss": 0.6762, + "step": 8759 + }, + { + "epoch": 0.3, + "learning_rate": 1.5794385562155436e-05, + "loss": 0.604, + "step": 8760 + }, + { + "epoch": 0.3, + "learning_rate": 1.5793498085673115e-05, + "loss": 0.6536, + "step": 8761 + }, + { + "epoch": 0.3, + "learning_rate": 1.579261054050155e-05, + "loss": 0.6435, + "step": 8762 + }, + { + "epoch": 0.3, + "learning_rate": 1.5791722926651253e-05, + "loss": 0.6369, + "step": 8763 + }, + { + "epoch": 0.3, + "learning_rate": 1.5790835244132758e-05, + "loss": 0.6605, + "step": 8764 + }, + { + "epoch": 0.3, + "learning_rate": 1.578994749295659e-05, + "loss": 0.6888, + "step": 8765 + }, + { + "epoch": 0.3, + "learning_rate": 1.578905967313326e-05, + "loss": 0.6403, + "step": 8766 + }, + { + "epoch": 0.3, + "learning_rate": 1.578817178467331e-05, + "loss": 0.6039, + "step": 8767 + }, + { + "epoch": 0.3, + "learning_rate": 1.578728382758726e-05, + "loss": 0.677, + "step": 8768 + }, + { + "epoch": 0.3, + "learning_rate": 1.578639580188564e-05, + "loss": 0.6724, + "step": 8769 + }, + { + "epoch": 0.3, + "learning_rate": 1.578550770757898e-05, + "loss": 0.6353, + "step": 8770 + }, + { + "epoch": 0.3, + "learning_rate": 1.5784619544677804e-05, + "loss": 0.691, + "step": 8771 + }, + { + "epoch": 0.3, + "learning_rate": 1.5783731313192646e-05, + "loss": 0.6791, + "step": 8772 + }, + { + "epoch": 0.3, + "learning_rate": 1.578284301313404e-05, + "loss": 0.6295, + "step": 8773 + }, + { + "epoch": 0.3, + "learning_rate": 1.5781954644512513e-05, + "loss": 0.6811, + "step": 8774 + }, + { + "epoch": 0.3, + "learning_rate": 1.57810662073386e-05, + "loss": 0.6333, + "step": 8775 + }, + { + "epoch": 0.3, + "learning_rate": 1.578017770162283e-05, + "loss": 0.6775, + "step": 8776 + }, + { + "epoch": 0.3, + "learning_rate": 1.5779289127375744e-05, + "loss": 0.6088, + "step": 8777 + }, + { + "epoch": 0.3, + "learning_rate": 1.5778400484607876e-05, + "loss": 0.68, + "step": 8778 + }, + { + "epoch": 0.3, + "learning_rate": 1.577751177332976e-05, + "loss": 0.6197, + "step": 8779 + }, + { + "epoch": 0.3, + "learning_rate": 1.5776622993551935e-05, + "loss": 0.619, + "step": 8780 + }, + { + "epoch": 0.3, + "learning_rate": 1.5775734145284933e-05, + "loss": 0.5962, + "step": 8781 + }, + { + "epoch": 0.3, + "learning_rate": 1.5774845228539298e-05, + "loss": 0.628, + "step": 8782 + }, + { + "epoch": 0.3, + "learning_rate": 1.577395624332557e-05, + "loss": 0.6278, + "step": 8783 + }, + { + "epoch": 0.3, + "learning_rate": 1.577306718965428e-05, + "loss": 0.6022, + "step": 8784 + }, + { + "epoch": 0.3, + "learning_rate": 1.5772178067535984e-05, + "loss": 0.5669, + "step": 8785 + }, + { + "epoch": 0.3, + "learning_rate": 1.577128887698121e-05, + "loss": 0.6849, + "step": 8786 + }, + { + "epoch": 0.3, + "learning_rate": 1.5770399618000508e-05, + "loss": 0.6074, + "step": 8787 + }, + { + "epoch": 0.3, + "learning_rate": 1.5769510290604417e-05, + "loss": 0.6703, + "step": 8788 + }, + { + "epoch": 0.3, + "learning_rate": 1.5768620894803483e-05, + "loss": 0.5874, + "step": 8789 + }, + { + "epoch": 0.3, + "learning_rate": 1.5767731430608253e-05, + "loss": 0.6427, + "step": 8790 + }, + { + "epoch": 0.3, + "learning_rate": 1.576684189802927e-05, + "loss": 0.7125, + "step": 8791 + }, + { + "epoch": 0.3, + "learning_rate": 1.576595229707708e-05, + "loss": 0.6505, + "step": 8792 + }, + { + "epoch": 0.3, + "learning_rate": 1.576506262776223e-05, + "loss": 0.6272, + "step": 8793 + }, + { + "epoch": 0.3, + "learning_rate": 1.5764172890095273e-05, + "loss": 0.6346, + "step": 8794 + }, + { + "epoch": 0.3, + "learning_rate": 1.5763283084086755e-05, + "loss": 0.6675, + "step": 8795 + }, + { + "epoch": 0.3, + "learning_rate": 1.5762393209747226e-05, + "loss": 0.6318, + "step": 8796 + }, + { + "epoch": 0.3, + "learning_rate": 1.576150326708723e-05, + "loss": 0.6546, + "step": 8797 + }, + { + "epoch": 0.3, + "learning_rate": 1.576061325611733e-05, + "loss": 0.5844, + "step": 8798 + }, + { + "epoch": 0.3, + "learning_rate": 1.5759723176848073e-05, + "loss": 0.5911, + "step": 8799 + }, + { + "epoch": 0.3, + "learning_rate": 1.575883302929001e-05, + "loss": 0.6118, + "step": 8800 + }, + { + "epoch": 0.3, + "learning_rate": 1.5757942813453693e-05, + "loss": 0.6215, + "step": 8801 + }, + { + "epoch": 0.3, + "learning_rate": 1.5757052529349687e-05, + "loss": 0.6754, + "step": 8802 + }, + { + "epoch": 0.31, + "learning_rate": 1.5756162176988533e-05, + "loss": 0.6408, + "step": 8803 + }, + { + "epoch": 0.31, + "learning_rate": 1.57552717563808e-05, + "loss": 0.6272, + "step": 8804 + }, + { + "epoch": 0.31, + "learning_rate": 1.575438126753704e-05, + "loss": 0.6272, + "step": 8805 + }, + { + "epoch": 0.31, + "learning_rate": 1.5753490710467807e-05, + "loss": 0.6325, + "step": 8806 + }, + { + "epoch": 0.31, + "learning_rate": 1.5752600085183666e-05, + "loss": 0.6382, + "step": 8807 + }, + { + "epoch": 0.31, + "learning_rate": 1.5751709391695175e-05, + "loss": 0.6404, + "step": 8808 + }, + { + "epoch": 0.31, + "learning_rate": 1.5750818630012892e-05, + "loss": 0.6909, + "step": 8809 + }, + { + "epoch": 0.31, + "learning_rate": 1.574992780014738e-05, + "loss": 0.595, + "step": 8810 + }, + { + "epoch": 0.31, + "learning_rate": 1.57490369021092e-05, + "loss": 0.6623, + "step": 8811 + }, + { + "epoch": 0.31, + "learning_rate": 1.574814593590891e-05, + "loss": 0.6069, + "step": 8812 + }, + { + "epoch": 0.31, + "learning_rate": 1.5747254901557087e-05, + "loss": 0.6081, + "step": 8813 + }, + { + "epoch": 0.31, + "learning_rate": 1.574636379906428e-05, + "loss": 0.6867, + "step": 8814 + }, + { + "epoch": 0.31, + "learning_rate": 1.5745472628441066e-05, + "loss": 0.6511, + "step": 8815 + }, + { + "epoch": 0.31, + "learning_rate": 1.5744581389698005e-05, + "loss": 0.647, + "step": 8816 + }, + { + "epoch": 0.31, + "learning_rate": 1.5743690082845662e-05, + "loss": 0.6221, + "step": 8817 + }, + { + "epoch": 0.31, + "learning_rate": 1.5742798707894608e-05, + "loss": 0.6469, + "step": 8818 + }, + { + "epoch": 0.31, + "learning_rate": 1.574190726485541e-05, + "loss": 0.6167, + "step": 8819 + }, + { + "epoch": 0.31, + "learning_rate": 1.574101575373864e-05, + "loss": 0.6373, + "step": 8820 + }, + { + "epoch": 0.31, + "learning_rate": 1.5740124174554863e-05, + "loss": 0.6337, + "step": 8821 + }, + { + "epoch": 0.31, + "learning_rate": 1.5739232527314657e-05, + "loss": 0.5832, + "step": 8822 + }, + { + "epoch": 0.31, + "learning_rate": 1.5738340812028586e-05, + "loss": 0.6087, + "step": 8823 + }, + { + "epoch": 0.31, + "learning_rate": 1.5737449028707224e-05, + "loss": 0.6079, + "step": 8824 + }, + { + "epoch": 0.31, + "learning_rate": 1.573655717736115e-05, + "loss": 0.6545, + "step": 8825 + }, + { + "epoch": 0.31, + "learning_rate": 1.5735665258000933e-05, + "loss": 0.6502, + "step": 8826 + }, + { + "epoch": 0.31, + "learning_rate": 1.573477327063715e-05, + "loss": 0.601, + "step": 8827 + }, + { + "epoch": 0.31, + "learning_rate": 1.5733881215280373e-05, + "loss": 0.6633, + "step": 8828 + }, + { + "epoch": 0.31, + "learning_rate": 1.5732989091941178e-05, + "loss": 0.6072, + "step": 8829 + }, + { + "epoch": 0.31, + "learning_rate": 1.573209690063015e-05, + "loss": 0.6105, + "step": 8830 + }, + { + "epoch": 0.31, + "learning_rate": 1.5731204641357857e-05, + "loss": 0.6476, + "step": 8831 + }, + { + "epoch": 0.31, + "learning_rate": 1.5730312314134888e-05, + "loss": 0.6675, + "step": 8832 + }, + { + "epoch": 0.31, + "learning_rate": 1.5729419918971815e-05, + "loss": 0.6042, + "step": 8833 + }, + { + "epoch": 0.31, + "learning_rate": 1.5728527455879225e-05, + "loss": 0.6166, + "step": 8834 + }, + { + "epoch": 0.31, + "learning_rate": 1.572763492486769e-05, + "loss": 0.6422, + "step": 8835 + }, + { + "epoch": 0.31, + "learning_rate": 1.57267423259478e-05, + "loss": 0.5889, + "step": 8836 + }, + { + "epoch": 0.31, + "learning_rate": 1.572584965913013e-05, + "loss": 0.632, + "step": 8837 + }, + { + "epoch": 0.31, + "learning_rate": 1.572495692442528e-05, + "loss": 0.6383, + "step": 8838 + }, + { + "epoch": 0.31, + "learning_rate": 1.5724064121843815e-05, + "loss": 0.6455, + "step": 8839 + }, + { + "epoch": 0.31, + "learning_rate": 1.5723171251396332e-05, + "loss": 0.6279, + "step": 8840 + }, + { + "epoch": 0.31, + "learning_rate": 1.5722278313093413e-05, + "loss": 0.5854, + "step": 8841 + }, + { + "epoch": 0.31, + "learning_rate": 1.5721385306945645e-05, + "loss": 0.6143, + "step": 8842 + }, + { + "epoch": 0.31, + "learning_rate": 1.572049223296362e-05, + "loss": 0.6113, + "step": 8843 + }, + { + "epoch": 0.31, + "learning_rate": 1.571959909115792e-05, + "loss": 0.6469, + "step": 8844 + }, + { + "epoch": 0.31, + "learning_rate": 1.571870588153914e-05, + "loss": 0.5998, + "step": 8845 + }, + { + "epoch": 0.31, + "learning_rate": 1.5717812604117867e-05, + "loss": 0.6691, + "step": 8846 + }, + { + "epoch": 0.31, + "learning_rate": 1.571691925890469e-05, + "loss": 0.6825, + "step": 8847 + }, + { + "epoch": 0.31, + "learning_rate": 1.5716025845910207e-05, + "loss": 0.633, + "step": 8848 + }, + { + "epoch": 0.31, + "learning_rate": 1.5715132365145e-05, + "loss": 0.6573, + "step": 8849 + }, + { + "epoch": 0.31, + "learning_rate": 1.5714238816619677e-05, + "loss": 0.6178, + "step": 8850 + }, + { + "epoch": 0.31, + "learning_rate": 1.571334520034482e-05, + "loss": 0.6145, + "step": 8851 + }, + { + "epoch": 0.31, + "learning_rate": 1.571245151633103e-05, + "loss": 0.6371, + "step": 8852 + }, + { + "epoch": 0.31, + "learning_rate": 1.57115577645889e-05, + "loss": 0.6464, + "step": 8853 + }, + { + "epoch": 0.31, + "learning_rate": 1.5710663945129026e-05, + "loss": 0.6533, + "step": 8854 + }, + { + "epoch": 0.31, + "learning_rate": 1.5709770057962012e-05, + "loss": 0.6443, + "step": 8855 + }, + { + "epoch": 0.31, + "learning_rate": 1.5708876103098444e-05, + "loss": 0.6006, + "step": 8856 + }, + { + "epoch": 0.31, + "learning_rate": 1.5707982080548934e-05, + "loss": 0.5768, + "step": 8857 + }, + { + "epoch": 0.31, + "learning_rate": 1.5707087990324073e-05, + "loss": 0.5783, + "step": 8858 + }, + { + "epoch": 0.31, + "learning_rate": 1.5706193832434463e-05, + "loss": 0.6239, + "step": 8859 + }, + { + "epoch": 0.31, + "learning_rate": 1.5705299606890712e-05, + "loss": 0.7271, + "step": 8860 + }, + { + "epoch": 0.31, + "learning_rate": 1.570440531370341e-05, + "loss": 0.6131, + "step": 8861 + }, + { + "epoch": 0.31, + "learning_rate": 1.5703510952883172e-05, + "loss": 0.6724, + "step": 8862 + }, + { + "epoch": 0.31, + "learning_rate": 1.5702616524440596e-05, + "loss": 0.6381, + "step": 8863 + }, + { + "epoch": 0.31, + "learning_rate": 1.5701722028386286e-05, + "loss": 0.6803, + "step": 8864 + }, + { + "epoch": 0.31, + "learning_rate": 1.570082746473085e-05, + "loss": 0.6018, + "step": 8865 + }, + { + "epoch": 0.31, + "learning_rate": 1.569993283348489e-05, + "loss": 0.5792, + "step": 8866 + }, + { + "epoch": 0.31, + "learning_rate": 1.569903813465902e-05, + "loss": 0.6568, + "step": 8867 + }, + { + "epoch": 0.31, + "learning_rate": 1.569814336826384e-05, + "loss": 0.5923, + "step": 8868 + }, + { + "epoch": 0.31, + "learning_rate": 1.5697248534309963e-05, + "loss": 0.6365, + "step": 8869 + }, + { + "epoch": 0.31, + "learning_rate": 1.5696353632808e-05, + "loss": 0.6496, + "step": 8870 + }, + { + "epoch": 0.31, + "learning_rate": 1.5695458663768554e-05, + "loss": 0.644, + "step": 8871 + }, + { + "epoch": 0.31, + "learning_rate": 1.5694563627202245e-05, + "loss": 0.6524, + "step": 8872 + }, + { + "epoch": 0.31, + "learning_rate": 1.569366852311968e-05, + "loss": 0.6332, + "step": 8873 + }, + { + "epoch": 0.31, + "learning_rate": 1.569277335153147e-05, + "loss": 0.6805, + "step": 8874 + }, + { + "epoch": 0.31, + "learning_rate": 1.5691878112448233e-05, + "loss": 0.5999, + "step": 8875 + }, + { + "epoch": 0.31, + "learning_rate": 1.5690982805880577e-05, + "loss": 0.6708, + "step": 8876 + }, + { + "epoch": 0.31, + "learning_rate": 1.5690087431839126e-05, + "loss": 0.5845, + "step": 8877 + }, + { + "epoch": 0.31, + "learning_rate": 1.5689191990334487e-05, + "loss": 0.6219, + "step": 8878 + }, + { + "epoch": 0.31, + "learning_rate": 1.568829648137728e-05, + "loss": 0.6225, + "step": 8879 + }, + { + "epoch": 0.31, + "learning_rate": 1.5687400904978124e-05, + "loss": 0.5981, + "step": 8880 + }, + { + "epoch": 0.31, + "learning_rate": 1.5686505261147634e-05, + "loss": 0.6825, + "step": 8881 + }, + { + "epoch": 0.31, + "learning_rate": 1.568560954989643e-05, + "loss": 0.6751, + "step": 8882 + }, + { + "epoch": 0.31, + "learning_rate": 1.5684713771235135e-05, + "loss": 0.6208, + "step": 8883 + }, + { + "epoch": 0.31, + "learning_rate": 1.5683817925174366e-05, + "loss": 0.6593, + "step": 8884 + }, + { + "epoch": 0.31, + "learning_rate": 1.5682922011724747e-05, + "loss": 0.6601, + "step": 8885 + }, + { + "epoch": 0.31, + "learning_rate": 1.5682026030896897e-05, + "loss": 0.5804, + "step": 8886 + }, + { + "epoch": 0.31, + "learning_rate": 1.568112998270144e-05, + "loss": 0.6305, + "step": 8887 + }, + { + "epoch": 0.31, + "learning_rate": 1.5680233867149e-05, + "loss": 0.6878, + "step": 8888 + }, + { + "epoch": 0.31, + "learning_rate": 1.5679337684250205e-05, + "loss": 0.6912, + "step": 8889 + }, + { + "epoch": 0.31, + "learning_rate": 1.567844143401567e-05, + "loss": 0.6429, + "step": 8890 + }, + { + "epoch": 0.31, + "learning_rate": 1.5677545116456036e-05, + "loss": 0.6548, + "step": 8891 + }, + { + "epoch": 0.31, + "learning_rate": 1.5676648731581922e-05, + "loss": 0.6318, + "step": 8892 + }, + { + "epoch": 0.31, + "learning_rate": 1.5675752279403954e-05, + "loss": 0.6024, + "step": 8893 + }, + { + "epoch": 0.31, + "learning_rate": 1.5674855759932764e-05, + "loss": 0.6368, + "step": 8894 + }, + { + "epoch": 0.31, + "learning_rate": 1.567395917317898e-05, + "loss": 0.6384, + "step": 8895 + }, + { + "epoch": 0.31, + "learning_rate": 1.5673062519153233e-05, + "loss": 0.5812, + "step": 8896 + }, + { + "epoch": 0.31, + "learning_rate": 1.5672165797866154e-05, + "loss": 0.6393, + "step": 8897 + }, + { + "epoch": 0.31, + "learning_rate": 1.5671269009328373e-05, + "loss": 0.5753, + "step": 8898 + }, + { + "epoch": 0.31, + "learning_rate": 1.567037215355052e-05, + "loss": 0.5944, + "step": 8899 + }, + { + "epoch": 0.31, + "learning_rate": 1.566947523054324e-05, + "loss": 0.6254, + "step": 8900 + }, + { + "epoch": 0.31, + "learning_rate": 1.5668578240317153e-05, + "loss": 0.6614, + "step": 8901 + }, + { + "epoch": 0.31, + "learning_rate": 1.56676811828829e-05, + "loss": 0.6209, + "step": 8902 + }, + { + "epoch": 0.31, + "learning_rate": 1.566678405825112e-05, + "loss": 0.6352, + "step": 8903 + }, + { + "epoch": 0.31, + "learning_rate": 1.5665886866432445e-05, + "loss": 0.6514, + "step": 8904 + }, + { + "epoch": 0.31, + "learning_rate": 1.5664989607437515e-05, + "loss": 0.6315, + "step": 8905 + }, + { + "epoch": 0.31, + "learning_rate": 1.5664092281276964e-05, + "loss": 0.6231, + "step": 8906 + }, + { + "epoch": 0.31, + "learning_rate": 1.5663194887961437e-05, + "loss": 0.6118, + "step": 8907 + }, + { + "epoch": 0.31, + "learning_rate": 1.566229742750157e-05, + "loss": 0.6374, + "step": 8908 + }, + { + "epoch": 0.31, + "learning_rate": 1.5661399899908003e-05, + "loss": 0.6627, + "step": 8909 + }, + { + "epoch": 0.31, + "learning_rate": 1.566050230519138e-05, + "loss": 0.6455, + "step": 8910 + }, + { + "epoch": 0.31, + "learning_rate": 1.565960464336234e-05, + "loss": 0.5618, + "step": 8911 + }, + { + "epoch": 0.31, + "learning_rate": 1.565870691443153e-05, + "loss": 0.679, + "step": 8912 + }, + { + "epoch": 0.31, + "learning_rate": 1.565780911840959e-05, + "loss": 0.6177, + "step": 8913 + }, + { + "epoch": 0.31, + "learning_rate": 1.5656911255307164e-05, + "loss": 0.6907, + "step": 8914 + }, + { + "epoch": 0.31, + "learning_rate": 1.5656013325134897e-05, + "loss": 0.6334, + "step": 8915 + }, + { + "epoch": 0.31, + "learning_rate": 1.565511532790344e-05, + "loss": 0.6411, + "step": 8916 + }, + { + "epoch": 0.31, + "learning_rate": 1.565421726362344e-05, + "loss": 0.5995, + "step": 8917 + }, + { + "epoch": 0.31, + "learning_rate": 1.565331913230554e-05, + "loss": 0.6506, + "step": 8918 + }, + { + "epoch": 0.31, + "learning_rate": 1.5652420933960392e-05, + "loss": 0.633, + "step": 8919 + }, + { + "epoch": 0.31, + "learning_rate": 1.565152266859864e-05, + "loss": 0.6835, + "step": 8920 + }, + { + "epoch": 0.31, + "learning_rate": 1.5650624336230936e-05, + "loss": 0.6199, + "step": 8921 + }, + { + "epoch": 0.31, + "learning_rate": 1.5649725936867936e-05, + "loss": 0.6083, + "step": 8922 + }, + { + "epoch": 0.31, + "learning_rate": 1.5648827470520286e-05, + "loss": 0.5663, + "step": 8923 + }, + { + "epoch": 0.31, + "learning_rate": 1.5647928937198642e-05, + "loss": 0.5544, + "step": 8924 + }, + { + "epoch": 0.31, + "learning_rate": 1.5647030336913657e-05, + "loss": 0.6479, + "step": 8925 + }, + { + "epoch": 0.31, + "learning_rate": 1.5646131669675982e-05, + "loss": 0.6049, + "step": 8926 + }, + { + "epoch": 0.31, + "learning_rate": 1.5645232935496274e-05, + "loss": 0.6449, + "step": 8927 + }, + { + "epoch": 0.31, + "learning_rate": 1.5644334134385187e-05, + "loss": 0.6602, + "step": 8928 + }, + { + "epoch": 0.31, + "learning_rate": 1.564343526635338e-05, + "loss": 0.5799, + "step": 8929 + }, + { + "epoch": 0.31, + "learning_rate": 1.5642536331411507e-05, + "loss": 0.6002, + "step": 8930 + }, + { + "epoch": 0.31, + "learning_rate": 1.564163732957023e-05, + "loss": 0.5949, + "step": 8931 + }, + { + "epoch": 0.31, + "learning_rate": 1.5640738260840206e-05, + "loss": 0.6793, + "step": 8932 + }, + { + "epoch": 0.31, + "learning_rate": 1.5639839125232096e-05, + "loss": 0.5545, + "step": 8933 + }, + { + "epoch": 0.31, + "learning_rate": 1.5638939922756555e-05, + "loss": 0.6307, + "step": 8934 + }, + { + "epoch": 0.31, + "learning_rate": 1.563804065342425e-05, + "loss": 0.6568, + "step": 8935 + }, + { + "epoch": 0.31, + "learning_rate": 1.5637141317245838e-05, + "loss": 0.614, + "step": 8936 + }, + { + "epoch": 0.31, + "learning_rate": 1.5636241914231988e-05, + "loss": 0.6413, + "step": 8937 + }, + { + "epoch": 0.31, + "learning_rate": 1.563534244439336e-05, + "loss": 0.6472, + "step": 8938 + }, + { + "epoch": 0.31, + "learning_rate": 1.5634442907740617e-05, + "loss": 0.5852, + "step": 8939 + }, + { + "epoch": 0.31, + "learning_rate": 1.5633543304284426e-05, + "loss": 0.6204, + "step": 8940 + }, + { + "epoch": 0.31, + "learning_rate": 1.5632643634035455e-05, + "loss": 0.6374, + "step": 8941 + }, + { + "epoch": 0.31, + "learning_rate": 1.5631743897004367e-05, + "loss": 0.6492, + "step": 8942 + }, + { + "epoch": 0.31, + "learning_rate": 1.5630844093201827e-05, + "loss": 0.6314, + "step": 8943 + }, + { + "epoch": 0.31, + "learning_rate": 1.5629944222638512e-05, + "loss": 0.6363, + "step": 8944 + }, + { + "epoch": 0.31, + "learning_rate": 1.5629044285325084e-05, + "loss": 0.6415, + "step": 8945 + }, + { + "epoch": 0.31, + "learning_rate": 1.562814428127222e-05, + "loss": 0.6458, + "step": 8946 + }, + { + "epoch": 0.31, + "learning_rate": 1.562724421049058e-05, + "loss": 0.648, + "step": 8947 + }, + { + "epoch": 0.31, + "learning_rate": 1.5626344072990842e-05, + "loss": 0.5763, + "step": 8948 + }, + { + "epoch": 0.31, + "learning_rate": 1.562544386878368e-05, + "loss": 0.5904, + "step": 8949 + }, + { + "epoch": 0.31, + "learning_rate": 1.562454359787976e-05, + "loss": 0.6567, + "step": 8950 + }, + { + "epoch": 0.31, + "learning_rate": 1.562364326028977e-05, + "loss": 0.6079, + "step": 8951 + }, + { + "epoch": 0.31, + "learning_rate": 1.5622742856024368e-05, + "loss": 0.6309, + "step": 8952 + }, + { + "epoch": 0.31, + "learning_rate": 1.5621842385094237e-05, + "loss": 0.6191, + "step": 8953 + }, + { + "epoch": 0.31, + "learning_rate": 1.5620941847510054e-05, + "loss": 0.6293, + "step": 8954 + }, + { + "epoch": 0.31, + "learning_rate": 1.5620041243282494e-05, + "loss": 0.6605, + "step": 8955 + }, + { + "epoch": 0.31, + "learning_rate": 1.5619140572422237e-05, + "loss": 0.6446, + "step": 8956 + }, + { + "epoch": 0.31, + "learning_rate": 1.5618239834939962e-05, + "loss": 0.6179, + "step": 8957 + }, + { + "epoch": 0.31, + "learning_rate": 1.5617339030846345e-05, + "loss": 0.5993, + "step": 8958 + }, + { + "epoch": 0.31, + "learning_rate": 1.561643816015207e-05, + "loss": 0.5899, + "step": 8959 + }, + { + "epoch": 0.31, + "learning_rate": 1.561553722286781e-05, + "loss": 0.5926, + "step": 8960 + }, + { + "epoch": 0.31, + "learning_rate": 1.5614636219004254e-05, + "loss": 0.6315, + "step": 8961 + }, + { + "epoch": 0.31, + "learning_rate": 1.5613735148572088e-05, + "loss": 0.5757, + "step": 8962 + }, + { + "epoch": 0.31, + "learning_rate": 1.5612834011581987e-05, + "loss": 0.5722, + "step": 8963 + }, + { + "epoch": 0.31, + "learning_rate": 1.5611932808044637e-05, + "loss": 0.6541, + "step": 8964 + }, + { + "epoch": 0.31, + "learning_rate": 1.5611031537970728e-05, + "loss": 0.6613, + "step": 8965 + }, + { + "epoch": 0.31, + "learning_rate": 1.561013020137094e-05, + "loss": 0.6097, + "step": 8966 + }, + { + "epoch": 0.31, + "learning_rate": 1.5609228798255958e-05, + "loss": 0.6276, + "step": 8967 + }, + { + "epoch": 0.31, + "learning_rate": 1.560832732863648e-05, + "loss": 0.6603, + "step": 8968 + }, + { + "epoch": 0.31, + "learning_rate": 1.5607425792523183e-05, + "loss": 0.654, + "step": 8969 + }, + { + "epoch": 0.31, + "learning_rate": 1.5606524189926758e-05, + "loss": 0.5973, + "step": 8970 + }, + { + "epoch": 0.31, + "learning_rate": 1.5605622520857902e-05, + "loss": 0.6316, + "step": 8971 + }, + { + "epoch": 0.31, + "learning_rate": 1.5604720785327296e-05, + "loss": 0.6524, + "step": 8972 + }, + { + "epoch": 0.31, + "learning_rate": 1.5603818983345635e-05, + "loss": 0.658, + "step": 8973 + }, + { + "epoch": 0.31, + "learning_rate": 1.5602917114923613e-05, + "loss": 0.6661, + "step": 8974 + }, + { + "epoch": 0.31, + "learning_rate": 1.560201518007192e-05, + "loss": 0.6117, + "step": 8975 + }, + { + "epoch": 0.31, + "learning_rate": 1.560111317880125e-05, + "loss": 0.6355, + "step": 8976 + }, + { + "epoch": 0.31, + "learning_rate": 1.5600211111122297e-05, + "loss": 0.6879, + "step": 8977 + }, + { + "epoch": 0.31, + "learning_rate": 1.559930897704576e-05, + "loss": 0.5768, + "step": 8978 + }, + { + "epoch": 0.31, + "learning_rate": 1.5598406776582326e-05, + "loss": 0.66, + "step": 8979 + }, + { + "epoch": 0.31, + "learning_rate": 1.55975045097427e-05, + "loss": 0.6819, + "step": 8980 + }, + { + "epoch": 0.31, + "learning_rate": 1.559660217653758e-05, + "loss": 0.6336, + "step": 8981 + }, + { + "epoch": 0.31, + "learning_rate": 1.5595699776977662e-05, + "loss": 0.6161, + "step": 8982 + }, + { + "epoch": 0.31, + "learning_rate": 1.5594797311073643e-05, + "loss": 0.6323, + "step": 8983 + }, + { + "epoch": 0.31, + "learning_rate": 1.5593894778836224e-05, + "loss": 0.6817, + "step": 8984 + }, + { + "epoch": 0.31, + "learning_rate": 1.559299218027611e-05, + "loss": 0.6605, + "step": 8985 + }, + { + "epoch": 0.31, + "learning_rate": 1.5592089515403993e-05, + "loss": 0.6552, + "step": 8986 + }, + { + "epoch": 0.31, + "learning_rate": 1.559118678423058e-05, + "loss": 0.6244, + "step": 8987 + }, + { + "epoch": 0.31, + "learning_rate": 1.5590283986766582e-05, + "loss": 0.6201, + "step": 8988 + }, + { + "epoch": 0.31, + "learning_rate": 1.5589381123022687e-05, + "loss": 0.65, + "step": 8989 + }, + { + "epoch": 0.31, + "learning_rate": 1.5588478193009615e-05, + "loss": 0.6646, + "step": 8990 + }, + { + "epoch": 0.31, + "learning_rate": 1.558757519673806e-05, + "loss": 0.653, + "step": 8991 + }, + { + "epoch": 0.31, + "learning_rate": 1.5586672134218735e-05, + "loss": 0.6515, + "step": 8992 + }, + { + "epoch": 0.31, + "learning_rate": 1.5585769005462344e-05, + "loss": 0.6735, + "step": 8993 + }, + { + "epoch": 0.31, + "learning_rate": 1.5584865810479594e-05, + "loss": 0.5845, + "step": 8994 + }, + { + "epoch": 0.31, + "learning_rate": 1.5583962549281196e-05, + "loss": 0.6413, + "step": 8995 + }, + { + "epoch": 0.31, + "learning_rate": 1.5583059221877863e-05, + "loss": 0.6474, + "step": 8996 + }, + { + "epoch": 0.31, + "learning_rate": 1.5582155828280293e-05, + "loss": 0.5978, + "step": 8997 + }, + { + "epoch": 0.31, + "learning_rate": 1.558125236849921e-05, + "loss": 0.6067, + "step": 8998 + }, + { + "epoch": 0.31, + "learning_rate": 1.5580348842545314e-05, + "loss": 0.6326, + "step": 8999 + }, + { + "epoch": 0.31, + "learning_rate": 1.5579445250429328e-05, + "loss": 0.6415, + "step": 9000 + }, + { + "epoch": 0.31, + "learning_rate": 1.557854159216196e-05, + "loss": 0.6146, + "step": 9001 + }, + { + "epoch": 0.31, + "learning_rate": 1.557763786775392e-05, + "loss": 0.5799, + "step": 9002 + }, + { + "epoch": 0.31, + "learning_rate": 1.5576734077215933e-05, + "loss": 0.6095, + "step": 9003 + }, + { + "epoch": 0.31, + "learning_rate": 1.5575830220558702e-05, + "loss": 0.6138, + "step": 9004 + }, + { + "epoch": 0.31, + "learning_rate": 1.557492629779296e-05, + "loss": 0.6461, + "step": 9005 + }, + { + "epoch": 0.31, + "learning_rate": 1.5574022308929406e-05, + "loss": 0.6589, + "step": 9006 + }, + { + "epoch": 0.31, + "learning_rate": 1.557311825397877e-05, + "loss": 0.6264, + "step": 9007 + }, + { + "epoch": 0.31, + "learning_rate": 1.5572214132951767e-05, + "loss": 0.6638, + "step": 9008 + }, + { + "epoch": 0.31, + "learning_rate": 1.5571309945859116e-05, + "loss": 0.6347, + "step": 9009 + }, + { + "epoch": 0.31, + "learning_rate": 1.557040569271154e-05, + "loss": 0.5865, + "step": 9010 + }, + { + "epoch": 0.31, + "learning_rate": 1.5569501373519754e-05, + "loss": 0.6467, + "step": 9011 + }, + { + "epoch": 0.31, + "learning_rate": 1.5568596988294486e-05, + "loss": 0.6476, + "step": 9012 + }, + { + "epoch": 0.31, + "learning_rate": 1.556769253704646e-05, + "loss": 0.7084, + "step": 9013 + }, + { + "epoch": 0.31, + "learning_rate": 1.556678801978639e-05, + "loss": 0.6249, + "step": 9014 + }, + { + "epoch": 0.31, + "learning_rate": 1.5565883436525005e-05, + "loss": 0.6765, + "step": 9015 + }, + { + "epoch": 0.31, + "learning_rate": 1.556497878727304e-05, + "loss": 0.6444, + "step": 9016 + }, + { + "epoch": 0.31, + "learning_rate": 1.5564074072041204e-05, + "loss": 0.6426, + "step": 9017 + }, + { + "epoch": 0.31, + "learning_rate": 1.556316929084023e-05, + "loss": 0.6479, + "step": 9018 + }, + { + "epoch": 0.31, + "learning_rate": 1.5562264443680852e-05, + "loss": 0.6413, + "step": 9019 + }, + { + "epoch": 0.31, + "learning_rate": 1.556135953057379e-05, + "loss": 0.604, + "step": 9020 + }, + { + "epoch": 0.31, + "learning_rate": 1.5560454551529775e-05, + "loss": 0.572, + "step": 9021 + }, + { + "epoch": 0.31, + "learning_rate": 1.555954950655954e-05, + "loss": 0.6181, + "step": 9022 + }, + { + "epoch": 0.31, + "learning_rate": 1.555864439567381e-05, + "loss": 0.6478, + "step": 9023 + }, + { + "epoch": 0.31, + "learning_rate": 1.5557739218883317e-05, + "loss": 0.6062, + "step": 9024 + }, + { + "epoch": 0.31, + "learning_rate": 1.55568339761988e-05, + "loss": 0.6262, + "step": 9025 + }, + { + "epoch": 0.31, + "learning_rate": 1.5555928667630984e-05, + "loss": 0.6546, + "step": 9026 + }, + { + "epoch": 0.31, + "learning_rate": 1.5555023293190608e-05, + "loss": 0.6776, + "step": 9027 + }, + { + "epoch": 0.31, + "learning_rate": 1.5554117852888402e-05, + "loss": 0.6202, + "step": 9028 + }, + { + "epoch": 0.31, + "learning_rate": 1.55532123467351e-05, + "loss": 0.6612, + "step": 9029 + }, + { + "epoch": 0.31, + "learning_rate": 1.5552306774741443e-05, + "loss": 0.643, + "step": 9030 + }, + { + "epoch": 0.31, + "learning_rate": 1.5551401136918167e-05, + "loss": 0.6383, + "step": 9031 + }, + { + "epoch": 0.31, + "learning_rate": 1.5550495433276007e-05, + "loss": 0.6424, + "step": 9032 + }, + { + "epoch": 0.31, + "learning_rate": 1.5549589663825702e-05, + "loss": 0.6011, + "step": 9033 + }, + { + "epoch": 0.31, + "learning_rate": 1.5548683828577993e-05, + "loss": 0.6408, + "step": 9034 + }, + { + "epoch": 0.31, + "learning_rate": 1.5547777927543616e-05, + "loss": 0.6453, + "step": 9035 + }, + { + "epoch": 0.31, + "learning_rate": 1.5546871960733313e-05, + "loss": 0.6841, + "step": 9036 + }, + { + "epoch": 0.31, + "learning_rate": 1.554596592815783e-05, + "loss": 0.6146, + "step": 9037 + }, + { + "epoch": 0.31, + "learning_rate": 1.55450598298279e-05, + "loss": 0.6198, + "step": 9038 + }, + { + "epoch": 0.31, + "learning_rate": 1.5544153665754277e-05, + "loss": 0.6379, + "step": 9039 + }, + { + "epoch": 0.31, + "learning_rate": 1.5543247435947694e-05, + "loss": 0.6631, + "step": 9040 + }, + { + "epoch": 0.31, + "learning_rate": 1.55423411404189e-05, + "loss": 0.6342, + "step": 9041 + }, + { + "epoch": 0.31, + "learning_rate": 1.5541434779178645e-05, + "loss": 0.6571, + "step": 9042 + }, + { + "epoch": 0.31, + "learning_rate": 1.5540528352237666e-05, + "loss": 0.6542, + "step": 9043 + }, + { + "epoch": 0.31, + "learning_rate": 1.5539621859606718e-05, + "loss": 0.6657, + "step": 9044 + }, + { + "epoch": 0.31, + "learning_rate": 1.5538715301296547e-05, + "loss": 0.6223, + "step": 9045 + }, + { + "epoch": 0.31, + "learning_rate": 1.5537808677317893e-05, + "loss": 0.5735, + "step": 9046 + }, + { + "epoch": 0.31, + "learning_rate": 1.5536901987681518e-05, + "loss": 0.6402, + "step": 9047 + }, + { + "epoch": 0.31, + "learning_rate": 1.553599523239816e-05, + "loss": 0.5785, + "step": 9048 + }, + { + "epoch": 0.31, + "learning_rate": 1.553508841147858e-05, + "loss": 0.646, + "step": 9049 + }, + { + "epoch": 0.31, + "learning_rate": 1.5534181524933523e-05, + "loss": 0.6175, + "step": 9050 + }, + { + "epoch": 0.31, + "learning_rate": 1.5533274572773743e-05, + "loss": 0.7057, + "step": 9051 + }, + { + "epoch": 0.31, + "learning_rate": 1.5532367555009994e-05, + "loss": 0.6005, + "step": 9052 + }, + { + "epoch": 0.31, + "learning_rate": 1.5531460471653033e-05, + "loss": 0.66, + "step": 9053 + }, + { + "epoch": 0.31, + "learning_rate": 1.5530553322713605e-05, + "loss": 0.6592, + "step": 9054 + }, + { + "epoch": 0.31, + "learning_rate": 1.5529646108202473e-05, + "loss": 0.618, + "step": 9055 + }, + { + "epoch": 0.31, + "learning_rate": 1.552873882813039e-05, + "loss": 0.664, + "step": 9056 + }, + { + "epoch": 0.31, + "learning_rate": 1.552783148250812e-05, + "loss": 0.651, + "step": 9057 + }, + { + "epoch": 0.31, + "learning_rate": 1.5526924071346406e-05, + "loss": 0.6043, + "step": 9058 + }, + { + "epoch": 0.31, + "learning_rate": 1.5526016594656025e-05, + "loss": 0.6294, + "step": 9059 + }, + { + "epoch": 0.31, + "learning_rate": 1.552510905244772e-05, + "loss": 0.6318, + "step": 9060 + }, + { + "epoch": 0.31, + "learning_rate": 1.552420144473226e-05, + "loss": 0.606, + "step": 9061 + }, + { + "epoch": 0.31, + "learning_rate": 1.5523293771520406e-05, + "loss": 0.6333, + "step": 9062 + }, + { + "epoch": 0.31, + "learning_rate": 1.5522386032822914e-05, + "loss": 0.601, + "step": 9063 + }, + { + "epoch": 0.31, + "learning_rate": 1.552147822865055e-05, + "loss": 0.6382, + "step": 9064 + }, + { + "epoch": 0.31, + "learning_rate": 1.5520570359014078e-05, + "loss": 0.641, + "step": 9065 + }, + { + "epoch": 0.31, + "learning_rate": 1.551966242392426e-05, + "loss": 0.6304, + "step": 9066 + }, + { + "epoch": 0.31, + "learning_rate": 1.5518754423391864e-05, + "loss": 0.6186, + "step": 9067 + }, + { + "epoch": 0.31, + "learning_rate": 1.5517846357427654e-05, + "loss": 0.591, + "step": 9068 + }, + { + "epoch": 0.31, + "learning_rate": 1.5516938226042388e-05, + "loss": 0.6369, + "step": 9069 + }, + { + "epoch": 0.31, + "learning_rate": 1.5516030029246845e-05, + "loss": 0.5944, + "step": 9070 + }, + { + "epoch": 0.31, + "learning_rate": 1.551512176705179e-05, + "loss": 0.6455, + "step": 9071 + }, + { + "epoch": 0.31, + "learning_rate": 1.5514213439467988e-05, + "loss": 0.6206, + "step": 9072 + }, + { + "epoch": 0.31, + "learning_rate": 1.551330504650621e-05, + "loss": 0.617, + "step": 9073 + }, + { + "epoch": 0.31, + "learning_rate": 1.5512396588177225e-05, + "loss": 0.6208, + "step": 9074 + }, + { + "epoch": 0.31, + "learning_rate": 1.5511488064491807e-05, + "loss": 0.6396, + "step": 9075 + }, + { + "epoch": 0.31, + "learning_rate": 1.5510579475460724e-05, + "loss": 0.6092, + "step": 9076 + }, + { + "epoch": 0.31, + "learning_rate": 1.5509670821094755e-05, + "loss": 0.6375, + "step": 9077 + }, + { + "epoch": 0.31, + "learning_rate": 1.5508762101404666e-05, + "loss": 0.6081, + "step": 9078 + }, + { + "epoch": 0.31, + "learning_rate": 1.5507853316401235e-05, + "loss": 0.6306, + "step": 9079 + }, + { + "epoch": 0.31, + "learning_rate": 1.5506944466095233e-05, + "loss": 0.663, + "step": 9080 + }, + { + "epoch": 0.31, + "learning_rate": 1.550603555049744e-05, + "loss": 0.6635, + "step": 9081 + }, + { + "epoch": 0.31, + "learning_rate": 1.5505126569618628e-05, + "loss": 0.6064, + "step": 9082 + }, + { + "epoch": 0.31, + "learning_rate": 1.5504217523469576e-05, + "loss": 0.6549, + "step": 9083 + }, + { + "epoch": 0.31, + "learning_rate": 1.5503308412061064e-05, + "loss": 0.6173, + "step": 9084 + }, + { + "epoch": 0.31, + "learning_rate": 1.550239923540387e-05, + "loss": 0.6257, + "step": 9085 + }, + { + "epoch": 0.31, + "learning_rate": 1.5501489993508773e-05, + "loss": 0.6059, + "step": 9086 + }, + { + "epoch": 0.31, + "learning_rate": 1.550058068638655e-05, + "loss": 0.6051, + "step": 9087 + }, + { + "epoch": 0.31, + "learning_rate": 1.5499671314047983e-05, + "loss": 0.6417, + "step": 9088 + }, + { + "epoch": 0.31, + "learning_rate": 1.549876187650386e-05, + "loss": 0.5869, + "step": 9089 + }, + { + "epoch": 0.31, + "learning_rate": 1.5497852373764958e-05, + "loss": 0.6417, + "step": 9090 + }, + { + "epoch": 0.31, + "learning_rate": 1.5496942805842063e-05, + "loss": 0.6179, + "step": 9091 + }, + { + "epoch": 0.32, + "learning_rate": 1.5496033172745955e-05, + "loss": 0.627, + "step": 9092 + }, + { + "epoch": 0.32, + "learning_rate": 1.549512347448742e-05, + "loss": 0.6005, + "step": 9093 + }, + { + "epoch": 0.32, + "learning_rate": 1.5494213711077244e-05, + "loss": 0.6038, + "step": 9094 + }, + { + "epoch": 0.32, + "learning_rate": 1.5493303882526217e-05, + "loss": 0.5947, + "step": 9095 + }, + { + "epoch": 0.32, + "learning_rate": 1.5492393988845126e-05, + "loss": 0.6148, + "step": 9096 + }, + { + "epoch": 0.32, + "learning_rate": 1.549148403004475e-05, + "loss": 0.613, + "step": 9097 + }, + { + "epoch": 0.32, + "learning_rate": 1.549057400613589e-05, + "loss": 0.6539, + "step": 9098 + }, + { + "epoch": 0.32, + "learning_rate": 1.5489663917129325e-05, + "loss": 0.6152, + "step": 9099 + }, + { + "epoch": 0.32, + "learning_rate": 1.5488753763035852e-05, + "loss": 0.6374, + "step": 9100 + }, + { + "epoch": 0.32, + "learning_rate": 1.5487843543866257e-05, + "loss": 0.6437, + "step": 9101 + }, + { + "epoch": 0.32, + "learning_rate": 1.548693325963134e-05, + "loss": 0.6097, + "step": 9102 + }, + { + "epoch": 0.32, + "learning_rate": 1.5486022910341884e-05, + "loss": 0.6485, + "step": 9103 + }, + { + "epoch": 0.32, + "learning_rate": 1.548511249600869e-05, + "loss": 0.6745, + "step": 9104 + }, + { + "epoch": 0.32, + "learning_rate": 1.5484202016642546e-05, + "loss": 0.651, + "step": 9105 + }, + { + "epoch": 0.32, + "learning_rate": 1.5483291472254248e-05, + "loss": 0.5727, + "step": 9106 + }, + { + "epoch": 0.32, + "learning_rate": 1.5482380862854596e-05, + "loss": 0.6204, + "step": 9107 + }, + { + "epoch": 0.32, + "learning_rate": 1.5481470188454384e-05, + "loss": 0.6566, + "step": 9108 + }, + { + "epoch": 0.32, + "learning_rate": 1.5480559449064404e-05, + "loss": 0.5982, + "step": 9109 + }, + { + "epoch": 0.32, + "learning_rate": 1.5479648644695463e-05, + "loss": 0.6564, + "step": 9110 + }, + { + "epoch": 0.32, + "learning_rate": 1.5478737775358357e-05, + "loss": 0.6047, + "step": 9111 + }, + { + "epoch": 0.32, + "learning_rate": 1.5477826841063883e-05, + "loss": 0.6421, + "step": 9112 + }, + { + "epoch": 0.32, + "learning_rate": 1.547691584182284e-05, + "loss": 0.6014, + "step": 9113 + }, + { + "epoch": 0.32, + "learning_rate": 1.547600477764603e-05, + "loss": 0.662, + "step": 9114 + }, + { + "epoch": 0.32, + "learning_rate": 1.5475093648544262e-05, + "loss": 0.6635, + "step": 9115 + }, + { + "epoch": 0.32, + "learning_rate": 1.5474182454528328e-05, + "loss": 0.6397, + "step": 9116 + }, + { + "epoch": 0.32, + "learning_rate": 1.547327119560904e-05, + "loss": 0.6617, + "step": 9117 + }, + { + "epoch": 0.32, + "learning_rate": 1.5472359871797194e-05, + "loss": 0.6081, + "step": 9118 + }, + { + "epoch": 0.32, + "learning_rate": 1.5471448483103602e-05, + "loss": 0.6691, + "step": 9119 + }, + { + "epoch": 0.32, + "learning_rate": 1.5470537029539066e-05, + "loss": 0.6868, + "step": 9120 + }, + { + "epoch": 0.32, + "learning_rate": 1.5469625511114395e-05, + "loss": 0.6485, + "step": 9121 + }, + { + "epoch": 0.32, + "learning_rate": 1.546871392784039e-05, + "loss": 0.6274, + "step": 9122 + }, + { + "epoch": 0.32, + "learning_rate": 1.5467802279727867e-05, + "loss": 0.5905, + "step": 9123 + }, + { + "epoch": 0.32, + "learning_rate": 1.546689056678763e-05, + "loss": 0.6225, + "step": 9124 + }, + { + "epoch": 0.32, + "learning_rate": 1.546597878903049e-05, + "loss": 0.6731, + "step": 9125 + }, + { + "epoch": 0.32, + "learning_rate": 1.5465066946467255e-05, + "loss": 0.5876, + "step": 9126 + }, + { + "epoch": 0.32, + "learning_rate": 1.546415503910874e-05, + "loss": 0.641, + "step": 9127 + }, + { + "epoch": 0.32, + "learning_rate": 1.5463243066965756e-05, + "loss": 0.6217, + "step": 9128 + }, + { + "epoch": 0.32, + "learning_rate": 1.5462331030049115e-05, + "loss": 0.5912, + "step": 9129 + }, + { + "epoch": 0.32, + "learning_rate": 1.5461418928369628e-05, + "loss": 0.6161, + "step": 9130 + }, + { + "epoch": 0.32, + "learning_rate": 1.546050676193811e-05, + "loss": 0.6481, + "step": 9131 + }, + { + "epoch": 0.32, + "learning_rate": 1.5459594530765377e-05, + "loss": 0.632, + "step": 9132 + }, + { + "epoch": 0.32, + "learning_rate": 1.5458682234862245e-05, + "loss": 0.611, + "step": 9133 + }, + { + "epoch": 0.32, + "learning_rate": 1.545776987423953e-05, + "loss": 0.6602, + "step": 9134 + }, + { + "epoch": 0.32, + "learning_rate": 1.5456857448908048e-05, + "loss": 0.6169, + "step": 9135 + }, + { + "epoch": 0.32, + "learning_rate": 1.545594495887862e-05, + "loss": 0.664, + "step": 9136 + }, + { + "epoch": 0.32, + "learning_rate": 1.5455032404162063e-05, + "loss": 0.6383, + "step": 9137 + }, + { + "epoch": 0.32, + "learning_rate": 1.5454119784769192e-05, + "loss": 0.6271, + "step": 9138 + }, + { + "epoch": 0.32, + "learning_rate": 1.5453207100710834e-05, + "loss": 0.6333, + "step": 9139 + }, + { + "epoch": 0.32, + "learning_rate": 1.5452294351997807e-05, + "loss": 0.606, + "step": 9140 + }, + { + "epoch": 0.32, + "learning_rate": 1.5451381538640933e-05, + "loss": 0.6053, + "step": 9141 + }, + { + "epoch": 0.32, + "learning_rate": 1.5450468660651038e-05, + "loss": 0.6557, + "step": 9142 + }, + { + "epoch": 0.32, + "learning_rate": 1.544955571803894e-05, + "loss": 0.6667, + "step": 9143 + }, + { + "epoch": 0.32, + "learning_rate": 1.544864271081546e-05, + "loss": 0.5926, + "step": 9144 + }, + { + "epoch": 0.32, + "learning_rate": 1.5447729638991437e-05, + "loss": 0.593, + "step": 9145 + }, + { + "epoch": 0.32, + "learning_rate": 1.5446816502577685e-05, + "loss": 0.6389, + "step": 9146 + }, + { + "epoch": 0.32, + "learning_rate": 1.544590330158503e-05, + "loss": 0.6862, + "step": 9147 + }, + { + "epoch": 0.32, + "learning_rate": 1.5444990036024306e-05, + "loss": 0.5867, + "step": 9148 + }, + { + "epoch": 0.32, + "learning_rate": 1.5444076705906336e-05, + "loss": 0.6665, + "step": 9149 + }, + { + "epoch": 0.32, + "learning_rate": 1.5443163311241945e-05, + "loss": 0.6467, + "step": 9150 + }, + { + "epoch": 0.32, + "learning_rate": 1.5442249852041975e-05, + "loss": 0.6248, + "step": 9151 + }, + { + "epoch": 0.32, + "learning_rate": 1.5441336328317244e-05, + "loss": 0.6923, + "step": 9152 + }, + { + "epoch": 0.32, + "learning_rate": 1.5440422740078587e-05, + "loss": 0.662, + "step": 9153 + }, + { + "epoch": 0.32, + "learning_rate": 1.543950908733684e-05, + "loss": 0.6051, + "step": 9154 + }, + { + "epoch": 0.32, + "learning_rate": 1.5438595370102828e-05, + "loss": 0.6581, + "step": 9155 + }, + { + "epoch": 0.32, + "learning_rate": 1.543768158838739e-05, + "loss": 0.5961, + "step": 9156 + }, + { + "epoch": 0.32, + "learning_rate": 1.543676774220136e-05, + "loss": 0.6077, + "step": 9157 + }, + { + "epoch": 0.32, + "learning_rate": 1.543585383155557e-05, + "loss": 0.6622, + "step": 9158 + }, + { + "epoch": 0.32, + "learning_rate": 1.543493985646085e-05, + "loss": 0.6022, + "step": 9159 + }, + { + "epoch": 0.32, + "learning_rate": 1.543402581692805e-05, + "loss": 0.6445, + "step": 9160 + }, + { + "epoch": 0.32, + "learning_rate": 1.5433111712967998e-05, + "loss": 0.6549, + "step": 9161 + }, + { + "epoch": 0.32, + "learning_rate": 1.5432197544591532e-05, + "loss": 0.6064, + "step": 9162 + }, + { + "epoch": 0.32, + "learning_rate": 1.5431283311809497e-05, + "loss": 0.6452, + "step": 9163 + }, + { + "epoch": 0.32, + "learning_rate": 1.5430369014632724e-05, + "loss": 0.5994, + "step": 9164 + }, + { + "epoch": 0.32, + "learning_rate": 1.5429454653072055e-05, + "loss": 0.59, + "step": 9165 + }, + { + "epoch": 0.32, + "learning_rate": 1.5428540227138335e-05, + "loss": 0.6181, + "step": 9166 + }, + { + "epoch": 0.32, + "learning_rate": 1.5427625736842404e-05, + "loss": 0.6275, + "step": 9167 + }, + { + "epoch": 0.32, + "learning_rate": 1.5426711182195106e-05, + "loss": 0.67, + "step": 9168 + }, + { + "epoch": 0.32, + "learning_rate": 1.5425796563207277e-05, + "loss": 0.6268, + "step": 9169 + }, + { + "epoch": 0.32, + "learning_rate": 1.5424881879889772e-05, + "loss": 0.6392, + "step": 9170 + }, + { + "epoch": 0.32, + "learning_rate": 1.5423967132253424e-05, + "loss": 0.6388, + "step": 9171 + }, + { + "epoch": 0.32, + "learning_rate": 1.5423052320309087e-05, + "loss": 0.6161, + "step": 9172 + }, + { + "epoch": 0.32, + "learning_rate": 1.54221374440676e-05, + "loss": 0.6416, + "step": 9173 + }, + { + "epoch": 0.32, + "learning_rate": 1.542122250353982e-05, + "loss": 0.6276, + "step": 9174 + }, + { + "epoch": 0.32, + "learning_rate": 1.542030749873659e-05, + "loss": 0.6375, + "step": 9175 + }, + { + "epoch": 0.32, + "learning_rate": 1.5419392429668757e-05, + "loss": 0.6341, + "step": 9176 + }, + { + "epoch": 0.32, + "learning_rate": 1.541847729634717e-05, + "loss": 0.6094, + "step": 9177 + }, + { + "epoch": 0.32, + "learning_rate": 1.5417562098782682e-05, + "loss": 0.6376, + "step": 9178 + }, + { + "epoch": 0.32, + "learning_rate": 1.5416646836986137e-05, + "loss": 0.6039, + "step": 9179 + }, + { + "epoch": 0.32, + "learning_rate": 1.5415731510968397e-05, + "loss": 0.6229, + "step": 9180 + }, + { + "epoch": 0.32, + "learning_rate": 1.541481612074031e-05, + "loss": 0.6606, + "step": 9181 + }, + { + "epoch": 0.32, + "learning_rate": 1.5413900666312723e-05, + "loss": 0.6227, + "step": 9182 + }, + { + "epoch": 0.32, + "learning_rate": 1.5412985147696497e-05, + "loss": 0.6199, + "step": 9183 + }, + { + "epoch": 0.32, + "learning_rate": 1.5412069564902484e-05, + "loss": 0.6208, + "step": 9184 + }, + { + "epoch": 0.32, + "learning_rate": 1.5411153917941542e-05, + "loss": 0.6064, + "step": 9185 + }, + { + "epoch": 0.32, + "learning_rate": 1.5410238206824525e-05, + "loss": 0.709, + "step": 9186 + }, + { + "epoch": 0.32, + "learning_rate": 1.540932243156229e-05, + "loss": 0.6131, + "step": 9187 + }, + { + "epoch": 0.32, + "learning_rate": 1.5408406592165693e-05, + "loss": 0.657, + "step": 9188 + }, + { + "epoch": 0.32, + "learning_rate": 1.5407490688645593e-05, + "loss": 0.6773, + "step": 9189 + }, + { + "epoch": 0.32, + "learning_rate": 1.5406574721012854e-05, + "loss": 0.6014, + "step": 9190 + }, + { + "epoch": 0.32, + "learning_rate": 1.540565868927833e-05, + "loss": 0.651, + "step": 9191 + }, + { + "epoch": 0.32, + "learning_rate": 1.5404742593452886e-05, + "loss": 0.6056, + "step": 9192 + }, + { + "epoch": 0.32, + "learning_rate": 1.5403826433547378e-05, + "loss": 0.5953, + "step": 9193 + }, + { + "epoch": 0.32, + "learning_rate": 1.5402910209572673e-05, + "loss": 0.6549, + "step": 9194 + }, + { + "epoch": 0.32, + "learning_rate": 1.540199392153964e-05, + "loss": 0.6328, + "step": 9195 + }, + { + "epoch": 0.32, + "learning_rate": 1.5401077569459123e-05, + "loss": 0.6188, + "step": 9196 + }, + { + "epoch": 0.32, + "learning_rate": 1.540016115334201e-05, + "loss": 0.6127, + "step": 9197 + }, + { + "epoch": 0.32, + "learning_rate": 1.539924467319915e-05, + "loss": 0.6185, + "step": 9198 + }, + { + "epoch": 0.32, + "learning_rate": 1.5398328129041415e-05, + "loss": 0.6161, + "step": 9199 + }, + { + "epoch": 0.32, + "learning_rate": 1.539741152087967e-05, + "loss": 0.6006, + "step": 9200 + }, + { + "epoch": 0.32, + "learning_rate": 1.5396494848724785e-05, + "loss": 0.6231, + "step": 9201 + }, + { + "epoch": 0.32, + "learning_rate": 1.5395578112587628e-05, + "loss": 0.6741, + "step": 9202 + }, + { + "epoch": 0.32, + "learning_rate": 1.5394661312479064e-05, + "loss": 0.5954, + "step": 9203 + }, + { + "epoch": 0.32, + "learning_rate": 1.5393744448409967e-05, + "loss": 0.6292, + "step": 9204 + }, + { + "epoch": 0.32, + "learning_rate": 1.5392827520391208e-05, + "loss": 0.6527, + "step": 9205 + }, + { + "epoch": 0.32, + "learning_rate": 1.5391910528433655e-05, + "loss": 0.6166, + "step": 9206 + }, + { + "epoch": 0.32, + "learning_rate": 1.5390993472548185e-05, + "loss": 0.6189, + "step": 9207 + }, + { + "epoch": 0.32, + "learning_rate": 1.5390076352745663e-05, + "loss": 0.5953, + "step": 9208 + }, + { + "epoch": 0.32, + "learning_rate": 1.5389159169036967e-05, + "loss": 0.5873, + "step": 9209 + }, + { + "epoch": 0.32, + "learning_rate": 1.538824192143298e-05, + "loss": 0.5989, + "step": 9210 + }, + { + "epoch": 0.32, + "learning_rate": 1.538732460994456e-05, + "loss": 0.6531, + "step": 9211 + }, + { + "epoch": 0.32, + "learning_rate": 1.5386407234582598e-05, + "loss": 0.7412, + "step": 9212 + }, + { + "epoch": 0.32, + "learning_rate": 1.538548979535796e-05, + "loss": 0.6161, + "step": 9213 + }, + { + "epoch": 0.32, + "learning_rate": 1.5384572292281527e-05, + "loss": 0.6057, + "step": 9214 + }, + { + "epoch": 0.32, + "learning_rate": 1.5383654725364183e-05, + "loss": 0.5928, + "step": 9215 + }, + { + "epoch": 0.32, + "learning_rate": 1.53827370946168e-05, + "loss": 0.6399, + "step": 9216 + }, + { + "epoch": 0.32, + "learning_rate": 1.5381819400050257e-05, + "loss": 0.6473, + "step": 9217 + }, + { + "epoch": 0.32, + "learning_rate": 1.538090164167544e-05, + "loss": 0.6004, + "step": 9218 + }, + { + "epoch": 0.32, + "learning_rate": 1.5379983819503226e-05, + "loss": 0.6921, + "step": 9219 + }, + { + "epoch": 0.32, + "learning_rate": 1.5379065933544495e-05, + "loss": 0.6278, + "step": 9220 + }, + { + "epoch": 0.32, + "learning_rate": 1.5378147983810136e-05, + "loss": 0.6243, + "step": 9221 + }, + { + "epoch": 0.32, + "learning_rate": 1.5377229970311032e-05, + "loss": 0.6204, + "step": 9222 + }, + { + "epoch": 0.32, + "learning_rate": 1.537631189305806e-05, + "loss": 0.6686, + "step": 9223 + }, + { + "epoch": 0.32, + "learning_rate": 1.5375393752062108e-05, + "loss": 0.6589, + "step": 9224 + }, + { + "epoch": 0.32, + "learning_rate": 1.537447554733407e-05, + "loss": 0.6431, + "step": 9225 + }, + { + "epoch": 0.32, + "learning_rate": 1.5373557278884822e-05, + "loss": 0.6665, + "step": 9226 + }, + { + "epoch": 0.32, + "learning_rate": 1.5372638946725252e-05, + "loss": 0.6325, + "step": 9227 + }, + { + "epoch": 0.32, + "learning_rate": 1.5371720550866256e-05, + "loss": 0.6434, + "step": 9228 + }, + { + "epoch": 0.32, + "learning_rate": 1.5370802091318714e-05, + "loss": 0.6248, + "step": 9229 + }, + { + "epoch": 0.32, + "learning_rate": 1.536988356809352e-05, + "loss": 0.6254, + "step": 9230 + }, + { + "epoch": 0.32, + "learning_rate": 1.5368964981201563e-05, + "loss": 0.5734, + "step": 9231 + }, + { + "epoch": 0.32, + "learning_rate": 1.5368046330653736e-05, + "loss": 0.6119, + "step": 9232 + }, + { + "epoch": 0.32, + "learning_rate": 1.5367127616460927e-05, + "loss": 0.6842, + "step": 9233 + }, + { + "epoch": 0.32, + "learning_rate": 1.536620883863403e-05, + "loss": 0.5954, + "step": 9234 + }, + { + "epoch": 0.32, + "learning_rate": 1.5365289997183943e-05, + "loss": 0.6619, + "step": 9235 + }, + { + "epoch": 0.32, + "learning_rate": 1.5364371092121554e-05, + "loss": 0.6261, + "step": 9236 + }, + { + "epoch": 0.32, + "learning_rate": 1.536345212345776e-05, + "loss": 0.6088, + "step": 9237 + }, + { + "epoch": 0.32, + "learning_rate": 1.5362533091203454e-05, + "loss": 0.642, + "step": 9238 + }, + { + "epoch": 0.32, + "learning_rate": 1.536161399536954e-05, + "loss": 0.6076, + "step": 9239 + }, + { + "epoch": 0.32, + "learning_rate": 1.5360694835966903e-05, + "loss": 0.6196, + "step": 9240 + }, + { + "epoch": 0.32, + "learning_rate": 1.5359775613006448e-05, + "loss": 0.6702, + "step": 9241 + }, + { + "epoch": 0.32, + "learning_rate": 1.5358856326499078e-05, + "loss": 0.5974, + "step": 9242 + }, + { + "epoch": 0.32, + "learning_rate": 1.5357936976455684e-05, + "loss": 0.5836, + "step": 9243 + }, + { + "epoch": 0.32, + "learning_rate": 1.535701756288717e-05, + "loss": 0.6618, + "step": 9244 + }, + { + "epoch": 0.32, + "learning_rate": 1.5356098085804436e-05, + "loss": 0.5984, + "step": 9245 + }, + { + "epoch": 0.32, + "learning_rate": 1.5355178545218382e-05, + "loss": 0.6838, + "step": 9246 + }, + { + "epoch": 0.32, + "learning_rate": 1.5354258941139915e-05, + "loss": 0.6293, + "step": 9247 + }, + { + "epoch": 0.32, + "learning_rate": 1.5353339273579933e-05, + "loss": 0.7126, + "step": 9248 + }, + { + "epoch": 0.32, + "learning_rate": 1.535241954254934e-05, + "loss": 0.6282, + "step": 9249 + }, + { + "epoch": 0.32, + "learning_rate": 1.5351499748059046e-05, + "loss": 0.6147, + "step": 9250 + }, + { + "epoch": 0.32, + "learning_rate": 1.5350579890119952e-05, + "loss": 0.6189, + "step": 9251 + }, + { + "epoch": 0.32, + "learning_rate": 1.5349659968742963e-05, + "loss": 0.6814, + "step": 9252 + }, + { + "epoch": 0.32, + "learning_rate": 1.534873998393899e-05, + "loss": 0.6546, + "step": 9253 + }, + { + "epoch": 0.32, + "learning_rate": 1.534781993571894e-05, + "loss": 0.6613, + "step": 9254 + }, + { + "epoch": 0.32, + "learning_rate": 1.5346899824093717e-05, + "loss": 0.6403, + "step": 9255 + }, + { + "epoch": 0.32, + "learning_rate": 1.5345979649074233e-05, + "loss": 0.6334, + "step": 9256 + }, + { + "epoch": 0.32, + "learning_rate": 1.5345059410671396e-05, + "loss": 0.5932, + "step": 9257 + }, + { + "epoch": 0.32, + "learning_rate": 1.5344139108896122e-05, + "loss": 0.618, + "step": 9258 + }, + { + "epoch": 0.32, + "learning_rate": 1.5343218743759317e-05, + "loss": 0.6503, + "step": 9259 + }, + { + "epoch": 0.32, + "learning_rate": 1.5342298315271892e-05, + "loss": 0.6024, + "step": 9260 + }, + { + "epoch": 0.32, + "learning_rate": 1.5341377823444762e-05, + "loss": 0.6124, + "step": 9261 + }, + { + "epoch": 0.32, + "learning_rate": 1.5340457268288845e-05, + "loss": 0.6848, + "step": 9262 + }, + { + "epoch": 0.32, + "learning_rate": 1.533953664981505e-05, + "loss": 0.5913, + "step": 9263 + }, + { + "epoch": 0.32, + "learning_rate": 1.5338615968034294e-05, + "loss": 0.6256, + "step": 9264 + }, + { + "epoch": 0.32, + "learning_rate": 1.533769522295749e-05, + "loss": 0.6263, + "step": 9265 + }, + { + "epoch": 0.32, + "learning_rate": 1.533677441459556e-05, + "loss": 0.5887, + "step": 9266 + }, + { + "epoch": 0.32, + "learning_rate": 1.5335853542959417e-05, + "loss": 0.6686, + "step": 9267 + }, + { + "epoch": 0.32, + "learning_rate": 1.5334932608059978e-05, + "loss": 0.6905, + "step": 9268 + }, + { + "epoch": 0.32, + "learning_rate": 1.5334011609908167e-05, + "loss": 0.5804, + "step": 9269 + }, + { + "epoch": 0.32, + "learning_rate": 1.53330905485149e-05, + "loss": 0.6002, + "step": 9270 + }, + { + "epoch": 0.32, + "learning_rate": 1.53321694238911e-05, + "loss": 0.5858, + "step": 9271 + }, + { + "epoch": 0.32, + "learning_rate": 1.5331248236047684e-05, + "loss": 0.6541, + "step": 9272 + }, + { + "epoch": 0.32, + "learning_rate": 1.5330326984995575e-05, + "loss": 0.6335, + "step": 9273 + }, + { + "epoch": 0.32, + "learning_rate": 1.5329405670745695e-05, + "loss": 0.6221, + "step": 9274 + }, + { + "epoch": 0.32, + "learning_rate": 1.5328484293308977e-05, + "loss": 0.6625, + "step": 9275 + }, + { + "epoch": 0.32, + "learning_rate": 1.532756285269633e-05, + "loss": 0.6233, + "step": 9276 + }, + { + "epoch": 0.32, + "learning_rate": 1.532664134891869e-05, + "loss": 0.6902, + "step": 9277 + }, + { + "epoch": 0.32, + "learning_rate": 1.5325719781986976e-05, + "loss": 0.6785, + "step": 9278 + }, + { + "epoch": 0.32, + "learning_rate": 1.532479815191212e-05, + "loss": 0.6719, + "step": 9279 + }, + { + "epoch": 0.32, + "learning_rate": 1.5323876458705043e-05, + "loss": 0.6357, + "step": 9280 + }, + { + "epoch": 0.32, + "learning_rate": 1.5322954702376677e-05, + "loss": 0.6311, + "step": 9281 + }, + { + "epoch": 0.32, + "learning_rate": 1.5322032882937946e-05, + "loss": 0.6503, + "step": 9282 + }, + { + "epoch": 0.32, + "learning_rate": 1.5321111000399788e-05, + "loss": 0.6684, + "step": 9283 + }, + { + "epoch": 0.32, + "learning_rate": 1.5320189054773127e-05, + "loss": 0.6735, + "step": 9284 + }, + { + "epoch": 0.32, + "learning_rate": 1.5319267046068893e-05, + "loss": 0.6982, + "step": 9285 + }, + { + "epoch": 0.32, + "learning_rate": 1.5318344974298017e-05, + "loss": 0.6692, + "step": 9286 + }, + { + "epoch": 0.32, + "learning_rate": 1.5317422839471437e-05, + "loss": 0.6402, + "step": 9287 + }, + { + "epoch": 0.32, + "learning_rate": 1.5316500641600083e-05, + "loss": 0.6444, + "step": 9288 + }, + { + "epoch": 0.32, + "learning_rate": 1.5315578380694885e-05, + "loss": 0.67, + "step": 9289 + }, + { + "epoch": 0.32, + "learning_rate": 1.5314656056766787e-05, + "loss": 0.668, + "step": 9290 + }, + { + "epoch": 0.32, + "learning_rate": 1.5313733669826715e-05, + "loss": 0.6583, + "step": 9291 + }, + { + "epoch": 0.32, + "learning_rate": 1.5312811219885606e-05, + "loss": 0.6381, + "step": 9292 + }, + { + "epoch": 0.32, + "learning_rate": 1.53118887069544e-05, + "loss": 0.6969, + "step": 9293 + }, + { + "epoch": 0.32, + "learning_rate": 1.5310966131044037e-05, + "loss": 0.6568, + "step": 9294 + }, + { + "epoch": 0.32, + "learning_rate": 1.5310043492165453e-05, + "loss": 0.6118, + "step": 9295 + }, + { + "epoch": 0.32, + "learning_rate": 1.530912079032958e-05, + "loss": 0.6508, + "step": 9296 + }, + { + "epoch": 0.32, + "learning_rate": 1.5308198025547366e-05, + "loss": 0.6233, + "step": 9297 + }, + { + "epoch": 0.32, + "learning_rate": 1.5307275197829756e-05, + "loss": 0.6386, + "step": 9298 + }, + { + "epoch": 0.32, + "learning_rate": 1.530635230718768e-05, + "loss": 0.6541, + "step": 9299 + }, + { + "epoch": 0.32, + "learning_rate": 1.530542935363208e-05, + "loss": 0.6315, + "step": 9300 + }, + { + "epoch": 0.32, + "learning_rate": 1.530450633717391e-05, + "loss": 0.6135, + "step": 9301 + }, + { + "epoch": 0.32, + "learning_rate": 1.5303583257824107e-05, + "loss": 0.6732, + "step": 9302 + }, + { + "epoch": 0.32, + "learning_rate": 1.5302660115593613e-05, + "loss": 0.6116, + "step": 9303 + }, + { + "epoch": 0.32, + "learning_rate": 1.5301736910493375e-05, + "loss": 0.6312, + "step": 9304 + }, + { + "epoch": 0.32, + "learning_rate": 1.530081364253434e-05, + "loss": 0.615, + "step": 9305 + }, + { + "epoch": 0.32, + "learning_rate": 1.5299890311727456e-05, + "loss": 0.649, + "step": 9306 + }, + { + "epoch": 0.32, + "learning_rate": 1.5298966918083667e-05, + "loss": 0.628, + "step": 9307 + }, + { + "epoch": 0.32, + "learning_rate": 1.529804346161392e-05, + "loss": 0.6774, + "step": 9308 + }, + { + "epoch": 0.32, + "learning_rate": 1.5297119942329166e-05, + "loss": 0.6119, + "step": 9309 + }, + { + "epoch": 0.32, + "learning_rate": 1.5296196360240355e-05, + "loss": 0.6406, + "step": 9310 + }, + { + "epoch": 0.32, + "learning_rate": 1.5295272715358436e-05, + "loss": 0.6469, + "step": 9311 + }, + { + "epoch": 0.32, + "learning_rate": 1.5294349007694364e-05, + "loss": 0.6174, + "step": 9312 + }, + { + "epoch": 0.32, + "learning_rate": 1.5293425237259082e-05, + "loss": 0.635, + "step": 9313 + }, + { + "epoch": 0.32, + "learning_rate": 1.5292501404063548e-05, + "loss": 0.6237, + "step": 9314 + }, + { + "epoch": 0.32, + "learning_rate": 1.5291577508118715e-05, + "loss": 0.5885, + "step": 9315 + }, + { + "epoch": 0.32, + "learning_rate": 1.5290653549435542e-05, + "loss": 0.625, + "step": 9316 + }, + { + "epoch": 0.32, + "learning_rate": 1.5289729528024974e-05, + "loss": 0.6494, + "step": 9317 + }, + { + "epoch": 0.32, + "learning_rate": 1.528880544389797e-05, + "loss": 0.6219, + "step": 9318 + }, + { + "epoch": 0.32, + "learning_rate": 1.528788129706549e-05, + "loss": 0.6403, + "step": 9319 + }, + { + "epoch": 0.32, + "learning_rate": 1.5286957087538487e-05, + "loss": 0.6056, + "step": 9320 + }, + { + "epoch": 0.32, + "learning_rate": 1.5286032815327918e-05, + "loss": 0.6929, + "step": 9321 + }, + { + "epoch": 0.32, + "learning_rate": 1.5285108480444747e-05, + "loss": 0.5985, + "step": 9322 + }, + { + "epoch": 0.32, + "learning_rate": 1.5284184082899926e-05, + "loss": 0.6785, + "step": 9323 + }, + { + "epoch": 0.32, + "learning_rate": 1.5283259622704417e-05, + "loss": 0.6178, + "step": 9324 + }, + { + "epoch": 0.32, + "learning_rate": 1.5282335099869183e-05, + "loss": 0.6164, + "step": 9325 + }, + { + "epoch": 0.32, + "learning_rate": 1.528141051440519e-05, + "loss": 0.6311, + "step": 9326 + }, + { + "epoch": 0.32, + "learning_rate": 1.5280485866323383e-05, + "loss": 0.5928, + "step": 9327 + }, + { + "epoch": 0.32, + "learning_rate": 1.5279561155634747e-05, + "loss": 0.63, + "step": 9328 + }, + { + "epoch": 0.32, + "learning_rate": 1.527863638235023e-05, + "loss": 0.6409, + "step": 9329 + }, + { + "epoch": 0.32, + "learning_rate": 1.5277711546480797e-05, + "loss": 0.6277, + "step": 9330 + }, + { + "epoch": 0.32, + "learning_rate": 1.5276786648037424e-05, + "loss": 0.6225, + "step": 9331 + }, + { + "epoch": 0.32, + "learning_rate": 1.5275861687031067e-05, + "loss": 0.5904, + "step": 9332 + }, + { + "epoch": 0.32, + "learning_rate": 1.52749366634727e-05, + "loss": 0.6653, + "step": 9333 + }, + { + "epoch": 0.32, + "learning_rate": 1.527401157737328e-05, + "loss": 0.6118, + "step": 9334 + }, + { + "epoch": 0.32, + "learning_rate": 1.5273086428743785e-05, + "loss": 0.6659, + "step": 9335 + }, + { + "epoch": 0.32, + "learning_rate": 1.5272161217595174e-05, + "loss": 0.6243, + "step": 9336 + }, + { + "epoch": 0.32, + "learning_rate": 1.527123594393843e-05, + "loss": 0.6369, + "step": 9337 + }, + { + "epoch": 0.32, + "learning_rate": 1.5270310607784513e-05, + "loss": 0.629, + "step": 9338 + }, + { + "epoch": 0.32, + "learning_rate": 1.5269385209144394e-05, + "loss": 0.6539, + "step": 9339 + }, + { + "epoch": 0.32, + "learning_rate": 1.526845974802905e-05, + "loss": 0.6481, + "step": 9340 + }, + { + "epoch": 0.32, + "learning_rate": 1.5267534224449452e-05, + "loss": 0.6171, + "step": 9341 + }, + { + "epoch": 0.32, + "learning_rate": 1.526660863841657e-05, + "loss": 0.5997, + "step": 9342 + }, + { + "epoch": 0.32, + "learning_rate": 1.526568298994138e-05, + "loss": 0.6346, + "step": 9343 + }, + { + "epoch": 0.32, + "learning_rate": 1.5264757279034864e-05, + "loss": 0.6294, + "step": 9344 + }, + { + "epoch": 0.32, + "learning_rate": 1.5263831505707983e-05, + "loss": 0.6448, + "step": 9345 + }, + { + "epoch": 0.32, + "learning_rate": 1.5262905669971724e-05, + "loss": 0.6814, + "step": 9346 + }, + { + "epoch": 0.32, + "learning_rate": 1.526197977183706e-05, + "loss": 0.6075, + "step": 9347 + }, + { + "epoch": 0.32, + "learning_rate": 1.5261053811314967e-05, + "loss": 0.6397, + "step": 9348 + }, + { + "epoch": 0.32, + "learning_rate": 1.5260127788416428e-05, + "loss": 0.6576, + "step": 9349 + }, + { + "epoch": 0.32, + "learning_rate": 1.525920170315242e-05, + "loss": 0.6592, + "step": 9350 + }, + { + "epoch": 0.32, + "learning_rate": 1.5258275555533923e-05, + "loss": 0.6046, + "step": 9351 + }, + { + "epoch": 0.32, + "learning_rate": 1.5257349345571917e-05, + "loss": 0.6372, + "step": 9352 + }, + { + "epoch": 0.32, + "learning_rate": 1.5256423073277384e-05, + "loss": 0.6185, + "step": 9353 + }, + { + "epoch": 0.32, + "learning_rate": 1.5255496738661305e-05, + "loss": 0.6268, + "step": 9354 + }, + { + "epoch": 0.32, + "learning_rate": 1.5254570341734664e-05, + "loss": 0.6159, + "step": 9355 + }, + { + "epoch": 0.32, + "learning_rate": 1.5253643882508447e-05, + "loss": 0.595, + "step": 9356 + }, + { + "epoch": 0.32, + "learning_rate": 1.5252717360993635e-05, + "loss": 0.6025, + "step": 9357 + }, + { + "epoch": 0.32, + "learning_rate": 1.5251790777201211e-05, + "loss": 0.5851, + "step": 9358 + }, + { + "epoch": 0.32, + "learning_rate": 1.5250864131142169e-05, + "loss": 0.6327, + "step": 9359 + }, + { + "epoch": 0.32, + "learning_rate": 1.5249937422827486e-05, + "loss": 0.6213, + "step": 9360 + }, + { + "epoch": 0.32, + "learning_rate": 1.5249010652268155e-05, + "loss": 0.6101, + "step": 9361 + }, + { + "epoch": 0.32, + "learning_rate": 1.5248083819475163e-05, + "loss": 0.5986, + "step": 9362 + }, + { + "epoch": 0.32, + "learning_rate": 1.5247156924459499e-05, + "loss": 0.6173, + "step": 9363 + }, + { + "epoch": 0.32, + "learning_rate": 1.5246229967232151e-05, + "loss": 0.6795, + "step": 9364 + }, + { + "epoch": 0.32, + "learning_rate": 1.5245302947804113e-05, + "loss": 0.6485, + "step": 9365 + }, + { + "epoch": 0.32, + "learning_rate": 1.5244375866186367e-05, + "loss": 0.6434, + "step": 9366 + }, + { + "epoch": 0.32, + "learning_rate": 1.5243448722389915e-05, + "loss": 0.6291, + "step": 9367 + }, + { + "epoch": 0.32, + "learning_rate": 1.5242521516425748e-05, + "loss": 0.6168, + "step": 9368 + }, + { + "epoch": 0.32, + "learning_rate": 1.5241594248304852e-05, + "loss": 0.6151, + "step": 9369 + }, + { + "epoch": 0.32, + "learning_rate": 1.5240666918038227e-05, + "loss": 0.6205, + "step": 9370 + }, + { + "epoch": 0.32, + "learning_rate": 1.5239739525636866e-05, + "loss": 0.6525, + "step": 9371 + }, + { + "epoch": 0.32, + "learning_rate": 1.5238812071111767e-05, + "loss": 0.6977, + "step": 9372 + }, + { + "epoch": 0.32, + "learning_rate": 1.5237884554473918e-05, + "loss": 0.6289, + "step": 9373 + }, + { + "epoch": 0.32, + "learning_rate": 1.5236956975734328e-05, + "loss": 0.5968, + "step": 9374 + }, + { + "epoch": 0.32, + "learning_rate": 1.5236029334903983e-05, + "loss": 0.6393, + "step": 9375 + }, + { + "epoch": 0.32, + "learning_rate": 1.5235101631993891e-05, + "loss": 0.6216, + "step": 9376 + }, + { + "epoch": 0.32, + "learning_rate": 1.5234173867015046e-05, + "loss": 0.6956, + "step": 9377 + }, + { + "epoch": 0.32, + "learning_rate": 1.5233246039978447e-05, + "loss": 0.6204, + "step": 9378 + }, + { + "epoch": 0.32, + "learning_rate": 1.5232318150895095e-05, + "loss": 0.5522, + "step": 9379 + }, + { + "epoch": 0.32, + "learning_rate": 1.5231390199775997e-05, + "loss": 0.6534, + "step": 9380 + }, + { + "epoch": 0.33, + "learning_rate": 1.5230462186632147e-05, + "loss": 0.5782, + "step": 9381 + }, + { + "epoch": 0.33, + "learning_rate": 1.522953411147455e-05, + "loss": 0.6396, + "step": 9382 + }, + { + "epoch": 0.33, + "learning_rate": 1.5228605974314214e-05, + "loss": 0.5976, + "step": 9383 + }, + { + "epoch": 0.33, + "learning_rate": 1.5227677775162138e-05, + "loss": 0.6411, + "step": 9384 + }, + { + "epoch": 0.33, + "learning_rate": 1.5226749514029329e-05, + "loss": 0.6108, + "step": 9385 + }, + { + "epoch": 0.33, + "learning_rate": 1.5225821190926793e-05, + "loss": 0.6492, + "step": 9386 + }, + { + "epoch": 0.33, + "learning_rate": 1.5224892805865534e-05, + "loss": 0.6589, + "step": 9387 + }, + { + "epoch": 0.33, + "learning_rate": 1.5223964358856567e-05, + "loss": 0.7096, + "step": 9388 + }, + { + "epoch": 0.33, + "learning_rate": 1.522303584991089e-05, + "loss": 0.6469, + "step": 9389 + }, + { + "epoch": 0.33, + "learning_rate": 1.5222107279039513e-05, + "loss": 0.6965, + "step": 9390 + }, + { + "epoch": 0.33, + "learning_rate": 1.5221178646253454e-05, + "loss": 0.6008, + "step": 9391 + }, + { + "epoch": 0.33, + "learning_rate": 1.5220249951563714e-05, + "loss": 0.6579, + "step": 9392 + }, + { + "epoch": 0.33, + "learning_rate": 1.5219321194981307e-05, + "loss": 0.6628, + "step": 9393 + }, + { + "epoch": 0.33, + "learning_rate": 1.5218392376517248e-05, + "loss": 0.6208, + "step": 9394 + }, + { + "epoch": 0.33, + "learning_rate": 1.5217463496182543e-05, + "loss": 0.6451, + "step": 9395 + }, + { + "epoch": 0.33, + "learning_rate": 1.5216534553988206e-05, + "loss": 0.6245, + "step": 9396 + }, + { + "epoch": 0.33, + "learning_rate": 1.5215605549945261e-05, + "loss": 0.6604, + "step": 9397 + }, + { + "epoch": 0.33, + "learning_rate": 1.5214676484064707e-05, + "loss": 0.6367, + "step": 9398 + }, + { + "epoch": 0.33, + "learning_rate": 1.5213747356357569e-05, + "loss": 0.5502, + "step": 9399 + }, + { + "epoch": 0.33, + "learning_rate": 1.5212818166834859e-05, + "loss": 0.6618, + "step": 9400 + }, + { + "epoch": 0.33, + "learning_rate": 1.52118889155076e-05, + "loss": 0.6653, + "step": 9401 + }, + { + "epoch": 0.33, + "learning_rate": 1.5210959602386801e-05, + "loss": 0.6098, + "step": 9402 + }, + { + "epoch": 0.33, + "learning_rate": 1.5210030227483485e-05, + "loss": 0.7012, + "step": 9403 + }, + { + "epoch": 0.33, + "learning_rate": 1.520910079080867e-05, + "loss": 0.6329, + "step": 9404 + }, + { + "epoch": 0.33, + "learning_rate": 1.5208171292373375e-05, + "loss": 0.6477, + "step": 9405 + }, + { + "epoch": 0.33, + "learning_rate": 1.520724173218862e-05, + "loss": 0.6379, + "step": 9406 + }, + { + "epoch": 0.33, + "learning_rate": 1.520631211026543e-05, + "loss": 0.6963, + "step": 9407 + }, + { + "epoch": 0.33, + "learning_rate": 1.5205382426614821e-05, + "loss": 0.5887, + "step": 9408 + }, + { + "epoch": 0.33, + "learning_rate": 1.520445268124782e-05, + "loss": 0.6322, + "step": 9409 + }, + { + "epoch": 0.33, + "learning_rate": 1.5203522874175448e-05, + "loss": 0.5572, + "step": 9410 + }, + { + "epoch": 0.33, + "learning_rate": 1.520259300540873e-05, + "loss": 0.6034, + "step": 9411 + }, + { + "epoch": 0.33, + "learning_rate": 1.5201663074958695e-05, + "loss": 0.6132, + "step": 9412 + }, + { + "epoch": 0.33, + "learning_rate": 1.5200733082836356e-05, + "loss": 0.6829, + "step": 9413 + }, + { + "epoch": 0.33, + "learning_rate": 1.519980302905275e-05, + "loss": 0.6199, + "step": 9414 + }, + { + "epoch": 0.33, + "learning_rate": 1.5198872913618905e-05, + "loss": 0.6534, + "step": 9415 + }, + { + "epoch": 0.33, + "learning_rate": 1.5197942736545845e-05, + "loss": 0.6109, + "step": 9416 + }, + { + "epoch": 0.33, + "learning_rate": 1.5197012497844594e-05, + "loss": 0.67, + "step": 9417 + }, + { + "epoch": 0.33, + "learning_rate": 1.519608219752619e-05, + "loss": 0.652, + "step": 9418 + }, + { + "epoch": 0.33, + "learning_rate": 1.5195151835601656e-05, + "loss": 0.5577, + "step": 9419 + }, + { + "epoch": 0.33, + "learning_rate": 1.5194221412082024e-05, + "loss": 0.6446, + "step": 9420 + }, + { + "epoch": 0.33, + "learning_rate": 1.5193290926978331e-05, + "loss": 0.632, + "step": 9421 + }, + { + "epoch": 0.33, + "learning_rate": 1.51923603803016e-05, + "loss": 0.6234, + "step": 9422 + }, + { + "epoch": 0.33, + "learning_rate": 1.5191429772062867e-05, + "loss": 0.6538, + "step": 9423 + }, + { + "epoch": 0.33, + "learning_rate": 1.519049910227317e-05, + "loss": 0.65, + "step": 9424 + }, + { + "epoch": 0.33, + "learning_rate": 1.5189568370943541e-05, + "loss": 0.6546, + "step": 9425 + }, + { + "epoch": 0.33, + "learning_rate": 1.5188637578085011e-05, + "loss": 0.6284, + "step": 9426 + }, + { + "epoch": 0.33, + "learning_rate": 1.5187706723708621e-05, + "loss": 0.6734, + "step": 9427 + }, + { + "epoch": 0.33, + "learning_rate": 1.5186775807825407e-05, + "loss": 0.6786, + "step": 9428 + }, + { + "epoch": 0.33, + "learning_rate": 1.51858448304464e-05, + "loss": 0.6837, + "step": 9429 + }, + { + "epoch": 0.33, + "learning_rate": 1.5184913791582645e-05, + "loss": 0.6118, + "step": 9430 + }, + { + "epoch": 0.33, + "learning_rate": 1.518398269124518e-05, + "loss": 0.6043, + "step": 9431 + }, + { + "epoch": 0.33, + "learning_rate": 1.5183051529445038e-05, + "loss": 0.5735, + "step": 9432 + }, + { + "epoch": 0.33, + "learning_rate": 1.5182120306193269e-05, + "loss": 0.6286, + "step": 9433 + }, + { + "epoch": 0.33, + "learning_rate": 1.5181189021500906e-05, + "loss": 0.6817, + "step": 9434 + }, + { + "epoch": 0.33, + "learning_rate": 1.5180257675378988e-05, + "loss": 0.6365, + "step": 9435 + }, + { + "epoch": 0.33, + "learning_rate": 1.5179326267838567e-05, + "loss": 0.6547, + "step": 9436 + }, + { + "epoch": 0.33, + "learning_rate": 1.5178394798890682e-05, + "loss": 0.6574, + "step": 9437 + }, + { + "epoch": 0.33, + "learning_rate": 1.5177463268546374e-05, + "loss": 0.6089, + "step": 9438 + }, + { + "epoch": 0.33, + "learning_rate": 1.5176531676816688e-05, + "loss": 0.58, + "step": 9439 + }, + { + "epoch": 0.33, + "learning_rate": 1.5175600023712675e-05, + "loss": 0.6802, + "step": 9440 + }, + { + "epoch": 0.33, + "learning_rate": 1.5174668309245371e-05, + "loss": 0.6403, + "step": 9441 + }, + { + "epoch": 0.33, + "learning_rate": 1.5173736533425834e-05, + "loss": 0.6552, + "step": 9442 + }, + { + "epoch": 0.33, + "learning_rate": 1.5172804696265102e-05, + "loss": 0.6161, + "step": 9443 + }, + { + "epoch": 0.33, + "learning_rate": 1.5171872797774225e-05, + "loss": 0.6483, + "step": 9444 + }, + { + "epoch": 0.33, + "learning_rate": 1.5170940837964259e-05, + "loss": 0.6428, + "step": 9445 + }, + { + "epoch": 0.33, + "learning_rate": 1.5170008816846247e-05, + "loss": 0.6841, + "step": 9446 + }, + { + "epoch": 0.33, + "learning_rate": 1.5169076734431238e-05, + "loss": 0.6262, + "step": 9447 + }, + { + "epoch": 0.33, + "learning_rate": 1.5168144590730285e-05, + "loss": 0.6321, + "step": 9448 + }, + { + "epoch": 0.33, + "learning_rate": 1.5167212385754441e-05, + "loss": 0.6262, + "step": 9449 + }, + { + "epoch": 0.33, + "learning_rate": 1.5166280119514758e-05, + "loss": 0.6549, + "step": 9450 + }, + { + "epoch": 0.33, + "learning_rate": 1.5165347792022286e-05, + "loss": 0.6615, + "step": 9451 + }, + { + "epoch": 0.33, + "learning_rate": 1.5164415403288088e-05, + "loss": 0.6546, + "step": 9452 + }, + { + "epoch": 0.33, + "learning_rate": 1.5163482953323208e-05, + "loss": 0.6482, + "step": 9453 + }, + { + "epoch": 0.33, + "learning_rate": 1.5162550442138706e-05, + "loss": 0.6069, + "step": 9454 + }, + { + "epoch": 0.33, + "learning_rate": 1.5161617869745636e-05, + "loss": 0.6831, + "step": 9455 + }, + { + "epoch": 0.33, + "learning_rate": 1.516068523615506e-05, + "loss": 0.6085, + "step": 9456 + }, + { + "epoch": 0.33, + "learning_rate": 1.515975254137803e-05, + "loss": 0.68, + "step": 9457 + }, + { + "epoch": 0.33, + "learning_rate": 1.5158819785425612e-05, + "loss": 0.6499, + "step": 9458 + }, + { + "epoch": 0.33, + "learning_rate": 1.5157886968308852e-05, + "loss": 0.6163, + "step": 9459 + }, + { + "epoch": 0.33, + "learning_rate": 1.515695409003882e-05, + "loss": 0.6289, + "step": 9460 + }, + { + "epoch": 0.33, + "learning_rate": 1.5156021150626576e-05, + "loss": 0.6077, + "step": 9461 + }, + { + "epoch": 0.33, + "learning_rate": 1.5155088150083175e-05, + "loss": 0.5708, + "step": 9462 + }, + { + "epoch": 0.33, + "learning_rate": 1.5154155088419684e-05, + "loss": 0.6571, + "step": 9463 + }, + { + "epoch": 0.33, + "learning_rate": 1.5153221965647167e-05, + "loss": 0.6003, + "step": 9464 + }, + { + "epoch": 0.33, + "learning_rate": 1.5152288781776681e-05, + "loss": 0.663, + "step": 9465 + }, + { + "epoch": 0.33, + "learning_rate": 1.5151355536819296e-05, + "loss": 0.5954, + "step": 9466 + }, + { + "epoch": 0.33, + "learning_rate": 1.5150422230786075e-05, + "loss": 0.6301, + "step": 9467 + }, + { + "epoch": 0.33, + "learning_rate": 1.5149488863688082e-05, + "loss": 0.6541, + "step": 9468 + }, + { + "epoch": 0.33, + "learning_rate": 1.5148555435536386e-05, + "loss": 0.6727, + "step": 9469 + }, + { + "epoch": 0.33, + "learning_rate": 1.514762194634205e-05, + "loss": 0.6582, + "step": 9470 + }, + { + "epoch": 0.33, + "learning_rate": 1.5146688396116144e-05, + "loss": 0.666, + "step": 9471 + }, + { + "epoch": 0.33, + "learning_rate": 1.5145754784869737e-05, + "loss": 0.6291, + "step": 9472 + }, + { + "epoch": 0.33, + "learning_rate": 1.5144821112613901e-05, + "loss": 0.5997, + "step": 9473 + }, + { + "epoch": 0.33, + "learning_rate": 1.5143887379359696e-05, + "loss": 0.6027, + "step": 9474 + }, + { + "epoch": 0.33, + "learning_rate": 1.5142953585118205e-05, + "loss": 0.6381, + "step": 9475 + }, + { + "epoch": 0.33, + "learning_rate": 1.514201972990049e-05, + "loss": 0.5898, + "step": 9476 + }, + { + "epoch": 0.33, + "learning_rate": 1.5141085813717629e-05, + "loss": 0.6413, + "step": 9477 + }, + { + "epoch": 0.33, + "learning_rate": 1.514015183658069e-05, + "loss": 0.6826, + "step": 9478 + }, + { + "epoch": 0.33, + "learning_rate": 1.513921779850075e-05, + "loss": 0.6223, + "step": 9479 + }, + { + "epoch": 0.33, + "learning_rate": 1.513828369948888e-05, + "loss": 0.6809, + "step": 9480 + }, + { + "epoch": 0.33, + "learning_rate": 1.513734953955616e-05, + "loss": 0.5912, + "step": 9481 + }, + { + "epoch": 0.33, + "learning_rate": 1.513641531871366e-05, + "loss": 0.7068, + "step": 9482 + }, + { + "epoch": 0.33, + "learning_rate": 1.5135481036972457e-05, + "loss": 0.6273, + "step": 9483 + }, + { + "epoch": 0.33, + "learning_rate": 1.5134546694343635e-05, + "loss": 0.6226, + "step": 9484 + }, + { + "epoch": 0.33, + "learning_rate": 1.5133612290838262e-05, + "loss": 0.6416, + "step": 9485 + }, + { + "epoch": 0.33, + "learning_rate": 1.5132677826467421e-05, + "loss": 0.6602, + "step": 9486 + }, + { + "epoch": 0.33, + "learning_rate": 1.5131743301242196e-05, + "loss": 0.622, + "step": 9487 + }, + { + "epoch": 0.33, + "learning_rate": 1.5130808715173659e-05, + "loss": 0.6701, + "step": 9488 + }, + { + "epoch": 0.33, + "learning_rate": 1.5129874068272896e-05, + "loss": 0.6654, + "step": 9489 + }, + { + "epoch": 0.33, + "learning_rate": 1.5128939360550985e-05, + "loss": 0.6009, + "step": 9490 + }, + { + "epoch": 0.33, + "learning_rate": 1.512800459201901e-05, + "loss": 0.6294, + "step": 9491 + }, + { + "epoch": 0.33, + "learning_rate": 1.5127069762688056e-05, + "loss": 0.6223, + "step": 9492 + }, + { + "epoch": 0.33, + "learning_rate": 1.5126134872569202e-05, + "loss": 0.6903, + "step": 9493 + }, + { + "epoch": 0.33, + "learning_rate": 1.5125199921673534e-05, + "loss": 0.6854, + "step": 9494 + }, + { + "epoch": 0.33, + "learning_rate": 1.5124264910012139e-05, + "loss": 0.6295, + "step": 9495 + }, + { + "epoch": 0.33, + "learning_rate": 1.5123329837596101e-05, + "loss": 0.6235, + "step": 9496 + }, + { + "epoch": 0.33, + "learning_rate": 1.5122394704436505e-05, + "loss": 0.6625, + "step": 9497 + }, + { + "epoch": 0.33, + "learning_rate": 1.512145951054444e-05, + "loss": 0.5883, + "step": 9498 + }, + { + "epoch": 0.33, + "learning_rate": 1.5120524255930998e-05, + "loss": 0.6126, + "step": 9499 + }, + { + "epoch": 0.33, + "learning_rate": 1.511958894060726e-05, + "loss": 0.6061, + "step": 9500 + }, + { + "epoch": 0.33, + "learning_rate": 1.5118653564584318e-05, + "loss": 0.6304, + "step": 9501 + }, + { + "epoch": 0.33, + "learning_rate": 1.5117718127873264e-05, + "loss": 0.6322, + "step": 9502 + }, + { + "epoch": 0.33, + "learning_rate": 1.511678263048519e-05, + "loss": 0.617, + "step": 9503 + }, + { + "epoch": 0.33, + "learning_rate": 1.511584707243118e-05, + "loss": 0.6636, + "step": 9504 + }, + { + "epoch": 0.33, + "learning_rate": 1.5114911453722336e-05, + "loss": 0.6395, + "step": 9505 + }, + { + "epoch": 0.33, + "learning_rate": 1.5113975774369744e-05, + "loss": 0.6013, + "step": 9506 + }, + { + "epoch": 0.33, + "learning_rate": 1.5113040034384501e-05, + "loss": 0.6378, + "step": 9507 + }, + { + "epoch": 0.33, + "learning_rate": 1.51121042337777e-05, + "loss": 0.6162, + "step": 9508 + }, + { + "epoch": 0.33, + "learning_rate": 1.5111168372560436e-05, + "loss": 0.6945, + "step": 9509 + }, + { + "epoch": 0.33, + "learning_rate": 1.5110232450743806e-05, + "loss": 0.6893, + "step": 9510 + }, + { + "epoch": 0.33, + "learning_rate": 1.5109296468338906e-05, + "loss": 0.5834, + "step": 9511 + }, + { + "epoch": 0.33, + "learning_rate": 1.5108360425356834e-05, + "loss": 0.6633, + "step": 9512 + }, + { + "epoch": 0.33, + "learning_rate": 1.5107424321808684e-05, + "loss": 0.6432, + "step": 9513 + }, + { + "epoch": 0.33, + "learning_rate": 1.5106488157705558e-05, + "loss": 0.5838, + "step": 9514 + }, + { + "epoch": 0.33, + "learning_rate": 1.5105551933058558e-05, + "loss": 0.5578, + "step": 9515 + }, + { + "epoch": 0.33, + "learning_rate": 1.5104615647878778e-05, + "loss": 0.6147, + "step": 9516 + }, + { + "epoch": 0.33, + "learning_rate": 1.5103679302177327e-05, + "loss": 0.6041, + "step": 9517 + }, + { + "epoch": 0.33, + "learning_rate": 1.5102742895965299e-05, + "loss": 0.6021, + "step": 9518 + }, + { + "epoch": 0.33, + "learning_rate": 1.5101806429253795e-05, + "loss": 0.6538, + "step": 9519 + }, + { + "epoch": 0.33, + "learning_rate": 1.5100869902053927e-05, + "loss": 0.5898, + "step": 9520 + }, + { + "epoch": 0.33, + "learning_rate": 1.5099933314376793e-05, + "loss": 0.6778, + "step": 9521 + }, + { + "epoch": 0.33, + "learning_rate": 1.5098996666233497e-05, + "loss": 0.5752, + "step": 9522 + }, + { + "epoch": 0.33, + "learning_rate": 1.5098059957635145e-05, + "loss": 0.6617, + "step": 9523 + }, + { + "epoch": 0.33, + "learning_rate": 1.5097123188592844e-05, + "loss": 0.6522, + "step": 9524 + }, + { + "epoch": 0.33, + "learning_rate": 1.50961863591177e-05, + "loss": 0.6211, + "step": 9525 + }, + { + "epoch": 0.33, + "learning_rate": 1.5095249469220821e-05, + "loss": 0.638, + "step": 9526 + }, + { + "epoch": 0.33, + "learning_rate": 1.5094312518913312e-05, + "loss": 0.6425, + "step": 9527 + }, + { + "epoch": 0.33, + "learning_rate": 1.5093375508206282e-05, + "loss": 0.6217, + "step": 9528 + }, + { + "epoch": 0.33, + "learning_rate": 1.5092438437110846e-05, + "loss": 0.6881, + "step": 9529 + }, + { + "epoch": 0.33, + "learning_rate": 1.5091501305638107e-05, + "loss": 0.6465, + "step": 9530 + }, + { + "epoch": 0.33, + "learning_rate": 1.509056411379918e-05, + "loss": 0.6618, + "step": 9531 + }, + { + "epoch": 0.33, + "learning_rate": 1.508962686160518e-05, + "loss": 0.6242, + "step": 9532 + }, + { + "epoch": 0.33, + "learning_rate": 1.508868954906721e-05, + "loss": 0.5907, + "step": 9533 + }, + { + "epoch": 0.33, + "learning_rate": 1.508775217619639e-05, + "loss": 0.6012, + "step": 9534 + }, + { + "epoch": 0.33, + "learning_rate": 1.5086814743003833e-05, + "loss": 0.65, + "step": 9535 + }, + { + "epoch": 0.33, + "learning_rate": 1.508587724950065e-05, + "loss": 0.6322, + "step": 9536 + }, + { + "epoch": 0.33, + "learning_rate": 1.5084939695697962e-05, + "loss": 0.5988, + "step": 9537 + }, + { + "epoch": 0.33, + "learning_rate": 1.5084002081606878e-05, + "loss": 0.6992, + "step": 9538 + }, + { + "epoch": 0.33, + "learning_rate": 1.5083064407238524e-05, + "loss": 0.679, + "step": 9539 + }, + { + "epoch": 0.33, + "learning_rate": 1.5082126672604003e-05, + "loss": 0.6157, + "step": 9540 + }, + { + "epoch": 0.33, + "learning_rate": 1.5081188877714445e-05, + "loss": 0.6228, + "step": 9541 + }, + { + "epoch": 0.33, + "learning_rate": 1.5080251022580968e-05, + "loss": 0.6548, + "step": 9542 + }, + { + "epoch": 0.33, + "learning_rate": 1.5079313107214683e-05, + "loss": 0.6741, + "step": 9543 + }, + { + "epoch": 0.33, + "learning_rate": 1.5078375131626719e-05, + "loss": 0.6326, + "step": 9544 + }, + { + "epoch": 0.33, + "learning_rate": 1.5077437095828193e-05, + "loss": 0.6151, + "step": 9545 + }, + { + "epoch": 0.33, + "learning_rate": 1.5076498999830229e-05, + "loss": 0.6264, + "step": 9546 + }, + { + "epoch": 0.33, + "learning_rate": 1.5075560843643944e-05, + "loss": 0.5832, + "step": 9547 + }, + { + "epoch": 0.33, + "learning_rate": 1.507462262728047e-05, + "loss": 0.6465, + "step": 9548 + }, + { + "epoch": 0.33, + "learning_rate": 1.5073684350750921e-05, + "loss": 0.6397, + "step": 9549 + }, + { + "epoch": 0.33, + "learning_rate": 1.5072746014066427e-05, + "loss": 0.6626, + "step": 9550 + }, + { + "epoch": 0.33, + "learning_rate": 1.5071807617238112e-05, + "loss": 0.5935, + "step": 9551 + }, + { + "epoch": 0.33, + "learning_rate": 1.5070869160277099e-05, + "loss": 0.6904, + "step": 9552 + }, + { + "epoch": 0.33, + "learning_rate": 1.5069930643194521e-05, + "loss": 0.6426, + "step": 9553 + }, + { + "epoch": 0.33, + "learning_rate": 1.5068992066001503e-05, + "loss": 0.6975, + "step": 9554 + }, + { + "epoch": 0.33, + "learning_rate": 1.5068053428709165e-05, + "loss": 0.6426, + "step": 9555 + }, + { + "epoch": 0.33, + "learning_rate": 1.5067114731328647e-05, + "loss": 0.6234, + "step": 9556 + }, + { + "epoch": 0.33, + "learning_rate": 1.5066175973871076e-05, + "loss": 0.5986, + "step": 9557 + }, + { + "epoch": 0.33, + "learning_rate": 1.5065237156347578e-05, + "loss": 0.6045, + "step": 9558 + }, + { + "epoch": 0.33, + "learning_rate": 1.5064298278769285e-05, + "loss": 0.6424, + "step": 9559 + }, + { + "epoch": 0.33, + "learning_rate": 1.5063359341147332e-05, + "loss": 0.6383, + "step": 9560 + }, + { + "epoch": 0.33, + "learning_rate": 1.5062420343492846e-05, + "loss": 0.6186, + "step": 9561 + }, + { + "epoch": 0.33, + "learning_rate": 1.5061481285816963e-05, + "loss": 0.6245, + "step": 9562 + }, + { + "epoch": 0.33, + "learning_rate": 1.5060542168130818e-05, + "loss": 0.6472, + "step": 9563 + }, + { + "epoch": 0.33, + "learning_rate": 1.5059602990445543e-05, + "loss": 0.5976, + "step": 9564 + }, + { + "epoch": 0.33, + "learning_rate": 1.5058663752772274e-05, + "loss": 0.6281, + "step": 9565 + }, + { + "epoch": 0.33, + "learning_rate": 1.505772445512215e-05, + "loss": 0.6061, + "step": 9566 + }, + { + "epoch": 0.33, + "learning_rate": 1.5056785097506301e-05, + "loss": 0.646, + "step": 9567 + }, + { + "epoch": 0.33, + "learning_rate": 1.5055845679935868e-05, + "loss": 0.682, + "step": 9568 + }, + { + "epoch": 0.33, + "learning_rate": 1.5054906202421991e-05, + "loss": 0.69, + "step": 9569 + }, + { + "epoch": 0.33, + "learning_rate": 1.5053966664975806e-05, + "loss": 0.6716, + "step": 9570 + }, + { + "epoch": 0.33, + "learning_rate": 1.5053027067608452e-05, + "loss": 0.6794, + "step": 9571 + }, + { + "epoch": 0.33, + "learning_rate": 1.5052087410331071e-05, + "loss": 0.6297, + "step": 9572 + }, + { + "epoch": 0.33, + "learning_rate": 1.50511476931548e-05, + "loss": 0.5939, + "step": 9573 + }, + { + "epoch": 0.33, + "learning_rate": 1.5050207916090787e-05, + "loss": 0.6007, + "step": 9574 + }, + { + "epoch": 0.33, + "learning_rate": 1.5049268079150168e-05, + "loss": 0.6615, + "step": 9575 + }, + { + "epoch": 0.33, + "learning_rate": 1.5048328182344087e-05, + "loss": 0.6007, + "step": 9576 + }, + { + "epoch": 0.33, + "learning_rate": 1.5047388225683694e-05, + "loss": 0.6485, + "step": 9577 + }, + { + "epoch": 0.33, + "learning_rate": 1.5046448209180126e-05, + "loss": 0.5741, + "step": 9578 + }, + { + "epoch": 0.33, + "learning_rate": 1.5045508132844531e-05, + "loss": 0.6506, + "step": 9579 + }, + { + "epoch": 0.33, + "learning_rate": 1.5044567996688056e-05, + "loss": 0.6531, + "step": 9580 + }, + { + "epoch": 0.33, + "learning_rate": 1.5043627800721843e-05, + "loss": 0.7069, + "step": 9581 + }, + { + "epoch": 0.33, + "learning_rate": 1.5042687544957044e-05, + "loss": 0.6328, + "step": 9582 + }, + { + "epoch": 0.33, + "learning_rate": 1.5041747229404803e-05, + "loss": 0.6804, + "step": 9583 + }, + { + "epoch": 0.33, + "learning_rate": 1.5040806854076273e-05, + "loss": 0.6554, + "step": 9584 + }, + { + "epoch": 0.33, + "learning_rate": 1.5039866418982603e-05, + "loss": 0.6476, + "step": 9585 + }, + { + "epoch": 0.33, + "learning_rate": 1.5038925924134939e-05, + "loss": 0.6512, + "step": 9586 + }, + { + "epoch": 0.33, + "learning_rate": 1.5037985369544432e-05, + "loss": 0.6192, + "step": 9587 + }, + { + "epoch": 0.33, + "learning_rate": 1.5037044755222237e-05, + "loss": 0.6341, + "step": 9588 + }, + { + "epoch": 0.33, + "learning_rate": 1.5036104081179506e-05, + "loss": 0.627, + "step": 9589 + }, + { + "epoch": 0.33, + "learning_rate": 1.5035163347427389e-05, + "loss": 0.6454, + "step": 9590 + }, + { + "epoch": 0.33, + "learning_rate": 1.503422255397704e-05, + "loss": 0.6309, + "step": 9591 + }, + { + "epoch": 0.33, + "learning_rate": 1.5033281700839614e-05, + "loss": 0.6569, + "step": 9592 + }, + { + "epoch": 0.33, + "learning_rate": 1.5032340788026267e-05, + "loss": 0.6544, + "step": 9593 + }, + { + "epoch": 0.33, + "learning_rate": 1.5031399815548155e-05, + "loss": 0.6702, + "step": 9594 + }, + { + "epoch": 0.33, + "learning_rate": 1.5030458783416436e-05, + "loss": 0.6308, + "step": 9595 + }, + { + "epoch": 0.33, + "learning_rate": 1.502951769164226e-05, + "loss": 0.6047, + "step": 9596 + }, + { + "epoch": 0.33, + "learning_rate": 1.502857654023679e-05, + "loss": 0.5766, + "step": 9597 + }, + { + "epoch": 0.33, + "learning_rate": 1.5027635329211187e-05, + "loss": 0.5964, + "step": 9598 + }, + { + "epoch": 0.33, + "learning_rate": 1.5026694058576602e-05, + "loss": 0.5834, + "step": 9599 + }, + { + "epoch": 0.33, + "learning_rate": 1.5025752728344204e-05, + "loss": 0.6379, + "step": 9600 + }, + { + "epoch": 0.33, + "learning_rate": 1.502481133852515e-05, + "loss": 0.6613, + "step": 9601 + }, + { + "epoch": 0.33, + "learning_rate": 1.50238698891306e-05, + "loss": 0.6698, + "step": 9602 + }, + { + "epoch": 0.33, + "learning_rate": 1.5022928380171715e-05, + "loss": 0.5862, + "step": 9603 + }, + { + "epoch": 0.33, + "learning_rate": 1.5021986811659665e-05, + "loss": 0.608, + "step": 9604 + }, + { + "epoch": 0.33, + "learning_rate": 1.5021045183605605e-05, + "loss": 0.6368, + "step": 9605 + }, + { + "epoch": 0.33, + "learning_rate": 1.5020103496020704e-05, + "loss": 0.6252, + "step": 9606 + }, + { + "epoch": 0.33, + "learning_rate": 1.5019161748916125e-05, + "loss": 0.6265, + "step": 9607 + }, + { + "epoch": 0.33, + "learning_rate": 1.5018219942303036e-05, + "loss": 0.6213, + "step": 9608 + }, + { + "epoch": 0.33, + "learning_rate": 1.5017278076192598e-05, + "loss": 0.6622, + "step": 9609 + }, + { + "epoch": 0.33, + "learning_rate": 1.5016336150595984e-05, + "loss": 0.6479, + "step": 9610 + }, + { + "epoch": 0.33, + "learning_rate": 1.501539416552436e-05, + "loss": 0.6642, + "step": 9611 + }, + { + "epoch": 0.33, + "learning_rate": 1.5014452120988892e-05, + "loss": 0.6376, + "step": 9612 + }, + { + "epoch": 0.33, + "learning_rate": 1.501351001700075e-05, + "loss": 0.6492, + "step": 9613 + }, + { + "epoch": 0.33, + "learning_rate": 1.5012567853571107e-05, + "loss": 0.625, + "step": 9614 + }, + { + "epoch": 0.33, + "learning_rate": 1.5011625630711128e-05, + "loss": 0.6264, + "step": 9615 + }, + { + "epoch": 0.33, + "learning_rate": 1.5010683348431992e-05, + "loss": 0.6841, + "step": 9616 + }, + { + "epoch": 0.33, + "learning_rate": 1.5009741006744862e-05, + "loss": 0.6185, + "step": 9617 + }, + { + "epoch": 0.33, + "learning_rate": 1.5008798605660916e-05, + "loss": 0.6979, + "step": 9618 + }, + { + "epoch": 0.33, + "learning_rate": 1.5007856145191329e-05, + "loss": 0.5906, + "step": 9619 + }, + { + "epoch": 0.33, + "learning_rate": 1.500691362534727e-05, + "loss": 0.6479, + "step": 9620 + }, + { + "epoch": 0.33, + "learning_rate": 1.5005971046139915e-05, + "loss": 0.6666, + "step": 9621 + }, + { + "epoch": 0.33, + "learning_rate": 1.5005028407580443e-05, + "loss": 0.5868, + "step": 9622 + }, + { + "epoch": 0.33, + "learning_rate": 1.5004085709680027e-05, + "loss": 0.6342, + "step": 9623 + }, + { + "epoch": 0.33, + "learning_rate": 1.5003142952449845e-05, + "loss": 0.6242, + "step": 9624 + }, + { + "epoch": 0.33, + "learning_rate": 1.5002200135901075e-05, + "loss": 0.6748, + "step": 9625 + }, + { + "epoch": 0.33, + "learning_rate": 1.5001257260044892e-05, + "loss": 0.606, + "step": 9626 + }, + { + "epoch": 0.33, + "learning_rate": 1.500031432489248e-05, + "loss": 0.6427, + "step": 9627 + }, + { + "epoch": 0.33, + "learning_rate": 1.4999371330455017e-05, + "loss": 0.6953, + "step": 9628 + }, + { + "epoch": 0.33, + "learning_rate": 1.4998428276743679e-05, + "loss": 0.6525, + "step": 9629 + }, + { + "epoch": 0.33, + "learning_rate": 1.4997485163769652e-05, + "loss": 0.6556, + "step": 9630 + }, + { + "epoch": 0.33, + "learning_rate": 1.499654199154412e-05, + "loss": 0.6183, + "step": 9631 + }, + { + "epoch": 0.33, + "learning_rate": 1.4995598760078258e-05, + "loss": 0.6257, + "step": 9632 + }, + { + "epoch": 0.33, + "learning_rate": 1.4994655469383256e-05, + "loss": 0.648, + "step": 9633 + }, + { + "epoch": 0.33, + "learning_rate": 1.4993712119470294e-05, + "loss": 0.6158, + "step": 9634 + }, + { + "epoch": 0.33, + "learning_rate": 1.4992768710350558e-05, + "loss": 0.6619, + "step": 9635 + }, + { + "epoch": 0.33, + "learning_rate": 1.4991825242035232e-05, + "loss": 0.6417, + "step": 9636 + }, + { + "epoch": 0.33, + "learning_rate": 1.4990881714535504e-05, + "loss": 0.6677, + "step": 9637 + }, + { + "epoch": 0.33, + "learning_rate": 1.4989938127862558e-05, + "loss": 0.6462, + "step": 9638 + }, + { + "epoch": 0.33, + "learning_rate": 1.4988994482027587e-05, + "loss": 0.6453, + "step": 9639 + }, + { + "epoch": 0.33, + "learning_rate": 1.498805077704177e-05, + "loss": 0.611, + "step": 9640 + }, + { + "epoch": 0.33, + "learning_rate": 1.4987107012916307e-05, + "loss": 0.5948, + "step": 9641 + }, + { + "epoch": 0.33, + "learning_rate": 1.4986163189662377e-05, + "loss": 0.6242, + "step": 9642 + }, + { + "epoch": 0.33, + "learning_rate": 1.4985219307291177e-05, + "loss": 0.7034, + "step": 9643 + }, + { + "epoch": 0.33, + "learning_rate": 1.4984275365813895e-05, + "loss": 0.6165, + "step": 9644 + }, + { + "epoch": 0.33, + "learning_rate": 1.4983331365241724e-05, + "loss": 0.673, + "step": 9645 + }, + { + "epoch": 0.33, + "learning_rate": 1.4982387305585855e-05, + "loss": 0.7053, + "step": 9646 + }, + { + "epoch": 0.33, + "learning_rate": 1.4981443186857482e-05, + "loss": 0.6397, + "step": 9647 + }, + { + "epoch": 0.33, + "learning_rate": 1.49804990090678e-05, + "loss": 0.6804, + "step": 9648 + }, + { + "epoch": 0.33, + "learning_rate": 1.4979554772228e-05, + "loss": 0.6417, + "step": 9649 + }, + { + "epoch": 0.33, + "learning_rate": 1.497861047634928e-05, + "loss": 0.6332, + "step": 9650 + }, + { + "epoch": 0.33, + "learning_rate": 1.4977666121442835e-05, + "loss": 0.6448, + "step": 9651 + }, + { + "epoch": 0.33, + "learning_rate": 1.497672170751986e-05, + "loss": 0.6741, + "step": 9652 + }, + { + "epoch": 0.33, + "learning_rate": 1.4975777234591553e-05, + "loss": 0.6571, + "step": 9653 + }, + { + "epoch": 0.33, + "learning_rate": 1.4974832702669116e-05, + "loss": 0.5846, + "step": 9654 + }, + { + "epoch": 0.33, + "learning_rate": 1.4973888111763742e-05, + "loss": 0.6227, + "step": 9655 + }, + { + "epoch": 0.33, + "learning_rate": 1.497294346188663e-05, + "loss": 0.6647, + "step": 9656 + }, + { + "epoch": 0.33, + "learning_rate": 1.4971998753048986e-05, + "loss": 0.6125, + "step": 9657 + }, + { + "epoch": 0.33, + "learning_rate": 1.4971053985262005e-05, + "loss": 0.6173, + "step": 9658 + }, + { + "epoch": 0.33, + "learning_rate": 1.4970109158536892e-05, + "loss": 0.659, + "step": 9659 + }, + { + "epoch": 0.33, + "learning_rate": 1.496916427288485e-05, + "loss": 0.6388, + "step": 9660 + }, + { + "epoch": 0.33, + "learning_rate": 1.4968219328317076e-05, + "loss": 0.6203, + "step": 9661 + }, + { + "epoch": 0.33, + "learning_rate": 1.4967274324844776e-05, + "loss": 0.6646, + "step": 9662 + }, + { + "epoch": 0.33, + "learning_rate": 1.4966329262479158e-05, + "loss": 0.6426, + "step": 9663 + }, + { + "epoch": 0.33, + "learning_rate": 1.4965384141231425e-05, + "loss": 0.6573, + "step": 9664 + }, + { + "epoch": 0.33, + "learning_rate": 1.4964438961112777e-05, + "loss": 0.61, + "step": 9665 + }, + { + "epoch": 0.33, + "learning_rate": 1.496349372213443e-05, + "loss": 0.6441, + "step": 9666 + }, + { + "epoch": 0.33, + "learning_rate": 1.4962548424307586e-05, + "loss": 0.6465, + "step": 9667 + }, + { + "epoch": 0.33, + "learning_rate": 1.4961603067643449e-05, + "loss": 0.6254, + "step": 9668 + }, + { + "epoch": 0.34, + "learning_rate": 1.4960657652153234e-05, + "loss": 0.6888, + "step": 9669 + }, + { + "epoch": 0.34, + "learning_rate": 1.4959712177848146e-05, + "loss": 0.5963, + "step": 9670 + }, + { + "epoch": 0.34, + "learning_rate": 1.4958766644739396e-05, + "loss": 0.6593, + "step": 9671 + }, + { + "epoch": 0.34, + "learning_rate": 1.4957821052838195e-05, + "loss": 0.5854, + "step": 9672 + }, + { + "epoch": 0.34, + "learning_rate": 1.4956875402155755e-05, + "loss": 0.6429, + "step": 9673 + }, + { + "epoch": 0.34, + "learning_rate": 1.4955929692703283e-05, + "loss": 0.5908, + "step": 9674 + }, + { + "epoch": 0.34, + "learning_rate": 1.4954983924492e-05, + "loss": 0.6236, + "step": 9675 + }, + { + "epoch": 0.34, + "learning_rate": 1.4954038097533113e-05, + "loss": 0.6449, + "step": 9676 + }, + { + "epoch": 0.34, + "learning_rate": 1.4953092211837831e-05, + "loss": 0.6587, + "step": 9677 + }, + { + "epoch": 0.34, + "learning_rate": 1.4952146267417385e-05, + "loss": 0.586, + "step": 9678 + }, + { + "epoch": 0.34, + "learning_rate": 1.4951200264282977e-05, + "loss": 0.668, + "step": 9679 + }, + { + "epoch": 0.34, + "learning_rate": 1.4950254202445822e-05, + "loss": 0.6099, + "step": 9680 + }, + { + "epoch": 0.34, + "learning_rate": 1.4949308081917147e-05, + "loss": 0.6622, + "step": 9681 + }, + { + "epoch": 0.34, + "learning_rate": 1.4948361902708161e-05, + "loss": 0.669, + "step": 9682 + }, + { + "epoch": 0.34, + "learning_rate": 1.4947415664830085e-05, + "loss": 0.6325, + "step": 9683 + }, + { + "epoch": 0.34, + "learning_rate": 1.494646936829414e-05, + "loss": 0.6315, + "step": 9684 + }, + { + "epoch": 0.34, + "learning_rate": 1.4945523013111542e-05, + "loss": 0.6173, + "step": 9685 + }, + { + "epoch": 0.34, + "learning_rate": 1.494457659929351e-05, + "loss": 0.6118, + "step": 9686 + }, + { + "epoch": 0.34, + "learning_rate": 1.4943630126851272e-05, + "loss": 0.6288, + "step": 9687 + }, + { + "epoch": 0.34, + "learning_rate": 1.4942683595796043e-05, + "loss": 0.6556, + "step": 9688 + }, + { + "epoch": 0.34, + "learning_rate": 1.4941737006139045e-05, + "loss": 0.6252, + "step": 9689 + }, + { + "epoch": 0.34, + "learning_rate": 1.4940790357891509e-05, + "loss": 0.661, + "step": 9690 + }, + { + "epoch": 0.34, + "learning_rate": 1.493984365106465e-05, + "loss": 0.6013, + "step": 9691 + }, + { + "epoch": 0.34, + "learning_rate": 1.4938896885669694e-05, + "loss": 0.6687, + "step": 9692 + }, + { + "epoch": 0.34, + "learning_rate": 1.493795006171787e-05, + "loss": 0.5984, + "step": 9693 + }, + { + "epoch": 0.34, + "learning_rate": 1.4937003179220402e-05, + "loss": 0.6283, + "step": 9694 + }, + { + "epoch": 0.34, + "learning_rate": 1.4936056238188515e-05, + "loss": 0.6164, + "step": 9695 + }, + { + "epoch": 0.34, + "learning_rate": 1.4935109238633437e-05, + "loss": 0.5823, + "step": 9696 + }, + { + "epoch": 0.34, + "learning_rate": 1.4934162180566395e-05, + "loss": 0.6244, + "step": 9697 + }, + { + "epoch": 0.34, + "learning_rate": 1.493321506399862e-05, + "loss": 0.7202, + "step": 9698 + }, + { + "epoch": 0.34, + "learning_rate": 1.4932267888941338e-05, + "loss": 0.7007, + "step": 9699 + }, + { + "epoch": 0.34, + "learning_rate": 1.4931320655405785e-05, + "loss": 0.5885, + "step": 9700 + }, + { + "epoch": 0.34, + "learning_rate": 1.4930373363403184e-05, + "loss": 0.6518, + "step": 9701 + }, + { + "epoch": 0.34, + "learning_rate": 1.492942601294477e-05, + "loss": 0.5849, + "step": 9702 + }, + { + "epoch": 0.34, + "learning_rate": 1.4928478604041776e-05, + "loss": 0.6209, + "step": 9703 + }, + { + "epoch": 0.34, + "learning_rate": 1.4927531136705433e-05, + "loss": 0.6623, + "step": 9704 + }, + { + "epoch": 0.34, + "learning_rate": 1.4926583610946974e-05, + "loss": 0.6603, + "step": 9705 + }, + { + "epoch": 0.34, + "learning_rate": 1.4925636026777637e-05, + "loss": 0.6063, + "step": 9706 + }, + { + "epoch": 0.34, + "learning_rate": 1.492468838420865e-05, + "loss": 0.6411, + "step": 9707 + }, + { + "epoch": 0.34, + "learning_rate": 1.4923740683251255e-05, + "loss": 0.6238, + "step": 9708 + }, + { + "epoch": 0.34, + "learning_rate": 1.4922792923916687e-05, + "loss": 0.6547, + "step": 9709 + }, + { + "epoch": 0.34, + "learning_rate": 1.492184510621618e-05, + "loss": 0.6175, + "step": 9710 + }, + { + "epoch": 0.34, + "learning_rate": 1.4920897230160971e-05, + "loss": 0.639, + "step": 9711 + }, + { + "epoch": 0.34, + "learning_rate": 1.4919949295762304e-05, + "loss": 0.6006, + "step": 9712 + }, + { + "epoch": 0.34, + "learning_rate": 1.491900130303141e-05, + "loss": 0.623, + "step": 9713 + }, + { + "epoch": 0.34, + "learning_rate": 1.4918053251979535e-05, + "loss": 0.6377, + "step": 9714 + }, + { + "epoch": 0.34, + "learning_rate": 1.491710514261792e-05, + "loss": 0.6461, + "step": 9715 + }, + { + "epoch": 0.34, + "learning_rate": 1.49161569749578e-05, + "loss": 0.7113, + "step": 9716 + }, + { + "epoch": 0.34, + "learning_rate": 1.4915208749010421e-05, + "loss": 0.635, + "step": 9717 + }, + { + "epoch": 0.34, + "learning_rate": 1.4914260464787027e-05, + "loss": 0.6375, + "step": 9718 + }, + { + "epoch": 0.34, + "learning_rate": 1.4913312122298855e-05, + "loss": 0.5736, + "step": 9719 + }, + { + "epoch": 0.34, + "learning_rate": 1.4912363721557154e-05, + "loss": 0.7045, + "step": 9720 + }, + { + "epoch": 0.34, + "learning_rate": 1.4911415262573168e-05, + "loss": 0.6477, + "step": 9721 + }, + { + "epoch": 0.34, + "learning_rate": 1.4910466745358139e-05, + "loss": 0.653, + "step": 9722 + }, + { + "epoch": 0.34, + "learning_rate": 1.4909518169923316e-05, + "loss": 0.6612, + "step": 9723 + }, + { + "epoch": 0.34, + "learning_rate": 1.4908569536279944e-05, + "loss": 0.6164, + "step": 9724 + }, + { + "epoch": 0.34, + "learning_rate": 1.4907620844439272e-05, + "loss": 0.6305, + "step": 9725 + }, + { + "epoch": 0.34, + "learning_rate": 1.4906672094412546e-05, + "loss": 0.6005, + "step": 9726 + }, + { + "epoch": 0.34, + "learning_rate": 1.4905723286211013e-05, + "loss": 0.6395, + "step": 9727 + }, + { + "epoch": 0.34, + "learning_rate": 1.4904774419845928e-05, + "loss": 0.598, + "step": 9728 + }, + { + "epoch": 0.34, + "learning_rate": 1.4903825495328538e-05, + "loss": 0.6672, + "step": 9729 + }, + { + "epoch": 0.34, + "learning_rate": 1.490287651267009e-05, + "loss": 0.688, + "step": 9730 + }, + { + "epoch": 0.34, + "learning_rate": 1.490192747188184e-05, + "loss": 0.5966, + "step": 9731 + }, + { + "epoch": 0.34, + "learning_rate": 1.490097837297504e-05, + "loss": 0.6172, + "step": 9732 + }, + { + "epoch": 0.34, + "learning_rate": 1.4900029215960942e-05, + "loss": 0.6336, + "step": 9733 + }, + { + "epoch": 0.34, + "learning_rate": 1.4899080000850799e-05, + "loss": 0.6319, + "step": 9734 + }, + { + "epoch": 0.34, + "learning_rate": 1.4898130727655863e-05, + "loss": 0.5606, + "step": 9735 + }, + { + "epoch": 0.34, + "learning_rate": 1.4897181396387392e-05, + "loss": 0.6385, + "step": 9736 + }, + { + "epoch": 0.34, + "learning_rate": 1.489623200705664e-05, + "loss": 0.5649, + "step": 9737 + }, + { + "epoch": 0.34, + "learning_rate": 1.4895282559674869e-05, + "loss": 0.6452, + "step": 9738 + }, + { + "epoch": 0.34, + "learning_rate": 1.4894333054253325e-05, + "loss": 0.592, + "step": 9739 + }, + { + "epoch": 0.34, + "learning_rate": 1.4893383490803272e-05, + "loss": 0.6259, + "step": 9740 + }, + { + "epoch": 0.34, + "learning_rate": 1.4892433869335969e-05, + "loss": 0.6197, + "step": 9741 + }, + { + "epoch": 0.34, + "learning_rate": 1.4891484189862673e-05, + "loss": 0.5842, + "step": 9742 + }, + { + "epoch": 0.34, + "learning_rate": 1.4890534452394643e-05, + "loss": 0.6536, + "step": 9743 + }, + { + "epoch": 0.34, + "learning_rate": 1.4889584656943143e-05, + "loss": 0.6295, + "step": 9744 + }, + { + "epoch": 0.34, + "learning_rate": 1.4888634803519431e-05, + "loss": 0.6113, + "step": 9745 + }, + { + "epoch": 0.34, + "learning_rate": 1.4887684892134766e-05, + "loss": 0.5939, + "step": 9746 + }, + { + "epoch": 0.34, + "learning_rate": 1.4886734922800416e-05, + "loss": 0.6028, + "step": 9747 + }, + { + "epoch": 0.34, + "learning_rate": 1.4885784895527642e-05, + "loss": 0.6551, + "step": 9748 + }, + { + "epoch": 0.34, + "learning_rate": 1.4884834810327706e-05, + "loss": 0.6407, + "step": 9749 + }, + { + "epoch": 0.34, + "learning_rate": 1.4883884667211879e-05, + "loss": 0.6516, + "step": 9750 + }, + { + "epoch": 0.34, + "learning_rate": 1.4882934466191414e-05, + "loss": 0.619, + "step": 9751 + }, + { + "epoch": 0.34, + "learning_rate": 1.4881984207277589e-05, + "loss": 0.6203, + "step": 9752 + }, + { + "epoch": 0.34, + "learning_rate": 1.4881033890481664e-05, + "loss": 0.6866, + "step": 9753 + }, + { + "epoch": 0.34, + "learning_rate": 1.4880083515814906e-05, + "loss": 0.6385, + "step": 9754 + }, + { + "epoch": 0.34, + "learning_rate": 1.4879133083288587e-05, + "loss": 0.67, + "step": 9755 + }, + { + "epoch": 0.34, + "learning_rate": 1.4878182592913973e-05, + "loss": 0.586, + "step": 9756 + }, + { + "epoch": 0.34, + "learning_rate": 1.4877232044702335e-05, + "loss": 0.6252, + "step": 9757 + }, + { + "epoch": 0.34, + "learning_rate": 1.4876281438664934e-05, + "loss": 0.6189, + "step": 9758 + }, + { + "epoch": 0.34, + "learning_rate": 1.4875330774813055e-05, + "loss": 0.6101, + "step": 9759 + }, + { + "epoch": 0.34, + "learning_rate": 1.4874380053157961e-05, + "loss": 0.6112, + "step": 9760 + }, + { + "epoch": 0.34, + "learning_rate": 1.4873429273710924e-05, + "loss": 0.6159, + "step": 9761 + }, + { + "epoch": 0.34, + "learning_rate": 1.487247843648322e-05, + "loss": 0.5884, + "step": 9762 + }, + { + "epoch": 0.34, + "learning_rate": 1.4871527541486122e-05, + "loss": 0.6222, + "step": 9763 + }, + { + "epoch": 0.34, + "learning_rate": 1.4870576588730896e-05, + "loss": 0.6415, + "step": 9764 + }, + { + "epoch": 0.34, + "learning_rate": 1.4869625578228828e-05, + "loss": 0.6589, + "step": 9765 + }, + { + "epoch": 0.34, + "learning_rate": 1.4868674509991188e-05, + "loss": 0.6415, + "step": 9766 + }, + { + "epoch": 0.34, + "learning_rate": 1.486772338402925e-05, + "loss": 0.6508, + "step": 9767 + }, + { + "epoch": 0.34, + "learning_rate": 1.4866772200354298e-05, + "loss": 0.6447, + "step": 9768 + }, + { + "epoch": 0.34, + "learning_rate": 1.4865820958977603e-05, + "loss": 0.6224, + "step": 9769 + }, + { + "epoch": 0.34, + "learning_rate": 1.4864869659910444e-05, + "loss": 0.5935, + "step": 9770 + }, + { + "epoch": 0.34, + "learning_rate": 1.4863918303164103e-05, + "loss": 0.6199, + "step": 9771 + }, + { + "epoch": 0.34, + "learning_rate": 1.4862966888749859e-05, + "loss": 0.6077, + "step": 9772 + }, + { + "epoch": 0.34, + "learning_rate": 1.4862015416678985e-05, + "loss": 0.6437, + "step": 9773 + }, + { + "epoch": 0.34, + "learning_rate": 1.4861063886962774e-05, + "loss": 0.6134, + "step": 9774 + }, + { + "epoch": 0.34, + "learning_rate": 1.4860112299612499e-05, + "loss": 0.6437, + "step": 9775 + }, + { + "epoch": 0.34, + "learning_rate": 1.4859160654639441e-05, + "loss": 0.5943, + "step": 9776 + }, + { + "epoch": 0.34, + "learning_rate": 1.4858208952054893e-05, + "loss": 0.6009, + "step": 9777 + }, + { + "epoch": 0.34, + "learning_rate": 1.4857257191870132e-05, + "loss": 0.7042, + "step": 9778 + }, + { + "epoch": 0.34, + "learning_rate": 1.4856305374096435e-05, + "loss": 0.6642, + "step": 9779 + }, + { + "epoch": 0.34, + "learning_rate": 1.4855353498745102e-05, + "loss": 0.6209, + "step": 9780 + }, + { + "epoch": 0.34, + "learning_rate": 1.485440156582741e-05, + "loss": 0.5917, + "step": 9781 + }, + { + "epoch": 0.34, + "learning_rate": 1.485344957535464e-05, + "loss": 0.5827, + "step": 9782 + }, + { + "epoch": 0.34, + "learning_rate": 1.4852497527338094e-05, + "loss": 0.6099, + "step": 9783 + }, + { + "epoch": 0.34, + "learning_rate": 1.4851545421789048e-05, + "loss": 0.6215, + "step": 9784 + }, + { + "epoch": 0.34, + "learning_rate": 1.4850593258718793e-05, + "loss": 0.5637, + "step": 9785 + }, + { + "epoch": 0.34, + "learning_rate": 1.484964103813862e-05, + "loss": 0.6192, + "step": 9786 + }, + { + "epoch": 0.34, + "learning_rate": 1.4848688760059819e-05, + "loss": 0.6386, + "step": 9787 + }, + { + "epoch": 0.34, + "learning_rate": 1.4847736424493677e-05, + "loss": 0.6581, + "step": 9788 + }, + { + "epoch": 0.34, + "learning_rate": 1.4846784031451486e-05, + "loss": 0.6456, + "step": 9789 + }, + { + "epoch": 0.34, + "learning_rate": 1.4845831580944543e-05, + "loss": 0.6489, + "step": 9790 + }, + { + "epoch": 0.34, + "learning_rate": 1.4844879072984135e-05, + "loss": 0.6163, + "step": 9791 + }, + { + "epoch": 0.34, + "learning_rate": 1.4843926507581556e-05, + "loss": 0.6782, + "step": 9792 + }, + { + "epoch": 0.34, + "learning_rate": 1.4842973884748102e-05, + "loss": 0.631, + "step": 9793 + }, + { + "epoch": 0.34, + "learning_rate": 1.4842021204495065e-05, + "loss": 0.6368, + "step": 9794 + }, + { + "epoch": 0.34, + "learning_rate": 1.4841068466833742e-05, + "loss": 0.6468, + "step": 9795 + }, + { + "epoch": 0.34, + "learning_rate": 1.4840115671775428e-05, + "loss": 0.6078, + "step": 9796 + }, + { + "epoch": 0.34, + "learning_rate": 1.483916281933142e-05, + "loss": 0.6731, + "step": 9797 + }, + { + "epoch": 0.34, + "learning_rate": 1.4838209909513012e-05, + "loss": 0.6269, + "step": 9798 + }, + { + "epoch": 0.34, + "learning_rate": 1.4837256942331514e-05, + "loss": 0.6163, + "step": 9799 + }, + { + "epoch": 0.34, + "learning_rate": 1.4836303917798207e-05, + "loss": 0.6307, + "step": 9800 + }, + { + "epoch": 0.34, + "learning_rate": 1.48353508359244e-05, + "loss": 0.5507, + "step": 9801 + }, + { + "epoch": 0.34, + "learning_rate": 1.4834397696721396e-05, + "loss": 0.6993, + "step": 9802 + }, + { + "epoch": 0.34, + "learning_rate": 1.483344450020049e-05, + "loss": 0.6368, + "step": 9803 + }, + { + "epoch": 0.34, + "learning_rate": 1.4832491246372985e-05, + "loss": 0.5999, + "step": 9804 + }, + { + "epoch": 0.34, + "learning_rate": 1.4831537935250185e-05, + "loss": 0.6203, + "step": 9805 + }, + { + "epoch": 0.34, + "learning_rate": 1.4830584566843387e-05, + "loss": 0.6309, + "step": 9806 + }, + { + "epoch": 0.34, + "learning_rate": 1.48296311411639e-05, + "loss": 0.6172, + "step": 9807 + }, + { + "epoch": 0.34, + "learning_rate": 1.4828677658223028e-05, + "loss": 0.6496, + "step": 9808 + }, + { + "epoch": 0.34, + "learning_rate": 1.4827724118032074e-05, + "loss": 0.6364, + "step": 9809 + }, + { + "epoch": 0.34, + "learning_rate": 1.4826770520602341e-05, + "loss": 0.6546, + "step": 9810 + }, + { + "epoch": 0.34, + "learning_rate": 1.482581686594514e-05, + "loss": 0.6819, + "step": 9811 + }, + { + "epoch": 0.34, + "learning_rate": 1.4824863154071774e-05, + "loss": 0.6588, + "step": 9812 + }, + { + "epoch": 0.34, + "learning_rate": 1.482390938499355e-05, + "loss": 0.6, + "step": 9813 + }, + { + "epoch": 0.34, + "learning_rate": 1.482295555872178e-05, + "loss": 0.6456, + "step": 9814 + }, + { + "epoch": 0.34, + "learning_rate": 1.4822001675267772e-05, + "loss": 0.6362, + "step": 9815 + }, + { + "epoch": 0.34, + "learning_rate": 1.4821047734642833e-05, + "loss": 0.6577, + "step": 9816 + }, + { + "epoch": 0.34, + "learning_rate": 1.4820093736858274e-05, + "loss": 0.6391, + "step": 9817 + }, + { + "epoch": 0.34, + "learning_rate": 1.4819139681925408e-05, + "loss": 0.6909, + "step": 9818 + }, + { + "epoch": 0.34, + "learning_rate": 1.4818185569855541e-05, + "loss": 0.6151, + "step": 9819 + }, + { + "epoch": 0.34, + "learning_rate": 1.4817231400659995e-05, + "loss": 0.6735, + "step": 9820 + }, + { + "epoch": 0.34, + "learning_rate": 1.4816277174350071e-05, + "loss": 0.5816, + "step": 9821 + }, + { + "epoch": 0.34, + "learning_rate": 1.4815322890937091e-05, + "loss": 0.6338, + "step": 9822 + }, + { + "epoch": 0.34, + "learning_rate": 1.4814368550432368e-05, + "loss": 0.6367, + "step": 9823 + }, + { + "epoch": 0.34, + "learning_rate": 1.4813414152847213e-05, + "loss": 0.6253, + "step": 9824 + }, + { + "epoch": 0.34, + "learning_rate": 1.4812459698192947e-05, + "loss": 0.6251, + "step": 9825 + }, + { + "epoch": 0.34, + "learning_rate": 1.481150518648088e-05, + "loss": 0.6261, + "step": 9826 + }, + { + "epoch": 0.34, + "learning_rate": 1.4810550617722336e-05, + "loss": 0.6246, + "step": 9827 + }, + { + "epoch": 0.34, + "learning_rate": 1.4809595991928628e-05, + "loss": 0.6254, + "step": 9828 + }, + { + "epoch": 0.34, + "learning_rate": 1.4808641309111074e-05, + "loss": 0.6407, + "step": 9829 + }, + { + "epoch": 0.34, + "learning_rate": 1.4807686569280995e-05, + "loss": 0.6551, + "step": 9830 + }, + { + "epoch": 0.34, + "learning_rate": 1.4806731772449712e-05, + "loss": 0.6378, + "step": 9831 + }, + { + "epoch": 0.34, + "learning_rate": 1.480577691862854e-05, + "loss": 0.6582, + "step": 9832 + }, + { + "epoch": 0.34, + "learning_rate": 1.4804822007828805e-05, + "loss": 0.6875, + "step": 9833 + }, + { + "epoch": 0.34, + "learning_rate": 1.4803867040061828e-05, + "loss": 0.6292, + "step": 9834 + }, + { + "epoch": 0.34, + "learning_rate": 1.4802912015338928e-05, + "loss": 0.553, + "step": 9835 + }, + { + "epoch": 0.34, + "learning_rate": 1.480195693367143e-05, + "loss": 0.5683, + "step": 9836 + }, + { + "epoch": 0.34, + "learning_rate": 1.4801001795070661e-05, + "loss": 0.614, + "step": 9837 + }, + { + "epoch": 0.34, + "learning_rate": 1.4800046599547941e-05, + "loss": 0.548, + "step": 9838 + }, + { + "epoch": 0.34, + "learning_rate": 1.4799091347114595e-05, + "loss": 0.6669, + "step": 9839 + }, + { + "epoch": 0.34, + "learning_rate": 1.4798136037781954e-05, + "loss": 0.6467, + "step": 9840 + }, + { + "epoch": 0.34, + "learning_rate": 1.4797180671561337e-05, + "loss": 0.6347, + "step": 9841 + }, + { + "epoch": 0.34, + "learning_rate": 1.4796225248464073e-05, + "loss": 0.6694, + "step": 9842 + }, + { + "epoch": 0.34, + "learning_rate": 1.4795269768501496e-05, + "loss": 0.6744, + "step": 9843 + }, + { + "epoch": 0.34, + "learning_rate": 1.4794314231684927e-05, + "loss": 0.6322, + "step": 9844 + }, + { + "epoch": 0.34, + "learning_rate": 1.4793358638025699e-05, + "loss": 0.6414, + "step": 9845 + }, + { + "epoch": 0.34, + "learning_rate": 1.4792402987535144e-05, + "loss": 0.6129, + "step": 9846 + }, + { + "epoch": 0.34, + "learning_rate": 1.4791447280224585e-05, + "loss": 0.6299, + "step": 9847 + }, + { + "epoch": 0.34, + "learning_rate": 1.4790491516105356e-05, + "loss": 0.6229, + "step": 9848 + }, + { + "epoch": 0.34, + "learning_rate": 1.4789535695188795e-05, + "loss": 0.6395, + "step": 9849 + }, + { + "epoch": 0.34, + "learning_rate": 1.4788579817486226e-05, + "loss": 0.6161, + "step": 9850 + }, + { + "epoch": 0.34, + "learning_rate": 1.4787623883008986e-05, + "loss": 0.6327, + "step": 9851 + }, + { + "epoch": 0.34, + "learning_rate": 1.478666789176841e-05, + "loss": 0.62, + "step": 9852 + }, + { + "epoch": 0.34, + "learning_rate": 1.4785711843775828e-05, + "loss": 0.6543, + "step": 9853 + }, + { + "epoch": 0.34, + "learning_rate": 1.478475573904258e-05, + "loss": 0.6756, + "step": 9854 + }, + { + "epoch": 0.34, + "learning_rate": 1.4783799577580001e-05, + "loss": 0.5924, + "step": 9855 + }, + { + "epoch": 0.34, + "learning_rate": 1.4782843359399426e-05, + "loss": 0.5746, + "step": 9856 + }, + { + "epoch": 0.34, + "learning_rate": 1.478188708451219e-05, + "loss": 0.612, + "step": 9857 + }, + { + "epoch": 0.34, + "learning_rate": 1.4780930752929638e-05, + "loss": 0.634, + "step": 9858 + }, + { + "epoch": 0.34, + "learning_rate": 1.4779974364663101e-05, + "loss": 0.6128, + "step": 9859 + }, + { + "epoch": 0.34, + "learning_rate": 1.4779017919723919e-05, + "loss": 0.7026, + "step": 9860 + }, + { + "epoch": 0.34, + "learning_rate": 1.477806141812344e-05, + "loss": 0.6368, + "step": 9861 + }, + { + "epoch": 0.34, + "learning_rate": 1.4777104859872995e-05, + "loss": 0.6115, + "step": 9862 + }, + { + "epoch": 0.34, + "learning_rate": 1.4776148244983928e-05, + "loss": 0.6303, + "step": 9863 + }, + { + "epoch": 0.34, + "learning_rate": 1.4775191573467584e-05, + "loss": 0.6847, + "step": 9864 + }, + { + "epoch": 0.34, + "learning_rate": 1.4774234845335303e-05, + "loss": 0.5724, + "step": 9865 + }, + { + "epoch": 0.34, + "learning_rate": 1.4773278060598426e-05, + "loss": 0.6563, + "step": 9866 + }, + { + "epoch": 0.34, + "learning_rate": 1.4772321219268304e-05, + "loss": 0.6775, + "step": 9867 + }, + { + "epoch": 0.34, + "learning_rate": 1.4771364321356272e-05, + "loss": 0.6743, + "step": 9868 + }, + { + "epoch": 0.34, + "learning_rate": 1.4770407366873682e-05, + "loss": 0.6289, + "step": 9869 + }, + { + "epoch": 0.34, + "learning_rate": 1.4769450355831878e-05, + "loss": 0.6661, + "step": 9870 + }, + { + "epoch": 0.34, + "learning_rate": 1.4768493288242207e-05, + "loss": 0.6976, + "step": 9871 + }, + { + "epoch": 0.34, + "learning_rate": 1.4767536164116017e-05, + "loss": 0.6584, + "step": 9872 + }, + { + "epoch": 0.34, + "learning_rate": 1.4766578983464654e-05, + "loss": 0.6189, + "step": 9873 + }, + { + "epoch": 0.34, + "learning_rate": 1.4765621746299465e-05, + "loss": 0.6222, + "step": 9874 + }, + { + "epoch": 0.34, + "learning_rate": 1.4764664452631806e-05, + "loss": 0.6383, + "step": 9875 + }, + { + "epoch": 0.34, + "learning_rate": 1.4763707102473019e-05, + "loss": 0.6349, + "step": 9876 + }, + { + "epoch": 0.34, + "learning_rate": 1.476274969583446e-05, + "loss": 0.6371, + "step": 9877 + }, + { + "epoch": 0.34, + "learning_rate": 1.4761792232727477e-05, + "loss": 0.6011, + "step": 9878 + }, + { + "epoch": 0.34, + "learning_rate": 1.4760834713163426e-05, + "loss": 0.6435, + "step": 9879 + }, + { + "epoch": 0.34, + "learning_rate": 1.4759877137153653e-05, + "loss": 0.6341, + "step": 9880 + }, + { + "epoch": 0.34, + "learning_rate": 1.4758919504709517e-05, + "loss": 0.6621, + "step": 9881 + }, + { + "epoch": 0.34, + "learning_rate": 1.4757961815842372e-05, + "loss": 0.5841, + "step": 9882 + }, + { + "epoch": 0.34, + "learning_rate": 1.475700407056357e-05, + "loss": 0.6329, + "step": 9883 + }, + { + "epoch": 0.34, + "learning_rate": 1.4756046268884468e-05, + "loss": 0.6323, + "step": 9884 + }, + { + "epoch": 0.34, + "learning_rate": 1.4755088410816418e-05, + "loss": 0.5998, + "step": 9885 + }, + { + "epoch": 0.34, + "learning_rate": 1.4754130496370782e-05, + "loss": 0.6351, + "step": 9886 + }, + { + "epoch": 0.34, + "learning_rate": 1.4753172525558914e-05, + "loss": 0.6256, + "step": 9887 + }, + { + "epoch": 0.34, + "learning_rate": 1.4752214498392174e-05, + "loss": 0.6203, + "step": 9888 + }, + { + "epoch": 0.34, + "learning_rate": 1.4751256414881918e-05, + "loss": 0.6279, + "step": 9889 + }, + { + "epoch": 0.34, + "learning_rate": 1.4750298275039509e-05, + "loss": 0.6158, + "step": 9890 + }, + { + "epoch": 0.34, + "learning_rate": 1.4749340078876302e-05, + "loss": 0.6584, + "step": 9891 + }, + { + "epoch": 0.34, + "learning_rate": 1.4748381826403662e-05, + "loss": 0.5687, + "step": 9892 + }, + { + "epoch": 0.34, + "learning_rate": 1.474742351763295e-05, + "loss": 0.6637, + "step": 9893 + }, + { + "epoch": 0.34, + "learning_rate": 1.4746465152575524e-05, + "loss": 0.6316, + "step": 9894 + }, + { + "epoch": 0.34, + "learning_rate": 1.4745506731242748e-05, + "loss": 0.6731, + "step": 9895 + }, + { + "epoch": 0.34, + "learning_rate": 1.4744548253645992e-05, + "loss": 0.6013, + "step": 9896 + }, + { + "epoch": 0.34, + "learning_rate": 1.4743589719796612e-05, + "loss": 0.5539, + "step": 9897 + }, + { + "epoch": 0.34, + "learning_rate": 1.4742631129705974e-05, + "loss": 0.6044, + "step": 9898 + }, + { + "epoch": 0.34, + "learning_rate": 1.4741672483385445e-05, + "loss": 0.6121, + "step": 9899 + }, + { + "epoch": 0.34, + "learning_rate": 1.4740713780846392e-05, + "loss": 0.641, + "step": 9900 + }, + { + "epoch": 0.34, + "learning_rate": 1.4739755022100176e-05, + "loss": 0.7026, + "step": 9901 + }, + { + "epoch": 0.34, + "learning_rate": 1.4738796207158175e-05, + "loss": 0.6224, + "step": 9902 + }, + { + "epoch": 0.34, + "learning_rate": 1.4737837336031744e-05, + "loss": 0.5836, + "step": 9903 + }, + { + "epoch": 0.34, + "learning_rate": 1.4736878408732263e-05, + "loss": 0.6135, + "step": 9904 + }, + { + "epoch": 0.34, + "learning_rate": 1.4735919425271093e-05, + "loss": 0.633, + "step": 9905 + }, + { + "epoch": 0.34, + "learning_rate": 1.4734960385659608e-05, + "loss": 0.6398, + "step": 9906 + }, + { + "epoch": 0.34, + "learning_rate": 1.4734001289909179e-05, + "loss": 0.6633, + "step": 9907 + }, + { + "epoch": 0.34, + "learning_rate": 1.4733042138031175e-05, + "loss": 0.6397, + "step": 9908 + }, + { + "epoch": 0.34, + "learning_rate": 1.4732082930036968e-05, + "loss": 0.6258, + "step": 9909 + }, + { + "epoch": 0.34, + "learning_rate": 1.4731123665937937e-05, + "loss": 0.619, + "step": 9910 + }, + { + "epoch": 0.34, + "learning_rate": 1.4730164345745444e-05, + "loss": 0.6204, + "step": 9911 + }, + { + "epoch": 0.34, + "learning_rate": 1.4729204969470869e-05, + "loss": 0.6627, + "step": 9912 + }, + { + "epoch": 0.34, + "learning_rate": 1.4728245537125591e-05, + "loss": 0.5899, + "step": 9913 + }, + { + "epoch": 0.34, + "learning_rate": 1.472728604872098e-05, + "loss": 0.6381, + "step": 9914 + }, + { + "epoch": 0.34, + "learning_rate": 1.4726326504268412e-05, + "loss": 0.6489, + "step": 9915 + }, + { + "epoch": 0.34, + "learning_rate": 1.4725366903779264e-05, + "loss": 0.6137, + "step": 9916 + }, + { + "epoch": 0.34, + "learning_rate": 1.4724407247264911e-05, + "loss": 0.6524, + "step": 9917 + }, + { + "epoch": 0.34, + "learning_rate": 1.4723447534736738e-05, + "loss": 0.6513, + "step": 9918 + }, + { + "epoch": 0.34, + "learning_rate": 1.4722487766206117e-05, + "loss": 0.6484, + "step": 9919 + }, + { + "epoch": 0.34, + "learning_rate": 1.472152794168443e-05, + "loss": 0.6329, + "step": 9920 + }, + { + "epoch": 0.34, + "learning_rate": 1.4720568061183058e-05, + "loss": 0.5981, + "step": 9921 + }, + { + "epoch": 0.34, + "learning_rate": 1.4719608124713378e-05, + "loss": 0.6175, + "step": 9922 + }, + { + "epoch": 0.34, + "learning_rate": 1.4718648132286773e-05, + "loss": 0.6434, + "step": 9923 + }, + { + "epoch": 0.34, + "learning_rate": 1.4717688083914628e-05, + "loss": 0.659, + "step": 9924 + }, + { + "epoch": 0.34, + "learning_rate": 1.4716727979608321e-05, + "loss": 0.6441, + "step": 9925 + }, + { + "epoch": 0.34, + "learning_rate": 1.4715767819379236e-05, + "loss": 0.6059, + "step": 9926 + }, + { + "epoch": 0.34, + "learning_rate": 1.4714807603238762e-05, + "loss": 0.6485, + "step": 9927 + }, + { + "epoch": 0.34, + "learning_rate": 1.4713847331198276e-05, + "loss": 0.6839, + "step": 9928 + }, + { + "epoch": 0.34, + "learning_rate": 1.4712887003269165e-05, + "loss": 0.6023, + "step": 9929 + }, + { + "epoch": 0.34, + "learning_rate": 1.4711926619462821e-05, + "loss": 0.6645, + "step": 9930 + }, + { + "epoch": 0.34, + "learning_rate": 1.4710966179790624e-05, + "loss": 0.6435, + "step": 9931 + }, + { + "epoch": 0.34, + "learning_rate": 1.4710005684263966e-05, + "loss": 0.6357, + "step": 9932 + }, + { + "epoch": 0.34, + "learning_rate": 1.470904513289423e-05, + "loss": 0.5675, + "step": 9933 + }, + { + "epoch": 0.34, + "learning_rate": 1.4708084525692808e-05, + "loss": 0.6611, + "step": 9934 + }, + { + "epoch": 0.34, + "learning_rate": 1.470712386267109e-05, + "loss": 0.6291, + "step": 9935 + }, + { + "epoch": 0.34, + "learning_rate": 1.4706163143840462e-05, + "loss": 0.6493, + "step": 9936 + }, + { + "epoch": 0.34, + "learning_rate": 1.4705202369212315e-05, + "loss": 0.6555, + "step": 9937 + }, + { + "epoch": 0.34, + "learning_rate": 1.4704241538798043e-05, + "loss": 0.6278, + "step": 9938 + }, + { + "epoch": 0.34, + "learning_rate": 1.4703280652609037e-05, + "loss": 0.6531, + "step": 9939 + }, + { + "epoch": 0.34, + "learning_rate": 1.4702319710656689e-05, + "loss": 0.6191, + "step": 9940 + }, + { + "epoch": 0.34, + "learning_rate": 1.4701358712952393e-05, + "loss": 0.6742, + "step": 9941 + }, + { + "epoch": 0.34, + "learning_rate": 1.4700397659507543e-05, + "loss": 0.6177, + "step": 9942 + }, + { + "epoch": 0.34, + "learning_rate": 1.4699436550333532e-05, + "loss": 0.5482, + "step": 9943 + }, + { + "epoch": 0.34, + "learning_rate": 1.4698475385441755e-05, + "loss": 0.6526, + "step": 9944 + }, + { + "epoch": 0.34, + "learning_rate": 1.4697514164843609e-05, + "loss": 0.641, + "step": 9945 + }, + { + "epoch": 0.34, + "learning_rate": 1.469655288855049e-05, + "loss": 0.6531, + "step": 9946 + }, + { + "epoch": 0.34, + "learning_rate": 1.4695591556573797e-05, + "loss": 0.6713, + "step": 9947 + }, + { + "epoch": 0.34, + "learning_rate": 1.4694630168924926e-05, + "loss": 0.626, + "step": 9948 + }, + { + "epoch": 0.34, + "learning_rate": 1.4693668725615272e-05, + "loss": 0.639, + "step": 9949 + }, + { + "epoch": 0.34, + "learning_rate": 1.469270722665624e-05, + "loss": 0.7042, + "step": 9950 + }, + { + "epoch": 0.34, + "learning_rate": 1.469174567205923e-05, + "loss": 0.6308, + "step": 9951 + }, + { + "epoch": 0.34, + "learning_rate": 1.4690784061835638e-05, + "loss": 0.6198, + "step": 9952 + }, + { + "epoch": 0.34, + "learning_rate": 1.4689822395996864e-05, + "loss": 0.6339, + "step": 9953 + }, + { + "epoch": 0.34, + "learning_rate": 1.4688860674554317e-05, + "loss": 0.6036, + "step": 9954 + }, + { + "epoch": 0.34, + "learning_rate": 1.4687898897519394e-05, + "loss": 0.6941, + "step": 9955 + }, + { + "epoch": 0.34, + "learning_rate": 1.46869370649035e-05, + "loss": 0.6411, + "step": 9956 + }, + { + "epoch": 0.34, + "learning_rate": 1.4685975176718037e-05, + "loss": 0.6254, + "step": 9957 + }, + { + "epoch": 0.35, + "learning_rate": 1.468501323297441e-05, + "loss": 0.5907, + "step": 9958 + }, + { + "epoch": 0.35, + "learning_rate": 1.4684051233684025e-05, + "loss": 0.6272, + "step": 9959 + }, + { + "epoch": 0.35, + "learning_rate": 1.4683089178858288e-05, + "loss": 0.6849, + "step": 9960 + }, + { + "epoch": 0.35, + "learning_rate": 1.4682127068508604e-05, + "loss": 0.6365, + "step": 9961 + }, + { + "epoch": 0.35, + "learning_rate": 1.468116490264638e-05, + "loss": 0.7223, + "step": 9962 + }, + { + "epoch": 0.35, + "learning_rate": 1.4680202681283027e-05, + "loss": 0.6494, + "step": 9963 + }, + { + "epoch": 0.35, + "learning_rate": 1.467924040442995e-05, + "loss": 0.6024, + "step": 9964 + }, + { + "epoch": 0.35, + "learning_rate": 1.4678278072098555e-05, + "loss": 0.648, + "step": 9965 + }, + { + "epoch": 0.35, + "learning_rate": 1.467731568430026e-05, + "loss": 0.6236, + "step": 9966 + }, + { + "epoch": 0.35, + "learning_rate": 1.4676353241046468e-05, + "loss": 0.6064, + "step": 9967 + }, + { + "epoch": 0.35, + "learning_rate": 1.4675390742348592e-05, + "loss": 0.6481, + "step": 9968 + }, + { + "epoch": 0.35, + "learning_rate": 1.4674428188218049e-05, + "loss": 0.5998, + "step": 9969 + }, + { + "epoch": 0.35, + "learning_rate": 1.4673465578666242e-05, + "loss": 0.678, + "step": 9970 + }, + { + "epoch": 0.35, + "learning_rate": 1.4672502913704589e-05, + "loss": 0.6292, + "step": 9971 + }, + { + "epoch": 0.35, + "learning_rate": 1.4671540193344507e-05, + "loss": 0.6227, + "step": 9972 + }, + { + "epoch": 0.35, + "learning_rate": 1.4670577417597403e-05, + "loss": 0.6468, + "step": 9973 + }, + { + "epoch": 0.35, + "learning_rate": 1.4669614586474694e-05, + "loss": 0.6949, + "step": 9974 + }, + { + "epoch": 0.35, + "learning_rate": 1.4668651699987802e-05, + "loss": 0.6386, + "step": 9975 + }, + { + "epoch": 0.35, + "learning_rate": 1.4667688758148134e-05, + "loss": 0.6379, + "step": 9976 + }, + { + "epoch": 0.35, + "learning_rate": 1.4666725760967115e-05, + "loss": 0.5971, + "step": 9977 + }, + { + "epoch": 0.35, + "learning_rate": 1.4665762708456155e-05, + "loss": 0.6611, + "step": 9978 + }, + { + "epoch": 0.35, + "learning_rate": 1.4664799600626678e-05, + "loss": 0.6519, + "step": 9979 + }, + { + "epoch": 0.35, + "learning_rate": 1.46638364374901e-05, + "loss": 0.613, + "step": 9980 + }, + { + "epoch": 0.35, + "learning_rate": 1.466287321905784e-05, + "loss": 0.6184, + "step": 9981 + }, + { + "epoch": 0.35, + "learning_rate": 1.4661909945341321e-05, + "loss": 0.6473, + "step": 9982 + }, + { + "epoch": 0.35, + "learning_rate": 1.4660946616351964e-05, + "loss": 0.6248, + "step": 9983 + }, + { + "epoch": 0.35, + "learning_rate": 1.4659983232101185e-05, + "loss": 0.6371, + "step": 9984 + }, + { + "epoch": 0.35, + "learning_rate": 1.4659019792600411e-05, + "loss": 0.6531, + "step": 9985 + }, + { + "epoch": 0.35, + "learning_rate": 1.4658056297861065e-05, + "loss": 0.6715, + "step": 9986 + }, + { + "epoch": 0.35, + "learning_rate": 1.4657092747894568e-05, + "loss": 0.6352, + "step": 9987 + }, + { + "epoch": 0.35, + "learning_rate": 1.4656129142712346e-05, + "loss": 0.5826, + "step": 9988 + }, + { + "epoch": 0.35, + "learning_rate": 1.4655165482325821e-05, + "loss": 0.6761, + "step": 9989 + }, + { + "epoch": 0.35, + "learning_rate": 1.4654201766746422e-05, + "loss": 0.7039, + "step": 9990 + }, + { + "epoch": 0.35, + "learning_rate": 1.4653237995985572e-05, + "loss": 0.6376, + "step": 9991 + }, + { + "epoch": 0.35, + "learning_rate": 1.4652274170054703e-05, + "loss": 0.6207, + "step": 9992 + }, + { + "epoch": 0.35, + "learning_rate": 1.4651310288965235e-05, + "loss": 0.5697, + "step": 9993 + }, + { + "epoch": 0.35, + "learning_rate": 1.4650346352728599e-05, + "loss": 0.6231, + "step": 9994 + }, + { + "epoch": 0.35, + "learning_rate": 1.4649382361356229e-05, + "loss": 0.6809, + "step": 9995 + }, + { + "epoch": 0.35, + "learning_rate": 1.4648418314859546e-05, + "loss": 0.611, + "step": 9996 + }, + { + "epoch": 0.35, + "learning_rate": 1.4647454213249983e-05, + "loss": 0.6764, + "step": 9997 + }, + { + "epoch": 0.35, + "learning_rate": 1.4646490056538974e-05, + "loss": 0.7005, + "step": 9998 + }, + { + "epoch": 0.35, + "learning_rate": 1.4645525844737944e-05, + "loss": 0.6246, + "step": 9999 + }, + { + "epoch": 0.35, + "learning_rate": 1.464456157785833e-05, + "loss": 0.6288, + "step": 10000 + }, + { + "epoch": 0.35, + "learning_rate": 1.4643597255911564e-05, + "loss": 0.6672, + "step": 10001 + }, + { + "epoch": 0.35, + "learning_rate": 1.4642632878909078e-05, + "loss": 0.623, + "step": 10002 + }, + { + "epoch": 0.35, + "learning_rate": 1.4641668446862304e-05, + "loss": 0.6369, + "step": 10003 + }, + { + "epoch": 0.35, + "learning_rate": 1.4640703959782682e-05, + "loss": 0.6539, + "step": 10004 + }, + { + "epoch": 0.35, + "learning_rate": 1.4639739417681643e-05, + "loss": 0.6407, + "step": 10005 + }, + { + "epoch": 0.35, + "learning_rate": 1.4638774820570625e-05, + "loss": 0.5602, + "step": 10006 + }, + { + "epoch": 0.35, + "learning_rate": 1.4637810168461062e-05, + "loss": 0.7274, + "step": 10007 + }, + { + "epoch": 0.35, + "learning_rate": 1.4636845461364396e-05, + "loss": 0.6346, + "step": 10008 + }, + { + "epoch": 0.35, + "learning_rate": 1.4635880699292053e-05, + "loss": 0.6309, + "step": 10009 + }, + { + "epoch": 0.35, + "learning_rate": 1.4634915882255486e-05, + "loss": 0.6171, + "step": 10010 + }, + { + "epoch": 0.35, + "learning_rate": 1.463395101026613e-05, + "loss": 0.584, + "step": 10011 + }, + { + "epoch": 0.35, + "learning_rate": 1.4632986083335417e-05, + "loss": 0.6473, + "step": 10012 + }, + { + "epoch": 0.35, + "learning_rate": 1.4632021101474798e-05, + "loss": 0.6206, + "step": 10013 + }, + { + "epoch": 0.35, + "learning_rate": 1.4631056064695708e-05, + "loss": 0.6511, + "step": 10014 + }, + { + "epoch": 0.35, + "learning_rate": 1.4630090973009588e-05, + "loss": 0.6317, + "step": 10015 + }, + { + "epoch": 0.35, + "learning_rate": 1.4629125826427883e-05, + "loss": 0.599, + "step": 10016 + }, + { + "epoch": 0.35, + "learning_rate": 1.462816062496204e-05, + "loss": 0.6705, + "step": 10017 + }, + { + "epoch": 0.35, + "learning_rate": 1.462719536862349e-05, + "loss": 0.6891, + "step": 10018 + }, + { + "epoch": 0.35, + "learning_rate": 1.4626230057423692e-05, + "loss": 0.6033, + "step": 10019 + }, + { + "epoch": 0.35, + "learning_rate": 1.4625264691374084e-05, + "loss": 0.6575, + "step": 10020 + }, + { + "epoch": 0.35, + "learning_rate": 1.4624299270486106e-05, + "loss": 0.5686, + "step": 10021 + }, + { + "epoch": 0.35, + "learning_rate": 1.4623333794771217e-05, + "loss": 0.6304, + "step": 10022 + }, + { + "epoch": 0.35, + "learning_rate": 1.4622368264240859e-05, + "loss": 0.6323, + "step": 10023 + }, + { + "epoch": 0.35, + "learning_rate": 1.462140267890647e-05, + "loss": 0.6793, + "step": 10024 + }, + { + "epoch": 0.35, + "learning_rate": 1.462043703877951e-05, + "loss": 0.6523, + "step": 10025 + }, + { + "epoch": 0.35, + "learning_rate": 1.4619471343871428e-05, + "loss": 0.6321, + "step": 10026 + }, + { + "epoch": 0.35, + "learning_rate": 1.4618505594193661e-05, + "loss": 0.6581, + "step": 10027 + }, + { + "epoch": 0.35, + "learning_rate": 1.4617539789757676e-05, + "loss": 0.6506, + "step": 10028 + }, + { + "epoch": 0.35, + "learning_rate": 1.4616573930574913e-05, + "loss": 0.5897, + "step": 10029 + }, + { + "epoch": 0.35, + "learning_rate": 1.4615608016656823e-05, + "loss": 0.7071, + "step": 10030 + }, + { + "epoch": 0.35, + "learning_rate": 1.4614642048014864e-05, + "loss": 0.6471, + "step": 10031 + }, + { + "epoch": 0.35, + "learning_rate": 1.4613676024660488e-05, + "loss": 0.6842, + "step": 10032 + }, + { + "epoch": 0.35, + "learning_rate": 1.4612709946605139e-05, + "loss": 0.6356, + "step": 10033 + }, + { + "epoch": 0.35, + "learning_rate": 1.4611743813860285e-05, + "loss": 0.6502, + "step": 10034 + }, + { + "epoch": 0.35, + "learning_rate": 1.4610777626437373e-05, + "loss": 0.6471, + "step": 10035 + }, + { + "epoch": 0.35, + "learning_rate": 1.4609811384347858e-05, + "loss": 0.6052, + "step": 10036 + }, + { + "epoch": 0.35, + "learning_rate": 1.4608845087603198e-05, + "loss": 0.6033, + "step": 10037 + }, + { + "epoch": 0.35, + "learning_rate": 1.4607878736214854e-05, + "loss": 0.6504, + "step": 10038 + }, + { + "epoch": 0.35, + "learning_rate": 1.4606912330194272e-05, + "loss": 0.5833, + "step": 10039 + }, + { + "epoch": 0.35, + "learning_rate": 1.460594586955292e-05, + "loss": 0.5938, + "step": 10040 + }, + { + "epoch": 0.35, + "learning_rate": 1.4604979354302251e-05, + "loss": 0.6515, + "step": 10041 + }, + { + "epoch": 0.35, + "learning_rate": 1.4604012784453727e-05, + "loss": 0.638, + "step": 10042 + }, + { + "epoch": 0.35, + "learning_rate": 1.4603046160018808e-05, + "loss": 0.6554, + "step": 10043 + }, + { + "epoch": 0.35, + "learning_rate": 1.4602079481008955e-05, + "loss": 0.6333, + "step": 10044 + }, + { + "epoch": 0.35, + "learning_rate": 1.4601112747435626e-05, + "loss": 0.6262, + "step": 10045 + }, + { + "epoch": 0.35, + "learning_rate": 1.4600145959310286e-05, + "loss": 0.5912, + "step": 10046 + }, + { + "epoch": 0.35, + "learning_rate": 1.4599179116644397e-05, + "loss": 0.6217, + "step": 10047 + }, + { + "epoch": 0.35, + "learning_rate": 1.4598212219449421e-05, + "loss": 0.6036, + "step": 10048 + }, + { + "epoch": 0.35, + "learning_rate": 1.4597245267736821e-05, + "loss": 0.6861, + "step": 10049 + }, + { + "epoch": 0.35, + "learning_rate": 1.4596278261518066e-05, + "loss": 0.6415, + "step": 10050 + }, + { + "epoch": 0.35, + "learning_rate": 1.4595311200804616e-05, + "loss": 0.6703, + "step": 10051 + }, + { + "epoch": 0.35, + "learning_rate": 1.4594344085607937e-05, + "loss": 0.5677, + "step": 10052 + }, + { + "epoch": 0.35, + "learning_rate": 1.4593376915939499e-05, + "loss": 0.6312, + "step": 10053 + }, + { + "epoch": 0.35, + "learning_rate": 1.4592409691810767e-05, + "loss": 0.5867, + "step": 10054 + }, + { + "epoch": 0.35, + "learning_rate": 1.4591442413233208e-05, + "loss": 0.6792, + "step": 10055 + }, + { + "epoch": 0.35, + "learning_rate": 1.4590475080218291e-05, + "loss": 0.6338, + "step": 10056 + }, + { + "epoch": 0.35, + "learning_rate": 1.4589507692777484e-05, + "loss": 0.6363, + "step": 10057 + }, + { + "epoch": 0.35, + "learning_rate": 1.4588540250922259e-05, + "loss": 0.6719, + "step": 10058 + }, + { + "epoch": 0.35, + "learning_rate": 1.4587572754664088e-05, + "loss": 0.589, + "step": 10059 + }, + { + "epoch": 0.35, + "learning_rate": 1.4586605204014432e-05, + "loss": 0.6572, + "step": 10060 + }, + { + "epoch": 0.35, + "learning_rate": 1.4585637598984772e-05, + "loss": 0.6083, + "step": 10061 + }, + { + "epoch": 0.35, + "learning_rate": 1.458466993958658e-05, + "loss": 0.5982, + "step": 10062 + }, + { + "epoch": 0.35, + "learning_rate": 1.4583702225831324e-05, + "loss": 0.6355, + "step": 10063 + }, + { + "epoch": 0.35, + "learning_rate": 1.4582734457730479e-05, + "loss": 0.6915, + "step": 10064 + }, + { + "epoch": 0.35, + "learning_rate": 1.4581766635295522e-05, + "loss": 0.6941, + "step": 10065 + }, + { + "epoch": 0.35, + "learning_rate": 1.4580798758537922e-05, + "loss": 0.6812, + "step": 10066 + }, + { + "epoch": 0.35, + "learning_rate": 1.4579830827469162e-05, + "loss": 0.6195, + "step": 10067 + }, + { + "epoch": 0.35, + "learning_rate": 1.4578862842100711e-05, + "loss": 0.6344, + "step": 10068 + }, + { + "epoch": 0.35, + "learning_rate": 1.457789480244405e-05, + "loss": 0.6497, + "step": 10069 + }, + { + "epoch": 0.35, + "learning_rate": 1.4576926708510657e-05, + "loss": 0.6534, + "step": 10070 + }, + { + "epoch": 0.35, + "learning_rate": 1.4575958560312004e-05, + "loss": 0.6944, + "step": 10071 + }, + { + "epoch": 0.35, + "learning_rate": 1.4574990357859575e-05, + "loss": 0.6053, + "step": 10072 + }, + { + "epoch": 0.35, + "learning_rate": 1.4574022101164848e-05, + "loss": 0.5922, + "step": 10073 + }, + { + "epoch": 0.35, + "learning_rate": 1.4573053790239304e-05, + "loss": 0.6624, + "step": 10074 + }, + { + "epoch": 0.35, + "learning_rate": 1.4572085425094423e-05, + "loss": 0.6518, + "step": 10075 + }, + { + "epoch": 0.35, + "learning_rate": 1.4571117005741684e-05, + "loss": 0.7102, + "step": 10076 + }, + { + "epoch": 0.35, + "learning_rate": 1.457014853219257e-05, + "loss": 0.6667, + "step": 10077 + }, + { + "epoch": 0.35, + "learning_rate": 1.4569180004458563e-05, + "loss": 0.6418, + "step": 10078 + }, + { + "epoch": 0.35, + "learning_rate": 1.456821142255115e-05, + "loss": 0.6763, + "step": 10079 + }, + { + "epoch": 0.35, + "learning_rate": 1.456724278648181e-05, + "loss": 0.649, + "step": 10080 + }, + { + "epoch": 0.35, + "learning_rate": 1.456627409626203e-05, + "loss": 0.5909, + "step": 10081 + }, + { + "epoch": 0.35, + "learning_rate": 1.4565305351903293e-05, + "loss": 0.658, + "step": 10082 + }, + { + "epoch": 0.35, + "learning_rate": 1.4564336553417086e-05, + "loss": 0.5867, + "step": 10083 + }, + { + "epoch": 0.35, + "learning_rate": 1.4563367700814896e-05, + "loss": 0.6569, + "step": 10084 + }, + { + "epoch": 0.35, + "learning_rate": 1.456239879410821e-05, + "loss": 0.6494, + "step": 10085 + }, + { + "epoch": 0.35, + "learning_rate": 1.4561429833308513e-05, + "loss": 0.6581, + "step": 10086 + }, + { + "epoch": 0.35, + "learning_rate": 1.4560460818427297e-05, + "loss": 0.6472, + "step": 10087 + }, + { + "epoch": 0.35, + "learning_rate": 1.4559491749476048e-05, + "loss": 0.6553, + "step": 10088 + }, + { + "epoch": 0.35, + "learning_rate": 1.4558522626466255e-05, + "loss": 0.6463, + "step": 10089 + }, + { + "epoch": 0.35, + "learning_rate": 1.4557553449409411e-05, + "loss": 0.6478, + "step": 10090 + }, + { + "epoch": 0.35, + "learning_rate": 1.455658421831701e-05, + "loss": 0.5779, + "step": 10091 + }, + { + "epoch": 0.35, + "learning_rate": 1.4555614933200533e-05, + "loss": 0.6444, + "step": 10092 + }, + { + "epoch": 0.35, + "learning_rate": 1.455464559407148e-05, + "loss": 0.6379, + "step": 10093 + }, + { + "epoch": 0.35, + "learning_rate": 1.4553676200941342e-05, + "loss": 0.6499, + "step": 10094 + }, + { + "epoch": 0.35, + "learning_rate": 1.455270675382161e-05, + "loss": 0.6058, + "step": 10095 + }, + { + "epoch": 0.35, + "learning_rate": 1.455173725272378e-05, + "loss": 0.5847, + "step": 10096 + }, + { + "epoch": 0.35, + "learning_rate": 1.4550767697659352e-05, + "loss": 0.6006, + "step": 10097 + }, + { + "epoch": 0.35, + "learning_rate": 1.4549798088639813e-05, + "loss": 0.5841, + "step": 10098 + }, + { + "epoch": 0.35, + "learning_rate": 1.454882842567666e-05, + "loss": 0.613, + "step": 10099 + }, + { + "epoch": 0.35, + "learning_rate": 1.4547858708781397e-05, + "loss": 0.624, + "step": 10100 + }, + { + "epoch": 0.35, + "learning_rate": 1.4546888937965514e-05, + "loss": 0.6499, + "step": 10101 + }, + { + "epoch": 0.35, + "learning_rate": 1.4545919113240508e-05, + "loss": 0.5806, + "step": 10102 + }, + { + "epoch": 0.35, + "learning_rate": 1.4544949234617882e-05, + "loss": 0.6062, + "step": 10103 + }, + { + "epoch": 0.35, + "learning_rate": 1.4543979302109135e-05, + "loss": 0.6135, + "step": 10104 + }, + { + "epoch": 0.35, + "learning_rate": 1.454300931572576e-05, + "loss": 0.6584, + "step": 10105 + }, + { + "epoch": 0.35, + "learning_rate": 1.4542039275479267e-05, + "loss": 0.6912, + "step": 10106 + }, + { + "epoch": 0.35, + "learning_rate": 1.4541069181381156e-05, + "loss": 0.706, + "step": 10107 + }, + { + "epoch": 0.35, + "learning_rate": 1.4540099033442918e-05, + "loss": 0.5459, + "step": 10108 + }, + { + "epoch": 0.35, + "learning_rate": 1.4539128831676066e-05, + "loss": 0.6603, + "step": 10109 + }, + { + "epoch": 0.35, + "learning_rate": 1.4538158576092101e-05, + "loss": 0.6211, + "step": 10110 + }, + { + "epoch": 0.35, + "learning_rate": 1.4537188266702522e-05, + "loss": 0.6358, + "step": 10111 + }, + { + "epoch": 0.35, + "learning_rate": 1.4536217903518842e-05, + "loss": 0.6493, + "step": 10112 + }, + { + "epoch": 0.35, + "learning_rate": 1.4535247486552555e-05, + "loss": 0.6194, + "step": 10113 + }, + { + "epoch": 0.35, + "learning_rate": 1.4534277015815172e-05, + "loss": 0.6164, + "step": 10114 + }, + { + "epoch": 0.35, + "learning_rate": 1.4533306491318202e-05, + "loss": 0.5681, + "step": 10115 + }, + { + "epoch": 0.35, + "learning_rate": 1.453233591307315e-05, + "loss": 0.6312, + "step": 10116 + }, + { + "epoch": 0.35, + "learning_rate": 1.4531365281091518e-05, + "loss": 0.6229, + "step": 10117 + }, + { + "epoch": 0.35, + "learning_rate": 1.453039459538482e-05, + "loss": 0.5896, + "step": 10118 + }, + { + "epoch": 0.35, + "learning_rate": 1.4529423855964566e-05, + "loss": 0.639, + "step": 10119 + }, + { + "epoch": 0.35, + "learning_rate": 1.4528453062842258e-05, + "loss": 0.6431, + "step": 10120 + }, + { + "epoch": 0.35, + "learning_rate": 1.4527482216029414e-05, + "loss": 0.6438, + "step": 10121 + }, + { + "epoch": 0.35, + "learning_rate": 1.4526511315537541e-05, + "loss": 0.6397, + "step": 10122 + }, + { + "epoch": 0.35, + "learning_rate": 1.4525540361378145e-05, + "loss": 0.6532, + "step": 10123 + }, + { + "epoch": 0.35, + "learning_rate": 1.452456935356275e-05, + "loss": 0.6399, + "step": 10124 + }, + { + "epoch": 0.35, + "learning_rate": 1.4523598292102858e-05, + "loss": 0.6066, + "step": 10125 + }, + { + "epoch": 0.35, + "learning_rate": 1.4522627177009985e-05, + "loss": 0.6156, + "step": 10126 + }, + { + "epoch": 0.35, + "learning_rate": 1.4521656008295647e-05, + "loss": 0.7049, + "step": 10127 + }, + { + "epoch": 0.35, + "learning_rate": 1.452068478597136e-05, + "loss": 0.6816, + "step": 10128 + }, + { + "epoch": 0.35, + "learning_rate": 1.451971351004863e-05, + "loss": 0.6216, + "step": 10129 + }, + { + "epoch": 0.35, + "learning_rate": 1.4518742180538985e-05, + "loss": 0.6118, + "step": 10130 + }, + { + "epoch": 0.35, + "learning_rate": 1.4517770797453933e-05, + "loss": 0.6715, + "step": 10131 + }, + { + "epoch": 0.35, + "learning_rate": 1.4516799360804992e-05, + "loss": 0.6333, + "step": 10132 + }, + { + "epoch": 0.35, + "learning_rate": 1.451582787060368e-05, + "loss": 0.606, + "step": 10133 + }, + { + "epoch": 0.35, + "learning_rate": 1.4514856326861519e-05, + "loss": 0.6584, + "step": 10134 + }, + { + "epoch": 0.35, + "learning_rate": 1.4513884729590025e-05, + "loss": 0.6787, + "step": 10135 + }, + { + "epoch": 0.35, + "learning_rate": 1.4512913078800714e-05, + "loss": 0.682, + "step": 10136 + }, + { + "epoch": 0.35, + "learning_rate": 1.4511941374505112e-05, + "loss": 0.7002, + "step": 10137 + }, + { + "epoch": 0.35, + "learning_rate": 1.4510969616714739e-05, + "loss": 0.6724, + "step": 10138 + }, + { + "epoch": 0.35, + "learning_rate": 1.4509997805441109e-05, + "loss": 0.6589, + "step": 10139 + }, + { + "epoch": 0.35, + "learning_rate": 1.4509025940695756e-05, + "loss": 0.6554, + "step": 10140 + }, + { + "epoch": 0.35, + "learning_rate": 1.4508054022490195e-05, + "loss": 0.6106, + "step": 10141 + }, + { + "epoch": 0.35, + "learning_rate": 1.4507082050835947e-05, + "loss": 0.6755, + "step": 10142 + }, + { + "epoch": 0.35, + "learning_rate": 1.4506110025744544e-05, + "loss": 0.6052, + "step": 10143 + }, + { + "epoch": 0.35, + "learning_rate": 1.4505137947227506e-05, + "loss": 0.5701, + "step": 10144 + }, + { + "epoch": 0.35, + "learning_rate": 1.4504165815296356e-05, + "loss": 0.6466, + "step": 10145 + }, + { + "epoch": 0.35, + "learning_rate": 1.4503193629962626e-05, + "loss": 0.6237, + "step": 10146 + }, + { + "epoch": 0.35, + "learning_rate": 1.4502221391237836e-05, + "loss": 0.6111, + "step": 10147 + }, + { + "epoch": 0.35, + "learning_rate": 1.4501249099133516e-05, + "loss": 0.6638, + "step": 10148 + }, + { + "epoch": 0.35, + "learning_rate": 1.4500276753661195e-05, + "loss": 0.6022, + "step": 10149 + }, + { + "epoch": 0.35, + "learning_rate": 1.4499304354832403e-05, + "loss": 0.6385, + "step": 10150 + }, + { + "epoch": 0.35, + "learning_rate": 1.4498331902658663e-05, + "loss": 0.6712, + "step": 10151 + }, + { + "epoch": 0.35, + "learning_rate": 1.4497359397151507e-05, + "loss": 0.6183, + "step": 10152 + }, + { + "epoch": 0.35, + "learning_rate": 1.4496386838322468e-05, + "loss": 0.6354, + "step": 10153 + }, + { + "epoch": 0.35, + "learning_rate": 1.4495414226183073e-05, + "loss": 0.6228, + "step": 10154 + }, + { + "epoch": 0.35, + "learning_rate": 1.449444156074486e-05, + "loss": 0.6894, + "step": 10155 + }, + { + "epoch": 0.35, + "learning_rate": 1.4493468842019351e-05, + "loss": 0.615, + "step": 10156 + }, + { + "epoch": 0.35, + "learning_rate": 1.4492496070018088e-05, + "loss": 0.6556, + "step": 10157 + }, + { + "epoch": 0.35, + "learning_rate": 1.44915232447526e-05, + "loss": 0.6381, + "step": 10158 + }, + { + "epoch": 0.35, + "learning_rate": 1.4490550366234424e-05, + "loss": 0.6215, + "step": 10159 + }, + { + "epoch": 0.35, + "learning_rate": 1.4489577434475091e-05, + "loss": 0.65, + "step": 10160 + }, + { + "epoch": 0.35, + "learning_rate": 1.448860444948614e-05, + "loss": 0.617, + "step": 10161 + }, + { + "epoch": 0.35, + "learning_rate": 1.4487631411279104e-05, + "loss": 0.6535, + "step": 10162 + }, + { + "epoch": 0.35, + "learning_rate": 1.4486658319865521e-05, + "loss": 0.6945, + "step": 10163 + }, + { + "epoch": 0.35, + "learning_rate": 1.4485685175256927e-05, + "loss": 0.6421, + "step": 10164 + }, + { + "epoch": 0.35, + "learning_rate": 1.4484711977464861e-05, + "loss": 0.616, + "step": 10165 + }, + { + "epoch": 0.35, + "learning_rate": 1.4483738726500862e-05, + "loss": 0.5814, + "step": 10166 + }, + { + "epoch": 0.35, + "learning_rate": 1.4482765422376468e-05, + "loss": 0.6427, + "step": 10167 + }, + { + "epoch": 0.35, + "learning_rate": 1.4481792065103219e-05, + "loss": 0.5951, + "step": 10168 + }, + { + "epoch": 0.35, + "learning_rate": 1.4480818654692657e-05, + "loss": 0.6482, + "step": 10169 + }, + { + "epoch": 0.35, + "learning_rate": 1.4479845191156318e-05, + "loss": 0.6004, + "step": 10170 + }, + { + "epoch": 0.35, + "learning_rate": 1.447887167450575e-05, + "loss": 0.6456, + "step": 10171 + }, + { + "epoch": 0.35, + "learning_rate": 1.4477898104752495e-05, + "loss": 0.6394, + "step": 10172 + }, + { + "epoch": 0.35, + "learning_rate": 1.447692448190809e-05, + "loss": 0.6615, + "step": 10173 + }, + { + "epoch": 0.35, + "learning_rate": 1.4475950805984082e-05, + "loss": 0.6589, + "step": 10174 + }, + { + "epoch": 0.35, + "learning_rate": 1.4474977076992017e-05, + "loss": 0.5973, + "step": 10175 + }, + { + "epoch": 0.35, + "learning_rate": 1.4474003294943436e-05, + "loss": 0.6298, + "step": 10176 + }, + { + "epoch": 0.35, + "learning_rate": 1.4473029459849885e-05, + "loss": 0.6636, + "step": 10177 + }, + { + "epoch": 0.35, + "learning_rate": 1.4472055571722914e-05, + "loss": 0.6247, + "step": 10178 + }, + { + "epoch": 0.35, + "learning_rate": 1.4471081630574066e-05, + "loss": 0.6382, + "step": 10179 + }, + { + "epoch": 0.35, + "learning_rate": 1.447010763641489e-05, + "loss": 0.6822, + "step": 10180 + }, + { + "epoch": 0.35, + "learning_rate": 1.4469133589256932e-05, + "loss": 0.6129, + "step": 10181 + }, + { + "epoch": 0.35, + "learning_rate": 1.4468159489111741e-05, + "loss": 0.5896, + "step": 10182 + }, + { + "epoch": 0.35, + "learning_rate": 1.446718533599087e-05, + "loss": 0.6289, + "step": 10183 + }, + { + "epoch": 0.35, + "learning_rate": 1.4466211129905864e-05, + "loss": 0.6272, + "step": 10184 + }, + { + "epoch": 0.35, + "learning_rate": 1.4465236870868275e-05, + "loss": 0.6737, + "step": 10185 + }, + { + "epoch": 0.35, + "learning_rate": 1.4464262558889654e-05, + "loss": 0.6627, + "step": 10186 + }, + { + "epoch": 0.35, + "learning_rate": 1.4463288193981558e-05, + "loss": 0.6575, + "step": 10187 + }, + { + "epoch": 0.35, + "learning_rate": 1.4462313776155528e-05, + "loss": 0.5965, + "step": 10188 + }, + { + "epoch": 0.35, + "learning_rate": 1.4461339305423125e-05, + "loss": 0.7005, + "step": 10189 + }, + { + "epoch": 0.35, + "learning_rate": 1.4460364781795904e-05, + "loss": 0.6835, + "step": 10190 + }, + { + "epoch": 0.35, + "learning_rate": 1.4459390205285413e-05, + "loss": 0.6313, + "step": 10191 + }, + { + "epoch": 0.35, + "learning_rate": 1.4458415575903211e-05, + "loss": 0.6799, + "step": 10192 + }, + { + "epoch": 0.35, + "learning_rate": 1.4457440893660852e-05, + "loss": 0.6559, + "step": 10193 + }, + { + "epoch": 0.35, + "learning_rate": 1.4456466158569892e-05, + "loss": 0.6169, + "step": 10194 + }, + { + "epoch": 0.35, + "learning_rate": 1.4455491370641888e-05, + "loss": 0.5935, + "step": 10195 + }, + { + "epoch": 0.35, + "learning_rate": 1.44545165298884e-05, + "loss": 0.5657, + "step": 10196 + }, + { + "epoch": 0.35, + "learning_rate": 1.4453541636320983e-05, + "loss": 0.5984, + "step": 10197 + }, + { + "epoch": 0.35, + "learning_rate": 1.4452566689951194e-05, + "loss": 0.5665, + "step": 10198 + }, + { + "epoch": 0.35, + "learning_rate": 1.4451591690790596e-05, + "loss": 0.5847, + "step": 10199 + }, + { + "epoch": 0.35, + "learning_rate": 1.4450616638850745e-05, + "loss": 0.6322, + "step": 10200 + }, + { + "epoch": 0.35, + "learning_rate": 1.4449641534143207e-05, + "loss": 0.6209, + "step": 10201 + }, + { + "epoch": 0.35, + "learning_rate": 1.444866637667954e-05, + "loss": 0.5886, + "step": 10202 + }, + { + "epoch": 0.35, + "learning_rate": 1.4447691166471303e-05, + "loss": 0.6162, + "step": 10203 + }, + { + "epoch": 0.35, + "learning_rate": 1.444671590353006e-05, + "loss": 0.6167, + "step": 10204 + }, + { + "epoch": 0.35, + "learning_rate": 1.4445740587867377e-05, + "loss": 0.648, + "step": 10205 + }, + { + "epoch": 0.35, + "learning_rate": 1.4444765219494814e-05, + "loss": 0.6566, + "step": 10206 + }, + { + "epoch": 0.35, + "learning_rate": 1.4443789798423938e-05, + "loss": 0.6185, + "step": 10207 + }, + { + "epoch": 0.35, + "learning_rate": 1.4442814324666312e-05, + "loss": 0.6628, + "step": 10208 + }, + { + "epoch": 0.35, + "learning_rate": 1.44418387982335e-05, + "loss": 0.6841, + "step": 10209 + }, + { + "epoch": 0.35, + "learning_rate": 1.4440863219137074e-05, + "loss": 0.6444, + "step": 10210 + }, + { + "epoch": 0.35, + "learning_rate": 1.4439887587388595e-05, + "loss": 0.6475, + "step": 10211 + }, + { + "epoch": 0.35, + "learning_rate": 1.4438911902999633e-05, + "loss": 0.6006, + "step": 10212 + }, + { + "epoch": 0.35, + "learning_rate": 1.4437936165981752e-05, + "loss": 0.6265, + "step": 10213 + }, + { + "epoch": 0.35, + "learning_rate": 1.4436960376346527e-05, + "loss": 0.6156, + "step": 10214 + }, + { + "epoch": 0.35, + "learning_rate": 1.4435984534105522e-05, + "loss": 0.5972, + "step": 10215 + }, + { + "epoch": 0.35, + "learning_rate": 1.4435008639270312e-05, + "loss": 0.6759, + "step": 10216 + }, + { + "epoch": 0.35, + "learning_rate": 1.4434032691852463e-05, + "loss": 0.6811, + "step": 10217 + }, + { + "epoch": 0.35, + "learning_rate": 1.4433056691863545e-05, + "loss": 0.6585, + "step": 10218 + }, + { + "epoch": 0.35, + "learning_rate": 1.4432080639315131e-05, + "loss": 0.6364, + "step": 10219 + }, + { + "epoch": 0.35, + "learning_rate": 1.44311045342188e-05, + "loss": 0.6815, + "step": 10220 + }, + { + "epoch": 0.35, + "learning_rate": 1.4430128376586114e-05, + "loss": 0.5986, + "step": 10221 + }, + { + "epoch": 0.35, + "learning_rate": 1.4429152166428655e-05, + "loss": 0.6235, + "step": 10222 + }, + { + "epoch": 0.35, + "learning_rate": 1.4428175903757993e-05, + "loss": 0.6271, + "step": 10223 + }, + { + "epoch": 0.35, + "learning_rate": 1.4427199588585706e-05, + "loss": 0.5914, + "step": 10224 + }, + { + "epoch": 0.35, + "learning_rate": 1.4426223220923366e-05, + "loss": 0.6809, + "step": 10225 + }, + { + "epoch": 0.35, + "learning_rate": 1.4425246800782549e-05, + "loss": 0.6691, + "step": 10226 + }, + { + "epoch": 0.35, + "learning_rate": 1.4424270328174834e-05, + "loss": 0.5852, + "step": 10227 + }, + { + "epoch": 0.35, + "learning_rate": 1.4423293803111799e-05, + "loss": 0.5891, + "step": 10228 + }, + { + "epoch": 0.35, + "learning_rate": 1.4422317225605019e-05, + "loss": 0.6848, + "step": 10229 + }, + { + "epoch": 0.35, + "learning_rate": 1.4421340595666074e-05, + "loss": 0.5899, + "step": 10230 + }, + { + "epoch": 0.35, + "learning_rate": 1.4420363913306545e-05, + "loss": 0.5838, + "step": 10231 + }, + { + "epoch": 0.35, + "learning_rate": 1.4419387178538008e-05, + "loss": 0.6072, + "step": 10232 + }, + { + "epoch": 0.35, + "learning_rate": 1.4418410391372046e-05, + "loss": 0.6771, + "step": 10233 + }, + { + "epoch": 0.35, + "learning_rate": 1.4417433551820241e-05, + "loss": 0.5519, + "step": 10234 + }, + { + "epoch": 0.35, + "learning_rate": 1.4416456659894172e-05, + "loss": 0.6159, + "step": 10235 + }, + { + "epoch": 0.35, + "learning_rate": 1.441547971560542e-05, + "loss": 0.6803, + "step": 10236 + }, + { + "epoch": 0.35, + "learning_rate": 1.4414502718965575e-05, + "loss": 0.6687, + "step": 10237 + }, + { + "epoch": 0.35, + "learning_rate": 1.4413525669986212e-05, + "loss": 0.7016, + "step": 10238 + }, + { + "epoch": 0.35, + "learning_rate": 1.4412548568678921e-05, + "loss": 0.619, + "step": 10239 + }, + { + "epoch": 0.35, + "learning_rate": 1.4411571415055285e-05, + "loss": 0.6438, + "step": 10240 + }, + { + "epoch": 0.35, + "learning_rate": 1.4410594209126887e-05, + "loss": 0.6663, + "step": 10241 + }, + { + "epoch": 0.35, + "learning_rate": 1.4409616950905316e-05, + "loss": 0.647, + "step": 10242 + }, + { + "epoch": 0.35, + "learning_rate": 1.440863964040216e-05, + "loss": 0.6509, + "step": 10243 + }, + { + "epoch": 0.35, + "learning_rate": 1.4407662277629003e-05, + "loss": 0.65, + "step": 10244 + }, + { + "epoch": 0.35, + "learning_rate": 1.4406684862597434e-05, + "loss": 0.6534, + "step": 10245 + }, + { + "epoch": 0.35, + "learning_rate": 1.4405707395319042e-05, + "loss": 0.6421, + "step": 10246 + }, + { + "epoch": 0.36, + "learning_rate": 1.4404729875805414e-05, + "loss": 0.6838, + "step": 10247 + }, + { + "epoch": 0.36, + "learning_rate": 1.4403752304068141e-05, + "loss": 0.69, + "step": 10248 + }, + { + "epoch": 0.36, + "learning_rate": 1.4402774680118816e-05, + "loss": 0.6939, + "step": 10249 + }, + { + "epoch": 0.36, + "learning_rate": 1.4401797003969025e-05, + "loss": 0.6017, + "step": 10250 + }, + { + "epoch": 0.36, + "learning_rate": 1.4400819275630364e-05, + "loss": 0.6591, + "step": 10251 + }, + { + "epoch": 0.36, + "learning_rate": 1.4399841495114423e-05, + "loss": 0.6531, + "step": 10252 + }, + { + "epoch": 0.36, + "learning_rate": 1.4398863662432797e-05, + "loss": 0.6389, + "step": 10253 + }, + { + "epoch": 0.36, + "learning_rate": 1.4397885777597073e-05, + "loss": 0.6553, + "step": 10254 + }, + { + "epoch": 0.36, + "learning_rate": 1.4396907840618855e-05, + "loss": 0.6607, + "step": 10255 + }, + { + "epoch": 0.36, + "learning_rate": 1.4395929851509731e-05, + "loss": 0.6665, + "step": 10256 + }, + { + "epoch": 0.36, + "learning_rate": 1.4394951810281295e-05, + "loss": 0.6465, + "step": 10257 + }, + { + "epoch": 0.36, + "learning_rate": 1.4393973716945149e-05, + "loss": 0.6479, + "step": 10258 + }, + { + "epoch": 0.36, + "learning_rate": 1.4392995571512886e-05, + "loss": 0.6449, + "step": 10259 + }, + { + "epoch": 0.36, + "learning_rate": 1.4392017373996099e-05, + "loss": 0.6467, + "step": 10260 + }, + { + "epoch": 0.36, + "learning_rate": 1.4391039124406394e-05, + "loss": 0.6043, + "step": 10261 + }, + { + "epoch": 0.36, + "learning_rate": 1.4390060822755367e-05, + "loss": 0.6193, + "step": 10262 + }, + { + "epoch": 0.36, + "learning_rate": 1.438908246905461e-05, + "loss": 0.605, + "step": 10263 + }, + { + "epoch": 0.36, + "learning_rate": 1.4388104063315733e-05, + "loss": 0.5687, + "step": 10264 + }, + { + "epoch": 0.36, + "learning_rate": 1.4387125605550329e-05, + "loss": 0.6481, + "step": 10265 + }, + { + "epoch": 0.36, + "learning_rate": 1.438614709577e-05, + "loss": 0.6256, + "step": 10266 + }, + { + "epoch": 0.36, + "learning_rate": 1.4385168533986353e-05, + "loss": 0.6267, + "step": 10267 + }, + { + "epoch": 0.36, + "learning_rate": 1.4384189920210985e-05, + "loss": 0.5785, + "step": 10268 + }, + { + "epoch": 0.36, + "learning_rate": 1.4383211254455494e-05, + "loss": 0.6261, + "step": 10269 + }, + { + "epoch": 0.36, + "learning_rate": 1.4382232536731496e-05, + "loss": 0.6631, + "step": 10270 + }, + { + "epoch": 0.36, + "learning_rate": 1.4381253767050583e-05, + "loss": 0.6445, + "step": 10271 + }, + { + "epoch": 0.36, + "learning_rate": 1.4380274945424365e-05, + "loss": 0.609, + "step": 10272 + }, + { + "epoch": 0.36, + "learning_rate": 1.4379296071864446e-05, + "loss": 0.6068, + "step": 10273 + }, + { + "epoch": 0.36, + "learning_rate": 1.4378317146382434e-05, + "loss": 0.613, + "step": 10274 + }, + { + "epoch": 0.36, + "learning_rate": 1.4377338168989933e-05, + "loss": 0.6381, + "step": 10275 + }, + { + "epoch": 0.36, + "learning_rate": 1.437635913969855e-05, + "loss": 0.6645, + "step": 10276 + }, + { + "epoch": 0.36, + "learning_rate": 1.4375380058519895e-05, + "loss": 0.651, + "step": 10277 + }, + { + "epoch": 0.36, + "learning_rate": 1.4374400925465573e-05, + "loss": 0.6405, + "step": 10278 + }, + { + "epoch": 0.36, + "learning_rate": 1.4373421740547193e-05, + "loss": 0.6217, + "step": 10279 + }, + { + "epoch": 0.36, + "learning_rate": 1.4372442503776369e-05, + "loss": 0.6217, + "step": 10280 + }, + { + "epoch": 0.36, + "learning_rate": 1.4371463215164707e-05, + "loss": 0.6481, + "step": 10281 + }, + { + "epoch": 0.36, + "learning_rate": 1.4370483874723817e-05, + "loss": 0.6079, + "step": 10282 + }, + { + "epoch": 0.36, + "learning_rate": 1.4369504482465314e-05, + "loss": 0.6557, + "step": 10283 + }, + { + "epoch": 0.36, + "learning_rate": 1.4368525038400808e-05, + "loss": 0.6195, + "step": 10284 + }, + { + "epoch": 0.36, + "learning_rate": 1.4367545542541908e-05, + "loss": 0.6377, + "step": 10285 + }, + { + "epoch": 0.36, + "learning_rate": 1.4366565994900234e-05, + "loss": 0.5845, + "step": 10286 + }, + { + "epoch": 0.36, + "learning_rate": 1.4365586395487395e-05, + "loss": 0.6108, + "step": 10287 + }, + { + "epoch": 0.36, + "learning_rate": 1.4364606744315006e-05, + "loss": 0.61, + "step": 10288 + }, + { + "epoch": 0.36, + "learning_rate": 1.4363627041394686e-05, + "loss": 0.6339, + "step": 10289 + }, + { + "epoch": 0.36, + "learning_rate": 1.4362647286738045e-05, + "loss": 0.5748, + "step": 10290 + }, + { + "epoch": 0.36, + "learning_rate": 1.43616674803567e-05, + "loss": 0.6341, + "step": 10291 + }, + { + "epoch": 0.36, + "learning_rate": 1.4360687622262273e-05, + "loss": 0.6117, + "step": 10292 + }, + { + "epoch": 0.36, + "learning_rate": 1.4359707712466375e-05, + "loss": 0.6316, + "step": 10293 + }, + { + "epoch": 0.36, + "learning_rate": 1.435872775098063e-05, + "loss": 0.6365, + "step": 10294 + }, + { + "epoch": 0.36, + "learning_rate": 1.4357747737816655e-05, + "loss": 0.69, + "step": 10295 + }, + { + "epoch": 0.36, + "learning_rate": 1.4356767672986063e-05, + "loss": 0.6593, + "step": 10296 + }, + { + "epoch": 0.36, + "learning_rate": 1.435578755650048e-05, + "loss": 0.6512, + "step": 10297 + }, + { + "epoch": 0.36, + "learning_rate": 1.4354807388371528e-05, + "loss": 0.6281, + "step": 10298 + }, + { + "epoch": 0.36, + "learning_rate": 1.4353827168610823e-05, + "loss": 0.6364, + "step": 10299 + }, + { + "epoch": 0.36, + "learning_rate": 1.435284689722999e-05, + "loss": 0.623, + "step": 10300 + }, + { + "epoch": 0.36, + "learning_rate": 1.4351866574240651e-05, + "loss": 0.605, + "step": 10301 + }, + { + "epoch": 0.36, + "learning_rate": 1.4350886199654431e-05, + "loss": 0.5913, + "step": 10302 + }, + { + "epoch": 0.36, + "learning_rate": 1.4349905773482945e-05, + "loss": 0.6379, + "step": 10303 + }, + { + "epoch": 0.36, + "learning_rate": 1.434892529573783e-05, + "loss": 0.6112, + "step": 10304 + }, + { + "epoch": 0.36, + "learning_rate": 1.4347944766430702e-05, + "loss": 0.6299, + "step": 10305 + }, + { + "epoch": 0.36, + "learning_rate": 1.4346964185573184e-05, + "loss": 0.6677, + "step": 10306 + }, + { + "epoch": 0.36, + "learning_rate": 1.4345983553176914e-05, + "loss": 0.579, + "step": 10307 + }, + { + "epoch": 0.36, + "learning_rate": 1.4345002869253506e-05, + "loss": 0.5946, + "step": 10308 + }, + { + "epoch": 0.36, + "learning_rate": 1.4344022133814594e-05, + "loss": 0.6198, + "step": 10309 + }, + { + "epoch": 0.36, + "learning_rate": 1.4343041346871807e-05, + "loss": 0.6209, + "step": 10310 + }, + { + "epoch": 0.36, + "learning_rate": 1.4342060508436768e-05, + "loss": 0.6296, + "step": 10311 + }, + { + "epoch": 0.36, + "learning_rate": 1.434107961852111e-05, + "loss": 0.6445, + "step": 10312 + }, + { + "epoch": 0.36, + "learning_rate": 1.434009867713646e-05, + "loss": 0.6366, + "step": 10313 + }, + { + "epoch": 0.36, + "learning_rate": 1.4339117684294453e-05, + "loss": 0.663, + "step": 10314 + }, + { + "epoch": 0.36, + "learning_rate": 1.4338136640006712e-05, + "loss": 0.5345, + "step": 10315 + }, + { + "epoch": 0.36, + "learning_rate": 1.433715554428488e-05, + "loss": 0.677, + "step": 10316 + }, + { + "epoch": 0.36, + "learning_rate": 1.4336174397140576e-05, + "loss": 0.6828, + "step": 10317 + }, + { + "epoch": 0.36, + "learning_rate": 1.4335193198585443e-05, + "loss": 0.657, + "step": 10318 + }, + { + "epoch": 0.36, + "learning_rate": 1.4334211948631111e-05, + "loss": 0.653, + "step": 10319 + }, + { + "epoch": 0.36, + "learning_rate": 1.4333230647289211e-05, + "loss": 0.6265, + "step": 10320 + }, + { + "epoch": 0.36, + "learning_rate": 1.4332249294571383e-05, + "loss": 0.6272, + "step": 10321 + }, + { + "epoch": 0.36, + "learning_rate": 1.4331267890489257e-05, + "loss": 0.5772, + "step": 10322 + }, + { + "epoch": 0.36, + "learning_rate": 1.4330286435054471e-05, + "loss": 0.6236, + "step": 10323 + }, + { + "epoch": 0.36, + "learning_rate": 1.4329304928278665e-05, + "loss": 0.6419, + "step": 10324 + }, + { + "epoch": 0.36, + "learning_rate": 1.4328323370173467e-05, + "loss": 0.63, + "step": 10325 + }, + { + "epoch": 0.36, + "learning_rate": 1.4327341760750524e-05, + "loss": 0.6453, + "step": 10326 + }, + { + "epoch": 0.36, + "learning_rate": 1.4326360100021468e-05, + "loss": 0.6572, + "step": 10327 + }, + { + "epoch": 0.36, + "learning_rate": 1.4325378387997941e-05, + "loss": 0.668, + "step": 10328 + }, + { + "epoch": 0.36, + "learning_rate": 1.4324396624691581e-05, + "loss": 0.6568, + "step": 10329 + }, + { + "epoch": 0.36, + "learning_rate": 1.4323414810114031e-05, + "loss": 0.6114, + "step": 10330 + }, + { + "epoch": 0.36, + "learning_rate": 1.4322432944276927e-05, + "loss": 0.6324, + "step": 10331 + }, + { + "epoch": 0.36, + "learning_rate": 1.4321451027191913e-05, + "loss": 0.6446, + "step": 10332 + }, + { + "epoch": 0.36, + "learning_rate": 1.4320469058870633e-05, + "loss": 0.7105, + "step": 10333 + }, + { + "epoch": 0.36, + "learning_rate": 1.4319487039324723e-05, + "loss": 0.6655, + "step": 10334 + }, + { + "epoch": 0.36, + "learning_rate": 1.4318504968565832e-05, + "loss": 0.6413, + "step": 10335 + }, + { + "epoch": 0.36, + "learning_rate": 1.43175228466056e-05, + "loss": 0.6827, + "step": 10336 + }, + { + "epoch": 0.36, + "learning_rate": 1.4316540673455675e-05, + "loss": 0.6467, + "step": 10337 + }, + { + "epoch": 0.36, + "learning_rate": 1.4315558449127698e-05, + "loss": 0.6553, + "step": 10338 + }, + { + "epoch": 0.36, + "learning_rate": 1.4314576173633319e-05, + "loss": 0.6719, + "step": 10339 + }, + { + "epoch": 0.36, + "learning_rate": 1.4313593846984179e-05, + "loss": 0.6332, + "step": 10340 + }, + { + "epoch": 0.36, + "learning_rate": 1.4312611469191928e-05, + "loss": 0.6271, + "step": 10341 + }, + { + "epoch": 0.36, + "learning_rate": 1.4311629040268214e-05, + "loss": 0.671, + "step": 10342 + }, + { + "epoch": 0.36, + "learning_rate": 1.4310646560224682e-05, + "loss": 0.621, + "step": 10343 + }, + { + "epoch": 0.36, + "learning_rate": 1.430966402907298e-05, + "loss": 0.6129, + "step": 10344 + }, + { + "epoch": 0.36, + "learning_rate": 1.4308681446824764e-05, + "loss": 0.5969, + "step": 10345 + }, + { + "epoch": 0.36, + "learning_rate": 1.4307698813491676e-05, + "loss": 0.6021, + "step": 10346 + }, + { + "epoch": 0.36, + "learning_rate": 1.4306716129085367e-05, + "loss": 0.5758, + "step": 10347 + }, + { + "epoch": 0.36, + "learning_rate": 1.4305733393617494e-05, + "loss": 0.6085, + "step": 10348 + }, + { + "epoch": 0.36, + "learning_rate": 1.4304750607099705e-05, + "loss": 0.5801, + "step": 10349 + }, + { + "epoch": 0.36, + "learning_rate": 1.4303767769543649e-05, + "loss": 0.6254, + "step": 10350 + }, + { + "epoch": 0.36, + "learning_rate": 1.4302784880960985e-05, + "loss": 0.6402, + "step": 10351 + }, + { + "epoch": 0.36, + "learning_rate": 1.4301801941363363e-05, + "loss": 0.6245, + "step": 10352 + }, + { + "epoch": 0.36, + "learning_rate": 1.4300818950762435e-05, + "loss": 0.6581, + "step": 10353 + }, + { + "epoch": 0.36, + "learning_rate": 1.4299835909169857e-05, + "loss": 0.65, + "step": 10354 + }, + { + "epoch": 0.36, + "learning_rate": 1.4298852816597288e-05, + "loss": 0.5855, + "step": 10355 + }, + { + "epoch": 0.36, + "learning_rate": 1.4297869673056377e-05, + "loss": 0.6822, + "step": 10356 + }, + { + "epoch": 0.36, + "learning_rate": 1.4296886478558789e-05, + "loss": 0.6395, + "step": 10357 + }, + { + "epoch": 0.36, + "learning_rate": 1.4295903233116172e-05, + "loss": 0.5695, + "step": 10358 + }, + { + "epoch": 0.36, + "learning_rate": 1.4294919936740189e-05, + "loss": 0.6164, + "step": 10359 + }, + { + "epoch": 0.36, + "learning_rate": 1.4293936589442499e-05, + "loss": 0.5871, + "step": 10360 + }, + { + "epoch": 0.36, + "learning_rate": 1.4292953191234759e-05, + "loss": 0.6307, + "step": 10361 + }, + { + "epoch": 0.36, + "learning_rate": 1.4291969742128625e-05, + "loss": 0.6327, + "step": 10362 + }, + { + "epoch": 0.36, + "learning_rate": 1.4290986242135763e-05, + "loss": 0.6473, + "step": 10363 + }, + { + "epoch": 0.36, + "learning_rate": 1.4290002691267831e-05, + "loss": 0.6319, + "step": 10364 + }, + { + "epoch": 0.36, + "learning_rate": 1.4289019089536487e-05, + "loss": 0.6173, + "step": 10365 + }, + { + "epoch": 0.36, + "learning_rate": 1.42880354369534e-05, + "loss": 0.6907, + "step": 10366 + }, + { + "epoch": 0.36, + "learning_rate": 1.428705173353023e-05, + "loss": 0.6176, + "step": 10367 + }, + { + "epoch": 0.36, + "learning_rate": 1.4286067979278631e-05, + "loss": 0.6073, + "step": 10368 + }, + { + "epoch": 0.36, + "learning_rate": 1.428508417421028e-05, + "loss": 0.6136, + "step": 10369 + }, + { + "epoch": 0.36, + "learning_rate": 1.4284100318336836e-05, + "loss": 0.5826, + "step": 10370 + }, + { + "epoch": 0.36, + "learning_rate": 1.4283116411669956e-05, + "loss": 0.6264, + "step": 10371 + }, + { + "epoch": 0.36, + "learning_rate": 1.428213245422132e-05, + "loss": 0.5915, + "step": 10372 + }, + { + "epoch": 0.36, + "learning_rate": 1.4281148446002589e-05, + "loss": 0.6432, + "step": 10373 + }, + { + "epoch": 0.36, + "learning_rate": 1.428016438702542e-05, + "loss": 0.5966, + "step": 10374 + }, + { + "epoch": 0.36, + "learning_rate": 1.4279180277301493e-05, + "loss": 0.7162, + "step": 10375 + }, + { + "epoch": 0.36, + "learning_rate": 1.4278196116842468e-05, + "loss": 0.6615, + "step": 10376 + }, + { + "epoch": 0.36, + "learning_rate": 1.4277211905660015e-05, + "loss": 0.6531, + "step": 10377 + }, + { + "epoch": 0.36, + "learning_rate": 1.4276227643765807e-05, + "loss": 0.6114, + "step": 10378 + }, + { + "epoch": 0.36, + "learning_rate": 1.4275243331171513e-05, + "loss": 0.6118, + "step": 10379 + }, + { + "epoch": 0.36, + "learning_rate": 1.4274258967888797e-05, + "loss": 0.6298, + "step": 10380 + }, + { + "epoch": 0.36, + "learning_rate": 1.4273274553929335e-05, + "loss": 0.6565, + "step": 10381 + }, + { + "epoch": 0.36, + "learning_rate": 1.4272290089304796e-05, + "loss": 0.6455, + "step": 10382 + }, + { + "epoch": 0.36, + "learning_rate": 1.4271305574026856e-05, + "loss": 0.6146, + "step": 10383 + }, + { + "epoch": 0.36, + "learning_rate": 1.4270321008107185e-05, + "loss": 0.6082, + "step": 10384 + }, + { + "epoch": 0.36, + "learning_rate": 1.4269336391557456e-05, + "loss": 0.6483, + "step": 10385 + }, + { + "epoch": 0.36, + "learning_rate": 1.4268351724389342e-05, + "loss": 0.6219, + "step": 10386 + }, + { + "epoch": 0.36, + "learning_rate": 1.4267367006614519e-05, + "loss": 0.6292, + "step": 10387 + }, + { + "epoch": 0.36, + "learning_rate": 1.4266382238244664e-05, + "loss": 0.5824, + "step": 10388 + }, + { + "epoch": 0.36, + "learning_rate": 1.4265397419291449e-05, + "loss": 0.6292, + "step": 10389 + }, + { + "epoch": 0.36, + "learning_rate": 1.4264412549766551e-05, + "loss": 0.6351, + "step": 10390 + }, + { + "epoch": 0.36, + "learning_rate": 1.426342762968165e-05, + "loss": 0.6609, + "step": 10391 + }, + { + "epoch": 0.36, + "learning_rate": 1.4262442659048419e-05, + "loss": 0.6349, + "step": 10392 + }, + { + "epoch": 0.36, + "learning_rate": 1.426145763787854e-05, + "loss": 0.6738, + "step": 10393 + }, + { + "epoch": 0.36, + "learning_rate": 1.426047256618369e-05, + "loss": 0.6708, + "step": 10394 + }, + { + "epoch": 0.36, + "learning_rate": 1.4259487443975546e-05, + "loss": 0.6791, + "step": 10395 + }, + { + "epoch": 0.36, + "learning_rate": 1.425850227126579e-05, + "loss": 0.6636, + "step": 10396 + }, + { + "epoch": 0.36, + "learning_rate": 1.4257517048066108e-05, + "loss": 0.5987, + "step": 10397 + }, + { + "epoch": 0.36, + "learning_rate": 1.4256531774388169e-05, + "loss": 0.6028, + "step": 10398 + }, + { + "epoch": 0.36, + "learning_rate": 1.4255546450243665e-05, + "loss": 0.6374, + "step": 10399 + }, + { + "epoch": 0.36, + "learning_rate": 1.4254561075644273e-05, + "loss": 0.6203, + "step": 10400 + }, + { + "epoch": 0.36, + "learning_rate": 1.4253575650601677e-05, + "loss": 0.6457, + "step": 10401 + }, + { + "epoch": 0.36, + "learning_rate": 1.4252590175127562e-05, + "loss": 0.613, + "step": 10402 + }, + { + "epoch": 0.36, + "learning_rate": 1.4251604649233612e-05, + "loss": 0.6504, + "step": 10403 + }, + { + "epoch": 0.36, + "learning_rate": 1.425061907293151e-05, + "loss": 0.5912, + "step": 10404 + }, + { + "epoch": 0.36, + "learning_rate": 1.4249633446232937e-05, + "loss": 0.6707, + "step": 10405 + }, + { + "epoch": 0.36, + "learning_rate": 1.424864776914959e-05, + "loss": 0.6375, + "step": 10406 + }, + { + "epoch": 0.36, + "learning_rate": 1.4247662041693147e-05, + "loss": 0.6312, + "step": 10407 + }, + { + "epoch": 0.36, + "learning_rate": 1.4246676263875296e-05, + "loss": 0.6015, + "step": 10408 + }, + { + "epoch": 0.36, + "learning_rate": 1.4245690435707728e-05, + "loss": 0.6278, + "step": 10409 + }, + { + "epoch": 0.36, + "learning_rate": 1.4244704557202127e-05, + "loss": 0.6799, + "step": 10410 + }, + { + "epoch": 0.36, + "learning_rate": 1.4243718628370187e-05, + "loss": 0.5768, + "step": 10411 + }, + { + "epoch": 0.36, + "learning_rate": 1.4242732649223592e-05, + "loss": 0.6157, + "step": 10412 + }, + { + "epoch": 0.36, + "learning_rate": 1.4241746619774033e-05, + "loss": 0.619, + "step": 10413 + }, + { + "epoch": 0.36, + "learning_rate": 1.4240760540033204e-05, + "loss": 0.5696, + "step": 10414 + }, + { + "epoch": 0.36, + "learning_rate": 1.4239774410012794e-05, + "loss": 0.6541, + "step": 10415 + }, + { + "epoch": 0.36, + "learning_rate": 1.4238788229724494e-05, + "loss": 0.6158, + "step": 10416 + }, + { + "epoch": 0.36, + "learning_rate": 1.423780199918e-05, + "loss": 0.6052, + "step": 10417 + }, + { + "epoch": 0.36, + "learning_rate": 1.4236815718390999e-05, + "loss": 0.6011, + "step": 10418 + }, + { + "epoch": 0.36, + "learning_rate": 1.423582938736919e-05, + "loss": 0.648, + "step": 10419 + }, + { + "epoch": 0.36, + "learning_rate": 1.4234843006126265e-05, + "loss": 0.6317, + "step": 10420 + }, + { + "epoch": 0.36, + "learning_rate": 1.4233856574673918e-05, + "loss": 0.6141, + "step": 10421 + }, + { + "epoch": 0.36, + "learning_rate": 1.4232870093023845e-05, + "loss": 0.6667, + "step": 10422 + }, + { + "epoch": 0.36, + "learning_rate": 1.4231883561187747e-05, + "loss": 0.6248, + "step": 10423 + }, + { + "epoch": 0.36, + "learning_rate": 1.423089697917731e-05, + "loss": 0.652, + "step": 10424 + }, + { + "epoch": 0.36, + "learning_rate": 1.4229910347004241e-05, + "loss": 0.6416, + "step": 10425 + }, + { + "epoch": 0.36, + "learning_rate": 1.4228923664680235e-05, + "loss": 0.6136, + "step": 10426 + }, + { + "epoch": 0.36, + "learning_rate": 1.4227936932216986e-05, + "loss": 0.6797, + "step": 10427 + }, + { + "epoch": 0.36, + "learning_rate": 1.4226950149626198e-05, + "loss": 0.6129, + "step": 10428 + }, + { + "epoch": 0.36, + "learning_rate": 1.4225963316919569e-05, + "loss": 0.6285, + "step": 10429 + }, + { + "epoch": 0.36, + "learning_rate": 1.4224976434108796e-05, + "loss": 0.6156, + "step": 10430 + }, + { + "epoch": 0.36, + "learning_rate": 1.4223989501205586e-05, + "loss": 0.6048, + "step": 10431 + }, + { + "epoch": 0.36, + "learning_rate": 1.4223002518221638e-05, + "loss": 0.6523, + "step": 10432 + }, + { + "epoch": 0.36, + "learning_rate": 1.4222015485168649e-05, + "loss": 0.6432, + "step": 10433 + }, + { + "epoch": 0.36, + "learning_rate": 1.4221028402058329e-05, + "loss": 0.629, + "step": 10434 + }, + { + "epoch": 0.36, + "learning_rate": 1.4220041268902378e-05, + "loss": 0.6358, + "step": 10435 + }, + { + "epoch": 0.36, + "learning_rate": 1.4219054085712495e-05, + "loss": 0.6381, + "step": 10436 + }, + { + "epoch": 0.36, + "learning_rate": 1.4218066852500391e-05, + "loss": 0.6309, + "step": 10437 + }, + { + "epoch": 0.36, + "learning_rate": 1.4217079569277771e-05, + "loss": 0.6936, + "step": 10438 + }, + { + "epoch": 0.36, + "learning_rate": 1.4216092236056338e-05, + "loss": 0.6094, + "step": 10439 + }, + { + "epoch": 0.36, + "learning_rate": 1.4215104852847794e-05, + "loss": 0.679, + "step": 10440 + }, + { + "epoch": 0.36, + "learning_rate": 1.4214117419663853e-05, + "loss": 0.6018, + "step": 10441 + }, + { + "epoch": 0.36, + "learning_rate": 1.4213129936516219e-05, + "loss": 0.6242, + "step": 10442 + }, + { + "epoch": 0.36, + "learning_rate": 1.42121424034166e-05, + "loss": 0.6087, + "step": 10443 + }, + { + "epoch": 0.36, + "learning_rate": 1.4211154820376705e-05, + "loss": 0.712, + "step": 10444 + }, + { + "epoch": 0.36, + "learning_rate": 1.421016718740824e-05, + "loss": 0.6286, + "step": 10445 + }, + { + "epoch": 0.36, + "learning_rate": 1.4209179504522919e-05, + "loss": 0.6323, + "step": 10446 + }, + { + "epoch": 0.36, + "learning_rate": 1.420819177173245e-05, + "loss": 0.6035, + "step": 10447 + }, + { + "epoch": 0.36, + "learning_rate": 1.4207203989048544e-05, + "loss": 0.6812, + "step": 10448 + }, + { + "epoch": 0.36, + "learning_rate": 1.420621615648291e-05, + "loss": 0.6713, + "step": 10449 + }, + { + "epoch": 0.36, + "learning_rate": 1.4205228274047267e-05, + "loss": 0.6315, + "step": 10450 + }, + { + "epoch": 0.36, + "learning_rate": 1.4204240341753321e-05, + "loss": 0.6407, + "step": 10451 + }, + { + "epoch": 0.36, + "learning_rate": 1.4203252359612787e-05, + "loss": 0.5906, + "step": 10452 + }, + { + "epoch": 0.36, + "learning_rate": 1.420226432763738e-05, + "loss": 0.632, + "step": 10453 + }, + { + "epoch": 0.36, + "learning_rate": 1.4201276245838812e-05, + "loss": 0.6074, + "step": 10454 + }, + { + "epoch": 0.36, + "learning_rate": 1.4200288114228799e-05, + "loss": 0.6328, + "step": 10455 + }, + { + "epoch": 0.36, + "learning_rate": 1.4199299932819062e-05, + "loss": 0.6733, + "step": 10456 + }, + { + "epoch": 0.36, + "learning_rate": 1.4198311701621308e-05, + "loss": 0.6147, + "step": 10457 + }, + { + "epoch": 0.36, + "learning_rate": 1.4197323420647258e-05, + "loss": 0.6128, + "step": 10458 + }, + { + "epoch": 0.36, + "learning_rate": 1.4196335089908631e-05, + "loss": 0.5887, + "step": 10459 + }, + { + "epoch": 0.36, + "learning_rate": 1.4195346709417141e-05, + "loss": 0.6764, + "step": 10460 + }, + { + "epoch": 0.36, + "learning_rate": 1.4194358279184508e-05, + "loss": 0.65, + "step": 10461 + }, + { + "epoch": 0.36, + "learning_rate": 1.4193369799222456e-05, + "loss": 0.6304, + "step": 10462 + }, + { + "epoch": 0.36, + "learning_rate": 1.4192381269542697e-05, + "loss": 0.671, + "step": 10463 + }, + { + "epoch": 0.36, + "learning_rate": 1.4191392690156956e-05, + "loss": 0.6125, + "step": 10464 + }, + { + "epoch": 0.36, + "learning_rate": 1.4190404061076952e-05, + "loss": 0.6411, + "step": 10465 + }, + { + "epoch": 0.36, + "learning_rate": 1.4189415382314407e-05, + "loss": 0.6789, + "step": 10466 + }, + { + "epoch": 0.36, + "learning_rate": 1.418842665388104e-05, + "loss": 0.6514, + "step": 10467 + }, + { + "epoch": 0.36, + "learning_rate": 1.4187437875788581e-05, + "loss": 0.6005, + "step": 10468 + }, + { + "epoch": 0.36, + "learning_rate": 1.418644904804875e-05, + "loss": 0.6062, + "step": 10469 + }, + { + "epoch": 0.36, + "learning_rate": 1.4185460170673263e-05, + "loss": 0.6622, + "step": 10470 + }, + { + "epoch": 0.36, + "learning_rate": 1.4184471243673859e-05, + "loss": 0.6373, + "step": 10471 + }, + { + "epoch": 0.36, + "learning_rate": 1.418348226706225e-05, + "loss": 0.6313, + "step": 10472 + }, + { + "epoch": 0.36, + "learning_rate": 1.4182493240850169e-05, + "loss": 0.6579, + "step": 10473 + }, + { + "epoch": 0.36, + "learning_rate": 1.4181504165049336e-05, + "loss": 0.6454, + "step": 10474 + }, + { + "epoch": 0.36, + "learning_rate": 1.4180515039671485e-05, + "loss": 0.6082, + "step": 10475 + }, + { + "epoch": 0.36, + "learning_rate": 1.4179525864728338e-05, + "loss": 0.6902, + "step": 10476 + }, + { + "epoch": 0.36, + "learning_rate": 1.4178536640231625e-05, + "loss": 0.6198, + "step": 10477 + }, + { + "epoch": 0.36, + "learning_rate": 1.4177547366193076e-05, + "loss": 0.5814, + "step": 10478 + }, + { + "epoch": 0.36, + "learning_rate": 1.4176558042624418e-05, + "loss": 0.6171, + "step": 10479 + }, + { + "epoch": 0.36, + "learning_rate": 1.4175568669537379e-05, + "loss": 0.6463, + "step": 10480 + }, + { + "epoch": 0.36, + "learning_rate": 1.4174579246943693e-05, + "loss": 0.6133, + "step": 10481 + }, + { + "epoch": 0.36, + "learning_rate": 1.4173589774855087e-05, + "loss": 0.6176, + "step": 10482 + }, + { + "epoch": 0.36, + "learning_rate": 1.4172600253283296e-05, + "loss": 0.6017, + "step": 10483 + }, + { + "epoch": 0.36, + "learning_rate": 1.4171610682240054e-05, + "loss": 0.5933, + "step": 10484 + }, + { + "epoch": 0.36, + "learning_rate": 1.4170621061737084e-05, + "loss": 0.6267, + "step": 10485 + }, + { + "epoch": 0.36, + "learning_rate": 1.4169631391786129e-05, + "loss": 0.6105, + "step": 10486 + }, + { + "epoch": 0.36, + "learning_rate": 1.416864167239892e-05, + "loss": 0.6237, + "step": 10487 + }, + { + "epoch": 0.36, + "learning_rate": 1.416765190358719e-05, + "loss": 0.6021, + "step": 10488 + }, + { + "epoch": 0.36, + "learning_rate": 1.4166662085362673e-05, + "loss": 0.6587, + "step": 10489 + }, + { + "epoch": 0.36, + "learning_rate": 1.4165672217737108e-05, + "loss": 0.62, + "step": 10490 + }, + { + "epoch": 0.36, + "learning_rate": 1.4164682300722228e-05, + "loss": 0.5843, + "step": 10491 + }, + { + "epoch": 0.36, + "learning_rate": 1.416369233432977e-05, + "loss": 0.638, + "step": 10492 + }, + { + "epoch": 0.36, + "learning_rate": 1.4162702318571473e-05, + "loss": 0.6897, + "step": 10493 + }, + { + "epoch": 0.36, + "learning_rate": 1.4161712253459075e-05, + "loss": 0.652, + "step": 10494 + }, + { + "epoch": 0.36, + "learning_rate": 1.4160722139004312e-05, + "loss": 0.5983, + "step": 10495 + }, + { + "epoch": 0.36, + "learning_rate": 1.4159731975218928e-05, + "loss": 0.6619, + "step": 10496 + }, + { + "epoch": 0.36, + "learning_rate": 1.4158741762114656e-05, + "loss": 0.5781, + "step": 10497 + }, + { + "epoch": 0.36, + "learning_rate": 1.4157751499703241e-05, + "loss": 0.6553, + "step": 10498 + }, + { + "epoch": 0.36, + "learning_rate": 1.4156761187996425e-05, + "loss": 0.6358, + "step": 10499 + }, + { + "epoch": 0.36, + "learning_rate": 1.4155770827005943e-05, + "loss": 0.6291, + "step": 10500 + }, + { + "epoch": 0.36, + "learning_rate": 1.4154780416743541e-05, + "loss": 0.6042, + "step": 10501 + }, + { + "epoch": 0.36, + "learning_rate": 1.4153789957220964e-05, + "loss": 0.6911, + "step": 10502 + }, + { + "epoch": 0.36, + "learning_rate": 1.415279944844995e-05, + "loss": 0.6703, + "step": 10503 + }, + { + "epoch": 0.36, + "learning_rate": 1.4151808890442247e-05, + "loss": 0.6829, + "step": 10504 + }, + { + "epoch": 0.36, + "learning_rate": 1.4150818283209595e-05, + "loss": 0.6876, + "step": 10505 + }, + { + "epoch": 0.36, + "learning_rate": 1.4149827626763744e-05, + "loss": 0.6137, + "step": 10506 + }, + { + "epoch": 0.36, + "learning_rate": 1.4148836921116435e-05, + "loss": 0.6552, + "step": 10507 + }, + { + "epoch": 0.36, + "learning_rate": 1.4147846166279418e-05, + "loss": 0.6458, + "step": 10508 + }, + { + "epoch": 0.36, + "learning_rate": 1.4146855362264435e-05, + "loss": 0.6009, + "step": 10509 + }, + { + "epoch": 0.36, + "learning_rate": 1.4145864509083238e-05, + "loss": 0.6189, + "step": 10510 + }, + { + "epoch": 0.36, + "learning_rate": 1.4144873606747571e-05, + "loss": 0.6423, + "step": 10511 + }, + { + "epoch": 0.36, + "learning_rate": 1.4143882655269185e-05, + "loss": 0.6179, + "step": 10512 + }, + { + "epoch": 0.36, + "learning_rate": 1.4142891654659829e-05, + "loss": 0.5811, + "step": 10513 + }, + { + "epoch": 0.36, + "learning_rate": 1.4141900604931252e-05, + "loss": 0.6129, + "step": 10514 + }, + { + "epoch": 0.36, + "learning_rate": 1.4140909506095201e-05, + "loss": 0.6075, + "step": 10515 + }, + { + "epoch": 0.36, + "learning_rate": 1.4139918358163434e-05, + "loss": 0.5947, + "step": 10516 + }, + { + "epoch": 0.36, + "learning_rate": 1.4138927161147693e-05, + "loss": 0.601, + "step": 10517 + }, + { + "epoch": 0.36, + "learning_rate": 1.4137935915059737e-05, + "loss": 0.6222, + "step": 10518 + }, + { + "epoch": 0.36, + "learning_rate": 1.4136944619911317e-05, + "loss": 0.6348, + "step": 10519 + }, + { + "epoch": 0.36, + "learning_rate": 1.4135953275714184e-05, + "loss": 0.6178, + "step": 10520 + }, + { + "epoch": 0.36, + "learning_rate": 1.4134961882480091e-05, + "loss": 0.6376, + "step": 10521 + }, + { + "epoch": 0.36, + "learning_rate": 1.4133970440220799e-05, + "loss": 0.609, + "step": 10522 + }, + { + "epoch": 0.36, + "learning_rate": 1.4132978948948055e-05, + "loss": 0.6565, + "step": 10523 + }, + { + "epoch": 0.36, + "learning_rate": 1.4131987408673618e-05, + "loss": 0.6222, + "step": 10524 + }, + { + "epoch": 0.36, + "learning_rate": 1.4130995819409243e-05, + "loss": 0.6863, + "step": 10525 + }, + { + "epoch": 0.36, + "learning_rate": 1.4130004181166686e-05, + "loss": 0.5793, + "step": 10526 + }, + { + "epoch": 0.36, + "learning_rate": 1.4129012493957706e-05, + "loss": 0.5768, + "step": 10527 + }, + { + "epoch": 0.36, + "learning_rate": 1.412802075779406e-05, + "loss": 0.616, + "step": 10528 + }, + { + "epoch": 0.36, + "learning_rate": 1.4127028972687504e-05, + "loss": 0.6982, + "step": 10529 + }, + { + "epoch": 0.36, + "learning_rate": 1.41260371386498e-05, + "loss": 0.6356, + "step": 10530 + }, + { + "epoch": 0.36, + "learning_rate": 1.4125045255692707e-05, + "loss": 0.7041, + "step": 10531 + }, + { + "epoch": 0.36, + "learning_rate": 1.4124053323827983e-05, + "loss": 0.6457, + "step": 10532 + }, + { + "epoch": 0.36, + "learning_rate": 1.412306134306739e-05, + "loss": 0.6115, + "step": 10533 + }, + { + "epoch": 0.36, + "learning_rate": 1.412206931342269e-05, + "loss": 0.6092, + "step": 10534 + }, + { + "epoch": 0.37, + "learning_rate": 1.4121077234905643e-05, + "loss": 0.6598, + "step": 10535 + }, + { + "epoch": 0.37, + "learning_rate": 1.4120085107528012e-05, + "loss": 0.6603, + "step": 10536 + }, + { + "epoch": 0.37, + "learning_rate": 1.4119092931301563e-05, + "loss": 0.6415, + "step": 10537 + }, + { + "epoch": 0.37, + "learning_rate": 1.4118100706238051e-05, + "loss": 0.673, + "step": 10538 + }, + { + "epoch": 0.37, + "learning_rate": 1.411710843234925e-05, + "loss": 0.6301, + "step": 10539 + }, + { + "epoch": 0.37, + "learning_rate": 1.411611610964692e-05, + "loss": 0.657, + "step": 10540 + }, + { + "epoch": 0.37, + "learning_rate": 1.4115123738142826e-05, + "loss": 0.6369, + "step": 10541 + }, + { + "epoch": 0.37, + "learning_rate": 1.4114131317848733e-05, + "loss": 0.6049, + "step": 10542 + }, + { + "epoch": 0.37, + "learning_rate": 1.4113138848776413e-05, + "loss": 0.6514, + "step": 10543 + }, + { + "epoch": 0.37, + "learning_rate": 1.4112146330937627e-05, + "loss": 0.6383, + "step": 10544 + }, + { + "epoch": 0.37, + "learning_rate": 1.411115376434414e-05, + "loss": 0.6643, + "step": 10545 + }, + { + "epoch": 0.37, + "learning_rate": 1.4110161149007731e-05, + "loss": 0.5871, + "step": 10546 + }, + { + "epoch": 0.37, + "learning_rate": 1.4109168484940157e-05, + "loss": 0.6488, + "step": 10547 + }, + { + "epoch": 0.37, + "learning_rate": 1.4108175772153195e-05, + "loss": 0.6158, + "step": 10548 + }, + { + "epoch": 0.37, + "learning_rate": 1.4107183010658612e-05, + "loss": 0.6425, + "step": 10549 + }, + { + "epoch": 0.37, + "learning_rate": 1.4106190200468177e-05, + "loss": 0.6286, + "step": 10550 + }, + { + "epoch": 0.37, + "learning_rate": 1.4105197341593666e-05, + "loss": 0.5698, + "step": 10551 + }, + { + "epoch": 0.37, + "learning_rate": 1.4104204434046847e-05, + "loss": 0.6476, + "step": 10552 + }, + { + "epoch": 0.37, + "learning_rate": 1.4103211477839491e-05, + "loss": 0.6236, + "step": 10553 + }, + { + "epoch": 0.37, + "learning_rate": 1.4102218472983372e-05, + "loss": 0.637, + "step": 10554 + }, + { + "epoch": 0.37, + "learning_rate": 1.4101225419490265e-05, + "loss": 0.5853, + "step": 10555 + }, + { + "epoch": 0.37, + "learning_rate": 1.4100232317371943e-05, + "loss": 0.6633, + "step": 10556 + }, + { + "epoch": 0.37, + "learning_rate": 1.4099239166640177e-05, + "loss": 0.6037, + "step": 10557 + }, + { + "epoch": 0.37, + "learning_rate": 1.409824596730675e-05, + "loss": 0.5872, + "step": 10558 + }, + { + "epoch": 0.37, + "learning_rate": 1.409725271938343e-05, + "loss": 0.6128, + "step": 10559 + }, + { + "epoch": 0.37, + "learning_rate": 1.4096259422881992e-05, + "loss": 0.6356, + "step": 10560 + }, + { + "epoch": 0.37, + "learning_rate": 1.4095266077814224e-05, + "loss": 0.6709, + "step": 10561 + }, + { + "epoch": 0.37, + "learning_rate": 1.4094272684191891e-05, + "loss": 0.5922, + "step": 10562 + }, + { + "epoch": 0.37, + "learning_rate": 1.4093279242026778e-05, + "loss": 0.6726, + "step": 10563 + }, + { + "epoch": 0.37, + "learning_rate": 1.4092285751330663e-05, + "loss": 0.6256, + "step": 10564 + }, + { + "epoch": 0.37, + "learning_rate": 1.4091292212115322e-05, + "loss": 0.6301, + "step": 10565 + }, + { + "epoch": 0.37, + "learning_rate": 1.4090298624392538e-05, + "loss": 0.5409, + "step": 10566 + }, + { + "epoch": 0.37, + "learning_rate": 1.4089304988174086e-05, + "loss": 0.6865, + "step": 10567 + }, + { + "epoch": 0.37, + "learning_rate": 1.4088311303471751e-05, + "loss": 0.5843, + "step": 10568 + }, + { + "epoch": 0.37, + "learning_rate": 1.4087317570297319e-05, + "loss": 0.6176, + "step": 10569 + }, + { + "epoch": 0.37, + "learning_rate": 1.408632378866256e-05, + "loss": 0.6183, + "step": 10570 + }, + { + "epoch": 0.37, + "learning_rate": 1.4085329958579266e-05, + "loss": 0.608, + "step": 10571 + }, + { + "epoch": 0.37, + "learning_rate": 1.408433608005922e-05, + "loss": 0.6016, + "step": 10572 + }, + { + "epoch": 0.37, + "learning_rate": 1.40833421531142e-05, + "loss": 0.6069, + "step": 10573 + }, + { + "epoch": 0.37, + "learning_rate": 1.4082348177755992e-05, + "loss": 0.6427, + "step": 10574 + }, + { + "epoch": 0.37, + "learning_rate": 1.4081354153996385e-05, + "loss": 0.6425, + "step": 10575 + }, + { + "epoch": 0.37, + "learning_rate": 1.408036008184716e-05, + "loss": 0.6472, + "step": 10576 + }, + { + "epoch": 0.37, + "learning_rate": 1.4079365961320105e-05, + "loss": 0.6319, + "step": 10577 + }, + { + "epoch": 0.37, + "learning_rate": 1.4078371792427008e-05, + "loss": 0.6475, + "step": 10578 + }, + { + "epoch": 0.37, + "learning_rate": 1.4077377575179651e-05, + "loss": 0.6302, + "step": 10579 + }, + { + "epoch": 0.37, + "learning_rate": 1.4076383309589825e-05, + "loss": 0.6499, + "step": 10580 + }, + { + "epoch": 0.37, + "learning_rate": 1.4075388995669321e-05, + "loss": 0.58, + "step": 10581 + }, + { + "epoch": 0.37, + "learning_rate": 1.4074394633429924e-05, + "loss": 0.6367, + "step": 10582 + }, + { + "epoch": 0.37, + "learning_rate": 1.4073400222883425e-05, + "loss": 0.6459, + "step": 10583 + }, + { + "epoch": 0.37, + "learning_rate": 1.4072405764041612e-05, + "loss": 0.6553, + "step": 10584 + }, + { + "epoch": 0.37, + "learning_rate": 1.4071411256916276e-05, + "loss": 0.6229, + "step": 10585 + }, + { + "epoch": 0.37, + "learning_rate": 1.4070416701519211e-05, + "loss": 0.6811, + "step": 10586 + }, + { + "epoch": 0.37, + "learning_rate": 1.4069422097862209e-05, + "loss": 0.5607, + "step": 10587 + }, + { + "epoch": 0.37, + "learning_rate": 1.4068427445957058e-05, + "loss": 0.6911, + "step": 10588 + }, + { + "epoch": 0.37, + "learning_rate": 1.406743274581555e-05, + "loss": 0.6348, + "step": 10589 + }, + { + "epoch": 0.37, + "learning_rate": 1.4066437997449488e-05, + "loss": 0.6213, + "step": 10590 + }, + { + "epoch": 0.37, + "learning_rate": 1.4065443200870655e-05, + "loss": 0.6005, + "step": 10591 + }, + { + "epoch": 0.37, + "learning_rate": 1.406444835609085e-05, + "loss": 0.6762, + "step": 10592 + }, + { + "epoch": 0.37, + "learning_rate": 1.406345346312187e-05, + "loss": 0.6445, + "step": 10593 + }, + { + "epoch": 0.37, + "learning_rate": 1.4062458521975507e-05, + "loss": 0.6112, + "step": 10594 + }, + { + "epoch": 0.37, + "learning_rate": 1.406146353266356e-05, + "loss": 0.6223, + "step": 10595 + }, + { + "epoch": 0.37, + "learning_rate": 1.4060468495197825e-05, + "loss": 0.6131, + "step": 10596 + }, + { + "epoch": 0.37, + "learning_rate": 1.4059473409590103e-05, + "loss": 0.6326, + "step": 10597 + }, + { + "epoch": 0.37, + "learning_rate": 1.4058478275852184e-05, + "loss": 0.6503, + "step": 10598 + }, + { + "epoch": 0.37, + "learning_rate": 1.4057483093995872e-05, + "loss": 0.6453, + "step": 10599 + }, + { + "epoch": 0.37, + "learning_rate": 1.4056487864032966e-05, + "loss": 0.6197, + "step": 10600 + }, + { + "epoch": 0.37, + "learning_rate": 1.4055492585975263e-05, + "loss": 0.6673, + "step": 10601 + }, + { + "epoch": 0.37, + "learning_rate": 1.4054497259834567e-05, + "loss": 0.6669, + "step": 10602 + }, + { + "epoch": 0.37, + "learning_rate": 1.4053501885622679e-05, + "loss": 0.5629, + "step": 10603 + }, + { + "epoch": 0.37, + "learning_rate": 1.4052506463351392e-05, + "loss": 0.5705, + "step": 10604 + }, + { + "epoch": 0.37, + "learning_rate": 1.405151099303252e-05, + "loss": 0.6158, + "step": 10605 + }, + { + "epoch": 0.37, + "learning_rate": 1.405051547467786e-05, + "loss": 0.6093, + "step": 10606 + }, + { + "epoch": 0.37, + "learning_rate": 1.404951990829921e-05, + "loss": 0.6201, + "step": 10607 + }, + { + "epoch": 0.37, + "learning_rate": 1.4048524293908383e-05, + "loss": 0.7032, + "step": 10608 + }, + { + "epoch": 0.37, + "learning_rate": 1.404752863151718e-05, + "loss": 0.6484, + "step": 10609 + }, + { + "epoch": 0.37, + "learning_rate": 1.4046532921137401e-05, + "loss": 0.6452, + "step": 10610 + }, + { + "epoch": 0.37, + "learning_rate": 1.4045537162780858e-05, + "loss": 0.6984, + "step": 10611 + }, + { + "epoch": 0.37, + "learning_rate": 1.4044541356459357e-05, + "loss": 0.6622, + "step": 10612 + }, + { + "epoch": 0.37, + "learning_rate": 1.4043545502184696e-05, + "loss": 0.5997, + "step": 10613 + }, + { + "epoch": 0.37, + "learning_rate": 1.404254959996869e-05, + "loss": 0.5988, + "step": 10614 + }, + { + "epoch": 0.37, + "learning_rate": 1.404155364982315e-05, + "loss": 0.6128, + "step": 10615 + }, + { + "epoch": 0.37, + "learning_rate": 1.404055765175987e-05, + "loss": 0.6578, + "step": 10616 + }, + { + "epoch": 0.37, + "learning_rate": 1.4039561605790673e-05, + "loss": 0.6177, + "step": 10617 + }, + { + "epoch": 0.37, + "learning_rate": 1.4038565511927364e-05, + "loss": 0.7078, + "step": 10618 + }, + { + "epoch": 0.37, + "learning_rate": 1.4037569370181748e-05, + "loss": 0.6363, + "step": 10619 + }, + { + "epoch": 0.37, + "learning_rate": 1.4036573180565642e-05, + "loss": 0.6118, + "step": 10620 + }, + { + "epoch": 0.37, + "learning_rate": 1.4035576943090857e-05, + "loss": 0.6402, + "step": 10621 + }, + { + "epoch": 0.37, + "learning_rate": 1.4034580657769196e-05, + "loss": 0.654, + "step": 10622 + }, + { + "epoch": 0.37, + "learning_rate": 1.4033584324612482e-05, + "loss": 0.6573, + "step": 10623 + }, + { + "epoch": 0.37, + "learning_rate": 1.4032587943632523e-05, + "loss": 0.6249, + "step": 10624 + }, + { + "epoch": 0.37, + "learning_rate": 1.403159151484113e-05, + "loss": 0.6003, + "step": 10625 + }, + { + "epoch": 0.37, + "learning_rate": 1.4030595038250123e-05, + "loss": 0.6259, + "step": 10626 + }, + { + "epoch": 0.37, + "learning_rate": 1.4029598513871314e-05, + "loss": 0.6736, + "step": 10627 + }, + { + "epoch": 0.37, + "learning_rate": 1.4028601941716514e-05, + "loss": 0.5895, + "step": 10628 + }, + { + "epoch": 0.37, + "learning_rate": 1.4027605321797542e-05, + "loss": 0.6445, + "step": 10629 + }, + { + "epoch": 0.37, + "learning_rate": 1.4026608654126217e-05, + "loss": 0.5936, + "step": 10630 + }, + { + "epoch": 0.37, + "learning_rate": 1.402561193871435e-05, + "loss": 0.6007, + "step": 10631 + }, + { + "epoch": 0.37, + "learning_rate": 1.4024615175573759e-05, + "loss": 0.6652, + "step": 10632 + }, + { + "epoch": 0.37, + "learning_rate": 1.402361836471627e-05, + "loss": 0.5859, + "step": 10633 + }, + { + "epoch": 0.37, + "learning_rate": 1.402262150615369e-05, + "loss": 0.5791, + "step": 10634 + }, + { + "epoch": 0.37, + "learning_rate": 1.4021624599897844e-05, + "loss": 0.5734, + "step": 10635 + }, + { + "epoch": 0.37, + "learning_rate": 1.4020627645960554e-05, + "loss": 0.6606, + "step": 10636 + }, + { + "epoch": 0.37, + "learning_rate": 1.4019630644353634e-05, + "loss": 0.6261, + "step": 10637 + }, + { + "epoch": 0.37, + "learning_rate": 1.4018633595088908e-05, + "loss": 0.6567, + "step": 10638 + }, + { + "epoch": 0.37, + "learning_rate": 1.4017636498178199e-05, + "loss": 0.5598, + "step": 10639 + }, + { + "epoch": 0.37, + "learning_rate": 1.4016639353633327e-05, + "loss": 0.6117, + "step": 10640 + }, + { + "epoch": 0.37, + "learning_rate": 1.4015642161466115e-05, + "loss": 0.7032, + "step": 10641 + }, + { + "epoch": 0.37, + "learning_rate": 1.4014644921688385e-05, + "loss": 0.6668, + "step": 10642 + }, + { + "epoch": 0.37, + "learning_rate": 1.4013647634311957e-05, + "loss": 0.6348, + "step": 10643 + }, + { + "epoch": 0.37, + "learning_rate": 1.4012650299348662e-05, + "loss": 0.6152, + "step": 10644 + }, + { + "epoch": 0.37, + "learning_rate": 1.4011652916810322e-05, + "loss": 0.6232, + "step": 10645 + }, + { + "epoch": 0.37, + "learning_rate": 1.4010655486708762e-05, + "loss": 0.6099, + "step": 10646 + }, + { + "epoch": 0.37, + "learning_rate": 1.4009658009055806e-05, + "loss": 0.6179, + "step": 10647 + }, + { + "epoch": 0.37, + "learning_rate": 1.4008660483863286e-05, + "loss": 0.6227, + "step": 10648 + }, + { + "epoch": 0.37, + "learning_rate": 1.400766291114302e-05, + "loss": 0.6693, + "step": 10649 + }, + { + "epoch": 0.37, + "learning_rate": 1.4006665290906844e-05, + "loss": 0.6273, + "step": 10650 + }, + { + "epoch": 0.37, + "learning_rate": 1.4005667623166583e-05, + "loss": 0.6809, + "step": 10651 + }, + { + "epoch": 0.37, + "learning_rate": 1.4004669907934062e-05, + "loss": 0.6431, + "step": 10652 + }, + { + "epoch": 0.37, + "learning_rate": 1.4003672145221115e-05, + "loss": 0.6497, + "step": 10653 + }, + { + "epoch": 0.37, + "learning_rate": 1.400267433503957e-05, + "loss": 0.6235, + "step": 10654 + }, + { + "epoch": 0.37, + "learning_rate": 1.4001676477401257e-05, + "loss": 0.6452, + "step": 10655 + }, + { + "epoch": 0.37, + "learning_rate": 1.4000678572318007e-05, + "loss": 0.5731, + "step": 10656 + }, + { + "epoch": 0.37, + "learning_rate": 1.3999680619801652e-05, + "loss": 0.588, + "step": 10657 + }, + { + "epoch": 0.37, + "learning_rate": 1.3998682619864023e-05, + "loss": 0.6634, + "step": 10658 + }, + { + "epoch": 0.37, + "learning_rate": 1.3997684572516956e-05, + "loss": 0.6303, + "step": 10659 + }, + { + "epoch": 0.37, + "learning_rate": 1.3996686477772277e-05, + "loss": 0.6322, + "step": 10660 + }, + { + "epoch": 0.37, + "learning_rate": 1.3995688335641826e-05, + "loss": 0.6251, + "step": 10661 + }, + { + "epoch": 0.37, + "learning_rate": 1.3994690146137437e-05, + "loss": 0.7022, + "step": 10662 + }, + { + "epoch": 0.37, + "learning_rate": 1.3993691909270941e-05, + "loss": 0.6436, + "step": 10663 + }, + { + "epoch": 0.37, + "learning_rate": 1.3992693625054175e-05, + "loss": 0.7223, + "step": 10664 + }, + { + "epoch": 0.37, + "learning_rate": 1.3991695293498976e-05, + "loss": 0.6075, + "step": 10665 + }, + { + "epoch": 0.37, + "learning_rate": 1.399069691461718e-05, + "loss": 0.6113, + "step": 10666 + }, + { + "epoch": 0.37, + "learning_rate": 1.3989698488420623e-05, + "loss": 0.6464, + "step": 10667 + }, + { + "epoch": 0.37, + "learning_rate": 1.3988700014921146e-05, + "loss": 0.63, + "step": 10668 + }, + { + "epoch": 0.37, + "learning_rate": 1.398770149413058e-05, + "loss": 0.6375, + "step": 10669 + }, + { + "epoch": 0.37, + "learning_rate": 1.398670292606077e-05, + "loss": 0.6954, + "step": 10670 + }, + { + "epoch": 0.37, + "learning_rate": 1.3985704310723555e-05, + "loss": 0.6518, + "step": 10671 + }, + { + "epoch": 0.37, + "learning_rate": 1.3984705648130774e-05, + "loss": 0.6637, + "step": 10672 + }, + { + "epoch": 0.37, + "learning_rate": 1.3983706938294263e-05, + "loss": 0.6569, + "step": 10673 + }, + { + "epoch": 0.37, + "learning_rate": 1.3982708181225873e-05, + "loss": 0.6683, + "step": 10674 + }, + { + "epoch": 0.37, + "learning_rate": 1.3981709376937436e-05, + "loss": 0.632, + "step": 10675 + }, + { + "epoch": 0.37, + "learning_rate": 1.3980710525440797e-05, + "loss": 0.6527, + "step": 10676 + }, + { + "epoch": 0.37, + "learning_rate": 1.39797116267478e-05, + "loss": 0.7086, + "step": 10677 + }, + { + "epoch": 0.37, + "learning_rate": 1.3978712680870286e-05, + "loss": 0.6101, + "step": 10678 + }, + { + "epoch": 0.37, + "learning_rate": 1.39777136878201e-05, + "loss": 0.6303, + "step": 10679 + }, + { + "epoch": 0.37, + "learning_rate": 1.3976714647609089e-05, + "loss": 0.6416, + "step": 10680 + }, + { + "epoch": 0.37, + "learning_rate": 1.3975715560249092e-05, + "loss": 0.6425, + "step": 10681 + }, + { + "epoch": 0.37, + "learning_rate": 1.397471642575196e-05, + "loss": 0.6406, + "step": 10682 + }, + { + "epoch": 0.37, + "learning_rate": 1.3973717244129537e-05, + "loss": 0.5999, + "step": 10683 + }, + { + "epoch": 0.37, + "learning_rate": 1.3972718015393667e-05, + "loss": 0.6219, + "step": 10684 + }, + { + "epoch": 0.37, + "learning_rate": 1.39717187395562e-05, + "loss": 0.6644, + "step": 10685 + }, + { + "epoch": 0.37, + "learning_rate": 1.3970719416628985e-05, + "loss": 0.6203, + "step": 10686 + }, + { + "epoch": 0.37, + "learning_rate": 1.3969720046623867e-05, + "loss": 0.6873, + "step": 10687 + }, + { + "epoch": 0.37, + "learning_rate": 1.3968720629552697e-05, + "loss": 0.6118, + "step": 10688 + }, + { + "epoch": 0.37, + "learning_rate": 1.3967721165427324e-05, + "loss": 0.6198, + "step": 10689 + }, + { + "epoch": 0.37, + "learning_rate": 1.3966721654259596e-05, + "loss": 0.5749, + "step": 10690 + }, + { + "epoch": 0.37, + "learning_rate": 1.3965722096061362e-05, + "loss": 0.6331, + "step": 10691 + }, + { + "epoch": 0.37, + "learning_rate": 1.396472249084448e-05, + "loss": 0.6021, + "step": 10692 + }, + { + "epoch": 0.37, + "learning_rate": 1.3963722838620797e-05, + "loss": 0.5921, + "step": 10693 + }, + { + "epoch": 0.37, + "learning_rate": 1.3962723139402164e-05, + "loss": 0.6337, + "step": 10694 + }, + { + "epoch": 0.37, + "learning_rate": 1.3961723393200438e-05, + "loss": 0.6762, + "step": 10695 + }, + { + "epoch": 0.37, + "learning_rate": 1.3960723600027469e-05, + "loss": 0.5917, + "step": 10696 + }, + { + "epoch": 0.37, + "learning_rate": 1.3959723759895108e-05, + "loss": 0.6377, + "step": 10697 + }, + { + "epoch": 0.37, + "learning_rate": 1.3958723872815214e-05, + "loss": 0.5656, + "step": 10698 + }, + { + "epoch": 0.37, + "learning_rate": 1.3957723938799643e-05, + "loss": 0.5877, + "step": 10699 + }, + { + "epoch": 0.37, + "learning_rate": 1.3956723957860245e-05, + "loss": 0.5981, + "step": 10700 + }, + { + "epoch": 0.37, + "learning_rate": 1.3955723930008881e-05, + "loss": 0.6549, + "step": 10701 + }, + { + "epoch": 0.37, + "learning_rate": 1.3954723855257408e-05, + "loss": 0.6955, + "step": 10702 + }, + { + "epoch": 0.37, + "learning_rate": 1.3953723733617676e-05, + "loss": 0.6556, + "step": 10703 + }, + { + "epoch": 0.37, + "learning_rate": 1.3952723565101552e-05, + "loss": 0.6519, + "step": 10704 + }, + { + "epoch": 0.37, + "learning_rate": 1.395172334972089e-05, + "loss": 0.6524, + "step": 10705 + }, + { + "epoch": 0.37, + "learning_rate": 1.3950723087487546e-05, + "loss": 0.6283, + "step": 10706 + }, + { + "epoch": 0.37, + "learning_rate": 1.3949722778413383e-05, + "loss": 0.6338, + "step": 10707 + }, + { + "epoch": 0.37, + "learning_rate": 1.3948722422510262e-05, + "loss": 0.639, + "step": 10708 + }, + { + "epoch": 0.37, + "learning_rate": 1.3947722019790036e-05, + "loss": 0.6602, + "step": 10709 + }, + { + "epoch": 0.37, + "learning_rate": 1.3946721570264577e-05, + "loss": 0.6613, + "step": 10710 + }, + { + "epoch": 0.37, + "learning_rate": 1.3945721073945741e-05, + "loss": 0.6336, + "step": 10711 + }, + { + "epoch": 0.37, + "learning_rate": 1.3944720530845386e-05, + "loss": 0.5937, + "step": 10712 + }, + { + "epoch": 0.37, + "learning_rate": 1.3943719940975381e-05, + "loss": 0.6996, + "step": 10713 + }, + { + "epoch": 0.37, + "learning_rate": 1.3942719304347591e-05, + "loss": 0.6301, + "step": 10714 + }, + { + "epoch": 0.37, + "learning_rate": 1.394171862097387e-05, + "loss": 0.6067, + "step": 10715 + }, + { + "epoch": 0.37, + "learning_rate": 1.3940717890866093e-05, + "loss": 0.6232, + "step": 10716 + }, + { + "epoch": 0.37, + "learning_rate": 1.3939717114036121e-05, + "loss": 0.643, + "step": 10717 + }, + { + "epoch": 0.37, + "learning_rate": 1.3938716290495812e-05, + "loss": 0.6514, + "step": 10718 + }, + { + "epoch": 0.37, + "learning_rate": 1.3937715420257048e-05, + "loss": 0.6648, + "step": 10719 + }, + { + "epoch": 0.37, + "learning_rate": 1.3936714503331683e-05, + "loss": 0.6986, + "step": 10720 + }, + { + "epoch": 0.37, + "learning_rate": 1.3935713539731586e-05, + "loss": 0.5827, + "step": 10721 + }, + { + "epoch": 0.37, + "learning_rate": 1.3934712529468627e-05, + "loss": 0.6449, + "step": 10722 + }, + { + "epoch": 0.37, + "learning_rate": 1.3933711472554674e-05, + "loss": 0.607, + "step": 10723 + }, + { + "epoch": 0.37, + "learning_rate": 1.3932710369001594e-05, + "loss": 0.6478, + "step": 10724 + }, + { + "epoch": 0.37, + "learning_rate": 1.3931709218821259e-05, + "loss": 0.6469, + "step": 10725 + }, + { + "epoch": 0.37, + "learning_rate": 1.3930708022025537e-05, + "loss": 0.6241, + "step": 10726 + }, + { + "epoch": 0.37, + "learning_rate": 1.3929706778626297e-05, + "loss": 0.6815, + "step": 10727 + }, + { + "epoch": 0.37, + "learning_rate": 1.3928705488635414e-05, + "loss": 0.6639, + "step": 10728 + }, + { + "epoch": 0.37, + "learning_rate": 1.392770415206476e-05, + "loss": 0.6217, + "step": 10729 + }, + { + "epoch": 0.37, + "learning_rate": 1.3926702768926202e-05, + "loss": 0.6222, + "step": 10730 + }, + { + "epoch": 0.37, + "learning_rate": 1.3925701339231614e-05, + "loss": 0.6145, + "step": 10731 + }, + { + "epoch": 0.37, + "learning_rate": 1.3924699862992874e-05, + "loss": 0.6528, + "step": 10732 + }, + { + "epoch": 0.37, + "learning_rate": 1.3923698340221852e-05, + "loss": 0.6294, + "step": 10733 + }, + { + "epoch": 0.37, + "learning_rate": 1.3922696770930419e-05, + "loss": 0.6184, + "step": 10734 + }, + { + "epoch": 0.37, + "learning_rate": 1.3921695155130456e-05, + "loss": 0.673, + "step": 10735 + }, + { + "epoch": 0.37, + "learning_rate": 1.3920693492833836e-05, + "loss": 0.6196, + "step": 10736 + }, + { + "epoch": 0.37, + "learning_rate": 1.3919691784052436e-05, + "loss": 0.6464, + "step": 10737 + }, + { + "epoch": 0.37, + "learning_rate": 1.391869002879813e-05, + "loss": 0.6325, + "step": 10738 + }, + { + "epoch": 0.37, + "learning_rate": 1.3917688227082797e-05, + "loss": 0.6321, + "step": 10739 + }, + { + "epoch": 0.37, + "learning_rate": 1.3916686378918314e-05, + "loss": 0.6758, + "step": 10740 + }, + { + "epoch": 0.37, + "learning_rate": 1.3915684484316559e-05, + "loss": 0.5876, + "step": 10741 + }, + { + "epoch": 0.37, + "learning_rate": 1.391468254328941e-05, + "loss": 0.6766, + "step": 10742 + }, + { + "epoch": 0.37, + "learning_rate": 1.391368055584875e-05, + "loss": 0.6057, + "step": 10743 + }, + { + "epoch": 0.37, + "learning_rate": 1.3912678522006456e-05, + "loss": 0.6097, + "step": 10744 + }, + { + "epoch": 0.37, + "learning_rate": 1.3911676441774406e-05, + "loss": 0.6257, + "step": 10745 + }, + { + "epoch": 0.37, + "learning_rate": 1.3910674315164486e-05, + "loss": 0.6204, + "step": 10746 + }, + { + "epoch": 0.37, + "learning_rate": 1.3909672142188575e-05, + "loss": 0.6241, + "step": 10747 + }, + { + "epoch": 0.37, + "learning_rate": 1.3908669922858554e-05, + "loss": 0.6588, + "step": 10748 + }, + { + "epoch": 0.37, + "learning_rate": 1.3907667657186306e-05, + "loss": 0.631, + "step": 10749 + }, + { + "epoch": 0.37, + "learning_rate": 1.3906665345183715e-05, + "loss": 0.6801, + "step": 10750 + }, + { + "epoch": 0.37, + "learning_rate": 1.3905662986862665e-05, + "loss": 0.6643, + "step": 10751 + }, + { + "epoch": 0.37, + "learning_rate": 1.3904660582235039e-05, + "loss": 0.6662, + "step": 10752 + }, + { + "epoch": 0.37, + "learning_rate": 1.3903658131312723e-05, + "loss": 0.649, + "step": 10753 + }, + { + "epoch": 0.37, + "learning_rate": 1.39026556341076e-05, + "loss": 0.6426, + "step": 10754 + }, + { + "epoch": 0.37, + "learning_rate": 1.3901653090631562e-05, + "loss": 0.6142, + "step": 10755 + }, + { + "epoch": 0.37, + "learning_rate": 1.3900650500896485e-05, + "loss": 0.6513, + "step": 10756 + }, + { + "epoch": 0.37, + "learning_rate": 1.3899647864914265e-05, + "loss": 0.5645, + "step": 10757 + }, + { + "epoch": 0.37, + "learning_rate": 1.3898645182696786e-05, + "loss": 0.6302, + "step": 10758 + }, + { + "epoch": 0.37, + "learning_rate": 1.3897642454255937e-05, + "loss": 0.6431, + "step": 10759 + }, + { + "epoch": 0.37, + "learning_rate": 1.3896639679603606e-05, + "loss": 0.6087, + "step": 10760 + }, + { + "epoch": 0.37, + "learning_rate": 1.3895636858751682e-05, + "loss": 0.7021, + "step": 10761 + }, + { + "epoch": 0.37, + "learning_rate": 1.3894633991712056e-05, + "loss": 0.6343, + "step": 10762 + }, + { + "epoch": 0.37, + "learning_rate": 1.3893631078496617e-05, + "loss": 0.6328, + "step": 10763 + }, + { + "epoch": 0.37, + "learning_rate": 1.3892628119117255e-05, + "loss": 0.6611, + "step": 10764 + }, + { + "epoch": 0.37, + "learning_rate": 1.3891625113585866e-05, + "loss": 0.6407, + "step": 10765 + }, + { + "epoch": 0.37, + "learning_rate": 1.3890622061914331e-05, + "loss": 0.6211, + "step": 10766 + }, + { + "epoch": 0.37, + "learning_rate": 1.3889618964114557e-05, + "loss": 0.6401, + "step": 10767 + }, + { + "epoch": 0.37, + "learning_rate": 1.3888615820198426e-05, + "loss": 0.6156, + "step": 10768 + }, + { + "epoch": 0.37, + "learning_rate": 1.3887612630177836e-05, + "loss": 0.6239, + "step": 10769 + }, + { + "epoch": 0.37, + "learning_rate": 1.3886609394064682e-05, + "loss": 0.619, + "step": 10770 + }, + { + "epoch": 0.37, + "learning_rate": 1.3885606111870854e-05, + "loss": 0.6031, + "step": 10771 + }, + { + "epoch": 0.37, + "learning_rate": 1.3884602783608255e-05, + "loss": 0.6644, + "step": 10772 + }, + { + "epoch": 0.37, + "learning_rate": 1.3883599409288772e-05, + "loss": 0.6124, + "step": 10773 + }, + { + "epoch": 0.37, + "learning_rate": 1.3882595988924306e-05, + "loss": 0.6318, + "step": 10774 + }, + { + "epoch": 0.37, + "learning_rate": 1.3881592522526752e-05, + "loss": 0.6727, + "step": 10775 + }, + { + "epoch": 0.37, + "learning_rate": 1.3880589010108012e-05, + "loss": 0.6701, + "step": 10776 + }, + { + "epoch": 0.37, + "learning_rate": 1.3879585451679978e-05, + "loss": 0.6366, + "step": 10777 + }, + { + "epoch": 0.37, + "learning_rate": 1.387858184725455e-05, + "loss": 0.6118, + "step": 10778 + }, + { + "epoch": 0.37, + "learning_rate": 1.3877578196843629e-05, + "loss": 0.5655, + "step": 10779 + }, + { + "epoch": 0.37, + "learning_rate": 1.3876574500459113e-05, + "loss": 0.6884, + "step": 10780 + }, + { + "epoch": 0.37, + "learning_rate": 1.3875570758112902e-05, + "loss": 0.6235, + "step": 10781 + }, + { + "epoch": 0.37, + "learning_rate": 1.3874566969816898e-05, + "loss": 0.625, + "step": 10782 + }, + { + "epoch": 0.37, + "learning_rate": 1.3873563135583e-05, + "loss": 0.6225, + "step": 10783 + }, + { + "epoch": 0.37, + "learning_rate": 1.387255925542311e-05, + "loss": 0.6257, + "step": 10784 + }, + { + "epoch": 0.37, + "learning_rate": 1.3871555329349135e-05, + "loss": 0.5832, + "step": 10785 + }, + { + "epoch": 0.37, + "learning_rate": 1.3870551357372972e-05, + "loss": 0.6088, + "step": 10786 + }, + { + "epoch": 0.37, + "learning_rate": 1.3869547339506526e-05, + "loss": 0.5867, + "step": 10787 + }, + { + "epoch": 0.37, + "learning_rate": 1.3868543275761702e-05, + "loss": 0.6246, + "step": 10788 + }, + { + "epoch": 0.37, + "learning_rate": 1.38675391661504e-05, + "loss": 0.6541, + "step": 10789 + }, + { + "epoch": 0.37, + "learning_rate": 1.3866535010684534e-05, + "loss": 0.6076, + "step": 10790 + }, + { + "epoch": 0.37, + "learning_rate": 1.3865530809376002e-05, + "loss": 0.6169, + "step": 10791 + }, + { + "epoch": 0.37, + "learning_rate": 1.3864526562236713e-05, + "loss": 0.6415, + "step": 10792 + }, + { + "epoch": 0.37, + "learning_rate": 1.3863522269278571e-05, + "loss": 0.6598, + "step": 10793 + }, + { + "epoch": 0.37, + "learning_rate": 1.3862517930513489e-05, + "loss": 0.6274, + "step": 10794 + }, + { + "epoch": 0.37, + "learning_rate": 1.3861513545953367e-05, + "loss": 0.6615, + "step": 10795 + }, + { + "epoch": 0.37, + "learning_rate": 1.3860509115610116e-05, + "loss": 0.5709, + "step": 10796 + }, + { + "epoch": 0.37, + "learning_rate": 1.3859504639495651e-05, + "loss": 0.6785, + "step": 10797 + }, + { + "epoch": 0.37, + "learning_rate": 1.3858500117621873e-05, + "loss": 0.6217, + "step": 10798 + }, + { + "epoch": 0.37, + "learning_rate": 1.3857495550000695e-05, + "loss": 0.6292, + "step": 10799 + }, + { + "epoch": 0.37, + "learning_rate": 1.385649093664403e-05, + "loss": 0.6719, + "step": 10800 + }, + { + "epoch": 0.37, + "learning_rate": 1.3855486277563784e-05, + "loss": 0.5342, + "step": 10801 + }, + { + "epoch": 0.37, + "learning_rate": 1.3854481572771872e-05, + "loss": 0.6522, + "step": 10802 + }, + { + "epoch": 0.37, + "learning_rate": 1.3853476822280205e-05, + "loss": 0.6748, + "step": 10803 + }, + { + "epoch": 0.37, + "learning_rate": 1.3852472026100693e-05, + "loss": 0.6603, + "step": 10804 + }, + { + "epoch": 0.37, + "learning_rate": 1.3851467184245256e-05, + "loss": 0.6021, + "step": 10805 + }, + { + "epoch": 0.37, + "learning_rate": 1.3850462296725802e-05, + "loss": 0.6222, + "step": 10806 + }, + { + "epoch": 0.37, + "learning_rate": 1.3849457363554245e-05, + "loss": 0.6407, + "step": 10807 + }, + { + "epoch": 0.37, + "learning_rate": 1.3848452384742502e-05, + "loss": 0.6371, + "step": 10808 + }, + { + "epoch": 0.37, + "learning_rate": 1.3847447360302489e-05, + "loss": 0.6532, + "step": 10809 + }, + { + "epoch": 0.37, + "learning_rate": 1.3846442290246119e-05, + "loss": 0.6602, + "step": 10810 + }, + { + "epoch": 0.37, + "learning_rate": 1.3845437174585307e-05, + "loss": 0.6224, + "step": 10811 + }, + { + "epoch": 0.37, + "learning_rate": 1.3844432013331978e-05, + "loss": 0.6329, + "step": 10812 + }, + { + "epoch": 0.37, + "learning_rate": 1.3843426806498041e-05, + "loss": 0.6421, + "step": 10813 + }, + { + "epoch": 0.37, + "learning_rate": 1.3842421554095422e-05, + "loss": 0.6732, + "step": 10814 + }, + { + "epoch": 0.37, + "learning_rate": 1.3841416256136029e-05, + "loss": 0.6372, + "step": 10815 + }, + { + "epoch": 0.37, + "learning_rate": 1.384041091263179e-05, + "loss": 0.5767, + "step": 10816 + }, + { + "epoch": 0.37, + "learning_rate": 1.3839405523594623e-05, + "loss": 0.6327, + "step": 10817 + }, + { + "epoch": 0.37, + "learning_rate": 1.3838400089036444e-05, + "loss": 0.6352, + "step": 10818 + }, + { + "epoch": 0.37, + "learning_rate": 1.3837394608969175e-05, + "loss": 0.6257, + "step": 10819 + }, + { + "epoch": 0.37, + "learning_rate": 1.3836389083404739e-05, + "loss": 0.6446, + "step": 10820 + }, + { + "epoch": 0.37, + "learning_rate": 1.3835383512355058e-05, + "loss": 0.6431, + "step": 10821 + }, + { + "epoch": 0.37, + "learning_rate": 1.3834377895832055e-05, + "loss": 0.5698, + "step": 10822 + }, + { + "epoch": 0.37, + "learning_rate": 1.3833372233847652e-05, + "loss": 0.6509, + "step": 10823 + }, + { + "epoch": 0.38, + "learning_rate": 1.3832366526413772e-05, + "loss": 0.5905, + "step": 10824 + }, + { + "epoch": 0.38, + "learning_rate": 1.3831360773542334e-05, + "loss": 0.6146, + "step": 10825 + }, + { + "epoch": 0.38, + "learning_rate": 1.3830354975245275e-05, + "loss": 0.5626, + "step": 10826 + }, + { + "epoch": 0.38, + "learning_rate": 1.3829349131534507e-05, + "loss": 0.639, + "step": 10827 + }, + { + "epoch": 0.38, + "learning_rate": 1.3828343242421961e-05, + "loss": 0.6106, + "step": 10828 + }, + { + "epoch": 0.38, + "learning_rate": 1.3827337307919567e-05, + "loss": 0.6243, + "step": 10829 + }, + { + "epoch": 0.38, + "learning_rate": 1.3826331328039242e-05, + "loss": 0.6616, + "step": 10830 + }, + { + "epoch": 0.38, + "learning_rate": 1.3825325302792925e-05, + "loss": 0.6218, + "step": 10831 + }, + { + "epoch": 0.38, + "learning_rate": 1.3824319232192532e-05, + "loss": 0.6324, + "step": 10832 + }, + { + "epoch": 0.38, + "learning_rate": 1.382331311625e-05, + "loss": 0.6092, + "step": 10833 + }, + { + "epoch": 0.38, + "learning_rate": 1.3822306954977252e-05, + "loss": 0.6658, + "step": 10834 + }, + { + "epoch": 0.38, + "learning_rate": 1.3821300748386222e-05, + "loss": 0.6255, + "step": 10835 + }, + { + "epoch": 0.38, + "learning_rate": 1.3820294496488835e-05, + "loss": 0.6067, + "step": 10836 + }, + { + "epoch": 0.38, + "learning_rate": 1.3819288199297027e-05, + "loss": 0.6495, + "step": 10837 + }, + { + "epoch": 0.38, + "learning_rate": 1.3818281856822725e-05, + "loss": 0.5935, + "step": 10838 + }, + { + "epoch": 0.38, + "learning_rate": 1.381727546907786e-05, + "loss": 0.6663, + "step": 10839 + }, + { + "epoch": 0.38, + "learning_rate": 1.3816269036074368e-05, + "loss": 0.6682, + "step": 10840 + }, + { + "epoch": 0.38, + "learning_rate": 1.3815262557824177e-05, + "loss": 0.5754, + "step": 10841 + }, + { + "epoch": 0.38, + "learning_rate": 1.3814256034339221e-05, + "loss": 0.633, + "step": 10842 + }, + { + "epoch": 0.38, + "learning_rate": 1.3813249465631437e-05, + "loss": 0.656, + "step": 10843 + }, + { + "epoch": 0.38, + "learning_rate": 1.3812242851712756e-05, + "loss": 0.6144, + "step": 10844 + }, + { + "epoch": 0.38, + "learning_rate": 1.3811236192595115e-05, + "loss": 0.622, + "step": 10845 + }, + { + "epoch": 0.38, + "learning_rate": 1.3810229488290445e-05, + "loss": 0.6086, + "step": 10846 + }, + { + "epoch": 0.38, + "learning_rate": 1.3809222738810685e-05, + "loss": 0.5857, + "step": 10847 + }, + { + "epoch": 0.38, + "learning_rate": 1.3808215944167774e-05, + "loss": 0.6119, + "step": 10848 + }, + { + "epoch": 0.38, + "learning_rate": 1.3807209104373643e-05, + "loss": 0.6826, + "step": 10849 + }, + { + "epoch": 0.38, + "learning_rate": 1.380620221944023e-05, + "loss": 0.6125, + "step": 10850 + }, + { + "epoch": 0.38, + "learning_rate": 1.3805195289379478e-05, + "loss": 0.6653, + "step": 10851 + }, + { + "epoch": 0.38, + "learning_rate": 1.3804188314203319e-05, + "loss": 0.6394, + "step": 10852 + }, + { + "epoch": 0.38, + "learning_rate": 1.3803181293923697e-05, + "loss": 0.6372, + "step": 10853 + }, + { + "epoch": 0.38, + "learning_rate": 1.3802174228552552e-05, + "loss": 0.6248, + "step": 10854 + }, + { + "epoch": 0.38, + "learning_rate": 1.380116711810182e-05, + "loss": 0.7018, + "step": 10855 + }, + { + "epoch": 0.38, + "learning_rate": 1.3800159962583442e-05, + "loss": 0.6406, + "step": 10856 + }, + { + "epoch": 0.38, + "learning_rate": 1.3799152762009363e-05, + "loss": 0.6479, + "step": 10857 + }, + { + "epoch": 0.38, + "learning_rate": 1.379814551639152e-05, + "loss": 0.6541, + "step": 10858 + }, + { + "epoch": 0.38, + "learning_rate": 1.3797138225741856e-05, + "loss": 0.6637, + "step": 10859 + }, + { + "epoch": 0.38, + "learning_rate": 1.379613089007232e-05, + "loss": 0.6274, + "step": 10860 + }, + { + "epoch": 0.38, + "learning_rate": 1.3795123509394843e-05, + "loss": 0.6858, + "step": 10861 + }, + { + "epoch": 0.38, + "learning_rate": 1.3794116083721381e-05, + "loss": 0.6335, + "step": 10862 + }, + { + "epoch": 0.38, + "learning_rate": 1.3793108613063872e-05, + "loss": 0.6073, + "step": 10863 + }, + { + "epoch": 0.38, + "learning_rate": 1.379210109743426e-05, + "loss": 0.6604, + "step": 10864 + }, + { + "epoch": 0.38, + "learning_rate": 1.3791093536844495e-05, + "loss": 0.6481, + "step": 10865 + }, + { + "epoch": 0.38, + "learning_rate": 1.3790085931306521e-05, + "loss": 0.66, + "step": 10866 + }, + { + "epoch": 0.38, + "learning_rate": 1.3789078280832283e-05, + "loss": 0.6529, + "step": 10867 + }, + { + "epoch": 0.38, + "learning_rate": 1.3788070585433729e-05, + "loss": 0.5969, + "step": 10868 + }, + { + "epoch": 0.38, + "learning_rate": 1.3787062845122805e-05, + "loss": 0.6111, + "step": 10869 + }, + { + "epoch": 0.38, + "learning_rate": 1.378605505991146e-05, + "loss": 0.5514, + "step": 10870 + }, + { + "epoch": 0.38, + "learning_rate": 1.3785047229811644e-05, + "loss": 0.597, + "step": 10871 + }, + { + "epoch": 0.38, + "learning_rate": 1.3784039354835306e-05, + "loss": 0.6354, + "step": 10872 + }, + { + "epoch": 0.38, + "learning_rate": 1.3783031434994393e-05, + "loss": 0.6438, + "step": 10873 + }, + { + "epoch": 0.38, + "learning_rate": 1.3782023470300855e-05, + "loss": 0.6749, + "step": 10874 + }, + { + "epoch": 0.38, + "learning_rate": 1.3781015460766648e-05, + "loss": 0.6647, + "step": 10875 + }, + { + "epoch": 0.38, + "learning_rate": 1.3780007406403719e-05, + "loss": 0.6705, + "step": 10876 + }, + { + "epoch": 0.38, + "learning_rate": 1.3778999307224019e-05, + "loss": 0.6322, + "step": 10877 + }, + { + "epoch": 0.38, + "learning_rate": 1.3777991163239506e-05, + "loss": 0.5414, + "step": 10878 + }, + { + "epoch": 0.38, + "learning_rate": 1.3776982974462123e-05, + "loss": 0.6058, + "step": 10879 + }, + { + "epoch": 0.38, + "learning_rate": 1.3775974740903831e-05, + "loss": 0.65, + "step": 10880 + }, + { + "epoch": 0.38, + "learning_rate": 1.3774966462576585e-05, + "loss": 0.5934, + "step": 10881 + }, + { + "epoch": 0.38, + "learning_rate": 1.3773958139492329e-05, + "loss": 0.6231, + "step": 10882 + }, + { + "epoch": 0.38, + "learning_rate": 1.3772949771663031e-05, + "loss": 0.6942, + "step": 10883 + }, + { + "epoch": 0.38, + "learning_rate": 1.377194135910064e-05, + "loss": 0.6671, + "step": 10884 + }, + { + "epoch": 0.38, + "learning_rate": 1.3770932901817112e-05, + "loss": 0.6739, + "step": 10885 + }, + { + "epoch": 0.38, + "learning_rate": 1.3769924399824402e-05, + "loss": 0.5587, + "step": 10886 + }, + { + "epoch": 0.38, + "learning_rate": 1.3768915853134472e-05, + "loss": 0.6185, + "step": 10887 + }, + { + "epoch": 0.38, + "learning_rate": 1.3767907261759276e-05, + "loss": 0.6458, + "step": 10888 + }, + { + "epoch": 0.38, + "learning_rate": 1.3766898625710771e-05, + "loss": 0.6399, + "step": 10889 + }, + { + "epoch": 0.38, + "learning_rate": 1.3765889945000922e-05, + "loss": 0.6712, + "step": 10890 + }, + { + "epoch": 0.38, + "learning_rate": 1.3764881219641682e-05, + "loss": 0.6243, + "step": 10891 + }, + { + "epoch": 0.38, + "learning_rate": 1.376387244964501e-05, + "loss": 0.6308, + "step": 10892 + }, + { + "epoch": 0.38, + "learning_rate": 1.3762863635022871e-05, + "loss": 0.6202, + "step": 10893 + }, + { + "epoch": 0.38, + "learning_rate": 1.3761854775787224e-05, + "loss": 0.6175, + "step": 10894 + }, + { + "epoch": 0.38, + "learning_rate": 1.3760845871950028e-05, + "loss": 0.581, + "step": 10895 + }, + { + "epoch": 0.38, + "learning_rate": 1.3759836923523251e-05, + "loss": 0.5653, + "step": 10896 + }, + { + "epoch": 0.38, + "learning_rate": 1.3758827930518846e-05, + "loss": 0.6297, + "step": 10897 + }, + { + "epoch": 0.38, + "learning_rate": 1.3757818892948782e-05, + "loss": 0.6204, + "step": 10898 + }, + { + "epoch": 0.38, + "learning_rate": 1.3756809810825024e-05, + "loss": 0.6246, + "step": 10899 + }, + { + "epoch": 0.38, + "learning_rate": 1.3755800684159531e-05, + "loss": 0.6514, + "step": 10900 + }, + { + "epoch": 0.38, + "learning_rate": 1.3754791512964269e-05, + "loss": 0.6434, + "step": 10901 + }, + { + "epoch": 0.38, + "learning_rate": 1.3753782297251206e-05, + "loss": 0.6093, + "step": 10902 + }, + { + "epoch": 0.38, + "learning_rate": 1.3752773037032303e-05, + "loss": 0.6106, + "step": 10903 + }, + { + "epoch": 0.38, + "learning_rate": 1.3751763732319529e-05, + "loss": 0.6399, + "step": 10904 + }, + { + "epoch": 0.38, + "learning_rate": 1.3750754383124853e-05, + "loss": 0.6204, + "step": 10905 + }, + { + "epoch": 0.38, + "learning_rate": 1.3749744989460236e-05, + "loss": 0.6971, + "step": 10906 + }, + { + "epoch": 0.38, + "learning_rate": 1.3748735551337649e-05, + "loss": 0.6708, + "step": 10907 + }, + { + "epoch": 0.38, + "learning_rate": 1.3747726068769063e-05, + "loss": 0.6145, + "step": 10908 + }, + { + "epoch": 0.38, + "learning_rate": 1.3746716541766438e-05, + "loss": 0.6419, + "step": 10909 + }, + { + "epoch": 0.38, + "learning_rate": 1.3745706970341755e-05, + "loss": 0.6306, + "step": 10910 + }, + { + "epoch": 0.38, + "learning_rate": 1.3744697354506972e-05, + "loss": 0.6429, + "step": 10911 + }, + { + "epoch": 0.38, + "learning_rate": 1.3743687694274068e-05, + "loss": 0.593, + "step": 10912 + }, + { + "epoch": 0.38, + "learning_rate": 1.3742677989655012e-05, + "loss": 0.6274, + "step": 10913 + }, + { + "epoch": 0.38, + "learning_rate": 1.3741668240661769e-05, + "loss": 0.6789, + "step": 10914 + }, + { + "epoch": 0.38, + "learning_rate": 1.3740658447306316e-05, + "loss": 0.6102, + "step": 10915 + }, + { + "epoch": 0.38, + "learning_rate": 1.3739648609600631e-05, + "loss": 0.6118, + "step": 10916 + }, + { + "epoch": 0.38, + "learning_rate": 1.3738638727556676e-05, + "loss": 0.7153, + "step": 10917 + }, + { + "epoch": 0.38, + "learning_rate": 1.373762880118643e-05, + "loss": 0.6634, + "step": 10918 + }, + { + "epoch": 0.38, + "learning_rate": 1.3736618830501869e-05, + "loss": 0.6387, + "step": 10919 + }, + { + "epoch": 0.38, + "learning_rate": 1.3735608815514963e-05, + "loss": 0.6053, + "step": 10920 + }, + { + "epoch": 0.38, + "learning_rate": 1.3734598756237687e-05, + "loss": 0.5979, + "step": 10921 + }, + { + "epoch": 0.38, + "learning_rate": 1.3733588652682024e-05, + "loss": 0.6026, + "step": 10922 + }, + { + "epoch": 0.38, + "learning_rate": 1.3732578504859939e-05, + "loss": 0.6293, + "step": 10923 + }, + { + "epoch": 0.38, + "learning_rate": 1.3731568312783416e-05, + "loss": 0.6104, + "step": 10924 + }, + { + "epoch": 0.38, + "learning_rate": 1.3730558076464433e-05, + "loss": 0.711, + "step": 10925 + }, + { + "epoch": 0.38, + "learning_rate": 1.3729547795914961e-05, + "loss": 0.6878, + "step": 10926 + }, + { + "epoch": 0.38, + "learning_rate": 1.3728537471146983e-05, + "loss": 0.5558, + "step": 10927 + }, + { + "epoch": 0.38, + "learning_rate": 1.3727527102172478e-05, + "loss": 0.6408, + "step": 10928 + }, + { + "epoch": 0.38, + "learning_rate": 1.3726516689003422e-05, + "loss": 0.6857, + "step": 10929 + }, + { + "epoch": 0.38, + "learning_rate": 1.3725506231651797e-05, + "loss": 0.6788, + "step": 10930 + }, + { + "epoch": 0.38, + "learning_rate": 1.3724495730129585e-05, + "loss": 0.6266, + "step": 10931 + }, + { + "epoch": 0.38, + "learning_rate": 1.3723485184448762e-05, + "loss": 0.621, + "step": 10932 + }, + { + "epoch": 0.38, + "learning_rate": 1.3722474594621312e-05, + "loss": 0.5708, + "step": 10933 + }, + { + "epoch": 0.38, + "learning_rate": 1.3721463960659218e-05, + "loss": 0.6046, + "step": 10934 + }, + { + "epoch": 0.38, + "learning_rate": 1.372045328257446e-05, + "loss": 0.6151, + "step": 10935 + }, + { + "epoch": 0.38, + "learning_rate": 1.3719442560379022e-05, + "loss": 0.6058, + "step": 10936 + }, + { + "epoch": 0.38, + "learning_rate": 1.371843179408489e-05, + "loss": 0.6278, + "step": 10937 + }, + { + "epoch": 0.38, + "learning_rate": 1.3717420983704042e-05, + "loss": 0.6083, + "step": 10938 + }, + { + "epoch": 0.38, + "learning_rate": 1.3716410129248465e-05, + "loss": 0.6449, + "step": 10939 + }, + { + "epoch": 0.38, + "learning_rate": 1.3715399230730148e-05, + "loss": 0.6582, + "step": 10940 + }, + { + "epoch": 0.38, + "learning_rate": 1.3714388288161074e-05, + "loss": 0.6113, + "step": 10941 + }, + { + "epoch": 0.38, + "learning_rate": 1.3713377301553221e-05, + "loss": 0.6721, + "step": 10942 + }, + { + "epoch": 0.38, + "learning_rate": 1.3712366270918589e-05, + "loss": 0.6192, + "step": 10943 + }, + { + "epoch": 0.38, + "learning_rate": 1.3711355196269158e-05, + "loss": 0.6192, + "step": 10944 + }, + { + "epoch": 0.38, + "learning_rate": 1.3710344077616912e-05, + "loss": 0.6734, + "step": 10945 + }, + { + "epoch": 0.38, + "learning_rate": 1.370933291497385e-05, + "loss": 0.5825, + "step": 10946 + }, + { + "epoch": 0.38, + "learning_rate": 1.370832170835195e-05, + "loss": 0.6348, + "step": 10947 + }, + { + "epoch": 0.38, + "learning_rate": 1.3707310457763204e-05, + "loss": 0.6139, + "step": 10948 + }, + { + "epoch": 0.38, + "learning_rate": 1.3706299163219605e-05, + "loss": 0.6421, + "step": 10949 + }, + { + "epoch": 0.38, + "learning_rate": 1.3705287824733142e-05, + "loss": 0.6681, + "step": 10950 + }, + { + "epoch": 0.38, + "learning_rate": 1.37042764423158e-05, + "loss": 0.6274, + "step": 10951 + }, + { + "epoch": 0.38, + "learning_rate": 1.3703265015979579e-05, + "loss": 0.6561, + "step": 10952 + }, + { + "epoch": 0.38, + "learning_rate": 1.3702253545736466e-05, + "loss": 0.6197, + "step": 10953 + }, + { + "epoch": 0.38, + "learning_rate": 1.3701242031598452e-05, + "loss": 0.6618, + "step": 10954 + }, + { + "epoch": 0.38, + "learning_rate": 1.3700230473577534e-05, + "loss": 0.5926, + "step": 10955 + }, + { + "epoch": 0.38, + "learning_rate": 1.3699218871685702e-05, + "loss": 0.611, + "step": 10956 + }, + { + "epoch": 0.38, + "learning_rate": 1.3698207225934947e-05, + "loss": 0.6388, + "step": 10957 + }, + { + "epoch": 0.38, + "learning_rate": 1.3697195536337274e-05, + "loss": 0.6137, + "step": 10958 + }, + { + "epoch": 0.38, + "learning_rate": 1.3696183802904668e-05, + "loss": 0.6335, + "step": 10959 + }, + { + "epoch": 0.38, + "learning_rate": 1.3695172025649124e-05, + "loss": 0.6222, + "step": 10960 + }, + { + "epoch": 0.38, + "learning_rate": 1.3694160204582645e-05, + "loss": 0.649, + "step": 10961 + }, + { + "epoch": 0.38, + "learning_rate": 1.3693148339717223e-05, + "loss": 0.6256, + "step": 10962 + }, + { + "epoch": 0.38, + "learning_rate": 1.3692136431064853e-05, + "loss": 0.6404, + "step": 10963 + }, + { + "epoch": 0.38, + "learning_rate": 1.3691124478637538e-05, + "loss": 0.612, + "step": 10964 + }, + { + "epoch": 0.38, + "learning_rate": 1.3690112482447276e-05, + "loss": 0.5746, + "step": 10965 + }, + { + "epoch": 0.38, + "learning_rate": 1.3689100442506055e-05, + "loss": 0.5571, + "step": 10966 + }, + { + "epoch": 0.38, + "learning_rate": 1.3688088358825887e-05, + "loss": 0.5486, + "step": 10967 + }, + { + "epoch": 0.38, + "learning_rate": 1.3687076231418765e-05, + "loss": 0.6103, + "step": 10968 + }, + { + "epoch": 0.38, + "learning_rate": 1.3686064060296687e-05, + "loss": 0.6193, + "step": 10969 + }, + { + "epoch": 0.38, + "learning_rate": 1.368505184547166e-05, + "loss": 0.6186, + "step": 10970 + }, + { + "epoch": 0.38, + "learning_rate": 1.3684039586955682e-05, + "loss": 0.5786, + "step": 10971 + }, + { + "epoch": 0.38, + "learning_rate": 1.3683027284760752e-05, + "loss": 0.6378, + "step": 10972 + }, + { + "epoch": 0.38, + "learning_rate": 1.3682014938898875e-05, + "loss": 0.6396, + "step": 10973 + }, + { + "epoch": 0.38, + "learning_rate": 1.3681002549382057e-05, + "loss": 0.637, + "step": 10974 + }, + { + "epoch": 0.38, + "learning_rate": 1.3679990116222292e-05, + "loss": 0.6643, + "step": 10975 + }, + { + "epoch": 0.38, + "learning_rate": 1.3678977639431592e-05, + "loss": 0.681, + "step": 10976 + }, + { + "epoch": 0.38, + "learning_rate": 1.3677965119021957e-05, + "loss": 0.618, + "step": 10977 + }, + { + "epoch": 0.38, + "learning_rate": 1.3676952555005394e-05, + "loss": 0.6945, + "step": 10978 + }, + { + "epoch": 0.38, + "learning_rate": 1.3675939947393904e-05, + "loss": 0.649, + "step": 10979 + }, + { + "epoch": 0.38, + "learning_rate": 1.3674927296199501e-05, + "loss": 0.6671, + "step": 10980 + }, + { + "epoch": 0.38, + "learning_rate": 1.3673914601434182e-05, + "loss": 0.6112, + "step": 10981 + }, + { + "epoch": 0.38, + "learning_rate": 1.3672901863109958e-05, + "loss": 0.5933, + "step": 10982 + }, + { + "epoch": 0.38, + "learning_rate": 1.3671889081238839e-05, + "loss": 0.6189, + "step": 10983 + }, + { + "epoch": 0.38, + "learning_rate": 1.3670876255832826e-05, + "loss": 0.6718, + "step": 10984 + }, + { + "epoch": 0.38, + "learning_rate": 1.3669863386903935e-05, + "loss": 0.6265, + "step": 10985 + }, + { + "epoch": 0.38, + "learning_rate": 1.3668850474464171e-05, + "loss": 0.6458, + "step": 10986 + }, + { + "epoch": 0.38, + "learning_rate": 1.366783751852554e-05, + "loss": 0.6235, + "step": 10987 + }, + { + "epoch": 0.38, + "learning_rate": 1.3666824519100057e-05, + "loss": 0.5818, + "step": 10988 + }, + { + "epoch": 0.38, + "learning_rate": 1.3665811476199733e-05, + "loss": 0.6525, + "step": 10989 + }, + { + "epoch": 0.38, + "learning_rate": 1.3664798389836573e-05, + "loss": 0.6264, + "step": 10990 + }, + { + "epoch": 0.38, + "learning_rate": 1.3663785260022593e-05, + "loss": 0.6525, + "step": 10991 + }, + { + "epoch": 0.38, + "learning_rate": 1.3662772086769807e-05, + "loss": 0.6633, + "step": 10992 + }, + { + "epoch": 0.38, + "learning_rate": 1.3661758870090221e-05, + "loss": 0.5786, + "step": 10993 + }, + { + "epoch": 0.38, + "learning_rate": 1.3660745609995853e-05, + "loss": 0.6299, + "step": 10994 + }, + { + "epoch": 0.38, + "learning_rate": 1.3659732306498716e-05, + "loss": 0.6739, + "step": 10995 + }, + { + "epoch": 0.38, + "learning_rate": 1.3658718959610822e-05, + "loss": 0.6526, + "step": 10996 + }, + { + "epoch": 0.38, + "learning_rate": 1.3657705569344183e-05, + "loss": 0.6369, + "step": 10997 + }, + { + "epoch": 0.38, + "learning_rate": 1.3656692135710823e-05, + "loss": 0.6775, + "step": 10998 + }, + { + "epoch": 0.38, + "learning_rate": 1.365567865872275e-05, + "loss": 0.6233, + "step": 10999 + }, + { + "epoch": 0.38, + "learning_rate": 1.3654665138391981e-05, + "loss": 0.5965, + "step": 11000 + }, + { + "epoch": 0.38, + "learning_rate": 1.3653651574730536e-05, + "loss": 0.5826, + "step": 11001 + }, + { + "epoch": 0.38, + "learning_rate": 1.3652637967750426e-05, + "loss": 0.6339, + "step": 11002 + }, + { + "epoch": 0.38, + "learning_rate": 1.3651624317463677e-05, + "loss": 0.6067, + "step": 11003 + }, + { + "epoch": 0.38, + "learning_rate": 1.3650610623882299e-05, + "loss": 0.6483, + "step": 11004 + }, + { + "epoch": 0.38, + "learning_rate": 1.3649596887018313e-05, + "loss": 0.5611, + "step": 11005 + }, + { + "epoch": 0.38, + "learning_rate": 1.3648583106883742e-05, + "loss": 0.6991, + "step": 11006 + }, + { + "epoch": 0.38, + "learning_rate": 1.3647569283490602e-05, + "loss": 0.6125, + "step": 11007 + }, + { + "epoch": 0.38, + "learning_rate": 1.3646555416850913e-05, + "loss": 0.6989, + "step": 11008 + }, + { + "epoch": 0.38, + "learning_rate": 1.3645541506976699e-05, + "loss": 0.6056, + "step": 11009 + }, + { + "epoch": 0.38, + "learning_rate": 1.3644527553879976e-05, + "loss": 0.6276, + "step": 11010 + }, + { + "epoch": 0.38, + "learning_rate": 1.3643513557572768e-05, + "loss": 0.6756, + "step": 11011 + }, + { + "epoch": 0.38, + "learning_rate": 1.36424995180671e-05, + "loss": 0.6402, + "step": 11012 + }, + { + "epoch": 0.38, + "learning_rate": 1.3641485435374993e-05, + "loss": 0.6173, + "step": 11013 + }, + { + "epoch": 0.38, + "learning_rate": 1.3640471309508465e-05, + "loss": 0.6617, + "step": 11014 + }, + { + "epoch": 0.38, + "learning_rate": 1.363945714047955e-05, + "loss": 0.7219, + "step": 11015 + }, + { + "epoch": 0.38, + "learning_rate": 1.3638442928300264e-05, + "loss": 0.6295, + "step": 11016 + }, + { + "epoch": 0.38, + "learning_rate": 1.3637428672982633e-05, + "loss": 0.6489, + "step": 11017 + }, + { + "epoch": 0.38, + "learning_rate": 1.3636414374538686e-05, + "loss": 0.6164, + "step": 11018 + }, + { + "epoch": 0.38, + "learning_rate": 1.3635400032980446e-05, + "loss": 0.6132, + "step": 11019 + }, + { + "epoch": 0.38, + "learning_rate": 1.3634385648319941e-05, + "loss": 0.6231, + "step": 11020 + }, + { + "epoch": 0.38, + "learning_rate": 1.3633371220569195e-05, + "loss": 0.6588, + "step": 11021 + }, + { + "epoch": 0.38, + "learning_rate": 1.3632356749740239e-05, + "loss": 0.6483, + "step": 11022 + }, + { + "epoch": 0.38, + "learning_rate": 1.3631342235845095e-05, + "loss": 0.582, + "step": 11023 + }, + { + "epoch": 0.38, + "learning_rate": 1.3630327678895799e-05, + "loss": 0.696, + "step": 11024 + }, + { + "epoch": 0.38, + "learning_rate": 1.3629313078904374e-05, + "loss": 0.6234, + "step": 11025 + }, + { + "epoch": 0.38, + "learning_rate": 1.3628298435882849e-05, + "loss": 0.6563, + "step": 11026 + }, + { + "epoch": 0.38, + "learning_rate": 1.3627283749843261e-05, + "loss": 0.6424, + "step": 11027 + }, + { + "epoch": 0.38, + "learning_rate": 1.3626269020797634e-05, + "loss": 0.6621, + "step": 11028 + }, + { + "epoch": 0.38, + "learning_rate": 1.3625254248757997e-05, + "loss": 0.6023, + "step": 11029 + }, + { + "epoch": 0.38, + "learning_rate": 1.3624239433736391e-05, + "loss": 0.6616, + "step": 11030 + }, + { + "epoch": 0.38, + "learning_rate": 1.3623224575744838e-05, + "loss": 0.6121, + "step": 11031 + }, + { + "epoch": 0.38, + "learning_rate": 1.3622209674795373e-05, + "loss": 0.6671, + "step": 11032 + }, + { + "epoch": 0.38, + "learning_rate": 1.3621194730900034e-05, + "loss": 0.6843, + "step": 11033 + }, + { + "epoch": 0.38, + "learning_rate": 1.3620179744070849e-05, + "loss": 0.6141, + "step": 11034 + }, + { + "epoch": 0.38, + "learning_rate": 1.361916471431985e-05, + "loss": 0.6506, + "step": 11035 + }, + { + "epoch": 0.38, + "learning_rate": 1.3618149641659079e-05, + "loss": 0.6086, + "step": 11036 + }, + { + "epoch": 0.38, + "learning_rate": 1.3617134526100571e-05, + "loss": 0.6528, + "step": 11037 + }, + { + "epoch": 0.38, + "learning_rate": 1.3616119367656348e-05, + "loss": 0.6436, + "step": 11038 + }, + { + "epoch": 0.38, + "learning_rate": 1.3615104166338462e-05, + "loss": 0.6904, + "step": 11039 + }, + { + "epoch": 0.38, + "learning_rate": 1.3614088922158943e-05, + "loss": 0.6683, + "step": 11040 + }, + { + "epoch": 0.38, + "learning_rate": 1.3613073635129823e-05, + "loss": 0.6589, + "step": 11041 + }, + { + "epoch": 0.38, + "learning_rate": 1.3612058305263149e-05, + "loss": 0.6508, + "step": 11042 + }, + { + "epoch": 0.38, + "learning_rate": 1.3611042932570956e-05, + "loss": 0.6442, + "step": 11043 + }, + { + "epoch": 0.38, + "learning_rate": 1.3610027517065275e-05, + "loss": 0.6615, + "step": 11044 + }, + { + "epoch": 0.38, + "learning_rate": 1.3609012058758155e-05, + "loss": 0.6077, + "step": 11045 + }, + { + "epoch": 0.38, + "learning_rate": 1.3607996557661634e-05, + "loss": 0.578, + "step": 11046 + }, + { + "epoch": 0.38, + "learning_rate": 1.3606981013787743e-05, + "loss": 0.5797, + "step": 11047 + }, + { + "epoch": 0.38, + "learning_rate": 1.3605965427148535e-05, + "loss": 0.6638, + "step": 11048 + }, + { + "epoch": 0.38, + "learning_rate": 1.3604949797756045e-05, + "loss": 0.6418, + "step": 11049 + }, + { + "epoch": 0.38, + "learning_rate": 1.360393412562231e-05, + "loss": 0.6487, + "step": 11050 + }, + { + "epoch": 0.38, + "learning_rate": 1.360291841075938e-05, + "loss": 0.5816, + "step": 11051 + }, + { + "epoch": 0.38, + "learning_rate": 1.3601902653179298e-05, + "loss": 0.6514, + "step": 11052 + }, + { + "epoch": 0.38, + "learning_rate": 1.3600886852894096e-05, + "loss": 0.6408, + "step": 11053 + }, + { + "epoch": 0.38, + "learning_rate": 1.3599871009915831e-05, + "loss": 0.5893, + "step": 11054 + }, + { + "epoch": 0.38, + "learning_rate": 1.359885512425654e-05, + "loss": 0.6125, + "step": 11055 + }, + { + "epoch": 0.38, + "learning_rate": 1.3597839195928266e-05, + "loss": 0.5929, + "step": 11056 + }, + { + "epoch": 0.38, + "learning_rate": 1.3596823224943063e-05, + "loss": 0.6055, + "step": 11057 + }, + { + "epoch": 0.38, + "learning_rate": 1.3595807211312967e-05, + "loss": 0.6133, + "step": 11058 + }, + { + "epoch": 0.38, + "learning_rate": 1.3594791155050028e-05, + "loss": 0.666, + "step": 11059 + }, + { + "epoch": 0.38, + "learning_rate": 1.3593775056166292e-05, + "loss": 0.587, + "step": 11060 + }, + { + "epoch": 0.38, + "learning_rate": 1.3592758914673807e-05, + "loss": 0.6117, + "step": 11061 + }, + { + "epoch": 0.38, + "learning_rate": 1.3591742730584618e-05, + "loss": 0.5922, + "step": 11062 + }, + { + "epoch": 0.38, + "learning_rate": 1.3590726503910781e-05, + "loss": 0.6135, + "step": 11063 + }, + { + "epoch": 0.38, + "learning_rate": 1.3589710234664337e-05, + "loss": 0.6598, + "step": 11064 + }, + { + "epoch": 0.38, + "learning_rate": 1.3588693922857334e-05, + "loss": 0.688, + "step": 11065 + }, + { + "epoch": 0.38, + "learning_rate": 1.3587677568501825e-05, + "loss": 0.6404, + "step": 11066 + }, + { + "epoch": 0.38, + "learning_rate": 1.3586661171609863e-05, + "loss": 0.6757, + "step": 11067 + }, + { + "epoch": 0.38, + "learning_rate": 1.3585644732193495e-05, + "loss": 0.6632, + "step": 11068 + }, + { + "epoch": 0.38, + "learning_rate": 1.3584628250264772e-05, + "loss": 0.627, + "step": 11069 + }, + { + "epoch": 0.38, + "learning_rate": 1.3583611725835746e-05, + "loss": 0.6489, + "step": 11070 + }, + { + "epoch": 0.38, + "learning_rate": 1.358259515891847e-05, + "loss": 0.6988, + "step": 11071 + }, + { + "epoch": 0.38, + "learning_rate": 1.3581578549524997e-05, + "loss": 0.5893, + "step": 11072 + }, + { + "epoch": 0.38, + "learning_rate": 1.358056189766738e-05, + "loss": 0.5825, + "step": 11073 + }, + { + "epoch": 0.38, + "learning_rate": 1.3579545203357671e-05, + "loss": 0.6617, + "step": 11074 + }, + { + "epoch": 0.38, + "learning_rate": 1.3578528466607925e-05, + "loss": 0.6242, + "step": 11075 + }, + { + "epoch": 0.38, + "learning_rate": 1.35775116874302e-05, + "loss": 0.5905, + "step": 11076 + }, + { + "epoch": 0.38, + "learning_rate": 1.3576494865836547e-05, + "loss": 0.5773, + "step": 11077 + }, + { + "epoch": 0.38, + "learning_rate": 1.3575478001839023e-05, + "loss": 0.6165, + "step": 11078 + }, + { + "epoch": 0.38, + "learning_rate": 1.3574461095449683e-05, + "loss": 0.6661, + "step": 11079 + }, + { + "epoch": 0.38, + "learning_rate": 1.3573444146680585e-05, + "loss": 0.6196, + "step": 11080 + }, + { + "epoch": 0.38, + "learning_rate": 1.3572427155543789e-05, + "loss": 0.6138, + "step": 11081 + }, + { + "epoch": 0.38, + "learning_rate": 1.3571410122051347e-05, + "loss": 0.6305, + "step": 11082 + }, + { + "epoch": 0.38, + "learning_rate": 1.357039304621532e-05, + "loss": 0.6037, + "step": 11083 + }, + { + "epoch": 0.38, + "learning_rate": 1.3569375928047768e-05, + "loss": 0.6315, + "step": 11084 + }, + { + "epoch": 0.38, + "learning_rate": 1.3568358767560752e-05, + "loss": 0.6293, + "step": 11085 + }, + { + "epoch": 0.38, + "learning_rate": 1.3567341564766326e-05, + "loss": 0.5708, + "step": 11086 + }, + { + "epoch": 0.38, + "learning_rate": 1.356632431967655e-05, + "loss": 0.602, + "step": 11087 + }, + { + "epoch": 0.38, + "learning_rate": 1.3565307032303492e-05, + "loss": 0.6163, + "step": 11088 + }, + { + "epoch": 0.38, + "learning_rate": 1.3564289702659208e-05, + "loss": 0.6406, + "step": 11089 + }, + { + "epoch": 0.38, + "learning_rate": 1.3563272330755759e-05, + "loss": 0.6047, + "step": 11090 + }, + { + "epoch": 0.38, + "learning_rate": 1.3562254916605211e-05, + "loss": 0.7117, + "step": 11091 + }, + { + "epoch": 0.38, + "learning_rate": 1.3561237460219625e-05, + "loss": 0.6143, + "step": 11092 + }, + { + "epoch": 0.38, + "learning_rate": 1.3560219961611063e-05, + "loss": 0.6567, + "step": 11093 + }, + { + "epoch": 0.38, + "learning_rate": 1.355920242079159e-05, + "loss": 0.6228, + "step": 11094 + }, + { + "epoch": 0.38, + "learning_rate": 1.3558184837773269e-05, + "loss": 0.6192, + "step": 11095 + }, + { + "epoch": 0.38, + "learning_rate": 1.3557167212568167e-05, + "loss": 0.6456, + "step": 11096 + }, + { + "epoch": 0.38, + "learning_rate": 1.3556149545188346e-05, + "loss": 0.6265, + "step": 11097 + }, + { + "epoch": 0.38, + "learning_rate": 1.3555131835645873e-05, + "loss": 0.6376, + "step": 11098 + }, + { + "epoch": 0.38, + "learning_rate": 1.3554114083952821e-05, + "loss": 0.5352, + "step": 11099 + }, + { + "epoch": 0.38, + "learning_rate": 1.3553096290121244e-05, + "loss": 0.5879, + "step": 11100 + }, + { + "epoch": 0.38, + "learning_rate": 1.3552078454163218e-05, + "loss": 0.6404, + "step": 11101 + }, + { + "epoch": 0.38, + "learning_rate": 1.355106057609081e-05, + "loss": 0.622, + "step": 11102 + }, + { + "epoch": 0.38, + "learning_rate": 1.3550042655916084e-05, + "loss": 0.6338, + "step": 11103 + }, + { + "epoch": 0.38, + "learning_rate": 1.3549024693651112e-05, + "loss": 0.6509, + "step": 11104 + }, + { + "epoch": 0.38, + "learning_rate": 1.3548006689307965e-05, + "loss": 0.674, + "step": 11105 + }, + { + "epoch": 0.38, + "learning_rate": 1.3546988642898708e-05, + "loss": 0.6208, + "step": 11106 + }, + { + "epoch": 0.38, + "learning_rate": 1.3545970554435412e-05, + "loss": 0.6477, + "step": 11107 + }, + { + "epoch": 0.38, + "learning_rate": 1.3544952423930156e-05, + "loss": 0.5933, + "step": 11108 + }, + { + "epoch": 0.38, + "learning_rate": 1.3543934251394997e-05, + "loss": 0.5918, + "step": 11109 + }, + { + "epoch": 0.38, + "learning_rate": 1.3542916036842017e-05, + "loss": 0.5649, + "step": 11110 + }, + { + "epoch": 0.38, + "learning_rate": 1.3541897780283288e-05, + "loss": 0.6496, + "step": 11111 + }, + { + "epoch": 0.39, + "learning_rate": 1.354087948173088e-05, + "loss": 0.6608, + "step": 11112 + }, + { + "epoch": 0.39, + "learning_rate": 1.3539861141196864e-05, + "loss": 0.6169, + "step": 11113 + }, + { + "epoch": 0.39, + "learning_rate": 1.3538842758693318e-05, + "loss": 0.6564, + "step": 11114 + }, + { + "epoch": 0.39, + "learning_rate": 1.3537824334232315e-05, + "loss": 0.5601, + "step": 11115 + }, + { + "epoch": 0.39, + "learning_rate": 1.3536805867825927e-05, + "loss": 0.612, + "step": 11116 + }, + { + "epoch": 0.39, + "learning_rate": 1.3535787359486232e-05, + "loss": 0.6263, + "step": 11117 + }, + { + "epoch": 0.39, + "learning_rate": 1.3534768809225305e-05, + "loss": 0.6496, + "step": 11118 + }, + { + "epoch": 0.39, + "learning_rate": 1.353375021705522e-05, + "loss": 0.6431, + "step": 11119 + }, + { + "epoch": 0.39, + "learning_rate": 1.3532731582988061e-05, + "loss": 0.6754, + "step": 11120 + }, + { + "epoch": 0.39, + "learning_rate": 1.3531712907035898e-05, + "loss": 0.6683, + "step": 11121 + }, + { + "epoch": 0.39, + "learning_rate": 1.3530694189210812e-05, + "loss": 0.6277, + "step": 11122 + }, + { + "epoch": 0.39, + "learning_rate": 1.3529675429524878e-05, + "loss": 0.6191, + "step": 11123 + }, + { + "epoch": 0.39, + "learning_rate": 1.3528656627990176e-05, + "loss": 0.6678, + "step": 11124 + }, + { + "epoch": 0.39, + "learning_rate": 1.3527637784618788e-05, + "loss": 0.6053, + "step": 11125 + }, + { + "epoch": 0.39, + "learning_rate": 1.3526618899422792e-05, + "loss": 0.6792, + "step": 11126 + }, + { + "epoch": 0.39, + "learning_rate": 1.3525599972414264e-05, + "loss": 0.6418, + "step": 11127 + }, + { + "epoch": 0.39, + "learning_rate": 1.3524581003605293e-05, + "loss": 0.6242, + "step": 11128 + }, + { + "epoch": 0.39, + "learning_rate": 1.3523561993007955e-05, + "loss": 0.6122, + "step": 11129 + }, + { + "epoch": 0.39, + "learning_rate": 1.352254294063433e-05, + "loss": 0.5922, + "step": 11130 + }, + { + "epoch": 0.39, + "learning_rate": 1.3521523846496503e-05, + "loss": 0.5908, + "step": 11131 + }, + { + "epoch": 0.39, + "learning_rate": 1.3520504710606556e-05, + "loss": 0.6297, + "step": 11132 + }, + { + "epoch": 0.39, + "learning_rate": 1.3519485532976573e-05, + "loss": 0.6831, + "step": 11133 + }, + { + "epoch": 0.39, + "learning_rate": 1.3518466313618634e-05, + "loss": 0.6316, + "step": 11134 + }, + { + "epoch": 0.39, + "learning_rate": 1.351744705254483e-05, + "loss": 0.6703, + "step": 11135 + }, + { + "epoch": 0.39, + "learning_rate": 1.351642774976724e-05, + "loss": 0.6124, + "step": 11136 + }, + { + "epoch": 0.39, + "learning_rate": 1.351540840529795e-05, + "loss": 0.654, + "step": 11137 + }, + { + "epoch": 0.39, + "learning_rate": 1.3514389019149047e-05, + "loss": 0.6176, + "step": 11138 + }, + { + "epoch": 0.39, + "learning_rate": 1.3513369591332617e-05, + "loss": 0.6678, + "step": 11139 + }, + { + "epoch": 0.39, + "learning_rate": 1.3512350121860744e-05, + "loss": 0.6494, + "step": 11140 + }, + { + "epoch": 0.39, + "learning_rate": 1.3511330610745522e-05, + "loss": 0.6016, + "step": 11141 + }, + { + "epoch": 0.39, + "learning_rate": 1.3510311057999028e-05, + "loss": 0.656, + "step": 11142 + }, + { + "epoch": 0.39, + "learning_rate": 1.3509291463633358e-05, + "loss": 0.6139, + "step": 11143 + }, + { + "epoch": 0.39, + "learning_rate": 1.3508271827660599e-05, + "loss": 0.671, + "step": 11144 + }, + { + "epoch": 0.39, + "learning_rate": 1.350725215009284e-05, + "loss": 0.6736, + "step": 11145 + }, + { + "epoch": 0.39, + "learning_rate": 1.3506232430942168e-05, + "loss": 0.6423, + "step": 11146 + }, + { + "epoch": 0.39, + "learning_rate": 1.3505212670220678e-05, + "loss": 0.6472, + "step": 11147 + }, + { + "epoch": 0.39, + "learning_rate": 1.3504192867940455e-05, + "loss": 0.6846, + "step": 11148 + }, + { + "epoch": 0.39, + "learning_rate": 1.3503173024113592e-05, + "loss": 0.6131, + "step": 11149 + }, + { + "epoch": 0.39, + "learning_rate": 1.3502153138752185e-05, + "loss": 0.6471, + "step": 11150 + }, + { + "epoch": 0.39, + "learning_rate": 1.3501133211868321e-05, + "loss": 0.6575, + "step": 11151 + }, + { + "epoch": 0.39, + "learning_rate": 1.3500113243474092e-05, + "loss": 0.6212, + "step": 11152 + }, + { + "epoch": 0.39, + "learning_rate": 1.3499093233581595e-05, + "loss": 0.6561, + "step": 11153 + }, + { + "epoch": 0.39, + "learning_rate": 1.349807318220292e-05, + "loss": 0.6614, + "step": 11154 + }, + { + "epoch": 0.39, + "learning_rate": 1.3497053089350161e-05, + "loss": 0.6461, + "step": 11155 + }, + { + "epoch": 0.39, + "learning_rate": 1.3496032955035416e-05, + "loss": 0.6117, + "step": 11156 + }, + { + "epoch": 0.39, + "learning_rate": 1.3495012779270777e-05, + "loss": 0.6271, + "step": 11157 + }, + { + "epoch": 0.39, + "learning_rate": 1.3493992562068343e-05, + "loss": 0.5667, + "step": 11158 + }, + { + "epoch": 0.39, + "learning_rate": 1.3492972303440203e-05, + "loss": 0.6125, + "step": 11159 + }, + { + "epoch": 0.39, + "learning_rate": 1.3491952003398461e-05, + "loss": 0.6069, + "step": 11160 + }, + { + "epoch": 0.39, + "learning_rate": 1.349093166195521e-05, + "loss": 0.6409, + "step": 11161 + }, + { + "epoch": 0.39, + "learning_rate": 1.3489911279122545e-05, + "loss": 0.6305, + "step": 11162 + }, + { + "epoch": 0.39, + "learning_rate": 1.348889085491257e-05, + "loss": 0.6332, + "step": 11163 + }, + { + "epoch": 0.39, + "learning_rate": 1.3487870389337381e-05, + "loss": 0.6497, + "step": 11164 + }, + { + "epoch": 0.39, + "learning_rate": 1.3486849882409075e-05, + "loss": 0.6584, + "step": 11165 + }, + { + "epoch": 0.39, + "learning_rate": 1.348582933413975e-05, + "loss": 0.6934, + "step": 11166 + }, + { + "epoch": 0.39, + "learning_rate": 1.3484808744541514e-05, + "loss": 0.6464, + "step": 11167 + }, + { + "epoch": 0.39, + "learning_rate": 1.348378811362646e-05, + "loss": 0.6311, + "step": 11168 + }, + { + "epoch": 0.39, + "learning_rate": 1.3482767441406687e-05, + "loss": 0.6134, + "step": 11169 + }, + { + "epoch": 0.39, + "learning_rate": 1.3481746727894307e-05, + "loss": 0.6181, + "step": 11170 + }, + { + "epoch": 0.39, + "learning_rate": 1.3480725973101412e-05, + "loss": 0.6184, + "step": 11171 + }, + { + "epoch": 0.39, + "learning_rate": 1.3479705177040106e-05, + "loss": 0.604, + "step": 11172 + }, + { + "epoch": 0.39, + "learning_rate": 1.3478684339722494e-05, + "loss": 0.6457, + "step": 11173 + }, + { + "epoch": 0.39, + "learning_rate": 1.347766346116068e-05, + "loss": 0.6027, + "step": 11174 + }, + { + "epoch": 0.39, + "learning_rate": 1.3476642541366765e-05, + "loss": 0.6657, + "step": 11175 + }, + { + "epoch": 0.39, + "learning_rate": 1.3475621580352856e-05, + "loss": 0.6447, + "step": 11176 + }, + { + "epoch": 0.39, + "learning_rate": 1.3474600578131054e-05, + "loss": 0.628, + "step": 11177 + }, + { + "epoch": 0.39, + "learning_rate": 1.3473579534713468e-05, + "loss": 0.662, + "step": 11178 + }, + { + "epoch": 0.39, + "learning_rate": 1.3472558450112206e-05, + "loss": 0.6648, + "step": 11179 + }, + { + "epoch": 0.39, + "learning_rate": 1.3471537324339365e-05, + "loss": 0.6155, + "step": 11180 + }, + { + "epoch": 0.39, + "learning_rate": 1.3470516157407061e-05, + "loss": 0.6406, + "step": 11181 + }, + { + "epoch": 0.39, + "learning_rate": 1.3469494949327397e-05, + "loss": 0.7016, + "step": 11182 + }, + { + "epoch": 0.39, + "learning_rate": 1.3468473700112482e-05, + "loss": 0.6038, + "step": 11183 + }, + { + "epoch": 0.39, + "learning_rate": 1.3467452409774423e-05, + "loss": 0.5973, + "step": 11184 + }, + { + "epoch": 0.39, + "learning_rate": 1.346643107832533e-05, + "loss": 0.6474, + "step": 11185 + }, + { + "epoch": 0.39, + "learning_rate": 1.3465409705777311e-05, + "loss": 0.6042, + "step": 11186 + }, + { + "epoch": 0.39, + "learning_rate": 1.3464388292142475e-05, + "loss": 0.5799, + "step": 11187 + }, + { + "epoch": 0.39, + "learning_rate": 1.3463366837432936e-05, + "loss": 0.6212, + "step": 11188 + }, + { + "epoch": 0.39, + "learning_rate": 1.34623453416608e-05, + "loss": 0.6441, + "step": 11189 + }, + { + "epoch": 0.39, + "learning_rate": 1.3461323804838178e-05, + "loss": 0.6392, + "step": 11190 + }, + { + "epoch": 0.39, + "learning_rate": 1.3460302226977189e-05, + "loss": 0.6072, + "step": 11191 + }, + { + "epoch": 0.39, + "learning_rate": 1.3459280608089937e-05, + "loss": 0.6765, + "step": 11192 + }, + { + "epoch": 0.39, + "learning_rate": 1.3458258948188534e-05, + "loss": 0.6188, + "step": 11193 + }, + { + "epoch": 0.39, + "learning_rate": 1.3457237247285103e-05, + "loss": 0.6643, + "step": 11194 + }, + { + "epoch": 0.39, + "learning_rate": 1.3456215505391748e-05, + "loss": 0.6702, + "step": 11195 + }, + { + "epoch": 0.39, + "learning_rate": 1.3455193722520585e-05, + "loss": 0.6217, + "step": 11196 + }, + { + "epoch": 0.39, + "learning_rate": 1.345417189868373e-05, + "loss": 0.6177, + "step": 11197 + }, + { + "epoch": 0.39, + "learning_rate": 1.3453150033893298e-05, + "loss": 0.6293, + "step": 11198 + }, + { + "epoch": 0.39, + "learning_rate": 1.3452128128161404e-05, + "loss": 0.6536, + "step": 11199 + }, + { + "epoch": 0.39, + "learning_rate": 1.3451106181500164e-05, + "loss": 0.6236, + "step": 11200 + }, + { + "epoch": 0.39, + "learning_rate": 1.3450084193921695e-05, + "loss": 0.6064, + "step": 11201 + }, + { + "epoch": 0.39, + "learning_rate": 1.3449062165438114e-05, + "loss": 0.6051, + "step": 11202 + }, + { + "epoch": 0.39, + "learning_rate": 1.3448040096061536e-05, + "loss": 0.6466, + "step": 11203 + }, + { + "epoch": 0.39, + "learning_rate": 1.3447017985804083e-05, + "loss": 0.5877, + "step": 11204 + }, + { + "epoch": 0.39, + "learning_rate": 1.344599583467787e-05, + "loss": 0.6935, + "step": 11205 + }, + { + "epoch": 0.39, + "learning_rate": 1.3444973642695016e-05, + "loss": 0.6431, + "step": 11206 + }, + { + "epoch": 0.39, + "learning_rate": 1.3443951409867645e-05, + "loss": 0.6, + "step": 11207 + }, + { + "epoch": 0.39, + "learning_rate": 1.3442929136207869e-05, + "loss": 0.6776, + "step": 11208 + }, + { + "epoch": 0.39, + "learning_rate": 1.3441906821727817e-05, + "loss": 0.6274, + "step": 11209 + }, + { + "epoch": 0.39, + "learning_rate": 1.3440884466439604e-05, + "loss": 0.64, + "step": 11210 + }, + { + "epoch": 0.39, + "learning_rate": 1.3439862070355352e-05, + "loss": 0.6659, + "step": 11211 + }, + { + "epoch": 0.39, + "learning_rate": 1.3438839633487184e-05, + "loss": 0.6973, + "step": 11212 + }, + { + "epoch": 0.39, + "learning_rate": 1.3437817155847224e-05, + "loss": 0.61, + "step": 11213 + }, + { + "epoch": 0.39, + "learning_rate": 1.343679463744759e-05, + "loss": 0.6441, + "step": 11214 + }, + { + "epoch": 0.39, + "learning_rate": 1.343577207830041e-05, + "loss": 0.6334, + "step": 11215 + }, + { + "epoch": 0.39, + "learning_rate": 1.3434749478417806e-05, + "loss": 0.6332, + "step": 11216 + }, + { + "epoch": 0.39, + "learning_rate": 1.34337268378119e-05, + "loss": 0.6654, + "step": 11217 + }, + { + "epoch": 0.39, + "learning_rate": 1.3432704156494818e-05, + "loss": 0.6117, + "step": 11218 + }, + { + "epoch": 0.39, + "learning_rate": 1.3431681434478688e-05, + "loss": 0.6261, + "step": 11219 + }, + { + "epoch": 0.39, + "learning_rate": 1.3430658671775634e-05, + "loss": 0.6564, + "step": 11220 + }, + { + "epoch": 0.39, + "learning_rate": 1.342963586839778e-05, + "loss": 0.6835, + "step": 11221 + }, + { + "epoch": 0.39, + "learning_rate": 1.3428613024357255e-05, + "loss": 0.6453, + "step": 11222 + }, + { + "epoch": 0.39, + "learning_rate": 1.3427590139666185e-05, + "loss": 0.6464, + "step": 11223 + }, + { + "epoch": 0.39, + "learning_rate": 1.3426567214336696e-05, + "loss": 0.6413, + "step": 11224 + }, + { + "epoch": 0.39, + "learning_rate": 1.3425544248380922e-05, + "loss": 0.613, + "step": 11225 + }, + { + "epoch": 0.39, + "learning_rate": 1.3424521241810983e-05, + "loss": 0.7016, + "step": 11226 + }, + { + "epoch": 0.39, + "learning_rate": 1.3423498194639017e-05, + "loss": 0.6152, + "step": 11227 + }, + { + "epoch": 0.39, + "learning_rate": 1.3422475106877149e-05, + "loss": 0.6529, + "step": 11228 + }, + { + "epoch": 0.39, + "learning_rate": 1.3421451978537507e-05, + "loss": 0.6916, + "step": 11229 + }, + { + "epoch": 0.39, + "learning_rate": 1.3420428809632222e-05, + "loss": 0.7086, + "step": 11230 + }, + { + "epoch": 0.39, + "learning_rate": 1.3419405600173429e-05, + "loss": 0.649, + "step": 11231 + }, + { + "epoch": 0.39, + "learning_rate": 1.3418382350173259e-05, + "loss": 0.646, + "step": 11232 + }, + { + "epoch": 0.39, + "learning_rate": 1.341735905964384e-05, + "loss": 0.6866, + "step": 11233 + }, + { + "epoch": 0.39, + "learning_rate": 1.3416335728597307e-05, + "loss": 0.6267, + "step": 11234 + }, + { + "epoch": 0.39, + "learning_rate": 1.3415312357045788e-05, + "loss": 0.6698, + "step": 11235 + }, + { + "epoch": 0.39, + "learning_rate": 1.3414288945001425e-05, + "loss": 0.6171, + "step": 11236 + }, + { + "epoch": 0.39, + "learning_rate": 1.3413265492476348e-05, + "loss": 0.638, + "step": 11237 + }, + { + "epoch": 0.39, + "learning_rate": 1.341224199948269e-05, + "loss": 0.5913, + "step": 11238 + }, + { + "epoch": 0.39, + "learning_rate": 1.3411218466032585e-05, + "loss": 0.6145, + "step": 11239 + }, + { + "epoch": 0.39, + "learning_rate": 1.3410194892138171e-05, + "loss": 0.6223, + "step": 11240 + }, + { + "epoch": 0.39, + "learning_rate": 1.3409171277811581e-05, + "loss": 0.6075, + "step": 11241 + }, + { + "epoch": 0.39, + "learning_rate": 1.3408147623064954e-05, + "loss": 0.6731, + "step": 11242 + }, + { + "epoch": 0.39, + "learning_rate": 1.3407123927910428e-05, + "loss": 0.6663, + "step": 11243 + }, + { + "epoch": 0.39, + "learning_rate": 1.3406100192360134e-05, + "loss": 0.6284, + "step": 11244 + }, + { + "epoch": 0.39, + "learning_rate": 1.3405076416426214e-05, + "loss": 0.6565, + "step": 11245 + }, + { + "epoch": 0.39, + "learning_rate": 1.340405260012081e-05, + "loss": 0.677, + "step": 11246 + }, + { + "epoch": 0.39, + "learning_rate": 1.3403028743456053e-05, + "loss": 0.6238, + "step": 11247 + }, + { + "epoch": 0.39, + "learning_rate": 1.3402004846444084e-05, + "loss": 0.668, + "step": 11248 + }, + { + "epoch": 0.39, + "learning_rate": 1.3400980909097045e-05, + "loss": 0.6019, + "step": 11249 + }, + { + "epoch": 0.39, + "learning_rate": 1.3399956931427077e-05, + "loss": 0.6775, + "step": 11250 + }, + { + "epoch": 0.39, + "learning_rate": 1.339893291344632e-05, + "loss": 0.6208, + "step": 11251 + }, + { + "epoch": 0.39, + "learning_rate": 1.3397908855166908e-05, + "loss": 0.6602, + "step": 11252 + }, + { + "epoch": 0.39, + "learning_rate": 1.3396884756600993e-05, + "loss": 0.6197, + "step": 11253 + }, + { + "epoch": 0.39, + "learning_rate": 1.3395860617760709e-05, + "loss": 0.6116, + "step": 11254 + }, + { + "epoch": 0.39, + "learning_rate": 1.3394836438658203e-05, + "loss": 0.5582, + "step": 11255 + }, + { + "epoch": 0.39, + "learning_rate": 1.3393812219305615e-05, + "loss": 0.619, + "step": 11256 + }, + { + "epoch": 0.39, + "learning_rate": 1.3392787959715091e-05, + "loss": 0.6143, + "step": 11257 + }, + { + "epoch": 0.39, + "learning_rate": 1.3391763659898773e-05, + "loss": 0.6857, + "step": 11258 + }, + { + "epoch": 0.39, + "learning_rate": 1.3390739319868808e-05, + "loss": 0.619, + "step": 11259 + }, + { + "epoch": 0.39, + "learning_rate": 1.338971493963734e-05, + "loss": 0.6637, + "step": 11260 + }, + { + "epoch": 0.39, + "learning_rate": 1.338869051921651e-05, + "loss": 0.6036, + "step": 11261 + }, + { + "epoch": 0.39, + "learning_rate": 1.3387666058618469e-05, + "loss": 0.6297, + "step": 11262 + }, + { + "epoch": 0.39, + "learning_rate": 1.3386641557855362e-05, + "loss": 0.6454, + "step": 11263 + }, + { + "epoch": 0.39, + "learning_rate": 1.3385617016939333e-05, + "loss": 0.6144, + "step": 11264 + }, + { + "epoch": 0.39, + "learning_rate": 1.3384592435882533e-05, + "loss": 0.6963, + "step": 11265 + }, + { + "epoch": 0.39, + "learning_rate": 1.3383567814697109e-05, + "loss": 0.6184, + "step": 11266 + }, + { + "epoch": 0.39, + "learning_rate": 1.3382543153395207e-05, + "loss": 0.6503, + "step": 11267 + }, + { + "epoch": 0.39, + "learning_rate": 1.3381518451988978e-05, + "loss": 0.5793, + "step": 11268 + }, + { + "epoch": 0.39, + "learning_rate": 1.338049371049057e-05, + "loss": 0.6147, + "step": 11269 + }, + { + "epoch": 0.39, + "learning_rate": 1.3379468928912131e-05, + "loss": 0.6134, + "step": 11270 + }, + { + "epoch": 0.39, + "learning_rate": 1.3378444107265814e-05, + "loss": 0.6318, + "step": 11271 + }, + { + "epoch": 0.39, + "learning_rate": 1.337741924556377e-05, + "loss": 0.617, + "step": 11272 + }, + { + "epoch": 0.39, + "learning_rate": 1.3376394343818144e-05, + "loss": 0.603, + "step": 11273 + }, + { + "epoch": 0.39, + "learning_rate": 1.3375369402041094e-05, + "loss": 0.555, + "step": 11274 + }, + { + "epoch": 0.39, + "learning_rate": 1.3374344420244774e-05, + "loss": 0.6296, + "step": 11275 + }, + { + "epoch": 0.39, + "learning_rate": 1.3373319398441327e-05, + "loss": 0.6127, + "step": 11276 + }, + { + "epoch": 0.39, + "learning_rate": 1.3372294336642912e-05, + "loss": 0.6456, + "step": 11277 + }, + { + "epoch": 0.39, + "learning_rate": 1.3371269234861686e-05, + "loss": 0.6798, + "step": 11278 + }, + { + "epoch": 0.39, + "learning_rate": 1.3370244093109795e-05, + "loss": 0.5968, + "step": 11279 + }, + { + "epoch": 0.39, + "learning_rate": 1.3369218911399396e-05, + "loss": 0.6387, + "step": 11280 + }, + { + "epoch": 0.39, + "learning_rate": 1.3368193689742645e-05, + "loss": 0.6207, + "step": 11281 + }, + { + "epoch": 0.39, + "learning_rate": 1.33671684281517e-05, + "loss": 0.6618, + "step": 11282 + }, + { + "epoch": 0.39, + "learning_rate": 1.3366143126638708e-05, + "loss": 0.6253, + "step": 11283 + }, + { + "epoch": 0.39, + "learning_rate": 1.3365117785215837e-05, + "loss": 0.6123, + "step": 11284 + }, + { + "epoch": 0.39, + "learning_rate": 1.3364092403895236e-05, + "loss": 0.6574, + "step": 11285 + }, + { + "epoch": 0.39, + "learning_rate": 1.3363066982689061e-05, + "loss": 0.6148, + "step": 11286 + }, + { + "epoch": 0.39, + "learning_rate": 1.3362041521609476e-05, + "loss": 0.6415, + "step": 11287 + }, + { + "epoch": 0.39, + "learning_rate": 1.3361016020668637e-05, + "loss": 0.6753, + "step": 11288 + }, + { + "epoch": 0.39, + "learning_rate": 1.3359990479878697e-05, + "loss": 0.6262, + "step": 11289 + }, + { + "epoch": 0.39, + "learning_rate": 1.3358964899251822e-05, + "loss": 0.706, + "step": 11290 + }, + { + "epoch": 0.39, + "learning_rate": 1.3357939278800171e-05, + "loss": 0.6456, + "step": 11291 + }, + { + "epoch": 0.39, + "learning_rate": 1.3356913618535896e-05, + "loss": 0.6582, + "step": 11292 + }, + { + "epoch": 0.39, + "learning_rate": 1.3355887918471169e-05, + "loss": 0.6125, + "step": 11293 + }, + { + "epoch": 0.39, + "learning_rate": 1.3354862178618145e-05, + "loss": 0.6294, + "step": 11294 + }, + { + "epoch": 0.39, + "learning_rate": 1.3353836398988982e-05, + "loss": 0.6103, + "step": 11295 + }, + { + "epoch": 0.39, + "learning_rate": 1.335281057959585e-05, + "loss": 0.588, + "step": 11296 + }, + { + "epoch": 0.39, + "learning_rate": 1.3351784720450906e-05, + "loss": 0.6517, + "step": 11297 + }, + { + "epoch": 0.39, + "learning_rate": 1.3350758821566312e-05, + "loss": 0.6764, + "step": 11298 + }, + { + "epoch": 0.39, + "learning_rate": 1.3349732882954238e-05, + "loss": 0.6808, + "step": 11299 + }, + { + "epoch": 0.39, + "learning_rate": 1.334870690462684e-05, + "loss": 0.6254, + "step": 11300 + }, + { + "epoch": 0.39, + "learning_rate": 1.3347680886596285e-05, + "loss": 0.5986, + "step": 11301 + }, + { + "epoch": 0.39, + "learning_rate": 1.334665482887474e-05, + "loss": 0.6869, + "step": 11302 + }, + { + "epoch": 0.39, + "learning_rate": 1.334562873147437e-05, + "loss": 0.6411, + "step": 11303 + }, + { + "epoch": 0.39, + "learning_rate": 1.3344602594407334e-05, + "loss": 0.655, + "step": 11304 + }, + { + "epoch": 0.39, + "learning_rate": 1.3343576417685809e-05, + "loss": 0.652, + "step": 11305 + }, + { + "epoch": 0.39, + "learning_rate": 1.3342550201321954e-05, + "loss": 0.6362, + "step": 11306 + }, + { + "epoch": 0.39, + "learning_rate": 1.3341523945327931e-05, + "loss": 0.596, + "step": 11307 + }, + { + "epoch": 0.39, + "learning_rate": 1.3340497649715925e-05, + "loss": 0.5683, + "step": 11308 + }, + { + "epoch": 0.39, + "learning_rate": 1.333947131449809e-05, + "loss": 0.6343, + "step": 11309 + }, + { + "epoch": 0.39, + "learning_rate": 1.3338444939686594e-05, + "loss": 0.6244, + "step": 11310 + }, + { + "epoch": 0.39, + "learning_rate": 1.3337418525293618e-05, + "loss": 0.6315, + "step": 11311 + }, + { + "epoch": 0.39, + "learning_rate": 1.3336392071331319e-05, + "loss": 0.6143, + "step": 11312 + }, + { + "epoch": 0.39, + "learning_rate": 1.3335365577811872e-05, + "loss": 0.604, + "step": 11313 + }, + { + "epoch": 0.39, + "learning_rate": 1.3334339044747445e-05, + "loss": 0.6577, + "step": 11314 + }, + { + "epoch": 0.39, + "learning_rate": 1.3333312472150213e-05, + "loss": 0.6433, + "step": 11315 + }, + { + "epoch": 0.39, + "learning_rate": 1.3332285860032343e-05, + "loss": 0.6073, + "step": 11316 + }, + { + "epoch": 0.39, + "learning_rate": 1.3331259208406009e-05, + "loss": 0.6856, + "step": 11317 + }, + { + "epoch": 0.39, + "learning_rate": 1.3330232517283386e-05, + "loss": 0.6049, + "step": 11318 + }, + { + "epoch": 0.39, + "learning_rate": 1.332920578667664e-05, + "loss": 0.591, + "step": 11319 + }, + { + "epoch": 0.39, + "learning_rate": 1.332817901659795e-05, + "loss": 0.6345, + "step": 11320 + }, + { + "epoch": 0.39, + "learning_rate": 1.3327152207059486e-05, + "loss": 0.631, + "step": 11321 + }, + { + "epoch": 0.39, + "learning_rate": 1.3326125358073425e-05, + "loss": 0.6174, + "step": 11322 + }, + { + "epoch": 0.39, + "learning_rate": 1.3325098469651941e-05, + "loss": 0.6442, + "step": 11323 + }, + { + "epoch": 0.39, + "learning_rate": 1.3324071541807207e-05, + "loss": 0.596, + "step": 11324 + }, + { + "epoch": 0.39, + "learning_rate": 1.3323044574551401e-05, + "loss": 0.6835, + "step": 11325 + }, + { + "epoch": 0.39, + "learning_rate": 1.3322017567896697e-05, + "loss": 0.6419, + "step": 11326 + }, + { + "epoch": 0.39, + "learning_rate": 1.3320990521855272e-05, + "loss": 0.609, + "step": 11327 + }, + { + "epoch": 0.39, + "learning_rate": 1.3319963436439305e-05, + "loss": 0.5858, + "step": 11328 + }, + { + "epoch": 0.39, + "learning_rate": 1.3318936311660968e-05, + "loss": 0.5993, + "step": 11329 + }, + { + "epoch": 0.39, + "learning_rate": 1.3317909147532446e-05, + "loss": 0.6797, + "step": 11330 + }, + { + "epoch": 0.39, + "learning_rate": 1.3316881944065914e-05, + "loss": 0.6164, + "step": 11331 + }, + { + "epoch": 0.39, + "learning_rate": 1.3315854701273549e-05, + "loss": 0.5826, + "step": 11332 + }, + { + "epoch": 0.39, + "learning_rate": 1.3314827419167533e-05, + "loss": 0.6714, + "step": 11333 + }, + { + "epoch": 0.39, + "learning_rate": 1.3313800097760043e-05, + "loss": 0.5963, + "step": 11334 + }, + { + "epoch": 0.39, + "learning_rate": 1.3312772737063262e-05, + "loss": 0.6441, + "step": 11335 + }, + { + "epoch": 0.39, + "learning_rate": 1.3311745337089372e-05, + "loss": 0.6359, + "step": 11336 + }, + { + "epoch": 0.39, + "learning_rate": 1.331071789785055e-05, + "loss": 0.6779, + "step": 11337 + }, + { + "epoch": 0.39, + "learning_rate": 1.3309690419358977e-05, + "loss": 0.6799, + "step": 11338 + }, + { + "epoch": 0.39, + "learning_rate": 1.330866290162684e-05, + "loss": 0.7005, + "step": 11339 + }, + { + "epoch": 0.39, + "learning_rate": 1.3307635344666316e-05, + "loss": 0.6287, + "step": 11340 + }, + { + "epoch": 0.39, + "learning_rate": 1.3306607748489593e-05, + "loss": 0.6558, + "step": 11341 + }, + { + "epoch": 0.39, + "learning_rate": 1.3305580113108852e-05, + "loss": 0.5958, + "step": 11342 + }, + { + "epoch": 0.39, + "learning_rate": 1.3304552438536275e-05, + "loss": 0.6805, + "step": 11343 + }, + { + "epoch": 0.39, + "learning_rate": 1.3303524724784054e-05, + "loss": 0.638, + "step": 11344 + }, + { + "epoch": 0.39, + "learning_rate": 1.3302496971864364e-05, + "loss": 0.6342, + "step": 11345 + }, + { + "epoch": 0.39, + "learning_rate": 1.3301469179789395e-05, + "loss": 0.6498, + "step": 11346 + }, + { + "epoch": 0.39, + "learning_rate": 1.3300441348571333e-05, + "loss": 0.6878, + "step": 11347 + }, + { + "epoch": 0.39, + "learning_rate": 1.3299413478222363e-05, + "loss": 0.6226, + "step": 11348 + }, + { + "epoch": 0.39, + "learning_rate": 1.3298385568754672e-05, + "loss": 0.6279, + "step": 11349 + }, + { + "epoch": 0.39, + "learning_rate": 1.3297357620180451e-05, + "loss": 0.6199, + "step": 11350 + }, + { + "epoch": 0.39, + "learning_rate": 1.3296329632511881e-05, + "loss": 0.6083, + "step": 11351 + }, + { + "epoch": 0.39, + "learning_rate": 1.3295301605761156e-05, + "loss": 0.6223, + "step": 11352 + }, + { + "epoch": 0.39, + "learning_rate": 1.3294273539940461e-05, + "loss": 0.6415, + "step": 11353 + }, + { + "epoch": 0.39, + "learning_rate": 1.3293245435061985e-05, + "loss": 0.6634, + "step": 11354 + }, + { + "epoch": 0.39, + "learning_rate": 1.3292217291137917e-05, + "loss": 0.6449, + "step": 11355 + }, + { + "epoch": 0.39, + "learning_rate": 1.3291189108180452e-05, + "loss": 0.6425, + "step": 11356 + }, + { + "epoch": 0.39, + "learning_rate": 1.3290160886201773e-05, + "loss": 0.6779, + "step": 11357 + }, + { + "epoch": 0.39, + "learning_rate": 1.3289132625214077e-05, + "loss": 0.6878, + "step": 11358 + }, + { + "epoch": 0.39, + "learning_rate": 1.3288104325229552e-05, + "loss": 0.6138, + "step": 11359 + }, + { + "epoch": 0.39, + "learning_rate": 1.3287075986260392e-05, + "loss": 0.6144, + "step": 11360 + }, + { + "epoch": 0.39, + "learning_rate": 1.3286047608318786e-05, + "loss": 0.6378, + "step": 11361 + }, + { + "epoch": 0.39, + "learning_rate": 1.328501919141693e-05, + "loss": 0.6362, + "step": 11362 + }, + { + "epoch": 0.39, + "learning_rate": 1.3283990735567016e-05, + "loss": 0.6001, + "step": 11363 + }, + { + "epoch": 0.39, + "learning_rate": 1.3282962240781237e-05, + "loss": 0.6031, + "step": 11364 + }, + { + "epoch": 0.39, + "learning_rate": 1.3281933707071787e-05, + "loss": 0.6765, + "step": 11365 + }, + { + "epoch": 0.39, + "learning_rate": 1.3280905134450863e-05, + "loss": 0.5949, + "step": 11366 + }, + { + "epoch": 0.39, + "learning_rate": 1.3279876522930658e-05, + "loss": 0.6337, + "step": 11367 + }, + { + "epoch": 0.39, + "learning_rate": 1.3278847872523368e-05, + "loss": 0.6214, + "step": 11368 + }, + { + "epoch": 0.39, + "learning_rate": 1.3277819183241186e-05, + "loss": 0.6437, + "step": 11369 + }, + { + "epoch": 0.39, + "learning_rate": 1.3276790455096314e-05, + "loss": 0.6653, + "step": 11370 + }, + { + "epoch": 0.39, + "learning_rate": 1.3275761688100946e-05, + "loss": 0.6002, + "step": 11371 + }, + { + "epoch": 0.39, + "learning_rate": 1.3274732882267276e-05, + "loss": 0.5815, + "step": 11372 + }, + { + "epoch": 0.39, + "learning_rate": 1.327370403760751e-05, + "loss": 0.6288, + "step": 11373 + }, + { + "epoch": 0.39, + "learning_rate": 1.3272675154133839e-05, + "loss": 0.6304, + "step": 11374 + }, + { + "epoch": 0.39, + "learning_rate": 1.3271646231858462e-05, + "loss": 0.6107, + "step": 11375 + }, + { + "epoch": 0.39, + "learning_rate": 1.3270617270793582e-05, + "loss": 0.6474, + "step": 11376 + }, + { + "epoch": 0.39, + "learning_rate": 1.32695882709514e-05, + "loss": 0.6129, + "step": 11377 + }, + { + "epoch": 0.39, + "learning_rate": 1.3268559232344107e-05, + "loss": 0.6774, + "step": 11378 + }, + { + "epoch": 0.39, + "learning_rate": 1.3267530154983912e-05, + "loss": 0.6059, + "step": 11379 + }, + { + "epoch": 0.39, + "learning_rate": 1.3266501038883015e-05, + "loss": 0.6154, + "step": 11380 + }, + { + "epoch": 0.39, + "learning_rate": 1.3265471884053616e-05, + "loss": 0.6439, + "step": 11381 + }, + { + "epoch": 0.39, + "learning_rate": 1.3264442690507914e-05, + "loss": 0.6858, + "step": 11382 + }, + { + "epoch": 0.39, + "learning_rate": 1.3263413458258119e-05, + "loss": 0.6211, + "step": 11383 + }, + { + "epoch": 0.39, + "learning_rate": 1.3262384187316427e-05, + "loss": 0.6672, + "step": 11384 + }, + { + "epoch": 0.39, + "learning_rate": 1.326135487769504e-05, + "loss": 0.6564, + "step": 11385 + }, + { + "epoch": 0.39, + "learning_rate": 1.326032552940617e-05, + "loss": 0.5673, + "step": 11386 + }, + { + "epoch": 0.39, + "learning_rate": 1.3259296142462015e-05, + "loss": 0.5876, + "step": 11387 + }, + { + "epoch": 0.39, + "learning_rate": 1.3258266716874781e-05, + "loss": 0.6094, + "step": 11388 + }, + { + "epoch": 0.39, + "learning_rate": 1.3257237252656676e-05, + "loss": 0.6523, + "step": 11389 + }, + { + "epoch": 0.39, + "learning_rate": 1.32562077498199e-05, + "loss": 0.6462, + "step": 11390 + }, + { + "epoch": 0.39, + "learning_rate": 1.325517820837666e-05, + "loss": 0.6058, + "step": 11391 + }, + { + "epoch": 0.39, + "learning_rate": 1.325414862833917e-05, + "loss": 0.6136, + "step": 11392 + }, + { + "epoch": 0.39, + "learning_rate": 1.325311900971963e-05, + "loss": 0.6251, + "step": 11393 + }, + { + "epoch": 0.39, + "learning_rate": 1.3252089352530244e-05, + "loss": 0.6147, + "step": 11394 + }, + { + "epoch": 0.39, + "learning_rate": 1.3251059656783229e-05, + "loss": 0.6485, + "step": 11395 + }, + { + "epoch": 0.39, + "learning_rate": 1.325002992249079e-05, + "loss": 0.6622, + "step": 11396 + }, + { + "epoch": 0.39, + "learning_rate": 1.3249000149665133e-05, + "loss": 0.6596, + "step": 11397 + }, + { + "epoch": 0.39, + "learning_rate": 1.324797033831847e-05, + "loss": 0.6307, + "step": 11398 + }, + { + "epoch": 0.39, + "learning_rate": 1.324694048846301e-05, + "loss": 0.6501, + "step": 11399 + }, + { + "epoch": 0.39, + "learning_rate": 1.3245910600110961e-05, + "loss": 0.6134, + "step": 11400 + }, + { + "epoch": 0.4, + "learning_rate": 1.3244880673274537e-05, + "loss": 0.6033, + "step": 11401 + }, + { + "epoch": 0.4, + "learning_rate": 1.324385070796595e-05, + "loss": 0.6246, + "step": 11402 + }, + { + "epoch": 0.4, + "learning_rate": 1.3242820704197406e-05, + "loss": 0.6445, + "step": 11403 + }, + { + "epoch": 0.4, + "learning_rate": 1.3241790661981124e-05, + "loss": 0.6333, + "step": 11404 + }, + { + "epoch": 0.4, + "learning_rate": 1.3240760581329312e-05, + "loss": 0.6512, + "step": 11405 + }, + { + "epoch": 0.4, + "learning_rate": 1.323973046225418e-05, + "loss": 0.6994, + "step": 11406 + }, + { + "epoch": 0.4, + "learning_rate": 1.3238700304767949e-05, + "loss": 0.6595, + "step": 11407 + }, + { + "epoch": 0.4, + "learning_rate": 1.323767010888283e-05, + "loss": 0.6444, + "step": 11408 + }, + { + "epoch": 0.4, + "learning_rate": 1.323663987461103e-05, + "loss": 0.654, + "step": 11409 + }, + { + "epoch": 0.4, + "learning_rate": 1.3235609601964774e-05, + "loss": 0.6434, + "step": 11410 + }, + { + "epoch": 0.4, + "learning_rate": 1.3234579290956276e-05, + "loss": 0.5951, + "step": 11411 + }, + { + "epoch": 0.4, + "learning_rate": 1.3233548941597743e-05, + "loss": 0.6076, + "step": 11412 + }, + { + "epoch": 0.4, + "learning_rate": 1.3232518553901399e-05, + "loss": 0.6331, + "step": 11413 + }, + { + "epoch": 0.4, + "learning_rate": 1.323148812787946e-05, + "loss": 0.6535, + "step": 11414 + }, + { + "epoch": 0.4, + "learning_rate": 1.3230457663544139e-05, + "loss": 0.6386, + "step": 11415 + }, + { + "epoch": 0.4, + "learning_rate": 1.3229427160907657e-05, + "loss": 0.641, + "step": 11416 + }, + { + "epoch": 0.4, + "learning_rate": 1.3228396619982231e-05, + "loss": 0.622, + "step": 11417 + }, + { + "epoch": 0.4, + "learning_rate": 1.3227366040780078e-05, + "loss": 0.6307, + "step": 11418 + }, + { + "epoch": 0.4, + "learning_rate": 1.322633542331342e-05, + "loss": 0.6273, + "step": 11419 + }, + { + "epoch": 0.4, + "learning_rate": 1.3225304767594473e-05, + "loss": 0.5944, + "step": 11420 + }, + { + "epoch": 0.4, + "learning_rate": 1.3224274073635458e-05, + "loss": 0.626, + "step": 11421 + }, + { + "epoch": 0.4, + "learning_rate": 1.3223243341448595e-05, + "loss": 0.6669, + "step": 11422 + }, + { + "epoch": 0.4, + "learning_rate": 1.3222212571046104e-05, + "loss": 0.6413, + "step": 11423 + }, + { + "epoch": 0.4, + "learning_rate": 1.322118176244021e-05, + "loss": 0.5855, + "step": 11424 + }, + { + "epoch": 0.4, + "learning_rate": 1.3220150915643127e-05, + "loss": 0.6438, + "step": 11425 + }, + { + "epoch": 0.4, + "learning_rate": 1.3219120030667085e-05, + "loss": 0.6484, + "step": 11426 + }, + { + "epoch": 0.4, + "learning_rate": 1.3218089107524298e-05, + "loss": 0.6567, + "step": 11427 + }, + { + "epoch": 0.4, + "learning_rate": 1.3217058146226997e-05, + "loss": 0.6907, + "step": 11428 + }, + { + "epoch": 0.4, + "learning_rate": 1.3216027146787405e-05, + "loss": 0.6269, + "step": 11429 + }, + { + "epoch": 0.4, + "learning_rate": 1.321499610921774e-05, + "loss": 0.6967, + "step": 11430 + }, + { + "epoch": 0.4, + "learning_rate": 1.3213965033530228e-05, + "loss": 0.6553, + "step": 11431 + }, + { + "epoch": 0.4, + "learning_rate": 1.3212933919737096e-05, + "loss": 0.6144, + "step": 11432 + }, + { + "epoch": 0.4, + "learning_rate": 1.3211902767850568e-05, + "loss": 0.6044, + "step": 11433 + }, + { + "epoch": 0.4, + "learning_rate": 1.3210871577882868e-05, + "loss": 0.6318, + "step": 11434 + }, + { + "epoch": 0.4, + "learning_rate": 1.3209840349846228e-05, + "loss": 0.6339, + "step": 11435 + }, + { + "epoch": 0.4, + "learning_rate": 1.3208809083752867e-05, + "loss": 0.6713, + "step": 11436 + }, + { + "epoch": 0.4, + "learning_rate": 1.3207777779615016e-05, + "loss": 0.6084, + "step": 11437 + }, + { + "epoch": 0.4, + "learning_rate": 1.3206746437444901e-05, + "loss": 0.6245, + "step": 11438 + }, + { + "epoch": 0.4, + "learning_rate": 1.3205715057254749e-05, + "loss": 0.68, + "step": 11439 + }, + { + "epoch": 0.4, + "learning_rate": 1.3204683639056795e-05, + "loss": 0.6471, + "step": 11440 + }, + { + "epoch": 0.4, + "learning_rate": 1.3203652182863255e-05, + "loss": 0.6221, + "step": 11441 + }, + { + "epoch": 0.4, + "learning_rate": 1.320262068868637e-05, + "loss": 0.6118, + "step": 11442 + }, + { + "epoch": 0.4, + "learning_rate": 1.3201589156538366e-05, + "loss": 0.6396, + "step": 11443 + }, + { + "epoch": 0.4, + "learning_rate": 1.3200557586431471e-05, + "loss": 0.6025, + "step": 11444 + }, + { + "epoch": 0.4, + "learning_rate": 1.3199525978377916e-05, + "loss": 0.6378, + "step": 11445 + }, + { + "epoch": 0.4, + "learning_rate": 1.3198494332389938e-05, + "loss": 0.6318, + "step": 11446 + }, + { + "epoch": 0.4, + "learning_rate": 1.3197462648479759e-05, + "loss": 0.6632, + "step": 11447 + }, + { + "epoch": 0.4, + "learning_rate": 1.3196430926659616e-05, + "loss": 0.6188, + "step": 11448 + }, + { + "epoch": 0.4, + "learning_rate": 1.3195399166941742e-05, + "loss": 0.6508, + "step": 11449 + }, + { + "epoch": 0.4, + "learning_rate": 1.3194367369338368e-05, + "loss": 0.6007, + "step": 11450 + }, + { + "epoch": 0.4, + "learning_rate": 1.319333553386173e-05, + "loss": 0.6306, + "step": 11451 + }, + { + "epoch": 0.4, + "learning_rate": 1.3192303660524057e-05, + "loss": 0.6485, + "step": 11452 + }, + { + "epoch": 0.4, + "learning_rate": 1.3191271749337586e-05, + "loss": 0.6652, + "step": 11453 + }, + { + "epoch": 0.4, + "learning_rate": 1.3190239800314553e-05, + "loss": 0.6828, + "step": 11454 + }, + { + "epoch": 0.4, + "learning_rate": 1.3189207813467191e-05, + "loss": 0.6741, + "step": 11455 + }, + { + "epoch": 0.4, + "learning_rate": 1.3188175788807733e-05, + "loss": 0.6357, + "step": 11456 + }, + { + "epoch": 0.4, + "learning_rate": 1.3187143726348422e-05, + "loss": 0.6065, + "step": 11457 + }, + { + "epoch": 0.4, + "learning_rate": 1.318611162610149e-05, + "loss": 0.6274, + "step": 11458 + }, + { + "epoch": 0.4, + "learning_rate": 1.318507948807917e-05, + "loss": 0.6101, + "step": 11459 + }, + { + "epoch": 0.4, + "learning_rate": 1.3184047312293709e-05, + "loss": 0.6269, + "step": 11460 + }, + { + "epoch": 0.4, + "learning_rate": 1.3183015098757337e-05, + "loss": 0.669, + "step": 11461 + }, + { + "epoch": 0.4, + "learning_rate": 1.3181982847482292e-05, + "loss": 0.5392, + "step": 11462 + }, + { + "epoch": 0.4, + "learning_rate": 1.318095055848082e-05, + "loss": 0.631, + "step": 11463 + }, + { + "epoch": 0.4, + "learning_rate": 1.3179918231765152e-05, + "loss": 0.6117, + "step": 11464 + }, + { + "epoch": 0.4, + "learning_rate": 1.3178885867347532e-05, + "loss": 0.6474, + "step": 11465 + }, + { + "epoch": 0.4, + "learning_rate": 1.3177853465240196e-05, + "loss": 0.5907, + "step": 11466 + }, + { + "epoch": 0.4, + "learning_rate": 1.3176821025455393e-05, + "loss": 0.638, + "step": 11467 + }, + { + "epoch": 0.4, + "learning_rate": 1.3175788548005352e-05, + "loss": 0.6304, + "step": 11468 + }, + { + "epoch": 0.4, + "learning_rate": 1.3174756032902323e-05, + "loss": 0.6351, + "step": 11469 + }, + { + "epoch": 0.4, + "learning_rate": 1.3173723480158546e-05, + "loss": 0.6295, + "step": 11470 + }, + { + "epoch": 0.4, + "learning_rate": 1.3172690889786259e-05, + "loss": 0.6532, + "step": 11471 + }, + { + "epoch": 0.4, + "learning_rate": 1.317165826179771e-05, + "loss": 0.6296, + "step": 11472 + }, + { + "epoch": 0.4, + "learning_rate": 1.3170625596205142e-05, + "loss": 0.6169, + "step": 11473 + }, + { + "epoch": 0.4, + "learning_rate": 1.3169592893020795e-05, + "loss": 0.6607, + "step": 11474 + }, + { + "epoch": 0.4, + "learning_rate": 1.3168560152256915e-05, + "loss": 0.6775, + "step": 11475 + }, + { + "epoch": 0.4, + "learning_rate": 1.3167527373925748e-05, + "loss": 0.6404, + "step": 11476 + }, + { + "epoch": 0.4, + "learning_rate": 1.3166494558039533e-05, + "loss": 0.5484, + "step": 11477 + }, + { + "epoch": 0.4, + "learning_rate": 1.316546170461052e-05, + "loss": 0.5863, + "step": 11478 + }, + { + "epoch": 0.4, + "learning_rate": 1.3164428813650957e-05, + "loss": 0.6493, + "step": 11479 + }, + { + "epoch": 0.4, + "learning_rate": 1.3163395885173086e-05, + "loss": 0.6341, + "step": 11480 + }, + { + "epoch": 0.4, + "learning_rate": 1.3162362919189154e-05, + "loss": 0.6561, + "step": 11481 + }, + { + "epoch": 0.4, + "learning_rate": 1.3161329915711412e-05, + "loss": 0.653, + "step": 11482 + }, + { + "epoch": 0.4, + "learning_rate": 1.3160296874752101e-05, + "loss": 0.6417, + "step": 11483 + }, + { + "epoch": 0.4, + "learning_rate": 1.3159263796323477e-05, + "loss": 0.5965, + "step": 11484 + }, + { + "epoch": 0.4, + "learning_rate": 1.3158230680437783e-05, + "loss": 0.6734, + "step": 11485 + }, + { + "epoch": 0.4, + "learning_rate": 1.3157197527107267e-05, + "loss": 0.6462, + "step": 11486 + }, + { + "epoch": 0.4, + "learning_rate": 1.3156164336344179e-05, + "loss": 0.624, + "step": 11487 + }, + { + "epoch": 0.4, + "learning_rate": 1.3155131108160775e-05, + "loss": 0.6053, + "step": 11488 + }, + { + "epoch": 0.4, + "learning_rate": 1.3154097842569297e-05, + "loss": 0.6055, + "step": 11489 + }, + { + "epoch": 0.4, + "learning_rate": 1.3153064539582e-05, + "loss": 0.6615, + "step": 11490 + }, + { + "epoch": 0.4, + "learning_rate": 1.3152031199211135e-05, + "loss": 0.6677, + "step": 11491 + }, + { + "epoch": 0.4, + "learning_rate": 1.3150997821468951e-05, + "loss": 0.6168, + "step": 11492 + }, + { + "epoch": 0.4, + "learning_rate": 1.3149964406367703e-05, + "loss": 0.6023, + "step": 11493 + }, + { + "epoch": 0.4, + "learning_rate": 1.3148930953919643e-05, + "loss": 0.6487, + "step": 11494 + }, + { + "epoch": 0.4, + "learning_rate": 1.3147897464137023e-05, + "loss": 0.6029, + "step": 11495 + }, + { + "epoch": 0.4, + "learning_rate": 1.3146863937032095e-05, + "loss": 0.6258, + "step": 11496 + }, + { + "epoch": 0.4, + "learning_rate": 1.3145830372617116e-05, + "loss": 0.6423, + "step": 11497 + }, + { + "epoch": 0.4, + "learning_rate": 1.3144796770904337e-05, + "loss": 0.6578, + "step": 11498 + }, + { + "epoch": 0.4, + "learning_rate": 1.3143763131906018e-05, + "loss": 0.5901, + "step": 11499 + }, + { + "epoch": 0.4, + "learning_rate": 1.3142729455634404e-05, + "loss": 0.6407, + "step": 11500 + }, + { + "epoch": 0.4, + "learning_rate": 1.3141695742101758e-05, + "loss": 0.5907, + "step": 11501 + }, + { + "epoch": 0.4, + "learning_rate": 1.314066199132034e-05, + "loss": 0.6077, + "step": 11502 + }, + { + "epoch": 0.4, + "learning_rate": 1.3139628203302395e-05, + "loss": 0.6238, + "step": 11503 + }, + { + "epoch": 0.4, + "learning_rate": 1.3138594378060188e-05, + "loss": 0.6149, + "step": 11504 + }, + { + "epoch": 0.4, + "learning_rate": 1.3137560515605975e-05, + "loss": 0.6299, + "step": 11505 + }, + { + "epoch": 0.4, + "learning_rate": 1.3136526615952015e-05, + "loss": 0.6056, + "step": 11506 + }, + { + "epoch": 0.4, + "learning_rate": 1.3135492679110559e-05, + "loss": 0.6135, + "step": 11507 + }, + { + "epoch": 0.4, + "learning_rate": 1.3134458705093876e-05, + "loss": 0.6058, + "step": 11508 + }, + { + "epoch": 0.4, + "learning_rate": 1.3133424693914218e-05, + "loss": 0.6409, + "step": 11509 + }, + { + "epoch": 0.4, + "learning_rate": 1.3132390645583844e-05, + "loss": 0.5969, + "step": 11510 + }, + { + "epoch": 0.4, + "learning_rate": 1.3131356560115021e-05, + "loss": 0.6855, + "step": 11511 + }, + { + "epoch": 0.4, + "learning_rate": 1.3130322437520002e-05, + "loss": 0.5766, + "step": 11512 + }, + { + "epoch": 0.4, + "learning_rate": 1.312928827781105e-05, + "loss": 0.6755, + "step": 11513 + }, + { + "epoch": 0.4, + "learning_rate": 1.312825408100043e-05, + "loss": 0.6023, + "step": 11514 + }, + { + "epoch": 0.4, + "learning_rate": 1.3127219847100397e-05, + "loss": 0.5994, + "step": 11515 + }, + { + "epoch": 0.4, + "learning_rate": 1.3126185576123219e-05, + "loss": 0.6314, + "step": 11516 + }, + { + "epoch": 0.4, + "learning_rate": 1.3125151268081156e-05, + "loss": 0.6975, + "step": 11517 + }, + { + "epoch": 0.4, + "learning_rate": 1.312411692298647e-05, + "loss": 0.605, + "step": 11518 + }, + { + "epoch": 0.4, + "learning_rate": 1.3123082540851427e-05, + "loss": 0.5787, + "step": 11519 + }, + { + "epoch": 0.4, + "learning_rate": 1.312204812168829e-05, + "loss": 0.621, + "step": 11520 + }, + { + "epoch": 0.4, + "learning_rate": 1.3121013665509324e-05, + "loss": 0.631, + "step": 11521 + }, + { + "epoch": 0.4, + "learning_rate": 1.311997917232679e-05, + "loss": 0.6259, + "step": 11522 + }, + { + "epoch": 0.4, + "learning_rate": 1.3118944642152958e-05, + "loss": 0.657, + "step": 11523 + }, + { + "epoch": 0.4, + "learning_rate": 1.3117910075000091e-05, + "loss": 0.6539, + "step": 11524 + }, + { + "epoch": 0.4, + "learning_rate": 1.3116875470880457e-05, + "loss": 0.5853, + "step": 11525 + }, + { + "epoch": 0.4, + "learning_rate": 1.3115840829806322e-05, + "loss": 0.6192, + "step": 11526 + }, + { + "epoch": 0.4, + "learning_rate": 1.3114806151789949e-05, + "loss": 0.6189, + "step": 11527 + }, + { + "epoch": 0.4, + "learning_rate": 1.3113771436843612e-05, + "loss": 0.5707, + "step": 11528 + }, + { + "epoch": 0.4, + "learning_rate": 1.3112736684979577e-05, + "loss": 0.6167, + "step": 11529 + }, + { + "epoch": 0.4, + "learning_rate": 1.311170189621011e-05, + "loss": 0.6128, + "step": 11530 + }, + { + "epoch": 0.4, + "learning_rate": 1.3110667070547476e-05, + "loss": 0.6206, + "step": 11531 + }, + { + "epoch": 0.4, + "learning_rate": 1.3109632208003953e-05, + "loss": 0.6994, + "step": 11532 + }, + { + "epoch": 0.4, + "learning_rate": 1.3108597308591808e-05, + "loss": 0.6337, + "step": 11533 + }, + { + "epoch": 0.4, + "learning_rate": 1.3107562372323304e-05, + "loss": 0.6142, + "step": 11534 + }, + { + "epoch": 0.4, + "learning_rate": 1.3106527399210722e-05, + "loss": 0.6335, + "step": 11535 + }, + { + "epoch": 0.4, + "learning_rate": 1.3105492389266327e-05, + "loss": 0.6239, + "step": 11536 + }, + { + "epoch": 0.4, + "learning_rate": 1.3104457342502387e-05, + "loss": 0.6375, + "step": 11537 + }, + { + "epoch": 0.4, + "learning_rate": 1.3103422258931185e-05, + "loss": 0.6374, + "step": 11538 + }, + { + "epoch": 0.4, + "learning_rate": 1.3102387138564983e-05, + "loss": 0.6138, + "step": 11539 + }, + { + "epoch": 0.4, + "learning_rate": 1.3101351981416053e-05, + "loss": 0.5834, + "step": 11540 + }, + { + "epoch": 0.4, + "learning_rate": 1.3100316787496678e-05, + "loss": 0.644, + "step": 11541 + }, + { + "epoch": 0.4, + "learning_rate": 1.3099281556819125e-05, + "loss": 0.6651, + "step": 11542 + }, + { + "epoch": 0.4, + "learning_rate": 1.3098246289395664e-05, + "loss": 0.6324, + "step": 11543 + }, + { + "epoch": 0.4, + "learning_rate": 1.3097210985238578e-05, + "loss": 0.6033, + "step": 11544 + }, + { + "epoch": 0.4, + "eval_loss": 0.5762600302696228, + "eval_runtime": 4922.6934, + "eval_samples_per_second": 112.061, + "eval_steps_per_second": 37.354, + "step": 11544 + }, + { + "epoch": 0.4, + "learning_rate": 1.3096175644360138e-05, + "loss": 0.662, + "step": 11545 + }, + { + "epoch": 0.4, + "learning_rate": 1.3095140266772614e-05, + "loss": 0.6567, + "step": 11546 + }, + { + "epoch": 0.4, + "learning_rate": 1.3094104852488292e-05, + "loss": 0.6154, + "step": 11547 + }, + { + "epoch": 0.4, + "learning_rate": 1.3093069401519443e-05, + "loss": 0.7427, + "step": 11548 + }, + { + "epoch": 0.4, + "learning_rate": 1.3092033913878339e-05, + "loss": 0.5697, + "step": 11549 + }, + { + "epoch": 0.4, + "learning_rate": 1.3090998389577264e-05, + "loss": 0.6315, + "step": 11550 + }, + { + "epoch": 0.4, + "learning_rate": 1.3089962828628498e-05, + "loss": 0.5809, + "step": 11551 + }, + { + "epoch": 0.4, + "learning_rate": 1.3088927231044304e-05, + "loss": 0.668, + "step": 11552 + }, + { + "epoch": 0.4, + "learning_rate": 1.3087891596836976e-05, + "loss": 0.6504, + "step": 11553 + }, + { + "epoch": 0.4, + "learning_rate": 1.3086855926018788e-05, + "loss": 0.6427, + "step": 11554 + }, + { + "epoch": 0.4, + "learning_rate": 1.3085820218602015e-05, + "loss": 0.6349, + "step": 11555 + }, + { + "epoch": 0.4, + "learning_rate": 1.3084784474598942e-05, + "loss": 0.6717, + "step": 11556 + }, + { + "epoch": 0.4, + "learning_rate": 1.3083748694021847e-05, + "loss": 0.6583, + "step": 11557 + }, + { + "epoch": 0.4, + "learning_rate": 1.3082712876883005e-05, + "loss": 0.616, + "step": 11558 + }, + { + "epoch": 0.4, + "learning_rate": 1.3081677023194707e-05, + "loss": 0.6281, + "step": 11559 + }, + { + "epoch": 0.4, + "learning_rate": 1.3080641132969231e-05, + "loss": 0.6229, + "step": 11560 + }, + { + "epoch": 0.4, + "learning_rate": 1.3079605206218854e-05, + "loss": 0.594, + "step": 11561 + }, + { + "epoch": 0.4, + "learning_rate": 1.3078569242955864e-05, + "loss": 0.6541, + "step": 11562 + }, + { + "epoch": 0.4, + "learning_rate": 1.3077533243192541e-05, + "loss": 0.6036, + "step": 11563 + }, + { + "epoch": 0.4, + "learning_rate": 1.3076497206941165e-05, + "loss": 0.6025, + "step": 11564 + }, + { + "epoch": 0.4, + "learning_rate": 1.3075461134214024e-05, + "loss": 0.5859, + "step": 11565 + }, + { + "epoch": 0.4, + "learning_rate": 1.3074425025023405e-05, + "loss": 0.6884, + "step": 11566 + }, + { + "epoch": 0.4, + "learning_rate": 1.3073388879381582e-05, + "loss": 0.6299, + "step": 11567 + }, + { + "epoch": 0.4, + "learning_rate": 1.307235269730085e-05, + "loss": 0.6414, + "step": 11568 + }, + { + "epoch": 0.4, + "learning_rate": 1.307131647879349e-05, + "loss": 0.6114, + "step": 11569 + }, + { + "epoch": 0.4, + "learning_rate": 1.3070280223871787e-05, + "loss": 0.6416, + "step": 11570 + }, + { + "epoch": 0.4, + "learning_rate": 1.3069243932548026e-05, + "loss": 0.6549, + "step": 11571 + }, + { + "epoch": 0.4, + "learning_rate": 1.30682076048345e-05, + "loss": 0.5729, + "step": 11572 + }, + { + "epoch": 0.4, + "learning_rate": 1.3067171240743487e-05, + "loss": 0.6443, + "step": 11573 + }, + { + "epoch": 0.4, + "learning_rate": 1.3066134840287282e-05, + "loss": 0.6223, + "step": 11574 + }, + { + "epoch": 0.4, + "learning_rate": 1.3065098403478169e-05, + "loss": 0.6039, + "step": 11575 + }, + { + "epoch": 0.4, + "learning_rate": 1.3064061930328438e-05, + "loss": 0.6499, + "step": 11576 + }, + { + "epoch": 0.4, + "learning_rate": 1.3063025420850375e-05, + "loss": 0.6371, + "step": 11577 + }, + { + "epoch": 0.4, + "learning_rate": 1.3061988875056274e-05, + "loss": 0.6174, + "step": 11578 + }, + { + "epoch": 0.4, + "learning_rate": 1.3060952292958418e-05, + "loss": 0.6105, + "step": 11579 + }, + { + "epoch": 0.4, + "learning_rate": 1.3059915674569099e-05, + "loss": 0.5876, + "step": 11580 + }, + { + "epoch": 0.4, + "learning_rate": 1.3058879019900614e-05, + "loss": 0.6341, + "step": 11581 + }, + { + "epoch": 0.4, + "learning_rate": 1.3057842328965244e-05, + "loss": 0.6575, + "step": 11582 + }, + { + "epoch": 0.4, + "learning_rate": 1.3056805601775286e-05, + "loss": 0.6011, + "step": 11583 + }, + { + "epoch": 0.4, + "learning_rate": 1.3055768838343035e-05, + "loss": 0.6456, + "step": 11584 + }, + { + "epoch": 0.4, + "learning_rate": 1.3054732038680776e-05, + "loss": 0.6678, + "step": 11585 + }, + { + "epoch": 0.4, + "learning_rate": 1.3053695202800802e-05, + "loss": 0.6379, + "step": 11586 + }, + { + "epoch": 0.4, + "learning_rate": 1.3052658330715411e-05, + "loss": 0.6255, + "step": 11587 + }, + { + "epoch": 0.4, + "learning_rate": 1.3051621422436892e-05, + "loss": 0.6705, + "step": 11588 + }, + { + "epoch": 0.4, + "learning_rate": 1.3050584477977544e-05, + "loss": 0.6223, + "step": 11589 + }, + { + "epoch": 0.4, + "learning_rate": 1.3049547497349657e-05, + "loss": 0.6235, + "step": 11590 + }, + { + "epoch": 0.4, + "learning_rate": 1.3048510480565525e-05, + "loss": 0.6306, + "step": 11591 + }, + { + "epoch": 0.4, + "learning_rate": 1.3047473427637448e-05, + "loss": 0.659, + "step": 11592 + }, + { + "epoch": 0.4, + "learning_rate": 1.3046436338577713e-05, + "loss": 0.6334, + "step": 11593 + }, + { + "epoch": 0.4, + "learning_rate": 1.3045399213398624e-05, + "loss": 0.6441, + "step": 11594 + }, + { + "epoch": 0.4, + "learning_rate": 1.3044362052112478e-05, + "loss": 0.5832, + "step": 11595 + }, + { + "epoch": 0.4, + "learning_rate": 1.3043324854731565e-05, + "loss": 0.6516, + "step": 11596 + }, + { + "epoch": 0.4, + "learning_rate": 1.3042287621268185e-05, + "loss": 0.6603, + "step": 11597 + }, + { + "epoch": 0.4, + "learning_rate": 1.3041250351734643e-05, + "loss": 0.6068, + "step": 11598 + }, + { + "epoch": 0.4, + "learning_rate": 1.3040213046143224e-05, + "loss": 0.6282, + "step": 11599 + }, + { + "epoch": 0.4, + "learning_rate": 1.3039175704506237e-05, + "loss": 0.6688, + "step": 11600 + }, + { + "epoch": 0.4, + "learning_rate": 1.303813832683598e-05, + "loss": 0.5768, + "step": 11601 + }, + { + "epoch": 0.4, + "learning_rate": 1.3037100913144744e-05, + "loss": 0.6134, + "step": 11602 + }, + { + "epoch": 0.4, + "learning_rate": 1.3036063463444837e-05, + "loss": 0.6444, + "step": 11603 + }, + { + "epoch": 0.4, + "learning_rate": 1.3035025977748559e-05, + "loss": 0.6491, + "step": 11604 + }, + { + "epoch": 0.4, + "learning_rate": 1.3033988456068205e-05, + "loss": 0.5782, + "step": 11605 + }, + { + "epoch": 0.4, + "learning_rate": 1.3032950898416082e-05, + "loss": 0.6592, + "step": 11606 + }, + { + "epoch": 0.4, + "learning_rate": 1.303191330480449e-05, + "loss": 0.6457, + "step": 11607 + }, + { + "epoch": 0.4, + "learning_rate": 1.3030875675245728e-05, + "loss": 0.6522, + "step": 11608 + }, + { + "epoch": 0.4, + "learning_rate": 1.3029838009752103e-05, + "loss": 0.6413, + "step": 11609 + }, + { + "epoch": 0.4, + "learning_rate": 1.3028800308335917e-05, + "loss": 0.5872, + "step": 11610 + }, + { + "epoch": 0.4, + "learning_rate": 1.3027762571009467e-05, + "loss": 0.6316, + "step": 11611 + }, + { + "epoch": 0.4, + "learning_rate": 1.3026724797785063e-05, + "loss": 0.6285, + "step": 11612 + }, + { + "epoch": 0.4, + "learning_rate": 1.3025686988675013e-05, + "loss": 0.6206, + "step": 11613 + }, + { + "epoch": 0.4, + "learning_rate": 1.302464914369161e-05, + "loss": 0.638, + "step": 11614 + }, + { + "epoch": 0.4, + "learning_rate": 1.3023611262847168e-05, + "loss": 0.6602, + "step": 11615 + }, + { + "epoch": 0.4, + "learning_rate": 1.302257334615399e-05, + "loss": 0.6329, + "step": 11616 + }, + { + "epoch": 0.4, + "learning_rate": 1.302153539362438e-05, + "loss": 0.6314, + "step": 11617 + }, + { + "epoch": 0.4, + "learning_rate": 1.3020497405270647e-05, + "loss": 0.645, + "step": 11618 + }, + { + "epoch": 0.4, + "learning_rate": 1.3019459381105098e-05, + "loss": 0.6271, + "step": 11619 + }, + { + "epoch": 0.4, + "learning_rate": 1.3018421321140033e-05, + "loss": 0.6122, + "step": 11620 + }, + { + "epoch": 0.4, + "learning_rate": 1.3017383225387768e-05, + "loss": 0.6368, + "step": 11621 + }, + { + "epoch": 0.4, + "learning_rate": 1.301634509386061e-05, + "loss": 0.6538, + "step": 11622 + }, + { + "epoch": 0.4, + "learning_rate": 1.3015306926570863e-05, + "loss": 0.6039, + "step": 11623 + }, + { + "epoch": 0.4, + "learning_rate": 1.3014268723530837e-05, + "loss": 0.634, + "step": 11624 + }, + { + "epoch": 0.4, + "learning_rate": 1.3013230484752844e-05, + "loss": 0.6561, + "step": 11625 + }, + { + "epoch": 0.4, + "learning_rate": 1.301219221024919e-05, + "loss": 0.6333, + "step": 11626 + }, + { + "epoch": 0.4, + "learning_rate": 1.3011153900032188e-05, + "loss": 0.6076, + "step": 11627 + }, + { + "epoch": 0.4, + "learning_rate": 1.3010115554114147e-05, + "loss": 0.6804, + "step": 11628 + }, + { + "epoch": 0.4, + "learning_rate": 1.300907717250738e-05, + "loss": 0.6117, + "step": 11629 + }, + { + "epoch": 0.4, + "learning_rate": 1.3008038755224193e-05, + "loss": 0.6682, + "step": 11630 + }, + { + "epoch": 0.4, + "learning_rate": 1.3007000302276905e-05, + "loss": 0.6513, + "step": 11631 + }, + { + "epoch": 0.4, + "learning_rate": 1.3005961813677824e-05, + "loss": 0.6561, + "step": 11632 + }, + { + "epoch": 0.4, + "learning_rate": 1.300492328943926e-05, + "loss": 0.6379, + "step": 11633 + }, + { + "epoch": 0.4, + "learning_rate": 1.3003884729573532e-05, + "loss": 0.6216, + "step": 11634 + }, + { + "epoch": 0.4, + "learning_rate": 1.3002846134092952e-05, + "loss": 0.632, + "step": 11635 + }, + { + "epoch": 0.4, + "learning_rate": 1.3001807503009829e-05, + "loss": 0.6923, + "step": 11636 + }, + { + "epoch": 0.4, + "learning_rate": 1.3000768836336483e-05, + "loss": 0.6048, + "step": 11637 + }, + { + "epoch": 0.4, + "learning_rate": 1.2999730134085226e-05, + "loss": 0.6215, + "step": 11638 + }, + { + "epoch": 0.4, + "learning_rate": 1.299869139626837e-05, + "loss": 0.667, + "step": 11639 + }, + { + "epoch": 0.4, + "learning_rate": 1.299765262289824e-05, + "loss": 0.594, + "step": 11640 + }, + { + "epoch": 0.4, + "learning_rate": 1.2996613813987145e-05, + "loss": 0.6872, + "step": 11641 + }, + { + "epoch": 0.4, + "learning_rate": 1.2995574969547398e-05, + "loss": 0.6531, + "step": 11642 + }, + { + "epoch": 0.4, + "learning_rate": 1.2994536089591324e-05, + "loss": 0.5986, + "step": 11643 + }, + { + "epoch": 0.4, + "learning_rate": 1.2993497174131238e-05, + "loss": 0.6453, + "step": 11644 + }, + { + "epoch": 0.4, + "learning_rate": 1.2992458223179451e-05, + "loss": 0.6342, + "step": 11645 + }, + { + "epoch": 0.4, + "learning_rate": 1.299141923674829e-05, + "loss": 0.5949, + "step": 11646 + }, + { + "epoch": 0.4, + "learning_rate": 1.2990380214850072e-05, + "loss": 0.627, + "step": 11647 + }, + { + "epoch": 0.4, + "learning_rate": 1.2989341157497108e-05, + "loss": 0.6639, + "step": 11648 + }, + { + "epoch": 0.4, + "learning_rate": 1.2988302064701728e-05, + "loss": 0.6603, + "step": 11649 + }, + { + "epoch": 0.4, + "learning_rate": 1.2987262936476246e-05, + "loss": 0.6471, + "step": 11650 + }, + { + "epoch": 0.4, + "learning_rate": 1.2986223772832977e-05, + "loss": 0.6289, + "step": 11651 + }, + { + "epoch": 0.4, + "learning_rate": 1.2985184573784256e-05, + "loss": 0.7017, + "step": 11652 + }, + { + "epoch": 0.4, + "learning_rate": 1.2984145339342393e-05, + "loss": 0.6367, + "step": 11653 + }, + { + "epoch": 0.4, + "learning_rate": 1.2983106069519708e-05, + "loss": 0.6439, + "step": 11654 + }, + { + "epoch": 0.4, + "learning_rate": 1.298206676432853e-05, + "loss": 0.6715, + "step": 11655 + }, + { + "epoch": 0.4, + "learning_rate": 1.2981027423781179e-05, + "loss": 0.6626, + "step": 11656 + }, + { + "epoch": 0.4, + "learning_rate": 1.2979988047889976e-05, + "loss": 0.6015, + "step": 11657 + }, + { + "epoch": 0.4, + "learning_rate": 1.2978948636667243e-05, + "loss": 0.6134, + "step": 11658 + }, + { + "epoch": 0.4, + "learning_rate": 1.2977909190125311e-05, + "loss": 0.5886, + "step": 11659 + }, + { + "epoch": 0.4, + "learning_rate": 1.2976869708276492e-05, + "loss": 0.6172, + "step": 11660 + }, + { + "epoch": 0.4, + "learning_rate": 1.2975830191133119e-05, + "loss": 0.6073, + "step": 11661 + }, + { + "epoch": 0.4, + "learning_rate": 1.2974790638707517e-05, + "loss": 0.6445, + "step": 11662 + }, + { + "epoch": 0.4, + "learning_rate": 1.2973751051012007e-05, + "loss": 0.6397, + "step": 11663 + }, + { + "epoch": 0.4, + "learning_rate": 1.2972711428058915e-05, + "loss": 0.6362, + "step": 11664 + }, + { + "epoch": 0.4, + "learning_rate": 1.2971671769860572e-05, + "loss": 0.6573, + "step": 11665 + }, + { + "epoch": 0.4, + "learning_rate": 1.2970632076429299e-05, + "loss": 0.5928, + "step": 11666 + }, + { + "epoch": 0.4, + "learning_rate": 1.2969592347777424e-05, + "loss": 0.6853, + "step": 11667 + }, + { + "epoch": 0.4, + "learning_rate": 1.2968552583917279e-05, + "loss": 0.681, + "step": 11668 + }, + { + "epoch": 0.4, + "learning_rate": 1.2967512784861183e-05, + "loss": 0.6349, + "step": 11669 + }, + { + "epoch": 0.4, + "learning_rate": 1.2966472950621469e-05, + "loss": 0.5678, + "step": 11670 + }, + { + "epoch": 0.4, + "learning_rate": 1.296543308121047e-05, + "loss": 0.6649, + "step": 11671 + }, + { + "epoch": 0.4, + "learning_rate": 1.2964393176640508e-05, + "loss": 0.6165, + "step": 11672 + }, + { + "epoch": 0.4, + "learning_rate": 1.2963353236923914e-05, + "loss": 0.5998, + "step": 11673 + }, + { + "epoch": 0.4, + "learning_rate": 1.2962313262073022e-05, + "loss": 0.6044, + "step": 11674 + }, + { + "epoch": 0.4, + "learning_rate": 1.2961273252100155e-05, + "loss": 0.6804, + "step": 11675 + }, + { + "epoch": 0.4, + "learning_rate": 1.296023320701765e-05, + "loss": 0.6257, + "step": 11676 + }, + { + "epoch": 0.4, + "learning_rate": 1.2959193126837834e-05, + "loss": 0.6319, + "step": 11677 + }, + { + "epoch": 0.4, + "learning_rate": 1.2958153011573042e-05, + "loss": 0.6167, + "step": 11678 + }, + { + "epoch": 0.4, + "learning_rate": 1.2957112861235604e-05, + "loss": 0.5979, + "step": 11679 + }, + { + "epoch": 0.4, + "learning_rate": 1.2956072675837849e-05, + "loss": 0.6092, + "step": 11680 + }, + { + "epoch": 0.4, + "learning_rate": 1.2955032455392115e-05, + "loss": 0.6428, + "step": 11681 + }, + { + "epoch": 0.4, + "learning_rate": 1.2953992199910734e-05, + "loss": 0.6451, + "step": 11682 + }, + { + "epoch": 0.4, + "learning_rate": 1.295295190940604e-05, + "loss": 0.6561, + "step": 11683 + }, + { + "epoch": 0.4, + "learning_rate": 1.2951911583890362e-05, + "loss": 0.6482, + "step": 11684 + }, + { + "epoch": 0.4, + "learning_rate": 1.295087122337604e-05, + "loss": 0.6619, + "step": 11685 + }, + { + "epoch": 0.4, + "learning_rate": 1.2949830827875406e-05, + "loss": 0.6586, + "step": 11686 + }, + { + "epoch": 0.4, + "learning_rate": 1.2948790397400796e-05, + "loss": 0.6436, + "step": 11687 + }, + { + "epoch": 0.4, + "learning_rate": 1.2947749931964548e-05, + "loss": 0.5652, + "step": 11688 + }, + { + "epoch": 0.4, + "learning_rate": 1.2946709431578993e-05, + "loss": 0.6562, + "step": 11689 + }, + { + "epoch": 0.41, + "learning_rate": 1.2945668896256469e-05, + "loss": 0.6139, + "step": 11690 + }, + { + "epoch": 0.41, + "learning_rate": 1.2944628326009317e-05, + "loss": 0.6095, + "step": 11691 + }, + { + "epoch": 0.41, + "learning_rate": 1.294358772084987e-05, + "loss": 0.6238, + "step": 11692 + }, + { + "epoch": 0.41, + "learning_rate": 1.2942547080790467e-05, + "loss": 0.6166, + "step": 11693 + }, + { + "epoch": 0.41, + "learning_rate": 1.2941506405843444e-05, + "loss": 0.6793, + "step": 11694 + }, + { + "epoch": 0.41, + "learning_rate": 1.2940465696021142e-05, + "loss": 0.6755, + "step": 11695 + }, + { + "epoch": 0.41, + "learning_rate": 1.29394249513359e-05, + "loss": 0.6327, + "step": 11696 + }, + { + "epoch": 0.41, + "learning_rate": 1.293838417180006e-05, + "loss": 0.5996, + "step": 11697 + }, + { + "epoch": 0.41, + "learning_rate": 1.2937343357425955e-05, + "loss": 0.685, + "step": 11698 + }, + { + "epoch": 0.41, + "learning_rate": 1.293630250822593e-05, + "loss": 0.6123, + "step": 11699 + }, + { + "epoch": 0.41, + "learning_rate": 1.2935261624212326e-05, + "loss": 0.6636, + "step": 11700 + }, + { + "epoch": 0.41, + "learning_rate": 1.293422070539748e-05, + "loss": 0.6659, + "step": 11701 + }, + { + "epoch": 0.41, + "learning_rate": 1.2933179751793734e-05, + "loss": 0.6292, + "step": 11702 + }, + { + "epoch": 0.41, + "learning_rate": 1.2932138763413438e-05, + "loss": 0.6269, + "step": 11703 + }, + { + "epoch": 0.41, + "learning_rate": 1.293109774026892e-05, + "loss": 0.6308, + "step": 11704 + }, + { + "epoch": 0.41, + "learning_rate": 1.2930056682372534e-05, + "loss": 0.6003, + "step": 11705 + }, + { + "epoch": 0.41, + "learning_rate": 1.2929015589736622e-05, + "loss": 0.5863, + "step": 11706 + }, + { + "epoch": 0.41, + "learning_rate": 1.292797446237352e-05, + "loss": 0.623, + "step": 11707 + }, + { + "epoch": 0.41, + "learning_rate": 1.2926933300295579e-05, + "loss": 0.6669, + "step": 11708 + }, + { + "epoch": 0.41, + "learning_rate": 1.2925892103515143e-05, + "loss": 0.6463, + "step": 11709 + }, + { + "epoch": 0.41, + "learning_rate": 1.2924850872044552e-05, + "loss": 0.6057, + "step": 11710 + }, + { + "epoch": 0.41, + "learning_rate": 1.2923809605896156e-05, + "loss": 0.6458, + "step": 11711 + }, + { + "epoch": 0.41, + "learning_rate": 1.2922768305082298e-05, + "loss": 0.6402, + "step": 11712 + }, + { + "epoch": 0.41, + "learning_rate": 1.2921726969615325e-05, + "loss": 0.6155, + "step": 11713 + }, + { + "epoch": 0.41, + "learning_rate": 1.292068559950758e-05, + "loss": 0.6006, + "step": 11714 + }, + { + "epoch": 0.41, + "learning_rate": 1.2919644194771417e-05, + "loss": 0.6395, + "step": 11715 + }, + { + "epoch": 0.41, + "learning_rate": 1.2918602755419174e-05, + "loss": 0.6041, + "step": 11716 + }, + { + "epoch": 0.41, + "learning_rate": 1.2917561281463205e-05, + "loss": 0.622, + "step": 11717 + }, + { + "epoch": 0.41, + "learning_rate": 1.291651977291586e-05, + "loss": 0.6658, + "step": 11718 + }, + { + "epoch": 0.41, + "learning_rate": 1.2915478229789478e-05, + "loss": 0.6388, + "step": 11719 + }, + { + "epoch": 0.41, + "learning_rate": 1.2914436652096413e-05, + "loss": 0.6487, + "step": 11720 + }, + { + "epoch": 0.41, + "learning_rate": 1.2913395039849021e-05, + "loss": 0.6619, + "step": 11721 + }, + { + "epoch": 0.41, + "learning_rate": 1.291235339305964e-05, + "loss": 0.6253, + "step": 11722 + }, + { + "epoch": 0.41, + "learning_rate": 1.2911311711740626e-05, + "loss": 0.5713, + "step": 11723 + }, + { + "epoch": 0.41, + "learning_rate": 1.2910269995904332e-05, + "loss": 0.6197, + "step": 11724 + }, + { + "epoch": 0.41, + "learning_rate": 1.2909228245563103e-05, + "loss": 0.6425, + "step": 11725 + }, + { + "epoch": 0.41, + "learning_rate": 1.2908186460729294e-05, + "loss": 0.5766, + "step": 11726 + }, + { + "epoch": 0.41, + "learning_rate": 1.2907144641415256e-05, + "loss": 0.6258, + "step": 11727 + }, + { + "epoch": 0.41, + "learning_rate": 1.290610278763334e-05, + "loss": 0.6755, + "step": 11728 + }, + { + "epoch": 0.41, + "learning_rate": 1.2905060899395897e-05, + "loss": 0.6255, + "step": 11729 + }, + { + "epoch": 0.41, + "learning_rate": 1.2904018976715287e-05, + "loss": 0.6511, + "step": 11730 + }, + { + "epoch": 0.41, + "learning_rate": 1.2902977019603855e-05, + "loss": 0.633, + "step": 11731 + }, + { + "epoch": 0.41, + "learning_rate": 1.2901935028073957e-05, + "loss": 0.6165, + "step": 11732 + }, + { + "epoch": 0.41, + "learning_rate": 1.2900893002137953e-05, + "loss": 0.5828, + "step": 11733 + }, + { + "epoch": 0.41, + "learning_rate": 1.289985094180819e-05, + "loss": 0.6591, + "step": 11734 + }, + { + "epoch": 0.41, + "learning_rate": 1.2898808847097025e-05, + "loss": 0.5781, + "step": 11735 + }, + { + "epoch": 0.41, + "learning_rate": 1.2897766718016815e-05, + "loss": 0.6462, + "step": 11736 + }, + { + "epoch": 0.41, + "learning_rate": 1.2896724554579916e-05, + "loss": 0.6387, + "step": 11737 + }, + { + "epoch": 0.41, + "learning_rate": 1.289568235679868e-05, + "loss": 0.6461, + "step": 11738 + }, + { + "epoch": 0.41, + "learning_rate": 1.2894640124685469e-05, + "loss": 0.6447, + "step": 11739 + }, + { + "epoch": 0.41, + "learning_rate": 1.2893597858252637e-05, + "loss": 0.6014, + "step": 11740 + }, + { + "epoch": 0.41, + "learning_rate": 1.2892555557512544e-05, + "loss": 0.6021, + "step": 11741 + }, + { + "epoch": 0.41, + "learning_rate": 1.2891513222477543e-05, + "loss": 0.6364, + "step": 11742 + }, + { + "epoch": 0.41, + "learning_rate": 1.2890470853159995e-05, + "loss": 0.6596, + "step": 11743 + }, + { + "epoch": 0.41, + "learning_rate": 1.2889428449572258e-05, + "loss": 0.5865, + "step": 11744 + }, + { + "epoch": 0.41, + "learning_rate": 1.2888386011726695e-05, + "loss": 0.5962, + "step": 11745 + }, + { + "epoch": 0.41, + "learning_rate": 1.288734353963566e-05, + "loss": 0.6969, + "step": 11746 + }, + { + "epoch": 0.41, + "learning_rate": 1.2886301033311515e-05, + "loss": 0.6304, + "step": 11747 + }, + { + "epoch": 0.41, + "learning_rate": 1.288525849276662e-05, + "loss": 0.6261, + "step": 11748 + }, + { + "epoch": 0.41, + "learning_rate": 1.2884215918013335e-05, + "loss": 0.5893, + "step": 11749 + }, + { + "epoch": 0.41, + "learning_rate": 1.2883173309064022e-05, + "loss": 0.6418, + "step": 11750 + }, + { + "epoch": 0.41, + "learning_rate": 1.2882130665931044e-05, + "loss": 0.6183, + "step": 11751 + }, + { + "epoch": 0.41, + "learning_rate": 1.2881087988626756e-05, + "loss": 0.6507, + "step": 11752 + }, + { + "epoch": 0.41, + "learning_rate": 1.2880045277163531e-05, + "loss": 0.6118, + "step": 11753 + }, + { + "epoch": 0.41, + "learning_rate": 1.2879002531553724e-05, + "loss": 0.6316, + "step": 11754 + }, + { + "epoch": 0.41, + "learning_rate": 1.2877959751809699e-05, + "loss": 0.6159, + "step": 11755 + }, + { + "epoch": 0.41, + "learning_rate": 1.2876916937943822e-05, + "loss": 0.6541, + "step": 11756 + }, + { + "epoch": 0.41, + "learning_rate": 1.2875874089968452e-05, + "loss": 0.6414, + "step": 11757 + }, + { + "epoch": 0.41, + "learning_rate": 1.2874831207895962e-05, + "loss": 0.597, + "step": 11758 + }, + { + "epoch": 0.41, + "learning_rate": 1.2873788291738707e-05, + "loss": 0.6786, + "step": 11759 + }, + { + "epoch": 0.41, + "learning_rate": 1.2872745341509059e-05, + "loss": 0.6358, + "step": 11760 + }, + { + "epoch": 0.41, + "learning_rate": 1.287170235721938e-05, + "loss": 0.6547, + "step": 11761 + }, + { + "epoch": 0.41, + "learning_rate": 1.2870659338882037e-05, + "loss": 0.6543, + "step": 11762 + }, + { + "epoch": 0.41, + "learning_rate": 1.2869616286509394e-05, + "loss": 0.6043, + "step": 11763 + }, + { + "epoch": 0.41, + "learning_rate": 1.2868573200113823e-05, + "loss": 0.6794, + "step": 11764 + }, + { + "epoch": 0.41, + "learning_rate": 1.2867530079707686e-05, + "loss": 0.6508, + "step": 11765 + }, + { + "epoch": 0.41, + "learning_rate": 1.2866486925303355e-05, + "loss": 0.585, + "step": 11766 + }, + { + "epoch": 0.41, + "learning_rate": 1.2865443736913194e-05, + "loss": 0.6419, + "step": 11767 + }, + { + "epoch": 0.41, + "learning_rate": 1.2864400514549571e-05, + "loss": 0.6185, + "step": 11768 + }, + { + "epoch": 0.41, + "learning_rate": 1.2863357258224855e-05, + "loss": 0.702, + "step": 11769 + }, + { + "epoch": 0.41, + "learning_rate": 1.2862313967951423e-05, + "loss": 0.6028, + "step": 11770 + }, + { + "epoch": 0.41, + "learning_rate": 1.2861270643741633e-05, + "loss": 0.5854, + "step": 11771 + }, + { + "epoch": 0.41, + "learning_rate": 1.286022728560786e-05, + "loss": 0.6297, + "step": 11772 + }, + { + "epoch": 0.41, + "learning_rate": 1.2859183893562479e-05, + "loss": 0.6441, + "step": 11773 + }, + { + "epoch": 0.41, + "learning_rate": 1.285814046761785e-05, + "loss": 0.6251, + "step": 11774 + }, + { + "epoch": 0.41, + "learning_rate": 1.2857097007786351e-05, + "loss": 0.6314, + "step": 11775 + }, + { + "epoch": 0.41, + "learning_rate": 1.2856053514080357e-05, + "loss": 0.6889, + "step": 11776 + }, + { + "epoch": 0.41, + "learning_rate": 1.2855009986512234e-05, + "loss": 0.6164, + "step": 11777 + }, + { + "epoch": 0.41, + "learning_rate": 1.2853966425094355e-05, + "loss": 0.6779, + "step": 11778 + }, + { + "epoch": 0.41, + "learning_rate": 1.2852922829839094e-05, + "loss": 0.7002, + "step": 11779 + }, + { + "epoch": 0.41, + "learning_rate": 1.2851879200758823e-05, + "loss": 0.646, + "step": 11780 + }, + { + "epoch": 0.41, + "learning_rate": 1.285083553786592e-05, + "loss": 0.6573, + "step": 11781 + }, + { + "epoch": 0.41, + "learning_rate": 1.2849791841172752e-05, + "loss": 0.6158, + "step": 11782 + }, + { + "epoch": 0.41, + "learning_rate": 1.2848748110691696e-05, + "loss": 0.62, + "step": 11783 + }, + { + "epoch": 0.41, + "learning_rate": 1.284770434643513e-05, + "loss": 0.578, + "step": 11784 + }, + { + "epoch": 0.41, + "learning_rate": 1.2846660548415426e-05, + "loss": 0.574, + "step": 11785 + }, + { + "epoch": 0.41, + "learning_rate": 1.2845616716644958e-05, + "loss": 0.6502, + "step": 11786 + }, + { + "epoch": 0.41, + "learning_rate": 1.2844572851136108e-05, + "loss": 0.6563, + "step": 11787 + }, + { + "epoch": 0.41, + "learning_rate": 1.2843528951901245e-05, + "loss": 0.6478, + "step": 11788 + }, + { + "epoch": 0.41, + "learning_rate": 1.2842485018952749e-05, + "loss": 0.5999, + "step": 11789 + }, + { + "epoch": 0.41, + "learning_rate": 1.2841441052303001e-05, + "loss": 0.6947, + "step": 11790 + }, + { + "epoch": 0.41, + "learning_rate": 1.284039705196437e-05, + "loss": 0.6663, + "step": 11791 + }, + { + "epoch": 0.41, + "learning_rate": 1.283935301794924e-05, + "loss": 0.6595, + "step": 11792 + }, + { + "epoch": 0.41, + "learning_rate": 1.2838308950269993e-05, + "loss": 0.6273, + "step": 11793 + }, + { + "epoch": 0.41, + "learning_rate": 1.2837264848939e-05, + "loss": 0.6173, + "step": 11794 + }, + { + "epoch": 0.41, + "learning_rate": 1.2836220713968639e-05, + "loss": 0.6468, + "step": 11795 + }, + { + "epoch": 0.41, + "learning_rate": 1.2835176545371299e-05, + "loss": 0.6583, + "step": 11796 + }, + { + "epoch": 0.41, + "learning_rate": 1.2834132343159353e-05, + "loss": 0.6092, + "step": 11797 + }, + { + "epoch": 0.41, + "learning_rate": 1.2833088107345181e-05, + "loss": 0.6711, + "step": 11798 + }, + { + "epoch": 0.41, + "learning_rate": 1.2832043837941168e-05, + "loss": 0.5535, + "step": 11799 + }, + { + "epoch": 0.41, + "learning_rate": 1.2830999534959692e-05, + "loss": 0.6278, + "step": 11800 + }, + { + "epoch": 0.41, + "learning_rate": 1.2829955198413136e-05, + "loss": 0.6406, + "step": 11801 + }, + { + "epoch": 0.41, + "learning_rate": 1.282891082831388e-05, + "loss": 0.6265, + "step": 11802 + }, + { + "epoch": 0.41, + "learning_rate": 1.2827866424674307e-05, + "loss": 0.6646, + "step": 11803 + }, + { + "epoch": 0.41, + "learning_rate": 1.2826821987506802e-05, + "loss": 0.6351, + "step": 11804 + }, + { + "epoch": 0.41, + "learning_rate": 1.2825777516823745e-05, + "loss": 0.6403, + "step": 11805 + }, + { + "epoch": 0.41, + "learning_rate": 1.2824733012637523e-05, + "loss": 0.6291, + "step": 11806 + }, + { + "epoch": 0.41, + "learning_rate": 1.2823688474960514e-05, + "loss": 0.6516, + "step": 11807 + }, + { + "epoch": 0.41, + "learning_rate": 1.2822643903805113e-05, + "loss": 0.6368, + "step": 11808 + }, + { + "epoch": 0.41, + "learning_rate": 1.2821599299183692e-05, + "loss": 0.6445, + "step": 11809 + }, + { + "epoch": 0.41, + "learning_rate": 1.2820554661108639e-05, + "loss": 0.6193, + "step": 11810 + }, + { + "epoch": 0.41, + "learning_rate": 1.2819509989592351e-05, + "loss": 0.5917, + "step": 11811 + }, + { + "epoch": 0.41, + "learning_rate": 1.28184652846472e-05, + "loss": 0.6594, + "step": 11812 + }, + { + "epoch": 0.41, + "learning_rate": 1.2817420546285576e-05, + "loss": 0.6318, + "step": 11813 + }, + { + "epoch": 0.41, + "learning_rate": 1.2816375774519874e-05, + "loss": 0.636, + "step": 11814 + }, + { + "epoch": 0.41, + "learning_rate": 1.281533096936247e-05, + "loss": 0.6827, + "step": 11815 + }, + { + "epoch": 0.41, + "learning_rate": 1.2814286130825755e-05, + "loss": 0.6577, + "step": 11816 + }, + { + "epoch": 0.41, + "learning_rate": 1.281324125892212e-05, + "loss": 0.6207, + "step": 11817 + }, + { + "epoch": 0.41, + "learning_rate": 1.281219635366395e-05, + "loss": 0.6206, + "step": 11818 + }, + { + "epoch": 0.41, + "learning_rate": 1.2811151415063633e-05, + "loss": 0.6548, + "step": 11819 + }, + { + "epoch": 0.41, + "learning_rate": 1.2810106443133565e-05, + "loss": 0.6766, + "step": 11820 + }, + { + "epoch": 0.41, + "learning_rate": 1.2809061437886127e-05, + "loss": 0.6309, + "step": 11821 + }, + { + "epoch": 0.41, + "learning_rate": 1.2808016399333712e-05, + "loss": 0.5911, + "step": 11822 + }, + { + "epoch": 0.41, + "learning_rate": 1.2806971327488713e-05, + "loss": 0.6217, + "step": 11823 + }, + { + "epoch": 0.41, + "learning_rate": 1.2805926222363516e-05, + "loss": 0.6376, + "step": 11824 + }, + { + "epoch": 0.41, + "learning_rate": 1.2804881083970513e-05, + "loss": 0.6343, + "step": 11825 + }, + { + "epoch": 0.41, + "learning_rate": 1.28038359123221e-05, + "loss": 0.6556, + "step": 11826 + }, + { + "epoch": 0.41, + "learning_rate": 1.2802790707430662e-05, + "loss": 0.6182, + "step": 11827 + }, + { + "epoch": 0.41, + "learning_rate": 1.2801745469308596e-05, + "loss": 0.6836, + "step": 11828 + }, + { + "epoch": 0.41, + "learning_rate": 1.2800700197968294e-05, + "loss": 0.6449, + "step": 11829 + }, + { + "epoch": 0.41, + "learning_rate": 1.2799654893422146e-05, + "loss": 0.6428, + "step": 11830 + }, + { + "epoch": 0.41, + "learning_rate": 1.2798609555682549e-05, + "loss": 0.621, + "step": 11831 + }, + { + "epoch": 0.41, + "learning_rate": 1.2797564184761897e-05, + "loss": 0.6654, + "step": 11832 + }, + { + "epoch": 0.41, + "learning_rate": 1.279651878067258e-05, + "loss": 0.5915, + "step": 11833 + }, + { + "epoch": 0.41, + "learning_rate": 1.2795473343426994e-05, + "loss": 0.602, + "step": 11834 + }, + { + "epoch": 0.41, + "learning_rate": 1.2794427873037541e-05, + "loss": 0.6715, + "step": 11835 + }, + { + "epoch": 0.41, + "learning_rate": 1.2793382369516606e-05, + "loss": 0.6285, + "step": 11836 + }, + { + "epoch": 0.41, + "learning_rate": 1.279233683287659e-05, + "loss": 0.5942, + "step": 11837 + }, + { + "epoch": 0.41, + "learning_rate": 1.279129126312989e-05, + "loss": 0.6349, + "step": 11838 + }, + { + "epoch": 0.41, + "learning_rate": 1.2790245660288898e-05, + "loss": 0.6021, + "step": 11839 + }, + { + "epoch": 0.41, + "learning_rate": 1.278920002436602e-05, + "loss": 0.5839, + "step": 11840 + }, + { + "epoch": 0.41, + "learning_rate": 1.278815435537364e-05, + "loss": 0.5869, + "step": 11841 + }, + { + "epoch": 0.41, + "learning_rate": 1.2787108653324168e-05, + "loss": 0.6652, + "step": 11842 + }, + { + "epoch": 0.41, + "learning_rate": 1.2786062918229996e-05, + "loss": 0.5825, + "step": 11843 + }, + { + "epoch": 0.41, + "learning_rate": 1.2785017150103522e-05, + "loss": 0.5937, + "step": 11844 + }, + { + "epoch": 0.41, + "learning_rate": 1.278397134895715e-05, + "loss": 0.6321, + "step": 11845 + }, + { + "epoch": 0.41, + "learning_rate": 1.2782925514803275e-05, + "loss": 0.6052, + "step": 11846 + }, + { + "epoch": 0.41, + "learning_rate": 1.2781879647654293e-05, + "loss": 0.657, + "step": 11847 + }, + { + "epoch": 0.41, + "learning_rate": 1.2780833747522614e-05, + "loss": 0.6195, + "step": 11848 + }, + { + "epoch": 0.41, + "learning_rate": 1.2779787814420632e-05, + "loss": 0.6846, + "step": 11849 + }, + { + "epoch": 0.41, + "learning_rate": 1.2778741848360747e-05, + "loss": 0.6231, + "step": 11850 + }, + { + "epoch": 0.41, + "learning_rate": 1.2777695849355365e-05, + "loss": 0.6157, + "step": 11851 + }, + { + "epoch": 0.41, + "learning_rate": 1.2776649817416884e-05, + "loss": 0.6495, + "step": 11852 + }, + { + "epoch": 0.41, + "learning_rate": 1.2775603752557706e-05, + "loss": 0.6412, + "step": 11853 + }, + { + "epoch": 0.41, + "learning_rate": 1.2774557654790235e-05, + "loss": 0.6245, + "step": 11854 + }, + { + "epoch": 0.41, + "learning_rate": 1.2773511524126873e-05, + "loss": 0.5888, + "step": 11855 + }, + { + "epoch": 0.41, + "learning_rate": 1.2772465360580024e-05, + "loss": 0.6322, + "step": 11856 + }, + { + "epoch": 0.41, + "learning_rate": 1.2771419164162088e-05, + "loss": 0.5741, + "step": 11857 + }, + { + "epoch": 0.41, + "learning_rate": 1.2770372934885477e-05, + "loss": 0.6675, + "step": 11858 + }, + { + "epoch": 0.41, + "learning_rate": 1.2769326672762587e-05, + "loss": 0.6646, + "step": 11859 + }, + { + "epoch": 0.41, + "learning_rate": 1.2768280377805827e-05, + "loss": 0.6796, + "step": 11860 + }, + { + "epoch": 0.41, + "learning_rate": 1.2767234050027602e-05, + "loss": 0.6545, + "step": 11861 + }, + { + "epoch": 0.41, + "learning_rate": 1.2766187689440315e-05, + "loss": 0.6305, + "step": 11862 + }, + { + "epoch": 0.41, + "learning_rate": 1.2765141296056373e-05, + "loss": 0.6526, + "step": 11863 + }, + { + "epoch": 0.41, + "learning_rate": 1.2764094869888185e-05, + "loss": 0.6807, + "step": 11864 + }, + { + "epoch": 0.41, + "learning_rate": 1.2763048410948156e-05, + "loss": 0.6601, + "step": 11865 + }, + { + "epoch": 0.41, + "learning_rate": 1.2762001919248693e-05, + "loss": 0.6946, + "step": 11866 + }, + { + "epoch": 0.41, + "learning_rate": 1.2760955394802201e-05, + "loss": 0.6262, + "step": 11867 + }, + { + "epoch": 0.41, + "learning_rate": 1.2759908837621091e-05, + "loss": 0.6233, + "step": 11868 + }, + { + "epoch": 0.41, + "learning_rate": 1.2758862247717772e-05, + "loss": 0.6521, + "step": 11869 + }, + { + "epoch": 0.41, + "learning_rate": 1.275781562510465e-05, + "loss": 0.5662, + "step": 11870 + }, + { + "epoch": 0.41, + "learning_rate": 1.2756768969794134e-05, + "loss": 0.6021, + "step": 11871 + }, + { + "epoch": 0.41, + "learning_rate": 1.2755722281798635e-05, + "loss": 0.6774, + "step": 11872 + }, + { + "epoch": 0.41, + "learning_rate": 1.2754675561130566e-05, + "loss": 0.6452, + "step": 11873 + }, + { + "epoch": 0.41, + "learning_rate": 1.2753628807802333e-05, + "loss": 0.6454, + "step": 11874 + }, + { + "epoch": 0.41, + "learning_rate": 1.2752582021826338e-05, + "loss": 0.6288, + "step": 11875 + }, + { + "epoch": 0.41, + "learning_rate": 1.275153520321501e-05, + "loss": 0.649, + "step": 11876 + }, + { + "epoch": 0.41, + "learning_rate": 1.2750488351980751e-05, + "loss": 0.6409, + "step": 11877 + }, + { + "epoch": 0.41, + "learning_rate": 1.2749441468135968e-05, + "loss": 0.6205, + "step": 11878 + }, + { + "epoch": 0.41, + "learning_rate": 1.2748394551693084e-05, + "loss": 0.6285, + "step": 11879 + }, + { + "epoch": 0.41, + "learning_rate": 1.2747347602664504e-05, + "loss": 0.6819, + "step": 11880 + }, + { + "epoch": 0.41, + "learning_rate": 1.274630062106264e-05, + "loss": 0.6775, + "step": 11881 + }, + { + "epoch": 0.41, + "learning_rate": 1.2745253606899913e-05, + "loss": 0.6228, + "step": 11882 + }, + { + "epoch": 0.41, + "learning_rate": 1.274420656018873e-05, + "loss": 0.6235, + "step": 11883 + }, + { + "epoch": 0.41, + "learning_rate": 1.2743159480941502e-05, + "loss": 0.6745, + "step": 11884 + }, + { + "epoch": 0.41, + "learning_rate": 1.2742112369170654e-05, + "loss": 0.6305, + "step": 11885 + }, + { + "epoch": 0.41, + "learning_rate": 1.2741065224888596e-05, + "loss": 0.6367, + "step": 11886 + }, + { + "epoch": 0.41, + "learning_rate": 1.2740018048107734e-05, + "loss": 0.6495, + "step": 11887 + }, + { + "epoch": 0.41, + "learning_rate": 1.2738970838840498e-05, + "loss": 0.5928, + "step": 11888 + }, + { + "epoch": 0.41, + "learning_rate": 1.2737923597099301e-05, + "loss": 0.667, + "step": 11889 + }, + { + "epoch": 0.41, + "learning_rate": 1.273687632289655e-05, + "loss": 0.6198, + "step": 11890 + }, + { + "epoch": 0.41, + "learning_rate": 1.2735829016244673e-05, + "loss": 0.5857, + "step": 11891 + }, + { + "epoch": 0.41, + "learning_rate": 1.273478167715608e-05, + "loss": 0.673, + "step": 11892 + }, + { + "epoch": 0.41, + "learning_rate": 1.2733734305643189e-05, + "loss": 0.6235, + "step": 11893 + }, + { + "epoch": 0.41, + "learning_rate": 1.273268690171842e-05, + "loss": 0.6102, + "step": 11894 + }, + { + "epoch": 0.41, + "learning_rate": 1.2731639465394194e-05, + "loss": 0.641, + "step": 11895 + }, + { + "epoch": 0.41, + "learning_rate": 1.2730591996682922e-05, + "loss": 0.5735, + "step": 11896 + }, + { + "epoch": 0.41, + "learning_rate": 1.2729544495597032e-05, + "loss": 0.6216, + "step": 11897 + }, + { + "epoch": 0.41, + "learning_rate": 1.2728496962148937e-05, + "loss": 0.5745, + "step": 11898 + }, + { + "epoch": 0.41, + "learning_rate": 1.2727449396351057e-05, + "loss": 0.6524, + "step": 11899 + }, + { + "epoch": 0.41, + "learning_rate": 1.2726401798215818e-05, + "loss": 0.6615, + "step": 11900 + }, + { + "epoch": 0.41, + "learning_rate": 1.2725354167755637e-05, + "loss": 0.6541, + "step": 11901 + }, + { + "epoch": 0.41, + "learning_rate": 1.2724306504982931e-05, + "loss": 0.6308, + "step": 11902 + }, + { + "epoch": 0.41, + "learning_rate": 1.2723258809910128e-05, + "loss": 0.6195, + "step": 11903 + }, + { + "epoch": 0.41, + "learning_rate": 1.2722211082549647e-05, + "loss": 0.6444, + "step": 11904 + }, + { + "epoch": 0.41, + "learning_rate": 1.2721163322913908e-05, + "loss": 0.6061, + "step": 11905 + }, + { + "epoch": 0.41, + "learning_rate": 1.2720115531015336e-05, + "loss": 0.6176, + "step": 11906 + }, + { + "epoch": 0.41, + "learning_rate": 1.2719067706866355e-05, + "loss": 0.6656, + "step": 11907 + }, + { + "epoch": 0.41, + "learning_rate": 1.2718019850479383e-05, + "loss": 0.6555, + "step": 11908 + }, + { + "epoch": 0.41, + "learning_rate": 1.2716971961866852e-05, + "loss": 0.6285, + "step": 11909 + }, + { + "epoch": 0.41, + "learning_rate": 1.271592404104118e-05, + "loss": 0.7077, + "step": 11910 + }, + { + "epoch": 0.41, + "learning_rate": 1.2714876088014792e-05, + "loss": 0.6303, + "step": 11911 + }, + { + "epoch": 0.41, + "learning_rate": 1.2713828102800111e-05, + "loss": 0.6183, + "step": 11912 + }, + { + "epoch": 0.41, + "learning_rate": 1.2712780085409571e-05, + "loss": 0.608, + "step": 11913 + }, + { + "epoch": 0.41, + "learning_rate": 1.2711732035855589e-05, + "loss": 0.6418, + "step": 11914 + }, + { + "epoch": 0.41, + "learning_rate": 1.271068395415059e-05, + "loss": 0.6206, + "step": 11915 + }, + { + "epoch": 0.41, + "learning_rate": 1.2709635840307008e-05, + "loss": 0.7225, + "step": 11916 + }, + { + "epoch": 0.41, + "learning_rate": 1.2708587694337262e-05, + "loss": 0.641, + "step": 11917 + }, + { + "epoch": 0.41, + "learning_rate": 1.2707539516253784e-05, + "loss": 0.6347, + "step": 11918 + }, + { + "epoch": 0.41, + "learning_rate": 1.2706491306069003e-05, + "loss": 0.6292, + "step": 11919 + }, + { + "epoch": 0.41, + "learning_rate": 1.2705443063795338e-05, + "loss": 0.623, + "step": 11920 + }, + { + "epoch": 0.41, + "learning_rate": 1.2704394789445225e-05, + "loss": 0.6173, + "step": 11921 + }, + { + "epoch": 0.41, + "learning_rate": 1.2703346483031094e-05, + "loss": 0.66, + "step": 11922 + }, + { + "epoch": 0.41, + "learning_rate": 1.2702298144565366e-05, + "loss": 0.6021, + "step": 11923 + }, + { + "epoch": 0.41, + "learning_rate": 1.2701249774060478e-05, + "loss": 0.6635, + "step": 11924 + }, + { + "epoch": 0.41, + "learning_rate": 1.2700201371528858e-05, + "loss": 0.6615, + "step": 11925 + }, + { + "epoch": 0.41, + "learning_rate": 1.269915293698293e-05, + "loss": 0.623, + "step": 11926 + }, + { + "epoch": 0.41, + "learning_rate": 1.2698104470435133e-05, + "loss": 0.6438, + "step": 11927 + }, + { + "epoch": 0.41, + "learning_rate": 1.2697055971897895e-05, + "loss": 0.6791, + "step": 11928 + }, + { + "epoch": 0.41, + "learning_rate": 1.2696007441383644e-05, + "loss": 0.6225, + "step": 11929 + }, + { + "epoch": 0.41, + "learning_rate": 1.2694958878904818e-05, + "loss": 0.5513, + "step": 11930 + }, + { + "epoch": 0.41, + "learning_rate": 1.2693910284473843e-05, + "loss": 0.6199, + "step": 11931 + }, + { + "epoch": 0.41, + "learning_rate": 1.2692861658103155e-05, + "loss": 0.6527, + "step": 11932 + }, + { + "epoch": 0.41, + "learning_rate": 1.2691812999805184e-05, + "loss": 0.6866, + "step": 11933 + }, + { + "epoch": 0.41, + "learning_rate": 1.2690764309592365e-05, + "loss": 0.572, + "step": 11934 + }, + { + "epoch": 0.41, + "learning_rate": 1.2689715587477132e-05, + "loss": 0.6729, + "step": 11935 + }, + { + "epoch": 0.41, + "learning_rate": 1.2688666833471919e-05, + "loss": 0.6806, + "step": 11936 + }, + { + "epoch": 0.41, + "learning_rate": 1.2687618047589157e-05, + "loss": 0.6906, + "step": 11937 + }, + { + "epoch": 0.41, + "learning_rate": 1.2686569229841284e-05, + "loss": 0.6503, + "step": 11938 + }, + { + "epoch": 0.41, + "learning_rate": 1.2685520380240738e-05, + "loss": 0.6499, + "step": 11939 + }, + { + "epoch": 0.41, + "learning_rate": 1.2684471498799946e-05, + "loss": 0.6173, + "step": 11940 + }, + { + "epoch": 0.41, + "learning_rate": 1.2683422585531348e-05, + "loss": 0.6257, + "step": 11941 + }, + { + "epoch": 0.41, + "learning_rate": 1.2682373640447385e-05, + "loss": 0.6634, + "step": 11942 + }, + { + "epoch": 0.41, + "learning_rate": 1.2681324663560485e-05, + "loss": 0.6615, + "step": 11943 + }, + { + "epoch": 0.41, + "learning_rate": 1.2680275654883092e-05, + "loss": 0.6638, + "step": 11944 + }, + { + "epoch": 0.41, + "learning_rate": 1.2679226614427642e-05, + "loss": 0.6138, + "step": 11945 + }, + { + "epoch": 0.41, + "learning_rate": 1.2678177542206566e-05, + "loss": 0.63, + "step": 11946 + }, + { + "epoch": 0.41, + "learning_rate": 1.2677128438232312e-05, + "loss": 0.6126, + "step": 11947 + }, + { + "epoch": 0.41, + "learning_rate": 1.2676079302517312e-05, + "loss": 0.6154, + "step": 11948 + }, + { + "epoch": 0.41, + "learning_rate": 1.2675030135074006e-05, + "loss": 0.6408, + "step": 11949 + }, + { + "epoch": 0.41, + "learning_rate": 1.2673980935914833e-05, + "loss": 0.662, + "step": 11950 + }, + { + "epoch": 0.41, + "learning_rate": 1.2672931705052238e-05, + "loss": 0.6209, + "step": 11951 + }, + { + "epoch": 0.41, + "learning_rate": 1.2671882442498654e-05, + "loss": 0.6286, + "step": 11952 + }, + { + "epoch": 0.41, + "learning_rate": 1.267083314826652e-05, + "loss": 0.6548, + "step": 11953 + }, + { + "epoch": 0.41, + "learning_rate": 1.2669783822368285e-05, + "loss": 0.6473, + "step": 11954 + }, + { + "epoch": 0.41, + "learning_rate": 1.2668734464816383e-05, + "loss": 0.648, + "step": 11955 + }, + { + "epoch": 0.41, + "learning_rate": 1.2667685075623259e-05, + "loss": 0.6055, + "step": 11956 + }, + { + "epoch": 0.41, + "learning_rate": 1.2666635654801357e-05, + "loss": 0.5884, + "step": 11957 + }, + { + "epoch": 0.41, + "learning_rate": 1.266558620236311e-05, + "loss": 0.6116, + "step": 11958 + }, + { + "epoch": 0.41, + "learning_rate": 1.2664536718320967e-05, + "loss": 0.62, + "step": 11959 + }, + { + "epoch": 0.41, + "learning_rate": 1.2663487202687374e-05, + "loss": 0.6028, + "step": 11960 + }, + { + "epoch": 0.41, + "learning_rate": 1.2662437655474771e-05, + "loss": 0.6314, + "step": 11961 + }, + { + "epoch": 0.41, + "learning_rate": 1.26613880766956e-05, + "loss": 0.6582, + "step": 11962 + }, + { + "epoch": 0.41, + "learning_rate": 1.2660338466362307e-05, + "loss": 0.6002, + "step": 11963 + }, + { + "epoch": 0.41, + "learning_rate": 1.2659288824487334e-05, + "loss": 0.5731, + "step": 11964 + }, + { + "epoch": 0.41, + "learning_rate": 1.265823915108313e-05, + "loss": 0.5678, + "step": 11965 + }, + { + "epoch": 0.41, + "learning_rate": 1.265718944616214e-05, + "loss": 0.5807, + "step": 11966 + }, + { + "epoch": 0.41, + "learning_rate": 1.2656139709736808e-05, + "loss": 0.6444, + "step": 11967 + }, + { + "epoch": 0.41, + "learning_rate": 1.2655089941819575e-05, + "loss": 0.6808, + "step": 11968 + }, + { + "epoch": 0.41, + "learning_rate": 1.2654040142422897e-05, + "loss": 0.6703, + "step": 11969 + }, + { + "epoch": 0.41, + "learning_rate": 1.2652990311559213e-05, + "loss": 0.6675, + "step": 11970 + }, + { + "epoch": 0.41, + "learning_rate": 1.2651940449240972e-05, + "loss": 0.63, + "step": 11971 + }, + { + "epoch": 0.41, + "learning_rate": 1.2650890555480624e-05, + "loss": 0.6159, + "step": 11972 + }, + { + "epoch": 0.41, + "learning_rate": 1.2649840630290616e-05, + "loss": 0.6411, + "step": 11973 + }, + { + "epoch": 0.41, + "learning_rate": 1.2648790673683392e-05, + "loss": 0.643, + "step": 11974 + }, + { + "epoch": 0.41, + "learning_rate": 1.2647740685671406e-05, + "loss": 0.6262, + "step": 11975 + }, + { + "epoch": 0.41, + "learning_rate": 1.2646690666267105e-05, + "loss": 0.5891, + "step": 11976 + }, + { + "epoch": 0.41, + "learning_rate": 1.2645640615482934e-05, + "loss": 0.6016, + "step": 11977 + }, + { + "epoch": 0.42, + "learning_rate": 1.2644590533331353e-05, + "loss": 0.6542, + "step": 11978 + }, + { + "epoch": 0.42, + "learning_rate": 1.2643540419824805e-05, + "loss": 0.5919, + "step": 11979 + }, + { + "epoch": 0.42, + "learning_rate": 1.2642490274975737e-05, + "loss": 0.6353, + "step": 11980 + }, + { + "epoch": 0.42, + "learning_rate": 1.2641440098796607e-05, + "loss": 0.5982, + "step": 11981 + }, + { + "epoch": 0.42, + "learning_rate": 1.2640389891299863e-05, + "loss": 0.6446, + "step": 11982 + }, + { + "epoch": 0.42, + "learning_rate": 1.2639339652497954e-05, + "loss": 0.6476, + "step": 11983 + }, + { + "epoch": 0.42, + "learning_rate": 1.2638289382403336e-05, + "loss": 0.635, + "step": 11984 + }, + { + "epoch": 0.42, + "learning_rate": 1.2637239081028466e-05, + "loss": 0.5707, + "step": 11985 + }, + { + "epoch": 0.42, + "learning_rate": 1.263618874838578e-05, + "loss": 0.6599, + "step": 11986 + }, + { + "epoch": 0.42, + "learning_rate": 1.2635138384487748e-05, + "loss": 0.6502, + "step": 11987 + }, + { + "epoch": 0.42, + "learning_rate": 1.2634087989346818e-05, + "loss": 0.6034, + "step": 11988 + }, + { + "epoch": 0.42, + "learning_rate": 1.263303756297544e-05, + "loss": 0.6271, + "step": 11989 + }, + { + "epoch": 0.42, + "learning_rate": 1.2631987105386072e-05, + "loss": 0.6609, + "step": 11990 + }, + { + "epoch": 0.42, + "learning_rate": 1.2630936616591167e-05, + "loss": 0.5422, + "step": 11991 + }, + { + "epoch": 0.42, + "learning_rate": 1.2629886096603178e-05, + "loss": 0.5951, + "step": 11992 + }, + { + "epoch": 0.42, + "learning_rate": 1.2628835545434565e-05, + "loss": 0.664, + "step": 11993 + }, + { + "epoch": 0.42, + "learning_rate": 1.2627784963097782e-05, + "loss": 0.5848, + "step": 11994 + }, + { + "epoch": 0.42, + "learning_rate": 1.262673434960528e-05, + "loss": 0.6124, + "step": 11995 + }, + { + "epoch": 0.42, + "learning_rate": 1.2625683704969525e-05, + "loss": 0.6053, + "step": 11996 + }, + { + "epoch": 0.42, + "learning_rate": 1.2624633029202967e-05, + "loss": 0.6927, + "step": 11997 + }, + { + "epoch": 0.42, + "learning_rate": 1.2623582322318062e-05, + "loss": 0.6251, + "step": 11998 + }, + { + "epoch": 0.42, + "learning_rate": 1.2622531584327269e-05, + "loss": 0.6119, + "step": 11999 + }, + { + "epoch": 0.42, + "learning_rate": 1.262148081524305e-05, + "loss": 0.6875, + "step": 12000 + }, + { + "epoch": 0.42, + "learning_rate": 1.2620430015077858e-05, + "loss": 0.6582, + "step": 12001 + }, + { + "epoch": 0.42, + "learning_rate": 1.2619379183844152e-05, + "loss": 0.6218, + "step": 12002 + }, + { + "epoch": 0.42, + "learning_rate": 1.2618328321554394e-05, + "loss": 0.6661, + "step": 12003 + }, + { + "epoch": 0.42, + "learning_rate": 1.261727742822104e-05, + "loss": 0.6616, + "step": 12004 + }, + { + "epoch": 0.42, + "learning_rate": 1.2616226503856552e-05, + "loss": 0.6252, + "step": 12005 + }, + { + "epoch": 0.42, + "learning_rate": 1.261517554847339e-05, + "loss": 0.6658, + "step": 12006 + }, + { + "epoch": 0.42, + "learning_rate": 1.2614124562084014e-05, + "loss": 0.6617, + "step": 12007 + }, + { + "epoch": 0.42, + "learning_rate": 1.2613073544700882e-05, + "loss": 0.6358, + "step": 12008 + }, + { + "epoch": 0.42, + "learning_rate": 1.2612022496336461e-05, + "loss": 0.5801, + "step": 12009 + }, + { + "epoch": 0.42, + "learning_rate": 1.2610971417003206e-05, + "loss": 0.6359, + "step": 12010 + }, + { + "epoch": 0.42, + "learning_rate": 1.260992030671358e-05, + "loss": 0.7121, + "step": 12011 + }, + { + "epoch": 0.42, + "learning_rate": 1.2608869165480054e-05, + "loss": 0.6491, + "step": 12012 + }, + { + "epoch": 0.42, + "learning_rate": 1.260781799331508e-05, + "loss": 0.6104, + "step": 12013 + }, + { + "epoch": 0.42, + "learning_rate": 1.2606766790231122e-05, + "loss": 0.6526, + "step": 12014 + }, + { + "epoch": 0.42, + "learning_rate": 1.2605715556240653e-05, + "loss": 0.661, + "step": 12015 + }, + { + "epoch": 0.42, + "learning_rate": 1.2604664291356123e-05, + "loss": 0.6072, + "step": 12016 + }, + { + "epoch": 0.42, + "learning_rate": 1.2603612995590004e-05, + "loss": 0.6028, + "step": 12017 + }, + { + "epoch": 0.42, + "learning_rate": 1.2602561668954762e-05, + "loss": 0.6294, + "step": 12018 + }, + { + "epoch": 0.42, + "learning_rate": 1.260151031146286e-05, + "loss": 0.6005, + "step": 12019 + }, + { + "epoch": 0.42, + "learning_rate": 1.260045892312676e-05, + "loss": 0.6817, + "step": 12020 + }, + { + "epoch": 0.42, + "learning_rate": 1.2599407503958931e-05, + "loss": 0.5866, + "step": 12021 + }, + { + "epoch": 0.42, + "learning_rate": 1.2598356053971836e-05, + "loss": 0.6354, + "step": 12022 + }, + { + "epoch": 0.42, + "learning_rate": 1.2597304573177944e-05, + "loss": 0.5778, + "step": 12023 + }, + { + "epoch": 0.42, + "learning_rate": 1.2596253061589722e-05, + "loss": 0.6374, + "step": 12024 + }, + { + "epoch": 0.42, + "learning_rate": 1.2595201519219633e-05, + "loss": 0.5986, + "step": 12025 + }, + { + "epoch": 0.42, + "learning_rate": 1.2594149946080148e-05, + "loss": 0.6128, + "step": 12026 + }, + { + "epoch": 0.42, + "learning_rate": 1.2593098342183736e-05, + "loss": 0.624, + "step": 12027 + }, + { + "epoch": 0.42, + "learning_rate": 1.259204670754286e-05, + "loss": 0.6458, + "step": 12028 + }, + { + "epoch": 0.42, + "learning_rate": 1.2590995042169996e-05, + "loss": 0.6434, + "step": 12029 + }, + { + "epoch": 0.42, + "learning_rate": 1.2589943346077602e-05, + "loss": 0.678, + "step": 12030 + }, + { + "epoch": 0.42, + "learning_rate": 1.2588891619278156e-05, + "loss": 0.6706, + "step": 12031 + }, + { + "epoch": 0.42, + "learning_rate": 1.2587839861784126e-05, + "loss": 0.637, + "step": 12032 + }, + { + "epoch": 0.42, + "learning_rate": 1.2586788073607981e-05, + "loss": 0.6214, + "step": 12033 + }, + { + "epoch": 0.42, + "learning_rate": 1.2585736254762188e-05, + "loss": 0.667, + "step": 12034 + }, + { + "epoch": 0.42, + "learning_rate": 1.2584684405259223e-05, + "loss": 0.6364, + "step": 12035 + }, + { + "epoch": 0.42, + "learning_rate": 1.2583632525111555e-05, + "loss": 0.6142, + "step": 12036 + }, + { + "epoch": 0.42, + "learning_rate": 1.2582580614331654e-05, + "loss": 0.6136, + "step": 12037 + }, + { + "epoch": 0.42, + "learning_rate": 1.2581528672931996e-05, + "loss": 0.6176, + "step": 12038 + }, + { + "epoch": 0.42, + "learning_rate": 1.2580476700925045e-05, + "loss": 0.6357, + "step": 12039 + }, + { + "epoch": 0.42, + "learning_rate": 1.257942469832328e-05, + "loss": 0.6274, + "step": 12040 + }, + { + "epoch": 0.42, + "learning_rate": 1.2578372665139174e-05, + "loss": 0.6293, + "step": 12041 + }, + { + "epoch": 0.42, + "learning_rate": 1.2577320601385197e-05, + "loss": 0.6523, + "step": 12042 + }, + { + "epoch": 0.42, + "learning_rate": 1.2576268507073822e-05, + "loss": 0.6445, + "step": 12043 + }, + { + "epoch": 0.42, + "learning_rate": 1.257521638221753e-05, + "loss": 0.6114, + "step": 12044 + }, + { + "epoch": 0.42, + "learning_rate": 1.2574164226828785e-05, + "loss": 0.6372, + "step": 12045 + }, + { + "epoch": 0.42, + "learning_rate": 1.2573112040920068e-05, + "loss": 0.6347, + "step": 12046 + }, + { + "epoch": 0.42, + "learning_rate": 1.2572059824503855e-05, + "loss": 0.6091, + "step": 12047 + }, + { + "epoch": 0.42, + "learning_rate": 1.2571007577592618e-05, + "loss": 0.6587, + "step": 12048 + }, + { + "epoch": 0.42, + "learning_rate": 1.2569955300198833e-05, + "loss": 0.609, + "step": 12049 + }, + { + "epoch": 0.42, + "learning_rate": 1.256890299233498e-05, + "loss": 0.6242, + "step": 12050 + }, + { + "epoch": 0.42, + "learning_rate": 1.2567850654013527e-05, + "loss": 0.5633, + "step": 12051 + }, + { + "epoch": 0.42, + "learning_rate": 1.2566798285246957e-05, + "loss": 0.5836, + "step": 12052 + }, + { + "epoch": 0.42, + "learning_rate": 1.2565745886047751e-05, + "loss": 0.6156, + "step": 12053 + }, + { + "epoch": 0.42, + "learning_rate": 1.2564693456428379e-05, + "loss": 0.6241, + "step": 12054 + }, + { + "epoch": 0.42, + "learning_rate": 1.2563640996401321e-05, + "loss": 0.6531, + "step": 12055 + }, + { + "epoch": 0.42, + "learning_rate": 1.2562588505979059e-05, + "loss": 0.674, + "step": 12056 + }, + { + "epoch": 0.42, + "learning_rate": 1.2561535985174066e-05, + "loss": 0.5882, + "step": 12057 + }, + { + "epoch": 0.42, + "learning_rate": 1.2560483433998823e-05, + "loss": 0.671, + "step": 12058 + }, + { + "epoch": 0.42, + "learning_rate": 1.255943085246581e-05, + "loss": 0.6189, + "step": 12059 + }, + { + "epoch": 0.42, + "learning_rate": 1.2558378240587508e-05, + "loss": 0.5531, + "step": 12060 + }, + { + "epoch": 0.42, + "learning_rate": 1.2557325598376393e-05, + "loss": 0.6633, + "step": 12061 + }, + { + "epoch": 0.42, + "learning_rate": 1.2556272925844952e-05, + "loss": 0.6434, + "step": 12062 + }, + { + "epoch": 0.42, + "learning_rate": 1.255522022300566e-05, + "loss": 0.6112, + "step": 12063 + }, + { + "epoch": 0.42, + "learning_rate": 1.2554167489870999e-05, + "loss": 0.5965, + "step": 12064 + }, + { + "epoch": 0.42, + "learning_rate": 1.255311472645345e-05, + "loss": 0.6308, + "step": 12065 + }, + { + "epoch": 0.42, + "learning_rate": 1.2552061932765498e-05, + "loss": 0.6215, + "step": 12066 + }, + { + "epoch": 0.42, + "learning_rate": 1.2551009108819626e-05, + "loss": 0.5968, + "step": 12067 + }, + { + "epoch": 0.42, + "learning_rate": 1.254995625462831e-05, + "loss": 0.5998, + "step": 12068 + }, + { + "epoch": 0.42, + "learning_rate": 1.2548903370204038e-05, + "loss": 0.6188, + "step": 12069 + }, + { + "epoch": 0.42, + "learning_rate": 1.2547850455559292e-05, + "loss": 0.6615, + "step": 12070 + }, + { + "epoch": 0.42, + "learning_rate": 1.2546797510706559e-05, + "loss": 0.6478, + "step": 12071 + }, + { + "epoch": 0.42, + "learning_rate": 1.2545744535658316e-05, + "loss": 0.6617, + "step": 12072 + }, + { + "epoch": 0.42, + "learning_rate": 1.2544691530427052e-05, + "loss": 0.6658, + "step": 12073 + }, + { + "epoch": 0.42, + "learning_rate": 1.2543638495025252e-05, + "loss": 0.6031, + "step": 12074 + }, + { + "epoch": 0.42, + "learning_rate": 1.2542585429465398e-05, + "loss": 0.6657, + "step": 12075 + }, + { + "epoch": 0.42, + "learning_rate": 1.2541532333759978e-05, + "loss": 0.6226, + "step": 12076 + }, + { + "epoch": 0.42, + "learning_rate": 1.2540479207921478e-05, + "loss": 0.6292, + "step": 12077 + }, + { + "epoch": 0.42, + "learning_rate": 1.2539426051962383e-05, + "loss": 0.6425, + "step": 12078 + }, + { + "epoch": 0.42, + "learning_rate": 1.2538372865895179e-05, + "loss": 0.6334, + "step": 12079 + }, + { + "epoch": 0.42, + "learning_rate": 1.2537319649732356e-05, + "loss": 0.6184, + "step": 12080 + }, + { + "epoch": 0.42, + "learning_rate": 1.2536266403486395e-05, + "loss": 0.6615, + "step": 12081 + }, + { + "epoch": 0.42, + "learning_rate": 1.253521312716979e-05, + "loss": 0.6809, + "step": 12082 + }, + { + "epoch": 0.42, + "learning_rate": 1.2534159820795027e-05, + "loss": 0.6615, + "step": 12083 + }, + { + "epoch": 0.42, + "learning_rate": 1.2533106484374592e-05, + "loss": 0.6223, + "step": 12084 + }, + { + "epoch": 0.42, + "learning_rate": 1.2532053117920975e-05, + "loss": 0.6146, + "step": 12085 + }, + { + "epoch": 0.42, + "learning_rate": 1.2530999721446667e-05, + "loss": 0.6612, + "step": 12086 + }, + { + "epoch": 0.42, + "learning_rate": 1.2529946294964153e-05, + "loss": 0.6337, + "step": 12087 + }, + { + "epoch": 0.42, + "learning_rate": 1.2528892838485925e-05, + "loss": 0.6302, + "step": 12088 + }, + { + "epoch": 0.42, + "learning_rate": 1.2527839352024476e-05, + "loss": 0.6754, + "step": 12089 + }, + { + "epoch": 0.42, + "learning_rate": 1.2526785835592292e-05, + "loss": 0.6016, + "step": 12090 + }, + { + "epoch": 0.42, + "learning_rate": 1.2525732289201868e-05, + "loss": 0.6102, + "step": 12091 + }, + { + "epoch": 0.42, + "learning_rate": 1.252467871286569e-05, + "loss": 0.6833, + "step": 12092 + }, + { + "epoch": 0.42, + "learning_rate": 1.2523625106596254e-05, + "loss": 0.6276, + "step": 12093 + }, + { + "epoch": 0.42, + "learning_rate": 1.252257147040605e-05, + "loss": 0.6095, + "step": 12094 + }, + { + "epoch": 0.42, + "learning_rate": 1.2521517804307569e-05, + "loss": 0.6116, + "step": 12095 + }, + { + "epoch": 0.42, + "learning_rate": 1.2520464108313301e-05, + "loss": 0.6423, + "step": 12096 + }, + { + "epoch": 0.42, + "learning_rate": 1.251941038243575e-05, + "loss": 0.6469, + "step": 12097 + }, + { + "epoch": 0.42, + "learning_rate": 1.2518356626687397e-05, + "loss": 0.6447, + "step": 12098 + }, + { + "epoch": 0.42, + "learning_rate": 1.251730284108074e-05, + "loss": 0.6662, + "step": 12099 + }, + { + "epoch": 0.42, + "learning_rate": 1.2516249025628277e-05, + "loss": 0.624, + "step": 12100 + }, + { + "epoch": 0.42, + "learning_rate": 1.2515195180342496e-05, + "loss": 0.6376, + "step": 12101 + }, + { + "epoch": 0.42, + "learning_rate": 1.2514141305235893e-05, + "loss": 0.618, + "step": 12102 + }, + { + "epoch": 0.42, + "learning_rate": 1.251308740032097e-05, + "loss": 0.6191, + "step": 12103 + }, + { + "epoch": 0.42, + "learning_rate": 1.2512033465610211e-05, + "loss": 0.6774, + "step": 12104 + }, + { + "epoch": 0.42, + "learning_rate": 1.251097950111612e-05, + "loss": 0.6078, + "step": 12105 + }, + { + "epoch": 0.42, + "learning_rate": 1.2509925506851192e-05, + "loss": 0.6407, + "step": 12106 + }, + { + "epoch": 0.42, + "learning_rate": 1.250887148282792e-05, + "loss": 0.678, + "step": 12107 + }, + { + "epoch": 0.42, + "learning_rate": 1.2507817429058804e-05, + "loss": 0.6598, + "step": 12108 + }, + { + "epoch": 0.42, + "learning_rate": 1.2506763345556341e-05, + "loss": 0.6309, + "step": 12109 + }, + { + "epoch": 0.42, + "learning_rate": 1.2505709232333025e-05, + "loss": 0.6805, + "step": 12110 + }, + { + "epoch": 0.42, + "learning_rate": 1.2504655089401355e-05, + "loss": 0.6521, + "step": 12111 + }, + { + "epoch": 0.42, + "learning_rate": 1.2503600916773835e-05, + "loss": 0.567, + "step": 12112 + }, + { + "epoch": 0.42, + "learning_rate": 1.2502546714462955e-05, + "loss": 0.6558, + "step": 12113 + }, + { + "epoch": 0.42, + "learning_rate": 1.250149248248122e-05, + "loss": 0.6203, + "step": 12114 + }, + { + "epoch": 0.42, + "learning_rate": 1.2500438220841129e-05, + "loss": 0.6358, + "step": 12115 + }, + { + "epoch": 0.42, + "learning_rate": 1.2499383929555177e-05, + "loss": 0.6728, + "step": 12116 + }, + { + "epoch": 0.42, + "learning_rate": 1.2498329608635866e-05, + "loss": 0.6371, + "step": 12117 + }, + { + "epoch": 0.42, + "learning_rate": 1.24972752580957e-05, + "loss": 0.5915, + "step": 12118 + }, + { + "epoch": 0.42, + "learning_rate": 1.2496220877947174e-05, + "loss": 0.7062, + "step": 12119 + }, + { + "epoch": 0.42, + "learning_rate": 1.2495166468202793e-05, + "loss": 0.6686, + "step": 12120 + }, + { + "epoch": 0.42, + "learning_rate": 1.2494112028875059e-05, + "loss": 0.6482, + "step": 12121 + }, + { + "epoch": 0.42, + "learning_rate": 1.2493057559976471e-05, + "loss": 0.6178, + "step": 12122 + }, + { + "epoch": 0.42, + "learning_rate": 1.249200306151953e-05, + "loss": 0.686, + "step": 12123 + }, + { + "epoch": 0.42, + "learning_rate": 1.2490948533516742e-05, + "loss": 0.6352, + "step": 12124 + }, + { + "epoch": 0.42, + "learning_rate": 1.2489893975980608e-05, + "loss": 0.6035, + "step": 12125 + }, + { + "epoch": 0.42, + "learning_rate": 1.2488839388923631e-05, + "loss": 0.6175, + "step": 12126 + }, + { + "epoch": 0.42, + "learning_rate": 1.2487784772358313e-05, + "loss": 0.644, + "step": 12127 + }, + { + "epoch": 0.42, + "learning_rate": 1.2486730126297162e-05, + "loss": 0.5991, + "step": 12128 + }, + { + "epoch": 0.42, + "learning_rate": 1.2485675450752677e-05, + "loss": 0.598, + "step": 12129 + }, + { + "epoch": 0.42, + "learning_rate": 1.2484620745737365e-05, + "loss": 0.6522, + "step": 12130 + }, + { + "epoch": 0.42, + "learning_rate": 1.2483566011263735e-05, + "loss": 0.6943, + "step": 12131 + }, + { + "epoch": 0.42, + "learning_rate": 1.2482511247344284e-05, + "loss": 0.6212, + "step": 12132 + }, + { + "epoch": 0.42, + "learning_rate": 1.2481456453991523e-05, + "loss": 0.561, + "step": 12133 + }, + { + "epoch": 0.42, + "learning_rate": 1.2480401631217957e-05, + "loss": 0.6157, + "step": 12134 + }, + { + "epoch": 0.42, + "learning_rate": 1.2479346779036092e-05, + "loss": 0.606, + "step": 12135 + }, + { + "epoch": 0.42, + "learning_rate": 1.2478291897458434e-05, + "loss": 0.5476, + "step": 12136 + }, + { + "epoch": 0.42, + "learning_rate": 1.2477236986497494e-05, + "loss": 0.6337, + "step": 12137 + }, + { + "epoch": 0.42, + "learning_rate": 1.2476182046165772e-05, + "loss": 0.5823, + "step": 12138 + }, + { + "epoch": 0.42, + "learning_rate": 1.247512707647578e-05, + "loss": 0.656, + "step": 12139 + }, + { + "epoch": 0.42, + "learning_rate": 1.2474072077440024e-05, + "loss": 0.6325, + "step": 12140 + }, + { + "epoch": 0.42, + "learning_rate": 1.2473017049071016e-05, + "loss": 0.6555, + "step": 12141 + }, + { + "epoch": 0.42, + "learning_rate": 1.2471961991381263e-05, + "loss": 0.649, + "step": 12142 + }, + { + "epoch": 0.42, + "learning_rate": 1.2470906904383274e-05, + "loss": 0.6277, + "step": 12143 + }, + { + "epoch": 0.42, + "learning_rate": 1.2469851788089556e-05, + "loss": 0.591, + "step": 12144 + }, + { + "epoch": 0.42, + "learning_rate": 1.246879664251262e-05, + "loss": 0.6563, + "step": 12145 + }, + { + "epoch": 0.42, + "learning_rate": 1.2467741467664979e-05, + "loss": 0.5781, + "step": 12146 + }, + { + "epoch": 0.42, + "learning_rate": 1.246668626355914e-05, + "loss": 0.611, + "step": 12147 + }, + { + "epoch": 0.42, + "learning_rate": 1.2465631030207615e-05, + "loss": 0.6461, + "step": 12148 + }, + { + "epoch": 0.42, + "learning_rate": 1.2464575767622915e-05, + "loss": 0.612, + "step": 12149 + }, + { + "epoch": 0.42, + "learning_rate": 1.2463520475817553e-05, + "loss": 0.7178, + "step": 12150 + }, + { + "epoch": 0.42, + "learning_rate": 1.2462465154804035e-05, + "loss": 0.6439, + "step": 12151 + }, + { + "epoch": 0.42, + "learning_rate": 1.2461409804594884e-05, + "loss": 0.6987, + "step": 12152 + }, + { + "epoch": 0.42, + "learning_rate": 1.24603544252026e-05, + "loss": 0.5058, + "step": 12153 + }, + { + "epoch": 0.42, + "learning_rate": 1.2459299016639705e-05, + "loss": 0.6741, + "step": 12154 + }, + { + "epoch": 0.42, + "learning_rate": 1.245824357891871e-05, + "loss": 0.6432, + "step": 12155 + }, + { + "epoch": 0.42, + "learning_rate": 1.2457188112052126e-05, + "loss": 0.6283, + "step": 12156 + }, + { + "epoch": 0.42, + "learning_rate": 1.245613261605247e-05, + "loss": 0.5668, + "step": 12157 + }, + { + "epoch": 0.42, + "learning_rate": 1.2455077090932256e-05, + "loss": 0.635, + "step": 12158 + }, + { + "epoch": 0.42, + "learning_rate": 1.2454021536703993e-05, + "loss": 0.6168, + "step": 12159 + }, + { + "epoch": 0.42, + "learning_rate": 1.24529659533802e-05, + "loss": 0.6612, + "step": 12160 + }, + { + "epoch": 0.42, + "learning_rate": 1.2451910340973398e-05, + "loss": 0.6312, + "step": 12161 + }, + { + "epoch": 0.42, + "learning_rate": 1.2450854699496093e-05, + "loss": 0.5652, + "step": 12162 + }, + { + "epoch": 0.42, + "learning_rate": 1.2449799028960806e-05, + "loss": 0.6759, + "step": 12163 + }, + { + "epoch": 0.42, + "learning_rate": 1.2448743329380055e-05, + "loss": 0.6692, + "step": 12164 + }, + { + "epoch": 0.42, + "learning_rate": 1.2447687600766352e-05, + "loss": 0.572, + "step": 12165 + }, + { + "epoch": 0.42, + "learning_rate": 1.2446631843132215e-05, + "loss": 0.6181, + "step": 12166 + }, + { + "epoch": 0.42, + "learning_rate": 1.2445576056490168e-05, + "loss": 0.6539, + "step": 12167 + }, + { + "epoch": 0.42, + "learning_rate": 1.2444520240852716e-05, + "loss": 0.5925, + "step": 12168 + }, + { + "epoch": 0.42, + "learning_rate": 1.2443464396232387e-05, + "loss": 0.5918, + "step": 12169 + }, + { + "epoch": 0.42, + "learning_rate": 1.2442408522641698e-05, + "loss": 0.6459, + "step": 12170 + }, + { + "epoch": 0.42, + "learning_rate": 1.2441352620093166e-05, + "loss": 0.6119, + "step": 12171 + }, + { + "epoch": 0.42, + "learning_rate": 1.244029668859931e-05, + "loss": 0.6828, + "step": 12172 + }, + { + "epoch": 0.42, + "learning_rate": 1.243924072817265e-05, + "loss": 0.6543, + "step": 12173 + }, + { + "epoch": 0.42, + "learning_rate": 1.2438184738825703e-05, + "loss": 0.6157, + "step": 12174 + }, + { + "epoch": 0.42, + "learning_rate": 1.2437128720570992e-05, + "loss": 0.6783, + "step": 12175 + }, + { + "epoch": 0.42, + "learning_rate": 1.243607267342104e-05, + "loss": 0.6331, + "step": 12176 + }, + { + "epoch": 0.42, + "learning_rate": 1.2435016597388362e-05, + "loss": 0.634, + "step": 12177 + }, + { + "epoch": 0.42, + "learning_rate": 1.2433960492485485e-05, + "loss": 0.6329, + "step": 12178 + }, + { + "epoch": 0.42, + "learning_rate": 1.2432904358724926e-05, + "loss": 0.545, + "step": 12179 + }, + { + "epoch": 0.42, + "learning_rate": 1.2431848196119208e-05, + "loss": 0.6074, + "step": 12180 + }, + { + "epoch": 0.42, + "learning_rate": 1.2430792004680851e-05, + "loss": 0.6627, + "step": 12181 + }, + { + "epoch": 0.42, + "learning_rate": 1.2429735784422384e-05, + "loss": 0.6496, + "step": 12182 + }, + { + "epoch": 0.42, + "learning_rate": 1.2428679535356323e-05, + "loss": 0.6198, + "step": 12183 + }, + { + "epoch": 0.42, + "learning_rate": 1.2427623257495196e-05, + "loss": 0.5881, + "step": 12184 + }, + { + "epoch": 0.42, + "learning_rate": 1.2426566950851522e-05, + "loss": 0.6862, + "step": 12185 + }, + { + "epoch": 0.42, + "learning_rate": 1.2425510615437828e-05, + "loss": 0.6652, + "step": 12186 + }, + { + "epoch": 0.42, + "learning_rate": 1.2424454251266637e-05, + "loss": 0.6216, + "step": 12187 + }, + { + "epoch": 0.42, + "learning_rate": 1.2423397858350475e-05, + "loss": 0.6247, + "step": 12188 + }, + { + "epoch": 0.42, + "learning_rate": 1.2422341436701863e-05, + "loss": 0.6774, + "step": 12189 + }, + { + "epoch": 0.42, + "learning_rate": 1.2421284986333333e-05, + "loss": 0.6166, + "step": 12190 + }, + { + "epoch": 0.42, + "learning_rate": 1.2420228507257403e-05, + "loss": 0.6231, + "step": 12191 + }, + { + "epoch": 0.42, + "learning_rate": 1.2419171999486603e-05, + "loss": 0.6409, + "step": 12192 + }, + { + "epoch": 0.42, + "learning_rate": 1.2418115463033462e-05, + "loss": 0.5985, + "step": 12193 + }, + { + "epoch": 0.42, + "learning_rate": 1.2417058897910498e-05, + "loss": 0.6276, + "step": 12194 + }, + { + "epoch": 0.42, + "learning_rate": 1.2416002304130248e-05, + "loss": 0.6413, + "step": 12195 + }, + { + "epoch": 0.42, + "learning_rate": 1.2414945681705233e-05, + "loss": 0.5814, + "step": 12196 + }, + { + "epoch": 0.42, + "learning_rate": 1.2413889030647981e-05, + "loss": 0.6048, + "step": 12197 + }, + { + "epoch": 0.42, + "learning_rate": 1.241283235097102e-05, + "loss": 0.6404, + "step": 12198 + }, + { + "epoch": 0.42, + "learning_rate": 1.2411775642686883e-05, + "loss": 0.6282, + "step": 12199 + }, + { + "epoch": 0.42, + "learning_rate": 1.2410718905808093e-05, + "loss": 0.6084, + "step": 12200 + }, + { + "epoch": 0.42, + "learning_rate": 1.2409662140347178e-05, + "loss": 0.6341, + "step": 12201 + }, + { + "epoch": 0.42, + "learning_rate": 1.2408605346316673e-05, + "loss": 0.6786, + "step": 12202 + }, + { + "epoch": 0.42, + "learning_rate": 1.2407548523729105e-05, + "loss": 0.6336, + "step": 12203 + }, + { + "epoch": 0.42, + "learning_rate": 1.2406491672597e-05, + "loss": 0.6341, + "step": 12204 + }, + { + "epoch": 0.42, + "learning_rate": 1.2405434792932898e-05, + "loss": 0.617, + "step": 12205 + }, + { + "epoch": 0.42, + "learning_rate": 1.2404377884749318e-05, + "loss": 0.6502, + "step": 12206 + }, + { + "epoch": 0.42, + "learning_rate": 1.2403320948058799e-05, + "loss": 0.6488, + "step": 12207 + }, + { + "epoch": 0.42, + "learning_rate": 1.2402263982873873e-05, + "loss": 0.6438, + "step": 12208 + }, + { + "epoch": 0.42, + "learning_rate": 1.2401206989207064e-05, + "loss": 0.6379, + "step": 12209 + }, + { + "epoch": 0.42, + "learning_rate": 1.240014996707091e-05, + "loss": 0.6239, + "step": 12210 + }, + { + "epoch": 0.42, + "learning_rate": 1.2399092916477944e-05, + "loss": 0.6578, + "step": 12211 + }, + { + "epoch": 0.42, + "learning_rate": 1.2398035837440693e-05, + "loss": 0.6387, + "step": 12212 + }, + { + "epoch": 0.42, + "learning_rate": 1.2396978729971696e-05, + "loss": 0.6515, + "step": 12213 + }, + { + "epoch": 0.42, + "learning_rate": 1.2395921594083485e-05, + "loss": 0.6241, + "step": 12214 + }, + { + "epoch": 0.42, + "learning_rate": 1.239486442978859e-05, + "loss": 0.6594, + "step": 12215 + }, + { + "epoch": 0.42, + "learning_rate": 1.2393807237099547e-05, + "loss": 0.5963, + "step": 12216 + }, + { + "epoch": 0.42, + "learning_rate": 1.2392750016028893e-05, + "loss": 0.6324, + "step": 12217 + }, + { + "epoch": 0.42, + "learning_rate": 1.2391692766589163e-05, + "loss": 0.6508, + "step": 12218 + }, + { + "epoch": 0.42, + "learning_rate": 1.2390635488792883e-05, + "loss": 0.6476, + "step": 12219 + }, + { + "epoch": 0.42, + "learning_rate": 1.2389578182652601e-05, + "loss": 0.6893, + "step": 12220 + }, + { + "epoch": 0.42, + "learning_rate": 1.2388520848180848e-05, + "loss": 0.5969, + "step": 12221 + }, + { + "epoch": 0.42, + "learning_rate": 1.2387463485390152e-05, + "loss": 0.6893, + "step": 12222 + }, + { + "epoch": 0.42, + "learning_rate": 1.2386406094293062e-05, + "loss": 0.6315, + "step": 12223 + }, + { + "epoch": 0.42, + "learning_rate": 1.238534867490211e-05, + "loss": 0.6589, + "step": 12224 + }, + { + "epoch": 0.42, + "learning_rate": 1.2384291227229825e-05, + "loss": 0.6472, + "step": 12225 + }, + { + "epoch": 0.42, + "learning_rate": 1.2383233751288757e-05, + "loss": 0.5981, + "step": 12226 + }, + { + "epoch": 0.42, + "learning_rate": 1.2382176247091438e-05, + "loss": 0.5929, + "step": 12227 + }, + { + "epoch": 0.42, + "learning_rate": 1.2381118714650402e-05, + "loss": 0.5563, + "step": 12228 + }, + { + "epoch": 0.42, + "learning_rate": 1.2380061153978193e-05, + "loss": 0.598, + "step": 12229 + }, + { + "epoch": 0.42, + "learning_rate": 1.2379003565087352e-05, + "loss": 0.5917, + "step": 12230 + }, + { + "epoch": 0.42, + "learning_rate": 1.2377945947990408e-05, + "loss": 0.6445, + "step": 12231 + }, + { + "epoch": 0.42, + "learning_rate": 1.2376888302699913e-05, + "loss": 0.6779, + "step": 12232 + }, + { + "epoch": 0.42, + "learning_rate": 1.2375830629228398e-05, + "loss": 0.624, + "step": 12233 + }, + { + "epoch": 0.42, + "learning_rate": 1.2374772927588404e-05, + "loss": 0.6621, + "step": 12234 + }, + { + "epoch": 0.42, + "learning_rate": 1.2373715197792475e-05, + "loss": 0.6125, + "step": 12235 + }, + { + "epoch": 0.42, + "learning_rate": 1.237265743985315e-05, + "loss": 0.6283, + "step": 12236 + }, + { + "epoch": 0.42, + "learning_rate": 1.2371599653782964e-05, + "loss": 0.6729, + "step": 12237 + }, + { + "epoch": 0.42, + "learning_rate": 1.237054183959447e-05, + "loss": 0.6291, + "step": 12238 + }, + { + "epoch": 0.42, + "learning_rate": 1.2369483997300205e-05, + "loss": 0.6862, + "step": 12239 + }, + { + "epoch": 0.42, + "learning_rate": 1.2368426126912703e-05, + "loss": 0.6315, + "step": 12240 + }, + { + "epoch": 0.42, + "learning_rate": 1.2367368228444519e-05, + "loss": 0.647, + "step": 12241 + }, + { + "epoch": 0.42, + "learning_rate": 1.2366310301908188e-05, + "loss": 0.6044, + "step": 12242 + }, + { + "epoch": 0.42, + "learning_rate": 1.2365252347316252e-05, + "loss": 0.6245, + "step": 12243 + }, + { + "epoch": 0.42, + "learning_rate": 1.2364194364681261e-05, + "loss": 0.66, + "step": 12244 + }, + { + "epoch": 0.42, + "learning_rate": 1.2363136354015757e-05, + "loss": 0.6179, + "step": 12245 + }, + { + "epoch": 0.42, + "learning_rate": 1.2362078315332278e-05, + "loss": 0.6039, + "step": 12246 + }, + { + "epoch": 0.42, + "learning_rate": 1.2361020248643375e-05, + "loss": 0.6148, + "step": 12247 + }, + { + "epoch": 0.42, + "learning_rate": 1.2359962153961589e-05, + "loss": 0.6658, + "step": 12248 + }, + { + "epoch": 0.42, + "learning_rate": 1.2358904031299465e-05, + "loss": 0.6039, + "step": 12249 + }, + { + "epoch": 0.42, + "learning_rate": 1.235784588066955e-05, + "loss": 0.6582, + "step": 12250 + }, + { + "epoch": 0.42, + "learning_rate": 1.2356787702084391e-05, + "loss": 0.6251, + "step": 12251 + }, + { + "epoch": 0.42, + "learning_rate": 1.2355729495556533e-05, + "loss": 0.6502, + "step": 12252 + }, + { + "epoch": 0.42, + "learning_rate": 1.235467126109852e-05, + "loss": 0.6279, + "step": 12253 + }, + { + "epoch": 0.42, + "learning_rate": 1.2353612998722903e-05, + "loss": 0.6411, + "step": 12254 + }, + { + "epoch": 0.42, + "learning_rate": 1.2352554708442223e-05, + "loss": 0.6332, + "step": 12255 + }, + { + "epoch": 0.42, + "learning_rate": 1.2351496390269034e-05, + "loss": 0.6682, + "step": 12256 + }, + { + "epoch": 0.42, + "learning_rate": 1.235043804421588e-05, + "loss": 0.6139, + "step": 12257 + }, + { + "epoch": 0.42, + "learning_rate": 1.2349379670295308e-05, + "loss": 0.6324, + "step": 12258 + }, + { + "epoch": 0.42, + "learning_rate": 1.2348321268519869e-05, + "loss": 0.5844, + "step": 12259 + }, + { + "epoch": 0.42, + "learning_rate": 1.2347262838902113e-05, + "loss": 0.6301, + "step": 12260 + }, + { + "epoch": 0.42, + "learning_rate": 1.2346204381454582e-05, + "loss": 0.6645, + "step": 12261 + }, + { + "epoch": 0.42, + "learning_rate": 1.2345145896189831e-05, + "loss": 0.5927, + "step": 12262 + }, + { + "epoch": 0.42, + "learning_rate": 1.2344087383120414e-05, + "loss": 0.6365, + "step": 12263 + }, + { + "epoch": 0.42, + "learning_rate": 1.234302884225887e-05, + "loss": 0.6792, + "step": 12264 + }, + { + "epoch": 0.42, + "learning_rate": 1.2341970273617759e-05, + "loss": 0.6505, + "step": 12265 + }, + { + "epoch": 0.42, + "learning_rate": 1.2340911677209625e-05, + "loss": 0.6822, + "step": 12266 + }, + { + "epoch": 0.43, + "learning_rate": 1.2339853053047024e-05, + "loss": 0.6174, + "step": 12267 + }, + { + "epoch": 0.43, + "learning_rate": 1.2338794401142501e-05, + "loss": 0.6704, + "step": 12268 + }, + { + "epoch": 0.43, + "learning_rate": 1.2337735721508619e-05, + "loss": 0.6253, + "step": 12269 + }, + { + "epoch": 0.43, + "learning_rate": 1.2336677014157916e-05, + "loss": 0.6455, + "step": 12270 + }, + { + "epoch": 0.43, + "learning_rate": 1.2335618279102955e-05, + "loss": 0.644, + "step": 12271 + }, + { + "epoch": 0.43, + "learning_rate": 1.2334559516356284e-05, + "loss": 0.6063, + "step": 12272 + }, + { + "epoch": 0.43, + "learning_rate": 1.2333500725930456e-05, + "loss": 0.6483, + "step": 12273 + }, + { + "epoch": 0.43, + "learning_rate": 1.2332441907838023e-05, + "loss": 0.6238, + "step": 12274 + }, + { + "epoch": 0.43, + "learning_rate": 1.2331383062091544e-05, + "loss": 0.625, + "step": 12275 + }, + { + "epoch": 0.43, + "learning_rate": 1.2330324188703569e-05, + "loss": 0.5965, + "step": 12276 + }, + { + "epoch": 0.43, + "learning_rate": 1.2329265287686653e-05, + "loss": 0.634, + "step": 12277 + }, + { + "epoch": 0.43, + "learning_rate": 1.232820635905335e-05, + "loss": 0.6173, + "step": 12278 + }, + { + "epoch": 0.43, + "learning_rate": 1.2327147402816213e-05, + "loss": 0.6554, + "step": 12279 + }, + { + "epoch": 0.43, + "learning_rate": 1.2326088418987804e-05, + "loss": 0.6247, + "step": 12280 + }, + { + "epoch": 0.43, + "learning_rate": 1.2325029407580671e-05, + "loss": 0.6381, + "step": 12281 + }, + { + "epoch": 0.43, + "learning_rate": 1.2323970368607374e-05, + "loss": 0.6408, + "step": 12282 + }, + { + "epoch": 0.43, + "learning_rate": 1.232291130208047e-05, + "loss": 0.6209, + "step": 12283 + }, + { + "epoch": 0.43, + "learning_rate": 1.2321852208012513e-05, + "loss": 0.5895, + "step": 12284 + }, + { + "epoch": 0.43, + "learning_rate": 1.2320793086416058e-05, + "loss": 0.6582, + "step": 12285 + }, + { + "epoch": 0.43, + "learning_rate": 1.2319733937303671e-05, + "loss": 0.5961, + "step": 12286 + }, + { + "epoch": 0.43, + "learning_rate": 1.23186747606879e-05, + "loss": 0.6508, + "step": 12287 + }, + { + "epoch": 0.43, + "learning_rate": 1.2317615556581306e-05, + "loss": 0.6607, + "step": 12288 + }, + { + "epoch": 0.43, + "learning_rate": 1.231655632499645e-05, + "loss": 0.6647, + "step": 12289 + }, + { + "epoch": 0.43, + "learning_rate": 1.2315497065945887e-05, + "loss": 0.6718, + "step": 12290 + }, + { + "epoch": 0.43, + "learning_rate": 1.2314437779442176e-05, + "loss": 0.5943, + "step": 12291 + }, + { + "epoch": 0.43, + "learning_rate": 1.231337846549788e-05, + "loss": 0.6463, + "step": 12292 + }, + { + "epoch": 0.43, + "learning_rate": 1.2312319124125554e-05, + "loss": 0.5895, + "step": 12293 + }, + { + "epoch": 0.43, + "learning_rate": 1.231125975533776e-05, + "loss": 0.6473, + "step": 12294 + }, + { + "epoch": 0.43, + "learning_rate": 1.231020035914706e-05, + "loss": 0.6423, + "step": 12295 + }, + { + "epoch": 0.43, + "learning_rate": 1.2309140935566008e-05, + "loss": 0.6768, + "step": 12296 + }, + { + "epoch": 0.43, + "learning_rate": 1.2308081484607171e-05, + "loss": 0.6304, + "step": 12297 + }, + { + "epoch": 0.43, + "learning_rate": 1.2307022006283109e-05, + "loss": 0.6424, + "step": 12298 + }, + { + "epoch": 0.43, + "learning_rate": 1.2305962500606384e-05, + "loss": 0.6223, + "step": 12299 + }, + { + "epoch": 0.43, + "learning_rate": 1.2304902967589554e-05, + "loss": 0.6195, + "step": 12300 + }, + { + "epoch": 0.43, + "learning_rate": 1.2303843407245186e-05, + "loss": 0.6531, + "step": 12301 + }, + { + "epoch": 0.43, + "learning_rate": 1.2302783819585838e-05, + "loss": 0.5924, + "step": 12302 + }, + { + "epoch": 0.43, + "learning_rate": 1.2301724204624075e-05, + "loss": 0.6594, + "step": 12303 + }, + { + "epoch": 0.43, + "learning_rate": 1.2300664562372462e-05, + "loss": 0.6832, + "step": 12304 + }, + { + "epoch": 0.43, + "learning_rate": 1.2299604892843555e-05, + "loss": 0.6227, + "step": 12305 + }, + { + "epoch": 0.43, + "learning_rate": 1.2298545196049927e-05, + "loss": 0.6847, + "step": 12306 + }, + { + "epoch": 0.43, + "learning_rate": 1.2297485472004139e-05, + "loss": 0.6335, + "step": 12307 + }, + { + "epoch": 0.43, + "learning_rate": 1.2296425720718752e-05, + "loss": 0.6472, + "step": 12308 + }, + { + "epoch": 0.43, + "learning_rate": 1.2295365942206335e-05, + "loss": 0.6287, + "step": 12309 + }, + { + "epoch": 0.43, + "learning_rate": 1.229430613647945e-05, + "loss": 0.61, + "step": 12310 + }, + { + "epoch": 0.43, + "learning_rate": 1.2293246303550664e-05, + "loss": 0.6117, + "step": 12311 + }, + { + "epoch": 0.43, + "learning_rate": 1.2292186443432538e-05, + "loss": 0.6681, + "step": 12312 + }, + { + "epoch": 0.43, + "learning_rate": 1.229112655613765e-05, + "loss": 0.6618, + "step": 12313 + }, + { + "epoch": 0.43, + "learning_rate": 1.2290066641678554e-05, + "loss": 0.6469, + "step": 12314 + }, + { + "epoch": 0.43, + "learning_rate": 1.2289006700067818e-05, + "loss": 0.635, + "step": 12315 + }, + { + "epoch": 0.43, + "learning_rate": 1.2287946731318017e-05, + "loss": 0.6534, + "step": 12316 + }, + { + "epoch": 0.43, + "learning_rate": 1.2286886735441712e-05, + "loss": 0.5996, + "step": 12317 + }, + { + "epoch": 0.43, + "learning_rate": 1.228582671245147e-05, + "loss": 0.5855, + "step": 12318 + }, + { + "epoch": 0.43, + "learning_rate": 1.2284766662359861e-05, + "loss": 0.652, + "step": 12319 + }, + { + "epoch": 0.43, + "learning_rate": 1.2283706585179458e-05, + "loss": 0.6206, + "step": 12320 + }, + { + "epoch": 0.43, + "learning_rate": 1.2282646480922814e-05, + "loss": 0.7107, + "step": 12321 + }, + { + "epoch": 0.43, + "learning_rate": 1.228158634960252e-05, + "loss": 0.5949, + "step": 12322 + }, + { + "epoch": 0.43, + "learning_rate": 1.2280526191231128e-05, + "loss": 0.6002, + "step": 12323 + }, + { + "epoch": 0.43, + "learning_rate": 1.2279466005821212e-05, + "loss": 0.6046, + "step": 12324 + }, + { + "epoch": 0.43, + "learning_rate": 1.2278405793385346e-05, + "loss": 0.6437, + "step": 12325 + }, + { + "epoch": 0.43, + "learning_rate": 1.2277345553936095e-05, + "loss": 0.6517, + "step": 12326 + }, + { + "epoch": 0.43, + "learning_rate": 1.227628528748603e-05, + "loss": 0.6402, + "step": 12327 + }, + { + "epoch": 0.43, + "learning_rate": 1.2275224994047727e-05, + "loss": 0.6364, + "step": 12328 + }, + { + "epoch": 0.43, + "learning_rate": 1.2274164673633755e-05, + "loss": 0.5786, + "step": 12329 + }, + { + "epoch": 0.43, + "learning_rate": 1.2273104326256678e-05, + "loss": 0.6569, + "step": 12330 + }, + { + "epoch": 0.43, + "learning_rate": 1.2272043951929079e-05, + "loss": 0.7115, + "step": 12331 + }, + { + "epoch": 0.43, + "learning_rate": 1.2270983550663522e-05, + "loss": 0.6018, + "step": 12332 + }, + { + "epoch": 0.43, + "learning_rate": 1.226992312247258e-05, + "loss": 0.5841, + "step": 12333 + }, + { + "epoch": 0.43, + "learning_rate": 1.2268862667368833e-05, + "loss": 0.7047, + "step": 12334 + }, + { + "epoch": 0.43, + "learning_rate": 1.2267802185364848e-05, + "loss": 0.6713, + "step": 12335 + }, + { + "epoch": 0.43, + "learning_rate": 1.2266741676473195e-05, + "loss": 0.6621, + "step": 12336 + }, + { + "epoch": 0.43, + "learning_rate": 1.2265681140706455e-05, + "loss": 0.6275, + "step": 12337 + }, + { + "epoch": 0.43, + "learning_rate": 1.2264620578077202e-05, + "loss": 0.6528, + "step": 12338 + }, + { + "epoch": 0.43, + "learning_rate": 1.2263559988598004e-05, + "loss": 0.6086, + "step": 12339 + }, + { + "epoch": 0.43, + "learning_rate": 1.2262499372281438e-05, + "loss": 0.6547, + "step": 12340 + }, + { + "epoch": 0.43, + "learning_rate": 1.2261438729140083e-05, + "loss": 0.642, + "step": 12341 + }, + { + "epoch": 0.43, + "learning_rate": 1.2260378059186507e-05, + "loss": 0.6277, + "step": 12342 + }, + { + "epoch": 0.43, + "learning_rate": 1.2259317362433292e-05, + "loss": 0.6898, + "step": 12343 + }, + { + "epoch": 0.43, + "learning_rate": 1.2258256638893012e-05, + "loss": 0.6253, + "step": 12344 + }, + { + "epoch": 0.43, + "learning_rate": 1.2257195888578241e-05, + "loss": 0.6226, + "step": 12345 + }, + { + "epoch": 0.43, + "learning_rate": 1.2256135111501559e-05, + "loss": 0.6332, + "step": 12346 + }, + { + "epoch": 0.43, + "learning_rate": 1.2255074307675543e-05, + "loss": 0.6378, + "step": 12347 + }, + { + "epoch": 0.43, + "learning_rate": 1.2254013477112765e-05, + "loss": 0.6684, + "step": 12348 + }, + { + "epoch": 0.43, + "learning_rate": 1.2252952619825807e-05, + "loss": 0.6281, + "step": 12349 + }, + { + "epoch": 0.43, + "learning_rate": 1.2251891735827246e-05, + "loss": 0.6346, + "step": 12350 + }, + { + "epoch": 0.43, + "learning_rate": 1.225083082512966e-05, + "loss": 0.6409, + "step": 12351 + }, + { + "epoch": 0.43, + "learning_rate": 1.2249769887745626e-05, + "loss": 0.6108, + "step": 12352 + }, + { + "epoch": 0.43, + "learning_rate": 1.2248708923687727e-05, + "loss": 0.6384, + "step": 12353 + }, + { + "epoch": 0.43, + "learning_rate": 1.2247647932968536e-05, + "loss": 0.6524, + "step": 12354 + }, + { + "epoch": 0.43, + "learning_rate": 1.2246586915600636e-05, + "loss": 0.5898, + "step": 12355 + }, + { + "epoch": 0.43, + "learning_rate": 1.2245525871596606e-05, + "loss": 0.6734, + "step": 12356 + }, + { + "epoch": 0.43, + "learning_rate": 1.2244464800969026e-05, + "loss": 0.6042, + "step": 12357 + }, + { + "epoch": 0.43, + "learning_rate": 1.2243403703730479e-05, + "loss": 0.5873, + "step": 12358 + }, + { + "epoch": 0.43, + "learning_rate": 1.2242342579893543e-05, + "loss": 0.6386, + "step": 12359 + }, + { + "epoch": 0.43, + "learning_rate": 1.2241281429470796e-05, + "loss": 0.6482, + "step": 12360 + }, + { + "epoch": 0.43, + "learning_rate": 1.2240220252474824e-05, + "loss": 0.6335, + "step": 12361 + }, + { + "epoch": 0.43, + "learning_rate": 1.2239159048918208e-05, + "loss": 0.6069, + "step": 12362 + }, + { + "epoch": 0.43, + "learning_rate": 1.2238097818813529e-05, + "loss": 0.633, + "step": 12363 + }, + { + "epoch": 0.43, + "learning_rate": 1.2237036562173365e-05, + "loss": 0.6432, + "step": 12364 + }, + { + "epoch": 0.43, + "learning_rate": 1.2235975279010308e-05, + "loss": 0.5738, + "step": 12365 + }, + { + "epoch": 0.43, + "learning_rate": 1.2234913969336932e-05, + "loss": 0.681, + "step": 12366 + }, + { + "epoch": 0.43, + "learning_rate": 1.2233852633165826e-05, + "loss": 0.6669, + "step": 12367 + }, + { + "epoch": 0.43, + "learning_rate": 1.2232791270509572e-05, + "loss": 0.6509, + "step": 12368 + }, + { + "epoch": 0.43, + "learning_rate": 1.223172988138075e-05, + "loss": 0.6331, + "step": 12369 + }, + { + "epoch": 0.43, + "learning_rate": 1.2230668465791948e-05, + "loss": 0.7068, + "step": 12370 + }, + { + "epoch": 0.43, + "learning_rate": 1.222960702375575e-05, + "loss": 0.6557, + "step": 12371 + }, + { + "epoch": 0.43, + "learning_rate": 1.2228545555284739e-05, + "loss": 0.644, + "step": 12372 + }, + { + "epoch": 0.43, + "learning_rate": 1.2227484060391505e-05, + "loss": 0.5907, + "step": 12373 + }, + { + "epoch": 0.43, + "learning_rate": 1.2226422539088628e-05, + "loss": 0.5993, + "step": 12374 + }, + { + "epoch": 0.43, + "learning_rate": 1.2225360991388694e-05, + "loss": 0.616, + "step": 12375 + }, + { + "epoch": 0.43, + "learning_rate": 1.2224299417304291e-05, + "loss": 0.5881, + "step": 12376 + }, + { + "epoch": 0.43, + "learning_rate": 1.2223237816848003e-05, + "loss": 0.6058, + "step": 12377 + }, + { + "epoch": 0.43, + "learning_rate": 1.222217619003242e-05, + "loss": 0.583, + "step": 12378 + }, + { + "epoch": 0.43, + "learning_rate": 1.2221114536870128e-05, + "loss": 0.6362, + "step": 12379 + }, + { + "epoch": 0.43, + "learning_rate": 1.2220052857373712e-05, + "loss": 0.599, + "step": 12380 + }, + { + "epoch": 0.43, + "learning_rate": 1.2218991151555761e-05, + "loss": 0.6883, + "step": 12381 + }, + { + "epoch": 0.43, + "learning_rate": 1.2217929419428865e-05, + "loss": 0.6221, + "step": 12382 + }, + { + "epoch": 0.43, + "learning_rate": 1.2216867661005608e-05, + "loss": 0.6056, + "step": 12383 + }, + { + "epoch": 0.43, + "learning_rate": 1.2215805876298579e-05, + "loss": 0.5876, + "step": 12384 + }, + { + "epoch": 0.43, + "learning_rate": 1.2214744065320373e-05, + "loss": 0.6774, + "step": 12385 + }, + { + "epoch": 0.43, + "learning_rate": 1.2213682228083569e-05, + "loss": 0.5628, + "step": 12386 + }, + { + "epoch": 0.43, + "learning_rate": 1.2212620364600765e-05, + "loss": 0.6386, + "step": 12387 + }, + { + "epoch": 0.43, + "learning_rate": 1.2211558474884548e-05, + "loss": 0.6475, + "step": 12388 + }, + { + "epoch": 0.43, + "learning_rate": 1.2210496558947506e-05, + "loss": 0.5916, + "step": 12389 + }, + { + "epoch": 0.43, + "learning_rate": 1.2209434616802231e-05, + "loss": 0.5946, + "step": 12390 + }, + { + "epoch": 0.43, + "learning_rate": 1.2208372648461318e-05, + "loss": 0.6063, + "step": 12391 + }, + { + "epoch": 0.43, + "learning_rate": 1.2207310653937348e-05, + "loss": 0.6688, + "step": 12392 + }, + { + "epoch": 0.43, + "learning_rate": 1.2206248633242919e-05, + "loss": 0.6337, + "step": 12393 + }, + { + "epoch": 0.43, + "learning_rate": 1.2205186586390623e-05, + "loss": 0.6551, + "step": 12394 + }, + { + "epoch": 0.43, + "learning_rate": 1.220412451339305e-05, + "loss": 0.6222, + "step": 12395 + }, + { + "epoch": 0.43, + "learning_rate": 1.2203062414262792e-05, + "loss": 0.6431, + "step": 12396 + }, + { + "epoch": 0.43, + "learning_rate": 1.2202000289012444e-05, + "loss": 0.6325, + "step": 12397 + }, + { + "epoch": 0.43, + "learning_rate": 1.2200938137654596e-05, + "loss": 0.6826, + "step": 12398 + }, + { + "epoch": 0.43, + "learning_rate": 1.2199875960201841e-05, + "loss": 0.6641, + "step": 12399 + }, + { + "epoch": 0.43, + "learning_rate": 1.2198813756666776e-05, + "loss": 0.5924, + "step": 12400 + }, + { + "epoch": 0.43, + "learning_rate": 1.2197751527061992e-05, + "loss": 0.5875, + "step": 12401 + }, + { + "epoch": 0.43, + "learning_rate": 1.219668927140008e-05, + "loss": 0.627, + "step": 12402 + }, + { + "epoch": 0.43, + "learning_rate": 1.2195626989693643e-05, + "loss": 0.6674, + "step": 12403 + }, + { + "epoch": 0.43, + "learning_rate": 1.2194564681955265e-05, + "loss": 0.5876, + "step": 12404 + }, + { + "epoch": 0.43, + "learning_rate": 1.219350234819755e-05, + "loss": 0.6092, + "step": 12405 + }, + { + "epoch": 0.43, + "learning_rate": 1.219243998843309e-05, + "loss": 0.663, + "step": 12406 + }, + { + "epoch": 0.43, + "learning_rate": 1.2191377602674481e-05, + "loss": 0.6325, + "step": 12407 + }, + { + "epoch": 0.43, + "learning_rate": 1.2190315190934317e-05, + "loss": 0.616, + "step": 12408 + }, + { + "epoch": 0.43, + "learning_rate": 1.2189252753225196e-05, + "loss": 0.6257, + "step": 12409 + }, + { + "epoch": 0.43, + "learning_rate": 1.2188190289559713e-05, + "loss": 0.5655, + "step": 12410 + }, + { + "epoch": 0.43, + "learning_rate": 1.2187127799950466e-05, + "loss": 0.6458, + "step": 12411 + }, + { + "epoch": 0.43, + "learning_rate": 1.2186065284410056e-05, + "loss": 0.616, + "step": 12412 + }, + { + "epoch": 0.43, + "learning_rate": 1.2185002742951073e-05, + "loss": 0.6164, + "step": 12413 + }, + { + "epoch": 0.43, + "learning_rate": 1.218394017558612e-05, + "loss": 0.6779, + "step": 12414 + }, + { + "epoch": 0.43, + "learning_rate": 1.2182877582327794e-05, + "loss": 0.6123, + "step": 12415 + }, + { + "epoch": 0.43, + "learning_rate": 1.2181814963188692e-05, + "loss": 0.6524, + "step": 12416 + }, + { + "epoch": 0.43, + "learning_rate": 1.2180752318181412e-05, + "loss": 0.657, + "step": 12417 + }, + { + "epoch": 0.43, + "learning_rate": 1.2179689647318558e-05, + "loss": 0.6229, + "step": 12418 + }, + { + "epoch": 0.43, + "learning_rate": 1.2178626950612722e-05, + "loss": 0.6851, + "step": 12419 + }, + { + "epoch": 0.43, + "learning_rate": 1.2177564228076508e-05, + "loss": 0.6361, + "step": 12420 + }, + { + "epoch": 0.43, + "learning_rate": 1.217650147972252e-05, + "loss": 0.6537, + "step": 12421 + }, + { + "epoch": 0.43, + "learning_rate": 1.217543870556335e-05, + "loss": 0.6626, + "step": 12422 + }, + { + "epoch": 0.43, + "learning_rate": 1.2174375905611601e-05, + "loss": 0.6793, + "step": 12423 + }, + { + "epoch": 0.43, + "learning_rate": 1.217331307987988e-05, + "loss": 0.6006, + "step": 12424 + }, + { + "epoch": 0.43, + "learning_rate": 1.217225022838078e-05, + "loss": 0.6369, + "step": 12425 + }, + { + "epoch": 0.43, + "learning_rate": 1.2171187351126902e-05, + "loss": 0.6287, + "step": 12426 + }, + { + "epoch": 0.43, + "learning_rate": 1.2170124448130858e-05, + "loss": 0.6221, + "step": 12427 + }, + { + "epoch": 0.43, + "learning_rate": 1.216906151940524e-05, + "loss": 0.631, + "step": 12428 + }, + { + "epoch": 0.43, + "learning_rate": 1.2167998564962653e-05, + "loss": 0.6445, + "step": 12429 + }, + { + "epoch": 0.43, + "learning_rate": 1.2166935584815705e-05, + "loss": 0.6152, + "step": 12430 + }, + { + "epoch": 0.43, + "learning_rate": 1.2165872578976989e-05, + "loss": 0.6574, + "step": 12431 + }, + { + "epoch": 0.43, + "learning_rate": 1.2164809547459117e-05, + "loss": 0.6178, + "step": 12432 + }, + { + "epoch": 0.43, + "learning_rate": 1.2163746490274689e-05, + "loss": 0.6603, + "step": 12433 + }, + { + "epoch": 0.43, + "learning_rate": 1.2162683407436308e-05, + "loss": 0.6618, + "step": 12434 + }, + { + "epoch": 0.43, + "learning_rate": 1.2161620298956583e-05, + "loss": 0.64, + "step": 12435 + }, + { + "epoch": 0.43, + "learning_rate": 1.216055716484811e-05, + "loss": 0.6079, + "step": 12436 + }, + { + "epoch": 0.43, + "learning_rate": 1.21594940051235e-05, + "loss": 0.6686, + "step": 12437 + }, + { + "epoch": 0.43, + "learning_rate": 1.2158430819795357e-05, + "loss": 0.5726, + "step": 12438 + }, + { + "epoch": 0.43, + "learning_rate": 1.2157367608876288e-05, + "loss": 0.6712, + "step": 12439 + }, + { + "epoch": 0.43, + "learning_rate": 1.2156304372378892e-05, + "loss": 0.5716, + "step": 12440 + }, + { + "epoch": 0.43, + "learning_rate": 1.2155241110315784e-05, + "loss": 0.6307, + "step": 12441 + }, + { + "epoch": 0.43, + "learning_rate": 1.2154177822699566e-05, + "loss": 0.6387, + "step": 12442 + }, + { + "epoch": 0.43, + "learning_rate": 1.2153114509542845e-05, + "loss": 0.6067, + "step": 12443 + }, + { + "epoch": 0.43, + "learning_rate": 1.2152051170858227e-05, + "loss": 0.6397, + "step": 12444 + }, + { + "epoch": 0.43, + "learning_rate": 1.2150987806658321e-05, + "loss": 0.581, + "step": 12445 + }, + { + "epoch": 0.43, + "learning_rate": 1.2149924416955732e-05, + "loss": 0.6316, + "step": 12446 + }, + { + "epoch": 0.43, + "learning_rate": 1.2148861001763072e-05, + "loss": 0.6368, + "step": 12447 + }, + { + "epoch": 0.43, + "learning_rate": 1.2147797561092945e-05, + "loss": 0.5999, + "step": 12448 + }, + { + "epoch": 0.43, + "learning_rate": 1.214673409495796e-05, + "loss": 0.6573, + "step": 12449 + }, + { + "epoch": 0.43, + "learning_rate": 1.2145670603370727e-05, + "loss": 0.6066, + "step": 12450 + }, + { + "epoch": 0.43, + "learning_rate": 1.2144607086343853e-05, + "loss": 0.6622, + "step": 12451 + }, + { + "epoch": 0.43, + "learning_rate": 1.2143543543889953e-05, + "loss": 0.6017, + "step": 12452 + }, + { + "epoch": 0.43, + "learning_rate": 1.214247997602163e-05, + "loss": 0.6889, + "step": 12453 + }, + { + "epoch": 0.43, + "learning_rate": 1.21414163827515e-05, + "loss": 0.5907, + "step": 12454 + }, + { + "epoch": 0.43, + "learning_rate": 1.2140352764092164e-05, + "loss": 0.6209, + "step": 12455 + }, + { + "epoch": 0.43, + "learning_rate": 1.2139289120056243e-05, + "loss": 0.6526, + "step": 12456 + }, + { + "epoch": 0.43, + "learning_rate": 1.2138225450656343e-05, + "loss": 0.6629, + "step": 12457 + }, + { + "epoch": 0.43, + "learning_rate": 1.2137161755905073e-05, + "loss": 0.6228, + "step": 12458 + }, + { + "epoch": 0.43, + "learning_rate": 1.2136098035815048e-05, + "loss": 0.6258, + "step": 12459 + }, + { + "epoch": 0.43, + "learning_rate": 1.213503429039888e-05, + "loss": 0.6289, + "step": 12460 + }, + { + "epoch": 0.43, + "learning_rate": 1.2133970519669176e-05, + "loss": 0.6202, + "step": 12461 + }, + { + "epoch": 0.43, + "learning_rate": 1.2132906723638558e-05, + "loss": 0.5917, + "step": 12462 + }, + { + "epoch": 0.43, + "learning_rate": 1.2131842902319631e-05, + "loss": 0.6072, + "step": 12463 + }, + { + "epoch": 0.43, + "learning_rate": 1.2130779055725003e-05, + "loss": 0.658, + "step": 12464 + }, + { + "epoch": 0.43, + "learning_rate": 1.2129715183867301e-05, + "loss": 0.6292, + "step": 12465 + }, + { + "epoch": 0.43, + "learning_rate": 1.212865128675913e-05, + "loss": 0.6454, + "step": 12466 + }, + { + "epoch": 0.43, + "learning_rate": 1.21275873644131e-05, + "loss": 0.6504, + "step": 12467 + }, + { + "epoch": 0.43, + "learning_rate": 1.2126523416841838e-05, + "loss": 0.6619, + "step": 12468 + }, + { + "epoch": 0.43, + "learning_rate": 1.2125459444057948e-05, + "loss": 0.6357, + "step": 12469 + }, + { + "epoch": 0.43, + "learning_rate": 1.2124395446074044e-05, + "loss": 0.6244, + "step": 12470 + }, + { + "epoch": 0.43, + "learning_rate": 1.2123331422902749e-05, + "loss": 0.5957, + "step": 12471 + }, + { + "epoch": 0.43, + "learning_rate": 1.2122267374556676e-05, + "loss": 0.612, + "step": 12472 + }, + { + "epoch": 0.43, + "learning_rate": 1.212120330104843e-05, + "loss": 0.6665, + "step": 12473 + }, + { + "epoch": 0.43, + "learning_rate": 1.2120139202390641e-05, + "loss": 0.5995, + "step": 12474 + }, + { + "epoch": 0.43, + "learning_rate": 1.2119075078595923e-05, + "loss": 0.612, + "step": 12475 + }, + { + "epoch": 0.43, + "learning_rate": 1.2118010929676882e-05, + "loss": 0.6767, + "step": 12476 + }, + { + "epoch": 0.43, + "learning_rate": 1.211694675564615e-05, + "loss": 0.669, + "step": 12477 + }, + { + "epoch": 0.43, + "learning_rate": 1.2115882556516331e-05, + "loss": 0.6447, + "step": 12478 + }, + { + "epoch": 0.43, + "learning_rate": 1.2114818332300047e-05, + "loss": 0.6006, + "step": 12479 + }, + { + "epoch": 0.43, + "learning_rate": 1.2113754083009918e-05, + "loss": 0.6479, + "step": 12480 + }, + { + "epoch": 0.43, + "learning_rate": 1.2112689808658562e-05, + "loss": 0.6225, + "step": 12481 + }, + { + "epoch": 0.43, + "learning_rate": 1.2111625509258593e-05, + "loss": 0.5769, + "step": 12482 + }, + { + "epoch": 0.43, + "learning_rate": 1.2110561184822635e-05, + "loss": 0.6168, + "step": 12483 + }, + { + "epoch": 0.43, + "learning_rate": 1.2109496835363304e-05, + "loss": 0.5834, + "step": 12484 + }, + { + "epoch": 0.43, + "learning_rate": 1.2108432460893215e-05, + "loss": 0.5912, + "step": 12485 + }, + { + "epoch": 0.43, + "learning_rate": 1.2107368061424997e-05, + "loss": 0.6648, + "step": 12486 + }, + { + "epoch": 0.43, + "learning_rate": 1.2106303636971266e-05, + "loss": 0.6185, + "step": 12487 + }, + { + "epoch": 0.43, + "learning_rate": 1.2105239187544637e-05, + "loss": 0.6463, + "step": 12488 + }, + { + "epoch": 0.43, + "learning_rate": 1.2104174713157735e-05, + "loss": 0.5882, + "step": 12489 + }, + { + "epoch": 0.43, + "learning_rate": 1.2103110213823181e-05, + "loss": 0.6367, + "step": 12490 + }, + { + "epoch": 0.43, + "learning_rate": 1.2102045689553595e-05, + "loss": 0.6445, + "step": 12491 + }, + { + "epoch": 0.43, + "learning_rate": 1.2100981140361595e-05, + "loss": 0.6644, + "step": 12492 + }, + { + "epoch": 0.43, + "learning_rate": 1.2099916566259812e-05, + "loss": 0.6485, + "step": 12493 + }, + { + "epoch": 0.43, + "learning_rate": 1.2098851967260856e-05, + "loss": 0.6162, + "step": 12494 + }, + { + "epoch": 0.43, + "learning_rate": 1.2097787343377359e-05, + "loss": 0.6561, + "step": 12495 + }, + { + "epoch": 0.43, + "learning_rate": 1.2096722694621939e-05, + "loss": 0.6449, + "step": 12496 + }, + { + "epoch": 0.43, + "learning_rate": 1.2095658021007215e-05, + "loss": 0.6697, + "step": 12497 + }, + { + "epoch": 0.43, + "learning_rate": 1.2094593322545815e-05, + "loss": 0.6856, + "step": 12498 + }, + { + "epoch": 0.43, + "learning_rate": 1.2093528599250366e-05, + "loss": 0.6774, + "step": 12499 + }, + { + "epoch": 0.43, + "learning_rate": 1.2092463851133483e-05, + "loss": 0.5839, + "step": 12500 + }, + { + "epoch": 0.43, + "learning_rate": 1.2091399078207795e-05, + "loss": 0.6057, + "step": 12501 + }, + { + "epoch": 0.43, + "learning_rate": 1.2090334280485927e-05, + "loss": 0.6208, + "step": 12502 + }, + { + "epoch": 0.43, + "learning_rate": 1.20892694579805e-05, + "loss": 0.6477, + "step": 12503 + }, + { + "epoch": 0.43, + "learning_rate": 1.208820461070414e-05, + "loss": 0.6095, + "step": 12504 + }, + { + "epoch": 0.43, + "learning_rate": 1.2087139738669476e-05, + "loss": 0.6419, + "step": 12505 + }, + { + "epoch": 0.43, + "learning_rate": 1.2086074841889126e-05, + "loss": 0.626, + "step": 12506 + }, + { + "epoch": 0.43, + "learning_rate": 1.208500992037572e-05, + "loss": 0.5913, + "step": 12507 + }, + { + "epoch": 0.43, + "learning_rate": 1.2083944974141888e-05, + "loss": 0.6286, + "step": 12508 + }, + { + "epoch": 0.43, + "learning_rate": 1.208288000320025e-05, + "loss": 0.6541, + "step": 12509 + }, + { + "epoch": 0.43, + "learning_rate": 1.2081815007563433e-05, + "loss": 0.616, + "step": 12510 + }, + { + "epoch": 0.43, + "learning_rate": 1.208074998724407e-05, + "loss": 0.6218, + "step": 12511 + }, + { + "epoch": 0.43, + "learning_rate": 1.2079684942254779e-05, + "loss": 0.6568, + "step": 12512 + }, + { + "epoch": 0.43, + "learning_rate": 1.2078619872608194e-05, + "loss": 0.6392, + "step": 12513 + }, + { + "epoch": 0.43, + "learning_rate": 1.2077554778316942e-05, + "loss": 0.6055, + "step": 12514 + }, + { + "epoch": 0.43, + "learning_rate": 1.2076489659393649e-05, + "loss": 0.5993, + "step": 12515 + }, + { + "epoch": 0.43, + "learning_rate": 1.2075424515850944e-05, + "loss": 0.6349, + "step": 12516 + }, + { + "epoch": 0.43, + "learning_rate": 1.2074359347701457e-05, + "loss": 0.6177, + "step": 12517 + }, + { + "epoch": 0.43, + "learning_rate": 1.2073294154957815e-05, + "loss": 0.6057, + "step": 12518 + }, + { + "epoch": 0.43, + "learning_rate": 1.2072228937632646e-05, + "loss": 0.6585, + "step": 12519 + }, + { + "epoch": 0.43, + "learning_rate": 1.2071163695738586e-05, + "loss": 0.5935, + "step": 12520 + }, + { + "epoch": 0.43, + "learning_rate": 1.2070098429288257e-05, + "loss": 0.6437, + "step": 12521 + }, + { + "epoch": 0.43, + "learning_rate": 1.2069033138294293e-05, + "loss": 0.6464, + "step": 12522 + }, + { + "epoch": 0.43, + "learning_rate": 1.2067967822769326e-05, + "loss": 0.6202, + "step": 12523 + }, + { + "epoch": 0.43, + "learning_rate": 1.2066902482725983e-05, + "loss": 0.6316, + "step": 12524 + }, + { + "epoch": 0.43, + "learning_rate": 1.2065837118176895e-05, + "loss": 0.6336, + "step": 12525 + }, + { + "epoch": 0.43, + "learning_rate": 1.2064771729134696e-05, + "loss": 0.6096, + "step": 12526 + }, + { + "epoch": 0.43, + "learning_rate": 1.2063706315612016e-05, + "loss": 0.6139, + "step": 12527 + }, + { + "epoch": 0.43, + "learning_rate": 1.2062640877621487e-05, + "loss": 0.6533, + "step": 12528 + }, + { + "epoch": 0.43, + "learning_rate": 1.2061575415175742e-05, + "loss": 0.6362, + "step": 12529 + }, + { + "epoch": 0.43, + "learning_rate": 1.2060509928287412e-05, + "loss": 0.6271, + "step": 12530 + }, + { + "epoch": 0.43, + "learning_rate": 1.205944441696913e-05, + "loss": 0.618, + "step": 12531 + }, + { + "epoch": 0.43, + "learning_rate": 1.2058378881233528e-05, + "loss": 0.641, + "step": 12532 + }, + { + "epoch": 0.43, + "learning_rate": 1.2057313321093242e-05, + "loss": 0.5907, + "step": 12533 + }, + { + "epoch": 0.43, + "learning_rate": 1.2056247736560905e-05, + "loss": 0.634, + "step": 12534 + }, + { + "epoch": 0.43, + "learning_rate": 1.2055182127649148e-05, + "loss": 0.6343, + "step": 12535 + }, + { + "epoch": 0.43, + "learning_rate": 1.2054116494370608e-05, + "loss": 0.682, + "step": 12536 + }, + { + "epoch": 0.43, + "learning_rate": 1.2053050836737919e-05, + "loss": 0.595, + "step": 12537 + }, + { + "epoch": 0.43, + "learning_rate": 1.2051985154763712e-05, + "loss": 0.7031, + "step": 12538 + }, + { + "epoch": 0.43, + "learning_rate": 1.2050919448460627e-05, + "loss": 0.6338, + "step": 12539 + }, + { + "epoch": 0.43, + "learning_rate": 1.20498537178413e-05, + "loss": 0.649, + "step": 12540 + }, + { + "epoch": 0.43, + "learning_rate": 1.2048787962918362e-05, + "loss": 0.6066, + "step": 12541 + }, + { + "epoch": 0.43, + "learning_rate": 1.2047722183704451e-05, + "loss": 0.6351, + "step": 12542 + }, + { + "epoch": 0.43, + "learning_rate": 1.2046656380212205e-05, + "loss": 0.5854, + "step": 12543 + }, + { + "epoch": 0.43, + "learning_rate": 1.2045590552454256e-05, + "loss": 0.6418, + "step": 12544 + }, + { + "epoch": 0.43, + "learning_rate": 1.2044524700443244e-05, + "loss": 0.638, + "step": 12545 + }, + { + "epoch": 0.43, + "learning_rate": 1.2043458824191807e-05, + "loss": 0.5957, + "step": 12546 + }, + { + "epoch": 0.43, + "learning_rate": 1.2042392923712578e-05, + "loss": 0.65, + "step": 12547 + }, + { + "epoch": 0.43, + "learning_rate": 1.2041326999018197e-05, + "loss": 0.6112, + "step": 12548 + }, + { + "epoch": 0.43, + "learning_rate": 1.2040261050121307e-05, + "loss": 0.6233, + "step": 12549 + }, + { + "epoch": 0.43, + "learning_rate": 1.2039195077034536e-05, + "loss": 0.6537, + "step": 12550 + }, + { + "epoch": 0.43, + "learning_rate": 1.2038129079770529e-05, + "loss": 0.6329, + "step": 12551 + }, + { + "epoch": 0.43, + "learning_rate": 1.2037063058341926e-05, + "loss": 0.67, + "step": 12552 + }, + { + "epoch": 0.43, + "learning_rate": 1.2035997012761361e-05, + "loss": 0.5886, + "step": 12553 + }, + { + "epoch": 0.43, + "learning_rate": 1.2034930943041477e-05, + "loss": 0.6083, + "step": 12554 + }, + { + "epoch": 0.43, + "learning_rate": 1.2033864849194912e-05, + "loss": 0.6487, + "step": 12555 + }, + { + "epoch": 0.44, + "learning_rate": 1.2032798731234308e-05, + "loss": 0.6312, + "step": 12556 + }, + { + "epoch": 0.44, + "learning_rate": 1.20317325891723e-05, + "loss": 0.6452, + "step": 12557 + }, + { + "epoch": 0.44, + "learning_rate": 1.2030666423021536e-05, + "loss": 0.6501, + "step": 12558 + }, + { + "epoch": 0.44, + "learning_rate": 1.2029600232794652e-05, + "loss": 0.6429, + "step": 12559 + }, + { + "epoch": 0.44, + "learning_rate": 1.2028534018504285e-05, + "loss": 0.6527, + "step": 12560 + }, + { + "epoch": 0.44, + "learning_rate": 1.2027467780163087e-05, + "loss": 0.6628, + "step": 12561 + }, + { + "epoch": 0.44, + "learning_rate": 1.2026401517783692e-05, + "loss": 0.6326, + "step": 12562 + }, + { + "epoch": 0.44, + "learning_rate": 1.2025335231378741e-05, + "loss": 0.6601, + "step": 12563 + }, + { + "epoch": 0.44, + "learning_rate": 1.2024268920960882e-05, + "loss": 0.5929, + "step": 12564 + }, + { + "epoch": 0.44, + "learning_rate": 1.2023202586542753e-05, + "loss": 0.6225, + "step": 12565 + }, + { + "epoch": 0.44, + "learning_rate": 1.2022136228136996e-05, + "loss": 0.6663, + "step": 12566 + }, + { + "epoch": 0.44, + "learning_rate": 1.202106984575626e-05, + "loss": 0.6412, + "step": 12567 + }, + { + "epoch": 0.44, + "learning_rate": 1.2020003439413181e-05, + "loss": 0.6557, + "step": 12568 + }, + { + "epoch": 0.44, + "learning_rate": 1.2018937009120406e-05, + "loss": 0.669, + "step": 12569 + }, + { + "epoch": 0.44, + "learning_rate": 1.2017870554890581e-05, + "loss": 0.6428, + "step": 12570 + }, + { + "epoch": 0.44, + "learning_rate": 1.2016804076736348e-05, + "loss": 0.6298, + "step": 12571 + }, + { + "epoch": 0.44, + "learning_rate": 1.2015737574670347e-05, + "loss": 0.6124, + "step": 12572 + }, + { + "epoch": 0.44, + "learning_rate": 1.2014671048705232e-05, + "loss": 0.6354, + "step": 12573 + }, + { + "epoch": 0.44, + "learning_rate": 1.2013604498853645e-05, + "loss": 0.5723, + "step": 12574 + }, + { + "epoch": 0.44, + "learning_rate": 1.2012537925128223e-05, + "loss": 0.6029, + "step": 12575 + }, + { + "epoch": 0.44, + "learning_rate": 1.2011471327541622e-05, + "loss": 0.6367, + "step": 12576 + }, + { + "epoch": 0.44, + "learning_rate": 1.2010404706106484e-05, + "loss": 0.6363, + "step": 12577 + }, + { + "epoch": 0.44, + "learning_rate": 1.2009338060835452e-05, + "loss": 0.6331, + "step": 12578 + }, + { + "epoch": 0.44, + "learning_rate": 1.2008271391741178e-05, + "loss": 0.651, + "step": 12579 + }, + { + "epoch": 0.44, + "learning_rate": 1.2007204698836305e-05, + "loss": 0.6465, + "step": 12580 + }, + { + "epoch": 0.44, + "learning_rate": 1.200613798213348e-05, + "loss": 0.6459, + "step": 12581 + }, + { + "epoch": 0.44, + "learning_rate": 1.2005071241645354e-05, + "loss": 0.6751, + "step": 12582 + }, + { + "epoch": 0.44, + "learning_rate": 1.2004004477384574e-05, + "loss": 0.5774, + "step": 12583 + }, + { + "epoch": 0.44, + "learning_rate": 1.2002937689363781e-05, + "loss": 0.6259, + "step": 12584 + }, + { + "epoch": 0.44, + "learning_rate": 1.200187087759563e-05, + "loss": 0.6164, + "step": 12585 + }, + { + "epoch": 0.44, + "learning_rate": 1.2000804042092768e-05, + "loss": 0.6496, + "step": 12586 + }, + { + "epoch": 0.44, + "learning_rate": 1.1999737182867843e-05, + "loss": 0.6226, + "step": 12587 + }, + { + "epoch": 0.44, + "learning_rate": 1.1998670299933503e-05, + "loss": 0.5615, + "step": 12588 + }, + { + "epoch": 0.44, + "learning_rate": 1.19976033933024e-05, + "loss": 0.665, + "step": 12589 + }, + { + "epoch": 0.44, + "learning_rate": 1.1996536462987179e-05, + "loss": 0.6256, + "step": 12590 + }, + { + "epoch": 0.44, + "learning_rate": 1.1995469509000493e-05, + "loss": 0.6356, + "step": 12591 + }, + { + "epoch": 0.44, + "learning_rate": 1.1994402531354993e-05, + "loss": 0.6204, + "step": 12592 + }, + { + "epoch": 0.44, + "learning_rate": 1.1993335530063328e-05, + "loss": 0.5809, + "step": 12593 + }, + { + "epoch": 0.44, + "learning_rate": 1.199226850513815e-05, + "loss": 0.6236, + "step": 12594 + }, + { + "epoch": 0.44, + "learning_rate": 1.1991201456592108e-05, + "loss": 0.6363, + "step": 12595 + }, + { + "epoch": 0.44, + "learning_rate": 1.1990134384437853e-05, + "loss": 0.6434, + "step": 12596 + }, + { + "epoch": 0.44, + "learning_rate": 1.1989067288688037e-05, + "loss": 0.6244, + "step": 12597 + }, + { + "epoch": 0.44, + "learning_rate": 1.1988000169355311e-05, + "loss": 0.6103, + "step": 12598 + }, + { + "epoch": 0.44, + "learning_rate": 1.198693302645233e-05, + "loss": 0.6208, + "step": 12599 + }, + { + "epoch": 0.44, + "learning_rate": 1.1985865859991742e-05, + "loss": 0.6299, + "step": 12600 + }, + { + "epoch": 0.44, + "learning_rate": 1.1984798669986209e-05, + "loss": 0.6651, + "step": 12601 + }, + { + "epoch": 0.44, + "learning_rate": 1.198373145644837e-05, + "loss": 0.6806, + "step": 12602 + }, + { + "epoch": 0.44, + "learning_rate": 1.1982664219390887e-05, + "loss": 0.6291, + "step": 12603 + }, + { + "epoch": 0.44, + "learning_rate": 1.1981596958826414e-05, + "loss": 0.6457, + "step": 12604 + }, + { + "epoch": 0.44, + "learning_rate": 1.1980529674767599e-05, + "loss": 0.6588, + "step": 12605 + }, + { + "epoch": 0.44, + "learning_rate": 1.19794623672271e-05, + "loss": 0.6166, + "step": 12606 + }, + { + "epoch": 0.44, + "learning_rate": 1.1978395036217572e-05, + "loss": 0.6155, + "step": 12607 + }, + { + "epoch": 0.44, + "learning_rate": 1.1977327681751668e-05, + "loss": 0.663, + "step": 12608 + }, + { + "epoch": 0.44, + "learning_rate": 1.197626030384204e-05, + "loss": 0.6535, + "step": 12609 + }, + { + "epoch": 0.44, + "learning_rate": 1.1975192902501349e-05, + "loss": 0.6021, + "step": 12610 + }, + { + "epoch": 0.44, + "learning_rate": 1.1974125477742247e-05, + "loss": 0.5813, + "step": 12611 + }, + { + "epoch": 0.44, + "learning_rate": 1.1973058029577388e-05, + "loss": 0.6916, + "step": 12612 + }, + { + "epoch": 0.44, + "learning_rate": 1.1971990558019435e-05, + "loss": 0.6338, + "step": 12613 + }, + { + "epoch": 0.44, + "learning_rate": 1.1970923063081038e-05, + "loss": 0.61, + "step": 12614 + }, + { + "epoch": 0.44, + "learning_rate": 1.1969855544774851e-05, + "loss": 0.6133, + "step": 12615 + }, + { + "epoch": 0.44, + "learning_rate": 1.1968788003113539e-05, + "loss": 0.6184, + "step": 12616 + }, + { + "epoch": 0.44, + "learning_rate": 1.196772043810975e-05, + "loss": 0.6692, + "step": 12617 + }, + { + "epoch": 0.44, + "learning_rate": 1.1966652849776152e-05, + "loss": 0.6262, + "step": 12618 + }, + { + "epoch": 0.44, + "learning_rate": 1.1965585238125392e-05, + "loss": 0.5753, + "step": 12619 + }, + { + "epoch": 0.44, + "learning_rate": 1.1964517603170134e-05, + "loss": 0.6067, + "step": 12620 + }, + { + "epoch": 0.44, + "learning_rate": 1.1963449944923036e-05, + "loss": 0.6148, + "step": 12621 + }, + { + "epoch": 0.44, + "learning_rate": 1.1962382263396752e-05, + "loss": 0.5804, + "step": 12622 + }, + { + "epoch": 0.44, + "learning_rate": 1.1961314558603946e-05, + "loss": 0.6628, + "step": 12623 + }, + { + "epoch": 0.44, + "learning_rate": 1.1960246830557276e-05, + "loss": 0.6711, + "step": 12624 + }, + { + "epoch": 0.44, + "learning_rate": 1.1959179079269399e-05, + "loss": 0.6151, + "step": 12625 + }, + { + "epoch": 0.44, + "learning_rate": 1.1958111304752973e-05, + "loss": 0.656, + "step": 12626 + }, + { + "epoch": 0.44, + "learning_rate": 1.1957043507020665e-05, + "loss": 0.6393, + "step": 12627 + }, + { + "epoch": 0.44, + "learning_rate": 1.1955975686085129e-05, + "loss": 0.6423, + "step": 12628 + }, + { + "epoch": 0.44, + "learning_rate": 1.1954907841959026e-05, + "loss": 0.6265, + "step": 12629 + }, + { + "epoch": 0.44, + "learning_rate": 1.1953839974655018e-05, + "loss": 0.5778, + "step": 12630 + }, + { + "epoch": 0.44, + "learning_rate": 1.1952772084185765e-05, + "loss": 0.6244, + "step": 12631 + }, + { + "epoch": 0.44, + "learning_rate": 1.1951704170563927e-05, + "loss": 0.6063, + "step": 12632 + }, + { + "epoch": 0.44, + "learning_rate": 1.1950636233802172e-05, + "loss": 0.5795, + "step": 12633 + }, + { + "epoch": 0.44, + "learning_rate": 1.1949568273913153e-05, + "loss": 0.6208, + "step": 12634 + }, + { + "epoch": 0.44, + "learning_rate": 1.1948500290909535e-05, + "loss": 0.6288, + "step": 12635 + }, + { + "epoch": 0.44, + "learning_rate": 1.1947432284803984e-05, + "loss": 0.6394, + "step": 12636 + }, + { + "epoch": 0.44, + "learning_rate": 1.1946364255609157e-05, + "loss": 0.6421, + "step": 12637 + }, + { + "epoch": 0.44, + "learning_rate": 1.1945296203337721e-05, + "loss": 0.6537, + "step": 12638 + }, + { + "epoch": 0.44, + "learning_rate": 1.194422812800234e-05, + "loss": 0.6441, + "step": 12639 + }, + { + "epoch": 0.44, + "learning_rate": 1.1943160029615672e-05, + "loss": 0.5801, + "step": 12640 + }, + { + "epoch": 0.44, + "learning_rate": 1.1942091908190385e-05, + "loss": 0.6717, + "step": 12641 + }, + { + "epoch": 0.44, + "learning_rate": 1.1941023763739143e-05, + "loss": 0.551, + "step": 12642 + }, + { + "epoch": 0.44, + "learning_rate": 1.1939955596274606e-05, + "loss": 0.6687, + "step": 12643 + }, + { + "epoch": 0.44, + "learning_rate": 1.1938887405809443e-05, + "loss": 0.638, + "step": 12644 + }, + { + "epoch": 0.44, + "learning_rate": 1.1937819192356317e-05, + "loss": 0.671, + "step": 12645 + }, + { + "epoch": 0.44, + "learning_rate": 1.1936750955927891e-05, + "loss": 0.644, + "step": 12646 + }, + { + "epoch": 0.44, + "learning_rate": 1.1935682696536835e-05, + "loss": 0.6247, + "step": 12647 + }, + { + "epoch": 0.44, + "learning_rate": 1.1934614414195814e-05, + "loss": 0.5936, + "step": 12648 + }, + { + "epoch": 0.44, + "learning_rate": 1.193354610891749e-05, + "loss": 0.6279, + "step": 12649 + }, + { + "epoch": 0.44, + "learning_rate": 1.1932477780714526e-05, + "loss": 0.628, + "step": 12650 + }, + { + "epoch": 0.44, + "learning_rate": 1.19314094295996e-05, + "loss": 0.6129, + "step": 12651 + }, + { + "epoch": 0.44, + "learning_rate": 1.1930341055585369e-05, + "loss": 0.6277, + "step": 12652 + }, + { + "epoch": 0.44, + "learning_rate": 1.1929272658684502e-05, + "loss": 0.6551, + "step": 12653 + }, + { + "epoch": 0.44, + "learning_rate": 1.1928204238909671e-05, + "loss": 0.6629, + "step": 12654 + }, + { + "epoch": 0.44, + "learning_rate": 1.1927135796273534e-05, + "loss": 0.6592, + "step": 12655 + }, + { + "epoch": 0.44, + "learning_rate": 1.1926067330788769e-05, + "loss": 0.6123, + "step": 12656 + }, + { + "epoch": 0.44, + "learning_rate": 1.1924998842468039e-05, + "loss": 0.6082, + "step": 12657 + }, + { + "epoch": 0.44, + "learning_rate": 1.192393033132401e-05, + "loss": 0.6154, + "step": 12658 + }, + { + "epoch": 0.44, + "learning_rate": 1.1922861797369351e-05, + "loss": 0.6284, + "step": 12659 + }, + { + "epoch": 0.44, + "learning_rate": 1.192179324061674e-05, + "loss": 0.6903, + "step": 12660 + }, + { + "epoch": 0.44, + "learning_rate": 1.1920724661078832e-05, + "loss": 0.5583, + "step": 12661 + }, + { + "epoch": 0.44, + "learning_rate": 1.1919656058768308e-05, + "loss": 0.666, + "step": 12662 + }, + { + "epoch": 0.44, + "learning_rate": 1.1918587433697832e-05, + "loss": 0.6793, + "step": 12663 + }, + { + "epoch": 0.44, + "learning_rate": 1.1917518785880075e-05, + "loss": 0.5583, + "step": 12664 + }, + { + "epoch": 0.44, + "learning_rate": 1.1916450115327707e-05, + "loss": 0.615, + "step": 12665 + }, + { + "epoch": 0.44, + "learning_rate": 1.1915381422053398e-05, + "loss": 0.6252, + "step": 12666 + }, + { + "epoch": 0.44, + "learning_rate": 1.1914312706069819e-05, + "loss": 0.6427, + "step": 12667 + }, + { + "epoch": 0.44, + "learning_rate": 1.1913243967389643e-05, + "loss": 0.6572, + "step": 12668 + }, + { + "epoch": 0.44, + "learning_rate": 1.1912175206025537e-05, + "loss": 0.5851, + "step": 12669 + }, + { + "epoch": 0.44, + "learning_rate": 1.1911106421990178e-05, + "loss": 0.6841, + "step": 12670 + }, + { + "epoch": 0.44, + "learning_rate": 1.1910037615296233e-05, + "loss": 0.6328, + "step": 12671 + }, + { + "epoch": 0.44, + "learning_rate": 1.1908968785956376e-05, + "loss": 0.6006, + "step": 12672 + }, + { + "epoch": 0.44, + "learning_rate": 1.1907899933983279e-05, + "loss": 0.6728, + "step": 12673 + }, + { + "epoch": 0.44, + "learning_rate": 1.1906831059389614e-05, + "loss": 0.6277, + "step": 12674 + }, + { + "epoch": 0.44, + "learning_rate": 1.1905762162188058e-05, + "loss": 0.6296, + "step": 12675 + }, + { + "epoch": 0.44, + "learning_rate": 1.1904693242391277e-05, + "loss": 0.6412, + "step": 12676 + }, + { + "epoch": 0.44, + "learning_rate": 1.190362430001195e-05, + "loss": 0.6124, + "step": 12677 + }, + { + "epoch": 0.44, + "learning_rate": 1.190255533506275e-05, + "loss": 0.5927, + "step": 12678 + }, + { + "epoch": 0.44, + "learning_rate": 1.1901486347556346e-05, + "loss": 0.663, + "step": 12679 + }, + { + "epoch": 0.44, + "learning_rate": 1.190041733750542e-05, + "loss": 0.6271, + "step": 12680 + }, + { + "epoch": 0.44, + "learning_rate": 1.189934830492264e-05, + "loss": 0.6393, + "step": 12681 + }, + { + "epoch": 0.44, + "learning_rate": 1.1898279249820684e-05, + "loss": 0.6577, + "step": 12682 + }, + { + "epoch": 0.44, + "learning_rate": 1.1897210172212226e-05, + "loss": 0.6092, + "step": 12683 + }, + { + "epoch": 0.44, + "learning_rate": 1.189614107210994e-05, + "loss": 0.6671, + "step": 12684 + }, + { + "epoch": 0.44, + "learning_rate": 1.1895071949526507e-05, + "loss": 0.6303, + "step": 12685 + }, + { + "epoch": 0.44, + "learning_rate": 1.1894002804474594e-05, + "loss": 0.6412, + "step": 12686 + }, + { + "epoch": 0.44, + "learning_rate": 1.1892933636966884e-05, + "loss": 0.6027, + "step": 12687 + }, + { + "epoch": 0.44, + "learning_rate": 1.1891864447016053e-05, + "loss": 0.6395, + "step": 12688 + }, + { + "epoch": 0.44, + "learning_rate": 1.1890795234634772e-05, + "loss": 0.6234, + "step": 12689 + }, + { + "epoch": 0.44, + "learning_rate": 1.1889725999835721e-05, + "loss": 0.6093, + "step": 12690 + }, + { + "epoch": 0.44, + "learning_rate": 1.1888656742631583e-05, + "loss": 0.6951, + "step": 12691 + }, + { + "epoch": 0.44, + "learning_rate": 1.1887587463035027e-05, + "loss": 0.6803, + "step": 12692 + }, + { + "epoch": 0.44, + "learning_rate": 1.1886518161058734e-05, + "loss": 0.5904, + "step": 12693 + }, + { + "epoch": 0.44, + "learning_rate": 1.188544883671538e-05, + "loss": 0.6457, + "step": 12694 + }, + { + "epoch": 0.44, + "learning_rate": 1.1884379490017647e-05, + "loss": 0.5845, + "step": 12695 + }, + { + "epoch": 0.44, + "learning_rate": 1.1883310120978212e-05, + "loss": 0.6141, + "step": 12696 + }, + { + "epoch": 0.44, + "learning_rate": 1.1882240729609753e-05, + "loss": 0.6106, + "step": 12697 + }, + { + "epoch": 0.44, + "learning_rate": 1.1881171315924949e-05, + "loss": 0.6241, + "step": 12698 + }, + { + "epoch": 0.44, + "learning_rate": 1.1880101879936477e-05, + "loss": 0.6347, + "step": 12699 + }, + { + "epoch": 0.44, + "learning_rate": 1.1879032421657021e-05, + "loss": 0.6591, + "step": 12700 + }, + { + "epoch": 0.44, + "learning_rate": 1.187796294109926e-05, + "loss": 0.5801, + "step": 12701 + }, + { + "epoch": 0.44, + "learning_rate": 1.187689343827587e-05, + "loss": 0.6208, + "step": 12702 + }, + { + "epoch": 0.44, + "learning_rate": 1.1875823913199536e-05, + "loss": 0.653, + "step": 12703 + }, + { + "epoch": 0.44, + "learning_rate": 1.1874754365882935e-05, + "loss": 0.6249, + "step": 12704 + }, + { + "epoch": 0.44, + "learning_rate": 1.1873684796338746e-05, + "loss": 0.6585, + "step": 12705 + }, + { + "epoch": 0.44, + "learning_rate": 1.1872615204579661e-05, + "loss": 0.6751, + "step": 12706 + }, + { + "epoch": 0.44, + "learning_rate": 1.187154559061835e-05, + "loss": 0.6403, + "step": 12707 + }, + { + "epoch": 0.44, + "learning_rate": 1.1870475954467497e-05, + "loss": 0.6297, + "step": 12708 + }, + { + "epoch": 0.44, + "learning_rate": 1.186940629613979e-05, + "loss": 0.6718, + "step": 12709 + }, + { + "epoch": 0.44, + "learning_rate": 1.1868336615647901e-05, + "loss": 0.66, + "step": 12710 + }, + { + "epoch": 0.44, + "learning_rate": 1.1867266913004523e-05, + "loss": 0.6264, + "step": 12711 + }, + { + "epoch": 0.44, + "learning_rate": 1.1866197188222332e-05, + "loss": 0.5979, + "step": 12712 + }, + { + "epoch": 0.44, + "learning_rate": 1.1865127441314011e-05, + "loss": 0.666, + "step": 12713 + }, + { + "epoch": 0.44, + "learning_rate": 1.1864057672292247e-05, + "loss": 0.5936, + "step": 12714 + }, + { + "epoch": 0.44, + "learning_rate": 1.186298788116972e-05, + "loss": 0.6099, + "step": 12715 + }, + { + "epoch": 0.44, + "learning_rate": 1.1861918067959113e-05, + "loss": 0.6355, + "step": 12716 + }, + { + "epoch": 0.44, + "learning_rate": 1.1860848232673116e-05, + "loss": 0.617, + "step": 12717 + }, + { + "epoch": 0.44, + "learning_rate": 1.1859778375324406e-05, + "loss": 0.6489, + "step": 12718 + }, + { + "epoch": 0.44, + "learning_rate": 1.1858708495925672e-05, + "loss": 0.6423, + "step": 12719 + }, + { + "epoch": 0.44, + "learning_rate": 1.1857638594489598e-05, + "loss": 0.6393, + "step": 12720 + }, + { + "epoch": 0.44, + "learning_rate": 1.1856568671028867e-05, + "loss": 0.5983, + "step": 12721 + }, + { + "epoch": 0.44, + "learning_rate": 1.1855498725556168e-05, + "loss": 0.654, + "step": 12722 + }, + { + "epoch": 0.44, + "learning_rate": 1.1854428758084184e-05, + "loss": 0.6328, + "step": 12723 + }, + { + "epoch": 0.44, + "learning_rate": 1.1853358768625598e-05, + "loss": 0.6081, + "step": 12724 + }, + { + "epoch": 0.44, + "learning_rate": 1.1852288757193103e-05, + "loss": 0.6682, + "step": 12725 + }, + { + "epoch": 0.44, + "learning_rate": 1.1851218723799381e-05, + "loss": 0.6353, + "step": 12726 + }, + { + "epoch": 0.44, + "learning_rate": 1.1850148668457118e-05, + "loss": 0.6684, + "step": 12727 + }, + { + "epoch": 0.44, + "learning_rate": 1.1849078591179001e-05, + "loss": 0.653, + "step": 12728 + }, + { + "epoch": 0.44, + "learning_rate": 1.1848008491977723e-05, + "loss": 0.6375, + "step": 12729 + }, + { + "epoch": 0.44, + "learning_rate": 1.1846938370865962e-05, + "loss": 0.5974, + "step": 12730 + }, + { + "epoch": 0.44, + "learning_rate": 1.184586822785641e-05, + "loss": 0.647, + "step": 12731 + }, + { + "epoch": 0.44, + "learning_rate": 1.1844798062961758e-05, + "loss": 0.6253, + "step": 12732 + }, + { + "epoch": 0.44, + "learning_rate": 1.1843727876194691e-05, + "loss": 0.6054, + "step": 12733 + }, + { + "epoch": 0.44, + "learning_rate": 1.1842657667567896e-05, + "loss": 0.661, + "step": 12734 + }, + { + "epoch": 0.44, + "learning_rate": 1.1841587437094064e-05, + "loss": 0.5955, + "step": 12735 + }, + { + "epoch": 0.44, + "learning_rate": 1.1840517184785883e-05, + "loss": 0.6415, + "step": 12736 + }, + { + "epoch": 0.44, + "learning_rate": 1.1839446910656043e-05, + "loss": 0.6603, + "step": 12737 + }, + { + "epoch": 0.44, + "learning_rate": 1.1838376614717234e-05, + "loss": 0.6977, + "step": 12738 + }, + { + "epoch": 0.44, + "learning_rate": 1.1837306296982142e-05, + "loss": 0.6252, + "step": 12739 + }, + { + "epoch": 0.44, + "learning_rate": 1.183623595746346e-05, + "loss": 0.6178, + "step": 12740 + }, + { + "epoch": 0.44, + "learning_rate": 1.1835165596173881e-05, + "loss": 0.6512, + "step": 12741 + }, + { + "epoch": 0.44, + "learning_rate": 1.183409521312609e-05, + "loss": 0.561, + "step": 12742 + }, + { + "epoch": 0.44, + "learning_rate": 1.183302480833278e-05, + "loss": 0.696, + "step": 12743 + }, + { + "epoch": 0.44, + "learning_rate": 1.1831954381806646e-05, + "loss": 0.7045, + "step": 12744 + }, + { + "epoch": 0.44, + "learning_rate": 1.1830883933560369e-05, + "loss": 0.5989, + "step": 12745 + }, + { + "epoch": 0.44, + "learning_rate": 1.182981346360665e-05, + "loss": 0.5945, + "step": 12746 + }, + { + "epoch": 0.44, + "learning_rate": 1.1828742971958178e-05, + "loss": 0.6287, + "step": 12747 + }, + { + "epoch": 0.44, + "learning_rate": 1.1827672458627643e-05, + "loss": 0.6408, + "step": 12748 + }, + { + "epoch": 0.44, + "learning_rate": 1.182660192362774e-05, + "loss": 0.6803, + "step": 12749 + }, + { + "epoch": 0.44, + "learning_rate": 1.1825531366971163e-05, + "loss": 0.5672, + "step": 12750 + }, + { + "epoch": 0.44, + "learning_rate": 1.1824460788670599e-05, + "loss": 0.6248, + "step": 12751 + }, + { + "epoch": 0.44, + "learning_rate": 1.1823390188738746e-05, + "loss": 0.5567, + "step": 12752 + }, + { + "epoch": 0.44, + "learning_rate": 1.1822319567188297e-05, + "loss": 0.6272, + "step": 12753 + }, + { + "epoch": 0.44, + "learning_rate": 1.1821248924031941e-05, + "loss": 0.6639, + "step": 12754 + }, + { + "epoch": 0.44, + "learning_rate": 1.1820178259282376e-05, + "loss": 0.6313, + "step": 12755 + }, + { + "epoch": 0.44, + "learning_rate": 1.1819107572952297e-05, + "loss": 0.6659, + "step": 12756 + }, + { + "epoch": 0.44, + "learning_rate": 1.1818036865054394e-05, + "loss": 0.5762, + "step": 12757 + }, + { + "epoch": 0.44, + "learning_rate": 1.1816966135601366e-05, + "loss": 0.6055, + "step": 12758 + }, + { + "epoch": 0.44, + "learning_rate": 1.1815895384605907e-05, + "loss": 0.6459, + "step": 12759 + }, + { + "epoch": 0.44, + "learning_rate": 1.1814824612080709e-05, + "loss": 0.5751, + "step": 12760 + }, + { + "epoch": 0.44, + "learning_rate": 1.1813753818038469e-05, + "loss": 0.6589, + "step": 12761 + }, + { + "epoch": 0.44, + "learning_rate": 1.1812683002491884e-05, + "loss": 0.6052, + "step": 12762 + }, + { + "epoch": 0.44, + "learning_rate": 1.181161216545365e-05, + "loss": 0.6245, + "step": 12763 + }, + { + "epoch": 0.44, + "learning_rate": 1.181054130693646e-05, + "loss": 0.582, + "step": 12764 + }, + { + "epoch": 0.44, + "learning_rate": 1.1809470426953016e-05, + "loss": 0.6584, + "step": 12765 + }, + { + "epoch": 0.44, + "learning_rate": 1.1808399525516008e-05, + "loss": 0.6141, + "step": 12766 + }, + { + "epoch": 0.44, + "learning_rate": 1.1807328602638136e-05, + "loss": 0.6582, + "step": 12767 + }, + { + "epoch": 0.44, + "learning_rate": 1.1806257658332099e-05, + "loss": 0.6801, + "step": 12768 + }, + { + "epoch": 0.44, + "learning_rate": 1.1805186692610591e-05, + "loss": 0.66, + "step": 12769 + }, + { + "epoch": 0.44, + "learning_rate": 1.180411570548631e-05, + "loss": 0.6439, + "step": 12770 + }, + { + "epoch": 0.44, + "learning_rate": 1.1803044696971957e-05, + "loss": 0.6388, + "step": 12771 + }, + { + "epoch": 0.44, + "learning_rate": 1.180197366708023e-05, + "loss": 0.5949, + "step": 12772 + }, + { + "epoch": 0.44, + "learning_rate": 1.1800902615823823e-05, + "loss": 0.5963, + "step": 12773 + }, + { + "epoch": 0.44, + "learning_rate": 1.1799831543215436e-05, + "loss": 0.6743, + "step": 12774 + }, + { + "epoch": 0.44, + "learning_rate": 1.1798760449267771e-05, + "loss": 0.6653, + "step": 12775 + }, + { + "epoch": 0.44, + "learning_rate": 1.1797689333993528e-05, + "loss": 0.6467, + "step": 12776 + }, + { + "epoch": 0.44, + "learning_rate": 1.17966181974054e-05, + "loss": 0.5774, + "step": 12777 + }, + { + "epoch": 0.44, + "learning_rate": 1.179554703951609e-05, + "loss": 0.6411, + "step": 12778 + }, + { + "epoch": 0.44, + "learning_rate": 1.1794475860338304e-05, + "loss": 0.6009, + "step": 12779 + }, + { + "epoch": 0.44, + "learning_rate": 1.1793404659884732e-05, + "loss": 0.659, + "step": 12780 + }, + { + "epoch": 0.44, + "learning_rate": 1.179233343816808e-05, + "loss": 0.6113, + "step": 12781 + }, + { + "epoch": 0.44, + "learning_rate": 1.179126219520105e-05, + "loss": 0.6872, + "step": 12782 + }, + { + "epoch": 0.44, + "learning_rate": 1.1790190930996337e-05, + "loss": 0.6328, + "step": 12783 + }, + { + "epoch": 0.44, + "learning_rate": 1.1789119645566648e-05, + "loss": 0.567, + "step": 12784 + }, + { + "epoch": 0.44, + "learning_rate": 1.1788048338924683e-05, + "loss": 0.5578, + "step": 12785 + }, + { + "epoch": 0.44, + "learning_rate": 1.1786977011083141e-05, + "loss": 0.6145, + "step": 12786 + }, + { + "epoch": 0.44, + "learning_rate": 1.1785905662054726e-05, + "loss": 0.6104, + "step": 12787 + }, + { + "epoch": 0.44, + "learning_rate": 1.1784834291852143e-05, + "loss": 0.6008, + "step": 12788 + }, + { + "epoch": 0.44, + "learning_rate": 1.1783762900488087e-05, + "loss": 0.6401, + "step": 12789 + }, + { + "epoch": 0.44, + "learning_rate": 1.1782691487975268e-05, + "loss": 0.6346, + "step": 12790 + }, + { + "epoch": 0.44, + "learning_rate": 1.1781620054326388e-05, + "loss": 0.6142, + "step": 12791 + }, + { + "epoch": 0.44, + "learning_rate": 1.1780548599554147e-05, + "loss": 0.6132, + "step": 12792 + }, + { + "epoch": 0.44, + "learning_rate": 1.177947712367125e-05, + "loss": 0.575, + "step": 12793 + }, + { + "epoch": 0.44, + "learning_rate": 1.1778405626690402e-05, + "loss": 0.6869, + "step": 12794 + }, + { + "epoch": 0.44, + "learning_rate": 1.1777334108624303e-05, + "loss": 0.6506, + "step": 12795 + }, + { + "epoch": 0.44, + "learning_rate": 1.1776262569485658e-05, + "loss": 0.5887, + "step": 12796 + }, + { + "epoch": 0.44, + "learning_rate": 1.1775191009287178e-05, + "loss": 0.6164, + "step": 12797 + }, + { + "epoch": 0.44, + "learning_rate": 1.1774119428041562e-05, + "loss": 0.6667, + "step": 12798 + }, + { + "epoch": 0.44, + "learning_rate": 1.1773047825761515e-05, + "loss": 0.6498, + "step": 12799 + }, + { + "epoch": 0.44, + "learning_rate": 1.1771976202459742e-05, + "loss": 0.6027, + "step": 12800 + }, + { + "epoch": 0.44, + "learning_rate": 1.1770904558148952e-05, + "loss": 0.5909, + "step": 12801 + }, + { + "epoch": 0.44, + "learning_rate": 1.1769832892841846e-05, + "loss": 0.6085, + "step": 12802 + }, + { + "epoch": 0.44, + "learning_rate": 1.1768761206551136e-05, + "loss": 0.6451, + "step": 12803 + }, + { + "epoch": 0.44, + "learning_rate": 1.1767689499289521e-05, + "loss": 0.6753, + "step": 12804 + }, + { + "epoch": 0.44, + "learning_rate": 1.1766617771069711e-05, + "loss": 0.6221, + "step": 12805 + }, + { + "epoch": 0.44, + "learning_rate": 1.1765546021904413e-05, + "loss": 0.6081, + "step": 12806 + }, + { + "epoch": 0.44, + "learning_rate": 1.1764474251806335e-05, + "loss": 0.6608, + "step": 12807 + }, + { + "epoch": 0.44, + "learning_rate": 1.1763402460788178e-05, + "loss": 0.6415, + "step": 12808 + }, + { + "epoch": 0.44, + "learning_rate": 1.1762330648862658e-05, + "loss": 0.5866, + "step": 12809 + }, + { + "epoch": 0.44, + "learning_rate": 1.176125881604248e-05, + "loss": 0.6573, + "step": 12810 + }, + { + "epoch": 0.44, + "learning_rate": 1.1760186962340345e-05, + "loss": 0.6003, + "step": 12811 + }, + { + "epoch": 0.44, + "learning_rate": 1.1759115087768973e-05, + "loss": 0.628, + "step": 12812 + }, + { + "epoch": 0.44, + "learning_rate": 1.1758043192341066e-05, + "loss": 0.6342, + "step": 12813 + }, + { + "epoch": 0.44, + "learning_rate": 1.1756971276069329e-05, + "loss": 0.6288, + "step": 12814 + }, + { + "epoch": 0.44, + "learning_rate": 1.1755899338966476e-05, + "loss": 0.6403, + "step": 12815 + }, + { + "epoch": 0.44, + "learning_rate": 1.175482738104522e-05, + "loss": 0.5832, + "step": 12816 + }, + { + "epoch": 0.44, + "learning_rate": 1.1753755402318259e-05, + "loss": 0.622, + "step": 12817 + }, + { + "epoch": 0.44, + "learning_rate": 1.1752683402798312e-05, + "loss": 0.6286, + "step": 12818 + }, + { + "epoch": 0.44, + "learning_rate": 1.1751611382498088e-05, + "loss": 0.631, + "step": 12819 + }, + { + "epoch": 0.44, + "learning_rate": 1.175053934143029e-05, + "loss": 0.6502, + "step": 12820 + }, + { + "epoch": 0.44, + "learning_rate": 1.1749467279607639e-05, + "loss": 0.6853, + "step": 12821 + }, + { + "epoch": 0.44, + "learning_rate": 1.1748395197042839e-05, + "loss": 0.5904, + "step": 12822 + }, + { + "epoch": 0.44, + "learning_rate": 1.1747323093748597e-05, + "loss": 0.6268, + "step": 12823 + }, + { + "epoch": 0.44, + "learning_rate": 1.1746250969737636e-05, + "loss": 0.6401, + "step": 12824 + }, + { + "epoch": 0.44, + "learning_rate": 1.1745178825022661e-05, + "loss": 0.6781, + "step": 12825 + }, + { + "epoch": 0.44, + "learning_rate": 1.1744106659616377e-05, + "loss": 0.6067, + "step": 12826 + }, + { + "epoch": 0.44, + "learning_rate": 1.1743034473531506e-05, + "loss": 0.596, + "step": 12827 + }, + { + "epoch": 0.44, + "learning_rate": 1.174196226678076e-05, + "loss": 0.6341, + "step": 12828 + }, + { + "epoch": 0.44, + "learning_rate": 1.174089003937684e-05, + "loss": 0.6678, + "step": 12829 + }, + { + "epoch": 0.44, + "learning_rate": 1.1739817791332473e-05, + "loss": 0.6333, + "step": 12830 + }, + { + "epoch": 0.44, + "learning_rate": 1.1738745522660364e-05, + "loss": 0.6204, + "step": 12831 + }, + { + "epoch": 0.44, + "learning_rate": 1.1737673233373224e-05, + "loss": 0.653, + "step": 12832 + }, + { + "epoch": 0.44, + "learning_rate": 1.1736600923483771e-05, + "loss": 0.6683, + "step": 12833 + }, + { + "epoch": 0.44, + "learning_rate": 1.1735528593004722e-05, + "loss": 0.6676, + "step": 12834 + }, + { + "epoch": 0.44, + "learning_rate": 1.173445624194878e-05, + "loss": 0.6093, + "step": 12835 + }, + { + "epoch": 0.44, + "learning_rate": 1.1733383870328668e-05, + "loss": 0.6074, + "step": 12836 + }, + { + "epoch": 0.44, + "learning_rate": 1.1732311478157096e-05, + "loss": 0.5753, + "step": 12837 + }, + { + "epoch": 0.44, + "learning_rate": 1.173123906544678e-05, + "loss": 0.6033, + "step": 12838 + }, + { + "epoch": 0.44, + "learning_rate": 1.1730166632210435e-05, + "loss": 0.6675, + "step": 12839 + }, + { + "epoch": 0.44, + "learning_rate": 1.1729094178460778e-05, + "loss": 0.6254, + "step": 12840 + }, + { + "epoch": 0.44, + "learning_rate": 1.172802170421052e-05, + "loss": 0.5923, + "step": 12841 + }, + { + "epoch": 0.44, + "learning_rate": 1.1726949209472378e-05, + "loss": 0.6103, + "step": 12842 + }, + { + "epoch": 0.44, + "learning_rate": 1.1725876694259073e-05, + "loss": 0.6022, + "step": 12843 + }, + { + "epoch": 0.45, + "learning_rate": 1.1724804158583312e-05, + "loss": 0.6015, + "step": 12844 + }, + { + "epoch": 0.45, + "learning_rate": 1.1723731602457817e-05, + "loss": 0.5921, + "step": 12845 + }, + { + "epoch": 0.45, + "learning_rate": 1.1722659025895305e-05, + "loss": 0.6109, + "step": 12846 + }, + { + "epoch": 0.45, + "learning_rate": 1.1721586428908489e-05, + "loss": 0.6589, + "step": 12847 + }, + { + "epoch": 0.45, + "learning_rate": 1.1720513811510088e-05, + "loss": 0.6083, + "step": 12848 + }, + { + "epoch": 0.45, + "learning_rate": 1.171944117371282e-05, + "loss": 0.6356, + "step": 12849 + }, + { + "epoch": 0.45, + "learning_rate": 1.1718368515529402e-05, + "loss": 0.6761, + "step": 12850 + }, + { + "epoch": 0.45, + "learning_rate": 1.171729583697255e-05, + "loss": 0.5828, + "step": 12851 + }, + { + "epoch": 0.45, + "learning_rate": 1.1716223138054987e-05, + "loss": 0.6625, + "step": 12852 + }, + { + "epoch": 0.45, + "learning_rate": 1.1715150418789424e-05, + "loss": 0.5551, + "step": 12853 + }, + { + "epoch": 0.45, + "learning_rate": 1.1714077679188585e-05, + "loss": 0.6082, + "step": 12854 + }, + { + "epoch": 0.45, + "learning_rate": 1.1713004919265187e-05, + "loss": 0.6137, + "step": 12855 + }, + { + "epoch": 0.45, + "learning_rate": 1.1711932139031947e-05, + "loss": 0.6121, + "step": 12856 + }, + { + "epoch": 0.45, + "learning_rate": 1.1710859338501585e-05, + "loss": 0.6852, + "step": 12857 + }, + { + "epoch": 0.45, + "learning_rate": 1.1709786517686825e-05, + "loss": 0.6034, + "step": 12858 + }, + { + "epoch": 0.45, + "learning_rate": 1.170871367660038e-05, + "loss": 0.5904, + "step": 12859 + }, + { + "epoch": 0.45, + "learning_rate": 1.1707640815254975e-05, + "loss": 0.5917, + "step": 12860 + }, + { + "epoch": 0.45, + "learning_rate": 1.1706567933663329e-05, + "loss": 0.6627, + "step": 12861 + }, + { + "epoch": 0.45, + "learning_rate": 1.1705495031838159e-05, + "loss": 0.6481, + "step": 12862 + }, + { + "epoch": 0.45, + "learning_rate": 1.1704422109792186e-05, + "loss": 0.6013, + "step": 12863 + }, + { + "epoch": 0.45, + "learning_rate": 1.1703349167538136e-05, + "loss": 0.6952, + "step": 12864 + }, + { + "epoch": 0.45, + "learning_rate": 1.1702276205088726e-05, + "loss": 0.588, + "step": 12865 + }, + { + "epoch": 0.45, + "learning_rate": 1.1701203222456679e-05, + "loss": 0.6356, + "step": 12866 + }, + { + "epoch": 0.45, + "learning_rate": 1.1700130219654715e-05, + "loss": 0.6685, + "step": 12867 + }, + { + "epoch": 0.45, + "learning_rate": 1.1699057196695555e-05, + "loss": 0.6197, + "step": 12868 + }, + { + "epoch": 0.45, + "learning_rate": 1.1697984153591925e-05, + "loss": 0.6586, + "step": 12869 + }, + { + "epoch": 0.45, + "learning_rate": 1.1696911090356545e-05, + "loss": 0.5921, + "step": 12870 + }, + { + "epoch": 0.45, + "learning_rate": 1.1695838007002133e-05, + "loss": 0.666, + "step": 12871 + }, + { + "epoch": 0.45, + "learning_rate": 1.1694764903541422e-05, + "loss": 0.6341, + "step": 12872 + }, + { + "epoch": 0.45, + "learning_rate": 1.1693691779987127e-05, + "loss": 0.6945, + "step": 12873 + }, + { + "epoch": 0.45, + "learning_rate": 1.1692618636351972e-05, + "loss": 0.6396, + "step": 12874 + }, + { + "epoch": 0.45, + "learning_rate": 1.1691545472648684e-05, + "loss": 0.5988, + "step": 12875 + }, + { + "epoch": 0.45, + "learning_rate": 1.1690472288889983e-05, + "loss": 0.6288, + "step": 12876 + }, + { + "epoch": 0.45, + "learning_rate": 1.1689399085088596e-05, + "loss": 0.639, + "step": 12877 + }, + { + "epoch": 0.45, + "learning_rate": 1.1688325861257246e-05, + "loss": 0.6437, + "step": 12878 + }, + { + "epoch": 0.45, + "learning_rate": 1.1687252617408654e-05, + "loss": 0.6187, + "step": 12879 + }, + { + "epoch": 0.45, + "learning_rate": 1.168617935355555e-05, + "loss": 0.6187, + "step": 12880 + }, + { + "epoch": 0.45, + "learning_rate": 1.1685106069710656e-05, + "loss": 0.6498, + "step": 12881 + }, + { + "epoch": 0.45, + "learning_rate": 1.1684032765886699e-05, + "loss": 0.6549, + "step": 12882 + }, + { + "epoch": 0.45, + "learning_rate": 1.1682959442096401e-05, + "loss": 0.5568, + "step": 12883 + }, + { + "epoch": 0.45, + "learning_rate": 1.1681886098352495e-05, + "loss": 0.6136, + "step": 12884 + }, + { + "epoch": 0.45, + "learning_rate": 1.1680812734667697e-05, + "loss": 0.5994, + "step": 12885 + }, + { + "epoch": 0.45, + "learning_rate": 1.1679739351054739e-05, + "loss": 0.6493, + "step": 12886 + }, + { + "epoch": 0.45, + "learning_rate": 1.1678665947526347e-05, + "loss": 0.6695, + "step": 12887 + }, + { + "epoch": 0.45, + "learning_rate": 1.1677592524095244e-05, + "loss": 0.662, + "step": 12888 + }, + { + "epoch": 0.45, + "learning_rate": 1.1676519080774162e-05, + "loss": 0.6363, + "step": 12889 + }, + { + "epoch": 0.45, + "learning_rate": 1.1675445617575826e-05, + "loss": 0.6173, + "step": 12890 + }, + { + "epoch": 0.45, + "learning_rate": 1.1674372134512962e-05, + "loss": 0.6291, + "step": 12891 + }, + { + "epoch": 0.45, + "learning_rate": 1.1673298631598296e-05, + "loss": 0.6235, + "step": 12892 + }, + { + "epoch": 0.45, + "learning_rate": 1.1672225108844562e-05, + "loss": 0.6264, + "step": 12893 + }, + { + "epoch": 0.45, + "learning_rate": 1.167115156626448e-05, + "loss": 0.622, + "step": 12894 + }, + { + "epoch": 0.45, + "learning_rate": 1.1670078003870783e-05, + "loss": 0.6081, + "step": 12895 + }, + { + "epoch": 0.45, + "learning_rate": 1.1669004421676202e-05, + "loss": 0.6006, + "step": 12896 + }, + { + "epoch": 0.45, + "learning_rate": 1.1667930819693459e-05, + "loss": 0.6155, + "step": 12897 + }, + { + "epoch": 0.45, + "learning_rate": 1.1666857197935287e-05, + "loss": 0.6629, + "step": 12898 + }, + { + "epoch": 0.45, + "learning_rate": 1.1665783556414416e-05, + "loss": 0.5829, + "step": 12899 + }, + { + "epoch": 0.45, + "learning_rate": 1.1664709895143573e-05, + "loss": 0.729, + "step": 12900 + }, + { + "epoch": 0.45, + "learning_rate": 1.1663636214135485e-05, + "loss": 0.6168, + "step": 12901 + }, + { + "epoch": 0.45, + "learning_rate": 1.1662562513402888e-05, + "loss": 0.6493, + "step": 12902 + }, + { + "epoch": 0.45, + "learning_rate": 1.166148879295851e-05, + "loss": 0.6308, + "step": 12903 + }, + { + "epoch": 0.45, + "learning_rate": 1.1660415052815078e-05, + "loss": 0.6472, + "step": 12904 + }, + { + "epoch": 0.45, + "learning_rate": 1.1659341292985326e-05, + "loss": 0.6644, + "step": 12905 + }, + { + "epoch": 0.45, + "learning_rate": 1.1658267513481987e-05, + "loss": 0.6264, + "step": 12906 + }, + { + "epoch": 0.45, + "learning_rate": 1.1657193714317782e-05, + "loss": 0.6778, + "step": 12907 + }, + { + "epoch": 0.45, + "learning_rate": 1.1656119895505455e-05, + "loss": 0.6332, + "step": 12908 + }, + { + "epoch": 0.45, + "learning_rate": 1.1655046057057734e-05, + "loss": 0.613, + "step": 12909 + }, + { + "epoch": 0.45, + "learning_rate": 1.165397219898734e-05, + "loss": 0.599, + "step": 12910 + }, + { + "epoch": 0.45, + "learning_rate": 1.165289832130702e-05, + "loss": 0.6266, + "step": 12911 + }, + { + "epoch": 0.45, + "learning_rate": 1.16518244240295e-05, + "loss": 0.6392, + "step": 12912 + }, + { + "epoch": 0.45, + "learning_rate": 1.1650750507167505e-05, + "loss": 0.6259, + "step": 12913 + }, + { + "epoch": 0.45, + "learning_rate": 1.1649676570733779e-05, + "loss": 0.5986, + "step": 12914 + }, + { + "epoch": 0.45, + "learning_rate": 1.164860261474105e-05, + "loss": 0.6175, + "step": 12915 + }, + { + "epoch": 0.45, + "learning_rate": 1.164752863920205e-05, + "loss": 0.6397, + "step": 12916 + }, + { + "epoch": 0.45, + "learning_rate": 1.1646454644129519e-05, + "loss": 0.6328, + "step": 12917 + }, + { + "epoch": 0.45, + "learning_rate": 1.1645380629536183e-05, + "loss": 0.6566, + "step": 12918 + }, + { + "epoch": 0.45, + "learning_rate": 1.1644306595434773e-05, + "loss": 0.6488, + "step": 12919 + }, + { + "epoch": 0.45, + "learning_rate": 1.1643232541838035e-05, + "loss": 0.6387, + "step": 12920 + }, + { + "epoch": 0.45, + "learning_rate": 1.1642158468758696e-05, + "loss": 0.6428, + "step": 12921 + }, + { + "epoch": 0.45, + "learning_rate": 1.1641084376209484e-05, + "loss": 0.6656, + "step": 12922 + }, + { + "epoch": 0.45, + "learning_rate": 1.1640010264203147e-05, + "loss": 0.604, + "step": 12923 + }, + { + "epoch": 0.45, + "learning_rate": 1.1638936132752414e-05, + "loss": 0.6107, + "step": 12924 + }, + { + "epoch": 0.45, + "learning_rate": 1.1637861981870016e-05, + "loss": 0.6045, + "step": 12925 + }, + { + "epoch": 0.45, + "learning_rate": 1.1636787811568695e-05, + "loss": 0.6154, + "step": 12926 + }, + { + "epoch": 0.45, + "learning_rate": 1.1635713621861185e-05, + "loss": 0.688, + "step": 12927 + }, + { + "epoch": 0.45, + "learning_rate": 1.1634639412760216e-05, + "loss": 0.6213, + "step": 12928 + }, + { + "epoch": 0.45, + "learning_rate": 1.1633565184278534e-05, + "loss": 0.5819, + "step": 12929 + }, + { + "epoch": 0.45, + "learning_rate": 1.1632490936428869e-05, + "loss": 0.6162, + "step": 12930 + }, + { + "epoch": 0.45, + "learning_rate": 1.1631416669223958e-05, + "loss": 0.6074, + "step": 12931 + }, + { + "epoch": 0.45, + "learning_rate": 1.1630342382676539e-05, + "loss": 0.5821, + "step": 12932 + }, + { + "epoch": 0.45, + "learning_rate": 1.1629268076799349e-05, + "loss": 0.6511, + "step": 12933 + }, + { + "epoch": 0.45, + "learning_rate": 1.1628193751605124e-05, + "loss": 0.6594, + "step": 12934 + }, + { + "epoch": 0.45, + "learning_rate": 1.1627119407106602e-05, + "loss": 0.6412, + "step": 12935 + }, + { + "epoch": 0.45, + "learning_rate": 1.1626045043316523e-05, + "loss": 0.6453, + "step": 12936 + }, + { + "epoch": 0.45, + "learning_rate": 1.1624970660247621e-05, + "loss": 0.6491, + "step": 12937 + }, + { + "epoch": 0.45, + "learning_rate": 1.1623896257912637e-05, + "loss": 0.6291, + "step": 12938 + }, + { + "epoch": 0.45, + "learning_rate": 1.162282183632431e-05, + "loss": 0.5734, + "step": 12939 + }, + { + "epoch": 0.45, + "learning_rate": 1.1621747395495375e-05, + "loss": 0.6188, + "step": 12940 + }, + { + "epoch": 0.45, + "learning_rate": 1.1620672935438574e-05, + "loss": 0.6703, + "step": 12941 + }, + { + "epoch": 0.45, + "learning_rate": 1.1619598456166647e-05, + "loss": 0.6109, + "step": 12942 + }, + { + "epoch": 0.45, + "learning_rate": 1.1618523957692329e-05, + "loss": 0.5653, + "step": 12943 + }, + { + "epoch": 0.45, + "learning_rate": 1.1617449440028363e-05, + "loss": 0.6472, + "step": 12944 + }, + { + "epoch": 0.45, + "learning_rate": 1.1616374903187488e-05, + "loss": 0.642, + "step": 12945 + }, + { + "epoch": 0.45, + "learning_rate": 1.1615300347182443e-05, + "loss": 0.6332, + "step": 12946 + }, + { + "epoch": 0.45, + "learning_rate": 1.1614225772025969e-05, + "loss": 0.6386, + "step": 12947 + }, + { + "epoch": 0.45, + "learning_rate": 1.1613151177730808e-05, + "loss": 0.6173, + "step": 12948 + }, + { + "epoch": 0.45, + "learning_rate": 1.1612076564309698e-05, + "loss": 0.6881, + "step": 12949 + }, + { + "epoch": 0.45, + "learning_rate": 1.161100193177538e-05, + "loss": 0.6512, + "step": 12950 + }, + { + "epoch": 0.45, + "learning_rate": 1.16099272801406e-05, + "loss": 0.6447, + "step": 12951 + }, + { + "epoch": 0.45, + "learning_rate": 1.1608852609418092e-05, + "loss": 0.6362, + "step": 12952 + }, + { + "epoch": 0.45, + "learning_rate": 1.1607777919620603e-05, + "loss": 0.6278, + "step": 12953 + }, + { + "epoch": 0.45, + "learning_rate": 1.1606703210760873e-05, + "loss": 0.6183, + "step": 12954 + }, + { + "epoch": 0.45, + "learning_rate": 1.1605628482851641e-05, + "loss": 0.5996, + "step": 12955 + }, + { + "epoch": 0.45, + "learning_rate": 1.1604553735905652e-05, + "loss": 0.6555, + "step": 12956 + }, + { + "epoch": 0.45, + "learning_rate": 1.1603478969935654e-05, + "loss": 0.6738, + "step": 12957 + }, + { + "epoch": 0.45, + "learning_rate": 1.1602404184954379e-05, + "loss": 0.6897, + "step": 12958 + }, + { + "epoch": 0.45, + "learning_rate": 1.1601329380974577e-05, + "loss": 0.6417, + "step": 12959 + }, + { + "epoch": 0.45, + "learning_rate": 1.1600254558008992e-05, + "loss": 0.6541, + "step": 12960 + }, + { + "epoch": 0.45, + "learning_rate": 1.1599179716070364e-05, + "loss": 0.5951, + "step": 12961 + }, + { + "epoch": 0.45, + "learning_rate": 1.1598104855171437e-05, + "loss": 0.6871, + "step": 12962 + }, + { + "epoch": 0.45, + "learning_rate": 1.1597029975324954e-05, + "loss": 0.6106, + "step": 12963 + }, + { + "epoch": 0.45, + "learning_rate": 1.159595507654366e-05, + "loss": 0.6503, + "step": 12964 + }, + { + "epoch": 0.45, + "learning_rate": 1.1594880158840302e-05, + "loss": 0.5702, + "step": 12965 + }, + { + "epoch": 0.45, + "learning_rate": 1.1593805222227621e-05, + "loss": 0.6176, + "step": 12966 + }, + { + "epoch": 0.45, + "learning_rate": 1.1592730266718361e-05, + "loss": 0.6347, + "step": 12967 + }, + { + "epoch": 0.45, + "learning_rate": 1.1591655292325273e-05, + "loss": 0.647, + "step": 12968 + }, + { + "epoch": 0.45, + "learning_rate": 1.1590580299061093e-05, + "loss": 0.6381, + "step": 12969 + }, + { + "epoch": 0.45, + "learning_rate": 1.1589505286938576e-05, + "loss": 0.6294, + "step": 12970 + }, + { + "epoch": 0.45, + "learning_rate": 1.1588430255970463e-05, + "loss": 0.5892, + "step": 12971 + }, + { + "epoch": 0.45, + "learning_rate": 1.1587355206169497e-05, + "loss": 0.6004, + "step": 12972 + }, + { + "epoch": 0.45, + "learning_rate": 1.1586280137548426e-05, + "loss": 0.6176, + "step": 12973 + }, + { + "epoch": 0.45, + "learning_rate": 1.158520505012e-05, + "loss": 0.6785, + "step": 12974 + }, + { + "epoch": 0.45, + "learning_rate": 1.1584129943896964e-05, + "loss": 0.675, + "step": 12975 + }, + { + "epoch": 0.45, + "learning_rate": 1.1583054818892062e-05, + "loss": 0.6408, + "step": 12976 + }, + { + "epoch": 0.45, + "learning_rate": 1.1581979675118042e-05, + "loss": 0.6678, + "step": 12977 + }, + { + "epoch": 0.45, + "learning_rate": 1.1580904512587652e-05, + "loss": 0.6258, + "step": 12978 + }, + { + "epoch": 0.45, + "learning_rate": 1.1579829331313639e-05, + "loss": 0.6432, + "step": 12979 + }, + { + "epoch": 0.45, + "learning_rate": 1.1578754131308754e-05, + "loss": 0.5698, + "step": 12980 + }, + { + "epoch": 0.45, + "learning_rate": 1.1577678912585738e-05, + "loss": 0.6507, + "step": 12981 + }, + { + "epoch": 0.45, + "learning_rate": 1.1576603675157343e-05, + "loss": 0.6556, + "step": 12982 + }, + { + "epoch": 0.45, + "learning_rate": 1.1575528419036318e-05, + "loss": 0.6211, + "step": 12983 + }, + { + "epoch": 0.45, + "learning_rate": 1.1574453144235408e-05, + "loss": 0.6693, + "step": 12984 + }, + { + "epoch": 0.45, + "learning_rate": 1.1573377850767367e-05, + "loss": 0.6788, + "step": 12985 + }, + { + "epoch": 0.45, + "learning_rate": 1.1572302538644941e-05, + "loss": 0.5973, + "step": 12986 + }, + { + "epoch": 0.45, + "learning_rate": 1.157122720788088e-05, + "loss": 0.6511, + "step": 12987 + }, + { + "epoch": 0.45, + "learning_rate": 1.157015185848793e-05, + "loss": 0.6675, + "step": 12988 + }, + { + "epoch": 0.45, + "learning_rate": 1.1569076490478848e-05, + "loss": 0.6209, + "step": 12989 + }, + { + "epoch": 0.45, + "learning_rate": 1.1568001103866376e-05, + "loss": 0.6125, + "step": 12990 + }, + { + "epoch": 0.45, + "learning_rate": 1.1566925698663267e-05, + "loss": 0.6608, + "step": 12991 + }, + { + "epoch": 0.45, + "learning_rate": 1.1565850274882275e-05, + "loss": 0.7055, + "step": 12992 + }, + { + "epoch": 0.45, + "learning_rate": 1.1564774832536143e-05, + "loss": 0.6081, + "step": 12993 + }, + { + "epoch": 0.45, + "learning_rate": 1.1563699371637628e-05, + "loss": 0.7101, + "step": 12994 + }, + { + "epoch": 0.45, + "learning_rate": 1.1562623892199481e-05, + "loss": 0.6328, + "step": 12995 + }, + { + "epoch": 0.45, + "learning_rate": 1.1561548394234447e-05, + "loss": 0.6602, + "step": 12996 + }, + { + "epoch": 0.45, + "learning_rate": 1.1560472877755282e-05, + "loss": 0.6755, + "step": 12997 + }, + { + "epoch": 0.45, + "learning_rate": 1.155939734277474e-05, + "loss": 0.6179, + "step": 12998 + }, + { + "epoch": 0.45, + "learning_rate": 1.1558321789305568e-05, + "loss": 0.6628, + "step": 12999 + }, + { + "epoch": 0.45, + "learning_rate": 1.1557246217360519e-05, + "loss": 0.6616, + "step": 13000 + }, + { + "epoch": 0.45, + "learning_rate": 1.1556170626952348e-05, + "loss": 0.6493, + "step": 13001 + }, + { + "epoch": 0.45, + "learning_rate": 1.1555095018093805e-05, + "loss": 0.6138, + "step": 13002 + }, + { + "epoch": 0.45, + "learning_rate": 1.155401939079764e-05, + "loss": 0.6162, + "step": 13003 + }, + { + "epoch": 0.45, + "learning_rate": 1.1552943745076616e-05, + "loss": 0.6046, + "step": 13004 + }, + { + "epoch": 0.45, + "learning_rate": 1.1551868080943476e-05, + "loss": 0.5994, + "step": 13005 + }, + { + "epoch": 0.45, + "learning_rate": 1.1550792398410975e-05, + "loss": 0.6387, + "step": 13006 + }, + { + "epoch": 0.45, + "learning_rate": 1.154971669749187e-05, + "loss": 0.6179, + "step": 13007 + }, + { + "epoch": 0.45, + "learning_rate": 1.1548640978198912e-05, + "loss": 0.6032, + "step": 13008 + }, + { + "epoch": 0.45, + "learning_rate": 1.1547565240544858e-05, + "loss": 0.6375, + "step": 13009 + }, + { + "epoch": 0.45, + "learning_rate": 1.1546489484542462e-05, + "loss": 0.5921, + "step": 13010 + }, + { + "epoch": 0.45, + "learning_rate": 1.1545413710204473e-05, + "loss": 0.6358, + "step": 13011 + }, + { + "epoch": 0.45, + "learning_rate": 1.1544337917543651e-05, + "loss": 0.598, + "step": 13012 + }, + { + "epoch": 0.45, + "learning_rate": 1.154326210657275e-05, + "loss": 0.6083, + "step": 13013 + }, + { + "epoch": 0.45, + "learning_rate": 1.1542186277304524e-05, + "loss": 0.5891, + "step": 13014 + }, + { + "epoch": 0.45, + "learning_rate": 1.1541110429751728e-05, + "loss": 0.6261, + "step": 13015 + }, + { + "epoch": 0.45, + "learning_rate": 1.154003456392712e-05, + "loss": 0.6869, + "step": 13016 + }, + { + "epoch": 0.45, + "learning_rate": 1.1538958679843452e-05, + "loss": 0.6418, + "step": 13017 + }, + { + "epoch": 0.45, + "learning_rate": 1.1537882777513483e-05, + "loss": 0.6378, + "step": 13018 + }, + { + "epoch": 0.45, + "learning_rate": 1.153680685694997e-05, + "loss": 0.7034, + "step": 13019 + }, + { + "epoch": 0.45, + "learning_rate": 1.1535730918165667e-05, + "loss": 0.6104, + "step": 13020 + }, + { + "epoch": 0.45, + "learning_rate": 1.1534654961173328e-05, + "loss": 0.6699, + "step": 13021 + }, + { + "epoch": 0.45, + "learning_rate": 1.1533578985985716e-05, + "loss": 0.6209, + "step": 13022 + }, + { + "epoch": 0.45, + "learning_rate": 1.1532502992615584e-05, + "loss": 0.5928, + "step": 13023 + }, + { + "epoch": 0.45, + "learning_rate": 1.1531426981075693e-05, + "loss": 0.5855, + "step": 13024 + }, + { + "epoch": 0.45, + "learning_rate": 1.1530350951378794e-05, + "loss": 0.6426, + "step": 13025 + }, + { + "epoch": 0.45, + "learning_rate": 1.152927490353765e-05, + "loss": 0.6921, + "step": 13026 + }, + { + "epoch": 0.45, + "learning_rate": 1.1528198837565018e-05, + "loss": 0.6438, + "step": 13027 + }, + { + "epoch": 0.45, + "learning_rate": 1.1527122753473656e-05, + "loss": 0.6427, + "step": 13028 + }, + { + "epoch": 0.45, + "learning_rate": 1.1526046651276322e-05, + "loss": 0.6499, + "step": 13029 + }, + { + "epoch": 0.45, + "learning_rate": 1.1524970530985775e-05, + "loss": 0.6142, + "step": 13030 + }, + { + "epoch": 0.45, + "learning_rate": 1.1523894392614772e-05, + "loss": 0.6444, + "step": 13031 + }, + { + "epoch": 0.45, + "learning_rate": 1.1522818236176072e-05, + "loss": 0.6271, + "step": 13032 + }, + { + "epoch": 0.45, + "learning_rate": 1.1521742061682437e-05, + "loss": 0.6067, + "step": 13033 + }, + { + "epoch": 0.45, + "learning_rate": 1.1520665869146625e-05, + "loss": 0.6128, + "step": 13034 + }, + { + "epoch": 0.45, + "learning_rate": 1.1519589658581393e-05, + "loss": 0.6637, + "step": 13035 + }, + { + "epoch": 0.45, + "learning_rate": 1.151851342999951e-05, + "loss": 0.6564, + "step": 13036 + }, + { + "epoch": 0.45, + "learning_rate": 1.1517437183413723e-05, + "loss": 0.6257, + "step": 13037 + }, + { + "epoch": 0.45, + "learning_rate": 1.15163609188368e-05, + "loss": 0.6536, + "step": 13038 + }, + { + "epoch": 0.45, + "learning_rate": 1.1515284636281502e-05, + "loss": 0.6317, + "step": 13039 + }, + { + "epoch": 0.45, + "learning_rate": 1.1514208335760583e-05, + "loss": 0.6449, + "step": 13040 + }, + { + "epoch": 0.45, + "learning_rate": 1.1513132017286812e-05, + "loss": 0.6126, + "step": 13041 + }, + { + "epoch": 0.45, + "learning_rate": 1.1512055680872948e-05, + "loss": 0.6538, + "step": 13042 + }, + { + "epoch": 0.45, + "learning_rate": 1.151097932653175e-05, + "loss": 0.6403, + "step": 13043 + }, + { + "epoch": 0.45, + "learning_rate": 1.150990295427598e-05, + "loss": 0.6502, + "step": 13044 + }, + { + "epoch": 0.45, + "learning_rate": 1.1508826564118403e-05, + "loss": 0.5929, + "step": 13045 + }, + { + "epoch": 0.45, + "learning_rate": 1.1507750156071775e-05, + "loss": 0.6156, + "step": 13046 + }, + { + "epoch": 0.45, + "learning_rate": 1.1506673730148862e-05, + "loss": 0.6015, + "step": 13047 + }, + { + "epoch": 0.45, + "learning_rate": 1.150559728636243e-05, + "loss": 0.6062, + "step": 13048 + }, + { + "epoch": 0.45, + "learning_rate": 1.1504520824725235e-05, + "loss": 0.6341, + "step": 13049 + }, + { + "epoch": 0.45, + "learning_rate": 1.150344434525004e-05, + "loss": 0.625, + "step": 13050 + }, + { + "epoch": 0.45, + "learning_rate": 1.1502367847949613e-05, + "loss": 0.7137, + "step": 13051 + }, + { + "epoch": 0.45, + "learning_rate": 1.1501291332836714e-05, + "loss": 0.5527, + "step": 13052 + }, + { + "epoch": 0.45, + "learning_rate": 1.150021479992411e-05, + "loss": 0.6766, + "step": 13053 + }, + { + "epoch": 0.45, + "learning_rate": 1.1499138249224558e-05, + "loss": 0.5826, + "step": 13054 + }, + { + "epoch": 0.45, + "learning_rate": 1.1498061680750828e-05, + "loss": 0.637, + "step": 13055 + }, + { + "epoch": 0.45, + "learning_rate": 1.1496985094515678e-05, + "loss": 0.6409, + "step": 13056 + }, + { + "epoch": 0.45, + "learning_rate": 1.1495908490531877e-05, + "loss": 0.6557, + "step": 13057 + }, + { + "epoch": 0.45, + "learning_rate": 1.1494831868812192e-05, + "loss": 0.5936, + "step": 13058 + }, + { + "epoch": 0.45, + "learning_rate": 1.1493755229369384e-05, + "loss": 0.6825, + "step": 13059 + }, + { + "epoch": 0.45, + "learning_rate": 1.1492678572216213e-05, + "loss": 0.6786, + "step": 13060 + }, + { + "epoch": 0.45, + "learning_rate": 1.1491601897365454e-05, + "loss": 0.6247, + "step": 13061 + }, + { + "epoch": 0.45, + "learning_rate": 1.1490525204829866e-05, + "loss": 0.6072, + "step": 13062 + }, + { + "epoch": 0.45, + "learning_rate": 1.1489448494622215e-05, + "loss": 0.6115, + "step": 13063 + }, + { + "epoch": 0.45, + "learning_rate": 1.1488371766755272e-05, + "loss": 0.6102, + "step": 13064 + }, + { + "epoch": 0.45, + "learning_rate": 1.1487295021241796e-05, + "loss": 0.644, + "step": 13065 + }, + { + "epoch": 0.45, + "learning_rate": 1.1486218258094555e-05, + "loss": 0.5936, + "step": 13066 + }, + { + "epoch": 0.45, + "learning_rate": 1.1485141477326319e-05, + "loss": 0.6576, + "step": 13067 + }, + { + "epoch": 0.45, + "learning_rate": 1.1484064678949849e-05, + "loss": 0.6626, + "step": 13068 + }, + { + "epoch": 0.45, + "learning_rate": 1.1482987862977917e-05, + "loss": 0.6341, + "step": 13069 + }, + { + "epoch": 0.45, + "learning_rate": 1.1481911029423288e-05, + "loss": 0.6949, + "step": 13070 + }, + { + "epoch": 0.45, + "learning_rate": 1.1480834178298728e-05, + "loss": 0.5923, + "step": 13071 + }, + { + "epoch": 0.45, + "learning_rate": 1.1479757309617006e-05, + "loss": 0.6019, + "step": 13072 + }, + { + "epoch": 0.45, + "learning_rate": 1.1478680423390892e-05, + "loss": 0.6622, + "step": 13073 + }, + { + "epoch": 0.45, + "learning_rate": 1.1477603519633148e-05, + "loss": 0.6176, + "step": 13074 + }, + { + "epoch": 0.45, + "learning_rate": 1.1476526598356543e-05, + "loss": 0.6665, + "step": 13075 + }, + { + "epoch": 0.45, + "learning_rate": 1.1475449659573852e-05, + "loss": 0.618, + "step": 13076 + }, + { + "epoch": 0.45, + "learning_rate": 1.1474372703297836e-05, + "loss": 0.6221, + "step": 13077 + }, + { + "epoch": 0.45, + "learning_rate": 1.1473295729541265e-05, + "loss": 0.6467, + "step": 13078 + }, + { + "epoch": 0.45, + "learning_rate": 1.1472218738316913e-05, + "loss": 0.6755, + "step": 13079 + }, + { + "epoch": 0.45, + "learning_rate": 1.1471141729637545e-05, + "loss": 0.6494, + "step": 13080 + }, + { + "epoch": 0.45, + "learning_rate": 1.1470064703515929e-05, + "loss": 0.5903, + "step": 13081 + }, + { + "epoch": 0.45, + "learning_rate": 1.146898765996484e-05, + "loss": 0.5929, + "step": 13082 + }, + { + "epoch": 0.45, + "learning_rate": 1.1467910598997038e-05, + "loss": 0.6594, + "step": 13083 + }, + { + "epoch": 0.45, + "learning_rate": 1.1466833520625303e-05, + "loss": 0.6237, + "step": 13084 + }, + { + "epoch": 0.45, + "learning_rate": 1.1465756424862401e-05, + "loss": 0.5918, + "step": 13085 + }, + { + "epoch": 0.45, + "learning_rate": 1.1464679311721101e-05, + "loss": 0.6577, + "step": 13086 + }, + { + "epoch": 0.45, + "learning_rate": 1.1463602181214175e-05, + "loss": 0.596, + "step": 13087 + }, + { + "epoch": 0.45, + "learning_rate": 1.1462525033354395e-05, + "loss": 0.5822, + "step": 13088 + }, + { + "epoch": 0.45, + "learning_rate": 1.1461447868154529e-05, + "loss": 0.6419, + "step": 13089 + }, + { + "epoch": 0.45, + "learning_rate": 1.146037068562735e-05, + "loss": 0.6466, + "step": 13090 + }, + { + "epoch": 0.45, + "learning_rate": 1.1459293485785631e-05, + "loss": 0.5851, + "step": 13091 + }, + { + "epoch": 0.45, + "learning_rate": 1.1458216268642142e-05, + "loss": 0.6455, + "step": 13092 + }, + { + "epoch": 0.45, + "learning_rate": 1.145713903420965e-05, + "loss": 0.655, + "step": 13093 + }, + { + "epoch": 0.45, + "learning_rate": 1.1456061782500936e-05, + "loss": 0.6087, + "step": 13094 + }, + { + "epoch": 0.45, + "learning_rate": 1.1454984513528767e-05, + "loss": 0.6339, + "step": 13095 + }, + { + "epoch": 0.45, + "learning_rate": 1.1453907227305914e-05, + "loss": 0.6711, + "step": 13096 + }, + { + "epoch": 0.45, + "learning_rate": 1.1452829923845155e-05, + "loss": 0.6196, + "step": 13097 + }, + { + "epoch": 0.45, + "learning_rate": 1.1451752603159254e-05, + "loss": 0.6838, + "step": 13098 + }, + { + "epoch": 0.45, + "learning_rate": 1.1450675265260994e-05, + "loss": 0.6299, + "step": 13099 + }, + { + "epoch": 0.45, + "learning_rate": 1.1449597910163141e-05, + "loss": 0.6129, + "step": 13100 + }, + { + "epoch": 0.45, + "learning_rate": 1.1448520537878473e-05, + "loss": 0.6491, + "step": 13101 + }, + { + "epoch": 0.45, + "learning_rate": 1.1447443148419758e-05, + "loss": 0.6566, + "step": 13102 + }, + { + "epoch": 0.45, + "learning_rate": 1.1446365741799778e-05, + "loss": 0.6578, + "step": 13103 + }, + { + "epoch": 0.45, + "learning_rate": 1.1445288318031303e-05, + "loss": 0.5964, + "step": 13104 + }, + { + "epoch": 0.45, + "learning_rate": 1.1444210877127102e-05, + "loss": 0.6652, + "step": 13105 + }, + { + "epoch": 0.45, + "learning_rate": 1.1443133419099958e-05, + "loss": 0.6903, + "step": 13106 + }, + { + "epoch": 0.45, + "learning_rate": 1.144205594396264e-05, + "loss": 0.6278, + "step": 13107 + }, + { + "epoch": 0.45, + "learning_rate": 1.1440978451727925e-05, + "loss": 0.6549, + "step": 13108 + }, + { + "epoch": 0.45, + "learning_rate": 1.1439900942408588e-05, + "loss": 0.6469, + "step": 13109 + }, + { + "epoch": 0.45, + "learning_rate": 1.1438823416017402e-05, + "loss": 0.6562, + "step": 13110 + }, + { + "epoch": 0.45, + "learning_rate": 1.1437745872567145e-05, + "loss": 0.6548, + "step": 13111 + }, + { + "epoch": 0.45, + "learning_rate": 1.1436668312070593e-05, + "loss": 0.6375, + "step": 13112 + }, + { + "epoch": 0.45, + "learning_rate": 1.143559073454052e-05, + "loss": 0.6003, + "step": 13113 + }, + { + "epoch": 0.45, + "learning_rate": 1.1434513139989702e-05, + "loss": 0.6561, + "step": 13114 + }, + { + "epoch": 0.45, + "learning_rate": 1.143343552843092e-05, + "loss": 0.6298, + "step": 13115 + }, + { + "epoch": 0.45, + "learning_rate": 1.1432357899876942e-05, + "loss": 0.6948, + "step": 13116 + }, + { + "epoch": 0.45, + "learning_rate": 1.1431280254340554e-05, + "loss": 0.612, + "step": 13117 + }, + { + "epoch": 0.45, + "learning_rate": 1.1430202591834522e-05, + "loss": 0.6371, + "step": 13118 + }, + { + "epoch": 0.45, + "learning_rate": 1.1429124912371632e-05, + "loss": 0.6164, + "step": 13119 + }, + { + "epoch": 0.45, + "learning_rate": 1.142804721596466e-05, + "loss": 0.6021, + "step": 13120 + }, + { + "epoch": 0.45, + "learning_rate": 1.1426969502626379e-05, + "loss": 0.67, + "step": 13121 + }, + { + "epoch": 0.45, + "learning_rate": 1.142589177236957e-05, + "loss": 0.6808, + "step": 13122 + }, + { + "epoch": 0.45, + "learning_rate": 1.1424814025207012e-05, + "loss": 0.6564, + "step": 13123 + }, + { + "epoch": 0.45, + "learning_rate": 1.142373626115148e-05, + "loss": 0.6448, + "step": 13124 + }, + { + "epoch": 0.45, + "learning_rate": 1.1422658480215751e-05, + "loss": 0.5703, + "step": 13125 + }, + { + "epoch": 0.45, + "learning_rate": 1.1421580682412612e-05, + "loss": 0.6348, + "step": 13126 + }, + { + "epoch": 0.45, + "learning_rate": 1.142050286775483e-05, + "loss": 0.6857, + "step": 13127 + }, + { + "epoch": 0.45, + "learning_rate": 1.1419425036255192e-05, + "loss": 0.6425, + "step": 13128 + }, + { + "epoch": 0.45, + "learning_rate": 1.1418347187926476e-05, + "loss": 0.5895, + "step": 13129 + }, + { + "epoch": 0.45, + "learning_rate": 1.1417269322781458e-05, + "loss": 0.6195, + "step": 13130 + }, + { + "epoch": 0.45, + "learning_rate": 1.1416191440832918e-05, + "loss": 0.662, + "step": 13131 + }, + { + "epoch": 0.45, + "learning_rate": 1.1415113542093642e-05, + "loss": 0.623, + "step": 13132 + }, + { + "epoch": 0.46, + "learning_rate": 1.1414035626576399e-05, + "loss": 0.6554, + "step": 13133 + }, + { + "epoch": 0.46, + "learning_rate": 1.1412957694293975e-05, + "loss": 0.6277, + "step": 13134 + }, + { + "epoch": 0.46, + "learning_rate": 1.1411879745259156e-05, + "loss": 0.6253, + "step": 13135 + }, + { + "epoch": 0.46, + "learning_rate": 1.1410801779484713e-05, + "loss": 0.6904, + "step": 13136 + }, + { + "epoch": 0.46, + "learning_rate": 1.140972379698343e-05, + "loss": 0.6533, + "step": 13137 + }, + { + "epoch": 0.46, + "learning_rate": 1.1408645797768087e-05, + "loss": 0.5695, + "step": 13138 + }, + { + "epoch": 0.46, + "learning_rate": 1.1407567781851467e-05, + "loss": 0.5957, + "step": 13139 + }, + { + "epoch": 0.46, + "learning_rate": 1.1406489749246353e-05, + "loss": 0.6271, + "step": 13140 + }, + { + "epoch": 0.46, + "learning_rate": 1.1405411699965521e-05, + "loss": 0.6013, + "step": 13141 + }, + { + "epoch": 0.46, + "learning_rate": 1.1404333634021756e-05, + "loss": 0.5898, + "step": 13142 + }, + { + "epoch": 0.46, + "learning_rate": 1.1403255551427839e-05, + "loss": 0.6373, + "step": 13143 + }, + { + "epoch": 0.46, + "learning_rate": 1.1402177452196555e-05, + "loss": 0.6224, + "step": 13144 + }, + { + "epoch": 0.46, + "learning_rate": 1.140109933634068e-05, + "loss": 0.6604, + "step": 13145 + }, + { + "epoch": 0.46, + "learning_rate": 1.1400021203872999e-05, + "loss": 0.5739, + "step": 13146 + }, + { + "epoch": 0.46, + "learning_rate": 1.1398943054806299e-05, + "loss": 0.6708, + "step": 13147 + }, + { + "epoch": 0.46, + "learning_rate": 1.1397864889153361e-05, + "loss": 0.6634, + "step": 13148 + }, + { + "epoch": 0.46, + "learning_rate": 1.1396786706926961e-05, + "loss": 0.6084, + "step": 13149 + }, + { + "epoch": 0.46, + "learning_rate": 1.1395708508139892e-05, + "loss": 0.6234, + "step": 13150 + }, + { + "epoch": 0.46, + "learning_rate": 1.139463029280493e-05, + "loss": 0.6006, + "step": 13151 + }, + { + "epoch": 0.46, + "learning_rate": 1.1393552060934863e-05, + "loss": 0.6156, + "step": 13152 + }, + { + "epoch": 0.46, + "learning_rate": 1.1392473812542475e-05, + "loss": 0.5976, + "step": 13153 + }, + { + "epoch": 0.46, + "learning_rate": 1.1391395547640547e-05, + "loss": 0.6317, + "step": 13154 + }, + { + "epoch": 0.46, + "learning_rate": 1.139031726624186e-05, + "loss": 0.5952, + "step": 13155 + }, + { + "epoch": 0.46, + "learning_rate": 1.138923896835921e-05, + "loss": 0.6457, + "step": 13156 + }, + { + "epoch": 0.46, + "learning_rate": 1.1388160654005376e-05, + "loss": 0.5793, + "step": 13157 + }, + { + "epoch": 0.46, + "learning_rate": 1.1387082323193135e-05, + "loss": 0.6277, + "step": 13158 + }, + { + "epoch": 0.46, + "learning_rate": 1.1386003975935282e-05, + "loss": 0.6624, + "step": 13159 + }, + { + "epoch": 0.46, + "learning_rate": 1.1384925612244598e-05, + "loss": 0.65, + "step": 13160 + }, + { + "epoch": 0.46, + "learning_rate": 1.1383847232133866e-05, + "loss": 0.5923, + "step": 13161 + }, + { + "epoch": 0.46, + "learning_rate": 1.1382768835615878e-05, + "loss": 0.6291, + "step": 13162 + }, + { + "epoch": 0.46, + "learning_rate": 1.1381690422703418e-05, + "loss": 0.5727, + "step": 13163 + }, + { + "epoch": 0.46, + "learning_rate": 1.1380611993409266e-05, + "loss": 0.6193, + "step": 13164 + }, + { + "epoch": 0.46, + "learning_rate": 1.1379533547746214e-05, + "loss": 0.6492, + "step": 13165 + }, + { + "epoch": 0.46, + "learning_rate": 1.1378455085727047e-05, + "loss": 0.5734, + "step": 13166 + }, + { + "epoch": 0.46, + "learning_rate": 1.1377376607364548e-05, + "loss": 0.6696, + "step": 13167 + }, + { + "epoch": 0.46, + "learning_rate": 1.137629811267151e-05, + "loss": 0.5564, + "step": 13168 + }, + { + "epoch": 0.46, + "learning_rate": 1.1375219601660719e-05, + "loss": 0.5858, + "step": 13169 + }, + { + "epoch": 0.46, + "learning_rate": 1.1374141074344955e-05, + "loss": 0.5866, + "step": 13170 + }, + { + "epoch": 0.46, + "learning_rate": 1.1373062530737013e-05, + "loss": 0.6675, + "step": 13171 + }, + { + "epoch": 0.46, + "learning_rate": 1.137198397084968e-05, + "loss": 0.6616, + "step": 13172 + }, + { + "epoch": 0.46, + "learning_rate": 1.1370905394695736e-05, + "loss": 0.6376, + "step": 13173 + }, + { + "epoch": 0.46, + "learning_rate": 1.1369826802287978e-05, + "loss": 0.6633, + "step": 13174 + }, + { + "epoch": 0.46, + "learning_rate": 1.1368748193639192e-05, + "loss": 0.6265, + "step": 13175 + }, + { + "epoch": 0.46, + "learning_rate": 1.1367669568762158e-05, + "loss": 0.6522, + "step": 13176 + }, + { + "epoch": 0.46, + "learning_rate": 1.1366590927669679e-05, + "loss": 0.6426, + "step": 13177 + }, + { + "epoch": 0.46, + "learning_rate": 1.1365512270374532e-05, + "loss": 0.6338, + "step": 13178 + }, + { + "epoch": 0.46, + "learning_rate": 1.1364433596889511e-05, + "loss": 0.5951, + "step": 13179 + }, + { + "epoch": 0.46, + "learning_rate": 1.1363354907227402e-05, + "loss": 0.6111, + "step": 13180 + }, + { + "epoch": 0.46, + "learning_rate": 1.1362276201400996e-05, + "loss": 0.599, + "step": 13181 + }, + { + "epoch": 0.46, + "learning_rate": 1.1361197479423083e-05, + "loss": 0.6808, + "step": 13182 + }, + { + "epoch": 0.46, + "learning_rate": 1.1360118741306451e-05, + "loss": 0.6512, + "step": 13183 + }, + { + "epoch": 0.46, + "learning_rate": 1.1359039987063893e-05, + "loss": 0.6187, + "step": 13184 + }, + { + "epoch": 0.46, + "learning_rate": 1.1357961216708196e-05, + "loss": 0.6537, + "step": 13185 + }, + { + "epoch": 0.46, + "learning_rate": 1.135688243025215e-05, + "loss": 0.6476, + "step": 13186 + }, + { + "epoch": 0.46, + "learning_rate": 1.1355803627708548e-05, + "loss": 0.6289, + "step": 13187 + }, + { + "epoch": 0.46, + "learning_rate": 1.1354724809090176e-05, + "loss": 0.65, + "step": 13188 + }, + { + "epoch": 0.46, + "learning_rate": 1.1353645974409829e-05, + "loss": 0.6298, + "step": 13189 + }, + { + "epoch": 0.46, + "learning_rate": 1.1352567123680299e-05, + "loss": 0.6241, + "step": 13190 + }, + { + "epoch": 0.46, + "learning_rate": 1.1351488256914371e-05, + "loss": 0.6574, + "step": 13191 + }, + { + "epoch": 0.46, + "learning_rate": 1.135040937412484e-05, + "loss": 0.5514, + "step": 13192 + }, + { + "epoch": 0.46, + "learning_rate": 1.1349330475324502e-05, + "loss": 0.671, + "step": 13193 + }, + { + "epoch": 0.46, + "learning_rate": 1.134825156052614e-05, + "loss": 0.6575, + "step": 13194 + }, + { + "epoch": 0.46, + "learning_rate": 1.134717262974255e-05, + "loss": 0.6427, + "step": 13195 + }, + { + "epoch": 0.46, + "learning_rate": 1.1346093682986527e-05, + "loss": 0.6085, + "step": 13196 + }, + { + "epoch": 0.46, + "learning_rate": 1.1345014720270862e-05, + "loss": 0.6315, + "step": 13197 + }, + { + "epoch": 0.46, + "learning_rate": 1.1343935741608342e-05, + "loss": 0.6312, + "step": 13198 + }, + { + "epoch": 0.46, + "learning_rate": 1.1342856747011765e-05, + "loss": 0.5741, + "step": 13199 + }, + { + "epoch": 0.46, + "learning_rate": 1.1341777736493924e-05, + "loss": 0.6088, + "step": 13200 + }, + { + "epoch": 0.46, + "learning_rate": 1.1340698710067609e-05, + "loss": 0.6708, + "step": 13201 + }, + { + "epoch": 0.46, + "learning_rate": 1.1339619667745616e-05, + "loss": 0.6282, + "step": 13202 + }, + { + "epoch": 0.46, + "learning_rate": 1.1338540609540736e-05, + "loss": 0.6778, + "step": 13203 + }, + { + "epoch": 0.46, + "learning_rate": 1.1337461535465763e-05, + "loss": 0.6098, + "step": 13204 + }, + { + "epoch": 0.46, + "learning_rate": 1.1336382445533495e-05, + "loss": 0.6112, + "step": 13205 + }, + { + "epoch": 0.46, + "learning_rate": 1.133530333975672e-05, + "loss": 0.6805, + "step": 13206 + }, + { + "epoch": 0.46, + "learning_rate": 1.1334224218148233e-05, + "loss": 0.6583, + "step": 13207 + }, + { + "epoch": 0.46, + "learning_rate": 1.1333145080720835e-05, + "loss": 0.6162, + "step": 13208 + }, + { + "epoch": 0.46, + "learning_rate": 1.1332065927487312e-05, + "loss": 0.5984, + "step": 13209 + }, + { + "epoch": 0.46, + "learning_rate": 1.1330986758460464e-05, + "loss": 0.6759, + "step": 13210 + }, + { + "epoch": 0.46, + "learning_rate": 1.1329907573653083e-05, + "loss": 0.7285, + "step": 13211 + }, + { + "epoch": 0.46, + "learning_rate": 1.1328828373077964e-05, + "loss": 0.6233, + "step": 13212 + }, + { + "epoch": 0.46, + "learning_rate": 1.132774915674791e-05, + "loss": 0.6319, + "step": 13213 + }, + { + "epoch": 0.46, + "learning_rate": 1.1326669924675704e-05, + "loss": 0.6233, + "step": 13214 + }, + { + "epoch": 0.46, + "learning_rate": 1.132559067687415e-05, + "loss": 0.6435, + "step": 13215 + }, + { + "epoch": 0.46, + "learning_rate": 1.132451141335604e-05, + "loss": 0.6544, + "step": 13216 + }, + { + "epoch": 0.46, + "learning_rate": 1.1323432134134174e-05, + "loss": 0.5866, + "step": 13217 + }, + { + "epoch": 0.46, + "learning_rate": 1.1322352839221344e-05, + "loss": 0.6521, + "step": 13218 + }, + { + "epoch": 0.46, + "learning_rate": 1.132127352863035e-05, + "loss": 0.616, + "step": 13219 + }, + { + "epoch": 0.46, + "learning_rate": 1.1320194202373985e-05, + "loss": 0.6287, + "step": 13220 + }, + { + "epoch": 0.46, + "learning_rate": 1.1319114860465048e-05, + "loss": 0.6454, + "step": 13221 + }, + { + "epoch": 0.46, + "learning_rate": 1.1318035502916337e-05, + "loss": 0.6453, + "step": 13222 + }, + { + "epoch": 0.46, + "learning_rate": 1.1316956129740646e-05, + "loss": 0.6483, + "step": 13223 + }, + { + "epoch": 0.46, + "learning_rate": 1.1315876740950775e-05, + "loss": 0.6902, + "step": 13224 + }, + { + "epoch": 0.46, + "learning_rate": 1.1314797336559521e-05, + "loss": 0.6569, + "step": 13225 + }, + { + "epoch": 0.46, + "learning_rate": 1.1313717916579683e-05, + "loss": 0.6156, + "step": 13226 + }, + { + "epoch": 0.46, + "learning_rate": 1.1312638481024054e-05, + "loss": 0.6566, + "step": 13227 + }, + { + "epoch": 0.46, + "learning_rate": 1.1311559029905438e-05, + "loss": 0.6681, + "step": 13228 + }, + { + "epoch": 0.46, + "learning_rate": 1.1310479563236629e-05, + "loss": 0.6003, + "step": 13229 + }, + { + "epoch": 0.46, + "learning_rate": 1.1309400081030427e-05, + "loss": 0.6174, + "step": 13230 + }, + { + "epoch": 0.46, + "learning_rate": 1.1308320583299632e-05, + "loss": 0.6384, + "step": 13231 + }, + { + "epoch": 0.46, + "learning_rate": 1.130724107005704e-05, + "loss": 0.6581, + "step": 13232 + }, + { + "epoch": 0.46, + "learning_rate": 1.130616154131545e-05, + "loss": 0.6031, + "step": 13233 + }, + { + "epoch": 0.46, + "learning_rate": 1.1305081997087666e-05, + "loss": 0.6315, + "step": 13234 + }, + { + "epoch": 0.46, + "learning_rate": 1.1304002437386483e-05, + "loss": 0.6541, + "step": 13235 + }, + { + "epoch": 0.46, + "learning_rate": 1.1302922862224698e-05, + "loss": 0.6425, + "step": 13236 + }, + { + "epoch": 0.46, + "learning_rate": 1.1301843271615121e-05, + "loss": 0.6593, + "step": 13237 + }, + { + "epoch": 0.46, + "learning_rate": 1.130076366557054e-05, + "loss": 0.6484, + "step": 13238 + }, + { + "epoch": 0.46, + "learning_rate": 1.129968404410376e-05, + "loss": 0.6111, + "step": 13239 + }, + { + "epoch": 0.46, + "learning_rate": 1.1298604407227588e-05, + "loss": 0.5867, + "step": 13240 + }, + { + "epoch": 0.46, + "learning_rate": 1.1297524754954812e-05, + "loss": 0.6487, + "step": 13241 + }, + { + "epoch": 0.46, + "learning_rate": 1.1296445087298238e-05, + "loss": 0.636, + "step": 13242 + }, + { + "epoch": 0.46, + "learning_rate": 1.129536540427067e-05, + "loss": 0.6219, + "step": 13243 + }, + { + "epoch": 0.46, + "learning_rate": 1.1294285705884907e-05, + "loss": 0.5666, + "step": 13244 + }, + { + "epoch": 0.46, + "learning_rate": 1.1293205992153746e-05, + "loss": 0.6162, + "step": 13245 + }, + { + "epoch": 0.46, + "learning_rate": 1.1292126263089995e-05, + "loss": 0.6349, + "step": 13246 + }, + { + "epoch": 0.46, + "learning_rate": 1.1291046518706455e-05, + "loss": 0.631, + "step": 13247 + }, + { + "epoch": 0.46, + "learning_rate": 1.128996675901592e-05, + "loss": 0.6319, + "step": 13248 + }, + { + "epoch": 0.46, + "learning_rate": 1.12888869840312e-05, + "loss": 0.6505, + "step": 13249 + }, + { + "epoch": 0.46, + "learning_rate": 1.1287807193765097e-05, + "loss": 0.5727, + "step": 13250 + }, + { + "epoch": 0.46, + "learning_rate": 1.1286727388230405e-05, + "loss": 0.611, + "step": 13251 + }, + { + "epoch": 0.46, + "learning_rate": 1.1285647567439934e-05, + "loss": 0.6258, + "step": 13252 + }, + { + "epoch": 0.46, + "learning_rate": 1.1284567731406489e-05, + "loss": 0.6552, + "step": 13253 + }, + { + "epoch": 0.46, + "learning_rate": 1.1283487880142863e-05, + "loss": 0.6148, + "step": 13254 + }, + { + "epoch": 0.46, + "learning_rate": 1.1282408013661868e-05, + "loss": 0.6329, + "step": 13255 + }, + { + "epoch": 0.46, + "learning_rate": 1.1281328131976303e-05, + "loss": 0.6737, + "step": 13256 + }, + { + "epoch": 0.46, + "learning_rate": 1.1280248235098969e-05, + "loss": 0.613, + "step": 13257 + }, + { + "epoch": 0.46, + "learning_rate": 1.1279168323042677e-05, + "loss": 0.6191, + "step": 13258 + }, + { + "epoch": 0.46, + "learning_rate": 1.1278088395820226e-05, + "loss": 0.6693, + "step": 13259 + }, + { + "epoch": 0.46, + "learning_rate": 1.1277008453444415e-05, + "loss": 0.6527, + "step": 13260 + }, + { + "epoch": 0.46, + "learning_rate": 1.127592849592806e-05, + "loss": 0.6802, + "step": 13261 + }, + { + "epoch": 0.46, + "learning_rate": 1.1274848523283957e-05, + "loss": 0.6435, + "step": 13262 + }, + { + "epoch": 0.46, + "learning_rate": 1.1273768535524907e-05, + "loss": 0.6619, + "step": 13263 + }, + { + "epoch": 0.46, + "learning_rate": 1.1272688532663725e-05, + "loss": 0.6368, + "step": 13264 + }, + { + "epoch": 0.46, + "learning_rate": 1.127160851471321e-05, + "loss": 0.5697, + "step": 13265 + }, + { + "epoch": 0.46, + "learning_rate": 1.1270528481686165e-05, + "loss": 0.6688, + "step": 13266 + }, + { + "epoch": 0.46, + "learning_rate": 1.12694484335954e-05, + "loss": 0.6685, + "step": 13267 + }, + { + "epoch": 0.46, + "learning_rate": 1.126836837045372e-05, + "loss": 0.5905, + "step": 13268 + }, + { + "epoch": 0.46, + "learning_rate": 1.1267288292273921e-05, + "loss": 0.6665, + "step": 13269 + }, + { + "epoch": 0.46, + "learning_rate": 1.1266208199068822e-05, + "loss": 0.5939, + "step": 13270 + }, + { + "epoch": 0.46, + "learning_rate": 1.1265128090851226e-05, + "loss": 0.6612, + "step": 13271 + }, + { + "epoch": 0.46, + "learning_rate": 1.1264047967633928e-05, + "loss": 0.656, + "step": 13272 + }, + { + "epoch": 0.46, + "learning_rate": 1.1262967829429748e-05, + "loss": 0.6426, + "step": 13273 + }, + { + "epoch": 0.46, + "learning_rate": 1.1261887676251487e-05, + "loss": 0.6045, + "step": 13274 + }, + { + "epoch": 0.46, + "learning_rate": 1.1260807508111946e-05, + "loss": 0.6366, + "step": 13275 + }, + { + "epoch": 0.46, + "learning_rate": 1.1259727325023942e-05, + "loss": 0.6422, + "step": 13276 + }, + { + "epoch": 0.46, + "learning_rate": 1.1258647127000276e-05, + "loss": 0.6398, + "step": 13277 + }, + { + "epoch": 0.46, + "learning_rate": 1.1257566914053754e-05, + "loss": 0.6694, + "step": 13278 + }, + { + "epoch": 0.46, + "learning_rate": 1.1256486686197186e-05, + "loss": 0.646, + "step": 13279 + }, + { + "epoch": 0.46, + "learning_rate": 1.1255406443443382e-05, + "loss": 0.6429, + "step": 13280 + }, + { + "epoch": 0.46, + "learning_rate": 1.1254326185805142e-05, + "loss": 0.6641, + "step": 13281 + }, + { + "epoch": 0.46, + "learning_rate": 1.1253245913295282e-05, + "loss": 0.7042, + "step": 13282 + }, + { + "epoch": 0.46, + "learning_rate": 1.1252165625926606e-05, + "loss": 0.6653, + "step": 13283 + }, + { + "epoch": 0.46, + "learning_rate": 1.1251085323711918e-05, + "loss": 0.6324, + "step": 13284 + }, + { + "epoch": 0.46, + "learning_rate": 1.1250005006664036e-05, + "loss": 0.6568, + "step": 13285 + }, + { + "epoch": 0.46, + "learning_rate": 1.1248924674795762e-05, + "loss": 0.64, + "step": 13286 + }, + { + "epoch": 0.46, + "learning_rate": 1.1247844328119906e-05, + "loss": 0.6848, + "step": 13287 + }, + { + "epoch": 0.46, + "learning_rate": 1.1246763966649274e-05, + "loss": 0.6165, + "step": 13288 + }, + { + "epoch": 0.46, + "learning_rate": 1.1245683590396684e-05, + "loss": 0.662, + "step": 13289 + }, + { + "epoch": 0.46, + "learning_rate": 1.1244603199374934e-05, + "loss": 0.6206, + "step": 13290 + }, + { + "epoch": 0.46, + "learning_rate": 1.1243522793596839e-05, + "loss": 0.6686, + "step": 13291 + }, + { + "epoch": 0.46, + "learning_rate": 1.1242442373075214e-05, + "loss": 0.6635, + "step": 13292 + }, + { + "epoch": 0.46, + "learning_rate": 1.1241361937822857e-05, + "loss": 0.6173, + "step": 13293 + }, + { + "epoch": 0.46, + "learning_rate": 1.1240281487852584e-05, + "loss": 0.5893, + "step": 13294 + }, + { + "epoch": 0.46, + "learning_rate": 1.1239201023177209e-05, + "loss": 0.6682, + "step": 13295 + }, + { + "epoch": 0.46, + "learning_rate": 1.1238120543809534e-05, + "loss": 0.596, + "step": 13296 + }, + { + "epoch": 0.46, + "learning_rate": 1.1237040049762376e-05, + "loss": 0.6511, + "step": 13297 + }, + { + "epoch": 0.46, + "learning_rate": 1.1235959541048544e-05, + "loss": 0.5979, + "step": 13298 + }, + { + "epoch": 0.46, + "learning_rate": 1.1234879017680846e-05, + "loss": 0.6006, + "step": 13299 + }, + { + "epoch": 0.46, + "learning_rate": 1.1233798479672095e-05, + "loss": 0.5825, + "step": 13300 + }, + { + "epoch": 0.46, + "learning_rate": 1.1232717927035106e-05, + "loss": 0.6306, + "step": 13301 + }, + { + "epoch": 0.46, + "learning_rate": 1.1231637359782683e-05, + "loss": 0.6777, + "step": 13302 + }, + { + "epoch": 0.46, + "learning_rate": 1.1230556777927644e-05, + "loss": 0.6191, + "step": 13303 + }, + { + "epoch": 0.46, + "learning_rate": 1.1229476181482795e-05, + "loss": 0.6585, + "step": 13304 + }, + { + "epoch": 0.46, + "learning_rate": 1.122839557046095e-05, + "loss": 0.5725, + "step": 13305 + }, + { + "epoch": 0.46, + "learning_rate": 1.1227314944874926e-05, + "loss": 0.61, + "step": 13306 + }, + { + "epoch": 0.46, + "learning_rate": 1.1226234304737527e-05, + "loss": 0.6451, + "step": 13307 + }, + { + "epoch": 0.46, + "learning_rate": 1.1225153650061568e-05, + "loss": 0.6504, + "step": 13308 + }, + { + "epoch": 0.46, + "learning_rate": 1.1224072980859865e-05, + "loss": 0.5982, + "step": 13309 + }, + { + "epoch": 0.46, + "learning_rate": 1.122299229714523e-05, + "loss": 0.6157, + "step": 13310 + }, + { + "epoch": 0.46, + "learning_rate": 1.122191159893047e-05, + "loss": 0.6165, + "step": 13311 + }, + { + "epoch": 0.46, + "learning_rate": 1.1220830886228407e-05, + "loss": 0.6552, + "step": 13312 + }, + { + "epoch": 0.46, + "learning_rate": 1.1219750159051846e-05, + "loss": 0.6172, + "step": 13313 + }, + { + "epoch": 0.46, + "learning_rate": 1.1218669417413603e-05, + "loss": 0.6216, + "step": 13314 + }, + { + "epoch": 0.46, + "learning_rate": 1.1217588661326496e-05, + "loss": 0.6406, + "step": 13315 + }, + { + "epoch": 0.46, + "learning_rate": 1.1216507890803332e-05, + "loss": 0.6238, + "step": 13316 + }, + { + "epoch": 0.46, + "learning_rate": 1.121542710585693e-05, + "loss": 0.6233, + "step": 13317 + }, + { + "epoch": 0.46, + "learning_rate": 1.1214346306500103e-05, + "loss": 0.6325, + "step": 13318 + }, + { + "epoch": 0.46, + "learning_rate": 1.1213265492745661e-05, + "loss": 0.6657, + "step": 13319 + }, + { + "epoch": 0.46, + "learning_rate": 1.1212184664606425e-05, + "loss": 0.5888, + "step": 13320 + }, + { + "epoch": 0.46, + "learning_rate": 1.1211103822095206e-05, + "loss": 0.6301, + "step": 13321 + }, + { + "epoch": 0.46, + "learning_rate": 1.1210022965224816e-05, + "loss": 0.6319, + "step": 13322 + }, + { + "epoch": 0.46, + "learning_rate": 1.1208942094008076e-05, + "loss": 0.6164, + "step": 13323 + }, + { + "epoch": 0.46, + "learning_rate": 1.1207861208457798e-05, + "loss": 0.6642, + "step": 13324 + }, + { + "epoch": 0.46, + "learning_rate": 1.1206780308586796e-05, + "loss": 0.6516, + "step": 13325 + }, + { + "epoch": 0.46, + "learning_rate": 1.1205699394407887e-05, + "loss": 0.5835, + "step": 13326 + }, + { + "epoch": 0.46, + "learning_rate": 1.120461846593389e-05, + "loss": 0.6635, + "step": 13327 + }, + { + "epoch": 0.46, + "learning_rate": 1.1203537523177613e-05, + "loss": 0.6369, + "step": 13328 + }, + { + "epoch": 0.46, + "learning_rate": 1.1202456566151878e-05, + "loss": 0.5877, + "step": 13329 + }, + { + "epoch": 0.46, + "learning_rate": 1.12013755948695e-05, + "loss": 0.6441, + "step": 13330 + }, + { + "epoch": 0.46, + "learning_rate": 1.1200294609343292e-05, + "loss": 0.5891, + "step": 13331 + }, + { + "epoch": 0.46, + "learning_rate": 1.1199213609586075e-05, + "loss": 0.585, + "step": 13332 + }, + { + "epoch": 0.46, + "learning_rate": 1.1198132595610663e-05, + "loss": 0.6114, + "step": 13333 + }, + { + "epoch": 0.46, + "learning_rate": 1.1197051567429873e-05, + "loss": 0.652, + "step": 13334 + }, + { + "epoch": 0.46, + "learning_rate": 1.1195970525056524e-05, + "loss": 0.6484, + "step": 13335 + }, + { + "epoch": 0.46, + "learning_rate": 1.1194889468503432e-05, + "loss": 0.6657, + "step": 13336 + }, + { + "epoch": 0.46, + "learning_rate": 1.119380839778341e-05, + "loss": 0.6688, + "step": 13337 + }, + { + "epoch": 0.46, + "learning_rate": 1.1192727312909281e-05, + "loss": 0.7251, + "step": 13338 + }, + { + "epoch": 0.46, + "learning_rate": 1.1191646213893863e-05, + "loss": 0.6908, + "step": 13339 + }, + { + "epoch": 0.46, + "learning_rate": 1.119056510074997e-05, + "loss": 0.6306, + "step": 13340 + }, + { + "epoch": 0.46, + "learning_rate": 1.118948397349042e-05, + "loss": 0.6725, + "step": 13341 + }, + { + "epoch": 0.46, + "learning_rate": 1.1188402832128035e-05, + "loss": 0.6115, + "step": 13342 + }, + { + "epoch": 0.46, + "learning_rate": 1.118732167667563e-05, + "loss": 0.6239, + "step": 13343 + }, + { + "epoch": 0.46, + "learning_rate": 1.1186240507146026e-05, + "loss": 0.6119, + "step": 13344 + }, + { + "epoch": 0.46, + "learning_rate": 1.1185159323552041e-05, + "loss": 0.6771, + "step": 13345 + }, + { + "epoch": 0.46, + "learning_rate": 1.118407812590649e-05, + "loss": 0.6511, + "step": 13346 + }, + { + "epoch": 0.46, + "learning_rate": 1.1182996914222198e-05, + "loss": 0.6454, + "step": 13347 + }, + { + "epoch": 0.46, + "learning_rate": 1.118191568851198e-05, + "loss": 0.5955, + "step": 13348 + }, + { + "epoch": 0.46, + "learning_rate": 1.1180834448788655e-05, + "loss": 0.6283, + "step": 13349 + }, + { + "epoch": 0.46, + "learning_rate": 1.1179753195065044e-05, + "loss": 0.5808, + "step": 13350 + }, + { + "epoch": 0.46, + "learning_rate": 1.1178671927353967e-05, + "loss": 0.6028, + "step": 13351 + }, + { + "epoch": 0.46, + "learning_rate": 1.1177590645668244e-05, + "loss": 0.6145, + "step": 13352 + }, + { + "epoch": 0.46, + "learning_rate": 1.1176509350020692e-05, + "loss": 0.67, + "step": 13353 + }, + { + "epoch": 0.46, + "learning_rate": 1.1175428040424137e-05, + "loss": 0.6748, + "step": 13354 + }, + { + "epoch": 0.46, + "learning_rate": 1.1174346716891393e-05, + "loss": 0.6493, + "step": 13355 + }, + { + "epoch": 0.46, + "learning_rate": 1.1173265379435283e-05, + "loss": 0.5574, + "step": 13356 + }, + { + "epoch": 0.46, + "learning_rate": 1.1172184028068631e-05, + "loss": 0.6672, + "step": 13357 + }, + { + "epoch": 0.46, + "learning_rate": 1.1171102662804251e-05, + "loss": 0.665, + "step": 13358 + }, + { + "epoch": 0.46, + "learning_rate": 1.1170021283654968e-05, + "loss": 0.6815, + "step": 13359 + }, + { + "epoch": 0.46, + "learning_rate": 1.1168939890633603e-05, + "loss": 0.6366, + "step": 13360 + }, + { + "epoch": 0.46, + "learning_rate": 1.1167858483752978e-05, + "loss": 0.5672, + "step": 13361 + }, + { + "epoch": 0.46, + "learning_rate": 1.116677706302591e-05, + "loss": 0.6351, + "step": 13362 + }, + { + "epoch": 0.46, + "learning_rate": 1.116569562846523e-05, + "loss": 0.6258, + "step": 13363 + }, + { + "epoch": 0.46, + "learning_rate": 1.1164614180083748e-05, + "loss": 0.6354, + "step": 13364 + }, + { + "epoch": 0.46, + "learning_rate": 1.1163532717894297e-05, + "loss": 0.699, + "step": 13365 + }, + { + "epoch": 0.46, + "learning_rate": 1.1162451241909689e-05, + "loss": 0.7008, + "step": 13366 + }, + { + "epoch": 0.46, + "learning_rate": 1.116136975214275e-05, + "loss": 0.6794, + "step": 13367 + }, + { + "epoch": 0.46, + "learning_rate": 1.1160288248606307e-05, + "loss": 0.6721, + "step": 13368 + }, + { + "epoch": 0.46, + "learning_rate": 1.115920673131318e-05, + "loss": 0.6116, + "step": 13369 + }, + { + "epoch": 0.46, + "learning_rate": 1.1158125200276186e-05, + "loss": 0.6026, + "step": 13370 + }, + { + "epoch": 0.46, + "learning_rate": 1.1157043655508157e-05, + "loss": 0.6497, + "step": 13371 + }, + { + "epoch": 0.46, + "learning_rate": 1.115596209702191e-05, + "loss": 0.6383, + "step": 13372 + }, + { + "epoch": 0.46, + "learning_rate": 1.115488052483027e-05, + "loss": 0.6307, + "step": 13373 + }, + { + "epoch": 0.46, + "learning_rate": 1.115379893894606e-05, + "loss": 0.6296, + "step": 13374 + }, + { + "epoch": 0.46, + "learning_rate": 1.1152717339382106e-05, + "loss": 0.6631, + "step": 13375 + }, + { + "epoch": 0.46, + "learning_rate": 1.1151635726151228e-05, + "loss": 0.5982, + "step": 13376 + }, + { + "epoch": 0.46, + "learning_rate": 1.1150554099266253e-05, + "loss": 0.5995, + "step": 13377 + }, + { + "epoch": 0.46, + "learning_rate": 1.1149472458740002e-05, + "loss": 0.6356, + "step": 13378 + }, + { + "epoch": 0.46, + "learning_rate": 1.1148390804585301e-05, + "loss": 0.6093, + "step": 13379 + }, + { + "epoch": 0.46, + "learning_rate": 1.1147309136814976e-05, + "loss": 0.6579, + "step": 13380 + }, + { + "epoch": 0.46, + "learning_rate": 1.1146227455441849e-05, + "loss": 0.6217, + "step": 13381 + }, + { + "epoch": 0.46, + "learning_rate": 1.1145145760478744e-05, + "loss": 0.6709, + "step": 13382 + }, + { + "epoch": 0.46, + "learning_rate": 1.114406405193849e-05, + "loss": 0.5822, + "step": 13383 + }, + { + "epoch": 0.46, + "learning_rate": 1.1142982329833909e-05, + "loss": 0.6246, + "step": 13384 + }, + { + "epoch": 0.46, + "learning_rate": 1.1141900594177823e-05, + "loss": 0.6284, + "step": 13385 + }, + { + "epoch": 0.46, + "learning_rate": 1.1140818844983066e-05, + "loss": 0.6262, + "step": 13386 + }, + { + "epoch": 0.46, + "learning_rate": 1.1139737082262456e-05, + "loss": 0.6381, + "step": 13387 + }, + { + "epoch": 0.46, + "learning_rate": 1.113865530602882e-05, + "loss": 0.5982, + "step": 13388 + }, + { + "epoch": 0.46, + "learning_rate": 1.1137573516294988e-05, + "loss": 0.6574, + "step": 13389 + }, + { + "epoch": 0.46, + "learning_rate": 1.113649171307378e-05, + "loss": 0.6212, + "step": 13390 + }, + { + "epoch": 0.46, + "learning_rate": 1.1135409896378027e-05, + "loss": 0.6171, + "step": 13391 + }, + { + "epoch": 0.46, + "learning_rate": 1.1134328066220554e-05, + "loss": 0.5767, + "step": 13392 + }, + { + "epoch": 0.46, + "learning_rate": 1.1133246222614185e-05, + "loss": 0.6559, + "step": 13393 + }, + { + "epoch": 0.46, + "learning_rate": 1.1132164365571747e-05, + "loss": 0.6503, + "step": 13394 + }, + { + "epoch": 0.46, + "learning_rate": 1.1131082495106072e-05, + "loss": 0.6388, + "step": 13395 + }, + { + "epoch": 0.46, + "learning_rate": 1.1130000611229983e-05, + "loss": 0.6009, + "step": 13396 + }, + { + "epoch": 0.46, + "learning_rate": 1.1128918713956303e-05, + "loss": 0.6135, + "step": 13397 + }, + { + "epoch": 0.46, + "learning_rate": 1.1127836803297867e-05, + "loss": 0.6378, + "step": 13398 + }, + { + "epoch": 0.46, + "learning_rate": 1.11267548792675e-05, + "loss": 0.6526, + "step": 13399 + }, + { + "epoch": 0.46, + "learning_rate": 1.1125672941878023e-05, + "loss": 0.6657, + "step": 13400 + }, + { + "epoch": 0.46, + "learning_rate": 1.1124590991142274e-05, + "loss": 0.628, + "step": 13401 + }, + { + "epoch": 0.46, + "learning_rate": 1.1123509027073078e-05, + "loss": 0.6265, + "step": 13402 + }, + { + "epoch": 0.46, + "learning_rate": 1.1122427049683256e-05, + "loss": 0.6982, + "step": 13403 + }, + { + "epoch": 0.46, + "learning_rate": 1.1121345058985644e-05, + "loss": 0.654, + "step": 13404 + }, + { + "epoch": 0.46, + "learning_rate": 1.112026305499307e-05, + "loss": 0.5654, + "step": 13405 + }, + { + "epoch": 0.46, + "learning_rate": 1.1119181037718353e-05, + "loss": 0.666, + "step": 13406 + }, + { + "epoch": 0.46, + "learning_rate": 1.1118099007174337e-05, + "loss": 0.6496, + "step": 13407 + }, + { + "epoch": 0.46, + "learning_rate": 1.1117016963373842e-05, + "loss": 0.578, + "step": 13408 + }, + { + "epoch": 0.46, + "learning_rate": 1.1115934906329693e-05, + "loss": 0.6948, + "step": 13409 + }, + { + "epoch": 0.46, + "learning_rate": 1.1114852836054727e-05, + "loss": 0.6593, + "step": 13410 + }, + { + "epoch": 0.46, + "learning_rate": 1.1113770752561772e-05, + "loss": 0.578, + "step": 13411 + }, + { + "epoch": 0.46, + "learning_rate": 1.1112688655863652e-05, + "loss": 0.6307, + "step": 13412 + }, + { + "epoch": 0.46, + "learning_rate": 1.1111606545973204e-05, + "loss": 0.6356, + "step": 13413 + }, + { + "epoch": 0.46, + "learning_rate": 1.1110524422903254e-05, + "loss": 0.655, + "step": 13414 + }, + { + "epoch": 0.46, + "learning_rate": 1.110944228666663e-05, + "loss": 0.605, + "step": 13415 + }, + { + "epoch": 0.46, + "learning_rate": 1.1108360137276164e-05, + "loss": 0.6202, + "step": 13416 + }, + { + "epoch": 0.46, + "learning_rate": 1.110727797474469e-05, + "loss": 0.6215, + "step": 13417 + }, + { + "epoch": 0.46, + "learning_rate": 1.1106195799085031e-05, + "loss": 0.6105, + "step": 13418 + }, + { + "epoch": 0.46, + "learning_rate": 1.1105113610310024e-05, + "loss": 0.614, + "step": 13419 + }, + { + "epoch": 0.46, + "learning_rate": 1.1104031408432496e-05, + "loss": 0.5971, + "step": 13420 + }, + { + "epoch": 0.47, + "learning_rate": 1.1102949193465277e-05, + "loss": 0.6273, + "step": 13421 + }, + { + "epoch": 0.47, + "learning_rate": 1.1101866965421202e-05, + "loss": 0.6172, + "step": 13422 + }, + { + "epoch": 0.47, + "learning_rate": 1.1100784724313103e-05, + "loss": 0.5756, + "step": 13423 + }, + { + "epoch": 0.47, + "learning_rate": 1.1099702470153803e-05, + "loss": 0.6384, + "step": 13424 + }, + { + "epoch": 0.47, + "learning_rate": 1.1098620202956144e-05, + "loss": 0.6153, + "step": 13425 + }, + { + "epoch": 0.47, + "learning_rate": 1.109753792273295e-05, + "loss": 0.6046, + "step": 13426 + }, + { + "epoch": 0.47, + "learning_rate": 1.1096455629497056e-05, + "loss": 0.6075, + "step": 13427 + }, + { + "epoch": 0.47, + "learning_rate": 1.1095373323261293e-05, + "loss": 0.6233, + "step": 13428 + }, + { + "epoch": 0.47, + "learning_rate": 1.1094291004038497e-05, + "loss": 0.6435, + "step": 13429 + }, + { + "epoch": 0.47, + "learning_rate": 1.1093208671841493e-05, + "loss": 0.6423, + "step": 13430 + }, + { + "epoch": 0.47, + "learning_rate": 1.109212632668312e-05, + "loss": 0.6118, + "step": 13431 + }, + { + "epoch": 0.47, + "learning_rate": 1.1091043968576206e-05, + "loss": 0.6157, + "step": 13432 + }, + { + "epoch": 0.47, + "learning_rate": 1.1089961597533584e-05, + "loss": 0.5838, + "step": 13433 + }, + { + "epoch": 0.47, + "learning_rate": 1.1088879213568091e-05, + "loss": 0.665, + "step": 13434 + }, + { + "epoch": 0.47, + "learning_rate": 1.1087796816692557e-05, + "loss": 0.627, + "step": 13435 + }, + { + "epoch": 0.47, + "learning_rate": 1.1086714406919817e-05, + "loss": 0.6029, + "step": 13436 + }, + { + "epoch": 0.47, + "learning_rate": 1.1085631984262699e-05, + "loss": 0.6158, + "step": 13437 + }, + { + "epoch": 0.47, + "learning_rate": 1.1084549548734045e-05, + "loss": 0.6376, + "step": 13438 + }, + { + "epoch": 0.47, + "learning_rate": 1.1083467100346683e-05, + "loss": 0.6452, + "step": 13439 + }, + { + "epoch": 0.47, + "learning_rate": 1.1082384639113446e-05, + "loss": 0.6334, + "step": 13440 + }, + { + "epoch": 0.47, + "learning_rate": 1.1081302165047172e-05, + "loss": 0.6732, + "step": 13441 + }, + { + "epoch": 0.47, + "learning_rate": 1.1080219678160691e-05, + "loss": 0.6803, + "step": 13442 + }, + { + "epoch": 0.47, + "learning_rate": 1.1079137178466838e-05, + "loss": 0.6201, + "step": 13443 + }, + { + "epoch": 0.47, + "learning_rate": 1.1078054665978454e-05, + "loss": 0.5896, + "step": 13444 + }, + { + "epoch": 0.47, + "learning_rate": 1.1076972140708364e-05, + "loss": 0.5944, + "step": 13445 + }, + { + "epoch": 0.47, + "learning_rate": 1.1075889602669407e-05, + "loss": 0.6492, + "step": 13446 + }, + { + "epoch": 0.47, + "learning_rate": 1.107480705187442e-05, + "loss": 0.621, + "step": 13447 + }, + { + "epoch": 0.47, + "learning_rate": 1.1073724488336235e-05, + "loss": 0.6463, + "step": 13448 + }, + { + "epoch": 0.47, + "learning_rate": 1.1072641912067688e-05, + "loss": 0.6578, + "step": 13449 + }, + { + "epoch": 0.47, + "learning_rate": 1.1071559323081612e-05, + "loss": 0.621, + "step": 13450 + }, + { + "epoch": 0.47, + "learning_rate": 1.1070476721390849e-05, + "loss": 0.658, + "step": 13451 + }, + { + "epoch": 0.47, + "learning_rate": 1.1069394107008225e-05, + "loss": 0.6043, + "step": 13452 + }, + { + "epoch": 0.47, + "learning_rate": 1.1068311479946585e-05, + "loss": 0.6731, + "step": 13453 + }, + { + "epoch": 0.47, + "learning_rate": 1.106722884021876e-05, + "loss": 0.6485, + "step": 13454 + }, + { + "epoch": 0.47, + "learning_rate": 1.1066146187837586e-05, + "loss": 0.6677, + "step": 13455 + }, + { + "epoch": 0.47, + "learning_rate": 1.1065063522815902e-05, + "loss": 0.6203, + "step": 13456 + }, + { + "epoch": 0.47, + "learning_rate": 1.1063980845166542e-05, + "loss": 0.702, + "step": 13457 + }, + { + "epoch": 0.47, + "learning_rate": 1.1062898154902344e-05, + "loss": 0.6448, + "step": 13458 + }, + { + "epoch": 0.47, + "learning_rate": 1.1061815452036141e-05, + "loss": 0.6103, + "step": 13459 + }, + { + "epoch": 0.47, + "learning_rate": 1.1060732736580772e-05, + "loss": 0.6517, + "step": 13460 + }, + { + "epoch": 0.47, + "learning_rate": 1.1059650008549078e-05, + "loss": 0.6433, + "step": 13461 + }, + { + "epoch": 0.47, + "learning_rate": 1.1058567267953893e-05, + "loss": 0.6374, + "step": 13462 + }, + { + "epoch": 0.47, + "learning_rate": 1.105748451480805e-05, + "loss": 0.6511, + "step": 13463 + }, + { + "epoch": 0.47, + "learning_rate": 1.1056401749124394e-05, + "loss": 0.6729, + "step": 13464 + }, + { + "epoch": 0.47, + "learning_rate": 1.1055318970915758e-05, + "loss": 0.6558, + "step": 13465 + }, + { + "epoch": 0.47, + "learning_rate": 1.1054236180194979e-05, + "loss": 0.6079, + "step": 13466 + }, + { + "epoch": 0.47, + "learning_rate": 1.10531533769749e-05, + "loss": 0.6028, + "step": 13467 + }, + { + "epoch": 0.47, + "learning_rate": 1.1052070561268353e-05, + "loss": 0.6026, + "step": 13468 + }, + { + "epoch": 0.47, + "learning_rate": 1.1050987733088177e-05, + "loss": 0.6434, + "step": 13469 + }, + { + "epoch": 0.47, + "learning_rate": 1.1049904892447217e-05, + "loss": 0.6521, + "step": 13470 + }, + { + "epoch": 0.47, + "learning_rate": 1.1048822039358301e-05, + "loss": 0.6863, + "step": 13471 + }, + { + "epoch": 0.47, + "learning_rate": 1.1047739173834276e-05, + "loss": 0.6523, + "step": 13472 + }, + { + "epoch": 0.47, + "learning_rate": 1.1046656295887977e-05, + "loss": 0.6159, + "step": 13473 + }, + { + "epoch": 0.47, + "learning_rate": 1.1045573405532242e-05, + "loss": 0.6457, + "step": 13474 + }, + { + "epoch": 0.47, + "learning_rate": 1.1044490502779913e-05, + "loss": 0.6399, + "step": 13475 + }, + { + "epoch": 0.47, + "learning_rate": 1.1043407587643828e-05, + "loss": 0.6124, + "step": 13476 + }, + { + "epoch": 0.47, + "learning_rate": 1.1042324660136825e-05, + "loss": 0.6302, + "step": 13477 + }, + { + "epoch": 0.47, + "learning_rate": 1.1041241720271745e-05, + "loss": 0.6324, + "step": 13478 + }, + { + "epoch": 0.47, + "learning_rate": 1.1040158768061431e-05, + "loss": 0.687, + "step": 13479 + }, + { + "epoch": 0.47, + "learning_rate": 1.1039075803518716e-05, + "loss": 0.6366, + "step": 13480 + }, + { + "epoch": 0.47, + "learning_rate": 1.1037992826656441e-05, + "loss": 0.6483, + "step": 13481 + }, + { + "epoch": 0.47, + "learning_rate": 1.103690983748745e-05, + "loss": 0.6692, + "step": 13482 + }, + { + "epoch": 0.47, + "learning_rate": 1.103582683602458e-05, + "loss": 0.6248, + "step": 13483 + }, + { + "epoch": 0.47, + "learning_rate": 1.1034743822280673e-05, + "loss": 0.6048, + "step": 13484 + }, + { + "epoch": 0.47, + "learning_rate": 1.103366079626857e-05, + "loss": 0.6387, + "step": 13485 + }, + { + "epoch": 0.47, + "learning_rate": 1.1032577758001111e-05, + "loss": 0.6153, + "step": 13486 + }, + { + "epoch": 0.47, + "learning_rate": 1.1031494707491133e-05, + "loss": 0.6356, + "step": 13487 + }, + { + "epoch": 0.47, + "learning_rate": 1.1030411644751485e-05, + "loss": 0.6511, + "step": 13488 + }, + { + "epoch": 0.47, + "learning_rate": 1.1029328569795004e-05, + "loss": 0.6372, + "step": 13489 + }, + { + "epoch": 0.47, + "learning_rate": 1.1028245482634524e-05, + "loss": 0.6225, + "step": 13490 + }, + { + "epoch": 0.47, + "learning_rate": 1.10271623832829e-05, + "loss": 0.6485, + "step": 13491 + }, + { + "epoch": 0.47, + "learning_rate": 1.1026079271752962e-05, + "loss": 0.613, + "step": 13492 + }, + { + "epoch": 0.47, + "learning_rate": 1.1024996148057557e-05, + "loss": 0.5794, + "step": 13493 + }, + { + "epoch": 0.47, + "learning_rate": 1.1023913012209528e-05, + "loss": 0.6058, + "step": 13494 + }, + { + "epoch": 0.47, + "learning_rate": 1.1022829864221716e-05, + "loss": 0.6873, + "step": 13495 + }, + { + "epoch": 0.47, + "learning_rate": 1.1021746704106956e-05, + "loss": 0.6295, + "step": 13496 + }, + { + "epoch": 0.47, + "learning_rate": 1.1020663531878101e-05, + "loss": 0.5953, + "step": 13497 + }, + { + "epoch": 0.47, + "learning_rate": 1.1019580347547992e-05, + "loss": 0.6116, + "step": 13498 + }, + { + "epoch": 0.47, + "learning_rate": 1.101849715112946e-05, + "loss": 0.6132, + "step": 13499 + }, + { + "epoch": 0.47, + "learning_rate": 1.1017413942635362e-05, + "loss": 0.6396, + "step": 13500 + }, + { + "epoch": 0.47, + "learning_rate": 1.1016330722078534e-05, + "loss": 0.6318, + "step": 13501 + }, + { + "epoch": 0.47, + "learning_rate": 1.1015247489471817e-05, + "loss": 0.5908, + "step": 13502 + }, + { + "epoch": 0.47, + "learning_rate": 1.1014164244828058e-05, + "loss": 0.6126, + "step": 13503 + }, + { + "epoch": 0.47, + "learning_rate": 1.1013080988160102e-05, + "loss": 0.6527, + "step": 13504 + }, + { + "epoch": 0.47, + "learning_rate": 1.1011997719480782e-05, + "loss": 0.6413, + "step": 13505 + }, + { + "epoch": 0.47, + "learning_rate": 1.1010914438802955e-05, + "loss": 0.5822, + "step": 13506 + }, + { + "epoch": 0.47, + "learning_rate": 1.1009831146139457e-05, + "loss": 0.5845, + "step": 13507 + }, + { + "epoch": 0.47, + "learning_rate": 1.1008747841503132e-05, + "loss": 0.5952, + "step": 13508 + }, + { + "epoch": 0.47, + "learning_rate": 1.1007664524906827e-05, + "loss": 0.6347, + "step": 13509 + }, + { + "epoch": 0.47, + "learning_rate": 1.1006581196363385e-05, + "loss": 0.6655, + "step": 13510 + }, + { + "epoch": 0.47, + "learning_rate": 1.1005497855885644e-05, + "loss": 0.6096, + "step": 13511 + }, + { + "epoch": 0.47, + "learning_rate": 1.1004414503486461e-05, + "loss": 0.6523, + "step": 13512 + }, + { + "epoch": 0.47, + "learning_rate": 1.1003331139178672e-05, + "loss": 0.6417, + "step": 13513 + }, + { + "epoch": 0.47, + "learning_rate": 1.100224776297512e-05, + "loss": 0.6017, + "step": 13514 + }, + { + "epoch": 0.47, + "learning_rate": 1.1001164374888655e-05, + "loss": 0.6331, + "step": 13515 + }, + { + "epoch": 0.47, + "learning_rate": 1.100008097493212e-05, + "loss": 0.6117, + "step": 13516 + }, + { + "epoch": 0.47, + "learning_rate": 1.0998997563118358e-05, + "loss": 0.6577, + "step": 13517 + }, + { + "epoch": 0.47, + "learning_rate": 1.099791413946022e-05, + "loss": 0.6294, + "step": 13518 + }, + { + "epoch": 0.47, + "learning_rate": 1.0996830703970546e-05, + "loss": 0.6329, + "step": 13519 + }, + { + "epoch": 0.47, + "learning_rate": 1.0995747256662181e-05, + "loss": 0.6664, + "step": 13520 + }, + { + "epoch": 0.47, + "learning_rate": 1.0994663797547973e-05, + "loss": 0.645, + "step": 13521 + }, + { + "epoch": 0.47, + "learning_rate": 1.0993580326640771e-05, + "loss": 0.6457, + "step": 13522 + }, + { + "epoch": 0.47, + "learning_rate": 1.0992496843953413e-05, + "loss": 0.6066, + "step": 13523 + }, + { + "epoch": 0.47, + "learning_rate": 1.099141334949875e-05, + "loss": 0.5728, + "step": 13524 + }, + { + "epoch": 0.47, + "learning_rate": 1.099032984328963e-05, + "loss": 0.6577, + "step": 13525 + }, + { + "epoch": 0.47, + "learning_rate": 1.0989246325338896e-05, + "loss": 0.6301, + "step": 13526 + }, + { + "epoch": 0.47, + "learning_rate": 1.0988162795659395e-05, + "loss": 0.6092, + "step": 13527 + }, + { + "epoch": 0.47, + "learning_rate": 1.0987079254263974e-05, + "loss": 0.7135, + "step": 13528 + }, + { + "epoch": 0.47, + "learning_rate": 1.0985995701165479e-05, + "loss": 0.648, + "step": 13529 + }, + { + "epoch": 0.47, + "learning_rate": 1.0984912136376758e-05, + "loss": 0.6105, + "step": 13530 + }, + { + "epoch": 0.47, + "learning_rate": 1.0983828559910658e-05, + "loss": 0.6361, + "step": 13531 + }, + { + "epoch": 0.47, + "learning_rate": 1.0982744971780026e-05, + "loss": 0.5803, + "step": 13532 + }, + { + "epoch": 0.47, + "learning_rate": 1.0981661371997709e-05, + "loss": 0.6186, + "step": 13533 + }, + { + "epoch": 0.47, + "learning_rate": 1.0980577760576557e-05, + "loss": 0.6317, + "step": 13534 + }, + { + "epoch": 0.47, + "learning_rate": 1.0979494137529412e-05, + "loss": 0.6621, + "step": 13535 + }, + { + "epoch": 0.47, + "learning_rate": 1.0978410502869126e-05, + "loss": 0.6183, + "step": 13536 + }, + { + "epoch": 0.47, + "learning_rate": 1.0977326856608545e-05, + "loss": 0.5791, + "step": 13537 + }, + { + "epoch": 0.47, + "learning_rate": 1.0976243198760519e-05, + "loss": 0.5823, + "step": 13538 + }, + { + "epoch": 0.47, + "learning_rate": 1.0975159529337893e-05, + "loss": 0.6013, + "step": 13539 + }, + { + "epoch": 0.47, + "learning_rate": 1.097407584835352e-05, + "loss": 0.6534, + "step": 13540 + }, + { + "epoch": 0.47, + "learning_rate": 1.0972992155820245e-05, + "loss": 0.6136, + "step": 13541 + }, + { + "epoch": 0.47, + "learning_rate": 1.0971908451750915e-05, + "loss": 0.6328, + "step": 13542 + }, + { + "epoch": 0.47, + "learning_rate": 1.0970824736158385e-05, + "loss": 0.6365, + "step": 13543 + }, + { + "epoch": 0.47, + "learning_rate": 1.0969741009055495e-05, + "loss": 0.6466, + "step": 13544 + }, + { + "epoch": 0.47, + "learning_rate": 1.09686572704551e-05, + "loss": 0.5768, + "step": 13545 + }, + { + "epoch": 0.47, + "learning_rate": 1.0967573520370049e-05, + "loss": 0.6433, + "step": 13546 + }, + { + "epoch": 0.47, + "learning_rate": 1.0966489758813191e-05, + "loss": 0.6272, + "step": 13547 + }, + { + "epoch": 0.47, + "learning_rate": 1.096540598579737e-05, + "loss": 0.6393, + "step": 13548 + }, + { + "epoch": 0.47, + "learning_rate": 1.0964322201335445e-05, + "loss": 0.6556, + "step": 13549 + }, + { + "epoch": 0.47, + "learning_rate": 1.0963238405440254e-05, + "loss": 0.6388, + "step": 13550 + }, + { + "epoch": 0.47, + "learning_rate": 1.096215459812466e-05, + "loss": 0.6536, + "step": 13551 + }, + { + "epoch": 0.47, + "learning_rate": 1.0961070779401502e-05, + "loss": 0.6474, + "step": 13552 + }, + { + "epoch": 0.47, + "learning_rate": 1.0959986949283634e-05, + "loss": 0.6377, + "step": 13553 + }, + { + "epoch": 0.47, + "learning_rate": 1.0958903107783908e-05, + "loss": 0.6266, + "step": 13554 + }, + { + "epoch": 0.47, + "learning_rate": 1.0957819254915174e-05, + "loss": 0.6152, + "step": 13555 + }, + { + "epoch": 0.47, + "learning_rate": 1.0956735390690278e-05, + "loss": 0.6471, + "step": 13556 + }, + { + "epoch": 0.47, + "learning_rate": 1.0955651515122077e-05, + "loss": 0.6229, + "step": 13557 + }, + { + "epoch": 0.47, + "learning_rate": 1.0954567628223413e-05, + "loss": 0.6415, + "step": 13558 + }, + { + "epoch": 0.47, + "learning_rate": 1.0953483730007146e-05, + "loss": 0.6609, + "step": 13559 + }, + { + "epoch": 0.47, + "learning_rate": 1.0952399820486124e-05, + "loss": 0.6318, + "step": 13560 + }, + { + "epoch": 0.47, + "learning_rate": 1.0951315899673196e-05, + "loss": 0.6379, + "step": 13561 + }, + { + "epoch": 0.47, + "learning_rate": 1.0950231967581213e-05, + "loss": 0.6786, + "step": 13562 + }, + { + "epoch": 0.47, + "learning_rate": 1.0949148024223031e-05, + "loss": 0.6356, + "step": 13563 + }, + { + "epoch": 0.47, + "learning_rate": 1.0948064069611496e-05, + "loss": 0.6631, + "step": 13564 + }, + { + "epoch": 0.47, + "learning_rate": 1.0946980103759463e-05, + "loss": 0.5814, + "step": 13565 + }, + { + "epoch": 0.47, + "learning_rate": 1.0945896126679785e-05, + "loss": 0.6885, + "step": 13566 + }, + { + "epoch": 0.47, + "learning_rate": 1.094481213838531e-05, + "loss": 0.6504, + "step": 13567 + }, + { + "epoch": 0.47, + "learning_rate": 1.094372813888889e-05, + "loss": 0.6231, + "step": 13568 + }, + { + "epoch": 0.47, + "learning_rate": 1.0942644128203383e-05, + "loss": 0.6024, + "step": 13569 + }, + { + "epoch": 0.47, + "learning_rate": 1.0941560106341635e-05, + "loss": 0.6192, + "step": 13570 + }, + { + "epoch": 0.47, + "learning_rate": 1.09404760733165e-05, + "loss": 0.6582, + "step": 13571 + }, + { + "epoch": 0.47, + "learning_rate": 1.0939392029140834e-05, + "loss": 0.6151, + "step": 13572 + }, + { + "epoch": 0.47, + "learning_rate": 1.0938307973827485e-05, + "loss": 0.603, + "step": 13573 + }, + { + "epoch": 0.47, + "learning_rate": 1.0937223907389309e-05, + "loss": 0.6809, + "step": 13574 + }, + { + "epoch": 0.47, + "learning_rate": 1.0936139829839158e-05, + "loss": 0.6087, + "step": 13575 + }, + { + "epoch": 0.47, + "learning_rate": 1.0935055741189884e-05, + "loss": 0.6146, + "step": 13576 + }, + { + "epoch": 0.47, + "learning_rate": 1.0933971641454342e-05, + "loss": 0.6162, + "step": 13577 + }, + { + "epoch": 0.47, + "learning_rate": 1.0932887530645387e-05, + "loss": 0.6149, + "step": 13578 + }, + { + "epoch": 0.47, + "learning_rate": 1.0931803408775867e-05, + "loss": 0.6643, + "step": 13579 + }, + { + "epoch": 0.47, + "learning_rate": 1.0930719275858638e-05, + "loss": 0.6261, + "step": 13580 + }, + { + "epoch": 0.47, + "learning_rate": 1.0929635131906559e-05, + "loss": 0.6894, + "step": 13581 + }, + { + "epoch": 0.47, + "learning_rate": 1.0928550976932477e-05, + "loss": 0.6291, + "step": 13582 + }, + { + "epoch": 0.47, + "learning_rate": 1.0927466810949247e-05, + "loss": 0.6386, + "step": 13583 + }, + { + "epoch": 0.47, + "learning_rate": 1.092638263396973e-05, + "loss": 0.6213, + "step": 13584 + }, + { + "epoch": 0.47, + "learning_rate": 1.0925298446006769e-05, + "loss": 0.6935, + "step": 13585 + }, + { + "epoch": 0.47, + "learning_rate": 1.0924214247073229e-05, + "loss": 0.607, + "step": 13586 + }, + { + "epoch": 0.47, + "learning_rate": 1.0923130037181957e-05, + "loss": 0.6277, + "step": 13587 + }, + { + "epoch": 0.47, + "learning_rate": 1.0922045816345812e-05, + "loss": 0.6176, + "step": 13588 + }, + { + "epoch": 0.47, + "learning_rate": 1.0920961584577645e-05, + "loss": 0.649, + "step": 13589 + }, + { + "epoch": 0.47, + "learning_rate": 1.0919877341890316e-05, + "loss": 0.5653, + "step": 13590 + }, + { + "epoch": 0.47, + "learning_rate": 1.0918793088296678e-05, + "loss": 0.6616, + "step": 13591 + }, + { + "epoch": 0.47, + "learning_rate": 1.0917708823809583e-05, + "loss": 0.6312, + "step": 13592 + }, + { + "epoch": 0.47, + "learning_rate": 1.0916624548441892e-05, + "loss": 0.639, + "step": 13593 + }, + { + "epoch": 0.47, + "learning_rate": 1.0915540262206454e-05, + "loss": 0.5957, + "step": 13594 + }, + { + "epoch": 0.47, + "learning_rate": 1.091445596511613e-05, + "loss": 0.6272, + "step": 13595 + }, + { + "epoch": 0.47, + "learning_rate": 1.0913371657183775e-05, + "loss": 0.6703, + "step": 13596 + }, + { + "epoch": 0.47, + "learning_rate": 1.0912287338422243e-05, + "loss": 0.6591, + "step": 13597 + }, + { + "epoch": 0.47, + "learning_rate": 1.0911203008844389e-05, + "loss": 0.6365, + "step": 13598 + }, + { + "epoch": 0.47, + "learning_rate": 1.0910118668463072e-05, + "loss": 0.6201, + "step": 13599 + }, + { + "epoch": 0.47, + "learning_rate": 1.0909034317291145e-05, + "loss": 0.6201, + "step": 13600 + }, + { + "epoch": 0.47, + "learning_rate": 1.0907949955341468e-05, + "loss": 0.6035, + "step": 13601 + }, + { + "epoch": 0.47, + "learning_rate": 1.0906865582626895e-05, + "loss": 0.6452, + "step": 13602 + }, + { + "epoch": 0.47, + "learning_rate": 1.0905781199160283e-05, + "loss": 0.6198, + "step": 13603 + }, + { + "epoch": 0.47, + "learning_rate": 1.0904696804954488e-05, + "loss": 0.6601, + "step": 13604 + }, + { + "epoch": 0.47, + "learning_rate": 1.0903612400022371e-05, + "loss": 0.6323, + "step": 13605 + }, + { + "epoch": 0.47, + "learning_rate": 1.0902527984376785e-05, + "loss": 0.6398, + "step": 13606 + }, + { + "epoch": 0.47, + "learning_rate": 1.0901443558030587e-05, + "loss": 0.6019, + "step": 13607 + }, + { + "epoch": 0.47, + "learning_rate": 1.0900359120996638e-05, + "loss": 0.5718, + "step": 13608 + }, + { + "epoch": 0.47, + "learning_rate": 1.0899274673287792e-05, + "loss": 0.6008, + "step": 13609 + }, + { + "epoch": 0.47, + "learning_rate": 1.0898190214916902e-05, + "loss": 0.5941, + "step": 13610 + }, + { + "epoch": 0.47, + "learning_rate": 1.0897105745896837e-05, + "loss": 0.6257, + "step": 13611 + }, + { + "epoch": 0.47, + "learning_rate": 1.0896021266240446e-05, + "loss": 0.687, + "step": 13612 + }, + { + "epoch": 0.47, + "learning_rate": 1.089493677596059e-05, + "loss": 0.6308, + "step": 13613 + }, + { + "epoch": 0.47, + "learning_rate": 1.0893852275070124e-05, + "loss": 0.5766, + "step": 13614 + }, + { + "epoch": 0.47, + "learning_rate": 1.0892767763581913e-05, + "loss": 0.6333, + "step": 13615 + }, + { + "epoch": 0.47, + "learning_rate": 1.0891683241508807e-05, + "loss": 0.6281, + "step": 13616 + }, + { + "epoch": 0.47, + "learning_rate": 1.0890598708863669e-05, + "loss": 0.6674, + "step": 13617 + }, + { + "epoch": 0.47, + "learning_rate": 1.0889514165659358e-05, + "loss": 0.6336, + "step": 13618 + }, + { + "epoch": 0.47, + "learning_rate": 1.0888429611908729e-05, + "loss": 0.6164, + "step": 13619 + }, + { + "epoch": 0.47, + "learning_rate": 1.0887345047624644e-05, + "loss": 0.6734, + "step": 13620 + }, + { + "epoch": 0.47, + "learning_rate": 1.0886260472819963e-05, + "loss": 0.6222, + "step": 13621 + }, + { + "epoch": 0.47, + "learning_rate": 1.088517588750754e-05, + "loss": 0.6875, + "step": 13622 + }, + { + "epoch": 0.47, + "learning_rate": 1.0884091291700239e-05, + "loss": 0.6059, + "step": 13623 + }, + { + "epoch": 0.47, + "learning_rate": 1.0883006685410918e-05, + "loss": 0.6396, + "step": 13624 + }, + { + "epoch": 0.47, + "learning_rate": 1.0881922068652432e-05, + "loss": 0.6449, + "step": 13625 + }, + { + "epoch": 0.47, + "learning_rate": 1.0880837441437648e-05, + "loss": 0.5635, + "step": 13626 + }, + { + "epoch": 0.47, + "learning_rate": 1.0879752803779422e-05, + "loss": 0.609, + "step": 13627 + }, + { + "epoch": 0.47, + "learning_rate": 1.0878668155690611e-05, + "loss": 0.6364, + "step": 13628 + }, + { + "epoch": 0.47, + "learning_rate": 1.0877583497184078e-05, + "loss": 0.6692, + "step": 13629 + }, + { + "epoch": 0.47, + "learning_rate": 1.0876498828272687e-05, + "loss": 0.5993, + "step": 13630 + }, + { + "epoch": 0.47, + "learning_rate": 1.0875414148969288e-05, + "loss": 0.6342, + "step": 13631 + }, + { + "epoch": 0.47, + "learning_rate": 1.0874329459286747e-05, + "loss": 0.6792, + "step": 13632 + }, + { + "epoch": 0.47, + "learning_rate": 1.0873244759237928e-05, + "loss": 0.6223, + "step": 13633 + }, + { + "epoch": 0.47, + "learning_rate": 1.0872160048835684e-05, + "loss": 0.5986, + "step": 13634 + }, + { + "epoch": 0.47, + "learning_rate": 1.087107532809288e-05, + "loss": 0.6698, + "step": 13635 + }, + { + "epoch": 0.47, + "learning_rate": 1.086999059702238e-05, + "loss": 0.6659, + "step": 13636 + }, + { + "epoch": 0.47, + "learning_rate": 1.0868905855637037e-05, + "loss": 0.6679, + "step": 13637 + }, + { + "epoch": 0.47, + "learning_rate": 1.0867821103949717e-05, + "loss": 0.6639, + "step": 13638 + }, + { + "epoch": 0.47, + "learning_rate": 1.0866736341973282e-05, + "loss": 0.624, + "step": 13639 + }, + { + "epoch": 0.47, + "learning_rate": 1.0865651569720587e-05, + "loss": 0.5748, + "step": 13640 + }, + { + "epoch": 0.47, + "learning_rate": 1.0864566787204498e-05, + "loss": 0.5586, + "step": 13641 + }, + { + "epoch": 0.47, + "learning_rate": 1.0863481994437881e-05, + "loss": 0.6231, + "step": 13642 + }, + { + "epoch": 0.47, + "learning_rate": 1.086239719143359e-05, + "loss": 0.608, + "step": 13643 + }, + { + "epoch": 0.47, + "learning_rate": 1.086131237820449e-05, + "loss": 0.6599, + "step": 13644 + }, + { + "epoch": 0.47, + "learning_rate": 1.0860227554763438e-05, + "loss": 0.6618, + "step": 13645 + }, + { + "epoch": 0.47, + "learning_rate": 1.0859142721123303e-05, + "loss": 0.6475, + "step": 13646 + }, + { + "epoch": 0.47, + "learning_rate": 1.0858057877296946e-05, + "loss": 0.6225, + "step": 13647 + }, + { + "epoch": 0.47, + "learning_rate": 1.0856973023297225e-05, + "loss": 0.5563, + "step": 13648 + }, + { + "epoch": 0.47, + "learning_rate": 1.0855888159137006e-05, + "loss": 0.5632, + "step": 13649 + }, + { + "epoch": 0.47, + "learning_rate": 1.085480328482915e-05, + "loss": 0.6418, + "step": 13650 + }, + { + "epoch": 0.47, + "learning_rate": 1.085371840038652e-05, + "loss": 0.6205, + "step": 13651 + }, + { + "epoch": 0.47, + "learning_rate": 1.0852633505821976e-05, + "loss": 0.5486, + "step": 13652 + }, + { + "epoch": 0.47, + "learning_rate": 1.0851548601148387e-05, + "loss": 0.6044, + "step": 13653 + }, + { + "epoch": 0.47, + "learning_rate": 1.085046368637861e-05, + "loss": 0.5538, + "step": 13654 + }, + { + "epoch": 0.47, + "learning_rate": 1.0849378761525508e-05, + "loss": 0.613, + "step": 13655 + }, + { + "epoch": 0.47, + "learning_rate": 1.084829382660195e-05, + "loss": 0.6527, + "step": 13656 + }, + { + "epoch": 0.47, + "learning_rate": 1.0847208881620794e-05, + "loss": 0.653, + "step": 13657 + }, + { + "epoch": 0.47, + "learning_rate": 1.0846123926594905e-05, + "loss": 0.6282, + "step": 13658 + }, + { + "epoch": 0.47, + "learning_rate": 1.0845038961537147e-05, + "loss": 0.6093, + "step": 13659 + }, + { + "epoch": 0.47, + "learning_rate": 1.0843953986460382e-05, + "loss": 0.6504, + "step": 13660 + }, + { + "epoch": 0.47, + "learning_rate": 1.0842869001377477e-05, + "loss": 0.6177, + "step": 13661 + }, + { + "epoch": 0.47, + "learning_rate": 1.0841784006301293e-05, + "loss": 0.6766, + "step": 13662 + }, + { + "epoch": 0.47, + "learning_rate": 1.0840699001244693e-05, + "loss": 0.5841, + "step": 13663 + }, + { + "epoch": 0.47, + "learning_rate": 1.0839613986220543e-05, + "loss": 0.7012, + "step": 13664 + }, + { + "epoch": 0.47, + "learning_rate": 1.083852896124171e-05, + "loss": 0.6078, + "step": 13665 + }, + { + "epoch": 0.47, + "learning_rate": 1.0837443926321054e-05, + "loss": 0.676, + "step": 13666 + }, + { + "epoch": 0.47, + "learning_rate": 1.0836358881471439e-05, + "loss": 0.6235, + "step": 13667 + }, + { + "epoch": 0.47, + "learning_rate": 1.0835273826705734e-05, + "loss": 0.5992, + "step": 13668 + }, + { + "epoch": 0.47, + "learning_rate": 1.0834188762036799e-05, + "loss": 0.6664, + "step": 13669 + }, + { + "epoch": 0.47, + "learning_rate": 1.0833103687477501e-05, + "loss": 0.6269, + "step": 13670 + }, + { + "epoch": 0.47, + "learning_rate": 1.0832018603040709e-05, + "loss": 0.6622, + "step": 13671 + }, + { + "epoch": 0.47, + "learning_rate": 1.083093350873928e-05, + "loss": 0.6403, + "step": 13672 + }, + { + "epoch": 0.47, + "learning_rate": 1.0829848404586082e-05, + "loss": 0.6557, + "step": 13673 + }, + { + "epoch": 0.47, + "learning_rate": 1.0828763290593984e-05, + "loss": 0.6163, + "step": 13674 + }, + { + "epoch": 0.47, + "learning_rate": 1.0827678166775849e-05, + "loss": 0.6183, + "step": 13675 + }, + { + "epoch": 0.47, + "learning_rate": 1.0826593033144541e-05, + "loss": 0.626, + "step": 13676 + }, + { + "epoch": 0.47, + "learning_rate": 1.0825507889712929e-05, + "loss": 0.5759, + "step": 13677 + }, + { + "epoch": 0.47, + "learning_rate": 1.0824422736493873e-05, + "loss": 0.6598, + "step": 13678 + }, + { + "epoch": 0.47, + "learning_rate": 1.0823337573500245e-05, + "loss": 0.611, + "step": 13679 + }, + { + "epoch": 0.47, + "learning_rate": 1.0822252400744911e-05, + "loss": 0.5606, + "step": 13680 + }, + { + "epoch": 0.47, + "learning_rate": 1.082116721824073e-05, + "loss": 0.6334, + "step": 13681 + }, + { + "epoch": 0.47, + "learning_rate": 1.0820082026000573e-05, + "loss": 0.5907, + "step": 13682 + }, + { + "epoch": 0.47, + "learning_rate": 1.081899682403731e-05, + "loss": 0.6175, + "step": 13683 + }, + { + "epoch": 0.47, + "learning_rate": 1.0817911612363801e-05, + "loss": 0.6544, + "step": 13684 + }, + { + "epoch": 0.47, + "learning_rate": 1.0816826390992915e-05, + "loss": 0.6716, + "step": 13685 + }, + { + "epoch": 0.47, + "learning_rate": 1.0815741159937521e-05, + "loss": 0.6086, + "step": 13686 + }, + { + "epoch": 0.47, + "learning_rate": 1.0814655919210482e-05, + "loss": 0.6719, + "step": 13687 + }, + { + "epoch": 0.47, + "learning_rate": 1.0813570668824665e-05, + "loss": 0.6006, + "step": 13688 + }, + { + "epoch": 0.47, + "learning_rate": 1.0812485408792943e-05, + "loss": 0.6162, + "step": 13689 + }, + { + "epoch": 0.47, + "learning_rate": 1.0811400139128175e-05, + "loss": 0.61, + "step": 13690 + }, + { + "epoch": 0.47, + "learning_rate": 1.0810314859843232e-05, + "loss": 0.6058, + "step": 13691 + }, + { + "epoch": 0.47, + "learning_rate": 1.0809229570950983e-05, + "loss": 0.6704, + "step": 13692 + }, + { + "epoch": 0.47, + "learning_rate": 1.0808144272464291e-05, + "loss": 0.6011, + "step": 13693 + }, + { + "epoch": 0.47, + "learning_rate": 1.0807058964396029e-05, + "loss": 0.6394, + "step": 13694 + }, + { + "epoch": 0.47, + "learning_rate": 1.0805973646759063e-05, + "loss": 0.6172, + "step": 13695 + }, + { + "epoch": 0.47, + "learning_rate": 1.0804888319566259e-05, + "loss": 0.6503, + "step": 13696 + }, + { + "epoch": 0.47, + "learning_rate": 1.0803802982830483e-05, + "loss": 0.6216, + "step": 13697 + }, + { + "epoch": 0.47, + "learning_rate": 1.0802717636564608e-05, + "loss": 0.6013, + "step": 13698 + }, + { + "epoch": 0.47, + "learning_rate": 1.0801632280781499e-05, + "loss": 0.6931, + "step": 13699 + }, + { + "epoch": 0.47, + "learning_rate": 1.0800546915494026e-05, + "loss": 0.6324, + "step": 13700 + }, + { + "epoch": 0.47, + "learning_rate": 1.0799461540715058e-05, + "loss": 0.6826, + "step": 13701 + }, + { + "epoch": 0.47, + "learning_rate": 1.0798376156457459e-05, + "loss": 0.5789, + "step": 13702 + }, + { + "epoch": 0.47, + "learning_rate": 1.0797290762734102e-05, + "loss": 0.6286, + "step": 13703 + }, + { + "epoch": 0.47, + "learning_rate": 1.0796205359557856e-05, + "loss": 0.6081, + "step": 13704 + }, + { + "epoch": 0.47, + "learning_rate": 1.0795119946941586e-05, + "loss": 0.6074, + "step": 13705 + }, + { + "epoch": 0.47, + "learning_rate": 1.0794034524898167e-05, + "loss": 0.6286, + "step": 13706 + }, + { + "epoch": 0.47, + "learning_rate": 1.0792949093440459e-05, + "loss": 0.6333, + "step": 13707 + }, + { + "epoch": 0.47, + "learning_rate": 1.079186365258134e-05, + "loss": 0.6463, + "step": 13708 + }, + { + "epoch": 0.47, + "learning_rate": 1.0790778202333676e-05, + "loss": 0.6011, + "step": 13709 + }, + { + "epoch": 0.48, + "learning_rate": 1.0789692742710334e-05, + "loss": 0.6302, + "step": 13710 + }, + { + "epoch": 0.48, + "learning_rate": 1.0788607273724185e-05, + "loss": 0.6638, + "step": 13711 + }, + { + "epoch": 0.48, + "learning_rate": 1.0787521795388102e-05, + "loss": 0.6042, + "step": 13712 + }, + { + "epoch": 0.48, + "learning_rate": 1.078643630771495e-05, + "loss": 0.6976, + "step": 13713 + }, + { + "epoch": 0.48, + "learning_rate": 1.07853508107176e-05, + "loss": 0.6206, + "step": 13714 + }, + { + "epoch": 0.48, + "learning_rate": 1.0784265304408925e-05, + "loss": 0.5983, + "step": 13715 + }, + { + "epoch": 0.48, + "learning_rate": 1.078317978880179e-05, + "loss": 0.6225, + "step": 13716 + }, + { + "epoch": 0.48, + "learning_rate": 1.078209426390907e-05, + "loss": 0.639, + "step": 13717 + }, + { + "epoch": 0.48, + "learning_rate": 1.0781008729743634e-05, + "loss": 0.6492, + "step": 13718 + }, + { + "epoch": 0.48, + "learning_rate": 1.0779923186318349e-05, + "loss": 0.6418, + "step": 13719 + }, + { + "epoch": 0.48, + "learning_rate": 1.0778837633646088e-05, + "loss": 0.6445, + "step": 13720 + }, + { + "epoch": 0.48, + "learning_rate": 1.0777752071739724e-05, + "loss": 0.6005, + "step": 13721 + }, + { + "epoch": 0.48, + "learning_rate": 1.0776666500612123e-05, + "loss": 0.6229, + "step": 13722 + }, + { + "epoch": 0.48, + "learning_rate": 1.0775580920276158e-05, + "loss": 0.6234, + "step": 13723 + }, + { + "epoch": 0.48, + "learning_rate": 1.0774495330744703e-05, + "loss": 0.6195, + "step": 13724 + }, + { + "epoch": 0.48, + "learning_rate": 1.0773409732030624e-05, + "loss": 0.6139, + "step": 13725 + }, + { + "epoch": 0.48, + "learning_rate": 1.0772324124146794e-05, + "loss": 0.6141, + "step": 13726 + }, + { + "epoch": 0.48, + "learning_rate": 1.0771238507106086e-05, + "loss": 0.6703, + "step": 13727 + }, + { + "epoch": 0.48, + "learning_rate": 1.0770152880921368e-05, + "loss": 0.5913, + "step": 13728 + }, + { + "epoch": 0.48, + "learning_rate": 1.0769067245605514e-05, + "loss": 0.619, + "step": 13729 + }, + { + "epoch": 0.48, + "learning_rate": 1.0767981601171398e-05, + "loss": 0.6056, + "step": 13730 + }, + { + "epoch": 0.48, + "learning_rate": 1.0766895947631884e-05, + "loss": 0.6577, + "step": 13731 + }, + { + "epoch": 0.48, + "learning_rate": 1.076581028499985e-05, + "loss": 0.6094, + "step": 13732 + }, + { + "epoch": 0.48, + "learning_rate": 1.0764724613288167e-05, + "loss": 0.623, + "step": 13733 + }, + { + "epoch": 0.48, + "learning_rate": 1.0763638932509705e-05, + "loss": 0.6423, + "step": 13734 + }, + { + "epoch": 0.48, + "learning_rate": 1.0762553242677339e-05, + "loss": 0.6375, + "step": 13735 + }, + { + "epoch": 0.48, + "learning_rate": 1.076146754380394e-05, + "loss": 0.6379, + "step": 13736 + }, + { + "epoch": 0.48, + "learning_rate": 1.076038183590238e-05, + "loss": 0.588, + "step": 13737 + }, + { + "epoch": 0.48, + "learning_rate": 1.0759296118985526e-05, + "loss": 0.6493, + "step": 13738 + }, + { + "epoch": 0.48, + "learning_rate": 1.0758210393066265e-05, + "loss": 0.5952, + "step": 13739 + }, + { + "epoch": 0.48, + "learning_rate": 1.0757124658157456e-05, + "loss": 0.6306, + "step": 13740 + }, + { + "epoch": 0.48, + "learning_rate": 1.0756038914271973e-05, + "loss": 0.6152, + "step": 13741 + }, + { + "epoch": 0.48, + "learning_rate": 1.0754953161422698e-05, + "loss": 0.6593, + "step": 13742 + }, + { + "epoch": 0.48, + "learning_rate": 1.0753867399622498e-05, + "loss": 0.607, + "step": 13743 + }, + { + "epoch": 0.48, + "learning_rate": 1.0752781628884241e-05, + "loss": 0.6708, + "step": 13744 + }, + { + "epoch": 0.48, + "learning_rate": 1.0751695849220812e-05, + "loss": 0.6384, + "step": 13745 + }, + { + "epoch": 0.48, + "learning_rate": 1.0750610060645075e-05, + "loss": 0.6276, + "step": 13746 + }, + { + "epoch": 0.48, + "learning_rate": 1.0749524263169901e-05, + "loss": 0.6732, + "step": 13747 + }, + { + "epoch": 0.48, + "learning_rate": 1.0748438456808176e-05, + "loss": 0.6404, + "step": 13748 + }, + { + "epoch": 0.48, + "learning_rate": 1.0747352641572766e-05, + "loss": 0.6047, + "step": 13749 + }, + { + "epoch": 0.48, + "learning_rate": 1.074626681747654e-05, + "loss": 0.5643, + "step": 13750 + }, + { + "epoch": 0.48, + "learning_rate": 1.0745180984532382e-05, + "loss": 0.6933, + "step": 13751 + }, + { + "epoch": 0.48, + "learning_rate": 1.0744095142753159e-05, + "loss": 0.6465, + "step": 13752 + }, + { + "epoch": 0.48, + "learning_rate": 1.0743009292151743e-05, + "loss": 0.6201, + "step": 13753 + }, + { + "epoch": 0.48, + "learning_rate": 1.0741923432741017e-05, + "loss": 0.6157, + "step": 13754 + }, + { + "epoch": 0.48, + "learning_rate": 1.0740837564533851e-05, + "loss": 0.6369, + "step": 13755 + }, + { + "epoch": 0.48, + "learning_rate": 1.0739751687543112e-05, + "loss": 0.6125, + "step": 13756 + }, + { + "epoch": 0.48, + "learning_rate": 1.0738665801781686e-05, + "loss": 0.6647, + "step": 13757 + }, + { + "epoch": 0.48, + "learning_rate": 1.0737579907262443e-05, + "loss": 0.616, + "step": 13758 + }, + { + "epoch": 0.48, + "learning_rate": 1.0736494003998253e-05, + "loss": 0.5979, + "step": 13759 + }, + { + "epoch": 0.48, + "learning_rate": 1.0735408092002e-05, + "loss": 0.6407, + "step": 13760 + }, + { + "epoch": 0.48, + "learning_rate": 1.0734322171286554e-05, + "loss": 0.6271, + "step": 13761 + }, + { + "epoch": 0.48, + "learning_rate": 1.0733236241864782e-05, + "loss": 0.6332, + "step": 13762 + }, + { + "epoch": 0.48, + "learning_rate": 1.0732150303749573e-05, + "loss": 0.576, + "step": 13763 + }, + { + "epoch": 0.48, + "learning_rate": 1.0731064356953797e-05, + "loss": 0.6187, + "step": 13764 + }, + { + "epoch": 0.48, + "learning_rate": 1.0729978401490322e-05, + "loss": 0.6511, + "step": 13765 + }, + { + "epoch": 0.48, + "learning_rate": 1.0728892437372037e-05, + "loss": 0.6247, + "step": 13766 + }, + { + "epoch": 0.48, + "learning_rate": 1.0727806464611807e-05, + "loss": 0.6172, + "step": 13767 + }, + { + "epoch": 0.48, + "learning_rate": 1.072672048322251e-05, + "loss": 0.7048, + "step": 13768 + }, + { + "epoch": 0.48, + "learning_rate": 1.0725634493217023e-05, + "loss": 0.617, + "step": 13769 + }, + { + "epoch": 0.48, + "learning_rate": 1.0724548494608222e-05, + "loss": 0.6033, + "step": 13770 + }, + { + "epoch": 0.48, + "learning_rate": 1.072346248740898e-05, + "loss": 0.6395, + "step": 13771 + }, + { + "epoch": 0.48, + "learning_rate": 1.0722376471632174e-05, + "loss": 0.6665, + "step": 13772 + }, + { + "epoch": 0.48, + "learning_rate": 1.0721290447290687e-05, + "loss": 0.6857, + "step": 13773 + }, + { + "epoch": 0.48, + "learning_rate": 1.0720204414397383e-05, + "loss": 0.6243, + "step": 13774 + }, + { + "epoch": 0.48, + "learning_rate": 1.0719118372965147e-05, + "loss": 0.6708, + "step": 13775 + }, + { + "epoch": 0.48, + "learning_rate": 1.0718032323006855e-05, + "loss": 0.5741, + "step": 13776 + }, + { + "epoch": 0.48, + "learning_rate": 1.0716946264535377e-05, + "loss": 0.6192, + "step": 13777 + }, + { + "epoch": 0.48, + "learning_rate": 1.0715860197563597e-05, + "loss": 0.5971, + "step": 13778 + }, + { + "epoch": 0.48, + "learning_rate": 1.071477412210439e-05, + "loss": 0.6243, + "step": 13779 + }, + { + "epoch": 0.48, + "learning_rate": 1.071368803817063e-05, + "loss": 0.6443, + "step": 13780 + }, + { + "epoch": 0.48, + "learning_rate": 1.0712601945775194e-05, + "loss": 0.6257, + "step": 13781 + }, + { + "epoch": 0.48, + "learning_rate": 1.0711515844930964e-05, + "loss": 0.7077, + "step": 13782 + }, + { + "epoch": 0.48, + "learning_rate": 1.071042973565081e-05, + "loss": 0.6194, + "step": 13783 + }, + { + "epoch": 0.48, + "learning_rate": 1.0709343617947613e-05, + "loss": 0.6184, + "step": 13784 + }, + { + "epoch": 0.48, + "learning_rate": 1.0708257491834253e-05, + "loss": 0.6046, + "step": 13785 + }, + { + "epoch": 0.48, + "learning_rate": 1.0707171357323602e-05, + "loss": 0.6557, + "step": 13786 + }, + { + "epoch": 0.48, + "learning_rate": 1.0706085214428542e-05, + "loss": 0.6072, + "step": 13787 + }, + { + "epoch": 0.48, + "learning_rate": 1.0704999063161946e-05, + "loss": 0.6108, + "step": 13788 + }, + { + "epoch": 0.48, + "learning_rate": 1.0703912903536698e-05, + "loss": 0.6211, + "step": 13789 + }, + { + "epoch": 0.48, + "learning_rate": 1.0702826735565668e-05, + "loss": 0.5851, + "step": 13790 + }, + { + "epoch": 0.48, + "learning_rate": 1.0701740559261742e-05, + "loss": 0.624, + "step": 13791 + }, + { + "epoch": 0.48, + "learning_rate": 1.0700654374637792e-05, + "loss": 0.6727, + "step": 13792 + }, + { + "epoch": 0.48, + "learning_rate": 1.0699568181706696e-05, + "loss": 0.6211, + "step": 13793 + }, + { + "epoch": 0.48, + "learning_rate": 1.0698481980481337e-05, + "loss": 0.5634, + "step": 13794 + }, + { + "epoch": 0.48, + "learning_rate": 1.069739577097459e-05, + "loss": 0.6225, + "step": 13795 + }, + { + "epoch": 0.48, + "learning_rate": 1.0696309553199331e-05, + "loss": 0.6687, + "step": 13796 + }, + { + "epoch": 0.48, + "learning_rate": 1.0695223327168446e-05, + "loss": 0.6384, + "step": 13797 + }, + { + "epoch": 0.48, + "learning_rate": 1.0694137092894807e-05, + "loss": 0.6717, + "step": 13798 + }, + { + "epoch": 0.48, + "learning_rate": 1.0693050850391295e-05, + "loss": 0.6998, + "step": 13799 + }, + { + "epoch": 0.48, + "learning_rate": 1.0691964599670787e-05, + "loss": 0.6244, + "step": 13800 + }, + { + "epoch": 0.48, + "learning_rate": 1.0690878340746165e-05, + "loss": 0.6552, + "step": 13801 + }, + { + "epoch": 0.48, + "learning_rate": 1.0689792073630308e-05, + "loss": 0.5736, + "step": 13802 + }, + { + "epoch": 0.48, + "learning_rate": 1.068870579833609e-05, + "loss": 0.6635, + "step": 13803 + }, + { + "epoch": 0.48, + "learning_rate": 1.0687619514876393e-05, + "loss": 0.675, + "step": 13804 + }, + { + "epoch": 0.48, + "learning_rate": 1.0686533223264099e-05, + "loss": 0.6444, + "step": 13805 + }, + { + "epoch": 0.48, + "learning_rate": 1.0685446923512084e-05, + "loss": 0.6044, + "step": 13806 + }, + { + "epoch": 0.48, + "learning_rate": 1.0684360615633229e-05, + "loss": 0.6029, + "step": 13807 + }, + { + "epoch": 0.48, + "learning_rate": 1.0683274299640416e-05, + "loss": 0.6321, + "step": 13808 + }, + { + "epoch": 0.48, + "learning_rate": 1.068218797554652e-05, + "loss": 0.5886, + "step": 13809 + }, + { + "epoch": 0.48, + "learning_rate": 1.068110164336442e-05, + "loss": 0.6916, + "step": 13810 + }, + { + "epoch": 0.48, + "learning_rate": 1.0680015303107e-05, + "loss": 0.5769, + "step": 13811 + }, + { + "epoch": 0.48, + "learning_rate": 1.0678928954787138e-05, + "loss": 0.6613, + "step": 13812 + }, + { + "epoch": 0.48, + "learning_rate": 1.0677842598417713e-05, + "loss": 0.6298, + "step": 13813 + }, + { + "epoch": 0.48, + "learning_rate": 1.0676756234011612e-05, + "loss": 0.6517, + "step": 13814 + }, + { + "epoch": 0.48, + "learning_rate": 1.0675669861581706e-05, + "loss": 0.6257, + "step": 13815 + }, + { + "epoch": 0.48, + "learning_rate": 1.0674583481140878e-05, + "loss": 0.6033, + "step": 13816 + }, + { + "epoch": 0.48, + "learning_rate": 1.0673497092702012e-05, + "loss": 0.599, + "step": 13817 + }, + { + "epoch": 0.48, + "learning_rate": 1.0672410696277985e-05, + "loss": 0.6549, + "step": 13818 + }, + { + "epoch": 0.48, + "learning_rate": 1.0671324291881677e-05, + "loss": 0.6364, + "step": 13819 + }, + { + "epoch": 0.48, + "learning_rate": 1.0670237879525973e-05, + "loss": 0.6866, + "step": 13820 + }, + { + "epoch": 0.48, + "learning_rate": 1.066915145922375e-05, + "loss": 0.6314, + "step": 13821 + }, + { + "epoch": 0.48, + "learning_rate": 1.0668065030987889e-05, + "loss": 0.6491, + "step": 13822 + }, + { + "epoch": 0.48, + "learning_rate": 1.0666978594831274e-05, + "loss": 0.6658, + "step": 13823 + }, + { + "epoch": 0.48, + "learning_rate": 1.0665892150766781e-05, + "loss": 0.6675, + "step": 13824 + }, + { + "epoch": 0.48, + "learning_rate": 1.0664805698807294e-05, + "loss": 0.6646, + "step": 13825 + }, + { + "epoch": 0.48, + "learning_rate": 1.06637192389657e-05, + "loss": 0.6205, + "step": 13826 + }, + { + "epoch": 0.48, + "learning_rate": 1.066263277125487e-05, + "loss": 0.6333, + "step": 13827 + }, + { + "epoch": 0.48, + "learning_rate": 1.0661546295687691e-05, + "loss": 0.627, + "step": 13828 + }, + { + "epoch": 0.48, + "learning_rate": 1.0660459812277044e-05, + "loss": 0.6256, + "step": 13829 + }, + { + "epoch": 0.48, + "learning_rate": 1.0659373321035813e-05, + "loss": 0.6283, + "step": 13830 + }, + { + "epoch": 0.48, + "learning_rate": 1.0658286821976872e-05, + "loss": 0.6493, + "step": 13831 + }, + { + "epoch": 0.48, + "learning_rate": 1.0657200315113113e-05, + "loss": 0.6936, + "step": 13832 + }, + { + "epoch": 0.48, + "learning_rate": 1.0656113800457413e-05, + "loss": 0.614, + "step": 13833 + }, + { + "epoch": 0.48, + "learning_rate": 1.0655027278022647e-05, + "loss": 0.6534, + "step": 13834 + }, + { + "epoch": 0.48, + "learning_rate": 1.0653940747821712e-05, + "loss": 0.6572, + "step": 13835 + }, + { + "epoch": 0.48, + "learning_rate": 1.0652854209867478e-05, + "loss": 0.5895, + "step": 13836 + }, + { + "epoch": 0.48, + "learning_rate": 1.065176766417283e-05, + "loss": 0.6788, + "step": 13837 + }, + { + "epoch": 0.48, + "learning_rate": 1.0650681110750657e-05, + "loss": 0.6705, + "step": 13838 + }, + { + "epoch": 0.48, + "learning_rate": 1.0649594549613834e-05, + "loss": 0.5674, + "step": 13839 + }, + { + "epoch": 0.48, + "learning_rate": 1.0648507980775242e-05, + "loss": 0.6304, + "step": 13840 + }, + { + "epoch": 0.48, + "learning_rate": 1.0647421404247773e-05, + "loss": 0.5926, + "step": 13841 + }, + { + "epoch": 0.48, + "learning_rate": 1.0646334820044304e-05, + "loss": 0.6278, + "step": 13842 + }, + { + "epoch": 0.48, + "learning_rate": 1.0645248228177712e-05, + "loss": 0.6666, + "step": 13843 + }, + { + "epoch": 0.48, + "learning_rate": 1.0644161628660891e-05, + "loss": 0.6459, + "step": 13844 + }, + { + "epoch": 0.48, + "learning_rate": 1.0643075021506722e-05, + "loss": 0.6491, + "step": 13845 + }, + { + "epoch": 0.48, + "learning_rate": 1.0641988406728077e-05, + "loss": 0.6616, + "step": 13846 + }, + { + "epoch": 0.48, + "learning_rate": 1.0640901784337853e-05, + "loss": 0.7036, + "step": 13847 + }, + { + "epoch": 0.48, + "learning_rate": 1.063981515434893e-05, + "loss": 0.6163, + "step": 13848 + }, + { + "epoch": 0.48, + "learning_rate": 1.0638728516774181e-05, + "loss": 0.6349, + "step": 13849 + }, + { + "epoch": 0.48, + "learning_rate": 1.0637641871626503e-05, + "loss": 0.6101, + "step": 13850 + }, + { + "epoch": 0.48, + "learning_rate": 1.0636555218918773e-05, + "loss": 0.5951, + "step": 13851 + }, + { + "epoch": 0.48, + "learning_rate": 1.0635468558663873e-05, + "loss": 0.6266, + "step": 13852 + }, + { + "epoch": 0.48, + "learning_rate": 1.0634381890874694e-05, + "loss": 0.582, + "step": 13853 + }, + { + "epoch": 0.48, + "learning_rate": 1.0633295215564115e-05, + "loss": 0.6255, + "step": 13854 + }, + { + "epoch": 0.48, + "learning_rate": 1.0632208532745014e-05, + "loss": 0.6454, + "step": 13855 + }, + { + "epoch": 0.48, + "learning_rate": 1.0631121842430287e-05, + "loss": 0.6879, + "step": 13856 + }, + { + "epoch": 0.48, + "learning_rate": 1.0630035144632811e-05, + "loss": 0.6097, + "step": 13857 + }, + { + "epoch": 0.48, + "learning_rate": 1.0628948439365467e-05, + "loss": 0.6104, + "step": 13858 + }, + { + "epoch": 0.48, + "learning_rate": 1.0627861726641151e-05, + "loss": 0.5824, + "step": 13859 + }, + { + "epoch": 0.48, + "learning_rate": 1.0626775006472736e-05, + "loss": 0.6894, + "step": 13860 + }, + { + "epoch": 0.48, + "learning_rate": 1.062568827887311e-05, + "loss": 0.6125, + "step": 13861 + }, + { + "epoch": 0.48, + "learning_rate": 1.0624601543855157e-05, + "loss": 0.6032, + "step": 13862 + }, + { + "epoch": 0.48, + "learning_rate": 1.0623514801431767e-05, + "loss": 0.6361, + "step": 13863 + }, + { + "epoch": 0.48, + "learning_rate": 1.0622428051615816e-05, + "loss": 0.6877, + "step": 13864 + }, + { + "epoch": 0.48, + "learning_rate": 1.0621341294420196e-05, + "loss": 0.5843, + "step": 13865 + }, + { + "epoch": 0.48, + "learning_rate": 1.0620254529857787e-05, + "loss": 0.6027, + "step": 13866 + }, + { + "epoch": 0.48, + "learning_rate": 1.0619167757941476e-05, + "loss": 0.6263, + "step": 13867 + }, + { + "epoch": 0.48, + "learning_rate": 1.0618080978684149e-05, + "loss": 0.6729, + "step": 13868 + }, + { + "epoch": 0.48, + "learning_rate": 1.061699419209869e-05, + "loss": 0.6673, + "step": 13869 + }, + { + "epoch": 0.48, + "learning_rate": 1.0615907398197981e-05, + "loss": 0.6506, + "step": 13870 + }, + { + "epoch": 0.48, + "learning_rate": 1.0614820596994915e-05, + "loss": 0.5879, + "step": 13871 + }, + { + "epoch": 0.48, + "learning_rate": 1.0613733788502374e-05, + "loss": 0.6295, + "step": 13872 + }, + { + "epoch": 0.48, + "learning_rate": 1.0612646972733238e-05, + "loss": 0.6023, + "step": 13873 + }, + { + "epoch": 0.48, + "learning_rate": 1.06115601497004e-05, + "loss": 0.6267, + "step": 13874 + }, + { + "epoch": 0.48, + "learning_rate": 1.0610473319416743e-05, + "loss": 0.6084, + "step": 13875 + }, + { + "epoch": 0.48, + "learning_rate": 1.060938648189515e-05, + "loss": 0.6343, + "step": 13876 + }, + { + "epoch": 0.48, + "learning_rate": 1.0608299637148512e-05, + "loss": 0.6458, + "step": 13877 + }, + { + "epoch": 0.48, + "learning_rate": 1.0607212785189712e-05, + "loss": 0.6455, + "step": 13878 + }, + { + "epoch": 0.48, + "learning_rate": 1.0606125926031634e-05, + "loss": 0.6393, + "step": 13879 + }, + { + "epoch": 0.48, + "learning_rate": 1.0605039059687167e-05, + "loss": 0.633, + "step": 13880 + }, + { + "epoch": 0.48, + "learning_rate": 1.06039521861692e-05, + "loss": 0.5964, + "step": 13881 + }, + { + "epoch": 0.48, + "learning_rate": 1.0602865305490612e-05, + "loss": 0.5854, + "step": 13882 + }, + { + "epoch": 0.48, + "learning_rate": 1.0601778417664295e-05, + "loss": 0.5932, + "step": 13883 + }, + { + "epoch": 0.48, + "learning_rate": 1.0600691522703134e-05, + "loss": 0.6716, + "step": 13884 + }, + { + "epoch": 0.48, + "learning_rate": 1.0599604620620014e-05, + "loss": 0.6719, + "step": 13885 + }, + { + "epoch": 0.48, + "learning_rate": 1.0598517711427823e-05, + "loss": 0.6288, + "step": 13886 + }, + { + "epoch": 0.48, + "learning_rate": 1.0597430795139447e-05, + "loss": 0.6817, + "step": 13887 + }, + { + "epoch": 0.48, + "learning_rate": 1.0596343871767773e-05, + "loss": 0.6289, + "step": 13888 + }, + { + "epoch": 0.48, + "learning_rate": 1.059525694132569e-05, + "loss": 0.6298, + "step": 13889 + }, + { + "epoch": 0.48, + "learning_rate": 1.059417000382608e-05, + "loss": 0.6272, + "step": 13890 + }, + { + "epoch": 0.48, + "learning_rate": 1.0593083059281837e-05, + "loss": 0.616, + "step": 13891 + }, + { + "epoch": 0.48, + "learning_rate": 1.0591996107705842e-05, + "loss": 0.6127, + "step": 13892 + }, + { + "epoch": 0.48, + "learning_rate": 1.0590909149110984e-05, + "loss": 0.621, + "step": 13893 + }, + { + "epoch": 0.48, + "learning_rate": 1.0589822183510147e-05, + "loss": 0.635, + "step": 13894 + }, + { + "epoch": 0.48, + "learning_rate": 1.0588735210916228e-05, + "loss": 0.6053, + "step": 13895 + }, + { + "epoch": 0.48, + "learning_rate": 1.0587648231342104e-05, + "loss": 0.6302, + "step": 13896 + }, + { + "epoch": 0.48, + "learning_rate": 1.0586561244800668e-05, + "loss": 0.6513, + "step": 13897 + }, + { + "epoch": 0.48, + "learning_rate": 1.058547425130481e-05, + "loss": 0.6041, + "step": 13898 + }, + { + "epoch": 0.48, + "learning_rate": 1.0584387250867409e-05, + "loss": 0.6887, + "step": 13899 + }, + { + "epoch": 0.48, + "learning_rate": 1.058330024350136e-05, + "loss": 0.6141, + "step": 13900 + }, + { + "epoch": 0.48, + "learning_rate": 1.058221322921955e-05, + "loss": 0.6403, + "step": 13901 + }, + { + "epoch": 0.48, + "learning_rate": 1.0581126208034863e-05, + "loss": 0.6178, + "step": 13902 + }, + { + "epoch": 0.48, + "learning_rate": 1.0580039179960192e-05, + "loss": 0.5864, + "step": 13903 + }, + { + "epoch": 0.48, + "learning_rate": 1.0578952145008424e-05, + "loss": 0.6189, + "step": 13904 + }, + { + "epoch": 0.48, + "learning_rate": 1.0577865103192442e-05, + "loss": 0.6888, + "step": 13905 + }, + { + "epoch": 0.48, + "learning_rate": 1.0576778054525139e-05, + "loss": 0.6514, + "step": 13906 + }, + { + "epoch": 0.48, + "learning_rate": 1.0575690999019405e-05, + "loss": 0.6053, + "step": 13907 + }, + { + "epoch": 0.48, + "learning_rate": 1.0574603936688124e-05, + "loss": 0.6343, + "step": 13908 + }, + { + "epoch": 0.48, + "learning_rate": 1.0573516867544184e-05, + "loss": 0.5559, + "step": 13909 + }, + { + "epoch": 0.48, + "learning_rate": 1.0572429791600482e-05, + "loss": 0.6391, + "step": 13910 + }, + { + "epoch": 0.48, + "learning_rate": 1.0571342708869896e-05, + "loss": 0.6493, + "step": 13911 + }, + { + "epoch": 0.48, + "learning_rate": 1.0570255619365322e-05, + "loss": 0.636, + "step": 13912 + }, + { + "epoch": 0.48, + "learning_rate": 1.0569168523099646e-05, + "loss": 0.6449, + "step": 13913 + }, + { + "epoch": 0.48, + "learning_rate": 1.0568081420085756e-05, + "loss": 0.5966, + "step": 13914 + }, + { + "epoch": 0.48, + "learning_rate": 1.056699431033654e-05, + "loss": 0.6349, + "step": 13915 + }, + { + "epoch": 0.48, + "learning_rate": 1.0565907193864895e-05, + "loss": 0.6282, + "step": 13916 + }, + { + "epoch": 0.48, + "learning_rate": 1.0564820070683699e-05, + "loss": 0.5425, + "step": 13917 + }, + { + "epoch": 0.48, + "learning_rate": 1.0563732940805848e-05, + "loss": 0.6126, + "step": 13918 + }, + { + "epoch": 0.48, + "learning_rate": 1.0562645804244234e-05, + "loss": 0.5584, + "step": 13919 + }, + { + "epoch": 0.48, + "learning_rate": 1.0561558661011738e-05, + "loss": 0.6429, + "step": 13920 + }, + { + "epoch": 0.48, + "learning_rate": 1.0560471511121253e-05, + "loss": 0.6413, + "step": 13921 + }, + { + "epoch": 0.48, + "learning_rate": 1.0559384354585671e-05, + "loss": 0.6106, + "step": 13922 + }, + { + "epoch": 0.48, + "learning_rate": 1.055829719141788e-05, + "loss": 0.6315, + "step": 13923 + }, + { + "epoch": 0.48, + "learning_rate": 1.0557210021630769e-05, + "loss": 0.6053, + "step": 13924 + }, + { + "epoch": 0.48, + "learning_rate": 1.055612284523723e-05, + "loss": 0.5879, + "step": 13925 + }, + { + "epoch": 0.48, + "learning_rate": 1.0555035662250149e-05, + "loss": 0.6246, + "step": 13926 + }, + { + "epoch": 0.48, + "learning_rate": 1.0553948472682417e-05, + "loss": 0.6332, + "step": 13927 + }, + { + "epoch": 0.48, + "learning_rate": 1.0552861276546928e-05, + "loss": 0.5793, + "step": 13928 + }, + { + "epoch": 0.48, + "learning_rate": 1.0551774073856567e-05, + "loss": 0.6267, + "step": 13929 + }, + { + "epoch": 0.48, + "learning_rate": 1.0550686864624226e-05, + "loss": 0.6593, + "step": 13930 + }, + { + "epoch": 0.48, + "learning_rate": 1.0549599648862798e-05, + "loss": 0.6902, + "step": 13931 + }, + { + "epoch": 0.48, + "learning_rate": 1.0548512426585171e-05, + "loss": 0.6531, + "step": 13932 + }, + { + "epoch": 0.48, + "learning_rate": 1.0547425197804233e-05, + "loss": 0.639, + "step": 13933 + }, + { + "epoch": 0.48, + "learning_rate": 1.054633796253288e-05, + "loss": 0.6337, + "step": 13934 + }, + { + "epoch": 0.48, + "learning_rate": 1.0545250720783995e-05, + "loss": 0.6622, + "step": 13935 + }, + { + "epoch": 0.48, + "learning_rate": 1.0544163472570474e-05, + "loss": 0.626, + "step": 13936 + }, + { + "epoch": 0.48, + "learning_rate": 1.0543076217905211e-05, + "loss": 0.6425, + "step": 13937 + }, + { + "epoch": 0.48, + "learning_rate": 1.0541988956801088e-05, + "loss": 0.6417, + "step": 13938 + }, + { + "epoch": 0.48, + "learning_rate": 1.0540901689271001e-05, + "loss": 0.5841, + "step": 13939 + }, + { + "epoch": 0.48, + "learning_rate": 1.0539814415327842e-05, + "loss": 0.7055, + "step": 13940 + }, + { + "epoch": 0.48, + "learning_rate": 1.0538727134984499e-05, + "loss": 0.6202, + "step": 13941 + }, + { + "epoch": 0.48, + "learning_rate": 1.0537639848253865e-05, + "loss": 0.6659, + "step": 13942 + }, + { + "epoch": 0.48, + "learning_rate": 1.0536552555148831e-05, + "loss": 0.6353, + "step": 13943 + }, + { + "epoch": 0.48, + "learning_rate": 1.0535465255682284e-05, + "loss": 0.5997, + "step": 13944 + }, + { + "epoch": 0.48, + "learning_rate": 1.0534377949867124e-05, + "loss": 0.577, + "step": 13945 + }, + { + "epoch": 0.48, + "learning_rate": 1.0533290637716234e-05, + "loss": 0.6096, + "step": 13946 + }, + { + "epoch": 0.48, + "learning_rate": 1.0532203319242509e-05, + "loss": 0.6309, + "step": 13947 + }, + { + "epoch": 0.48, + "learning_rate": 1.0531115994458843e-05, + "loss": 0.6551, + "step": 13948 + }, + { + "epoch": 0.48, + "learning_rate": 1.0530028663378124e-05, + "loss": 0.6861, + "step": 13949 + }, + { + "epoch": 0.48, + "learning_rate": 1.0528941326013243e-05, + "loss": 0.6093, + "step": 13950 + }, + { + "epoch": 0.48, + "learning_rate": 1.0527853982377094e-05, + "loss": 0.6115, + "step": 13951 + }, + { + "epoch": 0.48, + "learning_rate": 1.052676663248257e-05, + "loss": 0.6123, + "step": 13952 + }, + { + "epoch": 0.48, + "learning_rate": 1.052567927634256e-05, + "loss": 0.6617, + "step": 13953 + }, + { + "epoch": 0.48, + "learning_rate": 1.0524591913969954e-05, + "loss": 0.5918, + "step": 13954 + }, + { + "epoch": 0.48, + "learning_rate": 1.0523504545377655e-05, + "loss": 0.6221, + "step": 13955 + }, + { + "epoch": 0.48, + "learning_rate": 1.052241717057854e-05, + "loss": 0.6424, + "step": 13956 + }, + { + "epoch": 0.48, + "learning_rate": 1.0521329789585516e-05, + "loss": 0.6211, + "step": 13957 + }, + { + "epoch": 0.48, + "learning_rate": 1.052024240241146e-05, + "loss": 0.6422, + "step": 13958 + }, + { + "epoch": 0.48, + "learning_rate": 1.0519155009069274e-05, + "loss": 0.6488, + "step": 13959 + }, + { + "epoch": 0.48, + "learning_rate": 1.0518067609571853e-05, + "loss": 0.6533, + "step": 13960 + }, + { + "epoch": 0.48, + "learning_rate": 1.051698020393208e-05, + "loss": 0.5822, + "step": 13961 + }, + { + "epoch": 0.48, + "learning_rate": 1.0515892792162856e-05, + "loss": 0.6646, + "step": 13962 + }, + { + "epoch": 0.48, + "learning_rate": 1.0514805374277071e-05, + "loss": 0.68, + "step": 13963 + }, + { + "epoch": 0.48, + "learning_rate": 1.0513717950287614e-05, + "loss": 0.6392, + "step": 13964 + }, + { + "epoch": 0.48, + "learning_rate": 1.051263052020738e-05, + "loss": 0.6402, + "step": 13965 + }, + { + "epoch": 0.48, + "learning_rate": 1.0511543084049267e-05, + "loss": 0.6755, + "step": 13966 + }, + { + "epoch": 0.48, + "learning_rate": 1.0510455641826162e-05, + "loss": 0.6227, + "step": 13967 + }, + { + "epoch": 0.48, + "learning_rate": 1.050936819355096e-05, + "loss": 0.6829, + "step": 13968 + }, + { + "epoch": 0.48, + "learning_rate": 1.0508280739236554e-05, + "loss": 0.6318, + "step": 13969 + }, + { + "epoch": 0.48, + "learning_rate": 1.0507193278895833e-05, + "loss": 0.6704, + "step": 13970 + }, + { + "epoch": 0.48, + "learning_rate": 1.0506105812541696e-05, + "loss": 0.6498, + "step": 13971 + }, + { + "epoch": 0.48, + "learning_rate": 1.0505018340187039e-05, + "loss": 0.5643, + "step": 13972 + }, + { + "epoch": 0.48, + "learning_rate": 1.0503930861844745e-05, + "loss": 0.643, + "step": 13973 + }, + { + "epoch": 0.48, + "learning_rate": 1.0502843377527716e-05, + "loss": 0.617, + "step": 13974 + }, + { + "epoch": 0.48, + "learning_rate": 1.0501755887248842e-05, + "loss": 0.6641, + "step": 13975 + }, + { + "epoch": 0.48, + "learning_rate": 1.0500668391021017e-05, + "loss": 0.6636, + "step": 13976 + }, + { + "epoch": 0.48, + "learning_rate": 1.0499580888857134e-05, + "loss": 0.607, + "step": 13977 + }, + { + "epoch": 0.48, + "learning_rate": 1.0498493380770089e-05, + "loss": 0.6238, + "step": 13978 + }, + { + "epoch": 0.48, + "learning_rate": 1.0497405866772775e-05, + "loss": 0.6386, + "step": 13979 + }, + { + "epoch": 0.48, + "learning_rate": 1.0496318346878084e-05, + "loss": 0.6604, + "step": 13980 + }, + { + "epoch": 0.48, + "learning_rate": 1.049523082109891e-05, + "loss": 0.6662, + "step": 13981 + }, + { + "epoch": 0.48, + "learning_rate": 1.0494143289448149e-05, + "loss": 0.6236, + "step": 13982 + }, + { + "epoch": 0.48, + "learning_rate": 1.0493055751938696e-05, + "loss": 0.7105, + "step": 13983 + }, + { + "epoch": 0.48, + "learning_rate": 1.049196820858344e-05, + "loss": 0.6131, + "step": 13984 + }, + { + "epoch": 0.48, + "learning_rate": 1.049088065939528e-05, + "loss": 0.6403, + "step": 13985 + }, + { + "epoch": 0.48, + "learning_rate": 1.0489793104387112e-05, + "loss": 0.5793, + "step": 13986 + }, + { + "epoch": 0.48, + "learning_rate": 1.0488705543571822e-05, + "loss": 0.6318, + "step": 13987 + }, + { + "epoch": 0.48, + "learning_rate": 1.0487617976962315e-05, + "loss": 0.6126, + "step": 13988 + }, + { + "epoch": 0.48, + "learning_rate": 1.0486530404571476e-05, + "loss": 0.5748, + "step": 13989 + }, + { + "epoch": 0.48, + "learning_rate": 1.0485442826412204e-05, + "loss": 0.6016, + "step": 13990 + }, + { + "epoch": 0.48, + "learning_rate": 1.0484355242497396e-05, + "loss": 0.6169, + "step": 13991 + }, + { + "epoch": 0.48, + "learning_rate": 1.0483267652839939e-05, + "loss": 0.6131, + "step": 13992 + }, + { + "epoch": 0.48, + "learning_rate": 1.0482180057452735e-05, + "loss": 0.6196, + "step": 13993 + }, + { + "epoch": 0.48, + "learning_rate": 1.0481092456348679e-05, + "loss": 0.5654, + "step": 13994 + }, + { + "epoch": 0.48, + "learning_rate": 1.048000484954066e-05, + "loss": 0.6098, + "step": 13995 + }, + { + "epoch": 0.48, + "learning_rate": 1.0478917237041578e-05, + "loss": 0.5889, + "step": 13996 + }, + { + "epoch": 0.48, + "learning_rate": 1.0477829618864325e-05, + "loss": 0.6379, + "step": 13997 + }, + { + "epoch": 0.48, + "learning_rate": 1.04767419950218e-05, + "loss": 0.6097, + "step": 13998 + }, + { + "epoch": 0.49, + "learning_rate": 1.0475654365526893e-05, + "loss": 0.6435, + "step": 13999 + }, + { + "epoch": 0.49, + "learning_rate": 1.0474566730392504e-05, + "loss": 0.6362, + "step": 14000 + }, + { + "epoch": 0.49, + "learning_rate": 1.0473479089631522e-05, + "loss": 0.6563, + "step": 14001 + }, + { + "epoch": 0.49, + "learning_rate": 1.0472391443256848e-05, + "loss": 0.6142, + "step": 14002 + }, + { + "epoch": 0.49, + "learning_rate": 1.047130379128138e-05, + "loss": 0.6879, + "step": 14003 + }, + { + "epoch": 0.49, + "learning_rate": 1.0470216133718005e-05, + "loss": 0.6213, + "step": 14004 + }, + { + "epoch": 0.49, + "learning_rate": 1.0469128470579624e-05, + "loss": 0.6758, + "step": 14005 + }, + { + "epoch": 0.49, + "learning_rate": 1.0468040801879133e-05, + "loss": 0.5881, + "step": 14006 + }, + { + "epoch": 0.49, + "learning_rate": 1.0466953127629425e-05, + "loss": 0.6658, + "step": 14007 + }, + { + "epoch": 0.49, + "learning_rate": 1.0465865447843396e-05, + "loss": 0.6333, + "step": 14008 + }, + { + "epoch": 0.49, + "learning_rate": 1.0464777762533944e-05, + "loss": 0.6361, + "step": 14009 + }, + { + "epoch": 0.49, + "learning_rate": 1.0463690071713964e-05, + "loss": 0.6493, + "step": 14010 + }, + { + "epoch": 0.49, + "learning_rate": 1.046260237539635e-05, + "loss": 0.6919, + "step": 14011 + }, + { + "epoch": 0.49, + "learning_rate": 1.0461514673594003e-05, + "loss": 0.6091, + "step": 14012 + }, + { + "epoch": 0.49, + "learning_rate": 1.046042696631981e-05, + "loss": 0.6685, + "step": 14013 + }, + { + "epoch": 0.49, + "learning_rate": 1.0459339253586675e-05, + "loss": 0.5884, + "step": 14014 + }, + { + "epoch": 0.49, + "learning_rate": 1.0458251535407495e-05, + "loss": 0.6356, + "step": 14015 + }, + { + "epoch": 0.49, + "learning_rate": 1.0457163811795161e-05, + "loss": 0.5936, + "step": 14016 + }, + { + "epoch": 0.49, + "learning_rate": 1.0456076082762572e-05, + "loss": 0.6481, + "step": 14017 + }, + { + "epoch": 0.49, + "learning_rate": 1.0454988348322628e-05, + "loss": 0.6016, + "step": 14018 + }, + { + "epoch": 0.49, + "learning_rate": 1.0453900608488217e-05, + "loss": 0.606, + "step": 14019 + }, + { + "epoch": 0.49, + "learning_rate": 1.045281286327224e-05, + "loss": 0.6241, + "step": 14020 + }, + { + "epoch": 0.49, + "learning_rate": 1.0451725112687597e-05, + "loss": 0.6739, + "step": 14021 + }, + { + "epoch": 0.49, + "learning_rate": 1.0450637356747178e-05, + "loss": 0.625, + "step": 14022 + }, + { + "epoch": 0.49, + "learning_rate": 1.0449549595463884e-05, + "loss": 0.6411, + "step": 14023 + }, + { + "epoch": 0.49, + "learning_rate": 1.044846182885061e-05, + "loss": 0.6123, + "step": 14024 + }, + { + "epoch": 0.49, + "learning_rate": 1.0447374056920256e-05, + "loss": 0.6183, + "step": 14025 + }, + { + "epoch": 0.49, + "learning_rate": 1.0446286279685714e-05, + "loss": 0.6426, + "step": 14026 + }, + { + "epoch": 0.49, + "learning_rate": 1.0445198497159887e-05, + "loss": 0.6252, + "step": 14027 + }, + { + "epoch": 0.49, + "learning_rate": 1.0444110709355666e-05, + "loss": 0.5421, + "step": 14028 + }, + { + "epoch": 0.49, + "learning_rate": 1.044302291628595e-05, + "loss": 0.693, + "step": 14029 + }, + { + "epoch": 0.49, + "learning_rate": 1.0441935117963639e-05, + "loss": 0.6667, + "step": 14030 + }, + { + "epoch": 0.49, + "learning_rate": 1.0440847314401627e-05, + "loss": 0.6173, + "step": 14031 + }, + { + "epoch": 0.49, + "learning_rate": 1.0439759505612813e-05, + "loss": 0.6596, + "step": 14032 + }, + { + "epoch": 0.49, + "learning_rate": 1.0438671691610095e-05, + "loss": 0.5867, + "step": 14033 + }, + { + "epoch": 0.49, + "learning_rate": 1.0437583872406366e-05, + "loss": 0.6569, + "step": 14034 + }, + { + "epoch": 0.49, + "learning_rate": 1.0436496048014528e-05, + "loss": 0.5929, + "step": 14035 + }, + { + "epoch": 0.49, + "learning_rate": 1.043540821844748e-05, + "loss": 0.6524, + "step": 14036 + }, + { + "epoch": 0.49, + "learning_rate": 1.0434320383718113e-05, + "loss": 0.6087, + "step": 14037 + }, + { + "epoch": 0.49, + "learning_rate": 1.0433232543839331e-05, + "loss": 0.678, + "step": 14038 + }, + { + "epoch": 0.49, + "learning_rate": 1.043214469882403e-05, + "loss": 0.6358, + "step": 14039 + }, + { + "epoch": 0.49, + "learning_rate": 1.0431056848685102e-05, + "loss": 0.6403, + "step": 14040 + }, + { + "epoch": 0.49, + "learning_rate": 1.0429968993435453e-05, + "loss": 0.6263, + "step": 14041 + }, + { + "epoch": 0.49, + "learning_rate": 1.0428881133087977e-05, + "loss": 0.6511, + "step": 14042 + }, + { + "epoch": 0.49, + "learning_rate": 1.0427793267655575e-05, + "loss": 0.6118, + "step": 14043 + }, + { + "epoch": 0.49, + "learning_rate": 1.0426705397151138e-05, + "loss": 0.6433, + "step": 14044 + }, + { + "epoch": 0.49, + "learning_rate": 1.0425617521587575e-05, + "loss": 0.6182, + "step": 14045 + }, + { + "epoch": 0.49, + "learning_rate": 1.0424529640977772e-05, + "loss": 0.5992, + "step": 14046 + }, + { + "epoch": 0.49, + "learning_rate": 1.0423441755334636e-05, + "loss": 0.6416, + "step": 14047 + }, + { + "epoch": 0.49, + "learning_rate": 1.0422353864671062e-05, + "loss": 0.6547, + "step": 14048 + }, + { + "epoch": 0.49, + "learning_rate": 1.0421265968999948e-05, + "loss": 0.5908, + "step": 14049 + }, + { + "epoch": 0.49, + "learning_rate": 1.0420178068334195e-05, + "loss": 0.6374, + "step": 14050 + }, + { + "epoch": 0.49, + "learning_rate": 1.0419090162686695e-05, + "loss": 0.6463, + "step": 14051 + }, + { + "epoch": 0.49, + "learning_rate": 1.0418002252070354e-05, + "loss": 0.6529, + "step": 14052 + }, + { + "epoch": 0.49, + "learning_rate": 1.041691433649807e-05, + "loss": 0.6237, + "step": 14053 + }, + { + "epoch": 0.49, + "learning_rate": 1.0415826415982734e-05, + "loss": 0.6287, + "step": 14054 + }, + { + "epoch": 0.49, + "learning_rate": 1.0414738490537254e-05, + "loss": 0.5682, + "step": 14055 + }, + { + "epoch": 0.49, + "learning_rate": 1.0413650560174521e-05, + "loss": 0.5872, + "step": 14056 + }, + { + "epoch": 0.49, + "learning_rate": 1.041256262490744e-05, + "loss": 0.6776, + "step": 14057 + }, + { + "epoch": 0.49, + "learning_rate": 1.0411474684748906e-05, + "loss": 0.65, + "step": 14058 + }, + { + "epoch": 0.49, + "learning_rate": 1.0410386739711823e-05, + "loss": 0.6386, + "step": 14059 + }, + { + "epoch": 0.49, + "learning_rate": 1.0409298789809078e-05, + "loss": 0.6705, + "step": 14060 + }, + { + "epoch": 0.49, + "learning_rate": 1.0408210835053583e-05, + "loss": 0.6189, + "step": 14061 + }, + { + "epoch": 0.49, + "learning_rate": 1.0407122875458234e-05, + "loss": 0.6253, + "step": 14062 + }, + { + "epoch": 0.49, + "learning_rate": 1.0406034911035925e-05, + "loss": 0.6037, + "step": 14063 + }, + { + "epoch": 0.49, + "learning_rate": 1.040494694179956e-05, + "loss": 0.6142, + "step": 14064 + }, + { + "epoch": 0.49, + "learning_rate": 1.0403858967762038e-05, + "loss": 0.618, + "step": 14065 + }, + { + "epoch": 0.49, + "learning_rate": 1.0402770988936253e-05, + "loss": 0.6268, + "step": 14066 + }, + { + "epoch": 0.49, + "learning_rate": 1.040168300533511e-05, + "loss": 0.6632, + "step": 14067 + }, + { + "epoch": 0.49, + "learning_rate": 1.040059501697151e-05, + "loss": 0.6256, + "step": 14068 + }, + { + "epoch": 0.49, + "learning_rate": 1.0399507023858347e-05, + "loss": 0.6857, + "step": 14069 + }, + { + "epoch": 0.49, + "learning_rate": 1.039841902600852e-05, + "loss": 0.6355, + "step": 14070 + }, + { + "epoch": 0.49, + "learning_rate": 1.0397331023434936e-05, + "loss": 0.6196, + "step": 14071 + }, + { + "epoch": 0.49, + "learning_rate": 1.0396243016150487e-05, + "loss": 0.655, + "step": 14072 + }, + { + "epoch": 0.49, + "learning_rate": 1.0395155004168078e-05, + "loss": 0.6175, + "step": 14073 + }, + { + "epoch": 0.49, + "learning_rate": 1.0394066987500607e-05, + "loss": 0.6075, + "step": 14074 + }, + { + "epoch": 0.49, + "learning_rate": 1.0392978966160972e-05, + "loss": 0.669, + "step": 14075 + }, + { + "epoch": 0.49, + "learning_rate": 1.0391890940162072e-05, + "loss": 0.6226, + "step": 14076 + }, + { + "epoch": 0.49, + "learning_rate": 1.0390802909516812e-05, + "loss": 0.6474, + "step": 14077 + }, + { + "epoch": 0.49, + "learning_rate": 1.0389714874238088e-05, + "loss": 0.5774, + "step": 14078 + }, + { + "epoch": 0.49, + "learning_rate": 1.0388626834338802e-05, + "loss": 0.5968, + "step": 14079 + }, + { + "epoch": 0.49, + "learning_rate": 1.0387538789831854e-05, + "loss": 0.6932, + "step": 14080 + }, + { + "epoch": 0.49, + "learning_rate": 1.0386450740730142e-05, + "loss": 0.6165, + "step": 14081 + }, + { + "epoch": 0.49, + "learning_rate": 1.0385362687046567e-05, + "loss": 0.6284, + "step": 14082 + }, + { + "epoch": 0.49, + "learning_rate": 1.0384274628794033e-05, + "loss": 0.6323, + "step": 14083 + }, + { + "epoch": 0.49, + "learning_rate": 1.0383186565985438e-05, + "loss": 0.5797, + "step": 14084 + }, + { + "epoch": 0.49, + "learning_rate": 1.0382098498633672e-05, + "loss": 0.6452, + "step": 14085 + }, + { + "epoch": 0.49, + "learning_rate": 1.0381010426751655e-05, + "loss": 0.6507, + "step": 14086 + }, + { + "epoch": 0.49, + "learning_rate": 1.0379922350352274e-05, + "loss": 0.6613, + "step": 14087 + }, + { + "epoch": 0.49, + "learning_rate": 1.037883426944843e-05, + "loss": 0.6444, + "step": 14088 + }, + { + "epoch": 0.49, + "learning_rate": 1.0377746184053032e-05, + "loss": 0.6317, + "step": 14089 + }, + { + "epoch": 0.49, + "learning_rate": 1.0376658094178973e-05, + "loss": 0.5835, + "step": 14090 + }, + { + "epoch": 0.49, + "learning_rate": 1.0375569999839153e-05, + "loss": 0.6118, + "step": 14091 + }, + { + "epoch": 0.49, + "learning_rate": 1.037448190104648e-05, + "loss": 0.5663, + "step": 14092 + }, + { + "epoch": 0.49, + "learning_rate": 1.0373393797813849e-05, + "loss": 0.6112, + "step": 14093 + }, + { + "epoch": 0.49, + "learning_rate": 1.0372305690154159e-05, + "loss": 0.6616, + "step": 14094 + }, + { + "epoch": 0.49, + "learning_rate": 1.0371217578080316e-05, + "loss": 0.6521, + "step": 14095 + }, + { + "epoch": 0.49, + "learning_rate": 1.0370129461605223e-05, + "loss": 0.6408, + "step": 14096 + }, + { + "epoch": 0.49, + "learning_rate": 1.036904134074177e-05, + "loss": 0.7004, + "step": 14097 + }, + { + "epoch": 0.49, + "learning_rate": 1.036795321550287e-05, + "loss": 0.6609, + "step": 14098 + }, + { + "epoch": 0.49, + "learning_rate": 1.036686508590142e-05, + "loss": 0.6985, + "step": 14099 + }, + { + "epoch": 0.49, + "learning_rate": 1.0365776951950315e-05, + "loss": 0.6153, + "step": 14100 + }, + { + "epoch": 0.49, + "learning_rate": 1.0364688813662464e-05, + "loss": 0.6448, + "step": 14101 + }, + { + "epoch": 0.49, + "learning_rate": 1.0363600671050768e-05, + "loss": 0.6472, + "step": 14102 + }, + { + "epoch": 0.49, + "learning_rate": 1.0362512524128123e-05, + "loss": 0.6471, + "step": 14103 + }, + { + "epoch": 0.49, + "learning_rate": 1.0361424372907435e-05, + "loss": 0.567, + "step": 14104 + }, + { + "epoch": 0.49, + "learning_rate": 1.0360336217401606e-05, + "loss": 0.6206, + "step": 14105 + }, + { + "epoch": 0.49, + "learning_rate": 1.035924805762353e-05, + "loss": 0.5929, + "step": 14106 + }, + { + "epoch": 0.49, + "learning_rate": 1.035815989358612e-05, + "loss": 0.6364, + "step": 14107 + }, + { + "epoch": 0.49, + "learning_rate": 1.0357071725302268e-05, + "loss": 0.6043, + "step": 14108 + }, + { + "epoch": 0.49, + "learning_rate": 1.0355983552784876e-05, + "loss": 0.6118, + "step": 14109 + }, + { + "epoch": 0.49, + "learning_rate": 1.0354895376046854e-05, + "loss": 0.6908, + "step": 14110 + }, + { + "epoch": 0.49, + "learning_rate": 1.0353807195101098e-05, + "loss": 0.5775, + "step": 14111 + }, + { + "epoch": 0.49, + "learning_rate": 1.0352719009960508e-05, + "loss": 0.6707, + "step": 14112 + }, + { + "epoch": 0.49, + "learning_rate": 1.0351630820637987e-05, + "loss": 0.643, + "step": 14113 + }, + { + "epoch": 0.49, + "learning_rate": 1.035054262714644e-05, + "loss": 0.6315, + "step": 14114 + }, + { + "epoch": 0.49, + "learning_rate": 1.0349454429498766e-05, + "loss": 0.6064, + "step": 14115 + }, + { + "epoch": 0.49, + "learning_rate": 1.0348366227707867e-05, + "loss": 0.6262, + "step": 14116 + }, + { + "epoch": 0.49, + "learning_rate": 1.0347278021786646e-05, + "loss": 0.6346, + "step": 14117 + }, + { + "epoch": 0.49, + "learning_rate": 1.0346189811748007e-05, + "loss": 0.6543, + "step": 14118 + }, + { + "epoch": 0.49, + "learning_rate": 1.0345101597604846e-05, + "loss": 0.6004, + "step": 14119 + }, + { + "epoch": 0.49, + "learning_rate": 1.0344013379370072e-05, + "loss": 0.6166, + "step": 14120 + }, + { + "epoch": 0.49, + "learning_rate": 1.0342925157056582e-05, + "loss": 0.6356, + "step": 14121 + }, + { + "epoch": 0.49, + "learning_rate": 1.034183693067728e-05, + "loss": 0.6298, + "step": 14122 + }, + { + "epoch": 0.49, + "learning_rate": 1.0340748700245074e-05, + "loss": 0.685, + "step": 14123 + }, + { + "epoch": 0.49, + "learning_rate": 1.0339660465772856e-05, + "loss": 0.6713, + "step": 14124 + }, + { + "epoch": 0.49, + "learning_rate": 1.0338572227273534e-05, + "loss": 0.6424, + "step": 14125 + }, + { + "epoch": 0.49, + "learning_rate": 1.0337483984760012e-05, + "loss": 0.662, + "step": 14126 + }, + { + "epoch": 0.49, + "learning_rate": 1.0336395738245188e-05, + "loss": 0.6023, + "step": 14127 + }, + { + "epoch": 0.49, + "learning_rate": 1.0335307487741968e-05, + "loss": 0.6508, + "step": 14128 + }, + { + "epoch": 0.49, + "learning_rate": 1.0334219233263257e-05, + "loss": 0.608, + "step": 14129 + }, + { + "epoch": 0.49, + "learning_rate": 1.0333130974821948e-05, + "loss": 0.6381, + "step": 14130 + }, + { + "epoch": 0.49, + "learning_rate": 1.0332042712430952e-05, + "loss": 0.6287, + "step": 14131 + }, + { + "epoch": 0.49, + "learning_rate": 1.0330954446103172e-05, + "loss": 0.6146, + "step": 14132 + }, + { + "epoch": 0.49, + "learning_rate": 1.0329866175851507e-05, + "loss": 0.7095, + "step": 14133 + }, + { + "epoch": 0.49, + "learning_rate": 1.032877790168886e-05, + "loss": 0.5877, + "step": 14134 + }, + { + "epoch": 0.49, + "learning_rate": 1.0327689623628139e-05, + "loss": 0.6407, + "step": 14135 + }, + { + "epoch": 0.49, + "learning_rate": 1.0326601341682238e-05, + "loss": 0.5947, + "step": 14136 + }, + { + "epoch": 0.49, + "learning_rate": 1.0325513055864068e-05, + "loss": 0.6704, + "step": 14137 + }, + { + "epoch": 0.49, + "learning_rate": 1.0324424766186527e-05, + "loss": 0.5956, + "step": 14138 + }, + { + "epoch": 0.49, + "learning_rate": 1.0323336472662521e-05, + "loss": 0.674, + "step": 14139 + }, + { + "epoch": 0.49, + "learning_rate": 1.0322248175304951e-05, + "loss": 0.6373, + "step": 14140 + }, + { + "epoch": 0.49, + "learning_rate": 1.0321159874126726e-05, + "loss": 0.6505, + "step": 14141 + }, + { + "epoch": 0.49, + "learning_rate": 1.032007156914074e-05, + "loss": 0.6687, + "step": 14142 + }, + { + "epoch": 0.49, + "learning_rate": 1.0318983260359902e-05, + "loss": 0.6339, + "step": 14143 + }, + { + "epoch": 0.49, + "learning_rate": 1.0317894947797113e-05, + "loss": 0.6528, + "step": 14144 + }, + { + "epoch": 0.49, + "learning_rate": 1.0316806631465277e-05, + "loss": 0.594, + "step": 14145 + }, + { + "epoch": 0.49, + "learning_rate": 1.0315718311377298e-05, + "loss": 0.6113, + "step": 14146 + }, + { + "epoch": 0.49, + "learning_rate": 1.031462998754608e-05, + "loss": 0.6321, + "step": 14147 + }, + { + "epoch": 0.49, + "learning_rate": 1.0313541659984523e-05, + "loss": 0.6829, + "step": 14148 + }, + { + "epoch": 0.49, + "learning_rate": 1.0312453328705536e-05, + "loss": 0.5906, + "step": 14149 + }, + { + "epoch": 0.49, + "learning_rate": 1.0311364993722019e-05, + "loss": 0.6104, + "step": 14150 + }, + { + "epoch": 0.49, + "learning_rate": 1.0310276655046873e-05, + "loss": 0.6161, + "step": 14151 + }, + { + "epoch": 0.49, + "learning_rate": 1.030918831269301e-05, + "loss": 0.6145, + "step": 14152 + }, + { + "epoch": 0.49, + "learning_rate": 1.0308099966673323e-05, + "loss": 0.6475, + "step": 14153 + }, + { + "epoch": 0.49, + "learning_rate": 1.0307011617000723e-05, + "loss": 0.684, + "step": 14154 + }, + { + "epoch": 0.49, + "learning_rate": 1.0305923263688116e-05, + "loss": 0.6269, + "step": 14155 + }, + { + "epoch": 0.49, + "learning_rate": 1.0304834906748397e-05, + "loss": 0.6442, + "step": 14156 + }, + { + "epoch": 0.49, + "learning_rate": 1.0303746546194475e-05, + "loss": 0.6646, + "step": 14157 + }, + { + "epoch": 0.49, + "learning_rate": 1.0302658182039256e-05, + "loss": 0.6239, + "step": 14158 + }, + { + "epoch": 0.49, + "learning_rate": 1.030156981429564e-05, + "loss": 0.5904, + "step": 14159 + }, + { + "epoch": 0.49, + "learning_rate": 1.0300481442976531e-05, + "loss": 0.6186, + "step": 14160 + }, + { + "epoch": 0.49, + "learning_rate": 1.0299393068094836e-05, + "loss": 0.6213, + "step": 14161 + }, + { + "epoch": 0.49, + "learning_rate": 1.0298304689663457e-05, + "loss": 0.5326, + "step": 14162 + }, + { + "epoch": 0.49, + "learning_rate": 1.0297216307695297e-05, + "loss": 0.6033, + "step": 14163 + }, + { + "epoch": 0.49, + "learning_rate": 1.0296127922203266e-05, + "loss": 0.6596, + "step": 14164 + }, + { + "epoch": 0.49, + "learning_rate": 1.029503953320026e-05, + "loss": 0.6443, + "step": 14165 + }, + { + "epoch": 0.49, + "learning_rate": 1.0293951140699187e-05, + "loss": 0.617, + "step": 14166 + }, + { + "epoch": 0.49, + "learning_rate": 1.0292862744712955e-05, + "loss": 0.6583, + "step": 14167 + }, + { + "epoch": 0.49, + "learning_rate": 1.0291774345254462e-05, + "loss": 0.5442, + "step": 14168 + }, + { + "epoch": 0.49, + "learning_rate": 1.0290685942336614e-05, + "loss": 0.6071, + "step": 14169 + }, + { + "epoch": 0.49, + "learning_rate": 1.0289597535972317e-05, + "loss": 0.6174, + "step": 14170 + }, + { + "epoch": 0.49, + "learning_rate": 1.0288509126174478e-05, + "loss": 0.6008, + "step": 14171 + }, + { + "epoch": 0.49, + "learning_rate": 1.0287420712955994e-05, + "loss": 0.6568, + "step": 14172 + }, + { + "epoch": 0.49, + "learning_rate": 1.0286332296329777e-05, + "loss": 0.5977, + "step": 14173 + }, + { + "epoch": 0.49, + "learning_rate": 1.0285243876308729e-05, + "loss": 0.6735, + "step": 14174 + }, + { + "epoch": 0.49, + "learning_rate": 1.0284155452905748e-05, + "loss": 0.6427, + "step": 14175 + }, + { + "epoch": 0.49, + "learning_rate": 1.0283067026133751e-05, + "loss": 0.6732, + "step": 14176 + }, + { + "epoch": 0.49, + "learning_rate": 1.0281978596005635e-05, + "loss": 0.6386, + "step": 14177 + }, + { + "epoch": 0.49, + "learning_rate": 1.0280890162534302e-05, + "loss": 0.6206, + "step": 14178 + }, + { + "epoch": 0.49, + "learning_rate": 1.0279801725732668e-05, + "loss": 0.6374, + "step": 14179 + }, + { + "epoch": 0.49, + "learning_rate": 1.0278713285613626e-05, + "loss": 0.6468, + "step": 14180 + }, + { + "epoch": 0.49, + "learning_rate": 1.0277624842190084e-05, + "loss": 0.6149, + "step": 14181 + }, + { + "epoch": 0.49, + "learning_rate": 1.0276536395474952e-05, + "loss": 0.617, + "step": 14182 + }, + { + "epoch": 0.49, + "learning_rate": 1.0275447945481132e-05, + "loss": 0.6007, + "step": 14183 + }, + { + "epoch": 0.49, + "learning_rate": 1.0274359492221522e-05, + "loss": 0.588, + "step": 14184 + }, + { + "epoch": 0.49, + "learning_rate": 1.0273271035709038e-05, + "loss": 0.5834, + "step": 14185 + }, + { + "epoch": 0.49, + "learning_rate": 1.027218257595658e-05, + "loss": 0.6129, + "step": 14186 + }, + { + "epoch": 0.49, + "learning_rate": 1.0271094112977049e-05, + "loss": 0.5998, + "step": 14187 + }, + { + "epoch": 0.49, + "learning_rate": 1.0270005646783361e-05, + "loss": 0.6228, + "step": 14188 + }, + { + "epoch": 0.49, + "learning_rate": 1.026891717738841e-05, + "loss": 0.6286, + "step": 14189 + }, + { + "epoch": 0.49, + "learning_rate": 1.0267828704805106e-05, + "loss": 0.6805, + "step": 14190 + }, + { + "epoch": 0.49, + "learning_rate": 1.0266740229046354e-05, + "loss": 0.6399, + "step": 14191 + }, + { + "epoch": 0.49, + "learning_rate": 1.0265651750125063e-05, + "loss": 0.5576, + "step": 14192 + }, + { + "epoch": 0.49, + "learning_rate": 1.0264563268054129e-05, + "loss": 0.6188, + "step": 14193 + }, + { + "epoch": 0.49, + "learning_rate": 1.0263474782846466e-05, + "loss": 0.6553, + "step": 14194 + }, + { + "epoch": 0.49, + "learning_rate": 1.0262386294514977e-05, + "loss": 0.6794, + "step": 14195 + }, + { + "epoch": 0.49, + "learning_rate": 1.026129780307256e-05, + "loss": 0.6024, + "step": 14196 + }, + { + "epoch": 0.49, + "learning_rate": 1.0260209308532134e-05, + "loss": 0.6641, + "step": 14197 + }, + { + "epoch": 0.49, + "learning_rate": 1.0259120810906597e-05, + "loss": 0.6601, + "step": 14198 + }, + { + "epoch": 0.49, + "learning_rate": 1.0258032310208852e-05, + "loss": 0.6242, + "step": 14199 + }, + { + "epoch": 0.49, + "learning_rate": 1.025694380645181e-05, + "loss": 0.6437, + "step": 14200 + }, + { + "epoch": 0.49, + "learning_rate": 1.0255855299648374e-05, + "loss": 0.6112, + "step": 14201 + }, + { + "epoch": 0.49, + "learning_rate": 1.0254766789811446e-05, + "loss": 0.6684, + "step": 14202 + }, + { + "epoch": 0.49, + "learning_rate": 1.025367827695394e-05, + "loss": 0.6396, + "step": 14203 + }, + { + "epoch": 0.49, + "learning_rate": 1.0252589761088757e-05, + "loss": 0.6494, + "step": 14204 + }, + { + "epoch": 0.49, + "learning_rate": 1.0251501242228801e-05, + "loss": 0.6465, + "step": 14205 + }, + { + "epoch": 0.49, + "learning_rate": 1.0250412720386977e-05, + "loss": 0.6368, + "step": 14206 + }, + { + "epoch": 0.49, + "learning_rate": 1.0249324195576198e-05, + "loss": 0.6628, + "step": 14207 + }, + { + "epoch": 0.49, + "learning_rate": 1.0248235667809363e-05, + "loss": 0.6429, + "step": 14208 + }, + { + "epoch": 0.49, + "learning_rate": 1.024714713709938e-05, + "loss": 0.5724, + "step": 14209 + }, + { + "epoch": 0.49, + "learning_rate": 1.0246058603459157e-05, + "loss": 0.6376, + "step": 14210 + }, + { + "epoch": 0.49, + "learning_rate": 1.0244970066901597e-05, + "loss": 0.6494, + "step": 14211 + }, + { + "epoch": 0.49, + "learning_rate": 1.0243881527439605e-05, + "loss": 0.6358, + "step": 14212 + }, + { + "epoch": 0.49, + "learning_rate": 1.0242792985086091e-05, + "loss": 0.6258, + "step": 14213 + }, + { + "epoch": 0.49, + "learning_rate": 1.0241704439853959e-05, + "loss": 0.6759, + "step": 14214 + }, + { + "epoch": 0.49, + "learning_rate": 1.0240615891756113e-05, + "loss": 0.6443, + "step": 14215 + }, + { + "epoch": 0.49, + "learning_rate": 1.0239527340805466e-05, + "loss": 0.6298, + "step": 14216 + }, + { + "epoch": 0.49, + "learning_rate": 1.0238438787014916e-05, + "loss": 0.6055, + "step": 14217 + }, + { + "epoch": 0.49, + "learning_rate": 1.023735023039737e-05, + "loss": 0.6967, + "step": 14218 + }, + { + "epoch": 0.49, + "learning_rate": 1.0236261670965742e-05, + "loss": 0.6275, + "step": 14219 + }, + { + "epoch": 0.49, + "learning_rate": 1.023517310873293e-05, + "loss": 0.614, + "step": 14220 + }, + { + "epoch": 0.49, + "learning_rate": 1.0234084543711843e-05, + "loss": 0.654, + "step": 14221 + }, + { + "epoch": 0.49, + "learning_rate": 1.023299597591539e-05, + "loss": 0.6679, + "step": 14222 + }, + { + "epoch": 0.49, + "learning_rate": 1.0231907405356474e-05, + "loss": 0.6493, + "step": 14223 + }, + { + "epoch": 0.49, + "learning_rate": 1.0230818832047999e-05, + "loss": 0.6303, + "step": 14224 + }, + { + "epoch": 0.49, + "learning_rate": 1.0229730256002881e-05, + "loss": 0.6201, + "step": 14225 + }, + { + "epoch": 0.49, + "learning_rate": 1.0228641677234015e-05, + "loss": 0.6403, + "step": 14226 + }, + { + "epoch": 0.49, + "learning_rate": 1.0227553095754315e-05, + "loss": 0.5952, + "step": 14227 + }, + { + "epoch": 0.49, + "learning_rate": 1.0226464511576686e-05, + "loss": 0.6579, + "step": 14228 + }, + { + "epoch": 0.49, + "learning_rate": 1.0225375924714031e-05, + "loss": 0.6448, + "step": 14229 + }, + { + "epoch": 0.49, + "learning_rate": 1.0224287335179261e-05, + "loss": 0.6036, + "step": 14230 + }, + { + "epoch": 0.49, + "learning_rate": 1.022319874298528e-05, + "loss": 0.6498, + "step": 14231 + }, + { + "epoch": 0.49, + "learning_rate": 1.0222110148144998e-05, + "loss": 0.6534, + "step": 14232 + }, + { + "epoch": 0.49, + "learning_rate": 1.0221021550671315e-05, + "loss": 0.6513, + "step": 14233 + }, + { + "epoch": 0.49, + "learning_rate": 1.0219932950577148e-05, + "loss": 0.643, + "step": 14234 + }, + { + "epoch": 0.49, + "learning_rate": 1.0218844347875391e-05, + "loss": 0.6684, + "step": 14235 + }, + { + "epoch": 0.49, + "learning_rate": 1.0217755742578963e-05, + "loss": 0.6158, + "step": 14236 + }, + { + "epoch": 0.49, + "learning_rate": 1.0216667134700763e-05, + "loss": 0.605, + "step": 14237 + }, + { + "epoch": 0.49, + "learning_rate": 1.0215578524253698e-05, + "loss": 0.6328, + "step": 14238 + }, + { + "epoch": 0.49, + "learning_rate": 1.021448991125068e-05, + "loss": 0.6793, + "step": 14239 + }, + { + "epoch": 0.49, + "learning_rate": 1.021340129570461e-05, + "loss": 0.6477, + "step": 14240 + }, + { + "epoch": 0.49, + "learning_rate": 1.0212312677628399e-05, + "loss": 0.6496, + "step": 14241 + }, + { + "epoch": 0.49, + "learning_rate": 1.0211224057034954e-05, + "loss": 0.6061, + "step": 14242 + }, + { + "epoch": 0.49, + "learning_rate": 1.0210135433937178e-05, + "loss": 0.6116, + "step": 14243 + }, + { + "epoch": 0.49, + "learning_rate": 1.0209046808347983e-05, + "loss": 0.6327, + "step": 14244 + }, + { + "epoch": 0.49, + "learning_rate": 1.0207958180280273e-05, + "loss": 0.629, + "step": 14245 + }, + { + "epoch": 0.49, + "learning_rate": 1.0206869549746953e-05, + "loss": 0.6181, + "step": 14246 + }, + { + "epoch": 0.49, + "learning_rate": 1.0205780916760937e-05, + "loss": 0.6604, + "step": 14247 + }, + { + "epoch": 0.49, + "learning_rate": 1.0204692281335126e-05, + "loss": 0.6095, + "step": 14248 + }, + { + "epoch": 0.49, + "learning_rate": 1.0203603643482429e-05, + "loss": 0.606, + "step": 14249 + }, + { + "epoch": 0.49, + "learning_rate": 1.020251500321575e-05, + "loss": 0.5874, + "step": 14250 + }, + { + "epoch": 0.49, + "learning_rate": 1.0201426360548005e-05, + "loss": 0.6236, + "step": 14251 + }, + { + "epoch": 0.49, + "learning_rate": 1.0200337715492094e-05, + "loss": 0.6173, + "step": 14252 + }, + { + "epoch": 0.49, + "learning_rate": 1.0199249068060923e-05, + "loss": 0.6142, + "step": 14253 + }, + { + "epoch": 0.49, + "learning_rate": 1.019816041826741e-05, + "loss": 0.6341, + "step": 14254 + }, + { + "epoch": 0.49, + "learning_rate": 1.0197071766124447e-05, + "loss": 0.6715, + "step": 14255 + }, + { + "epoch": 0.49, + "learning_rate": 1.019598311164495e-05, + "loss": 0.6577, + "step": 14256 + }, + { + "epoch": 0.49, + "learning_rate": 1.0194894454841829e-05, + "loss": 0.6367, + "step": 14257 + }, + { + "epoch": 0.49, + "learning_rate": 1.0193805795727983e-05, + "loss": 0.6122, + "step": 14258 + }, + { + "epoch": 0.49, + "learning_rate": 1.0192717134316325e-05, + "loss": 0.6568, + "step": 14259 + }, + { + "epoch": 0.49, + "learning_rate": 1.0191628470619765e-05, + "loss": 0.6435, + "step": 14260 + }, + { + "epoch": 0.49, + "learning_rate": 1.0190539804651203e-05, + "loss": 0.671, + "step": 14261 + }, + { + "epoch": 0.49, + "learning_rate": 1.0189451136423552e-05, + "loss": 0.6483, + "step": 14262 + }, + { + "epoch": 0.49, + "learning_rate": 1.0188362465949719e-05, + "loss": 0.6661, + "step": 14263 + }, + { + "epoch": 0.49, + "learning_rate": 1.018727379324261e-05, + "loss": 0.5965, + "step": 14264 + }, + { + "epoch": 0.49, + "learning_rate": 1.0186185118315132e-05, + "loss": 0.6336, + "step": 14265 + }, + { + "epoch": 0.49, + "learning_rate": 1.0185096441180198e-05, + "loss": 0.6746, + "step": 14266 + }, + { + "epoch": 0.49, + "learning_rate": 1.018400776185071e-05, + "loss": 0.633, + "step": 14267 + }, + { + "epoch": 0.49, + "learning_rate": 1.0182919080339575e-05, + "loss": 0.6058, + "step": 14268 + }, + { + "epoch": 0.49, + "learning_rate": 1.0181830396659705e-05, + "loss": 0.6331, + "step": 14269 + }, + { + "epoch": 0.49, + "learning_rate": 1.0180741710824004e-05, + "loss": 0.5502, + "step": 14270 + }, + { + "epoch": 0.49, + "learning_rate": 1.0179653022845381e-05, + "loss": 0.6438, + "step": 14271 + }, + { + "epoch": 0.49, + "learning_rate": 1.0178564332736747e-05, + "loss": 0.5867, + "step": 14272 + }, + { + "epoch": 0.49, + "learning_rate": 1.0177475640511006e-05, + "loss": 0.6337, + "step": 14273 + }, + { + "epoch": 0.49, + "learning_rate": 1.0176386946181062e-05, + "loss": 0.6395, + "step": 14274 + }, + { + "epoch": 0.49, + "learning_rate": 1.0175298249759835e-05, + "loss": 0.649, + "step": 14275 + }, + { + "epoch": 0.49, + "learning_rate": 1.017420955126022e-05, + "loss": 0.616, + "step": 14276 + }, + { + "epoch": 0.49, + "learning_rate": 1.0173120850695132e-05, + "loss": 0.594, + "step": 14277 + }, + { + "epoch": 0.49, + "learning_rate": 1.017203214807748e-05, + "loss": 0.6655, + "step": 14278 + }, + { + "epoch": 0.49, + "learning_rate": 1.0170943443420168e-05, + "loss": 0.5961, + "step": 14279 + }, + { + "epoch": 0.49, + "learning_rate": 1.0169854736736103e-05, + "loss": 0.5546, + "step": 14280 + }, + { + "epoch": 0.49, + "learning_rate": 1.0168766028038197e-05, + "loss": 0.6158, + "step": 14281 + }, + { + "epoch": 0.49, + "learning_rate": 1.0167677317339355e-05, + "loss": 0.6491, + "step": 14282 + }, + { + "epoch": 0.49, + "learning_rate": 1.0166588604652488e-05, + "loss": 0.631, + "step": 14283 + }, + { + "epoch": 0.49, + "learning_rate": 1.0165499889990503e-05, + "loss": 0.5973, + "step": 14284 + }, + { + "epoch": 0.49, + "learning_rate": 1.0164411173366305e-05, + "loss": 0.6228, + "step": 14285 + }, + { + "epoch": 0.49, + "learning_rate": 1.0163322454792803e-05, + "loss": 0.6392, + "step": 14286 + }, + { + "epoch": 0.5, + "learning_rate": 1.0162233734282912e-05, + "loss": 0.6721, + "step": 14287 + }, + { + "epoch": 0.5, + "learning_rate": 1.016114501184953e-05, + "loss": 0.6023, + "step": 14288 + }, + { + "epoch": 0.5, + "learning_rate": 1.016005628750557e-05, + "loss": 0.6532, + "step": 14289 + }, + { + "epoch": 0.5, + "learning_rate": 1.0158967561263946e-05, + "loss": 0.6428, + "step": 14290 + }, + { + "epoch": 0.5, + "learning_rate": 1.0157878833137556e-05, + "loss": 0.5904, + "step": 14291 + }, + { + "epoch": 0.5, + "learning_rate": 1.015679010313931e-05, + "loss": 0.6743, + "step": 14292 + }, + { + "epoch": 0.5, + "learning_rate": 1.0155701371282125e-05, + "loss": 0.594, + "step": 14293 + }, + { + "epoch": 0.5, + "learning_rate": 1.01546126375789e-05, + "loss": 0.6725, + "step": 14294 + }, + { + "epoch": 0.5, + "learning_rate": 1.0153523902042548e-05, + "loss": 0.6545, + "step": 14295 + }, + { + "epoch": 0.5, + "learning_rate": 1.0152435164685977e-05, + "loss": 0.6466, + "step": 14296 + }, + { + "epoch": 0.5, + "learning_rate": 1.015134642552209e-05, + "loss": 0.6234, + "step": 14297 + }, + { + "epoch": 0.5, + "learning_rate": 1.0150257684563804e-05, + "loss": 0.5935, + "step": 14298 + }, + { + "epoch": 0.5, + "learning_rate": 1.0149168941824022e-05, + "loss": 0.6225, + "step": 14299 + }, + { + "epoch": 0.5, + "learning_rate": 1.0148080197315651e-05, + "loss": 0.6116, + "step": 14300 + }, + { + "epoch": 0.5, + "learning_rate": 1.0146991451051604e-05, + "loss": 0.6247, + "step": 14301 + }, + { + "epoch": 0.5, + "learning_rate": 1.0145902703044788e-05, + "loss": 0.6081, + "step": 14302 + }, + { + "epoch": 0.5, + "learning_rate": 1.0144813953308108e-05, + "loss": 0.6317, + "step": 14303 + }, + { + "epoch": 0.5, + "learning_rate": 1.014372520185448e-05, + "loss": 0.6771, + "step": 14304 + }, + { + "epoch": 0.5, + "learning_rate": 1.0142636448696803e-05, + "loss": 0.6132, + "step": 14305 + }, + { + "epoch": 0.5, + "learning_rate": 1.0141547693847992e-05, + "loss": 0.6341, + "step": 14306 + }, + { + "epoch": 0.5, + "learning_rate": 1.0140458937320958e-05, + "loss": 0.6659, + "step": 14307 + }, + { + "epoch": 0.5, + "learning_rate": 1.0139370179128601e-05, + "loss": 0.6558, + "step": 14308 + }, + { + "epoch": 0.5, + "learning_rate": 1.0138281419283835e-05, + "loss": 0.5942, + "step": 14309 + }, + { + "epoch": 0.5, + "learning_rate": 1.0137192657799571e-05, + "loss": 0.6049, + "step": 14310 + }, + { + "epoch": 0.5, + "learning_rate": 1.0136103894688709e-05, + "loss": 0.6065, + "step": 14311 + }, + { + "epoch": 0.5, + "learning_rate": 1.0135015129964168e-05, + "loss": 0.6078, + "step": 14312 + }, + { + "epoch": 0.5, + "learning_rate": 1.0133926363638851e-05, + "loss": 0.6473, + "step": 14313 + }, + { + "epoch": 0.5, + "learning_rate": 1.0132837595725665e-05, + "loss": 0.6344, + "step": 14314 + }, + { + "epoch": 0.5, + "learning_rate": 1.0131748826237522e-05, + "loss": 0.6871, + "step": 14315 + }, + { + "epoch": 0.5, + "learning_rate": 1.013066005518733e-05, + "loss": 0.6406, + "step": 14316 + }, + { + "epoch": 0.5, + "learning_rate": 1.0129571282588e-05, + "loss": 0.6617, + "step": 14317 + }, + { + "epoch": 0.5, + "learning_rate": 1.0128482508452435e-05, + "loss": 0.6405, + "step": 14318 + }, + { + "epoch": 0.5, + "learning_rate": 1.012739373279355e-05, + "loss": 0.6599, + "step": 14319 + }, + { + "epoch": 0.5, + "learning_rate": 1.012630495562425e-05, + "loss": 0.6301, + "step": 14320 + }, + { + "epoch": 0.5, + "learning_rate": 1.0125216176957446e-05, + "loss": 0.5889, + "step": 14321 + }, + { + "epoch": 0.5, + "learning_rate": 1.0124127396806048e-05, + "loss": 0.6571, + "step": 14322 + }, + { + "epoch": 0.5, + "learning_rate": 1.0123038615182959e-05, + "loss": 0.6243, + "step": 14323 + }, + { + "epoch": 0.5, + "learning_rate": 1.0121949832101092e-05, + "loss": 0.6351, + "step": 14324 + }, + { + "epoch": 0.5, + "learning_rate": 1.0120861047573358e-05, + "loss": 0.704, + "step": 14325 + }, + { + "epoch": 0.5, + "learning_rate": 1.0119772261612659e-05, + "loss": 0.6067, + "step": 14326 + }, + { + "epoch": 0.5, + "learning_rate": 1.0118683474231911e-05, + "loss": 0.6304, + "step": 14327 + }, + { + "epoch": 0.5, + "learning_rate": 1.0117594685444021e-05, + "loss": 0.6418, + "step": 14328 + }, + { + "epoch": 0.5, + "learning_rate": 1.01165058952619e-05, + "loss": 0.6265, + "step": 14329 + }, + { + "epoch": 0.5, + "learning_rate": 1.0115417103698447e-05, + "loss": 0.6492, + "step": 14330 + }, + { + "epoch": 0.5, + "learning_rate": 1.0114328310766582e-05, + "loss": 0.5989, + "step": 14331 + }, + { + "epoch": 0.5, + "learning_rate": 1.0113239516479212e-05, + "loss": 0.5833, + "step": 14332 + }, + { + "epoch": 0.5, + "learning_rate": 1.0112150720849239e-05, + "loss": 0.6569, + "step": 14333 + }, + { + "epoch": 0.5, + "learning_rate": 1.0111061923889582e-05, + "loss": 0.6336, + "step": 14334 + }, + { + "epoch": 0.5, + "learning_rate": 1.0109973125613146e-05, + "loss": 0.6327, + "step": 14335 + }, + { + "epoch": 0.5, + "learning_rate": 1.0108884326032834e-05, + "loss": 0.617, + "step": 14336 + }, + { + "epoch": 0.5, + "learning_rate": 1.0107795525161565e-05, + "loss": 0.6322, + "step": 14337 + }, + { + "epoch": 0.5, + "learning_rate": 1.0106706723012246e-05, + "loss": 0.6144, + "step": 14338 + }, + { + "epoch": 0.5, + "learning_rate": 1.0105617919597777e-05, + "loss": 0.6724, + "step": 14339 + }, + { + "epoch": 0.5, + "learning_rate": 1.0104529114931079e-05, + "loss": 0.6715, + "step": 14340 + }, + { + "epoch": 0.5, + "learning_rate": 1.0103440309025056e-05, + "loss": 0.6476, + "step": 14341 + }, + { + "epoch": 0.5, + "learning_rate": 1.0102351501892616e-05, + "loss": 0.694, + "step": 14342 + }, + { + "epoch": 0.5, + "learning_rate": 1.0101262693546668e-05, + "loss": 0.5982, + "step": 14343 + }, + { + "epoch": 0.5, + "learning_rate": 1.0100173884000126e-05, + "loss": 0.6505, + "step": 14344 + }, + { + "epoch": 0.5, + "learning_rate": 1.0099085073265894e-05, + "loss": 0.6528, + "step": 14345 + }, + { + "epoch": 0.5, + "learning_rate": 1.009799626135688e-05, + "loss": 0.6333, + "step": 14346 + }, + { + "epoch": 0.5, + "learning_rate": 1.0096907448286001e-05, + "loss": 0.6289, + "step": 14347 + }, + { + "epoch": 0.5, + "learning_rate": 1.009581863406616e-05, + "loss": 0.5271, + "step": 14348 + }, + { + "epoch": 0.5, + "learning_rate": 1.0094729818710267e-05, + "loss": 0.6871, + "step": 14349 + }, + { + "epoch": 0.5, + "learning_rate": 1.0093641002231235e-05, + "loss": 0.6226, + "step": 14350 + }, + { + "epoch": 0.5, + "learning_rate": 1.0092552184641969e-05, + "loss": 0.6057, + "step": 14351 + }, + { + "epoch": 0.5, + "learning_rate": 1.0091463365955378e-05, + "loss": 0.6424, + "step": 14352 + }, + { + "epoch": 0.5, + "learning_rate": 1.0090374546184376e-05, + "loss": 0.6524, + "step": 14353 + }, + { + "epoch": 0.5, + "learning_rate": 1.0089285725341866e-05, + "loss": 0.6352, + "step": 14354 + }, + { + "epoch": 0.5, + "learning_rate": 1.0088196903440763e-05, + "loss": 0.5802, + "step": 14355 + }, + { + "epoch": 0.5, + "learning_rate": 1.0087108080493975e-05, + "loss": 0.6602, + "step": 14356 + }, + { + "epoch": 0.5, + "learning_rate": 1.0086019256514407e-05, + "loss": 0.6205, + "step": 14357 + }, + { + "epoch": 0.5, + "learning_rate": 1.0084930431514975e-05, + "loss": 0.6405, + "step": 14358 + }, + { + "epoch": 0.5, + "learning_rate": 1.0083841605508586e-05, + "loss": 0.6411, + "step": 14359 + }, + { + "epoch": 0.5, + "learning_rate": 1.0082752778508148e-05, + "loss": 0.6281, + "step": 14360 + }, + { + "epoch": 0.5, + "learning_rate": 1.0081663950526568e-05, + "loss": 0.6148, + "step": 14361 + }, + { + "epoch": 0.5, + "learning_rate": 1.0080575121576761e-05, + "loss": 0.617, + "step": 14362 + }, + { + "epoch": 0.5, + "learning_rate": 1.0079486291671634e-05, + "loss": 0.6497, + "step": 14363 + }, + { + "epoch": 0.5, + "learning_rate": 1.0078397460824096e-05, + "loss": 0.6476, + "step": 14364 + }, + { + "epoch": 0.5, + "learning_rate": 1.0077308629047058e-05, + "loss": 0.6297, + "step": 14365 + }, + { + "epoch": 0.5, + "learning_rate": 1.0076219796353428e-05, + "loss": 0.6908, + "step": 14366 + }, + { + "epoch": 0.5, + "learning_rate": 1.0075130962756115e-05, + "loss": 0.5614, + "step": 14367 + }, + { + "epoch": 0.5, + "learning_rate": 1.007404212826803e-05, + "loss": 0.6123, + "step": 14368 + }, + { + "epoch": 0.5, + "learning_rate": 1.0072953292902082e-05, + "loss": 0.6676, + "step": 14369 + }, + { + "epoch": 0.5, + "learning_rate": 1.0071864456671179e-05, + "loss": 0.5812, + "step": 14370 + }, + { + "epoch": 0.5, + "learning_rate": 1.0070775619588236e-05, + "loss": 0.6192, + "step": 14371 + }, + { + "epoch": 0.5, + "learning_rate": 1.0069686781666156e-05, + "loss": 0.5759, + "step": 14372 + }, + { + "epoch": 0.5, + "learning_rate": 1.0068597942917848e-05, + "loss": 0.6694, + "step": 14373 + }, + { + "epoch": 0.5, + "learning_rate": 1.006750910335623e-05, + "loss": 0.6671, + "step": 14374 + }, + { + "epoch": 0.5, + "learning_rate": 1.0066420262994203e-05, + "loss": 0.6339, + "step": 14375 + }, + { + "epoch": 0.5, + "learning_rate": 1.006533142184468e-05, + "loss": 0.5978, + "step": 14376 + }, + { + "epoch": 0.5, + "learning_rate": 1.0064242579920571e-05, + "loss": 0.6054, + "step": 14377 + }, + { + "epoch": 0.5, + "learning_rate": 1.0063153737234784e-05, + "loss": 0.6203, + "step": 14378 + }, + { + "epoch": 0.5, + "learning_rate": 1.006206489380023e-05, + "loss": 0.6096, + "step": 14379 + }, + { + "epoch": 0.5, + "learning_rate": 1.006097604962982e-05, + "loss": 0.583, + "step": 14380 + }, + { + "epoch": 0.5, + "learning_rate": 1.0059887204736458e-05, + "loss": 0.6662, + "step": 14381 + }, + { + "epoch": 0.5, + "learning_rate": 1.005879835913306e-05, + "loss": 0.6413, + "step": 14382 + }, + { + "epoch": 0.5, + "learning_rate": 1.0057709512832533e-05, + "loss": 0.6244, + "step": 14383 + }, + { + "epoch": 0.5, + "learning_rate": 1.0056620665847788e-05, + "loss": 0.7072, + "step": 14384 + }, + { + "epoch": 0.5, + "learning_rate": 1.005553181819173e-05, + "loss": 0.6486, + "step": 14385 + }, + { + "epoch": 0.5, + "learning_rate": 1.0054442969877276e-05, + "loss": 0.6265, + "step": 14386 + }, + { + "epoch": 0.5, + "learning_rate": 1.0053354120917326e-05, + "loss": 0.6269, + "step": 14387 + }, + { + "epoch": 0.5, + "learning_rate": 1.00522652713248e-05, + "loss": 0.5966, + "step": 14388 + }, + { + "epoch": 0.5, + "learning_rate": 1.0051176421112603e-05, + "loss": 0.6834, + "step": 14389 + }, + { + "epoch": 0.5, + "learning_rate": 1.0050087570293643e-05, + "loss": 0.6106, + "step": 14390 + }, + { + "epoch": 0.5, + "learning_rate": 1.0048998718880834e-05, + "loss": 0.677, + "step": 14391 + }, + { + "epoch": 0.5, + "learning_rate": 1.0047909866887081e-05, + "loss": 0.5819, + "step": 14392 + }, + { + "epoch": 0.5, + "learning_rate": 1.0046821014325297e-05, + "loss": 0.6472, + "step": 14393 + }, + { + "epoch": 0.5, + "learning_rate": 1.004573216120839e-05, + "loss": 0.5778, + "step": 14394 + }, + { + "epoch": 0.5, + "learning_rate": 1.004464330754927e-05, + "loss": 0.5917, + "step": 14395 + }, + { + "epoch": 0.5, + "learning_rate": 1.0043554453360847e-05, + "loss": 0.68, + "step": 14396 + }, + { + "epoch": 0.5, + "learning_rate": 1.0042465598656033e-05, + "loss": 0.6033, + "step": 14397 + }, + { + "epoch": 0.5, + "learning_rate": 1.0041376743447732e-05, + "loss": 0.6473, + "step": 14398 + }, + { + "epoch": 0.5, + "learning_rate": 1.0040287887748861e-05, + "loss": 0.668, + "step": 14399 + }, + { + "epoch": 0.5, + "learning_rate": 1.0039199031572326e-05, + "loss": 0.6483, + "step": 14400 + }, + { + "epoch": 0.5, + "learning_rate": 1.0038110174931035e-05, + "loss": 0.5752, + "step": 14401 + }, + { + "epoch": 0.5, + "learning_rate": 1.0037021317837898e-05, + "loss": 0.5742, + "step": 14402 + }, + { + "epoch": 0.5, + "learning_rate": 1.0035932460305831e-05, + "loss": 0.6958, + "step": 14403 + }, + { + "epoch": 0.5, + "learning_rate": 1.0034843602347735e-05, + "loss": 0.5937, + "step": 14404 + }, + { + "epoch": 0.5, + "learning_rate": 1.0033754743976525e-05, + "loss": 0.6463, + "step": 14405 + }, + { + "epoch": 0.5, + "learning_rate": 1.0032665885205113e-05, + "loss": 0.5964, + "step": 14406 + }, + { + "epoch": 0.5, + "learning_rate": 1.0031577026046401e-05, + "loss": 0.6406, + "step": 14407 + }, + { + "epoch": 0.5, + "learning_rate": 1.0030488166513307e-05, + "loss": 0.6369, + "step": 14408 + }, + { + "epoch": 0.5, + "learning_rate": 1.0029399306618737e-05, + "loss": 0.6658, + "step": 14409 + }, + { + "epoch": 0.5, + "learning_rate": 1.0028310446375598e-05, + "loss": 0.6818, + "step": 14410 + }, + { + "epoch": 0.5, + "learning_rate": 1.0027221585796804e-05, + "loss": 0.6566, + "step": 14411 + }, + { + "epoch": 0.5, + "learning_rate": 1.0026132724895265e-05, + "loss": 0.6225, + "step": 14412 + }, + { + "epoch": 0.5, + "learning_rate": 1.002504386368389e-05, + "loss": 0.6283, + "step": 14413 + }, + { + "epoch": 0.5, + "learning_rate": 1.0023955002175587e-05, + "loss": 0.6394, + "step": 14414 + }, + { + "epoch": 0.5, + "learning_rate": 1.0022866140383267e-05, + "loss": 0.6216, + "step": 14415 + }, + { + "epoch": 0.5, + "learning_rate": 1.0021777278319839e-05, + "loss": 0.7218, + "step": 14416 + }, + { + "epoch": 0.5, + "learning_rate": 1.0020688415998217e-05, + "loss": 0.6324, + "step": 14417 + }, + { + "epoch": 0.5, + "learning_rate": 1.0019599553431308e-05, + "loss": 0.6472, + "step": 14418 + }, + { + "epoch": 0.5, + "learning_rate": 1.0018510690632017e-05, + "loss": 0.6632, + "step": 14419 + }, + { + "epoch": 0.5, + "learning_rate": 1.001742182761326e-05, + "loss": 0.6385, + "step": 14420 + }, + { + "epoch": 0.5, + "learning_rate": 1.0016332964387948e-05, + "loss": 0.6636, + "step": 14421 + }, + { + "epoch": 0.5, + "learning_rate": 1.0015244100968986e-05, + "loss": 0.6804, + "step": 14422 + }, + { + "epoch": 0.5, + "learning_rate": 1.0014155237369283e-05, + "loss": 0.6259, + "step": 14423 + }, + { + "epoch": 0.5, + "learning_rate": 1.0013066373601757e-05, + "loss": 0.6352, + "step": 14424 + }, + { + "epoch": 0.5, + "learning_rate": 1.0011977509679312e-05, + "loss": 0.5801, + "step": 14425 + }, + { + "epoch": 0.5, + "learning_rate": 1.0010888645614853e-05, + "loss": 0.6359, + "step": 14426 + }, + { + "epoch": 0.5, + "learning_rate": 1.0009799781421302e-05, + "loss": 0.6629, + "step": 14427 + }, + { + "epoch": 0.5, + "learning_rate": 1.000871091711156e-05, + "loss": 0.5948, + "step": 14428 + }, + { + "epoch": 0.5, + "learning_rate": 1.0007622052698533e-05, + "loss": 0.673, + "step": 14429 + }, + { + "epoch": 0.5, + "learning_rate": 1.0006533188195144e-05, + "loss": 0.6555, + "step": 14430 + }, + { + "epoch": 0.5, + "learning_rate": 1.0005444323614295e-05, + "loss": 0.6262, + "step": 14431 + }, + { + "epoch": 0.5, + "learning_rate": 1.0004355458968892e-05, + "loss": 0.5915, + "step": 14432 + }, + { + "epoch": 0.5, + "learning_rate": 1.0003266594271856e-05, + "loss": 0.5959, + "step": 14433 + }, + { + "epoch": 0.5, + "learning_rate": 1.0002177729536089e-05, + "loss": 0.6094, + "step": 14434 + }, + { + "epoch": 0.5, + "learning_rate": 1.0001088864774498e-05, + "loss": 0.6435, + "step": 14435 + }, + { + "epoch": 0.5, + "learning_rate": 1e-05, + "loss": 0.5964, + "step": 14436 + }, + { + "epoch": 0.5, + "learning_rate": 9.998911135225503e-06, + "loss": 0.6196, + "step": 14437 + }, + { + "epoch": 0.5, + "learning_rate": 9.997822270463916e-06, + "loss": 0.6596, + "step": 14438 + }, + { + "epoch": 0.5, + "learning_rate": 9.996733405728145e-06, + "loss": 0.6125, + "step": 14439 + }, + { + "epoch": 0.5, + "learning_rate": 9.995644541031106e-06, + "loss": 0.6454, + "step": 14440 + }, + { + "epoch": 0.5, + "learning_rate": 9.994555676385708e-06, + "loss": 0.5861, + "step": 14441 + }, + { + "epoch": 0.5, + "learning_rate": 9.993466811804858e-06, + "loss": 0.6523, + "step": 14442 + }, + { + "epoch": 0.5, + "learning_rate": 9.992377947301467e-06, + "loss": 0.6652, + "step": 14443 + }, + { + "epoch": 0.5, + "learning_rate": 9.991289082888447e-06, + "loss": 0.6316, + "step": 14444 + }, + { + "epoch": 0.5, + "learning_rate": 9.990200218578703e-06, + "loss": 0.6482, + "step": 14445 + }, + { + "epoch": 0.5, + "learning_rate": 9.989111354385149e-06, + "loss": 0.6018, + "step": 14446 + }, + { + "epoch": 0.5, + "learning_rate": 9.988022490320695e-06, + "loss": 0.6747, + "step": 14447 + }, + { + "epoch": 0.5, + "learning_rate": 9.986933626398247e-06, + "loss": 0.6602, + "step": 14448 + }, + { + "epoch": 0.5, + "learning_rate": 9.985844762630717e-06, + "loss": 0.5925, + "step": 14449 + }, + { + "epoch": 0.5, + "learning_rate": 9.984755899031019e-06, + "loss": 0.5598, + "step": 14450 + }, + { + "epoch": 0.5, + "learning_rate": 9.983667035612056e-06, + "loss": 0.6174, + "step": 14451 + }, + { + "epoch": 0.5, + "learning_rate": 9.98257817238674e-06, + "loss": 0.674, + "step": 14452 + }, + { + "epoch": 0.5, + "learning_rate": 9.981489309367987e-06, + "loss": 0.6325, + "step": 14453 + }, + { + "epoch": 0.5, + "learning_rate": 9.980400446568696e-06, + "loss": 0.6354, + "step": 14454 + }, + { + "epoch": 0.5, + "learning_rate": 9.979311584001785e-06, + "loss": 0.6064, + "step": 14455 + }, + { + "epoch": 0.5, + "learning_rate": 9.978222721680163e-06, + "loss": 0.6084, + "step": 14456 + }, + { + "epoch": 0.5, + "learning_rate": 9.977133859616735e-06, + "loss": 0.6178, + "step": 14457 + }, + { + "epoch": 0.5, + "learning_rate": 9.976044997824415e-06, + "loss": 0.5926, + "step": 14458 + }, + { + "epoch": 0.5, + "learning_rate": 9.974956136316112e-06, + "loss": 0.6833, + "step": 14459 + }, + { + "epoch": 0.5, + "learning_rate": 9.973867275104737e-06, + "loss": 0.5931, + "step": 14460 + }, + { + "epoch": 0.5, + "learning_rate": 9.972778414203196e-06, + "loss": 0.6011, + "step": 14461 + }, + { + "epoch": 0.5, + "learning_rate": 9.971689553624403e-06, + "loss": 0.6079, + "step": 14462 + }, + { + "epoch": 0.5, + "learning_rate": 9.970600693381266e-06, + "loss": 0.6535, + "step": 14463 + }, + { + "epoch": 0.5, + "learning_rate": 9.969511833486695e-06, + "loss": 0.663, + "step": 14464 + }, + { + "epoch": 0.5, + "learning_rate": 9.9684229739536e-06, + "loss": 0.6005, + "step": 14465 + }, + { + "epoch": 0.5, + "learning_rate": 9.96733411479489e-06, + "loss": 0.668, + "step": 14466 + }, + { + "epoch": 0.5, + "learning_rate": 9.966245256023475e-06, + "loss": 0.6567, + "step": 14467 + }, + { + "epoch": 0.5, + "learning_rate": 9.965156397652267e-06, + "loss": 0.6447, + "step": 14468 + }, + { + "epoch": 0.5, + "learning_rate": 9.964067539694172e-06, + "loss": 0.6386, + "step": 14469 + }, + { + "epoch": 0.5, + "learning_rate": 9.962978682162105e-06, + "loss": 0.663, + "step": 14470 + }, + { + "epoch": 0.5, + "learning_rate": 9.961889825068968e-06, + "loss": 0.6387, + "step": 14471 + }, + { + "epoch": 0.5, + "learning_rate": 9.960800968427678e-06, + "loss": 0.6515, + "step": 14472 + }, + { + "epoch": 0.5, + "learning_rate": 9.959712112251142e-06, + "loss": 0.6732, + "step": 14473 + }, + { + "epoch": 0.5, + "learning_rate": 9.95862325655227e-06, + "loss": 0.6081, + "step": 14474 + }, + { + "epoch": 0.5, + "learning_rate": 9.95753440134397e-06, + "loss": 0.6725, + "step": 14475 + }, + { + "epoch": 0.5, + "learning_rate": 9.956445546639155e-06, + "loss": 0.6721, + "step": 14476 + }, + { + "epoch": 0.5, + "learning_rate": 9.955356692450733e-06, + "loss": 0.599, + "step": 14477 + }, + { + "epoch": 0.5, + "learning_rate": 9.954267838791612e-06, + "loss": 0.6345, + "step": 14478 + }, + { + "epoch": 0.5, + "learning_rate": 9.953178985674707e-06, + "loss": 0.6217, + "step": 14479 + }, + { + "epoch": 0.5, + "learning_rate": 9.952090133112922e-06, + "loss": 0.6304, + "step": 14480 + }, + { + "epoch": 0.5, + "learning_rate": 9.951001281119167e-06, + "loss": 0.6613, + "step": 14481 + }, + { + "epoch": 0.5, + "learning_rate": 9.949912429706359e-06, + "loss": 0.6128, + "step": 14482 + }, + { + "epoch": 0.5, + "learning_rate": 9.948823578887398e-06, + "loss": 0.5912, + "step": 14483 + }, + { + "epoch": 0.5, + "learning_rate": 9.9477347286752e-06, + "loss": 0.6151, + "step": 14484 + }, + { + "epoch": 0.5, + "learning_rate": 9.946645879082675e-06, + "loss": 0.64, + "step": 14485 + }, + { + "epoch": 0.5, + "learning_rate": 9.945557030122729e-06, + "loss": 0.6723, + "step": 14486 + }, + { + "epoch": 0.5, + "learning_rate": 9.944468181808272e-06, + "loss": 0.625, + "step": 14487 + }, + { + "epoch": 0.5, + "learning_rate": 9.943379334152217e-06, + "loss": 0.5778, + "step": 14488 + }, + { + "epoch": 0.5, + "learning_rate": 9.942290487167468e-06, + "loss": 0.6405, + "step": 14489 + }, + { + "epoch": 0.5, + "learning_rate": 9.94120164086694e-06, + "loss": 0.6057, + "step": 14490 + }, + { + "epoch": 0.5, + "learning_rate": 9.940112795263543e-06, + "loss": 0.6302, + "step": 14491 + }, + { + "epoch": 0.5, + "learning_rate": 9.939023950370183e-06, + "loss": 0.5888, + "step": 14492 + }, + { + "epoch": 0.5, + "learning_rate": 9.93793510619977e-06, + "loss": 0.6217, + "step": 14493 + }, + { + "epoch": 0.5, + "learning_rate": 9.936846262765218e-06, + "loss": 0.6609, + "step": 14494 + }, + { + "epoch": 0.5, + "learning_rate": 9.935757420079432e-06, + "loss": 0.6587, + "step": 14495 + }, + { + "epoch": 0.5, + "learning_rate": 9.934668578155322e-06, + "loss": 0.6141, + "step": 14496 + }, + { + "epoch": 0.5, + "learning_rate": 9.9335797370058e-06, + "loss": 0.5736, + "step": 14497 + }, + { + "epoch": 0.5, + "learning_rate": 9.932490896643773e-06, + "loss": 0.6504, + "step": 14498 + }, + { + "epoch": 0.5, + "learning_rate": 9.931402057082152e-06, + "loss": 0.6797, + "step": 14499 + }, + { + "epoch": 0.5, + "learning_rate": 9.930313218333848e-06, + "loss": 0.635, + "step": 14500 + }, + { + "epoch": 0.5, + "learning_rate": 9.929224380411767e-06, + "loss": 0.6465, + "step": 14501 + }, + { + "epoch": 0.5, + "learning_rate": 9.928135543328821e-06, + "loss": 0.5917, + "step": 14502 + }, + { + "epoch": 0.5, + "learning_rate": 9.92704670709792e-06, + "loss": 0.6649, + "step": 14503 + }, + { + "epoch": 0.5, + "learning_rate": 9.92595787173197e-06, + "loss": 0.648, + "step": 14504 + }, + { + "epoch": 0.5, + "learning_rate": 9.924869037243887e-06, + "loss": 0.6347, + "step": 14505 + }, + { + "epoch": 0.5, + "learning_rate": 9.923780203646575e-06, + "loss": 0.597, + "step": 14506 + }, + { + "epoch": 0.5, + "learning_rate": 9.922691370952944e-06, + "loss": 0.6365, + "step": 14507 + }, + { + "epoch": 0.5, + "learning_rate": 9.921602539175906e-06, + "loss": 0.5844, + "step": 14508 + }, + { + "epoch": 0.5, + "learning_rate": 9.920513708328368e-06, + "loss": 0.6469, + "step": 14509 + }, + { + "epoch": 0.5, + "learning_rate": 9.91942487842324e-06, + "loss": 0.6118, + "step": 14510 + }, + { + "epoch": 0.5, + "learning_rate": 9.918336049473432e-06, + "loss": 0.5715, + "step": 14511 + }, + { + "epoch": 0.5, + "learning_rate": 9.917247221491857e-06, + "loss": 0.6116, + "step": 14512 + }, + { + "epoch": 0.5, + "learning_rate": 9.916158394491418e-06, + "loss": 0.5763, + "step": 14513 + }, + { + "epoch": 0.5, + "learning_rate": 9.915069568485027e-06, + "loss": 0.6082, + "step": 14514 + }, + { + "epoch": 0.5, + "learning_rate": 9.913980743485594e-06, + "loss": 0.602, + "step": 14515 + }, + { + "epoch": 0.5, + "learning_rate": 9.912891919506028e-06, + "loss": 0.5904, + "step": 14516 + }, + { + "epoch": 0.5, + "learning_rate": 9.911803096559239e-06, + "loss": 0.6552, + "step": 14517 + }, + { + "epoch": 0.5, + "learning_rate": 9.910714274658136e-06, + "loss": 0.6089, + "step": 14518 + }, + { + "epoch": 0.5, + "learning_rate": 9.909625453815627e-06, + "loss": 0.6539, + "step": 14519 + }, + { + "epoch": 0.5, + "learning_rate": 9.908536634044624e-06, + "loss": 0.5691, + "step": 14520 + }, + { + "epoch": 0.5, + "learning_rate": 9.907447815358035e-06, + "loss": 0.6198, + "step": 14521 + }, + { + "epoch": 0.5, + "learning_rate": 9.906358997768768e-06, + "loss": 0.6596, + "step": 14522 + }, + { + "epoch": 0.5, + "learning_rate": 9.905270181289733e-06, + "loss": 0.6031, + "step": 14523 + }, + { + "epoch": 0.5, + "learning_rate": 9.904181365933843e-06, + "loss": 0.6013, + "step": 14524 + }, + { + "epoch": 0.5, + "learning_rate": 9.903092551714e-06, + "loss": 0.629, + "step": 14525 + }, + { + "epoch": 0.5, + "learning_rate": 9.90200373864312e-06, + "loss": 0.6538, + "step": 14526 + }, + { + "epoch": 0.5, + "learning_rate": 9.90091492673411e-06, + "loss": 0.6503, + "step": 14527 + }, + { + "epoch": 0.5, + "learning_rate": 9.899826115999877e-06, + "loss": 0.6162, + "step": 14528 + }, + { + "epoch": 0.5, + "learning_rate": 9.898737306453334e-06, + "loss": 0.6299, + "step": 14529 + }, + { + "epoch": 0.5, + "learning_rate": 9.897648498107387e-06, + "loss": 0.6852, + "step": 14530 + }, + { + "epoch": 0.5, + "learning_rate": 9.896559690974947e-06, + "loss": 0.6092, + "step": 14531 + }, + { + "epoch": 0.5, + "learning_rate": 9.895470885068926e-06, + "loss": 0.5865, + "step": 14532 + }, + { + "epoch": 0.5, + "learning_rate": 9.894382080402226e-06, + "loss": 0.6395, + "step": 14533 + }, + { + "epoch": 0.5, + "learning_rate": 9.893293276987758e-06, + "loss": 0.5891, + "step": 14534 + }, + { + "epoch": 0.5, + "learning_rate": 9.89220447483844e-06, + "loss": 0.6695, + "step": 14535 + }, + { + "epoch": 0.5, + "learning_rate": 9.891115673967169e-06, + "loss": 0.6624, + "step": 14536 + }, + { + "epoch": 0.5, + "learning_rate": 9.890026874386856e-06, + "loss": 0.577, + "step": 14537 + }, + { + "epoch": 0.5, + "learning_rate": 9.888938076110423e-06, + "loss": 0.661, + "step": 14538 + }, + { + "epoch": 0.5, + "learning_rate": 9.887849279150764e-06, + "loss": 0.5913, + "step": 14539 + }, + { + "epoch": 0.5, + "learning_rate": 9.886760483520791e-06, + "loss": 0.6459, + "step": 14540 + }, + { + "epoch": 0.5, + "learning_rate": 9.885671689233423e-06, + "loss": 0.6933, + "step": 14541 + }, + { + "epoch": 0.5, + "learning_rate": 9.884582896301556e-06, + "loss": 0.6602, + "step": 14542 + }, + { + "epoch": 0.5, + "learning_rate": 9.883494104738105e-06, + "loss": 0.6041, + "step": 14543 + }, + { + "epoch": 0.5, + "learning_rate": 9.882405314555984e-06, + "loss": 0.6398, + "step": 14544 + }, + { + "epoch": 0.5, + "learning_rate": 9.881316525768092e-06, + "loss": 0.6133, + "step": 14545 + }, + { + "epoch": 0.5, + "learning_rate": 9.880227738387341e-06, + "loss": 0.6455, + "step": 14546 + }, + { + "epoch": 0.5, + "learning_rate": 9.879138952426649e-06, + "loss": 0.6153, + "step": 14547 + }, + { + "epoch": 0.5, + "learning_rate": 9.878050167898911e-06, + "loss": 0.6437, + "step": 14548 + }, + { + "epoch": 0.5, + "learning_rate": 9.876961384817041e-06, + "loss": 0.6763, + "step": 14549 + }, + { + "epoch": 0.5, + "learning_rate": 9.875872603193957e-06, + "loss": 0.6521, + "step": 14550 + }, + { + "epoch": 0.5, + "learning_rate": 9.874783823042556e-06, + "loss": 0.565, + "step": 14551 + }, + { + "epoch": 0.5, + "learning_rate": 9.873695044375749e-06, + "loss": 0.6458, + "step": 14552 + }, + { + "epoch": 0.5, + "learning_rate": 9.872606267206453e-06, + "loss": 0.6755, + "step": 14553 + }, + { + "epoch": 0.5, + "learning_rate": 9.871517491547566e-06, + "loss": 0.6366, + "step": 14554 + }, + { + "epoch": 0.5, + "learning_rate": 9.870428717412001e-06, + "loss": 0.5852, + "step": 14555 + }, + { + "epoch": 0.5, + "learning_rate": 9.869339944812673e-06, + "loss": 0.6154, + "step": 14556 + }, + { + "epoch": 0.5, + "learning_rate": 9.868251173762481e-06, + "loss": 0.61, + "step": 14557 + }, + { + "epoch": 0.5, + "learning_rate": 9.867162404274337e-06, + "loss": 0.6795, + "step": 14558 + }, + { + "epoch": 0.5, + "learning_rate": 9.866073636361155e-06, + "loss": 0.6026, + "step": 14559 + }, + { + "epoch": 0.5, + "learning_rate": 9.864984870035837e-06, + "loss": 0.6724, + "step": 14560 + }, + { + "epoch": 0.5, + "learning_rate": 9.86389610531129e-06, + "loss": 0.6225, + "step": 14561 + }, + { + "epoch": 0.5, + "learning_rate": 9.862807342200436e-06, + "loss": 0.6769, + "step": 14562 + }, + { + "epoch": 0.5, + "learning_rate": 9.861718580716168e-06, + "loss": 0.611, + "step": 14563 + }, + { + "epoch": 0.5, + "learning_rate": 9.860629820871399e-06, + "loss": 0.6158, + "step": 14564 + }, + { + "epoch": 0.5, + "learning_rate": 9.859541062679047e-06, + "loss": 0.6637, + "step": 14565 + }, + { + "epoch": 0.5, + "learning_rate": 9.85845230615201e-06, + "loss": 0.6854, + "step": 14566 + }, + { + "epoch": 0.5, + "learning_rate": 9.857363551303197e-06, + "loss": 0.6237, + "step": 14567 + }, + { + "epoch": 0.5, + "learning_rate": 9.856274798145526e-06, + "loss": 0.6432, + "step": 14568 + }, + { + "epoch": 0.5, + "learning_rate": 9.855186046691895e-06, + "loss": 0.67, + "step": 14569 + }, + { + "epoch": 0.5, + "learning_rate": 9.854097296955212e-06, + "loss": 0.6384, + "step": 14570 + }, + { + "epoch": 0.5, + "learning_rate": 9.8530085489484e-06, + "loss": 0.6221, + "step": 14571 + }, + { + "epoch": 0.5, + "learning_rate": 9.851919802684352e-06, + "loss": 0.6629, + "step": 14572 + }, + { + "epoch": 0.5, + "learning_rate": 9.85083105817598e-06, + "loss": 0.6443, + "step": 14573 + }, + { + "epoch": 0.5, + "learning_rate": 9.849742315436201e-06, + "loss": 0.6317, + "step": 14574 + }, + { + "epoch": 0.5, + "learning_rate": 9.848653574477912e-06, + "loss": 0.6129, + "step": 14575 + }, + { + "epoch": 0.51, + "learning_rate": 9.847564835314025e-06, + "loss": 0.6149, + "step": 14576 + }, + { + "epoch": 0.51, + "learning_rate": 9.846476097957455e-06, + "loss": 0.6387, + "step": 14577 + }, + { + "epoch": 0.51, + "learning_rate": 9.845387362421102e-06, + "loss": 0.6517, + "step": 14578 + }, + { + "epoch": 0.51, + "learning_rate": 9.844298628717875e-06, + "loss": 0.6128, + "step": 14579 + }, + { + "epoch": 0.51, + "learning_rate": 9.843209896860691e-06, + "loss": 0.6061, + "step": 14580 + }, + { + "epoch": 0.51, + "learning_rate": 9.842121166862449e-06, + "loss": 0.685, + "step": 14581 + }, + { + "epoch": 0.51, + "learning_rate": 9.841032438736055e-06, + "loss": 0.585, + "step": 14582 + }, + { + "epoch": 0.51, + "learning_rate": 9.839943712494432e-06, + "loss": 0.6597, + "step": 14583 + }, + { + "epoch": 0.51, + "learning_rate": 9.838854988150472e-06, + "loss": 0.6667, + "step": 14584 + }, + { + "epoch": 0.51, + "learning_rate": 9.83776626571709e-06, + "loss": 0.6645, + "step": 14585 + }, + { + "epoch": 0.51, + "learning_rate": 9.836677545207199e-06, + "loss": 0.6191, + "step": 14586 + }, + { + "epoch": 0.51, + "learning_rate": 9.8355888266337e-06, + "loss": 0.622, + "step": 14587 + }, + { + "epoch": 0.51, + "learning_rate": 9.834500110009499e-06, + "loss": 0.6157, + "step": 14588 + }, + { + "epoch": 0.51, + "learning_rate": 9.833411395347517e-06, + "loss": 0.659, + "step": 14589 + }, + { + "epoch": 0.51, + "learning_rate": 9.832322682660648e-06, + "loss": 0.6266, + "step": 14590 + }, + { + "epoch": 0.51, + "learning_rate": 9.831233971961803e-06, + "loss": 0.6417, + "step": 14591 + }, + { + "epoch": 0.51, + "learning_rate": 9.8301452632639e-06, + "loss": 0.6175, + "step": 14592 + }, + { + "epoch": 0.51, + "learning_rate": 9.829056556579837e-06, + "loss": 0.6736, + "step": 14593 + }, + { + "epoch": 0.51, + "learning_rate": 9.827967851922526e-06, + "loss": 0.639, + "step": 14594 + }, + { + "epoch": 0.51, + "learning_rate": 9.82687914930487e-06, + "loss": 0.5941, + "step": 14595 + }, + { + "epoch": 0.51, + "learning_rate": 9.825790448739781e-06, + "loss": 0.6258, + "step": 14596 + }, + { + "epoch": 0.51, + "learning_rate": 9.82470175024017e-06, + "loss": 0.6018, + "step": 14597 + }, + { + "epoch": 0.51, + "learning_rate": 9.82361305381894e-06, + "loss": 0.5657, + "step": 14598 + }, + { + "epoch": 0.51, + "learning_rate": 9.822524359489e-06, + "loss": 0.6397, + "step": 14599 + }, + { + "epoch": 0.51, + "learning_rate": 9.821435667263258e-06, + "loss": 0.6593, + "step": 14600 + }, + { + "epoch": 0.51, + "learning_rate": 9.820346977154622e-06, + "loss": 0.6024, + "step": 14601 + }, + { + "epoch": 0.51, + "learning_rate": 9.819258289175999e-06, + "loss": 0.6571, + "step": 14602 + }, + { + "epoch": 0.51, + "learning_rate": 9.8181696033403e-06, + "loss": 0.6387, + "step": 14603 + }, + { + "epoch": 0.51, + "learning_rate": 9.817080919660429e-06, + "loss": 0.6102, + "step": 14604 + }, + { + "epoch": 0.51, + "learning_rate": 9.815992238149295e-06, + "loss": 0.6266, + "step": 14605 + }, + { + "epoch": 0.51, + "learning_rate": 9.814903558819805e-06, + "loss": 0.649, + "step": 14606 + }, + { + "epoch": 0.51, + "learning_rate": 9.81381488168487e-06, + "loss": 0.6409, + "step": 14607 + }, + { + "epoch": 0.51, + "learning_rate": 9.812726206757393e-06, + "loss": 0.6208, + "step": 14608 + }, + { + "epoch": 0.51, + "learning_rate": 9.811637534050284e-06, + "loss": 0.6322, + "step": 14609 + }, + { + "epoch": 0.51, + "learning_rate": 9.81054886357645e-06, + "loss": 0.6205, + "step": 14610 + }, + { + "epoch": 0.51, + "learning_rate": 9.809460195348798e-06, + "loss": 0.6741, + "step": 14611 + }, + { + "epoch": 0.51, + "learning_rate": 9.80837152938024e-06, + "loss": 0.6011, + "step": 14612 + }, + { + "epoch": 0.51, + "learning_rate": 9.807282865683677e-06, + "loss": 0.6691, + "step": 14613 + }, + { + "epoch": 0.51, + "learning_rate": 9.80619420427202e-06, + "loss": 0.6331, + "step": 14614 + }, + { + "epoch": 0.51, + "learning_rate": 9.805105545158178e-06, + "loss": 0.6311, + "step": 14615 + }, + { + "epoch": 0.51, + "learning_rate": 9.804016888355053e-06, + "loss": 0.6648, + "step": 14616 + }, + { + "epoch": 0.51, + "learning_rate": 9.802928233875557e-06, + "loss": 0.6106, + "step": 14617 + }, + { + "epoch": 0.51, + "learning_rate": 9.801839581732597e-06, + "loss": 0.6252, + "step": 14618 + }, + { + "epoch": 0.51, + "learning_rate": 9.800750931939079e-06, + "loss": 0.6165, + "step": 14619 + }, + { + "epoch": 0.51, + "learning_rate": 9.79966228450791e-06, + "loss": 0.6671, + "step": 14620 + }, + { + "epoch": 0.51, + "learning_rate": 9.798573639452e-06, + "loss": 0.6481, + "step": 14621 + }, + { + "epoch": 0.51, + "learning_rate": 9.797484996784251e-06, + "loss": 0.6656, + "step": 14622 + }, + { + "epoch": 0.51, + "learning_rate": 9.796396356517574e-06, + "loss": 0.5814, + "step": 14623 + }, + { + "epoch": 0.51, + "learning_rate": 9.795307718664879e-06, + "loss": 0.6701, + "step": 14624 + }, + { + "epoch": 0.51, + "learning_rate": 9.794219083239067e-06, + "loss": 0.6142, + "step": 14625 + }, + { + "epoch": 0.51, + "learning_rate": 9.793130450253048e-06, + "loss": 0.6327, + "step": 14626 + }, + { + "epoch": 0.51, + "learning_rate": 9.792041819719732e-06, + "loss": 0.6063, + "step": 14627 + }, + { + "epoch": 0.51, + "learning_rate": 9.79095319165202e-06, + "loss": 0.6405, + "step": 14628 + }, + { + "epoch": 0.51, + "learning_rate": 9.789864566062824e-06, + "loss": 0.6929, + "step": 14629 + }, + { + "epoch": 0.51, + "learning_rate": 9.788775942965051e-06, + "loss": 0.6551, + "step": 14630 + }, + { + "epoch": 0.51, + "learning_rate": 9.787687322371604e-06, + "loss": 0.6485, + "step": 14631 + }, + { + "epoch": 0.51, + "learning_rate": 9.786598704295392e-06, + "loss": 0.5886, + "step": 14632 + }, + { + "epoch": 0.51, + "learning_rate": 9.785510088749324e-06, + "loss": 0.6315, + "step": 14633 + }, + { + "epoch": 0.51, + "learning_rate": 9.784421475746305e-06, + "loss": 0.6886, + "step": 14634 + }, + { + "epoch": 0.51, + "learning_rate": 9.78333286529924e-06, + "loss": 0.636, + "step": 14635 + }, + { + "epoch": 0.51, + "learning_rate": 9.782244257421042e-06, + "loss": 0.6388, + "step": 14636 + }, + { + "epoch": 0.51, + "learning_rate": 9.78115565212461e-06, + "loss": 0.5824, + "step": 14637 + }, + { + "epoch": 0.51, + "learning_rate": 9.780067049422856e-06, + "loss": 0.603, + "step": 14638 + }, + { + "epoch": 0.51, + "learning_rate": 9.778978449328687e-06, + "loss": 0.6087, + "step": 14639 + }, + { + "epoch": 0.51, + "learning_rate": 9.777889851855006e-06, + "loss": 0.5591, + "step": 14640 + }, + { + "epoch": 0.51, + "learning_rate": 9.776801257014721e-06, + "loss": 0.6743, + "step": 14641 + }, + { + "epoch": 0.51, + "learning_rate": 9.775712664820742e-06, + "loss": 0.6898, + "step": 14642 + }, + { + "epoch": 0.51, + "learning_rate": 9.77462407528597e-06, + "loss": 0.6795, + "step": 14643 + }, + { + "epoch": 0.51, + "learning_rate": 9.773535488423317e-06, + "loss": 0.6879, + "step": 14644 + }, + { + "epoch": 0.51, + "learning_rate": 9.772446904245688e-06, + "loss": 0.6423, + "step": 14645 + }, + { + "epoch": 0.51, + "learning_rate": 9.771358322765987e-06, + "loss": 0.6055, + "step": 14646 + }, + { + "epoch": 0.51, + "learning_rate": 9.770269743997122e-06, + "loss": 0.6475, + "step": 14647 + }, + { + "epoch": 0.51, + "learning_rate": 9.769181167952003e-06, + "loss": 0.6273, + "step": 14648 + }, + { + "epoch": 0.51, + "learning_rate": 9.76809259464353e-06, + "loss": 0.6295, + "step": 14649 + }, + { + "epoch": 0.51, + "learning_rate": 9.767004024084612e-06, + "loss": 0.659, + "step": 14650 + }, + { + "epoch": 0.51, + "learning_rate": 9.76591545628816e-06, + "loss": 0.6461, + "step": 14651 + }, + { + "epoch": 0.51, + "learning_rate": 9.764826891267072e-06, + "loss": 0.6297, + "step": 14652 + }, + { + "epoch": 0.51, + "learning_rate": 9.76373832903426e-06, + "loss": 0.6196, + "step": 14653 + }, + { + "epoch": 0.51, + "learning_rate": 9.76264976960263e-06, + "loss": 0.6212, + "step": 14654 + }, + { + "epoch": 0.51, + "learning_rate": 9.761561212985088e-06, + "loss": 0.7113, + "step": 14655 + }, + { + "epoch": 0.51, + "learning_rate": 9.76047265919454e-06, + "loss": 0.6363, + "step": 14656 + }, + { + "epoch": 0.51, + "learning_rate": 9.759384108243888e-06, + "loss": 0.7063, + "step": 14657 + }, + { + "epoch": 0.51, + "learning_rate": 9.758295560146043e-06, + "loss": 0.5932, + "step": 14658 + }, + { + "epoch": 0.51, + "learning_rate": 9.757207014913914e-06, + "loss": 0.6946, + "step": 14659 + }, + { + "epoch": 0.51, + "learning_rate": 9.756118472560397e-06, + "loss": 0.6272, + "step": 14660 + }, + { + "epoch": 0.51, + "learning_rate": 9.755029933098406e-06, + "loss": 0.6346, + "step": 14661 + }, + { + "epoch": 0.51, + "learning_rate": 9.753941396540848e-06, + "loss": 0.6384, + "step": 14662 + }, + { + "epoch": 0.51, + "learning_rate": 9.752852862900622e-06, + "loss": 0.6941, + "step": 14663 + }, + { + "epoch": 0.51, + "learning_rate": 9.75176433219064e-06, + "loss": 0.6138, + "step": 14664 + }, + { + "epoch": 0.51, + "learning_rate": 9.750675804423807e-06, + "loss": 0.6552, + "step": 14665 + }, + { + "epoch": 0.51, + "learning_rate": 9.749587279613025e-06, + "loss": 0.6726, + "step": 14666 + }, + { + "epoch": 0.51, + "learning_rate": 9.748498757771204e-06, + "loss": 0.5734, + "step": 14667 + }, + { + "epoch": 0.51, + "learning_rate": 9.747410238911248e-06, + "loss": 0.6662, + "step": 14668 + }, + { + "epoch": 0.51, + "learning_rate": 9.746321723046065e-06, + "loss": 0.619, + "step": 14669 + }, + { + "epoch": 0.51, + "learning_rate": 9.745233210188556e-06, + "loss": 0.6619, + "step": 14670 + }, + { + "epoch": 0.51, + "learning_rate": 9.744144700351631e-06, + "loss": 0.6019, + "step": 14671 + }, + { + "epoch": 0.51, + "learning_rate": 9.743056193548194e-06, + "loss": 0.6445, + "step": 14672 + }, + { + "epoch": 0.51, + "learning_rate": 9.74196768979115e-06, + "loss": 0.6211, + "step": 14673 + }, + { + "epoch": 0.51, + "learning_rate": 9.740879189093407e-06, + "loss": 0.6269, + "step": 14674 + }, + { + "epoch": 0.51, + "learning_rate": 9.739790691467868e-06, + "loss": 0.6688, + "step": 14675 + }, + { + "epoch": 0.51, + "learning_rate": 9.738702196927438e-06, + "loss": 0.6497, + "step": 14676 + }, + { + "epoch": 0.51, + "learning_rate": 9.737613705485028e-06, + "loss": 0.6703, + "step": 14677 + }, + { + "epoch": 0.51, + "learning_rate": 9.736525217153538e-06, + "loss": 0.702, + "step": 14678 + }, + { + "epoch": 0.51, + "learning_rate": 9.735436731945873e-06, + "loss": 0.5889, + "step": 14679 + }, + { + "epoch": 0.51, + "learning_rate": 9.734348249874942e-06, + "loss": 0.6538, + "step": 14680 + }, + { + "epoch": 0.51, + "learning_rate": 9.733259770953647e-06, + "loss": 0.656, + "step": 14681 + }, + { + "epoch": 0.51, + "learning_rate": 9.732171295194896e-06, + "loss": 0.6302, + "step": 14682 + }, + { + "epoch": 0.51, + "learning_rate": 9.731082822611595e-06, + "loss": 0.6782, + "step": 14683 + }, + { + "epoch": 0.51, + "learning_rate": 9.729994353216642e-06, + "loss": 0.6403, + "step": 14684 + }, + { + "epoch": 0.51, + "learning_rate": 9.728905887022951e-06, + "loss": 0.6689, + "step": 14685 + }, + { + "epoch": 0.51, + "learning_rate": 9.727817424043425e-06, + "loss": 0.5857, + "step": 14686 + }, + { + "epoch": 0.51, + "learning_rate": 9.726728964290965e-06, + "loss": 0.6475, + "step": 14687 + }, + { + "epoch": 0.51, + "learning_rate": 9.72564050777848e-06, + "loss": 0.6117, + "step": 14688 + }, + { + "epoch": 0.51, + "learning_rate": 9.724552054518875e-06, + "loss": 0.5994, + "step": 14689 + }, + { + "epoch": 0.51, + "learning_rate": 9.723463604525051e-06, + "loss": 0.6295, + "step": 14690 + }, + { + "epoch": 0.51, + "learning_rate": 9.722375157809918e-06, + "loss": 0.5951, + "step": 14691 + }, + { + "epoch": 0.51, + "learning_rate": 9.72128671438638e-06, + "loss": 0.65, + "step": 14692 + }, + { + "epoch": 0.51, + "learning_rate": 9.720198274267335e-06, + "loss": 0.622, + "step": 14693 + }, + { + "epoch": 0.51, + "learning_rate": 9.719109837465698e-06, + "loss": 0.6435, + "step": 14694 + }, + { + "epoch": 0.51, + "learning_rate": 9.718021403994368e-06, + "loss": 0.6224, + "step": 14695 + }, + { + "epoch": 0.51, + "learning_rate": 9.71693297386625e-06, + "loss": 0.6418, + "step": 14696 + }, + { + "epoch": 0.51, + "learning_rate": 9.715844547094252e-06, + "loss": 0.6183, + "step": 14697 + }, + { + "epoch": 0.51, + "learning_rate": 9.714756123691276e-06, + "loss": 0.6598, + "step": 14698 + }, + { + "epoch": 0.51, + "learning_rate": 9.713667703670225e-06, + "loss": 0.6544, + "step": 14699 + }, + { + "epoch": 0.51, + "learning_rate": 9.712579287044008e-06, + "loss": 0.5403, + "step": 14700 + }, + { + "epoch": 0.51, + "learning_rate": 9.711490873825527e-06, + "loss": 0.6384, + "step": 14701 + }, + { + "epoch": 0.51, + "learning_rate": 9.710402464027684e-06, + "loss": 0.6541, + "step": 14702 + }, + { + "epoch": 0.51, + "learning_rate": 9.709314057663388e-06, + "loss": 0.663, + "step": 14703 + }, + { + "epoch": 0.51, + "learning_rate": 9.708225654745543e-06, + "loss": 0.6576, + "step": 14704 + }, + { + "epoch": 0.51, + "learning_rate": 9.707137255287048e-06, + "loss": 0.6134, + "step": 14705 + }, + { + "epoch": 0.51, + "learning_rate": 9.706048859300813e-06, + "loss": 0.6992, + "step": 14706 + }, + { + "epoch": 0.51, + "learning_rate": 9.704960466799744e-06, + "loss": 0.6695, + "step": 14707 + }, + { + "epoch": 0.51, + "learning_rate": 9.703872077796738e-06, + "loss": 0.6668, + "step": 14708 + }, + { + "epoch": 0.51, + "learning_rate": 9.702783692304702e-06, + "loss": 0.6516, + "step": 14709 + }, + { + "epoch": 0.51, + "learning_rate": 9.701695310336545e-06, + "loss": 0.6339, + "step": 14710 + }, + { + "epoch": 0.51, + "learning_rate": 9.700606931905165e-06, + "loss": 0.6413, + "step": 14711 + }, + { + "epoch": 0.51, + "learning_rate": 9.699518557023469e-06, + "loss": 0.66, + "step": 14712 + }, + { + "epoch": 0.51, + "learning_rate": 9.698430185704365e-06, + "loss": 0.6512, + "step": 14713 + }, + { + "epoch": 0.51, + "learning_rate": 9.697341817960745e-06, + "loss": 0.6733, + "step": 14714 + }, + { + "epoch": 0.51, + "learning_rate": 9.696253453805525e-06, + "loss": 0.6065, + "step": 14715 + }, + { + "epoch": 0.51, + "learning_rate": 9.695165093251605e-06, + "loss": 0.6262, + "step": 14716 + }, + { + "epoch": 0.51, + "learning_rate": 9.694076736311887e-06, + "loss": 0.6666, + "step": 14717 + }, + { + "epoch": 0.51, + "learning_rate": 9.692988382999278e-06, + "loss": 0.645, + "step": 14718 + }, + { + "epoch": 0.51, + "learning_rate": 9.691900033326679e-06, + "loss": 0.645, + "step": 14719 + }, + { + "epoch": 0.51, + "learning_rate": 9.690811687306993e-06, + "loss": 0.618, + "step": 14720 + }, + { + "epoch": 0.51, + "learning_rate": 9.689723344953129e-06, + "loss": 0.6263, + "step": 14721 + }, + { + "epoch": 0.51, + "learning_rate": 9.688635006277984e-06, + "loss": 0.611, + "step": 14722 + }, + { + "epoch": 0.51, + "learning_rate": 9.687546671294465e-06, + "loss": 0.5928, + "step": 14723 + }, + { + "epoch": 0.51, + "learning_rate": 9.686458340015479e-06, + "loss": 0.6181, + "step": 14724 + }, + { + "epoch": 0.51, + "learning_rate": 9.685370012453922e-06, + "loss": 0.6287, + "step": 14725 + }, + { + "epoch": 0.51, + "learning_rate": 9.684281688622705e-06, + "loss": 0.6137, + "step": 14726 + }, + { + "epoch": 0.51, + "learning_rate": 9.68319336853473e-06, + "loss": 0.6363, + "step": 14727 + }, + { + "epoch": 0.51, + "learning_rate": 9.68210505220289e-06, + "loss": 0.5927, + "step": 14728 + }, + { + "epoch": 0.51, + "learning_rate": 9.681016739640101e-06, + "loss": 0.6603, + "step": 14729 + }, + { + "epoch": 0.51, + "learning_rate": 9.679928430859267e-06, + "loss": 0.63, + "step": 14730 + }, + { + "epoch": 0.51, + "learning_rate": 9.678840125873278e-06, + "loss": 0.6509, + "step": 14731 + }, + { + "epoch": 0.51, + "learning_rate": 9.677751824695049e-06, + "loss": 0.6565, + "step": 14732 + }, + { + "epoch": 0.51, + "learning_rate": 9.676663527337484e-06, + "loss": 0.6327, + "step": 14733 + }, + { + "epoch": 0.51, + "learning_rate": 9.675575233813475e-06, + "loss": 0.6069, + "step": 14734 + }, + { + "epoch": 0.51, + "learning_rate": 9.674486944135934e-06, + "loss": 0.616, + "step": 14735 + }, + { + "epoch": 0.51, + "learning_rate": 9.673398658317767e-06, + "loss": 0.679, + "step": 14736 + }, + { + "epoch": 0.51, + "learning_rate": 9.672310376371864e-06, + "loss": 0.6205, + "step": 14737 + }, + { + "epoch": 0.51, + "learning_rate": 9.67122209831114e-06, + "loss": 0.6213, + "step": 14738 + }, + { + "epoch": 0.51, + "learning_rate": 9.670133824148498e-06, + "loss": 0.6688, + "step": 14739 + }, + { + "epoch": 0.51, + "learning_rate": 9.66904555389683e-06, + "loss": 0.6048, + "step": 14740 + }, + { + "epoch": 0.51, + "learning_rate": 9.667957287569048e-06, + "loss": 0.6012, + "step": 14741 + }, + { + "epoch": 0.51, + "learning_rate": 9.666869025178057e-06, + "loss": 0.6662, + "step": 14742 + }, + { + "epoch": 0.51, + "learning_rate": 9.665780766736748e-06, + "loss": 0.6301, + "step": 14743 + }, + { + "epoch": 0.51, + "learning_rate": 9.664692512258032e-06, + "loss": 0.6211, + "step": 14744 + }, + { + "epoch": 0.51, + "learning_rate": 9.663604261754817e-06, + "loss": 0.6781, + "step": 14745 + }, + { + "epoch": 0.51, + "learning_rate": 9.662516015239991e-06, + "loss": 0.6432, + "step": 14746 + }, + { + "epoch": 0.51, + "learning_rate": 9.661427772726468e-06, + "loss": 0.6354, + "step": 14747 + }, + { + "epoch": 0.51, + "learning_rate": 9.66033953422715e-06, + "loss": 0.6279, + "step": 14748 + }, + { + "epoch": 0.51, + "learning_rate": 9.65925129975493e-06, + "loss": 0.7499, + "step": 14749 + }, + { + "epoch": 0.51, + "learning_rate": 9.658163069322719e-06, + "loss": 0.621, + "step": 14750 + }, + { + "epoch": 0.51, + "learning_rate": 9.657074842943423e-06, + "loss": 0.6323, + "step": 14751 + }, + { + "epoch": 0.51, + "learning_rate": 9.655986620629931e-06, + "loss": 0.5504, + "step": 14752 + }, + { + "epoch": 0.51, + "learning_rate": 9.654898402395156e-06, + "loss": 0.6585, + "step": 14753 + }, + { + "epoch": 0.51, + "learning_rate": 9.653810188252e-06, + "loss": 0.6097, + "step": 14754 + }, + { + "epoch": 0.51, + "learning_rate": 9.652721978213356e-06, + "loss": 0.6675, + "step": 14755 + }, + { + "epoch": 0.51, + "learning_rate": 9.651633772292133e-06, + "loss": 0.654, + "step": 14756 + }, + { + "epoch": 0.51, + "learning_rate": 9.65054557050124e-06, + "loss": 0.6111, + "step": 14757 + }, + { + "epoch": 0.51, + "learning_rate": 9.649457372853562e-06, + "loss": 0.6188, + "step": 14758 + }, + { + "epoch": 0.51, + "learning_rate": 9.648369179362014e-06, + "loss": 0.6271, + "step": 14759 + }, + { + "epoch": 0.51, + "learning_rate": 9.647280990039499e-06, + "loss": 0.6378, + "step": 14760 + }, + { + "epoch": 0.51, + "learning_rate": 9.646192804898905e-06, + "loss": 0.6642, + "step": 14761 + }, + { + "epoch": 0.51, + "learning_rate": 9.645104623953147e-06, + "loss": 0.6246, + "step": 14762 + }, + { + "epoch": 0.51, + "learning_rate": 9.644016447215127e-06, + "loss": 0.6539, + "step": 14763 + }, + { + "epoch": 0.51, + "learning_rate": 9.642928274697735e-06, + "loss": 0.6239, + "step": 14764 + }, + { + "epoch": 0.51, + "learning_rate": 9.641840106413882e-06, + "loss": 0.6315, + "step": 14765 + }, + { + "epoch": 0.51, + "learning_rate": 9.640751942376474e-06, + "loss": 0.5964, + "step": 14766 + }, + { + "epoch": 0.51, + "learning_rate": 9.639663782598398e-06, + "loss": 0.6681, + "step": 14767 + }, + { + "epoch": 0.51, + "learning_rate": 9.638575627092565e-06, + "loss": 0.6615, + "step": 14768 + }, + { + "epoch": 0.51, + "learning_rate": 9.63748747587188e-06, + "loss": 0.6569, + "step": 14769 + }, + { + "epoch": 0.51, + "learning_rate": 9.636399328949235e-06, + "loss": 0.6536, + "step": 14770 + }, + { + "epoch": 0.51, + "learning_rate": 9.635311186337535e-06, + "loss": 0.6164, + "step": 14771 + }, + { + "epoch": 0.51, + "learning_rate": 9.634223048049688e-06, + "loss": 0.6199, + "step": 14772 + }, + { + "epoch": 0.51, + "learning_rate": 9.633134914098584e-06, + "loss": 0.6165, + "step": 14773 + }, + { + "epoch": 0.51, + "learning_rate": 9.632046784497131e-06, + "loss": 0.5698, + "step": 14774 + }, + { + "epoch": 0.51, + "learning_rate": 9.630958659258233e-06, + "loss": 0.647, + "step": 14775 + }, + { + "epoch": 0.51, + "learning_rate": 9.62987053839478e-06, + "loss": 0.6432, + "step": 14776 + }, + { + "epoch": 0.51, + "learning_rate": 9.628782421919683e-06, + "loss": 0.6597, + "step": 14777 + }, + { + "epoch": 0.51, + "learning_rate": 9.627694309845844e-06, + "loss": 0.6257, + "step": 14778 + }, + { + "epoch": 0.51, + "learning_rate": 9.626606202186155e-06, + "loss": 0.6414, + "step": 14779 + }, + { + "epoch": 0.51, + "learning_rate": 9.625518098953525e-06, + "loss": 0.6715, + "step": 14780 + }, + { + "epoch": 0.51, + "learning_rate": 9.62443000016085e-06, + "loss": 0.6182, + "step": 14781 + }, + { + "epoch": 0.51, + "learning_rate": 9.62334190582103e-06, + "loss": 0.6305, + "step": 14782 + }, + { + "epoch": 0.51, + "learning_rate": 9.622253815946974e-06, + "loss": 0.6659, + "step": 14783 + }, + { + "epoch": 0.51, + "learning_rate": 9.621165730551571e-06, + "loss": 0.6019, + "step": 14784 + }, + { + "epoch": 0.51, + "learning_rate": 9.620077649647728e-06, + "loss": 0.6715, + "step": 14785 + }, + { + "epoch": 0.51, + "learning_rate": 9.61898957324835e-06, + "loss": 0.6827, + "step": 14786 + }, + { + "epoch": 0.51, + "learning_rate": 9.617901501366329e-06, + "loss": 0.6267, + "step": 14787 + }, + { + "epoch": 0.51, + "learning_rate": 9.616813434014567e-06, + "loss": 0.6514, + "step": 14788 + }, + { + "epoch": 0.51, + "learning_rate": 9.615725371205972e-06, + "loss": 0.6904, + "step": 14789 + }, + { + "epoch": 0.51, + "learning_rate": 9.614637312953435e-06, + "loss": 0.6222, + "step": 14790 + }, + { + "epoch": 0.51, + "learning_rate": 9.61354925926986e-06, + "loss": 0.6448, + "step": 14791 + }, + { + "epoch": 0.51, + "learning_rate": 9.61246121016815e-06, + "loss": 0.5713, + "step": 14792 + }, + { + "epoch": 0.51, + "learning_rate": 9.611373165661201e-06, + "loss": 0.5277, + "step": 14793 + }, + { + "epoch": 0.51, + "learning_rate": 9.610285125761911e-06, + "loss": 0.6271, + "step": 14794 + }, + { + "epoch": 0.51, + "learning_rate": 9.609197090483193e-06, + "loss": 0.6609, + "step": 14795 + }, + { + "epoch": 0.51, + "learning_rate": 9.608109059837931e-06, + "loss": 0.6346, + "step": 14796 + }, + { + "epoch": 0.51, + "learning_rate": 9.60702103383903e-06, + "loss": 0.6351, + "step": 14797 + }, + { + "epoch": 0.51, + "learning_rate": 9.605933012499398e-06, + "loss": 0.6518, + "step": 14798 + }, + { + "epoch": 0.51, + "learning_rate": 9.604844995831925e-06, + "loss": 0.6238, + "step": 14799 + }, + { + "epoch": 0.51, + "learning_rate": 9.603756983849513e-06, + "loss": 0.6296, + "step": 14800 + }, + { + "epoch": 0.51, + "learning_rate": 9.602668976565069e-06, + "loss": 0.683, + "step": 14801 + }, + { + "epoch": 0.51, + "learning_rate": 9.601580973991482e-06, + "loss": 0.6815, + "step": 14802 + }, + { + "epoch": 0.51, + "learning_rate": 9.600492976141655e-06, + "loss": 0.6441, + "step": 14803 + }, + { + "epoch": 0.51, + "learning_rate": 9.599404983028496e-06, + "loss": 0.6384, + "step": 14804 + }, + { + "epoch": 0.51, + "learning_rate": 9.598316994664893e-06, + "loss": 0.6328, + "step": 14805 + }, + { + "epoch": 0.51, + "learning_rate": 9.597229011063747e-06, + "loss": 0.6581, + "step": 14806 + }, + { + "epoch": 0.51, + "learning_rate": 9.596141032237969e-06, + "loss": 0.6856, + "step": 14807 + }, + { + "epoch": 0.51, + "learning_rate": 9.595053058200444e-06, + "loss": 0.6334, + "step": 14808 + }, + { + "epoch": 0.51, + "learning_rate": 9.593965088964076e-06, + "loss": 0.5781, + "step": 14809 + }, + { + "epoch": 0.51, + "learning_rate": 9.592877124541771e-06, + "loss": 0.6416, + "step": 14810 + }, + { + "epoch": 0.51, + "learning_rate": 9.591789164946419e-06, + "loss": 0.6827, + "step": 14811 + }, + { + "epoch": 0.51, + "learning_rate": 9.590701210190922e-06, + "loss": 0.6743, + "step": 14812 + }, + { + "epoch": 0.51, + "learning_rate": 9.589613260288184e-06, + "loss": 0.6292, + "step": 14813 + }, + { + "epoch": 0.51, + "learning_rate": 9.588525315251097e-06, + "loss": 0.6116, + "step": 14814 + }, + { + "epoch": 0.51, + "learning_rate": 9.58743737509256e-06, + "loss": 0.6558, + "step": 14815 + }, + { + "epoch": 0.51, + "learning_rate": 9.586349439825482e-06, + "loss": 0.6751, + "step": 14816 + }, + { + "epoch": 0.51, + "learning_rate": 9.58526150946275e-06, + "loss": 0.6484, + "step": 14817 + }, + { + "epoch": 0.51, + "learning_rate": 9.584173584017265e-06, + "loss": 0.5941, + "step": 14818 + }, + { + "epoch": 0.51, + "learning_rate": 9.583085663501935e-06, + "loss": 0.5996, + "step": 14819 + }, + { + "epoch": 0.51, + "learning_rate": 9.58199774792965e-06, + "loss": 0.5826, + "step": 14820 + }, + { + "epoch": 0.51, + "learning_rate": 9.580909837313305e-06, + "loss": 0.594, + "step": 14821 + }, + { + "epoch": 0.51, + "learning_rate": 9.57982193166581e-06, + "loss": 0.6444, + "step": 14822 + }, + { + "epoch": 0.51, + "learning_rate": 9.578734031000056e-06, + "loss": 0.6181, + "step": 14823 + }, + { + "epoch": 0.51, + "learning_rate": 9.577646135328938e-06, + "loss": 0.5792, + "step": 14824 + }, + { + "epoch": 0.51, + "learning_rate": 9.576558244665368e-06, + "loss": 0.6334, + "step": 14825 + }, + { + "epoch": 0.51, + "learning_rate": 9.575470359022231e-06, + "loss": 0.6446, + "step": 14826 + }, + { + "epoch": 0.51, + "learning_rate": 9.574382478412427e-06, + "loss": 0.5876, + "step": 14827 + }, + { + "epoch": 0.51, + "learning_rate": 9.573294602848863e-06, + "loss": 0.6486, + "step": 14828 + }, + { + "epoch": 0.51, + "learning_rate": 9.57220673234443e-06, + "loss": 0.7033, + "step": 14829 + }, + { + "epoch": 0.51, + "learning_rate": 9.571118866912023e-06, + "loss": 0.6477, + "step": 14830 + }, + { + "epoch": 0.51, + "learning_rate": 9.570031006564549e-06, + "loss": 0.6406, + "step": 14831 + }, + { + "epoch": 0.51, + "learning_rate": 9.5689431513149e-06, + "loss": 0.6861, + "step": 14832 + }, + { + "epoch": 0.51, + "learning_rate": 9.567855301175972e-06, + "loss": 0.6367, + "step": 14833 + }, + { + "epoch": 0.51, + "learning_rate": 9.566767456160672e-06, + "loss": 0.6114, + "step": 14834 + }, + { + "epoch": 0.51, + "learning_rate": 9.565679616281889e-06, + "loss": 0.6637, + "step": 14835 + }, + { + "epoch": 0.51, + "learning_rate": 9.56459178155252e-06, + "loss": 0.6698, + "step": 14836 + }, + { + "epoch": 0.51, + "learning_rate": 9.563503951985473e-06, + "loss": 0.6353, + "step": 14837 + }, + { + "epoch": 0.51, + "learning_rate": 9.562416127593635e-06, + "loss": 0.6059, + "step": 14838 + }, + { + "epoch": 0.51, + "learning_rate": 9.561328308389906e-06, + "loss": 0.6374, + "step": 14839 + }, + { + "epoch": 0.51, + "learning_rate": 9.56024049438719e-06, + "loss": 0.5979, + "step": 14840 + }, + { + "epoch": 0.51, + "learning_rate": 9.559152685598375e-06, + "loss": 0.6532, + "step": 14841 + }, + { + "epoch": 0.51, + "learning_rate": 9.558064882036366e-06, + "loss": 0.6308, + "step": 14842 + }, + { + "epoch": 0.51, + "learning_rate": 9.556977083714052e-06, + "loss": 0.6521, + "step": 14843 + }, + { + "epoch": 0.51, + "learning_rate": 9.555889290644337e-06, + "loss": 0.6192, + "step": 14844 + }, + { + "epoch": 0.51, + "learning_rate": 9.554801502840118e-06, + "loss": 0.6273, + "step": 14845 + }, + { + "epoch": 0.51, + "learning_rate": 9.553713720314288e-06, + "loss": 0.5594, + "step": 14846 + }, + { + "epoch": 0.51, + "learning_rate": 9.552625943079747e-06, + "loss": 0.6173, + "step": 14847 + }, + { + "epoch": 0.51, + "learning_rate": 9.551538171149394e-06, + "loss": 0.6583, + "step": 14848 + }, + { + "epoch": 0.51, + "learning_rate": 9.55045040453612e-06, + "loss": 0.6784, + "step": 14849 + }, + { + "epoch": 0.51, + "learning_rate": 9.549362643252825e-06, + "loss": 0.5996, + "step": 14850 + }, + { + "epoch": 0.51, + "learning_rate": 9.54827488731241e-06, + "loss": 0.5794, + "step": 14851 + }, + { + "epoch": 0.51, + "learning_rate": 9.547187136727764e-06, + "loss": 0.6288, + "step": 14852 + }, + { + "epoch": 0.51, + "learning_rate": 9.546099391511787e-06, + "loss": 0.5801, + "step": 14853 + }, + { + "epoch": 0.51, + "learning_rate": 9.545011651677379e-06, + "loss": 0.6564, + "step": 14854 + }, + { + "epoch": 0.51, + "learning_rate": 9.54392391723743e-06, + "loss": 0.6251, + "step": 14855 + }, + { + "epoch": 0.51, + "learning_rate": 9.54283618820484e-06, + "loss": 0.6109, + "step": 14856 + }, + { + "epoch": 0.51, + "learning_rate": 9.541748464592508e-06, + "loss": 0.6153, + "step": 14857 + }, + { + "epoch": 0.51, + "learning_rate": 9.540660746413326e-06, + "loss": 0.6239, + "step": 14858 + }, + { + "epoch": 0.51, + "learning_rate": 9.539573033680192e-06, + "loss": 0.6303, + "step": 14859 + }, + { + "epoch": 0.51, + "learning_rate": 9.538485326406004e-06, + "loss": 0.6767, + "step": 14860 + }, + { + "epoch": 0.51, + "learning_rate": 9.537397624603653e-06, + "loss": 0.659, + "step": 14861 + }, + { + "epoch": 0.51, + "learning_rate": 9.53630992828604e-06, + "loss": 0.6791, + "step": 14862 + }, + { + "epoch": 0.51, + "learning_rate": 9.535222237466061e-06, + "loss": 0.6056, + "step": 14863 + }, + { + "epoch": 0.51, + "learning_rate": 9.534134552156608e-06, + "loss": 0.6752, + "step": 14864 + }, + { + "epoch": 0.52, + "learning_rate": 9.53304687237058e-06, + "loss": 0.5812, + "step": 14865 + }, + { + "epoch": 0.52, + "learning_rate": 9.531959198120873e-06, + "loss": 0.6399, + "step": 14866 + }, + { + "epoch": 0.52, + "learning_rate": 9.530871529420379e-06, + "loss": 0.6038, + "step": 14867 + }, + { + "epoch": 0.52, + "learning_rate": 9.529783866281998e-06, + "loss": 0.6259, + "step": 14868 + }, + { + "epoch": 0.52, + "learning_rate": 9.528696208718627e-06, + "loss": 0.6321, + "step": 14869 + }, + { + "epoch": 0.52, + "learning_rate": 9.527608556743154e-06, + "loss": 0.6649, + "step": 14870 + }, + { + "epoch": 0.52, + "learning_rate": 9.52652091036848e-06, + "loss": 0.6529, + "step": 14871 + }, + { + "epoch": 0.52, + "learning_rate": 9.525433269607503e-06, + "loss": 0.6187, + "step": 14872 + }, + { + "epoch": 0.52, + "learning_rate": 9.524345634473112e-06, + "loss": 0.6715, + "step": 14873 + }, + { + "epoch": 0.52, + "learning_rate": 9.523258004978205e-06, + "loss": 0.6667, + "step": 14874 + }, + { + "epoch": 0.52, + "learning_rate": 9.52217038113568e-06, + "loss": 0.6181, + "step": 14875 + }, + { + "epoch": 0.52, + "learning_rate": 9.521082762958426e-06, + "loss": 0.6275, + "step": 14876 + }, + { + "epoch": 0.52, + "learning_rate": 9.519995150459342e-06, + "loss": 0.6031, + "step": 14877 + }, + { + "epoch": 0.52, + "learning_rate": 9.518907543651326e-06, + "loss": 0.6156, + "step": 14878 + }, + { + "epoch": 0.52, + "learning_rate": 9.517819942547267e-06, + "loss": 0.5958, + "step": 14879 + }, + { + "epoch": 0.52, + "learning_rate": 9.516732347160063e-06, + "loss": 0.6437, + "step": 14880 + }, + { + "epoch": 0.52, + "learning_rate": 9.51564475750261e-06, + "loss": 0.5937, + "step": 14881 + }, + { + "epoch": 0.52, + "learning_rate": 9.5145571735878e-06, + "loss": 0.6385, + "step": 14882 + }, + { + "epoch": 0.52, + "learning_rate": 9.513469595428527e-06, + "loss": 0.6138, + "step": 14883 + }, + { + "epoch": 0.52, + "learning_rate": 9.51238202303769e-06, + "loss": 0.6594, + "step": 14884 + }, + { + "epoch": 0.52, + "learning_rate": 9.51129445642818e-06, + "loss": 0.6227, + "step": 14885 + }, + { + "epoch": 0.52, + "learning_rate": 9.510206895612891e-06, + "loss": 0.6561, + "step": 14886 + }, + { + "epoch": 0.52, + "learning_rate": 9.509119340604722e-06, + "loss": 0.635, + "step": 14887 + }, + { + "epoch": 0.52, + "learning_rate": 9.508031791416562e-06, + "loss": 0.6101, + "step": 14888 + }, + { + "epoch": 0.52, + "learning_rate": 9.506944248061307e-06, + "loss": 0.6492, + "step": 14889 + }, + { + "epoch": 0.52, + "learning_rate": 9.505856710551854e-06, + "loss": 0.6411, + "step": 14890 + }, + { + "epoch": 0.52, + "learning_rate": 9.504769178901093e-06, + "loss": 0.6841, + "step": 14891 + }, + { + "epoch": 0.52, + "learning_rate": 9.503681653121918e-06, + "loss": 0.5888, + "step": 14892 + }, + { + "epoch": 0.52, + "learning_rate": 9.50259413322723e-06, + "loss": 0.6564, + "step": 14893 + }, + { + "epoch": 0.52, + "learning_rate": 9.501506619229914e-06, + "loss": 0.6485, + "step": 14894 + }, + { + "epoch": 0.52, + "learning_rate": 9.500419111142867e-06, + "loss": 0.6504, + "step": 14895 + }, + { + "epoch": 0.52, + "learning_rate": 9.499331608978986e-06, + "loss": 0.624, + "step": 14896 + }, + { + "epoch": 0.52, + "learning_rate": 9.498244112751161e-06, + "loss": 0.6401, + "step": 14897 + }, + { + "epoch": 0.52, + "learning_rate": 9.497156622472286e-06, + "loss": 0.6248, + "step": 14898 + }, + { + "epoch": 0.52, + "learning_rate": 9.496069138155259e-06, + "loss": 0.6508, + "step": 14899 + }, + { + "epoch": 0.52, + "learning_rate": 9.494981659812965e-06, + "loss": 0.5966, + "step": 14900 + }, + { + "epoch": 0.52, + "learning_rate": 9.493894187458304e-06, + "loss": 0.6268, + "step": 14901 + }, + { + "epoch": 0.52, + "learning_rate": 9.492806721104169e-06, + "loss": 0.7078, + "step": 14902 + }, + { + "epoch": 0.52, + "learning_rate": 9.49171926076345e-06, + "loss": 0.6654, + "step": 14903 + }, + { + "epoch": 0.52, + "learning_rate": 9.490631806449044e-06, + "loss": 0.5936, + "step": 14904 + }, + { + "epoch": 0.52, + "learning_rate": 9.489544358173841e-06, + "loss": 0.6486, + "step": 14905 + }, + { + "epoch": 0.52, + "learning_rate": 9.488456915950735e-06, + "loss": 0.5852, + "step": 14906 + }, + { + "epoch": 0.52, + "learning_rate": 9.487369479792621e-06, + "loss": 0.6001, + "step": 14907 + }, + { + "epoch": 0.52, + "learning_rate": 9.486282049712389e-06, + "loss": 0.6642, + "step": 14908 + }, + { + "epoch": 0.52, + "learning_rate": 9.485194625722932e-06, + "loss": 0.5982, + "step": 14909 + }, + { + "epoch": 0.52, + "learning_rate": 9.484107207837147e-06, + "loss": 0.6498, + "step": 14910 + }, + { + "epoch": 0.52, + "learning_rate": 9.483019796067921e-06, + "loss": 0.6405, + "step": 14911 + }, + { + "epoch": 0.52, + "learning_rate": 9.48193239042815e-06, + "loss": 0.6288, + "step": 14912 + }, + { + "epoch": 0.52, + "learning_rate": 9.480844990930727e-06, + "loss": 0.6431, + "step": 14913 + }, + { + "epoch": 0.52, + "learning_rate": 9.479757597588542e-06, + "loss": 0.6262, + "step": 14914 + }, + { + "epoch": 0.52, + "learning_rate": 9.47867021041449e-06, + "loss": 0.6226, + "step": 14915 + }, + { + "epoch": 0.52, + "learning_rate": 9.477582829421462e-06, + "loss": 0.6372, + "step": 14916 + }, + { + "epoch": 0.52, + "learning_rate": 9.476495454622349e-06, + "loss": 0.6028, + "step": 14917 + }, + { + "epoch": 0.52, + "learning_rate": 9.475408086030044e-06, + "loss": 0.6114, + "step": 14918 + }, + { + "epoch": 0.52, + "learning_rate": 9.474320723657445e-06, + "loss": 0.6049, + "step": 14919 + }, + { + "epoch": 0.52, + "learning_rate": 9.473233367517433e-06, + "loss": 0.6994, + "step": 14920 + }, + { + "epoch": 0.52, + "learning_rate": 9.472146017622908e-06, + "loss": 0.6398, + "step": 14921 + }, + { + "epoch": 0.52, + "learning_rate": 9.47105867398676e-06, + "loss": 0.5931, + "step": 14922 + }, + { + "epoch": 0.52, + "learning_rate": 9.469971336621879e-06, + "loss": 0.5744, + "step": 14923 + }, + { + "epoch": 0.52, + "learning_rate": 9.468884005541159e-06, + "loss": 0.6483, + "step": 14924 + }, + { + "epoch": 0.52, + "learning_rate": 9.467796680757493e-06, + "loss": 0.6245, + "step": 14925 + }, + { + "epoch": 0.52, + "learning_rate": 9.466709362283767e-06, + "loss": 0.5654, + "step": 14926 + }, + { + "epoch": 0.52, + "learning_rate": 9.465622050132878e-06, + "loss": 0.649, + "step": 14927 + }, + { + "epoch": 0.52, + "learning_rate": 9.464534744317717e-06, + "loss": 0.6065, + "step": 14928 + }, + { + "epoch": 0.52, + "learning_rate": 9.463447444851172e-06, + "loss": 0.6108, + "step": 14929 + }, + { + "epoch": 0.52, + "learning_rate": 9.462360151746137e-06, + "loss": 0.6411, + "step": 14930 + }, + { + "epoch": 0.52, + "learning_rate": 9.461272865015505e-06, + "loss": 0.6565, + "step": 14931 + }, + { + "epoch": 0.52, + "learning_rate": 9.46018558467216e-06, + "loss": 0.6474, + "step": 14932 + }, + { + "epoch": 0.52, + "learning_rate": 9.459098310728999e-06, + "loss": 0.6706, + "step": 14933 + }, + { + "epoch": 0.52, + "learning_rate": 9.458011043198914e-06, + "loss": 0.6259, + "step": 14934 + }, + { + "epoch": 0.52, + "learning_rate": 9.456923782094792e-06, + "loss": 0.6659, + "step": 14935 + }, + { + "epoch": 0.52, + "learning_rate": 9.455836527429526e-06, + "loss": 0.5808, + "step": 14936 + }, + { + "epoch": 0.52, + "learning_rate": 9.454749279216007e-06, + "loss": 0.6076, + "step": 14937 + }, + { + "epoch": 0.52, + "learning_rate": 9.453662037467123e-06, + "loss": 0.6439, + "step": 14938 + }, + { + "epoch": 0.52, + "learning_rate": 9.452574802195767e-06, + "loss": 0.602, + "step": 14939 + }, + { + "epoch": 0.52, + "learning_rate": 9.451487573414832e-06, + "loss": 0.5997, + "step": 14940 + }, + { + "epoch": 0.52, + "learning_rate": 9.450400351137204e-06, + "loss": 0.6262, + "step": 14941 + }, + { + "epoch": 0.52, + "learning_rate": 9.449313135375774e-06, + "loss": 0.662, + "step": 14942 + }, + { + "epoch": 0.52, + "learning_rate": 9.448225926143435e-06, + "loss": 0.573, + "step": 14943 + }, + { + "epoch": 0.52, + "learning_rate": 9.447138723453075e-06, + "loss": 0.6086, + "step": 14944 + }, + { + "epoch": 0.52, + "learning_rate": 9.446051527317583e-06, + "loss": 0.6579, + "step": 14945 + }, + { + "epoch": 0.52, + "learning_rate": 9.444964337749856e-06, + "loss": 0.6191, + "step": 14946 + }, + { + "epoch": 0.52, + "learning_rate": 9.443877154762774e-06, + "loss": 0.6044, + "step": 14947 + }, + { + "epoch": 0.52, + "learning_rate": 9.442789978369233e-06, + "loss": 0.606, + "step": 14948 + }, + { + "epoch": 0.52, + "learning_rate": 9.441702808582122e-06, + "loss": 0.5633, + "step": 14949 + }, + { + "epoch": 0.52, + "learning_rate": 9.44061564541433e-06, + "loss": 0.5971, + "step": 14950 + }, + { + "epoch": 0.52, + "learning_rate": 9.439528488878747e-06, + "loss": 0.6317, + "step": 14951 + }, + { + "epoch": 0.52, + "learning_rate": 9.438441338988265e-06, + "loss": 0.6512, + "step": 14952 + }, + { + "epoch": 0.52, + "learning_rate": 9.43735419575577e-06, + "loss": 0.6329, + "step": 14953 + }, + { + "epoch": 0.52, + "learning_rate": 9.436267059194152e-06, + "loss": 0.5846, + "step": 14954 + }, + { + "epoch": 0.52, + "learning_rate": 9.435179929316303e-06, + "loss": 0.6539, + "step": 14955 + }, + { + "epoch": 0.52, + "learning_rate": 9.434092806135108e-06, + "loss": 0.6338, + "step": 14956 + }, + { + "epoch": 0.52, + "learning_rate": 9.43300568966346e-06, + "loss": 0.6563, + "step": 14957 + }, + { + "epoch": 0.52, + "learning_rate": 9.431918579914248e-06, + "loss": 0.5685, + "step": 14958 + }, + { + "epoch": 0.52, + "learning_rate": 9.430831476900357e-06, + "loss": 0.6547, + "step": 14959 + }, + { + "epoch": 0.52, + "learning_rate": 9.42974438063468e-06, + "loss": 0.6413, + "step": 14960 + }, + { + "epoch": 0.52, + "learning_rate": 9.428657291130107e-06, + "loss": 0.6138, + "step": 14961 + }, + { + "epoch": 0.52, + "learning_rate": 9.427570208399521e-06, + "loss": 0.6521, + "step": 14962 + }, + { + "epoch": 0.52, + "learning_rate": 9.426483132455814e-06, + "loss": 0.6622, + "step": 14963 + }, + { + "epoch": 0.52, + "learning_rate": 9.42539606331188e-06, + "loss": 0.6101, + "step": 14964 + }, + { + "epoch": 0.52, + "learning_rate": 9.424309000980598e-06, + "loss": 0.5879, + "step": 14965 + }, + { + "epoch": 0.52, + "learning_rate": 9.423221945474866e-06, + "loss": 0.612, + "step": 14966 + }, + { + "epoch": 0.52, + "learning_rate": 9.422134896807562e-06, + "loss": 0.6374, + "step": 14967 + }, + { + "epoch": 0.52, + "learning_rate": 9.421047854991581e-06, + "loss": 0.6765, + "step": 14968 + }, + { + "epoch": 0.52, + "learning_rate": 9.419960820039813e-06, + "loss": 0.5899, + "step": 14969 + }, + { + "epoch": 0.52, + "learning_rate": 9.418873791965138e-06, + "loss": 0.6482, + "step": 14970 + }, + { + "epoch": 0.52, + "learning_rate": 9.417786770780453e-06, + "loss": 0.6297, + "step": 14971 + }, + { + "epoch": 0.52, + "learning_rate": 9.416699756498645e-06, + "loss": 0.6217, + "step": 14972 + }, + { + "epoch": 0.52, + "learning_rate": 9.415612749132593e-06, + "loss": 0.6808, + "step": 14973 + }, + { + "epoch": 0.52, + "learning_rate": 9.414525748695193e-06, + "loss": 0.6329, + "step": 14974 + }, + { + "epoch": 0.52, + "learning_rate": 9.413438755199335e-06, + "loss": 0.5937, + "step": 14975 + }, + { + "epoch": 0.52, + "learning_rate": 9.412351768657898e-06, + "loss": 0.6437, + "step": 14976 + }, + { + "epoch": 0.52, + "learning_rate": 9.411264789083773e-06, + "loss": 0.6308, + "step": 14977 + }, + { + "epoch": 0.52, + "learning_rate": 9.410177816489856e-06, + "loss": 0.6052, + "step": 14978 + }, + { + "epoch": 0.52, + "learning_rate": 9.40909085088902e-06, + "loss": 0.6237, + "step": 14979 + }, + { + "epoch": 0.52, + "learning_rate": 9.408003892294162e-06, + "loss": 0.6225, + "step": 14980 + }, + { + "epoch": 0.52, + "learning_rate": 9.40691694071817e-06, + "loss": 0.6195, + "step": 14981 + }, + { + "epoch": 0.52, + "learning_rate": 9.405829996173921e-06, + "loss": 0.6443, + "step": 14982 + }, + { + "epoch": 0.52, + "learning_rate": 9.404743058674312e-06, + "loss": 0.5896, + "step": 14983 + }, + { + "epoch": 0.52, + "learning_rate": 9.40365612823223e-06, + "loss": 0.64, + "step": 14984 + }, + { + "epoch": 0.52, + "learning_rate": 9.402569204860555e-06, + "loss": 0.6309, + "step": 14985 + }, + { + "epoch": 0.52, + "learning_rate": 9.401482288572179e-06, + "loss": 0.599, + "step": 14986 + }, + { + "epoch": 0.52, + "learning_rate": 9.400395379379993e-06, + "loss": 0.6727, + "step": 14987 + }, + { + "epoch": 0.52, + "learning_rate": 9.399308477296869e-06, + "loss": 0.607, + "step": 14988 + }, + { + "epoch": 0.52, + "learning_rate": 9.398221582335705e-06, + "loss": 0.5919, + "step": 14989 + }, + { + "epoch": 0.52, + "learning_rate": 9.397134694509393e-06, + "loss": 0.6538, + "step": 14990 + }, + { + "epoch": 0.52, + "learning_rate": 9.396047813830804e-06, + "loss": 0.6296, + "step": 14991 + }, + { + "epoch": 0.52, + "learning_rate": 9.394960940312833e-06, + "loss": 0.6214, + "step": 14992 + }, + { + "epoch": 0.52, + "learning_rate": 9.39387407396837e-06, + "loss": 0.6238, + "step": 14993 + }, + { + "epoch": 0.52, + "learning_rate": 9.392787214810292e-06, + "loss": 0.5973, + "step": 14994 + }, + { + "epoch": 0.52, + "learning_rate": 9.39170036285149e-06, + "loss": 0.6029, + "step": 14995 + }, + { + "epoch": 0.52, + "learning_rate": 9.390613518104855e-06, + "loss": 0.6498, + "step": 14996 + }, + { + "epoch": 0.52, + "learning_rate": 9.38952668058326e-06, + "loss": 0.6421, + "step": 14997 + }, + { + "epoch": 0.52, + "learning_rate": 9.388439850299602e-06, + "loss": 0.6153, + "step": 14998 + }, + { + "epoch": 0.52, + "learning_rate": 9.387353027266767e-06, + "loss": 0.5939, + "step": 14999 + }, + { + "epoch": 0.52, + "learning_rate": 9.38626621149763e-06, + "loss": 0.6051, + "step": 15000 + }, + { + "epoch": 0.52, + "learning_rate": 9.385179403005085e-06, + "loss": 0.6587, + "step": 15001 + }, + { + "epoch": 0.52, + "learning_rate": 9.384092601802022e-06, + "loss": 0.6316, + "step": 15002 + }, + { + "epoch": 0.52, + "learning_rate": 9.383005807901313e-06, + "loss": 0.6879, + "step": 15003 + }, + { + "epoch": 0.52, + "learning_rate": 9.381919021315853e-06, + "loss": 0.6424, + "step": 15004 + }, + { + "epoch": 0.52, + "learning_rate": 9.380832242058529e-06, + "loss": 0.6424, + "step": 15005 + }, + { + "epoch": 0.52, + "learning_rate": 9.379745470142214e-06, + "loss": 0.624, + "step": 15006 + }, + { + "epoch": 0.52, + "learning_rate": 9.378658705579806e-06, + "loss": 0.7022, + "step": 15007 + }, + { + "epoch": 0.52, + "learning_rate": 9.377571948384189e-06, + "loss": 0.6527, + "step": 15008 + }, + { + "epoch": 0.52, + "learning_rate": 9.376485198568236e-06, + "loss": 0.6471, + "step": 15009 + }, + { + "epoch": 0.52, + "learning_rate": 9.375398456144841e-06, + "loss": 0.6621, + "step": 15010 + }, + { + "epoch": 0.52, + "learning_rate": 9.374311721126895e-06, + "loss": 0.6266, + "step": 15011 + }, + { + "epoch": 0.52, + "learning_rate": 9.373224993527266e-06, + "loss": 0.6688, + "step": 15012 + }, + { + "epoch": 0.52, + "learning_rate": 9.37213827335885e-06, + "loss": 0.6491, + "step": 15013 + }, + { + "epoch": 0.52, + "learning_rate": 9.371051560634535e-06, + "loss": 0.6735, + "step": 15014 + }, + { + "epoch": 0.52, + "learning_rate": 9.369964855367192e-06, + "loss": 0.6487, + "step": 15015 + }, + { + "epoch": 0.52, + "learning_rate": 9.368878157569715e-06, + "loss": 0.6352, + "step": 15016 + }, + { + "epoch": 0.52, + "learning_rate": 9.367791467254989e-06, + "loss": 0.624, + "step": 15017 + }, + { + "epoch": 0.52, + "learning_rate": 9.36670478443589e-06, + "loss": 0.5881, + "step": 15018 + }, + { + "epoch": 0.52, + "learning_rate": 9.365618109125308e-06, + "loss": 0.582, + "step": 15019 + }, + { + "epoch": 0.52, + "learning_rate": 9.364531441336129e-06, + "loss": 0.6688, + "step": 15020 + }, + { + "epoch": 0.52, + "learning_rate": 9.363444781081228e-06, + "loss": 0.6131, + "step": 15021 + }, + { + "epoch": 0.52, + "learning_rate": 9.362358128373498e-06, + "loss": 0.6148, + "step": 15022 + }, + { + "epoch": 0.52, + "learning_rate": 9.361271483225822e-06, + "loss": 0.6608, + "step": 15023 + }, + { + "epoch": 0.52, + "learning_rate": 9.360184845651074e-06, + "loss": 0.5763, + "step": 15024 + }, + { + "epoch": 0.52, + "learning_rate": 9.359098215662147e-06, + "loss": 0.6597, + "step": 15025 + }, + { + "epoch": 0.52, + "learning_rate": 9.358011593271925e-06, + "loss": 0.5868, + "step": 15026 + }, + { + "epoch": 0.52, + "learning_rate": 9.356924978493283e-06, + "loss": 0.6589, + "step": 15027 + }, + { + "epoch": 0.52, + "learning_rate": 9.355838371339114e-06, + "loss": 0.7261, + "step": 15028 + }, + { + "epoch": 0.52, + "learning_rate": 9.35475177182229e-06, + "loss": 0.6176, + "step": 15029 + }, + { + "epoch": 0.52, + "learning_rate": 9.3536651799557e-06, + "loss": 0.614, + "step": 15030 + }, + { + "epoch": 0.52, + "learning_rate": 9.352578595752233e-06, + "loss": 0.6413, + "step": 15031 + }, + { + "epoch": 0.52, + "learning_rate": 9.351492019224761e-06, + "loss": 0.649, + "step": 15032 + }, + { + "epoch": 0.52, + "learning_rate": 9.350405450386168e-06, + "loss": 0.5996, + "step": 15033 + }, + { + "epoch": 0.52, + "learning_rate": 9.349318889249349e-06, + "loss": 0.65, + "step": 15034 + }, + { + "epoch": 0.52, + "learning_rate": 9.348232335827173e-06, + "loss": 0.6628, + "step": 15035 + }, + { + "epoch": 0.52, + "learning_rate": 9.347145790132524e-06, + "loss": 0.6519, + "step": 15036 + }, + { + "epoch": 0.52, + "learning_rate": 9.346059252178295e-06, + "loss": 0.6246, + "step": 15037 + }, + { + "epoch": 0.52, + "learning_rate": 9.344972721977355e-06, + "loss": 0.6101, + "step": 15038 + }, + { + "epoch": 0.52, + "learning_rate": 9.34388619954259e-06, + "loss": 0.5932, + "step": 15039 + }, + { + "epoch": 0.52, + "learning_rate": 9.342799684886892e-06, + "loss": 0.6617, + "step": 15040 + }, + { + "epoch": 0.52, + "learning_rate": 9.34171317802313e-06, + "loss": 0.6454, + "step": 15041 + }, + { + "epoch": 0.52, + "learning_rate": 9.34062667896419e-06, + "loss": 0.6358, + "step": 15042 + }, + { + "epoch": 0.52, + "learning_rate": 9.339540187722959e-06, + "loss": 0.6418, + "step": 15043 + }, + { + "epoch": 0.52, + "learning_rate": 9.338453704312312e-06, + "loss": 0.6438, + "step": 15044 + }, + { + "epoch": 0.52, + "learning_rate": 9.337367228745131e-06, + "loss": 0.6495, + "step": 15045 + }, + { + "epoch": 0.52, + "learning_rate": 9.336280761034306e-06, + "loss": 0.597, + "step": 15046 + }, + { + "epoch": 0.52, + "learning_rate": 9.335194301192707e-06, + "loss": 0.622, + "step": 15047 + }, + { + "epoch": 0.52, + "learning_rate": 9.334107849233219e-06, + "loss": 0.6069, + "step": 15048 + }, + { + "epoch": 0.52, + "learning_rate": 9.333021405168731e-06, + "loss": 0.5994, + "step": 15049 + }, + { + "epoch": 0.52, + "learning_rate": 9.331934969012115e-06, + "loss": 0.6712, + "step": 15050 + }, + { + "epoch": 0.52, + "learning_rate": 9.330848540776252e-06, + "loss": 0.5952, + "step": 15051 + }, + { + "epoch": 0.52, + "learning_rate": 9.329762120474032e-06, + "loss": 0.6624, + "step": 15052 + }, + { + "epoch": 0.52, + "learning_rate": 9.328675708118327e-06, + "loss": 0.6075, + "step": 15053 + }, + { + "epoch": 0.52, + "learning_rate": 9.327589303722017e-06, + "loss": 0.6166, + "step": 15054 + }, + { + "epoch": 0.52, + "learning_rate": 9.326502907297993e-06, + "loss": 0.6167, + "step": 15055 + }, + { + "epoch": 0.52, + "learning_rate": 9.325416518859125e-06, + "loss": 0.7058, + "step": 15056 + }, + { + "epoch": 0.52, + "learning_rate": 9.324330138418294e-06, + "loss": 0.6052, + "step": 15057 + }, + { + "epoch": 0.52, + "learning_rate": 9.323243765988393e-06, + "loss": 0.609, + "step": 15058 + }, + { + "epoch": 0.52, + "learning_rate": 9.322157401582289e-06, + "loss": 0.6096, + "step": 15059 + }, + { + "epoch": 0.52, + "learning_rate": 9.321071045212862e-06, + "loss": 0.6551, + "step": 15060 + }, + { + "epoch": 0.52, + "learning_rate": 9.319984696893005e-06, + "loss": 0.6294, + "step": 15061 + }, + { + "epoch": 0.52, + "learning_rate": 9.318898356635583e-06, + "loss": 0.6294, + "step": 15062 + }, + { + "epoch": 0.52, + "learning_rate": 9.317812024453482e-06, + "loss": 0.6051, + "step": 15063 + }, + { + "epoch": 0.52, + "learning_rate": 9.31672570035959e-06, + "loss": 0.6294, + "step": 15064 + }, + { + "epoch": 0.52, + "learning_rate": 9.315639384366773e-06, + "loss": 0.6413, + "step": 15065 + }, + { + "epoch": 0.52, + "learning_rate": 9.314553076487916e-06, + "loss": 0.6043, + "step": 15066 + }, + { + "epoch": 0.52, + "learning_rate": 9.313466776735906e-06, + "loss": 0.6656, + "step": 15067 + }, + { + "epoch": 0.52, + "learning_rate": 9.31238048512361e-06, + "loss": 0.6296, + "step": 15068 + }, + { + "epoch": 0.52, + "learning_rate": 9.311294201663912e-06, + "loss": 0.6349, + "step": 15069 + }, + { + "epoch": 0.52, + "learning_rate": 9.310207926369699e-06, + "loss": 0.602, + "step": 15070 + }, + { + "epoch": 0.52, + "learning_rate": 9.309121659253838e-06, + "loss": 0.6289, + "step": 15071 + }, + { + "epoch": 0.52, + "learning_rate": 9.308035400329213e-06, + "loss": 0.6521, + "step": 15072 + }, + { + "epoch": 0.52, + "learning_rate": 9.30694914960871e-06, + "loss": 0.5987, + "step": 15073 + }, + { + "epoch": 0.52, + "learning_rate": 9.305862907105196e-06, + "loss": 0.6208, + "step": 15074 + }, + { + "epoch": 0.52, + "learning_rate": 9.304776672831557e-06, + "loss": 0.6328, + "step": 15075 + }, + { + "epoch": 0.52, + "learning_rate": 9.30369044680067e-06, + "loss": 0.6236, + "step": 15076 + }, + { + "epoch": 0.52, + "learning_rate": 9.302604229025414e-06, + "loss": 0.604, + "step": 15077 + }, + { + "epoch": 0.52, + "learning_rate": 9.301518019518666e-06, + "loss": 0.6154, + "step": 15078 + }, + { + "epoch": 0.52, + "learning_rate": 9.300431818293307e-06, + "loss": 0.6412, + "step": 15079 + }, + { + "epoch": 0.52, + "learning_rate": 9.299345625362213e-06, + "loss": 0.629, + "step": 15080 + }, + { + "epoch": 0.52, + "learning_rate": 9.298259440738263e-06, + "loss": 0.6422, + "step": 15081 + }, + { + "epoch": 0.52, + "learning_rate": 9.297173264434334e-06, + "loss": 0.6138, + "step": 15082 + }, + { + "epoch": 0.52, + "learning_rate": 9.296087096463305e-06, + "loss": 0.6829, + "step": 15083 + }, + { + "epoch": 0.52, + "learning_rate": 9.295000936838055e-06, + "loss": 0.6444, + "step": 15084 + }, + { + "epoch": 0.52, + "learning_rate": 9.293914785571462e-06, + "loss": 0.586, + "step": 15085 + }, + { + "epoch": 0.52, + "learning_rate": 9.2928286426764e-06, + "loss": 0.6064, + "step": 15086 + }, + { + "epoch": 0.52, + "learning_rate": 9.291742508165749e-06, + "loss": 0.6323, + "step": 15087 + }, + { + "epoch": 0.52, + "learning_rate": 9.290656382052388e-06, + "loss": 0.6689, + "step": 15088 + }, + { + "epoch": 0.52, + "learning_rate": 9.289570264349192e-06, + "loss": 0.6109, + "step": 15089 + }, + { + "epoch": 0.52, + "learning_rate": 9.288484155069041e-06, + "loss": 0.6462, + "step": 15090 + }, + { + "epoch": 0.52, + "learning_rate": 9.28739805422481e-06, + "loss": 0.5916, + "step": 15091 + }, + { + "epoch": 0.52, + "learning_rate": 9.286311961829374e-06, + "loss": 0.6417, + "step": 15092 + }, + { + "epoch": 0.52, + "learning_rate": 9.285225877895615e-06, + "loss": 0.633, + "step": 15093 + }, + { + "epoch": 0.52, + "learning_rate": 9.284139802436407e-06, + "loss": 0.6589, + "step": 15094 + }, + { + "epoch": 0.52, + "learning_rate": 9.283053735464624e-06, + "loss": 0.644, + "step": 15095 + }, + { + "epoch": 0.52, + "learning_rate": 9.281967676993152e-06, + "loss": 0.5839, + "step": 15096 + }, + { + "epoch": 0.52, + "learning_rate": 9.280881627034856e-06, + "loss": 0.6912, + "step": 15097 + }, + { + "epoch": 0.52, + "learning_rate": 9.27979558560262e-06, + "loss": 0.6841, + "step": 15098 + }, + { + "epoch": 0.52, + "learning_rate": 9.27870955270932e-06, + "loss": 0.604, + "step": 15099 + }, + { + "epoch": 0.52, + "learning_rate": 9.277623528367828e-06, + "loss": 0.6198, + "step": 15100 + }, + { + "epoch": 0.52, + "learning_rate": 9.276537512591022e-06, + "loss": 0.5535, + "step": 15101 + }, + { + "epoch": 0.52, + "learning_rate": 9.275451505391783e-06, + "loss": 0.6636, + "step": 15102 + }, + { + "epoch": 0.52, + "learning_rate": 9.27436550678298e-06, + "loss": 0.6461, + "step": 15103 + }, + { + "epoch": 0.52, + "learning_rate": 9.273279516777494e-06, + "loss": 0.6287, + "step": 15104 + }, + { + "epoch": 0.52, + "learning_rate": 9.272193535388198e-06, + "loss": 0.6432, + "step": 15105 + }, + { + "epoch": 0.52, + "learning_rate": 9.271107562627967e-06, + "loss": 0.6356, + "step": 15106 + }, + { + "epoch": 0.52, + "learning_rate": 9.270021598509677e-06, + "loss": 0.6085, + "step": 15107 + }, + { + "epoch": 0.52, + "learning_rate": 9.268935643046208e-06, + "loss": 0.6442, + "step": 15108 + }, + { + "epoch": 0.52, + "learning_rate": 9.267849696250429e-06, + "loss": 0.6168, + "step": 15109 + }, + { + "epoch": 0.52, + "learning_rate": 9.26676375813522e-06, + "loss": 0.6542, + "step": 15110 + }, + { + "epoch": 0.52, + "learning_rate": 9.265677828713453e-06, + "loss": 0.603, + "step": 15111 + }, + { + "epoch": 0.52, + "learning_rate": 9.264591907998004e-06, + "loss": 0.6499, + "step": 15112 + }, + { + "epoch": 0.52, + "learning_rate": 9.263505996001747e-06, + "loss": 0.6191, + "step": 15113 + }, + { + "epoch": 0.52, + "learning_rate": 9.262420092737562e-06, + "loss": 0.6771, + "step": 15114 + }, + { + "epoch": 0.52, + "learning_rate": 9.261334198218315e-06, + "loss": 0.6284, + "step": 15115 + }, + { + "epoch": 0.52, + "learning_rate": 9.26024831245689e-06, + "loss": 0.6286, + "step": 15116 + }, + { + "epoch": 0.52, + "learning_rate": 9.259162435466154e-06, + "loss": 0.6647, + "step": 15117 + }, + { + "epoch": 0.52, + "learning_rate": 9.258076567258986e-06, + "loss": 0.6555, + "step": 15118 + }, + { + "epoch": 0.52, + "learning_rate": 9.256990707848257e-06, + "loss": 0.6474, + "step": 15119 + }, + { + "epoch": 0.52, + "learning_rate": 9.255904857246846e-06, + "loss": 0.6723, + "step": 15120 + }, + { + "epoch": 0.52, + "learning_rate": 9.254819015467621e-06, + "loss": 0.61, + "step": 15121 + }, + { + "epoch": 0.52, + "learning_rate": 9.253733182523462e-06, + "loss": 0.6129, + "step": 15122 + }, + { + "epoch": 0.52, + "learning_rate": 9.252647358427239e-06, + "loss": 0.6526, + "step": 15123 + }, + { + "epoch": 0.52, + "learning_rate": 9.251561543191825e-06, + "loss": 0.5749, + "step": 15124 + }, + { + "epoch": 0.52, + "learning_rate": 9.250475736830097e-06, + "loss": 0.6076, + "step": 15125 + }, + { + "epoch": 0.52, + "learning_rate": 9.24938993935493e-06, + "loss": 0.6543, + "step": 15126 + }, + { + "epoch": 0.52, + "learning_rate": 9.248304150779193e-06, + "loss": 0.611, + "step": 15127 + }, + { + "epoch": 0.52, + "learning_rate": 9.24721837111576e-06, + "loss": 0.6483, + "step": 15128 + }, + { + "epoch": 0.52, + "learning_rate": 9.246132600377507e-06, + "loss": 0.6158, + "step": 15129 + }, + { + "epoch": 0.52, + "learning_rate": 9.245046838577305e-06, + "loss": 0.6318, + "step": 15130 + }, + { + "epoch": 0.52, + "learning_rate": 9.243961085728027e-06, + "loss": 0.6582, + "step": 15131 + }, + { + "epoch": 0.52, + "learning_rate": 9.242875341842549e-06, + "loss": 0.5546, + "step": 15132 + }, + { + "epoch": 0.52, + "learning_rate": 9.24178960693374e-06, + "loss": 0.626, + "step": 15133 + }, + { + "epoch": 0.52, + "learning_rate": 9.240703881014474e-06, + "loss": 0.6366, + "step": 15134 + }, + { + "epoch": 0.52, + "learning_rate": 9.239618164097624e-06, + "loss": 0.5975, + "step": 15135 + }, + { + "epoch": 0.52, + "learning_rate": 9.238532456196062e-06, + "loss": 0.6332, + "step": 15136 + }, + { + "epoch": 0.52, + "learning_rate": 9.237446757322663e-06, + "loss": 0.6079, + "step": 15137 + }, + { + "epoch": 0.52, + "learning_rate": 9.236361067490296e-06, + "loss": 0.5868, + "step": 15138 + }, + { + "epoch": 0.52, + "learning_rate": 9.235275386711834e-06, + "loss": 0.6525, + "step": 15139 + }, + { + "epoch": 0.52, + "learning_rate": 9.234189715000152e-06, + "loss": 0.6697, + "step": 15140 + }, + { + "epoch": 0.52, + "learning_rate": 9.23310405236812e-06, + "loss": 0.6151, + "step": 15141 + }, + { + "epoch": 0.52, + "learning_rate": 9.232018398828606e-06, + "loss": 0.6294, + "step": 15142 + }, + { + "epoch": 0.52, + "learning_rate": 9.230932754394488e-06, + "loss": 0.6626, + "step": 15143 + }, + { + "epoch": 0.52, + "learning_rate": 9.229847119078634e-06, + "loss": 0.6523, + "step": 15144 + }, + { + "epoch": 0.52, + "learning_rate": 9.228761492893916e-06, + "loss": 0.5719, + "step": 15145 + }, + { + "epoch": 0.52, + "learning_rate": 9.227675875853207e-06, + "loss": 0.6027, + "step": 15146 + }, + { + "epoch": 0.52, + "learning_rate": 9.226590267969378e-06, + "loss": 0.5914, + "step": 15147 + }, + { + "epoch": 0.52, + "learning_rate": 9.2255046692553e-06, + "loss": 0.6164, + "step": 15148 + }, + { + "epoch": 0.52, + "learning_rate": 9.224419079723842e-06, + "loss": 0.5621, + "step": 15149 + }, + { + "epoch": 0.52, + "learning_rate": 9.22333349938788e-06, + "loss": 0.6095, + "step": 15150 + }, + { + "epoch": 0.52, + "learning_rate": 9.22224792826028e-06, + "loss": 0.6436, + "step": 15151 + }, + { + "epoch": 0.52, + "learning_rate": 9.221162366353915e-06, + "loss": 0.6611, + "step": 15152 + }, + { + "epoch": 0.53, + "learning_rate": 9.220076813681655e-06, + "loss": 0.5903, + "step": 15153 + }, + { + "epoch": 0.53, + "learning_rate": 9.21899127025637e-06, + "loss": 0.5882, + "step": 15154 + }, + { + "epoch": 0.53, + "learning_rate": 9.217905736090932e-06, + "loss": 0.6175, + "step": 15155 + }, + { + "epoch": 0.53, + "learning_rate": 9.216820211198212e-06, + "loss": 0.6613, + "step": 15156 + }, + { + "epoch": 0.53, + "learning_rate": 9.215734695591078e-06, + "loss": 0.5931, + "step": 15157 + }, + { + "epoch": 0.53, + "learning_rate": 9.214649189282403e-06, + "loss": 0.643, + "step": 15158 + }, + { + "epoch": 0.53, + "learning_rate": 9.213563692285054e-06, + "loss": 0.6606, + "step": 15159 + }, + { + "epoch": 0.53, + "learning_rate": 9.212478204611901e-06, + "loss": 0.6722, + "step": 15160 + }, + { + "epoch": 0.53, + "learning_rate": 9.211392726275818e-06, + "loss": 0.6461, + "step": 15161 + }, + { + "epoch": 0.53, + "learning_rate": 9.21030725728967e-06, + "loss": 0.6539, + "step": 15162 + }, + { + "epoch": 0.53, + "learning_rate": 9.209221797666328e-06, + "loss": 0.5857, + "step": 15163 + }, + { + "epoch": 0.53, + "learning_rate": 9.208136347418664e-06, + "loss": 0.6551, + "step": 15164 + }, + { + "epoch": 0.53, + "learning_rate": 9.207050906559543e-06, + "loss": 0.6405, + "step": 15165 + }, + { + "epoch": 0.53, + "learning_rate": 9.205965475101836e-06, + "loss": 0.5674, + "step": 15166 + }, + { + "epoch": 0.53, + "learning_rate": 9.204880053058416e-06, + "loss": 0.6813, + "step": 15167 + }, + { + "epoch": 0.53, + "learning_rate": 9.203794640442147e-06, + "loss": 0.5786, + "step": 15168 + }, + { + "epoch": 0.53, + "learning_rate": 9.2027092372659e-06, + "loss": 0.6674, + "step": 15169 + }, + { + "epoch": 0.53, + "learning_rate": 9.201623843542543e-06, + "loss": 0.6438, + "step": 15170 + }, + { + "epoch": 0.53, + "learning_rate": 9.200538459284945e-06, + "loss": 0.6084, + "step": 15171 + }, + { + "epoch": 0.53, + "learning_rate": 9.199453084505975e-06, + "loss": 0.5994, + "step": 15172 + }, + { + "epoch": 0.53, + "learning_rate": 9.198367719218504e-06, + "loss": 0.673, + "step": 15173 + }, + { + "epoch": 0.53, + "learning_rate": 9.197282363435395e-06, + "loss": 0.6551, + "step": 15174 + }, + { + "epoch": 0.53, + "learning_rate": 9.196197017169519e-06, + "loss": 0.6167, + "step": 15175 + }, + { + "epoch": 0.53, + "learning_rate": 9.195111680433746e-06, + "loss": 0.6244, + "step": 15176 + }, + { + "epoch": 0.53, + "learning_rate": 9.19402635324094e-06, + "loss": 0.6489, + "step": 15177 + }, + { + "epoch": 0.53, + "learning_rate": 9.192941035603971e-06, + "loss": 0.6932, + "step": 15178 + }, + { + "epoch": 0.53, + "learning_rate": 9.191855727535712e-06, + "loss": 0.6511, + "step": 15179 + }, + { + "epoch": 0.53, + "learning_rate": 9.19077042904902e-06, + "loss": 0.6462, + "step": 15180 + }, + { + "epoch": 0.53, + "learning_rate": 9.189685140156768e-06, + "loss": 0.6056, + "step": 15181 + }, + { + "epoch": 0.53, + "learning_rate": 9.188599860871828e-06, + "loss": 0.5765, + "step": 15182 + }, + { + "epoch": 0.53, + "learning_rate": 9.18751459120706e-06, + "loss": 0.6698, + "step": 15183 + }, + { + "epoch": 0.53, + "learning_rate": 9.186429331175335e-06, + "loss": 0.5973, + "step": 15184 + }, + { + "epoch": 0.53, + "learning_rate": 9.185344080789522e-06, + "loss": 0.6599, + "step": 15185 + }, + { + "epoch": 0.53, + "learning_rate": 9.184258840062482e-06, + "loss": 0.651, + "step": 15186 + }, + { + "epoch": 0.53, + "learning_rate": 9.183173609007085e-06, + "loss": 0.5947, + "step": 15187 + }, + { + "epoch": 0.53, + "learning_rate": 9.182088387636202e-06, + "loss": 0.6601, + "step": 15188 + }, + { + "epoch": 0.53, + "learning_rate": 9.181003175962693e-06, + "loss": 0.6376, + "step": 15189 + }, + { + "epoch": 0.53, + "learning_rate": 9.179917973999427e-06, + "loss": 0.6686, + "step": 15190 + }, + { + "epoch": 0.53, + "learning_rate": 9.178832781759272e-06, + "loss": 0.659, + "step": 15191 + }, + { + "epoch": 0.53, + "learning_rate": 9.177747599255094e-06, + "loss": 0.6268, + "step": 15192 + }, + { + "epoch": 0.53, + "learning_rate": 9.176662426499757e-06, + "loss": 0.6315, + "step": 15193 + }, + { + "epoch": 0.53, + "learning_rate": 9.175577263506129e-06, + "loss": 0.6701, + "step": 15194 + }, + { + "epoch": 0.53, + "learning_rate": 9.174492110287074e-06, + "loss": 0.615, + "step": 15195 + }, + { + "epoch": 0.53, + "learning_rate": 9.17340696685546e-06, + "loss": 0.6114, + "step": 15196 + }, + { + "epoch": 0.53, + "learning_rate": 9.172321833224153e-06, + "loss": 0.6404, + "step": 15197 + }, + { + "epoch": 0.53, + "learning_rate": 9.171236709406017e-06, + "loss": 0.5947, + "step": 15198 + }, + { + "epoch": 0.53, + "learning_rate": 9.17015159541392e-06, + "loss": 0.5986, + "step": 15199 + }, + { + "epoch": 0.53, + "learning_rate": 9.169066491260724e-06, + "loss": 0.6469, + "step": 15200 + }, + { + "epoch": 0.53, + "learning_rate": 9.167981396959294e-06, + "loss": 0.6466, + "step": 15201 + }, + { + "epoch": 0.53, + "learning_rate": 9.166896312522499e-06, + "loss": 0.6043, + "step": 15202 + }, + { + "epoch": 0.53, + "learning_rate": 9.165811237963203e-06, + "loss": 0.6457, + "step": 15203 + }, + { + "epoch": 0.53, + "learning_rate": 9.164726173294269e-06, + "loss": 0.6134, + "step": 15204 + }, + { + "epoch": 0.53, + "learning_rate": 9.163641118528563e-06, + "loss": 0.609, + "step": 15205 + }, + { + "epoch": 0.53, + "learning_rate": 9.16255607367895e-06, + "loss": 0.6316, + "step": 15206 + }, + { + "epoch": 0.53, + "learning_rate": 9.161471038758292e-06, + "loss": 0.612, + "step": 15207 + }, + { + "epoch": 0.53, + "learning_rate": 9.160386013779457e-06, + "loss": 0.6672, + "step": 15208 + }, + { + "epoch": 0.53, + "learning_rate": 9.159300998755309e-06, + "loss": 0.619, + "step": 15209 + }, + { + "epoch": 0.53, + "learning_rate": 9.15821599369871e-06, + "loss": 0.7012, + "step": 15210 + }, + { + "epoch": 0.53, + "learning_rate": 9.157130998622525e-06, + "loss": 0.6108, + "step": 15211 + }, + { + "epoch": 0.53, + "learning_rate": 9.15604601353962e-06, + "loss": 0.6274, + "step": 15212 + }, + { + "epoch": 0.53, + "learning_rate": 9.154961038462854e-06, + "loss": 0.6791, + "step": 15213 + }, + { + "epoch": 0.53, + "learning_rate": 9.1538760734051e-06, + "loss": 0.6391, + "step": 15214 + }, + { + "epoch": 0.53, + "learning_rate": 9.152791118379209e-06, + "loss": 0.6766, + "step": 15215 + }, + { + "epoch": 0.53, + "learning_rate": 9.151706173398053e-06, + "loss": 0.6807, + "step": 15216 + }, + { + "epoch": 0.53, + "learning_rate": 9.150621238474497e-06, + "loss": 0.5966, + "step": 15217 + }, + { + "epoch": 0.53, + "learning_rate": 9.149536313621394e-06, + "loss": 0.6922, + "step": 15218 + }, + { + "epoch": 0.53, + "learning_rate": 9.148451398851616e-06, + "loss": 0.6279, + "step": 15219 + }, + { + "epoch": 0.53, + "learning_rate": 9.147366494178029e-06, + "loss": 0.6662, + "step": 15220 + }, + { + "epoch": 0.53, + "learning_rate": 9.146281599613484e-06, + "loss": 0.5877, + "step": 15221 + }, + { + "epoch": 0.53, + "learning_rate": 9.145196715170853e-06, + "loss": 0.6046, + "step": 15222 + }, + { + "epoch": 0.53, + "learning_rate": 9.144111840863e-06, + "loss": 0.6208, + "step": 15223 + }, + { + "epoch": 0.53, + "learning_rate": 9.143026976702778e-06, + "loss": 0.6714, + "step": 15224 + }, + { + "epoch": 0.53, + "learning_rate": 9.141942122703057e-06, + "loss": 0.643, + "step": 15225 + }, + { + "epoch": 0.53, + "learning_rate": 9.140857278876702e-06, + "loss": 0.6048, + "step": 15226 + }, + { + "epoch": 0.53, + "learning_rate": 9.139772445236564e-06, + "loss": 0.6686, + "step": 15227 + }, + { + "epoch": 0.53, + "learning_rate": 9.138687621795515e-06, + "loss": 0.6344, + "step": 15228 + }, + { + "epoch": 0.53, + "learning_rate": 9.137602808566417e-06, + "loss": 0.6198, + "step": 15229 + }, + { + "epoch": 0.53, + "learning_rate": 9.136518005562122e-06, + "loss": 0.6149, + "step": 15230 + }, + { + "epoch": 0.53, + "learning_rate": 9.1354332127955e-06, + "loss": 0.6538, + "step": 15231 + }, + { + "epoch": 0.53, + "learning_rate": 9.134348430279418e-06, + "loss": 0.6279, + "step": 15232 + }, + { + "epoch": 0.53, + "learning_rate": 9.133263658026722e-06, + "loss": 0.6588, + "step": 15233 + }, + { + "epoch": 0.53, + "learning_rate": 9.132178896050285e-06, + "loss": 0.6424, + "step": 15234 + }, + { + "epoch": 0.53, + "learning_rate": 9.13109414436297e-06, + "loss": 0.5943, + "step": 15235 + }, + { + "epoch": 0.53, + "learning_rate": 9.130009402977622e-06, + "loss": 0.6001, + "step": 15236 + }, + { + "epoch": 0.53, + "learning_rate": 9.12892467190712e-06, + "loss": 0.5578, + "step": 15237 + }, + { + "epoch": 0.53, + "learning_rate": 9.127839951164321e-06, + "loss": 0.6642, + "step": 15238 + }, + { + "epoch": 0.53, + "learning_rate": 9.126755240762075e-06, + "loss": 0.6447, + "step": 15239 + }, + { + "epoch": 0.53, + "learning_rate": 9.125670540713253e-06, + "loss": 0.5916, + "step": 15240 + }, + { + "epoch": 0.53, + "learning_rate": 9.124585851030719e-06, + "loss": 0.6483, + "step": 15241 + }, + { + "epoch": 0.53, + "learning_rate": 9.123501171727318e-06, + "loss": 0.6345, + "step": 15242 + }, + { + "epoch": 0.53, + "learning_rate": 9.122416502815923e-06, + "loss": 0.6138, + "step": 15243 + }, + { + "epoch": 0.53, + "learning_rate": 9.121331844309394e-06, + "loss": 0.6374, + "step": 15244 + }, + { + "epoch": 0.53, + "learning_rate": 9.120247196220581e-06, + "loss": 0.683, + "step": 15245 + }, + { + "epoch": 0.53, + "learning_rate": 9.119162558562353e-06, + "loss": 0.6589, + "step": 15246 + }, + { + "epoch": 0.53, + "learning_rate": 9.118077931347571e-06, + "loss": 0.5562, + "step": 15247 + }, + { + "epoch": 0.53, + "learning_rate": 9.116993314589085e-06, + "loss": 0.6954, + "step": 15248 + }, + { + "epoch": 0.53, + "learning_rate": 9.115908708299762e-06, + "loss": 0.5741, + "step": 15249 + }, + { + "epoch": 0.53, + "learning_rate": 9.114824112492464e-06, + "loss": 0.6855, + "step": 15250 + }, + { + "epoch": 0.53, + "learning_rate": 9.11373952718004e-06, + "loss": 0.6381, + "step": 15251 + }, + { + "epoch": 0.53, + "learning_rate": 9.112654952375358e-06, + "loss": 0.6546, + "step": 15252 + }, + { + "epoch": 0.53, + "learning_rate": 9.111570388091276e-06, + "loss": 0.6518, + "step": 15253 + }, + { + "epoch": 0.53, + "learning_rate": 9.110485834340646e-06, + "loss": 0.5756, + "step": 15254 + }, + { + "epoch": 0.53, + "learning_rate": 9.109401291136333e-06, + "loss": 0.6336, + "step": 15255 + }, + { + "epoch": 0.53, + "learning_rate": 9.108316758491198e-06, + "loss": 0.643, + "step": 15256 + }, + { + "epoch": 0.53, + "learning_rate": 9.10723223641809e-06, + "loss": 0.6306, + "step": 15257 + }, + { + "epoch": 0.53, + "learning_rate": 9.106147724929878e-06, + "loss": 0.6248, + "step": 15258 + }, + { + "epoch": 0.53, + "learning_rate": 9.105063224039416e-06, + "loss": 0.6698, + "step": 15259 + }, + { + "epoch": 0.53, + "learning_rate": 9.103978733759556e-06, + "loss": 0.6328, + "step": 15260 + }, + { + "epoch": 0.53, + "learning_rate": 9.102894254103165e-06, + "loss": 0.6287, + "step": 15261 + }, + { + "epoch": 0.53, + "learning_rate": 9.1018097850831e-06, + "loss": 0.6377, + "step": 15262 + }, + { + "epoch": 0.53, + "learning_rate": 9.100725326712211e-06, + "loss": 0.6712, + "step": 15263 + }, + { + "epoch": 0.53, + "learning_rate": 9.099640879003363e-06, + "loss": 0.6812, + "step": 15264 + }, + { + "epoch": 0.53, + "learning_rate": 9.098556441969414e-06, + "loss": 0.6583, + "step": 15265 + }, + { + "epoch": 0.53, + "learning_rate": 9.097472015623218e-06, + "loss": 0.6226, + "step": 15266 + }, + { + "epoch": 0.53, + "learning_rate": 9.096387599977627e-06, + "loss": 0.5932, + "step": 15267 + }, + { + "epoch": 0.53, + "learning_rate": 9.095303195045513e-06, + "loss": 0.6344, + "step": 15268 + }, + { + "epoch": 0.53, + "learning_rate": 9.094218800839719e-06, + "loss": 0.6336, + "step": 15269 + }, + { + "epoch": 0.53, + "learning_rate": 9.093134417373105e-06, + "loss": 0.6219, + "step": 15270 + }, + { + "epoch": 0.53, + "learning_rate": 9.092050044658535e-06, + "loss": 0.658, + "step": 15271 + }, + { + "epoch": 0.53, + "learning_rate": 9.090965682708858e-06, + "loss": 0.5875, + "step": 15272 + }, + { + "epoch": 0.53, + "learning_rate": 9.08988133153693e-06, + "loss": 0.6308, + "step": 15273 + }, + { + "epoch": 0.53, + "learning_rate": 9.088796991155614e-06, + "loss": 0.6476, + "step": 15274 + }, + { + "epoch": 0.53, + "learning_rate": 9.08771266157776e-06, + "loss": 0.6019, + "step": 15275 + }, + { + "epoch": 0.53, + "learning_rate": 9.08662834281623e-06, + "loss": 0.6411, + "step": 15276 + }, + { + "epoch": 0.53, + "learning_rate": 9.085544034883873e-06, + "loss": 0.6228, + "step": 15277 + }, + { + "epoch": 0.53, + "learning_rate": 9.084459737793548e-06, + "loss": 0.67, + "step": 15278 + }, + { + "epoch": 0.53, + "learning_rate": 9.083375451558113e-06, + "loss": 0.6171, + "step": 15279 + }, + { + "epoch": 0.53, + "learning_rate": 9.08229117619042e-06, + "loss": 0.5955, + "step": 15280 + }, + { + "epoch": 0.53, + "learning_rate": 9.081206911703325e-06, + "loss": 0.6443, + "step": 15281 + }, + { + "epoch": 0.53, + "learning_rate": 9.080122658109689e-06, + "loss": 0.6671, + "step": 15282 + }, + { + "epoch": 0.53, + "learning_rate": 9.079038415422357e-06, + "loss": 0.6563, + "step": 15283 + }, + { + "epoch": 0.53, + "learning_rate": 9.077954183654191e-06, + "loss": 0.6091, + "step": 15284 + }, + { + "epoch": 0.53, + "learning_rate": 9.076869962818048e-06, + "loss": 0.6616, + "step": 15285 + }, + { + "epoch": 0.53, + "learning_rate": 9.075785752926776e-06, + "loss": 0.6327, + "step": 15286 + }, + { + "epoch": 0.53, + "learning_rate": 9.074701553993233e-06, + "loss": 0.6694, + "step": 15287 + }, + { + "epoch": 0.53, + "learning_rate": 9.073617366030276e-06, + "loss": 0.6034, + "step": 15288 + }, + { + "epoch": 0.53, + "learning_rate": 9.072533189050754e-06, + "loss": 0.6384, + "step": 15289 + }, + { + "epoch": 0.53, + "learning_rate": 9.071449023067526e-06, + "loss": 0.6448, + "step": 15290 + }, + { + "epoch": 0.53, + "learning_rate": 9.070364868093446e-06, + "loss": 0.606, + "step": 15291 + }, + { + "epoch": 0.53, + "learning_rate": 9.069280724141364e-06, + "loss": 0.6146, + "step": 15292 + }, + { + "epoch": 0.53, + "learning_rate": 9.068196591224135e-06, + "loss": 0.6686, + "step": 15293 + }, + { + "epoch": 0.53, + "learning_rate": 9.067112469354618e-06, + "loss": 0.6855, + "step": 15294 + }, + { + "epoch": 0.53, + "learning_rate": 9.06602835854566e-06, + "loss": 0.6301, + "step": 15295 + }, + { + "epoch": 0.53, + "learning_rate": 9.064944258810118e-06, + "loss": 0.6358, + "step": 15296 + }, + { + "epoch": 0.53, + "learning_rate": 9.063860170160847e-06, + "loss": 0.5933, + "step": 15297 + }, + { + "epoch": 0.53, + "learning_rate": 9.062776092610695e-06, + "loss": 0.6437, + "step": 15298 + }, + { + "epoch": 0.53, + "learning_rate": 9.061692026172517e-06, + "loss": 0.6004, + "step": 15299 + }, + { + "epoch": 0.53, + "learning_rate": 9.060607970859171e-06, + "loss": 0.6553, + "step": 15300 + }, + { + "epoch": 0.53, + "learning_rate": 9.059523926683504e-06, + "loss": 0.6246, + "step": 15301 + }, + { + "epoch": 0.53, + "learning_rate": 9.058439893658368e-06, + "loss": 0.6347, + "step": 15302 + }, + { + "epoch": 0.53, + "learning_rate": 9.057355871796622e-06, + "loss": 0.5601, + "step": 15303 + }, + { + "epoch": 0.53, + "learning_rate": 9.056271861111112e-06, + "loss": 0.6398, + "step": 15304 + }, + { + "epoch": 0.53, + "learning_rate": 9.055187861614694e-06, + "loss": 0.6053, + "step": 15305 + }, + { + "epoch": 0.53, + "learning_rate": 9.05410387332022e-06, + "loss": 0.6093, + "step": 15306 + }, + { + "epoch": 0.53, + "learning_rate": 9.05301989624054e-06, + "loss": 0.6038, + "step": 15307 + }, + { + "epoch": 0.53, + "learning_rate": 9.051935930388505e-06, + "loss": 0.6216, + "step": 15308 + }, + { + "epoch": 0.53, + "learning_rate": 9.050851975776974e-06, + "loss": 0.6264, + "step": 15309 + }, + { + "epoch": 0.53, + "learning_rate": 9.04976803241879e-06, + "loss": 0.6111, + "step": 15310 + }, + { + "epoch": 0.53, + "learning_rate": 9.048684100326807e-06, + "loss": 0.6115, + "step": 15311 + }, + { + "epoch": 0.53, + "learning_rate": 9.04760017951388e-06, + "loss": 0.5825, + "step": 15312 + }, + { + "epoch": 0.53, + "learning_rate": 9.046516269992856e-06, + "loss": 0.6246, + "step": 15313 + }, + { + "epoch": 0.53, + "learning_rate": 9.045432371776588e-06, + "loss": 0.6647, + "step": 15314 + }, + { + "epoch": 0.53, + "learning_rate": 9.04434848487793e-06, + "loss": 0.6266, + "step": 15315 + }, + { + "epoch": 0.53, + "learning_rate": 9.043264609309725e-06, + "loss": 0.6508, + "step": 15316 + }, + { + "epoch": 0.53, + "learning_rate": 9.042180745084829e-06, + "loss": 0.6313, + "step": 15317 + }, + { + "epoch": 0.53, + "learning_rate": 9.041096892216095e-06, + "loss": 0.6503, + "step": 15318 + }, + { + "epoch": 0.53, + "learning_rate": 9.04001305071637e-06, + "loss": 0.6051, + "step": 15319 + }, + { + "epoch": 0.53, + "learning_rate": 9.0389292205985e-06, + "loss": 0.6323, + "step": 15320 + }, + { + "epoch": 0.53, + "learning_rate": 9.037845401875344e-06, + "loss": 0.618, + "step": 15321 + }, + { + "epoch": 0.53, + "learning_rate": 9.036761594559747e-06, + "loss": 0.6328, + "step": 15322 + }, + { + "epoch": 0.53, + "learning_rate": 9.03567779866456e-06, + "loss": 0.6471, + "step": 15323 + }, + { + "epoch": 0.53, + "learning_rate": 9.034594014202634e-06, + "loss": 0.6947, + "step": 15324 + }, + { + "epoch": 0.53, + "learning_rate": 9.033510241186814e-06, + "loss": 0.6369, + "step": 15325 + }, + { + "epoch": 0.53, + "learning_rate": 9.032426479629953e-06, + "loss": 0.6208, + "step": 15326 + }, + { + "epoch": 0.53, + "learning_rate": 9.031342729544903e-06, + "loss": 0.612, + "step": 15327 + }, + { + "epoch": 0.53, + "learning_rate": 9.030258990944506e-06, + "loss": 0.6023, + "step": 15328 + }, + { + "epoch": 0.53, + "learning_rate": 9.029175263841618e-06, + "loss": 0.6194, + "step": 15329 + }, + { + "epoch": 0.53, + "learning_rate": 9.028091548249086e-06, + "loss": 0.5634, + "step": 15330 + }, + { + "epoch": 0.53, + "learning_rate": 9.027007844179758e-06, + "loss": 0.6433, + "step": 15331 + }, + { + "epoch": 0.53, + "learning_rate": 9.025924151646482e-06, + "loss": 0.5847, + "step": 15332 + }, + { + "epoch": 0.53, + "learning_rate": 9.024840470662109e-06, + "loss": 0.6398, + "step": 15333 + }, + { + "epoch": 0.53, + "learning_rate": 9.023756801239484e-06, + "loss": 0.6121, + "step": 15334 + }, + { + "epoch": 0.53, + "learning_rate": 9.022673143391457e-06, + "loss": 0.6553, + "step": 15335 + }, + { + "epoch": 0.53, + "learning_rate": 9.021589497130879e-06, + "loss": 0.6194, + "step": 15336 + }, + { + "epoch": 0.53, + "learning_rate": 9.020505862470592e-06, + "loss": 0.5737, + "step": 15337 + }, + { + "epoch": 0.53, + "learning_rate": 9.019422239423448e-06, + "loss": 0.641, + "step": 15338 + }, + { + "epoch": 0.53, + "learning_rate": 9.018338628002293e-06, + "loss": 0.6431, + "step": 15339 + }, + { + "epoch": 0.53, + "learning_rate": 9.017255028219976e-06, + "loss": 0.6718, + "step": 15340 + }, + { + "epoch": 0.53, + "learning_rate": 9.016171440089345e-06, + "loss": 0.6694, + "step": 15341 + }, + { + "epoch": 0.53, + "learning_rate": 9.015087863623245e-06, + "loss": 0.5901, + "step": 15342 + }, + { + "epoch": 0.53, + "learning_rate": 9.014004298834523e-06, + "loss": 0.6643, + "step": 15343 + }, + { + "epoch": 0.53, + "learning_rate": 9.012920745736031e-06, + "loss": 0.6222, + "step": 15344 + }, + { + "epoch": 0.53, + "learning_rate": 9.011837204340609e-06, + "loss": 0.6434, + "step": 15345 + }, + { + "epoch": 0.53, + "learning_rate": 9.010753674661107e-06, + "loss": 0.5609, + "step": 15346 + }, + { + "epoch": 0.53, + "learning_rate": 9.009670156710374e-06, + "loss": 0.6292, + "step": 15347 + }, + { + "epoch": 0.53, + "learning_rate": 9.008586650501251e-06, + "loss": 0.6305, + "step": 15348 + }, + { + "epoch": 0.53, + "learning_rate": 9.007503156046589e-06, + "loss": 0.6056, + "step": 15349 + }, + { + "epoch": 0.53, + "learning_rate": 9.006419673359234e-06, + "loss": 0.6867, + "step": 15350 + }, + { + "epoch": 0.53, + "learning_rate": 9.00533620245203e-06, + "loss": 0.6548, + "step": 15351 + }, + { + "epoch": 0.53, + "learning_rate": 9.004252743337822e-06, + "loss": 0.6314, + "step": 15352 + }, + { + "epoch": 0.53, + "learning_rate": 9.003169296029459e-06, + "loss": 0.6701, + "step": 15353 + }, + { + "epoch": 0.53, + "learning_rate": 9.002085860539782e-06, + "loss": 0.6231, + "step": 15354 + }, + { + "epoch": 0.53, + "learning_rate": 9.001002436881643e-06, + "loss": 0.6338, + "step": 15355 + }, + { + "epoch": 0.53, + "learning_rate": 8.999919025067883e-06, + "loss": 0.6378, + "step": 15356 + }, + { + "epoch": 0.53, + "learning_rate": 8.998835625111347e-06, + "loss": 0.6105, + "step": 15357 + }, + { + "epoch": 0.53, + "learning_rate": 8.997752237024882e-06, + "loss": 0.5909, + "step": 15358 + }, + { + "epoch": 0.53, + "learning_rate": 8.996668860821333e-06, + "loss": 0.6494, + "step": 15359 + }, + { + "epoch": 0.53, + "learning_rate": 8.99558549651354e-06, + "loss": 0.6103, + "step": 15360 + }, + { + "epoch": 0.53, + "learning_rate": 8.994502144114356e-06, + "loss": 0.6183, + "step": 15361 + }, + { + "epoch": 0.53, + "learning_rate": 8.99341880363662e-06, + "loss": 0.6801, + "step": 15362 + }, + { + "epoch": 0.53, + "learning_rate": 8.992335475093176e-06, + "loss": 0.5923, + "step": 15363 + }, + { + "epoch": 0.53, + "learning_rate": 8.99125215849687e-06, + "loss": 0.6284, + "step": 15364 + }, + { + "epoch": 0.53, + "learning_rate": 8.990168853860548e-06, + "loss": 0.6361, + "step": 15365 + }, + { + "epoch": 0.53, + "learning_rate": 8.989085561197048e-06, + "loss": 0.5774, + "step": 15366 + }, + { + "epoch": 0.53, + "learning_rate": 8.98800228051922e-06, + "loss": 0.5968, + "step": 15367 + }, + { + "epoch": 0.53, + "learning_rate": 8.986919011839903e-06, + "loss": 0.6179, + "step": 15368 + }, + { + "epoch": 0.53, + "learning_rate": 8.985835755171945e-06, + "loss": 0.6429, + "step": 15369 + }, + { + "epoch": 0.53, + "learning_rate": 8.984752510528185e-06, + "loss": 0.6472, + "step": 15370 + }, + { + "epoch": 0.53, + "learning_rate": 8.983669277921471e-06, + "loss": 0.6247, + "step": 15371 + }, + { + "epoch": 0.53, + "learning_rate": 8.982586057364642e-06, + "loss": 0.6443, + "step": 15372 + }, + { + "epoch": 0.53, + "learning_rate": 8.98150284887054e-06, + "loss": 0.6061, + "step": 15373 + }, + { + "epoch": 0.53, + "learning_rate": 8.980419652452013e-06, + "loss": 0.6396, + "step": 15374 + }, + { + "epoch": 0.53, + "learning_rate": 8.9793364681219e-06, + "loss": 0.6241, + "step": 15375 + }, + { + "epoch": 0.53, + "learning_rate": 8.978253295893045e-06, + "loss": 0.5908, + "step": 15376 + }, + { + "epoch": 0.53, + "learning_rate": 8.97717013577829e-06, + "loss": 0.6134, + "step": 15377 + }, + { + "epoch": 0.53, + "learning_rate": 8.976086987790474e-06, + "loss": 0.6224, + "step": 15378 + }, + { + "epoch": 0.53, + "learning_rate": 8.975003851942445e-06, + "loss": 0.6466, + "step": 15379 + }, + { + "epoch": 0.53, + "learning_rate": 8.973920728247041e-06, + "loss": 0.6273, + "step": 15380 + }, + { + "epoch": 0.53, + "learning_rate": 8.972837616717106e-06, + "loss": 0.6261, + "step": 15381 + }, + { + "epoch": 0.53, + "learning_rate": 8.971754517365476e-06, + "loss": 0.6788, + "step": 15382 + }, + { + "epoch": 0.53, + "learning_rate": 8.970671430205003e-06, + "loss": 0.5891, + "step": 15383 + }, + { + "epoch": 0.53, + "learning_rate": 8.969588355248517e-06, + "loss": 0.6602, + "step": 15384 + }, + { + "epoch": 0.53, + "learning_rate": 8.968505292508867e-06, + "loss": 0.633, + "step": 15385 + }, + { + "epoch": 0.53, + "learning_rate": 8.967422241998894e-06, + "loss": 0.6791, + "step": 15386 + }, + { + "epoch": 0.53, + "learning_rate": 8.966339203731432e-06, + "loss": 0.6922, + "step": 15387 + }, + { + "epoch": 0.53, + "learning_rate": 8.965256177719328e-06, + "loss": 0.6028, + "step": 15388 + }, + { + "epoch": 0.53, + "learning_rate": 8.964173163975422e-06, + "loss": 0.612, + "step": 15389 + }, + { + "epoch": 0.53, + "learning_rate": 8.963090162512553e-06, + "loss": 0.6519, + "step": 15390 + }, + { + "epoch": 0.53, + "learning_rate": 8.96200717334356e-06, + "loss": 0.6538, + "step": 15391 + }, + { + "epoch": 0.53, + "learning_rate": 8.96092419648129e-06, + "loss": 0.6388, + "step": 15392 + }, + { + "epoch": 0.53, + "learning_rate": 8.959841231938574e-06, + "loss": 0.6433, + "step": 15393 + }, + { + "epoch": 0.53, + "learning_rate": 8.958758279728255e-06, + "loss": 0.6312, + "step": 15394 + }, + { + "epoch": 0.53, + "learning_rate": 8.957675339863177e-06, + "loss": 0.602, + "step": 15395 + }, + { + "epoch": 0.53, + "learning_rate": 8.956592412356174e-06, + "loss": 0.6522, + "step": 15396 + }, + { + "epoch": 0.53, + "learning_rate": 8.955509497220089e-06, + "loss": 0.6247, + "step": 15397 + }, + { + "epoch": 0.53, + "learning_rate": 8.95442659446776e-06, + "loss": 0.6027, + "step": 15398 + }, + { + "epoch": 0.53, + "learning_rate": 8.953343704112026e-06, + "loss": 0.619, + "step": 15399 + }, + { + "epoch": 0.53, + "learning_rate": 8.952260826165728e-06, + "loss": 0.6302, + "step": 15400 + }, + { + "epoch": 0.53, + "learning_rate": 8.9511779606417e-06, + "loss": 0.6249, + "step": 15401 + }, + { + "epoch": 0.53, + "learning_rate": 8.950095107552788e-06, + "loss": 0.6345, + "step": 15402 + }, + { + "epoch": 0.53, + "learning_rate": 8.949012266911825e-06, + "loss": 0.5572, + "step": 15403 + }, + { + "epoch": 0.53, + "learning_rate": 8.94792943873165e-06, + "loss": 0.6535, + "step": 15404 + }, + { + "epoch": 0.53, + "learning_rate": 8.946846623025103e-06, + "loss": 0.6541, + "step": 15405 + }, + { + "epoch": 0.53, + "learning_rate": 8.945763819805023e-06, + "loss": 0.5769, + "step": 15406 + }, + { + "epoch": 0.53, + "learning_rate": 8.944681029084244e-06, + "loss": 0.6007, + "step": 15407 + }, + { + "epoch": 0.53, + "learning_rate": 8.943598250875607e-06, + "loss": 0.6088, + "step": 15408 + }, + { + "epoch": 0.53, + "learning_rate": 8.942515485191952e-06, + "loss": 0.6371, + "step": 15409 + }, + { + "epoch": 0.53, + "learning_rate": 8.94143273204611e-06, + "loss": 0.6156, + "step": 15410 + }, + { + "epoch": 0.53, + "learning_rate": 8.940349991450923e-06, + "loss": 0.6685, + "step": 15411 + }, + { + "epoch": 0.53, + "learning_rate": 8.93926726341923e-06, + "loss": 0.6311, + "step": 15412 + }, + { + "epoch": 0.53, + "learning_rate": 8.938184547963862e-06, + "loss": 0.6995, + "step": 15413 + }, + { + "epoch": 0.53, + "learning_rate": 8.93710184509766e-06, + "loss": 0.5842, + "step": 15414 + }, + { + "epoch": 0.53, + "learning_rate": 8.936019154833461e-06, + "loss": 0.672, + "step": 15415 + }, + { + "epoch": 0.53, + "learning_rate": 8.9349364771841e-06, + "loss": 0.6925, + "step": 15416 + }, + { + "epoch": 0.53, + "learning_rate": 8.933853812162416e-06, + "loss": 0.6428, + "step": 15417 + }, + { + "epoch": 0.53, + "learning_rate": 8.932771159781243e-06, + "loss": 0.6419, + "step": 15418 + }, + { + "epoch": 0.53, + "learning_rate": 8.931688520053418e-06, + "loss": 0.6367, + "step": 15419 + }, + { + "epoch": 0.53, + "learning_rate": 8.930605892991775e-06, + "loss": 0.6153, + "step": 15420 + }, + { + "epoch": 0.53, + "learning_rate": 8.929523278609156e-06, + "loss": 0.7123, + "step": 15421 + }, + { + "epoch": 0.53, + "learning_rate": 8.92844067691839e-06, + "loss": 0.6983, + "step": 15422 + }, + { + "epoch": 0.53, + "learning_rate": 8.927358087932313e-06, + "loss": 0.6168, + "step": 15423 + }, + { + "epoch": 0.53, + "learning_rate": 8.926275511663768e-06, + "loss": 0.655, + "step": 15424 + }, + { + "epoch": 0.53, + "learning_rate": 8.925192948125581e-06, + "loss": 0.5992, + "step": 15425 + }, + { + "epoch": 0.53, + "learning_rate": 8.924110397330591e-06, + "loss": 0.6032, + "step": 15426 + }, + { + "epoch": 0.53, + "learning_rate": 8.923027859291638e-06, + "loss": 0.6102, + "step": 15427 + }, + { + "epoch": 0.53, + "learning_rate": 8.921945334021549e-06, + "loss": 0.6638, + "step": 15428 + }, + { + "epoch": 0.53, + "learning_rate": 8.92086282153316e-06, + "loss": 0.6656, + "step": 15429 + }, + { + "epoch": 0.53, + "learning_rate": 8.91978032183931e-06, + "loss": 0.647, + "step": 15430 + }, + { + "epoch": 0.53, + "learning_rate": 8.918697834952831e-06, + "loss": 0.6058, + "step": 15431 + }, + { + "epoch": 0.53, + "learning_rate": 8.917615360886554e-06, + "loss": 0.6469, + "step": 15432 + }, + { + "epoch": 0.53, + "learning_rate": 8.91653289965332e-06, + "loss": 0.6501, + "step": 15433 + }, + { + "epoch": 0.53, + "learning_rate": 8.915450451265957e-06, + "loss": 0.6073, + "step": 15434 + }, + { + "epoch": 0.53, + "learning_rate": 8.914368015737301e-06, + "loss": 0.582, + "step": 15435 + }, + { + "epoch": 0.53, + "learning_rate": 8.913285593080186e-06, + "loss": 0.6556, + "step": 15436 + }, + { + "epoch": 0.53, + "learning_rate": 8.912203183307444e-06, + "loss": 0.6219, + "step": 15437 + }, + { + "epoch": 0.53, + "learning_rate": 8.911120786431909e-06, + "loss": 0.6437, + "step": 15438 + }, + { + "epoch": 0.53, + "learning_rate": 8.910038402466417e-06, + "loss": 0.6135, + "step": 15439 + }, + { + "epoch": 0.53, + "learning_rate": 8.908956031423796e-06, + "loss": 0.6879, + "step": 15440 + }, + { + "epoch": 0.53, + "learning_rate": 8.907873673316882e-06, + "loss": 0.6935, + "step": 15441 + }, + { + "epoch": 0.54, + "learning_rate": 8.90679132815851e-06, + "loss": 0.6241, + "step": 15442 + }, + { + "epoch": 0.54, + "learning_rate": 8.905708995961506e-06, + "loss": 0.6311, + "step": 15443 + }, + { + "epoch": 0.54, + "learning_rate": 8.904626676738707e-06, + "loss": 0.6006, + "step": 15444 + }, + { + "epoch": 0.54, + "learning_rate": 8.903544370502945e-06, + "loss": 0.5973, + "step": 15445 + }, + { + "epoch": 0.54, + "learning_rate": 8.902462077267051e-06, + "loss": 0.695, + "step": 15446 + }, + { + "epoch": 0.54, + "learning_rate": 8.901379797043858e-06, + "loss": 0.6492, + "step": 15447 + }, + { + "epoch": 0.54, + "learning_rate": 8.900297529846199e-06, + "loss": 0.6438, + "step": 15448 + }, + { + "epoch": 0.54, + "learning_rate": 8.8992152756869e-06, + "loss": 0.6312, + "step": 15449 + }, + { + "epoch": 0.54, + "learning_rate": 8.8981330345788e-06, + "loss": 0.6297, + "step": 15450 + }, + { + "epoch": 0.54, + "learning_rate": 8.897050806534725e-06, + "loss": 0.6497, + "step": 15451 + }, + { + "epoch": 0.54, + "learning_rate": 8.895968591567507e-06, + "loss": 0.628, + "step": 15452 + }, + { + "epoch": 0.54, + "learning_rate": 8.894886389689978e-06, + "loss": 0.6482, + "step": 15453 + }, + { + "epoch": 0.54, + "learning_rate": 8.893804200914972e-06, + "loss": 0.6254, + "step": 15454 + }, + { + "epoch": 0.54, + "learning_rate": 8.892722025255315e-06, + "loss": 0.6059, + "step": 15455 + }, + { + "epoch": 0.54, + "learning_rate": 8.891639862723836e-06, + "loss": 0.6199, + "step": 15456 + }, + { + "epoch": 0.54, + "learning_rate": 8.890557713333374e-06, + "loss": 0.6587, + "step": 15457 + }, + { + "epoch": 0.54, + "learning_rate": 8.889475577096749e-06, + "loss": 0.6111, + "step": 15458 + }, + { + "epoch": 0.54, + "learning_rate": 8.888393454026797e-06, + "loss": 0.6671, + "step": 15459 + }, + { + "epoch": 0.54, + "learning_rate": 8.887311344136351e-06, + "loss": 0.5976, + "step": 15460 + }, + { + "epoch": 0.54, + "learning_rate": 8.88622924743823e-06, + "loss": 0.6454, + "step": 15461 + }, + { + "epoch": 0.54, + "learning_rate": 8.885147163945278e-06, + "loss": 0.6168, + "step": 15462 + }, + { + "epoch": 0.54, + "learning_rate": 8.88406509367031e-06, + "loss": 0.6503, + "step": 15463 + }, + { + "epoch": 0.54, + "learning_rate": 8.88298303662616e-06, + "loss": 0.6239, + "step": 15464 + }, + { + "epoch": 0.54, + "learning_rate": 8.881900992825666e-06, + "loss": 0.6188, + "step": 15465 + }, + { + "epoch": 0.54, + "learning_rate": 8.880818962281648e-06, + "loss": 0.661, + "step": 15466 + }, + { + "epoch": 0.54, + "learning_rate": 8.879736945006933e-06, + "loss": 0.6735, + "step": 15467 + }, + { + "epoch": 0.54, + "learning_rate": 8.87865494101436e-06, + "loss": 0.6144, + "step": 15468 + }, + { + "epoch": 0.54, + "learning_rate": 8.877572950316748e-06, + "loss": 0.6628, + "step": 15469 + }, + { + "epoch": 0.54, + "learning_rate": 8.876490972926925e-06, + "loss": 0.6396, + "step": 15470 + }, + { + "epoch": 0.54, + "learning_rate": 8.87540900885773e-06, + "loss": 0.6278, + "step": 15471 + }, + { + "epoch": 0.54, + "learning_rate": 8.874327058121979e-06, + "loss": 0.6256, + "step": 15472 + }, + { + "epoch": 0.54, + "learning_rate": 8.873245120732503e-06, + "loss": 0.6062, + "step": 15473 + }, + { + "epoch": 0.54, + "learning_rate": 8.872163196702138e-06, + "loss": 0.6361, + "step": 15474 + }, + { + "epoch": 0.54, + "learning_rate": 8.8710812860437e-06, + "loss": 0.6851, + "step": 15475 + }, + { + "epoch": 0.54, + "learning_rate": 8.86999938877002e-06, + "loss": 0.609, + "step": 15476 + }, + { + "epoch": 0.54, + "learning_rate": 8.868917504893933e-06, + "loss": 0.5786, + "step": 15477 + }, + { + "epoch": 0.54, + "learning_rate": 8.867835634428256e-06, + "loss": 0.6109, + "step": 15478 + }, + { + "epoch": 0.54, + "learning_rate": 8.866753777385817e-06, + "loss": 0.639, + "step": 15479 + }, + { + "epoch": 0.54, + "learning_rate": 8.865671933779451e-06, + "loss": 0.6635, + "step": 15480 + }, + { + "epoch": 0.54, + "learning_rate": 8.864590103621978e-06, + "loss": 0.6577, + "step": 15481 + }, + { + "epoch": 0.54, + "learning_rate": 8.86350828692622e-06, + "loss": 0.6773, + "step": 15482 + }, + { + "epoch": 0.54, + "learning_rate": 8.862426483705017e-06, + "loss": 0.6384, + "step": 15483 + }, + { + "epoch": 0.54, + "learning_rate": 8.861344693971183e-06, + "loss": 0.6307, + "step": 15484 + }, + { + "epoch": 0.54, + "learning_rate": 8.860262917737544e-06, + "loss": 0.6849, + "step": 15485 + }, + { + "epoch": 0.54, + "learning_rate": 8.859181155016937e-06, + "loss": 0.6583, + "step": 15486 + }, + { + "epoch": 0.54, + "learning_rate": 8.858099405822179e-06, + "loss": 0.6323, + "step": 15487 + }, + { + "epoch": 0.54, + "learning_rate": 8.857017670166093e-06, + "loss": 0.6567, + "step": 15488 + }, + { + "epoch": 0.54, + "learning_rate": 8.855935948061513e-06, + "loss": 0.7013, + "step": 15489 + }, + { + "epoch": 0.54, + "learning_rate": 8.854854239521258e-06, + "loss": 0.6186, + "step": 15490 + }, + { + "epoch": 0.54, + "learning_rate": 8.853772544558153e-06, + "loss": 0.6125, + "step": 15491 + }, + { + "epoch": 0.54, + "learning_rate": 8.852690863185029e-06, + "loss": 0.6037, + "step": 15492 + }, + { + "epoch": 0.54, + "learning_rate": 8.851609195414702e-06, + "loss": 0.5744, + "step": 15493 + }, + { + "epoch": 0.54, + "learning_rate": 8.85052754126e-06, + "loss": 0.6525, + "step": 15494 + }, + { + "epoch": 0.54, + "learning_rate": 8.849445900733752e-06, + "loss": 0.63, + "step": 15495 + }, + { + "epoch": 0.54, + "learning_rate": 8.848364273848775e-06, + "loss": 0.6385, + "step": 15496 + }, + { + "epoch": 0.54, + "learning_rate": 8.847282660617895e-06, + "loss": 0.6516, + "step": 15497 + }, + { + "epoch": 0.54, + "learning_rate": 8.846201061053943e-06, + "loss": 0.599, + "step": 15498 + }, + { + "epoch": 0.54, + "learning_rate": 8.845119475169733e-06, + "loss": 0.6232, + "step": 15499 + }, + { + "epoch": 0.54, + "learning_rate": 8.844037902978091e-06, + "loss": 0.6556, + "step": 15500 + }, + { + "epoch": 0.54, + "learning_rate": 8.842956344491848e-06, + "loss": 0.6273, + "step": 15501 + }, + { + "epoch": 0.54, + "learning_rate": 8.841874799723816e-06, + "loss": 0.622, + "step": 15502 + }, + { + "epoch": 0.54, + "learning_rate": 8.840793268686822e-06, + "loss": 0.6295, + "step": 15503 + }, + { + "epoch": 0.54, + "learning_rate": 8.839711751393698e-06, + "loss": 0.603, + "step": 15504 + }, + { + "epoch": 0.54, + "learning_rate": 8.838630247857252e-06, + "loss": 0.597, + "step": 15505 + }, + { + "epoch": 0.54, + "learning_rate": 8.837548758090311e-06, + "loss": 0.6222, + "step": 15506 + }, + { + "epoch": 0.54, + "learning_rate": 8.83646728210571e-06, + "loss": 0.6117, + "step": 15507 + }, + { + "epoch": 0.54, + "learning_rate": 8.835385819916254e-06, + "loss": 0.623, + "step": 15508 + }, + { + "epoch": 0.54, + "learning_rate": 8.834304371534772e-06, + "loss": 0.6333, + "step": 15509 + }, + { + "epoch": 0.54, + "learning_rate": 8.833222936974091e-06, + "loss": 0.6381, + "step": 15510 + }, + { + "epoch": 0.54, + "learning_rate": 8.832141516247025e-06, + "loss": 0.5541, + "step": 15511 + }, + { + "epoch": 0.54, + "learning_rate": 8.831060109366397e-06, + "loss": 0.6512, + "step": 15512 + }, + { + "epoch": 0.54, + "learning_rate": 8.829978716345035e-06, + "loss": 0.633, + "step": 15513 + }, + { + "epoch": 0.54, + "learning_rate": 8.828897337195752e-06, + "loss": 0.6432, + "step": 15514 + }, + { + "epoch": 0.54, + "learning_rate": 8.82781597193137e-06, + "loss": 0.6365, + "step": 15515 + }, + { + "epoch": 0.54, + "learning_rate": 8.826734620564719e-06, + "loss": 0.6715, + "step": 15516 + }, + { + "epoch": 0.54, + "learning_rate": 8.82565328310861e-06, + "loss": 0.6399, + "step": 15517 + }, + { + "epoch": 0.54, + "learning_rate": 8.824571959575863e-06, + "loss": 0.608, + "step": 15518 + }, + { + "epoch": 0.54, + "learning_rate": 8.82349064997931e-06, + "loss": 0.6137, + "step": 15519 + }, + { + "epoch": 0.54, + "learning_rate": 8.82240935433176e-06, + "loss": 0.6201, + "step": 15520 + }, + { + "epoch": 0.54, + "learning_rate": 8.821328072646033e-06, + "loss": 0.6376, + "step": 15521 + }, + { + "epoch": 0.54, + "learning_rate": 8.820246804934959e-06, + "loss": 0.635, + "step": 15522 + }, + { + "epoch": 0.54, + "learning_rate": 8.819165551211349e-06, + "loss": 0.6351, + "step": 15523 + }, + { + "epoch": 0.54, + "learning_rate": 8.81808431148802e-06, + "loss": 0.6581, + "step": 15524 + }, + { + "epoch": 0.54, + "learning_rate": 8.817003085777807e-06, + "loss": 0.6331, + "step": 15525 + }, + { + "epoch": 0.54, + "learning_rate": 8.81592187409351e-06, + "loss": 0.6412, + "step": 15526 + }, + { + "epoch": 0.54, + "learning_rate": 8.814840676447964e-06, + "loss": 0.5772, + "step": 15527 + }, + { + "epoch": 0.54, + "learning_rate": 8.813759492853977e-06, + "loss": 0.6578, + "step": 15528 + }, + { + "epoch": 0.54, + "learning_rate": 8.812678323324371e-06, + "loss": 0.6269, + "step": 15529 + }, + { + "epoch": 0.54, + "learning_rate": 8.811597167871968e-06, + "loss": 0.6469, + "step": 15530 + }, + { + "epoch": 0.54, + "learning_rate": 8.810516026509582e-06, + "loss": 0.6241, + "step": 15531 + }, + { + "epoch": 0.54, + "learning_rate": 8.809434899250033e-06, + "loss": 0.6124, + "step": 15532 + }, + { + "epoch": 0.54, + "learning_rate": 8.808353786106142e-06, + "loss": 0.605, + "step": 15533 + }, + { + "epoch": 0.54, + "learning_rate": 8.807272687090722e-06, + "loss": 0.6254, + "step": 15534 + }, + { + "epoch": 0.54, + "learning_rate": 8.806191602216593e-06, + "loss": 0.602, + "step": 15535 + }, + { + "epoch": 0.54, + "learning_rate": 8.805110531496575e-06, + "loss": 0.6102, + "step": 15536 + }, + { + "epoch": 0.54, + "learning_rate": 8.804029474943481e-06, + "loss": 0.6566, + "step": 15537 + }, + { + "epoch": 0.54, + "learning_rate": 8.802948432570129e-06, + "loss": 0.6274, + "step": 15538 + }, + { + "epoch": 0.54, + "learning_rate": 8.80186740438934e-06, + "loss": 0.6492, + "step": 15539 + }, + { + "epoch": 0.54, + "learning_rate": 8.800786390413929e-06, + "loss": 0.6156, + "step": 15540 + }, + { + "epoch": 0.54, + "learning_rate": 8.799705390656711e-06, + "loss": 0.6948, + "step": 15541 + }, + { + "epoch": 0.54, + "learning_rate": 8.798624405130505e-06, + "loss": 0.6209, + "step": 15542 + }, + { + "epoch": 0.54, + "learning_rate": 8.797543433848125e-06, + "loss": 0.6697, + "step": 15543 + }, + { + "epoch": 0.54, + "learning_rate": 8.796462476822389e-06, + "loss": 0.5758, + "step": 15544 + }, + { + "epoch": 0.54, + "learning_rate": 8.795381534066117e-06, + "loss": 0.7098, + "step": 15545 + }, + { + "epoch": 0.54, + "learning_rate": 8.794300605592116e-06, + "loss": 0.6235, + "step": 15546 + }, + { + "epoch": 0.54, + "learning_rate": 8.793219691413206e-06, + "loss": 0.5821, + "step": 15547 + }, + { + "epoch": 0.54, + "learning_rate": 8.792138791542207e-06, + "loss": 0.6348, + "step": 15548 + }, + { + "epoch": 0.54, + "learning_rate": 8.791057905991928e-06, + "loss": 0.67, + "step": 15549 + }, + { + "epoch": 0.54, + "learning_rate": 8.789977034775186e-06, + "loss": 0.6272, + "step": 15550 + }, + { + "epoch": 0.54, + "learning_rate": 8.7888961779048e-06, + "loss": 0.6442, + "step": 15551 + }, + { + "epoch": 0.54, + "learning_rate": 8.787815335393578e-06, + "loss": 0.6569, + "step": 15552 + }, + { + "epoch": 0.54, + "learning_rate": 8.78673450725434e-06, + "loss": 0.6676, + "step": 15553 + }, + { + "epoch": 0.54, + "learning_rate": 8.785653693499902e-06, + "loss": 0.6672, + "step": 15554 + }, + { + "epoch": 0.54, + "learning_rate": 8.784572894143072e-06, + "loss": 0.5729, + "step": 15555 + }, + { + "epoch": 0.54, + "learning_rate": 8.78349210919667e-06, + "loss": 0.6646, + "step": 15556 + }, + { + "epoch": 0.54, + "learning_rate": 8.78241133867351e-06, + "loss": 0.6473, + "step": 15557 + }, + { + "epoch": 0.54, + "learning_rate": 8.781330582586399e-06, + "loss": 0.6444, + "step": 15558 + }, + { + "epoch": 0.54, + "learning_rate": 8.780249840948157e-06, + "loss": 0.6693, + "step": 15559 + }, + { + "epoch": 0.54, + "learning_rate": 8.7791691137716e-06, + "loss": 0.6201, + "step": 15560 + }, + { + "epoch": 0.54, + "learning_rate": 8.778088401069532e-06, + "loss": 0.6117, + "step": 15561 + }, + { + "epoch": 0.54, + "learning_rate": 8.777007702854773e-06, + "loss": 0.6222, + "step": 15562 + }, + { + "epoch": 0.54, + "learning_rate": 8.775927019140138e-06, + "loss": 0.6674, + "step": 15563 + }, + { + "epoch": 0.54, + "learning_rate": 8.774846349938433e-06, + "loss": 0.5967, + "step": 15564 + }, + { + "epoch": 0.54, + "learning_rate": 8.773765695262476e-06, + "loss": 0.6043, + "step": 15565 + }, + { + "epoch": 0.54, + "learning_rate": 8.77268505512508e-06, + "loss": 0.6439, + "step": 15566 + }, + { + "epoch": 0.54, + "learning_rate": 8.771604429539052e-06, + "loss": 0.611, + "step": 15567 + }, + { + "epoch": 0.54, + "learning_rate": 8.770523818517208e-06, + "loss": 0.5959, + "step": 15568 + }, + { + "epoch": 0.54, + "learning_rate": 8.769443222072361e-06, + "loss": 0.6297, + "step": 15569 + }, + { + "epoch": 0.54, + "learning_rate": 8.768362640217319e-06, + "loss": 0.6458, + "step": 15570 + }, + { + "epoch": 0.54, + "learning_rate": 8.767282072964896e-06, + "loss": 0.6917, + "step": 15571 + }, + { + "epoch": 0.54, + "learning_rate": 8.766201520327906e-06, + "loss": 0.6541, + "step": 15572 + }, + { + "epoch": 0.54, + "learning_rate": 8.765120982319155e-06, + "loss": 0.6698, + "step": 15573 + }, + { + "epoch": 0.54, + "learning_rate": 8.764040458951459e-06, + "loss": 0.6149, + "step": 15574 + }, + { + "epoch": 0.54, + "learning_rate": 8.762959950237627e-06, + "loss": 0.6609, + "step": 15575 + }, + { + "epoch": 0.54, + "learning_rate": 8.761879456190469e-06, + "loss": 0.6502, + "step": 15576 + }, + { + "epoch": 0.54, + "learning_rate": 8.760798976822795e-06, + "loss": 0.6498, + "step": 15577 + }, + { + "epoch": 0.54, + "learning_rate": 8.759718512147419e-06, + "loss": 0.6356, + "step": 15578 + }, + { + "epoch": 0.54, + "learning_rate": 8.758638062177146e-06, + "loss": 0.5795, + "step": 15579 + }, + { + "epoch": 0.54, + "learning_rate": 8.757557626924791e-06, + "loss": 0.6373, + "step": 15580 + }, + { + "epoch": 0.54, + "learning_rate": 8.756477206403163e-06, + "loss": 0.5713, + "step": 15581 + }, + { + "epoch": 0.54, + "learning_rate": 8.755396800625069e-06, + "loss": 0.5928, + "step": 15582 + }, + { + "epoch": 0.54, + "learning_rate": 8.75431640960332e-06, + "loss": 0.6188, + "step": 15583 + }, + { + "epoch": 0.54, + "learning_rate": 8.753236033350728e-06, + "loss": 0.5659, + "step": 15584 + }, + { + "epoch": 0.54, + "learning_rate": 8.752155671880097e-06, + "loss": 0.668, + "step": 15585 + }, + { + "epoch": 0.54, + "learning_rate": 8.751075325204241e-06, + "loss": 0.537, + "step": 15586 + }, + { + "epoch": 0.54, + "learning_rate": 8.749994993335969e-06, + "loss": 0.6796, + "step": 15587 + }, + { + "epoch": 0.54, + "learning_rate": 8.748914676288083e-06, + "loss": 0.6361, + "step": 15588 + }, + { + "epoch": 0.54, + "learning_rate": 8.747834374073401e-06, + "loss": 0.6252, + "step": 15589 + }, + { + "epoch": 0.54, + "learning_rate": 8.746754086704723e-06, + "loss": 0.6413, + "step": 15590 + }, + { + "epoch": 0.54, + "learning_rate": 8.74567381419486e-06, + "loss": 0.6617, + "step": 15591 + }, + { + "epoch": 0.54, + "learning_rate": 8.744593556556623e-06, + "loss": 0.6401, + "step": 15592 + }, + { + "epoch": 0.54, + "learning_rate": 8.743513313802818e-06, + "loss": 0.6155, + "step": 15593 + }, + { + "epoch": 0.54, + "learning_rate": 8.74243308594625e-06, + "loss": 0.6601, + "step": 15594 + }, + { + "epoch": 0.54, + "learning_rate": 8.74135287299973e-06, + "loss": 0.6114, + "step": 15595 + }, + { + "epoch": 0.54, + "learning_rate": 8.740272674976063e-06, + "loss": 0.6516, + "step": 15596 + }, + { + "epoch": 0.54, + "learning_rate": 8.739192491888056e-06, + "loss": 0.6603, + "step": 15597 + }, + { + "epoch": 0.54, + "learning_rate": 8.73811232374852e-06, + "loss": 0.639, + "step": 15598 + }, + { + "epoch": 0.54, + "learning_rate": 8.737032170570257e-06, + "loss": 0.6427, + "step": 15599 + }, + { + "epoch": 0.54, + "learning_rate": 8.735952032366074e-06, + "loss": 0.6691, + "step": 15600 + }, + { + "epoch": 0.54, + "learning_rate": 8.734871909148781e-06, + "loss": 0.6238, + "step": 15601 + }, + { + "epoch": 0.54, + "learning_rate": 8.73379180093118e-06, + "loss": 0.6004, + "step": 15602 + }, + { + "epoch": 0.54, + "learning_rate": 8.732711707726079e-06, + "loss": 0.6707, + "step": 15603 + }, + { + "epoch": 0.54, + "learning_rate": 8.731631629546287e-06, + "loss": 0.6348, + "step": 15604 + }, + { + "epoch": 0.54, + "learning_rate": 8.730551566404603e-06, + "loss": 0.6652, + "step": 15605 + }, + { + "epoch": 0.54, + "learning_rate": 8.729471518313835e-06, + "loss": 0.6212, + "step": 15606 + }, + { + "epoch": 0.54, + "learning_rate": 8.728391485286793e-06, + "loss": 0.6028, + "step": 15607 + }, + { + "epoch": 0.54, + "learning_rate": 8.727311467336277e-06, + "loss": 0.6347, + "step": 15608 + }, + { + "epoch": 0.54, + "learning_rate": 8.726231464475093e-06, + "loss": 0.6248, + "step": 15609 + }, + { + "epoch": 0.54, + "learning_rate": 8.725151476716048e-06, + "loss": 0.6426, + "step": 15610 + }, + { + "epoch": 0.54, + "learning_rate": 8.724071504071944e-06, + "loss": 0.645, + "step": 15611 + }, + { + "epoch": 0.54, + "learning_rate": 8.722991546555586e-06, + "loss": 0.6255, + "step": 15612 + }, + { + "epoch": 0.54, + "learning_rate": 8.72191160417978e-06, + "loss": 0.6277, + "step": 15613 + }, + { + "epoch": 0.54, + "learning_rate": 8.720831676957327e-06, + "loss": 0.6209, + "step": 15614 + }, + { + "epoch": 0.54, + "learning_rate": 8.719751764901033e-06, + "loss": 0.6597, + "step": 15615 + }, + { + "epoch": 0.54, + "learning_rate": 8.718671868023702e-06, + "loss": 0.6283, + "step": 15616 + }, + { + "epoch": 0.54, + "learning_rate": 8.717591986338137e-06, + "loss": 0.6005, + "step": 15617 + }, + { + "epoch": 0.54, + "learning_rate": 8.716512119857139e-06, + "loss": 0.6283, + "step": 15618 + }, + { + "epoch": 0.54, + "learning_rate": 8.715432268593516e-06, + "loss": 0.6166, + "step": 15619 + }, + { + "epoch": 0.54, + "learning_rate": 8.714352432560068e-06, + "loss": 0.6054, + "step": 15620 + }, + { + "epoch": 0.54, + "learning_rate": 8.713272611769597e-06, + "loss": 0.6574, + "step": 15621 + }, + { + "epoch": 0.54, + "learning_rate": 8.71219280623491e-06, + "loss": 0.6767, + "step": 15622 + }, + { + "epoch": 0.54, + "learning_rate": 8.711113015968801e-06, + "loss": 0.644, + "step": 15623 + }, + { + "epoch": 0.54, + "learning_rate": 8.710033240984082e-06, + "loss": 0.5871, + "step": 15624 + }, + { + "epoch": 0.54, + "learning_rate": 8.70895348129355e-06, + "loss": 0.6122, + "step": 15625 + }, + { + "epoch": 0.54, + "learning_rate": 8.707873736910007e-06, + "loss": 0.6601, + "step": 15626 + }, + { + "epoch": 0.54, + "learning_rate": 8.706794007846254e-06, + "loss": 0.6234, + "step": 15627 + }, + { + "epoch": 0.54, + "learning_rate": 8.705714294115098e-06, + "loss": 0.641, + "step": 15628 + }, + { + "epoch": 0.54, + "learning_rate": 8.704634595729333e-06, + "loss": 0.641, + "step": 15629 + }, + { + "epoch": 0.54, + "learning_rate": 8.703554912701763e-06, + "loss": 0.6203, + "step": 15630 + }, + { + "epoch": 0.54, + "learning_rate": 8.702475245045192e-06, + "loss": 0.6256, + "step": 15631 + }, + { + "epoch": 0.54, + "learning_rate": 8.701395592772417e-06, + "loss": 0.6474, + "step": 15632 + }, + { + "epoch": 0.54, + "learning_rate": 8.700315955896239e-06, + "loss": 0.6457, + "step": 15633 + }, + { + "epoch": 0.54, + "learning_rate": 8.699236334429463e-06, + "loss": 0.6453, + "step": 15634 + }, + { + "epoch": 0.54, + "learning_rate": 8.698156728384882e-06, + "loss": 0.6573, + "step": 15635 + }, + { + "epoch": 0.54, + "learning_rate": 8.6970771377753e-06, + "loss": 0.6261, + "step": 15636 + }, + { + "epoch": 0.54, + "learning_rate": 8.69599756261352e-06, + "loss": 0.5837, + "step": 15637 + }, + { + "epoch": 0.54, + "learning_rate": 8.694918002912336e-06, + "loss": 0.6068, + "step": 15638 + }, + { + "epoch": 0.54, + "learning_rate": 8.69383845868455e-06, + "loss": 0.6792, + "step": 15639 + }, + { + "epoch": 0.54, + "learning_rate": 8.692758929942964e-06, + "loss": 0.602, + "step": 15640 + }, + { + "epoch": 0.54, + "learning_rate": 8.691679416700372e-06, + "loss": 0.6159, + "step": 15641 + }, + { + "epoch": 0.54, + "learning_rate": 8.690599918969575e-06, + "loss": 0.642, + "step": 15642 + }, + { + "epoch": 0.54, + "learning_rate": 8.689520436763374e-06, + "loss": 0.6154, + "step": 15643 + }, + { + "epoch": 0.54, + "learning_rate": 8.688440970094565e-06, + "loss": 0.5988, + "step": 15644 + }, + { + "epoch": 0.54, + "learning_rate": 8.687361518975946e-06, + "loss": 0.6663, + "step": 15645 + }, + { + "epoch": 0.54, + "learning_rate": 8.68628208342032e-06, + "loss": 0.6037, + "step": 15646 + }, + { + "epoch": 0.54, + "learning_rate": 8.68520266344048e-06, + "loss": 0.6091, + "step": 15647 + }, + { + "epoch": 0.54, + "learning_rate": 8.684123259049225e-06, + "loss": 0.6516, + "step": 15648 + }, + { + "epoch": 0.54, + "learning_rate": 8.683043870259355e-06, + "loss": 0.6017, + "step": 15649 + }, + { + "epoch": 0.54, + "learning_rate": 8.681964497083664e-06, + "loss": 0.6163, + "step": 15650 + }, + { + "epoch": 0.54, + "learning_rate": 8.680885139534955e-06, + "loss": 0.6484, + "step": 15651 + }, + { + "epoch": 0.54, + "learning_rate": 8.679805797626017e-06, + "loss": 0.6376, + "step": 15652 + }, + { + "epoch": 0.54, + "learning_rate": 8.678726471369652e-06, + "loss": 0.6579, + "step": 15653 + }, + { + "epoch": 0.54, + "learning_rate": 8.677647160778661e-06, + "loss": 0.6515, + "step": 15654 + }, + { + "epoch": 0.54, + "learning_rate": 8.67656786586583e-06, + "loss": 0.6063, + "step": 15655 + }, + { + "epoch": 0.54, + "learning_rate": 8.675488586643961e-06, + "loss": 0.6476, + "step": 15656 + }, + { + "epoch": 0.54, + "learning_rate": 8.674409323125857e-06, + "loss": 0.6503, + "step": 15657 + }, + { + "epoch": 0.54, + "learning_rate": 8.6733300753243e-06, + "loss": 0.6663, + "step": 15658 + }, + { + "epoch": 0.54, + "learning_rate": 8.672250843252095e-06, + "loss": 0.6344, + "step": 15659 + }, + { + "epoch": 0.54, + "learning_rate": 8.671171626922039e-06, + "loss": 0.6377, + "step": 15660 + }, + { + "epoch": 0.54, + "learning_rate": 8.670092426346919e-06, + "loss": 0.6213, + "step": 15661 + }, + { + "epoch": 0.54, + "learning_rate": 8.669013241539538e-06, + "loss": 0.5963, + "step": 15662 + }, + { + "epoch": 0.54, + "learning_rate": 8.667934072512693e-06, + "loss": 0.6286, + "step": 15663 + }, + { + "epoch": 0.54, + "learning_rate": 8.666854919279168e-06, + "loss": 0.5959, + "step": 15664 + }, + { + "epoch": 0.54, + "learning_rate": 8.665775781851766e-06, + "loss": 0.5732, + "step": 15665 + }, + { + "epoch": 0.54, + "learning_rate": 8.664696660243286e-06, + "loss": 0.6336, + "step": 15666 + }, + { + "epoch": 0.54, + "learning_rate": 8.663617554466508e-06, + "loss": 0.638, + "step": 15667 + }, + { + "epoch": 0.54, + "learning_rate": 8.662538464534237e-06, + "loss": 0.6072, + "step": 15668 + }, + { + "epoch": 0.54, + "learning_rate": 8.66145939045927e-06, + "loss": 0.6638, + "step": 15669 + }, + { + "epoch": 0.54, + "learning_rate": 8.660380332254387e-06, + "loss": 0.5753, + "step": 15670 + }, + { + "epoch": 0.54, + "learning_rate": 8.659301289932393e-06, + "loss": 0.6247, + "step": 15671 + }, + { + "epoch": 0.54, + "learning_rate": 8.658222263506081e-06, + "loss": 0.6027, + "step": 15672 + }, + { + "epoch": 0.54, + "learning_rate": 8.657143252988236e-06, + "loss": 0.6444, + "step": 15673 + }, + { + "epoch": 0.54, + "learning_rate": 8.65606425839166e-06, + "loss": 0.5666, + "step": 15674 + }, + { + "epoch": 0.54, + "learning_rate": 8.654985279729144e-06, + "loss": 0.6273, + "step": 15675 + }, + { + "epoch": 0.54, + "learning_rate": 8.653906317013475e-06, + "loss": 0.6246, + "step": 15676 + }, + { + "epoch": 0.54, + "learning_rate": 8.65282737025745e-06, + "loss": 0.6605, + "step": 15677 + }, + { + "epoch": 0.54, + "learning_rate": 8.651748439473865e-06, + "loss": 0.6256, + "step": 15678 + }, + { + "epoch": 0.54, + "learning_rate": 8.650669524675501e-06, + "loss": 0.6191, + "step": 15679 + }, + { + "epoch": 0.54, + "learning_rate": 8.649590625875159e-06, + "loss": 0.5964, + "step": 15680 + }, + { + "epoch": 0.54, + "learning_rate": 8.648511743085635e-06, + "loss": 0.634, + "step": 15681 + }, + { + "epoch": 0.54, + "learning_rate": 8.647432876319705e-06, + "loss": 0.6548, + "step": 15682 + }, + { + "epoch": 0.54, + "learning_rate": 8.646354025590173e-06, + "loss": 0.5876, + "step": 15683 + }, + { + "epoch": 0.54, + "learning_rate": 8.645275190909829e-06, + "loss": 0.6172, + "step": 15684 + }, + { + "epoch": 0.54, + "learning_rate": 8.644196372291455e-06, + "loss": 0.6657, + "step": 15685 + }, + { + "epoch": 0.54, + "learning_rate": 8.643117569747852e-06, + "loss": 0.6644, + "step": 15686 + }, + { + "epoch": 0.54, + "learning_rate": 8.642038783291809e-06, + "loss": 0.6204, + "step": 15687 + }, + { + "epoch": 0.54, + "learning_rate": 8.640960012936109e-06, + "loss": 0.673, + "step": 15688 + }, + { + "epoch": 0.54, + "learning_rate": 8.639881258693549e-06, + "loss": 0.6547, + "step": 15689 + }, + { + "epoch": 0.54, + "learning_rate": 8.638802520576922e-06, + "loss": 0.6377, + "step": 15690 + }, + { + "epoch": 0.54, + "learning_rate": 8.637723798599005e-06, + "loss": 0.6608, + "step": 15691 + }, + { + "epoch": 0.54, + "learning_rate": 8.6366450927726e-06, + "loss": 0.5818, + "step": 15692 + }, + { + "epoch": 0.54, + "learning_rate": 8.635566403110494e-06, + "loss": 0.6213, + "step": 15693 + }, + { + "epoch": 0.54, + "learning_rate": 8.634487729625471e-06, + "loss": 0.6766, + "step": 15694 + }, + { + "epoch": 0.54, + "learning_rate": 8.633409072330323e-06, + "loss": 0.6245, + "step": 15695 + }, + { + "epoch": 0.54, + "learning_rate": 8.632330431237844e-06, + "loss": 0.6588, + "step": 15696 + }, + { + "epoch": 0.54, + "learning_rate": 8.631251806360811e-06, + "loss": 0.6711, + "step": 15697 + }, + { + "epoch": 0.54, + "learning_rate": 8.630173197712022e-06, + "loss": 0.6036, + "step": 15698 + }, + { + "epoch": 0.54, + "learning_rate": 8.629094605304266e-06, + "loss": 0.6432, + "step": 15699 + }, + { + "epoch": 0.54, + "learning_rate": 8.628016029150324e-06, + "loss": 0.6396, + "step": 15700 + }, + { + "epoch": 0.54, + "learning_rate": 8.626937469262987e-06, + "loss": 0.6006, + "step": 15701 + }, + { + "epoch": 0.54, + "learning_rate": 8.625858925655049e-06, + "loss": 0.6151, + "step": 15702 + }, + { + "epoch": 0.54, + "learning_rate": 8.624780398339284e-06, + "loss": 0.6058, + "step": 15703 + }, + { + "epoch": 0.54, + "learning_rate": 8.62370188732849e-06, + "loss": 0.6721, + "step": 15704 + }, + { + "epoch": 0.54, + "learning_rate": 8.622623392635456e-06, + "loss": 0.6449, + "step": 15705 + }, + { + "epoch": 0.54, + "learning_rate": 8.621544914272956e-06, + "loss": 0.7221, + "step": 15706 + }, + { + "epoch": 0.54, + "learning_rate": 8.620466452253788e-06, + "loss": 0.6216, + "step": 15707 + }, + { + "epoch": 0.54, + "learning_rate": 8.61938800659074e-06, + "loss": 0.625, + "step": 15708 + }, + { + "epoch": 0.54, + "learning_rate": 8.618309577296586e-06, + "loss": 0.6085, + "step": 15709 + }, + { + "epoch": 0.54, + "learning_rate": 8.617231164384122e-06, + "loss": 0.6431, + "step": 15710 + }, + { + "epoch": 0.54, + "learning_rate": 8.616152767866137e-06, + "loss": 0.5791, + "step": 15711 + }, + { + "epoch": 0.54, + "learning_rate": 8.615074387755404e-06, + "loss": 0.6237, + "step": 15712 + }, + { + "epoch": 0.54, + "learning_rate": 8.613996024064724e-06, + "loss": 0.6466, + "step": 15713 + }, + { + "epoch": 0.54, + "learning_rate": 8.612917676806869e-06, + "loss": 0.5954, + "step": 15714 + }, + { + "epoch": 0.54, + "learning_rate": 8.611839345994629e-06, + "loss": 0.6751, + "step": 15715 + }, + { + "epoch": 0.54, + "learning_rate": 8.610761031640794e-06, + "loss": 0.6463, + "step": 15716 + }, + { + "epoch": 0.54, + "learning_rate": 8.609682733758141e-06, + "loss": 0.6346, + "step": 15717 + }, + { + "epoch": 0.54, + "learning_rate": 8.608604452359455e-06, + "loss": 0.6062, + "step": 15718 + }, + { + "epoch": 0.54, + "learning_rate": 8.60752618745753e-06, + "loss": 0.6283, + "step": 15719 + }, + { + "epoch": 0.54, + "learning_rate": 8.606447939065142e-06, + "loss": 0.5451, + "step": 15720 + }, + { + "epoch": 0.54, + "learning_rate": 8.605369707195071e-06, + "loss": 0.6871, + "step": 15721 + }, + { + "epoch": 0.54, + "learning_rate": 8.604291491860113e-06, + "loss": 0.643, + "step": 15722 + }, + { + "epoch": 0.54, + "learning_rate": 8.603213293073042e-06, + "loss": 0.6363, + "step": 15723 + }, + { + "epoch": 0.54, + "learning_rate": 8.602135110846642e-06, + "loss": 0.6239, + "step": 15724 + }, + { + "epoch": 0.54, + "learning_rate": 8.601056945193706e-06, + "loss": 0.6266, + "step": 15725 + }, + { + "epoch": 0.54, + "learning_rate": 8.599978796127003e-06, + "loss": 0.664, + "step": 15726 + }, + { + "epoch": 0.54, + "learning_rate": 8.598900663659321e-06, + "loss": 0.6396, + "step": 15727 + }, + { + "epoch": 0.54, + "learning_rate": 8.597822547803452e-06, + "loss": 0.6182, + "step": 15728 + }, + { + "epoch": 0.54, + "learning_rate": 8.596744448572164e-06, + "loss": 0.6661, + "step": 15729 + }, + { + "epoch": 0.55, + "learning_rate": 8.595666365978244e-06, + "loss": 0.6473, + "step": 15730 + }, + { + "epoch": 0.55, + "learning_rate": 8.594588300034484e-06, + "loss": 0.6596, + "step": 15731 + }, + { + "epoch": 0.55, + "learning_rate": 8.593510250753652e-06, + "loss": 0.5922, + "step": 15732 + }, + { + "epoch": 0.55, + "learning_rate": 8.592432218148531e-06, + "loss": 0.5765, + "step": 15733 + }, + { + "epoch": 0.55, + "learning_rate": 8.591354202231916e-06, + "loss": 0.6367, + "step": 15734 + }, + { + "epoch": 0.55, + "learning_rate": 8.590276203016575e-06, + "loss": 0.6733, + "step": 15735 + }, + { + "epoch": 0.55, + "learning_rate": 8.589198220515289e-06, + "loss": 0.6588, + "step": 15736 + }, + { + "epoch": 0.55, + "learning_rate": 8.588120254740849e-06, + "loss": 0.6834, + "step": 15737 + }, + { + "epoch": 0.55, + "learning_rate": 8.587042305706026e-06, + "loss": 0.625, + "step": 15738 + }, + { + "epoch": 0.55, + "learning_rate": 8.585964373423601e-06, + "loss": 0.6367, + "step": 15739 + }, + { + "epoch": 0.55, + "learning_rate": 8.584886457906365e-06, + "loss": 0.6979, + "step": 15740 + }, + { + "epoch": 0.55, + "learning_rate": 8.583808559167085e-06, + "loss": 0.5661, + "step": 15741 + }, + { + "epoch": 0.55, + "learning_rate": 8.582730677218544e-06, + "loss": 0.6691, + "step": 15742 + }, + { + "epoch": 0.55, + "learning_rate": 8.581652812073529e-06, + "loss": 0.6268, + "step": 15743 + }, + { + "epoch": 0.55, + "learning_rate": 8.580574963744812e-06, + "loss": 0.6453, + "step": 15744 + }, + { + "epoch": 0.55, + "learning_rate": 8.57949713224517e-06, + "loss": 0.5716, + "step": 15745 + }, + { + "epoch": 0.55, + "learning_rate": 8.578419317587395e-06, + "loss": 0.6082, + "step": 15746 + }, + { + "epoch": 0.55, + "learning_rate": 8.577341519784252e-06, + "loss": 0.6472, + "step": 15747 + }, + { + "epoch": 0.55, + "learning_rate": 8.576263738848522e-06, + "loss": 0.6141, + "step": 15748 + }, + { + "epoch": 0.55, + "learning_rate": 8.575185974792993e-06, + "loss": 0.6638, + "step": 15749 + }, + { + "epoch": 0.55, + "learning_rate": 8.574108227630433e-06, + "loss": 0.5777, + "step": 15750 + }, + { + "epoch": 0.55, + "learning_rate": 8.573030497373623e-06, + "loss": 0.6617, + "step": 15751 + }, + { + "epoch": 0.55, + "learning_rate": 8.571952784035345e-06, + "loss": 0.6612, + "step": 15752 + }, + { + "epoch": 0.55, + "learning_rate": 8.57087508762837e-06, + "loss": 0.6321, + "step": 15753 + }, + { + "epoch": 0.55, + "learning_rate": 8.569797408165478e-06, + "loss": 0.6374, + "step": 15754 + }, + { + "epoch": 0.55, + "learning_rate": 8.568719745659451e-06, + "loss": 0.6129, + "step": 15755 + }, + { + "epoch": 0.55, + "learning_rate": 8.567642100123061e-06, + "loss": 0.561, + "step": 15756 + }, + { + "epoch": 0.55, + "learning_rate": 8.566564471569081e-06, + "loss": 0.6191, + "step": 15757 + }, + { + "epoch": 0.55, + "learning_rate": 8.5654868600103e-06, + "loss": 0.6621, + "step": 15758 + }, + { + "epoch": 0.55, + "learning_rate": 8.564409265459482e-06, + "loss": 0.6083, + "step": 15759 + }, + { + "epoch": 0.55, + "learning_rate": 8.563331687929405e-06, + "loss": 0.6476, + "step": 15760 + }, + { + "epoch": 0.55, + "learning_rate": 8.562254127432858e-06, + "loss": 0.6526, + "step": 15761 + }, + { + "epoch": 0.55, + "learning_rate": 8.5611765839826e-06, + "loss": 0.6219, + "step": 15762 + }, + { + "epoch": 0.55, + "learning_rate": 8.560099057591414e-06, + "loss": 0.6449, + "step": 15763 + }, + { + "epoch": 0.55, + "learning_rate": 8.55902154827208e-06, + "loss": 0.6518, + "step": 15764 + }, + { + "epoch": 0.55, + "learning_rate": 8.557944056037362e-06, + "loss": 0.577, + "step": 15765 + }, + { + "epoch": 0.55, + "learning_rate": 8.556866580900043e-06, + "loss": 0.6697, + "step": 15766 + }, + { + "epoch": 0.55, + "learning_rate": 8.5557891228729e-06, + "loss": 0.6264, + "step": 15767 + }, + { + "epoch": 0.55, + "learning_rate": 8.5547116819687e-06, + "loss": 0.6008, + "step": 15768 + }, + { + "epoch": 0.55, + "learning_rate": 8.55363425820022e-06, + "loss": 0.6045, + "step": 15769 + }, + { + "epoch": 0.55, + "learning_rate": 8.552556851580243e-06, + "loss": 0.6219, + "step": 15770 + }, + { + "epoch": 0.55, + "learning_rate": 8.55147946212153e-06, + "loss": 0.6259, + "step": 15771 + }, + { + "epoch": 0.55, + "learning_rate": 8.550402089836857e-06, + "loss": 0.6619, + "step": 15772 + }, + { + "epoch": 0.55, + "learning_rate": 8.549324734739011e-06, + "loss": 0.653, + "step": 15773 + }, + { + "epoch": 0.55, + "learning_rate": 8.548247396840747e-06, + "loss": 0.6315, + "step": 15774 + }, + { + "epoch": 0.55, + "learning_rate": 8.547170076154852e-06, + "loss": 0.6329, + "step": 15775 + }, + { + "epoch": 0.55, + "learning_rate": 8.54609277269409e-06, + "loss": 0.6899, + "step": 15776 + }, + { + "epoch": 0.55, + "learning_rate": 8.545015486471238e-06, + "loss": 0.6467, + "step": 15777 + }, + { + "epoch": 0.55, + "learning_rate": 8.543938217499069e-06, + "loss": 0.6104, + "step": 15778 + }, + { + "epoch": 0.55, + "learning_rate": 8.542860965790351e-06, + "loss": 0.671, + "step": 15779 + }, + { + "epoch": 0.55, + "learning_rate": 8.541783731357863e-06, + "loss": 0.6216, + "step": 15780 + }, + { + "epoch": 0.55, + "learning_rate": 8.540706514214374e-06, + "loss": 0.627, + "step": 15781 + }, + { + "epoch": 0.55, + "learning_rate": 8.539629314372653e-06, + "loss": 0.622, + "step": 15782 + }, + { + "epoch": 0.55, + "learning_rate": 8.538552131845473e-06, + "loss": 0.6355, + "step": 15783 + }, + { + "epoch": 0.55, + "learning_rate": 8.537474966645609e-06, + "loss": 0.6662, + "step": 15784 + }, + { + "epoch": 0.55, + "learning_rate": 8.536397818785829e-06, + "loss": 0.6795, + "step": 15785 + }, + { + "epoch": 0.55, + "learning_rate": 8.535320688278902e-06, + "loss": 0.6578, + "step": 15786 + }, + { + "epoch": 0.55, + "learning_rate": 8.534243575137604e-06, + "loss": 0.6532, + "step": 15787 + }, + { + "epoch": 0.55, + "learning_rate": 8.5331664793747e-06, + "loss": 0.6729, + "step": 15788 + }, + { + "epoch": 0.55, + "learning_rate": 8.532089401002964e-06, + "loss": 0.6336, + "step": 15789 + }, + { + "epoch": 0.55, + "learning_rate": 8.531012340035166e-06, + "loss": 0.6393, + "step": 15790 + }, + { + "epoch": 0.55, + "learning_rate": 8.529935296484075e-06, + "loss": 0.5994, + "step": 15791 + }, + { + "epoch": 0.55, + "learning_rate": 8.528858270362458e-06, + "loss": 0.6631, + "step": 15792 + }, + { + "epoch": 0.55, + "learning_rate": 8.527781261683092e-06, + "loss": 0.6126, + "step": 15793 + }, + { + "epoch": 0.55, + "learning_rate": 8.526704270458737e-06, + "loss": 0.6838, + "step": 15794 + }, + { + "epoch": 0.55, + "learning_rate": 8.525627296702168e-06, + "loss": 0.6731, + "step": 15795 + }, + { + "epoch": 0.55, + "learning_rate": 8.524550340426154e-06, + "loss": 0.6304, + "step": 15796 + }, + { + "epoch": 0.55, + "learning_rate": 8.523473401643459e-06, + "loss": 0.5694, + "step": 15797 + }, + { + "epoch": 0.55, + "learning_rate": 8.522396480366857e-06, + "loss": 0.6113, + "step": 15798 + }, + { + "epoch": 0.55, + "learning_rate": 8.521319576609115e-06, + "loss": 0.6927, + "step": 15799 + }, + { + "epoch": 0.55, + "learning_rate": 8.520242690382998e-06, + "loss": 0.6473, + "step": 15800 + }, + { + "epoch": 0.55, + "learning_rate": 8.519165821701274e-06, + "loss": 0.6611, + "step": 15801 + }, + { + "epoch": 0.55, + "learning_rate": 8.518088970576717e-06, + "loss": 0.6794, + "step": 15802 + }, + { + "epoch": 0.55, + "learning_rate": 8.517012137022087e-06, + "loss": 0.6254, + "step": 15803 + }, + { + "epoch": 0.55, + "learning_rate": 8.515935321050154e-06, + "loss": 0.6101, + "step": 15804 + }, + { + "epoch": 0.55, + "learning_rate": 8.514858522673686e-06, + "loss": 0.612, + "step": 15805 + }, + { + "epoch": 0.55, + "learning_rate": 8.51378174190545e-06, + "loss": 0.6594, + "step": 15806 + }, + { + "epoch": 0.55, + "learning_rate": 8.512704978758209e-06, + "loss": 0.5907, + "step": 15807 + }, + { + "epoch": 0.55, + "learning_rate": 8.511628233244733e-06, + "loss": 0.6827, + "step": 15808 + }, + { + "epoch": 0.55, + "learning_rate": 8.510551505377787e-06, + "loss": 0.6486, + "step": 15809 + }, + { + "epoch": 0.55, + "learning_rate": 8.509474795170136e-06, + "loss": 0.5388, + "step": 15810 + }, + { + "epoch": 0.55, + "learning_rate": 8.508398102634551e-06, + "loss": 0.6365, + "step": 15811 + }, + { + "epoch": 0.55, + "learning_rate": 8.50732142778379e-06, + "loss": 0.6526, + "step": 15812 + }, + { + "epoch": 0.55, + "learning_rate": 8.50624477063062e-06, + "loss": 0.63, + "step": 15813 + }, + { + "epoch": 0.55, + "learning_rate": 8.505168131187813e-06, + "loss": 0.6436, + "step": 15814 + }, + { + "epoch": 0.55, + "learning_rate": 8.504091509468125e-06, + "loss": 0.6645, + "step": 15815 + }, + { + "epoch": 0.55, + "learning_rate": 8.503014905484324e-06, + "loss": 0.5861, + "step": 15816 + }, + { + "epoch": 0.55, + "learning_rate": 8.501938319249177e-06, + "loss": 0.6387, + "step": 15817 + }, + { + "epoch": 0.55, + "learning_rate": 8.500861750775446e-06, + "loss": 0.6538, + "step": 15818 + }, + { + "epoch": 0.55, + "learning_rate": 8.499785200075894e-06, + "loss": 0.5885, + "step": 15819 + }, + { + "epoch": 0.55, + "learning_rate": 8.498708667163289e-06, + "loss": 0.6387, + "step": 15820 + }, + { + "epoch": 0.55, + "learning_rate": 8.497632152050389e-06, + "loss": 0.6498, + "step": 15821 + }, + { + "epoch": 0.55, + "learning_rate": 8.49655565474996e-06, + "loss": 0.6868, + "step": 15822 + }, + { + "epoch": 0.55, + "learning_rate": 8.495479175274769e-06, + "loss": 0.64, + "step": 15823 + }, + { + "epoch": 0.55, + "learning_rate": 8.494402713637572e-06, + "loss": 0.6602, + "step": 15824 + }, + { + "epoch": 0.55, + "learning_rate": 8.493326269851138e-06, + "loss": 0.6231, + "step": 15825 + }, + { + "epoch": 0.55, + "learning_rate": 8.492249843928228e-06, + "loss": 0.7122, + "step": 15826 + }, + { + "epoch": 0.55, + "learning_rate": 8.4911734358816e-06, + "loss": 0.6656, + "step": 15827 + }, + { + "epoch": 0.55, + "learning_rate": 8.490097045724021e-06, + "loss": 0.6266, + "step": 15828 + }, + { + "epoch": 0.55, + "learning_rate": 8.489020673468252e-06, + "loss": 0.587, + "step": 15829 + }, + { + "epoch": 0.55, + "learning_rate": 8.487944319127053e-06, + "loss": 0.6208, + "step": 15830 + }, + { + "epoch": 0.55, + "learning_rate": 8.486867982713187e-06, + "loss": 0.591, + "step": 15831 + }, + { + "epoch": 0.55, + "learning_rate": 8.485791664239418e-06, + "loss": 0.6869, + "step": 15832 + }, + { + "epoch": 0.55, + "learning_rate": 8.484715363718502e-06, + "loss": 0.6482, + "step": 15833 + }, + { + "epoch": 0.55, + "learning_rate": 8.483639081163201e-06, + "loss": 0.6031, + "step": 15834 + }, + { + "epoch": 0.55, + "learning_rate": 8.48256281658628e-06, + "loss": 0.677, + "step": 15835 + }, + { + "epoch": 0.55, + "learning_rate": 8.481486570000495e-06, + "loss": 0.6722, + "step": 15836 + }, + { + "epoch": 0.55, + "learning_rate": 8.480410341418608e-06, + "loss": 0.6004, + "step": 15837 + }, + { + "epoch": 0.55, + "learning_rate": 8.479334130853378e-06, + "loss": 0.6116, + "step": 15838 + }, + { + "epoch": 0.55, + "learning_rate": 8.478257938317565e-06, + "loss": 0.6488, + "step": 15839 + }, + { + "epoch": 0.55, + "learning_rate": 8.477181763823931e-06, + "loss": 0.6708, + "step": 15840 + }, + { + "epoch": 0.55, + "learning_rate": 8.476105607385233e-06, + "loss": 0.5877, + "step": 15841 + }, + { + "epoch": 0.55, + "learning_rate": 8.475029469014229e-06, + "loss": 0.6267, + "step": 15842 + }, + { + "epoch": 0.55, + "learning_rate": 8.473953348723682e-06, + "loss": 0.639, + "step": 15843 + }, + { + "epoch": 0.55, + "learning_rate": 8.472877246526346e-06, + "loss": 0.6632, + "step": 15844 + }, + { + "epoch": 0.55, + "learning_rate": 8.471801162434983e-06, + "loss": 0.6795, + "step": 15845 + }, + { + "epoch": 0.55, + "learning_rate": 8.470725096462352e-06, + "loss": 0.6667, + "step": 15846 + }, + { + "epoch": 0.55, + "learning_rate": 8.469649048621207e-06, + "loss": 0.6775, + "step": 15847 + }, + { + "epoch": 0.55, + "learning_rate": 8.46857301892431e-06, + "loss": 0.6389, + "step": 15848 + }, + { + "epoch": 0.55, + "learning_rate": 8.467497007384418e-06, + "loss": 0.6527, + "step": 15849 + }, + { + "epoch": 0.55, + "learning_rate": 8.466421014014285e-06, + "loss": 0.6187, + "step": 15850 + }, + { + "epoch": 0.55, + "learning_rate": 8.465345038826674e-06, + "loss": 0.6733, + "step": 15851 + }, + { + "epoch": 0.55, + "learning_rate": 8.464269081834338e-06, + "loss": 0.616, + "step": 15852 + }, + { + "epoch": 0.55, + "learning_rate": 8.463193143050032e-06, + "loss": 0.6146, + "step": 15853 + }, + { + "epoch": 0.55, + "learning_rate": 8.462117222486519e-06, + "loss": 0.6763, + "step": 15854 + }, + { + "epoch": 0.55, + "learning_rate": 8.46104132015655e-06, + "loss": 0.6907, + "step": 15855 + }, + { + "epoch": 0.55, + "learning_rate": 8.459965436072883e-06, + "loss": 0.6599, + "step": 15856 + }, + { + "epoch": 0.55, + "learning_rate": 8.458889570248273e-06, + "loss": 0.624, + "step": 15857 + }, + { + "epoch": 0.55, + "learning_rate": 8.45781372269548e-06, + "loss": 0.6506, + "step": 15858 + }, + { + "epoch": 0.55, + "learning_rate": 8.456737893427252e-06, + "loss": 0.6315, + "step": 15859 + }, + { + "epoch": 0.55, + "learning_rate": 8.45566208245635e-06, + "loss": 0.6149, + "step": 15860 + }, + { + "epoch": 0.55, + "learning_rate": 8.45458628979553e-06, + "loss": 0.6394, + "step": 15861 + }, + { + "epoch": 0.55, + "learning_rate": 8.453510515457542e-06, + "loss": 0.621, + "step": 15862 + }, + { + "epoch": 0.55, + "learning_rate": 8.452434759455143e-06, + "loss": 0.6496, + "step": 15863 + }, + { + "epoch": 0.55, + "learning_rate": 8.45135902180109e-06, + "loss": 0.5886, + "step": 15864 + }, + { + "epoch": 0.55, + "learning_rate": 8.450283302508132e-06, + "loss": 0.6263, + "step": 15865 + }, + { + "epoch": 0.55, + "learning_rate": 8.449207601589026e-06, + "loss": 0.6391, + "step": 15866 + }, + { + "epoch": 0.55, + "learning_rate": 8.448131919056527e-06, + "loss": 0.6383, + "step": 15867 + }, + { + "epoch": 0.55, + "learning_rate": 8.447056254923387e-06, + "loss": 0.6051, + "step": 15868 + }, + { + "epoch": 0.55, + "learning_rate": 8.445980609202359e-06, + "loss": 0.6034, + "step": 15869 + }, + { + "epoch": 0.55, + "learning_rate": 8.444904981906199e-06, + "loss": 0.5929, + "step": 15870 + }, + { + "epoch": 0.55, + "learning_rate": 8.443829373047653e-06, + "loss": 0.6378, + "step": 15871 + }, + { + "epoch": 0.55, + "learning_rate": 8.442753782639481e-06, + "loss": 0.6822, + "step": 15872 + }, + { + "epoch": 0.55, + "learning_rate": 8.441678210694435e-06, + "loss": 0.6443, + "step": 15873 + }, + { + "epoch": 0.55, + "learning_rate": 8.440602657225263e-06, + "loss": 0.611, + "step": 15874 + }, + { + "epoch": 0.55, + "learning_rate": 8.439527122244716e-06, + "loss": 0.6417, + "step": 15875 + }, + { + "epoch": 0.55, + "learning_rate": 8.438451605765555e-06, + "loss": 0.5969, + "step": 15876 + }, + { + "epoch": 0.55, + "learning_rate": 8.437376107800522e-06, + "loss": 0.621, + "step": 15877 + }, + { + "epoch": 0.55, + "learning_rate": 8.436300628362374e-06, + "loss": 0.6406, + "step": 15878 + }, + { + "epoch": 0.55, + "learning_rate": 8.435225167463859e-06, + "loss": 0.6461, + "step": 15879 + }, + { + "epoch": 0.55, + "learning_rate": 8.434149725117728e-06, + "loss": 0.6212, + "step": 15880 + }, + { + "epoch": 0.55, + "learning_rate": 8.433074301336732e-06, + "loss": 0.6502, + "step": 15881 + }, + { + "epoch": 0.55, + "learning_rate": 8.431998896133626e-06, + "loss": 0.6007, + "step": 15882 + }, + { + "epoch": 0.55, + "learning_rate": 8.430923509521155e-06, + "loss": 0.6513, + "step": 15883 + }, + { + "epoch": 0.55, + "learning_rate": 8.42984814151207e-06, + "loss": 0.5828, + "step": 15884 + }, + { + "epoch": 0.55, + "learning_rate": 8.428772792119123e-06, + "loss": 0.6651, + "step": 15885 + }, + { + "epoch": 0.55, + "learning_rate": 8.42769746135506e-06, + "loss": 0.6231, + "step": 15886 + }, + { + "epoch": 0.55, + "learning_rate": 8.426622149232633e-06, + "loss": 0.628, + "step": 15887 + }, + { + "epoch": 0.55, + "learning_rate": 8.425546855764593e-06, + "loss": 0.6443, + "step": 15888 + }, + { + "epoch": 0.55, + "learning_rate": 8.424471580963684e-06, + "loss": 0.5774, + "step": 15889 + }, + { + "epoch": 0.55, + "learning_rate": 8.423396324842658e-06, + "loss": 0.6123, + "step": 15890 + }, + { + "epoch": 0.55, + "learning_rate": 8.422321087414266e-06, + "loss": 0.6148, + "step": 15891 + }, + { + "epoch": 0.55, + "learning_rate": 8.42124586869125e-06, + "loss": 0.6827, + "step": 15892 + }, + { + "epoch": 0.55, + "learning_rate": 8.420170668686361e-06, + "loss": 0.6238, + "step": 15893 + }, + { + "epoch": 0.55, + "learning_rate": 8.41909548741235e-06, + "loss": 0.6401, + "step": 15894 + }, + { + "epoch": 0.55, + "learning_rate": 8.41802032488196e-06, + "loss": 0.6241, + "step": 15895 + }, + { + "epoch": 0.55, + "learning_rate": 8.41694518110794e-06, + "loss": 0.645, + "step": 15896 + }, + { + "epoch": 0.55, + "learning_rate": 8.415870056103039e-06, + "loss": 0.5522, + "step": 15897 + }, + { + "epoch": 0.55, + "learning_rate": 8.41479494988e-06, + "loss": 0.5968, + "step": 15898 + }, + { + "epoch": 0.55, + "learning_rate": 8.413719862451579e-06, + "loss": 0.6363, + "step": 15899 + }, + { + "epoch": 0.55, + "learning_rate": 8.412644793830506e-06, + "loss": 0.6316, + "step": 15900 + }, + { + "epoch": 0.55, + "learning_rate": 8.41156974402954e-06, + "loss": 0.6144, + "step": 15901 + }, + { + "epoch": 0.55, + "learning_rate": 8.41049471306143e-06, + "loss": 0.6119, + "step": 15902 + }, + { + "epoch": 0.55, + "learning_rate": 8.409419700938908e-06, + "loss": 0.6391, + "step": 15903 + }, + { + "epoch": 0.55, + "learning_rate": 8.40834470767473e-06, + "loss": 0.6575, + "step": 15904 + }, + { + "epoch": 0.55, + "learning_rate": 8.407269733281644e-06, + "loss": 0.6259, + "step": 15905 + }, + { + "epoch": 0.55, + "learning_rate": 8.406194777772382e-06, + "loss": 0.6205, + "step": 15906 + }, + { + "epoch": 0.55, + "learning_rate": 8.405119841159701e-06, + "loss": 0.596, + "step": 15907 + }, + { + "epoch": 0.55, + "learning_rate": 8.404044923456346e-06, + "loss": 0.6377, + "step": 15908 + }, + { + "epoch": 0.55, + "learning_rate": 8.402970024675051e-06, + "loss": 0.6009, + "step": 15909 + }, + { + "epoch": 0.55, + "learning_rate": 8.401895144828566e-06, + "loss": 0.6416, + "step": 15910 + }, + { + "epoch": 0.55, + "learning_rate": 8.400820283929642e-06, + "loss": 0.6816, + "step": 15911 + }, + { + "epoch": 0.55, + "learning_rate": 8.399745441991011e-06, + "loss": 0.6945, + "step": 15912 + }, + { + "epoch": 0.55, + "learning_rate": 8.398670619025423e-06, + "loss": 0.7075, + "step": 15913 + }, + { + "epoch": 0.55, + "learning_rate": 8.397595815045624e-06, + "loss": 0.6292, + "step": 15914 + }, + { + "epoch": 0.55, + "learning_rate": 8.39652103006435e-06, + "loss": 0.6116, + "step": 15915 + }, + { + "epoch": 0.55, + "learning_rate": 8.395446264094346e-06, + "loss": 0.6145, + "step": 15916 + }, + { + "epoch": 0.55, + "learning_rate": 8.394371517148364e-06, + "loss": 0.6521, + "step": 15917 + }, + { + "epoch": 0.55, + "learning_rate": 8.39329678923913e-06, + "loss": 0.6437, + "step": 15918 + }, + { + "epoch": 0.55, + "learning_rate": 8.392222080379399e-06, + "loss": 0.6439, + "step": 15919 + }, + { + "epoch": 0.55, + "learning_rate": 8.391147390581914e-06, + "loss": 0.6211, + "step": 15920 + }, + { + "epoch": 0.55, + "learning_rate": 8.390072719859403e-06, + "loss": 0.6467, + "step": 15921 + }, + { + "epoch": 0.55, + "learning_rate": 8.38899806822462e-06, + "loss": 0.6532, + "step": 15922 + }, + { + "epoch": 0.55, + "learning_rate": 8.387923435690307e-06, + "loss": 0.6378, + "step": 15923 + }, + { + "epoch": 0.55, + "learning_rate": 8.386848822269194e-06, + "loss": 0.6793, + "step": 15924 + }, + { + "epoch": 0.55, + "learning_rate": 8.385774227974031e-06, + "loss": 0.6021, + "step": 15925 + }, + { + "epoch": 0.55, + "learning_rate": 8.38469965281756e-06, + "loss": 0.6557, + "step": 15926 + }, + { + "epoch": 0.55, + "learning_rate": 8.383625096812514e-06, + "loss": 0.612, + "step": 15927 + }, + { + "epoch": 0.55, + "learning_rate": 8.382550559971638e-06, + "loss": 0.5951, + "step": 15928 + }, + { + "epoch": 0.55, + "learning_rate": 8.381476042307677e-06, + "loss": 0.6479, + "step": 15929 + }, + { + "epoch": 0.55, + "learning_rate": 8.380401543833355e-06, + "loss": 0.6312, + "step": 15930 + }, + { + "epoch": 0.55, + "learning_rate": 8.379327064561427e-06, + "loss": 0.5972, + "step": 15931 + }, + { + "epoch": 0.55, + "learning_rate": 8.378252604504629e-06, + "loss": 0.558, + "step": 15932 + }, + { + "epoch": 0.55, + "learning_rate": 8.377178163675691e-06, + "loss": 0.6214, + "step": 15933 + }, + { + "epoch": 0.55, + "learning_rate": 8.376103742087363e-06, + "loss": 0.5856, + "step": 15934 + }, + { + "epoch": 0.55, + "learning_rate": 8.375029339752382e-06, + "loss": 0.6308, + "step": 15935 + }, + { + "epoch": 0.55, + "learning_rate": 8.373954956683479e-06, + "loss": 0.6608, + "step": 15936 + }, + { + "epoch": 0.55, + "learning_rate": 8.3728805928934e-06, + "loss": 0.5926, + "step": 15937 + }, + { + "epoch": 0.55, + "learning_rate": 8.371806248394882e-06, + "loss": 0.6344, + "step": 15938 + }, + { + "epoch": 0.55, + "learning_rate": 8.370731923200653e-06, + "loss": 0.5892, + "step": 15939 + }, + { + "epoch": 0.55, + "learning_rate": 8.369657617323463e-06, + "loss": 0.6765, + "step": 15940 + }, + { + "epoch": 0.55, + "learning_rate": 8.368583330776047e-06, + "loss": 0.6044, + "step": 15941 + }, + { + "epoch": 0.55, + "learning_rate": 8.367509063571133e-06, + "loss": 0.6431, + "step": 15942 + }, + { + "epoch": 0.55, + "learning_rate": 8.366434815721468e-06, + "loss": 0.6296, + "step": 15943 + }, + { + "epoch": 0.55, + "learning_rate": 8.365360587239787e-06, + "loss": 0.6366, + "step": 15944 + }, + { + "epoch": 0.55, + "learning_rate": 8.364286378138819e-06, + "loss": 0.6565, + "step": 15945 + }, + { + "epoch": 0.55, + "learning_rate": 8.363212188431306e-06, + "loss": 0.6141, + "step": 15946 + }, + { + "epoch": 0.55, + "learning_rate": 8.362138018129988e-06, + "loss": 0.6519, + "step": 15947 + }, + { + "epoch": 0.55, + "learning_rate": 8.36106386724759e-06, + "loss": 0.6446, + "step": 15948 + }, + { + "epoch": 0.55, + "learning_rate": 8.359989735796855e-06, + "loss": 0.6267, + "step": 15949 + }, + { + "epoch": 0.55, + "learning_rate": 8.358915623790519e-06, + "loss": 0.6187, + "step": 15950 + }, + { + "epoch": 0.55, + "learning_rate": 8.35784153124131e-06, + "loss": 0.6135, + "step": 15951 + }, + { + "epoch": 0.55, + "learning_rate": 8.356767458161967e-06, + "loss": 0.6262, + "step": 15952 + }, + { + "epoch": 0.55, + "learning_rate": 8.355693404565229e-06, + "loss": 0.6099, + "step": 15953 + }, + { + "epoch": 0.55, + "learning_rate": 8.354619370463822e-06, + "loss": 0.6406, + "step": 15954 + }, + { + "epoch": 0.55, + "learning_rate": 8.353545355870483e-06, + "loss": 0.5869, + "step": 15955 + }, + { + "epoch": 0.55, + "learning_rate": 8.352471360797952e-06, + "loss": 0.602, + "step": 15956 + }, + { + "epoch": 0.55, + "learning_rate": 8.351397385258951e-06, + "loss": 0.6008, + "step": 15957 + }, + { + "epoch": 0.55, + "learning_rate": 8.350323429266221e-06, + "loss": 0.6297, + "step": 15958 + }, + { + "epoch": 0.55, + "learning_rate": 8.349249492832499e-06, + "loss": 0.5861, + "step": 15959 + }, + { + "epoch": 0.55, + "learning_rate": 8.348175575970504e-06, + "loss": 0.6269, + "step": 15960 + }, + { + "epoch": 0.55, + "learning_rate": 8.347101678692985e-06, + "loss": 0.6461, + "step": 15961 + }, + { + "epoch": 0.55, + "learning_rate": 8.346027801012661e-06, + "loss": 0.6479, + "step": 15962 + }, + { + "epoch": 0.55, + "learning_rate": 8.34495394294227e-06, + "loss": 0.613, + "step": 15963 + }, + { + "epoch": 0.55, + "learning_rate": 8.343880104494548e-06, + "loss": 0.6238, + "step": 15964 + }, + { + "epoch": 0.55, + "learning_rate": 8.34280628568222e-06, + "loss": 0.6095, + "step": 15965 + }, + { + "epoch": 0.55, + "learning_rate": 8.341732486518016e-06, + "loss": 0.6475, + "step": 15966 + }, + { + "epoch": 0.55, + "learning_rate": 8.340658707014677e-06, + "loss": 0.6012, + "step": 15967 + }, + { + "epoch": 0.55, + "learning_rate": 8.339584947184925e-06, + "loss": 0.616, + "step": 15968 + }, + { + "epoch": 0.55, + "learning_rate": 8.338511207041491e-06, + "loss": 0.6296, + "step": 15969 + }, + { + "epoch": 0.55, + "learning_rate": 8.337437486597117e-06, + "loss": 0.584, + "step": 15970 + }, + { + "epoch": 0.55, + "learning_rate": 8.336363785864518e-06, + "loss": 0.6468, + "step": 15971 + }, + { + "epoch": 0.55, + "learning_rate": 8.33529010485643e-06, + "loss": 0.639, + "step": 15972 + }, + { + "epoch": 0.55, + "learning_rate": 8.33421644358559e-06, + "loss": 0.62, + "step": 15973 + }, + { + "epoch": 0.55, + "learning_rate": 8.333142802064717e-06, + "loss": 0.6378, + "step": 15974 + }, + { + "epoch": 0.55, + "learning_rate": 8.332069180306541e-06, + "loss": 0.6866, + "step": 15975 + }, + { + "epoch": 0.55, + "learning_rate": 8.330995578323803e-06, + "loss": 0.666, + "step": 15976 + }, + { + "epoch": 0.55, + "learning_rate": 8.329921996129219e-06, + "loss": 0.6148, + "step": 15977 + }, + { + "epoch": 0.55, + "learning_rate": 8.32884843373552e-06, + "loss": 0.641, + "step": 15978 + }, + { + "epoch": 0.55, + "learning_rate": 8.327774891155443e-06, + "loss": 0.6619, + "step": 15979 + }, + { + "epoch": 0.55, + "learning_rate": 8.326701368401706e-06, + "loss": 0.6351, + "step": 15980 + }, + { + "epoch": 0.55, + "learning_rate": 8.32562786548704e-06, + "loss": 0.6452, + "step": 15981 + }, + { + "epoch": 0.55, + "learning_rate": 8.324554382424179e-06, + "loss": 0.6608, + "step": 15982 + }, + { + "epoch": 0.55, + "learning_rate": 8.323480919225841e-06, + "loss": 0.6763, + "step": 15983 + }, + { + "epoch": 0.55, + "learning_rate": 8.322407475904754e-06, + "loss": 0.6136, + "step": 15984 + }, + { + "epoch": 0.55, + "learning_rate": 8.321334052473658e-06, + "loss": 0.6196, + "step": 15985 + }, + { + "epoch": 0.55, + "learning_rate": 8.320260648945264e-06, + "loss": 0.59, + "step": 15986 + }, + { + "epoch": 0.55, + "learning_rate": 8.319187265332304e-06, + "loss": 0.6217, + "step": 15987 + }, + { + "epoch": 0.55, + "learning_rate": 8.31811390164751e-06, + "loss": 0.6002, + "step": 15988 + }, + { + "epoch": 0.55, + "learning_rate": 8.3170405579036e-06, + "loss": 0.5791, + "step": 15989 + }, + { + "epoch": 0.55, + "learning_rate": 8.3159672341133e-06, + "loss": 0.5553, + "step": 15990 + }, + { + "epoch": 0.55, + "learning_rate": 8.314893930289347e-06, + "loss": 0.6886, + "step": 15991 + }, + { + "epoch": 0.55, + "learning_rate": 8.313820646444454e-06, + "loss": 0.6047, + "step": 15992 + }, + { + "epoch": 0.55, + "learning_rate": 8.312747382591346e-06, + "loss": 0.6964, + "step": 15993 + }, + { + "epoch": 0.55, + "learning_rate": 8.31167413874276e-06, + "loss": 0.6396, + "step": 15994 + }, + { + "epoch": 0.55, + "learning_rate": 8.31060091491141e-06, + "loss": 0.6077, + "step": 15995 + }, + { + "epoch": 0.55, + "learning_rate": 8.309527711110017e-06, + "loss": 0.6124, + "step": 15996 + }, + { + "epoch": 0.55, + "learning_rate": 8.308454527351321e-06, + "loss": 0.6438, + "step": 15997 + }, + { + "epoch": 0.55, + "learning_rate": 8.30738136364803e-06, + "loss": 0.6348, + "step": 15998 + }, + { + "epoch": 0.55, + "learning_rate": 8.306308220012877e-06, + "loss": 0.656, + "step": 15999 + }, + { + "epoch": 0.55, + "learning_rate": 8.305235096458583e-06, + "loss": 0.6023, + "step": 16000 + }, + { + "epoch": 0.55, + "learning_rate": 8.304161992997869e-06, + "loss": 0.606, + "step": 16001 + }, + { + "epoch": 0.55, + "learning_rate": 8.303088909643458e-06, + "loss": 0.6243, + "step": 16002 + }, + { + "epoch": 0.55, + "learning_rate": 8.30201584640808e-06, + "loss": 0.6446, + "step": 16003 + }, + { + "epoch": 0.55, + "learning_rate": 8.300942803304448e-06, + "loss": 0.6267, + "step": 16004 + }, + { + "epoch": 0.55, + "learning_rate": 8.29986978034529e-06, + "loss": 0.6406, + "step": 16005 + }, + { + "epoch": 0.55, + "learning_rate": 8.298796777543325e-06, + "loss": 0.6834, + "step": 16006 + }, + { + "epoch": 0.55, + "learning_rate": 8.297723794911276e-06, + "loss": 0.6936, + "step": 16007 + }, + { + "epoch": 0.55, + "learning_rate": 8.296650832461866e-06, + "loss": 0.6098, + "step": 16008 + }, + { + "epoch": 0.55, + "learning_rate": 8.295577890207817e-06, + "loss": 0.6341, + "step": 16009 + }, + { + "epoch": 0.55, + "learning_rate": 8.294504968161844e-06, + "loss": 0.631, + "step": 16010 + }, + { + "epoch": 0.55, + "learning_rate": 8.293432066336675e-06, + "loss": 0.6008, + "step": 16011 + }, + { + "epoch": 0.55, + "learning_rate": 8.292359184745028e-06, + "loss": 0.6289, + "step": 16012 + }, + { + "epoch": 0.55, + "learning_rate": 8.291286323399622e-06, + "loss": 0.6357, + "step": 16013 + }, + { + "epoch": 0.55, + "learning_rate": 8.290213482313177e-06, + "loss": 0.6316, + "step": 16014 + }, + { + "epoch": 0.55, + "learning_rate": 8.289140661498416e-06, + "loss": 0.5915, + "step": 16015 + }, + { + "epoch": 0.55, + "learning_rate": 8.288067860968055e-06, + "loss": 0.5847, + "step": 16016 + }, + { + "epoch": 0.55, + "learning_rate": 8.286995080734817e-06, + "loss": 0.7003, + "step": 16017 + }, + { + "epoch": 0.55, + "learning_rate": 8.28592232081142e-06, + "loss": 0.6289, + "step": 16018 + }, + { + "epoch": 0.56, + "learning_rate": 8.28484958121058e-06, + "loss": 0.667, + "step": 16019 + }, + { + "epoch": 0.56, + "learning_rate": 8.283776861945016e-06, + "loss": 0.6516, + "step": 16020 + }, + { + "epoch": 0.56, + "learning_rate": 8.282704163027453e-06, + "loss": 0.6496, + "step": 16021 + }, + { + "epoch": 0.56, + "learning_rate": 8.2816314844706e-06, + "loss": 0.6157, + "step": 16022 + }, + { + "epoch": 0.56, + "learning_rate": 8.280558826287184e-06, + "loss": 0.6098, + "step": 16023 + }, + { + "epoch": 0.56, + "learning_rate": 8.279486188489916e-06, + "loss": 0.6017, + "step": 16024 + }, + { + "epoch": 0.56, + "learning_rate": 8.278413571091515e-06, + "loss": 0.622, + "step": 16025 + }, + { + "epoch": 0.56, + "learning_rate": 8.2773409741047e-06, + "loss": 0.593, + "step": 16026 + }, + { + "epoch": 0.56, + "learning_rate": 8.276268397542186e-06, + "loss": 0.6061, + "step": 16027 + }, + { + "epoch": 0.56, + "learning_rate": 8.275195841416692e-06, + "loss": 0.5843, + "step": 16028 + }, + { + "epoch": 0.56, + "learning_rate": 8.274123305740934e-06, + "loss": 0.5989, + "step": 16029 + }, + { + "epoch": 0.56, + "learning_rate": 8.273050790527624e-06, + "loss": 0.6095, + "step": 16030 + }, + { + "epoch": 0.56, + "learning_rate": 8.271978295789482e-06, + "loss": 0.6377, + "step": 16031 + }, + { + "epoch": 0.56, + "learning_rate": 8.270905821539227e-06, + "loss": 0.6519, + "step": 16032 + }, + { + "epoch": 0.56, + "learning_rate": 8.269833367789566e-06, + "loss": 0.66, + "step": 16033 + }, + { + "epoch": 0.56, + "learning_rate": 8.268760934553221e-06, + "loss": 0.5921, + "step": 16034 + }, + { + "epoch": 0.56, + "learning_rate": 8.267688521842909e-06, + "loss": 0.6414, + "step": 16035 + }, + { + "epoch": 0.56, + "learning_rate": 8.266616129671337e-06, + "loss": 0.6318, + "step": 16036 + }, + { + "epoch": 0.56, + "learning_rate": 8.265543758051221e-06, + "loss": 0.6414, + "step": 16037 + }, + { + "epoch": 0.56, + "learning_rate": 8.264471406995285e-06, + "loss": 0.6676, + "step": 16038 + }, + { + "epoch": 0.56, + "learning_rate": 8.26339907651623e-06, + "loss": 0.6371, + "step": 16039 + }, + { + "epoch": 0.56, + "learning_rate": 8.262326766626778e-06, + "loss": 0.6064, + "step": 16040 + }, + { + "epoch": 0.56, + "learning_rate": 8.261254477339642e-06, + "loss": 0.6559, + "step": 16041 + }, + { + "epoch": 0.56, + "learning_rate": 8.26018220866753e-06, + "loss": 0.6175, + "step": 16042 + }, + { + "epoch": 0.56, + "learning_rate": 8.259109960623159e-06, + "loss": 0.648, + "step": 16043 + }, + { + "epoch": 0.56, + "learning_rate": 8.258037733219245e-06, + "loss": 0.6477, + "step": 16044 + }, + { + "epoch": 0.56, + "learning_rate": 8.256965526468495e-06, + "loss": 0.5611, + "step": 16045 + }, + { + "epoch": 0.56, + "learning_rate": 8.255893340383623e-06, + "loss": 0.5739, + "step": 16046 + }, + { + "epoch": 0.56, + "learning_rate": 8.254821174977344e-06, + "loss": 0.6173, + "step": 16047 + }, + { + "epoch": 0.56, + "learning_rate": 8.253749030262366e-06, + "loss": 0.6672, + "step": 16048 + }, + { + "epoch": 0.56, + "learning_rate": 8.252676906251402e-06, + "loss": 0.6431, + "step": 16049 + }, + { + "epoch": 0.56, + "learning_rate": 8.251604802957166e-06, + "loss": 0.6154, + "step": 16050 + }, + { + "epoch": 0.56, + "learning_rate": 8.250532720392364e-06, + "loss": 0.5979, + "step": 16051 + }, + { + "epoch": 0.56, + "learning_rate": 8.24946065856971e-06, + "loss": 0.7005, + "step": 16052 + }, + { + "epoch": 0.56, + "learning_rate": 8.248388617501917e-06, + "loss": 0.6006, + "step": 16053 + }, + { + "epoch": 0.56, + "learning_rate": 8.247316597201691e-06, + "loss": 0.6, + "step": 16054 + }, + { + "epoch": 0.56, + "learning_rate": 8.246244597681743e-06, + "loss": 0.6235, + "step": 16055 + }, + { + "epoch": 0.56, + "learning_rate": 8.245172618954786e-06, + "loss": 0.6438, + "step": 16056 + }, + { + "epoch": 0.56, + "learning_rate": 8.244100661033526e-06, + "loss": 0.6333, + "step": 16057 + }, + { + "epoch": 0.56, + "learning_rate": 8.243028723930673e-06, + "loss": 0.635, + "step": 16058 + }, + { + "epoch": 0.56, + "learning_rate": 8.241956807658939e-06, + "loss": 0.6223, + "step": 16059 + }, + { + "epoch": 0.56, + "learning_rate": 8.24088491223103e-06, + "loss": 0.5888, + "step": 16060 + }, + { + "epoch": 0.56, + "learning_rate": 8.239813037659655e-06, + "loss": 0.6142, + "step": 16061 + }, + { + "epoch": 0.56, + "learning_rate": 8.238741183957525e-06, + "loss": 0.6352, + "step": 16062 + }, + { + "epoch": 0.56, + "learning_rate": 8.237669351137343e-06, + "loss": 0.6082, + "step": 16063 + }, + { + "epoch": 0.56, + "learning_rate": 8.236597539211823e-06, + "loss": 0.648, + "step": 16064 + }, + { + "epoch": 0.56, + "learning_rate": 8.23552574819367e-06, + "loss": 0.599, + "step": 16065 + }, + { + "epoch": 0.56, + "learning_rate": 8.23445397809559e-06, + "loss": 0.661, + "step": 16066 + }, + { + "epoch": 0.56, + "learning_rate": 8.23338222893029e-06, + "loss": 0.5972, + "step": 16067 + }, + { + "epoch": 0.56, + "learning_rate": 8.232310500710482e-06, + "loss": 0.5544, + "step": 16068 + }, + { + "epoch": 0.56, + "learning_rate": 8.231238793448868e-06, + "loss": 0.6713, + "step": 16069 + }, + { + "epoch": 0.56, + "learning_rate": 8.230167107158154e-06, + "loss": 0.6246, + "step": 16070 + }, + { + "epoch": 0.56, + "learning_rate": 8.22909544185105e-06, + "loss": 0.6547, + "step": 16071 + }, + { + "epoch": 0.56, + "learning_rate": 8.22802379754026e-06, + "loss": 0.6382, + "step": 16072 + }, + { + "epoch": 0.56, + "learning_rate": 8.226952174238487e-06, + "loss": 0.5706, + "step": 16073 + }, + { + "epoch": 0.56, + "learning_rate": 8.225880571958441e-06, + "loss": 0.6091, + "step": 16074 + }, + { + "epoch": 0.56, + "learning_rate": 8.224808990712823e-06, + "loss": 0.6164, + "step": 16075 + }, + { + "epoch": 0.56, + "learning_rate": 8.22373743051434e-06, + "loss": 0.6524, + "step": 16076 + }, + { + "epoch": 0.56, + "learning_rate": 8.2226658913757e-06, + "loss": 0.6246, + "step": 16077 + }, + { + "epoch": 0.56, + "learning_rate": 8.221594373309602e-06, + "loss": 0.616, + "step": 16078 + }, + { + "epoch": 0.56, + "learning_rate": 8.220522876328751e-06, + "loss": 0.5527, + "step": 16079 + }, + { + "epoch": 0.56, + "learning_rate": 8.219451400445857e-06, + "loss": 0.6284, + "step": 16080 + }, + { + "epoch": 0.56, + "learning_rate": 8.218379945673613e-06, + "loss": 0.6334, + "step": 16081 + }, + { + "epoch": 0.56, + "learning_rate": 8.217308512024732e-06, + "loss": 0.631, + "step": 16082 + }, + { + "epoch": 0.56, + "learning_rate": 8.216237099511915e-06, + "loss": 0.6122, + "step": 16083 + }, + { + "epoch": 0.56, + "learning_rate": 8.21516570814786e-06, + "loss": 0.6206, + "step": 16084 + }, + { + "epoch": 0.56, + "learning_rate": 8.214094337945277e-06, + "loss": 0.6795, + "step": 16085 + }, + { + "epoch": 0.56, + "learning_rate": 8.213022988916862e-06, + "loss": 0.6296, + "step": 16086 + }, + { + "epoch": 0.56, + "learning_rate": 8.211951661075322e-06, + "loss": 0.6439, + "step": 16087 + }, + { + "epoch": 0.56, + "learning_rate": 8.210880354433356e-06, + "loss": 0.6588, + "step": 16088 + }, + { + "epoch": 0.56, + "learning_rate": 8.209809069003666e-06, + "loss": 0.592, + "step": 16089 + }, + { + "epoch": 0.56, + "learning_rate": 8.208737804798954e-06, + "loss": 0.6018, + "step": 16090 + }, + { + "epoch": 0.56, + "learning_rate": 8.207666561831924e-06, + "loss": 0.6516, + "step": 16091 + }, + { + "epoch": 0.56, + "learning_rate": 8.20659534011527e-06, + "loss": 0.658, + "step": 16092 + }, + { + "epoch": 0.56, + "learning_rate": 8.2055241396617e-06, + "loss": 0.6664, + "step": 16093 + }, + { + "epoch": 0.56, + "learning_rate": 8.204452960483911e-06, + "loss": 0.6111, + "step": 16094 + }, + { + "epoch": 0.56, + "learning_rate": 8.203381802594602e-06, + "loss": 0.6254, + "step": 16095 + }, + { + "epoch": 0.56, + "learning_rate": 8.202310666006475e-06, + "loss": 0.6335, + "step": 16096 + }, + { + "epoch": 0.56, + "learning_rate": 8.201239550732232e-06, + "loss": 0.5991, + "step": 16097 + }, + { + "epoch": 0.56, + "learning_rate": 8.200168456784566e-06, + "loss": 0.5647, + "step": 16098 + }, + { + "epoch": 0.56, + "learning_rate": 8.19909738417618e-06, + "loss": 0.653, + "step": 16099 + }, + { + "epoch": 0.56, + "learning_rate": 8.198026332919776e-06, + "loss": 0.6257, + "step": 16100 + }, + { + "epoch": 0.56, + "learning_rate": 8.196955303028044e-06, + "loss": 0.6135, + "step": 16101 + }, + { + "epoch": 0.56, + "learning_rate": 8.195884294513691e-06, + "loss": 0.6582, + "step": 16102 + }, + { + "epoch": 0.56, + "learning_rate": 8.194813307389412e-06, + "loss": 0.6441, + "step": 16103 + }, + { + "epoch": 0.56, + "learning_rate": 8.193742341667906e-06, + "loss": 0.6418, + "step": 16104 + }, + { + "epoch": 0.56, + "learning_rate": 8.192671397361866e-06, + "loss": 0.628, + "step": 16105 + }, + { + "epoch": 0.56, + "learning_rate": 8.191600474483996e-06, + "loss": 0.6289, + "step": 16106 + }, + { + "epoch": 0.56, + "learning_rate": 8.190529573046988e-06, + "loss": 0.6397, + "step": 16107 + }, + { + "epoch": 0.56, + "learning_rate": 8.189458693063542e-06, + "loss": 0.5768, + "step": 16108 + }, + { + "epoch": 0.56, + "learning_rate": 8.188387834546352e-06, + "loss": 0.6278, + "step": 16109 + }, + { + "epoch": 0.56, + "learning_rate": 8.187316997508117e-06, + "loss": 0.6272, + "step": 16110 + }, + { + "epoch": 0.56, + "learning_rate": 8.186246181961533e-06, + "loss": 0.5775, + "step": 16111 + }, + { + "epoch": 0.56, + "learning_rate": 8.185175387919295e-06, + "loss": 0.6359, + "step": 16112 + }, + { + "epoch": 0.56, + "learning_rate": 8.184104615394096e-06, + "loss": 0.6186, + "step": 16113 + }, + { + "epoch": 0.56, + "learning_rate": 8.183033864398635e-06, + "loss": 0.6593, + "step": 16114 + }, + { + "epoch": 0.56, + "learning_rate": 8.181963134945609e-06, + "loss": 0.6414, + "step": 16115 + }, + { + "epoch": 0.56, + "learning_rate": 8.180892427047706e-06, + "loss": 0.6862, + "step": 16116 + }, + { + "epoch": 0.56, + "learning_rate": 8.179821740717625e-06, + "loss": 0.571, + "step": 16117 + }, + { + "epoch": 0.56, + "learning_rate": 8.178751075968062e-06, + "loss": 0.5926, + "step": 16118 + }, + { + "epoch": 0.56, + "learning_rate": 8.177680432811706e-06, + "loss": 0.6377, + "step": 16119 + }, + { + "epoch": 0.56, + "learning_rate": 8.176609811261255e-06, + "loss": 0.6679, + "step": 16120 + }, + { + "epoch": 0.56, + "learning_rate": 8.175539211329403e-06, + "loss": 0.6573, + "step": 16121 + }, + { + "epoch": 0.56, + "learning_rate": 8.17446863302884e-06, + "loss": 0.6244, + "step": 16122 + }, + { + "epoch": 0.56, + "learning_rate": 8.17339807637226e-06, + "loss": 0.6355, + "step": 16123 + }, + { + "epoch": 0.56, + "learning_rate": 8.172327541372359e-06, + "loss": 0.6316, + "step": 16124 + }, + { + "epoch": 0.56, + "learning_rate": 8.171257028041824e-06, + "loss": 0.6, + "step": 16125 + }, + { + "epoch": 0.56, + "learning_rate": 8.170186536393352e-06, + "loss": 0.632, + "step": 16126 + }, + { + "epoch": 0.56, + "learning_rate": 8.169116066439633e-06, + "loss": 0.675, + "step": 16127 + }, + { + "epoch": 0.56, + "learning_rate": 8.16804561819336e-06, + "loss": 0.6468, + "step": 16128 + }, + { + "epoch": 0.56, + "learning_rate": 8.16697519166722e-06, + "loss": 0.6696, + "step": 16129 + }, + { + "epoch": 0.56, + "learning_rate": 8.165904786873913e-06, + "loss": 0.6415, + "step": 16130 + }, + { + "epoch": 0.56, + "learning_rate": 8.16483440382612e-06, + "loss": 0.5946, + "step": 16131 + }, + { + "epoch": 0.56, + "learning_rate": 8.163764042536539e-06, + "loss": 0.6012, + "step": 16132 + }, + { + "epoch": 0.56, + "learning_rate": 8.16269370301786e-06, + "loss": 0.6395, + "step": 16133 + }, + { + "epoch": 0.56, + "learning_rate": 8.161623385282768e-06, + "loss": 0.6408, + "step": 16134 + }, + { + "epoch": 0.56, + "learning_rate": 8.160553089343959e-06, + "loss": 0.6101, + "step": 16135 + }, + { + "epoch": 0.56, + "learning_rate": 8.159482815214118e-06, + "loss": 0.6463, + "step": 16136 + }, + { + "epoch": 0.56, + "learning_rate": 8.158412562905939e-06, + "loss": 0.6316, + "step": 16137 + }, + { + "epoch": 0.56, + "learning_rate": 8.157342332432106e-06, + "loss": 0.6105, + "step": 16138 + }, + { + "epoch": 0.56, + "learning_rate": 8.156272123805314e-06, + "loss": 0.5959, + "step": 16139 + }, + { + "epoch": 0.56, + "learning_rate": 8.155201937038244e-06, + "loss": 0.5968, + "step": 16140 + }, + { + "epoch": 0.56, + "learning_rate": 8.15413177214359e-06, + "loss": 0.6655, + "step": 16141 + }, + { + "epoch": 0.56, + "learning_rate": 8.153061629134042e-06, + "loss": 0.5845, + "step": 16142 + }, + { + "epoch": 0.56, + "learning_rate": 8.15199150802228e-06, + "loss": 0.6192, + "step": 16143 + }, + { + "epoch": 0.56, + "learning_rate": 8.150921408820998e-06, + "loss": 0.631, + "step": 16144 + }, + { + "epoch": 0.56, + "learning_rate": 8.149851331542886e-06, + "loss": 0.6561, + "step": 16145 + }, + { + "epoch": 0.56, + "learning_rate": 8.14878127620062e-06, + "loss": 0.6287, + "step": 16146 + }, + { + "epoch": 0.56, + "learning_rate": 8.147711242806902e-06, + "loss": 0.6151, + "step": 16147 + }, + { + "epoch": 0.56, + "learning_rate": 8.146641231374403e-06, + "loss": 0.5951, + "step": 16148 + }, + { + "epoch": 0.56, + "learning_rate": 8.14557124191582e-06, + "loss": 0.6946, + "step": 16149 + }, + { + "epoch": 0.56, + "learning_rate": 8.144501274443838e-06, + "loss": 0.6447, + "step": 16150 + }, + { + "epoch": 0.56, + "learning_rate": 8.143431328971136e-06, + "loss": 0.6163, + "step": 16151 + }, + { + "epoch": 0.56, + "learning_rate": 8.142361405510403e-06, + "loss": 0.5746, + "step": 16152 + }, + { + "epoch": 0.56, + "learning_rate": 8.141291504074333e-06, + "loss": 0.6929, + "step": 16153 + }, + { + "epoch": 0.56, + "learning_rate": 8.140221624675595e-06, + "loss": 0.5798, + "step": 16154 + }, + { + "epoch": 0.56, + "learning_rate": 8.139151767326887e-06, + "loss": 0.6721, + "step": 16155 + }, + { + "epoch": 0.56, + "learning_rate": 8.138081932040892e-06, + "loss": 0.5891, + "step": 16156 + }, + { + "epoch": 0.56, + "learning_rate": 8.137012118830282e-06, + "loss": 0.5941, + "step": 16157 + }, + { + "epoch": 0.56, + "learning_rate": 8.135942327707755e-06, + "loss": 0.6498, + "step": 16158 + }, + { + "epoch": 0.56, + "learning_rate": 8.134872558685994e-06, + "loss": 0.6388, + "step": 16159 + }, + { + "epoch": 0.56, + "learning_rate": 8.133802811777671e-06, + "loss": 0.6422, + "step": 16160 + }, + { + "epoch": 0.56, + "learning_rate": 8.132733086995479e-06, + "loss": 0.5906, + "step": 16161 + }, + { + "epoch": 0.56, + "learning_rate": 8.131663384352102e-06, + "loss": 0.5965, + "step": 16162 + }, + { + "epoch": 0.56, + "learning_rate": 8.130593703860214e-06, + "loss": 0.6307, + "step": 16163 + }, + { + "epoch": 0.56, + "learning_rate": 8.129524045532503e-06, + "loss": 0.6424, + "step": 16164 + }, + { + "epoch": 0.56, + "learning_rate": 8.128454409381655e-06, + "loss": 0.6388, + "step": 16165 + }, + { + "epoch": 0.56, + "learning_rate": 8.127384795420342e-06, + "loss": 0.667, + "step": 16166 + }, + { + "epoch": 0.56, + "learning_rate": 8.126315203661252e-06, + "loss": 0.6603, + "step": 16167 + }, + { + "epoch": 0.56, + "learning_rate": 8.125245634117072e-06, + "loss": 0.6196, + "step": 16168 + }, + { + "epoch": 0.56, + "learning_rate": 8.124176086800469e-06, + "loss": 0.6552, + "step": 16169 + }, + { + "epoch": 0.56, + "learning_rate": 8.123106561724132e-06, + "loss": 0.6184, + "step": 16170 + }, + { + "epoch": 0.56, + "learning_rate": 8.122037058900747e-06, + "loss": 0.6389, + "step": 16171 + }, + { + "epoch": 0.56, + "learning_rate": 8.12096757834298e-06, + "loss": 0.6286, + "step": 16172 + }, + { + "epoch": 0.56, + "learning_rate": 8.119898120063525e-06, + "loss": 0.5879, + "step": 16173 + }, + { + "epoch": 0.56, + "learning_rate": 8.118828684075058e-06, + "loss": 0.6226, + "step": 16174 + }, + { + "epoch": 0.56, + "learning_rate": 8.11775927039025e-06, + "loss": 0.6648, + "step": 16175 + }, + { + "epoch": 0.56, + "learning_rate": 8.11668987902179e-06, + "loss": 0.6537, + "step": 16176 + }, + { + "epoch": 0.56, + "learning_rate": 8.115620509982356e-06, + "loss": 0.6503, + "step": 16177 + }, + { + "epoch": 0.56, + "learning_rate": 8.114551163284621e-06, + "loss": 0.6175, + "step": 16178 + }, + { + "epoch": 0.56, + "learning_rate": 8.113481838941268e-06, + "loss": 0.6474, + "step": 16179 + }, + { + "epoch": 0.56, + "learning_rate": 8.112412536964978e-06, + "loss": 0.5978, + "step": 16180 + }, + { + "epoch": 0.56, + "learning_rate": 8.11134325736842e-06, + "loss": 0.669, + "step": 16181 + }, + { + "epoch": 0.56, + "learning_rate": 8.110274000164278e-06, + "loss": 0.6331, + "step": 16182 + }, + { + "epoch": 0.56, + "learning_rate": 8.109204765365233e-06, + "loss": 0.6207, + "step": 16183 + }, + { + "epoch": 0.56, + "learning_rate": 8.10813555298395e-06, + "loss": 0.6633, + "step": 16184 + }, + { + "epoch": 0.56, + "learning_rate": 8.107066363033118e-06, + "loss": 0.618, + "step": 16185 + }, + { + "epoch": 0.56, + "learning_rate": 8.105997195525411e-06, + "loss": 0.6218, + "step": 16186 + }, + { + "epoch": 0.56, + "learning_rate": 8.104928050473497e-06, + "loss": 0.615, + "step": 16187 + }, + { + "epoch": 0.56, + "learning_rate": 8.10385892789006e-06, + "loss": 0.6746, + "step": 16188 + }, + { + "epoch": 0.56, + "learning_rate": 8.102789827787779e-06, + "loss": 0.5992, + "step": 16189 + }, + { + "epoch": 0.56, + "learning_rate": 8.101720750179318e-06, + "loss": 0.6116, + "step": 16190 + }, + { + "epoch": 0.56, + "learning_rate": 8.100651695077362e-06, + "loss": 0.5912, + "step": 16191 + }, + { + "epoch": 0.56, + "learning_rate": 8.099582662494585e-06, + "loss": 0.5646, + "step": 16192 + }, + { + "epoch": 0.56, + "learning_rate": 8.098513652443658e-06, + "loss": 0.6445, + "step": 16193 + }, + { + "epoch": 0.56, + "learning_rate": 8.097444664937252e-06, + "loss": 0.6469, + "step": 16194 + }, + { + "epoch": 0.56, + "learning_rate": 8.096375699988056e-06, + "loss": 0.6156, + "step": 16195 + }, + { + "epoch": 0.56, + "learning_rate": 8.095306757608726e-06, + "loss": 0.6128, + "step": 16196 + }, + { + "epoch": 0.56, + "learning_rate": 8.094237837811944e-06, + "loss": 0.6448, + "step": 16197 + }, + { + "epoch": 0.56, + "learning_rate": 8.09316894061039e-06, + "loss": 0.6132, + "step": 16198 + }, + { + "epoch": 0.56, + "learning_rate": 8.092100066016723e-06, + "loss": 0.644, + "step": 16199 + }, + { + "epoch": 0.56, + "learning_rate": 8.091031214043624e-06, + "loss": 0.6296, + "step": 16200 + }, + { + "epoch": 0.56, + "learning_rate": 8.08996238470377e-06, + "loss": 0.6581, + "step": 16201 + }, + { + "epoch": 0.56, + "learning_rate": 8.088893578009826e-06, + "loss": 0.6227, + "step": 16202 + }, + { + "epoch": 0.56, + "learning_rate": 8.087824793974463e-06, + "loss": 0.6604, + "step": 16203 + }, + { + "epoch": 0.56, + "learning_rate": 8.086756032610362e-06, + "loss": 0.6616, + "step": 16204 + }, + { + "epoch": 0.56, + "learning_rate": 8.085687293930183e-06, + "loss": 0.6263, + "step": 16205 + }, + { + "epoch": 0.56, + "learning_rate": 8.084618577946602e-06, + "loss": 0.6647, + "step": 16206 + }, + { + "epoch": 0.56, + "learning_rate": 8.083549884672297e-06, + "loss": 0.6087, + "step": 16207 + }, + { + "epoch": 0.56, + "learning_rate": 8.082481214119928e-06, + "loss": 0.6031, + "step": 16208 + }, + { + "epoch": 0.56, + "learning_rate": 8.081412566302173e-06, + "loss": 0.689, + "step": 16209 + }, + { + "epoch": 0.56, + "learning_rate": 8.080343941231695e-06, + "loss": 0.6248, + "step": 16210 + }, + { + "epoch": 0.56, + "learning_rate": 8.07927533892117e-06, + "loss": 0.6581, + "step": 16211 + }, + { + "epoch": 0.56, + "learning_rate": 8.078206759383265e-06, + "loss": 0.6246, + "step": 16212 + }, + { + "epoch": 0.56, + "learning_rate": 8.07713820263065e-06, + "loss": 0.6441, + "step": 16213 + }, + { + "epoch": 0.56, + "learning_rate": 8.076069668675995e-06, + "loss": 0.6661, + "step": 16214 + }, + { + "epoch": 0.56, + "learning_rate": 8.075001157531968e-06, + "loss": 0.6619, + "step": 16215 + }, + { + "epoch": 0.56, + "learning_rate": 8.073932669211234e-06, + "loss": 0.6361, + "step": 16216 + }, + { + "epoch": 0.56, + "learning_rate": 8.072864203726467e-06, + "loss": 0.6101, + "step": 16217 + }, + { + "epoch": 0.56, + "learning_rate": 8.071795761090336e-06, + "loss": 0.618, + "step": 16218 + }, + { + "epoch": 0.56, + "learning_rate": 8.0707273413155e-06, + "loss": 0.6136, + "step": 16219 + }, + { + "epoch": 0.56, + "learning_rate": 8.069658944414635e-06, + "loss": 0.6268, + "step": 16220 + }, + { + "epoch": 0.56, + "learning_rate": 8.068590570400405e-06, + "loss": 0.6074, + "step": 16221 + }, + { + "epoch": 0.56, + "learning_rate": 8.067522219285475e-06, + "loss": 0.6554, + "step": 16222 + }, + { + "epoch": 0.56, + "learning_rate": 8.066453891082516e-06, + "loss": 0.6587, + "step": 16223 + }, + { + "epoch": 0.56, + "learning_rate": 8.065385585804191e-06, + "loss": 0.6381, + "step": 16224 + }, + { + "epoch": 0.56, + "learning_rate": 8.064317303463167e-06, + "loss": 0.5806, + "step": 16225 + }, + { + "epoch": 0.56, + "learning_rate": 8.06324904407211e-06, + "loss": 0.6356, + "step": 16226 + }, + { + "epoch": 0.56, + "learning_rate": 8.062180807643687e-06, + "loss": 0.6665, + "step": 16227 + }, + { + "epoch": 0.56, + "learning_rate": 8.06111259419056e-06, + "loss": 0.6393, + "step": 16228 + }, + { + "epoch": 0.56, + "learning_rate": 8.060044403725397e-06, + "loss": 0.7185, + "step": 16229 + }, + { + "epoch": 0.56, + "learning_rate": 8.058976236260863e-06, + "loss": 0.6395, + "step": 16230 + }, + { + "epoch": 0.56, + "learning_rate": 8.057908091809618e-06, + "loss": 0.6693, + "step": 16231 + }, + { + "epoch": 0.56, + "learning_rate": 8.05683997038433e-06, + "loss": 0.6204, + "step": 16232 + }, + { + "epoch": 0.56, + "learning_rate": 8.055771871997665e-06, + "loss": 0.6652, + "step": 16233 + }, + { + "epoch": 0.56, + "learning_rate": 8.05470379666228e-06, + "loss": 0.6441, + "step": 16234 + }, + { + "epoch": 0.56, + "learning_rate": 8.053635744390844e-06, + "loss": 0.6546, + "step": 16235 + }, + { + "epoch": 0.56, + "learning_rate": 8.052567715196021e-06, + "loss": 0.6519, + "step": 16236 + }, + { + "epoch": 0.56, + "learning_rate": 8.051499709090469e-06, + "loss": 0.6498, + "step": 16237 + }, + { + "epoch": 0.56, + "learning_rate": 8.05043172608685e-06, + "loss": 0.6259, + "step": 16238 + }, + { + "epoch": 0.56, + "learning_rate": 8.049363766197835e-06, + "loss": 0.5938, + "step": 16239 + }, + { + "epoch": 0.56, + "learning_rate": 8.048295829436075e-06, + "loss": 0.6327, + "step": 16240 + }, + { + "epoch": 0.56, + "learning_rate": 8.04722791581424e-06, + "loss": 0.5804, + "step": 16241 + }, + { + "epoch": 0.56, + "learning_rate": 8.046160025344987e-06, + "loss": 0.5878, + "step": 16242 + }, + { + "epoch": 0.56, + "learning_rate": 8.04509215804098e-06, + "loss": 0.6253, + "step": 16243 + }, + { + "epoch": 0.56, + "learning_rate": 8.044024313914876e-06, + "loss": 0.6135, + "step": 16244 + }, + { + "epoch": 0.56, + "learning_rate": 8.04295649297934e-06, + "loss": 0.6665, + "step": 16245 + }, + { + "epoch": 0.56, + "learning_rate": 8.041888695247029e-06, + "loss": 0.592, + "step": 16246 + }, + { + "epoch": 0.56, + "learning_rate": 8.040820920730605e-06, + "loss": 0.6274, + "step": 16247 + }, + { + "epoch": 0.56, + "learning_rate": 8.03975316944273e-06, + "loss": 0.6246, + "step": 16248 + }, + { + "epoch": 0.56, + "learning_rate": 8.038685441396057e-06, + "loss": 0.6679, + "step": 16249 + }, + { + "epoch": 0.56, + "learning_rate": 8.03761773660325e-06, + "loss": 0.6178, + "step": 16250 + }, + { + "epoch": 0.56, + "learning_rate": 8.036550055076967e-06, + "loss": 0.628, + "step": 16251 + }, + { + "epoch": 0.56, + "learning_rate": 8.035482396829867e-06, + "loss": 0.6327, + "step": 16252 + }, + { + "epoch": 0.56, + "learning_rate": 8.03441476187461e-06, + "loss": 0.595, + "step": 16253 + }, + { + "epoch": 0.56, + "learning_rate": 8.033347150223853e-06, + "loss": 0.6323, + "step": 16254 + }, + { + "epoch": 0.56, + "learning_rate": 8.032279561890251e-06, + "loss": 0.6294, + "step": 16255 + }, + { + "epoch": 0.56, + "learning_rate": 8.031211996886464e-06, + "loss": 0.662, + "step": 16256 + }, + { + "epoch": 0.56, + "learning_rate": 8.030144455225152e-06, + "loss": 0.6098, + "step": 16257 + }, + { + "epoch": 0.56, + "learning_rate": 8.029076936918967e-06, + "loss": 0.6379, + "step": 16258 + }, + { + "epoch": 0.56, + "learning_rate": 8.028009441980568e-06, + "loss": 0.6093, + "step": 16259 + }, + { + "epoch": 0.56, + "learning_rate": 8.026941970422613e-06, + "loss": 0.6249, + "step": 16260 + }, + { + "epoch": 0.56, + "learning_rate": 8.025874522257755e-06, + "loss": 0.6168, + "step": 16261 + }, + { + "epoch": 0.56, + "learning_rate": 8.024807097498653e-06, + "loss": 0.6193, + "step": 16262 + }, + { + "epoch": 0.56, + "learning_rate": 8.023739696157962e-06, + "loss": 0.5716, + "step": 16263 + }, + { + "epoch": 0.56, + "learning_rate": 8.022672318248337e-06, + "loss": 0.6638, + "step": 16264 + }, + { + "epoch": 0.56, + "learning_rate": 8.021604963782431e-06, + "loss": 0.5949, + "step": 16265 + }, + { + "epoch": 0.56, + "learning_rate": 8.020537632772904e-06, + "loss": 0.597, + "step": 16266 + }, + { + "epoch": 0.56, + "learning_rate": 8.019470325232405e-06, + "loss": 0.6387, + "step": 16267 + }, + { + "epoch": 0.56, + "learning_rate": 8.01840304117359e-06, + "loss": 0.635, + "step": 16268 + }, + { + "epoch": 0.56, + "learning_rate": 8.017335780609118e-06, + "loss": 0.7025, + "step": 16269 + }, + { + "epoch": 0.56, + "learning_rate": 8.016268543551632e-06, + "loss": 0.6876, + "step": 16270 + }, + { + "epoch": 0.56, + "learning_rate": 8.015201330013798e-06, + "loss": 0.6964, + "step": 16271 + }, + { + "epoch": 0.56, + "learning_rate": 8.01413414000826e-06, + "loss": 0.6509, + "step": 16272 + }, + { + "epoch": 0.56, + "learning_rate": 8.013066973547674e-06, + "loss": 0.6799, + "step": 16273 + }, + { + "epoch": 0.56, + "learning_rate": 8.011999830644692e-06, + "loss": 0.612, + "step": 16274 + }, + { + "epoch": 0.56, + "learning_rate": 8.010932711311968e-06, + "loss": 0.6375, + "step": 16275 + }, + { + "epoch": 0.56, + "learning_rate": 8.009865615562152e-06, + "loss": 0.6487, + "step": 16276 + }, + { + "epoch": 0.56, + "learning_rate": 8.008798543407897e-06, + "loss": 0.5973, + "step": 16277 + }, + { + "epoch": 0.56, + "learning_rate": 8.007731494861855e-06, + "loss": 0.643, + "step": 16278 + }, + { + "epoch": 0.56, + "learning_rate": 8.006664469936673e-06, + "loss": 0.5965, + "step": 16279 + }, + { + "epoch": 0.56, + "learning_rate": 8.00559746864501e-06, + "loss": 0.6642, + "step": 16280 + }, + { + "epoch": 0.56, + "learning_rate": 8.004530490999509e-06, + "loss": 0.6122, + "step": 16281 + }, + { + "epoch": 0.56, + "learning_rate": 8.003463537012823e-06, + "loss": 0.6403, + "step": 16282 + }, + { + "epoch": 0.56, + "learning_rate": 8.002396606697605e-06, + "loss": 0.6835, + "step": 16283 + }, + { + "epoch": 0.56, + "learning_rate": 8.0013297000665e-06, + "loss": 0.6607, + "step": 16284 + }, + { + "epoch": 0.56, + "learning_rate": 8.00026281713216e-06, + "loss": 0.6264, + "step": 16285 + }, + { + "epoch": 0.56, + "learning_rate": 7.999195957907235e-06, + "loss": 0.6489, + "step": 16286 + }, + { + "epoch": 0.56, + "learning_rate": 7.998129122404372e-06, + "loss": 0.6315, + "step": 16287 + }, + { + "epoch": 0.56, + "learning_rate": 7.99706231063622e-06, + "loss": 0.6301, + "step": 16288 + }, + { + "epoch": 0.56, + "learning_rate": 7.995995522615431e-06, + "loss": 0.6187, + "step": 16289 + }, + { + "epoch": 0.56, + "learning_rate": 7.994928758354647e-06, + "loss": 0.5762, + "step": 16290 + }, + { + "epoch": 0.56, + "learning_rate": 7.993862017866521e-06, + "loss": 0.6689, + "step": 16291 + }, + { + "epoch": 0.56, + "learning_rate": 7.992795301163698e-06, + "loss": 0.6029, + "step": 16292 + }, + { + "epoch": 0.56, + "learning_rate": 7.991728608258825e-06, + "loss": 0.6551, + "step": 16293 + }, + { + "epoch": 0.56, + "learning_rate": 7.99066193916455e-06, + "loss": 0.6366, + "step": 16294 + }, + { + "epoch": 0.56, + "learning_rate": 7.989595293893521e-06, + "loss": 0.5968, + "step": 16295 + }, + { + "epoch": 0.56, + "learning_rate": 7.988528672458383e-06, + "loss": 0.6386, + "step": 16296 + }, + { + "epoch": 0.56, + "learning_rate": 7.987462074871779e-06, + "loss": 0.6902, + "step": 16297 + }, + { + "epoch": 0.56, + "learning_rate": 7.98639550114636e-06, + "loss": 0.6391, + "step": 16298 + }, + { + "epoch": 0.56, + "learning_rate": 7.985328951294771e-06, + "loss": 0.6091, + "step": 16299 + }, + { + "epoch": 0.56, + "learning_rate": 7.984262425329653e-06, + "loss": 0.6059, + "step": 16300 + }, + { + "epoch": 0.56, + "learning_rate": 7.983195923263657e-06, + "loss": 0.5954, + "step": 16301 + }, + { + "epoch": 0.56, + "learning_rate": 7.98212944510942e-06, + "loss": 0.6154, + "step": 16302 + }, + { + "epoch": 0.56, + "learning_rate": 7.981062990879596e-06, + "loss": 0.6301, + "step": 16303 + }, + { + "epoch": 0.56, + "learning_rate": 7.979996560586822e-06, + "loss": 0.5853, + "step": 16304 + }, + { + "epoch": 0.56, + "learning_rate": 7.978930154243744e-06, + "loss": 0.6106, + "step": 16305 + }, + { + "epoch": 0.56, + "learning_rate": 7.977863771863006e-06, + "loss": 0.6112, + "step": 16306 + }, + { + "epoch": 0.56, + "learning_rate": 7.97679741345725e-06, + "loss": 0.5976, + "step": 16307 + }, + { + "epoch": 0.57, + "learning_rate": 7.975731079039121e-06, + "loss": 0.629, + "step": 16308 + }, + { + "epoch": 0.57, + "learning_rate": 7.97466476862126e-06, + "loss": 0.5699, + "step": 16309 + }, + { + "epoch": 0.57, + "learning_rate": 7.973598482216313e-06, + "loss": 0.6753, + "step": 16310 + }, + { + "epoch": 0.57, + "learning_rate": 7.972532219836916e-06, + "loss": 0.6337, + "step": 16311 + }, + { + "epoch": 0.57, + "learning_rate": 7.971465981495717e-06, + "loss": 0.6245, + "step": 16312 + }, + { + "epoch": 0.57, + "learning_rate": 7.970399767205353e-06, + "loss": 0.6299, + "step": 16313 + }, + { + "epoch": 0.57, + "learning_rate": 7.969333576978468e-06, + "loss": 0.6682, + "step": 16314 + }, + { + "epoch": 0.57, + "learning_rate": 7.968267410827701e-06, + "loss": 0.6589, + "step": 16315 + }, + { + "epoch": 0.57, + "learning_rate": 7.967201268765697e-06, + "loss": 0.6341, + "step": 16316 + }, + { + "epoch": 0.57, + "learning_rate": 7.96613515080509e-06, + "loss": 0.6446, + "step": 16317 + }, + { + "epoch": 0.57, + "learning_rate": 7.965069056958525e-06, + "loss": 0.6667, + "step": 16318 + }, + { + "epoch": 0.57, + "learning_rate": 7.96400298723864e-06, + "loss": 0.674, + "step": 16319 + }, + { + "epoch": 0.57, + "learning_rate": 7.962936941658077e-06, + "loss": 0.6585, + "step": 16320 + }, + { + "epoch": 0.57, + "learning_rate": 7.961870920229471e-06, + "loss": 0.6354, + "step": 16321 + }, + { + "epoch": 0.57, + "learning_rate": 7.960804922965466e-06, + "loss": 0.632, + "step": 16322 + }, + { + "epoch": 0.57, + "learning_rate": 7.959738949878697e-06, + "loss": 0.6481, + "step": 16323 + }, + { + "epoch": 0.57, + "learning_rate": 7.958673000981803e-06, + "loss": 0.6172, + "step": 16324 + }, + { + "epoch": 0.57, + "learning_rate": 7.957607076287425e-06, + "loss": 0.5516, + "step": 16325 + }, + { + "epoch": 0.57, + "learning_rate": 7.956541175808196e-06, + "loss": 0.6273, + "step": 16326 + }, + { + "epoch": 0.57, + "learning_rate": 7.955475299556756e-06, + "loss": 0.6327, + "step": 16327 + }, + { + "epoch": 0.57, + "learning_rate": 7.954409447545747e-06, + "loss": 0.651, + "step": 16328 + }, + { + "epoch": 0.57, + "learning_rate": 7.953343619787797e-06, + "loss": 0.6474, + "step": 16329 + }, + { + "epoch": 0.57, + "learning_rate": 7.95227781629555e-06, + "loss": 0.6552, + "step": 16330 + }, + { + "epoch": 0.57, + "learning_rate": 7.951212037081641e-06, + "loss": 0.5994, + "step": 16331 + }, + { + "epoch": 0.57, + "learning_rate": 7.950146282158702e-06, + "loss": 0.6353, + "step": 16332 + }, + { + "epoch": 0.57, + "learning_rate": 7.949080551539375e-06, + "loss": 0.6027, + "step": 16333 + }, + { + "epoch": 0.57, + "learning_rate": 7.94801484523629e-06, + "loss": 0.6061, + "step": 16334 + }, + { + "epoch": 0.57, + "learning_rate": 7.946949163262085e-06, + "loss": 0.5612, + "step": 16335 + }, + { + "epoch": 0.57, + "learning_rate": 7.945883505629396e-06, + "loss": 0.5853, + "step": 16336 + }, + { + "epoch": 0.57, + "learning_rate": 7.944817872350856e-06, + "loss": 0.6532, + "step": 16337 + }, + { + "epoch": 0.57, + "learning_rate": 7.943752263439097e-06, + "loss": 0.5998, + "step": 16338 + }, + { + "epoch": 0.57, + "learning_rate": 7.942686678906761e-06, + "loss": 0.6492, + "step": 16339 + }, + { + "epoch": 0.57, + "learning_rate": 7.941621118766473e-06, + "loss": 0.6043, + "step": 16340 + }, + { + "epoch": 0.57, + "learning_rate": 7.940555583030872e-06, + "loss": 0.6436, + "step": 16341 + }, + { + "epoch": 0.57, + "learning_rate": 7.939490071712593e-06, + "loss": 0.6496, + "step": 16342 + }, + { + "epoch": 0.57, + "learning_rate": 7.938424584824262e-06, + "loss": 0.6707, + "step": 16343 + }, + { + "epoch": 0.57, + "learning_rate": 7.937359122378515e-06, + "loss": 0.6348, + "step": 16344 + }, + { + "epoch": 0.57, + "learning_rate": 7.936293684387986e-06, + "loss": 0.6165, + "step": 16345 + }, + { + "epoch": 0.57, + "learning_rate": 7.935228270865307e-06, + "loss": 0.6152, + "step": 16346 + }, + { + "epoch": 0.57, + "learning_rate": 7.934162881823107e-06, + "loss": 0.6021, + "step": 16347 + }, + { + "epoch": 0.57, + "learning_rate": 7.93309751727402e-06, + "loss": 0.6434, + "step": 16348 + }, + { + "epoch": 0.57, + "learning_rate": 7.932032177230677e-06, + "loss": 0.6506, + "step": 16349 + }, + { + "epoch": 0.57, + "learning_rate": 7.930966861705707e-06, + "loss": 0.6628, + "step": 16350 + }, + { + "epoch": 0.57, + "learning_rate": 7.929901570711746e-06, + "loss": 0.5559, + "step": 16351 + }, + { + "epoch": 0.57, + "learning_rate": 7.928836304261417e-06, + "loss": 0.6131, + "step": 16352 + }, + { + "epoch": 0.57, + "learning_rate": 7.927771062367354e-06, + "loss": 0.6201, + "step": 16353 + }, + { + "epoch": 0.57, + "learning_rate": 7.926705845042188e-06, + "loss": 0.5791, + "step": 16354 + }, + { + "epoch": 0.57, + "learning_rate": 7.925640652298547e-06, + "loss": 0.6426, + "step": 16355 + }, + { + "epoch": 0.57, + "learning_rate": 7.924575484149057e-06, + "loss": 0.5816, + "step": 16356 + }, + { + "epoch": 0.57, + "learning_rate": 7.923510340606355e-06, + "loss": 0.6238, + "step": 16357 + }, + { + "epoch": 0.57, + "learning_rate": 7.922445221683061e-06, + "loss": 0.6514, + "step": 16358 + }, + { + "epoch": 0.57, + "learning_rate": 7.921380127391807e-06, + "loss": 0.6679, + "step": 16359 + }, + { + "epoch": 0.57, + "learning_rate": 7.920315057745223e-06, + "loss": 0.6301, + "step": 16360 + }, + { + "epoch": 0.57, + "learning_rate": 7.919250012755934e-06, + "loss": 0.633, + "step": 16361 + }, + { + "epoch": 0.57, + "learning_rate": 7.918184992436565e-06, + "loss": 0.6756, + "step": 16362 + }, + { + "epoch": 0.57, + "learning_rate": 7.917119996799753e-06, + "loss": 0.5748, + "step": 16363 + }, + { + "epoch": 0.57, + "learning_rate": 7.916055025858114e-06, + "loss": 0.6991, + "step": 16364 + }, + { + "epoch": 0.57, + "learning_rate": 7.914990079624279e-06, + "loss": 0.582, + "step": 16365 + }, + { + "epoch": 0.57, + "learning_rate": 7.913925158110875e-06, + "loss": 0.6681, + "step": 16366 + }, + { + "epoch": 0.57, + "learning_rate": 7.912860261330527e-06, + "loss": 0.6346, + "step": 16367 + }, + { + "epoch": 0.57, + "learning_rate": 7.91179538929586e-06, + "loss": 0.6188, + "step": 16368 + }, + { + "epoch": 0.57, + "learning_rate": 7.910730542019502e-06, + "loss": 0.6915, + "step": 16369 + }, + { + "epoch": 0.57, + "learning_rate": 7.909665719514076e-06, + "loss": 0.6366, + "step": 16370 + }, + { + "epoch": 0.57, + "learning_rate": 7.908600921792205e-06, + "loss": 0.6166, + "step": 16371 + }, + { + "epoch": 0.57, + "learning_rate": 7.907536148866518e-06, + "loss": 0.6423, + "step": 16372 + }, + { + "epoch": 0.57, + "learning_rate": 7.906471400749636e-06, + "loss": 0.5878, + "step": 16373 + }, + { + "epoch": 0.57, + "learning_rate": 7.905406677454183e-06, + "loss": 0.6019, + "step": 16374 + }, + { + "epoch": 0.57, + "learning_rate": 7.904341978992788e-06, + "loss": 0.5727, + "step": 16375 + }, + { + "epoch": 0.57, + "learning_rate": 7.903277305378066e-06, + "loss": 0.6576, + "step": 16376 + }, + { + "epoch": 0.57, + "learning_rate": 7.902212656622643e-06, + "loss": 0.6231, + "step": 16377 + }, + { + "epoch": 0.57, + "learning_rate": 7.901148032739146e-06, + "loss": 0.6393, + "step": 16378 + }, + { + "epoch": 0.57, + "learning_rate": 7.900083433740191e-06, + "loss": 0.5992, + "step": 16379 + }, + { + "epoch": 0.57, + "learning_rate": 7.899018859638405e-06, + "loss": 0.565, + "step": 16380 + }, + { + "epoch": 0.57, + "learning_rate": 7.897954310446408e-06, + "loss": 0.6272, + "step": 16381 + }, + { + "epoch": 0.57, + "learning_rate": 7.89688978617682e-06, + "loss": 0.6056, + "step": 16382 + }, + { + "epoch": 0.57, + "learning_rate": 7.895825286842266e-06, + "loss": 0.6331, + "step": 16383 + }, + { + "epoch": 0.57, + "learning_rate": 7.894760812455365e-06, + "loss": 0.6375, + "step": 16384 + }, + { + "epoch": 0.57, + "learning_rate": 7.893696363028737e-06, + "loss": 0.652, + "step": 16385 + }, + { + "epoch": 0.57, + "learning_rate": 7.892631938575002e-06, + "loss": 0.6436, + "step": 16386 + }, + { + "epoch": 0.57, + "learning_rate": 7.891567539106786e-06, + "loss": 0.6408, + "step": 16387 + }, + { + "epoch": 0.57, + "learning_rate": 7.890503164636698e-06, + "loss": 0.6222, + "step": 16388 + }, + { + "epoch": 0.57, + "learning_rate": 7.889438815177366e-06, + "loss": 0.5626, + "step": 16389 + }, + { + "epoch": 0.57, + "learning_rate": 7.88837449074141e-06, + "loss": 0.6628, + "step": 16390 + }, + { + "epoch": 0.57, + "learning_rate": 7.88731019134144e-06, + "loss": 0.5883, + "step": 16391 + }, + { + "epoch": 0.57, + "learning_rate": 7.886245916990082e-06, + "loss": 0.6062, + "step": 16392 + }, + { + "epoch": 0.57, + "learning_rate": 7.885181667699957e-06, + "loss": 0.6703, + "step": 16393 + }, + { + "epoch": 0.57, + "learning_rate": 7.884117443483672e-06, + "loss": 0.6293, + "step": 16394 + }, + { + "epoch": 0.57, + "learning_rate": 7.883053244353858e-06, + "loss": 0.6479, + "step": 16395 + }, + { + "epoch": 0.57, + "learning_rate": 7.88198907032312e-06, + "loss": 0.6524, + "step": 16396 + }, + { + "epoch": 0.57, + "learning_rate": 7.88092492140408e-06, + "loss": 0.6394, + "step": 16397 + }, + { + "epoch": 0.57, + "learning_rate": 7.879860797609362e-06, + "loss": 0.6513, + "step": 16398 + }, + { + "epoch": 0.57, + "learning_rate": 7.878796698951572e-06, + "loss": 0.6204, + "step": 16399 + }, + { + "epoch": 0.57, + "learning_rate": 7.877732625443328e-06, + "loss": 0.656, + "step": 16400 + }, + { + "epoch": 0.57, + "learning_rate": 7.876668577097255e-06, + "loss": 0.6588, + "step": 16401 + }, + { + "epoch": 0.57, + "learning_rate": 7.875604553925958e-06, + "loss": 0.635, + "step": 16402 + }, + { + "epoch": 0.57, + "learning_rate": 7.874540555942055e-06, + "loss": 0.6512, + "step": 16403 + }, + { + "epoch": 0.57, + "learning_rate": 7.873476583158169e-06, + "loss": 0.6402, + "step": 16404 + }, + { + "epoch": 0.57, + "learning_rate": 7.872412635586902e-06, + "loss": 0.6628, + "step": 16405 + }, + { + "epoch": 0.57, + "learning_rate": 7.871348713240873e-06, + "loss": 0.5821, + "step": 16406 + }, + { + "epoch": 0.57, + "learning_rate": 7.870284816132705e-06, + "loss": 0.637, + "step": 16407 + }, + { + "epoch": 0.57, + "learning_rate": 7.869220944275e-06, + "loss": 0.6194, + "step": 16408 + }, + { + "epoch": 0.57, + "learning_rate": 7.868157097680374e-06, + "loss": 0.6324, + "step": 16409 + }, + { + "epoch": 0.57, + "learning_rate": 7.867093276361449e-06, + "loss": 0.6594, + "step": 16410 + }, + { + "epoch": 0.57, + "learning_rate": 7.866029480330826e-06, + "loss": 0.5651, + "step": 16411 + }, + { + "epoch": 0.57, + "learning_rate": 7.86496570960112e-06, + "loss": 0.6136, + "step": 16412 + }, + { + "epoch": 0.57, + "learning_rate": 7.863901964184955e-06, + "loss": 0.6592, + "step": 16413 + }, + { + "epoch": 0.57, + "learning_rate": 7.86283824409493e-06, + "loss": 0.6086, + "step": 16414 + }, + { + "epoch": 0.57, + "learning_rate": 7.861774549343659e-06, + "loss": 0.6537, + "step": 16415 + }, + { + "epoch": 0.57, + "learning_rate": 7.860710879943762e-06, + "loss": 0.6308, + "step": 16416 + }, + { + "epoch": 0.57, + "learning_rate": 7.859647235907838e-06, + "loss": 0.6277, + "step": 16417 + }, + { + "epoch": 0.57, + "learning_rate": 7.858583617248502e-06, + "loss": 0.6375, + "step": 16418 + }, + { + "epoch": 0.57, + "learning_rate": 7.857520023978373e-06, + "loss": 0.5829, + "step": 16419 + }, + { + "epoch": 0.57, + "learning_rate": 7.85645645611005e-06, + "loss": 0.6266, + "step": 16420 + }, + { + "epoch": 0.57, + "learning_rate": 7.855392913656145e-06, + "loss": 0.6366, + "step": 16421 + }, + { + "epoch": 0.57, + "learning_rate": 7.854329396629278e-06, + "loss": 0.6062, + "step": 16422 + }, + { + "epoch": 0.57, + "learning_rate": 7.853265905042045e-06, + "loss": 0.6579, + "step": 16423 + }, + { + "epoch": 0.57, + "learning_rate": 7.852202438907057e-06, + "loss": 0.6823, + "step": 16424 + }, + { + "epoch": 0.57, + "learning_rate": 7.851138998236933e-06, + "loss": 0.5903, + "step": 16425 + }, + { + "epoch": 0.57, + "learning_rate": 7.85007558304427e-06, + "loss": 0.6119, + "step": 16426 + }, + { + "epoch": 0.57, + "learning_rate": 7.849012193341679e-06, + "loss": 0.6475, + "step": 16427 + }, + { + "epoch": 0.57, + "learning_rate": 7.847948829141776e-06, + "loss": 0.6235, + "step": 16428 + }, + { + "epoch": 0.57, + "learning_rate": 7.846885490457157e-06, + "loss": 0.6354, + "step": 16429 + }, + { + "epoch": 0.57, + "learning_rate": 7.845822177300432e-06, + "loss": 0.6739, + "step": 16430 + }, + { + "epoch": 0.57, + "learning_rate": 7.844758889684219e-06, + "loss": 0.6748, + "step": 16431 + }, + { + "epoch": 0.57, + "learning_rate": 7.84369562762111e-06, + "loss": 0.6285, + "step": 16432 + }, + { + "epoch": 0.57, + "learning_rate": 7.842632391123714e-06, + "loss": 0.6066, + "step": 16433 + }, + { + "epoch": 0.57, + "learning_rate": 7.841569180204647e-06, + "loss": 0.6681, + "step": 16434 + }, + { + "epoch": 0.57, + "learning_rate": 7.840505994876505e-06, + "loss": 0.6628, + "step": 16435 + }, + { + "epoch": 0.57, + "learning_rate": 7.839442835151892e-06, + "loss": 0.5883, + "step": 16436 + }, + { + "epoch": 0.57, + "learning_rate": 7.838379701043424e-06, + "loss": 0.6511, + "step": 16437 + }, + { + "epoch": 0.57, + "learning_rate": 7.837316592563695e-06, + "loss": 0.6263, + "step": 16438 + }, + { + "epoch": 0.57, + "learning_rate": 7.836253509725311e-06, + "loss": 0.6298, + "step": 16439 + }, + { + "epoch": 0.57, + "learning_rate": 7.835190452540886e-06, + "loss": 0.6431, + "step": 16440 + }, + { + "epoch": 0.57, + "learning_rate": 7.834127421023013e-06, + "loss": 0.6519, + "step": 16441 + }, + { + "epoch": 0.57, + "learning_rate": 7.833064415184296e-06, + "loss": 0.623, + "step": 16442 + }, + { + "epoch": 0.57, + "learning_rate": 7.832001435037348e-06, + "loss": 0.6796, + "step": 16443 + }, + { + "epoch": 0.57, + "learning_rate": 7.830938480594763e-06, + "loss": 0.6511, + "step": 16444 + }, + { + "epoch": 0.57, + "learning_rate": 7.829875551869142e-06, + "loss": 0.6263, + "step": 16445 + }, + { + "epoch": 0.57, + "learning_rate": 7.8288126488731e-06, + "loss": 0.5954, + "step": 16446 + }, + { + "epoch": 0.57, + "learning_rate": 7.827749771619224e-06, + "loss": 0.6322, + "step": 16447 + }, + { + "epoch": 0.57, + "learning_rate": 7.826686920120121e-06, + "loss": 0.6214, + "step": 16448 + }, + { + "epoch": 0.57, + "learning_rate": 7.8256240943884e-06, + "loss": 0.5828, + "step": 16449 + }, + { + "epoch": 0.57, + "learning_rate": 7.824561294436651e-06, + "loss": 0.5921, + "step": 16450 + }, + { + "epoch": 0.57, + "learning_rate": 7.82349852027748e-06, + "loss": 0.6005, + "step": 16451 + }, + { + "epoch": 0.57, + "learning_rate": 7.822435771923494e-06, + "loss": 0.6073, + "step": 16452 + }, + { + "epoch": 0.57, + "learning_rate": 7.82137304938728e-06, + "loss": 0.6672, + "step": 16453 + }, + { + "epoch": 0.57, + "learning_rate": 7.820310352681444e-06, + "loss": 0.6306, + "step": 16454 + }, + { + "epoch": 0.57, + "learning_rate": 7.819247681818591e-06, + "loss": 0.6915, + "step": 16455 + }, + { + "epoch": 0.57, + "learning_rate": 7.818185036811311e-06, + "loss": 0.5854, + "step": 16456 + }, + { + "epoch": 0.57, + "learning_rate": 7.81712241767221e-06, + "loss": 0.6861, + "step": 16457 + }, + { + "epoch": 0.57, + "learning_rate": 7.816059824413884e-06, + "loss": 0.6716, + "step": 16458 + }, + { + "epoch": 0.57, + "learning_rate": 7.81499725704893e-06, + "loss": 0.6627, + "step": 16459 + }, + { + "epoch": 0.57, + "learning_rate": 7.813934715589949e-06, + "loss": 0.604, + "step": 16460 + }, + { + "epoch": 0.57, + "learning_rate": 7.812872200049535e-06, + "loss": 0.6451, + "step": 16461 + }, + { + "epoch": 0.57, + "learning_rate": 7.811809710440289e-06, + "loss": 0.6223, + "step": 16462 + }, + { + "epoch": 0.57, + "learning_rate": 7.810747246774807e-06, + "loss": 0.6672, + "step": 16463 + }, + { + "epoch": 0.57, + "learning_rate": 7.809684809065687e-06, + "loss": 0.6069, + "step": 16464 + }, + { + "epoch": 0.57, + "learning_rate": 7.808622397325522e-06, + "loss": 0.6714, + "step": 16465 + }, + { + "epoch": 0.57, + "learning_rate": 7.807560011566914e-06, + "loss": 0.6941, + "step": 16466 + }, + { + "epoch": 0.57, + "learning_rate": 7.806497651802453e-06, + "loss": 0.6293, + "step": 16467 + }, + { + "epoch": 0.57, + "learning_rate": 7.805435318044736e-06, + "loss": 0.6363, + "step": 16468 + }, + { + "epoch": 0.57, + "learning_rate": 7.804373010306364e-06, + "loss": 0.6332, + "step": 16469 + }, + { + "epoch": 0.57, + "learning_rate": 7.803310728599922e-06, + "loss": 0.6021, + "step": 16470 + }, + { + "epoch": 0.57, + "learning_rate": 7.802248472938013e-06, + "loss": 0.5834, + "step": 16471 + }, + { + "epoch": 0.57, + "learning_rate": 7.801186243333229e-06, + "loss": 0.5908, + "step": 16472 + }, + { + "epoch": 0.57, + "learning_rate": 7.800124039798162e-06, + "loss": 0.6319, + "step": 16473 + }, + { + "epoch": 0.57, + "learning_rate": 7.799061862345407e-06, + "loss": 0.6253, + "step": 16474 + }, + { + "epoch": 0.57, + "learning_rate": 7.79799971098756e-06, + "loss": 0.6312, + "step": 16475 + }, + { + "epoch": 0.57, + "learning_rate": 7.796937585737211e-06, + "loss": 0.6182, + "step": 16476 + }, + { + "epoch": 0.57, + "learning_rate": 7.795875486606951e-06, + "loss": 0.5957, + "step": 16477 + }, + { + "epoch": 0.57, + "learning_rate": 7.79481341360938e-06, + "loss": 0.6314, + "step": 16478 + }, + { + "epoch": 0.57, + "learning_rate": 7.793751366757085e-06, + "loss": 0.6549, + "step": 16479 + }, + { + "epoch": 0.57, + "learning_rate": 7.792689346062655e-06, + "loss": 0.5995, + "step": 16480 + }, + { + "epoch": 0.57, + "learning_rate": 7.791627351538689e-06, + "loss": 0.6981, + "step": 16481 + }, + { + "epoch": 0.57, + "learning_rate": 7.790565383197772e-06, + "loss": 0.6036, + "step": 16482 + }, + { + "epoch": 0.57, + "learning_rate": 7.789503441052496e-06, + "loss": 0.5908, + "step": 16483 + }, + { + "epoch": 0.57, + "learning_rate": 7.788441525115457e-06, + "loss": 0.6364, + "step": 16484 + }, + { + "epoch": 0.57, + "learning_rate": 7.787379635399238e-06, + "loss": 0.6655, + "step": 16485 + }, + { + "epoch": 0.57, + "learning_rate": 7.786317771916433e-06, + "loss": 0.6255, + "step": 16486 + }, + { + "epoch": 0.57, + "learning_rate": 7.785255934679632e-06, + "loss": 0.6307, + "step": 16487 + }, + { + "epoch": 0.57, + "learning_rate": 7.784194123701425e-06, + "loss": 0.6398, + "step": 16488 + }, + { + "epoch": 0.57, + "learning_rate": 7.783132338994396e-06, + "loss": 0.6425, + "step": 16489 + }, + { + "epoch": 0.57, + "learning_rate": 7.78207058057114e-06, + "loss": 0.6354, + "step": 16490 + }, + { + "epoch": 0.57, + "learning_rate": 7.781008848444242e-06, + "loss": 0.6596, + "step": 16491 + }, + { + "epoch": 0.57, + "learning_rate": 7.779947142626291e-06, + "loss": 0.6286, + "step": 16492 + }, + { + "epoch": 0.57, + "learning_rate": 7.778885463129877e-06, + "loss": 0.666, + "step": 16493 + }, + { + "epoch": 0.57, + "learning_rate": 7.777823809967583e-06, + "loss": 0.6295, + "step": 16494 + }, + { + "epoch": 0.57, + "learning_rate": 7.776762183151999e-06, + "loss": 0.647, + "step": 16495 + }, + { + "epoch": 0.57, + "learning_rate": 7.775700582695714e-06, + "loss": 0.6821, + "step": 16496 + }, + { + "epoch": 0.57, + "learning_rate": 7.774639008611311e-06, + "loss": 0.6772, + "step": 16497 + }, + { + "epoch": 0.57, + "learning_rate": 7.773577460911377e-06, + "loss": 0.6211, + "step": 16498 + }, + { + "epoch": 0.57, + "learning_rate": 7.7725159396085e-06, + "loss": 0.5781, + "step": 16499 + }, + { + "epoch": 0.57, + "learning_rate": 7.771454444715263e-06, + "loss": 0.5484, + "step": 16500 + }, + { + "epoch": 0.57, + "learning_rate": 7.770392976244251e-06, + "loss": 0.622, + "step": 16501 + }, + { + "epoch": 0.57, + "learning_rate": 7.769331534208056e-06, + "loss": 0.6469, + "step": 16502 + }, + { + "epoch": 0.57, + "learning_rate": 7.768270118619254e-06, + "loss": 0.6126, + "step": 16503 + }, + { + "epoch": 0.57, + "learning_rate": 7.767208729490432e-06, + "loss": 0.6687, + "step": 16504 + }, + { + "epoch": 0.57, + "learning_rate": 7.766147366834178e-06, + "loss": 0.6574, + "step": 16505 + }, + { + "epoch": 0.57, + "learning_rate": 7.76508603066307e-06, + "loss": 0.599, + "step": 16506 + }, + { + "epoch": 0.57, + "learning_rate": 7.764024720989694e-06, + "loss": 0.6047, + "step": 16507 + }, + { + "epoch": 0.57, + "learning_rate": 7.762963437826637e-06, + "loss": 0.6348, + "step": 16508 + }, + { + "epoch": 0.57, + "learning_rate": 7.761902181186476e-06, + "loss": 0.6387, + "step": 16509 + }, + { + "epoch": 0.57, + "learning_rate": 7.760840951081795e-06, + "loss": 0.585, + "step": 16510 + }, + { + "epoch": 0.57, + "learning_rate": 7.759779747525181e-06, + "loss": 0.6243, + "step": 16511 + }, + { + "epoch": 0.57, + "learning_rate": 7.758718570529206e-06, + "loss": 0.6388, + "step": 16512 + }, + { + "epoch": 0.57, + "learning_rate": 7.75765742010646e-06, + "loss": 0.6334, + "step": 16513 + }, + { + "epoch": 0.57, + "learning_rate": 7.756596296269525e-06, + "loss": 0.6227, + "step": 16514 + }, + { + "epoch": 0.57, + "learning_rate": 7.755535199030975e-06, + "loss": 0.6495, + "step": 16515 + }, + { + "epoch": 0.57, + "learning_rate": 7.754474128403395e-06, + "loss": 0.5827, + "step": 16516 + }, + { + "epoch": 0.57, + "learning_rate": 7.753413084399369e-06, + "loss": 0.6437, + "step": 16517 + }, + { + "epoch": 0.57, + "learning_rate": 7.752352067031468e-06, + "loss": 0.6462, + "step": 16518 + }, + { + "epoch": 0.57, + "learning_rate": 7.751291076312277e-06, + "loss": 0.6437, + "step": 16519 + }, + { + "epoch": 0.57, + "learning_rate": 7.750230112254377e-06, + "loss": 0.6501, + "step": 16520 + }, + { + "epoch": 0.57, + "learning_rate": 7.749169174870344e-06, + "loss": 0.5534, + "step": 16521 + }, + { + "epoch": 0.57, + "learning_rate": 7.748108264172759e-06, + "loss": 0.6195, + "step": 16522 + }, + { + "epoch": 0.57, + "learning_rate": 7.747047380174197e-06, + "loss": 0.6699, + "step": 16523 + }, + { + "epoch": 0.57, + "learning_rate": 7.745986522887238e-06, + "loss": 0.5926, + "step": 16524 + }, + { + "epoch": 0.57, + "learning_rate": 7.744925692324463e-06, + "loss": 0.6356, + "step": 16525 + }, + { + "epoch": 0.57, + "learning_rate": 7.743864888498444e-06, + "loss": 0.6318, + "step": 16526 + }, + { + "epoch": 0.57, + "learning_rate": 7.74280411142176e-06, + "loss": 0.6042, + "step": 16527 + }, + { + "epoch": 0.57, + "learning_rate": 7.741743361106993e-06, + "loss": 0.6716, + "step": 16528 + }, + { + "epoch": 0.57, + "learning_rate": 7.740682637566711e-06, + "loss": 0.6609, + "step": 16529 + }, + { + "epoch": 0.57, + "learning_rate": 7.739621940813495e-06, + "loss": 0.6368, + "step": 16530 + }, + { + "epoch": 0.57, + "learning_rate": 7.738561270859924e-06, + "loss": 0.6382, + "step": 16531 + }, + { + "epoch": 0.57, + "learning_rate": 7.737500627718567e-06, + "loss": 0.6251, + "step": 16532 + }, + { + "epoch": 0.57, + "learning_rate": 7.736440011402e-06, + "loss": 0.5992, + "step": 16533 + }, + { + "epoch": 0.57, + "learning_rate": 7.735379421922805e-06, + "loss": 0.6075, + "step": 16534 + }, + { + "epoch": 0.57, + "learning_rate": 7.734318859293547e-06, + "loss": 0.6419, + "step": 16535 + }, + { + "epoch": 0.57, + "learning_rate": 7.733258323526807e-06, + "loss": 0.6475, + "step": 16536 + }, + { + "epoch": 0.57, + "learning_rate": 7.732197814635157e-06, + "loss": 0.6029, + "step": 16537 + }, + { + "epoch": 0.57, + "learning_rate": 7.73113733263117e-06, + "loss": 0.6021, + "step": 16538 + }, + { + "epoch": 0.57, + "learning_rate": 7.730076877527421e-06, + "loss": 0.6657, + "step": 16539 + }, + { + "epoch": 0.57, + "learning_rate": 7.729016449336483e-06, + "loss": 0.6528, + "step": 16540 + }, + { + "epoch": 0.57, + "learning_rate": 7.727956048070926e-06, + "loss": 0.6374, + "step": 16541 + }, + { + "epoch": 0.57, + "learning_rate": 7.726895673743323e-06, + "loss": 0.6582, + "step": 16542 + }, + { + "epoch": 0.57, + "learning_rate": 7.72583532636625e-06, + "loss": 0.6518, + "step": 16543 + }, + { + "epoch": 0.57, + "learning_rate": 7.724775005952276e-06, + "loss": 0.6781, + "step": 16544 + }, + { + "epoch": 0.57, + "learning_rate": 7.72371471251397e-06, + "loss": 0.6796, + "step": 16545 + }, + { + "epoch": 0.57, + "learning_rate": 7.722654446063909e-06, + "loss": 0.6439, + "step": 16546 + }, + { + "epoch": 0.57, + "learning_rate": 7.721594206614657e-06, + "loss": 0.6034, + "step": 16547 + }, + { + "epoch": 0.57, + "learning_rate": 7.72053399417879e-06, + "loss": 0.5832, + "step": 16548 + }, + { + "epoch": 0.57, + "learning_rate": 7.719473808768877e-06, + "loss": 0.6628, + "step": 16549 + }, + { + "epoch": 0.57, + "learning_rate": 7.718413650397484e-06, + "loss": 0.6433, + "step": 16550 + }, + { + "epoch": 0.57, + "learning_rate": 7.717353519077184e-06, + "loss": 0.6375, + "step": 16551 + }, + { + "epoch": 0.57, + "learning_rate": 7.716293414820549e-06, + "loss": 0.6087, + "step": 16552 + }, + { + "epoch": 0.57, + "learning_rate": 7.71523333764014e-06, + "loss": 0.6436, + "step": 16553 + }, + { + "epoch": 0.57, + "learning_rate": 7.714173287548532e-06, + "loss": 0.6159, + "step": 16554 + }, + { + "epoch": 0.57, + "learning_rate": 7.713113264558291e-06, + "loss": 0.6117, + "step": 16555 + }, + { + "epoch": 0.57, + "learning_rate": 7.712053268681985e-06, + "loss": 0.6721, + "step": 16556 + }, + { + "epoch": 0.57, + "learning_rate": 7.710993299932182e-06, + "loss": 0.6502, + "step": 16557 + }, + { + "epoch": 0.57, + "learning_rate": 7.709933358321451e-06, + "loss": 0.6014, + "step": 16558 + }, + { + "epoch": 0.57, + "learning_rate": 7.708873443862354e-06, + "loss": 0.5773, + "step": 16559 + }, + { + "epoch": 0.57, + "learning_rate": 7.70781355656746e-06, + "loss": 0.6242, + "step": 16560 + }, + { + "epoch": 0.57, + "learning_rate": 7.70675369644934e-06, + "loss": 0.6918, + "step": 16561 + }, + { + "epoch": 0.57, + "learning_rate": 7.705693863520553e-06, + "loss": 0.6409, + "step": 16562 + }, + { + "epoch": 0.57, + "learning_rate": 7.704634057793667e-06, + "loss": 0.6553, + "step": 16563 + }, + { + "epoch": 0.57, + "learning_rate": 7.703574279281251e-06, + "loss": 0.6784, + "step": 16564 + }, + { + "epoch": 0.57, + "learning_rate": 7.702514527995863e-06, + "loss": 0.623, + "step": 16565 + }, + { + "epoch": 0.57, + "learning_rate": 7.701454803950073e-06, + "loss": 0.7079, + "step": 16566 + }, + { + "epoch": 0.57, + "learning_rate": 7.700395107156447e-06, + "loss": 0.6257, + "step": 16567 + }, + { + "epoch": 0.57, + "learning_rate": 7.699335437627543e-06, + "loss": 0.6623, + "step": 16568 + }, + { + "epoch": 0.57, + "learning_rate": 7.698275795375927e-06, + "loss": 0.6324, + "step": 16569 + }, + { + "epoch": 0.57, + "learning_rate": 7.697216180414166e-06, + "loss": 0.6176, + "step": 16570 + }, + { + "epoch": 0.57, + "learning_rate": 7.696156592754818e-06, + "loss": 0.6059, + "step": 16571 + }, + { + "epoch": 0.57, + "learning_rate": 7.695097032410447e-06, + "loss": 0.5999, + "step": 16572 + }, + { + "epoch": 0.57, + "learning_rate": 7.69403749939362e-06, + "loss": 0.6007, + "step": 16573 + }, + { + "epoch": 0.57, + "learning_rate": 7.692977993716893e-06, + "loss": 0.6183, + "step": 16574 + }, + { + "epoch": 0.57, + "learning_rate": 7.691918515392829e-06, + "loss": 0.6434, + "step": 16575 + }, + { + "epoch": 0.57, + "learning_rate": 7.690859064433994e-06, + "loss": 0.6969, + "step": 16576 + }, + { + "epoch": 0.57, + "learning_rate": 7.689799640852944e-06, + "loss": 0.6713, + "step": 16577 + }, + { + "epoch": 0.57, + "learning_rate": 7.688740244662242e-06, + "loss": 0.6068, + "step": 16578 + }, + { + "epoch": 0.57, + "learning_rate": 7.68768087587445e-06, + "loss": 0.6422, + "step": 16579 + }, + { + "epoch": 0.57, + "learning_rate": 7.686621534502123e-06, + "loss": 0.58, + "step": 16580 + }, + { + "epoch": 0.57, + "learning_rate": 7.685562220557826e-06, + "loss": 0.608, + "step": 16581 + }, + { + "epoch": 0.57, + "learning_rate": 7.684502934054117e-06, + "loss": 0.605, + "step": 16582 + }, + { + "epoch": 0.57, + "learning_rate": 7.683443675003552e-06, + "loss": 0.6217, + "step": 16583 + }, + { + "epoch": 0.57, + "learning_rate": 7.6823844434187e-06, + "loss": 0.631, + "step": 16584 + }, + { + "epoch": 0.57, + "learning_rate": 7.681325239312102e-06, + "loss": 0.6846, + "step": 16585 + }, + { + "epoch": 0.57, + "learning_rate": 7.680266062696332e-06, + "loss": 0.5832, + "step": 16586 + }, + { + "epoch": 0.57, + "learning_rate": 7.679206913583945e-06, + "loss": 0.6305, + "step": 16587 + }, + { + "epoch": 0.57, + "learning_rate": 7.67814779198749e-06, + "loss": 0.6514, + "step": 16588 + }, + { + "epoch": 0.57, + "learning_rate": 7.677088697919533e-06, + "loss": 0.6143, + "step": 16589 + }, + { + "epoch": 0.57, + "learning_rate": 7.676029631392631e-06, + "loss": 0.6219, + "step": 16590 + }, + { + "epoch": 0.57, + "learning_rate": 7.67497059241933e-06, + "loss": 0.6631, + "step": 16591 + }, + { + "epoch": 0.57, + "learning_rate": 7.673911581012199e-06, + "loss": 0.62, + "step": 16592 + }, + { + "epoch": 0.57, + "learning_rate": 7.67285259718379e-06, + "loss": 0.6714, + "step": 16593 + }, + { + "epoch": 0.57, + "learning_rate": 7.671793640946654e-06, + "loss": 0.6439, + "step": 16594 + }, + { + "epoch": 0.57, + "learning_rate": 7.670734712313349e-06, + "loss": 0.6802, + "step": 16595 + }, + { + "epoch": 0.58, + "learning_rate": 7.669675811296436e-06, + "loss": 0.6347, + "step": 16596 + }, + { + "epoch": 0.58, + "learning_rate": 7.668616937908458e-06, + "loss": 0.616, + "step": 16597 + }, + { + "epoch": 0.58, + "learning_rate": 7.667558092161978e-06, + "loss": 0.6659, + "step": 16598 + }, + { + "epoch": 0.58, + "learning_rate": 7.66649927406955e-06, + "loss": 0.6359, + "step": 16599 + }, + { + "epoch": 0.58, + "learning_rate": 7.66544048364372e-06, + "loss": 0.6619, + "step": 16600 + }, + { + "epoch": 0.58, + "learning_rate": 7.664381720897046e-06, + "loss": 0.6438, + "step": 16601 + }, + { + "epoch": 0.58, + "learning_rate": 7.663322985842088e-06, + "loss": 0.6461, + "step": 16602 + }, + { + "epoch": 0.58, + "learning_rate": 7.662264278491385e-06, + "loss": 0.6417, + "step": 16603 + }, + { + "epoch": 0.58, + "learning_rate": 7.661205598857497e-06, + "loss": 0.6051, + "step": 16604 + }, + { + "epoch": 0.58, + "learning_rate": 7.660146946952983e-06, + "loss": 0.6461, + "step": 16605 + }, + { + "epoch": 0.58, + "learning_rate": 7.659088322790376e-06, + "loss": 0.6082, + "step": 16606 + }, + { + "epoch": 0.58, + "learning_rate": 7.658029726382243e-06, + "loss": 0.6083, + "step": 16607 + }, + { + "epoch": 0.58, + "learning_rate": 7.656971157741134e-06, + "loss": 0.6646, + "step": 16608 + }, + { + "epoch": 0.58, + "learning_rate": 7.65591261687959e-06, + "loss": 0.6136, + "step": 16609 + }, + { + "epoch": 0.58, + "learning_rate": 7.654854103810167e-06, + "loss": 0.6288, + "step": 16610 + }, + { + "epoch": 0.58, + "learning_rate": 7.653795618545423e-06, + "loss": 0.6355, + "step": 16611 + }, + { + "epoch": 0.58, + "learning_rate": 7.65273716109789e-06, + "loss": 0.6241, + "step": 16612 + }, + { + "epoch": 0.58, + "learning_rate": 7.651678731480133e-06, + "loss": 0.6377, + "step": 16613 + }, + { + "epoch": 0.58, + "learning_rate": 7.650620329704697e-06, + "loss": 0.5676, + "step": 16614 + }, + { + "epoch": 0.58, + "learning_rate": 7.649561955784123e-06, + "loss": 0.5978, + "step": 16615 + }, + { + "epoch": 0.58, + "learning_rate": 7.648503609730968e-06, + "loss": 0.6266, + "step": 16616 + }, + { + "epoch": 0.58, + "learning_rate": 7.64744529155778e-06, + "loss": 0.6689, + "step": 16617 + }, + { + "epoch": 0.58, + "learning_rate": 7.6463870012771e-06, + "loss": 0.6316, + "step": 16618 + }, + { + "epoch": 0.58, + "learning_rate": 7.645328738901481e-06, + "loss": 0.6407, + "step": 16619 + }, + { + "epoch": 0.58, + "learning_rate": 7.644270504443472e-06, + "loss": 0.6395, + "step": 16620 + }, + { + "epoch": 0.58, + "learning_rate": 7.64321229791561e-06, + "loss": 0.6163, + "step": 16621 + }, + { + "epoch": 0.58, + "learning_rate": 7.642154119330449e-06, + "loss": 0.626, + "step": 16622 + }, + { + "epoch": 0.58, + "learning_rate": 7.64109596870054e-06, + "loss": 0.6072, + "step": 16623 + }, + { + "epoch": 0.58, + "learning_rate": 7.640037846038415e-06, + "loss": 0.6237, + "step": 16624 + }, + { + "epoch": 0.58, + "learning_rate": 7.638979751356627e-06, + "loss": 0.6877, + "step": 16625 + }, + { + "epoch": 0.58, + "learning_rate": 7.637921684667727e-06, + "loss": 0.6504, + "step": 16626 + }, + { + "epoch": 0.58, + "learning_rate": 7.636863645984248e-06, + "loss": 0.6038, + "step": 16627 + }, + { + "epoch": 0.58, + "learning_rate": 7.635805635318739e-06, + "loss": 0.6293, + "step": 16628 + }, + { + "epoch": 0.58, + "learning_rate": 7.63474765268375e-06, + "loss": 0.5988, + "step": 16629 + }, + { + "epoch": 0.58, + "learning_rate": 7.633689698091815e-06, + "loss": 0.6225, + "step": 16630 + }, + { + "epoch": 0.58, + "learning_rate": 7.632631771555483e-06, + "loss": 0.6363, + "step": 16631 + }, + { + "epoch": 0.58, + "learning_rate": 7.6315738730873e-06, + "loss": 0.6723, + "step": 16632 + }, + { + "epoch": 0.58, + "learning_rate": 7.630516002699799e-06, + "loss": 0.6383, + "step": 16633 + }, + { + "epoch": 0.58, + "learning_rate": 7.62945816040553e-06, + "loss": 0.6274, + "step": 16634 + }, + { + "epoch": 0.58, + "learning_rate": 7.628400346217038e-06, + "loss": 0.6458, + "step": 16635 + }, + { + "epoch": 0.58, + "learning_rate": 7.6273425601468535e-06, + "loss": 0.6049, + "step": 16636 + }, + { + "epoch": 0.58, + "learning_rate": 7.626284802207526e-06, + "loss": 0.6462, + "step": 16637 + }, + { + "epoch": 0.58, + "learning_rate": 7.6252270724116e-06, + "loss": 0.66, + "step": 16638 + }, + { + "epoch": 0.58, + "learning_rate": 7.624169370771603e-06, + "loss": 0.6806, + "step": 16639 + }, + { + "epoch": 0.58, + "learning_rate": 7.623111697300087e-06, + "loss": 0.6631, + "step": 16640 + }, + { + "epoch": 0.58, + "learning_rate": 7.6220540520095935e-06, + "loss": 0.6163, + "step": 16641 + }, + { + "epoch": 0.58, + "learning_rate": 7.620996434912651e-06, + "loss": 0.622, + "step": 16642 + }, + { + "epoch": 0.58, + "learning_rate": 7.619938846021806e-06, + "loss": 0.6957, + "step": 16643 + }, + { + "epoch": 0.58, + "learning_rate": 7.618881285349602e-06, + "loss": 0.6042, + "step": 16644 + }, + { + "epoch": 0.58, + "learning_rate": 7.6178237529085656e-06, + "loss": 0.6015, + "step": 16645 + }, + { + "epoch": 0.58, + "learning_rate": 7.6167662487112485e-06, + "loss": 0.7127, + "step": 16646 + }, + { + "epoch": 0.58, + "learning_rate": 7.615708772770178e-06, + "loss": 0.6317, + "step": 16647 + }, + { + "epoch": 0.58, + "learning_rate": 7.614651325097895e-06, + "loss": 0.6222, + "step": 16648 + }, + { + "epoch": 0.58, + "learning_rate": 7.613593905706943e-06, + "loss": 0.6592, + "step": 16649 + }, + { + "epoch": 0.58, + "learning_rate": 7.612536514609851e-06, + "loss": 0.6389, + "step": 16650 + }, + { + "epoch": 0.58, + "learning_rate": 7.6114791518191556e-06, + "loss": 0.6507, + "step": 16651 + }, + { + "epoch": 0.58, + "learning_rate": 7.610421817347403e-06, + "loss": 0.5809, + "step": 16652 + }, + { + "epoch": 0.58, + "learning_rate": 7.609364511207118e-06, + "loss": 0.636, + "step": 16653 + }, + { + "epoch": 0.58, + "learning_rate": 7.60830723341084e-06, + "loss": 0.6505, + "step": 16654 + }, + { + "epoch": 0.58, + "learning_rate": 7.607249983971111e-06, + "loss": 0.6319, + "step": 16655 + }, + { + "epoch": 0.58, + "learning_rate": 7.606192762900456e-06, + "loss": 0.6449, + "step": 16656 + }, + { + "epoch": 0.58, + "learning_rate": 7.605135570211411e-06, + "loss": 0.6384, + "step": 16657 + }, + { + "epoch": 0.58, + "learning_rate": 7.604078405916521e-06, + "loss": 0.6755, + "step": 16658 + }, + { + "epoch": 0.58, + "learning_rate": 7.603021270028308e-06, + "loss": 0.6456, + "step": 16659 + }, + { + "epoch": 0.58, + "learning_rate": 7.601964162559307e-06, + "loss": 0.615, + "step": 16660 + }, + { + "epoch": 0.58, + "learning_rate": 7.600907083522062e-06, + "loss": 0.6033, + "step": 16661 + }, + { + "epoch": 0.58, + "learning_rate": 7.5998500329290925e-06, + "loss": 0.6004, + "step": 16662 + }, + { + "epoch": 0.58, + "learning_rate": 7.598793010792936e-06, + "loss": 0.5714, + "step": 16663 + }, + { + "epoch": 0.58, + "learning_rate": 7.597736017126132e-06, + "loss": 0.6072, + "step": 16664 + }, + { + "epoch": 0.58, + "learning_rate": 7.596679051941203e-06, + "loss": 0.5976, + "step": 16665 + }, + { + "epoch": 0.58, + "learning_rate": 7.595622115250681e-06, + "loss": 0.6679, + "step": 16666 + }, + { + "epoch": 0.58, + "learning_rate": 7.594565207067107e-06, + "loss": 0.6319, + "step": 16667 + }, + { + "epoch": 0.58, + "learning_rate": 7.593508327403001e-06, + "loss": 0.6424, + "step": 16668 + }, + { + "epoch": 0.58, + "learning_rate": 7.592451476270897e-06, + "loss": 0.57, + "step": 16669 + }, + { + "epoch": 0.58, + "learning_rate": 7.59139465368333e-06, + "loss": 0.6582, + "step": 16670 + }, + { + "epoch": 0.58, + "learning_rate": 7.590337859652825e-06, + "loss": 0.622, + "step": 16671 + }, + { + "epoch": 0.58, + "learning_rate": 7.5892810941919094e-06, + "loss": 0.627, + "step": 16672 + }, + { + "epoch": 0.58, + "learning_rate": 7.588224357313122e-06, + "loss": 0.6154, + "step": 16673 + }, + { + "epoch": 0.58, + "learning_rate": 7.587167649028981e-06, + "loss": 0.6289, + "step": 16674 + }, + { + "epoch": 0.58, + "learning_rate": 7.58611096935202e-06, + "loss": 0.6161, + "step": 16675 + }, + { + "epoch": 0.58, + "learning_rate": 7.585054318294771e-06, + "loss": 0.5702, + "step": 16676 + }, + { + "epoch": 0.58, + "learning_rate": 7.583997695869756e-06, + "loss": 0.6753, + "step": 16677 + }, + { + "epoch": 0.58, + "learning_rate": 7.5829411020895e-06, + "loss": 0.6157, + "step": 16678 + }, + { + "epoch": 0.58, + "learning_rate": 7.5818845369665425e-06, + "loss": 0.6274, + "step": 16679 + }, + { + "epoch": 0.58, + "learning_rate": 7.580828000513398e-06, + "loss": 0.6218, + "step": 16680 + }, + { + "epoch": 0.58, + "learning_rate": 7.579771492742597e-06, + "loss": 0.6182, + "step": 16681 + }, + { + "epoch": 0.58, + "learning_rate": 7.578715013666672e-06, + "loss": 0.6482, + "step": 16682 + }, + { + "epoch": 0.58, + "learning_rate": 7.5776585632981395e-06, + "loss": 0.6266, + "step": 16683 + }, + { + "epoch": 0.58, + "learning_rate": 7.5766021416495265e-06, + "loss": 0.6446, + "step": 16684 + }, + { + "epoch": 0.58, + "learning_rate": 7.575545748733367e-06, + "loss": 0.6733, + "step": 16685 + }, + { + "epoch": 0.58, + "learning_rate": 7.5744893845621754e-06, + "loss": 0.6322, + "step": 16686 + }, + { + "epoch": 0.58, + "learning_rate": 7.573433049148479e-06, + "loss": 0.6498, + "step": 16687 + }, + { + "epoch": 0.58, + "learning_rate": 7.572376742504809e-06, + "loss": 0.6482, + "step": 16688 + }, + { + "epoch": 0.58, + "learning_rate": 7.57132046464368e-06, + "loss": 0.6391, + "step": 16689 + }, + { + "epoch": 0.58, + "learning_rate": 7.570264215577616e-06, + "loss": 0.6531, + "step": 16690 + }, + { + "epoch": 0.58, + "learning_rate": 7.569207995319151e-06, + "loss": 0.635, + "step": 16691 + }, + { + "epoch": 0.58, + "learning_rate": 7.568151803880795e-06, + "loss": 0.6368, + "step": 16692 + }, + { + "epoch": 0.58, + "learning_rate": 7.567095641275075e-06, + "loss": 0.6575, + "step": 16693 + }, + { + "epoch": 0.58, + "learning_rate": 7.566039507514519e-06, + "loss": 0.6432, + "step": 16694 + }, + { + "epoch": 0.58, + "learning_rate": 7.56498340261164e-06, + "loss": 0.6395, + "step": 16695 + }, + { + "epoch": 0.58, + "learning_rate": 7.563927326578959e-06, + "loss": 0.6004, + "step": 16696 + }, + { + "epoch": 0.58, + "learning_rate": 7.562871279429009e-06, + "loss": 0.5941, + "step": 16697 + }, + { + "epoch": 0.58, + "learning_rate": 7.5618152611743e-06, + "loss": 0.6693, + "step": 16698 + }, + { + "epoch": 0.58, + "learning_rate": 7.560759271827351e-06, + "loss": 0.6199, + "step": 16699 + }, + { + "epoch": 0.58, + "learning_rate": 7.5597033114006945e-06, + "loss": 0.6307, + "step": 16700 + }, + { + "epoch": 0.58, + "learning_rate": 7.558647379906837e-06, + "loss": 0.6246, + "step": 16701 + }, + { + "epoch": 0.58, + "learning_rate": 7.5575914773583015e-06, + "loss": 0.6172, + "step": 16702 + }, + { + "epoch": 0.58, + "learning_rate": 7.556535603767615e-06, + "loss": 0.6586, + "step": 16703 + }, + { + "epoch": 0.58, + "learning_rate": 7.555479759147286e-06, + "loss": 0.6447, + "step": 16704 + }, + { + "epoch": 0.58, + "learning_rate": 7.554423943509834e-06, + "loss": 0.6286, + "step": 16705 + }, + { + "epoch": 0.58, + "learning_rate": 7.553368156867787e-06, + "loss": 0.6091, + "step": 16706 + }, + { + "epoch": 0.58, + "learning_rate": 7.55231239923365e-06, + "loss": 0.632, + "step": 16707 + }, + { + "epoch": 0.58, + "learning_rate": 7.55125667061995e-06, + "loss": 0.6203, + "step": 16708 + }, + { + "epoch": 0.58, + "learning_rate": 7.550200971039195e-06, + "loss": 0.6688, + "step": 16709 + }, + { + "epoch": 0.58, + "learning_rate": 7.549145300503908e-06, + "loss": 0.6429, + "step": 16710 + }, + { + "epoch": 0.58, + "learning_rate": 7.5480896590266075e-06, + "loss": 0.6791, + "step": 16711 + }, + { + "epoch": 0.58, + "learning_rate": 7.547034046619801e-06, + "loss": 0.6851, + "step": 16712 + }, + { + "epoch": 0.58, + "learning_rate": 7.54597846329601e-06, + "loss": 0.5796, + "step": 16713 + }, + { + "epoch": 0.58, + "learning_rate": 7.544922909067751e-06, + "loss": 0.6243, + "step": 16714 + }, + { + "epoch": 0.58, + "learning_rate": 7.543867383947534e-06, + "loss": 0.5869, + "step": 16715 + }, + { + "epoch": 0.58, + "learning_rate": 7.542811887947876e-06, + "loss": 0.591, + "step": 16716 + }, + { + "epoch": 0.58, + "learning_rate": 7.5417564210812946e-06, + "loss": 0.6421, + "step": 16717 + }, + { + "epoch": 0.58, + "learning_rate": 7.540700983360298e-06, + "loss": 0.6261, + "step": 16718 + }, + { + "epoch": 0.58, + "learning_rate": 7.539645574797402e-06, + "loss": 0.6227, + "step": 16719 + }, + { + "epoch": 0.58, + "learning_rate": 7.5385901954051225e-06, + "loss": 0.6485, + "step": 16720 + }, + { + "epoch": 0.58, + "learning_rate": 7.5375348451959665e-06, + "loss": 0.6386, + "step": 16721 + }, + { + "epoch": 0.58, + "learning_rate": 7.536479524182452e-06, + "loss": 0.6041, + "step": 16722 + }, + { + "epoch": 0.58, + "learning_rate": 7.5354242323770894e-06, + "loss": 0.6005, + "step": 16723 + }, + { + "epoch": 0.58, + "learning_rate": 7.53436896979239e-06, + "loss": 0.6163, + "step": 16724 + }, + { + "epoch": 0.58, + "learning_rate": 7.533313736440864e-06, + "loss": 0.6036, + "step": 16725 + }, + { + "epoch": 0.58, + "learning_rate": 7.532258532335026e-06, + "loss": 0.6347, + "step": 16726 + }, + { + "epoch": 0.58, + "learning_rate": 7.531203357487383e-06, + "loss": 0.6584, + "step": 16727 + }, + { + "epoch": 0.58, + "learning_rate": 7.5301482119104475e-06, + "loss": 0.6299, + "step": 16728 + }, + { + "epoch": 0.58, + "learning_rate": 7.529093095616732e-06, + "loss": 0.6332, + "step": 16729 + }, + { + "epoch": 0.58, + "learning_rate": 7.528038008618741e-06, + "loss": 0.6158, + "step": 16730 + }, + { + "epoch": 0.58, + "learning_rate": 7.526982950928986e-06, + "loss": 0.6597, + "step": 16731 + }, + { + "epoch": 0.58, + "learning_rate": 7.525927922559979e-06, + "loss": 0.6103, + "step": 16732 + }, + { + "epoch": 0.58, + "learning_rate": 7.524872923524224e-06, + "loss": 0.5963, + "step": 16733 + }, + { + "epoch": 0.58, + "learning_rate": 7.523817953834232e-06, + "loss": 0.6305, + "step": 16734 + }, + { + "epoch": 0.58, + "learning_rate": 7.522763013502512e-06, + "loss": 0.5799, + "step": 16735 + }, + { + "epoch": 0.58, + "learning_rate": 7.521708102541569e-06, + "loss": 0.6496, + "step": 16736 + }, + { + "epoch": 0.58, + "learning_rate": 7.520653220963909e-06, + "loss": 0.7029, + "step": 16737 + }, + { + "epoch": 0.58, + "learning_rate": 7.519598368782046e-06, + "loss": 0.6218, + "step": 16738 + }, + { + "epoch": 0.58, + "learning_rate": 7.51854354600848e-06, + "loss": 0.6285, + "step": 16739 + }, + { + "epoch": 0.58, + "learning_rate": 7.517488752655718e-06, + "loss": 0.6589, + "step": 16740 + }, + { + "epoch": 0.58, + "learning_rate": 7.5164339887362705e-06, + "loss": 0.6358, + "step": 16741 + }, + { + "epoch": 0.58, + "learning_rate": 7.5153792542626365e-06, + "loss": 0.6942, + "step": 16742 + }, + { + "epoch": 0.58, + "learning_rate": 7.514324549247326e-06, + "loss": 0.539, + "step": 16743 + }, + { + "epoch": 0.58, + "learning_rate": 7.513269873702843e-06, + "loss": 0.6304, + "step": 16744 + }, + { + "epoch": 0.58, + "learning_rate": 7.51221522764169e-06, + "loss": 0.628, + "step": 16745 + }, + { + "epoch": 0.58, + "learning_rate": 7.5111606110763724e-06, + "loss": 0.6404, + "step": 16746 + }, + { + "epoch": 0.58, + "learning_rate": 7.510106024019397e-06, + "loss": 0.6228, + "step": 16747 + }, + { + "epoch": 0.58, + "learning_rate": 7.509051466483262e-06, + "loss": 0.6762, + "step": 16748 + }, + { + "epoch": 0.58, + "learning_rate": 7.5079969384804715e-06, + "loss": 0.6216, + "step": 16749 + }, + { + "epoch": 0.58, + "learning_rate": 7.506942440023534e-06, + "loss": 0.7054, + "step": 16750 + }, + { + "epoch": 0.58, + "learning_rate": 7.505887971124943e-06, + "loss": 0.6458, + "step": 16751 + }, + { + "epoch": 0.58, + "learning_rate": 7.5048335317972066e-06, + "loss": 0.6157, + "step": 16752 + }, + { + "epoch": 0.58, + "learning_rate": 7.503779122052828e-06, + "loss": 0.624, + "step": 16753 + }, + { + "epoch": 0.58, + "learning_rate": 7.5027247419043026e-06, + "loss": 0.5743, + "step": 16754 + }, + { + "epoch": 0.58, + "learning_rate": 7.501670391364134e-06, + "loss": 0.5938, + "step": 16755 + }, + { + "epoch": 0.58, + "learning_rate": 7.500616070444826e-06, + "loss": 0.6067, + "step": 16756 + }, + { + "epoch": 0.58, + "learning_rate": 7.499561779158875e-06, + "loss": 0.6231, + "step": 16757 + }, + { + "epoch": 0.58, + "learning_rate": 7.49850751751878e-06, + "loss": 0.6162, + "step": 16758 + }, + { + "epoch": 0.58, + "learning_rate": 7.4974532855370465e-06, + "loss": 0.5941, + "step": 16759 + }, + { + "epoch": 0.58, + "learning_rate": 7.496399083226168e-06, + "loss": 0.555, + "step": 16760 + }, + { + "epoch": 0.58, + "learning_rate": 7.495344910598645e-06, + "loss": 0.6572, + "step": 16761 + }, + { + "epoch": 0.58, + "learning_rate": 7.494290767666979e-06, + "loss": 0.6235, + "step": 16762 + }, + { + "epoch": 0.58, + "learning_rate": 7.493236654443663e-06, + "loss": 0.6754, + "step": 16763 + }, + { + "epoch": 0.58, + "learning_rate": 7.492182570941198e-06, + "loss": 0.6837, + "step": 16764 + }, + { + "epoch": 0.58, + "learning_rate": 7.491128517172082e-06, + "loss": 0.6087, + "step": 16765 + }, + { + "epoch": 0.58, + "learning_rate": 7.49007449314881e-06, + "loss": 0.6411, + "step": 16766 + }, + { + "epoch": 0.58, + "learning_rate": 7.48902049888388e-06, + "loss": 0.6117, + "step": 16767 + }, + { + "epoch": 0.58, + "learning_rate": 7.48796653438979e-06, + "loss": 0.6515, + "step": 16768 + }, + { + "epoch": 0.58, + "learning_rate": 7.486912599679032e-06, + "loss": 0.6156, + "step": 16769 + }, + { + "epoch": 0.58, + "learning_rate": 7.485858694764108e-06, + "loss": 0.6565, + "step": 16770 + }, + { + "epoch": 0.58, + "learning_rate": 7.4848048196575065e-06, + "loss": 0.6706, + "step": 16771 + }, + { + "epoch": 0.58, + "learning_rate": 7.483750974371726e-06, + "loss": 0.6483, + "step": 16772 + }, + { + "epoch": 0.58, + "learning_rate": 7.4826971589192624e-06, + "loss": 0.6373, + "step": 16773 + }, + { + "epoch": 0.58, + "learning_rate": 7.481643373312606e-06, + "loss": 0.6568, + "step": 16774 + }, + { + "epoch": 0.58, + "learning_rate": 7.4805896175642535e-06, + "loss": 0.6296, + "step": 16775 + }, + { + "epoch": 0.58, + "learning_rate": 7.4795358916867e-06, + "loss": 0.6305, + "step": 16776 + }, + { + "epoch": 0.58, + "learning_rate": 7.478482195692435e-06, + "loss": 0.6645, + "step": 16777 + }, + { + "epoch": 0.58, + "learning_rate": 7.477428529593953e-06, + "loss": 0.6354, + "step": 16778 + }, + { + "epoch": 0.58, + "learning_rate": 7.4763748934037505e-06, + "loss": 0.6212, + "step": 16779 + }, + { + "epoch": 0.58, + "learning_rate": 7.4753212871343115e-06, + "loss": 0.6476, + "step": 16780 + }, + { + "epoch": 0.58, + "learning_rate": 7.474267710798135e-06, + "loss": 0.6302, + "step": 16781 + }, + { + "epoch": 0.58, + "learning_rate": 7.473214164407709e-06, + "loss": 0.6161, + "step": 16782 + }, + { + "epoch": 0.58, + "learning_rate": 7.472160647975526e-06, + "loss": 0.6514, + "step": 16783 + }, + { + "epoch": 0.58, + "learning_rate": 7.471107161514075e-06, + "loss": 0.6198, + "step": 16784 + }, + { + "epoch": 0.58, + "learning_rate": 7.4700537050358515e-06, + "loss": 0.6262, + "step": 16785 + }, + { + "epoch": 0.58, + "learning_rate": 7.469000278553338e-06, + "loss": 0.5988, + "step": 16786 + }, + { + "epoch": 0.58, + "learning_rate": 7.467946882079027e-06, + "loss": 0.6324, + "step": 16787 + }, + { + "epoch": 0.58, + "learning_rate": 7.466893515625412e-06, + "loss": 0.6099, + "step": 16788 + }, + { + "epoch": 0.58, + "learning_rate": 7.465840179204978e-06, + "loss": 0.5932, + "step": 16789 + }, + { + "epoch": 0.58, + "learning_rate": 7.464786872830212e-06, + "loss": 0.6281, + "step": 16790 + }, + { + "epoch": 0.58, + "learning_rate": 7.4637335965136074e-06, + "loss": 0.6572, + "step": 16791 + }, + { + "epoch": 0.58, + "learning_rate": 7.462680350267648e-06, + "loss": 0.6264, + "step": 16792 + }, + { + "epoch": 0.58, + "learning_rate": 7.461627134104823e-06, + "loss": 0.6113, + "step": 16793 + }, + { + "epoch": 0.58, + "learning_rate": 7.46057394803762e-06, + "loss": 0.6708, + "step": 16794 + }, + { + "epoch": 0.58, + "learning_rate": 7.459520792078525e-06, + "loss": 0.6225, + "step": 16795 + }, + { + "epoch": 0.58, + "learning_rate": 7.458467666240024e-06, + "loss": 0.7009, + "step": 16796 + }, + { + "epoch": 0.58, + "learning_rate": 7.457414570534605e-06, + "loss": 0.6247, + "step": 16797 + }, + { + "epoch": 0.58, + "learning_rate": 7.4563615049747515e-06, + "loss": 0.5782, + "step": 16798 + }, + { + "epoch": 0.58, + "learning_rate": 7.455308469572951e-06, + "loss": 0.6442, + "step": 16799 + }, + { + "epoch": 0.58, + "learning_rate": 7.454255464341687e-06, + "loss": 0.6455, + "step": 16800 + }, + { + "epoch": 0.58, + "learning_rate": 7.453202489293445e-06, + "loss": 0.6534, + "step": 16801 + }, + { + "epoch": 0.58, + "learning_rate": 7.452149544440707e-06, + "loss": 0.6626, + "step": 16802 + }, + { + "epoch": 0.58, + "learning_rate": 7.4510966297959645e-06, + "loss": 0.6471, + "step": 16803 + }, + { + "epoch": 0.58, + "learning_rate": 7.450043745371692e-06, + "loss": 0.6061, + "step": 16804 + }, + { + "epoch": 0.58, + "learning_rate": 7.448990891180377e-06, + "loss": 0.6105, + "step": 16805 + }, + { + "epoch": 0.58, + "learning_rate": 7.447938067234504e-06, + "loss": 0.6549, + "step": 16806 + }, + { + "epoch": 0.58, + "learning_rate": 7.4468852735465515e-06, + "loss": 0.5996, + "step": 16807 + }, + { + "epoch": 0.58, + "learning_rate": 7.445832510129003e-06, + "loss": 0.6601, + "step": 16808 + }, + { + "epoch": 0.58, + "learning_rate": 7.4447797769943444e-06, + "loss": 0.7043, + "step": 16809 + }, + { + "epoch": 0.58, + "learning_rate": 7.443727074155051e-06, + "loss": 0.6465, + "step": 16810 + }, + { + "epoch": 0.58, + "learning_rate": 7.442674401623607e-06, + "loss": 0.6098, + "step": 16811 + }, + { + "epoch": 0.58, + "learning_rate": 7.4416217594124965e-06, + "loss": 0.6114, + "step": 16812 + }, + { + "epoch": 0.58, + "learning_rate": 7.440569147534193e-06, + "loss": 0.6211, + "step": 16813 + }, + { + "epoch": 0.58, + "learning_rate": 7.439516566001179e-06, + "loss": 0.6895, + "step": 16814 + }, + { + "epoch": 0.58, + "learning_rate": 7.438464014825939e-06, + "loss": 0.6096, + "step": 16815 + }, + { + "epoch": 0.58, + "learning_rate": 7.437411494020945e-06, + "loss": 0.6051, + "step": 16816 + }, + { + "epoch": 0.58, + "learning_rate": 7.436359003598681e-06, + "loss": 0.6457, + "step": 16817 + }, + { + "epoch": 0.58, + "learning_rate": 7.435306543571624e-06, + "loss": 0.5923, + "step": 16818 + }, + { + "epoch": 0.58, + "learning_rate": 7.434254113952251e-06, + "loss": 0.6119, + "step": 16819 + }, + { + "epoch": 0.58, + "learning_rate": 7.433201714753042e-06, + "loss": 0.6478, + "step": 16820 + }, + { + "epoch": 0.58, + "learning_rate": 7.432149345986476e-06, + "loss": 0.6463, + "step": 16821 + }, + { + "epoch": 0.58, + "learning_rate": 7.431097007665025e-06, + "loss": 0.6554, + "step": 16822 + }, + { + "epoch": 0.58, + "learning_rate": 7.430044699801169e-06, + "loss": 0.5864, + "step": 16823 + }, + { + "epoch": 0.58, + "learning_rate": 7.428992422407386e-06, + "loss": 0.6253, + "step": 16824 + }, + { + "epoch": 0.58, + "learning_rate": 7.427940175496146e-06, + "loss": 0.6222, + "step": 16825 + }, + { + "epoch": 0.58, + "learning_rate": 7.426887959079933e-06, + "loss": 0.6131, + "step": 16826 + }, + { + "epoch": 0.58, + "learning_rate": 7.425835773171217e-06, + "loss": 0.6142, + "step": 16827 + }, + { + "epoch": 0.58, + "learning_rate": 7.424783617782474e-06, + "loss": 0.626, + "step": 16828 + }, + { + "epoch": 0.58, + "learning_rate": 7.423731492926178e-06, + "loss": 0.6085, + "step": 16829 + }, + { + "epoch": 0.58, + "learning_rate": 7.422679398614807e-06, + "loss": 0.581, + "step": 16830 + }, + { + "epoch": 0.58, + "learning_rate": 7.421627334860829e-06, + "loss": 0.6278, + "step": 16831 + }, + { + "epoch": 0.58, + "learning_rate": 7.420575301676726e-06, + "loss": 0.6273, + "step": 16832 + }, + { + "epoch": 0.58, + "learning_rate": 7.419523299074958e-06, + "loss": 0.6932, + "step": 16833 + }, + { + "epoch": 0.58, + "learning_rate": 7.418471327068008e-06, + "loss": 0.6745, + "step": 16834 + }, + { + "epoch": 0.58, + "learning_rate": 7.417419385668352e-06, + "loss": 0.6282, + "step": 16835 + }, + { + "epoch": 0.58, + "learning_rate": 7.416367474888449e-06, + "loss": 0.6108, + "step": 16836 + }, + { + "epoch": 0.58, + "learning_rate": 7.415315594740778e-06, + "loss": 0.6249, + "step": 16837 + }, + { + "epoch": 0.58, + "learning_rate": 7.414263745237818e-06, + "loss": 0.6168, + "step": 16838 + }, + { + "epoch": 0.58, + "learning_rate": 7.413211926392024e-06, + "loss": 0.622, + "step": 16839 + }, + { + "epoch": 0.58, + "learning_rate": 7.412160138215876e-06, + "loss": 0.5797, + "step": 16840 + }, + { + "epoch": 0.58, + "learning_rate": 7.411108380721849e-06, + "loss": 0.6383, + "step": 16841 + }, + { + "epoch": 0.58, + "learning_rate": 7.410056653922399e-06, + "loss": 0.6231, + "step": 16842 + }, + { + "epoch": 0.58, + "learning_rate": 7.409004957830008e-06, + "loss": 0.6967, + "step": 16843 + }, + { + "epoch": 0.58, + "learning_rate": 7.407953292457144e-06, + "loss": 0.6584, + "step": 16844 + }, + { + "epoch": 0.58, + "learning_rate": 7.406901657816266e-06, + "loss": 0.6105, + "step": 16845 + }, + { + "epoch": 0.58, + "learning_rate": 7.405850053919852e-06, + "loss": 0.6745, + "step": 16846 + }, + { + "epoch": 0.58, + "learning_rate": 7.404798480780371e-06, + "loss": 0.6835, + "step": 16847 + }, + { + "epoch": 0.58, + "learning_rate": 7.403746938410281e-06, + "loss": 0.6105, + "step": 16848 + }, + { + "epoch": 0.58, + "learning_rate": 7.402695426822058e-06, + "loss": 0.6181, + "step": 16849 + }, + { + "epoch": 0.58, + "learning_rate": 7.4016439460281685e-06, + "loss": 0.651, + "step": 16850 + }, + { + "epoch": 0.58, + "learning_rate": 7.4005924960410724e-06, + "loss": 0.6827, + "step": 16851 + }, + { + "epoch": 0.58, + "learning_rate": 7.399541076873242e-06, + "loss": 0.6268, + "step": 16852 + }, + { + "epoch": 0.58, + "learning_rate": 7.398489688537146e-06, + "loss": 0.6309, + "step": 16853 + }, + { + "epoch": 0.58, + "learning_rate": 7.397438331045239e-06, + "loss": 0.7056, + "step": 16854 + }, + { + "epoch": 0.58, + "learning_rate": 7.396387004409995e-06, + "loss": 0.6223, + "step": 16855 + }, + { + "epoch": 0.58, + "learning_rate": 7.395335708643882e-06, + "loss": 0.6462, + "step": 16856 + }, + { + "epoch": 0.58, + "learning_rate": 7.3942844437593516e-06, + "loss": 0.634, + "step": 16857 + }, + { + "epoch": 0.58, + "learning_rate": 7.3932332097688775e-06, + "loss": 0.6185, + "step": 16858 + }, + { + "epoch": 0.58, + "learning_rate": 7.392182006684927e-06, + "loss": 0.6337, + "step": 16859 + }, + { + "epoch": 0.58, + "learning_rate": 7.39113083451995e-06, + "loss": 0.6533, + "step": 16860 + }, + { + "epoch": 0.58, + "learning_rate": 7.390079693286418e-06, + "loss": 0.6223, + "step": 16861 + }, + { + "epoch": 0.58, + "learning_rate": 7.3890285829968e-06, + "loss": 0.6101, + "step": 16862 + }, + { + "epoch": 0.58, + "learning_rate": 7.387977503663544e-06, + "loss": 0.6834, + "step": 16863 + }, + { + "epoch": 0.58, + "learning_rate": 7.386926455299119e-06, + "loss": 0.5818, + "step": 16864 + }, + { + "epoch": 0.58, + "learning_rate": 7.385875437915993e-06, + "loss": 0.6276, + "step": 16865 + }, + { + "epoch": 0.58, + "learning_rate": 7.384824451526612e-06, + "loss": 0.6083, + "step": 16866 + }, + { + "epoch": 0.58, + "learning_rate": 7.383773496143449e-06, + "loss": 0.6021, + "step": 16867 + }, + { + "epoch": 0.58, + "learning_rate": 7.382722571778964e-06, + "loss": 0.655, + "step": 16868 + }, + { + "epoch": 0.58, + "learning_rate": 7.381671678445609e-06, + "loss": 0.6445, + "step": 16869 + }, + { + "epoch": 0.58, + "learning_rate": 7.380620816155849e-06, + "loss": 0.6254, + "step": 16870 + }, + { + "epoch": 0.58, + "learning_rate": 7.379569984922148e-06, + "loss": 0.6333, + "step": 16871 + }, + { + "epoch": 0.58, + "learning_rate": 7.3785191847569526e-06, + "loss": 0.624, + "step": 16872 + }, + { + "epoch": 0.58, + "learning_rate": 7.377468415672731e-06, + "loss": 0.66, + "step": 16873 + }, + { + "epoch": 0.58, + "learning_rate": 7.376417677681943e-06, + "loss": 0.6173, + "step": 16874 + }, + { + "epoch": 0.58, + "learning_rate": 7.375366970797035e-06, + "loss": 0.5939, + "step": 16875 + }, + { + "epoch": 0.58, + "learning_rate": 7.374316295030476e-06, + "loss": 0.6419, + "step": 16876 + }, + { + "epoch": 0.58, + "learning_rate": 7.373265650394722e-06, + "loss": 0.6181, + "step": 16877 + }, + { + "epoch": 0.58, + "learning_rate": 7.372215036902219e-06, + "loss": 0.6637, + "step": 16878 + }, + { + "epoch": 0.58, + "learning_rate": 7.371164454565435e-06, + "loss": 0.6313, + "step": 16879 + }, + { + "epoch": 0.58, + "learning_rate": 7.370113903396825e-06, + "loss": 0.5598, + "step": 16880 + }, + { + "epoch": 0.58, + "learning_rate": 7.369063383408836e-06, + "loss": 0.6078, + "step": 16881 + }, + { + "epoch": 0.58, + "learning_rate": 7.3680128946139295e-06, + "loss": 0.6392, + "step": 16882 + }, + { + "epoch": 0.58, + "learning_rate": 7.366962437024565e-06, + "loss": 0.6357, + "step": 16883 + }, + { + "epoch": 0.58, + "learning_rate": 7.365912010653185e-06, + "loss": 0.591, + "step": 16884 + }, + { + "epoch": 0.59, + "learning_rate": 7.3648616155122506e-06, + "loss": 0.6119, + "step": 16885 + }, + { + "epoch": 0.59, + "learning_rate": 7.3638112516142225e-06, + "loss": 0.6401, + "step": 16886 + }, + { + "epoch": 0.59, + "learning_rate": 7.362760918971539e-06, + "loss": 0.6224, + "step": 16887 + }, + { + "epoch": 0.59, + "learning_rate": 7.361710617596663e-06, + "loss": 0.6451, + "step": 16888 + }, + { + "epoch": 0.59, + "learning_rate": 7.360660347502049e-06, + "loss": 0.629, + "step": 16889 + }, + { + "epoch": 0.59, + "learning_rate": 7.359610108700139e-06, + "loss": 0.6023, + "step": 16890 + }, + { + "epoch": 0.59, + "learning_rate": 7.358559901203395e-06, + "loss": 0.619, + "step": 16891 + }, + { + "epoch": 0.59, + "learning_rate": 7.357509725024267e-06, + "loss": 0.6251, + "step": 16892 + }, + { + "epoch": 0.59, + "learning_rate": 7.3564595801751996e-06, + "loss": 0.631, + "step": 16893 + }, + { + "epoch": 0.59, + "learning_rate": 7.355409466668653e-06, + "loss": 0.6091, + "step": 16894 + }, + { + "epoch": 0.59, + "learning_rate": 7.3543593845170665e-06, + "loss": 0.6303, + "step": 16895 + }, + { + "epoch": 0.59, + "learning_rate": 7.353309333732896e-06, + "loss": 0.6646, + "step": 16896 + }, + { + "epoch": 0.59, + "learning_rate": 7.352259314328599e-06, + "loss": 0.6254, + "step": 16897 + }, + { + "epoch": 0.59, + "learning_rate": 7.351209326316613e-06, + "loss": 0.5657, + "step": 16898 + }, + { + "epoch": 0.59, + "learning_rate": 7.3501593697093865e-06, + "loss": 0.5906, + "step": 16899 + }, + { + "epoch": 0.59, + "learning_rate": 7.349109444519381e-06, + "loss": 0.6737, + "step": 16900 + }, + { + "epoch": 0.59, + "learning_rate": 7.348059550759032e-06, + "loss": 0.6234, + "step": 16901 + }, + { + "epoch": 0.59, + "learning_rate": 7.34700968844079e-06, + "loss": 0.6379, + "step": 16902 + }, + { + "epoch": 0.59, + "learning_rate": 7.34595985757711e-06, + "loss": 0.6373, + "step": 16903 + }, + { + "epoch": 0.59, + "learning_rate": 7.344910058180428e-06, + "loss": 0.6344, + "step": 16904 + }, + { + "epoch": 0.59, + "learning_rate": 7.343860290263195e-06, + "loss": 0.6407, + "step": 16905 + }, + { + "epoch": 0.59, + "learning_rate": 7.3428105538378645e-06, + "loss": 0.6106, + "step": 16906 + }, + { + "epoch": 0.59, + "learning_rate": 7.3417608489168725e-06, + "loss": 0.6344, + "step": 16907 + }, + { + "epoch": 0.59, + "learning_rate": 7.3407111755126644e-06, + "loss": 0.6698, + "step": 16908 + }, + { + "epoch": 0.59, + "learning_rate": 7.339661533637698e-06, + "loss": 0.6364, + "step": 16909 + }, + { + "epoch": 0.59, + "learning_rate": 7.338611923304404e-06, + "loss": 0.6044, + "step": 16910 + }, + { + "epoch": 0.59, + "learning_rate": 7.337562344525231e-06, + "loss": 0.5599, + "step": 16911 + }, + { + "epoch": 0.59, + "learning_rate": 7.336512797312629e-06, + "loss": 0.6746, + "step": 16912 + }, + { + "epoch": 0.59, + "learning_rate": 7.335463281679035e-06, + "loss": 0.6469, + "step": 16913 + }, + { + "epoch": 0.59, + "learning_rate": 7.334413797636891e-06, + "loss": 0.6794, + "step": 16914 + }, + { + "epoch": 0.59, + "learning_rate": 7.33336434519865e-06, + "loss": 0.6147, + "step": 16915 + }, + { + "epoch": 0.59, + "learning_rate": 7.332314924376745e-06, + "loss": 0.649, + "step": 16916 + }, + { + "epoch": 0.59, + "learning_rate": 7.331265535183617e-06, + "loss": 0.6791, + "step": 16917 + }, + { + "epoch": 0.59, + "learning_rate": 7.330216177631719e-06, + "loss": 0.5869, + "step": 16918 + }, + { + "epoch": 0.59, + "learning_rate": 7.3291668517334825e-06, + "loss": 0.6027, + "step": 16919 + }, + { + "epoch": 0.59, + "learning_rate": 7.328117557501349e-06, + "loss": 0.6506, + "step": 16920 + }, + { + "epoch": 0.59, + "learning_rate": 7.327068294947768e-06, + "loss": 0.6591, + "step": 16921 + }, + { + "epoch": 0.59, + "learning_rate": 7.326019064085168e-06, + "loss": 0.6932, + "step": 16922 + }, + { + "epoch": 0.59, + "learning_rate": 7.324969864925995e-06, + "loss": 0.6263, + "step": 16923 + }, + { + "epoch": 0.59, + "learning_rate": 7.323920697482693e-06, + "loss": 0.6386, + "step": 16924 + }, + { + "epoch": 0.59, + "learning_rate": 7.3228715617676925e-06, + "loss": 0.6878, + "step": 16925 + }, + { + "epoch": 0.59, + "learning_rate": 7.321822457793435e-06, + "loss": 0.6369, + "step": 16926 + }, + { + "epoch": 0.59, + "learning_rate": 7.320773385572364e-06, + "loss": 0.6816, + "step": 16927 + }, + { + "epoch": 0.59, + "learning_rate": 7.319724345116911e-06, + "loss": 0.6238, + "step": 16928 + }, + { + "epoch": 0.59, + "learning_rate": 7.3186753364395155e-06, + "loss": 0.6375, + "step": 16929 + }, + { + "epoch": 0.59, + "learning_rate": 7.31762635955262e-06, + "loss": 0.6014, + "step": 16930 + }, + { + "epoch": 0.59, + "learning_rate": 7.316577414468654e-06, + "loss": 0.6732, + "step": 16931 + }, + { + "epoch": 0.59, + "learning_rate": 7.315528501200058e-06, + "loss": 0.6281, + "step": 16932 + }, + { + "epoch": 0.59, + "learning_rate": 7.314479619759268e-06, + "loss": 0.629, + "step": 16933 + }, + { + "epoch": 0.59, + "learning_rate": 7.3134307701587185e-06, + "loss": 0.6285, + "step": 16934 + }, + { + "epoch": 0.59, + "learning_rate": 7.312381952410845e-06, + "loss": 0.6702, + "step": 16935 + }, + { + "epoch": 0.59, + "learning_rate": 7.311333166528085e-06, + "loss": 0.6052, + "step": 16936 + }, + { + "epoch": 0.59, + "learning_rate": 7.310284412522871e-06, + "loss": 0.6789, + "step": 16937 + }, + { + "epoch": 0.59, + "learning_rate": 7.309235690407637e-06, + "loss": 0.6112, + "step": 16938 + }, + { + "epoch": 0.59, + "learning_rate": 7.308187000194819e-06, + "loss": 0.5996, + "step": 16939 + }, + { + "epoch": 0.59, + "learning_rate": 7.307138341896849e-06, + "loss": 0.6128, + "step": 16940 + }, + { + "epoch": 0.59, + "learning_rate": 7.306089715526159e-06, + "loss": 0.5784, + "step": 16941 + }, + { + "epoch": 0.59, + "learning_rate": 7.305041121095187e-06, + "loss": 0.6456, + "step": 16942 + }, + { + "epoch": 0.59, + "learning_rate": 7.303992558616357e-06, + "loss": 0.6176, + "step": 16943 + }, + { + "epoch": 0.59, + "learning_rate": 7.302944028102107e-06, + "loss": 0.6503, + "step": 16944 + }, + { + "epoch": 0.59, + "learning_rate": 7.30189552956487e-06, + "loss": 0.6651, + "step": 16945 + }, + { + "epoch": 0.59, + "learning_rate": 7.300847063017072e-06, + "loss": 0.654, + "step": 16946 + }, + { + "epoch": 0.59, + "learning_rate": 7.2997986284711465e-06, + "loss": 0.6297, + "step": 16947 + }, + { + "epoch": 0.59, + "learning_rate": 7.298750225939526e-06, + "loss": 0.6254, + "step": 16948 + }, + { + "epoch": 0.59, + "learning_rate": 7.2977018554346356e-06, + "loss": 0.6382, + "step": 16949 + }, + { + "epoch": 0.59, + "learning_rate": 7.29665351696891e-06, + "loss": 0.5727, + "step": 16950 + }, + { + "epoch": 0.59, + "learning_rate": 7.295605210554777e-06, + "loss": 0.6204, + "step": 16951 + }, + { + "epoch": 0.59, + "learning_rate": 7.294556936204664e-06, + "loss": 0.6512, + "step": 16952 + }, + { + "epoch": 0.59, + "learning_rate": 7.293508693931002e-06, + "loss": 0.6151, + "step": 16953 + }, + { + "epoch": 0.59, + "learning_rate": 7.29246048374622e-06, + "loss": 0.6123, + "step": 16954 + }, + { + "epoch": 0.59, + "learning_rate": 7.291412305662741e-06, + "loss": 0.6372, + "step": 16955 + }, + { + "epoch": 0.59, + "learning_rate": 7.290364159692997e-06, + "loss": 0.6619, + "step": 16956 + }, + { + "epoch": 0.59, + "learning_rate": 7.289316045849413e-06, + "loss": 0.6563, + "step": 16957 + }, + { + "epoch": 0.59, + "learning_rate": 7.288267964144415e-06, + "loss": 0.683, + "step": 16958 + }, + { + "epoch": 0.59, + "learning_rate": 7.287219914590434e-06, + "loss": 0.604, + "step": 16959 + }, + { + "epoch": 0.59, + "learning_rate": 7.2861718971998894e-06, + "loss": 0.6273, + "step": 16960 + }, + { + "epoch": 0.59, + "learning_rate": 7.285123911985211e-06, + "loss": 0.6935, + "step": 16961 + }, + { + "epoch": 0.59, + "learning_rate": 7.284075958958825e-06, + "loss": 0.6557, + "step": 16962 + }, + { + "epoch": 0.59, + "learning_rate": 7.283028038133151e-06, + "loss": 0.6347, + "step": 16963 + }, + { + "epoch": 0.59, + "learning_rate": 7.281980149520618e-06, + "loss": 0.6645, + "step": 16964 + }, + { + "epoch": 0.59, + "learning_rate": 7.280932293133649e-06, + "loss": 0.6468, + "step": 16965 + }, + { + "epoch": 0.59, + "learning_rate": 7.279884468984667e-06, + "loss": 0.6216, + "step": 16966 + }, + { + "epoch": 0.59, + "learning_rate": 7.278836677086094e-06, + "loss": 0.6182, + "step": 16967 + }, + { + "epoch": 0.59, + "learning_rate": 7.277788917450358e-06, + "loss": 0.5817, + "step": 16968 + }, + { + "epoch": 0.59, + "learning_rate": 7.276741190089875e-06, + "loss": 0.6421, + "step": 16969 + }, + { + "epoch": 0.59, + "learning_rate": 7.275693495017071e-06, + "loss": 0.645, + "step": 16970 + }, + { + "epoch": 0.59, + "learning_rate": 7.274645832244368e-06, + "loss": 0.6557, + "step": 16971 + }, + { + "epoch": 0.59, + "learning_rate": 7.273598201784185e-06, + "loss": 0.6341, + "step": 16972 + }, + { + "epoch": 0.59, + "learning_rate": 7.2725506036489425e-06, + "loss": 0.6427, + "step": 16973 + }, + { + "epoch": 0.59, + "learning_rate": 7.271503037851066e-06, + "loss": 0.653, + "step": 16974 + }, + { + "epoch": 0.59, + "learning_rate": 7.270455504402971e-06, + "loss": 0.6342, + "step": 16975 + }, + { + "epoch": 0.59, + "learning_rate": 7.269408003317079e-06, + "loss": 0.6369, + "step": 16976 + }, + { + "epoch": 0.59, + "learning_rate": 7.2683605346058114e-06, + "loss": 0.6373, + "step": 16977 + }, + { + "epoch": 0.59, + "learning_rate": 7.267313098281582e-06, + "loss": 0.6544, + "step": 16978 + }, + { + "epoch": 0.59, + "learning_rate": 7.266265694356813e-06, + "loss": 0.6373, + "step": 16979 + }, + { + "epoch": 0.59, + "learning_rate": 7.265218322843926e-06, + "loss": 0.5853, + "step": 16980 + }, + { + "epoch": 0.59, + "learning_rate": 7.264170983755332e-06, + "loss": 0.6599, + "step": 16981 + }, + { + "epoch": 0.59, + "learning_rate": 7.263123677103452e-06, + "loss": 0.6192, + "step": 16982 + }, + { + "epoch": 0.59, + "learning_rate": 7.262076402900704e-06, + "loss": 0.6411, + "step": 16983 + }, + { + "epoch": 0.59, + "learning_rate": 7.261029161159503e-06, + "loss": 0.5934, + "step": 16984 + }, + { + "epoch": 0.59, + "learning_rate": 7.259981951892266e-06, + "loss": 0.6259, + "step": 16985 + }, + { + "epoch": 0.59, + "learning_rate": 7.25893477511141e-06, + "loss": 0.5919, + "step": 16986 + }, + { + "epoch": 0.59, + "learning_rate": 7.257887630829349e-06, + "loss": 0.5626, + "step": 16987 + }, + { + "epoch": 0.59, + "learning_rate": 7.256840519058499e-06, + "loss": 0.5241, + "step": 16988 + }, + { + "epoch": 0.59, + "learning_rate": 7.255793439811276e-06, + "loss": 0.6775, + "step": 16989 + }, + { + "epoch": 0.59, + "learning_rate": 7.2547463931000916e-06, + "loss": 0.6178, + "step": 16990 + }, + { + "epoch": 0.59, + "learning_rate": 7.25369937893736e-06, + "loss": 0.6495, + "step": 16991 + }, + { + "epoch": 0.59, + "learning_rate": 7.2526523973355005e-06, + "loss": 0.6155, + "step": 16992 + }, + { + "epoch": 0.59, + "learning_rate": 7.2516054483069194e-06, + "loss": 0.6063, + "step": 16993 + }, + { + "epoch": 0.59, + "learning_rate": 7.250558531864031e-06, + "loss": 0.6316, + "step": 16994 + }, + { + "epoch": 0.59, + "learning_rate": 7.249511648019254e-06, + "loss": 0.6102, + "step": 16995 + }, + { + "epoch": 0.59, + "learning_rate": 7.248464796784993e-06, + "loss": 0.6309, + "step": 16996 + }, + { + "epoch": 0.59, + "learning_rate": 7.247417978173661e-06, + "loss": 0.5975, + "step": 16997 + }, + { + "epoch": 0.59, + "learning_rate": 7.246371192197674e-06, + "loss": 0.6437, + "step": 16998 + }, + { + "epoch": 0.59, + "learning_rate": 7.2453244388694385e-06, + "loss": 0.5876, + "step": 16999 + }, + { + "epoch": 0.59, + "learning_rate": 7.244277718201364e-06, + "loss": 0.6177, + "step": 17000 + }, + { + "epoch": 0.59, + "learning_rate": 7.2432310302058685e-06, + "loss": 0.5962, + "step": 17001 + }, + { + "epoch": 0.59, + "learning_rate": 7.242184374895354e-06, + "loss": 0.616, + "step": 17002 + }, + { + "epoch": 0.59, + "learning_rate": 7.24113775228223e-06, + "loss": 0.6472, + "step": 17003 + }, + { + "epoch": 0.59, + "learning_rate": 7.24009116237891e-06, + "loss": 0.6221, + "step": 17004 + }, + { + "epoch": 0.59, + "learning_rate": 7.2390446051978e-06, + "loss": 0.6257, + "step": 17005 + }, + { + "epoch": 0.59, + "learning_rate": 7.2379980807513096e-06, + "loss": 0.6324, + "step": 17006 + }, + { + "epoch": 0.59, + "learning_rate": 7.236951589051847e-06, + "loss": 0.669, + "step": 17007 + }, + { + "epoch": 0.59, + "learning_rate": 7.235905130111816e-06, + "loss": 0.6292, + "step": 17008 + }, + { + "epoch": 0.59, + "learning_rate": 7.234858703943628e-06, + "loss": 0.6084, + "step": 17009 + }, + { + "epoch": 0.59, + "learning_rate": 7.233812310559688e-06, + "loss": 0.5943, + "step": 17010 + }, + { + "epoch": 0.59, + "learning_rate": 7.232765949972401e-06, + "loss": 0.6301, + "step": 17011 + }, + { + "epoch": 0.59, + "learning_rate": 7.231719622194175e-06, + "loss": 0.6138, + "step": 17012 + }, + { + "epoch": 0.59, + "learning_rate": 7.230673327237416e-06, + "loss": 0.6331, + "step": 17013 + }, + { + "epoch": 0.59, + "learning_rate": 7.229627065114526e-06, + "loss": 0.6329, + "step": 17014 + }, + { + "epoch": 0.59, + "learning_rate": 7.228580835837911e-06, + "loss": 0.6013, + "step": 17015 + }, + { + "epoch": 0.59, + "learning_rate": 7.22753463941998e-06, + "loss": 0.6875, + "step": 17016 + }, + { + "epoch": 0.59, + "learning_rate": 7.226488475873129e-06, + "loss": 0.6435, + "step": 17017 + }, + { + "epoch": 0.59, + "learning_rate": 7.225442345209768e-06, + "loss": 0.6069, + "step": 17018 + }, + { + "epoch": 0.59, + "learning_rate": 7.2243962474422955e-06, + "loss": 0.6209, + "step": 17019 + }, + { + "epoch": 0.59, + "learning_rate": 7.223350182583118e-06, + "loss": 0.5896, + "step": 17020 + }, + { + "epoch": 0.59, + "learning_rate": 7.222304150644639e-06, + "loss": 0.6002, + "step": 17021 + }, + { + "epoch": 0.59, + "learning_rate": 7.221258151639254e-06, + "loss": 0.674, + "step": 17022 + }, + { + "epoch": 0.59, + "learning_rate": 7.220212185579369e-06, + "loss": 0.6539, + "step": 17023 + }, + { + "epoch": 0.59, + "learning_rate": 7.21916625247739e-06, + "loss": 0.6568, + "step": 17024 + }, + { + "epoch": 0.59, + "learning_rate": 7.218120352345708e-06, + "loss": 0.6647, + "step": 17025 + }, + { + "epoch": 0.59, + "learning_rate": 7.217074485196729e-06, + "loss": 0.6297, + "step": 17026 + }, + { + "epoch": 0.59, + "learning_rate": 7.216028651042855e-06, + "loss": 0.617, + "step": 17027 + }, + { + "epoch": 0.59, + "learning_rate": 7.214982849896479e-06, + "loss": 0.6368, + "step": 17028 + }, + { + "epoch": 0.59, + "learning_rate": 7.213937081770006e-06, + "loss": 0.6239, + "step": 17029 + }, + { + "epoch": 0.59, + "learning_rate": 7.2128913466758355e-06, + "loss": 0.6353, + "step": 17030 + }, + { + "epoch": 0.59, + "learning_rate": 7.211845644626361e-06, + "loss": 0.6097, + "step": 17031 + }, + { + "epoch": 0.59, + "learning_rate": 7.210799975633984e-06, + "loss": 0.5661, + "step": 17032 + }, + { + "epoch": 0.59, + "learning_rate": 7.209754339711103e-06, + "loss": 0.6078, + "step": 17033 + }, + { + "epoch": 0.59, + "learning_rate": 7.208708736870113e-06, + "loss": 0.6533, + "step": 17034 + }, + { + "epoch": 0.59, + "learning_rate": 7.207663167123411e-06, + "loss": 0.6576, + "step": 17035 + }, + { + "epoch": 0.59, + "learning_rate": 7.206617630483397e-06, + "loss": 0.6497, + "step": 17036 + }, + { + "epoch": 0.59, + "learning_rate": 7.205572126962462e-06, + "loss": 0.662, + "step": 17037 + }, + { + "epoch": 0.59, + "learning_rate": 7.2045266565730054e-06, + "loss": 0.5739, + "step": 17038 + }, + { + "epoch": 0.59, + "learning_rate": 7.203481219327424e-06, + "loss": 0.5715, + "step": 17039 + }, + { + "epoch": 0.59, + "learning_rate": 7.202435815238107e-06, + "loss": 0.6349, + "step": 17040 + }, + { + "epoch": 0.59, + "learning_rate": 7.201390444317452e-06, + "loss": 0.6516, + "step": 17041 + }, + { + "epoch": 0.59, + "learning_rate": 7.200345106577857e-06, + "loss": 0.6712, + "step": 17042 + }, + { + "epoch": 0.59, + "learning_rate": 7.199299802031709e-06, + "loss": 0.5989, + "step": 17043 + }, + { + "epoch": 0.59, + "learning_rate": 7.198254530691405e-06, + "loss": 0.6193, + "step": 17044 + }, + { + "epoch": 0.59, + "learning_rate": 7.1972092925693405e-06, + "loss": 0.6232, + "step": 17045 + }, + { + "epoch": 0.59, + "learning_rate": 7.196164087677904e-06, + "loss": 0.5917, + "step": 17046 + }, + { + "epoch": 0.59, + "learning_rate": 7.195118916029487e-06, + "loss": 0.6527, + "step": 17047 + }, + { + "epoch": 0.59, + "learning_rate": 7.194073777636488e-06, + "loss": 0.6665, + "step": 17048 + }, + { + "epoch": 0.59, + "learning_rate": 7.19302867251129e-06, + "loss": 0.6361, + "step": 17049 + }, + { + "epoch": 0.59, + "learning_rate": 7.191983600666288e-06, + "loss": 0.6514, + "step": 17050 + }, + { + "epoch": 0.59, + "learning_rate": 7.190938562113875e-06, + "loss": 0.5436, + "step": 17051 + }, + { + "epoch": 0.59, + "learning_rate": 7.189893556866436e-06, + "loss": 0.6262, + "step": 17052 + }, + { + "epoch": 0.59, + "learning_rate": 7.188848584936365e-06, + "loss": 0.6409, + "step": 17053 + }, + { + "epoch": 0.59, + "learning_rate": 7.187803646336051e-06, + "loss": 0.6126, + "step": 17054 + }, + { + "epoch": 0.59, + "learning_rate": 7.186758741077882e-06, + "loss": 0.6209, + "step": 17055 + }, + { + "epoch": 0.59, + "learning_rate": 7.1857138691742456e-06, + "loss": 0.6438, + "step": 17056 + }, + { + "epoch": 0.59, + "learning_rate": 7.184669030637534e-06, + "loss": 0.582, + "step": 17057 + }, + { + "epoch": 0.59, + "learning_rate": 7.18362422548013e-06, + "loss": 0.6622, + "step": 17058 + }, + { + "epoch": 0.59, + "learning_rate": 7.182579453714422e-06, + "loss": 0.6702, + "step": 17059 + }, + { + "epoch": 0.59, + "learning_rate": 7.181534715352802e-06, + "loss": 0.6122, + "step": 17060 + }, + { + "epoch": 0.59, + "learning_rate": 7.1804900104076525e-06, + "loss": 0.5699, + "step": 17061 + }, + { + "epoch": 0.59, + "learning_rate": 7.17944533889136e-06, + "loss": 0.6446, + "step": 17062 + }, + { + "epoch": 0.59, + "learning_rate": 7.178400700816313e-06, + "loss": 0.6861, + "step": 17063 + }, + { + "epoch": 0.59, + "learning_rate": 7.177356096194892e-06, + "loss": 0.648, + "step": 17064 + }, + { + "epoch": 0.59, + "learning_rate": 7.176311525039486e-06, + "loss": 0.6653, + "step": 17065 + }, + { + "epoch": 0.59, + "learning_rate": 7.175266987362481e-06, + "loss": 0.6795, + "step": 17066 + }, + { + "epoch": 0.59, + "learning_rate": 7.174222483176257e-06, + "loss": 0.6564, + "step": 17067 + }, + { + "epoch": 0.59, + "learning_rate": 7.173178012493199e-06, + "loss": 0.6493, + "step": 17068 + }, + { + "epoch": 0.59, + "learning_rate": 7.172133575325695e-06, + "loss": 0.6497, + "step": 17069 + }, + { + "epoch": 0.59, + "learning_rate": 7.171089171686123e-06, + "loss": 0.6016, + "step": 17070 + }, + { + "epoch": 0.59, + "learning_rate": 7.170044801586866e-06, + "loss": 0.6143, + "step": 17071 + }, + { + "epoch": 0.59, + "learning_rate": 7.16900046504031e-06, + "loss": 0.6587, + "step": 17072 + }, + { + "epoch": 0.59, + "learning_rate": 7.167956162058833e-06, + "loss": 0.6633, + "step": 17073 + }, + { + "epoch": 0.59, + "learning_rate": 7.1669118926548195e-06, + "loss": 0.6591, + "step": 17074 + }, + { + "epoch": 0.59, + "learning_rate": 7.16586765684065e-06, + "loss": 0.6887, + "step": 17075 + }, + { + "epoch": 0.59, + "learning_rate": 7.164823454628704e-06, + "loss": 0.6506, + "step": 17076 + }, + { + "epoch": 0.59, + "learning_rate": 7.16377928603136e-06, + "loss": 0.6307, + "step": 17077 + }, + { + "epoch": 0.59, + "learning_rate": 7.162735151061004e-06, + "loss": 0.6493, + "step": 17078 + }, + { + "epoch": 0.59, + "learning_rate": 7.161691049730011e-06, + "loss": 0.585, + "step": 17079 + }, + { + "epoch": 0.59, + "learning_rate": 7.160646982050763e-06, + "loss": 0.6511, + "step": 17080 + }, + { + "epoch": 0.59, + "learning_rate": 7.159602948035632e-06, + "loss": 0.5743, + "step": 17081 + }, + { + "epoch": 0.59, + "learning_rate": 7.158558947697003e-06, + "loss": 0.6342, + "step": 17082 + }, + { + "epoch": 0.59, + "learning_rate": 7.157514981047256e-06, + "loss": 0.624, + "step": 17083 + }, + { + "epoch": 0.59, + "learning_rate": 7.156471048098759e-06, + "loss": 0.6007, + "step": 17084 + }, + { + "epoch": 0.59, + "learning_rate": 7.155427148863896e-06, + "loss": 0.6484, + "step": 17085 + }, + { + "epoch": 0.59, + "learning_rate": 7.1543832833550475e-06, + "loss": 0.6546, + "step": 17086 + }, + { + "epoch": 0.59, + "learning_rate": 7.153339451584578e-06, + "loss": 0.648, + "step": 17087 + }, + { + "epoch": 0.59, + "learning_rate": 7.152295653564874e-06, + "loss": 0.6133, + "step": 17088 + }, + { + "epoch": 0.59, + "learning_rate": 7.15125188930831e-06, + "loss": 0.6623, + "step": 17089 + }, + { + "epoch": 0.59, + "learning_rate": 7.150208158827252e-06, + "loss": 0.6435, + "step": 17090 + }, + { + "epoch": 0.59, + "learning_rate": 7.149164462134084e-06, + "loss": 0.6288, + "step": 17091 + }, + { + "epoch": 0.59, + "learning_rate": 7.148120799241182e-06, + "loss": 0.6664, + "step": 17092 + }, + { + "epoch": 0.59, + "learning_rate": 7.147077170160909e-06, + "loss": 0.6192, + "step": 17093 + }, + { + "epoch": 0.59, + "learning_rate": 7.146033574905647e-06, + "loss": 0.645, + "step": 17094 + }, + { + "epoch": 0.59, + "learning_rate": 7.144990013487772e-06, + "loss": 0.6552, + "step": 17095 + }, + { + "epoch": 0.59, + "learning_rate": 7.143946485919645e-06, + "loss": 0.6339, + "step": 17096 + }, + { + "epoch": 0.59, + "learning_rate": 7.142902992213648e-06, + "loss": 0.669, + "step": 17097 + }, + { + "epoch": 0.59, + "learning_rate": 7.141859532382154e-06, + "loss": 0.6252, + "step": 17098 + }, + { + "epoch": 0.59, + "learning_rate": 7.140816106437525e-06, + "loss": 0.5985, + "step": 17099 + }, + { + "epoch": 0.59, + "learning_rate": 7.13977271439214e-06, + "loss": 0.5871, + "step": 17100 + }, + { + "epoch": 0.59, + "learning_rate": 7.1387293562583714e-06, + "loss": 0.5765, + "step": 17101 + }, + { + "epoch": 0.59, + "learning_rate": 7.137686032048581e-06, + "loss": 0.6366, + "step": 17102 + }, + { + "epoch": 0.59, + "learning_rate": 7.136642741775144e-06, + "loss": 0.6523, + "step": 17103 + }, + { + "epoch": 0.59, + "learning_rate": 7.135599485450434e-06, + "loss": 0.6152, + "step": 17104 + }, + { + "epoch": 0.59, + "learning_rate": 7.1345562630868096e-06, + "loss": 0.6182, + "step": 17105 + }, + { + "epoch": 0.59, + "learning_rate": 7.1335130746966475e-06, + "loss": 0.6111, + "step": 17106 + }, + { + "epoch": 0.59, + "learning_rate": 7.132469920292318e-06, + "loss": 0.5838, + "step": 17107 + }, + { + "epoch": 0.59, + "learning_rate": 7.131426799886179e-06, + "loss": 0.6281, + "step": 17108 + }, + { + "epoch": 0.59, + "learning_rate": 7.130383713490607e-06, + "loss": 0.6659, + "step": 17109 + }, + { + "epoch": 0.59, + "learning_rate": 7.1293406611179685e-06, + "loss": 0.6288, + "step": 17110 + }, + { + "epoch": 0.59, + "learning_rate": 7.128297642780622e-06, + "loss": 0.6738, + "step": 17111 + }, + { + "epoch": 0.59, + "learning_rate": 7.127254658490943e-06, + "loss": 0.6178, + "step": 17112 + }, + { + "epoch": 0.59, + "learning_rate": 7.126211708261297e-06, + "loss": 0.6593, + "step": 17113 + }, + { + "epoch": 0.59, + "learning_rate": 7.125168792104041e-06, + "loss": 0.676, + "step": 17114 + }, + { + "epoch": 0.59, + "learning_rate": 7.124125910031547e-06, + "loss": 0.6834, + "step": 17115 + }, + { + "epoch": 0.59, + "learning_rate": 7.123083062056184e-06, + "loss": 0.6319, + "step": 17116 + }, + { + "epoch": 0.59, + "learning_rate": 7.122040248190305e-06, + "loss": 0.6275, + "step": 17117 + }, + { + "epoch": 0.59, + "learning_rate": 7.120997468446278e-06, + "loss": 0.627, + "step": 17118 + }, + { + "epoch": 0.59, + "learning_rate": 7.119954722836474e-06, + "loss": 0.6148, + "step": 17119 + }, + { + "epoch": 0.59, + "learning_rate": 7.118912011373247e-06, + "loss": 0.6421, + "step": 17120 + }, + { + "epoch": 0.59, + "learning_rate": 7.117869334068959e-06, + "loss": 0.5998, + "step": 17121 + }, + { + "epoch": 0.59, + "learning_rate": 7.116826690935983e-06, + "loss": 0.5802, + "step": 17122 + }, + { + "epoch": 0.59, + "learning_rate": 7.11578408198667e-06, + "loss": 0.6102, + "step": 17123 + }, + { + "epoch": 0.59, + "learning_rate": 7.114741507233383e-06, + "loss": 0.5927, + "step": 17124 + }, + { + "epoch": 0.59, + "learning_rate": 7.1136989666884904e-06, + "loss": 0.6644, + "step": 17125 + }, + { + "epoch": 0.59, + "learning_rate": 7.112656460364344e-06, + "loss": 0.5892, + "step": 17126 + }, + { + "epoch": 0.59, + "learning_rate": 7.111613988273306e-06, + "loss": 0.5768, + "step": 17127 + }, + { + "epoch": 0.59, + "learning_rate": 7.110571550427745e-06, + "loss": 0.6252, + "step": 17128 + }, + { + "epoch": 0.59, + "learning_rate": 7.1095291468400084e-06, + "loss": 0.6567, + "step": 17129 + }, + { + "epoch": 0.59, + "learning_rate": 7.108486777522459e-06, + "loss": 0.6312, + "step": 17130 + }, + { + "epoch": 0.59, + "learning_rate": 7.1074444424874615e-06, + "loss": 0.6211, + "step": 17131 + }, + { + "epoch": 0.59, + "learning_rate": 7.106402141747366e-06, + "loss": 0.6178, + "step": 17132 + }, + { + "epoch": 0.59, + "learning_rate": 7.1053598753145304e-06, + "loss": 0.6414, + "step": 17133 + }, + { + "epoch": 0.59, + "learning_rate": 7.104317643201322e-06, + "loss": 0.6708, + "step": 17134 + }, + { + "epoch": 0.59, + "learning_rate": 7.103275445420088e-06, + "loss": 0.6191, + "step": 17135 + }, + { + "epoch": 0.59, + "learning_rate": 7.1022332819831845e-06, + "loss": 0.6219, + "step": 17136 + }, + { + "epoch": 0.59, + "learning_rate": 7.101191152902978e-06, + "loss": 0.576, + "step": 17137 + }, + { + "epoch": 0.59, + "learning_rate": 7.100149058191813e-06, + "loss": 0.6445, + "step": 17138 + }, + { + "epoch": 0.59, + "learning_rate": 7.099106997862048e-06, + "loss": 0.6548, + "step": 17139 + }, + { + "epoch": 0.59, + "learning_rate": 7.098064971926044e-06, + "loss": 0.6602, + "step": 17140 + }, + { + "epoch": 0.59, + "learning_rate": 7.097022980396148e-06, + "loss": 0.6225, + "step": 17141 + }, + { + "epoch": 0.59, + "learning_rate": 7.095981023284717e-06, + "loss": 0.5852, + "step": 17142 + }, + { + "epoch": 0.59, + "learning_rate": 7.094939100604104e-06, + "loss": 0.638, + "step": 17143 + }, + { + "epoch": 0.59, + "learning_rate": 7.093897212366662e-06, + "loss": 0.6842, + "step": 17144 + }, + { + "epoch": 0.59, + "learning_rate": 7.0928553585847496e-06, + "loss": 0.6031, + "step": 17145 + }, + { + "epoch": 0.59, + "learning_rate": 7.091813539270709e-06, + "loss": 0.6531, + "step": 17146 + }, + { + "epoch": 0.59, + "learning_rate": 7.090771754436899e-06, + "loss": 0.6572, + "step": 17147 + }, + { + "epoch": 0.59, + "learning_rate": 7.089730004095672e-06, + "loss": 0.6212, + "step": 17148 + }, + { + "epoch": 0.59, + "learning_rate": 7.088688288259375e-06, + "loss": 0.648, + "step": 17149 + }, + { + "epoch": 0.59, + "learning_rate": 7.087646606940361e-06, + "loss": 0.5691, + "step": 17150 + }, + { + "epoch": 0.59, + "learning_rate": 7.086604960150985e-06, + "loss": 0.6707, + "step": 17151 + }, + { + "epoch": 0.59, + "learning_rate": 7.085563347903588e-06, + "loss": 0.6356, + "step": 17152 + }, + { + "epoch": 0.59, + "learning_rate": 7.0845217702105255e-06, + "loss": 0.6131, + "step": 17153 + }, + { + "epoch": 0.59, + "learning_rate": 7.083480227084147e-06, + "loss": 0.6169, + "step": 17154 + }, + { + "epoch": 0.59, + "learning_rate": 7.082438718536798e-06, + "loss": 0.6576, + "step": 17155 + }, + { + "epoch": 0.59, + "learning_rate": 7.0813972445808285e-06, + "loss": 0.6906, + "step": 17156 + }, + { + "epoch": 0.59, + "learning_rate": 7.080355805228589e-06, + "loss": 0.6384, + "step": 17157 + }, + { + "epoch": 0.59, + "learning_rate": 7.079314400492423e-06, + "loss": 0.6916, + "step": 17158 + }, + { + "epoch": 0.59, + "learning_rate": 7.0782730303846794e-06, + "loss": 0.6564, + "step": 17159 + }, + { + "epoch": 0.59, + "learning_rate": 7.077231694917707e-06, + "loss": 0.651, + "step": 17160 + }, + { + "epoch": 0.59, + "learning_rate": 7.076190394103848e-06, + "loss": 0.6077, + "step": 17161 + }, + { + "epoch": 0.59, + "learning_rate": 7.07514912795545e-06, + "loss": 0.6881, + "step": 17162 + }, + { + "epoch": 0.59, + "learning_rate": 7.074107896484861e-06, + "loss": 0.6655, + "step": 17163 + }, + { + "epoch": 0.59, + "learning_rate": 7.073066699704423e-06, + "loss": 0.6216, + "step": 17164 + }, + { + "epoch": 0.59, + "learning_rate": 7.072025537626482e-06, + "loss": 0.6369, + "step": 17165 + }, + { + "epoch": 0.59, + "learning_rate": 7.070984410263384e-06, + "loss": 0.6524, + "step": 17166 + }, + { + "epoch": 0.59, + "learning_rate": 7.069943317627468e-06, + "loss": 0.6267, + "step": 17167 + }, + { + "epoch": 0.59, + "learning_rate": 7.068902259731082e-06, + "loss": 0.6333, + "step": 17168 + }, + { + "epoch": 0.59, + "learning_rate": 7.067861236586569e-06, + "loss": 0.659, + "step": 17169 + }, + { + "epoch": 0.59, + "learning_rate": 7.066820248206267e-06, + "loss": 0.672, + "step": 17170 + }, + { + "epoch": 0.59, + "learning_rate": 7.065779294602524e-06, + "loss": 0.613, + "step": 17171 + }, + { + "epoch": 0.59, + "learning_rate": 7.064738375787678e-06, + "loss": 0.6424, + "step": 17172 + }, + { + "epoch": 0.59, + "learning_rate": 7.063697491774073e-06, + "loss": 0.6335, + "step": 17173 + }, + { + "epoch": 0.6, + "learning_rate": 7.062656642574046e-06, + "loss": 0.6138, + "step": 17174 + }, + { + "epoch": 0.6, + "learning_rate": 7.0616158281999435e-06, + "loss": 0.6752, + "step": 17175 + }, + { + "epoch": 0.6, + "learning_rate": 7.060575048664101e-06, + "loss": 0.6305, + "step": 17176 + }, + { + "epoch": 0.6, + "learning_rate": 7.059534303978859e-06, + "loss": 0.6168, + "step": 17177 + }, + { + "epoch": 0.6, + "learning_rate": 7.058493594156559e-06, + "loss": 0.6592, + "step": 17178 + }, + { + "epoch": 0.6, + "learning_rate": 7.057452919209538e-06, + "loss": 0.6007, + "step": 17179 + }, + { + "epoch": 0.6, + "learning_rate": 7.056412279150133e-06, + "loss": 0.5947, + "step": 17180 + }, + { + "epoch": 0.6, + "learning_rate": 7.0553716739906875e-06, + "loss": 0.6876, + "step": 17181 + }, + { + "epoch": 0.6, + "learning_rate": 7.054331103743533e-06, + "loss": 0.6322, + "step": 17182 + }, + { + "epoch": 0.6, + "learning_rate": 7.0532905684210105e-06, + "loss": 0.6088, + "step": 17183 + }, + { + "epoch": 0.6, + "learning_rate": 7.052250068035458e-06, + "loss": 0.6112, + "step": 17184 + }, + { + "epoch": 0.6, + "learning_rate": 7.0512096025992074e-06, + "loss": 0.6347, + "step": 17185 + }, + { + "epoch": 0.6, + "learning_rate": 7.050169172124597e-06, + "loss": 0.6078, + "step": 17186 + }, + { + "epoch": 0.6, + "learning_rate": 7.049128776623964e-06, + "loss": 0.6314, + "step": 17187 + }, + { + "epoch": 0.6, + "learning_rate": 7.048088416109641e-06, + "loss": 0.6074, + "step": 17188 + }, + { + "epoch": 0.6, + "learning_rate": 7.047048090593964e-06, + "loss": 0.6331, + "step": 17189 + }, + { + "epoch": 0.6, + "learning_rate": 7.04600780008927e-06, + "loss": 0.6293, + "step": 17190 + }, + { + "epoch": 0.6, + "learning_rate": 7.044967544607885e-06, + "loss": 0.7025, + "step": 17191 + }, + { + "epoch": 0.6, + "learning_rate": 7.043927324162152e-06, + "loss": 0.6068, + "step": 17192 + }, + { + "epoch": 0.6, + "learning_rate": 7.0428871387644e-06, + "loss": 0.6318, + "step": 17193 + }, + { + "epoch": 0.6, + "learning_rate": 7.041846988426961e-06, + "loss": 0.6723, + "step": 17194 + }, + { + "epoch": 0.6, + "learning_rate": 7.040806873162167e-06, + "loss": 0.6528, + "step": 17195 + }, + { + "epoch": 0.6, + "learning_rate": 7.039766792982355e-06, + "loss": 0.6677, + "step": 17196 + }, + { + "epoch": 0.6, + "learning_rate": 7.038726747899847e-06, + "loss": 0.6836, + "step": 17197 + }, + { + "epoch": 0.6, + "learning_rate": 7.037686737926981e-06, + "loss": 0.6596, + "step": 17198 + }, + { + "epoch": 0.6, + "learning_rate": 7.036646763076088e-06, + "loss": 0.6303, + "step": 17199 + }, + { + "epoch": 0.6, + "learning_rate": 7.035606823359495e-06, + "loss": 0.6526, + "step": 17200 + }, + { + "epoch": 0.6, + "learning_rate": 7.034566918789531e-06, + "loss": 0.6783, + "step": 17201 + }, + { + "epoch": 0.6, + "learning_rate": 7.033527049378532e-06, + "loss": 0.6338, + "step": 17202 + }, + { + "epoch": 0.6, + "learning_rate": 7.032487215138819e-06, + "loss": 0.6658, + "step": 17203 + }, + { + "epoch": 0.6, + "learning_rate": 7.031447416082727e-06, + "loss": 0.6316, + "step": 17204 + }, + { + "epoch": 0.6, + "learning_rate": 7.030407652222578e-06, + "loss": 0.6385, + "step": 17205 + }, + { + "epoch": 0.6, + "learning_rate": 7.029367923570704e-06, + "loss": 0.6539, + "step": 17206 + }, + { + "epoch": 0.6, + "learning_rate": 7.028328230139432e-06, + "loss": 0.6896, + "step": 17207 + }, + { + "epoch": 0.6, + "learning_rate": 7.027288571941086e-06, + "loss": 0.6489, + "step": 17208 + }, + { + "epoch": 0.6, + "learning_rate": 7.026248948987996e-06, + "loss": 0.6526, + "step": 17209 + }, + { + "epoch": 0.6, + "learning_rate": 7.025209361292487e-06, + "loss": 0.6694, + "step": 17210 + }, + { + "epoch": 0.6, + "learning_rate": 7.024169808866883e-06, + "loss": 0.6159, + "step": 17211 + }, + { + "epoch": 0.6, + "learning_rate": 7.02313029172351e-06, + "loss": 0.5899, + "step": 17212 + }, + { + "epoch": 0.6, + "learning_rate": 7.0220908098746954e-06, + "loss": 0.6615, + "step": 17213 + }, + { + "epoch": 0.6, + "learning_rate": 7.021051363332758e-06, + "loss": 0.6166, + "step": 17214 + }, + { + "epoch": 0.6, + "learning_rate": 7.020011952110026e-06, + "loss": 0.6104, + "step": 17215 + }, + { + "epoch": 0.6, + "learning_rate": 7.0189725762188256e-06, + "loss": 0.6314, + "step": 17216 + }, + { + "epoch": 0.6, + "learning_rate": 7.017933235671472e-06, + "loss": 0.5998, + "step": 17217 + }, + { + "epoch": 0.6, + "learning_rate": 7.016893930480293e-06, + "loss": 0.6651, + "step": 17218 + }, + { + "epoch": 0.6, + "learning_rate": 7.015854660657613e-06, + "loss": 0.625, + "step": 17219 + }, + { + "epoch": 0.6, + "learning_rate": 7.014815426215749e-06, + "loss": 0.5964, + "step": 17220 + }, + { + "epoch": 0.6, + "learning_rate": 7.013776227167022e-06, + "loss": 0.6501, + "step": 17221 + }, + { + "epoch": 0.6, + "learning_rate": 7.01273706352376e-06, + "loss": 0.6155, + "step": 17222 + }, + { + "epoch": 0.6, + "learning_rate": 7.011697935298276e-06, + "loss": 0.5903, + "step": 17223 + }, + { + "epoch": 0.6, + "learning_rate": 7.010658842502893e-06, + "loss": 0.6482, + "step": 17224 + }, + { + "epoch": 0.6, + "learning_rate": 7.009619785149932e-06, + "loss": 0.6404, + "step": 17225 + }, + { + "epoch": 0.6, + "learning_rate": 7.008580763251711e-06, + "loss": 0.6418, + "step": 17226 + }, + { + "epoch": 0.6, + "learning_rate": 7.00754177682055e-06, + "loss": 0.6114, + "step": 17227 + }, + { + "epoch": 0.6, + "learning_rate": 7.006502825868766e-06, + "loss": 0.6081, + "step": 17228 + }, + { + "epoch": 0.6, + "learning_rate": 7.005463910408679e-06, + "loss": 0.5921, + "step": 17229 + }, + { + "epoch": 0.6, + "learning_rate": 7.004425030452602e-06, + "loss": 0.6708, + "step": 17230 + }, + { + "epoch": 0.6, + "learning_rate": 7.003386186012859e-06, + "loss": 0.621, + "step": 17231 + }, + { + "epoch": 0.6, + "learning_rate": 7.0023473771017635e-06, + "loss": 0.6855, + "step": 17232 + }, + { + "epoch": 0.6, + "learning_rate": 7.001308603731629e-06, + "loss": 0.6292, + "step": 17233 + }, + { + "epoch": 0.6, + "learning_rate": 7.000269865914779e-06, + "loss": 0.6106, + "step": 17234 + }, + { + "epoch": 0.6, + "learning_rate": 6.99923116366352e-06, + "loss": 0.6212, + "step": 17235 + }, + { + "epoch": 0.6, + "learning_rate": 6.998192496990172e-06, + "loss": 0.6022, + "step": 17236 + }, + { + "epoch": 0.6, + "learning_rate": 6.997153865907052e-06, + "loss": 0.6598, + "step": 17237 + }, + { + "epoch": 0.6, + "learning_rate": 6.9961152704264704e-06, + "loss": 0.6018, + "step": 17238 + }, + { + "epoch": 0.6, + "learning_rate": 6.995076710560741e-06, + "loss": 0.5991, + "step": 17239 + }, + { + "epoch": 0.6, + "learning_rate": 6.9940381863221805e-06, + "loss": 0.6972, + "step": 17240 + }, + { + "epoch": 0.6, + "learning_rate": 6.9929996977230975e-06, + "loss": 0.6948, + "step": 17241 + }, + { + "epoch": 0.6, + "learning_rate": 6.991961244775808e-06, + "loss": 0.6309, + "step": 17242 + }, + { + "epoch": 0.6, + "learning_rate": 6.990922827492624e-06, + "loss": 0.6478, + "step": 17243 + }, + { + "epoch": 0.6, + "learning_rate": 6.989884445885855e-06, + "loss": 0.6248, + "step": 17244 + }, + { + "epoch": 0.6, + "learning_rate": 6.988846099967814e-06, + "loss": 0.6119, + "step": 17245 + }, + { + "epoch": 0.6, + "learning_rate": 6.987807789750814e-06, + "loss": 0.63, + "step": 17246 + }, + { + "epoch": 0.6, + "learning_rate": 6.98676951524716e-06, + "loss": 0.608, + "step": 17247 + }, + { + "epoch": 0.6, + "learning_rate": 6.985731276469165e-06, + "loss": 0.6182, + "step": 17248 + }, + { + "epoch": 0.6, + "learning_rate": 6.984693073429141e-06, + "loss": 0.6462, + "step": 17249 + }, + { + "epoch": 0.6, + "learning_rate": 6.983654906139394e-06, + "loss": 0.6508, + "step": 17250 + }, + { + "epoch": 0.6, + "learning_rate": 6.982616774612233e-06, + "loss": 0.6153, + "step": 17251 + }, + { + "epoch": 0.6, + "learning_rate": 6.981578678859969e-06, + "loss": 0.6264, + "step": 17252 + }, + { + "epoch": 0.6, + "learning_rate": 6.9805406188949065e-06, + "loss": 0.6635, + "step": 17253 + }, + { + "epoch": 0.6, + "learning_rate": 6.979502594729355e-06, + "loss": 0.5959, + "step": 17254 + }, + { + "epoch": 0.6, + "learning_rate": 6.978464606375623e-06, + "loss": 0.6475, + "step": 17255 + }, + { + "epoch": 0.6, + "learning_rate": 6.977426653846011e-06, + "loss": 0.5892, + "step": 17256 + }, + { + "epoch": 0.6, + "learning_rate": 6.976388737152833e-06, + "loss": 0.5915, + "step": 17257 + }, + { + "epoch": 0.6, + "learning_rate": 6.975350856308392e-06, + "loss": 0.6169, + "step": 17258 + }, + { + "epoch": 0.6, + "learning_rate": 6.97431301132499e-06, + "loss": 0.5932, + "step": 17259 + }, + { + "epoch": 0.6, + "learning_rate": 6.973275202214935e-06, + "loss": 0.5905, + "step": 17260 + }, + { + "epoch": 0.6, + "learning_rate": 6.9722374289905345e-06, + "loss": 0.6494, + "step": 17261 + }, + { + "epoch": 0.6, + "learning_rate": 6.971199691664087e-06, + "loss": 0.6792, + "step": 17262 + }, + { + "epoch": 0.6, + "learning_rate": 6.970161990247899e-06, + "loss": 0.6621, + "step": 17263 + }, + { + "epoch": 0.6, + "learning_rate": 6.969124324754274e-06, + "loss": 0.661, + "step": 17264 + }, + { + "epoch": 0.6, + "learning_rate": 6.968086695195513e-06, + "loss": 0.6315, + "step": 17265 + }, + { + "epoch": 0.6, + "learning_rate": 6.967049101583921e-06, + "loss": 0.6702, + "step": 17266 + }, + { + "epoch": 0.6, + "learning_rate": 6.966011543931798e-06, + "loss": 0.6218, + "step": 17267 + }, + { + "epoch": 0.6, + "learning_rate": 6.964974022251445e-06, + "loss": 0.6007, + "step": 17268 + }, + { + "epoch": 0.6, + "learning_rate": 6.963936536555167e-06, + "loss": 0.6464, + "step": 17269 + }, + { + "epoch": 0.6, + "learning_rate": 6.9628990868552595e-06, + "loss": 0.6684, + "step": 17270 + }, + { + "epoch": 0.6, + "learning_rate": 6.961861673164026e-06, + "loss": 0.5905, + "step": 17271 + }, + { + "epoch": 0.6, + "learning_rate": 6.960824295493767e-06, + "loss": 0.6386, + "step": 17272 + }, + { + "epoch": 0.6, + "learning_rate": 6.9597869538567775e-06, + "loss": 0.6503, + "step": 17273 + }, + { + "epoch": 0.6, + "learning_rate": 6.9587496482653615e-06, + "loss": 0.6054, + "step": 17274 + }, + { + "epoch": 0.6, + "learning_rate": 6.957712378731815e-06, + "loss": 0.5945, + "step": 17275 + }, + { + "epoch": 0.6, + "learning_rate": 6.956675145268438e-06, + "loss": 0.6992, + "step": 17276 + }, + { + "epoch": 0.6, + "learning_rate": 6.955637947887526e-06, + "loss": 0.6224, + "step": 17277 + }, + { + "epoch": 0.6, + "learning_rate": 6.954600786601378e-06, + "loss": 0.5706, + "step": 17278 + }, + { + "epoch": 0.6, + "learning_rate": 6.953563661422289e-06, + "loss": 0.6653, + "step": 17279 + }, + { + "epoch": 0.6, + "learning_rate": 6.9525265723625565e-06, + "loss": 0.6452, + "step": 17280 + }, + { + "epoch": 0.6, + "learning_rate": 6.951489519434478e-06, + "loss": 0.5959, + "step": 17281 + }, + { + "epoch": 0.6, + "learning_rate": 6.9504525026503465e-06, + "loss": 0.6994, + "step": 17282 + }, + { + "epoch": 0.6, + "learning_rate": 6.949415522022458e-06, + "loss": 0.6225, + "step": 17283 + }, + { + "epoch": 0.6, + "learning_rate": 6.948378577563108e-06, + "loss": 0.6815, + "step": 17284 + }, + { + "epoch": 0.6, + "learning_rate": 6.947341669284591e-06, + "loss": 0.6674, + "step": 17285 + }, + { + "epoch": 0.6, + "learning_rate": 6.9463047971991995e-06, + "loss": 0.5994, + "step": 17286 + }, + { + "epoch": 0.6, + "learning_rate": 6.9452679613192285e-06, + "loss": 0.65, + "step": 17287 + }, + { + "epoch": 0.6, + "learning_rate": 6.944231161656968e-06, + "loss": 0.6278, + "step": 17288 + }, + { + "epoch": 0.6, + "learning_rate": 6.943194398224713e-06, + "loss": 0.5739, + "step": 17289 + }, + { + "epoch": 0.6, + "learning_rate": 6.942157671034757e-06, + "loss": 0.6031, + "step": 17290 + }, + { + "epoch": 0.6, + "learning_rate": 6.94112098009939e-06, + "loss": 0.6196, + "step": 17291 + }, + { + "epoch": 0.6, + "learning_rate": 6.9400843254309005e-06, + "loss": 0.5708, + "step": 17292 + }, + { + "epoch": 0.6, + "learning_rate": 6.939047707041586e-06, + "loss": 0.6373, + "step": 17293 + }, + { + "epoch": 0.6, + "learning_rate": 6.938011124943731e-06, + "loss": 0.6204, + "step": 17294 + }, + { + "epoch": 0.6, + "learning_rate": 6.936974579149627e-06, + "loss": 0.6595, + "step": 17295 + }, + { + "epoch": 0.6, + "learning_rate": 6.935938069671565e-06, + "loss": 0.6513, + "step": 17296 + }, + { + "epoch": 0.6, + "learning_rate": 6.934901596521832e-06, + "loss": 0.6394, + "step": 17297 + }, + { + "epoch": 0.6, + "learning_rate": 6.933865159712718e-06, + "loss": 0.6416, + "step": 17298 + }, + { + "epoch": 0.6, + "learning_rate": 6.9328287592565135e-06, + "loss": 0.5924, + "step": 17299 + }, + { + "epoch": 0.6, + "learning_rate": 6.931792395165502e-06, + "loss": 0.6929, + "step": 17300 + }, + { + "epoch": 0.6, + "learning_rate": 6.930756067451974e-06, + "loss": 0.6585, + "step": 17301 + }, + { + "epoch": 0.6, + "learning_rate": 6.929719776128217e-06, + "loss": 0.6617, + "step": 17302 + }, + { + "epoch": 0.6, + "learning_rate": 6.928683521206512e-06, + "loss": 0.6293, + "step": 17303 + }, + { + "epoch": 0.6, + "learning_rate": 6.9276473026991505e-06, + "loss": 0.5743, + "step": 17304 + }, + { + "epoch": 0.6, + "learning_rate": 6.926611120618419e-06, + "loss": 0.6305, + "step": 17305 + }, + { + "epoch": 0.6, + "learning_rate": 6.925574974976599e-06, + "loss": 0.6715, + "step": 17306 + }, + { + "epoch": 0.6, + "learning_rate": 6.924538865785976e-06, + "loss": 0.646, + "step": 17307 + }, + { + "epoch": 0.6, + "learning_rate": 6.923502793058836e-06, + "loss": 0.6078, + "step": 17308 + }, + { + "epoch": 0.6, + "learning_rate": 6.9224667568074624e-06, + "loss": 0.6378, + "step": 17309 + }, + { + "epoch": 0.6, + "learning_rate": 6.921430757044137e-06, + "loss": 0.6543, + "step": 17310 + }, + { + "epoch": 0.6, + "learning_rate": 6.92039479378115e-06, + "loss": 0.6207, + "step": 17311 + }, + { + "epoch": 0.6, + "learning_rate": 6.919358867030771e-06, + "loss": 0.6427, + "step": 17312 + }, + { + "epoch": 0.6, + "learning_rate": 6.918322976805292e-06, + "loss": 0.6299, + "step": 17313 + }, + { + "epoch": 0.6, + "learning_rate": 6.917287123116997e-06, + "loss": 0.6497, + "step": 17314 + }, + { + "epoch": 0.6, + "learning_rate": 6.916251305978156e-06, + "loss": 0.5954, + "step": 17315 + }, + { + "epoch": 0.6, + "learning_rate": 6.915215525401059e-06, + "loss": 0.6281, + "step": 17316 + }, + { + "epoch": 0.6, + "eval_loss": 0.5753005146980286, + "eval_runtime": 4931.9747, + "eval_samples_per_second": 111.85, + "eval_steps_per_second": 37.283, + "step": 17316 + }, + { + "epoch": 0.6, + "learning_rate": 6.914179781397989e-06, + "loss": 0.6366, + "step": 17317 + }, + { + "epoch": 0.6, + "learning_rate": 6.913144073981214e-06, + "loss": 0.6408, + "step": 17318 + }, + { + "epoch": 0.6, + "learning_rate": 6.912108403163024e-06, + "loss": 0.6058, + "step": 17319 + }, + { + "epoch": 0.6, + "learning_rate": 6.911072768955698e-06, + "loss": 0.5771, + "step": 17320 + }, + { + "epoch": 0.6, + "learning_rate": 6.910037171371506e-06, + "loss": 0.5992, + "step": 17321 + }, + { + "epoch": 0.6, + "learning_rate": 6.909001610422735e-06, + "loss": 0.6282, + "step": 17322 + }, + { + "epoch": 0.6, + "learning_rate": 6.907966086121663e-06, + "loss": 0.6064, + "step": 17323 + }, + { + "epoch": 0.6, + "learning_rate": 6.906930598480559e-06, + "loss": 0.6187, + "step": 17324 + }, + { + "epoch": 0.6, + "learning_rate": 6.9058951475117075e-06, + "loss": 0.6173, + "step": 17325 + }, + { + "epoch": 0.6, + "learning_rate": 6.904859733227388e-06, + "loss": 0.6615, + "step": 17326 + }, + { + "epoch": 0.6, + "learning_rate": 6.903824355639865e-06, + "loss": 0.6239, + "step": 17327 + }, + { + "epoch": 0.6, + "learning_rate": 6.902789014761426e-06, + "loss": 0.6735, + "step": 17328 + }, + { + "epoch": 0.6, + "learning_rate": 6.90175371060434e-06, + "loss": 0.6182, + "step": 17329 + }, + { + "epoch": 0.6, + "learning_rate": 6.900718443180878e-06, + "loss": 0.694, + "step": 17330 + }, + { + "epoch": 0.6, + "learning_rate": 6.899683212503327e-06, + "loss": 0.6443, + "step": 17331 + }, + { + "epoch": 0.6, + "learning_rate": 6.8986480185839486e-06, + "loss": 0.6039, + "step": 17332 + }, + { + "epoch": 0.6, + "learning_rate": 6.897612861435019e-06, + "loss": 0.6139, + "step": 17333 + }, + { + "epoch": 0.6, + "learning_rate": 6.896577741068822e-06, + "loss": 0.6422, + "step": 17334 + }, + { + "epoch": 0.6, + "learning_rate": 6.895542657497614e-06, + "loss": 0.6709, + "step": 17335 + }, + { + "epoch": 0.6, + "learning_rate": 6.894507610733676e-06, + "loss": 0.64, + "step": 17336 + }, + { + "epoch": 0.6, + "learning_rate": 6.893472600789284e-06, + "loss": 0.6255, + "step": 17337 + }, + { + "epoch": 0.6, + "learning_rate": 6.892437627676698e-06, + "loss": 0.6559, + "step": 17338 + }, + { + "epoch": 0.6, + "learning_rate": 6.891402691408196e-06, + "loss": 0.6344, + "step": 17339 + }, + { + "epoch": 0.6, + "learning_rate": 6.890367791996051e-06, + "loss": 0.5857, + "step": 17340 + }, + { + "epoch": 0.6, + "learning_rate": 6.889332929452527e-06, + "loss": 0.5676, + "step": 17341 + }, + { + "epoch": 0.6, + "learning_rate": 6.888298103789894e-06, + "loss": 0.6266, + "step": 17342 + }, + { + "epoch": 0.6, + "learning_rate": 6.88726331502043e-06, + "loss": 0.6919, + "step": 17343 + }, + { + "epoch": 0.6, + "learning_rate": 6.886228563156391e-06, + "loss": 0.6636, + "step": 17344 + }, + { + "epoch": 0.6, + "learning_rate": 6.88519384821005e-06, + "loss": 0.6084, + "step": 17345 + }, + { + "epoch": 0.6, + "learning_rate": 6.8841591701936826e-06, + "loss": 0.599, + "step": 17346 + }, + { + "epoch": 0.6, + "learning_rate": 6.8831245291195466e-06, + "loss": 0.6275, + "step": 17347 + }, + { + "epoch": 0.6, + "learning_rate": 6.882089924999909e-06, + "loss": 0.6216, + "step": 17348 + }, + { + "epoch": 0.6, + "learning_rate": 6.881055357847046e-06, + "loss": 0.6447, + "step": 17349 + }, + { + "epoch": 0.6, + "learning_rate": 6.880020827673213e-06, + "loss": 0.594, + "step": 17350 + }, + { + "epoch": 0.6, + "learning_rate": 6.878986334490678e-06, + "loss": 0.632, + "step": 17351 + }, + { + "epoch": 0.6, + "learning_rate": 6.877951878311715e-06, + "loss": 0.6086, + "step": 17352 + }, + { + "epoch": 0.6, + "learning_rate": 6.876917459148576e-06, + "loss": 0.6538, + "step": 17353 + }, + { + "epoch": 0.6, + "learning_rate": 6.87588307701353e-06, + "loss": 0.6549, + "step": 17354 + }, + { + "epoch": 0.6, + "learning_rate": 6.874848731918848e-06, + "loss": 0.6416, + "step": 17355 + }, + { + "epoch": 0.6, + "learning_rate": 6.8738144238767855e-06, + "loss": 0.6793, + "step": 17356 + }, + { + "epoch": 0.6, + "learning_rate": 6.872780152899603e-06, + "loss": 0.6852, + "step": 17357 + }, + { + "epoch": 0.6, + "learning_rate": 6.871745918999575e-06, + "loss": 0.6034, + "step": 17358 + }, + { + "epoch": 0.6, + "learning_rate": 6.870711722188953e-06, + "loss": 0.6415, + "step": 17359 + }, + { + "epoch": 0.6, + "learning_rate": 6.869677562479999e-06, + "loss": 0.6733, + "step": 17360 + }, + { + "epoch": 0.6, + "learning_rate": 6.868643439884983e-06, + "loss": 0.6851, + "step": 17361 + }, + { + "epoch": 0.6, + "learning_rate": 6.867609354416158e-06, + "loss": 0.6481, + "step": 17362 + }, + { + "epoch": 0.6, + "learning_rate": 6.866575306085783e-06, + "loss": 0.6428, + "step": 17363 + }, + { + "epoch": 0.6, + "learning_rate": 6.8655412949061286e-06, + "loss": 0.6216, + "step": 17364 + }, + { + "epoch": 0.6, + "learning_rate": 6.8645073208894434e-06, + "loss": 0.6659, + "step": 17365 + }, + { + "epoch": 0.6, + "learning_rate": 6.863473384047987e-06, + "loss": 0.6617, + "step": 17366 + }, + { + "epoch": 0.6, + "learning_rate": 6.862439484394028e-06, + "loss": 0.6306, + "step": 17367 + }, + { + "epoch": 0.6, + "learning_rate": 6.8614056219398136e-06, + "loss": 0.6407, + "step": 17368 + }, + { + "epoch": 0.6, + "learning_rate": 6.860371796697605e-06, + "loss": 0.6566, + "step": 17369 + }, + { + "epoch": 0.6, + "learning_rate": 6.8593380086796655e-06, + "loss": 0.6577, + "step": 17370 + }, + { + "epoch": 0.6, + "learning_rate": 6.858304257898243e-06, + "loss": 0.6003, + "step": 17371 + }, + { + "epoch": 0.6, + "learning_rate": 6.857270544365597e-06, + "loss": 0.5939, + "step": 17372 + }, + { + "epoch": 0.6, + "learning_rate": 6.8562368680939885e-06, + "loss": 0.5741, + "step": 17373 + }, + { + "epoch": 0.6, + "learning_rate": 6.855203229095666e-06, + "loss": 0.6332, + "step": 17374 + }, + { + "epoch": 0.6, + "learning_rate": 6.854169627382884e-06, + "loss": 0.6276, + "step": 17375 + }, + { + "epoch": 0.6, + "learning_rate": 6.853136062967908e-06, + "loss": 0.6045, + "step": 17376 + }, + { + "epoch": 0.6, + "learning_rate": 6.85210253586298e-06, + "loss": 0.604, + "step": 17377 + }, + { + "epoch": 0.6, + "learning_rate": 6.851069046080356e-06, + "loss": 0.611, + "step": 17378 + }, + { + "epoch": 0.6, + "learning_rate": 6.850035593632299e-06, + "loss": 0.6683, + "step": 17379 + }, + { + "epoch": 0.6, + "learning_rate": 6.84900217853105e-06, + "loss": 0.6329, + "step": 17380 + }, + { + "epoch": 0.6, + "learning_rate": 6.8479688007888645e-06, + "loss": 0.6667, + "step": 17381 + }, + { + "epoch": 0.6, + "learning_rate": 6.846935460418003e-06, + "loss": 0.627, + "step": 17382 + }, + { + "epoch": 0.6, + "learning_rate": 6.845902157430706e-06, + "loss": 0.6366, + "step": 17383 + }, + { + "epoch": 0.6, + "learning_rate": 6.844868891839226e-06, + "loss": 0.5724, + "step": 17384 + }, + { + "epoch": 0.6, + "learning_rate": 6.843835663655824e-06, + "loss": 0.5909, + "step": 17385 + }, + { + "epoch": 0.6, + "learning_rate": 6.842802472892737e-06, + "loss": 0.645, + "step": 17386 + }, + { + "epoch": 0.6, + "learning_rate": 6.8417693195622195e-06, + "loss": 0.6295, + "step": 17387 + }, + { + "epoch": 0.6, + "learning_rate": 6.840736203676528e-06, + "loss": 0.5996, + "step": 17388 + }, + { + "epoch": 0.6, + "learning_rate": 6.8397031252479004e-06, + "loss": 0.6485, + "step": 17389 + }, + { + "epoch": 0.6, + "learning_rate": 6.838670084288592e-06, + "loss": 0.6567, + "step": 17390 + }, + { + "epoch": 0.6, + "learning_rate": 6.837637080810848e-06, + "loss": 0.5989, + "step": 17391 + }, + { + "epoch": 0.6, + "learning_rate": 6.836604114826917e-06, + "loss": 0.6137, + "step": 17392 + }, + { + "epoch": 0.6, + "learning_rate": 6.835571186349047e-06, + "loss": 0.6729, + "step": 17393 + }, + { + "epoch": 0.6, + "learning_rate": 6.834538295389481e-06, + "loss": 0.5682, + "step": 17394 + }, + { + "epoch": 0.6, + "learning_rate": 6.83350544196047e-06, + "loss": 0.6401, + "step": 17395 + }, + { + "epoch": 0.6, + "learning_rate": 6.832472626074258e-06, + "loss": 0.643, + "step": 17396 + }, + { + "epoch": 0.6, + "learning_rate": 6.831439847743089e-06, + "loss": 0.6723, + "step": 17397 + }, + { + "epoch": 0.6, + "learning_rate": 6.830407106979207e-06, + "loss": 0.6446, + "step": 17398 + }, + { + "epoch": 0.6, + "learning_rate": 6.8293744037948614e-06, + "loss": 0.6194, + "step": 17399 + }, + { + "epoch": 0.6, + "learning_rate": 6.828341738202291e-06, + "loss": 0.6328, + "step": 17400 + }, + { + "epoch": 0.6, + "learning_rate": 6.827309110213742e-06, + "loss": 0.6083, + "step": 17401 + }, + { + "epoch": 0.6, + "learning_rate": 6.82627651984146e-06, + "loss": 0.5512, + "step": 17402 + }, + { + "epoch": 0.6, + "learning_rate": 6.82524396709768e-06, + "loss": 0.6647, + "step": 17403 + }, + { + "epoch": 0.6, + "learning_rate": 6.82421145199465e-06, + "loss": 0.5857, + "step": 17404 + }, + { + "epoch": 0.6, + "learning_rate": 6.823178974544613e-06, + "loss": 0.5913, + "step": 17405 + }, + { + "epoch": 0.6, + "learning_rate": 6.822146534759806e-06, + "loss": 0.6046, + "step": 17406 + }, + { + "epoch": 0.6, + "learning_rate": 6.821114132652471e-06, + "loss": 0.6593, + "step": 17407 + }, + { + "epoch": 0.6, + "learning_rate": 6.820081768234852e-06, + "loss": 0.6317, + "step": 17408 + }, + { + "epoch": 0.6, + "learning_rate": 6.819049441519184e-06, + "loss": 0.6545, + "step": 17409 + }, + { + "epoch": 0.6, + "learning_rate": 6.818017152517708e-06, + "loss": 0.6305, + "step": 17410 + }, + { + "epoch": 0.6, + "learning_rate": 6.816984901242667e-06, + "loss": 0.5646, + "step": 17411 + }, + { + "epoch": 0.6, + "learning_rate": 6.8159526877062955e-06, + "loss": 0.6531, + "step": 17412 + }, + { + "epoch": 0.6, + "learning_rate": 6.814920511920831e-06, + "loss": 0.6498, + "step": 17413 + }, + { + "epoch": 0.6, + "learning_rate": 6.813888373898517e-06, + "loss": 0.6435, + "step": 17414 + }, + { + "epoch": 0.6, + "learning_rate": 6.812856273651582e-06, + "loss": 0.6479, + "step": 17415 + }, + { + "epoch": 0.6, + "learning_rate": 6.8118242111922684e-06, + "loss": 0.6321, + "step": 17416 + }, + { + "epoch": 0.6, + "learning_rate": 6.810792186532815e-06, + "loss": 0.5938, + "step": 17417 + }, + { + "epoch": 0.6, + "learning_rate": 6.809760199685451e-06, + "loss": 0.6284, + "step": 17418 + }, + { + "epoch": 0.6, + "learning_rate": 6.808728250662417e-06, + "loss": 0.6504, + "step": 17419 + }, + { + "epoch": 0.6, + "learning_rate": 6.807696339475949e-06, + "loss": 0.6288, + "step": 17420 + }, + { + "epoch": 0.6, + "learning_rate": 6.806664466138276e-06, + "loss": 0.6487, + "step": 17421 + }, + { + "epoch": 0.6, + "learning_rate": 6.805632630661634e-06, + "loss": 0.6733, + "step": 17422 + }, + { + "epoch": 0.6, + "learning_rate": 6.804600833058262e-06, + "loss": 0.6077, + "step": 17423 + }, + { + "epoch": 0.6, + "learning_rate": 6.803569073340387e-06, + "loss": 0.6316, + "step": 17424 + }, + { + "epoch": 0.6, + "learning_rate": 6.802537351520244e-06, + "loss": 0.6459, + "step": 17425 + }, + { + "epoch": 0.6, + "learning_rate": 6.801505667610067e-06, + "loss": 0.5881, + "step": 17426 + }, + { + "epoch": 0.6, + "learning_rate": 6.800474021622086e-06, + "loss": 0.6438, + "step": 17427 + }, + { + "epoch": 0.6, + "learning_rate": 6.799442413568531e-06, + "loss": 0.5765, + "step": 17428 + }, + { + "epoch": 0.6, + "learning_rate": 6.798410843461638e-06, + "loss": 0.6457, + "step": 17429 + }, + { + "epoch": 0.6, + "learning_rate": 6.797379311313632e-06, + "loss": 0.6167, + "step": 17430 + }, + { + "epoch": 0.6, + "learning_rate": 6.796347817136746e-06, + "loss": 0.6505, + "step": 17431 + }, + { + "epoch": 0.6, + "learning_rate": 6.795316360943212e-06, + "loss": 0.6464, + "step": 17432 + }, + { + "epoch": 0.6, + "learning_rate": 6.794284942745253e-06, + "loss": 0.6334, + "step": 17433 + }, + { + "epoch": 0.6, + "learning_rate": 6.793253562555102e-06, + "loss": 0.6035, + "step": 17434 + }, + { + "epoch": 0.6, + "learning_rate": 6.792222220384989e-06, + "loss": 0.6119, + "step": 17435 + }, + { + "epoch": 0.6, + "learning_rate": 6.791190916247137e-06, + "loss": 0.6153, + "step": 17436 + }, + { + "epoch": 0.6, + "learning_rate": 6.790159650153776e-06, + "loss": 0.5794, + "step": 17437 + }, + { + "epoch": 0.6, + "learning_rate": 6.7891284221171336e-06, + "loss": 0.5851, + "step": 17438 + }, + { + "epoch": 0.6, + "learning_rate": 6.788097232149436e-06, + "loss": 0.6214, + "step": 17439 + }, + { + "epoch": 0.6, + "learning_rate": 6.787066080262905e-06, + "loss": 0.6875, + "step": 17440 + }, + { + "epoch": 0.6, + "learning_rate": 6.786034966469775e-06, + "loss": 0.6156, + "step": 17441 + }, + { + "epoch": 0.6, + "learning_rate": 6.7850038907822635e-06, + "loss": 0.6196, + "step": 17442 + }, + { + "epoch": 0.6, + "learning_rate": 6.783972853212598e-06, + "loss": 0.6214, + "step": 17443 + }, + { + "epoch": 0.6, + "learning_rate": 6.782941853773004e-06, + "loss": 0.6379, + "step": 17444 + }, + { + "epoch": 0.6, + "learning_rate": 6.7819108924757025e-06, + "loss": 0.6493, + "step": 17445 + }, + { + "epoch": 0.6, + "learning_rate": 6.780879969332919e-06, + "loss": 0.6068, + "step": 17446 + }, + { + "epoch": 0.6, + "learning_rate": 6.779849084356877e-06, + "loss": 0.6096, + "step": 17447 + }, + { + "epoch": 0.6, + "learning_rate": 6.778818237559794e-06, + "loss": 0.6243, + "step": 17448 + }, + { + "epoch": 0.6, + "learning_rate": 6.777787428953897e-06, + "loss": 0.6653, + "step": 17449 + }, + { + "epoch": 0.6, + "learning_rate": 6.7767566585514085e-06, + "loss": 0.6407, + "step": 17450 + }, + { + "epoch": 0.6, + "learning_rate": 6.775725926364545e-06, + "loss": 0.5867, + "step": 17451 + }, + { + "epoch": 0.6, + "learning_rate": 6.774695232405532e-06, + "loss": 0.6794, + "step": 17452 + }, + { + "epoch": 0.6, + "learning_rate": 6.773664576686584e-06, + "loss": 0.6282, + "step": 17453 + }, + { + "epoch": 0.6, + "learning_rate": 6.772633959219924e-06, + "loss": 0.6085, + "step": 17454 + }, + { + "epoch": 0.6, + "learning_rate": 6.771603380017773e-06, + "loss": 0.6651, + "step": 17455 + }, + { + "epoch": 0.6, + "learning_rate": 6.770572839092346e-06, + "loss": 0.6759, + "step": 17456 + }, + { + "epoch": 0.6, + "learning_rate": 6.769542336455863e-06, + "loss": 0.637, + "step": 17457 + }, + { + "epoch": 0.6, + "learning_rate": 6.768511872120544e-06, + "loss": 0.6422, + "step": 17458 + }, + { + "epoch": 0.6, + "learning_rate": 6.767481446098604e-06, + "loss": 0.5852, + "step": 17459 + }, + { + "epoch": 0.6, + "learning_rate": 6.766451058402259e-06, + "loss": 0.6128, + "step": 17460 + }, + { + "epoch": 0.6, + "learning_rate": 6.765420709043731e-06, + "loss": 0.6354, + "step": 17461 + }, + { + "epoch": 0.61, + "learning_rate": 6.764390398035229e-06, + "loss": 0.6459, + "step": 17462 + }, + { + "epoch": 0.61, + "learning_rate": 6.7633601253889715e-06, + "loss": 0.6205, + "step": 17463 + }, + { + "epoch": 0.61, + "learning_rate": 6.7623298911171766e-06, + "loss": 0.6271, + "step": 17464 + }, + { + "epoch": 0.61, + "learning_rate": 6.761299695232054e-06, + "loss": 0.6428, + "step": 17465 + }, + { + "epoch": 0.61, + "learning_rate": 6.760269537745821e-06, + "loss": 0.6482, + "step": 17466 + }, + { + "epoch": 0.61, + "learning_rate": 6.7592394186706935e-06, + "loss": 0.6259, + "step": 17467 + }, + { + "epoch": 0.61, + "learning_rate": 6.758209338018879e-06, + "loss": 0.6069, + "step": 17468 + }, + { + "epoch": 0.61, + "learning_rate": 6.757179295802594e-06, + "loss": 0.5661, + "step": 17469 + }, + { + "epoch": 0.61, + "learning_rate": 6.756149292034053e-06, + "loss": 0.6214, + "step": 17470 + }, + { + "epoch": 0.61, + "learning_rate": 6.755119326725464e-06, + "loss": 0.6246, + "step": 17471 + }, + { + "epoch": 0.61, + "learning_rate": 6.75408939988904e-06, + "loss": 0.6616, + "step": 17472 + }, + { + "epoch": 0.61, + "learning_rate": 6.753059511536994e-06, + "loss": 0.6642, + "step": 17473 + }, + { + "epoch": 0.61, + "learning_rate": 6.752029661681533e-06, + "loss": 0.6424, + "step": 17474 + }, + { + "epoch": 0.61, + "learning_rate": 6.75099985033487e-06, + "loss": 0.5834, + "step": 17475 + }, + { + "epoch": 0.61, + "learning_rate": 6.749970077509214e-06, + "loss": 0.6235, + "step": 17476 + }, + { + "epoch": 0.61, + "learning_rate": 6.748940343216772e-06, + "loss": 0.6032, + "step": 17477 + }, + { + "epoch": 0.61, + "learning_rate": 6.747910647469756e-06, + "loss": 0.6163, + "step": 17478 + }, + { + "epoch": 0.61, + "learning_rate": 6.746880990280376e-06, + "loss": 0.6845, + "step": 17479 + }, + { + "epoch": 0.61, + "learning_rate": 6.745851371660833e-06, + "loss": 0.6096, + "step": 17480 + }, + { + "epoch": 0.61, + "learning_rate": 6.744821791623339e-06, + "loss": 0.6021, + "step": 17481 + }, + { + "epoch": 0.61, + "learning_rate": 6.743792250180103e-06, + "loss": 0.6343, + "step": 17482 + }, + { + "epoch": 0.61, + "learning_rate": 6.7427627473433276e-06, + "loss": 0.652, + "step": 17483 + }, + { + "epoch": 0.61, + "learning_rate": 6.741733283125219e-06, + "loss": 0.5946, + "step": 17484 + }, + { + "epoch": 0.61, + "learning_rate": 6.740703857537987e-06, + "loss": 0.5993, + "step": 17485 + }, + { + "epoch": 0.61, + "learning_rate": 6.739674470593831e-06, + "loss": 0.659, + "step": 17486 + }, + { + "epoch": 0.61, + "learning_rate": 6.738645122304959e-06, + "loss": 0.634, + "step": 17487 + }, + { + "epoch": 0.61, + "learning_rate": 6.7376158126835775e-06, + "loss": 0.6155, + "step": 17488 + }, + { + "epoch": 0.61, + "learning_rate": 6.736586541741884e-06, + "loss": 0.6274, + "step": 17489 + }, + { + "epoch": 0.61, + "learning_rate": 6.735557309492087e-06, + "loss": 0.6061, + "step": 17490 + }, + { + "epoch": 0.61, + "learning_rate": 6.734528115946388e-06, + "loss": 0.6894, + "step": 17491 + }, + { + "epoch": 0.61, + "learning_rate": 6.733498961116986e-06, + "loss": 0.6645, + "step": 17492 + }, + { + "epoch": 0.61, + "learning_rate": 6.732469845016089e-06, + "loss": 0.698, + "step": 17493 + }, + { + "epoch": 0.61, + "learning_rate": 6.7314407676558955e-06, + "loss": 0.6315, + "step": 17494 + }, + { + "epoch": 0.61, + "learning_rate": 6.730411729048605e-06, + "loss": 0.6778, + "step": 17495 + }, + { + "epoch": 0.61, + "learning_rate": 6.729382729206419e-06, + "loss": 0.6722, + "step": 17496 + }, + { + "epoch": 0.61, + "learning_rate": 6.7283537681415416e-06, + "loss": 0.6518, + "step": 17497 + }, + { + "epoch": 0.61, + "learning_rate": 6.727324845866166e-06, + "loss": 0.605, + "step": 17498 + }, + { + "epoch": 0.61, + "learning_rate": 6.726295962392493e-06, + "loss": 0.6284, + "step": 17499 + }, + { + "epoch": 0.61, + "learning_rate": 6.725267117732726e-06, + "loss": 0.645, + "step": 17500 + }, + { + "epoch": 0.61, + "learning_rate": 6.724238311899058e-06, + "loss": 0.6187, + "step": 17501 + }, + { + "epoch": 0.61, + "learning_rate": 6.723209544903689e-06, + "loss": 0.6381, + "step": 17502 + }, + { + "epoch": 0.61, + "learning_rate": 6.722180816758817e-06, + "loss": 0.6317, + "step": 17503 + }, + { + "epoch": 0.61, + "learning_rate": 6.721152127476635e-06, + "loss": 0.6458, + "step": 17504 + }, + { + "epoch": 0.61, + "learning_rate": 6.720123477069345e-06, + "loss": 0.6263, + "step": 17505 + }, + { + "epoch": 0.61, + "learning_rate": 6.719094865549141e-06, + "loss": 0.6118, + "step": 17506 + }, + { + "epoch": 0.61, + "learning_rate": 6.718066292928214e-06, + "loss": 0.6431, + "step": 17507 + }, + { + "epoch": 0.61, + "learning_rate": 6.717037759218765e-06, + "loss": 0.5734, + "step": 17508 + }, + { + "epoch": 0.61, + "learning_rate": 6.7160092644329875e-06, + "loss": 0.5988, + "step": 17509 + }, + { + "epoch": 0.61, + "learning_rate": 6.714980808583071e-06, + "loss": 0.6262, + "step": 17510 + }, + { + "epoch": 0.61, + "learning_rate": 6.7139523916812154e-06, + "loss": 0.6057, + "step": 17511 + }, + { + "epoch": 0.61, + "learning_rate": 6.7129240137396125e-06, + "loss": 0.6198, + "step": 17512 + }, + { + "epoch": 0.61, + "learning_rate": 6.71189567477045e-06, + "loss": 0.6532, + "step": 17513 + }, + { + "epoch": 0.61, + "learning_rate": 6.710867374785929e-06, + "loss": 0.6365, + "step": 17514 + }, + { + "epoch": 0.61, + "learning_rate": 6.709839113798229e-06, + "loss": 0.6877, + "step": 17515 + }, + { + "epoch": 0.61, + "learning_rate": 6.708810891819551e-06, + "loss": 0.6188, + "step": 17516 + }, + { + "epoch": 0.61, + "learning_rate": 6.707782708862087e-06, + "loss": 0.5743, + "step": 17517 + }, + { + "epoch": 0.61, + "learning_rate": 6.7067545649380185e-06, + "loss": 0.6271, + "step": 17518 + }, + { + "epoch": 0.61, + "learning_rate": 6.705726460059543e-06, + "loss": 0.6757, + "step": 17519 + }, + { + "epoch": 0.61, + "learning_rate": 6.70469839423885e-06, + "loss": 0.6265, + "step": 17520 + }, + { + "epoch": 0.61, + "learning_rate": 6.70367036748812e-06, + "loss": 0.6115, + "step": 17521 + }, + { + "epoch": 0.61, + "learning_rate": 6.702642379819551e-06, + "loss": 0.6588, + "step": 17522 + }, + { + "epoch": 0.61, + "learning_rate": 6.701614431245331e-06, + "loss": 0.6608, + "step": 17523 + }, + { + "epoch": 0.61, + "learning_rate": 6.700586521777639e-06, + "loss": 0.6151, + "step": 17524 + }, + { + "epoch": 0.61, + "learning_rate": 6.699558651428668e-06, + "loss": 0.5909, + "step": 17525 + }, + { + "epoch": 0.61, + "learning_rate": 6.69853082021061e-06, + "loss": 0.6779, + "step": 17526 + }, + { + "epoch": 0.61, + "learning_rate": 6.697503028135639e-06, + "loss": 0.6585, + "step": 17527 + }, + { + "epoch": 0.61, + "learning_rate": 6.69647527521595e-06, + "loss": 0.6502, + "step": 17528 + }, + { + "epoch": 0.61, + "learning_rate": 6.695447561463728e-06, + "loss": 0.612, + "step": 17529 + }, + { + "epoch": 0.61, + "learning_rate": 6.69441988689115e-06, + "loss": 0.6242, + "step": 17530 + }, + { + "epoch": 0.61, + "learning_rate": 6.693392251510409e-06, + "loss": 0.6951, + "step": 17531 + }, + { + "epoch": 0.61, + "learning_rate": 6.6923646553336885e-06, + "loss": 0.6559, + "step": 17532 + }, + { + "epoch": 0.61, + "learning_rate": 6.691337098373163e-06, + "loss": 0.6274, + "step": 17533 + }, + { + "epoch": 0.61, + "learning_rate": 6.690309580641025e-06, + "loss": 0.605, + "step": 17534 + }, + { + "epoch": 0.61, + "learning_rate": 6.6892821021494566e-06, + "loss": 0.5955, + "step": 17535 + }, + { + "epoch": 0.61, + "learning_rate": 6.688254662910632e-06, + "loss": 0.6372, + "step": 17536 + }, + { + "epoch": 0.61, + "learning_rate": 6.687227262936739e-06, + "loss": 0.5825, + "step": 17537 + }, + { + "epoch": 0.61, + "learning_rate": 6.6861999022399605e-06, + "loss": 0.6076, + "step": 17538 + }, + { + "epoch": 0.61, + "learning_rate": 6.685172580832468e-06, + "loss": 0.6765, + "step": 17539 + }, + { + "epoch": 0.61, + "learning_rate": 6.684145298726452e-06, + "loss": 0.6394, + "step": 17540 + }, + { + "epoch": 0.61, + "learning_rate": 6.683118055934091e-06, + "loss": 0.6417, + "step": 17541 + }, + { + "epoch": 0.61, + "learning_rate": 6.682090852467556e-06, + "loss": 0.639, + "step": 17542 + }, + { + "epoch": 0.61, + "learning_rate": 6.681063688339032e-06, + "loss": 0.5924, + "step": 17543 + }, + { + "epoch": 0.61, + "learning_rate": 6.680036563560701e-06, + "loss": 0.6012, + "step": 17544 + }, + { + "epoch": 0.61, + "learning_rate": 6.67900947814473e-06, + "loss": 0.5833, + "step": 17545 + }, + { + "epoch": 0.61, + "learning_rate": 6.677982432103305e-06, + "loss": 0.6109, + "step": 17546 + }, + { + "epoch": 0.61, + "learning_rate": 6.676955425448605e-06, + "loss": 0.5765, + "step": 17547 + }, + { + "epoch": 0.61, + "learning_rate": 6.675928458192795e-06, + "loss": 0.601, + "step": 17548 + }, + { + "epoch": 0.61, + "learning_rate": 6.674901530348062e-06, + "loss": 0.6092, + "step": 17549 + }, + { + "epoch": 0.61, + "learning_rate": 6.67387464192658e-06, + "loss": 0.6449, + "step": 17550 + }, + { + "epoch": 0.61, + "learning_rate": 6.672847792940515e-06, + "loss": 0.6457, + "step": 17551 + }, + { + "epoch": 0.61, + "learning_rate": 6.671820983402052e-06, + "loss": 0.6622, + "step": 17552 + }, + { + "epoch": 0.61, + "learning_rate": 6.670794213323365e-06, + "loss": 0.6035, + "step": 17553 + }, + { + "epoch": 0.61, + "learning_rate": 6.669767482716618e-06, + "loss": 0.6371, + "step": 17554 + }, + { + "epoch": 0.61, + "learning_rate": 6.668740791593992e-06, + "loss": 0.6042, + "step": 17555 + }, + { + "epoch": 0.61, + "learning_rate": 6.6677141399676626e-06, + "loss": 0.5917, + "step": 17556 + }, + { + "epoch": 0.61, + "learning_rate": 6.666687527849791e-06, + "loss": 0.6698, + "step": 17557 + }, + { + "epoch": 0.61, + "learning_rate": 6.665660955252557e-06, + "loss": 0.6151, + "step": 17558 + }, + { + "epoch": 0.61, + "learning_rate": 6.664634422188134e-06, + "loss": 0.644, + "step": 17559 + }, + { + "epoch": 0.61, + "learning_rate": 6.663607928668685e-06, + "loss": 0.6264, + "step": 17560 + }, + { + "epoch": 0.61, + "learning_rate": 6.662581474706385e-06, + "loss": 0.6872, + "step": 17561 + }, + { + "epoch": 0.61, + "learning_rate": 6.661555060313407e-06, + "loss": 0.62, + "step": 17562 + }, + { + "epoch": 0.61, + "learning_rate": 6.6605286855019125e-06, + "loss": 0.6473, + "step": 17563 + }, + { + "epoch": 0.61, + "learning_rate": 6.659502350284076e-06, + "loss": 0.6489, + "step": 17564 + }, + { + "epoch": 0.61, + "learning_rate": 6.6584760546720694e-06, + "loss": 0.6034, + "step": 17565 + }, + { + "epoch": 0.61, + "learning_rate": 6.6574497986780495e-06, + "loss": 0.6373, + "step": 17566 + }, + { + "epoch": 0.61, + "learning_rate": 6.656423582314193e-06, + "loss": 0.6377, + "step": 17567 + }, + { + "epoch": 0.61, + "learning_rate": 6.6553974055926694e-06, + "loss": 0.6393, + "step": 17568 + }, + { + "epoch": 0.61, + "learning_rate": 6.654371268525632e-06, + "loss": 0.6006, + "step": 17569 + }, + { + "epoch": 0.61, + "learning_rate": 6.653345171125261e-06, + "loss": 0.6113, + "step": 17570 + }, + { + "epoch": 0.61, + "learning_rate": 6.652319113403718e-06, + "loss": 0.6262, + "step": 17571 + }, + { + "epoch": 0.61, + "learning_rate": 6.6512930953731614e-06, + "loss": 0.6687, + "step": 17572 + }, + { + "epoch": 0.61, + "learning_rate": 6.650267117045763e-06, + "loss": 0.6622, + "step": 17573 + }, + { + "epoch": 0.61, + "learning_rate": 6.64924117843369e-06, + "loss": 0.6826, + "step": 17574 + }, + { + "epoch": 0.61, + "learning_rate": 6.648215279549095e-06, + "loss": 0.5894, + "step": 17575 + }, + { + "epoch": 0.61, + "learning_rate": 6.64718942040415e-06, + "loss": 0.6357, + "step": 17576 + }, + { + "epoch": 0.61, + "learning_rate": 6.6461636010110195e-06, + "loss": 0.6043, + "step": 17577 + }, + { + "epoch": 0.61, + "learning_rate": 6.645137821381858e-06, + "loss": 0.6767, + "step": 17578 + }, + { + "epoch": 0.61, + "learning_rate": 6.6441120815288354e-06, + "loss": 0.6269, + "step": 17579 + }, + { + "epoch": 0.61, + "learning_rate": 6.643086381464106e-06, + "loss": 0.6174, + "step": 17580 + }, + { + "epoch": 0.61, + "learning_rate": 6.6420607211998325e-06, + "loss": 0.633, + "step": 17581 + }, + { + "epoch": 0.61, + "learning_rate": 6.641035100748182e-06, + "loss": 0.5701, + "step": 17582 + }, + { + "epoch": 0.61, + "learning_rate": 6.640009520121307e-06, + "loss": 0.6379, + "step": 17583 + }, + { + "epoch": 0.61, + "learning_rate": 6.638983979331366e-06, + "loss": 0.6118, + "step": 17584 + }, + { + "epoch": 0.61, + "learning_rate": 6.637958478390527e-06, + "loss": 0.6438, + "step": 17585 + }, + { + "epoch": 0.61, + "learning_rate": 6.6369330173109405e-06, + "loss": 0.6707, + "step": 17586 + }, + { + "epoch": 0.61, + "learning_rate": 6.635907596104766e-06, + "loss": 0.6208, + "step": 17587 + }, + { + "epoch": 0.61, + "learning_rate": 6.6348822147841686e-06, + "loss": 0.6147, + "step": 17588 + }, + { + "epoch": 0.61, + "learning_rate": 6.633856873361293e-06, + "loss": 0.6357, + "step": 17589 + }, + { + "epoch": 0.61, + "learning_rate": 6.632831571848302e-06, + "loss": 0.6676, + "step": 17590 + }, + { + "epoch": 0.61, + "learning_rate": 6.631806310257358e-06, + "loss": 0.5974, + "step": 17591 + }, + { + "epoch": 0.61, + "learning_rate": 6.630781088600608e-06, + "loss": 0.6069, + "step": 17592 + }, + { + "epoch": 0.61, + "learning_rate": 6.6297559068902074e-06, + "loss": 0.6333, + "step": 17593 + }, + { + "epoch": 0.61, + "learning_rate": 6.628730765138321e-06, + "loss": 0.6293, + "step": 17594 + }, + { + "epoch": 0.61, + "learning_rate": 6.6277056633570904e-06, + "loss": 0.684, + "step": 17595 + }, + { + "epoch": 0.61, + "learning_rate": 6.626680601558674e-06, + "loss": 0.6147, + "step": 17596 + }, + { + "epoch": 0.61, + "learning_rate": 6.625655579755232e-06, + "loss": 0.6885, + "step": 17597 + }, + { + "epoch": 0.61, + "learning_rate": 6.624630597958907e-06, + "loss": 0.7076, + "step": 17598 + }, + { + "epoch": 0.61, + "learning_rate": 6.623605656181855e-06, + "loss": 0.684, + "step": 17599 + }, + { + "epoch": 0.61, + "learning_rate": 6.6225807544362366e-06, + "loss": 0.5813, + "step": 17600 + }, + { + "epoch": 0.61, + "learning_rate": 6.6215558927341895e-06, + "loss": 0.6182, + "step": 17601 + }, + { + "epoch": 0.61, + "learning_rate": 6.6205310710878705e-06, + "loss": 0.6254, + "step": 17602 + }, + { + "epoch": 0.61, + "learning_rate": 6.619506289509435e-06, + "loss": 0.6521, + "step": 17603 + }, + { + "epoch": 0.61, + "learning_rate": 6.6184815480110265e-06, + "loss": 0.6675, + "step": 17604 + }, + { + "epoch": 0.61, + "learning_rate": 6.617456846604793e-06, + "loss": 0.6017, + "step": 17605 + }, + { + "epoch": 0.61, + "learning_rate": 6.616432185302895e-06, + "loss": 0.6236, + "step": 17606 + }, + { + "epoch": 0.61, + "learning_rate": 6.61540756411747e-06, + "loss": 0.6182, + "step": 17607 + }, + { + "epoch": 0.61, + "learning_rate": 6.614382983060667e-06, + "loss": 0.6288, + "step": 17608 + }, + { + "epoch": 0.61, + "learning_rate": 6.613358442144643e-06, + "loss": 0.666, + "step": 17609 + }, + { + "epoch": 0.61, + "learning_rate": 6.6123339413815345e-06, + "loss": 0.6447, + "step": 17610 + }, + { + "epoch": 0.61, + "learning_rate": 6.61130948078349e-06, + "loss": 0.6459, + "step": 17611 + }, + { + "epoch": 0.61, + "learning_rate": 6.610285060362665e-06, + "loss": 0.6545, + "step": 17612 + }, + { + "epoch": 0.61, + "learning_rate": 6.609260680131195e-06, + "loss": 0.6215, + "step": 17613 + }, + { + "epoch": 0.61, + "learning_rate": 6.608236340101226e-06, + "loss": 0.6501, + "step": 17614 + }, + { + "epoch": 0.61, + "learning_rate": 6.607212040284913e-06, + "loss": 0.6556, + "step": 17615 + }, + { + "epoch": 0.61, + "learning_rate": 6.606187780694389e-06, + "loss": 0.6412, + "step": 17616 + }, + { + "epoch": 0.61, + "learning_rate": 6.605163561341798e-06, + "loss": 0.6339, + "step": 17617 + }, + { + "epoch": 0.61, + "learning_rate": 6.604139382239296e-06, + "loss": 0.6383, + "step": 17618 + }, + { + "epoch": 0.61, + "learning_rate": 6.603115243399012e-06, + "loss": 0.6344, + "step": 17619 + }, + { + "epoch": 0.61, + "learning_rate": 6.602091144833092e-06, + "loss": 0.5936, + "step": 17620 + }, + { + "epoch": 0.61, + "learning_rate": 6.601067086553687e-06, + "loss": 0.605, + "step": 17621 + }, + { + "epoch": 0.61, + "learning_rate": 6.600043068572926e-06, + "loss": 0.633, + "step": 17622 + }, + { + "epoch": 0.61, + "learning_rate": 6.5990190909029535e-06, + "loss": 0.6525, + "step": 17623 + }, + { + "epoch": 0.61, + "learning_rate": 6.597995153555919e-06, + "loss": 0.662, + "step": 17624 + }, + { + "epoch": 0.61, + "learning_rate": 6.5969712565439515e-06, + "loss": 0.6407, + "step": 17625 + }, + { + "epoch": 0.61, + "learning_rate": 6.595947399879191e-06, + "loss": 0.6498, + "step": 17626 + }, + { + "epoch": 0.61, + "learning_rate": 6.594923583573787e-06, + "loss": 0.6659, + "step": 17627 + }, + { + "epoch": 0.61, + "learning_rate": 6.593899807639868e-06, + "loss": 0.6472, + "step": 17628 + }, + { + "epoch": 0.61, + "learning_rate": 6.592876072089573e-06, + "loss": 0.6446, + "step": 17629 + }, + { + "epoch": 0.61, + "learning_rate": 6.5918523769350485e-06, + "loss": 0.6653, + "step": 17630 + }, + { + "epoch": 0.61, + "learning_rate": 6.59082872218842e-06, + "loss": 0.6583, + "step": 17631 + }, + { + "epoch": 0.61, + "learning_rate": 6.58980510786183e-06, + "loss": 0.6212, + "step": 17632 + }, + { + "epoch": 0.61, + "learning_rate": 6.5887815339674185e-06, + "loss": 0.6651, + "step": 17633 + }, + { + "epoch": 0.61, + "learning_rate": 6.587758000517314e-06, + "loss": 0.6514, + "step": 17634 + }, + { + "epoch": 0.61, + "learning_rate": 6.5867345075236534e-06, + "loss": 0.6734, + "step": 17635 + }, + { + "epoch": 0.61, + "learning_rate": 6.585711054998578e-06, + "loss": 0.6312, + "step": 17636 + }, + { + "epoch": 0.61, + "learning_rate": 6.584687642954213e-06, + "loss": 0.6094, + "step": 17637 + }, + { + "epoch": 0.61, + "learning_rate": 6.5836642714026946e-06, + "loss": 0.6127, + "step": 17638 + }, + { + "epoch": 0.61, + "learning_rate": 6.582640940356164e-06, + "loss": 0.6393, + "step": 17639 + }, + { + "epoch": 0.61, + "learning_rate": 6.581617649826745e-06, + "loss": 0.6672, + "step": 17640 + }, + { + "epoch": 0.61, + "learning_rate": 6.580594399826574e-06, + "loss": 0.6234, + "step": 17641 + }, + { + "epoch": 0.61, + "learning_rate": 6.5795711903677796e-06, + "loss": 0.6508, + "step": 17642 + }, + { + "epoch": 0.61, + "learning_rate": 6.578548021462496e-06, + "loss": 0.6432, + "step": 17643 + }, + { + "epoch": 0.61, + "learning_rate": 6.577524893122858e-06, + "loss": 0.63, + "step": 17644 + }, + { + "epoch": 0.61, + "learning_rate": 6.576501805360986e-06, + "loss": 0.7267, + "step": 17645 + }, + { + "epoch": 0.61, + "learning_rate": 6.575478758189018e-06, + "loss": 0.6641, + "step": 17646 + }, + { + "epoch": 0.61, + "learning_rate": 6.574455751619083e-06, + "loss": 0.6049, + "step": 17647 + }, + { + "epoch": 0.61, + "learning_rate": 6.5734327856633075e-06, + "loss": 0.5648, + "step": 17648 + }, + { + "epoch": 0.61, + "learning_rate": 6.57240986033382e-06, + "loss": 0.6157, + "step": 17649 + }, + { + "epoch": 0.61, + "learning_rate": 6.571386975642751e-06, + "loss": 0.6743, + "step": 17650 + }, + { + "epoch": 0.61, + "learning_rate": 6.5703641316022246e-06, + "loss": 0.655, + "step": 17651 + }, + { + "epoch": 0.61, + "learning_rate": 6.5693413282243705e-06, + "loss": 0.6255, + "step": 17652 + }, + { + "epoch": 0.61, + "learning_rate": 6.568318565521316e-06, + "loss": 0.6258, + "step": 17653 + }, + { + "epoch": 0.61, + "learning_rate": 6.567295843505185e-06, + "loss": 0.6265, + "step": 17654 + }, + { + "epoch": 0.61, + "learning_rate": 6.566273162188104e-06, + "loss": 0.62, + "step": 17655 + }, + { + "epoch": 0.61, + "learning_rate": 6.5652505215822005e-06, + "loss": 0.6515, + "step": 17656 + }, + { + "epoch": 0.61, + "learning_rate": 6.564227921699594e-06, + "loss": 0.5967, + "step": 17657 + }, + { + "epoch": 0.61, + "learning_rate": 6.563205362552413e-06, + "loss": 0.6054, + "step": 17658 + }, + { + "epoch": 0.61, + "learning_rate": 6.5621828441527815e-06, + "loss": 0.6272, + "step": 17659 + }, + { + "epoch": 0.61, + "learning_rate": 6.561160366512819e-06, + "loss": 0.6804, + "step": 17660 + }, + { + "epoch": 0.61, + "learning_rate": 6.56013792964465e-06, + "loss": 0.6934, + "step": 17661 + }, + { + "epoch": 0.61, + "learning_rate": 6.5591155335604e-06, + "loss": 0.6376, + "step": 17662 + }, + { + "epoch": 0.61, + "learning_rate": 6.558093178272187e-06, + "loss": 0.6384, + "step": 17663 + }, + { + "epoch": 0.61, + "learning_rate": 6.557070863792132e-06, + "loss": 0.6584, + "step": 17664 + }, + { + "epoch": 0.61, + "learning_rate": 6.55604859013236e-06, + "loss": 0.5966, + "step": 17665 + }, + { + "epoch": 0.61, + "learning_rate": 6.555026357304986e-06, + "loss": 0.6708, + "step": 17666 + }, + { + "epoch": 0.61, + "learning_rate": 6.5540041653221334e-06, + "loss": 0.6222, + "step": 17667 + }, + { + "epoch": 0.61, + "learning_rate": 6.552982014195921e-06, + "loss": 0.6003, + "step": 17668 + }, + { + "epoch": 0.61, + "learning_rate": 6.551959903938468e-06, + "loss": 0.6305, + "step": 17669 + }, + { + "epoch": 0.61, + "learning_rate": 6.550937834561889e-06, + "loss": 0.6479, + "step": 17670 + }, + { + "epoch": 0.61, + "learning_rate": 6.549915806078309e-06, + "loss": 0.6365, + "step": 17671 + }, + { + "epoch": 0.61, + "learning_rate": 6.548893818499839e-06, + "loss": 0.6118, + "step": 17672 + }, + { + "epoch": 0.61, + "learning_rate": 6.547871871838598e-06, + "loss": 0.6171, + "step": 17673 + }, + { + "epoch": 0.61, + "learning_rate": 6.546849966106705e-06, + "loss": 0.5966, + "step": 17674 + }, + { + "epoch": 0.61, + "learning_rate": 6.545828101316273e-06, + "loss": 0.7067, + "step": 17675 + }, + { + "epoch": 0.61, + "learning_rate": 6.5448062774794175e-06, + "loss": 0.61, + "step": 17676 + }, + { + "epoch": 0.61, + "learning_rate": 6.543784494608256e-06, + "loss": 0.6273, + "step": 17677 + }, + { + "epoch": 0.61, + "learning_rate": 6.542762752714901e-06, + "loss": 0.6237, + "step": 17678 + }, + { + "epoch": 0.61, + "learning_rate": 6.5417410518114655e-06, + "loss": 0.5987, + "step": 17679 + }, + { + "epoch": 0.61, + "learning_rate": 6.540719391910068e-06, + "loss": 0.6584, + "step": 17680 + }, + { + "epoch": 0.61, + "learning_rate": 6.539697773022815e-06, + "loss": 0.604, + "step": 17681 + }, + { + "epoch": 0.61, + "learning_rate": 6.538676195161821e-06, + "loss": 0.6601, + "step": 17682 + }, + { + "epoch": 0.61, + "learning_rate": 6.537654658339204e-06, + "loss": 0.5864, + "step": 17683 + }, + { + "epoch": 0.61, + "learning_rate": 6.536633162567067e-06, + "loss": 0.626, + "step": 17684 + }, + { + "epoch": 0.61, + "learning_rate": 6.535611707857527e-06, + "loss": 0.6325, + "step": 17685 + }, + { + "epoch": 0.61, + "learning_rate": 6.534590294222693e-06, + "loss": 0.6233, + "step": 17686 + }, + { + "epoch": 0.61, + "learning_rate": 6.533568921674673e-06, + "loss": 0.6599, + "step": 17687 + }, + { + "epoch": 0.61, + "learning_rate": 6.532547590225578e-06, + "loss": 0.6194, + "step": 17688 + }, + { + "epoch": 0.61, + "learning_rate": 6.531526299887521e-06, + "loss": 0.6645, + "step": 17689 + }, + { + "epoch": 0.61, + "learning_rate": 6.530505050672604e-06, + "loss": 0.6437, + "step": 17690 + }, + { + "epoch": 0.61, + "learning_rate": 6.52948384259294e-06, + "loss": 0.6236, + "step": 17691 + }, + { + "epoch": 0.61, + "learning_rate": 6.528462675660636e-06, + "loss": 0.6278, + "step": 17692 + }, + { + "epoch": 0.61, + "learning_rate": 6.5274415498877975e-06, + "loss": 0.67, + "step": 17693 + }, + { + "epoch": 0.61, + "learning_rate": 6.526420465286532e-06, + "loss": 0.6417, + "step": 17694 + }, + { + "epoch": 0.61, + "learning_rate": 6.525399421868948e-06, + "loss": 0.6168, + "step": 17695 + }, + { + "epoch": 0.61, + "learning_rate": 6.524378419647146e-06, + "loss": 0.6358, + "step": 17696 + }, + { + "epoch": 0.61, + "learning_rate": 6.523357458633237e-06, + "loss": 0.6456, + "step": 17697 + }, + { + "epoch": 0.61, + "learning_rate": 6.522336538839324e-06, + "loss": 0.6466, + "step": 17698 + }, + { + "epoch": 0.61, + "learning_rate": 6.521315660277508e-06, + "loss": 0.5973, + "step": 17699 + }, + { + "epoch": 0.61, + "learning_rate": 6.520294822959896e-06, + "loss": 0.6708, + "step": 17700 + }, + { + "epoch": 0.61, + "learning_rate": 6.519274026898592e-06, + "loss": 0.6263, + "step": 17701 + }, + { + "epoch": 0.61, + "learning_rate": 6.518253272105697e-06, + "loss": 0.6553, + "step": 17702 + }, + { + "epoch": 0.61, + "learning_rate": 6.517232558593314e-06, + "loss": 0.6244, + "step": 17703 + }, + { + "epoch": 0.61, + "learning_rate": 6.516211886373545e-06, + "loss": 0.687, + "step": 17704 + }, + { + "epoch": 0.61, + "learning_rate": 6.515191255458489e-06, + "loss": 0.6059, + "step": 17705 + }, + { + "epoch": 0.61, + "learning_rate": 6.514170665860251e-06, + "loss": 0.6115, + "step": 17706 + }, + { + "epoch": 0.61, + "learning_rate": 6.513150117590929e-06, + "loss": 0.6498, + "step": 17707 + }, + { + "epoch": 0.61, + "learning_rate": 6.512129610662623e-06, + "loss": 0.645, + "step": 17708 + }, + { + "epoch": 0.61, + "learning_rate": 6.511109145087433e-06, + "loss": 0.6419, + "step": 17709 + }, + { + "epoch": 0.61, + "learning_rate": 6.510088720877457e-06, + "loss": 0.6881, + "step": 17710 + }, + { + "epoch": 0.61, + "learning_rate": 6.509068338044794e-06, + "loss": 0.6866, + "step": 17711 + }, + { + "epoch": 0.61, + "learning_rate": 6.508047996601543e-06, + "loss": 0.5954, + "step": 17712 + }, + { + "epoch": 0.61, + "learning_rate": 6.507027696559799e-06, + "loss": 0.6581, + "step": 17713 + }, + { + "epoch": 0.61, + "learning_rate": 6.506007437931661e-06, + "loss": 0.6275, + "step": 17714 + }, + { + "epoch": 0.61, + "learning_rate": 6.504987220729225e-06, + "loss": 0.6208, + "step": 17715 + }, + { + "epoch": 0.61, + "learning_rate": 6.503967044964585e-06, + "loss": 0.6264, + "step": 17716 + }, + { + "epoch": 0.61, + "learning_rate": 6.502946910649839e-06, + "loss": 0.6423, + "step": 17717 + }, + { + "epoch": 0.61, + "learning_rate": 6.501926817797084e-06, + "loss": 0.6142, + "step": 17718 + }, + { + "epoch": 0.61, + "learning_rate": 6.500906766418408e-06, + "loss": 0.6744, + "step": 17719 + }, + { + "epoch": 0.61, + "learning_rate": 6.499886756525909e-06, + "loss": 0.7066, + "step": 17720 + }, + { + "epoch": 0.61, + "learning_rate": 6.498866788131684e-06, + "loss": 0.6359, + "step": 17721 + }, + { + "epoch": 0.61, + "learning_rate": 6.497846861247818e-06, + "loss": 0.6071, + "step": 17722 + }, + { + "epoch": 0.61, + "learning_rate": 6.496826975886408e-06, + "loss": 0.5949, + "step": 17723 + }, + { + "epoch": 0.61, + "learning_rate": 6.495807132059549e-06, + "loss": 0.6795, + "step": 17724 + }, + { + "epoch": 0.61, + "learning_rate": 6.4947873297793255e-06, + "loss": 0.6223, + "step": 17725 + }, + { + "epoch": 0.61, + "learning_rate": 6.493767569057833e-06, + "loss": 0.5776, + "step": 17726 + }, + { + "epoch": 0.61, + "learning_rate": 6.492747849907164e-06, + "loss": 0.6408, + "step": 17727 + }, + { + "epoch": 0.61, + "learning_rate": 6.491728172339402e-06, + "loss": 0.583, + "step": 17728 + }, + { + "epoch": 0.61, + "learning_rate": 6.490708536366643e-06, + "loss": 0.6322, + "step": 17729 + }, + { + "epoch": 0.61, + "learning_rate": 6.489688942000975e-06, + "loss": 0.6473, + "step": 17730 + }, + { + "epoch": 0.61, + "learning_rate": 6.488669389254483e-06, + "loss": 0.608, + "step": 17731 + }, + { + "epoch": 0.61, + "learning_rate": 6.487649878139256e-06, + "loss": 0.6452, + "step": 17732 + }, + { + "epoch": 0.61, + "learning_rate": 6.486630408667386e-06, + "loss": 0.6567, + "step": 17733 + }, + { + "epoch": 0.61, + "learning_rate": 6.4856109808509545e-06, + "loss": 0.6912, + "step": 17734 + }, + { + "epoch": 0.61, + "learning_rate": 6.484591594702051e-06, + "loss": 0.669, + "step": 17735 + }, + { + "epoch": 0.61, + "learning_rate": 6.483572250232764e-06, + "loss": 0.6363, + "step": 17736 + }, + { + "epoch": 0.61, + "learning_rate": 6.482552947455172e-06, + "loss": 0.6089, + "step": 17737 + }, + { + "epoch": 0.61, + "learning_rate": 6.481533686381366e-06, + "loss": 0.6559, + "step": 17738 + }, + { + "epoch": 0.61, + "learning_rate": 6.480514467023431e-06, + "loss": 0.5954, + "step": 17739 + }, + { + "epoch": 0.61, + "learning_rate": 6.479495289393447e-06, + "loss": 0.602, + "step": 17740 + }, + { + "epoch": 0.61, + "learning_rate": 6.478476153503499e-06, + "loss": 0.625, + "step": 17741 + }, + { + "epoch": 0.61, + "learning_rate": 6.477457059365674e-06, + "loss": 0.5956, + "step": 17742 + }, + { + "epoch": 0.61, + "learning_rate": 6.47643800699205e-06, + "loss": 0.6198, + "step": 17743 + }, + { + "epoch": 0.61, + "learning_rate": 6.475418996394709e-06, + "loss": 0.6095, + "step": 17744 + }, + { + "epoch": 0.61, + "learning_rate": 6.474400027585736e-06, + "loss": 0.5854, + "step": 17745 + }, + { + "epoch": 0.61, + "learning_rate": 6.473381100577212e-06, + "loss": 0.6284, + "step": 17746 + }, + { + "epoch": 0.61, + "learning_rate": 6.472362215381214e-06, + "loss": 0.6503, + "step": 17747 + }, + { + "epoch": 0.61, + "learning_rate": 6.471343372009826e-06, + "loss": 0.6056, + "step": 17748 + }, + { + "epoch": 0.61, + "learning_rate": 6.470324570475124e-06, + "loss": 0.6414, + "step": 17749 + }, + { + "epoch": 0.61, + "learning_rate": 6.4693058107891905e-06, + "loss": 0.6234, + "step": 17750 + }, + { + "epoch": 0.62, + "learning_rate": 6.468287092964105e-06, + "loss": 0.5816, + "step": 17751 + }, + { + "epoch": 0.62, + "learning_rate": 6.467268417011941e-06, + "loss": 0.6531, + "step": 17752 + }, + { + "epoch": 0.62, + "learning_rate": 6.4662497829447776e-06, + "loss": 0.6344, + "step": 17753 + }, + { + "epoch": 0.62, + "learning_rate": 6.465231190774698e-06, + "loss": 0.6364, + "step": 17754 + }, + { + "epoch": 0.62, + "learning_rate": 6.46421264051377e-06, + "loss": 0.6527, + "step": 17755 + }, + { + "epoch": 0.62, + "learning_rate": 6.463194132174075e-06, + "loss": 0.6515, + "step": 17756 + }, + { + "epoch": 0.62, + "learning_rate": 6.4621756657676895e-06, + "loss": 0.637, + "step": 17757 + }, + { + "epoch": 0.62, + "learning_rate": 6.461157241306685e-06, + "loss": 0.6179, + "step": 17758 + }, + { + "epoch": 0.62, + "learning_rate": 6.4601388588031375e-06, + "loss": 0.6542, + "step": 17759 + }, + { + "epoch": 0.62, + "learning_rate": 6.459120518269124e-06, + "loss": 0.5916, + "step": 17760 + }, + { + "epoch": 0.62, + "learning_rate": 6.458102219716713e-06, + "loss": 0.6721, + "step": 17761 + }, + { + "epoch": 0.62, + "learning_rate": 6.457083963157982e-06, + "loss": 0.6035, + "step": 17762 + }, + { + "epoch": 0.62, + "learning_rate": 6.456065748605005e-06, + "loss": 0.6379, + "step": 17763 + }, + { + "epoch": 0.62, + "learning_rate": 6.455047576069849e-06, + "loss": 0.6374, + "step": 17764 + }, + { + "epoch": 0.62, + "learning_rate": 6.454029445564591e-06, + "loss": 0.5721, + "step": 17765 + }, + { + "epoch": 0.62, + "learning_rate": 6.453011357101295e-06, + "loss": 0.6202, + "step": 17766 + }, + { + "epoch": 0.62, + "learning_rate": 6.4519933106920385e-06, + "loss": 0.6332, + "step": 17767 + }, + { + "epoch": 0.62, + "learning_rate": 6.4509753063488934e-06, + "loss": 0.6507, + "step": 17768 + }, + { + "epoch": 0.62, + "learning_rate": 6.449957344083919e-06, + "loss": 0.5545, + "step": 17769 + }, + { + "epoch": 0.62, + "learning_rate": 6.448939423909193e-06, + "loss": 0.6396, + "step": 17770 + }, + { + "epoch": 0.62, + "learning_rate": 6.447921545836788e-06, + "loss": 0.6553, + "step": 17771 + }, + { + "epoch": 0.62, + "learning_rate": 6.4469037098787576e-06, + "loss": 0.6258, + "step": 17772 + }, + { + "epoch": 0.62, + "learning_rate": 6.445885916047183e-06, + "loss": 0.6077, + "step": 17773 + }, + { + "epoch": 0.62, + "learning_rate": 6.44486816435413e-06, + "loss": 0.6488, + "step": 17774 + }, + { + "epoch": 0.62, + "learning_rate": 6.443850454811655e-06, + "loss": 0.6115, + "step": 17775 + }, + { + "epoch": 0.62, + "learning_rate": 6.442832787431835e-06, + "loss": 0.6814, + "step": 17776 + }, + { + "epoch": 0.62, + "learning_rate": 6.441815162226737e-06, + "loss": 0.5696, + "step": 17777 + }, + { + "epoch": 0.62, + "learning_rate": 6.440797579208413e-06, + "loss": 0.6594, + "step": 17778 + }, + { + "epoch": 0.62, + "learning_rate": 6.4397800383889384e-06, + "loss": 0.6622, + "step": 17779 + }, + { + "epoch": 0.62, + "learning_rate": 6.438762539780381e-06, + "loss": 0.63, + "step": 17780 + }, + { + "epoch": 0.62, + "learning_rate": 6.437745083394791e-06, + "loss": 0.6695, + "step": 17781 + }, + { + "epoch": 0.62, + "learning_rate": 6.436727669244241e-06, + "loss": 0.6653, + "step": 17782 + }, + { + "epoch": 0.62, + "learning_rate": 6.435710297340798e-06, + "loss": 0.6671, + "step": 17783 + }, + { + "epoch": 0.62, + "learning_rate": 6.43469296769651e-06, + "loss": 0.6332, + "step": 17784 + }, + { + "epoch": 0.62, + "learning_rate": 6.43367568032345e-06, + "loss": 0.5894, + "step": 17785 + }, + { + "epoch": 0.62, + "learning_rate": 6.432658435233681e-06, + "loss": 0.6141, + "step": 17786 + }, + { + "epoch": 0.62, + "learning_rate": 6.431641232439252e-06, + "loss": 0.5973, + "step": 17787 + }, + { + "epoch": 0.62, + "learning_rate": 6.4306240719522315e-06, + "loss": 0.6262, + "step": 17788 + }, + { + "epoch": 0.62, + "learning_rate": 6.429606953784684e-06, + "loss": 0.6737, + "step": 17789 + }, + { + "epoch": 0.62, + "learning_rate": 6.428589877948656e-06, + "loss": 0.6762, + "step": 17790 + }, + { + "epoch": 0.62, + "learning_rate": 6.427572844456214e-06, + "loss": 0.6054, + "step": 17791 + }, + { + "epoch": 0.62, + "learning_rate": 6.42655585331942e-06, + "loss": 0.562, + "step": 17792 + }, + { + "epoch": 0.62, + "learning_rate": 6.425538904550319e-06, + "loss": 0.659, + "step": 17793 + }, + { + "epoch": 0.62, + "learning_rate": 6.42452199816098e-06, + "loss": 0.6595, + "step": 17794 + }, + { + "epoch": 0.62, + "learning_rate": 6.423505134163459e-06, + "loss": 0.6599, + "step": 17795 + }, + { + "epoch": 0.62, + "learning_rate": 6.422488312569803e-06, + "loss": 0.6463, + "step": 17796 + }, + { + "epoch": 0.62, + "learning_rate": 6.421471533392075e-06, + "loss": 0.5992, + "step": 17797 + }, + { + "epoch": 0.62, + "learning_rate": 6.4204547966423336e-06, + "loss": 0.5774, + "step": 17798 + }, + { + "epoch": 0.62, + "learning_rate": 6.4194381023326225e-06, + "loss": 0.6253, + "step": 17799 + }, + { + "epoch": 0.62, + "learning_rate": 6.418421450475004e-06, + "loss": 0.6, + "step": 17800 + }, + { + "epoch": 0.62, + "learning_rate": 6.4174048410815335e-06, + "loss": 0.627, + "step": 17801 + }, + { + "epoch": 0.62, + "learning_rate": 6.4163882741642555e-06, + "loss": 0.6128, + "step": 17802 + }, + { + "epoch": 0.62, + "learning_rate": 6.41537174973523e-06, + "loss": 0.604, + "step": 17803 + }, + { + "epoch": 0.62, + "learning_rate": 6.4143552678065105e-06, + "loss": 0.638, + "step": 17804 + }, + { + "epoch": 0.62, + "learning_rate": 6.413338828390139e-06, + "loss": 0.6172, + "step": 17805 + }, + { + "epoch": 0.62, + "learning_rate": 6.412322431498175e-06, + "loss": 0.6139, + "step": 17806 + }, + { + "epoch": 0.62, + "learning_rate": 6.4113060771426715e-06, + "loss": 0.5956, + "step": 17807 + }, + { + "epoch": 0.62, + "learning_rate": 6.410289765335667e-06, + "loss": 0.6071, + "step": 17808 + }, + { + "epoch": 0.62, + "learning_rate": 6.409273496089221e-06, + "loss": 0.6889, + "step": 17809 + }, + { + "epoch": 0.62, + "learning_rate": 6.408257269415383e-06, + "loss": 0.6666, + "step": 17810 + }, + { + "epoch": 0.62, + "learning_rate": 6.407241085326194e-06, + "loss": 0.6175, + "step": 17811 + }, + { + "epoch": 0.62, + "learning_rate": 6.406224943833708e-06, + "loss": 0.6797, + "step": 17812 + }, + { + "epoch": 0.62, + "learning_rate": 6.4052088449499775e-06, + "loss": 0.5861, + "step": 17813 + }, + { + "epoch": 0.62, + "learning_rate": 6.404192788687036e-06, + "loss": 0.6242, + "step": 17814 + }, + { + "epoch": 0.62, + "learning_rate": 6.4031767750569385e-06, + "loss": 0.6271, + "step": 17815 + }, + { + "epoch": 0.62, + "learning_rate": 6.402160804071735e-06, + "loss": 0.6414, + "step": 17816 + }, + { + "epoch": 0.62, + "learning_rate": 6.401144875743461e-06, + "loss": 0.7015, + "step": 17817 + }, + { + "epoch": 0.62, + "learning_rate": 6.400128990084169e-06, + "loss": 0.6642, + "step": 17818 + }, + { + "epoch": 0.62, + "learning_rate": 6.399113147105907e-06, + "loss": 0.6282, + "step": 17819 + }, + { + "epoch": 0.62, + "learning_rate": 6.398097346820706e-06, + "loss": 0.5933, + "step": 17820 + }, + { + "epoch": 0.62, + "learning_rate": 6.397081589240619e-06, + "loss": 0.6421, + "step": 17821 + }, + { + "epoch": 0.62, + "learning_rate": 6.396065874377693e-06, + "loss": 0.601, + "step": 17822 + }, + { + "epoch": 0.62, + "learning_rate": 6.395050202243959e-06, + "loss": 0.6699, + "step": 17823 + }, + { + "epoch": 0.62, + "learning_rate": 6.394034572851466e-06, + "loss": 0.6109, + "step": 17824 + }, + { + "epoch": 0.62, + "learning_rate": 6.393018986212259e-06, + "loss": 0.6555, + "step": 17825 + }, + { + "epoch": 0.62, + "learning_rate": 6.392003442338369e-06, + "loss": 0.6266, + "step": 17826 + }, + { + "epoch": 0.62, + "learning_rate": 6.390987941241849e-06, + "loss": 0.6542, + "step": 17827 + }, + { + "epoch": 0.62, + "learning_rate": 6.389972482934728e-06, + "loss": 0.599, + "step": 17828 + }, + { + "epoch": 0.62, + "learning_rate": 6.388957067429047e-06, + "loss": 0.6618, + "step": 17829 + }, + { + "epoch": 0.62, + "learning_rate": 6.387941694736854e-06, + "loss": 0.6309, + "step": 17830 + }, + { + "epoch": 0.62, + "learning_rate": 6.386926364870178e-06, + "loss": 0.6269, + "step": 17831 + }, + { + "epoch": 0.62, + "learning_rate": 6.385911077841059e-06, + "loss": 0.6502, + "step": 17832 + }, + { + "epoch": 0.62, + "learning_rate": 6.384895833661542e-06, + "loss": 0.5487, + "step": 17833 + }, + { + "epoch": 0.62, + "learning_rate": 6.383880632343653e-06, + "loss": 0.6177, + "step": 17834 + }, + { + "epoch": 0.62, + "learning_rate": 6.382865473899434e-06, + "loss": 0.6528, + "step": 17835 + }, + { + "epoch": 0.62, + "learning_rate": 6.381850358340924e-06, + "loss": 0.6709, + "step": 17836 + }, + { + "epoch": 0.62, + "learning_rate": 6.380835285680151e-06, + "loss": 0.674, + "step": 17837 + }, + { + "epoch": 0.62, + "learning_rate": 6.3798202559291526e-06, + "loss": 0.5911, + "step": 17838 + }, + { + "epoch": 0.62, + "learning_rate": 6.378805269099971e-06, + "loss": 0.6359, + "step": 17839 + }, + { + "epoch": 0.62, + "learning_rate": 6.377790325204629e-06, + "loss": 0.6054, + "step": 17840 + }, + { + "epoch": 0.62, + "learning_rate": 6.376775424255164e-06, + "loss": 0.6234, + "step": 17841 + }, + { + "epoch": 0.62, + "learning_rate": 6.375760566263615e-06, + "loss": 0.6442, + "step": 17842 + }, + { + "epoch": 0.62, + "learning_rate": 6.374745751242004e-06, + "loss": 0.6487, + "step": 17843 + }, + { + "epoch": 0.62, + "learning_rate": 6.373730979202368e-06, + "loss": 0.5905, + "step": 17844 + }, + { + "epoch": 0.62, + "learning_rate": 6.372716250156743e-06, + "loss": 0.6326, + "step": 17845 + }, + { + "epoch": 0.62, + "learning_rate": 6.371701564117152e-06, + "loss": 0.6497, + "step": 17846 + }, + { + "epoch": 0.62, + "learning_rate": 6.370686921095628e-06, + "loss": 0.6278, + "step": 17847 + }, + { + "epoch": 0.62, + "learning_rate": 6.3696723211042054e-06, + "loss": 0.632, + "step": 17848 + }, + { + "epoch": 0.62, + "learning_rate": 6.368657764154908e-06, + "loss": 0.6359, + "step": 17849 + }, + { + "epoch": 0.62, + "learning_rate": 6.367643250259765e-06, + "loss": 0.6147, + "step": 17850 + }, + { + "epoch": 0.62, + "learning_rate": 6.366628779430809e-06, + "loss": 0.6725, + "step": 17851 + }, + { + "epoch": 0.62, + "learning_rate": 6.365614351680063e-06, + "loss": 0.6396, + "step": 17852 + }, + { + "epoch": 0.62, + "learning_rate": 6.364599967019556e-06, + "loss": 0.5996, + "step": 17853 + }, + { + "epoch": 0.62, + "learning_rate": 6.363585625461317e-06, + "loss": 0.6297, + "step": 17854 + }, + { + "epoch": 0.62, + "learning_rate": 6.362571327017368e-06, + "loss": 0.6834, + "step": 17855 + }, + { + "epoch": 0.62, + "learning_rate": 6.361557071699739e-06, + "loss": 0.645, + "step": 17856 + }, + { + "epoch": 0.62, + "learning_rate": 6.360542859520455e-06, + "loss": 0.6271, + "step": 17857 + }, + { + "epoch": 0.62, + "learning_rate": 6.359528690491536e-06, + "loss": 0.6628, + "step": 17858 + }, + { + "epoch": 0.62, + "learning_rate": 6.358514564625011e-06, + "loss": 0.6592, + "step": 17859 + }, + { + "epoch": 0.62, + "learning_rate": 6.357500481932904e-06, + "loss": 0.6691, + "step": 17860 + }, + { + "epoch": 0.62, + "learning_rate": 6.356486442427235e-06, + "loss": 0.6546, + "step": 17861 + }, + { + "epoch": 0.62, + "learning_rate": 6.355472446120028e-06, + "loss": 0.6415, + "step": 17862 + }, + { + "epoch": 0.62, + "learning_rate": 6.354458493023307e-06, + "loss": 0.6094, + "step": 17863 + }, + { + "epoch": 0.62, + "learning_rate": 6.353444583149091e-06, + "loss": 0.5785, + "step": 17864 + }, + { + "epoch": 0.62, + "learning_rate": 6.352430716509401e-06, + "loss": 0.6565, + "step": 17865 + }, + { + "epoch": 0.62, + "learning_rate": 6.351416893116262e-06, + "loss": 0.6251, + "step": 17866 + }, + { + "epoch": 0.62, + "learning_rate": 6.350403112981689e-06, + "loss": 0.6573, + "step": 17867 + }, + { + "epoch": 0.62, + "learning_rate": 6.349389376117705e-06, + "loss": 0.6033, + "step": 17868 + }, + { + "epoch": 0.62, + "learning_rate": 6.348375682536328e-06, + "loss": 0.63, + "step": 17869 + }, + { + "epoch": 0.62, + "learning_rate": 6.347362032249576e-06, + "loss": 0.6451, + "step": 17870 + }, + { + "epoch": 0.62, + "learning_rate": 6.346348425269468e-06, + "loss": 0.614, + "step": 17871 + }, + { + "epoch": 0.62, + "learning_rate": 6.345334861608022e-06, + "loss": 0.6384, + "step": 17872 + }, + { + "epoch": 0.62, + "learning_rate": 6.344321341277253e-06, + "loss": 0.6093, + "step": 17873 + }, + { + "epoch": 0.62, + "learning_rate": 6.343307864289178e-06, + "loss": 0.5925, + "step": 17874 + }, + { + "epoch": 0.62, + "learning_rate": 6.3422944306558175e-06, + "loss": 0.637, + "step": 17875 + }, + { + "epoch": 0.62, + "learning_rate": 6.341281040389182e-06, + "loss": 0.6255, + "step": 17876 + }, + { + "epoch": 0.62, + "learning_rate": 6.340267693501287e-06, + "loss": 0.7493, + "step": 17877 + }, + { + "epoch": 0.62, + "learning_rate": 6.33925439000415e-06, + "loss": 0.618, + "step": 17878 + }, + { + "epoch": 0.62, + "learning_rate": 6.338241129909781e-06, + "loss": 0.6267, + "step": 17879 + }, + { + "epoch": 0.62, + "learning_rate": 6.3372279132301965e-06, + "loss": 0.6391, + "step": 17880 + }, + { + "epoch": 0.62, + "learning_rate": 6.336214739977409e-06, + "loss": 0.6535, + "step": 17881 + }, + { + "epoch": 0.62, + "learning_rate": 6.3352016101634295e-06, + "loss": 0.6384, + "step": 17882 + }, + { + "epoch": 0.62, + "learning_rate": 6.334188523800271e-06, + "loss": 0.625, + "step": 17883 + }, + { + "epoch": 0.62, + "learning_rate": 6.333175480899947e-06, + "loss": 0.6549, + "step": 17884 + }, + { + "epoch": 0.62, + "learning_rate": 6.332162481474463e-06, + "loss": 0.581, + "step": 17885 + }, + { + "epoch": 0.62, + "learning_rate": 6.331149525535833e-06, + "loss": 0.6407, + "step": 17886 + }, + { + "epoch": 0.62, + "learning_rate": 6.330136613096069e-06, + "loss": 0.6189, + "step": 17887 + }, + { + "epoch": 0.62, + "learning_rate": 6.329123744167176e-06, + "loss": 0.674, + "step": 17888 + }, + { + "epoch": 0.62, + "learning_rate": 6.328110918761166e-06, + "loss": 0.6662, + "step": 17889 + }, + { + "epoch": 0.62, + "learning_rate": 6.327098136890045e-06, + "loss": 0.5915, + "step": 17890 + }, + { + "epoch": 0.62, + "learning_rate": 6.326085398565822e-06, + "loss": 0.5704, + "step": 17891 + }, + { + "epoch": 0.62, + "learning_rate": 6.325072703800506e-06, + "loss": 0.673, + "step": 17892 + }, + { + "epoch": 0.62, + "learning_rate": 6.324060052606098e-06, + "loss": 0.6333, + "step": 17893 + }, + { + "epoch": 0.62, + "learning_rate": 6.32304744499461e-06, + "loss": 0.6579, + "step": 17894 + }, + { + "epoch": 0.62, + "learning_rate": 6.322034880978047e-06, + "loss": 0.6574, + "step": 17895 + }, + { + "epoch": 0.62, + "learning_rate": 6.3210223605684115e-06, + "loss": 0.672, + "step": 17896 + }, + { + "epoch": 0.62, + "learning_rate": 6.32000988377771e-06, + "loss": 0.6264, + "step": 17897 + }, + { + "epoch": 0.62, + "learning_rate": 6.3189974506179485e-06, + "loss": 0.6344, + "step": 17898 + }, + { + "epoch": 0.62, + "learning_rate": 6.317985061101126e-06, + "loss": 0.6462, + "step": 17899 + }, + { + "epoch": 0.62, + "learning_rate": 6.316972715239249e-06, + "loss": 0.6013, + "step": 17900 + }, + { + "epoch": 0.62, + "learning_rate": 6.315960413044322e-06, + "loss": 0.652, + "step": 17901 + }, + { + "epoch": 0.62, + "learning_rate": 6.314948154528342e-06, + "loss": 0.6363, + "step": 17902 + }, + { + "epoch": 0.62, + "learning_rate": 6.313935939703314e-06, + "loss": 0.6764, + "step": 17903 + }, + { + "epoch": 0.62, + "learning_rate": 6.312923768581239e-06, + "loss": 0.6359, + "step": 17904 + }, + { + "epoch": 0.62, + "learning_rate": 6.311911641174115e-06, + "loss": 0.6737, + "step": 17905 + }, + { + "epoch": 0.62, + "learning_rate": 6.3108995574939456e-06, + "loss": 0.6028, + "step": 17906 + }, + { + "epoch": 0.62, + "learning_rate": 6.30988751755273e-06, + "loss": 0.6362, + "step": 17907 + }, + { + "epoch": 0.62, + "learning_rate": 6.308875521362463e-06, + "loss": 0.6595, + "step": 17908 + }, + { + "epoch": 0.62, + "learning_rate": 6.307863568935147e-06, + "loss": 0.6665, + "step": 17909 + }, + { + "epoch": 0.62, + "learning_rate": 6.30685166028278e-06, + "loss": 0.6124, + "step": 17910 + }, + { + "epoch": 0.62, + "learning_rate": 6.305839795417358e-06, + "loss": 0.6746, + "step": 17911 + }, + { + "epoch": 0.62, + "learning_rate": 6.304827974350877e-06, + "loss": 0.6305, + "step": 17912 + }, + { + "epoch": 0.62, + "learning_rate": 6.303816197095337e-06, + "loss": 0.6634, + "step": 17913 + }, + { + "epoch": 0.62, + "learning_rate": 6.302804463662729e-06, + "loss": 0.6668, + "step": 17914 + }, + { + "epoch": 0.62, + "learning_rate": 6.301792774065052e-06, + "loss": 0.6454, + "step": 17915 + }, + { + "epoch": 0.62, + "learning_rate": 6.300781128314302e-06, + "loss": 0.6378, + "step": 17916 + }, + { + "epoch": 0.62, + "learning_rate": 6.29976952642247e-06, + "loss": 0.6705, + "step": 17917 + }, + { + "epoch": 0.62, + "learning_rate": 6.29875796840155e-06, + "loss": 0.6186, + "step": 17918 + }, + { + "epoch": 0.62, + "learning_rate": 6.297746454263538e-06, + "loss": 0.6445, + "step": 17919 + }, + { + "epoch": 0.62, + "learning_rate": 6.296734984020423e-06, + "loss": 0.5933, + "step": 17920 + }, + { + "epoch": 0.62, + "learning_rate": 6.295723557684201e-06, + "loss": 0.6272, + "step": 17921 + }, + { + "epoch": 0.62, + "learning_rate": 6.294712175266863e-06, + "loss": 0.6214, + "step": 17922 + }, + { + "epoch": 0.62, + "learning_rate": 6.293700836780397e-06, + "loss": 0.7059, + "step": 17923 + }, + { + "epoch": 0.62, + "learning_rate": 6.292689542236796e-06, + "loss": 0.6113, + "step": 17924 + }, + { + "epoch": 0.62, + "learning_rate": 6.2916782916480534e-06, + "loss": 0.6026, + "step": 17925 + }, + { + "epoch": 0.62, + "learning_rate": 6.290667085026154e-06, + "loss": 0.6733, + "step": 17926 + }, + { + "epoch": 0.62, + "learning_rate": 6.289655922383088e-06, + "loss": 0.6509, + "step": 17927 + }, + { + "epoch": 0.62, + "learning_rate": 6.288644803730846e-06, + "loss": 0.6586, + "step": 17928 + }, + { + "epoch": 0.62, + "learning_rate": 6.287633729081413e-06, + "loss": 0.6652, + "step": 17929 + }, + { + "epoch": 0.62, + "learning_rate": 6.286622698446779e-06, + "loss": 0.6557, + "step": 17930 + }, + { + "epoch": 0.62, + "learning_rate": 6.285611711838933e-06, + "loss": 0.6372, + "step": 17931 + }, + { + "epoch": 0.62, + "learning_rate": 6.284600769269855e-06, + "loss": 0.59, + "step": 17932 + }, + { + "epoch": 0.62, + "learning_rate": 6.283589870751535e-06, + "loss": 0.6253, + "step": 17933 + }, + { + "epoch": 0.62, + "learning_rate": 6.2825790162959625e-06, + "loss": 0.5909, + "step": 17934 + }, + { + "epoch": 0.62, + "learning_rate": 6.281568205915114e-06, + "loss": 0.5736, + "step": 17935 + }, + { + "epoch": 0.62, + "learning_rate": 6.280557439620979e-06, + "loss": 0.6336, + "step": 17936 + }, + { + "epoch": 0.62, + "learning_rate": 6.279546717425542e-06, + "loss": 0.529, + "step": 17937 + }, + { + "epoch": 0.62, + "learning_rate": 6.278536039340784e-06, + "loss": 0.6202, + "step": 17938 + }, + { + "epoch": 0.62, + "learning_rate": 6.277525405378689e-06, + "loss": 0.6133, + "step": 17939 + }, + { + "epoch": 0.62, + "learning_rate": 6.2765148155512414e-06, + "loss": 0.6054, + "step": 17940 + }, + { + "epoch": 0.62, + "learning_rate": 6.275504269870418e-06, + "loss": 0.6264, + "step": 17941 + }, + { + "epoch": 0.62, + "learning_rate": 6.274493768348204e-06, + "loss": 0.6574, + "step": 17942 + }, + { + "epoch": 0.62, + "learning_rate": 6.273483310996581e-06, + "loss": 0.6116, + "step": 17943 + }, + { + "epoch": 0.62, + "learning_rate": 6.272472897827524e-06, + "loss": 0.577, + "step": 17944 + }, + { + "epoch": 0.62, + "learning_rate": 6.2714625288530185e-06, + "loss": 0.624, + "step": 17945 + }, + { + "epoch": 0.62, + "learning_rate": 6.270452204085042e-06, + "loss": 0.6414, + "step": 17946 + }, + { + "epoch": 0.62, + "learning_rate": 6.269441923535571e-06, + "loss": 0.615, + "step": 17947 + }, + { + "epoch": 0.62, + "learning_rate": 6.268431687216584e-06, + "loss": 0.6544, + "step": 17948 + }, + { + "epoch": 0.62, + "learning_rate": 6.267421495140063e-06, + "loss": 0.6038, + "step": 17949 + }, + { + "epoch": 0.62, + "learning_rate": 6.26641134731798e-06, + "loss": 0.6387, + "step": 17950 + }, + { + "epoch": 0.62, + "learning_rate": 6.265401243762315e-06, + "loss": 0.6532, + "step": 17951 + }, + { + "epoch": 0.62, + "learning_rate": 6.264391184485039e-06, + "loss": 0.687, + "step": 17952 + }, + { + "epoch": 0.62, + "learning_rate": 6.263381169498133e-06, + "loss": 0.5828, + "step": 17953 + }, + { + "epoch": 0.62, + "learning_rate": 6.262371198813573e-06, + "loss": 0.6184, + "step": 17954 + }, + { + "epoch": 0.62, + "learning_rate": 6.261361272443327e-06, + "loss": 0.6643, + "step": 17955 + }, + { + "epoch": 0.62, + "learning_rate": 6.260351390399373e-06, + "loss": 0.6505, + "step": 17956 + }, + { + "epoch": 0.62, + "learning_rate": 6.259341552693685e-06, + "loss": 0.6111, + "step": 17957 + }, + { + "epoch": 0.62, + "learning_rate": 6.258331759338234e-06, + "loss": 0.6412, + "step": 17958 + }, + { + "epoch": 0.62, + "learning_rate": 6.2573220103449925e-06, + "loss": 0.6912, + "step": 17959 + }, + { + "epoch": 0.62, + "learning_rate": 6.256312305725936e-06, + "loss": 0.6243, + "step": 17960 + }, + { + "epoch": 0.62, + "learning_rate": 6.25530264549303e-06, + "loss": 0.6231, + "step": 17961 + }, + { + "epoch": 0.62, + "learning_rate": 6.254293029658248e-06, + "loss": 0.5785, + "step": 17962 + }, + { + "epoch": 0.62, + "learning_rate": 6.253283458233563e-06, + "loss": 0.6496, + "step": 17963 + }, + { + "epoch": 0.62, + "learning_rate": 6.252273931230941e-06, + "loss": 0.6622, + "step": 17964 + }, + { + "epoch": 0.62, + "learning_rate": 6.2512644486623505e-06, + "loss": 0.6321, + "step": 17965 + }, + { + "epoch": 0.62, + "learning_rate": 6.250255010539766e-06, + "loss": 0.6664, + "step": 17966 + }, + { + "epoch": 0.62, + "learning_rate": 6.249245616875149e-06, + "loss": 0.6455, + "step": 17967 + }, + { + "epoch": 0.62, + "learning_rate": 6.24823626768047e-06, + "loss": 0.5916, + "step": 17968 + }, + { + "epoch": 0.62, + "learning_rate": 6.247226962967698e-06, + "loss": 0.6227, + "step": 17969 + }, + { + "epoch": 0.62, + "learning_rate": 6.246217702748795e-06, + "loss": 0.6125, + "step": 17970 + }, + { + "epoch": 0.62, + "learning_rate": 6.245208487035732e-06, + "loss": 0.6613, + "step": 17971 + }, + { + "epoch": 0.62, + "learning_rate": 6.244199315840472e-06, + "loss": 0.6407, + "step": 17972 + }, + { + "epoch": 0.62, + "learning_rate": 6.243190189174979e-06, + "loss": 0.577, + "step": 17973 + }, + { + "epoch": 0.62, + "learning_rate": 6.2421811070512196e-06, + "loss": 0.6448, + "step": 17974 + }, + { + "epoch": 0.62, + "learning_rate": 6.241172069481156e-06, + "loss": 0.5768, + "step": 17975 + }, + { + "epoch": 0.62, + "learning_rate": 6.240163076476753e-06, + "loss": 0.6799, + "step": 17976 + }, + { + "epoch": 0.62, + "learning_rate": 6.239154128049972e-06, + "loss": 0.6763, + "step": 17977 + }, + { + "epoch": 0.62, + "learning_rate": 6.238145224212779e-06, + "loss": 0.6446, + "step": 17978 + }, + { + "epoch": 0.62, + "learning_rate": 6.23713636497713e-06, + "loss": 0.636, + "step": 17979 + }, + { + "epoch": 0.62, + "learning_rate": 6.236127550354991e-06, + "loss": 0.6582, + "step": 17980 + }, + { + "epoch": 0.62, + "learning_rate": 6.235118780358323e-06, + "loss": 0.6533, + "step": 17981 + }, + { + "epoch": 0.62, + "learning_rate": 6.234110054999081e-06, + "loss": 0.6372, + "step": 17982 + }, + { + "epoch": 0.62, + "learning_rate": 6.2331013742892285e-06, + "loss": 0.6689, + "step": 17983 + }, + { + "epoch": 0.62, + "learning_rate": 6.232092738240727e-06, + "loss": 0.6555, + "step": 17984 + }, + { + "epoch": 0.62, + "learning_rate": 6.231084146865531e-06, + "loss": 0.6305, + "step": 17985 + }, + { + "epoch": 0.62, + "learning_rate": 6.230075600175599e-06, + "loss": 0.5996, + "step": 17986 + }, + { + "epoch": 0.62, + "learning_rate": 6.229067098182892e-06, + "loss": 0.6622, + "step": 17987 + }, + { + "epoch": 0.62, + "learning_rate": 6.228058640899364e-06, + "loss": 0.6141, + "step": 17988 + }, + { + "epoch": 0.62, + "learning_rate": 6.22705022833697e-06, + "loss": 0.6645, + "step": 17989 + }, + { + "epoch": 0.62, + "learning_rate": 6.226041860507673e-06, + "loss": 0.6248, + "step": 17990 + }, + { + "epoch": 0.62, + "learning_rate": 6.22503353742342e-06, + "loss": 0.6586, + "step": 17991 + }, + { + "epoch": 0.62, + "learning_rate": 6.22402525909617e-06, + "loss": 0.6733, + "step": 17992 + }, + { + "epoch": 0.62, + "learning_rate": 6.223017025537879e-06, + "loss": 0.656, + "step": 17993 + }, + { + "epoch": 0.62, + "learning_rate": 6.222008836760498e-06, + "loss": 0.637, + "step": 17994 + }, + { + "epoch": 0.62, + "learning_rate": 6.22100069277598e-06, + "loss": 0.6647, + "step": 17995 + }, + { + "epoch": 0.62, + "learning_rate": 6.2199925935962835e-06, + "loss": 0.6516, + "step": 17996 + }, + { + "epoch": 0.62, + "learning_rate": 6.2189845392333525e-06, + "loss": 0.6815, + "step": 17997 + }, + { + "epoch": 0.62, + "learning_rate": 6.217976529699144e-06, + "loss": 0.5854, + "step": 17998 + }, + { + "epoch": 0.62, + "learning_rate": 6.21696856500561e-06, + "loss": 0.6183, + "step": 17999 + }, + { + "epoch": 0.62, + "learning_rate": 6.215960645164696e-06, + "loss": 0.603, + "step": 18000 + }, + { + "epoch": 0.62, + "learning_rate": 6.214952770188356e-06, + "loss": 0.6306, + "step": 18001 + }, + { + "epoch": 0.62, + "learning_rate": 6.213944940088542e-06, + "loss": 0.5969, + "step": 18002 + }, + { + "epoch": 0.62, + "learning_rate": 6.212937154877197e-06, + "loss": 0.6443, + "step": 18003 + }, + { + "epoch": 0.62, + "learning_rate": 6.211929414566274e-06, + "loss": 0.6358, + "step": 18004 + }, + { + "epoch": 0.62, + "learning_rate": 6.21092171916772e-06, + "loss": 0.7036, + "step": 18005 + }, + { + "epoch": 0.62, + "learning_rate": 6.209914068693481e-06, + "loss": 0.6406, + "step": 18006 + }, + { + "epoch": 0.62, + "learning_rate": 6.208906463155505e-06, + "loss": 0.6385, + "step": 18007 + }, + { + "epoch": 0.62, + "learning_rate": 6.207898902565741e-06, + "loss": 0.5996, + "step": 18008 + }, + { + "epoch": 0.62, + "learning_rate": 6.20689138693613e-06, + "loss": 0.6447, + "step": 18009 + }, + { + "epoch": 0.62, + "learning_rate": 6.205883916278621e-06, + "loss": 0.5805, + "step": 18010 + }, + { + "epoch": 0.62, + "learning_rate": 6.204876490605158e-06, + "loss": 0.6088, + "step": 18011 + }, + { + "epoch": 0.62, + "learning_rate": 6.2038691099276845e-06, + "loss": 0.6437, + "step": 18012 + }, + { + "epoch": 0.62, + "learning_rate": 6.2028617742581485e-06, + "loss": 0.6246, + "step": 18013 + }, + { + "epoch": 0.62, + "learning_rate": 6.201854483608484e-06, + "loss": 0.6326, + "step": 18014 + }, + { + "epoch": 0.62, + "learning_rate": 6.200847237990641e-06, + "loss": 0.6693, + "step": 18015 + }, + { + "epoch": 0.62, + "learning_rate": 6.199840037416564e-06, + "loss": 0.6339, + "step": 18016 + }, + { + "epoch": 0.62, + "learning_rate": 6.1988328818981836e-06, + "loss": 0.6834, + "step": 18017 + }, + { + "epoch": 0.62, + "learning_rate": 6.19782577144745e-06, + "loss": 0.6489, + "step": 18018 + }, + { + "epoch": 0.62, + "learning_rate": 6.196818706076306e-06, + "loss": 0.6384, + "step": 18019 + }, + { + "epoch": 0.62, + "learning_rate": 6.195811685796682e-06, + "loss": 0.6686, + "step": 18020 + }, + { + "epoch": 0.62, + "learning_rate": 6.194804710620524e-06, + "loss": 0.647, + "step": 18021 + }, + { + "epoch": 0.62, + "learning_rate": 6.193797780559775e-06, + "loss": 0.6296, + "step": 18022 + }, + { + "epoch": 0.62, + "learning_rate": 6.192790895626361e-06, + "loss": 0.6705, + "step": 18023 + }, + { + "epoch": 0.62, + "learning_rate": 6.1917840558322285e-06, + "loss": 0.6598, + "step": 18024 + }, + { + "epoch": 0.62, + "learning_rate": 6.190777261189319e-06, + "loss": 0.6242, + "step": 18025 + }, + { + "epoch": 0.62, + "learning_rate": 6.189770511709556e-06, + "loss": 0.613, + "step": 18026 + }, + { + "epoch": 0.62, + "learning_rate": 6.188763807404887e-06, + "loss": 0.6254, + "step": 18027 + }, + { + "epoch": 0.62, + "learning_rate": 6.187757148287248e-06, + "loss": 0.6813, + "step": 18028 + }, + { + "epoch": 0.62, + "learning_rate": 6.1867505343685645e-06, + "loss": 0.6395, + "step": 18029 + }, + { + "epoch": 0.62, + "learning_rate": 6.18574396566078e-06, + "loss": 0.6311, + "step": 18030 + }, + { + "epoch": 0.62, + "learning_rate": 6.1847374421758274e-06, + "loss": 0.6158, + "step": 18031 + }, + { + "epoch": 0.62, + "learning_rate": 6.183730963925636e-06, + "loss": 0.6245, + "step": 18032 + }, + { + "epoch": 0.62, + "learning_rate": 6.182724530922142e-06, + "loss": 0.6044, + "step": 18033 + }, + { + "epoch": 0.62, + "learning_rate": 6.181718143177281e-06, + "loss": 0.6772, + "step": 18034 + }, + { + "epoch": 0.62, + "learning_rate": 6.180711800702977e-06, + "loss": 0.6521, + "step": 18035 + }, + { + "epoch": 0.62, + "learning_rate": 6.179705503511166e-06, + "loss": 0.6794, + "step": 18036 + }, + { + "epoch": 0.62, + "learning_rate": 6.178699251613784e-06, + "loss": 0.614, + "step": 18037 + }, + { + "epoch": 0.62, + "learning_rate": 6.17769304502275e-06, + "loss": 0.6678, + "step": 18038 + }, + { + "epoch": 0.63, + "learning_rate": 6.176686883750002e-06, + "loss": 0.6217, + "step": 18039 + }, + { + "epoch": 0.63, + "learning_rate": 6.1756807678074725e-06, + "loss": 0.6745, + "step": 18040 + }, + { + "epoch": 0.63, + "learning_rate": 6.17467469720708e-06, + "loss": 0.599, + "step": 18041 + }, + { + "epoch": 0.63, + "learning_rate": 6.1736686719607575e-06, + "loss": 0.6503, + "step": 18042 + }, + { + "epoch": 0.63, + "learning_rate": 6.17266269208044e-06, + "loss": 0.6165, + "step": 18043 + }, + { + "epoch": 0.63, + "learning_rate": 6.171656757578042e-06, + "loss": 0.6387, + "step": 18044 + }, + { + "epoch": 0.63, + "learning_rate": 6.170650868465494e-06, + "loss": 0.6063, + "step": 18045 + }, + { + "epoch": 0.63, + "learning_rate": 6.169645024754731e-06, + "loss": 0.6307, + "step": 18046 + }, + { + "epoch": 0.63, + "learning_rate": 6.168639226457667e-06, + "loss": 0.6102, + "step": 18047 + }, + { + "epoch": 0.63, + "learning_rate": 6.16763347358623e-06, + "loss": 0.6656, + "step": 18048 + }, + { + "epoch": 0.63, + "learning_rate": 6.166627766152352e-06, + "loss": 0.6442, + "step": 18049 + }, + { + "epoch": 0.63, + "learning_rate": 6.165622104167948e-06, + "loss": 0.5778, + "step": 18050 + }, + { + "epoch": 0.63, + "learning_rate": 6.164616487644941e-06, + "loss": 0.6218, + "step": 18051 + }, + { + "epoch": 0.63, + "learning_rate": 6.163610916595264e-06, + "loss": 0.6363, + "step": 18052 + }, + { + "epoch": 0.63, + "learning_rate": 6.162605391030829e-06, + "loss": 0.6506, + "step": 18053 + }, + { + "epoch": 0.63, + "learning_rate": 6.161599910963558e-06, + "loss": 0.6188, + "step": 18054 + }, + { + "epoch": 0.63, + "learning_rate": 6.160594476405384e-06, + "loss": 0.6676, + "step": 18055 + }, + { + "epoch": 0.63, + "learning_rate": 6.159589087368214e-06, + "loss": 0.68, + "step": 18056 + }, + { + "epoch": 0.63, + "learning_rate": 6.158583743863971e-06, + "loss": 0.6255, + "step": 18057 + }, + { + "epoch": 0.63, + "learning_rate": 6.157578445904584e-06, + "loss": 0.6454, + "step": 18058 + }, + { + "epoch": 0.63, + "learning_rate": 6.15657319350196e-06, + "loss": 0.6324, + "step": 18059 + }, + { + "epoch": 0.63, + "learning_rate": 6.155567986668023e-06, + "loss": 0.5761, + "step": 18060 + }, + { + "epoch": 0.63, + "learning_rate": 6.154562825414695e-06, + "loss": 0.6104, + "step": 18061 + }, + { + "epoch": 0.63, + "learning_rate": 6.153557709753886e-06, + "loss": 0.5507, + "step": 18062 + }, + { + "epoch": 0.63, + "learning_rate": 6.152552639697513e-06, + "loss": 0.6177, + "step": 18063 + }, + { + "epoch": 0.63, + "learning_rate": 6.151547615257503e-06, + "loss": 0.637, + "step": 18064 + }, + { + "epoch": 0.63, + "learning_rate": 6.150542636445759e-06, + "loss": 0.6696, + "step": 18065 + }, + { + "epoch": 0.63, + "learning_rate": 6.1495377032742e-06, + "loss": 0.6415, + "step": 18066 + }, + { + "epoch": 0.63, + "learning_rate": 6.1485328157547485e-06, + "loss": 0.5698, + "step": 18067 + }, + { + "epoch": 0.63, + "learning_rate": 6.147527973899309e-06, + "loss": 0.5807, + "step": 18068 + }, + { + "epoch": 0.63, + "learning_rate": 6.146523177719797e-06, + "loss": 0.652, + "step": 18069 + }, + { + "epoch": 0.63, + "learning_rate": 6.145518427228132e-06, + "loss": 0.6685, + "step": 18070 + }, + { + "epoch": 0.63, + "learning_rate": 6.144513722436218e-06, + "loss": 0.609, + "step": 18071 + }, + { + "epoch": 0.63, + "learning_rate": 6.14350906335597e-06, + "loss": 0.6277, + "step": 18072 + }, + { + "epoch": 0.63, + "learning_rate": 6.142504449999307e-06, + "loss": 0.6466, + "step": 18073 + }, + { + "epoch": 0.63, + "learning_rate": 6.141499882378129e-06, + "loss": 0.5837, + "step": 18074 + }, + { + "epoch": 0.63, + "learning_rate": 6.140495360504353e-06, + "loss": 0.6675, + "step": 18075 + }, + { + "epoch": 0.63, + "learning_rate": 6.139490884389885e-06, + "loss": 0.6592, + "step": 18076 + }, + { + "epoch": 0.63, + "learning_rate": 6.138486454046635e-06, + "loss": 0.6735, + "step": 18077 + }, + { + "epoch": 0.63, + "learning_rate": 6.1374820694865156e-06, + "loss": 0.6221, + "step": 18078 + }, + { + "epoch": 0.63, + "learning_rate": 6.136477730721431e-06, + "loss": 0.6259, + "step": 18079 + }, + { + "epoch": 0.63, + "learning_rate": 6.135473437763291e-06, + "loss": 0.6189, + "step": 18080 + }, + { + "epoch": 0.63, + "learning_rate": 6.134469190624002e-06, + "loss": 0.6539, + "step": 18081 + }, + { + "epoch": 0.63, + "learning_rate": 6.1334649893154696e-06, + "loss": 0.6294, + "step": 18082 + }, + { + "epoch": 0.63, + "learning_rate": 6.1324608338496e-06, + "loss": 0.6591, + "step": 18083 + }, + { + "epoch": 0.63, + "learning_rate": 6.131456724238302e-06, + "loss": 0.606, + "step": 18084 + }, + { + "epoch": 0.63, + "learning_rate": 6.130452660493478e-06, + "loss": 0.6044, + "step": 18085 + }, + { + "epoch": 0.63, + "learning_rate": 6.1294486426270316e-06, + "loss": 0.6143, + "step": 18086 + }, + { + "epoch": 0.63, + "learning_rate": 6.1284446706508695e-06, + "loss": 0.6528, + "step": 18087 + }, + { + "epoch": 0.63, + "learning_rate": 6.127440744576892e-06, + "loss": 0.6051, + "step": 18088 + }, + { + "epoch": 0.63, + "learning_rate": 6.126436864417002e-06, + "loss": 0.5845, + "step": 18089 + }, + { + "epoch": 0.63, + "learning_rate": 6.125433030183107e-06, + "loss": 0.6575, + "step": 18090 + }, + { + "epoch": 0.63, + "learning_rate": 6.124429241887101e-06, + "loss": 0.5894, + "step": 18091 + }, + { + "epoch": 0.63, + "learning_rate": 6.123425499540889e-06, + "loss": 0.6479, + "step": 18092 + }, + { + "epoch": 0.63, + "learning_rate": 6.1224218031563754e-06, + "loss": 0.6402, + "step": 18093 + }, + { + "epoch": 0.63, + "learning_rate": 6.121418152745453e-06, + "loss": 0.6002, + "step": 18094 + }, + { + "epoch": 0.63, + "learning_rate": 6.120414548320025e-06, + "loss": 0.6433, + "step": 18095 + }, + { + "epoch": 0.63, + "learning_rate": 6.119410989891992e-06, + "loss": 0.6165, + "step": 18096 + }, + { + "epoch": 0.63, + "learning_rate": 6.11840747747325e-06, + "loss": 0.5903, + "step": 18097 + }, + { + "epoch": 0.63, + "learning_rate": 6.117404011075696e-06, + "loss": 0.6395, + "step": 18098 + }, + { + "epoch": 0.63, + "learning_rate": 6.116400590711233e-06, + "loss": 0.6388, + "step": 18099 + }, + { + "epoch": 0.63, + "learning_rate": 6.115397216391749e-06, + "loss": 0.6669, + "step": 18100 + }, + { + "epoch": 0.63, + "learning_rate": 6.114393888129146e-06, + "loss": 0.6123, + "step": 18101 + }, + { + "epoch": 0.63, + "learning_rate": 6.113390605935322e-06, + "loss": 0.6921, + "step": 18102 + }, + { + "epoch": 0.63, + "learning_rate": 6.112387369822166e-06, + "loss": 0.6836, + "step": 18103 + }, + { + "epoch": 0.63, + "learning_rate": 6.111384179801576e-06, + "loss": 0.5878, + "step": 18104 + }, + { + "epoch": 0.63, + "learning_rate": 6.1103810358854475e-06, + "loss": 0.5786, + "step": 18105 + }, + { + "epoch": 0.63, + "learning_rate": 6.10937793808567e-06, + "loss": 0.6354, + "step": 18106 + }, + { + "epoch": 0.63, + "learning_rate": 6.108374886414139e-06, + "loss": 0.6053, + "step": 18107 + }, + { + "epoch": 0.63, + "learning_rate": 6.107371880882749e-06, + "loss": 0.6448, + "step": 18108 + }, + { + "epoch": 0.63, + "learning_rate": 6.106368921503387e-06, + "loss": 0.6614, + "step": 18109 + }, + { + "epoch": 0.63, + "learning_rate": 6.1053660082879475e-06, + "loss": 0.6245, + "step": 18110 + }, + { + "epoch": 0.63, + "learning_rate": 6.104363141248322e-06, + "loss": 0.6614, + "step": 18111 + }, + { + "epoch": 0.63, + "learning_rate": 6.103360320396396e-06, + "loss": 0.6434, + "step": 18112 + }, + { + "epoch": 0.63, + "learning_rate": 6.102357545744066e-06, + "loss": 0.6441, + "step": 18113 + }, + { + "epoch": 0.63, + "learning_rate": 6.101354817303218e-06, + "loss": 0.6419, + "step": 18114 + }, + { + "epoch": 0.63, + "learning_rate": 6.100352135085739e-06, + "loss": 0.609, + "step": 18115 + }, + { + "epoch": 0.63, + "learning_rate": 6.099349499103517e-06, + "loss": 0.614, + "step": 18116 + }, + { + "epoch": 0.63, + "learning_rate": 6.0983469093684444e-06, + "loss": 0.6056, + "step": 18117 + }, + { + "epoch": 0.63, + "learning_rate": 6.0973443658924025e-06, + "loss": 0.6263, + "step": 18118 + }, + { + "epoch": 0.63, + "learning_rate": 6.096341868687281e-06, + "loss": 0.6534, + "step": 18119 + }, + { + "epoch": 0.63, + "learning_rate": 6.095339417764965e-06, + "loss": 0.6897, + "step": 18120 + }, + { + "epoch": 0.63, + "learning_rate": 6.094337013137339e-06, + "loss": 0.651, + "step": 18121 + }, + { + "epoch": 0.63, + "learning_rate": 6.093334654816288e-06, + "loss": 0.6012, + "step": 18122 + }, + { + "epoch": 0.63, + "learning_rate": 6.092332342813698e-06, + "loss": 0.6359, + "step": 18123 + }, + { + "epoch": 0.63, + "learning_rate": 6.0913300771414504e-06, + "loss": 0.6822, + "step": 18124 + }, + { + "epoch": 0.63, + "learning_rate": 6.090327857811429e-06, + "loss": 0.6156, + "step": 18125 + }, + { + "epoch": 0.63, + "learning_rate": 6.089325684835517e-06, + "loss": 0.6342, + "step": 18126 + }, + { + "epoch": 0.63, + "learning_rate": 6.088323558225596e-06, + "loss": 0.6487, + "step": 18127 + }, + { + "epoch": 0.63, + "learning_rate": 6.087321477993546e-06, + "loss": 0.6425, + "step": 18128 + }, + { + "epoch": 0.63, + "learning_rate": 6.086319444151253e-06, + "loss": 0.6104, + "step": 18129 + }, + { + "epoch": 0.63, + "learning_rate": 6.085317456710591e-06, + "loss": 0.6176, + "step": 18130 + }, + { + "epoch": 0.63, + "learning_rate": 6.084315515683443e-06, + "loss": 0.6861, + "step": 18131 + }, + { + "epoch": 0.63, + "learning_rate": 6.08331362108169e-06, + "loss": 0.627, + "step": 18132 + }, + { + "epoch": 0.63, + "learning_rate": 6.082311772917206e-06, + "loss": 0.6312, + "step": 18133 + }, + { + "epoch": 0.63, + "learning_rate": 6.081309971201872e-06, + "loss": 0.635, + "step": 18134 + }, + { + "epoch": 0.63, + "learning_rate": 6.080308215947568e-06, + "loss": 0.6295, + "step": 18135 + }, + { + "epoch": 0.63, + "learning_rate": 6.079306507166166e-06, + "loss": 0.6589, + "step": 18136 + }, + { + "epoch": 0.63, + "learning_rate": 6.078304844869547e-06, + "loss": 0.61, + "step": 18137 + }, + { + "epoch": 0.63, + "learning_rate": 6.077303229069585e-06, + "loss": 0.6811, + "step": 18138 + }, + { + "epoch": 0.63, + "learning_rate": 6.076301659778152e-06, + "loss": 0.6076, + "step": 18139 + }, + { + "epoch": 0.63, + "learning_rate": 6.07530013700713e-06, + "loss": 0.6468, + "step": 18140 + }, + { + "epoch": 0.63, + "learning_rate": 6.074298660768387e-06, + "loss": 0.6246, + "step": 18141 + }, + { + "epoch": 0.63, + "learning_rate": 6.073297231073802e-06, + "loss": 0.6055, + "step": 18142 + }, + { + "epoch": 0.63, + "learning_rate": 6.072295847935246e-06, + "loss": 0.6478, + "step": 18143 + }, + { + "epoch": 0.63, + "learning_rate": 6.071294511364588e-06, + "loss": 0.6629, + "step": 18144 + }, + { + "epoch": 0.63, + "learning_rate": 6.070293221373704e-06, + "loss": 0.6556, + "step": 18145 + }, + { + "epoch": 0.63, + "learning_rate": 6.069291977974468e-06, + "loss": 0.6003, + "step": 18146 + }, + { + "epoch": 0.63, + "learning_rate": 6.0682907811787455e-06, + "loss": 0.6237, + "step": 18147 + }, + { + "epoch": 0.63, + "learning_rate": 6.06728963099841e-06, + "loss": 0.6454, + "step": 18148 + }, + { + "epoch": 0.63, + "learning_rate": 6.066288527445332e-06, + "loss": 0.5898, + "step": 18149 + }, + { + "epoch": 0.63, + "learning_rate": 6.065287470531377e-06, + "loss": 0.6638, + "step": 18150 + }, + { + "epoch": 0.63, + "learning_rate": 6.064286460268418e-06, + "loss": 0.6608, + "step": 18151 + }, + { + "epoch": 0.63, + "learning_rate": 6.063285496668323e-06, + "loss": 0.6669, + "step": 18152 + }, + { + "epoch": 0.63, + "learning_rate": 6.062284579742957e-06, + "loss": 0.655, + "step": 18153 + }, + { + "epoch": 0.63, + "learning_rate": 6.061283709504186e-06, + "loss": 0.5978, + "step": 18154 + }, + { + "epoch": 0.63, + "learning_rate": 6.060282885963884e-06, + "loss": 0.6726, + "step": 18155 + }, + { + "epoch": 0.63, + "learning_rate": 6.059282109133908e-06, + "loss": 0.5884, + "step": 18156 + }, + { + "epoch": 0.63, + "learning_rate": 6.05828137902613e-06, + "loss": 0.6042, + "step": 18157 + }, + { + "epoch": 0.63, + "learning_rate": 6.057280695652413e-06, + "loss": 0.5931, + "step": 18158 + }, + { + "epoch": 0.63, + "learning_rate": 6.0562800590246196e-06, + "loss": 0.629, + "step": 18159 + }, + { + "epoch": 0.63, + "learning_rate": 6.055279469154614e-06, + "loss": 0.6273, + "step": 18160 + }, + { + "epoch": 0.63, + "learning_rate": 6.054278926054264e-06, + "loss": 0.6688, + "step": 18161 + }, + { + "epoch": 0.63, + "learning_rate": 6.053278429735425e-06, + "loss": 0.6449, + "step": 18162 + }, + { + "epoch": 0.63, + "learning_rate": 6.052277980209964e-06, + "loss": 0.5741, + "step": 18163 + }, + { + "epoch": 0.63, + "learning_rate": 6.051277577489743e-06, + "loss": 0.6348, + "step": 18164 + }, + { + "epoch": 0.63, + "learning_rate": 6.05027722158662e-06, + "loss": 0.6258, + "step": 18165 + }, + { + "epoch": 0.63, + "learning_rate": 6.0492769125124566e-06, + "loss": 0.6693, + "step": 18166 + }, + { + "epoch": 0.63, + "learning_rate": 6.048276650279114e-06, + "loss": 0.5892, + "step": 18167 + }, + { + "epoch": 0.63, + "learning_rate": 6.04727643489845e-06, + "loss": 0.6178, + "step": 18168 + }, + { + "epoch": 0.63, + "learning_rate": 6.046276266382324e-06, + "loss": 0.6226, + "step": 18169 + }, + { + "epoch": 0.63, + "learning_rate": 6.045276144742596e-06, + "loss": 0.6292, + "step": 18170 + }, + { + "epoch": 0.63, + "learning_rate": 6.044276069991119e-06, + "loss": 0.6258, + "step": 18171 + }, + { + "epoch": 0.63, + "learning_rate": 6.0432760421397566e-06, + "loss": 0.6924, + "step": 18172 + }, + { + "epoch": 0.63, + "learning_rate": 6.042276061200361e-06, + "loss": 0.6175, + "step": 18173 + }, + { + "epoch": 0.63, + "learning_rate": 6.041276127184787e-06, + "loss": 0.6054, + "step": 18174 + }, + { + "epoch": 0.63, + "learning_rate": 6.040276240104894e-06, + "loss": 0.6571, + "step": 18175 + }, + { + "epoch": 0.63, + "learning_rate": 6.0392763999725365e-06, + "loss": 0.6526, + "step": 18176 + }, + { + "epoch": 0.63, + "learning_rate": 6.0382766067995656e-06, + "loss": 0.6498, + "step": 18177 + }, + { + "epoch": 0.63, + "learning_rate": 6.037276860597837e-06, + "loss": 0.6756, + "step": 18178 + }, + { + "epoch": 0.63, + "learning_rate": 6.036277161379207e-06, + "loss": 0.6287, + "step": 18179 + }, + { + "epoch": 0.63, + "learning_rate": 6.035277509155521e-06, + "loss": 0.6342, + "step": 18180 + }, + { + "epoch": 0.63, + "learning_rate": 6.034277903938639e-06, + "loss": 0.5902, + "step": 18181 + }, + { + "epoch": 0.63, + "learning_rate": 6.0332783457404085e-06, + "loss": 0.6792, + "step": 18182 + }, + { + "epoch": 0.63, + "learning_rate": 6.03227883457268e-06, + "loss": 0.6685, + "step": 18183 + }, + { + "epoch": 0.63, + "learning_rate": 6.031279370447305e-06, + "loss": 0.5822, + "step": 18184 + }, + { + "epoch": 0.63, + "learning_rate": 6.030279953376136e-06, + "loss": 0.6476, + "step": 18185 + }, + { + "epoch": 0.63, + "learning_rate": 6.029280583371018e-06, + "loss": 0.6241, + "step": 18186 + }, + { + "epoch": 0.63, + "learning_rate": 6.0282812604438e-06, + "loss": 0.6184, + "step": 18187 + }, + { + "epoch": 0.63, + "learning_rate": 6.0272819846063356e-06, + "loss": 0.6224, + "step": 18188 + }, + { + "epoch": 0.63, + "learning_rate": 6.0262827558704666e-06, + "loss": 0.6439, + "step": 18189 + }, + { + "epoch": 0.63, + "learning_rate": 6.025283574248042e-06, + "loss": 0.6301, + "step": 18190 + }, + { + "epoch": 0.63, + "learning_rate": 6.02428443975091e-06, + "loss": 0.6372, + "step": 18191 + }, + { + "epoch": 0.63, + "learning_rate": 6.023285352390914e-06, + "loss": 0.6242, + "step": 18192 + }, + { + "epoch": 0.63, + "learning_rate": 6.0222863121799016e-06, + "loss": 0.6297, + "step": 18193 + }, + { + "epoch": 0.63, + "learning_rate": 6.021287319129717e-06, + "loss": 0.6423, + "step": 18194 + }, + { + "epoch": 0.63, + "learning_rate": 6.020288373252203e-06, + "loss": 0.5896, + "step": 18195 + }, + { + "epoch": 0.63, + "learning_rate": 6.019289474559204e-06, + "loss": 0.7093, + "step": 18196 + }, + { + "epoch": 0.63, + "learning_rate": 6.018290623062568e-06, + "loss": 0.6622, + "step": 18197 + }, + { + "epoch": 0.63, + "learning_rate": 6.017291818774129e-06, + "loss": 0.6436, + "step": 18198 + }, + { + "epoch": 0.63, + "learning_rate": 6.016293061705738e-06, + "loss": 0.6276, + "step": 18199 + }, + { + "epoch": 0.63, + "learning_rate": 6.01529435186923e-06, + "loss": 0.5899, + "step": 18200 + }, + { + "epoch": 0.63, + "learning_rate": 6.014295689276446e-06, + "loss": 0.6606, + "step": 18201 + }, + { + "epoch": 0.63, + "learning_rate": 6.013297073939233e-06, + "loss": 0.6471, + "step": 18202 + }, + { + "epoch": 0.63, + "learning_rate": 6.0122985058694226e-06, + "loss": 0.6415, + "step": 18203 + }, + { + "epoch": 0.63, + "learning_rate": 6.011299985078858e-06, + "loss": 0.6312, + "step": 18204 + }, + { + "epoch": 0.63, + "learning_rate": 6.010301511579381e-06, + "loss": 0.6584, + "step": 18205 + }, + { + "epoch": 0.63, + "learning_rate": 6.009303085382823e-06, + "loss": 0.6691, + "step": 18206 + }, + { + "epoch": 0.63, + "learning_rate": 6.008304706501027e-06, + "loss": 0.6144, + "step": 18207 + }, + { + "epoch": 0.63, + "learning_rate": 6.007306374945828e-06, + "loss": 0.6536, + "step": 18208 + }, + { + "epoch": 0.63, + "learning_rate": 6.006308090729062e-06, + "loss": 0.6308, + "step": 18209 + }, + { + "epoch": 0.63, + "learning_rate": 6.005309853862567e-06, + "loss": 0.6185, + "step": 18210 + }, + { + "epoch": 0.63, + "learning_rate": 6.0043116643581766e-06, + "loss": 0.6129, + "step": 18211 + }, + { + "epoch": 0.63, + "learning_rate": 6.003313522227725e-06, + "loss": 0.6309, + "step": 18212 + }, + { + "epoch": 0.63, + "learning_rate": 6.002315427483048e-06, + "loss": 0.6286, + "step": 18213 + }, + { + "epoch": 0.63, + "learning_rate": 6.0013173801359805e-06, + "loss": 0.6094, + "step": 18214 + }, + { + "epoch": 0.63, + "learning_rate": 6.000319380198351e-06, + "loss": 0.6329, + "step": 18215 + }, + { + "epoch": 0.63, + "learning_rate": 5.999321427681995e-06, + "loss": 0.6219, + "step": 18216 + }, + { + "epoch": 0.63, + "learning_rate": 5.998323522598746e-06, + "loss": 0.5722, + "step": 18217 + }, + { + "epoch": 0.63, + "learning_rate": 5.997325664960433e-06, + "loss": 0.668, + "step": 18218 + }, + { + "epoch": 0.63, + "learning_rate": 5.9963278547788876e-06, + "loss": 0.6038, + "step": 18219 + }, + { + "epoch": 0.63, + "learning_rate": 5.995330092065941e-06, + "loss": 0.5847, + "step": 18220 + }, + { + "epoch": 0.63, + "learning_rate": 5.99433237683342e-06, + "loss": 0.6037, + "step": 18221 + }, + { + "epoch": 0.63, + "learning_rate": 5.993334709093157e-06, + "loss": 0.6617, + "step": 18222 + }, + { + "epoch": 0.63, + "learning_rate": 5.9923370888569806e-06, + "loss": 0.6272, + "step": 18223 + }, + { + "epoch": 0.63, + "learning_rate": 5.991339516136717e-06, + "loss": 0.6504, + "step": 18224 + }, + { + "epoch": 0.63, + "learning_rate": 5.990341990944193e-06, + "loss": 0.6622, + "step": 18225 + }, + { + "epoch": 0.63, + "learning_rate": 5.98934451329124e-06, + "loss": 0.6406, + "step": 18226 + }, + { + "epoch": 0.63, + "learning_rate": 5.988347083189678e-06, + "loss": 0.6013, + "step": 18227 + }, + { + "epoch": 0.63, + "learning_rate": 5.987349700651338e-06, + "loss": 0.6548, + "step": 18228 + }, + { + "epoch": 0.63, + "learning_rate": 5.986352365688044e-06, + "loss": 0.6912, + "step": 18229 + }, + { + "epoch": 0.63, + "learning_rate": 5.9853550783116186e-06, + "loss": 0.64, + "step": 18230 + }, + { + "epoch": 0.63, + "learning_rate": 5.984357838533888e-06, + "loss": 0.6673, + "step": 18231 + }, + { + "epoch": 0.63, + "learning_rate": 5.9833606463666746e-06, + "loss": 0.6724, + "step": 18232 + }, + { + "epoch": 0.63, + "learning_rate": 5.982363501821802e-06, + "loss": 0.5916, + "step": 18233 + }, + { + "epoch": 0.63, + "learning_rate": 5.981366404911091e-06, + "loss": 0.6193, + "step": 18234 + }, + { + "epoch": 0.63, + "learning_rate": 5.980369355646367e-06, + "loss": 0.6355, + "step": 18235 + }, + { + "epoch": 0.63, + "learning_rate": 5.979372354039449e-06, + "loss": 0.6055, + "step": 18236 + }, + { + "epoch": 0.63, + "learning_rate": 5.978375400102156e-06, + "loss": 0.6479, + "step": 18237 + }, + { + "epoch": 0.63, + "learning_rate": 5.977378493846315e-06, + "loss": 0.5804, + "step": 18238 + }, + { + "epoch": 0.63, + "learning_rate": 5.9763816352837345e-06, + "loss": 0.6029, + "step": 18239 + }, + { + "epoch": 0.63, + "learning_rate": 5.97538482442624e-06, + "loss": 0.6583, + "step": 18240 + }, + { + "epoch": 0.63, + "learning_rate": 5.974388061285656e-06, + "loss": 0.6467, + "step": 18241 + }, + { + "epoch": 0.63, + "learning_rate": 5.973391345873787e-06, + "loss": 0.618, + "step": 18242 + }, + { + "epoch": 0.63, + "learning_rate": 5.972394678202458e-06, + "loss": 0.663, + "step": 18243 + }, + { + "epoch": 0.63, + "learning_rate": 5.9713980582834906e-06, + "loss": 0.6129, + "step": 18244 + }, + { + "epoch": 0.63, + "learning_rate": 5.97040148612869e-06, + "loss": 0.6375, + "step": 18245 + }, + { + "epoch": 0.63, + "learning_rate": 5.969404961749877e-06, + "loss": 0.6063, + "step": 18246 + }, + { + "epoch": 0.63, + "learning_rate": 5.968408485158872e-06, + "loss": 0.6026, + "step": 18247 + }, + { + "epoch": 0.63, + "learning_rate": 5.967412056367479e-06, + "loss": 0.6062, + "step": 18248 + }, + { + "epoch": 0.63, + "learning_rate": 5.966415675387518e-06, + "loss": 0.6742, + "step": 18249 + }, + { + "epoch": 0.63, + "learning_rate": 5.965419342230807e-06, + "loss": 0.7021, + "step": 18250 + }, + { + "epoch": 0.63, + "learning_rate": 5.964423056909147e-06, + "loss": 0.6768, + "step": 18251 + }, + { + "epoch": 0.63, + "learning_rate": 5.963426819434359e-06, + "loss": 0.6258, + "step": 18252 + }, + { + "epoch": 0.63, + "learning_rate": 5.962430629818256e-06, + "loss": 0.6729, + "step": 18253 + }, + { + "epoch": 0.63, + "learning_rate": 5.961434488072639e-06, + "loss": 0.591, + "step": 18254 + }, + { + "epoch": 0.63, + "learning_rate": 5.960438394209327e-06, + "loss": 0.6835, + "step": 18255 + }, + { + "epoch": 0.63, + "learning_rate": 5.959442348240132e-06, + "loss": 0.654, + "step": 18256 + }, + { + "epoch": 0.63, + "learning_rate": 5.958446350176854e-06, + "loss": 0.6501, + "step": 18257 + }, + { + "epoch": 0.63, + "learning_rate": 5.9574504000313095e-06, + "loss": 0.6574, + "step": 18258 + }, + { + "epoch": 0.63, + "learning_rate": 5.956454497815307e-06, + "loss": 0.6122, + "step": 18259 + }, + { + "epoch": 0.63, + "learning_rate": 5.955458643540646e-06, + "loss": 0.679, + "step": 18260 + }, + { + "epoch": 0.63, + "learning_rate": 5.954462837219146e-06, + "loss": 0.589, + "step": 18261 + }, + { + "epoch": 0.63, + "learning_rate": 5.9534670788626015e-06, + "loss": 0.5774, + "step": 18262 + }, + { + "epoch": 0.63, + "learning_rate": 5.952471368482822e-06, + "loss": 0.6061, + "step": 18263 + }, + { + "epoch": 0.63, + "learning_rate": 5.9514757060916205e-06, + "loss": 0.6288, + "step": 18264 + }, + { + "epoch": 0.63, + "learning_rate": 5.950480091700792e-06, + "loss": 0.6403, + "step": 18265 + }, + { + "epoch": 0.63, + "learning_rate": 5.949484525322144e-06, + "loss": 0.5892, + "step": 18266 + }, + { + "epoch": 0.63, + "learning_rate": 5.948489006967485e-06, + "loss": 0.6486, + "step": 18267 + }, + { + "epoch": 0.63, + "learning_rate": 5.947493536648611e-06, + "loss": 0.6122, + "step": 18268 + }, + { + "epoch": 0.63, + "learning_rate": 5.946498114377325e-06, + "loss": 0.6412, + "step": 18269 + }, + { + "epoch": 0.63, + "learning_rate": 5.9455027401654385e-06, + "loss": 0.5987, + "step": 18270 + }, + { + "epoch": 0.63, + "learning_rate": 5.9445074140247406e-06, + "loss": 0.6529, + "step": 18271 + }, + { + "epoch": 0.63, + "learning_rate": 5.943512135967036e-06, + "loss": 0.6732, + "step": 18272 + }, + { + "epoch": 0.63, + "learning_rate": 5.942516906004133e-06, + "loss": 0.6601, + "step": 18273 + }, + { + "epoch": 0.63, + "learning_rate": 5.941521724147821e-06, + "loss": 0.6049, + "step": 18274 + }, + { + "epoch": 0.63, + "learning_rate": 5.940526590409901e-06, + "loss": 0.6322, + "step": 18275 + }, + { + "epoch": 0.63, + "learning_rate": 5.939531504802179e-06, + "loss": 0.5867, + "step": 18276 + }, + { + "epoch": 0.63, + "learning_rate": 5.938536467336443e-06, + "loss": 0.6333, + "step": 18277 + }, + { + "epoch": 0.63, + "learning_rate": 5.937541478024493e-06, + "loss": 0.6306, + "step": 18278 + }, + { + "epoch": 0.63, + "learning_rate": 5.936546536878135e-06, + "loss": 0.6743, + "step": 18279 + }, + { + "epoch": 0.63, + "learning_rate": 5.935551643909153e-06, + "loss": 0.6725, + "step": 18280 + }, + { + "epoch": 0.63, + "learning_rate": 5.9345567991293474e-06, + "loss": 0.6483, + "step": 18281 + }, + { + "epoch": 0.63, + "learning_rate": 5.933562002550518e-06, + "loss": 0.6324, + "step": 18282 + }, + { + "epoch": 0.63, + "learning_rate": 5.932567254184451e-06, + "loss": 0.6156, + "step": 18283 + }, + { + "epoch": 0.63, + "learning_rate": 5.931572554042944e-06, + "loss": 0.6523, + "step": 18284 + }, + { + "epoch": 0.63, + "learning_rate": 5.930577902137796e-06, + "loss": 0.6354, + "step": 18285 + }, + { + "epoch": 0.63, + "learning_rate": 5.929583298480791e-06, + "loss": 0.687, + "step": 18286 + }, + { + "epoch": 0.63, + "learning_rate": 5.928588743083723e-06, + "loss": 0.6783, + "step": 18287 + }, + { + "epoch": 0.63, + "learning_rate": 5.9275942359583925e-06, + "loss": 0.6054, + "step": 18288 + }, + { + "epoch": 0.63, + "learning_rate": 5.926599777116579e-06, + "loss": 0.6442, + "step": 18289 + }, + { + "epoch": 0.63, + "learning_rate": 5.925605366570078e-06, + "loss": 0.6184, + "step": 18290 + }, + { + "epoch": 0.63, + "learning_rate": 5.924611004330682e-06, + "loss": 0.5859, + "step": 18291 + }, + { + "epoch": 0.63, + "learning_rate": 5.923616690410176e-06, + "loss": 0.5711, + "step": 18292 + }, + { + "epoch": 0.63, + "learning_rate": 5.9226224248203504e-06, + "loss": 0.66, + "step": 18293 + }, + { + "epoch": 0.63, + "learning_rate": 5.921628207572998e-06, + "loss": 0.6717, + "step": 18294 + }, + { + "epoch": 0.63, + "learning_rate": 5.920634038679898e-06, + "loss": 0.6488, + "step": 18295 + }, + { + "epoch": 0.63, + "learning_rate": 5.91963991815284e-06, + "loss": 0.6368, + "step": 18296 + }, + { + "epoch": 0.63, + "learning_rate": 5.9186458460036186e-06, + "loss": 0.6677, + "step": 18297 + }, + { + "epoch": 0.63, + "learning_rate": 5.917651822244011e-06, + "loss": 0.6027, + "step": 18298 + }, + { + "epoch": 0.63, + "learning_rate": 5.916657846885802e-06, + "loss": 0.6566, + "step": 18299 + }, + { + "epoch": 0.63, + "learning_rate": 5.915663919940786e-06, + "loss": 0.6642, + "step": 18300 + }, + { + "epoch": 0.63, + "learning_rate": 5.914670041420736e-06, + "loss": 0.658, + "step": 18301 + }, + { + "epoch": 0.63, + "learning_rate": 5.91367621133744e-06, + "loss": 0.6295, + "step": 18302 + }, + { + "epoch": 0.63, + "learning_rate": 5.912682429702687e-06, + "loss": 0.5991, + "step": 18303 + }, + { + "epoch": 0.63, + "learning_rate": 5.9116886965282506e-06, + "loss": 0.5927, + "step": 18304 + }, + { + "epoch": 0.63, + "learning_rate": 5.910695011825913e-06, + "loss": 0.6295, + "step": 18305 + }, + { + "epoch": 0.63, + "learning_rate": 5.909701375607467e-06, + "loss": 0.612, + "step": 18306 + }, + { + "epoch": 0.63, + "learning_rate": 5.908707787884681e-06, + "loss": 0.6506, + "step": 18307 + }, + { + "epoch": 0.63, + "learning_rate": 5.9077142486693375e-06, + "loss": 0.6134, + "step": 18308 + }, + { + "epoch": 0.63, + "learning_rate": 5.906720757973224e-06, + "loss": 0.6715, + "step": 18309 + }, + { + "epoch": 0.63, + "learning_rate": 5.905727315808111e-06, + "loss": 0.658, + "step": 18310 + }, + { + "epoch": 0.63, + "learning_rate": 5.904733922185777e-06, + "loss": 0.651, + "step": 18311 + }, + { + "epoch": 0.63, + "learning_rate": 5.903740577118009e-06, + "loss": 0.6209, + "step": 18312 + }, + { + "epoch": 0.63, + "learning_rate": 5.902747280616575e-06, + "loss": 0.7044, + "step": 18313 + }, + { + "epoch": 0.63, + "learning_rate": 5.901754032693252e-06, + "loss": 0.6521, + "step": 18314 + }, + { + "epoch": 0.63, + "learning_rate": 5.9007608333598255e-06, + "loss": 0.5915, + "step": 18315 + }, + { + "epoch": 0.63, + "learning_rate": 5.8997676826280615e-06, + "loss": 0.6724, + "step": 18316 + }, + { + "epoch": 0.63, + "learning_rate": 5.898774580509735e-06, + "loss": 0.6321, + "step": 18317 + }, + { + "epoch": 0.63, + "learning_rate": 5.897781527016631e-06, + "loss": 0.6337, + "step": 18318 + }, + { + "epoch": 0.63, + "learning_rate": 5.896788522160512e-06, + "loss": 0.6, + "step": 18319 + }, + { + "epoch": 0.63, + "learning_rate": 5.895795565953154e-06, + "loss": 0.6386, + "step": 18320 + }, + { + "epoch": 0.63, + "learning_rate": 5.894802658406338e-06, + "loss": 0.6549, + "step": 18321 + }, + { + "epoch": 0.63, + "learning_rate": 5.893809799531825e-06, + "loss": 0.5791, + "step": 18322 + }, + { + "epoch": 0.63, + "learning_rate": 5.892816989341393e-06, + "loss": 0.6455, + "step": 18323 + }, + { + "epoch": 0.63, + "learning_rate": 5.8918242278468085e-06, + "loss": 0.6658, + "step": 18324 + }, + { + "epoch": 0.63, + "learning_rate": 5.890831515059845e-06, + "loss": 0.634, + "step": 18325 + }, + { + "epoch": 0.63, + "learning_rate": 5.889838850992275e-06, + "loss": 0.6009, + "step": 18326 + }, + { + "epoch": 0.63, + "learning_rate": 5.888846235655863e-06, + "loss": 0.71, + "step": 18327 + }, + { + "epoch": 0.64, + "learning_rate": 5.887853669062378e-06, + "loss": 0.5983, + "step": 18328 + }, + { + "epoch": 0.64, + "learning_rate": 5.886861151223593e-06, + "loss": 0.625, + "step": 18329 + }, + { + "epoch": 0.64, + "learning_rate": 5.885868682151269e-06, + "loss": 0.6372, + "step": 18330 + }, + { + "epoch": 0.64, + "learning_rate": 5.8848762618571765e-06, + "loss": 0.702, + "step": 18331 + }, + { + "epoch": 0.64, + "learning_rate": 5.8838838903530835e-06, + "loss": 0.6527, + "step": 18332 + }, + { + "epoch": 0.64, + "learning_rate": 5.882891567650752e-06, + "loss": 0.6041, + "step": 18333 + }, + { + "epoch": 0.64, + "learning_rate": 5.8818992937619504e-06, + "loss": 0.6749, + "step": 18334 + }, + { + "epoch": 0.64, + "learning_rate": 5.880907068698443e-06, + "loss": 0.6714, + "step": 18335 + }, + { + "epoch": 0.64, + "learning_rate": 5.879914892471991e-06, + "loss": 0.6645, + "step": 18336 + }, + { + "epoch": 0.64, + "learning_rate": 5.8789227650943595e-06, + "loss": 0.6411, + "step": 18337 + }, + { + "epoch": 0.64, + "learning_rate": 5.877930686577315e-06, + "loss": 0.6347, + "step": 18338 + }, + { + "epoch": 0.64, + "learning_rate": 5.876938656932614e-06, + "loss": 0.6272, + "step": 18339 + }, + { + "epoch": 0.64, + "learning_rate": 5.87594667617202e-06, + "loss": 0.6508, + "step": 18340 + }, + { + "epoch": 0.64, + "learning_rate": 5.8749547443072974e-06, + "loss": 0.6343, + "step": 18341 + }, + { + "epoch": 0.64, + "learning_rate": 5.873962861350204e-06, + "loss": 0.6393, + "step": 18342 + }, + { + "epoch": 0.64, + "learning_rate": 5.8729710273125e-06, + "loss": 0.6578, + "step": 18343 + }, + { + "epoch": 0.64, + "learning_rate": 5.871979242205945e-06, + "loss": 0.6485, + "step": 18344 + }, + { + "epoch": 0.64, + "learning_rate": 5.870987506042299e-06, + "loss": 0.6127, + "step": 18345 + }, + { + "epoch": 0.64, + "learning_rate": 5.869995818833317e-06, + "loss": 0.5931, + "step": 18346 + }, + { + "epoch": 0.64, + "learning_rate": 5.869004180590763e-06, + "loss": 0.6519, + "step": 18347 + }, + { + "epoch": 0.64, + "learning_rate": 5.868012591326386e-06, + "loss": 0.649, + "step": 18348 + }, + { + "epoch": 0.64, + "learning_rate": 5.867021051051949e-06, + "loss": 0.5766, + "step": 18349 + }, + { + "epoch": 0.64, + "learning_rate": 5.866029559779206e-06, + "loss": 0.6484, + "step": 18350 + }, + { + "epoch": 0.64, + "learning_rate": 5.86503811751991e-06, + "loss": 0.6725, + "step": 18351 + }, + { + "epoch": 0.64, + "learning_rate": 5.864046724285819e-06, + "loss": 0.5812, + "step": 18352 + }, + { + "epoch": 0.64, + "learning_rate": 5.863055380088687e-06, + "loss": 0.6391, + "step": 18353 + }, + { + "epoch": 0.64, + "learning_rate": 5.862064084940267e-06, + "loss": 0.643, + "step": 18354 + }, + { + "epoch": 0.64, + "learning_rate": 5.861072838852309e-06, + "loss": 0.5896, + "step": 18355 + }, + { + "epoch": 0.64, + "learning_rate": 5.860081641836571e-06, + "loss": 0.6033, + "step": 18356 + }, + { + "epoch": 0.64, + "learning_rate": 5.859090493904801e-06, + "loss": 0.6143, + "step": 18357 + }, + { + "epoch": 0.64, + "learning_rate": 5.8580993950687514e-06, + "loss": 0.6106, + "step": 18358 + }, + { + "epoch": 0.64, + "learning_rate": 5.857108345340175e-06, + "loss": 0.6879, + "step": 18359 + }, + { + "epoch": 0.64, + "learning_rate": 5.8561173447308174e-06, + "loss": 0.633, + "step": 18360 + }, + { + "epoch": 0.64, + "learning_rate": 5.855126393252431e-06, + "loss": 0.591, + "step": 18361 + }, + { + "epoch": 0.64, + "learning_rate": 5.854135490916766e-06, + "loss": 0.664, + "step": 18362 + }, + { + "epoch": 0.64, + "learning_rate": 5.8531446377355684e-06, + "loss": 0.6566, + "step": 18363 + }, + { + "epoch": 0.64, + "learning_rate": 5.852153833720586e-06, + "loss": 0.6321, + "step": 18364 + }, + { + "epoch": 0.64, + "learning_rate": 5.851163078883568e-06, + "loss": 0.6353, + "step": 18365 + }, + { + "epoch": 0.64, + "learning_rate": 5.85017237323626e-06, + "loss": 0.6291, + "step": 18366 + }, + { + "epoch": 0.64, + "learning_rate": 5.849181716790406e-06, + "loss": 0.6562, + "step": 18367 + }, + { + "epoch": 0.64, + "learning_rate": 5.8481911095577585e-06, + "loss": 0.7064, + "step": 18368 + }, + { + "epoch": 0.64, + "learning_rate": 5.847200551550054e-06, + "loss": 0.5965, + "step": 18369 + }, + { + "epoch": 0.64, + "learning_rate": 5.846210042779039e-06, + "loss": 0.6466, + "step": 18370 + }, + { + "epoch": 0.64, + "learning_rate": 5.845219583256462e-06, + "loss": 0.6814, + "step": 18371 + }, + { + "epoch": 0.64, + "learning_rate": 5.84422917299406e-06, + "loss": 0.6128, + "step": 18372 + }, + { + "epoch": 0.64, + "learning_rate": 5.843238812003579e-06, + "loss": 0.614, + "step": 18373 + }, + { + "epoch": 0.64, + "learning_rate": 5.842248500296761e-06, + "loss": 0.6695, + "step": 18374 + }, + { + "epoch": 0.64, + "learning_rate": 5.841258237885345e-06, + "loss": 0.6227, + "step": 18375 + }, + { + "epoch": 0.64, + "learning_rate": 5.840268024781075e-06, + "loss": 0.7205, + "step": 18376 + }, + { + "epoch": 0.64, + "learning_rate": 5.839277860995689e-06, + "loss": 0.6554, + "step": 18377 + }, + { + "epoch": 0.64, + "learning_rate": 5.838287746540927e-06, + "loss": 0.5762, + "step": 18378 + }, + { + "epoch": 0.64, + "learning_rate": 5.837297681428529e-06, + "loss": 0.5861, + "step": 18379 + }, + { + "epoch": 0.64, + "learning_rate": 5.836307665670236e-06, + "loss": 0.6945, + "step": 18380 + }, + { + "epoch": 0.64, + "learning_rate": 5.835317699277774e-06, + "loss": 0.5967, + "step": 18381 + }, + { + "epoch": 0.64, + "learning_rate": 5.834327782262894e-06, + "loss": 0.6365, + "step": 18382 + }, + { + "epoch": 0.64, + "learning_rate": 5.833337914637331e-06, + "loss": 0.6216, + "step": 18383 + }, + { + "epoch": 0.64, + "learning_rate": 5.832348096412814e-06, + "loss": 0.5834, + "step": 18384 + }, + { + "epoch": 0.64, + "learning_rate": 5.831358327601087e-06, + "loss": 0.6221, + "step": 18385 + }, + { + "epoch": 0.64, + "learning_rate": 5.830368608213876e-06, + "loss": 0.6294, + "step": 18386 + }, + { + "epoch": 0.64, + "learning_rate": 5.829378938262915e-06, + "loss": 0.6371, + "step": 18387 + }, + { + "epoch": 0.64, + "learning_rate": 5.828389317759953e-06, + "loss": 0.6047, + "step": 18388 + }, + { + "epoch": 0.64, + "learning_rate": 5.827399746716707e-06, + "loss": 0.6135, + "step": 18389 + }, + { + "epoch": 0.64, + "learning_rate": 5.8264102251449154e-06, + "loss": 0.6323, + "step": 18390 + }, + { + "epoch": 0.64, + "learning_rate": 5.8254207530563145e-06, + "loss": 0.6413, + "step": 18391 + }, + { + "epoch": 0.64, + "learning_rate": 5.824431330462626e-06, + "loss": 0.6534, + "step": 18392 + }, + { + "epoch": 0.64, + "learning_rate": 5.823441957375584e-06, + "loss": 0.6142, + "step": 18393 + }, + { + "epoch": 0.64, + "learning_rate": 5.822452633806928e-06, + "loss": 0.637, + "step": 18394 + }, + { + "epoch": 0.64, + "learning_rate": 5.821463359768378e-06, + "loss": 0.6188, + "step": 18395 + }, + { + "epoch": 0.64, + "learning_rate": 5.820474135271664e-06, + "loss": 0.5949, + "step": 18396 + }, + { + "epoch": 0.64, + "learning_rate": 5.8194849603285205e-06, + "loss": 0.6531, + "step": 18397 + }, + { + "epoch": 0.64, + "learning_rate": 5.8184958349506685e-06, + "loss": 0.618, + "step": 18398 + }, + { + "epoch": 0.64, + "learning_rate": 5.817506759149834e-06, + "loss": 0.627, + "step": 18399 + }, + { + "epoch": 0.64, + "learning_rate": 5.816517732937754e-06, + "loss": 0.63, + "step": 18400 + }, + { + "epoch": 0.64, + "learning_rate": 5.815528756326145e-06, + "loss": 0.6509, + "step": 18401 + }, + { + "epoch": 0.64, + "learning_rate": 5.814539829326737e-06, + "loss": 0.6335, + "step": 18402 + }, + { + "epoch": 0.64, + "learning_rate": 5.813550951951257e-06, + "loss": 0.5991, + "step": 18403 + }, + { + "epoch": 0.64, + "learning_rate": 5.812562124211423e-06, + "loss": 0.6797, + "step": 18404 + }, + { + "epoch": 0.64, + "learning_rate": 5.811573346118957e-06, + "loss": 0.6927, + "step": 18405 + }, + { + "epoch": 0.64, + "learning_rate": 5.810584617685597e-06, + "loss": 0.6544, + "step": 18406 + }, + { + "epoch": 0.64, + "learning_rate": 5.809595938923051e-06, + "loss": 0.5932, + "step": 18407 + }, + { + "epoch": 0.64, + "learning_rate": 5.808607309843046e-06, + "loss": 0.6231, + "step": 18408 + }, + { + "epoch": 0.64, + "learning_rate": 5.807618730457307e-06, + "loss": 0.6401, + "step": 18409 + }, + { + "epoch": 0.64, + "learning_rate": 5.80663020077755e-06, + "loss": 0.6642, + "step": 18410 + }, + { + "epoch": 0.64, + "learning_rate": 5.805641720815489e-06, + "loss": 0.6358, + "step": 18411 + }, + { + "epoch": 0.64, + "learning_rate": 5.804653290582862e-06, + "loss": 0.6258, + "step": 18412 + }, + { + "epoch": 0.64, + "learning_rate": 5.803664910091372e-06, + "loss": 0.5932, + "step": 18413 + }, + { + "epoch": 0.64, + "learning_rate": 5.802676579352744e-06, + "loss": 0.6202, + "step": 18414 + }, + { + "epoch": 0.64, + "learning_rate": 5.801688298378697e-06, + "loss": 0.601, + "step": 18415 + }, + { + "epoch": 0.64, + "learning_rate": 5.800700067180943e-06, + "loss": 0.6008, + "step": 18416 + }, + { + "epoch": 0.64, + "learning_rate": 5.799711885771198e-06, + "loss": 0.6468, + "step": 18417 + }, + { + "epoch": 0.64, + "learning_rate": 5.798723754161191e-06, + "loss": 0.6057, + "step": 18418 + }, + { + "epoch": 0.64, + "learning_rate": 5.7977356723626235e-06, + "loss": 0.6014, + "step": 18419 + }, + { + "epoch": 0.64, + "learning_rate": 5.796747640387215e-06, + "loss": 0.601, + "step": 18420 + }, + { + "epoch": 0.64, + "learning_rate": 5.795759658246684e-06, + "loss": 0.618, + "step": 18421 + }, + { + "epoch": 0.64, + "learning_rate": 5.794771725952738e-06, + "loss": 0.631, + "step": 18422 + }, + { + "epoch": 0.64, + "learning_rate": 5.793783843517089e-06, + "loss": 0.6554, + "step": 18423 + }, + { + "epoch": 0.64, + "learning_rate": 5.792796010951461e-06, + "loss": 0.6432, + "step": 18424 + }, + { + "epoch": 0.64, + "learning_rate": 5.791808228267554e-06, + "loss": 0.6487, + "step": 18425 + }, + { + "epoch": 0.64, + "learning_rate": 5.790820495477083e-06, + "loss": 0.6173, + "step": 18426 + }, + { + "epoch": 0.64, + "learning_rate": 5.789832812591764e-06, + "loss": 0.6434, + "step": 18427 + }, + { + "epoch": 0.64, + "learning_rate": 5.788845179623301e-06, + "loss": 0.5973, + "step": 18428 + }, + { + "epoch": 0.64, + "learning_rate": 5.787857596583399e-06, + "loss": 0.5873, + "step": 18429 + }, + { + "epoch": 0.64, + "learning_rate": 5.786870063483784e-06, + "loss": 0.6481, + "step": 18430 + }, + { + "epoch": 0.64, + "learning_rate": 5.785882580336148e-06, + "loss": 0.5765, + "step": 18431 + }, + { + "epoch": 0.64, + "learning_rate": 5.784895147152206e-06, + "loss": 0.6154, + "step": 18432 + }, + { + "epoch": 0.64, + "learning_rate": 5.783907763943668e-06, + "loss": 0.6633, + "step": 18433 + }, + { + "epoch": 0.64, + "learning_rate": 5.782920430722232e-06, + "loss": 0.6305, + "step": 18434 + }, + { + "epoch": 0.64, + "learning_rate": 5.781933147499605e-06, + "loss": 0.6345, + "step": 18435 + }, + { + "epoch": 0.64, + "learning_rate": 5.780945914287505e-06, + "loss": 0.6399, + "step": 18436 + }, + { + "epoch": 0.64, + "learning_rate": 5.779958731097626e-06, + "loss": 0.5914, + "step": 18437 + }, + { + "epoch": 0.64, + "learning_rate": 5.778971597941671e-06, + "loss": 0.695, + "step": 18438 + }, + { + "epoch": 0.64, + "learning_rate": 5.777984514831354e-06, + "loss": 0.6668, + "step": 18439 + }, + { + "epoch": 0.64, + "learning_rate": 5.776997481778367e-06, + "loss": 0.6328, + "step": 18440 + }, + { + "epoch": 0.64, + "learning_rate": 5.776010498794414e-06, + "loss": 0.6685, + "step": 18441 + }, + { + "epoch": 0.64, + "learning_rate": 5.7750235658912045e-06, + "loss": 0.6609, + "step": 18442 + }, + { + "epoch": 0.64, + "learning_rate": 5.774036683080435e-06, + "loss": 0.6175, + "step": 18443 + }, + { + "epoch": 0.64, + "learning_rate": 5.773049850373804e-06, + "loss": 0.655, + "step": 18444 + }, + { + "epoch": 0.64, + "learning_rate": 5.7720630677830194e-06, + "loss": 0.6347, + "step": 18445 + }, + { + "epoch": 0.64, + "learning_rate": 5.771076335319771e-06, + "loss": 0.6485, + "step": 18446 + }, + { + "epoch": 0.64, + "learning_rate": 5.770089652995763e-06, + "loss": 0.6577, + "step": 18447 + }, + { + "epoch": 0.64, + "learning_rate": 5.769103020822692e-06, + "loss": 0.6742, + "step": 18448 + }, + { + "epoch": 0.64, + "learning_rate": 5.768116438812257e-06, + "loss": 0.6585, + "step": 18449 + }, + { + "epoch": 0.64, + "learning_rate": 5.767129906976159e-06, + "loss": 0.6695, + "step": 18450 + }, + { + "epoch": 0.64, + "learning_rate": 5.766143425326087e-06, + "loss": 0.6016, + "step": 18451 + }, + { + "epoch": 0.64, + "learning_rate": 5.7651569938737395e-06, + "loss": 0.5678, + "step": 18452 + }, + { + "epoch": 0.64, + "learning_rate": 5.764170612630814e-06, + "loss": 0.6535, + "step": 18453 + }, + { + "epoch": 0.64, + "learning_rate": 5.763184281609004e-06, + "loss": 0.6216, + "step": 18454 + }, + { + "epoch": 0.64, + "learning_rate": 5.762198000820004e-06, + "loss": 0.6383, + "step": 18455 + }, + { + "epoch": 0.64, + "learning_rate": 5.761211770275512e-06, + "loss": 0.6483, + "step": 18456 + }, + { + "epoch": 0.64, + "learning_rate": 5.760225589987212e-06, + "loss": 0.6113, + "step": 18457 + }, + { + "epoch": 0.64, + "learning_rate": 5.759239459966801e-06, + "loss": 0.6571, + "step": 18458 + }, + { + "epoch": 0.64, + "learning_rate": 5.75825338022597e-06, + "loss": 0.5742, + "step": 18459 + }, + { + "epoch": 0.64, + "learning_rate": 5.757267350776412e-06, + "loss": 0.6476, + "step": 18460 + }, + { + "epoch": 0.64, + "learning_rate": 5.756281371629817e-06, + "loss": 0.6199, + "step": 18461 + }, + { + "epoch": 0.64, + "learning_rate": 5.755295442797877e-06, + "loss": 0.6304, + "step": 18462 + }, + { + "epoch": 0.64, + "learning_rate": 5.754309564292276e-06, + "loss": 0.6455, + "step": 18463 + }, + { + "epoch": 0.64, + "learning_rate": 5.753323736124707e-06, + "loss": 0.6818, + "step": 18464 + }, + { + "epoch": 0.64, + "learning_rate": 5.752337958306856e-06, + "loss": 0.672, + "step": 18465 + }, + { + "epoch": 0.64, + "learning_rate": 5.751352230850412e-06, + "loss": 0.6221, + "step": 18466 + }, + { + "epoch": 0.64, + "learning_rate": 5.750366553767061e-06, + "loss": 0.6119, + "step": 18467 + }, + { + "epoch": 0.64, + "learning_rate": 5.7493809270684965e-06, + "loss": 0.6296, + "step": 18468 + }, + { + "epoch": 0.64, + "learning_rate": 5.748395350766394e-06, + "loss": 0.6199, + "step": 18469 + }, + { + "epoch": 0.64, + "learning_rate": 5.747409824872441e-06, + "loss": 0.6244, + "step": 18470 + }, + { + "epoch": 0.64, + "learning_rate": 5.7464243493983256e-06, + "loss": 0.6685, + "step": 18471 + }, + { + "epoch": 0.64, + "learning_rate": 5.745438924355729e-06, + "loss": 0.6264, + "step": 18472 + }, + { + "epoch": 0.64, + "learning_rate": 5.744453549756337e-06, + "loss": 0.6076, + "step": 18473 + }, + { + "epoch": 0.64, + "learning_rate": 5.743468225611834e-06, + "loss": 0.6249, + "step": 18474 + }, + { + "epoch": 0.64, + "learning_rate": 5.742482951933899e-06, + "loss": 0.6141, + "step": 18475 + }, + { + "epoch": 0.64, + "learning_rate": 5.741497728734211e-06, + "loss": 0.6314, + "step": 18476 + }, + { + "epoch": 0.64, + "learning_rate": 5.740512556024455e-06, + "loss": 0.625, + "step": 18477 + }, + { + "epoch": 0.64, + "learning_rate": 5.739527433816313e-06, + "loss": 0.5982, + "step": 18478 + }, + { + "epoch": 0.64, + "learning_rate": 5.738542362121462e-06, + "loss": 0.6448, + "step": 18479 + }, + { + "epoch": 0.64, + "learning_rate": 5.737557340951585e-06, + "loss": 0.6305, + "step": 18480 + }, + { + "epoch": 0.64, + "learning_rate": 5.736572370318354e-06, + "loss": 0.5644, + "step": 18481 + }, + { + "epoch": 0.64, + "learning_rate": 5.7355874502334505e-06, + "loss": 0.649, + "step": 18482 + }, + { + "epoch": 0.64, + "learning_rate": 5.734602580708554e-06, + "loss": 0.656, + "step": 18483 + }, + { + "epoch": 0.64, + "learning_rate": 5.733617761755339e-06, + "loss": 0.6611, + "step": 18484 + }, + { + "epoch": 0.64, + "learning_rate": 5.732632993385481e-06, + "loss": 0.655, + "step": 18485 + }, + { + "epoch": 0.64, + "learning_rate": 5.731648275610663e-06, + "loss": 0.6325, + "step": 18486 + }, + { + "epoch": 0.64, + "learning_rate": 5.730663608442549e-06, + "loss": 0.628, + "step": 18487 + }, + { + "epoch": 0.64, + "learning_rate": 5.729678991892819e-06, + "loss": 0.6326, + "step": 18488 + }, + { + "epoch": 0.64, + "learning_rate": 5.728694425973147e-06, + "loss": 0.6195, + "step": 18489 + }, + { + "epoch": 0.64, + "learning_rate": 5.727709910695205e-06, + "loss": 0.6486, + "step": 18490 + }, + { + "epoch": 0.64, + "learning_rate": 5.726725446070667e-06, + "loss": 0.6689, + "step": 18491 + }, + { + "epoch": 0.64, + "learning_rate": 5.725741032111208e-06, + "loss": 0.646, + "step": 18492 + }, + { + "epoch": 0.64, + "learning_rate": 5.724756668828493e-06, + "loss": 0.6355, + "step": 18493 + }, + { + "epoch": 0.64, + "learning_rate": 5.723772356234194e-06, + "loss": 0.6673, + "step": 18494 + }, + { + "epoch": 0.64, + "learning_rate": 5.722788094339985e-06, + "loss": 0.6282, + "step": 18495 + }, + { + "epoch": 0.64, + "learning_rate": 5.721803883157533e-06, + "loss": 0.6325, + "step": 18496 + }, + { + "epoch": 0.64, + "learning_rate": 5.720819722698509e-06, + "loss": 0.6026, + "step": 18497 + }, + { + "epoch": 0.64, + "learning_rate": 5.719835612974583e-06, + "loss": 0.5965, + "step": 18498 + }, + { + "epoch": 0.64, + "learning_rate": 5.718851553997418e-06, + "loss": 0.656, + "step": 18499 + }, + { + "epoch": 0.64, + "learning_rate": 5.717867545778681e-06, + "loss": 0.5985, + "step": 18500 + }, + { + "epoch": 0.64, + "learning_rate": 5.716883588330043e-06, + "loss": 0.6137, + "step": 18501 + }, + { + "epoch": 0.64, + "learning_rate": 5.715899681663168e-06, + "loss": 0.6414, + "step": 18502 + }, + { + "epoch": 0.64, + "learning_rate": 5.714915825789722e-06, + "loss": 0.6264, + "step": 18503 + }, + { + "epoch": 0.64, + "learning_rate": 5.713932020721372e-06, + "loss": 0.6285, + "step": 18504 + }, + { + "epoch": 0.64, + "learning_rate": 5.7129482664697775e-06, + "loss": 0.6455, + "step": 18505 + }, + { + "epoch": 0.64, + "learning_rate": 5.711964563046604e-06, + "loss": 0.6454, + "step": 18506 + }, + { + "epoch": 0.64, + "learning_rate": 5.710980910463514e-06, + "loss": 0.663, + "step": 18507 + }, + { + "epoch": 0.64, + "learning_rate": 5.709997308732171e-06, + "loss": 0.5771, + "step": 18508 + }, + { + "epoch": 0.64, + "learning_rate": 5.709013757864243e-06, + "loss": 0.6843, + "step": 18509 + }, + { + "epoch": 0.64, + "learning_rate": 5.7080302578713786e-06, + "loss": 0.6139, + "step": 18510 + }, + { + "epoch": 0.64, + "learning_rate": 5.707046808765246e-06, + "loss": 0.6547, + "step": 18511 + }, + { + "epoch": 0.64, + "learning_rate": 5.706063410557503e-06, + "loss": 0.6701, + "step": 18512 + }, + { + "epoch": 0.64, + "learning_rate": 5.705080063259811e-06, + "loss": 0.6222, + "step": 18513 + }, + { + "epoch": 0.64, + "learning_rate": 5.7040967668838286e-06, + "loss": 0.6315, + "step": 18514 + }, + { + "epoch": 0.64, + "learning_rate": 5.703113521441217e-06, + "loss": 0.6334, + "step": 18515 + }, + { + "epoch": 0.64, + "learning_rate": 5.702130326943625e-06, + "loss": 0.5964, + "step": 18516 + }, + { + "epoch": 0.64, + "learning_rate": 5.701147183402715e-06, + "loss": 0.6433, + "step": 18517 + }, + { + "epoch": 0.64, + "learning_rate": 5.700164090830145e-06, + "loss": 0.6044, + "step": 18518 + }, + { + "epoch": 0.64, + "learning_rate": 5.699181049237568e-06, + "loss": 0.6298, + "step": 18519 + }, + { + "epoch": 0.64, + "learning_rate": 5.69819805863664e-06, + "loss": 0.6542, + "step": 18520 + }, + { + "epoch": 0.64, + "learning_rate": 5.69721511903902e-06, + "loss": 0.6473, + "step": 18521 + }, + { + "epoch": 0.64, + "learning_rate": 5.696232230456353e-06, + "loss": 0.6288, + "step": 18522 + }, + { + "epoch": 0.64, + "learning_rate": 5.695249392900299e-06, + "loss": 0.629, + "step": 18523 + }, + { + "epoch": 0.64, + "learning_rate": 5.694266606382508e-06, + "loss": 0.6146, + "step": 18524 + }, + { + "epoch": 0.64, + "learning_rate": 5.693283870914633e-06, + "loss": 0.6777, + "step": 18525 + }, + { + "epoch": 0.64, + "learning_rate": 5.692301186508327e-06, + "loss": 0.606, + "step": 18526 + }, + { + "epoch": 0.64, + "learning_rate": 5.6913185531752425e-06, + "loss": 0.6198, + "step": 18527 + }, + { + "epoch": 0.64, + "learning_rate": 5.690335970927022e-06, + "loss": 0.6426, + "step": 18528 + }, + { + "epoch": 0.64, + "learning_rate": 5.689353439775323e-06, + "loss": 0.6636, + "step": 18529 + }, + { + "epoch": 0.64, + "learning_rate": 5.68837095973179e-06, + "loss": 0.6337, + "step": 18530 + }, + { + "epoch": 0.64, + "learning_rate": 5.687388530808073e-06, + "loss": 0.6394, + "step": 18531 + }, + { + "epoch": 0.64, + "learning_rate": 5.686406153015822e-06, + "loss": 0.6539, + "step": 18532 + }, + { + "epoch": 0.64, + "learning_rate": 5.685423826366686e-06, + "loss": 0.6678, + "step": 18533 + }, + { + "epoch": 0.64, + "learning_rate": 5.684441550872304e-06, + "loss": 0.6449, + "step": 18534 + }, + { + "epoch": 0.64, + "learning_rate": 5.683459326544327e-06, + "loss": 0.6104, + "step": 18535 + }, + { + "epoch": 0.64, + "learning_rate": 5.682477153394401e-06, + "loss": 0.6503, + "step": 18536 + }, + { + "epoch": 0.64, + "learning_rate": 5.68149503143417e-06, + "loss": 0.6039, + "step": 18537 + }, + { + "epoch": 0.64, + "learning_rate": 5.680512960675277e-06, + "loss": 0.6505, + "step": 18538 + }, + { + "epoch": 0.64, + "learning_rate": 5.679530941129372e-06, + "loss": 0.6557, + "step": 18539 + }, + { + "epoch": 0.64, + "learning_rate": 5.678548972808089e-06, + "loss": 0.6932, + "step": 18540 + }, + { + "epoch": 0.64, + "learning_rate": 5.677567055723074e-06, + "loss": 0.6243, + "step": 18541 + }, + { + "epoch": 0.64, + "learning_rate": 5.676585189885971e-06, + "loss": 0.6445, + "step": 18542 + }, + { + "epoch": 0.64, + "learning_rate": 5.675603375308419e-06, + "loss": 0.6841, + "step": 18543 + }, + { + "epoch": 0.64, + "learning_rate": 5.674621612002059e-06, + "loss": 0.6448, + "step": 18544 + }, + { + "epoch": 0.64, + "learning_rate": 5.673639899978536e-06, + "loss": 0.6119, + "step": 18545 + }, + { + "epoch": 0.64, + "learning_rate": 5.67265823924948e-06, + "loss": 0.6367, + "step": 18546 + }, + { + "epoch": 0.64, + "learning_rate": 5.671676629826535e-06, + "loss": 0.6428, + "step": 18547 + }, + { + "epoch": 0.64, + "learning_rate": 5.670695071721339e-06, + "loss": 0.6887, + "step": 18548 + }, + { + "epoch": 0.64, + "learning_rate": 5.669713564945529e-06, + "loss": 0.7034, + "step": 18549 + }, + { + "epoch": 0.64, + "learning_rate": 5.668732109510744e-06, + "loss": 0.6404, + "step": 18550 + }, + { + "epoch": 0.64, + "learning_rate": 5.667750705428622e-06, + "loss": 0.6096, + "step": 18551 + }, + { + "epoch": 0.64, + "learning_rate": 5.666769352710791e-06, + "loss": 0.6785, + "step": 18552 + }, + { + "epoch": 0.64, + "learning_rate": 5.665788051368892e-06, + "loss": 0.6129, + "step": 18553 + }, + { + "epoch": 0.64, + "learning_rate": 5.664806801414557e-06, + "loss": 0.6169, + "step": 18554 + }, + { + "epoch": 0.64, + "learning_rate": 5.663825602859423e-06, + "loss": 0.6397, + "step": 18555 + }, + { + "epoch": 0.64, + "learning_rate": 5.662844455715122e-06, + "loss": 0.607, + "step": 18556 + }, + { + "epoch": 0.64, + "learning_rate": 5.661863359993289e-06, + "loss": 0.622, + "step": 18557 + }, + { + "epoch": 0.64, + "learning_rate": 5.660882315705551e-06, + "loss": 0.6601, + "step": 18558 + }, + { + "epoch": 0.64, + "learning_rate": 5.659901322863541e-06, + "loss": 0.627, + "step": 18559 + }, + { + "epoch": 0.64, + "learning_rate": 5.6589203814788915e-06, + "loss": 0.5909, + "step": 18560 + }, + { + "epoch": 0.64, + "learning_rate": 5.6579394915632336e-06, + "loss": 0.5948, + "step": 18561 + }, + { + "epoch": 0.64, + "learning_rate": 5.656958653128194e-06, + "loss": 0.6977, + "step": 18562 + }, + { + "epoch": 0.64, + "learning_rate": 5.655977866185408e-06, + "loss": 0.6197, + "step": 18563 + }, + { + "epoch": 0.64, + "learning_rate": 5.654997130746496e-06, + "loss": 0.6291, + "step": 18564 + }, + { + "epoch": 0.64, + "learning_rate": 5.654016446823089e-06, + "loss": 0.6803, + "step": 18565 + }, + { + "epoch": 0.64, + "learning_rate": 5.653035814426815e-06, + "loss": 0.6495, + "step": 18566 + }, + { + "epoch": 0.64, + "learning_rate": 5.6520552335693e-06, + "loss": 0.6599, + "step": 18567 + }, + { + "epoch": 0.64, + "learning_rate": 5.651074704262172e-06, + "loss": 0.6138, + "step": 18568 + }, + { + "epoch": 0.64, + "learning_rate": 5.650094226517056e-06, + "loss": 0.6902, + "step": 18569 + }, + { + "epoch": 0.64, + "learning_rate": 5.649113800345573e-06, + "loss": 0.6242, + "step": 18570 + }, + { + "epoch": 0.64, + "learning_rate": 5.64813342575935e-06, + "loss": 0.6066, + "step": 18571 + }, + { + "epoch": 0.64, + "learning_rate": 5.647153102770011e-06, + "loss": 0.6436, + "step": 18572 + }, + { + "epoch": 0.64, + "learning_rate": 5.646172831389178e-06, + "loss": 0.5881, + "step": 18573 + }, + { + "epoch": 0.64, + "learning_rate": 5.6451926116284774e-06, + "loss": 0.6671, + "step": 18574 + }, + { + "epoch": 0.64, + "learning_rate": 5.644212443499523e-06, + "loss": 0.6635, + "step": 18575 + }, + { + "epoch": 0.64, + "learning_rate": 5.643232327013941e-06, + "loss": 0.6364, + "step": 18576 + }, + { + "epoch": 0.64, + "learning_rate": 5.642252262183354e-06, + "loss": 0.6471, + "step": 18577 + }, + { + "epoch": 0.64, + "learning_rate": 5.641272249019372e-06, + "loss": 0.615, + "step": 18578 + }, + { + "epoch": 0.64, + "learning_rate": 5.6402922875336245e-06, + "loss": 0.6188, + "step": 18579 + }, + { + "epoch": 0.64, + "learning_rate": 5.639312377737731e-06, + "loss": 0.6152, + "step": 18580 + }, + { + "epoch": 0.64, + "learning_rate": 5.638332519643302e-06, + "loss": 0.6198, + "step": 18581 + }, + { + "epoch": 0.64, + "learning_rate": 5.637352713261959e-06, + "loss": 0.6897, + "step": 18582 + }, + { + "epoch": 0.64, + "learning_rate": 5.6363729586053206e-06, + "loss": 0.6419, + "step": 18583 + }, + { + "epoch": 0.64, + "learning_rate": 5.635393255684995e-06, + "loss": 0.6437, + "step": 18584 + }, + { + "epoch": 0.64, + "learning_rate": 5.634413604512605e-06, + "loss": 0.7086, + "step": 18585 + }, + { + "epoch": 0.64, + "learning_rate": 5.63343400509977e-06, + "loss": 0.6161, + "step": 18586 + }, + { + "epoch": 0.64, + "learning_rate": 5.632454457458094e-06, + "loss": 0.6126, + "step": 18587 + }, + { + "epoch": 0.64, + "learning_rate": 5.631474961599197e-06, + "loss": 0.6599, + "step": 18588 + }, + { + "epoch": 0.64, + "learning_rate": 5.630495517534693e-06, + "loss": 0.5881, + "step": 18589 + }, + { + "epoch": 0.64, + "learning_rate": 5.629516125276184e-06, + "loss": 0.6963, + "step": 18590 + }, + { + "epoch": 0.64, + "learning_rate": 5.628536784835295e-06, + "loss": 0.6453, + "step": 18591 + }, + { + "epoch": 0.64, + "learning_rate": 5.6275574962236354e-06, + "loss": 0.6465, + "step": 18592 + }, + { + "epoch": 0.64, + "learning_rate": 5.626578259452808e-06, + "loss": 0.6325, + "step": 18593 + }, + { + "epoch": 0.64, + "learning_rate": 5.62559907453443e-06, + "loss": 0.6277, + "step": 18594 + }, + { + "epoch": 0.64, + "learning_rate": 5.6246199414801115e-06, + "loss": 0.6301, + "step": 18595 + }, + { + "epoch": 0.64, + "learning_rate": 5.623640860301452e-06, + "loss": 0.6481, + "step": 18596 + }, + { + "epoch": 0.64, + "learning_rate": 5.6226618310100675e-06, + "loss": 0.6101, + "step": 18597 + }, + { + "epoch": 0.64, + "learning_rate": 5.6216828536175694e-06, + "loss": 0.6409, + "step": 18598 + }, + { + "epoch": 0.64, + "learning_rate": 5.620703928135556e-06, + "loss": 0.6581, + "step": 18599 + }, + { + "epoch": 0.64, + "learning_rate": 5.619725054575638e-06, + "loss": 0.6462, + "step": 18600 + }, + { + "epoch": 0.64, + "learning_rate": 5.618746232949423e-06, + "loss": 0.6213, + "step": 18601 + }, + { + "epoch": 0.64, + "learning_rate": 5.617767463268506e-06, + "loss": 0.6092, + "step": 18602 + }, + { + "epoch": 0.64, + "learning_rate": 5.6167887455445044e-06, + "loss": 0.6093, + "step": 18603 + }, + { + "epoch": 0.64, + "learning_rate": 5.615810079789022e-06, + "loss": 0.6661, + "step": 18604 + }, + { + "epoch": 0.64, + "learning_rate": 5.61483146601365e-06, + "loss": 0.6163, + "step": 18605 + }, + { + "epoch": 0.64, + "learning_rate": 5.613852904229999e-06, + "loss": 0.6147, + "step": 18606 + }, + { + "epoch": 0.64, + "learning_rate": 5.612874394449676e-06, + "loss": 0.6331, + "step": 18607 + }, + { + "epoch": 0.64, + "learning_rate": 5.611895936684269e-06, + "loss": 0.6213, + "step": 18608 + }, + { + "epoch": 0.64, + "learning_rate": 5.610917530945388e-06, + "loss": 0.6206, + "step": 18609 + }, + { + "epoch": 0.64, + "learning_rate": 5.609939177244639e-06, + "loss": 0.6367, + "step": 18610 + }, + { + "epoch": 0.64, + "learning_rate": 5.608960875593608e-06, + "loss": 0.6473, + "step": 18611 + }, + { + "epoch": 0.64, + "learning_rate": 5.607982626003901e-06, + "loss": 0.6446, + "step": 18612 + }, + { + "epoch": 0.64, + "learning_rate": 5.60700442848712e-06, + "loss": 0.5724, + "step": 18613 + }, + { + "epoch": 0.64, + "learning_rate": 5.606026283054852e-06, + "loss": 0.6074, + "step": 18614 + }, + { + "epoch": 0.64, + "learning_rate": 5.605048189718704e-06, + "loss": 0.6849, + "step": 18615 + }, + { + "epoch": 0.64, + "learning_rate": 5.604070148490273e-06, + "loss": 0.6634, + "step": 18616 + }, + { + "epoch": 0.65, + "learning_rate": 5.603092159381147e-06, + "loss": 0.5905, + "step": 18617 + }, + { + "epoch": 0.65, + "learning_rate": 5.602114222402925e-06, + "loss": 0.5544, + "step": 18618 + }, + { + "epoch": 0.65, + "learning_rate": 5.601136337567209e-06, + "loss": 0.6187, + "step": 18619 + }, + { + "epoch": 0.65, + "learning_rate": 5.600158504885577e-06, + "loss": 0.6261, + "step": 18620 + }, + { + "epoch": 0.65, + "learning_rate": 5.599180724369635e-06, + "loss": 0.6219, + "step": 18621 + }, + { + "epoch": 0.65, + "learning_rate": 5.598202996030977e-06, + "loss": 0.628, + "step": 18622 + }, + { + "epoch": 0.65, + "learning_rate": 5.597225319881187e-06, + "loss": 0.6022, + "step": 18623 + }, + { + "epoch": 0.65, + "learning_rate": 5.5962476959318605e-06, + "loss": 0.6413, + "step": 18624 + }, + { + "epoch": 0.65, + "learning_rate": 5.5952701241945915e-06, + "loss": 0.5863, + "step": 18625 + }, + { + "epoch": 0.65, + "learning_rate": 5.59429260468096e-06, + "loss": 0.6635, + "step": 18626 + }, + { + "epoch": 0.65, + "learning_rate": 5.5933151374025664e-06, + "loss": 0.6542, + "step": 18627 + }, + { + "epoch": 0.65, + "learning_rate": 5.592337722371e-06, + "loss": 0.6838, + "step": 18628 + }, + { + "epoch": 0.65, + "learning_rate": 5.591360359597842e-06, + "loss": 0.675, + "step": 18629 + }, + { + "epoch": 0.65, + "learning_rate": 5.590383049094683e-06, + "loss": 0.6635, + "step": 18630 + }, + { + "epoch": 0.65, + "learning_rate": 5.589405790873117e-06, + "loss": 0.6485, + "step": 18631 + }, + { + "epoch": 0.65, + "learning_rate": 5.588428584944716e-06, + "loss": 0.5744, + "step": 18632 + }, + { + "epoch": 0.65, + "learning_rate": 5.587451431321078e-06, + "loss": 0.6118, + "step": 18633 + }, + { + "epoch": 0.65, + "learning_rate": 5.586474330013791e-06, + "loss": 0.6431, + "step": 18634 + }, + { + "epoch": 0.65, + "learning_rate": 5.585497281034428e-06, + "loss": 0.6574, + "step": 18635 + }, + { + "epoch": 0.65, + "learning_rate": 5.584520284394584e-06, + "loss": 0.606, + "step": 18636 + }, + { + "epoch": 0.65, + "learning_rate": 5.583543340105835e-06, + "loss": 0.6273, + "step": 18637 + }, + { + "epoch": 0.65, + "learning_rate": 5.582566448179761e-06, + "loss": 0.5939, + "step": 18638 + }, + { + "epoch": 0.65, + "learning_rate": 5.581589608627958e-06, + "loss": 0.5921, + "step": 18639 + }, + { + "epoch": 0.65, + "learning_rate": 5.580612821461995e-06, + "loss": 0.6303, + "step": 18640 + }, + { + "epoch": 0.65, + "learning_rate": 5.579636086693459e-06, + "loss": 0.6122, + "step": 18641 + }, + { + "epoch": 0.65, + "learning_rate": 5.57865940433393e-06, + "loss": 0.663, + "step": 18642 + }, + { + "epoch": 0.65, + "learning_rate": 5.577682774394985e-06, + "loss": 0.6854, + "step": 18643 + }, + { + "epoch": 0.65, + "learning_rate": 5.576706196888202e-06, + "loss": 0.6024, + "step": 18644 + }, + { + "epoch": 0.65, + "learning_rate": 5.575729671825169e-06, + "loss": 0.6712, + "step": 18645 + }, + { + "epoch": 0.65, + "learning_rate": 5.574753199217453e-06, + "loss": 0.6662, + "step": 18646 + }, + { + "epoch": 0.65, + "learning_rate": 5.5737767790766375e-06, + "loss": 0.6502, + "step": 18647 + }, + { + "epoch": 0.65, + "learning_rate": 5.572800411414301e-06, + "loss": 0.6865, + "step": 18648 + }, + { + "epoch": 0.65, + "learning_rate": 5.571824096242011e-06, + "loss": 0.5867, + "step": 18649 + }, + { + "epoch": 0.65, + "learning_rate": 5.570847833571344e-06, + "loss": 0.6256, + "step": 18650 + }, + { + "epoch": 0.65, + "learning_rate": 5.569871623413887e-06, + "loss": 0.6101, + "step": 18651 + }, + { + "epoch": 0.65, + "learning_rate": 5.568895465781203e-06, + "loss": 0.6574, + "step": 18652 + }, + { + "epoch": 0.65, + "learning_rate": 5.567919360684868e-06, + "loss": 0.6543, + "step": 18653 + }, + { + "epoch": 0.65, + "learning_rate": 5.566943308136461e-06, + "loss": 0.6294, + "step": 18654 + }, + { + "epoch": 0.65, + "learning_rate": 5.565967308147543e-06, + "loss": 0.5899, + "step": 18655 + }, + { + "epoch": 0.65, + "learning_rate": 5.564991360729688e-06, + "loss": 0.6456, + "step": 18656 + }, + { + "epoch": 0.65, + "learning_rate": 5.564015465894479e-06, + "loss": 0.6163, + "step": 18657 + }, + { + "epoch": 0.65, + "learning_rate": 5.563039623653474e-06, + "loss": 0.6577, + "step": 18658 + }, + { + "epoch": 0.65, + "learning_rate": 5.562063834018247e-06, + "loss": 0.6126, + "step": 18659 + }, + { + "epoch": 0.65, + "learning_rate": 5.561088097000373e-06, + "loss": 0.6038, + "step": 18660 + }, + { + "epoch": 0.65, + "learning_rate": 5.56011241261141e-06, + "loss": 0.65, + "step": 18661 + }, + { + "epoch": 0.65, + "learning_rate": 5.559136780862926e-06, + "loss": 0.6834, + "step": 18662 + }, + { + "epoch": 0.65, + "learning_rate": 5.558161201766501e-06, + "loss": 0.6208, + "step": 18663 + }, + { + "epoch": 0.65, + "learning_rate": 5.557185675333689e-06, + "loss": 0.6537, + "step": 18664 + }, + { + "epoch": 0.65, + "learning_rate": 5.556210201576063e-06, + "loss": 0.6154, + "step": 18665 + }, + { + "epoch": 0.65, + "learning_rate": 5.55523478050519e-06, + "loss": 0.6564, + "step": 18666 + }, + { + "epoch": 0.65, + "learning_rate": 5.554259412132628e-06, + "loss": 0.6231, + "step": 18667 + }, + { + "epoch": 0.65, + "learning_rate": 5.5532840964699396e-06, + "loss": 0.6143, + "step": 18668 + }, + { + "epoch": 0.65, + "learning_rate": 5.552308833528701e-06, + "loss": 0.6424, + "step": 18669 + }, + { + "epoch": 0.65, + "learning_rate": 5.551333623320464e-06, + "loss": 0.6034, + "step": 18670 + }, + { + "epoch": 0.65, + "learning_rate": 5.550358465856796e-06, + "loss": 0.5745, + "step": 18671 + }, + { + "epoch": 0.65, + "learning_rate": 5.549383361149259e-06, + "loss": 0.6572, + "step": 18672 + }, + { + "epoch": 0.65, + "learning_rate": 5.548408309209409e-06, + "loss": 0.6309, + "step": 18673 + }, + { + "epoch": 0.65, + "learning_rate": 5.5474333100488056e-06, + "loss": 0.6482, + "step": 18674 + }, + { + "epoch": 0.65, + "learning_rate": 5.5464583636790214e-06, + "loss": 0.6908, + "step": 18675 + }, + { + "epoch": 0.65, + "learning_rate": 5.545483470111603e-06, + "loss": 0.6263, + "step": 18676 + }, + { + "epoch": 0.65, + "learning_rate": 5.544508629358112e-06, + "loss": 0.6475, + "step": 18677 + }, + { + "epoch": 0.65, + "learning_rate": 5.543533841430112e-06, + "loss": 0.6703, + "step": 18678 + }, + { + "epoch": 0.65, + "learning_rate": 5.542559106339152e-06, + "loss": 0.6379, + "step": 18679 + }, + { + "epoch": 0.65, + "learning_rate": 5.541584424096793e-06, + "loss": 0.5784, + "step": 18680 + }, + { + "epoch": 0.65, + "learning_rate": 5.54060979471459e-06, + "loss": 0.6447, + "step": 18681 + }, + { + "epoch": 0.65, + "learning_rate": 5.539635218204099e-06, + "loss": 0.6204, + "step": 18682 + }, + { + "epoch": 0.65, + "learning_rate": 5.538660694576875e-06, + "loss": 0.6124, + "step": 18683 + }, + { + "epoch": 0.65, + "learning_rate": 5.537686223844476e-06, + "loss": 0.5753, + "step": 18684 + }, + { + "epoch": 0.65, + "learning_rate": 5.536711806018448e-06, + "loss": 0.7029, + "step": 18685 + }, + { + "epoch": 0.65, + "learning_rate": 5.535737441110347e-06, + "loss": 0.613, + "step": 18686 + }, + { + "epoch": 0.65, + "learning_rate": 5.534763129131726e-06, + "loss": 0.6263, + "step": 18687 + }, + { + "epoch": 0.65, + "learning_rate": 5.533788870094137e-06, + "loss": 0.6055, + "step": 18688 + }, + { + "epoch": 0.65, + "learning_rate": 5.5328146640091315e-06, + "loss": 0.6021, + "step": 18689 + }, + { + "epoch": 0.65, + "learning_rate": 5.531840510888262e-06, + "loss": 0.6555, + "step": 18690 + }, + { + "epoch": 0.65, + "learning_rate": 5.530866410743072e-06, + "loss": 0.6272, + "step": 18691 + }, + { + "epoch": 0.65, + "learning_rate": 5.529892363585114e-06, + "loss": 0.64, + "step": 18692 + }, + { + "epoch": 0.65, + "learning_rate": 5.528918369425937e-06, + "loss": 0.5969, + "step": 18693 + }, + { + "epoch": 0.65, + "learning_rate": 5.527944428277088e-06, + "loss": 0.6023, + "step": 18694 + }, + { + "epoch": 0.65, + "learning_rate": 5.526970540150116e-06, + "loss": 0.6231, + "step": 18695 + }, + { + "epoch": 0.65, + "learning_rate": 5.52599670505657e-06, + "loss": 0.6478, + "step": 18696 + }, + { + "epoch": 0.65, + "learning_rate": 5.525022923007989e-06, + "loss": 0.6373, + "step": 18697 + }, + { + "epoch": 0.65, + "learning_rate": 5.524049194015921e-06, + "loss": 0.584, + "step": 18698 + }, + { + "epoch": 0.65, + "learning_rate": 5.523075518091914e-06, + "loss": 0.5929, + "step": 18699 + }, + { + "epoch": 0.65, + "learning_rate": 5.522101895247509e-06, + "loss": 0.6489, + "step": 18700 + }, + { + "epoch": 0.65, + "learning_rate": 5.521128325494254e-06, + "loss": 0.7073, + "step": 18701 + }, + { + "epoch": 0.65, + "learning_rate": 5.520154808843685e-06, + "loss": 0.62, + "step": 18702 + }, + { + "epoch": 0.65, + "learning_rate": 5.519181345307348e-06, + "loss": 0.6222, + "step": 18703 + }, + { + "epoch": 0.65, + "learning_rate": 5.518207934896784e-06, + "loss": 0.6505, + "step": 18704 + }, + { + "epoch": 0.65, + "learning_rate": 5.517234577623535e-06, + "loss": 0.6894, + "step": 18705 + }, + { + "epoch": 0.65, + "learning_rate": 5.516261273499139e-06, + "loss": 0.5831, + "step": 18706 + }, + { + "epoch": 0.65, + "learning_rate": 5.515288022535144e-06, + "loss": 0.6026, + "step": 18707 + }, + { + "epoch": 0.65, + "learning_rate": 5.514314824743078e-06, + "loss": 0.624, + "step": 18708 + }, + { + "epoch": 0.65, + "learning_rate": 5.513341680134483e-06, + "loss": 0.6011, + "step": 18709 + }, + { + "epoch": 0.65, + "learning_rate": 5.5123685887209e-06, + "loss": 0.6429, + "step": 18710 + }, + { + "epoch": 0.65, + "learning_rate": 5.511395550513863e-06, + "loss": 0.6626, + "step": 18711 + }, + { + "epoch": 0.65, + "learning_rate": 5.51042256552491e-06, + "loss": 0.6476, + "step": 18712 + }, + { + "epoch": 0.65, + "learning_rate": 5.50944963376558e-06, + "loss": 0.6487, + "step": 18713 + }, + { + "epoch": 0.65, + "learning_rate": 5.508476755247403e-06, + "loss": 0.6274, + "step": 18714 + }, + { + "epoch": 0.65, + "learning_rate": 5.507503929981914e-06, + "loss": 0.6728, + "step": 18715 + }, + { + "epoch": 0.65, + "learning_rate": 5.50653115798065e-06, + "loss": 0.6294, + "step": 18716 + }, + { + "epoch": 0.65, + "learning_rate": 5.505558439255144e-06, + "loss": 0.6568, + "step": 18717 + }, + { + "epoch": 0.65, + "learning_rate": 5.5045857738169274e-06, + "loss": 0.6457, + "step": 18718 + }, + { + "epoch": 0.65, + "learning_rate": 5.5036131616775365e-06, + "loss": 0.612, + "step": 18719 + }, + { + "epoch": 0.65, + "learning_rate": 5.502640602848497e-06, + "loss": 0.6166, + "step": 18720 + }, + { + "epoch": 0.65, + "learning_rate": 5.5016680973413416e-06, + "loss": 0.5848, + "step": 18721 + }, + { + "epoch": 0.65, + "learning_rate": 5.500695645167602e-06, + "loss": 0.6077, + "step": 18722 + }, + { + "epoch": 0.65, + "learning_rate": 5.499723246338806e-06, + "loss": 0.6225, + "step": 18723 + }, + { + "epoch": 0.65, + "learning_rate": 5.498750900866484e-06, + "loss": 0.552, + "step": 18724 + }, + { + "epoch": 0.65, + "learning_rate": 5.497778608762168e-06, + "loss": 0.6493, + "step": 18725 + }, + { + "epoch": 0.65, + "learning_rate": 5.49680637003738e-06, + "loss": 0.6355, + "step": 18726 + }, + { + "epoch": 0.65, + "learning_rate": 5.495834184703647e-06, + "loss": 0.6216, + "step": 18727 + }, + { + "epoch": 0.65, + "learning_rate": 5.494862052772498e-06, + "loss": 0.6353, + "step": 18728 + }, + { + "epoch": 0.65, + "learning_rate": 5.493889974255458e-06, + "loss": 0.6077, + "step": 18729 + }, + { + "epoch": 0.65, + "learning_rate": 5.4929179491640535e-06, + "loss": 0.627, + "step": 18730 + }, + { + "epoch": 0.65, + "learning_rate": 5.4919459775098115e-06, + "loss": 0.6438, + "step": 18731 + }, + { + "epoch": 0.65, + "learning_rate": 5.490974059304248e-06, + "loss": 0.6157, + "step": 18732 + }, + { + "epoch": 0.65, + "learning_rate": 5.490002194558892e-06, + "loss": 0.6238, + "step": 18733 + }, + { + "epoch": 0.65, + "learning_rate": 5.4890303832852655e-06, + "loss": 0.625, + "step": 18734 + }, + { + "epoch": 0.65, + "learning_rate": 5.48805862549489e-06, + "loss": 0.5963, + "step": 18735 + }, + { + "epoch": 0.65, + "learning_rate": 5.487086921199287e-06, + "loss": 0.6191, + "step": 18736 + }, + { + "epoch": 0.65, + "learning_rate": 5.4861152704099805e-06, + "loss": 0.6446, + "step": 18737 + }, + { + "epoch": 0.65, + "learning_rate": 5.4851436731384845e-06, + "loss": 0.6068, + "step": 18738 + }, + { + "epoch": 0.65, + "learning_rate": 5.484172129396322e-06, + "loss": 0.6133, + "step": 18739 + }, + { + "epoch": 0.65, + "learning_rate": 5.48320063919501e-06, + "loss": 0.6453, + "step": 18740 + }, + { + "epoch": 0.65, + "learning_rate": 5.48222920254607e-06, + "loss": 0.6771, + "step": 18741 + }, + { + "epoch": 0.65, + "learning_rate": 5.481257819461016e-06, + "loss": 0.6446, + "step": 18742 + }, + { + "epoch": 0.65, + "learning_rate": 5.480286489951372e-06, + "loss": 0.6516, + "step": 18743 + }, + { + "epoch": 0.65, + "learning_rate": 5.479315214028645e-06, + "loss": 0.6111, + "step": 18744 + }, + { + "epoch": 0.65, + "learning_rate": 5.478343991704354e-06, + "loss": 0.58, + "step": 18745 + }, + { + "epoch": 0.65, + "learning_rate": 5.477372822990016e-06, + "loss": 0.6264, + "step": 18746 + }, + { + "epoch": 0.65, + "learning_rate": 5.4764017078971436e-06, + "loss": 0.6105, + "step": 18747 + }, + { + "epoch": 0.65, + "learning_rate": 5.475430646437252e-06, + "loss": 0.6469, + "step": 18748 + }, + { + "epoch": 0.65, + "learning_rate": 5.474459638621857e-06, + "loss": 0.5758, + "step": 18749 + }, + { + "epoch": 0.65, + "learning_rate": 5.473488684462465e-06, + "loss": 0.6332, + "step": 18750 + }, + { + "epoch": 0.65, + "learning_rate": 5.47251778397059e-06, + "loss": 0.6013, + "step": 18751 + }, + { + "epoch": 0.65, + "learning_rate": 5.471546937157743e-06, + "loss": 0.6139, + "step": 18752 + }, + { + "epoch": 0.65, + "learning_rate": 5.470576144035437e-06, + "loss": 0.6841, + "step": 18753 + }, + { + "epoch": 0.65, + "learning_rate": 5.4696054046151795e-06, + "loss": 0.6233, + "step": 18754 + }, + { + "epoch": 0.65, + "learning_rate": 5.468634718908486e-06, + "loss": 0.6672, + "step": 18755 + }, + { + "epoch": 0.65, + "learning_rate": 5.4676640869268545e-06, + "loss": 0.6378, + "step": 18756 + }, + { + "epoch": 0.65, + "learning_rate": 5.4666935086818e-06, + "loss": 0.5949, + "step": 18757 + }, + { + "epoch": 0.65, + "learning_rate": 5.465722984184828e-06, + "loss": 0.6301, + "step": 18758 + }, + { + "epoch": 0.65, + "learning_rate": 5.464752513447447e-06, + "loss": 0.6329, + "step": 18759 + }, + { + "epoch": 0.65, + "learning_rate": 5.463782096481165e-06, + "loss": 0.6536, + "step": 18760 + }, + { + "epoch": 0.65, + "learning_rate": 5.46281173329748e-06, + "loss": 0.5711, + "step": 18761 + }, + { + "epoch": 0.65, + "learning_rate": 5.461841423907903e-06, + "loss": 0.6513, + "step": 18762 + }, + { + "epoch": 0.65, + "learning_rate": 5.460871168323936e-06, + "loss": 0.614, + "step": 18763 + }, + { + "epoch": 0.65, + "learning_rate": 5.459900966557084e-06, + "loss": 0.6025, + "step": 18764 + }, + { + "epoch": 0.65, + "learning_rate": 5.458930818618848e-06, + "loss": 0.6519, + "step": 18765 + }, + { + "epoch": 0.65, + "learning_rate": 5.457960724520737e-06, + "loss": 0.6151, + "step": 18766 + }, + { + "epoch": 0.65, + "learning_rate": 5.456990684274241e-06, + "loss": 0.6653, + "step": 18767 + }, + { + "epoch": 0.65, + "learning_rate": 5.456020697890869e-06, + "loss": 0.6357, + "step": 18768 + }, + { + "epoch": 0.65, + "learning_rate": 5.455050765382121e-06, + "loss": 0.6588, + "step": 18769 + }, + { + "epoch": 0.65, + "learning_rate": 5.454080886759494e-06, + "loss": 0.6052, + "step": 18770 + }, + { + "epoch": 0.65, + "learning_rate": 5.453111062034489e-06, + "loss": 0.6235, + "step": 18771 + }, + { + "epoch": 0.65, + "learning_rate": 5.452141291218609e-06, + "loss": 0.6141, + "step": 18772 + }, + { + "epoch": 0.65, + "learning_rate": 5.451171574323342e-06, + "loss": 0.6605, + "step": 18773 + }, + { + "epoch": 0.65, + "learning_rate": 5.45020191136019e-06, + "loss": 0.5592, + "step": 18774 + }, + { + "epoch": 0.65, + "learning_rate": 5.44923230234065e-06, + "loss": 0.5957, + "step": 18775 + }, + { + "epoch": 0.65, + "learning_rate": 5.448262747276219e-06, + "loss": 0.6443, + "step": 18776 + }, + { + "epoch": 0.65, + "learning_rate": 5.44729324617839e-06, + "loss": 0.6179, + "step": 18777 + }, + { + "epoch": 0.65, + "learning_rate": 5.446323799058664e-06, + "loss": 0.6301, + "step": 18778 + }, + { + "epoch": 0.65, + "learning_rate": 5.445354405928524e-06, + "loss": 0.6541, + "step": 18779 + }, + { + "epoch": 0.65, + "learning_rate": 5.444385066799471e-06, + "loss": 0.63, + "step": 18780 + }, + { + "epoch": 0.65, + "learning_rate": 5.443415781682995e-06, + "loss": 0.5873, + "step": 18781 + }, + { + "epoch": 0.65, + "learning_rate": 5.442446550590589e-06, + "loss": 0.6209, + "step": 18782 + }, + { + "epoch": 0.65, + "learning_rate": 5.441477373533744e-06, + "loss": 0.6232, + "step": 18783 + }, + { + "epoch": 0.65, + "learning_rate": 5.440508250523956e-06, + "loss": 0.5795, + "step": 18784 + }, + { + "epoch": 0.65, + "learning_rate": 5.439539181572706e-06, + "loss": 0.6263, + "step": 18785 + }, + { + "epoch": 0.65, + "learning_rate": 5.438570166691488e-06, + "loss": 0.6504, + "step": 18786 + }, + { + "epoch": 0.65, + "learning_rate": 5.437601205891791e-06, + "loss": 0.6331, + "step": 18787 + }, + { + "epoch": 0.65, + "learning_rate": 5.436632299185105e-06, + "loss": 0.5978, + "step": 18788 + }, + { + "epoch": 0.65, + "learning_rate": 5.435663446582913e-06, + "loss": 0.5912, + "step": 18789 + }, + { + "epoch": 0.65, + "learning_rate": 5.43469464809671e-06, + "loss": 0.6343, + "step": 18790 + }, + { + "epoch": 0.65, + "learning_rate": 5.433725903737974e-06, + "loss": 0.6708, + "step": 18791 + }, + { + "epoch": 0.65, + "learning_rate": 5.4327572135181915e-06, + "loss": 0.6066, + "step": 18792 + }, + { + "epoch": 0.65, + "learning_rate": 5.431788577448852e-06, + "loss": 0.661, + "step": 18793 + }, + { + "epoch": 0.65, + "learning_rate": 5.4308199955414365e-06, + "loss": 0.6266, + "step": 18794 + }, + { + "epoch": 0.65, + "learning_rate": 5.42985146780743e-06, + "loss": 0.6041, + "step": 18795 + }, + { + "epoch": 0.65, + "learning_rate": 5.42888299425832e-06, + "loss": 0.634, + "step": 18796 + }, + { + "epoch": 0.65, + "learning_rate": 5.4279145749055814e-06, + "loss": 0.6433, + "step": 18797 + }, + { + "epoch": 0.65, + "learning_rate": 5.426946209760698e-06, + "loss": 0.641, + "step": 18798 + }, + { + "epoch": 0.65, + "learning_rate": 5.425977898835153e-06, + "loss": 0.6884, + "step": 18799 + }, + { + "epoch": 0.65, + "learning_rate": 5.425009642140426e-06, + "loss": 0.6571, + "step": 18800 + }, + { + "epoch": 0.65, + "learning_rate": 5.424041439687997e-06, + "loss": 0.6164, + "step": 18801 + }, + { + "epoch": 0.65, + "learning_rate": 5.423073291489349e-06, + "loss": 0.6044, + "step": 18802 + }, + { + "epoch": 0.65, + "learning_rate": 5.422105197555954e-06, + "loss": 0.5461, + "step": 18803 + }, + { + "epoch": 0.65, + "learning_rate": 5.421137157899291e-06, + "loss": 0.6546, + "step": 18804 + }, + { + "epoch": 0.65, + "learning_rate": 5.42016917253084e-06, + "loss": 0.7119, + "step": 18805 + }, + { + "epoch": 0.65, + "learning_rate": 5.419201241462078e-06, + "loss": 0.6135, + "step": 18806 + }, + { + "epoch": 0.65, + "learning_rate": 5.418233364704479e-06, + "loss": 0.5968, + "step": 18807 + }, + { + "epoch": 0.65, + "learning_rate": 5.4172655422695246e-06, + "loss": 0.6308, + "step": 18808 + }, + { + "epoch": 0.65, + "learning_rate": 5.41629777416868e-06, + "loss": 0.6069, + "step": 18809 + }, + { + "epoch": 0.65, + "learning_rate": 5.415330060413423e-06, + "loss": 0.6512, + "step": 18810 + }, + { + "epoch": 0.65, + "learning_rate": 5.414362401015228e-06, + "loss": 0.6018, + "step": 18811 + }, + { + "epoch": 0.65, + "learning_rate": 5.413394795985567e-06, + "loss": 0.6111, + "step": 18812 + }, + { + "epoch": 0.65, + "learning_rate": 5.412427245335914e-06, + "loss": 0.6455, + "step": 18813 + }, + { + "epoch": 0.65, + "learning_rate": 5.411459749077743e-06, + "loss": 0.6587, + "step": 18814 + }, + { + "epoch": 0.65, + "learning_rate": 5.410492307222517e-06, + "loss": 0.6637, + "step": 18815 + }, + { + "epoch": 0.65, + "learning_rate": 5.4095249197817105e-06, + "loss": 0.6533, + "step": 18816 + }, + { + "epoch": 0.65, + "learning_rate": 5.408557586766794e-06, + "loss": 0.6098, + "step": 18817 + }, + { + "epoch": 0.65, + "learning_rate": 5.4075903081892345e-06, + "loss": 0.6572, + "step": 18818 + }, + { + "epoch": 0.65, + "learning_rate": 5.4066230840605005e-06, + "loss": 0.6085, + "step": 18819 + }, + { + "epoch": 0.65, + "learning_rate": 5.405655914392065e-06, + "loss": 0.6952, + "step": 18820 + }, + { + "epoch": 0.65, + "learning_rate": 5.4046887991953874e-06, + "loss": 0.6558, + "step": 18821 + }, + { + "epoch": 0.65, + "learning_rate": 5.403721738481941e-06, + "loss": 0.6022, + "step": 18822 + }, + { + "epoch": 0.65, + "learning_rate": 5.402754732263179e-06, + "loss": 0.6361, + "step": 18823 + }, + { + "epoch": 0.65, + "learning_rate": 5.4017877805505806e-06, + "loss": 0.6465, + "step": 18824 + }, + { + "epoch": 0.65, + "learning_rate": 5.400820883355606e-06, + "loss": 0.6199, + "step": 18825 + }, + { + "epoch": 0.65, + "learning_rate": 5.399854040689716e-06, + "loss": 0.6287, + "step": 18826 + }, + { + "epoch": 0.65, + "learning_rate": 5.3988872525643755e-06, + "loss": 0.6634, + "step": 18827 + }, + { + "epoch": 0.65, + "learning_rate": 5.397920518991051e-06, + "loss": 0.681, + "step": 18828 + }, + { + "epoch": 0.65, + "learning_rate": 5.396953839981191e-06, + "loss": 0.6088, + "step": 18829 + }, + { + "epoch": 0.65, + "learning_rate": 5.395987215546272e-06, + "loss": 0.6391, + "step": 18830 + }, + { + "epoch": 0.65, + "learning_rate": 5.395020645697753e-06, + "loss": 0.6673, + "step": 18831 + }, + { + "epoch": 0.65, + "learning_rate": 5.394054130447084e-06, + "loss": 0.6078, + "step": 18832 + }, + { + "epoch": 0.65, + "learning_rate": 5.39308766980573e-06, + "loss": 0.6446, + "step": 18833 + }, + { + "epoch": 0.65, + "learning_rate": 5.392121263785154e-06, + "loss": 0.6705, + "step": 18834 + }, + { + "epoch": 0.65, + "learning_rate": 5.391154912396801e-06, + "loss": 0.5928, + "step": 18835 + }, + { + "epoch": 0.65, + "learning_rate": 5.390188615652141e-06, + "loss": 0.6418, + "step": 18836 + }, + { + "epoch": 0.65, + "learning_rate": 5.38922237356263e-06, + "loss": 0.6615, + "step": 18837 + }, + { + "epoch": 0.65, + "learning_rate": 5.388256186139718e-06, + "loss": 0.6757, + "step": 18838 + }, + { + "epoch": 0.65, + "learning_rate": 5.38729005339486e-06, + "loss": 0.6844, + "step": 18839 + }, + { + "epoch": 0.65, + "learning_rate": 5.38632397533952e-06, + "loss": 0.6342, + "step": 18840 + }, + { + "epoch": 0.65, + "learning_rate": 5.385357951985137e-06, + "loss": 0.6112, + "step": 18841 + }, + { + "epoch": 0.65, + "learning_rate": 5.384391983343175e-06, + "loss": 0.6574, + "step": 18842 + }, + { + "epoch": 0.65, + "learning_rate": 5.3834260694250915e-06, + "loss": 0.6427, + "step": 18843 + }, + { + "epoch": 0.65, + "learning_rate": 5.382460210242328e-06, + "loss": 0.5852, + "step": 18844 + }, + { + "epoch": 0.65, + "learning_rate": 5.381494405806338e-06, + "loss": 0.5983, + "step": 18845 + }, + { + "epoch": 0.65, + "learning_rate": 5.38052865612858e-06, + "loss": 0.6795, + "step": 18846 + }, + { + "epoch": 0.65, + "learning_rate": 5.379562961220489e-06, + "loss": 0.6414, + "step": 18847 + }, + { + "epoch": 0.65, + "learning_rate": 5.378597321093528e-06, + "loss": 0.611, + "step": 18848 + }, + { + "epoch": 0.65, + "learning_rate": 5.377631735759148e-06, + "loss": 0.6227, + "step": 18849 + }, + { + "epoch": 0.65, + "learning_rate": 5.376666205228784e-06, + "loss": 0.6264, + "step": 18850 + }, + { + "epoch": 0.65, + "learning_rate": 5.375700729513893e-06, + "loss": 0.5987, + "step": 18851 + }, + { + "epoch": 0.65, + "learning_rate": 5.374735308625923e-06, + "loss": 0.6112, + "step": 18852 + }, + { + "epoch": 0.65, + "learning_rate": 5.373769942576308e-06, + "loss": 0.6333, + "step": 18853 + }, + { + "epoch": 0.65, + "learning_rate": 5.372804631376508e-06, + "loss": 0.6481, + "step": 18854 + }, + { + "epoch": 0.65, + "learning_rate": 5.371839375037966e-06, + "loss": 0.5923, + "step": 18855 + }, + { + "epoch": 0.65, + "learning_rate": 5.370874173572118e-06, + "loss": 0.6754, + "step": 18856 + }, + { + "epoch": 0.65, + "learning_rate": 5.369909026990414e-06, + "loss": 0.6217, + "step": 18857 + }, + { + "epoch": 0.65, + "learning_rate": 5.3689439353042985e-06, + "loss": 0.6056, + "step": 18858 + }, + { + "epoch": 0.65, + "learning_rate": 5.367978898525203e-06, + "loss": 0.6598, + "step": 18859 + }, + { + "epoch": 0.65, + "learning_rate": 5.367013916664582e-06, + "loss": 0.639, + "step": 18860 + }, + { + "epoch": 0.65, + "learning_rate": 5.366048989733875e-06, + "loss": 0.6622, + "step": 18861 + }, + { + "epoch": 0.65, + "learning_rate": 5.365084117744515e-06, + "loss": 0.655, + "step": 18862 + }, + { + "epoch": 0.65, + "learning_rate": 5.364119300707947e-06, + "loss": 0.6028, + "step": 18863 + }, + { + "epoch": 0.65, + "learning_rate": 5.363154538635613e-06, + "loss": 0.6266, + "step": 18864 + }, + { + "epoch": 0.65, + "learning_rate": 5.362189831538938e-06, + "loss": 0.6886, + "step": 18865 + }, + { + "epoch": 0.65, + "learning_rate": 5.361225179429375e-06, + "loss": 0.6604, + "step": 18866 + }, + { + "epoch": 0.65, + "learning_rate": 5.3602605823183596e-06, + "loss": 0.6141, + "step": 18867 + }, + { + "epoch": 0.65, + "learning_rate": 5.359296040217319e-06, + "loss": 0.6597, + "step": 18868 + }, + { + "epoch": 0.65, + "learning_rate": 5.358331553137696e-06, + "loss": 0.6426, + "step": 18869 + }, + { + "epoch": 0.65, + "learning_rate": 5.3573671210909275e-06, + "loss": 0.6203, + "step": 18870 + }, + { + "epoch": 0.65, + "learning_rate": 5.356402744088436e-06, + "loss": 0.6152, + "step": 18871 + }, + { + "epoch": 0.65, + "learning_rate": 5.355438422141669e-06, + "loss": 0.5862, + "step": 18872 + }, + { + "epoch": 0.65, + "learning_rate": 5.354474155262059e-06, + "loss": 0.6558, + "step": 18873 + }, + { + "epoch": 0.65, + "learning_rate": 5.3535099434610305e-06, + "loss": 0.6316, + "step": 18874 + }, + { + "epoch": 0.65, + "learning_rate": 5.352545786750019e-06, + "loss": 0.5731, + "step": 18875 + }, + { + "epoch": 0.65, + "learning_rate": 5.35158168514046e-06, + "loss": 0.6332, + "step": 18876 + }, + { + "epoch": 0.65, + "learning_rate": 5.350617638643777e-06, + "loss": 0.6569, + "step": 18877 + }, + { + "epoch": 0.65, + "learning_rate": 5.3496536472713986e-06, + "loss": 0.6348, + "step": 18878 + }, + { + "epoch": 0.65, + "learning_rate": 5.348689711034768e-06, + "loss": 0.6197, + "step": 18879 + }, + { + "epoch": 0.65, + "learning_rate": 5.347725829945301e-06, + "loss": 0.6331, + "step": 18880 + }, + { + "epoch": 0.65, + "learning_rate": 5.3467620040144275e-06, + "loss": 0.6237, + "step": 18881 + }, + { + "epoch": 0.65, + "learning_rate": 5.3457982332535826e-06, + "loss": 0.6315, + "step": 18882 + }, + { + "epoch": 0.65, + "learning_rate": 5.344834517674182e-06, + "loss": 0.6083, + "step": 18883 + }, + { + "epoch": 0.65, + "learning_rate": 5.3438708572876586e-06, + "loss": 0.5961, + "step": 18884 + }, + { + "epoch": 0.65, + "learning_rate": 5.342907252105436e-06, + "loss": 0.6464, + "step": 18885 + }, + { + "epoch": 0.65, + "learning_rate": 5.341943702138939e-06, + "loss": 0.6502, + "step": 18886 + }, + { + "epoch": 0.65, + "learning_rate": 5.340980207399594e-06, + "loss": 0.5785, + "step": 18887 + }, + { + "epoch": 0.65, + "learning_rate": 5.34001676789882e-06, + "loss": 0.5916, + "step": 18888 + }, + { + "epoch": 0.65, + "learning_rate": 5.3390533836480414e-06, + "loss": 0.6119, + "step": 18889 + }, + { + "epoch": 0.65, + "learning_rate": 5.338090054658682e-06, + "loss": 0.6071, + "step": 18890 + }, + { + "epoch": 0.65, + "learning_rate": 5.337126780942161e-06, + "loss": 0.6453, + "step": 18891 + }, + { + "epoch": 0.65, + "learning_rate": 5.3361635625099016e-06, + "loss": 0.6277, + "step": 18892 + }, + { + "epoch": 0.65, + "learning_rate": 5.3352003993733285e-06, + "loss": 0.6931, + "step": 18893 + }, + { + "epoch": 0.65, + "learning_rate": 5.334237291543849e-06, + "loss": 0.6514, + "step": 18894 + }, + { + "epoch": 0.65, + "learning_rate": 5.33327423903289e-06, + "loss": 0.6294, + "step": 18895 + }, + { + "epoch": 0.65, + "learning_rate": 5.332311241851869e-06, + "loss": 0.5796, + "step": 18896 + }, + { + "epoch": 0.65, + "learning_rate": 5.3313483000122e-06, + "loss": 0.6742, + "step": 18897 + }, + { + "epoch": 0.65, + "learning_rate": 5.3303854135253054e-06, + "loss": 0.5695, + "step": 18898 + }, + { + "epoch": 0.65, + "learning_rate": 5.329422582402602e-06, + "loss": 0.5951, + "step": 18899 + }, + { + "epoch": 0.65, + "learning_rate": 5.3284598066554985e-06, + "loss": 0.6495, + "step": 18900 + }, + { + "epoch": 0.65, + "learning_rate": 5.327497086295412e-06, + "loss": 0.6013, + "step": 18901 + }, + { + "epoch": 0.65, + "learning_rate": 5.32653442133376e-06, + "loss": 0.5737, + "step": 18902 + }, + { + "epoch": 0.65, + "learning_rate": 5.325571811781954e-06, + "loss": 0.5779, + "step": 18903 + }, + { + "epoch": 0.65, + "learning_rate": 5.324609257651407e-06, + "loss": 0.6271, + "step": 18904 + }, + { + "epoch": 0.66, + "learning_rate": 5.323646758953537e-06, + "loss": 0.5923, + "step": 18905 + }, + { + "epoch": 0.66, + "learning_rate": 5.322684315699744e-06, + "loss": 0.6211, + "step": 18906 + }, + { + "epoch": 0.66, + "learning_rate": 5.321721927901448e-06, + "loss": 0.6183, + "step": 18907 + }, + { + "epoch": 0.66, + "learning_rate": 5.320759595570055e-06, + "loss": 0.6006, + "step": 18908 + }, + { + "epoch": 0.66, + "learning_rate": 5.319797318716976e-06, + "loss": 0.6158, + "step": 18909 + }, + { + "epoch": 0.66, + "learning_rate": 5.3188350973536205e-06, + "loss": 0.6429, + "step": 18910 + }, + { + "epoch": 0.66, + "learning_rate": 5.317872931491402e-06, + "loss": 0.6683, + "step": 18911 + }, + { + "epoch": 0.66, + "learning_rate": 5.316910821141716e-06, + "loss": 0.5719, + "step": 18912 + }, + { + "epoch": 0.66, + "learning_rate": 5.315948766315978e-06, + "loss": 0.643, + "step": 18913 + }, + { + "epoch": 0.66, + "learning_rate": 5.314986767025593e-06, + "loss": 0.6013, + "step": 18914 + }, + { + "epoch": 0.66, + "learning_rate": 5.3140248232819665e-06, + "loss": 0.6021, + "step": 18915 + }, + { + "epoch": 0.66, + "learning_rate": 5.313062935096502e-06, + "loss": 0.5982, + "step": 18916 + }, + { + "epoch": 0.66, + "learning_rate": 5.312101102480611e-06, + "loss": 0.6555, + "step": 18917 + }, + { + "epoch": 0.66, + "learning_rate": 5.311139325445687e-06, + "loss": 0.6555, + "step": 18918 + }, + { + "epoch": 0.66, + "learning_rate": 5.310177604003138e-06, + "loss": 0.6999, + "step": 18919 + }, + { + "epoch": 0.66, + "learning_rate": 5.309215938164367e-06, + "loss": 0.6087, + "step": 18920 + }, + { + "epoch": 0.66, + "learning_rate": 5.308254327940774e-06, + "loss": 0.6263, + "step": 18921 + }, + { + "epoch": 0.66, + "learning_rate": 5.307292773343761e-06, + "loss": 0.6671, + "step": 18922 + }, + { + "epoch": 0.66, + "learning_rate": 5.306331274384733e-06, + "loss": 0.6593, + "step": 18923 + }, + { + "epoch": 0.66, + "learning_rate": 5.30536983107508e-06, + "loss": 0.6298, + "step": 18924 + }, + { + "epoch": 0.66, + "learning_rate": 5.304408443426208e-06, + "loss": 0.633, + "step": 18925 + }, + { + "epoch": 0.66, + "learning_rate": 5.303447111449512e-06, + "loss": 0.5582, + "step": 18926 + }, + { + "epoch": 0.66, + "learning_rate": 5.302485835156392e-06, + "loss": 0.6083, + "step": 18927 + }, + { + "epoch": 0.66, + "learning_rate": 5.301524614558247e-06, + "loss": 0.616, + "step": 18928 + }, + { + "epoch": 0.66, + "learning_rate": 5.300563449666474e-06, + "loss": 0.6465, + "step": 18929 + }, + { + "epoch": 0.66, + "learning_rate": 5.299602340492461e-06, + "loss": 0.5625, + "step": 18930 + }, + { + "epoch": 0.66, + "learning_rate": 5.29864128704761e-06, + "loss": 0.6688, + "step": 18931 + }, + { + "epoch": 0.66, + "learning_rate": 5.297680289343312e-06, + "loss": 0.6615, + "step": 18932 + }, + { + "epoch": 0.66, + "learning_rate": 5.296719347390964e-06, + "loss": 0.6228, + "step": 18933 + }, + { + "epoch": 0.66, + "learning_rate": 5.295758461201957e-06, + "loss": 0.6261, + "step": 18934 + }, + { + "epoch": 0.66, + "learning_rate": 5.294797630787689e-06, + "loss": 0.6084, + "step": 18935 + }, + { + "epoch": 0.66, + "learning_rate": 5.293836856159544e-06, + "loss": 0.6616, + "step": 18936 + }, + { + "epoch": 0.66, + "learning_rate": 5.292876137328915e-06, + "loss": 0.6259, + "step": 18937 + }, + { + "epoch": 0.66, + "learning_rate": 5.291915474307194e-06, + "loss": 0.7038, + "step": 18938 + }, + { + "epoch": 0.66, + "learning_rate": 5.290954867105771e-06, + "loss": 0.618, + "step": 18939 + }, + { + "epoch": 0.66, + "learning_rate": 5.289994315736035e-06, + "loss": 0.7054, + "step": 18940 + }, + { + "epoch": 0.66, + "learning_rate": 5.28903382020938e-06, + "loss": 0.6369, + "step": 18941 + }, + { + "epoch": 0.66, + "learning_rate": 5.288073380537182e-06, + "loss": 0.6876, + "step": 18942 + }, + { + "epoch": 0.66, + "learning_rate": 5.287112996730837e-06, + "loss": 0.6247, + "step": 18943 + }, + { + "epoch": 0.66, + "learning_rate": 5.286152668801727e-06, + "loss": 0.6239, + "step": 18944 + }, + { + "epoch": 0.66, + "learning_rate": 5.285192396761242e-06, + "loss": 0.6843, + "step": 18945 + }, + { + "epoch": 0.66, + "learning_rate": 5.284232180620769e-06, + "loss": 0.6264, + "step": 18946 + }, + { + "epoch": 0.66, + "learning_rate": 5.283272020391685e-06, + "loss": 0.6569, + "step": 18947 + }, + { + "epoch": 0.66, + "learning_rate": 5.2823119160853765e-06, + "loss": 0.5611, + "step": 18948 + }, + { + "epoch": 0.66, + "learning_rate": 5.281351867713229e-06, + "loss": 0.6034, + "step": 18949 + }, + { + "epoch": 0.66, + "learning_rate": 5.2803918752866255e-06, + "loss": 0.6552, + "step": 18950 + }, + { + "epoch": 0.66, + "learning_rate": 5.279431938816946e-06, + "loss": 0.5946, + "step": 18951 + }, + { + "epoch": 0.66, + "learning_rate": 5.278472058315576e-06, + "loss": 0.6188, + "step": 18952 + }, + { + "epoch": 0.66, + "learning_rate": 5.277512233793888e-06, + "loss": 0.6244, + "step": 18953 + }, + { + "epoch": 0.66, + "learning_rate": 5.2765524652632674e-06, + "loss": 0.6397, + "step": 18954 + }, + { + "epoch": 0.66, + "learning_rate": 5.2755927527350915e-06, + "loss": 0.6675, + "step": 18955 + }, + { + "epoch": 0.66, + "learning_rate": 5.27463309622074e-06, + "loss": 0.6575, + "step": 18956 + }, + { + "epoch": 0.66, + "learning_rate": 5.273673495731592e-06, + "loss": 0.6899, + "step": 18957 + }, + { + "epoch": 0.66, + "learning_rate": 5.272713951279027e-06, + "loss": 0.6638, + "step": 18958 + }, + { + "epoch": 0.66, + "learning_rate": 5.2717544628744136e-06, + "loss": 0.649, + "step": 18959 + }, + { + "epoch": 0.66, + "learning_rate": 5.2707950305291326e-06, + "loss": 0.6651, + "step": 18960 + }, + { + "epoch": 0.66, + "learning_rate": 5.2698356542545595e-06, + "loss": 0.6067, + "step": 18961 + }, + { + "epoch": 0.66, + "learning_rate": 5.268876334062068e-06, + "loss": 0.6348, + "step": 18962 + }, + { + "epoch": 0.66, + "learning_rate": 5.267917069963032e-06, + "loss": 0.6343, + "step": 18963 + }, + { + "epoch": 0.66, + "learning_rate": 5.266957861968829e-06, + "loss": 0.6142, + "step": 18964 + }, + { + "epoch": 0.66, + "learning_rate": 5.265998710090825e-06, + "loss": 0.5991, + "step": 18965 + }, + { + "epoch": 0.66, + "learning_rate": 5.265039614340395e-06, + "loss": 0.5973, + "step": 18966 + }, + { + "epoch": 0.66, + "learning_rate": 5.264080574728909e-06, + "loss": 0.6488, + "step": 18967 + }, + { + "epoch": 0.66, + "learning_rate": 5.263121591267739e-06, + "loss": 0.6177, + "step": 18968 + }, + { + "epoch": 0.66, + "learning_rate": 5.262162663968255e-06, + "loss": 0.6192, + "step": 18969 + }, + { + "epoch": 0.66, + "learning_rate": 5.26120379284183e-06, + "loss": 0.6106, + "step": 18970 + }, + { + "epoch": 0.66, + "learning_rate": 5.260244977899824e-06, + "loss": 0.6634, + "step": 18971 + }, + { + "epoch": 0.66, + "learning_rate": 5.259286219153612e-06, + "loss": 0.64, + "step": 18972 + }, + { + "epoch": 0.66, + "learning_rate": 5.258327516614557e-06, + "loss": 0.633, + "step": 18973 + }, + { + "epoch": 0.66, + "learning_rate": 5.257368870294027e-06, + "loss": 0.6076, + "step": 18974 + }, + { + "epoch": 0.66, + "learning_rate": 5.25641028020339e-06, + "loss": 0.5662, + "step": 18975 + }, + { + "epoch": 0.66, + "learning_rate": 5.255451746354012e-06, + "loss": 0.6377, + "step": 18976 + }, + { + "epoch": 0.66, + "learning_rate": 5.2544932687572525e-06, + "loss": 0.6791, + "step": 18977 + }, + { + "epoch": 0.66, + "learning_rate": 5.253534847424479e-06, + "loss": 0.5663, + "step": 18978 + }, + { + "epoch": 0.66, + "learning_rate": 5.252576482367054e-06, + "loss": 0.6217, + "step": 18979 + }, + { + "epoch": 0.66, + "learning_rate": 5.25161817359634e-06, + "loss": 0.6252, + "step": 18980 + }, + { + "epoch": 0.66, + "learning_rate": 5.250659921123698e-06, + "loss": 0.6355, + "step": 18981 + }, + { + "epoch": 0.66, + "learning_rate": 5.249701724960496e-06, + "loss": 0.6298, + "step": 18982 + }, + { + "epoch": 0.66, + "learning_rate": 5.248743585118086e-06, + "loss": 0.6755, + "step": 18983 + }, + { + "epoch": 0.66, + "learning_rate": 5.24778550160783e-06, + "loss": 0.6335, + "step": 18984 + }, + { + "epoch": 0.66, + "learning_rate": 5.246827474441087e-06, + "loss": 0.6033, + "step": 18985 + }, + { + "epoch": 0.66, + "learning_rate": 5.245869503629219e-06, + "loss": 0.6952, + "step": 18986 + }, + { + "epoch": 0.66, + "learning_rate": 5.2449115891835825e-06, + "loss": 0.6496, + "step": 18987 + }, + { + "epoch": 0.66, + "learning_rate": 5.243953731115536e-06, + "loss": 0.6879, + "step": 18988 + }, + { + "epoch": 0.66, + "learning_rate": 5.242995929436433e-06, + "loss": 0.6359, + "step": 18989 + }, + { + "epoch": 0.66, + "learning_rate": 5.24203818415763e-06, + "loss": 0.6451, + "step": 18990 + }, + { + "epoch": 0.66, + "learning_rate": 5.241080495290483e-06, + "loss": 0.5954, + "step": 18991 + }, + { + "epoch": 0.66, + "learning_rate": 5.240122862846346e-06, + "loss": 0.6397, + "step": 18992 + }, + { + "epoch": 0.66, + "learning_rate": 5.239165286836576e-06, + "loss": 0.632, + "step": 18993 + }, + { + "epoch": 0.66, + "learning_rate": 5.238207767272526e-06, + "loss": 0.6314, + "step": 18994 + }, + { + "epoch": 0.66, + "learning_rate": 5.237250304165543e-06, + "loss": 0.5481, + "step": 18995 + }, + { + "epoch": 0.66, + "learning_rate": 5.236292897526983e-06, + "loss": 0.6524, + "step": 18996 + }, + { + "epoch": 0.66, + "learning_rate": 5.235335547368197e-06, + "loss": 0.5878, + "step": 18997 + }, + { + "epoch": 0.66, + "learning_rate": 5.234378253700535e-06, + "loss": 0.6727, + "step": 18998 + }, + { + "epoch": 0.66, + "learning_rate": 5.2334210165353474e-06, + "loss": 0.5854, + "step": 18999 + }, + { + "epoch": 0.66, + "learning_rate": 5.232463835883988e-06, + "loss": 0.6339, + "step": 19000 + }, + { + "epoch": 0.66, + "learning_rate": 5.231506711757795e-06, + "loss": 0.6173, + "step": 19001 + }, + { + "epoch": 0.66, + "learning_rate": 5.2305496441681236e-06, + "loss": 0.5807, + "step": 19002 + }, + { + "epoch": 0.66, + "learning_rate": 5.2295926331263194e-06, + "loss": 0.6281, + "step": 19003 + }, + { + "epoch": 0.66, + "learning_rate": 5.228635678643728e-06, + "loss": 0.6259, + "step": 19004 + }, + { + "epoch": 0.66, + "learning_rate": 5.227678780731697e-06, + "loss": 0.6547, + "step": 19005 + }, + { + "epoch": 0.66, + "learning_rate": 5.226721939401575e-06, + "loss": 0.6203, + "step": 19006 + }, + { + "epoch": 0.66, + "learning_rate": 5.2257651546647e-06, + "loss": 0.6589, + "step": 19007 + }, + { + "epoch": 0.66, + "learning_rate": 5.224808426532417e-06, + "loss": 0.6365, + "step": 19008 + }, + { + "epoch": 0.66, + "learning_rate": 5.223851755016071e-06, + "loss": 0.6354, + "step": 19009 + }, + { + "epoch": 0.66, + "learning_rate": 5.222895140127007e-06, + "loss": 0.5961, + "step": 19010 + }, + { + "epoch": 0.66, + "learning_rate": 5.221938581876565e-06, + "loss": 0.5876, + "step": 19011 + }, + { + "epoch": 0.66, + "learning_rate": 5.220982080276083e-06, + "loss": 0.6239, + "step": 19012 + }, + { + "epoch": 0.66, + "learning_rate": 5.220025635336903e-06, + "loss": 0.6839, + "step": 19013 + }, + { + "epoch": 0.66, + "learning_rate": 5.219069247070365e-06, + "loss": 0.6519, + "step": 19014 + }, + { + "epoch": 0.66, + "learning_rate": 5.218112915487809e-06, + "loss": 0.6076, + "step": 19015 + }, + { + "epoch": 0.66, + "learning_rate": 5.217156640600576e-06, + "loss": 0.6254, + "step": 19016 + }, + { + "epoch": 0.66, + "learning_rate": 5.216200422420003e-06, + "loss": 0.5866, + "step": 19017 + }, + { + "epoch": 0.66, + "learning_rate": 5.215244260957423e-06, + "loss": 0.6334, + "step": 19018 + }, + { + "epoch": 0.66, + "learning_rate": 5.214288156224174e-06, + "loss": 0.6251, + "step": 19019 + }, + { + "epoch": 0.66, + "learning_rate": 5.213332108231594e-06, + "loss": 0.6264, + "step": 19020 + }, + { + "epoch": 0.66, + "learning_rate": 5.2123761169910155e-06, + "loss": 0.641, + "step": 19021 + }, + { + "epoch": 0.66, + "learning_rate": 5.211420182513776e-06, + "loss": 0.6543, + "step": 19022 + }, + { + "epoch": 0.66, + "learning_rate": 5.2104643048112115e-06, + "loss": 0.6171, + "step": 19023 + }, + { + "epoch": 0.66, + "learning_rate": 5.209508483894647e-06, + "loss": 0.6282, + "step": 19024 + }, + { + "epoch": 0.66, + "learning_rate": 5.208552719775419e-06, + "loss": 0.6074, + "step": 19025 + }, + { + "epoch": 0.66, + "learning_rate": 5.20759701246486e-06, + "loss": 0.6662, + "step": 19026 + }, + { + "epoch": 0.66, + "learning_rate": 5.2066413619743e-06, + "loss": 0.6302, + "step": 19027 + }, + { + "epoch": 0.66, + "learning_rate": 5.205685768315072e-06, + "loss": 0.6172, + "step": 19028 + }, + { + "epoch": 0.66, + "learning_rate": 5.204730231498507e-06, + "loss": 0.6472, + "step": 19029 + }, + { + "epoch": 0.66, + "learning_rate": 5.203774751535928e-06, + "loss": 0.6288, + "step": 19030 + }, + { + "epoch": 0.66, + "learning_rate": 5.202819328438667e-06, + "loss": 0.5946, + "step": 19031 + }, + { + "epoch": 0.66, + "learning_rate": 5.20186396221805e-06, + "loss": 0.672, + "step": 19032 + }, + { + "epoch": 0.66, + "learning_rate": 5.200908652885406e-06, + "loss": 0.6405, + "step": 19033 + }, + { + "epoch": 0.66, + "learning_rate": 5.19995340045206e-06, + "loss": 0.6297, + "step": 19034 + }, + { + "epoch": 0.66, + "learning_rate": 5.198998204929343e-06, + "loss": 0.6118, + "step": 19035 + }, + { + "epoch": 0.66, + "learning_rate": 5.198043066328572e-06, + "loss": 0.6573, + "step": 19036 + }, + { + "epoch": 0.66, + "learning_rate": 5.197087984661075e-06, + "loss": 0.6171, + "step": 19037 + }, + { + "epoch": 0.66, + "learning_rate": 5.196132959938175e-06, + "loss": 0.6302, + "step": 19038 + }, + { + "epoch": 0.66, + "learning_rate": 5.195177992171197e-06, + "loss": 0.6445, + "step": 19039 + }, + { + "epoch": 0.66, + "learning_rate": 5.19422308137146e-06, + "loss": 0.6094, + "step": 19040 + }, + { + "epoch": 0.66, + "learning_rate": 5.193268227550292e-06, + "loss": 0.6063, + "step": 19041 + }, + { + "epoch": 0.66, + "learning_rate": 5.192313430719007e-06, + "loss": 0.6079, + "step": 19042 + }, + { + "epoch": 0.66, + "learning_rate": 5.191358690888928e-06, + "loss": 0.6543, + "step": 19043 + }, + { + "epoch": 0.66, + "learning_rate": 5.190404008071375e-06, + "loss": 0.5577, + "step": 19044 + }, + { + "epoch": 0.66, + "learning_rate": 5.189449382277665e-06, + "loss": 0.6546, + "step": 19045 + }, + { + "epoch": 0.66, + "learning_rate": 5.188494813519118e-06, + "loss": 0.6216, + "step": 19046 + }, + { + "epoch": 0.66, + "learning_rate": 5.187540301807057e-06, + "loss": 0.6464, + "step": 19047 + }, + { + "epoch": 0.66, + "learning_rate": 5.18658584715279e-06, + "loss": 0.6533, + "step": 19048 + }, + { + "epoch": 0.66, + "learning_rate": 5.185631449567634e-06, + "loss": 0.613, + "step": 19049 + }, + { + "epoch": 0.66, + "learning_rate": 5.18467710906291e-06, + "loss": 0.6274, + "step": 19050 + }, + { + "epoch": 0.66, + "learning_rate": 5.1837228256499285e-06, + "loss": 0.6461, + "step": 19051 + }, + { + "epoch": 0.66, + "learning_rate": 5.1827685993400065e-06, + "loss": 0.6888, + "step": 19052 + }, + { + "epoch": 0.66, + "learning_rate": 5.181814430144461e-06, + "loss": 0.6296, + "step": 19053 + }, + { + "epoch": 0.66, + "learning_rate": 5.1808603180745966e-06, + "loss": 0.6505, + "step": 19054 + }, + { + "epoch": 0.66, + "learning_rate": 5.179906263141728e-06, + "loss": 0.5986, + "step": 19055 + }, + { + "epoch": 0.66, + "learning_rate": 5.178952265357169e-06, + "loss": 0.6359, + "step": 19056 + }, + { + "epoch": 0.66, + "learning_rate": 5.17799832473223e-06, + "loss": 0.6801, + "step": 19057 + }, + { + "epoch": 0.66, + "learning_rate": 5.1770444412782185e-06, + "loss": 0.6945, + "step": 19058 + }, + { + "epoch": 0.66, + "learning_rate": 5.1760906150064525e-06, + "loss": 0.6224, + "step": 19059 + }, + { + "epoch": 0.66, + "learning_rate": 5.17513684592823e-06, + "loss": 0.6724, + "step": 19060 + }, + { + "epoch": 0.66, + "learning_rate": 5.1741831340548636e-06, + "loss": 0.546, + "step": 19061 + }, + { + "epoch": 0.66, + "learning_rate": 5.173229479397661e-06, + "loss": 0.6167, + "step": 19062 + }, + { + "epoch": 0.66, + "learning_rate": 5.172275881967928e-06, + "loss": 0.6503, + "step": 19063 + }, + { + "epoch": 0.66, + "learning_rate": 5.171322341776972e-06, + "loss": 0.6213, + "step": 19064 + }, + { + "epoch": 0.66, + "learning_rate": 5.170368858836101e-06, + "loss": 0.6283, + "step": 19065 + }, + { + "epoch": 0.66, + "learning_rate": 5.169415433156615e-06, + "loss": 0.6057, + "step": 19066 + }, + { + "epoch": 0.66, + "learning_rate": 5.1684620647498175e-06, + "loss": 0.6094, + "step": 19067 + }, + { + "epoch": 0.66, + "learning_rate": 5.1675087536270195e-06, + "loss": 0.6624, + "step": 19068 + }, + { + "epoch": 0.66, + "learning_rate": 5.16655549979951e-06, + "loss": 0.6058, + "step": 19069 + }, + { + "epoch": 0.66, + "learning_rate": 5.1656023032786075e-06, + "loss": 0.6245, + "step": 19070 + }, + { + "epoch": 0.66, + "learning_rate": 5.164649164075602e-06, + "loss": 0.6774, + "step": 19071 + }, + { + "epoch": 0.66, + "learning_rate": 5.163696082201796e-06, + "loss": 0.608, + "step": 19072 + }, + { + "epoch": 0.66, + "learning_rate": 5.162743057668496e-06, + "loss": 0.6156, + "step": 19073 + }, + { + "epoch": 0.66, + "learning_rate": 5.161790090486991e-06, + "loss": 0.6478, + "step": 19074 + }, + { + "epoch": 0.66, + "learning_rate": 5.1608371806685804e-06, + "loss": 0.6416, + "step": 19075 + }, + { + "epoch": 0.66, + "learning_rate": 5.159884328224576e-06, + "loss": 0.6423, + "step": 19076 + }, + { + "epoch": 0.66, + "learning_rate": 5.158931533166262e-06, + "loss": 0.6726, + "step": 19077 + }, + { + "epoch": 0.66, + "learning_rate": 5.157978795504939e-06, + "loss": 0.6501, + "step": 19078 + }, + { + "epoch": 0.66, + "learning_rate": 5.157026115251904e-06, + "loss": 0.6029, + "step": 19079 + }, + { + "epoch": 0.66, + "learning_rate": 5.156073492418448e-06, + "loss": 0.6264, + "step": 19080 + }, + { + "epoch": 0.66, + "learning_rate": 5.155120927015867e-06, + "loss": 0.615, + "step": 19081 + }, + { + "epoch": 0.66, + "learning_rate": 5.154168419055461e-06, + "loss": 0.6187, + "step": 19082 + }, + { + "epoch": 0.66, + "learning_rate": 5.153215968548515e-06, + "loss": 0.6377, + "step": 19083 + }, + { + "epoch": 0.66, + "learning_rate": 5.1522635755063244e-06, + "loss": 0.5765, + "step": 19084 + }, + { + "epoch": 0.66, + "learning_rate": 5.151311239940186e-06, + "loss": 0.6029, + "step": 19085 + }, + { + "epoch": 0.66, + "learning_rate": 5.150358961861384e-06, + "loss": 0.6211, + "step": 19086 + }, + { + "epoch": 0.66, + "learning_rate": 5.1494067412812064e-06, + "loss": 0.6621, + "step": 19087 + }, + { + "epoch": 0.66, + "learning_rate": 5.148454578210955e-06, + "loss": 0.6454, + "step": 19088 + }, + { + "epoch": 0.66, + "learning_rate": 5.14750247266191e-06, + "loss": 0.637, + "step": 19089 + }, + { + "epoch": 0.66, + "learning_rate": 5.146550424645359e-06, + "loss": 0.5911, + "step": 19090 + }, + { + "epoch": 0.66, + "learning_rate": 5.145598434172597e-06, + "loss": 0.5839, + "step": 19091 + }, + { + "epoch": 0.66, + "learning_rate": 5.144646501254904e-06, + "loss": 0.6837, + "step": 19092 + }, + { + "epoch": 0.66, + "learning_rate": 5.143694625903564e-06, + "loss": 0.6114, + "step": 19093 + }, + { + "epoch": 0.66, + "learning_rate": 5.142742808129875e-06, + "loss": 0.613, + "step": 19094 + }, + { + "epoch": 0.66, + "learning_rate": 5.141791047945111e-06, + "loss": 0.6116, + "step": 19095 + }, + { + "epoch": 0.66, + "learning_rate": 5.140839345360557e-06, + "loss": 0.6257, + "step": 19096 + }, + { + "epoch": 0.66, + "learning_rate": 5.139887700387507e-06, + "loss": 0.5938, + "step": 19097 + }, + { + "epoch": 0.66, + "learning_rate": 5.138936113037231e-06, + "loss": 0.6904, + "step": 19098 + }, + { + "epoch": 0.66, + "learning_rate": 5.137984583321014e-06, + "loss": 0.6233, + "step": 19099 + }, + { + "epoch": 0.66, + "learning_rate": 5.137033111250147e-06, + "loss": 0.6037, + "step": 19100 + }, + { + "epoch": 0.66, + "learning_rate": 5.1360816968359e-06, + "loss": 0.6224, + "step": 19101 + }, + { + "epoch": 0.66, + "learning_rate": 5.135130340089558e-06, + "loss": 0.6169, + "step": 19102 + }, + { + "epoch": 0.66, + "learning_rate": 5.134179041022403e-06, + "loss": 0.6205, + "step": 19103 + }, + { + "epoch": 0.66, + "learning_rate": 5.133227799645707e-06, + "loss": 0.6213, + "step": 19104 + }, + { + "epoch": 0.66, + "learning_rate": 5.132276615970748e-06, + "loss": 0.5931, + "step": 19105 + }, + { + "epoch": 0.66, + "learning_rate": 5.131325490008816e-06, + "loss": 0.621, + "step": 19106 + }, + { + "epoch": 0.66, + "learning_rate": 5.130374421771175e-06, + "loss": 0.6089, + "step": 19107 + }, + { + "epoch": 0.66, + "learning_rate": 5.129423411269106e-06, + "loss": 0.711, + "step": 19108 + }, + { + "epoch": 0.66, + "learning_rate": 5.128472458513886e-06, + "loss": 0.6542, + "step": 19109 + }, + { + "epoch": 0.66, + "learning_rate": 5.127521563516784e-06, + "loss": 0.6422, + "step": 19110 + }, + { + "epoch": 0.66, + "learning_rate": 5.1265707262890755e-06, + "loss": 0.6146, + "step": 19111 + }, + { + "epoch": 0.66, + "learning_rate": 5.125619946842042e-06, + "loss": 0.6424, + "step": 19112 + }, + { + "epoch": 0.66, + "learning_rate": 5.124669225186947e-06, + "loss": 0.6761, + "step": 19113 + }, + { + "epoch": 0.66, + "learning_rate": 5.123718561335065e-06, + "loss": 0.5805, + "step": 19114 + }, + { + "epoch": 0.66, + "learning_rate": 5.122767955297671e-06, + "loss": 0.61, + "step": 19115 + }, + { + "epoch": 0.66, + "learning_rate": 5.121817407086031e-06, + "loss": 0.6069, + "step": 19116 + }, + { + "epoch": 0.66, + "learning_rate": 5.120866916711412e-06, + "loss": 0.64, + "step": 19117 + }, + { + "epoch": 0.66, + "learning_rate": 5.119916484185095e-06, + "loss": 0.6148, + "step": 19118 + }, + { + "epoch": 0.66, + "learning_rate": 5.118966109518339e-06, + "loss": 0.6542, + "step": 19119 + }, + { + "epoch": 0.66, + "learning_rate": 5.118015792722413e-06, + "loss": 0.6703, + "step": 19120 + }, + { + "epoch": 0.66, + "learning_rate": 5.117065533808589e-06, + "loss": 0.6556, + "step": 19121 + }, + { + "epoch": 0.66, + "learning_rate": 5.116115332788127e-06, + "loss": 0.5817, + "step": 19122 + }, + { + "epoch": 0.66, + "learning_rate": 5.115165189672291e-06, + "loss": 0.5933, + "step": 19123 + }, + { + "epoch": 0.66, + "learning_rate": 5.11421510447236e-06, + "loss": 0.6283, + "step": 19124 + }, + { + "epoch": 0.66, + "learning_rate": 5.113265077199585e-06, + "loss": 0.6525, + "step": 19125 + }, + { + "epoch": 0.66, + "learning_rate": 5.112315107865235e-06, + "loss": 0.6165, + "step": 19126 + }, + { + "epoch": 0.66, + "learning_rate": 5.111365196480575e-06, + "loss": 0.6092, + "step": 19127 + }, + { + "epoch": 0.66, + "learning_rate": 5.110415343056862e-06, + "loss": 0.5979, + "step": 19128 + }, + { + "epoch": 0.66, + "learning_rate": 5.109465547605355e-06, + "loss": 0.6677, + "step": 19129 + }, + { + "epoch": 0.66, + "learning_rate": 5.10851581013733e-06, + "loss": 0.6472, + "step": 19130 + }, + { + "epoch": 0.66, + "learning_rate": 5.107566130664034e-06, + "loss": 0.6982, + "step": 19131 + }, + { + "epoch": 0.66, + "learning_rate": 5.106616509196734e-06, + "loss": 0.6356, + "step": 19132 + }, + { + "epoch": 0.66, + "learning_rate": 5.10566694574668e-06, + "loss": 0.6501, + "step": 19133 + }, + { + "epoch": 0.66, + "learning_rate": 5.104717440325138e-06, + "loss": 0.5985, + "step": 19134 + }, + { + "epoch": 0.66, + "learning_rate": 5.10376799294336e-06, + "loss": 0.6496, + "step": 19135 + }, + { + "epoch": 0.66, + "learning_rate": 5.102818603612609e-06, + "loss": 0.6243, + "step": 19136 + }, + { + "epoch": 0.66, + "learning_rate": 5.101869272344137e-06, + "loss": 0.6067, + "step": 19137 + }, + { + "epoch": 0.66, + "learning_rate": 5.100919999149207e-06, + "loss": 0.6925, + "step": 19138 + }, + { + "epoch": 0.66, + "learning_rate": 5.099970784039064e-06, + "loss": 0.6578, + "step": 19139 + }, + { + "epoch": 0.66, + "learning_rate": 5.0990216270249625e-06, + "loss": 0.6039, + "step": 19140 + }, + { + "epoch": 0.66, + "learning_rate": 5.098072528118162e-06, + "loss": 0.6455, + "step": 19141 + }, + { + "epoch": 0.66, + "learning_rate": 5.097123487329912e-06, + "loss": 0.6737, + "step": 19142 + }, + { + "epoch": 0.66, + "learning_rate": 5.096174504671465e-06, + "loss": 0.5761, + "step": 19143 + }, + { + "epoch": 0.66, + "learning_rate": 5.095225580154077e-06, + "loss": 0.5588, + "step": 19144 + }, + { + "epoch": 0.66, + "learning_rate": 5.09427671378899e-06, + "loss": 0.6346, + "step": 19145 + }, + { + "epoch": 0.66, + "learning_rate": 5.093327905587459e-06, + "loss": 0.6066, + "step": 19146 + }, + { + "epoch": 0.66, + "learning_rate": 5.092379155560731e-06, + "loss": 0.6498, + "step": 19147 + }, + { + "epoch": 0.66, + "learning_rate": 5.091430463720059e-06, + "loss": 0.6168, + "step": 19148 + }, + { + "epoch": 0.66, + "learning_rate": 5.0904818300766854e-06, + "loss": 0.6242, + "step": 19149 + }, + { + "epoch": 0.66, + "learning_rate": 5.089533254641865e-06, + "loss": 0.6036, + "step": 19150 + }, + { + "epoch": 0.66, + "learning_rate": 5.088584737426837e-06, + "loss": 0.6843, + "step": 19151 + }, + { + "epoch": 0.66, + "learning_rate": 5.087636278442849e-06, + "loss": 0.6361, + "step": 19152 + }, + { + "epoch": 0.66, + "learning_rate": 5.0866878777011475e-06, + "loss": 0.6024, + "step": 19153 + }, + { + "epoch": 0.66, + "learning_rate": 5.0857395352129765e-06, + "loss": 0.6642, + "step": 19154 + }, + { + "epoch": 0.66, + "learning_rate": 5.0847912509895795e-06, + "loss": 0.6216, + "step": 19155 + }, + { + "epoch": 0.66, + "learning_rate": 5.0838430250422035e-06, + "loss": 0.5942, + "step": 19156 + }, + { + "epoch": 0.66, + "learning_rate": 5.082894857382085e-06, + "loss": 0.6165, + "step": 19157 + }, + { + "epoch": 0.66, + "learning_rate": 5.081946748020466e-06, + "loss": 0.6865, + "step": 19158 + }, + { + "epoch": 0.66, + "learning_rate": 5.080998696968591e-06, + "loss": 0.6314, + "step": 19159 + }, + { + "epoch": 0.66, + "learning_rate": 5.0800507042377e-06, + "loss": 0.659, + "step": 19160 + }, + { + "epoch": 0.66, + "learning_rate": 5.079102769839031e-06, + "loss": 0.6437, + "step": 19161 + }, + { + "epoch": 0.66, + "learning_rate": 5.078154893783826e-06, + "loss": 0.6234, + "step": 19162 + }, + { + "epoch": 0.66, + "learning_rate": 5.0772070760833185e-06, + "loss": 0.5831, + "step": 19163 + }, + { + "epoch": 0.66, + "learning_rate": 5.0762593167487486e-06, + "loss": 0.6059, + "step": 19164 + }, + { + "epoch": 0.66, + "learning_rate": 5.075311615791352e-06, + "loss": 0.6552, + "step": 19165 + }, + { + "epoch": 0.66, + "learning_rate": 5.074363973222366e-06, + "loss": 0.6213, + "step": 19166 + }, + { + "epoch": 0.66, + "learning_rate": 5.073416389053027e-06, + "loss": 0.6703, + "step": 19167 + }, + { + "epoch": 0.66, + "learning_rate": 5.072468863294572e-06, + "loss": 0.6752, + "step": 19168 + }, + { + "epoch": 0.66, + "learning_rate": 5.0715213959582275e-06, + "loss": 0.6402, + "step": 19169 + }, + { + "epoch": 0.66, + "learning_rate": 5.070573987055234e-06, + "loss": 0.6414, + "step": 19170 + }, + { + "epoch": 0.66, + "learning_rate": 5.069626636596818e-06, + "loss": 0.639, + "step": 19171 + }, + { + "epoch": 0.66, + "learning_rate": 5.068679344594218e-06, + "loss": 0.6375, + "step": 19172 + }, + { + "epoch": 0.66, + "learning_rate": 5.067732111058662e-06, + "loss": 0.5936, + "step": 19173 + }, + { + "epoch": 0.66, + "learning_rate": 5.066784936001384e-06, + "loss": 0.6423, + "step": 19174 + }, + { + "epoch": 0.66, + "learning_rate": 5.065837819433608e-06, + "loss": 0.6663, + "step": 19175 + }, + { + "epoch": 0.66, + "learning_rate": 5.064890761366567e-06, + "loss": 0.6053, + "step": 19176 + }, + { + "epoch": 0.66, + "learning_rate": 5.063943761811489e-06, + "loss": 0.583, + "step": 19177 + }, + { + "epoch": 0.66, + "learning_rate": 5.0629968207796e-06, + "loss": 0.6396, + "step": 19178 + }, + { + "epoch": 0.66, + "learning_rate": 5.062049938282129e-06, + "loss": 0.6438, + "step": 19179 + }, + { + "epoch": 0.66, + "learning_rate": 5.061103114330309e-06, + "loss": 0.6191, + "step": 19180 + }, + { + "epoch": 0.66, + "learning_rate": 5.060156348935355e-06, + "loss": 0.6302, + "step": 19181 + }, + { + "epoch": 0.66, + "learning_rate": 5.0592096421084946e-06, + "loss": 0.671, + "step": 19182 + }, + { + "epoch": 0.66, + "learning_rate": 5.058262993860955e-06, + "loss": 0.6244, + "step": 19183 + }, + { + "epoch": 0.66, + "learning_rate": 5.057316404203958e-06, + "loss": 0.6807, + "step": 19184 + }, + { + "epoch": 0.66, + "learning_rate": 5.0563698731487295e-06, + "loss": 0.6167, + "step": 19185 + }, + { + "epoch": 0.66, + "learning_rate": 5.055423400706492e-06, + "loss": 0.6523, + "step": 19186 + }, + { + "epoch": 0.66, + "learning_rate": 5.054476986888461e-06, + "loss": 0.5998, + "step": 19187 + }, + { + "epoch": 0.66, + "learning_rate": 5.053530631705863e-06, + "loss": 0.6089, + "step": 19188 + }, + { + "epoch": 0.66, + "learning_rate": 5.052584335169917e-06, + "loss": 0.6687, + "step": 19189 + }, + { + "epoch": 0.66, + "learning_rate": 5.05163809729184e-06, + "loss": 0.6538, + "step": 19190 + }, + { + "epoch": 0.66, + "learning_rate": 5.050691918082855e-06, + "loss": 0.6367, + "step": 19191 + }, + { + "epoch": 0.66, + "learning_rate": 5.049745797554181e-06, + "loss": 0.6324, + "step": 19192 + }, + { + "epoch": 0.66, + "learning_rate": 5.048799735717029e-06, + "loss": 0.6676, + "step": 19193 + }, + { + "epoch": 0.67, + "learning_rate": 5.04785373258262e-06, + "loss": 0.6514, + "step": 19194 + }, + { + "epoch": 0.67, + "learning_rate": 5.046907788162168e-06, + "loss": 0.6549, + "step": 19195 + }, + { + "epoch": 0.67, + "learning_rate": 5.045961902466892e-06, + "loss": 0.6482, + "step": 19196 + }, + { + "epoch": 0.67, + "learning_rate": 5.045016075508007e-06, + "loss": 0.6352, + "step": 19197 + }, + { + "epoch": 0.67, + "learning_rate": 5.04407030729672e-06, + "loss": 0.642, + "step": 19198 + }, + { + "epoch": 0.67, + "learning_rate": 5.04312459784425e-06, + "loss": 0.6127, + "step": 19199 + }, + { + "epoch": 0.67, + "learning_rate": 5.042178947161808e-06, + "loss": 0.6205, + "step": 19200 + }, + { + "epoch": 0.67, + "learning_rate": 5.041233355260607e-06, + "loss": 0.6248, + "step": 19201 + }, + { + "epoch": 0.67, + "learning_rate": 5.040287822151856e-06, + "loss": 0.6189, + "step": 19202 + }, + { + "epoch": 0.67, + "learning_rate": 5.039342347846772e-06, + "loss": 0.6298, + "step": 19203 + }, + { + "epoch": 0.67, + "learning_rate": 5.038396932356555e-06, + "loss": 0.6411, + "step": 19204 + }, + { + "epoch": 0.67, + "learning_rate": 5.037451575692419e-06, + "loss": 0.6134, + "step": 19205 + }, + { + "epoch": 0.67, + "learning_rate": 5.0365062778655726e-06, + "loss": 0.6618, + "step": 19206 + }, + { + "epoch": 0.67, + "learning_rate": 5.035561038887223e-06, + "loss": 0.6323, + "step": 19207 + }, + { + "epoch": 0.67, + "learning_rate": 5.034615858768578e-06, + "loss": 0.5962, + "step": 19208 + }, + { + "epoch": 0.67, + "learning_rate": 5.033670737520846e-06, + "loss": 0.5988, + "step": 19209 + }, + { + "epoch": 0.67, + "learning_rate": 5.032725675155227e-06, + "loss": 0.6799, + "step": 19210 + }, + { + "epoch": 0.67, + "learning_rate": 5.031780671682928e-06, + "loss": 0.6712, + "step": 19211 + }, + { + "epoch": 0.67, + "learning_rate": 5.030835727115153e-06, + "loss": 0.6234, + "step": 19212 + }, + { + "epoch": 0.67, + "learning_rate": 5.0298908414631085e-06, + "loss": 0.691, + "step": 19213 + }, + { + "epoch": 0.67, + "learning_rate": 5.028946014737994e-06, + "loss": 0.6253, + "step": 19214 + }, + { + "epoch": 0.67, + "learning_rate": 5.028001246951018e-06, + "loss": 0.6192, + "step": 19215 + }, + { + "epoch": 0.67, + "learning_rate": 5.027056538113372e-06, + "loss": 0.6296, + "step": 19216 + }, + { + "epoch": 0.67, + "learning_rate": 5.026111888236261e-06, + "loss": 0.6989, + "step": 19217 + }, + { + "epoch": 0.67, + "learning_rate": 5.025167297330887e-06, + "loss": 0.6401, + "step": 19218 + }, + { + "epoch": 0.67, + "learning_rate": 5.0242227654084465e-06, + "loss": 0.6598, + "step": 19219 + }, + { + "epoch": 0.67, + "learning_rate": 5.02327829248014e-06, + "loss": 0.6414, + "step": 19220 + }, + { + "epoch": 0.67, + "learning_rate": 5.022333878557169e-06, + "loss": 0.6226, + "step": 19221 + }, + { + "epoch": 0.67, + "learning_rate": 5.021389523650724e-06, + "loss": 0.6184, + "step": 19222 + }, + { + "epoch": 0.67, + "learning_rate": 5.020445227772002e-06, + "loss": 0.6273, + "step": 19223 + }, + { + "epoch": 0.67, + "learning_rate": 5.0195009909322025e-06, + "loss": 0.63, + "step": 19224 + }, + { + "epoch": 0.67, + "learning_rate": 5.018556813142519e-06, + "loss": 0.5806, + "step": 19225 + }, + { + "epoch": 0.67, + "learning_rate": 5.017612694414145e-06, + "loss": 0.6209, + "step": 19226 + }, + { + "epoch": 0.67, + "learning_rate": 5.016668634758279e-06, + "loss": 0.677, + "step": 19227 + }, + { + "epoch": 0.67, + "learning_rate": 5.015724634186108e-06, + "loss": 0.5977, + "step": 19228 + }, + { + "epoch": 0.67, + "learning_rate": 5.014780692708825e-06, + "loss": 0.6397, + "step": 19229 + }, + { + "epoch": 0.67, + "learning_rate": 5.0138368103376245e-06, + "loss": 0.625, + "step": 19230 + }, + { + "epoch": 0.67, + "learning_rate": 5.012892987083695e-06, + "loss": 0.5872, + "step": 19231 + }, + { + "epoch": 0.67, + "learning_rate": 5.011949222958229e-06, + "loss": 0.6559, + "step": 19232 + }, + { + "epoch": 0.67, + "learning_rate": 5.011005517972418e-06, + "loss": 0.6464, + "step": 19233 + }, + { + "epoch": 0.67, + "learning_rate": 5.010061872137444e-06, + "loss": 0.58, + "step": 19234 + }, + { + "epoch": 0.67, + "learning_rate": 5.009118285464498e-06, + "loss": 0.6166, + "step": 19235 + }, + { + "epoch": 0.67, + "learning_rate": 5.00817475796477e-06, + "loss": 0.6067, + "step": 19236 + }, + { + "epoch": 0.67, + "learning_rate": 5.0072312896494434e-06, + "loss": 0.68, + "step": 19237 + }, + { + "epoch": 0.67, + "learning_rate": 5.006287880529708e-06, + "loss": 0.5958, + "step": 19238 + }, + { + "epoch": 0.67, + "learning_rate": 5.005344530616748e-06, + "loss": 0.6749, + "step": 19239 + }, + { + "epoch": 0.67, + "learning_rate": 5.004401239921744e-06, + "loss": 0.5367, + "step": 19240 + }, + { + "epoch": 0.67, + "learning_rate": 5.003458008455884e-06, + "loss": 0.6413, + "step": 19241 + }, + { + "epoch": 0.67, + "learning_rate": 5.002514836230348e-06, + "loss": 0.6252, + "step": 19242 + }, + { + "epoch": 0.67, + "learning_rate": 5.001571723256321e-06, + "loss": 0.6464, + "step": 19243 + }, + { + "epoch": 0.67, + "learning_rate": 5.000628669544985e-06, + "loss": 0.6425, + "step": 19244 + }, + { + "epoch": 0.67, + "learning_rate": 4.999685675107523e-06, + "loss": 0.6155, + "step": 19245 + }, + { + "epoch": 0.67, + "learning_rate": 4.99874273995511e-06, + "loss": 0.5693, + "step": 19246 + }, + { + "epoch": 0.67, + "learning_rate": 4.997799864098928e-06, + "loss": 0.6719, + "step": 19247 + }, + { + "epoch": 0.67, + "learning_rate": 4.9968570475501565e-06, + "loss": 0.6817, + "step": 19248 + }, + { + "epoch": 0.67, + "learning_rate": 4.995914290319974e-06, + "loss": 0.6332, + "step": 19249 + }, + { + "epoch": 0.67, + "learning_rate": 4.994971592419557e-06, + "loss": 0.5901, + "step": 19250 + }, + { + "epoch": 0.67, + "learning_rate": 4.994028953860087e-06, + "loss": 0.6277, + "step": 19251 + }, + { + "epoch": 0.67, + "learning_rate": 4.993086374652733e-06, + "loss": 0.6204, + "step": 19252 + }, + { + "epoch": 0.67, + "learning_rate": 4.992143854808674e-06, + "loss": 0.6126, + "step": 19253 + }, + { + "epoch": 0.67, + "learning_rate": 4.991201394339085e-06, + "loss": 0.5891, + "step": 19254 + }, + { + "epoch": 0.67, + "learning_rate": 4.990258993255139e-06, + "loss": 0.6389, + "step": 19255 + }, + { + "epoch": 0.67, + "learning_rate": 4.989316651568014e-06, + "loss": 0.6813, + "step": 19256 + }, + { + "epoch": 0.67, + "learning_rate": 4.988374369288874e-06, + "loss": 0.6609, + "step": 19257 + }, + { + "epoch": 0.67, + "learning_rate": 4.987432146428896e-06, + "loss": 0.6399, + "step": 19258 + }, + { + "epoch": 0.67, + "learning_rate": 4.986489982999255e-06, + "loss": 0.5839, + "step": 19259 + }, + { + "epoch": 0.67, + "learning_rate": 4.98554787901111e-06, + "loss": 0.6154, + "step": 19260 + }, + { + "epoch": 0.67, + "learning_rate": 4.984605834475642e-06, + "loss": 0.6745, + "step": 19261 + }, + { + "epoch": 0.67, + "learning_rate": 4.98366384940402e-06, + "loss": 0.6782, + "step": 19262 + }, + { + "epoch": 0.67, + "learning_rate": 4.982721923807404e-06, + "loss": 0.6637, + "step": 19263 + }, + { + "epoch": 0.67, + "learning_rate": 4.981780057696968e-06, + "loss": 0.6315, + "step": 19264 + }, + { + "epoch": 0.67, + "learning_rate": 4.980838251083881e-06, + "loss": 0.6353, + "step": 19265 + }, + { + "epoch": 0.67, + "learning_rate": 4.979896503979297e-06, + "loss": 0.6373, + "step": 19266 + }, + { + "epoch": 0.67, + "learning_rate": 4.978954816394394e-06, + "loss": 0.6287, + "step": 19267 + }, + { + "epoch": 0.67, + "learning_rate": 4.978013188340339e-06, + "loss": 0.6501, + "step": 19268 + }, + { + "epoch": 0.67, + "learning_rate": 4.977071619828286e-06, + "loss": 0.641, + "step": 19269 + }, + { + "epoch": 0.67, + "learning_rate": 4.976130110869403e-06, + "loss": 0.6395, + "step": 19270 + }, + { + "epoch": 0.67, + "learning_rate": 4.975188661474856e-06, + "loss": 0.5658, + "step": 19271 + }, + { + "epoch": 0.67, + "learning_rate": 4.974247271655796e-06, + "loss": 0.6616, + "step": 19272 + }, + { + "epoch": 0.67, + "learning_rate": 4.973305941423398e-06, + "loss": 0.6532, + "step": 19273 + }, + { + "epoch": 0.67, + "learning_rate": 4.972364670788818e-06, + "loss": 0.6821, + "step": 19274 + }, + { + "epoch": 0.67, + "learning_rate": 4.971423459763213e-06, + "loss": 0.6254, + "step": 19275 + }, + { + "epoch": 0.67, + "learning_rate": 4.970482308357743e-06, + "loss": 0.6189, + "step": 19276 + }, + { + "epoch": 0.67, + "learning_rate": 4.969541216583572e-06, + "loss": 0.591, + "step": 19277 + }, + { + "epoch": 0.67, + "learning_rate": 4.968600184451845e-06, + "loss": 0.6011, + "step": 19278 + }, + { + "epoch": 0.67, + "learning_rate": 4.967659211973732e-06, + "loss": 0.5782, + "step": 19279 + }, + { + "epoch": 0.67, + "learning_rate": 4.966718299160389e-06, + "loss": 0.6399, + "step": 19280 + }, + { + "epoch": 0.67, + "learning_rate": 4.965777446022964e-06, + "loss": 0.6275, + "step": 19281 + }, + { + "epoch": 0.67, + "learning_rate": 4.964836652572615e-06, + "loss": 0.6391, + "step": 19282 + }, + { + "epoch": 0.67, + "learning_rate": 4.963895918820502e-06, + "loss": 0.6591, + "step": 19283 + }, + { + "epoch": 0.67, + "learning_rate": 4.962955244777764e-06, + "loss": 0.587, + "step": 19284 + }, + { + "epoch": 0.67, + "learning_rate": 4.962014630455568e-06, + "loss": 0.5803, + "step": 19285 + }, + { + "epoch": 0.67, + "learning_rate": 4.961074075865067e-06, + "loss": 0.6391, + "step": 19286 + }, + { + "epoch": 0.67, + "learning_rate": 4.960133581017401e-06, + "loss": 0.6147, + "step": 19287 + }, + { + "epoch": 0.67, + "learning_rate": 4.959193145923728e-06, + "loss": 0.6534, + "step": 19288 + }, + { + "epoch": 0.67, + "learning_rate": 4.958252770595201e-06, + "loss": 0.6339, + "step": 19289 + }, + { + "epoch": 0.67, + "learning_rate": 4.957312455042957e-06, + "loss": 0.6479, + "step": 19290 + }, + { + "epoch": 0.67, + "learning_rate": 4.956372199278157e-06, + "loss": 0.6513, + "step": 19291 + }, + { + "epoch": 0.67, + "learning_rate": 4.95543200331195e-06, + "loss": 0.64, + "step": 19292 + }, + { + "epoch": 0.67, + "learning_rate": 4.954491867155472e-06, + "loss": 0.6182, + "step": 19293 + }, + { + "epoch": 0.67, + "learning_rate": 4.953551790819876e-06, + "loss": 0.635, + "step": 19294 + }, + { + "epoch": 0.67, + "learning_rate": 4.952611774316311e-06, + "loss": 0.6117, + "step": 19295 + }, + { + "epoch": 0.67, + "learning_rate": 4.951671817655912e-06, + "loss": 0.6152, + "step": 19296 + }, + { + "epoch": 0.67, + "learning_rate": 4.950731920849833e-06, + "loss": 0.6099, + "step": 19297 + }, + { + "epoch": 0.67, + "learning_rate": 4.9497920839092185e-06, + "loss": 0.6175, + "step": 19298 + }, + { + "epoch": 0.67, + "learning_rate": 4.948852306845202e-06, + "loss": 0.5533, + "step": 19299 + }, + { + "epoch": 0.67, + "learning_rate": 4.947912589668933e-06, + "loss": 0.6294, + "step": 19300 + }, + { + "epoch": 0.67, + "learning_rate": 4.9469729323915536e-06, + "loss": 0.6214, + "step": 19301 + }, + { + "epoch": 0.67, + "learning_rate": 4.946033335024196e-06, + "loss": 0.6487, + "step": 19302 + }, + { + "epoch": 0.67, + "learning_rate": 4.945093797578009e-06, + "loss": 0.6442, + "step": 19303 + }, + { + "epoch": 0.67, + "learning_rate": 4.944154320064134e-06, + "loss": 0.6493, + "step": 19304 + }, + { + "epoch": 0.67, + "learning_rate": 4.943214902493701e-06, + "loss": 0.62, + "step": 19305 + }, + { + "epoch": 0.67, + "learning_rate": 4.942275544877853e-06, + "loss": 0.6142, + "step": 19306 + }, + { + "epoch": 0.67, + "learning_rate": 4.94133624722773e-06, + "loss": 0.6313, + "step": 19307 + }, + { + "epoch": 0.67, + "learning_rate": 4.940397009554457e-06, + "loss": 0.655, + "step": 19308 + }, + { + "epoch": 0.67, + "learning_rate": 4.939457831869182e-06, + "loss": 0.6531, + "step": 19309 + }, + { + "epoch": 0.67, + "learning_rate": 4.938518714183039e-06, + "loss": 0.5914, + "step": 19310 + }, + { + "epoch": 0.67, + "learning_rate": 4.9375796565071574e-06, + "loss": 0.6212, + "step": 19311 + }, + { + "epoch": 0.67, + "learning_rate": 4.936640658852672e-06, + "loss": 0.6533, + "step": 19312 + }, + { + "epoch": 0.67, + "learning_rate": 4.93570172123072e-06, + "loss": 0.6513, + "step": 19313 + }, + { + "epoch": 0.67, + "learning_rate": 4.9347628436524235e-06, + "loss": 0.5454, + "step": 19314 + }, + { + "epoch": 0.67, + "learning_rate": 4.933824026128925e-06, + "loss": 0.6414, + "step": 19315 + }, + { + "epoch": 0.67, + "learning_rate": 4.932885268671354e-06, + "loss": 0.6441, + "step": 19316 + }, + { + "epoch": 0.67, + "learning_rate": 4.931946571290835e-06, + "loss": 0.6649, + "step": 19317 + }, + { + "epoch": 0.67, + "learning_rate": 4.931007933998505e-06, + "loss": 0.5917, + "step": 19318 + }, + { + "epoch": 0.67, + "learning_rate": 4.930069356805485e-06, + "loss": 0.5911, + "step": 19319 + }, + { + "epoch": 0.67, + "learning_rate": 4.929130839722901e-06, + "loss": 0.6994, + "step": 19320 + }, + { + "epoch": 0.67, + "learning_rate": 4.928192382761894e-06, + "loss": 0.6292, + "step": 19321 + }, + { + "epoch": 0.67, + "learning_rate": 4.927253985933577e-06, + "loss": 0.6741, + "step": 19322 + }, + { + "epoch": 0.67, + "learning_rate": 4.926315649249083e-06, + "loss": 0.6793, + "step": 19323 + }, + { + "epoch": 0.67, + "learning_rate": 4.9253773727195375e-06, + "loss": 0.5943, + "step": 19324 + }, + { + "epoch": 0.67, + "learning_rate": 4.924439156356059e-06, + "loss": 0.6124, + "step": 19325 + }, + { + "epoch": 0.67, + "learning_rate": 4.923501000169772e-06, + "loss": 0.5871, + "step": 19326 + }, + { + "epoch": 0.67, + "learning_rate": 4.922562904171809e-06, + "loss": 0.6482, + "step": 19327 + }, + { + "epoch": 0.67, + "learning_rate": 4.921624868373284e-06, + "loss": 0.6606, + "step": 19328 + }, + { + "epoch": 0.67, + "learning_rate": 4.920686892785318e-06, + "loss": 0.6444, + "step": 19329 + }, + { + "epoch": 0.67, + "learning_rate": 4.919748977419039e-06, + "loss": 0.6351, + "step": 19330 + }, + { + "epoch": 0.67, + "learning_rate": 4.918811122285558e-06, + "loss": 0.5547, + "step": 19331 + }, + { + "epoch": 0.67, + "learning_rate": 4.917873327395997e-06, + "loss": 0.6513, + "step": 19332 + }, + { + "epoch": 0.67, + "learning_rate": 4.9169355927614824e-06, + "loss": 0.5924, + "step": 19333 + }, + { + "epoch": 0.67, + "learning_rate": 4.915997918393123e-06, + "loss": 0.6786, + "step": 19334 + }, + { + "epoch": 0.67, + "learning_rate": 4.91506030430204e-06, + "loss": 0.5969, + "step": 19335 + }, + { + "epoch": 0.67, + "learning_rate": 4.914122750499353e-06, + "loss": 0.6334, + "step": 19336 + }, + { + "epoch": 0.67, + "learning_rate": 4.9131852569961714e-06, + "loss": 0.6848, + "step": 19337 + }, + { + "epoch": 0.67, + "learning_rate": 4.912247823803609e-06, + "loss": 0.5924, + "step": 19338 + }, + { + "epoch": 0.67, + "learning_rate": 4.911310450932791e-06, + "loss": 0.6107, + "step": 19339 + }, + { + "epoch": 0.67, + "learning_rate": 4.910373138394823e-06, + "loss": 0.6173, + "step": 19340 + }, + { + "epoch": 0.67, + "learning_rate": 4.9094358862008196e-06, + "loss": 0.6105, + "step": 19341 + }, + { + "epoch": 0.67, + "learning_rate": 4.908498694361896e-06, + "loss": 0.6396, + "step": 19342 + }, + { + "epoch": 0.67, + "learning_rate": 4.907561562889158e-06, + "loss": 0.6631, + "step": 19343 + }, + { + "epoch": 0.67, + "learning_rate": 4.906624491793717e-06, + "loss": 0.6442, + "step": 19344 + }, + { + "epoch": 0.67, + "learning_rate": 4.905687481086691e-06, + "loss": 0.6169, + "step": 19345 + }, + { + "epoch": 0.67, + "learning_rate": 4.904750530779183e-06, + "loss": 0.6811, + "step": 19346 + }, + { + "epoch": 0.67, + "learning_rate": 4.903813640882301e-06, + "loss": 0.5898, + "step": 19347 + }, + { + "epoch": 0.67, + "learning_rate": 4.90287681140716e-06, + "loss": 0.6129, + "step": 19348 + }, + { + "epoch": 0.67, + "learning_rate": 4.9019400423648575e-06, + "loss": 0.6023, + "step": 19349 + }, + { + "epoch": 0.67, + "learning_rate": 4.901003333766502e-06, + "loss": 0.6175, + "step": 19350 + }, + { + "epoch": 0.67, + "learning_rate": 4.9000666856232105e-06, + "loss": 0.6379, + "step": 19351 + }, + { + "epoch": 0.67, + "learning_rate": 4.8991300979460744e-06, + "loss": 0.6515, + "step": 19352 + }, + { + "epoch": 0.67, + "learning_rate": 4.898193570746205e-06, + "loss": 0.6148, + "step": 19353 + }, + { + "epoch": 0.67, + "learning_rate": 4.897257104034707e-06, + "loss": 0.6397, + "step": 19354 + }, + { + "epoch": 0.67, + "learning_rate": 4.896320697822678e-06, + "loss": 0.6171, + "step": 19355 + }, + { + "epoch": 0.67, + "learning_rate": 4.8953843521212195e-06, + "loss": 0.6485, + "step": 19356 + }, + { + "epoch": 0.67, + "learning_rate": 4.8944480669414455e-06, + "loss": 0.6244, + "step": 19357 + }, + { + "epoch": 0.67, + "learning_rate": 4.893511842294442e-06, + "loss": 0.6469, + "step": 19358 + }, + { + "epoch": 0.67, + "learning_rate": 4.892575678191317e-06, + "loss": 0.6035, + "step": 19359 + }, + { + "epoch": 0.67, + "learning_rate": 4.891639574643172e-06, + "loss": 0.6654, + "step": 19360 + }, + { + "epoch": 0.67, + "learning_rate": 4.890703531661099e-06, + "loss": 0.6345, + "step": 19361 + }, + { + "epoch": 0.67, + "learning_rate": 4.889767549256194e-06, + "loss": 0.6297, + "step": 19362 + }, + { + "epoch": 0.67, + "learning_rate": 4.888831627439566e-06, + "loss": 0.5963, + "step": 19363 + }, + { + "epoch": 0.67, + "learning_rate": 4.8878957662223024e-06, + "loss": 0.6114, + "step": 19364 + }, + { + "epoch": 0.67, + "learning_rate": 4.8869599656155e-06, + "loss": 0.6116, + "step": 19365 + }, + { + "epoch": 0.67, + "learning_rate": 4.886024225630261e-06, + "loss": 0.6402, + "step": 19366 + }, + { + "epoch": 0.67, + "learning_rate": 4.885088546277667e-06, + "loss": 0.6106, + "step": 19367 + }, + { + "epoch": 0.67, + "learning_rate": 4.884152927568818e-06, + "loss": 0.5858, + "step": 19368 + }, + { + "epoch": 0.67, + "learning_rate": 4.883217369514815e-06, + "loss": 0.6748, + "step": 19369 + }, + { + "epoch": 0.67, + "learning_rate": 4.8822818721267374e-06, + "loss": 0.6087, + "step": 19370 + }, + { + "epoch": 0.67, + "learning_rate": 4.8813464354156824e-06, + "loss": 0.6264, + "step": 19371 + }, + { + "epoch": 0.67, + "learning_rate": 4.880411059392746e-06, + "loss": 0.6589, + "step": 19372 + }, + { + "epoch": 0.67, + "learning_rate": 4.879475744069007e-06, + "loss": 0.6075, + "step": 19373 + }, + { + "epoch": 0.67, + "learning_rate": 4.878540489455558e-06, + "loss": 0.6823, + "step": 19374 + }, + { + "epoch": 0.67, + "learning_rate": 4.877605295563497e-06, + "loss": 0.6425, + "step": 19375 + }, + { + "epoch": 0.67, + "learning_rate": 4.876670162403901e-06, + "loss": 0.6755, + "step": 19376 + }, + { + "epoch": 0.67, + "learning_rate": 4.875735089987863e-06, + "loss": 0.6052, + "step": 19377 + }, + { + "epoch": 0.67, + "learning_rate": 4.87480007832647e-06, + "loss": 0.6605, + "step": 19378 + }, + { + "epoch": 0.67, + "learning_rate": 4.873865127430802e-06, + "loss": 0.6251, + "step": 19379 + }, + { + "epoch": 0.67, + "learning_rate": 4.872930237311948e-06, + "loss": 0.6196, + "step": 19380 + }, + { + "epoch": 0.67, + "learning_rate": 4.871995407980991e-06, + "loss": 0.5773, + "step": 19381 + }, + { + "epoch": 0.67, + "learning_rate": 4.8710606394490154e-06, + "loss": 0.6771, + "step": 19382 + }, + { + "epoch": 0.67, + "learning_rate": 4.870125931727109e-06, + "loss": 0.6854, + "step": 19383 + }, + { + "epoch": 0.67, + "learning_rate": 4.869191284826344e-06, + "loss": 0.6306, + "step": 19384 + }, + { + "epoch": 0.67, + "learning_rate": 4.868256698757808e-06, + "loss": 0.6052, + "step": 19385 + }, + { + "epoch": 0.67, + "learning_rate": 4.867322173532579e-06, + "loss": 0.6094, + "step": 19386 + }, + { + "epoch": 0.67, + "learning_rate": 4.866387709161741e-06, + "loss": 0.6063, + "step": 19387 + }, + { + "epoch": 0.67, + "learning_rate": 4.865453305656368e-06, + "loss": 0.6035, + "step": 19388 + }, + { + "epoch": 0.67, + "learning_rate": 4.864518963027547e-06, + "loss": 0.656, + "step": 19389 + }, + { + "epoch": 0.67, + "learning_rate": 4.8635846812863455e-06, + "loss": 0.5892, + "step": 19390 + }, + { + "epoch": 0.67, + "learning_rate": 4.862650460443845e-06, + "loss": 0.6641, + "step": 19391 + }, + { + "epoch": 0.67, + "learning_rate": 4.861716300511122e-06, + "loss": 0.673, + "step": 19392 + }, + { + "epoch": 0.67, + "learning_rate": 4.8607822014992525e-06, + "loss": 0.695, + "step": 19393 + }, + { + "epoch": 0.67, + "learning_rate": 4.859848163419312e-06, + "loss": 0.6501, + "step": 19394 + }, + { + "epoch": 0.67, + "learning_rate": 4.858914186282376e-06, + "loss": 0.6556, + "step": 19395 + }, + { + "epoch": 0.67, + "learning_rate": 4.8579802700995125e-06, + "loss": 0.6273, + "step": 19396 + }, + { + "epoch": 0.67, + "learning_rate": 4.857046414881799e-06, + "loss": 0.635, + "step": 19397 + }, + { + "epoch": 0.67, + "learning_rate": 4.856112620640304e-06, + "loss": 0.6786, + "step": 19398 + }, + { + "epoch": 0.67, + "learning_rate": 4.855178887386103e-06, + "loss": 0.6283, + "step": 19399 + }, + { + "epoch": 0.67, + "learning_rate": 4.854245215130263e-06, + "loss": 0.6198, + "step": 19400 + }, + { + "epoch": 0.67, + "learning_rate": 4.85331160388386e-06, + "loss": 0.6392, + "step": 19401 + }, + { + "epoch": 0.67, + "learning_rate": 4.852378053657954e-06, + "loss": 0.6317, + "step": 19402 + }, + { + "epoch": 0.67, + "learning_rate": 4.8514445644636185e-06, + "loss": 0.6212, + "step": 19403 + }, + { + "epoch": 0.67, + "learning_rate": 4.850511136311921e-06, + "loss": 0.632, + "step": 19404 + }, + { + "epoch": 0.67, + "learning_rate": 4.849577769213928e-06, + "loss": 0.6245, + "step": 19405 + }, + { + "epoch": 0.67, + "learning_rate": 4.848644463180705e-06, + "loss": 0.5849, + "step": 19406 + }, + { + "epoch": 0.67, + "learning_rate": 4.847711218223324e-06, + "loss": 0.5918, + "step": 19407 + }, + { + "epoch": 0.67, + "learning_rate": 4.846778034352838e-06, + "loss": 0.6555, + "step": 19408 + }, + { + "epoch": 0.67, + "learning_rate": 4.845844911580319e-06, + "loss": 0.6679, + "step": 19409 + }, + { + "epoch": 0.67, + "learning_rate": 4.844911849916827e-06, + "loss": 0.6478, + "step": 19410 + }, + { + "epoch": 0.67, + "learning_rate": 4.8439788493734276e-06, + "loss": 0.6816, + "step": 19411 + }, + { + "epoch": 0.67, + "learning_rate": 4.84304590996118e-06, + "loss": 0.6188, + "step": 19412 + }, + { + "epoch": 0.67, + "learning_rate": 4.842113031691153e-06, + "loss": 0.6356, + "step": 19413 + }, + { + "epoch": 0.67, + "learning_rate": 4.841180214574395e-06, + "loss": 0.6516, + "step": 19414 + }, + { + "epoch": 0.67, + "learning_rate": 4.840247458621972e-06, + "loss": 0.6137, + "step": 19415 + }, + { + "epoch": 0.67, + "learning_rate": 4.839314763844942e-06, + "loss": 0.5905, + "step": 19416 + }, + { + "epoch": 0.67, + "learning_rate": 4.838382130254364e-06, + "loss": 0.6305, + "step": 19417 + }, + { + "epoch": 0.67, + "learning_rate": 4.837449557861296e-06, + "loss": 0.6482, + "step": 19418 + }, + { + "epoch": 0.67, + "learning_rate": 4.8365170466767975e-06, + "loss": 0.6598, + "step": 19419 + }, + { + "epoch": 0.67, + "learning_rate": 4.835584596711917e-06, + "loss": 0.6363, + "step": 19420 + }, + { + "epoch": 0.67, + "learning_rate": 4.8346522079777145e-06, + "loss": 0.6448, + "step": 19421 + }, + { + "epoch": 0.67, + "learning_rate": 4.833719880485245e-06, + "loss": 0.6331, + "step": 19422 + }, + { + "epoch": 0.67, + "learning_rate": 4.832787614245561e-06, + "loss": 0.6406, + "step": 19423 + }, + { + "epoch": 0.67, + "learning_rate": 4.831855409269717e-06, + "loss": 0.6214, + "step": 19424 + }, + { + "epoch": 0.67, + "learning_rate": 4.830923265568768e-06, + "loss": 0.6824, + "step": 19425 + }, + { + "epoch": 0.67, + "learning_rate": 4.829991183153758e-06, + "loss": 0.6461, + "step": 19426 + }, + { + "epoch": 0.67, + "learning_rate": 4.829059162035744e-06, + "loss": 0.6637, + "step": 19427 + }, + { + "epoch": 0.67, + "learning_rate": 4.828127202225774e-06, + "loss": 0.6525, + "step": 19428 + }, + { + "epoch": 0.67, + "learning_rate": 4.8271953037349e-06, + "loss": 0.6152, + "step": 19429 + }, + { + "epoch": 0.67, + "learning_rate": 4.826263466574167e-06, + "loss": 0.6346, + "step": 19430 + }, + { + "epoch": 0.67, + "learning_rate": 4.825331690754631e-06, + "loss": 0.6872, + "step": 19431 + }, + { + "epoch": 0.67, + "learning_rate": 4.8243999762873295e-06, + "loss": 0.6111, + "step": 19432 + }, + { + "epoch": 0.67, + "learning_rate": 4.823468323183313e-06, + "loss": 0.6134, + "step": 19433 + }, + { + "epoch": 0.67, + "learning_rate": 4.822536731453629e-06, + "loss": 0.6091, + "step": 19434 + }, + { + "epoch": 0.67, + "learning_rate": 4.821605201109319e-06, + "loss": 0.6001, + "step": 19435 + }, + { + "epoch": 0.67, + "learning_rate": 4.820673732161433e-06, + "loss": 0.5851, + "step": 19436 + }, + { + "epoch": 0.67, + "learning_rate": 4.819742324621014e-06, + "loss": 0.6648, + "step": 19437 + }, + { + "epoch": 0.67, + "learning_rate": 4.8188109784991e-06, + "loss": 0.6632, + "step": 19438 + }, + { + "epoch": 0.67, + "learning_rate": 4.817879693806735e-06, + "loss": 0.6638, + "step": 19439 + }, + { + "epoch": 0.67, + "learning_rate": 4.816948470554963e-06, + "loss": 0.6385, + "step": 19440 + }, + { + "epoch": 0.67, + "learning_rate": 4.816017308754822e-06, + "loss": 0.7217, + "step": 19441 + }, + { + "epoch": 0.67, + "learning_rate": 4.8150862084173575e-06, + "loss": 0.6706, + "step": 19442 + }, + { + "epoch": 0.67, + "learning_rate": 4.814155169553603e-06, + "loss": 0.6391, + "step": 19443 + }, + { + "epoch": 0.67, + "learning_rate": 4.813224192174597e-06, + "loss": 0.6848, + "step": 19444 + }, + { + "epoch": 0.67, + "learning_rate": 4.81229327629138e-06, + "loss": 0.624, + "step": 19445 + }, + { + "epoch": 0.67, + "learning_rate": 4.811362421914989e-06, + "loss": 0.6535, + "step": 19446 + }, + { + "epoch": 0.67, + "learning_rate": 4.81043162905646e-06, + "loss": 0.6122, + "step": 19447 + }, + { + "epoch": 0.67, + "learning_rate": 4.8095008977268335e-06, + "loss": 0.6486, + "step": 19448 + }, + { + "epoch": 0.67, + "learning_rate": 4.808570227937135e-06, + "loss": 0.6337, + "step": 19449 + }, + { + "epoch": 0.67, + "learning_rate": 4.807639619698404e-06, + "loss": 0.6367, + "step": 19450 + }, + { + "epoch": 0.67, + "learning_rate": 4.806709073021673e-06, + "loss": 0.6371, + "step": 19451 + }, + { + "epoch": 0.67, + "learning_rate": 4.805778587917977e-06, + "loss": 0.6276, + "step": 19452 + }, + { + "epoch": 0.67, + "learning_rate": 4.804848164398346e-06, + "loss": 0.6386, + "step": 19453 + }, + { + "epoch": 0.67, + "learning_rate": 4.803917802473816e-06, + "loss": 0.6395, + "step": 19454 + }, + { + "epoch": 0.67, + "learning_rate": 4.802987502155409e-06, + "loss": 0.6004, + "step": 19455 + }, + { + "epoch": 0.67, + "learning_rate": 4.8020572634541586e-06, + "loss": 0.6796, + "step": 19456 + }, + { + "epoch": 0.67, + "learning_rate": 4.801127086381097e-06, + "loss": 0.6424, + "step": 19457 + }, + { + "epoch": 0.67, + "learning_rate": 4.800196970947249e-06, + "loss": 0.628, + "step": 19458 + }, + { + "epoch": 0.67, + "learning_rate": 4.799266917163643e-06, + "loss": 0.6695, + "step": 19459 + }, + { + "epoch": 0.67, + "learning_rate": 4.798336925041312e-06, + "loss": 0.6071, + "step": 19460 + }, + { + "epoch": 0.67, + "learning_rate": 4.797406994591272e-06, + "loss": 0.6021, + "step": 19461 + }, + { + "epoch": 0.67, + "learning_rate": 4.796477125824553e-06, + "loss": 0.6304, + "step": 19462 + }, + { + "epoch": 0.67, + "learning_rate": 4.795547318752181e-06, + "loss": 0.6068, + "step": 19463 + }, + { + "epoch": 0.67, + "learning_rate": 4.79461757338518e-06, + "loss": 0.6089, + "step": 19464 + }, + { + "epoch": 0.67, + "learning_rate": 4.7936878897345715e-06, + "loss": 0.6877, + "step": 19465 + }, + { + "epoch": 0.67, + "learning_rate": 4.792758267811383e-06, + "loss": 0.6469, + "step": 19466 + }, + { + "epoch": 0.67, + "learning_rate": 4.791828707626629e-06, + "loss": 0.6421, + "step": 19467 + }, + { + "epoch": 0.67, + "learning_rate": 4.790899209191333e-06, + "loss": 0.6136, + "step": 19468 + }, + { + "epoch": 0.67, + "learning_rate": 4.789969772516517e-06, + "loss": 0.6362, + "step": 19469 + }, + { + "epoch": 0.67, + "learning_rate": 4.7890403976132e-06, + "loss": 0.6172, + "step": 19470 + }, + { + "epoch": 0.67, + "learning_rate": 4.788111084492401e-06, + "loss": 0.6018, + "step": 19471 + }, + { + "epoch": 0.67, + "learning_rate": 4.787181833165143e-06, + "loss": 0.6383, + "step": 19472 + }, + { + "epoch": 0.67, + "learning_rate": 4.786252643642434e-06, + "loss": 0.6389, + "step": 19473 + }, + { + "epoch": 0.67, + "learning_rate": 4.785323515935296e-06, + "loss": 0.5998, + "step": 19474 + }, + { + "epoch": 0.67, + "learning_rate": 4.784394450054743e-06, + "loss": 0.6142, + "step": 19475 + }, + { + "epoch": 0.67, + "learning_rate": 4.783465446011793e-06, + "loss": 0.5801, + "step": 19476 + }, + { + "epoch": 0.67, + "learning_rate": 4.7825365038174574e-06, + "loss": 0.6306, + "step": 19477 + }, + { + "epoch": 0.67, + "learning_rate": 4.781607623482757e-06, + "loss": 0.5811, + "step": 19478 + }, + { + "epoch": 0.67, + "learning_rate": 4.780678805018695e-06, + "loss": 0.6394, + "step": 19479 + }, + { + "epoch": 0.67, + "learning_rate": 4.779750048436288e-06, + "loss": 0.6685, + "step": 19480 + }, + { + "epoch": 0.67, + "learning_rate": 4.778821353746549e-06, + "loss": 0.6404, + "step": 19481 + }, + { + "epoch": 0.67, + "learning_rate": 4.7778927209604865e-06, + "loss": 0.6231, + "step": 19482 + }, + { + "epoch": 0.68, + "learning_rate": 4.776964150089112e-06, + "loss": 0.6183, + "step": 19483 + }, + { + "epoch": 0.68, + "learning_rate": 4.776035641143438e-06, + "loss": 0.6355, + "step": 19484 + }, + { + "epoch": 0.68, + "learning_rate": 4.775107194134467e-06, + "loss": 0.622, + "step": 19485 + }, + { + "epoch": 0.68, + "learning_rate": 4.7741788090732095e-06, + "loss": 0.6156, + "step": 19486 + }, + { + "epoch": 0.68, + "learning_rate": 4.773250485970673e-06, + "loss": 0.6826, + "step": 19487 + }, + { + "epoch": 0.68, + "learning_rate": 4.772322224837864e-06, + "loss": 0.625, + "step": 19488 + }, + { + "epoch": 0.68, + "learning_rate": 4.771394025685787e-06, + "loss": 0.6357, + "step": 19489 + }, + { + "epoch": 0.68, + "learning_rate": 4.770465888525453e-06, + "loss": 0.6216, + "step": 19490 + }, + { + "epoch": 0.68, + "learning_rate": 4.769537813367857e-06, + "loss": 0.6377, + "step": 19491 + }, + { + "epoch": 0.68, + "learning_rate": 4.768609800224007e-06, + "loss": 0.5962, + "step": 19492 + }, + { + "epoch": 0.68, + "learning_rate": 4.767681849104905e-06, + "loss": 0.5874, + "step": 19493 + }, + { + "epoch": 0.68, + "learning_rate": 4.766753960021554e-06, + "loss": 0.6322, + "step": 19494 + }, + { + "epoch": 0.68, + "learning_rate": 4.765826132984955e-06, + "loss": 0.6271, + "step": 19495 + }, + { + "epoch": 0.68, + "learning_rate": 4.764898368006112e-06, + "loss": 0.6619, + "step": 19496 + }, + { + "epoch": 0.68, + "learning_rate": 4.763970665096018e-06, + "loss": 0.6039, + "step": 19497 + }, + { + "epoch": 0.68, + "learning_rate": 4.7630430242656755e-06, + "loss": 0.66, + "step": 19498 + }, + { + "epoch": 0.68, + "learning_rate": 4.762115445526082e-06, + "loss": 0.6471, + "step": 19499 + }, + { + "epoch": 0.68, + "learning_rate": 4.761187928888236e-06, + "loss": 0.6473, + "step": 19500 + }, + { + "epoch": 0.68, + "learning_rate": 4.760260474363134e-06, + "loss": 0.6022, + "step": 19501 + }, + { + "epoch": 0.68, + "learning_rate": 4.759333081961777e-06, + "loss": 0.5932, + "step": 19502 + }, + { + "epoch": 0.68, + "learning_rate": 4.758405751695151e-06, + "loss": 0.6279, + "step": 19503 + }, + { + "epoch": 0.68, + "learning_rate": 4.75747848357426e-06, + "loss": 0.6428, + "step": 19504 + }, + { + "epoch": 0.68, + "learning_rate": 4.756551277610085e-06, + "loss": 0.6154, + "step": 19505 + }, + { + "epoch": 0.68, + "learning_rate": 4.755624133813634e-06, + "loss": 0.6223, + "step": 19506 + }, + { + "epoch": 0.68, + "learning_rate": 4.754697052195894e-06, + "loss": 0.6144, + "step": 19507 + }, + { + "epoch": 0.68, + "learning_rate": 4.753770032767853e-06, + "loss": 0.6472, + "step": 19508 + }, + { + "epoch": 0.68, + "learning_rate": 4.7528430755405046e-06, + "loss": 0.6316, + "step": 19509 + }, + { + "epoch": 0.68, + "learning_rate": 4.751916180524843e-06, + "loss": 0.5937, + "step": 19510 + }, + { + "epoch": 0.68, + "learning_rate": 4.750989347731846e-06, + "loss": 0.6516, + "step": 19511 + }, + { + "epoch": 0.68, + "learning_rate": 4.750062577172514e-06, + "loss": 0.6622, + "step": 19512 + }, + { + "epoch": 0.68, + "learning_rate": 4.749135868857836e-06, + "loss": 0.6623, + "step": 19513 + }, + { + "epoch": 0.68, + "learning_rate": 4.7482092227987905e-06, + "loss": 0.6316, + "step": 19514 + }, + { + "epoch": 0.68, + "learning_rate": 4.7472826390063685e-06, + "loss": 0.6417, + "step": 19515 + }, + { + "epoch": 0.68, + "learning_rate": 4.7463561174915586e-06, + "loss": 0.6427, + "step": 19516 + }, + { + "epoch": 0.68, + "learning_rate": 4.745429658265336e-06, + "loss": 0.6765, + "step": 19517 + }, + { + "epoch": 0.68, + "learning_rate": 4.744503261338695e-06, + "loss": 0.6019, + "step": 19518 + }, + { + "epoch": 0.68, + "learning_rate": 4.743576926722621e-06, + "loss": 0.6152, + "step": 19519 + }, + { + "epoch": 0.68, + "learning_rate": 4.742650654428087e-06, + "loss": 0.6028, + "step": 19520 + }, + { + "epoch": 0.68, + "learning_rate": 4.741724444466081e-06, + "loss": 0.6107, + "step": 19521 + }, + { + "epoch": 0.68, + "learning_rate": 4.740798296847586e-06, + "loss": 0.6307, + "step": 19522 + }, + { + "epoch": 0.68, + "learning_rate": 4.739872211583573e-06, + "loss": 0.5874, + "step": 19523 + }, + { + "epoch": 0.68, + "learning_rate": 4.738946188685033e-06, + "loss": 0.6147, + "step": 19524 + }, + { + "epoch": 0.68, + "learning_rate": 4.738020228162945e-06, + "loss": 0.6495, + "step": 19525 + }, + { + "epoch": 0.68, + "learning_rate": 4.73709433002828e-06, + "loss": 0.6137, + "step": 19526 + }, + { + "epoch": 0.68, + "learning_rate": 4.73616849429202e-06, + "loss": 0.6134, + "step": 19527 + }, + { + "epoch": 0.68, + "learning_rate": 4.735242720965144e-06, + "loss": 0.6552, + "step": 19528 + }, + { + "epoch": 0.68, + "learning_rate": 4.7343170100586174e-06, + "loss": 0.6548, + "step": 19529 + }, + { + "epoch": 0.68, + "learning_rate": 4.733391361583429e-06, + "loss": 0.6438, + "step": 19530 + }, + { + "epoch": 0.68, + "learning_rate": 4.732465775550551e-06, + "loss": 0.5927, + "step": 19531 + }, + { + "epoch": 0.68, + "learning_rate": 4.731540251970952e-06, + "loss": 0.7165, + "step": 19532 + }, + { + "epoch": 0.68, + "learning_rate": 4.730614790855606e-06, + "loss": 0.6395, + "step": 19533 + }, + { + "epoch": 0.68, + "learning_rate": 4.729689392215493e-06, + "loss": 0.6199, + "step": 19534 + }, + { + "epoch": 0.68, + "learning_rate": 4.728764056061572e-06, + "loss": 0.6587, + "step": 19535 + }, + { + "epoch": 0.68, + "learning_rate": 4.727838782404824e-06, + "loss": 0.6677, + "step": 19536 + }, + { + "epoch": 0.68, + "learning_rate": 4.7269135712562205e-06, + "loss": 0.6736, + "step": 19537 + }, + { + "epoch": 0.68, + "learning_rate": 4.725988422626724e-06, + "loss": 0.6387, + "step": 19538 + }, + { + "epoch": 0.68, + "learning_rate": 4.725063336527306e-06, + "loss": 0.6184, + "step": 19539 + }, + { + "epoch": 0.68, + "learning_rate": 4.724138312968937e-06, + "loss": 0.5866, + "step": 19540 + }, + { + "epoch": 0.68, + "learning_rate": 4.7232133519625765e-06, + "loss": 0.6974, + "step": 19541 + }, + { + "epoch": 0.68, + "learning_rate": 4.7222884535192016e-06, + "loss": 0.5929, + "step": 19542 + }, + { + "epoch": 0.68, + "learning_rate": 4.721363617649776e-06, + "loss": 0.624, + "step": 19543 + }, + { + "epoch": 0.68, + "learning_rate": 4.720438844365258e-06, + "loss": 0.6369, + "step": 19544 + }, + { + "epoch": 0.68, + "learning_rate": 4.719514133676617e-06, + "loss": 0.6119, + "step": 19545 + }, + { + "epoch": 0.68, + "learning_rate": 4.718589485594819e-06, + "loss": 0.6953, + "step": 19546 + }, + { + "epoch": 0.68, + "learning_rate": 4.7176649001308165e-06, + "loss": 0.6061, + "step": 19547 + }, + { + "epoch": 0.68, + "learning_rate": 4.716740377295582e-06, + "loss": 0.5974, + "step": 19548 + }, + { + "epoch": 0.68, + "learning_rate": 4.7158159171000785e-06, + "loss": 0.6825, + "step": 19549 + }, + { + "epoch": 0.68, + "learning_rate": 4.714891519555257e-06, + "loss": 0.5959, + "step": 19550 + }, + { + "epoch": 0.68, + "learning_rate": 4.713967184672084e-06, + "loss": 0.6327, + "step": 19551 + }, + { + "epoch": 0.68, + "learning_rate": 4.713042912461519e-06, + "loss": 0.6465, + "step": 19552 + }, + { + "epoch": 0.68, + "learning_rate": 4.712118702934511e-06, + "loss": 0.6757, + "step": 19553 + }, + { + "epoch": 0.68, + "learning_rate": 4.7111945561020286e-06, + "loss": 0.5604, + "step": 19554 + }, + { + "epoch": 0.68, + "learning_rate": 4.7102704719750295e-06, + "loss": 0.6149, + "step": 19555 + }, + { + "epoch": 0.68, + "learning_rate": 4.709346450564462e-06, + "loss": 0.6541, + "step": 19556 + }, + { + "epoch": 0.68, + "learning_rate": 4.708422491881284e-06, + "loss": 0.6501, + "step": 19557 + }, + { + "epoch": 0.68, + "learning_rate": 4.7074985959364546e-06, + "loss": 0.5633, + "step": 19558 + }, + { + "epoch": 0.68, + "learning_rate": 4.706574762740919e-06, + "loss": 0.6042, + "step": 19559 + }, + { + "epoch": 0.68, + "learning_rate": 4.705650992305637e-06, + "loss": 0.6907, + "step": 19560 + }, + { + "epoch": 0.68, + "learning_rate": 4.704727284641565e-06, + "loss": 0.6579, + "step": 19561 + }, + { + "epoch": 0.68, + "learning_rate": 4.703803639759646e-06, + "loss": 0.6295, + "step": 19562 + }, + { + "epoch": 0.68, + "learning_rate": 4.702880057670834e-06, + "loss": 0.6738, + "step": 19563 + }, + { + "epoch": 0.68, + "learning_rate": 4.701956538386084e-06, + "loss": 0.6266, + "step": 19564 + }, + { + "epoch": 0.68, + "learning_rate": 4.701033081916334e-06, + "loss": 0.6291, + "step": 19565 + }, + { + "epoch": 0.68, + "learning_rate": 4.700109688272547e-06, + "loss": 0.6434, + "step": 19566 + }, + { + "epoch": 0.68, + "learning_rate": 4.699186357465661e-06, + "loss": 0.6349, + "step": 19567 + }, + { + "epoch": 0.68, + "learning_rate": 4.698263089506625e-06, + "loss": 0.6336, + "step": 19568 + }, + { + "epoch": 0.68, + "learning_rate": 4.697339884406392e-06, + "loss": 0.6435, + "step": 19569 + }, + { + "epoch": 0.68, + "learning_rate": 4.696416742175898e-06, + "loss": 0.6314, + "step": 19570 + }, + { + "epoch": 0.68, + "learning_rate": 4.6954936628260895e-06, + "loss": 0.6825, + "step": 19571 + }, + { + "epoch": 0.68, + "learning_rate": 4.694570646367921e-06, + "loss": 0.6288, + "step": 19572 + }, + { + "epoch": 0.68, + "learning_rate": 4.693647692812324e-06, + "loss": 0.6296, + "step": 19573 + }, + { + "epoch": 0.68, + "learning_rate": 4.692724802170248e-06, + "loss": 0.6872, + "step": 19574 + }, + { + "epoch": 0.68, + "learning_rate": 4.691801974452635e-06, + "loss": 0.6296, + "step": 19575 + }, + { + "epoch": 0.68, + "learning_rate": 4.690879209670423e-06, + "loss": 0.6004, + "step": 19576 + }, + { + "epoch": 0.68, + "learning_rate": 4.689956507834548e-06, + "loss": 0.6537, + "step": 19577 + }, + { + "epoch": 0.68, + "learning_rate": 4.6890338689559656e-06, + "loss": 0.6243, + "step": 19578 + }, + { + "epoch": 0.68, + "learning_rate": 4.688111293045601e-06, + "loss": 0.6239, + "step": 19579 + }, + { + "epoch": 0.68, + "learning_rate": 4.687188780114395e-06, + "loss": 0.5997, + "step": 19580 + }, + { + "epoch": 0.68, + "learning_rate": 4.686266330173291e-06, + "loss": 0.6447, + "step": 19581 + }, + { + "epoch": 0.68, + "learning_rate": 4.685343943233219e-06, + "loss": 0.6356, + "step": 19582 + }, + { + "epoch": 0.68, + "learning_rate": 4.6844216193051124e-06, + "loss": 0.6351, + "step": 19583 + }, + { + "epoch": 0.68, + "learning_rate": 4.68349935839992e-06, + "loss": 0.6207, + "step": 19584 + }, + { + "epoch": 0.68, + "learning_rate": 4.682577160528564e-06, + "loss": 0.6562, + "step": 19585 + }, + { + "epoch": 0.68, + "learning_rate": 4.681655025701983e-06, + "loss": 0.6319, + "step": 19586 + }, + { + "epoch": 0.68, + "learning_rate": 4.680732953931113e-06, + "loss": 0.6071, + "step": 19587 + }, + { + "epoch": 0.68, + "learning_rate": 4.679810945226879e-06, + "loss": 0.6687, + "step": 19588 + }, + { + "epoch": 0.68, + "learning_rate": 4.678888999600212e-06, + "loss": 0.6415, + "step": 19589 + }, + { + "epoch": 0.68, + "learning_rate": 4.677967117062055e-06, + "loss": 0.6246, + "step": 19590 + }, + { + "epoch": 0.68, + "learning_rate": 4.677045297623327e-06, + "loss": 0.6536, + "step": 19591 + }, + { + "epoch": 0.68, + "learning_rate": 4.67612354129496e-06, + "loss": 0.6288, + "step": 19592 + }, + { + "epoch": 0.68, + "learning_rate": 4.675201848087887e-06, + "loss": 0.601, + "step": 19593 + }, + { + "epoch": 0.68, + "learning_rate": 4.674280218013028e-06, + "loss": 0.6191, + "step": 19594 + }, + { + "epoch": 0.68, + "learning_rate": 4.67335865108131e-06, + "loss": 0.6456, + "step": 19595 + }, + { + "epoch": 0.68, + "learning_rate": 4.672437147303672e-06, + "loss": 0.7093, + "step": 19596 + }, + { + "epoch": 0.68, + "learning_rate": 4.6715157066910265e-06, + "loss": 0.5736, + "step": 19597 + }, + { + "epoch": 0.68, + "learning_rate": 4.670594329254303e-06, + "loss": 0.6074, + "step": 19598 + }, + { + "epoch": 0.68, + "learning_rate": 4.669673015004429e-06, + "loss": 0.6311, + "step": 19599 + }, + { + "epoch": 0.68, + "learning_rate": 4.668751763952321e-06, + "loss": 0.6388, + "step": 19600 + }, + { + "epoch": 0.68, + "learning_rate": 4.667830576108902e-06, + "loss": 0.644, + "step": 19601 + }, + { + "epoch": 0.68, + "learning_rate": 4.666909451485102e-06, + "loss": 0.6249, + "step": 19602 + }, + { + "epoch": 0.68, + "learning_rate": 4.665988390091835e-06, + "loss": 0.6606, + "step": 19603 + }, + { + "epoch": 0.68, + "learning_rate": 4.665067391940022e-06, + "loss": 0.6468, + "step": 19604 + }, + { + "epoch": 0.68, + "learning_rate": 4.664146457040588e-06, + "loss": 0.6827, + "step": 19605 + }, + { + "epoch": 0.68, + "learning_rate": 4.663225585404445e-06, + "loss": 0.6938, + "step": 19606 + }, + { + "epoch": 0.68, + "learning_rate": 4.662304777042513e-06, + "loss": 0.632, + "step": 19607 + }, + { + "epoch": 0.68, + "learning_rate": 4.661384031965709e-06, + "loss": 0.6447, + "step": 19608 + }, + { + "epoch": 0.68, + "learning_rate": 4.660463350184951e-06, + "loss": 0.6551, + "step": 19609 + }, + { + "epoch": 0.68, + "learning_rate": 4.6595427317111554e-06, + "loss": 0.6312, + "step": 19610 + }, + { + "epoch": 0.68, + "learning_rate": 4.65862217655524e-06, + "loss": 0.6336, + "step": 19611 + }, + { + "epoch": 0.68, + "learning_rate": 4.657701684728112e-06, + "loss": 0.5983, + "step": 19612 + }, + { + "epoch": 0.68, + "learning_rate": 4.656781256240688e-06, + "loss": 0.624, + "step": 19613 + }, + { + "epoch": 0.68, + "learning_rate": 4.655860891103881e-06, + "loss": 0.6128, + "step": 19614 + }, + { + "epoch": 0.68, + "learning_rate": 4.654940589328605e-06, + "loss": 0.595, + "step": 19615 + }, + { + "epoch": 0.68, + "learning_rate": 4.654020350925769e-06, + "loss": 0.6713, + "step": 19616 + }, + { + "epoch": 0.68, + "learning_rate": 4.653100175906288e-06, + "loss": 0.6028, + "step": 19617 + }, + { + "epoch": 0.68, + "learning_rate": 4.652180064281065e-06, + "loss": 0.5821, + "step": 19618 + }, + { + "epoch": 0.68, + "learning_rate": 4.651260016061011e-06, + "loss": 0.6308, + "step": 19619 + }, + { + "epoch": 0.68, + "learning_rate": 4.650340031257037e-06, + "loss": 0.6181, + "step": 19620 + }, + { + "epoch": 0.68, + "learning_rate": 4.649420109880049e-06, + "loss": 0.6051, + "step": 19621 + }, + { + "epoch": 0.68, + "learning_rate": 4.648500251940955e-06, + "loss": 0.5843, + "step": 19622 + }, + { + "epoch": 0.68, + "learning_rate": 4.647580457450662e-06, + "loss": 0.6571, + "step": 19623 + }, + { + "epoch": 0.68, + "learning_rate": 4.6466607264200715e-06, + "loss": 0.5883, + "step": 19624 + }, + { + "epoch": 0.68, + "learning_rate": 4.645741058860089e-06, + "loss": 0.6595, + "step": 19625 + }, + { + "epoch": 0.68, + "learning_rate": 4.644821454781621e-06, + "loss": 0.6247, + "step": 19626 + }, + { + "epoch": 0.68, + "learning_rate": 4.643901914195568e-06, + "loss": 0.68, + "step": 19627 + }, + { + "epoch": 0.68, + "learning_rate": 4.642982437112833e-06, + "loss": 0.6109, + "step": 19628 + }, + { + "epoch": 0.68, + "learning_rate": 4.6420630235443205e-06, + "loss": 0.5708, + "step": 19629 + }, + { + "epoch": 0.68, + "learning_rate": 4.6411436735009275e-06, + "loss": 0.6079, + "step": 19630 + }, + { + "epoch": 0.68, + "learning_rate": 4.640224386993554e-06, + "loss": 0.6485, + "step": 19631 + }, + { + "epoch": 0.68, + "learning_rate": 4.6393051640331e-06, + "loss": 0.6567, + "step": 19632 + }, + { + "epoch": 0.68, + "learning_rate": 4.638386004630465e-06, + "loss": 0.6091, + "step": 19633 + }, + { + "epoch": 0.68, + "learning_rate": 4.6374669087965505e-06, + "loss": 0.6065, + "step": 19634 + }, + { + "epoch": 0.68, + "learning_rate": 4.636547876542246e-06, + "loss": 0.6507, + "step": 19635 + }, + { + "epoch": 0.68, + "learning_rate": 4.63562890787845e-06, + "loss": 0.6314, + "step": 19636 + }, + { + "epoch": 0.68, + "learning_rate": 4.63471000281606e-06, + "loss": 0.6383, + "step": 19637 + }, + { + "epoch": 0.68, + "learning_rate": 4.63379116136597e-06, + "loss": 0.5873, + "step": 19638 + }, + { + "epoch": 0.68, + "learning_rate": 4.632872383539074e-06, + "loss": 0.6142, + "step": 19639 + }, + { + "epoch": 0.68, + "learning_rate": 4.63195366934627e-06, + "loss": 0.6494, + "step": 19640 + }, + { + "epoch": 0.68, + "learning_rate": 4.631035018798441e-06, + "loss": 0.6485, + "step": 19641 + }, + { + "epoch": 0.68, + "learning_rate": 4.630116431906484e-06, + "loss": 0.579, + "step": 19642 + }, + { + "epoch": 0.68, + "learning_rate": 4.629197908681289e-06, + "loss": 0.6378, + "step": 19643 + }, + { + "epoch": 0.68, + "learning_rate": 4.628279449133747e-06, + "loss": 0.6416, + "step": 19644 + }, + { + "epoch": 0.68, + "learning_rate": 4.627361053274748e-06, + "loss": 0.6579, + "step": 19645 + }, + { + "epoch": 0.68, + "learning_rate": 4.626442721115184e-06, + "loss": 0.6522, + "step": 19646 + }, + { + "epoch": 0.68, + "learning_rate": 4.625524452665935e-06, + "loss": 0.6249, + "step": 19647 + }, + { + "epoch": 0.68, + "learning_rate": 4.6246062479378925e-06, + "loss": 0.6403, + "step": 19648 + }, + { + "epoch": 0.68, + "learning_rate": 4.623688106941942e-06, + "loss": 0.6015, + "step": 19649 + }, + { + "epoch": 0.68, + "learning_rate": 4.622770029688971e-06, + "loss": 0.6144, + "step": 19650 + }, + { + "epoch": 0.68, + "learning_rate": 4.621852016189864e-06, + "loss": 0.6497, + "step": 19651 + }, + { + "epoch": 0.68, + "learning_rate": 4.620934066455508e-06, + "loss": 0.6614, + "step": 19652 + }, + { + "epoch": 0.68, + "learning_rate": 4.620016180496779e-06, + "loss": 0.6747, + "step": 19653 + }, + { + "epoch": 0.68, + "learning_rate": 4.619098358324564e-06, + "loss": 0.625, + "step": 19654 + }, + { + "epoch": 0.68, + "learning_rate": 4.6181805999497456e-06, + "loss": 0.6354, + "step": 19655 + }, + { + "epoch": 0.68, + "learning_rate": 4.617262905383203e-06, + "loss": 0.6271, + "step": 19656 + }, + { + "epoch": 0.68, + "learning_rate": 4.616345274635818e-06, + "loss": 0.63, + "step": 19657 + }, + { + "epoch": 0.68, + "learning_rate": 4.615427707718475e-06, + "loss": 0.6315, + "step": 19658 + }, + { + "epoch": 0.68, + "learning_rate": 4.614510204642044e-06, + "loss": 0.6602, + "step": 19659 + }, + { + "epoch": 0.68, + "learning_rate": 4.613592765417407e-06, + "loss": 0.6869, + "step": 19660 + }, + { + "epoch": 0.68, + "learning_rate": 4.6126753900554415e-06, + "loss": 0.6451, + "step": 19661 + }, + { + "epoch": 0.68, + "learning_rate": 4.611758078567024e-06, + "loss": 0.6753, + "step": 19662 + }, + { + "epoch": 0.68, + "learning_rate": 4.610840830963032e-06, + "loss": 0.5915, + "step": 19663 + }, + { + "epoch": 0.68, + "learning_rate": 4.609923647254341e-06, + "loss": 0.7493, + "step": 19664 + }, + { + "epoch": 0.68, + "learning_rate": 4.60900652745182e-06, + "loss": 0.6328, + "step": 19665 + }, + { + "epoch": 0.68, + "learning_rate": 4.608089471566348e-06, + "loss": 0.6417, + "step": 19666 + }, + { + "epoch": 0.68, + "learning_rate": 4.607172479608794e-06, + "loss": 0.6189, + "step": 19667 + }, + { + "epoch": 0.68, + "learning_rate": 4.606255551590034e-06, + "loss": 0.5844, + "step": 19668 + }, + { + "epoch": 0.68, + "learning_rate": 4.605338687520937e-06, + "loss": 0.6639, + "step": 19669 + }, + { + "epoch": 0.68, + "learning_rate": 4.604421887412378e-06, + "loss": 0.5901, + "step": 19670 + }, + { + "epoch": 0.68, + "learning_rate": 4.6035051512752194e-06, + "loss": 0.6642, + "step": 19671 + }, + { + "epoch": 0.68, + "learning_rate": 4.602588479120334e-06, + "loss": 0.6055, + "step": 19672 + }, + { + "epoch": 0.68, + "learning_rate": 4.601671870958588e-06, + "loss": 0.602, + "step": 19673 + }, + { + "epoch": 0.68, + "learning_rate": 4.600755326800853e-06, + "loss": 0.6557, + "step": 19674 + }, + { + "epoch": 0.68, + "learning_rate": 4.599838846657994e-06, + "loss": 0.5882, + "step": 19675 + }, + { + "epoch": 0.68, + "learning_rate": 4.598922430540878e-06, + "loss": 0.6271, + "step": 19676 + }, + { + "epoch": 0.68, + "learning_rate": 4.598006078460368e-06, + "loss": 0.5891, + "step": 19677 + }, + { + "epoch": 0.68, + "learning_rate": 4.597089790427327e-06, + "loss": 0.5751, + "step": 19678 + }, + { + "epoch": 0.68, + "learning_rate": 4.596173566452623e-06, + "loss": 0.6386, + "step": 19679 + }, + { + "epoch": 0.68, + "learning_rate": 4.595257406547117e-06, + "loss": 0.6244, + "step": 19680 + }, + { + "epoch": 0.68, + "learning_rate": 4.594341310721671e-06, + "loss": 0.6189, + "step": 19681 + }, + { + "epoch": 0.68, + "learning_rate": 4.59342527898715e-06, + "loss": 0.6293, + "step": 19682 + }, + { + "epoch": 0.68, + "learning_rate": 4.59250931135441e-06, + "loss": 0.6317, + "step": 19683 + }, + { + "epoch": 0.68, + "learning_rate": 4.59159340783431e-06, + "loss": 0.6311, + "step": 19684 + }, + { + "epoch": 0.68, + "learning_rate": 4.590677568437714e-06, + "loss": 0.6653, + "step": 19685 + }, + { + "epoch": 0.68, + "learning_rate": 4.5897617931754776e-06, + "loss": 0.6377, + "step": 19686 + }, + { + "epoch": 0.68, + "learning_rate": 4.588846082058459e-06, + "loss": 0.5736, + "step": 19687 + }, + { + "epoch": 0.68, + "learning_rate": 4.58793043509752e-06, + "loss": 0.5991, + "step": 19688 + }, + { + "epoch": 0.68, + "learning_rate": 4.587014852303507e-06, + "loss": 0.6633, + "step": 19689 + }, + { + "epoch": 0.68, + "learning_rate": 4.586099333687281e-06, + "loss": 0.6367, + "step": 19690 + }, + { + "epoch": 0.68, + "learning_rate": 4.585183879259695e-06, + "loss": 0.6185, + "step": 19691 + }, + { + "epoch": 0.68, + "learning_rate": 4.584268489031604e-06, + "loss": 0.6469, + "step": 19692 + }, + { + "epoch": 0.68, + "learning_rate": 4.583353163013866e-06, + "loss": 0.6061, + "step": 19693 + }, + { + "epoch": 0.68, + "learning_rate": 4.582437901217324e-06, + "loss": 0.6695, + "step": 19694 + }, + { + "epoch": 0.68, + "learning_rate": 4.581522703652833e-06, + "loss": 0.589, + "step": 19695 + }, + { + "epoch": 0.68, + "learning_rate": 4.580607570331246e-06, + "loss": 0.6327, + "step": 19696 + }, + { + "epoch": 0.68, + "learning_rate": 4.579692501263412e-06, + "loss": 0.6323, + "step": 19697 + }, + { + "epoch": 0.68, + "learning_rate": 4.578777496460179e-06, + "loss": 0.5684, + "step": 19698 + }, + { + "epoch": 0.68, + "learning_rate": 4.577862555932401e-06, + "loss": 0.648, + "step": 19699 + }, + { + "epoch": 0.68, + "learning_rate": 4.576947679690917e-06, + "loss": 0.6761, + "step": 19700 + }, + { + "epoch": 0.68, + "learning_rate": 4.576032867746579e-06, + "loss": 0.5994, + "step": 19701 + }, + { + "epoch": 0.68, + "learning_rate": 4.575118120110234e-06, + "loss": 0.5972, + "step": 19702 + }, + { + "epoch": 0.68, + "learning_rate": 4.574203436792725e-06, + "loss": 0.607, + "step": 19703 + }, + { + "epoch": 0.68, + "learning_rate": 4.573288817804898e-06, + "loss": 0.614, + "step": 19704 + }, + { + "epoch": 0.68, + "learning_rate": 4.5723742631576e-06, + "loss": 0.652, + "step": 19705 + }, + { + "epoch": 0.68, + "learning_rate": 4.571459772861668e-06, + "loss": 0.6275, + "step": 19706 + }, + { + "epoch": 0.68, + "learning_rate": 4.570545346927947e-06, + "loss": 0.6117, + "step": 19707 + }, + { + "epoch": 0.68, + "learning_rate": 4.569630985367281e-06, + "loss": 0.6497, + "step": 19708 + }, + { + "epoch": 0.68, + "learning_rate": 4.5687166881905066e-06, + "loss": 0.6438, + "step": 19709 + }, + { + "epoch": 0.68, + "learning_rate": 4.567802455408468e-06, + "loss": 0.6383, + "step": 19710 + }, + { + "epoch": 0.68, + "learning_rate": 4.566888287032007e-06, + "loss": 0.5872, + "step": 19711 + }, + { + "epoch": 0.68, + "learning_rate": 4.565974183071953e-06, + "loss": 0.6382, + "step": 19712 + }, + { + "epoch": 0.68, + "learning_rate": 4.5650601435391505e-06, + "loss": 0.5928, + "step": 19713 + }, + { + "epoch": 0.68, + "learning_rate": 4.564146168444435e-06, + "loss": 0.6543, + "step": 19714 + }, + { + "epoch": 0.68, + "learning_rate": 4.563232257798643e-06, + "loss": 0.597, + "step": 19715 + }, + { + "epoch": 0.68, + "learning_rate": 4.562318411612609e-06, + "loss": 0.7204, + "step": 19716 + }, + { + "epoch": 0.68, + "learning_rate": 4.5614046298971746e-06, + "loss": 0.6557, + "step": 19717 + }, + { + "epoch": 0.68, + "learning_rate": 4.560490912663164e-06, + "loss": 0.5873, + "step": 19718 + }, + { + "epoch": 0.68, + "learning_rate": 4.559577259921414e-06, + "loss": 0.5665, + "step": 19719 + }, + { + "epoch": 0.68, + "learning_rate": 4.558663671682757e-06, + "loss": 0.5563, + "step": 19720 + }, + { + "epoch": 0.68, + "learning_rate": 4.557750147958027e-06, + "loss": 0.6688, + "step": 19721 + }, + { + "epoch": 0.68, + "learning_rate": 4.556836688758053e-06, + "loss": 0.6681, + "step": 19722 + }, + { + "epoch": 0.68, + "learning_rate": 4.555923294093669e-06, + "loss": 0.6284, + "step": 19723 + }, + { + "epoch": 0.68, + "learning_rate": 4.555009963975698e-06, + "loss": 0.5921, + "step": 19724 + }, + { + "epoch": 0.68, + "learning_rate": 4.5540966984149714e-06, + "loss": 0.6278, + "step": 19725 + }, + { + "epoch": 0.68, + "learning_rate": 4.5531834974223175e-06, + "loss": 0.6641, + "step": 19726 + }, + { + "epoch": 0.68, + "learning_rate": 4.552270361008564e-06, + "loss": 0.612, + "step": 19727 + }, + { + "epoch": 0.68, + "learning_rate": 4.551357289184537e-06, + "loss": 0.598, + "step": 19728 + }, + { + "epoch": 0.68, + "learning_rate": 4.550444281961065e-06, + "loss": 0.6506, + "step": 19729 + }, + { + "epoch": 0.68, + "learning_rate": 4.549531339348966e-06, + "loss": 0.6365, + "step": 19730 + }, + { + "epoch": 0.68, + "learning_rate": 4.548618461359068e-06, + "loss": 0.6369, + "step": 19731 + }, + { + "epoch": 0.68, + "learning_rate": 4.5477056480021945e-06, + "loss": 0.6181, + "step": 19732 + }, + { + "epoch": 0.68, + "learning_rate": 4.546792899289168e-06, + "loss": 0.6388, + "step": 19733 + }, + { + "epoch": 0.68, + "learning_rate": 4.545880215230809e-06, + "loss": 0.6362, + "step": 19734 + }, + { + "epoch": 0.68, + "learning_rate": 4.544967595837943e-06, + "loss": 0.6313, + "step": 19735 + }, + { + "epoch": 0.68, + "learning_rate": 4.544055041121385e-06, + "loss": 0.6584, + "step": 19736 + }, + { + "epoch": 0.68, + "learning_rate": 4.543142551091954e-06, + "loss": 0.6009, + "step": 19737 + }, + { + "epoch": 0.68, + "learning_rate": 4.542230125760473e-06, + "loss": 0.6242, + "step": 19738 + }, + { + "epoch": 0.68, + "learning_rate": 4.541317765137756e-06, + "loss": 0.6317, + "step": 19739 + }, + { + "epoch": 0.68, + "learning_rate": 4.540405469234623e-06, + "loss": 0.6022, + "step": 19740 + }, + { + "epoch": 0.68, + "learning_rate": 4.539493238061894e-06, + "loss": 0.5851, + "step": 19741 + }, + { + "epoch": 0.68, + "learning_rate": 4.538581071630377e-06, + "loss": 0.6848, + "step": 19742 + }, + { + "epoch": 0.68, + "learning_rate": 4.5376689699508895e-06, + "loss": 0.6151, + "step": 19743 + }, + { + "epoch": 0.68, + "learning_rate": 4.536756933034245e-06, + "loss": 0.6021, + "step": 19744 + }, + { + "epoch": 0.68, + "learning_rate": 4.535844960891259e-06, + "loss": 0.6208, + "step": 19745 + }, + { + "epoch": 0.68, + "learning_rate": 4.534933053532743e-06, + "loss": 0.6892, + "step": 19746 + }, + { + "epoch": 0.68, + "learning_rate": 4.534021210969514e-06, + "loss": 0.6347, + "step": 19747 + }, + { + "epoch": 0.68, + "learning_rate": 4.533109433212373e-06, + "loss": 0.6274, + "step": 19748 + }, + { + "epoch": 0.68, + "learning_rate": 4.532197720272135e-06, + "loss": 0.6221, + "step": 19749 + }, + { + "epoch": 0.68, + "learning_rate": 4.531286072159611e-06, + "loss": 0.6422, + "step": 19750 + }, + { + "epoch": 0.68, + "learning_rate": 4.530374488885607e-06, + "loss": 0.5949, + "step": 19751 + }, + { + "epoch": 0.68, + "learning_rate": 4.529462970460934e-06, + "loss": 0.6406, + "step": 19752 + }, + { + "epoch": 0.68, + "learning_rate": 4.5285515168964014e-06, + "loss": 0.6548, + "step": 19753 + }, + { + "epoch": 0.68, + "learning_rate": 4.527640128202808e-06, + "loss": 0.6333, + "step": 19754 + }, + { + "epoch": 0.68, + "learning_rate": 4.526728804390966e-06, + "loss": 0.6162, + "step": 19755 + }, + { + "epoch": 0.68, + "learning_rate": 4.525817545471672e-06, + "loss": 0.6548, + "step": 19756 + }, + { + "epoch": 0.68, + "learning_rate": 4.524906351455739e-06, + "loss": 0.633, + "step": 19757 + }, + { + "epoch": 0.68, + "learning_rate": 4.523995222353971e-06, + "loss": 0.6046, + "step": 19758 + }, + { + "epoch": 0.68, + "learning_rate": 4.523084158177163e-06, + "loss": 0.6116, + "step": 19759 + }, + { + "epoch": 0.68, + "learning_rate": 4.52217315893612e-06, + "loss": 0.631, + "step": 19760 + }, + { + "epoch": 0.68, + "learning_rate": 4.521262224641648e-06, + "loss": 0.6338, + "step": 19761 + }, + { + "epoch": 0.68, + "learning_rate": 4.520351355304536e-06, + "loss": 0.6688, + "step": 19762 + }, + { + "epoch": 0.68, + "learning_rate": 4.519440550935595e-06, + "loss": 0.7049, + "step": 19763 + }, + { + "epoch": 0.68, + "learning_rate": 4.518529811545621e-06, + "loss": 0.6203, + "step": 19764 + }, + { + "epoch": 0.68, + "learning_rate": 4.517619137145407e-06, + "loss": 0.6233, + "step": 19765 + }, + { + "epoch": 0.68, + "learning_rate": 4.516708527745754e-06, + "loss": 0.6138, + "step": 19766 + }, + { + "epoch": 0.68, + "learning_rate": 4.515797983357461e-06, + "loss": 0.6054, + "step": 19767 + }, + { + "epoch": 0.68, + "learning_rate": 4.514887503991313e-06, + "loss": 0.6319, + "step": 19768 + }, + { + "epoch": 0.68, + "learning_rate": 4.5139770896581155e-06, + "loss": 0.6627, + "step": 19769 + }, + { + "epoch": 0.68, + "learning_rate": 4.513066740368664e-06, + "loss": 0.5835, + "step": 19770 + }, + { + "epoch": 0.69, + "learning_rate": 4.512156456133744e-06, + "loss": 0.6091, + "step": 19771 + }, + { + "epoch": 0.69, + "learning_rate": 4.511246236964151e-06, + "loss": 0.6335, + "step": 19772 + }, + { + "epoch": 0.69, + "learning_rate": 4.51033608287068e-06, + "loss": 0.6108, + "step": 19773 + }, + { + "epoch": 0.69, + "learning_rate": 4.509425993864113e-06, + "loss": 0.6085, + "step": 19774 + }, + { + "epoch": 0.69, + "learning_rate": 4.50851596995525e-06, + "loss": 0.617, + "step": 19775 + }, + { + "epoch": 0.69, + "learning_rate": 4.507606011154879e-06, + "loss": 0.5889, + "step": 19776 + }, + { + "epoch": 0.69, + "learning_rate": 4.506696117473784e-06, + "loss": 0.6321, + "step": 19777 + }, + { + "epoch": 0.69, + "learning_rate": 4.505786288922756e-06, + "loss": 0.5589, + "step": 19778 + }, + { + "epoch": 0.69, + "learning_rate": 4.5048765255125855e-06, + "loss": 0.5887, + "step": 19779 + }, + { + "epoch": 0.69, + "learning_rate": 4.503966827254047e-06, + "loss": 0.6026, + "step": 19780 + }, + { + "epoch": 0.69, + "learning_rate": 4.503057194157939e-06, + "loss": 0.636, + "step": 19781 + }, + { + "epoch": 0.69, + "learning_rate": 4.502147626235045e-06, + "loss": 0.6644, + "step": 19782 + }, + { + "epoch": 0.69, + "learning_rate": 4.5012381234961425e-06, + "loss": 0.5988, + "step": 19783 + }, + { + "epoch": 0.69, + "learning_rate": 4.5003286859520164e-06, + "loss": 0.6393, + "step": 19784 + }, + { + "epoch": 0.69, + "learning_rate": 4.499419313613456e-06, + "loss": 0.6784, + "step": 19785 + }, + { + "epoch": 0.69, + "learning_rate": 4.4985100064912294e-06, + "loss": 0.6303, + "step": 19786 + }, + { + "epoch": 0.69, + "learning_rate": 4.4976007645961305e-06, + "loss": 0.6567, + "step": 19787 + }, + { + "epoch": 0.69, + "learning_rate": 4.496691587938938e-06, + "loss": 0.609, + "step": 19788 + }, + { + "epoch": 0.69, + "learning_rate": 4.495782476530426e-06, + "loss": 0.6013, + "step": 19789 + }, + { + "epoch": 0.69, + "learning_rate": 4.494873430381376e-06, + "loss": 0.6579, + "step": 19790 + }, + { + "epoch": 0.69, + "learning_rate": 4.493964449502568e-06, + "loss": 0.6451, + "step": 19791 + }, + { + "epoch": 0.69, + "learning_rate": 4.493055533904769e-06, + "loss": 0.627, + "step": 19792 + }, + { + "epoch": 0.69, + "learning_rate": 4.492146683598767e-06, + "loss": 0.6733, + "step": 19793 + }, + { + "epoch": 0.69, + "learning_rate": 4.4912378985953375e-06, + "loss": 0.6866, + "step": 19794 + }, + { + "epoch": 0.69, + "learning_rate": 4.490329178905248e-06, + "loss": 0.5703, + "step": 19795 + }, + { + "epoch": 0.69, + "learning_rate": 4.4894205245392755e-06, + "loss": 0.6543, + "step": 19796 + }, + { + "epoch": 0.69, + "learning_rate": 4.488511935508196e-06, + "loss": 0.6767, + "step": 19797 + }, + { + "epoch": 0.69, + "learning_rate": 4.487603411822777e-06, + "loss": 0.5935, + "step": 19798 + }, + { + "epoch": 0.69, + "learning_rate": 4.48669495349379e-06, + "loss": 0.6695, + "step": 19799 + }, + { + "epoch": 0.69, + "learning_rate": 4.485786560532015e-06, + "loss": 0.6105, + "step": 19800 + }, + { + "epoch": 0.69, + "learning_rate": 4.484878232948212e-06, + "loss": 0.6009, + "step": 19801 + }, + { + "epoch": 0.69, + "learning_rate": 4.4839699707531545e-06, + "loss": 0.6591, + "step": 19802 + }, + { + "epoch": 0.69, + "learning_rate": 4.483061773957615e-06, + "loss": 0.6472, + "step": 19803 + }, + { + "epoch": 0.69, + "learning_rate": 4.482153642572353e-06, + "loss": 0.6642, + "step": 19804 + }, + { + "epoch": 0.69, + "learning_rate": 4.481245576608136e-06, + "loss": 0.5677, + "step": 19805 + }, + { + "epoch": 0.69, + "learning_rate": 4.480337576075742e-06, + "loss": 0.6012, + "step": 19806 + }, + { + "epoch": 0.69, + "learning_rate": 4.479429640985924e-06, + "loss": 0.6323, + "step": 19807 + }, + { + "epoch": 0.69, + "learning_rate": 4.478521771349451e-06, + "loss": 0.6316, + "step": 19808 + }, + { + "epoch": 0.69, + "learning_rate": 4.477613967177091e-06, + "loss": 0.6226, + "step": 19809 + }, + { + "epoch": 0.69, + "learning_rate": 4.476706228479599e-06, + "loss": 0.5952, + "step": 19810 + }, + { + "epoch": 0.69, + "learning_rate": 4.47579855526774e-06, + "loss": 0.6228, + "step": 19811 + }, + { + "epoch": 0.69, + "learning_rate": 4.474890947552283e-06, + "loss": 0.5687, + "step": 19812 + }, + { + "epoch": 0.69, + "learning_rate": 4.473983405343979e-06, + "loss": 0.6593, + "step": 19813 + }, + { + "epoch": 0.69, + "learning_rate": 4.473075928653593e-06, + "loss": 0.6253, + "step": 19814 + }, + { + "epoch": 0.69, + "learning_rate": 4.4721685174918875e-06, + "loss": 0.6578, + "step": 19815 + }, + { + "epoch": 0.69, + "learning_rate": 4.471261171869612e-06, + "loss": 0.7089, + "step": 19816 + }, + { + "epoch": 0.69, + "learning_rate": 4.47035389179753e-06, + "loss": 0.6711, + "step": 19817 + }, + { + "epoch": 0.69, + "learning_rate": 4.469446677286398e-06, + "loss": 0.6306, + "step": 19818 + }, + { + "epoch": 0.69, + "learning_rate": 4.468539528346971e-06, + "loss": 0.6534, + "step": 19819 + }, + { + "epoch": 0.69, + "learning_rate": 4.46763244499001e-06, + "loss": 0.6499, + "step": 19820 + }, + { + "epoch": 0.69, + "learning_rate": 4.46672542722626e-06, + "loss": 0.6455, + "step": 19821 + }, + { + "epoch": 0.69, + "learning_rate": 4.46581847506648e-06, + "loss": 0.6298, + "step": 19822 + }, + { + "epoch": 0.69, + "learning_rate": 4.464911588521424e-06, + "loss": 0.6588, + "step": 19823 + }, + { + "epoch": 0.69, + "learning_rate": 4.4640047676018415e-06, + "loss": 0.5348, + "step": 19824 + }, + { + "epoch": 0.69, + "learning_rate": 4.463098012318487e-06, + "loss": 0.6073, + "step": 19825 + }, + { + "epoch": 0.69, + "learning_rate": 4.462191322682112e-06, + "loss": 0.606, + "step": 19826 + }, + { + "epoch": 0.69, + "learning_rate": 4.461284698703461e-06, + "loss": 0.6137, + "step": 19827 + }, + { + "epoch": 0.69, + "learning_rate": 4.460378140393286e-06, + "loss": 0.6496, + "step": 19828 + }, + { + "epoch": 0.69, + "learning_rate": 4.459471647762337e-06, + "loss": 0.6328, + "step": 19829 + }, + { + "epoch": 0.69, + "learning_rate": 4.458565220821359e-06, + "loss": 0.5947, + "step": 19830 + }, + { + "epoch": 0.69, + "learning_rate": 4.457658859581101e-06, + "loss": 0.6675, + "step": 19831 + }, + { + "epoch": 0.69, + "learning_rate": 4.4567525640523125e-06, + "loss": 0.6631, + "step": 19832 + }, + { + "epoch": 0.69, + "learning_rate": 4.4558463342457305e-06, + "loss": 0.5976, + "step": 19833 + }, + { + "epoch": 0.69, + "learning_rate": 4.454940170172103e-06, + "loss": 0.5639, + "step": 19834 + }, + { + "epoch": 0.69, + "learning_rate": 4.454034071842175e-06, + "loss": 0.6598, + "step": 19835 + }, + { + "epoch": 0.69, + "learning_rate": 4.453128039266689e-06, + "loss": 0.6205, + "step": 19836 + }, + { + "epoch": 0.69, + "learning_rate": 4.4522220724563855e-06, + "loss": 0.6143, + "step": 19837 + }, + { + "epoch": 0.69, + "learning_rate": 4.451316171422013e-06, + "loss": 0.612, + "step": 19838 + }, + { + "epoch": 0.69, + "learning_rate": 4.450410336174302e-06, + "loss": 0.6068, + "step": 19839 + }, + { + "epoch": 0.69, + "learning_rate": 4.449504566723996e-06, + "loss": 0.6202, + "step": 19840 + }, + { + "epoch": 0.69, + "learning_rate": 4.448598863081836e-06, + "loss": 0.6061, + "step": 19841 + }, + { + "epoch": 0.69, + "learning_rate": 4.447693225258557e-06, + "loss": 0.6512, + "step": 19842 + }, + { + "epoch": 0.69, + "learning_rate": 4.4467876532649e-06, + "loss": 0.5988, + "step": 19843 + }, + { + "epoch": 0.69, + "learning_rate": 4.445882147111604e-06, + "loss": 0.6862, + "step": 19844 + }, + { + "epoch": 0.69, + "learning_rate": 4.444976706809397e-06, + "loss": 0.6448, + "step": 19845 + }, + { + "epoch": 0.69, + "learning_rate": 4.4440713323690185e-06, + "loss": 0.6874, + "step": 19846 + }, + { + "epoch": 0.69, + "learning_rate": 4.443166023801203e-06, + "loss": 0.6736, + "step": 19847 + }, + { + "epoch": 0.69, + "learning_rate": 4.442260781116683e-06, + "loss": 0.5913, + "step": 19848 + }, + { + "epoch": 0.69, + "learning_rate": 4.441355604326192e-06, + "loss": 0.628, + "step": 19849 + }, + { + "epoch": 0.69, + "learning_rate": 4.4404504934404656e-06, + "loss": 0.609, + "step": 19850 + }, + { + "epoch": 0.69, + "learning_rate": 4.43954544847023e-06, + "loss": 0.6507, + "step": 19851 + }, + { + "epoch": 0.69, + "learning_rate": 4.438640469426215e-06, + "loss": 0.6445, + "step": 19852 + }, + { + "epoch": 0.69, + "learning_rate": 4.4377355563191515e-06, + "loss": 0.6468, + "step": 19853 + }, + { + "epoch": 0.69, + "learning_rate": 4.436830709159771e-06, + "loss": 0.5951, + "step": 19854 + }, + { + "epoch": 0.69, + "learning_rate": 4.4359259279588e-06, + "loss": 0.6363, + "step": 19855 + }, + { + "epoch": 0.69, + "learning_rate": 4.435021212726968e-06, + "loss": 0.5999, + "step": 19856 + }, + { + "epoch": 0.69, + "learning_rate": 4.434116563474996e-06, + "loss": 0.6603, + "step": 19857 + }, + { + "epoch": 0.69, + "learning_rate": 4.433211980213614e-06, + "loss": 0.6142, + "step": 19858 + }, + { + "epoch": 0.69, + "learning_rate": 4.432307462953546e-06, + "loss": 0.6086, + "step": 19859 + }, + { + "epoch": 0.69, + "learning_rate": 4.431403011705515e-06, + "loss": 0.5975, + "step": 19860 + }, + { + "epoch": 0.69, + "learning_rate": 4.430498626480247e-06, + "loss": 0.5835, + "step": 19861 + }, + { + "epoch": 0.69, + "learning_rate": 4.429594307288465e-06, + "loss": 0.6366, + "step": 19862 + }, + { + "epoch": 0.69, + "learning_rate": 4.428690054140886e-06, + "loss": 0.6305, + "step": 19863 + }, + { + "epoch": 0.69, + "learning_rate": 4.427785867048236e-06, + "loss": 0.6396, + "step": 19864 + }, + { + "epoch": 0.69, + "learning_rate": 4.426881746021231e-06, + "loss": 0.722, + "step": 19865 + }, + { + "epoch": 0.69, + "learning_rate": 4.425977691070594e-06, + "loss": 0.6404, + "step": 19866 + }, + { + "epoch": 0.69, + "learning_rate": 4.4250737022070435e-06, + "loss": 0.6514, + "step": 19867 + }, + { + "epoch": 0.69, + "learning_rate": 4.424169779441299e-06, + "loss": 0.6119, + "step": 19868 + }, + { + "epoch": 0.69, + "learning_rate": 4.4232659227840725e-06, + "loss": 0.615, + "step": 19869 + }, + { + "epoch": 0.69, + "learning_rate": 4.422362132246082e-06, + "loss": 0.657, + "step": 19870 + }, + { + "epoch": 0.69, + "learning_rate": 4.4214584078380454e-06, + "loss": 0.6002, + "step": 19871 + }, + { + "epoch": 0.69, + "learning_rate": 4.420554749570675e-06, + "loss": 0.5999, + "step": 19872 + }, + { + "epoch": 0.69, + "learning_rate": 4.419651157454686e-06, + "loss": 0.602, + "step": 19873 + }, + { + "epoch": 0.69, + "learning_rate": 4.4187476315007975e-06, + "loss": 0.6553, + "step": 19874 + }, + { + "epoch": 0.69, + "learning_rate": 4.417844171719711e-06, + "loss": 0.6359, + "step": 19875 + }, + { + "epoch": 0.69, + "learning_rate": 4.416940778122143e-06, + "loss": 0.6143, + "step": 19876 + }, + { + "epoch": 0.69, + "learning_rate": 4.416037450718804e-06, + "loss": 0.5992, + "step": 19877 + }, + { + "epoch": 0.69, + "learning_rate": 4.415134189520407e-06, + "loss": 0.5569, + "step": 19878 + }, + { + "epoch": 0.69, + "learning_rate": 4.414230994537661e-06, + "loss": 0.6477, + "step": 19879 + }, + { + "epoch": 0.69, + "learning_rate": 4.41332786578127e-06, + "loss": 0.6825, + "step": 19880 + }, + { + "epoch": 0.69, + "learning_rate": 4.412424803261943e-06, + "loss": 0.6733, + "step": 19881 + }, + { + "epoch": 0.69, + "learning_rate": 4.41152180699039e-06, + "loss": 0.6342, + "step": 19882 + }, + { + "epoch": 0.69, + "learning_rate": 4.410618876977314e-06, + "loss": 0.6148, + "step": 19883 + }, + { + "epoch": 0.69, + "learning_rate": 4.409716013233423e-06, + "loss": 0.581, + "step": 19884 + }, + { + "epoch": 0.69, + "learning_rate": 4.408813215769423e-06, + "loss": 0.5995, + "step": 19885 + }, + { + "epoch": 0.69, + "learning_rate": 4.407910484596012e-06, + "loss": 0.5907, + "step": 19886 + }, + { + "epoch": 0.69, + "learning_rate": 4.407007819723896e-06, + "loss": 0.6696, + "step": 19887 + }, + { + "epoch": 0.69, + "learning_rate": 4.4061052211637775e-06, + "loss": 0.5544, + "step": 19888 + }, + { + "epoch": 0.69, + "learning_rate": 4.405202688926358e-06, + "loss": 0.6297, + "step": 19889 + }, + { + "epoch": 0.69, + "learning_rate": 4.404300223022339e-06, + "loss": 0.6429, + "step": 19890 + }, + { + "epoch": 0.69, + "learning_rate": 4.403397823462422e-06, + "loss": 0.6542, + "step": 19891 + }, + { + "epoch": 0.69, + "learning_rate": 4.402495490257299e-06, + "loss": 0.6116, + "step": 19892 + }, + { + "epoch": 0.69, + "learning_rate": 4.401593223417675e-06, + "loss": 0.6255, + "step": 19893 + }, + { + "epoch": 0.69, + "learning_rate": 4.400691022954244e-06, + "loss": 0.6161, + "step": 19894 + }, + { + "epoch": 0.69, + "learning_rate": 4.399788888877704e-06, + "loss": 0.6597, + "step": 19895 + }, + { + "epoch": 0.69, + "learning_rate": 4.398886821198752e-06, + "loss": 0.6322, + "step": 19896 + }, + { + "epoch": 0.69, + "learning_rate": 4.397984819928085e-06, + "loss": 0.5931, + "step": 19897 + }, + { + "epoch": 0.69, + "learning_rate": 4.397082885076392e-06, + "loss": 0.6107, + "step": 19898 + }, + { + "epoch": 0.69, + "learning_rate": 4.396181016654367e-06, + "loss": 0.6443, + "step": 19899 + }, + { + "epoch": 0.69, + "learning_rate": 4.395279214672707e-06, + "loss": 0.6288, + "step": 19900 + }, + { + "epoch": 0.69, + "learning_rate": 4.394377479142102e-06, + "loss": 0.6382, + "step": 19901 + }, + { + "epoch": 0.69, + "learning_rate": 4.393475810073241e-06, + "loss": 0.6256, + "step": 19902 + }, + { + "epoch": 0.69, + "learning_rate": 4.392574207476822e-06, + "loss": 0.653, + "step": 19903 + }, + { + "epoch": 0.69, + "learning_rate": 4.391672671363525e-06, + "loss": 0.6464, + "step": 19904 + }, + { + "epoch": 0.69, + "learning_rate": 4.390771201744043e-06, + "loss": 0.6191, + "step": 19905 + }, + { + "epoch": 0.69, + "learning_rate": 4.389869798629064e-06, + "loss": 0.6545, + "step": 19906 + }, + { + "epoch": 0.69, + "learning_rate": 4.388968462029276e-06, + "loss": 0.6186, + "step": 19907 + }, + { + "epoch": 0.69, + "learning_rate": 4.388067191955364e-06, + "loss": 0.6437, + "step": 19908 + }, + { + "epoch": 0.69, + "learning_rate": 4.387165988418019e-06, + "loss": 0.6139, + "step": 19909 + }, + { + "epoch": 0.69, + "learning_rate": 4.386264851427917e-06, + "loss": 0.6315, + "step": 19910 + }, + { + "epoch": 0.69, + "learning_rate": 4.385363780995747e-06, + "loss": 0.6331, + "step": 19911 + }, + { + "epoch": 0.69, + "learning_rate": 4.384462777132192e-06, + "loss": 0.613, + "step": 19912 + }, + { + "epoch": 0.69, + "learning_rate": 4.383561839847935e-06, + "loss": 0.6535, + "step": 19913 + }, + { + "epoch": 0.69, + "learning_rate": 4.382660969153657e-06, + "loss": 0.6393, + "step": 19914 + }, + { + "epoch": 0.69, + "learning_rate": 4.381760165060043e-06, + "loss": 0.6598, + "step": 19915 + }, + { + "epoch": 0.69, + "learning_rate": 4.380859427577765e-06, + "loss": 0.6142, + "step": 19916 + }, + { + "epoch": 0.69, + "learning_rate": 4.3799587567175075e-06, + "loss": 0.6148, + "step": 19917 + }, + { + "epoch": 0.69, + "learning_rate": 4.379058152489947e-06, + "loss": 0.6654, + "step": 19918 + }, + { + "epoch": 0.69, + "learning_rate": 4.378157614905763e-06, + "loss": 0.6433, + "step": 19919 + }, + { + "epoch": 0.69, + "learning_rate": 4.3772571439756325e-06, + "loss": 0.6417, + "step": 19920 + }, + { + "epoch": 0.69, + "learning_rate": 4.3763567397102355e-06, + "loss": 0.6371, + "step": 19921 + }, + { + "epoch": 0.69, + "learning_rate": 4.37545640212024e-06, + "loss": 0.6661, + "step": 19922 + }, + { + "epoch": 0.69, + "learning_rate": 4.3745561312163235e-06, + "loss": 0.6725, + "step": 19923 + }, + { + "epoch": 0.69, + "learning_rate": 4.373655927009159e-06, + "loss": 0.566, + "step": 19924 + }, + { + "epoch": 0.69, + "learning_rate": 4.372755789509422e-06, + "loss": 0.5838, + "step": 19925 + }, + { + "epoch": 0.69, + "learning_rate": 4.3718557187277835e-06, + "loss": 0.6388, + "step": 19926 + }, + { + "epoch": 0.69, + "learning_rate": 4.3709557146749195e-06, + "loss": 0.6527, + "step": 19927 + }, + { + "epoch": 0.69, + "learning_rate": 4.3700557773614915e-06, + "loss": 0.6128, + "step": 19928 + }, + { + "epoch": 0.69, + "learning_rate": 4.369155906798175e-06, + "loss": 0.6458, + "step": 19929 + }, + { + "epoch": 0.69, + "learning_rate": 4.368256102995637e-06, + "loss": 0.6256, + "step": 19930 + }, + { + "epoch": 0.69, + "learning_rate": 4.367356365964548e-06, + "loss": 0.5933, + "step": 19931 + }, + { + "epoch": 0.69, + "learning_rate": 4.366456695715574e-06, + "loss": 0.7225, + "step": 19932 + }, + { + "epoch": 0.69, + "learning_rate": 4.365557092259387e-06, + "loss": 0.6562, + "step": 19933 + }, + { + "epoch": 0.69, + "learning_rate": 4.364657555606644e-06, + "loss": 0.5998, + "step": 19934 + }, + { + "epoch": 0.69, + "learning_rate": 4.363758085768015e-06, + "loss": 0.5975, + "step": 19935 + }, + { + "epoch": 0.69, + "learning_rate": 4.3628586827541634e-06, + "loss": 0.644, + "step": 19936 + }, + { + "epoch": 0.69, + "learning_rate": 4.3619593465757525e-06, + "loss": 0.6381, + "step": 19937 + }, + { + "epoch": 0.69, + "learning_rate": 4.361060077243446e-06, + "loss": 0.6314, + "step": 19938 + }, + { + "epoch": 0.69, + "learning_rate": 4.36016087476791e-06, + "loss": 0.6804, + "step": 19939 + }, + { + "epoch": 0.69, + "learning_rate": 4.359261739159797e-06, + "loss": 0.6315, + "step": 19940 + }, + { + "epoch": 0.69, + "learning_rate": 4.358362670429772e-06, + "loss": 0.6614, + "step": 19941 + }, + { + "epoch": 0.69, + "learning_rate": 4.357463668588494e-06, + "loss": 0.6031, + "step": 19942 + }, + { + "epoch": 0.69, + "learning_rate": 4.356564733646622e-06, + "loss": 0.6581, + "step": 19943 + }, + { + "epoch": 0.69, + "learning_rate": 4.355665865614818e-06, + "loss": 0.6784, + "step": 19944 + }, + { + "epoch": 0.69, + "learning_rate": 4.354767064503731e-06, + "loss": 0.6254, + "step": 19945 + }, + { + "epoch": 0.69, + "learning_rate": 4.353868330324022e-06, + "loss": 0.6424, + "step": 19946 + }, + { + "epoch": 0.69, + "learning_rate": 4.352969663086347e-06, + "loss": 0.6516, + "step": 19947 + }, + { + "epoch": 0.69, + "learning_rate": 4.35207106280136e-06, + "loss": 0.6875, + "step": 19948 + }, + { + "epoch": 0.69, + "learning_rate": 4.351172529479714e-06, + "loss": 0.6699, + "step": 19949 + }, + { + "epoch": 0.69, + "learning_rate": 4.350274063132069e-06, + "loss": 0.6773, + "step": 19950 + }, + { + "epoch": 0.69, + "learning_rate": 4.349375663769067e-06, + "loss": 0.6611, + "step": 19951 + }, + { + "epoch": 0.69, + "learning_rate": 4.348477331401364e-06, + "loss": 0.6618, + "step": 19952 + }, + { + "epoch": 0.69, + "learning_rate": 4.347579066039612e-06, + "loss": 0.6159, + "step": 19953 + }, + { + "epoch": 0.69, + "learning_rate": 4.3466808676944615e-06, + "loss": 0.6265, + "step": 19954 + }, + { + "epoch": 0.69, + "learning_rate": 4.34578273637656e-06, + "loss": 0.624, + "step": 19955 + }, + { + "epoch": 0.69, + "learning_rate": 4.34488467209656e-06, + "loss": 0.6501, + "step": 19956 + }, + { + "epoch": 0.69, + "learning_rate": 4.343986674865103e-06, + "loss": 0.6198, + "step": 19957 + }, + { + "epoch": 0.69, + "learning_rate": 4.34308874469284e-06, + "loss": 0.6423, + "step": 19958 + }, + { + "epoch": 0.69, + "learning_rate": 4.342190881590413e-06, + "loss": 0.6676, + "step": 19959 + }, + { + "epoch": 0.69, + "learning_rate": 4.341293085568472e-06, + "loss": 0.6572, + "step": 19960 + }, + { + "epoch": 0.69, + "learning_rate": 4.34039535663766e-06, + "loss": 0.6089, + "step": 19961 + }, + { + "epoch": 0.69, + "learning_rate": 4.339497694808624e-06, + "loss": 0.6366, + "step": 19962 + }, + { + "epoch": 0.69, + "learning_rate": 4.338600100092e-06, + "loss": 0.6367, + "step": 19963 + }, + { + "epoch": 0.69, + "learning_rate": 4.337702572498432e-06, + "loss": 0.6324, + "step": 19964 + }, + { + "epoch": 0.69, + "learning_rate": 4.336805112038564e-06, + "loss": 0.6507, + "step": 19965 + }, + { + "epoch": 0.69, + "learning_rate": 4.3359077187230355e-06, + "loss": 0.6318, + "step": 19966 + }, + { + "epoch": 0.69, + "learning_rate": 4.335010392562486e-06, + "loss": 0.6309, + "step": 19967 + }, + { + "epoch": 0.69, + "learning_rate": 4.334113133567559e-06, + "loss": 0.6244, + "step": 19968 + }, + { + "epoch": 0.69, + "learning_rate": 4.3332159417488826e-06, + "loss": 0.6401, + "step": 19969 + }, + { + "epoch": 0.69, + "learning_rate": 4.3323188171171014e-06, + "loss": 0.6236, + "step": 19970 + }, + { + "epoch": 0.69, + "learning_rate": 4.3314217596828504e-06, + "loss": 0.6527, + "step": 19971 + }, + { + "epoch": 0.69, + "learning_rate": 4.330524769456764e-06, + "loss": 0.5808, + "step": 19972 + }, + { + "epoch": 0.69, + "learning_rate": 4.329627846449479e-06, + "loss": 0.5816, + "step": 19973 + }, + { + "epoch": 0.69, + "learning_rate": 4.3287309906716325e-06, + "loss": 0.6395, + "step": 19974 + }, + { + "epoch": 0.69, + "learning_rate": 4.32783420213385e-06, + "loss": 0.6072, + "step": 19975 + }, + { + "epoch": 0.69, + "learning_rate": 4.326937480846769e-06, + "loss": 0.6799, + "step": 19976 + }, + { + "epoch": 0.69, + "learning_rate": 4.326040826821021e-06, + "loss": 0.5986, + "step": 19977 + }, + { + "epoch": 0.69, + "learning_rate": 4.3251442400672365e-06, + "loss": 0.5944, + "step": 19978 + }, + { + "epoch": 0.69, + "learning_rate": 4.3242477205960456e-06, + "loss": 0.6243, + "step": 19979 + }, + { + "epoch": 0.69, + "learning_rate": 4.323351268418081e-06, + "loss": 0.6498, + "step": 19980 + }, + { + "epoch": 0.69, + "learning_rate": 4.322454883543965e-06, + "loss": 0.6105, + "step": 19981 + }, + { + "epoch": 0.69, + "learning_rate": 4.321558565984328e-06, + "loss": 0.6157, + "step": 19982 + }, + { + "epoch": 0.69, + "learning_rate": 4.3206623157497976e-06, + "loss": 0.6146, + "step": 19983 + }, + { + "epoch": 0.69, + "learning_rate": 4.319766132851e-06, + "loss": 0.6309, + "step": 19984 + }, + { + "epoch": 0.69, + "learning_rate": 4.318870017298561e-06, + "loss": 0.6627, + "step": 19985 + }, + { + "epoch": 0.69, + "learning_rate": 4.3179739691031075e-06, + "loss": 0.6312, + "step": 19986 + }, + { + "epoch": 0.69, + "learning_rate": 4.317077988275257e-06, + "loss": 0.6214, + "step": 19987 + }, + { + "epoch": 0.69, + "learning_rate": 4.3161820748256355e-06, + "loss": 0.6124, + "step": 19988 + }, + { + "epoch": 0.69, + "learning_rate": 4.315286228764865e-06, + "loss": 0.6117, + "step": 19989 + }, + { + "epoch": 0.69, + "learning_rate": 4.31439045010357e-06, + "loss": 0.636, + "step": 19990 + }, + { + "epoch": 0.69, + "learning_rate": 4.313494738852366e-06, + "loss": 0.6605, + "step": 19991 + }, + { + "epoch": 0.69, + "learning_rate": 4.3125990950218795e-06, + "loss": 0.623, + "step": 19992 + }, + { + "epoch": 0.69, + "learning_rate": 4.311703518622723e-06, + "loss": 0.6486, + "step": 19993 + }, + { + "epoch": 0.69, + "learning_rate": 4.3108080096655155e-06, + "loss": 0.71, + "step": 19994 + }, + { + "epoch": 0.69, + "learning_rate": 4.309912568160881e-06, + "loss": 0.6082, + "step": 19995 + }, + { + "epoch": 0.69, + "learning_rate": 4.309017194119422e-06, + "loss": 0.6022, + "step": 19996 + }, + { + "epoch": 0.69, + "learning_rate": 4.308121887551768e-06, + "loss": 0.6257, + "step": 19997 + }, + { + "epoch": 0.69, + "learning_rate": 4.307226648468533e-06, + "loss": 0.6832, + "step": 19998 + }, + { + "epoch": 0.69, + "learning_rate": 4.306331476880323e-06, + "loss": 0.6151, + "step": 19999 + }, + { + "epoch": 0.69, + "learning_rate": 4.3054363727977565e-06, + "loss": 0.6243, + "step": 20000 + }, + { + "epoch": 0.69, + "learning_rate": 4.304541336231449e-06, + "loss": 0.5962, + "step": 20001 + }, + { + "epoch": 0.69, + "learning_rate": 4.303646367192003e-06, + "loss": 0.6466, + "step": 20002 + }, + { + "epoch": 0.69, + "learning_rate": 4.302751465690041e-06, + "loss": 0.6307, + "step": 20003 + }, + { + "epoch": 0.69, + "learning_rate": 4.301856631736163e-06, + "loss": 0.6254, + "step": 20004 + }, + { + "epoch": 0.69, + "learning_rate": 4.300961865340983e-06, + "loss": 0.6484, + "step": 20005 + }, + { + "epoch": 0.69, + "learning_rate": 4.300067166515114e-06, + "loss": 0.5931, + "step": 20006 + }, + { + "epoch": 0.69, + "learning_rate": 4.299172535269156e-06, + "loss": 0.6189, + "step": 20007 + }, + { + "epoch": 0.69, + "learning_rate": 4.298277971613715e-06, + "loss": 0.6662, + "step": 20008 + }, + { + "epoch": 0.69, + "learning_rate": 4.297383475559408e-06, + "loss": 0.6255, + "step": 20009 + }, + { + "epoch": 0.69, + "learning_rate": 4.2964890471168305e-06, + "loss": 0.6425, + "step": 20010 + }, + { + "epoch": 0.69, + "learning_rate": 4.29559468629659e-06, + "loss": 0.6592, + "step": 20011 + }, + { + "epoch": 0.69, + "learning_rate": 4.294700393109294e-06, + "loss": 0.6631, + "step": 20012 + }, + { + "epoch": 0.69, + "learning_rate": 4.29380616756554e-06, + "loss": 0.6211, + "step": 20013 + }, + { + "epoch": 0.69, + "learning_rate": 4.292912009675927e-06, + "loss": 0.6324, + "step": 20014 + }, + { + "epoch": 0.69, + "learning_rate": 4.2920179194510705e-06, + "loss": 0.6281, + "step": 20015 + }, + { + "epoch": 0.69, + "learning_rate": 4.291123896901557e-06, + "loss": 0.6117, + "step": 20016 + }, + { + "epoch": 0.69, + "learning_rate": 4.290229942037992e-06, + "loss": 0.5733, + "step": 20017 + }, + { + "epoch": 0.69, + "learning_rate": 4.289336054870978e-06, + "loss": 0.6476, + "step": 20018 + }, + { + "epoch": 0.69, + "learning_rate": 4.288442235411105e-06, + "loss": 0.6186, + "step": 20019 + }, + { + "epoch": 0.69, + "learning_rate": 4.28754848366897e-06, + "loss": 0.6595, + "step": 20020 + }, + { + "epoch": 0.69, + "learning_rate": 4.286654799655183e-06, + "loss": 0.6036, + "step": 20021 + }, + { + "epoch": 0.69, + "learning_rate": 4.285761183380327e-06, + "loss": 0.6176, + "step": 20022 + }, + { + "epoch": 0.69, + "learning_rate": 4.284867634855e-06, + "loss": 0.6143, + "step": 20023 + }, + { + "epoch": 0.69, + "learning_rate": 4.283974154089801e-06, + "loss": 0.5879, + "step": 20024 + }, + { + "epoch": 0.69, + "learning_rate": 4.283080741095315e-06, + "loss": 0.624, + "step": 20025 + }, + { + "epoch": 0.69, + "learning_rate": 4.282187395882134e-06, + "loss": 0.6304, + "step": 20026 + }, + { + "epoch": 0.69, + "learning_rate": 4.281294118460864e-06, + "loss": 0.6717, + "step": 20027 + }, + { + "epoch": 0.69, + "learning_rate": 4.280400908842082e-06, + "loss": 0.6587, + "step": 20028 + }, + { + "epoch": 0.69, + "learning_rate": 4.279507767036382e-06, + "loss": 0.5914, + "step": 20029 + }, + { + "epoch": 0.69, + "learning_rate": 4.278614693054358e-06, + "loss": 0.6571, + "step": 20030 + }, + { + "epoch": 0.69, + "learning_rate": 4.277721686906591e-06, + "loss": 0.6703, + "step": 20031 + }, + { + "epoch": 0.69, + "learning_rate": 4.276828748603668e-06, + "loss": 0.6595, + "step": 20032 + }, + { + "epoch": 0.69, + "learning_rate": 4.275935878156188e-06, + "loss": 0.6073, + "step": 20033 + }, + { + "epoch": 0.69, + "learning_rate": 4.275043075574724e-06, + "loss": 0.6336, + "step": 20034 + }, + { + "epoch": 0.69, + "learning_rate": 4.2741503408698685e-06, + "loss": 0.5774, + "step": 20035 + }, + { + "epoch": 0.69, + "learning_rate": 4.273257674052206e-06, + "loss": 0.5999, + "step": 20036 + }, + { + "epoch": 0.69, + "learning_rate": 4.272365075132315e-06, + "loss": 0.5932, + "step": 20037 + }, + { + "epoch": 0.69, + "learning_rate": 4.271472544120777e-06, + "loss": 0.6838, + "step": 20038 + }, + { + "epoch": 0.69, + "learning_rate": 4.270580081028187e-06, + "loss": 0.6093, + "step": 20039 + }, + { + "epoch": 0.69, + "learning_rate": 4.269687685865115e-06, + "loss": 0.6371, + "step": 20040 + }, + { + "epoch": 0.69, + "learning_rate": 4.2687953586421425e-06, + "loss": 0.6005, + "step": 20041 + }, + { + "epoch": 0.69, + "learning_rate": 4.267903099369856e-06, + "loss": 0.6368, + "step": 20042 + }, + { + "epoch": 0.69, + "learning_rate": 4.267010908058825e-06, + "loss": 0.6252, + "step": 20043 + }, + { + "epoch": 0.69, + "learning_rate": 4.266118784719629e-06, + "loss": 0.6332, + "step": 20044 + }, + { + "epoch": 0.69, + "learning_rate": 4.265226729362855e-06, + "loss": 0.6105, + "step": 20045 + }, + { + "epoch": 0.69, + "learning_rate": 4.264334741999069e-06, + "loss": 0.6077, + "step": 20046 + }, + { + "epoch": 0.69, + "learning_rate": 4.263442822638851e-06, + "loss": 0.6287, + "step": 20047 + }, + { + "epoch": 0.69, + "learning_rate": 4.262550971292778e-06, + "loss": 0.5856, + "step": 20048 + }, + { + "epoch": 0.69, + "learning_rate": 4.261659187971418e-06, + "loss": 0.6493, + "step": 20049 + }, + { + "epoch": 0.69, + "learning_rate": 4.260767472685343e-06, + "loss": 0.6606, + "step": 20050 + }, + { + "epoch": 0.69, + "learning_rate": 4.259875825445138e-06, + "loss": 0.636, + "step": 20051 + }, + { + "epoch": 0.69, + "learning_rate": 4.258984246261361e-06, + "loss": 0.6003, + "step": 20052 + }, + { + "epoch": 0.69, + "learning_rate": 4.25809273514459e-06, + "loss": 0.5945, + "step": 20053 + }, + { + "epoch": 0.69, + "learning_rate": 4.257201292105396e-06, + "loss": 0.6104, + "step": 20054 + }, + { + "epoch": 0.69, + "learning_rate": 4.256309917154342e-06, + "loss": 0.6139, + "step": 20055 + }, + { + "epoch": 0.69, + "learning_rate": 4.255418610301996e-06, + "loss": 0.6555, + "step": 20056 + }, + { + "epoch": 0.69, + "learning_rate": 4.2545273715589375e-06, + "loss": 0.6344, + "step": 20057 + }, + { + "epoch": 0.69, + "learning_rate": 4.25363620093572e-06, + "loss": 0.6768, + "step": 20058 + }, + { + "epoch": 0.69, + "learning_rate": 4.252745098442915e-06, + "loss": 0.6591, + "step": 20059 + }, + { + "epoch": 0.7, + "learning_rate": 4.251854064091091e-06, + "loss": 0.6253, + "step": 20060 + }, + { + "epoch": 0.7, + "learning_rate": 4.250963097890806e-06, + "loss": 0.686, + "step": 20061 + }, + { + "epoch": 0.7, + "learning_rate": 4.250072199852621e-06, + "loss": 0.6469, + "step": 20062 + }, + { + "epoch": 0.7, + "learning_rate": 4.249181369987111e-06, + "loss": 0.6914, + "step": 20063 + }, + { + "epoch": 0.7, + "learning_rate": 4.248290608304827e-06, + "loss": 0.6242, + "step": 20064 + }, + { + "epoch": 0.7, + "learning_rate": 4.247399914816338e-06, + "loss": 0.6166, + "step": 20065 + }, + { + "epoch": 0.7, + "learning_rate": 4.246509289532196e-06, + "loss": 0.6141, + "step": 20066 + }, + { + "epoch": 0.7, + "learning_rate": 4.245618732462965e-06, + "loss": 0.673, + "step": 20067 + }, + { + "epoch": 0.7, + "learning_rate": 4.2447282436192025e-06, + "loss": 0.6274, + "step": 20068 + }, + { + "epoch": 0.7, + "learning_rate": 4.2438378230114676e-06, + "loss": 0.6622, + "step": 20069 + }, + { + "epoch": 0.7, + "learning_rate": 4.242947470650317e-06, + "loss": 0.6076, + "step": 20070 + }, + { + "epoch": 0.7, + "learning_rate": 4.24205718654631e-06, + "loss": 0.6206, + "step": 20071 + }, + { + "epoch": 0.7, + "learning_rate": 4.241166970709995e-06, + "loss": 0.5725, + "step": 20072 + }, + { + "epoch": 0.7, + "learning_rate": 4.240276823151932e-06, + "loss": 0.6524, + "step": 20073 + }, + { + "epoch": 0.7, + "learning_rate": 4.239386743882673e-06, + "loss": 0.6423, + "step": 20074 + }, + { + "epoch": 0.7, + "learning_rate": 4.23849673291277e-06, + "loss": 0.6657, + "step": 20075 + }, + { + "epoch": 0.7, + "learning_rate": 4.2376067902527785e-06, + "loss": 0.5551, + "step": 20076 + }, + { + "epoch": 0.7, + "learning_rate": 4.236716915913251e-06, + "loss": 0.5939, + "step": 20077 + }, + { + "epoch": 0.7, + "learning_rate": 4.23582710990473e-06, + "loss": 0.6663, + "step": 20078 + }, + { + "epoch": 0.7, + "learning_rate": 4.234937372237772e-06, + "loss": 0.6352, + "step": 20079 + }, + { + "epoch": 0.7, + "learning_rate": 4.234047702922923e-06, + "loss": 0.6231, + "step": 20080 + }, + { + "epoch": 0.7, + "learning_rate": 4.2331581019707336e-06, + "loss": 0.6397, + "step": 20081 + }, + { + "epoch": 0.7, + "learning_rate": 4.2322685693917484e-06, + "loss": 0.605, + "step": 20082 + }, + { + "epoch": 0.7, + "learning_rate": 4.231379105196521e-06, + "loss": 0.611, + "step": 20083 + }, + { + "epoch": 0.7, + "learning_rate": 4.230489709395587e-06, + "loss": 0.6186, + "step": 20084 + }, + { + "epoch": 0.7, + "learning_rate": 4.229600381999496e-06, + "loss": 0.5823, + "step": 20085 + }, + { + "epoch": 0.7, + "learning_rate": 4.228711123018793e-06, + "loss": 0.643, + "step": 20086 + }, + { + "epoch": 0.7, + "learning_rate": 4.227821932464019e-06, + "loss": 0.6181, + "step": 20087 + }, + { + "epoch": 0.7, + "learning_rate": 4.2269328103457186e-06, + "loss": 0.6431, + "step": 20088 + }, + { + "epoch": 0.7, + "learning_rate": 4.226043756674436e-06, + "loss": 0.655, + "step": 20089 + }, + { + "epoch": 0.7, + "learning_rate": 4.225154771460706e-06, + "loss": 0.6418, + "step": 20090 + }, + { + "epoch": 0.7, + "learning_rate": 4.22426585471507e-06, + "loss": 0.687, + "step": 20091 + }, + { + "epoch": 0.7, + "learning_rate": 4.223377006448069e-06, + "loss": 0.6291, + "step": 20092 + }, + { + "epoch": 0.7, + "learning_rate": 4.222488226670242e-06, + "loss": 0.669, + "step": 20093 + }, + { + "epoch": 0.7, + "learning_rate": 4.221599515392125e-06, + "loss": 0.6537, + "step": 20094 + }, + { + "epoch": 0.7, + "learning_rate": 4.220710872624259e-06, + "loss": 0.6476, + "step": 20095 + }, + { + "epoch": 0.7, + "learning_rate": 4.219822298377173e-06, + "loss": 0.6359, + "step": 20096 + }, + { + "epoch": 0.7, + "learning_rate": 4.218933792661405e-06, + "loss": 0.6609, + "step": 20097 + }, + { + "epoch": 0.7, + "learning_rate": 4.218045355487492e-06, + "loss": 0.6429, + "step": 20098 + }, + { + "epoch": 0.7, + "learning_rate": 4.217156986865964e-06, + "loss": 0.5924, + "step": 20099 + }, + { + "epoch": 0.7, + "learning_rate": 4.216268686807354e-06, + "loss": 0.7067, + "step": 20100 + }, + { + "epoch": 0.7, + "learning_rate": 4.2153804553222e-06, + "loss": 0.629, + "step": 20101 + }, + { + "epoch": 0.7, + "learning_rate": 4.214492292421025e-06, + "loss": 0.6186, + "step": 20102 + }, + { + "epoch": 0.7, + "learning_rate": 4.213604198114363e-06, + "loss": 0.6062, + "step": 20103 + }, + { + "epoch": 0.7, + "learning_rate": 4.2127161724127415e-06, + "loss": 0.601, + "step": 20104 + }, + { + "epoch": 0.7, + "learning_rate": 4.211828215326692e-06, + "loss": 0.6598, + "step": 20105 + }, + { + "epoch": 0.7, + "learning_rate": 4.210940326866741e-06, + "loss": 0.6369, + "step": 20106 + }, + { + "epoch": 0.7, + "learning_rate": 4.210052507043418e-06, + "loss": 0.5633, + "step": 20107 + }, + { + "epoch": 0.7, + "learning_rate": 4.209164755867245e-06, + "loss": 0.6358, + "step": 20108 + }, + { + "epoch": 0.7, + "learning_rate": 4.208277073348749e-06, + "loss": 0.6504, + "step": 20109 + }, + { + "epoch": 0.7, + "learning_rate": 4.207389459498454e-06, + "loss": 0.6218, + "step": 20110 + }, + { + "epoch": 0.7, + "learning_rate": 4.206501914326885e-06, + "loss": 0.6255, + "step": 20111 + }, + { + "epoch": 0.7, + "learning_rate": 4.205614437844564e-06, + "loss": 0.6534, + "step": 20112 + }, + { + "epoch": 0.7, + "learning_rate": 4.204727030062018e-06, + "loss": 0.6683, + "step": 20113 + }, + { + "epoch": 0.7, + "learning_rate": 4.203839690989761e-06, + "loss": 0.6529, + "step": 20114 + }, + { + "epoch": 0.7, + "learning_rate": 4.2029524206383164e-06, + "loss": 0.6288, + "step": 20115 + }, + { + "epoch": 0.7, + "learning_rate": 4.202065219018203e-06, + "loss": 0.6436, + "step": 20116 + }, + { + "epoch": 0.7, + "learning_rate": 4.201178086139942e-06, + "loss": 0.6635, + "step": 20117 + }, + { + "epoch": 0.7, + "learning_rate": 4.200291022014051e-06, + "loss": 0.6514, + "step": 20118 + }, + { + "epoch": 0.7, + "learning_rate": 4.199404026651048e-06, + "loss": 0.6283, + "step": 20119 + }, + { + "epoch": 0.7, + "learning_rate": 4.198517100061447e-06, + "loss": 0.6363, + "step": 20120 + }, + { + "epoch": 0.7, + "learning_rate": 4.197630242255762e-06, + "loss": 0.6182, + "step": 20121 + }, + { + "epoch": 0.7, + "learning_rate": 4.196743453244513e-06, + "loss": 0.6016, + "step": 20122 + }, + { + "epoch": 0.7, + "learning_rate": 4.195856733038211e-06, + "loss": 0.6392, + "step": 20123 + }, + { + "epoch": 0.7, + "learning_rate": 4.1949700816473685e-06, + "loss": 0.5917, + "step": 20124 + }, + { + "epoch": 0.7, + "learning_rate": 4.194083499082503e-06, + "loss": 0.6545, + "step": 20125 + }, + { + "epoch": 0.7, + "learning_rate": 4.1931969853541185e-06, + "loss": 0.6583, + "step": 20126 + }, + { + "epoch": 0.7, + "learning_rate": 4.19231054047273e-06, + "loss": 0.6699, + "step": 20127 + }, + { + "epoch": 0.7, + "learning_rate": 4.191424164448847e-06, + "loss": 0.5973, + "step": 20128 + }, + { + "epoch": 0.7, + "learning_rate": 4.190537857292978e-06, + "loss": 0.6239, + "step": 20129 + }, + { + "epoch": 0.7, + "learning_rate": 4.189651619015635e-06, + "loss": 0.7279, + "step": 20130 + }, + { + "epoch": 0.7, + "learning_rate": 4.188765449627319e-06, + "loss": 0.6509, + "step": 20131 + }, + { + "epoch": 0.7, + "learning_rate": 4.18787934913854e-06, + "loss": 0.6468, + "step": 20132 + }, + { + "epoch": 0.7, + "learning_rate": 4.186993317559803e-06, + "loss": 0.6178, + "step": 20133 + }, + { + "epoch": 0.7, + "learning_rate": 4.186107354901615e-06, + "loss": 0.6071, + "step": 20134 + }, + { + "epoch": 0.7, + "learning_rate": 4.185221461174478e-06, + "loss": 0.6226, + "step": 20135 + }, + { + "epoch": 0.7, + "learning_rate": 4.1843356363889e-06, + "loss": 0.5877, + "step": 20136 + }, + { + "epoch": 0.7, + "learning_rate": 4.183449880555376e-06, + "loss": 0.6521, + "step": 20137 + }, + { + "epoch": 0.7, + "learning_rate": 4.1825641936844115e-06, + "loss": 0.6192, + "step": 20138 + }, + { + "epoch": 0.7, + "learning_rate": 4.181678575786508e-06, + "loss": 0.6362, + "step": 20139 + }, + { + "epoch": 0.7, + "learning_rate": 4.180793026872165e-06, + "loss": 0.6416, + "step": 20140 + }, + { + "epoch": 0.7, + "learning_rate": 4.1799075469518825e-06, + "loss": 0.6107, + "step": 20141 + }, + { + "epoch": 0.7, + "learning_rate": 4.1790221360361615e-06, + "loss": 0.6642, + "step": 20142 + }, + { + "epoch": 0.7, + "learning_rate": 4.178136794135494e-06, + "loss": 0.623, + "step": 20143 + }, + { + "epoch": 0.7, + "learning_rate": 4.177251521260379e-06, + "loss": 0.5895, + "step": 20144 + }, + { + "epoch": 0.7, + "learning_rate": 4.176366317421312e-06, + "loss": 0.6115, + "step": 20145 + }, + { + "epoch": 0.7, + "learning_rate": 4.175481182628791e-06, + "loss": 0.6077, + "step": 20146 + }, + { + "epoch": 0.7, + "learning_rate": 4.174596116893307e-06, + "loss": 0.6446, + "step": 20147 + }, + { + "epoch": 0.7, + "learning_rate": 4.17371112022536e-06, + "loss": 0.6324, + "step": 20148 + }, + { + "epoch": 0.7, + "learning_rate": 4.172826192635434e-06, + "loss": 0.6689, + "step": 20149 + }, + { + "epoch": 0.7, + "learning_rate": 4.171941334134024e-06, + "loss": 0.6062, + "step": 20150 + }, + { + "epoch": 0.7, + "learning_rate": 4.1710565447316235e-06, + "loss": 0.6205, + "step": 20151 + }, + { + "epoch": 0.7, + "learning_rate": 4.1701718244387205e-06, + "loss": 0.5958, + "step": 20152 + }, + { + "epoch": 0.7, + "learning_rate": 4.169287173265806e-06, + "loss": 0.6046, + "step": 20153 + }, + { + "epoch": 0.7, + "learning_rate": 4.168402591223371e-06, + "loss": 0.6161, + "step": 20154 + }, + { + "epoch": 0.7, + "learning_rate": 4.167518078321896e-06, + "loss": 0.6363, + "step": 20155 + }, + { + "epoch": 0.7, + "learning_rate": 4.1666336345718725e-06, + "loss": 0.6277, + "step": 20156 + }, + { + "epoch": 0.7, + "learning_rate": 4.165749259983788e-06, + "loss": 0.5815, + "step": 20157 + }, + { + "epoch": 0.7, + "learning_rate": 4.164864954568126e-06, + "loss": 0.6483, + "step": 20158 + }, + { + "epoch": 0.7, + "learning_rate": 4.16398071833537e-06, + "loss": 0.5912, + "step": 20159 + }, + { + "epoch": 0.7, + "learning_rate": 4.16309655129601e-06, + "loss": 0.6428, + "step": 20160 + }, + { + "epoch": 0.7, + "learning_rate": 4.162212453460519e-06, + "loss": 0.5807, + "step": 20161 + }, + { + "epoch": 0.7, + "learning_rate": 4.161328424839386e-06, + "loss": 0.675, + "step": 20162 + }, + { + "epoch": 0.7, + "learning_rate": 4.1604444654430896e-06, + "loss": 0.6486, + "step": 20163 + }, + { + "epoch": 0.7, + "learning_rate": 4.159560575282111e-06, + "loss": 0.6223, + "step": 20164 + }, + { + "epoch": 0.7, + "learning_rate": 4.15867675436693e-06, + "loss": 0.6412, + "step": 20165 + }, + { + "epoch": 0.7, + "learning_rate": 4.157793002708031e-06, + "loss": 0.5883, + "step": 20166 + }, + { + "epoch": 0.7, + "learning_rate": 4.1569093203158805e-06, + "loss": 0.6151, + "step": 20167 + }, + { + "epoch": 0.7, + "learning_rate": 4.156025707200961e-06, + "loss": 0.6619, + "step": 20168 + }, + { + "epoch": 0.7, + "learning_rate": 4.155142163373751e-06, + "loss": 0.5968, + "step": 20169 + }, + { + "epoch": 0.7, + "learning_rate": 4.154258688844724e-06, + "loss": 0.6171, + "step": 20170 + }, + { + "epoch": 0.7, + "learning_rate": 4.153375283624356e-06, + "loss": 0.6379, + "step": 20171 + }, + { + "epoch": 0.7, + "learning_rate": 4.1524919477231215e-06, + "loss": 0.6492, + "step": 20172 + }, + { + "epoch": 0.7, + "learning_rate": 4.15160868115149e-06, + "loss": 0.6881, + "step": 20173 + }, + { + "epoch": 0.7, + "learning_rate": 4.150725483919936e-06, + "loss": 0.6225, + "step": 20174 + }, + { + "epoch": 0.7, + "learning_rate": 4.14984235603893e-06, + "loss": 0.6301, + "step": 20175 + }, + { + "epoch": 0.7, + "learning_rate": 4.1489592975189445e-06, + "loss": 0.6057, + "step": 20176 + }, + { + "epoch": 0.7, + "learning_rate": 4.148076308370447e-06, + "loss": 0.7109, + "step": 20177 + }, + { + "epoch": 0.7, + "learning_rate": 4.147193388603912e-06, + "loss": 0.6015, + "step": 20178 + }, + { + "epoch": 0.7, + "learning_rate": 4.146310538229799e-06, + "loss": 0.7126, + "step": 20179 + }, + { + "epoch": 0.7, + "learning_rate": 4.145427757258579e-06, + "loss": 0.6539, + "step": 20180 + }, + { + "epoch": 0.7, + "learning_rate": 4.1445450457007196e-06, + "loss": 0.5999, + "step": 20181 + }, + { + "epoch": 0.7, + "learning_rate": 4.143662403566686e-06, + "loss": 0.6043, + "step": 20182 + }, + { + "epoch": 0.7, + "learning_rate": 4.142779830866943e-06, + "loss": 0.6052, + "step": 20183 + }, + { + "epoch": 0.7, + "learning_rate": 4.141897327611958e-06, + "loss": 0.65, + "step": 20184 + }, + { + "epoch": 0.7, + "learning_rate": 4.141014893812187e-06, + "loss": 0.6205, + "step": 20185 + }, + { + "epoch": 0.7, + "learning_rate": 4.140132529478097e-06, + "loss": 0.6265, + "step": 20186 + }, + { + "epoch": 0.7, + "learning_rate": 4.139250234620147e-06, + "loss": 0.6049, + "step": 20187 + }, + { + "epoch": 0.7, + "learning_rate": 4.138368009248801e-06, + "loss": 0.6517, + "step": 20188 + }, + { + "epoch": 0.7, + "learning_rate": 4.13748585337452e-06, + "loss": 0.6718, + "step": 20189 + }, + { + "epoch": 0.7, + "learning_rate": 4.136603767007756e-06, + "loss": 0.639, + "step": 20190 + }, + { + "epoch": 0.7, + "learning_rate": 4.135721750158973e-06, + "loss": 0.6072, + "step": 20191 + }, + { + "epoch": 0.7, + "learning_rate": 4.1348398028386295e-06, + "loss": 0.6301, + "step": 20192 + }, + { + "epoch": 0.7, + "learning_rate": 4.1339579250571725e-06, + "loss": 0.6376, + "step": 20193 + }, + { + "epoch": 0.7, + "learning_rate": 4.133076116825069e-06, + "loss": 0.6871, + "step": 20194 + }, + { + "epoch": 0.7, + "learning_rate": 4.132194378152774e-06, + "loss": 0.5868, + "step": 20195 + }, + { + "epoch": 0.7, + "learning_rate": 4.131312709050733e-06, + "loss": 0.6219, + "step": 20196 + }, + { + "epoch": 0.7, + "learning_rate": 4.130431109529404e-06, + "loss": 0.613, + "step": 20197 + }, + { + "epoch": 0.7, + "learning_rate": 4.129549579599242e-06, + "loss": 0.5883, + "step": 20198 + }, + { + "epoch": 0.7, + "learning_rate": 4.12866811927069e-06, + "loss": 0.5762, + "step": 20199 + }, + { + "epoch": 0.7, + "learning_rate": 4.1277867285542075e-06, + "loss": 0.64, + "step": 20200 + }, + { + "epoch": 0.7, + "learning_rate": 4.126905407460246e-06, + "loss": 0.6337, + "step": 20201 + }, + { + "epoch": 0.7, + "learning_rate": 4.126024155999246e-06, + "loss": 0.6423, + "step": 20202 + }, + { + "epoch": 0.7, + "learning_rate": 4.1251429741816605e-06, + "loss": 0.591, + "step": 20203 + }, + { + "epoch": 0.7, + "learning_rate": 4.1242618620179406e-06, + "loss": 0.6364, + "step": 20204 + }, + { + "epoch": 0.7, + "learning_rate": 4.123380819518522e-06, + "loss": 0.6657, + "step": 20205 + }, + { + "epoch": 0.7, + "learning_rate": 4.122499846693862e-06, + "loss": 0.689, + "step": 20206 + }, + { + "epoch": 0.7, + "learning_rate": 4.121618943554403e-06, + "loss": 0.7169, + "step": 20207 + }, + { + "epoch": 0.7, + "learning_rate": 4.120738110110586e-06, + "loss": 0.6643, + "step": 20208 + }, + { + "epoch": 0.7, + "learning_rate": 4.119857346372854e-06, + "loss": 0.5889, + "step": 20209 + }, + { + "epoch": 0.7, + "learning_rate": 4.118976652351657e-06, + "loss": 0.6639, + "step": 20210 + }, + { + "epoch": 0.7, + "learning_rate": 4.118096028057424e-06, + "loss": 0.6073, + "step": 20211 + }, + { + "epoch": 0.7, + "learning_rate": 4.117215473500606e-06, + "loss": 0.6284, + "step": 20212 + }, + { + "epoch": 0.7, + "learning_rate": 4.116334988691644e-06, + "loss": 0.5747, + "step": 20213 + }, + { + "epoch": 0.7, + "learning_rate": 4.11545457364097e-06, + "loss": 0.6309, + "step": 20214 + }, + { + "epoch": 0.7, + "learning_rate": 4.114574228359026e-06, + "loss": 0.5752, + "step": 20215 + }, + { + "epoch": 0.7, + "learning_rate": 4.113693952856254e-06, + "loss": 0.5602, + "step": 20216 + }, + { + "epoch": 0.7, + "learning_rate": 4.112813747143078e-06, + "loss": 0.5878, + "step": 20217 + }, + { + "epoch": 0.7, + "learning_rate": 4.111933611229948e-06, + "loss": 0.6677, + "step": 20218 + }, + { + "epoch": 0.7, + "learning_rate": 4.1110535451272945e-06, + "loss": 0.6589, + "step": 20219 + }, + { + "epoch": 0.7, + "learning_rate": 4.11017354884555e-06, + "loss": 0.6793, + "step": 20220 + }, + { + "epoch": 0.7, + "learning_rate": 4.1092936223951465e-06, + "loss": 0.6091, + "step": 20221 + }, + { + "epoch": 0.7, + "learning_rate": 4.108413765786523e-06, + "loss": 0.602, + "step": 20222 + }, + { + "epoch": 0.7, + "learning_rate": 4.107533979030101e-06, + "loss": 0.6076, + "step": 20223 + }, + { + "epoch": 0.7, + "learning_rate": 4.106654262136319e-06, + "loss": 0.6135, + "step": 20224 + }, + { + "epoch": 0.7, + "learning_rate": 4.105774615115612e-06, + "loss": 0.6192, + "step": 20225 + }, + { + "epoch": 0.7, + "learning_rate": 4.104895037978398e-06, + "loss": 0.633, + "step": 20226 + }, + { + "epoch": 0.7, + "learning_rate": 4.104015530735111e-06, + "loss": 0.639, + "step": 20227 + }, + { + "epoch": 0.7, + "learning_rate": 4.103136093396182e-06, + "loss": 0.653, + "step": 20228 + }, + { + "epoch": 0.7, + "learning_rate": 4.102256725972027e-06, + "loss": 0.627, + "step": 20229 + }, + { + "epoch": 0.7, + "learning_rate": 4.101377428473083e-06, + "loss": 0.65, + "step": 20230 + }, + { + "epoch": 0.7, + "learning_rate": 4.1004982009097746e-06, + "loss": 0.6657, + "step": 20231 + }, + { + "epoch": 0.7, + "learning_rate": 4.09961904329252e-06, + "loss": 0.5715, + "step": 20232 + }, + { + "epoch": 0.7, + "learning_rate": 4.0987399556317456e-06, + "loss": 0.6392, + "step": 20233 + }, + { + "epoch": 0.7, + "learning_rate": 4.097860937937877e-06, + "loss": 0.6097, + "step": 20234 + }, + { + "epoch": 0.7, + "learning_rate": 4.096981990221326e-06, + "loss": 0.6198, + "step": 20235 + }, + { + "epoch": 0.7, + "learning_rate": 4.096103112492526e-06, + "loss": 0.6635, + "step": 20236 + }, + { + "epoch": 0.7, + "learning_rate": 4.095224304761894e-06, + "loss": 0.6375, + "step": 20237 + }, + { + "epoch": 0.7, + "learning_rate": 4.094345567039845e-06, + "loss": 0.6475, + "step": 20238 + }, + { + "epoch": 0.7, + "learning_rate": 4.093466899336799e-06, + "loss": 0.636, + "step": 20239 + }, + { + "epoch": 0.7, + "learning_rate": 4.092588301663179e-06, + "loss": 0.6566, + "step": 20240 + }, + { + "epoch": 0.7, + "learning_rate": 4.09170977402939e-06, + "loss": 0.6342, + "step": 20241 + }, + { + "epoch": 0.7, + "learning_rate": 4.090831316445859e-06, + "loss": 0.5917, + "step": 20242 + }, + { + "epoch": 0.7, + "learning_rate": 4.089952928923001e-06, + "loss": 0.6128, + "step": 20243 + }, + { + "epoch": 0.7, + "learning_rate": 4.0890746114712255e-06, + "loss": 0.6124, + "step": 20244 + }, + { + "epoch": 0.7, + "learning_rate": 4.088196364100947e-06, + "loss": 0.6203, + "step": 20245 + }, + { + "epoch": 0.7, + "learning_rate": 4.087318186822582e-06, + "loss": 0.5698, + "step": 20246 + }, + { + "epoch": 0.7, + "learning_rate": 4.086440079646533e-06, + "loss": 0.651, + "step": 20247 + }, + { + "epoch": 0.7, + "learning_rate": 4.085562042583221e-06, + "loss": 0.6617, + "step": 20248 + }, + { + "epoch": 0.7, + "learning_rate": 4.084684075643056e-06, + "loss": 0.5998, + "step": 20249 + }, + { + "epoch": 0.7, + "learning_rate": 4.083806178836442e-06, + "loss": 0.6197, + "step": 20250 + }, + { + "epoch": 0.7, + "learning_rate": 4.0829283521737915e-06, + "loss": 0.5615, + "step": 20251 + }, + { + "epoch": 0.7, + "learning_rate": 4.082050595665508e-06, + "loss": 0.6352, + "step": 20252 + }, + { + "epoch": 0.7, + "learning_rate": 4.081172909321997e-06, + "loss": 0.6451, + "step": 20253 + }, + { + "epoch": 0.7, + "learning_rate": 4.080295293153676e-06, + "loss": 0.6742, + "step": 20254 + }, + { + "epoch": 0.7, + "learning_rate": 4.079417747170938e-06, + "loss": 0.5807, + "step": 20255 + }, + { + "epoch": 0.7, + "learning_rate": 4.078540271384194e-06, + "loss": 0.6304, + "step": 20256 + }, + { + "epoch": 0.7, + "learning_rate": 4.077662865803847e-06, + "loss": 0.6371, + "step": 20257 + }, + { + "epoch": 0.7, + "learning_rate": 4.076785530440297e-06, + "loss": 0.6007, + "step": 20258 + }, + { + "epoch": 0.7, + "learning_rate": 4.075908265303944e-06, + "loss": 0.6617, + "step": 20259 + }, + { + "epoch": 0.7, + "learning_rate": 4.075031070405199e-06, + "loss": 0.6031, + "step": 20260 + }, + { + "epoch": 0.7, + "learning_rate": 4.074153945754452e-06, + "loss": 0.6407, + "step": 20261 + }, + { + "epoch": 0.7, + "learning_rate": 4.073276891362107e-06, + "loss": 0.6678, + "step": 20262 + }, + { + "epoch": 0.7, + "learning_rate": 4.072399907238564e-06, + "loss": 0.6559, + "step": 20263 + }, + { + "epoch": 0.7, + "learning_rate": 4.071522993394216e-06, + "loss": 0.6893, + "step": 20264 + }, + { + "epoch": 0.7, + "learning_rate": 4.070646149839459e-06, + "loss": 0.6086, + "step": 20265 + }, + { + "epoch": 0.7, + "learning_rate": 4.069769376584699e-06, + "loss": 0.6401, + "step": 20266 + }, + { + "epoch": 0.7, + "learning_rate": 4.0688926736403215e-06, + "loss": 0.6915, + "step": 20267 + }, + { + "epoch": 0.7, + "learning_rate": 4.0680160410167246e-06, + "loss": 0.6093, + "step": 20268 + }, + { + "epoch": 0.7, + "learning_rate": 4.0671394787243045e-06, + "loss": 0.6157, + "step": 20269 + }, + { + "epoch": 0.7, + "learning_rate": 4.066262986773448e-06, + "loss": 0.6917, + "step": 20270 + }, + { + "epoch": 0.7, + "learning_rate": 4.065386565174546e-06, + "loss": 0.6569, + "step": 20271 + }, + { + "epoch": 0.7, + "learning_rate": 4.064510213938001e-06, + "loss": 0.6127, + "step": 20272 + }, + { + "epoch": 0.7, + "learning_rate": 4.063633933074192e-06, + "loss": 0.6197, + "step": 20273 + }, + { + "epoch": 0.7, + "learning_rate": 4.062757722593512e-06, + "loss": 0.6497, + "step": 20274 + }, + { + "epoch": 0.7, + "learning_rate": 4.061881582506354e-06, + "loss": 0.6153, + "step": 20275 + }, + { + "epoch": 0.7, + "learning_rate": 4.061005512823099e-06, + "loss": 0.6525, + "step": 20276 + }, + { + "epoch": 0.7, + "learning_rate": 4.060129513554131e-06, + "loss": 0.5962, + "step": 20277 + }, + { + "epoch": 0.7, + "learning_rate": 4.0592535847098505e-06, + "loss": 0.667, + "step": 20278 + }, + { + "epoch": 0.7, + "learning_rate": 4.058377726300629e-06, + "loss": 0.6769, + "step": 20279 + }, + { + "epoch": 0.7, + "learning_rate": 4.057501938336856e-06, + "loss": 0.6136, + "step": 20280 + }, + { + "epoch": 0.7, + "learning_rate": 4.056626220828918e-06, + "loss": 0.6123, + "step": 20281 + }, + { + "epoch": 0.7, + "learning_rate": 4.055750573787191e-06, + "loss": 0.5904, + "step": 20282 + }, + { + "epoch": 0.7, + "learning_rate": 4.054874997222058e-06, + "loss": 0.6507, + "step": 20283 + }, + { + "epoch": 0.7, + "learning_rate": 4.05399949114391e-06, + "loss": 0.6664, + "step": 20284 + }, + { + "epoch": 0.7, + "learning_rate": 4.053124055563115e-06, + "loss": 0.673, + "step": 20285 + }, + { + "epoch": 0.7, + "learning_rate": 4.052248690490057e-06, + "loss": 0.6037, + "step": 20286 + }, + { + "epoch": 0.7, + "learning_rate": 4.0513733959351185e-06, + "loss": 0.6199, + "step": 20287 + }, + { + "epoch": 0.7, + "learning_rate": 4.05049817190867e-06, + "loss": 0.6944, + "step": 20288 + }, + { + "epoch": 0.7, + "learning_rate": 4.0496230184210885e-06, + "loss": 0.6015, + "step": 20289 + }, + { + "epoch": 0.7, + "learning_rate": 4.048747935482761e-06, + "loss": 0.6396, + "step": 20290 + }, + { + "epoch": 0.7, + "learning_rate": 4.04787292310405e-06, + "loss": 0.6152, + "step": 20291 + }, + { + "epoch": 0.7, + "learning_rate": 4.046997981295336e-06, + "loss": 0.6066, + "step": 20292 + }, + { + "epoch": 0.7, + "learning_rate": 4.0461231100669955e-06, + "loss": 0.5795, + "step": 20293 + }, + { + "epoch": 0.7, + "learning_rate": 4.045248309429393e-06, + "loss": 0.64, + "step": 20294 + }, + { + "epoch": 0.7, + "learning_rate": 4.044373579392901e-06, + "loss": 0.6689, + "step": 20295 + }, + { + "epoch": 0.7, + "learning_rate": 4.043498919967901e-06, + "loss": 0.6429, + "step": 20296 + }, + { + "epoch": 0.7, + "learning_rate": 4.0426243311647525e-06, + "loss": 0.6719, + "step": 20297 + }, + { + "epoch": 0.7, + "learning_rate": 4.04174981299383e-06, + "loss": 0.6174, + "step": 20298 + }, + { + "epoch": 0.7, + "learning_rate": 4.040875365465504e-06, + "loss": 0.6399, + "step": 20299 + }, + { + "epoch": 0.7, + "learning_rate": 4.040000988590135e-06, + "loss": 0.6189, + "step": 20300 + }, + { + "epoch": 0.7, + "learning_rate": 4.039126682378089e-06, + "loss": 0.6669, + "step": 20301 + }, + { + "epoch": 0.7, + "learning_rate": 4.0382524468397455e-06, + "loss": 0.6477, + "step": 20302 + }, + { + "epoch": 0.7, + "learning_rate": 4.037378281985457e-06, + "loss": 0.6225, + "step": 20303 + }, + { + "epoch": 0.7, + "learning_rate": 4.036504187825591e-06, + "loss": 0.6406, + "step": 20304 + }, + { + "epoch": 0.7, + "learning_rate": 4.035630164370516e-06, + "loss": 0.6192, + "step": 20305 + }, + { + "epoch": 0.7, + "learning_rate": 4.034756211630586e-06, + "loss": 0.6633, + "step": 20306 + }, + { + "epoch": 0.7, + "learning_rate": 4.033882329616164e-06, + "loss": 0.6058, + "step": 20307 + }, + { + "epoch": 0.7, + "learning_rate": 4.033008518337622e-06, + "loss": 0.6195, + "step": 20308 + }, + { + "epoch": 0.7, + "learning_rate": 4.032134777805307e-06, + "loss": 0.6307, + "step": 20309 + }, + { + "epoch": 0.7, + "learning_rate": 4.031261108029586e-06, + "loss": 0.6001, + "step": 20310 + }, + { + "epoch": 0.7, + "learning_rate": 4.0303875090208166e-06, + "loss": 0.6723, + "step": 20311 + }, + { + "epoch": 0.7, + "learning_rate": 4.029513980789352e-06, + "loss": 0.6143, + "step": 20312 + }, + { + "epoch": 0.7, + "learning_rate": 4.028640523345553e-06, + "loss": 0.6388, + "step": 20313 + }, + { + "epoch": 0.7, + "learning_rate": 4.027767136699773e-06, + "loss": 0.6111, + "step": 20314 + }, + { + "epoch": 0.7, + "learning_rate": 4.026893820862369e-06, + "loss": 0.6213, + "step": 20315 + }, + { + "epoch": 0.7, + "learning_rate": 4.026020575843698e-06, + "loss": 0.6424, + "step": 20316 + }, + { + "epoch": 0.7, + "learning_rate": 4.025147401654107e-06, + "loss": 0.62, + "step": 20317 + }, + { + "epoch": 0.7, + "learning_rate": 4.024274298303952e-06, + "loss": 0.6123, + "step": 20318 + }, + { + "epoch": 0.7, + "learning_rate": 4.023401265803584e-06, + "loss": 0.6012, + "step": 20319 + }, + { + "epoch": 0.7, + "learning_rate": 4.022528304163355e-06, + "loss": 0.634, + "step": 20320 + }, + { + "epoch": 0.7, + "learning_rate": 4.0216554133936136e-06, + "loss": 0.6728, + "step": 20321 + }, + { + "epoch": 0.7, + "learning_rate": 4.020782593504714e-06, + "loss": 0.5991, + "step": 20322 + }, + { + "epoch": 0.7, + "learning_rate": 4.019909844506996e-06, + "loss": 0.628, + "step": 20323 + }, + { + "epoch": 0.7, + "learning_rate": 4.019037166410813e-06, + "loss": 0.6379, + "step": 20324 + }, + { + "epoch": 0.7, + "learning_rate": 4.018164559226509e-06, + "loss": 0.6009, + "step": 20325 + }, + { + "epoch": 0.7, + "learning_rate": 4.017292022964433e-06, + "loss": 0.6412, + "step": 20326 + }, + { + "epoch": 0.7, + "learning_rate": 4.016419557634927e-06, + "loss": 0.6276, + "step": 20327 + }, + { + "epoch": 0.7, + "learning_rate": 4.015547163248341e-06, + "loss": 0.6062, + "step": 20328 + }, + { + "epoch": 0.7, + "learning_rate": 4.014674839815009e-06, + "loss": 0.5865, + "step": 20329 + }, + { + "epoch": 0.7, + "learning_rate": 4.013802587345279e-06, + "loss": 0.6424, + "step": 20330 + }, + { + "epoch": 0.7, + "learning_rate": 4.012930405849491e-06, + "loss": 0.6567, + "step": 20331 + }, + { + "epoch": 0.7, + "learning_rate": 4.012058295337988e-06, + "loss": 0.6389, + "step": 20332 + }, + { + "epoch": 0.7, + "learning_rate": 4.011186255821108e-06, + "loss": 0.6296, + "step": 20333 + }, + { + "epoch": 0.7, + "learning_rate": 4.010314287309195e-06, + "loss": 0.6241, + "step": 20334 + }, + { + "epoch": 0.7, + "learning_rate": 4.009442389812579e-06, + "loss": 0.6863, + "step": 20335 + }, + { + "epoch": 0.7, + "learning_rate": 4.008570563341601e-06, + "loss": 0.6758, + "step": 20336 + }, + { + "epoch": 0.7, + "learning_rate": 4.007698807906599e-06, + "loss": 0.6636, + "step": 20337 + }, + { + "epoch": 0.7, + "learning_rate": 4.006827123517908e-06, + "loss": 0.5573, + "step": 20338 + }, + { + "epoch": 0.7, + "learning_rate": 4.005955510185862e-06, + "loss": 0.6598, + "step": 20339 + }, + { + "epoch": 0.7, + "learning_rate": 4.0050839679208e-06, + "loss": 0.6342, + "step": 20340 + }, + { + "epoch": 0.7, + "learning_rate": 4.004212496733048e-06, + "loss": 0.6581, + "step": 20341 + }, + { + "epoch": 0.7, + "learning_rate": 4.003341096632941e-06, + "loss": 0.6031, + "step": 20342 + }, + { + "epoch": 0.7, + "learning_rate": 4.002469767630811e-06, + "loss": 0.6335, + "step": 20343 + }, + { + "epoch": 0.7, + "learning_rate": 4.001598509736989e-06, + "loss": 0.6356, + "step": 20344 + }, + { + "epoch": 0.7, + "learning_rate": 4.0007273229618045e-06, + "loss": 0.5756, + "step": 20345 + }, + { + "epoch": 0.7, + "learning_rate": 3.9998562073155914e-06, + "loss": 0.6508, + "step": 20346 + }, + { + "epoch": 0.7, + "learning_rate": 3.998985162808669e-06, + "loss": 0.6467, + "step": 20347 + }, + { + "epoch": 0.71, + "learning_rate": 3.998114189451367e-06, + "loss": 0.6263, + "step": 20348 + }, + { + "epoch": 0.71, + "learning_rate": 3.997243287254017e-06, + "loss": 0.6459, + "step": 20349 + }, + { + "epoch": 0.71, + "learning_rate": 3.996372456226939e-06, + "loss": 0.6243, + "step": 20350 + }, + { + "epoch": 0.71, + "learning_rate": 3.9955016963804604e-06, + "loss": 0.6246, + "step": 20351 + }, + { + "epoch": 0.71, + "learning_rate": 3.99463100772491e-06, + "loss": 0.634, + "step": 20352 + }, + { + "epoch": 0.71, + "learning_rate": 3.9937603902706e-06, + "loss": 0.6437, + "step": 20353 + }, + { + "epoch": 0.71, + "learning_rate": 3.992889844027861e-06, + "loss": 0.6102, + "step": 20354 + }, + { + "epoch": 0.71, + "learning_rate": 3.9920193690070095e-06, + "loss": 0.5704, + "step": 20355 + }, + { + "epoch": 0.71, + "learning_rate": 3.99114896521837e-06, + "loss": 0.6527, + "step": 20356 + }, + { + "epoch": 0.71, + "learning_rate": 3.9902786326722605e-06, + "loss": 0.6461, + "step": 20357 + }, + { + "epoch": 0.71, + "learning_rate": 3.9894083713790035e-06, + "loss": 0.6228, + "step": 20358 + }, + { + "epoch": 0.71, + "learning_rate": 3.98853818134891e-06, + "loss": 0.6092, + "step": 20359 + }, + { + "epoch": 0.71, + "learning_rate": 3.987668062592302e-06, + "loss": 0.6553, + "step": 20360 + }, + { + "epoch": 0.71, + "learning_rate": 3.986798015119493e-06, + "loss": 0.638, + "step": 20361 + }, + { + "epoch": 0.71, + "learning_rate": 3.985928038940802e-06, + "loss": 0.6242, + "step": 20362 + }, + { + "epoch": 0.71, + "learning_rate": 3.9850581340665405e-06, + "loss": 0.6648, + "step": 20363 + }, + { + "epoch": 0.71, + "learning_rate": 3.984188300507028e-06, + "loss": 0.6687, + "step": 20364 + }, + { + "epoch": 0.71, + "learning_rate": 3.983318538272569e-06, + "loss": 0.6731, + "step": 20365 + }, + { + "epoch": 0.71, + "learning_rate": 3.9824488473734814e-06, + "loss": 0.6895, + "step": 20366 + }, + { + "epoch": 0.71, + "learning_rate": 3.981579227820074e-06, + "loss": 0.57, + "step": 20367 + }, + { + "epoch": 0.71, + "learning_rate": 3.980709679622659e-06, + "loss": 0.5959, + "step": 20368 + }, + { + "epoch": 0.71, + "learning_rate": 3.979840202791544e-06, + "loss": 0.5914, + "step": 20369 + }, + { + "epoch": 0.71, + "learning_rate": 3.978970797337043e-06, + "loss": 0.6496, + "step": 20370 + }, + { + "epoch": 0.71, + "learning_rate": 3.9781014632694556e-06, + "loss": 0.701, + "step": 20371 + }, + { + "epoch": 0.71, + "learning_rate": 3.977232200599093e-06, + "loss": 0.6576, + "step": 20372 + }, + { + "epoch": 0.71, + "learning_rate": 3.9763630093362625e-06, + "loss": 0.6981, + "step": 20373 + }, + { + "epoch": 0.71, + "learning_rate": 3.975493889491269e-06, + "loss": 0.6505, + "step": 20374 + }, + { + "epoch": 0.71, + "learning_rate": 3.974624841074419e-06, + "loss": 0.6434, + "step": 20375 + }, + { + "epoch": 0.71, + "learning_rate": 3.97375586409601e-06, + "loss": 0.6584, + "step": 20376 + }, + { + "epoch": 0.71, + "learning_rate": 3.972886958566349e-06, + "loss": 0.6432, + "step": 20377 + }, + { + "epoch": 0.71, + "learning_rate": 3.9720181244957366e-06, + "loss": 0.6022, + "step": 20378 + }, + { + "epoch": 0.71, + "learning_rate": 3.971149361894476e-06, + "loss": 0.652, + "step": 20379 + }, + { + "epoch": 0.71, + "learning_rate": 3.970280670772866e-06, + "loss": 0.598, + "step": 20380 + }, + { + "epoch": 0.71, + "learning_rate": 3.969412051141209e-06, + "loss": 0.6291, + "step": 20381 + }, + { + "epoch": 0.71, + "learning_rate": 3.968543503009798e-06, + "loss": 0.5904, + "step": 20382 + }, + { + "epoch": 0.71, + "learning_rate": 3.967675026388933e-06, + "loss": 0.6206, + "step": 20383 + }, + { + "epoch": 0.71, + "learning_rate": 3.966806621288912e-06, + "loss": 0.6366, + "step": 20384 + }, + { + "epoch": 0.71, + "learning_rate": 3.965938287720031e-06, + "loss": 0.5908, + "step": 20385 + }, + { + "epoch": 0.71, + "learning_rate": 3.965070025692584e-06, + "loss": 0.729, + "step": 20386 + }, + { + "epoch": 0.71, + "learning_rate": 3.9642018352168685e-06, + "loss": 0.5753, + "step": 20387 + }, + { + "epoch": 0.71, + "learning_rate": 3.963333716303174e-06, + "loss": 0.6851, + "step": 20388 + }, + { + "epoch": 0.71, + "learning_rate": 3.962465668961793e-06, + "loss": 0.6365, + "step": 20389 + }, + { + "epoch": 0.71, + "learning_rate": 3.9615976932030206e-06, + "loss": 0.6341, + "step": 20390 + }, + { + "epoch": 0.71, + "learning_rate": 3.960729789037145e-06, + "loss": 0.6367, + "step": 20391 + }, + { + "epoch": 0.71, + "learning_rate": 3.959861956474459e-06, + "loss": 0.6559, + "step": 20392 + }, + { + "epoch": 0.71, + "learning_rate": 3.958994195525253e-06, + "loss": 0.6312, + "step": 20393 + }, + { + "epoch": 0.71, + "learning_rate": 3.958126506199809e-06, + "loss": 0.5851, + "step": 20394 + }, + { + "epoch": 0.71, + "learning_rate": 3.957258888508418e-06, + "loss": 0.5839, + "step": 20395 + }, + { + "epoch": 0.71, + "learning_rate": 3.956391342461368e-06, + "loss": 0.6292, + "step": 20396 + }, + { + "epoch": 0.71, + "learning_rate": 3.955523868068942e-06, + "loss": 0.6164, + "step": 20397 + }, + { + "epoch": 0.71, + "learning_rate": 3.954656465341428e-06, + "loss": 0.6116, + "step": 20398 + }, + { + "epoch": 0.71, + "learning_rate": 3.9537891342891134e-06, + "loss": 0.6103, + "step": 20399 + }, + { + "epoch": 0.71, + "learning_rate": 3.9529218749222734e-06, + "loss": 0.6518, + "step": 20400 + }, + { + "epoch": 0.71, + "learning_rate": 3.952054687251193e-06, + "loss": 0.6523, + "step": 20401 + }, + { + "epoch": 0.71, + "learning_rate": 3.951187571286156e-06, + "loss": 0.6238, + "step": 20402 + }, + { + "epoch": 0.71, + "learning_rate": 3.950320527037441e-06, + "loss": 0.5679, + "step": 20403 + }, + { + "epoch": 0.71, + "learning_rate": 3.94945355451533e-06, + "loss": 0.5808, + "step": 20404 + }, + { + "epoch": 0.71, + "learning_rate": 3.948586653730105e-06, + "loss": 0.6632, + "step": 20405 + }, + { + "epoch": 0.71, + "learning_rate": 3.947719824692035e-06, + "loss": 0.7228, + "step": 20406 + }, + { + "epoch": 0.71, + "learning_rate": 3.9468530674114034e-06, + "loss": 0.6272, + "step": 20407 + }, + { + "epoch": 0.71, + "learning_rate": 3.9459863818984864e-06, + "loss": 0.6481, + "step": 20408 + }, + { + "epoch": 0.71, + "learning_rate": 3.945119768163559e-06, + "loss": 0.6804, + "step": 20409 + }, + { + "epoch": 0.71, + "learning_rate": 3.944253226216896e-06, + "loss": 0.6106, + "step": 20410 + }, + { + "epoch": 0.71, + "learning_rate": 3.943386756068776e-06, + "loss": 0.5714, + "step": 20411 + }, + { + "epoch": 0.71, + "learning_rate": 3.942520357729464e-06, + "loss": 0.6681, + "step": 20412 + }, + { + "epoch": 0.71, + "learning_rate": 3.941654031209235e-06, + "loss": 0.6467, + "step": 20413 + }, + { + "epoch": 0.71, + "learning_rate": 3.9407877765183615e-06, + "loss": 0.6729, + "step": 20414 + }, + { + "epoch": 0.71, + "learning_rate": 3.939921593667114e-06, + "loss": 0.6892, + "step": 20415 + }, + { + "epoch": 0.71, + "learning_rate": 3.939055482665762e-06, + "loss": 0.6244, + "step": 20416 + }, + { + "epoch": 0.71, + "learning_rate": 3.938189443524578e-06, + "loss": 0.6796, + "step": 20417 + }, + { + "epoch": 0.71, + "learning_rate": 3.937323476253822e-06, + "loss": 0.6434, + "step": 20418 + }, + { + "epoch": 0.71, + "learning_rate": 3.936457580863767e-06, + "loss": 0.5862, + "step": 20419 + }, + { + "epoch": 0.71, + "learning_rate": 3.935591757364677e-06, + "loss": 0.6358, + "step": 20420 + }, + { + "epoch": 0.71, + "learning_rate": 3.934726005766819e-06, + "loss": 0.623, + "step": 20421 + }, + { + "epoch": 0.71, + "learning_rate": 3.933860326080456e-06, + "loss": 0.6507, + "step": 20422 + }, + { + "epoch": 0.71, + "learning_rate": 3.932994718315857e-06, + "loss": 0.6345, + "step": 20423 + }, + { + "epoch": 0.71, + "learning_rate": 3.932129182483275e-06, + "loss": 0.627, + "step": 20424 + }, + { + "epoch": 0.71, + "learning_rate": 3.931263718592979e-06, + "loss": 0.6411, + "step": 20425 + }, + { + "epoch": 0.71, + "learning_rate": 3.930398326655228e-06, + "loss": 0.6984, + "step": 20426 + }, + { + "epoch": 0.71, + "learning_rate": 3.929533006680284e-06, + "loss": 0.6464, + "step": 20427 + }, + { + "epoch": 0.71, + "learning_rate": 3.928667758678404e-06, + "loss": 0.5991, + "step": 20428 + }, + { + "epoch": 0.71, + "learning_rate": 3.927802582659852e-06, + "loss": 0.6358, + "step": 20429 + }, + { + "epoch": 0.71, + "learning_rate": 3.926937478634879e-06, + "loss": 0.6444, + "step": 20430 + }, + { + "epoch": 0.71, + "learning_rate": 3.926072446613744e-06, + "loss": 0.6223, + "step": 20431 + }, + { + "epoch": 0.71, + "learning_rate": 3.925207486606704e-06, + "loss": 0.6461, + "step": 20432 + }, + { + "epoch": 0.71, + "learning_rate": 3.924342598624012e-06, + "loss": 0.6486, + "step": 20433 + }, + { + "epoch": 0.71, + "learning_rate": 3.923477782675926e-06, + "loss": 0.637, + "step": 20434 + }, + { + "epoch": 0.71, + "learning_rate": 3.922613038772701e-06, + "loss": 0.6618, + "step": 20435 + }, + { + "epoch": 0.71, + "learning_rate": 3.9217483669245834e-06, + "loss": 0.6277, + "step": 20436 + }, + { + "epoch": 0.71, + "learning_rate": 3.920883767141831e-06, + "loss": 0.6729, + "step": 20437 + }, + { + "epoch": 0.71, + "learning_rate": 3.920019239434684e-06, + "loss": 0.6156, + "step": 20438 + }, + { + "epoch": 0.71, + "learning_rate": 3.9191547838134046e-06, + "loss": 0.6337, + "step": 20439 + }, + { + "epoch": 0.71, + "learning_rate": 3.91829040028824e-06, + "loss": 0.64, + "step": 20440 + }, + { + "epoch": 0.71, + "learning_rate": 3.917426088869434e-06, + "loss": 0.6171, + "step": 20441 + }, + { + "epoch": 0.71, + "learning_rate": 3.916561849567235e-06, + "loss": 0.6666, + "step": 20442 + }, + { + "epoch": 0.71, + "learning_rate": 3.915697682391895e-06, + "loss": 0.5972, + "step": 20443 + }, + { + "epoch": 0.71, + "learning_rate": 3.914833587353649e-06, + "loss": 0.5728, + "step": 20444 + }, + { + "epoch": 0.71, + "learning_rate": 3.913969564462752e-06, + "loss": 0.6056, + "step": 20445 + }, + { + "epoch": 0.71, + "learning_rate": 3.913105613729448e-06, + "loss": 0.6709, + "step": 20446 + }, + { + "epoch": 0.71, + "learning_rate": 3.912241735163973e-06, + "loss": 0.6832, + "step": 20447 + }, + { + "epoch": 0.71, + "learning_rate": 3.911377928776573e-06, + "loss": 0.6663, + "step": 20448 + }, + { + "epoch": 0.71, + "learning_rate": 3.910514194577494e-06, + "loss": 0.6459, + "step": 20449 + }, + { + "epoch": 0.71, + "learning_rate": 3.9096505325769655e-06, + "loss": 0.6665, + "step": 20450 + }, + { + "epoch": 0.71, + "learning_rate": 3.908786942785237e-06, + "loss": 0.6137, + "step": 20451 + }, + { + "epoch": 0.71, + "learning_rate": 3.9079234252125486e-06, + "loss": 0.6665, + "step": 20452 + }, + { + "epoch": 0.71, + "learning_rate": 3.907059979869131e-06, + "loss": 0.6434, + "step": 20453 + }, + { + "epoch": 0.71, + "learning_rate": 3.906196606765225e-06, + "loss": 0.6642, + "step": 20454 + }, + { + "epoch": 0.71, + "learning_rate": 3.905333305911071e-06, + "loss": 0.6409, + "step": 20455 + }, + { + "epoch": 0.71, + "learning_rate": 3.904470077316893e-06, + "loss": 0.6115, + "step": 20456 + }, + { + "epoch": 0.71, + "learning_rate": 3.903606920992936e-06, + "loss": 0.6613, + "step": 20457 + }, + { + "epoch": 0.71, + "learning_rate": 3.902743836949435e-06, + "loss": 0.6464, + "step": 20458 + }, + { + "epoch": 0.71, + "learning_rate": 3.901880825196616e-06, + "loss": 0.661, + "step": 20459 + }, + { + "epoch": 0.71, + "learning_rate": 3.901017885744713e-06, + "loss": 0.6553, + "step": 20460 + }, + { + "epoch": 0.71, + "learning_rate": 3.900155018603963e-06, + "loss": 0.6234, + "step": 20461 + }, + { + "epoch": 0.71, + "learning_rate": 3.899292223784583e-06, + "loss": 0.5634, + "step": 20462 + }, + { + "epoch": 0.71, + "learning_rate": 3.898429501296816e-06, + "loss": 0.6309, + "step": 20463 + }, + { + "epoch": 0.71, + "learning_rate": 3.897566851150888e-06, + "loss": 0.6015, + "step": 20464 + }, + { + "epoch": 0.71, + "learning_rate": 3.896704273357022e-06, + "loss": 0.6276, + "step": 20465 + }, + { + "epoch": 0.71, + "learning_rate": 3.895841767925447e-06, + "loss": 0.62, + "step": 20466 + }, + { + "epoch": 0.71, + "learning_rate": 3.894979334866393e-06, + "loss": 0.6539, + "step": 20467 + }, + { + "epoch": 0.71, + "learning_rate": 3.8941169741900755e-06, + "loss": 0.6479, + "step": 20468 + }, + { + "epoch": 0.71, + "learning_rate": 3.893254685906729e-06, + "loss": 0.5766, + "step": 20469 + }, + { + "epoch": 0.71, + "learning_rate": 3.892392470026576e-06, + "loss": 0.5971, + "step": 20470 + }, + { + "epoch": 0.71, + "learning_rate": 3.891530326559833e-06, + "loss": 0.5896, + "step": 20471 + }, + { + "epoch": 0.71, + "learning_rate": 3.890668255516725e-06, + "loss": 0.6777, + "step": 20472 + }, + { + "epoch": 0.71, + "learning_rate": 3.889806256907478e-06, + "loss": 0.6099, + "step": 20473 + }, + { + "epoch": 0.71, + "learning_rate": 3.888944330742299e-06, + "loss": 0.625, + "step": 20474 + }, + { + "epoch": 0.71, + "learning_rate": 3.88808247703142e-06, + "loss": 0.6141, + "step": 20475 + }, + { + "epoch": 0.71, + "learning_rate": 3.887220695785056e-06, + "loss": 0.6374, + "step": 20476 + }, + { + "epoch": 0.71, + "learning_rate": 3.886358987013422e-06, + "loss": 0.615, + "step": 20477 + }, + { + "epoch": 0.71, + "learning_rate": 3.885497350726736e-06, + "loss": 0.6291, + "step": 20478 + }, + { + "epoch": 0.71, + "learning_rate": 3.884635786935217e-06, + "loss": 0.6826, + "step": 20479 + }, + { + "epoch": 0.71, + "learning_rate": 3.88377429564907e-06, + "loss": 0.6251, + "step": 20480 + }, + { + "epoch": 0.71, + "learning_rate": 3.882912876878518e-06, + "loss": 0.6302, + "step": 20481 + }, + { + "epoch": 0.71, + "learning_rate": 3.882051530633777e-06, + "loss": 0.615, + "step": 20482 + }, + { + "epoch": 0.71, + "learning_rate": 3.88119025692505e-06, + "loss": 0.6638, + "step": 20483 + }, + { + "epoch": 0.71, + "learning_rate": 3.880329055762552e-06, + "loss": 0.6429, + "step": 20484 + }, + { + "epoch": 0.71, + "learning_rate": 3.8794679271565004e-06, + "loss": 0.605, + "step": 20485 + }, + { + "epoch": 0.71, + "learning_rate": 3.878606871117091e-06, + "loss": 0.6562, + "step": 20486 + }, + { + "epoch": 0.71, + "learning_rate": 3.877745887654544e-06, + "loss": 0.6484, + "step": 20487 + }, + { + "epoch": 0.71, + "learning_rate": 3.876884976779068e-06, + "loss": 0.6186, + "step": 20488 + }, + { + "epoch": 0.71, + "learning_rate": 3.8760241385008615e-06, + "loss": 0.666, + "step": 20489 + }, + { + "epoch": 0.71, + "learning_rate": 3.8751633728301375e-06, + "loss": 0.5905, + "step": 20490 + }, + { + "epoch": 0.71, + "learning_rate": 3.874302679777102e-06, + "loss": 0.5989, + "step": 20491 + }, + { + "epoch": 0.71, + "learning_rate": 3.873442059351951e-06, + "loss": 0.6082, + "step": 20492 + }, + { + "epoch": 0.71, + "learning_rate": 3.872581511564897e-06, + "loss": 0.6635, + "step": 20493 + }, + { + "epoch": 0.71, + "learning_rate": 3.871721036426145e-06, + "loss": 0.5939, + "step": 20494 + }, + { + "epoch": 0.71, + "learning_rate": 3.870860633945889e-06, + "loss": 0.603, + "step": 20495 + }, + { + "epoch": 0.71, + "learning_rate": 3.870000304134332e-06, + "loss": 0.5993, + "step": 20496 + }, + { + "epoch": 0.71, + "learning_rate": 3.8691400470016806e-06, + "loss": 0.6029, + "step": 20497 + }, + { + "epoch": 0.71, + "learning_rate": 3.8682798625581234e-06, + "loss": 0.5999, + "step": 20498 + }, + { + "epoch": 0.71, + "learning_rate": 3.86741975081387e-06, + "loss": 0.62, + "step": 20499 + }, + { + "epoch": 0.71, + "learning_rate": 3.866559711779111e-06, + "loss": 0.6952, + "step": 20500 + }, + { + "epoch": 0.71, + "learning_rate": 3.865699745464046e-06, + "loss": 0.6264, + "step": 20501 + }, + { + "epoch": 0.71, + "learning_rate": 3.864839851878873e-06, + "loss": 0.6495, + "step": 20502 + }, + { + "epoch": 0.71, + "learning_rate": 3.86398003103378e-06, + "loss": 0.6258, + "step": 20503 + }, + { + "epoch": 0.71, + "learning_rate": 3.863120282938965e-06, + "loss": 0.6737, + "step": 20504 + }, + { + "epoch": 0.71, + "learning_rate": 3.8622606076046276e-06, + "loss": 0.6345, + "step": 20505 + }, + { + "epoch": 0.71, + "learning_rate": 3.861401005040951e-06, + "loss": 0.6075, + "step": 20506 + }, + { + "epoch": 0.71, + "learning_rate": 3.860541475258133e-06, + "loss": 0.6312, + "step": 20507 + }, + { + "epoch": 0.71, + "learning_rate": 3.859682018266364e-06, + "loss": 0.6184, + "step": 20508 + }, + { + "epoch": 0.71, + "learning_rate": 3.858822634075828e-06, + "loss": 0.6209, + "step": 20509 + }, + { + "epoch": 0.71, + "learning_rate": 3.857963322696716e-06, + "loss": 0.6805, + "step": 20510 + }, + { + "epoch": 0.71, + "learning_rate": 3.857104084139226e-06, + "loss": 0.6105, + "step": 20511 + }, + { + "epoch": 0.71, + "learning_rate": 3.856244918413534e-06, + "loss": 0.6128, + "step": 20512 + }, + { + "epoch": 0.71, + "learning_rate": 3.85538582552983e-06, + "loss": 0.6657, + "step": 20513 + }, + { + "epoch": 0.71, + "learning_rate": 3.854526805498304e-06, + "loss": 0.6607, + "step": 20514 + }, + { + "epoch": 0.71, + "learning_rate": 3.853667858329133e-06, + "loss": 0.6449, + "step": 20515 + }, + { + "epoch": 0.71, + "learning_rate": 3.852808984032501e-06, + "loss": 0.6525, + "step": 20516 + }, + { + "epoch": 0.71, + "learning_rate": 3.851950182618602e-06, + "loss": 0.6322, + "step": 20517 + }, + { + "epoch": 0.71, + "learning_rate": 3.851091454097608e-06, + "loss": 0.6542, + "step": 20518 + }, + { + "epoch": 0.71, + "learning_rate": 3.850232798479702e-06, + "loss": 0.6105, + "step": 20519 + }, + { + "epoch": 0.71, + "learning_rate": 3.849374215775069e-06, + "loss": 0.6855, + "step": 20520 + }, + { + "epoch": 0.71, + "learning_rate": 3.848515705993882e-06, + "loss": 0.6121, + "step": 20521 + }, + { + "epoch": 0.71, + "learning_rate": 3.847657269146321e-06, + "loss": 0.5787, + "step": 20522 + }, + { + "epoch": 0.71, + "learning_rate": 3.8467989052425715e-06, + "loss": 0.6363, + "step": 20523 + }, + { + "epoch": 0.71, + "learning_rate": 3.8459406142928015e-06, + "loss": 0.6392, + "step": 20524 + }, + { + "epoch": 0.71, + "learning_rate": 3.84508239630719e-06, + "loss": 0.5958, + "step": 20525 + }, + { + "epoch": 0.71, + "learning_rate": 3.844224251295917e-06, + "loss": 0.6715, + "step": 20526 + }, + { + "epoch": 0.71, + "learning_rate": 3.843366179269149e-06, + "loss": 0.6151, + "step": 20527 + }, + { + "epoch": 0.71, + "learning_rate": 3.8425081802370605e-06, + "loss": 0.6552, + "step": 20528 + }, + { + "epoch": 0.71, + "learning_rate": 3.841650254209832e-06, + "loss": 0.6423, + "step": 20529 + }, + { + "epoch": 0.71, + "learning_rate": 3.840792401197628e-06, + "loss": 0.6447, + "step": 20530 + }, + { + "epoch": 0.71, + "learning_rate": 3.83993462121062e-06, + "loss": 0.5952, + "step": 20531 + }, + { + "epoch": 0.71, + "learning_rate": 3.839076914258984e-06, + "loss": 0.6899, + "step": 20532 + }, + { + "epoch": 0.71, + "learning_rate": 3.838219280352882e-06, + "loss": 0.6146, + "step": 20533 + }, + { + "epoch": 0.71, + "learning_rate": 3.837361719502484e-06, + "loss": 0.6187, + "step": 20534 + }, + { + "epoch": 0.71, + "learning_rate": 3.836504231717959e-06, + "loss": 0.6139, + "step": 20535 + }, + { + "epoch": 0.71, + "learning_rate": 3.835646817009473e-06, + "loss": 0.625, + "step": 20536 + }, + { + "epoch": 0.71, + "learning_rate": 3.834789475387192e-06, + "loss": 0.6824, + "step": 20537 + }, + { + "epoch": 0.71, + "learning_rate": 3.833932206861284e-06, + "loss": 0.6383, + "step": 20538 + }, + { + "epoch": 0.71, + "learning_rate": 3.833075011441907e-06, + "loss": 0.6048, + "step": 20539 + }, + { + "epoch": 0.71, + "learning_rate": 3.832217889139226e-06, + "loss": 0.6357, + "step": 20540 + }, + { + "epoch": 0.71, + "learning_rate": 3.831360839963405e-06, + "loss": 0.6559, + "step": 20541 + }, + { + "epoch": 0.71, + "learning_rate": 3.830503863924605e-06, + "loss": 0.6193, + "step": 20542 + }, + { + "epoch": 0.71, + "learning_rate": 3.829646961032985e-06, + "loss": 0.6382, + "step": 20543 + }, + { + "epoch": 0.71, + "learning_rate": 3.82879013129871e-06, + "loss": 0.6052, + "step": 20544 + }, + { + "epoch": 0.71, + "learning_rate": 3.827933374731932e-06, + "loss": 0.637, + "step": 20545 + }, + { + "epoch": 0.71, + "learning_rate": 3.827076691342809e-06, + "loss": 0.6132, + "step": 20546 + }, + { + "epoch": 0.71, + "learning_rate": 3.826220081141503e-06, + "loss": 0.664, + "step": 20547 + }, + { + "epoch": 0.71, + "learning_rate": 3.825363544138166e-06, + "loss": 0.6092, + "step": 20548 + }, + { + "epoch": 0.71, + "learning_rate": 3.8245070803429575e-06, + "loss": 0.6166, + "step": 20549 + }, + { + "epoch": 0.71, + "learning_rate": 3.823650689766031e-06, + "loss": 0.6211, + "step": 20550 + }, + { + "epoch": 0.71, + "learning_rate": 3.822794372417537e-06, + "loss": 0.6383, + "step": 20551 + }, + { + "epoch": 0.71, + "learning_rate": 3.821938128307629e-06, + "loss": 0.6437, + "step": 20552 + }, + { + "epoch": 0.71, + "learning_rate": 3.821081957446459e-06, + "loss": 0.6748, + "step": 20553 + }, + { + "epoch": 0.71, + "learning_rate": 3.820225859844179e-06, + "loss": 0.6312, + "step": 20554 + }, + { + "epoch": 0.71, + "learning_rate": 3.819369835510939e-06, + "loss": 0.621, + "step": 20555 + }, + { + "epoch": 0.71, + "learning_rate": 3.818513884456893e-06, + "loss": 0.6102, + "step": 20556 + }, + { + "epoch": 0.71, + "learning_rate": 3.817658006692179e-06, + "loss": 0.6626, + "step": 20557 + }, + { + "epoch": 0.71, + "learning_rate": 3.816802202226951e-06, + "loss": 0.6857, + "step": 20558 + }, + { + "epoch": 0.71, + "learning_rate": 3.815946471071355e-06, + "loss": 0.6637, + "step": 20559 + }, + { + "epoch": 0.71, + "learning_rate": 3.815090813235536e-06, + "loss": 0.6397, + "step": 20560 + }, + { + "epoch": 0.71, + "learning_rate": 3.8142352287296424e-06, + "loss": 0.6202, + "step": 20561 + }, + { + "epoch": 0.71, + "learning_rate": 3.8133797175638133e-06, + "loss": 0.6742, + "step": 20562 + }, + { + "epoch": 0.71, + "learning_rate": 3.8125242797481923e-06, + "loss": 0.6231, + "step": 20563 + }, + { + "epoch": 0.71, + "learning_rate": 3.8116689152929233e-06, + "loss": 0.6346, + "step": 20564 + }, + { + "epoch": 0.71, + "learning_rate": 3.8108136242081485e-06, + "loss": 0.6823, + "step": 20565 + }, + { + "epoch": 0.71, + "learning_rate": 3.8099584065040062e-06, + "loss": 0.6098, + "step": 20566 + }, + { + "epoch": 0.71, + "learning_rate": 3.809103262190642e-06, + "loss": 0.6414, + "step": 20567 + }, + { + "epoch": 0.71, + "learning_rate": 3.8082481912781866e-06, + "loss": 0.6136, + "step": 20568 + }, + { + "epoch": 0.71, + "learning_rate": 3.8073931937767804e-06, + "loss": 0.6407, + "step": 20569 + }, + { + "epoch": 0.71, + "learning_rate": 3.8065382696965623e-06, + "loss": 0.6084, + "step": 20570 + }, + { + "epoch": 0.71, + "learning_rate": 3.8056834190476676e-06, + "loss": 0.648, + "step": 20571 + }, + { + "epoch": 0.71, + "learning_rate": 3.8048286418402325e-06, + "loss": 0.616, + "step": 20572 + }, + { + "epoch": 0.71, + "learning_rate": 3.803973938084394e-06, + "loss": 0.6017, + "step": 20573 + }, + { + "epoch": 0.71, + "learning_rate": 3.8031193077902783e-06, + "loss": 0.6433, + "step": 20574 + }, + { + "epoch": 0.71, + "learning_rate": 3.8022647509680234e-06, + "loss": 0.6379, + "step": 20575 + }, + { + "epoch": 0.71, + "learning_rate": 3.8014102676277596e-06, + "loss": 0.625, + "step": 20576 + }, + { + "epoch": 0.71, + "learning_rate": 3.800555857779619e-06, + "loss": 0.6749, + "step": 20577 + }, + { + "epoch": 0.71, + "learning_rate": 3.7997015214337297e-06, + "loss": 0.6382, + "step": 20578 + }, + { + "epoch": 0.71, + "learning_rate": 3.798847258600226e-06, + "loss": 0.6014, + "step": 20579 + }, + { + "epoch": 0.71, + "learning_rate": 3.7979930692892296e-06, + "loss": 0.666, + "step": 20580 + }, + { + "epoch": 0.71, + "learning_rate": 3.7971389535108703e-06, + "loss": 0.6245, + "step": 20581 + }, + { + "epoch": 0.71, + "learning_rate": 3.7962849112752764e-06, + "loss": 0.6209, + "step": 20582 + }, + { + "epoch": 0.71, + "learning_rate": 3.795430942592572e-06, + "loss": 0.6014, + "step": 20583 + }, + { + "epoch": 0.71, + "learning_rate": 3.7945770474728827e-06, + "loss": 0.6832, + "step": 20584 + }, + { + "epoch": 0.71, + "learning_rate": 3.7937232259263356e-06, + "loss": 0.6576, + "step": 20585 + }, + { + "epoch": 0.71, + "learning_rate": 3.792869477963047e-06, + "loss": 0.5455, + "step": 20586 + }, + { + "epoch": 0.71, + "learning_rate": 3.792015803593143e-06, + "loss": 0.616, + "step": 20587 + }, + { + "epoch": 0.71, + "learning_rate": 3.7911622028267458e-06, + "loss": 0.6536, + "step": 20588 + }, + { + "epoch": 0.71, + "learning_rate": 3.7903086756739737e-06, + "loss": 0.6512, + "step": 20589 + }, + { + "epoch": 0.71, + "learning_rate": 3.7894552221449475e-06, + "loss": 0.5535, + "step": 20590 + }, + { + "epoch": 0.71, + "learning_rate": 3.7886018422497906e-06, + "loss": 0.667, + "step": 20591 + }, + { + "epoch": 0.71, + "learning_rate": 3.787748535998612e-06, + "loss": 0.6146, + "step": 20592 + }, + { + "epoch": 0.71, + "learning_rate": 3.786895303401533e-06, + "loss": 0.6331, + "step": 20593 + }, + { + "epoch": 0.71, + "learning_rate": 3.78604214446867e-06, + "loss": 0.6339, + "step": 20594 + }, + { + "epoch": 0.71, + "learning_rate": 3.7851890592101383e-06, + "loss": 0.6578, + "step": 20595 + }, + { + "epoch": 0.71, + "learning_rate": 3.7843360476360514e-06, + "loss": 0.6689, + "step": 20596 + }, + { + "epoch": 0.71, + "learning_rate": 3.7834831097565274e-06, + "loss": 0.6334, + "step": 20597 + }, + { + "epoch": 0.71, + "learning_rate": 3.7826302455816723e-06, + "loss": 0.5645, + "step": 20598 + }, + { + "epoch": 0.71, + "learning_rate": 3.781777455121599e-06, + "loss": 0.6217, + "step": 20599 + }, + { + "epoch": 0.71, + "learning_rate": 3.7809247383864213e-06, + "loss": 0.6513, + "step": 20600 + }, + { + "epoch": 0.71, + "learning_rate": 3.780072095386248e-06, + "loss": 0.6534, + "step": 20601 + }, + { + "epoch": 0.71, + "learning_rate": 3.779219526131188e-06, + "loss": 0.5742, + "step": 20602 + }, + { + "epoch": 0.71, + "learning_rate": 3.7783670306313535e-06, + "loss": 0.6416, + "step": 20603 + }, + { + "epoch": 0.71, + "learning_rate": 3.777514608896844e-06, + "loss": 0.6096, + "step": 20604 + }, + { + "epoch": 0.71, + "learning_rate": 3.776662260937771e-06, + "loss": 0.6648, + "step": 20605 + }, + { + "epoch": 0.71, + "learning_rate": 3.7758099867642396e-06, + "loss": 0.6246, + "step": 20606 + }, + { + "epoch": 0.71, + "learning_rate": 3.774957786386354e-06, + "loss": 0.6789, + "step": 20607 + }, + { + "epoch": 0.71, + "learning_rate": 3.7741056598142188e-06, + "loss": 0.6462, + "step": 20608 + }, + { + "epoch": 0.71, + "learning_rate": 3.7732536070579408e-06, + "loss": 0.6234, + "step": 20609 + }, + { + "epoch": 0.71, + "learning_rate": 3.7724016281276145e-06, + "loss": 0.6504, + "step": 20610 + }, + { + "epoch": 0.71, + "learning_rate": 3.771549723033344e-06, + "loss": 0.6361, + "step": 20611 + }, + { + "epoch": 0.71, + "learning_rate": 3.770697891785231e-06, + "loss": 0.6277, + "step": 20612 + }, + { + "epoch": 0.71, + "learning_rate": 3.7698461343933745e-06, + "loss": 0.6387, + "step": 20613 + }, + { + "epoch": 0.71, + "learning_rate": 3.768994450867873e-06, + "loss": 0.6082, + "step": 20614 + }, + { + "epoch": 0.71, + "learning_rate": 3.768142841218829e-06, + "loss": 0.6738, + "step": 20615 + }, + { + "epoch": 0.71, + "learning_rate": 3.767291305456331e-06, + "loss": 0.6481, + "step": 20616 + }, + { + "epoch": 0.71, + "learning_rate": 3.7664398435904792e-06, + "loss": 0.6598, + "step": 20617 + }, + { + "epoch": 0.71, + "learning_rate": 3.7655884556313683e-06, + "loss": 0.6087, + "step": 20618 + }, + { + "epoch": 0.71, + "learning_rate": 3.764737141589092e-06, + "loss": 0.5652, + "step": 20619 + }, + { + "epoch": 0.71, + "learning_rate": 3.763885901473746e-06, + "loss": 0.5698, + "step": 20620 + }, + { + "epoch": 0.71, + "learning_rate": 3.763034735295423e-06, + "loss": 0.6703, + "step": 20621 + }, + { + "epoch": 0.71, + "learning_rate": 3.7621836430642113e-06, + "loss": 0.6468, + "step": 20622 + }, + { + "epoch": 0.71, + "learning_rate": 3.7613326247902026e-06, + "loss": 0.6164, + "step": 20623 + }, + { + "epoch": 0.71, + "learning_rate": 3.7604816804834875e-06, + "loss": 0.6142, + "step": 20624 + }, + { + "epoch": 0.71, + "learning_rate": 3.7596308101541555e-06, + "loss": 0.6306, + "step": 20625 + }, + { + "epoch": 0.71, + "learning_rate": 3.758780013812299e-06, + "loss": 0.6366, + "step": 20626 + }, + { + "epoch": 0.71, + "learning_rate": 3.7579292914679956e-06, + "loss": 0.6786, + "step": 20627 + }, + { + "epoch": 0.71, + "learning_rate": 3.757078643131337e-06, + "loss": 0.6219, + "step": 20628 + }, + { + "epoch": 0.71, + "learning_rate": 3.7562280688124074e-06, + "loss": 0.6284, + "step": 20629 + }, + { + "epoch": 0.71, + "learning_rate": 3.7553775685212933e-06, + "loss": 0.6596, + "step": 20630 + }, + { + "epoch": 0.71, + "learning_rate": 3.7545271422680785e-06, + "loss": 0.6557, + "step": 20631 + }, + { + "epoch": 0.71, + "learning_rate": 3.7536767900628478e-06, + "loss": 0.5962, + "step": 20632 + }, + { + "epoch": 0.71, + "learning_rate": 3.752826511915677e-06, + "loss": 0.5683, + "step": 20633 + }, + { + "epoch": 0.71, + "learning_rate": 3.75197630783665e-06, + "loss": 0.6449, + "step": 20634 + }, + { + "epoch": 0.71, + "learning_rate": 3.7511261778358487e-06, + "loss": 0.6702, + "step": 20635 + }, + { + "epoch": 0.71, + "learning_rate": 3.7502761219233506e-06, + "loss": 0.5866, + "step": 20636 + }, + { + "epoch": 0.72, + "learning_rate": 3.7494261401092346e-06, + "loss": 0.6358, + "step": 20637 + }, + { + "epoch": 0.72, + "learning_rate": 3.7485762324035834e-06, + "loss": 0.6698, + "step": 20638 + }, + { + "epoch": 0.72, + "learning_rate": 3.7477263988164648e-06, + "loss": 0.6456, + "step": 20639 + }, + { + "epoch": 0.72, + "learning_rate": 3.7468766393579592e-06, + "loss": 0.6127, + "step": 20640 + }, + { + "epoch": 0.72, + "learning_rate": 3.746026954038141e-06, + "loss": 0.6078, + "step": 20641 + }, + { + "epoch": 0.72, + "learning_rate": 3.7451773428670855e-06, + "loss": 0.6454, + "step": 20642 + }, + { + "epoch": 0.72, + "learning_rate": 3.7443278058548636e-06, + "loss": 0.6323, + "step": 20643 + }, + { + "epoch": 0.72, + "learning_rate": 3.743478343011554e-06, + "loss": 0.6553, + "step": 20644 + }, + { + "epoch": 0.72, + "learning_rate": 3.7426289543472185e-06, + "loss": 0.6369, + "step": 20645 + }, + { + "epoch": 0.72, + "learning_rate": 3.741779639871933e-06, + "loss": 0.6399, + "step": 20646 + }, + { + "epoch": 0.72, + "learning_rate": 3.7409303995957656e-06, + "loss": 0.6278, + "step": 20647 + }, + { + "epoch": 0.72, + "learning_rate": 3.7400812335287874e-06, + "loss": 0.701, + "step": 20648 + }, + { + "epoch": 0.72, + "learning_rate": 3.7392321416810638e-06, + "loss": 0.6286, + "step": 20649 + }, + { + "epoch": 0.72, + "learning_rate": 3.738383124062668e-06, + "loss": 0.6207, + "step": 20650 + }, + { + "epoch": 0.72, + "learning_rate": 3.7375341806836573e-06, + "loss": 0.647, + "step": 20651 + }, + { + "epoch": 0.72, + "learning_rate": 3.7366853115541e-06, + "loss": 0.6251, + "step": 20652 + }, + { + "epoch": 0.72, + "learning_rate": 3.7358365166840627e-06, + "loss": 0.6075, + "step": 20653 + }, + { + "epoch": 0.72, + "learning_rate": 3.734987796083607e-06, + "loss": 0.5808, + "step": 20654 + }, + { + "epoch": 0.72, + "learning_rate": 3.7341391497627955e-06, + "loss": 0.6684, + "step": 20655 + }, + { + "epoch": 0.72, + "learning_rate": 3.7332905777316954e-06, + "loss": 0.6045, + "step": 20656 + }, + { + "epoch": 0.72, + "learning_rate": 3.732442080000359e-06, + "loss": 0.602, + "step": 20657 + }, + { + "epoch": 0.72, + "learning_rate": 3.7315936565788503e-06, + "loss": 0.6225, + "step": 20658 + }, + { + "epoch": 0.72, + "learning_rate": 3.7307453074772284e-06, + "loss": 0.6789, + "step": 20659 + }, + { + "epoch": 0.72, + "learning_rate": 3.7298970327055517e-06, + "loss": 0.6451, + "step": 20660 + }, + { + "epoch": 0.72, + "learning_rate": 3.729048832273877e-06, + "loss": 0.6776, + "step": 20661 + }, + { + "epoch": 0.72, + "learning_rate": 3.7282007061922654e-06, + "loss": 0.6141, + "step": 20662 + }, + { + "epoch": 0.72, + "learning_rate": 3.727352654470764e-06, + "loss": 0.6129, + "step": 20663 + }, + { + "epoch": 0.72, + "learning_rate": 3.7265046771194322e-06, + "loss": 0.5679, + "step": 20664 + }, + { + "epoch": 0.72, + "learning_rate": 3.7256567741483242e-06, + "loss": 0.6986, + "step": 20665 + }, + { + "epoch": 0.72, + "learning_rate": 3.7248089455674905e-06, + "loss": 0.6739, + "step": 20666 + }, + { + "epoch": 0.72, + "learning_rate": 3.7239611913869867e-06, + "loss": 0.611, + "step": 20667 + }, + { + "epoch": 0.72, + "learning_rate": 3.723113511616865e-06, + "loss": 0.6951, + "step": 20668 + }, + { + "epoch": 0.72, + "learning_rate": 3.7222659062671683e-06, + "loss": 0.5668, + "step": 20669 + }, + { + "epoch": 0.72, + "learning_rate": 3.7214183753479517e-06, + "loss": 0.6469, + "step": 20670 + }, + { + "epoch": 0.72, + "learning_rate": 3.720570918869263e-06, + "loss": 0.6869, + "step": 20671 + }, + { + "epoch": 0.72, + "learning_rate": 3.719723536841149e-06, + "loss": 0.631, + "step": 20672 + }, + { + "epoch": 0.72, + "learning_rate": 3.718876229273658e-06, + "loss": 0.6355, + "step": 20673 + }, + { + "epoch": 0.72, + "learning_rate": 3.7180289961768367e-06, + "loss": 0.6257, + "step": 20674 + }, + { + "epoch": 0.72, + "learning_rate": 3.717181837560726e-06, + "loss": 0.5925, + "step": 20675 + }, + { + "epoch": 0.72, + "learning_rate": 3.7163347534353733e-06, + "loss": 0.6017, + "step": 20676 + }, + { + "epoch": 0.72, + "learning_rate": 3.7154877438108193e-06, + "loss": 0.6536, + "step": 20677 + }, + { + "epoch": 0.72, + "learning_rate": 3.7146408086971087e-06, + "loss": 0.6109, + "step": 20678 + }, + { + "epoch": 0.72, + "learning_rate": 3.713793948104283e-06, + "loss": 0.6467, + "step": 20679 + }, + { + "epoch": 0.72, + "learning_rate": 3.712947162042385e-06, + "loss": 0.5761, + "step": 20680 + }, + { + "epoch": 0.72, + "learning_rate": 3.7121004505214476e-06, + "loss": 0.6442, + "step": 20681 + }, + { + "epoch": 0.72, + "learning_rate": 3.711253813551514e-06, + "loss": 0.5838, + "step": 20682 + }, + { + "epoch": 0.72, + "learning_rate": 3.7104072511426224e-06, + "loss": 0.6643, + "step": 20683 + }, + { + "epoch": 0.72, + "learning_rate": 3.709560763304808e-06, + "loss": 0.6547, + "step": 20684 + }, + { + "epoch": 0.72, + "learning_rate": 3.7087143500481093e-06, + "loss": 0.5956, + "step": 20685 + }, + { + "epoch": 0.72, + "learning_rate": 3.707868011382564e-06, + "loss": 0.6298, + "step": 20686 + }, + { + "epoch": 0.72, + "learning_rate": 3.707021747318199e-06, + "loss": 0.5679, + "step": 20687 + }, + { + "epoch": 0.72, + "learning_rate": 3.7061755578650548e-06, + "loss": 0.5726, + "step": 20688 + }, + { + "epoch": 0.72, + "learning_rate": 3.7053294430331555e-06, + "loss": 0.62, + "step": 20689 + }, + { + "epoch": 0.72, + "learning_rate": 3.7044834028325406e-06, + "loss": 0.6394, + "step": 20690 + }, + { + "epoch": 0.72, + "learning_rate": 3.7036374372732433e-06, + "loss": 0.6273, + "step": 20691 + }, + { + "epoch": 0.72, + "learning_rate": 3.702791546365285e-06, + "loss": 0.6235, + "step": 20692 + }, + { + "epoch": 0.72, + "learning_rate": 3.701945730118699e-06, + "loss": 0.6005, + "step": 20693 + }, + { + "epoch": 0.72, + "learning_rate": 3.7010999885435173e-06, + "loss": 0.6254, + "step": 20694 + }, + { + "epoch": 0.72, + "learning_rate": 3.7002543216497553e-06, + "loss": 0.5897, + "step": 20695 + }, + { + "epoch": 0.72, + "learning_rate": 3.6994087294474523e-06, + "loss": 0.5495, + "step": 20696 + }, + { + "epoch": 0.72, + "learning_rate": 3.698563211946633e-06, + "loss": 0.6969, + "step": 20697 + }, + { + "epoch": 0.72, + "learning_rate": 3.697717769157313e-06, + "loss": 0.6544, + "step": 20698 + }, + { + "epoch": 0.72, + "learning_rate": 3.6968724010895228e-06, + "loss": 0.6, + "step": 20699 + }, + { + "epoch": 0.72, + "learning_rate": 3.696027107753286e-06, + "loss": 0.6105, + "step": 20700 + }, + { + "epoch": 0.72, + "learning_rate": 3.6951818891586167e-06, + "loss": 0.6446, + "step": 20701 + }, + { + "epoch": 0.72, + "learning_rate": 3.6943367453155445e-06, + "loss": 0.6542, + "step": 20702 + }, + { + "epoch": 0.72, + "learning_rate": 3.69349167623409e-06, + "loss": 0.6015, + "step": 20703 + }, + { + "epoch": 0.72, + "learning_rate": 3.692646681924267e-06, + "loss": 0.6279, + "step": 20704 + }, + { + "epoch": 0.72, + "learning_rate": 3.6918017623960957e-06, + "loss": 0.6277, + "step": 20705 + }, + { + "epoch": 0.72, + "learning_rate": 3.6909569176595983e-06, + "loss": 0.6664, + "step": 20706 + }, + { + "epoch": 0.72, + "learning_rate": 3.6901121477247804e-06, + "loss": 0.63, + "step": 20707 + }, + { + "epoch": 0.72, + "learning_rate": 3.689267452601668e-06, + "loss": 0.5869, + "step": 20708 + }, + { + "epoch": 0.72, + "learning_rate": 3.688422832300277e-06, + "loss": 0.6229, + "step": 20709 + }, + { + "epoch": 0.72, + "learning_rate": 3.6875782868306143e-06, + "loss": 0.6493, + "step": 20710 + }, + { + "epoch": 0.72, + "learning_rate": 3.6867338162026967e-06, + "loss": 0.659, + "step": 20711 + }, + { + "epoch": 0.72, + "learning_rate": 3.685889420426538e-06, + "loss": 0.6437, + "step": 20712 + }, + { + "epoch": 0.72, + "learning_rate": 3.6850450995121425e-06, + "loss": 0.6081, + "step": 20713 + }, + { + "epoch": 0.72, + "learning_rate": 3.6842008534695284e-06, + "loss": 0.6203, + "step": 20714 + }, + { + "epoch": 0.72, + "learning_rate": 3.6833566823087053e-06, + "loss": 0.6515, + "step": 20715 + }, + { + "epoch": 0.72, + "learning_rate": 3.682512586039677e-06, + "loss": 0.6258, + "step": 20716 + }, + { + "epoch": 0.72, + "learning_rate": 3.6816685646724537e-06, + "loss": 0.6297, + "step": 20717 + }, + { + "epoch": 0.72, + "learning_rate": 3.6808246182170447e-06, + "loss": 0.5795, + "step": 20718 + }, + { + "epoch": 0.72, + "learning_rate": 3.679980746683448e-06, + "loss": 0.6687, + "step": 20719 + }, + { + "epoch": 0.72, + "learning_rate": 3.6791369500816765e-06, + "loss": 0.6415, + "step": 20720 + }, + { + "epoch": 0.72, + "learning_rate": 3.6782932284217377e-06, + "loss": 0.6525, + "step": 20721 + }, + { + "epoch": 0.72, + "learning_rate": 3.6774495817136247e-06, + "loss": 0.6312, + "step": 20722 + }, + { + "epoch": 0.72, + "learning_rate": 3.6766060099673453e-06, + "loss": 0.6837, + "step": 20723 + }, + { + "epoch": 0.72, + "learning_rate": 3.675762513192904e-06, + "loss": 0.6368, + "step": 20724 + }, + { + "epoch": 0.72, + "learning_rate": 3.674919091400295e-06, + "loss": 0.6263, + "step": 20725 + }, + { + "epoch": 0.72, + "learning_rate": 3.674075744599519e-06, + "loss": 0.6552, + "step": 20726 + }, + { + "epoch": 0.72, + "learning_rate": 3.6732324728005832e-06, + "loss": 0.5961, + "step": 20727 + }, + { + "epoch": 0.72, + "learning_rate": 3.672389276013477e-06, + "loss": 0.6062, + "step": 20728 + }, + { + "epoch": 0.72, + "learning_rate": 3.6715461542482e-06, + "loss": 0.7072, + "step": 20729 + }, + { + "epoch": 0.72, + "learning_rate": 3.6707031075147527e-06, + "loss": 0.6043, + "step": 20730 + }, + { + "epoch": 0.72, + "learning_rate": 3.669860135823122e-06, + "loss": 0.6562, + "step": 20731 + }, + { + "epoch": 0.72, + "learning_rate": 3.6690172391833055e-06, + "loss": 0.6242, + "step": 20732 + }, + { + "epoch": 0.72, + "learning_rate": 3.6681744176053034e-06, + "loss": 0.6555, + "step": 20733 + }, + { + "epoch": 0.72, + "learning_rate": 3.6673316710991014e-06, + "loss": 0.6676, + "step": 20734 + }, + { + "epoch": 0.72, + "learning_rate": 3.6664889996746935e-06, + "loss": 0.6353, + "step": 20735 + }, + { + "epoch": 0.72, + "learning_rate": 3.6656464033420725e-06, + "loss": 0.6459, + "step": 20736 + }, + { + "epoch": 0.72, + "learning_rate": 3.664803882111223e-06, + "loss": 0.6683, + "step": 20737 + }, + { + "epoch": 0.72, + "learning_rate": 3.6639614359921347e-06, + "loss": 0.5954, + "step": 20738 + }, + { + "epoch": 0.72, + "learning_rate": 3.6631190649948057e-06, + "loss": 0.63, + "step": 20739 + }, + { + "epoch": 0.72, + "learning_rate": 3.6622767691292127e-06, + "loss": 0.6512, + "step": 20740 + }, + { + "epoch": 0.72, + "learning_rate": 3.661434548405346e-06, + "loss": 0.5671, + "step": 20741 + }, + { + "epoch": 0.72, + "learning_rate": 3.6605924028331953e-06, + "loss": 0.6426, + "step": 20742 + }, + { + "epoch": 0.72, + "learning_rate": 3.6597503324227367e-06, + "loss": 0.63, + "step": 20743 + }, + { + "epoch": 0.72, + "learning_rate": 3.658908337183955e-06, + "loss": 0.6708, + "step": 20744 + }, + { + "epoch": 0.72, + "learning_rate": 3.658066417126843e-06, + "loss": 0.6509, + "step": 20745 + }, + { + "epoch": 0.72, + "learning_rate": 3.657224572261373e-06, + "loss": 0.6453, + "step": 20746 + }, + { + "epoch": 0.72, + "learning_rate": 3.65638280259753e-06, + "loss": 0.6041, + "step": 20747 + }, + { + "epoch": 0.72, + "learning_rate": 3.6555411081452962e-06, + "loss": 0.6253, + "step": 20748 + }, + { + "epoch": 0.72, + "learning_rate": 3.6546994889146446e-06, + "loss": 0.6494, + "step": 20749 + }, + { + "epoch": 0.72, + "learning_rate": 3.6538579449155585e-06, + "loss": 0.6439, + "step": 20750 + }, + { + "epoch": 0.72, + "learning_rate": 3.6530164761580145e-06, + "loss": 0.6541, + "step": 20751 + }, + { + "epoch": 0.72, + "learning_rate": 3.6521750826519888e-06, + "loss": 0.6348, + "step": 20752 + }, + { + "epoch": 0.72, + "learning_rate": 3.65133376440746e-06, + "loss": 0.6516, + "step": 20753 + }, + { + "epoch": 0.72, + "learning_rate": 3.6504925214343978e-06, + "loss": 0.6217, + "step": 20754 + }, + { + "epoch": 0.72, + "learning_rate": 3.6496513537427793e-06, + "loss": 0.5805, + "step": 20755 + }, + { + "epoch": 0.72, + "learning_rate": 3.648810261342577e-06, + "loss": 0.6438, + "step": 20756 + }, + { + "epoch": 0.72, + "learning_rate": 3.6479692442437632e-06, + "loss": 0.6216, + "step": 20757 + }, + { + "epoch": 0.72, + "learning_rate": 3.6471283024563087e-06, + "loss": 0.643, + "step": 20758 + }, + { + "epoch": 0.72, + "learning_rate": 3.646287435990189e-06, + "loss": 0.6638, + "step": 20759 + }, + { + "epoch": 0.72, + "learning_rate": 3.645446644855366e-06, + "loss": 0.6363, + "step": 20760 + }, + { + "epoch": 0.72, + "learning_rate": 3.6446059290618106e-06, + "loss": 0.6721, + "step": 20761 + }, + { + "epoch": 0.72, + "learning_rate": 3.643765288619492e-06, + "loss": 0.6167, + "step": 20762 + }, + { + "epoch": 0.72, + "learning_rate": 3.642924723538377e-06, + "loss": 0.6718, + "step": 20763 + }, + { + "epoch": 0.72, + "learning_rate": 3.6420842338284314e-06, + "loss": 0.6365, + "step": 20764 + }, + { + "epoch": 0.72, + "learning_rate": 3.6412438194996226e-06, + "loss": 0.6761, + "step": 20765 + }, + { + "epoch": 0.72, + "learning_rate": 3.6404034805619084e-06, + "loss": 0.6364, + "step": 20766 + }, + { + "epoch": 0.72, + "learning_rate": 3.639563217025257e-06, + "loss": 0.5906, + "step": 20767 + }, + { + "epoch": 0.72, + "learning_rate": 3.638723028899629e-06, + "loss": 0.658, + "step": 20768 + }, + { + "epoch": 0.72, + "learning_rate": 3.637882916194986e-06, + "loss": 0.634, + "step": 20769 + }, + { + "epoch": 0.72, + "learning_rate": 3.6370428789212898e-06, + "loss": 0.5941, + "step": 20770 + }, + { + "epoch": 0.72, + "learning_rate": 3.6362029170885026e-06, + "loss": 0.6109, + "step": 20771 + }, + { + "epoch": 0.72, + "learning_rate": 3.635363030706578e-06, + "loss": 0.6319, + "step": 20772 + }, + { + "epoch": 0.72, + "learning_rate": 3.634523219785474e-06, + "loss": 0.6472, + "step": 20773 + }, + { + "epoch": 0.72, + "learning_rate": 3.633683484335151e-06, + "loss": 0.6768, + "step": 20774 + }, + { + "epoch": 0.72, + "learning_rate": 3.632843824365563e-06, + "loss": 0.6537, + "step": 20775 + }, + { + "epoch": 0.72, + "learning_rate": 3.632004239886666e-06, + "loss": 0.6233, + "step": 20776 + }, + { + "epoch": 0.72, + "learning_rate": 3.6311647309084185e-06, + "loss": 0.6725, + "step": 20777 + }, + { + "epoch": 0.72, + "learning_rate": 3.6303252974407654e-06, + "loss": 0.6597, + "step": 20778 + }, + { + "epoch": 0.72, + "learning_rate": 3.6294859394936644e-06, + "loss": 0.646, + "step": 20779 + }, + { + "epoch": 0.72, + "learning_rate": 3.628646657077065e-06, + "loss": 0.6354, + "step": 20780 + }, + { + "epoch": 0.72, + "learning_rate": 3.627807450200921e-06, + "loss": 0.6589, + "step": 20781 + }, + { + "epoch": 0.72, + "learning_rate": 3.6269683188751792e-06, + "loss": 0.654, + "step": 20782 + }, + { + "epoch": 0.72, + "learning_rate": 3.626129263109793e-06, + "loss": 0.6976, + "step": 20783 + }, + { + "epoch": 0.72, + "learning_rate": 3.6252902829147053e-06, + "loss": 0.6707, + "step": 20784 + }, + { + "epoch": 0.72, + "learning_rate": 3.6244513782998647e-06, + "loss": 0.6266, + "step": 20785 + }, + { + "epoch": 0.72, + "learning_rate": 3.6236125492752184e-06, + "loss": 0.6716, + "step": 20786 + }, + { + "epoch": 0.72, + "learning_rate": 3.6227737958507114e-06, + "loss": 0.7103, + "step": 20787 + }, + { + "epoch": 0.72, + "learning_rate": 3.6219351180362883e-06, + "loss": 0.647, + "step": 20788 + }, + { + "epoch": 0.72, + "learning_rate": 3.6210965158418954e-06, + "loss": 0.5422, + "step": 20789 + }, + { + "epoch": 0.72, + "learning_rate": 3.6202579892774705e-06, + "loss": 0.6374, + "step": 20790 + }, + { + "epoch": 0.72, + "learning_rate": 3.619419538352956e-06, + "loss": 0.6493, + "step": 20791 + }, + { + "epoch": 0.72, + "learning_rate": 3.6185811630782954e-06, + "loss": 0.5806, + "step": 20792 + }, + { + "epoch": 0.72, + "learning_rate": 3.6177428634634272e-06, + "loss": 0.6508, + "step": 20793 + }, + { + "epoch": 0.72, + "learning_rate": 3.6169046395182915e-06, + "loss": 0.6459, + "step": 20794 + }, + { + "epoch": 0.72, + "learning_rate": 3.616066491252829e-06, + "loss": 0.6773, + "step": 20795 + }, + { + "epoch": 0.72, + "learning_rate": 3.6152284186769704e-06, + "loss": 0.6056, + "step": 20796 + }, + { + "epoch": 0.72, + "learning_rate": 3.6143904218006566e-06, + "loss": 0.6327, + "step": 20797 + }, + { + "epoch": 0.72, + "learning_rate": 3.6135525006338213e-06, + "loss": 0.6706, + "step": 20798 + }, + { + "epoch": 0.72, + "learning_rate": 3.6127146551864002e-06, + "loss": 0.7101, + "step": 20799 + }, + { + "epoch": 0.72, + "learning_rate": 3.611876885468326e-06, + "loss": 0.6538, + "step": 20800 + }, + { + "epoch": 0.72, + "learning_rate": 3.611039191489537e-06, + "loss": 0.6212, + "step": 20801 + }, + { + "epoch": 0.72, + "learning_rate": 3.6102015732599572e-06, + "loss": 0.6076, + "step": 20802 + }, + { + "epoch": 0.72, + "learning_rate": 3.6093640307895193e-06, + "loss": 0.6286, + "step": 20803 + }, + { + "epoch": 0.72, + "learning_rate": 3.6085265640881563e-06, + "loss": 0.6062, + "step": 20804 + }, + { + "epoch": 0.72, + "learning_rate": 3.607689173165796e-06, + "loss": 0.6194, + "step": 20805 + }, + { + "epoch": 0.72, + "learning_rate": 3.606851858032366e-06, + "loss": 0.6258, + "step": 20806 + }, + { + "epoch": 0.72, + "learning_rate": 3.6060146186977995e-06, + "loss": 0.6138, + "step": 20807 + }, + { + "epoch": 0.72, + "learning_rate": 3.605177455172014e-06, + "loss": 0.6555, + "step": 20808 + }, + { + "epoch": 0.72, + "learning_rate": 3.6043403674649393e-06, + "loss": 0.5723, + "step": 20809 + }, + { + "epoch": 0.72, + "learning_rate": 3.6035033555864995e-06, + "loss": 0.6193, + "step": 20810 + }, + { + "epoch": 0.72, + "learning_rate": 3.6026664195466197e-06, + "loss": 0.6677, + "step": 20811 + }, + { + "epoch": 0.72, + "learning_rate": 3.6018295593552254e-06, + "loss": 0.6283, + "step": 20812 + }, + { + "epoch": 0.72, + "learning_rate": 3.6009927750222317e-06, + "loss": 0.6123, + "step": 20813 + }, + { + "epoch": 0.72, + "learning_rate": 3.600156066557564e-06, + "loss": 0.6244, + "step": 20814 + }, + { + "epoch": 0.72, + "learning_rate": 3.5993194339711424e-06, + "loss": 0.6198, + "step": 20815 + }, + { + "epoch": 0.72, + "learning_rate": 3.5984828772728843e-06, + "loss": 0.5868, + "step": 20816 + }, + { + "epoch": 0.72, + "learning_rate": 3.5976463964727103e-06, + "loss": 0.6174, + "step": 20817 + }, + { + "epoch": 0.72, + "learning_rate": 3.596809991580541e-06, + "loss": 0.6208, + "step": 20818 + }, + { + "epoch": 0.72, + "learning_rate": 3.5959736626062858e-06, + "loss": 0.6065, + "step": 20819 + }, + { + "epoch": 0.72, + "learning_rate": 3.5951374095598644e-06, + "loss": 0.6414, + "step": 20820 + }, + { + "epoch": 0.72, + "learning_rate": 3.5943012324511906e-06, + "loss": 0.6406, + "step": 20821 + }, + { + "epoch": 0.72, + "learning_rate": 3.5934651312901793e-06, + "loss": 0.6241, + "step": 20822 + }, + { + "epoch": 0.72, + "learning_rate": 3.5926291060867426e-06, + "loss": 0.6888, + "step": 20823 + }, + { + "epoch": 0.72, + "learning_rate": 3.591793156850797e-06, + "loss": 0.7121, + "step": 20824 + }, + { + "epoch": 0.72, + "learning_rate": 3.590957283592247e-06, + "loss": 0.6442, + "step": 20825 + }, + { + "epoch": 0.72, + "learning_rate": 3.5901214863210055e-06, + "loss": 0.628, + "step": 20826 + }, + { + "epoch": 0.72, + "learning_rate": 3.5892857650469815e-06, + "loss": 0.6258, + "step": 20827 + }, + { + "epoch": 0.72, + "learning_rate": 3.588450119780086e-06, + "loss": 0.6565, + "step": 20828 + }, + { + "epoch": 0.72, + "learning_rate": 3.587614550530224e-06, + "loss": 0.6766, + "step": 20829 + }, + { + "epoch": 0.72, + "learning_rate": 3.586779057307306e-06, + "loss": 0.5911, + "step": 20830 + }, + { + "epoch": 0.72, + "learning_rate": 3.585943640121232e-06, + "loss": 0.6574, + "step": 20831 + }, + { + "epoch": 0.72, + "learning_rate": 3.5851082989819107e-06, + "loss": 0.6495, + "step": 20832 + }, + { + "epoch": 0.72, + "learning_rate": 3.584273033899245e-06, + "loss": 0.6516, + "step": 20833 + }, + { + "epoch": 0.72, + "learning_rate": 3.5834378448831385e-06, + "loss": 0.5959, + "step": 20834 + }, + { + "epoch": 0.72, + "learning_rate": 3.582602731943493e-06, + "loss": 0.6606, + "step": 20835 + }, + { + "epoch": 0.72, + "learning_rate": 3.5817676950902136e-06, + "loss": 0.6715, + "step": 20836 + }, + { + "epoch": 0.72, + "learning_rate": 3.5809327343331946e-06, + "loss": 0.6242, + "step": 20837 + }, + { + "epoch": 0.72, + "learning_rate": 3.580097849682338e-06, + "loss": 0.6091, + "step": 20838 + }, + { + "epoch": 0.72, + "learning_rate": 3.5792630411475415e-06, + "loss": 0.5857, + "step": 20839 + }, + { + "epoch": 0.72, + "learning_rate": 3.578428308738705e-06, + "loss": 0.597, + "step": 20840 + }, + { + "epoch": 0.72, + "learning_rate": 3.577593652465724e-06, + "loss": 0.5746, + "step": 20841 + }, + { + "epoch": 0.72, + "learning_rate": 3.576759072338498e-06, + "loss": 0.6058, + "step": 20842 + }, + { + "epoch": 0.72, + "learning_rate": 3.5759245683669153e-06, + "loss": 0.6668, + "step": 20843 + }, + { + "epoch": 0.72, + "learning_rate": 3.5750901405608727e-06, + "loss": 0.6669, + "step": 20844 + }, + { + "epoch": 0.72, + "learning_rate": 3.5742557889302653e-06, + "loss": 0.6398, + "step": 20845 + }, + { + "epoch": 0.72, + "learning_rate": 3.5734215134849835e-06, + "loss": 0.6647, + "step": 20846 + }, + { + "epoch": 0.72, + "learning_rate": 3.572587314234919e-06, + "loss": 0.6204, + "step": 20847 + }, + { + "epoch": 0.72, + "learning_rate": 3.571753191189966e-06, + "loss": 0.6528, + "step": 20848 + }, + { + "epoch": 0.72, + "learning_rate": 3.5709191443600076e-06, + "loss": 0.6533, + "step": 20849 + }, + { + "epoch": 0.72, + "learning_rate": 3.5700851737549357e-06, + "loss": 0.6056, + "step": 20850 + }, + { + "epoch": 0.72, + "learning_rate": 3.569251279384638e-06, + "loss": 0.6634, + "step": 20851 + }, + { + "epoch": 0.72, + "learning_rate": 3.5684174612590016e-06, + "loss": 0.6339, + "step": 20852 + }, + { + "epoch": 0.72, + "learning_rate": 3.5675837193879113e-06, + "loss": 0.6751, + "step": 20853 + }, + { + "epoch": 0.72, + "learning_rate": 3.5667500537812573e-06, + "loss": 0.6296, + "step": 20854 + }, + { + "epoch": 0.72, + "learning_rate": 3.5659164644489152e-06, + "loss": 0.6264, + "step": 20855 + }, + { + "epoch": 0.72, + "learning_rate": 3.5650829514007733e-06, + "loss": 0.6315, + "step": 20856 + }, + { + "epoch": 0.72, + "learning_rate": 3.5642495146467126e-06, + "loss": 0.6512, + "step": 20857 + }, + { + "epoch": 0.72, + "learning_rate": 3.5634161541966162e-06, + "loss": 0.6136, + "step": 20858 + }, + { + "epoch": 0.72, + "learning_rate": 3.5625828700603624e-06, + "loss": 0.5859, + "step": 20859 + }, + { + "epoch": 0.72, + "learning_rate": 3.5617496622478364e-06, + "loss": 0.6635, + "step": 20860 + }, + { + "epoch": 0.72, + "learning_rate": 3.5609165307689087e-06, + "loss": 0.6427, + "step": 20861 + }, + { + "epoch": 0.72, + "learning_rate": 3.560083475633461e-06, + "loss": 0.6175, + "step": 20862 + }, + { + "epoch": 0.72, + "learning_rate": 3.5592504968513697e-06, + "loss": 0.6133, + "step": 20863 + }, + { + "epoch": 0.72, + "learning_rate": 3.5584175944325126e-06, + "loss": 0.6585, + "step": 20864 + }, + { + "epoch": 0.72, + "learning_rate": 3.5575847683867627e-06, + "loss": 0.6255, + "step": 20865 + }, + { + "epoch": 0.72, + "learning_rate": 3.556752018723999e-06, + "loss": 0.6699, + "step": 20866 + }, + { + "epoch": 0.72, + "learning_rate": 3.5559193454540875e-06, + "loss": 0.6461, + "step": 20867 + }, + { + "epoch": 0.72, + "learning_rate": 3.5550867485869035e-06, + "loss": 0.6633, + "step": 20868 + }, + { + "epoch": 0.72, + "learning_rate": 3.554254228132319e-06, + "loss": 0.6454, + "step": 20869 + }, + { + "epoch": 0.72, + "learning_rate": 3.553421784100204e-06, + "loss": 0.6743, + "step": 20870 + }, + { + "epoch": 0.72, + "learning_rate": 3.5525894165004294e-06, + "loss": 0.5712, + "step": 20871 + }, + { + "epoch": 0.72, + "learning_rate": 3.5517571253428673e-06, + "loss": 0.6674, + "step": 20872 + }, + { + "epoch": 0.72, + "learning_rate": 3.5509249106373767e-06, + "loss": 0.6283, + "step": 20873 + }, + { + "epoch": 0.72, + "learning_rate": 3.5500927723938307e-06, + "loss": 0.6106, + "step": 20874 + }, + { + "epoch": 0.72, + "learning_rate": 3.5492607106220932e-06, + "loss": 0.6244, + "step": 20875 + }, + { + "epoch": 0.72, + "learning_rate": 3.5484287253320302e-06, + "loss": 0.6214, + "step": 20876 + }, + { + "epoch": 0.72, + "learning_rate": 3.5475968165335105e-06, + "loss": 0.6637, + "step": 20877 + }, + { + "epoch": 0.72, + "learning_rate": 3.5467649842363884e-06, + "loss": 0.6225, + "step": 20878 + }, + { + "epoch": 0.72, + "learning_rate": 3.545933228450531e-06, + "loss": 0.6314, + "step": 20879 + }, + { + "epoch": 0.72, + "learning_rate": 3.5451015491858e-06, + "loss": 0.5946, + "step": 20880 + }, + { + "epoch": 0.72, + "learning_rate": 3.544269946452055e-06, + "loss": 0.6595, + "step": 20881 + }, + { + "epoch": 0.72, + "learning_rate": 3.5434384202591564e-06, + "loss": 0.5778, + "step": 20882 + }, + { + "epoch": 0.72, + "learning_rate": 3.5426069706169664e-06, + "loss": 0.6451, + "step": 20883 + }, + { + "epoch": 0.72, + "learning_rate": 3.5417755975353363e-06, + "loss": 0.6584, + "step": 20884 + }, + { + "epoch": 0.72, + "learning_rate": 3.5409443010241264e-06, + "loss": 0.6458, + "step": 20885 + }, + { + "epoch": 0.72, + "learning_rate": 3.5401130810931915e-06, + "loss": 0.5892, + "step": 20886 + }, + { + "epoch": 0.72, + "learning_rate": 3.539281937752389e-06, + "loss": 0.6541, + "step": 20887 + }, + { + "epoch": 0.72, + "learning_rate": 3.5384508710115716e-06, + "loss": 0.6152, + "step": 20888 + }, + { + "epoch": 0.72, + "learning_rate": 3.537619880880596e-06, + "loss": 0.6332, + "step": 20889 + }, + { + "epoch": 0.72, + "learning_rate": 3.536788967369309e-06, + "loss": 0.6065, + "step": 20890 + }, + { + "epoch": 0.72, + "learning_rate": 3.5359581304875645e-06, + "loss": 0.6082, + "step": 20891 + }, + { + "epoch": 0.72, + "learning_rate": 3.535127370245213e-06, + "loss": 0.6029, + "step": 20892 + }, + { + "epoch": 0.72, + "learning_rate": 3.5342966866521047e-06, + "loss": 0.6599, + "step": 20893 + }, + { + "epoch": 0.72, + "learning_rate": 3.5334660797180887e-06, + "loss": 0.6432, + "step": 20894 + }, + { + "epoch": 0.72, + "learning_rate": 3.532635549453016e-06, + "loss": 0.643, + "step": 20895 + }, + { + "epoch": 0.72, + "learning_rate": 3.5318050958667262e-06, + "loss": 0.5579, + "step": 20896 + }, + { + "epoch": 0.72, + "learning_rate": 3.53097471896907e-06, + "loss": 0.6006, + "step": 20897 + }, + { + "epoch": 0.72, + "learning_rate": 3.530144418769892e-06, + "loss": 0.6545, + "step": 20898 + }, + { + "epoch": 0.72, + "learning_rate": 3.5293141952790357e-06, + "loss": 0.6338, + "step": 20899 + }, + { + "epoch": 0.72, + "learning_rate": 3.5284840485063444e-06, + "loss": 0.6859, + "step": 20900 + }, + { + "epoch": 0.72, + "learning_rate": 3.527653978461666e-06, + "loss": 0.6268, + "step": 20901 + }, + { + "epoch": 0.72, + "learning_rate": 3.5268239851548325e-06, + "loss": 0.6295, + "step": 20902 + }, + { + "epoch": 0.72, + "learning_rate": 3.5259940685956906e-06, + "loss": 0.653, + "step": 20903 + }, + { + "epoch": 0.72, + "learning_rate": 3.525164228794078e-06, + "loss": 0.6463, + "step": 20904 + }, + { + "epoch": 0.72, + "learning_rate": 3.5243344657598346e-06, + "loss": 0.6549, + "step": 20905 + }, + { + "epoch": 0.72, + "learning_rate": 3.523504779502798e-06, + "loss": 0.625, + "step": 20906 + }, + { + "epoch": 0.72, + "learning_rate": 3.522675170032808e-06, + "loss": 0.6337, + "step": 20907 + }, + { + "epoch": 0.72, + "learning_rate": 3.521845637359693e-06, + "loss": 0.6454, + "step": 20908 + }, + { + "epoch": 0.72, + "learning_rate": 3.521016181493294e-06, + "loss": 0.7001, + "step": 20909 + }, + { + "epoch": 0.72, + "learning_rate": 3.520186802443445e-06, + "loss": 0.6096, + "step": 20910 + }, + { + "epoch": 0.72, + "learning_rate": 3.5193575002199775e-06, + "loss": 0.5981, + "step": 20911 + }, + { + "epoch": 0.72, + "learning_rate": 3.5185282748327254e-06, + "loss": 0.6525, + "step": 20912 + }, + { + "epoch": 0.72, + "learning_rate": 3.5176991262915227e-06, + "loss": 0.6234, + "step": 20913 + }, + { + "epoch": 0.72, + "learning_rate": 3.516870054606194e-06, + "loss": 0.6288, + "step": 20914 + }, + { + "epoch": 0.72, + "learning_rate": 3.516041059786571e-06, + "loss": 0.6291, + "step": 20915 + }, + { + "epoch": 0.72, + "learning_rate": 3.5152121418424845e-06, + "loss": 0.6348, + "step": 20916 + }, + { + "epoch": 0.72, + "learning_rate": 3.5143833007837614e-06, + "loss": 0.6235, + "step": 20917 + }, + { + "epoch": 0.72, + "learning_rate": 3.5135545366202284e-06, + "loss": 0.6564, + "step": 20918 + }, + { + "epoch": 0.72, + "learning_rate": 3.5127258493617156e-06, + "loss": 0.629, + "step": 20919 + }, + { + "epoch": 0.72, + "learning_rate": 3.5118972390180406e-06, + "loss": 0.6215, + "step": 20920 + }, + { + "epoch": 0.72, + "learning_rate": 3.511068705599031e-06, + "loss": 0.6135, + "step": 20921 + }, + { + "epoch": 0.72, + "learning_rate": 3.510240249114514e-06, + "loss": 0.6465, + "step": 20922 + }, + { + "epoch": 0.72, + "learning_rate": 3.5094118695743006e-06, + "loss": 0.6921, + "step": 20923 + }, + { + "epoch": 0.72, + "learning_rate": 3.508583566988225e-06, + "loss": 0.5994, + "step": 20924 + }, + { + "epoch": 0.72, + "learning_rate": 3.5077553413661056e-06, + "loss": 0.682, + "step": 20925 + }, + { + "epoch": 0.73, + "learning_rate": 3.506927192717756e-06, + "loss": 0.618, + "step": 20926 + }, + { + "epoch": 0.73, + "learning_rate": 3.506099121052999e-06, + "loss": 0.6019, + "step": 20927 + }, + { + "epoch": 0.73, + "learning_rate": 3.505271126381654e-06, + "loss": 0.6289, + "step": 20928 + }, + { + "epoch": 0.73, + "learning_rate": 3.5044432087135307e-06, + "loss": 0.6175, + "step": 20929 + }, + { + "epoch": 0.73, + "learning_rate": 3.5036153680584517e-06, + "loss": 0.6344, + "step": 20930 + }, + { + "epoch": 0.73, + "learning_rate": 3.5027876044262343e-06, + "loss": 0.556, + "step": 20931 + }, + { + "epoch": 0.73, + "learning_rate": 3.5019599178266862e-06, + "loss": 0.6376, + "step": 20932 + }, + { + "epoch": 0.73, + "learning_rate": 3.5011323082696226e-06, + "loss": 0.588, + "step": 20933 + }, + { + "epoch": 0.73, + "learning_rate": 3.50030477576486e-06, + "loss": 0.6534, + "step": 20934 + }, + { + "epoch": 0.73, + "learning_rate": 3.4994773203222e-06, + "loss": 0.6496, + "step": 20935 + }, + { + "epoch": 0.73, + "learning_rate": 3.4986499419514662e-06, + "loss": 0.6067, + "step": 20936 + }, + { + "epoch": 0.73, + "learning_rate": 3.4978226406624583e-06, + "loss": 0.6042, + "step": 20937 + }, + { + "epoch": 0.73, + "learning_rate": 3.4969954164649877e-06, + "loss": 0.6376, + "step": 20938 + }, + { + "epoch": 0.73, + "learning_rate": 3.496168269368867e-06, + "loss": 0.6256, + "step": 20939 + }, + { + "epoch": 0.73, + "learning_rate": 3.4953411993838947e-06, + "loss": 0.6635, + "step": 20940 + }, + { + "epoch": 0.73, + "learning_rate": 3.4945142065198777e-06, + "loss": 0.5964, + "step": 20941 + }, + { + "epoch": 0.73, + "learning_rate": 3.4936872907866314e-06, + "loss": 0.6396, + "step": 20942 + }, + { + "epoch": 0.73, + "learning_rate": 3.492860452193949e-06, + "loss": 0.5995, + "step": 20943 + }, + { + "epoch": 0.73, + "learning_rate": 3.492033690751638e-06, + "loss": 0.6863, + "step": 20944 + }, + { + "epoch": 0.73, + "learning_rate": 3.4912070064695035e-06, + "loss": 0.6543, + "step": 20945 + }, + { + "epoch": 0.73, + "learning_rate": 3.4903803993573406e-06, + "loss": 0.6199, + "step": 20946 + }, + { + "epoch": 0.73, + "learning_rate": 3.4895538694249487e-06, + "loss": 0.5736, + "step": 20947 + }, + { + "epoch": 0.73, + "learning_rate": 3.488727416682138e-06, + "loss": 0.591, + "step": 20948 + }, + { + "epoch": 0.73, + "learning_rate": 3.4879010411386982e-06, + "loss": 0.5662, + "step": 20949 + }, + { + "epoch": 0.73, + "learning_rate": 3.487074742804428e-06, + "loss": 0.6311, + "step": 20950 + }, + { + "epoch": 0.73, + "learning_rate": 3.4862485216891307e-06, + "loss": 0.6268, + "step": 20951 + }, + { + "epoch": 0.73, + "learning_rate": 3.4854223778025932e-06, + "loss": 0.6394, + "step": 20952 + }, + { + "epoch": 0.73, + "learning_rate": 3.48459631115461e-06, + "loss": 0.6324, + "step": 20953 + }, + { + "epoch": 0.73, + "learning_rate": 3.483770321754987e-06, + "loss": 0.6367, + "step": 20954 + }, + { + "epoch": 0.73, + "learning_rate": 3.4829444096135066e-06, + "loss": 0.5973, + "step": 20955 + }, + { + "epoch": 0.73, + "learning_rate": 3.4821185747399645e-06, + "loss": 0.6208, + "step": 20956 + }, + { + "epoch": 0.73, + "learning_rate": 3.481292817144155e-06, + "loss": 0.686, + "step": 20957 + }, + { + "epoch": 0.73, + "learning_rate": 3.480467136835861e-06, + "loss": 0.5632, + "step": 20958 + }, + { + "epoch": 0.73, + "learning_rate": 3.4796415338248745e-06, + "loss": 0.6085, + "step": 20959 + }, + { + "epoch": 0.73, + "learning_rate": 3.478816008120992e-06, + "loss": 0.6272, + "step": 20960 + }, + { + "epoch": 0.73, + "learning_rate": 3.4779905597339923e-06, + "loss": 0.6508, + "step": 20961 + }, + { + "epoch": 0.73, + "learning_rate": 3.4771651886736646e-06, + "loss": 0.6812, + "step": 20962 + }, + { + "epoch": 0.73, + "learning_rate": 3.4763398949497973e-06, + "loss": 0.6225, + "step": 20963 + }, + { + "epoch": 0.73, + "learning_rate": 3.4755146785721704e-06, + "loss": 0.5988, + "step": 20964 + }, + { + "epoch": 0.73, + "learning_rate": 3.4746895395505674e-06, + "loss": 0.5872, + "step": 20965 + }, + { + "epoch": 0.73, + "learning_rate": 3.4738644778947816e-06, + "loss": 0.6183, + "step": 20966 + }, + { + "epoch": 0.73, + "learning_rate": 3.473039493614584e-06, + "loss": 0.6309, + "step": 20967 + }, + { + "epoch": 0.73, + "learning_rate": 3.47221458671976e-06, + "loss": 0.6427, + "step": 20968 + }, + { + "epoch": 0.73, + "learning_rate": 3.4713897572200925e-06, + "loss": 0.6172, + "step": 20969 + }, + { + "epoch": 0.73, + "learning_rate": 3.470565005125356e-06, + "loss": 0.6031, + "step": 20970 + }, + { + "epoch": 0.73, + "learning_rate": 3.469740330445327e-06, + "loss": 0.6029, + "step": 20971 + }, + { + "epoch": 0.73, + "learning_rate": 3.468915733189794e-06, + "loss": 0.6077, + "step": 20972 + }, + { + "epoch": 0.73, + "learning_rate": 3.4680912133685242e-06, + "loss": 0.59, + "step": 20973 + }, + { + "epoch": 0.73, + "learning_rate": 3.4672667709912956e-06, + "loss": 0.6506, + "step": 20974 + }, + { + "epoch": 0.73, + "learning_rate": 3.4664424060678857e-06, + "loss": 0.63, + "step": 20975 + }, + { + "epoch": 0.73, + "learning_rate": 3.465618118608064e-06, + "loss": 0.629, + "step": 20976 + }, + { + "epoch": 0.73, + "learning_rate": 3.464793908621601e-06, + "loss": 0.6481, + "step": 20977 + }, + { + "epoch": 0.73, + "learning_rate": 3.4639697761182812e-06, + "loss": 0.6585, + "step": 20978 + }, + { + "epoch": 0.73, + "learning_rate": 3.4631457211078634e-06, + "loss": 0.6935, + "step": 20979 + }, + { + "epoch": 0.73, + "learning_rate": 3.4623217436001233e-06, + "loss": 0.6588, + "step": 20980 + }, + { + "epoch": 0.73, + "learning_rate": 3.461497843604832e-06, + "loss": 0.5883, + "step": 20981 + }, + { + "epoch": 0.73, + "learning_rate": 3.460674021131751e-06, + "loss": 0.6173, + "step": 20982 + }, + { + "epoch": 0.73, + "learning_rate": 3.4598502761906495e-06, + "loss": 0.6479, + "step": 20983 + }, + { + "epoch": 0.73, + "learning_rate": 3.4590266087913026e-06, + "loss": 0.5968, + "step": 20984 + }, + { + "epoch": 0.73, + "learning_rate": 3.4582030189434667e-06, + "loss": 0.6281, + "step": 20985 + }, + { + "epoch": 0.73, + "learning_rate": 3.4573795066569093e-06, + "loss": 0.6702, + "step": 20986 + }, + { + "epoch": 0.73, + "learning_rate": 3.456556071941397e-06, + "loss": 0.6566, + "step": 20987 + }, + { + "epoch": 0.73, + "learning_rate": 3.4557327148066867e-06, + "loss": 0.6775, + "step": 20988 + }, + { + "epoch": 0.73, + "learning_rate": 3.454909435262541e-06, + "loss": 0.6379, + "step": 20989 + }, + { + "epoch": 0.73, + "learning_rate": 3.4540862333187296e-06, + "loss": 0.6691, + "step": 20990 + }, + { + "epoch": 0.73, + "learning_rate": 3.4532631089850032e-06, + "loss": 0.7043, + "step": 20991 + }, + { + "epoch": 0.73, + "learning_rate": 3.452440062271124e-06, + "loss": 0.5889, + "step": 20992 + }, + { + "epoch": 0.73, + "learning_rate": 3.4516170931868544e-06, + "loss": 0.6125, + "step": 20993 + }, + { + "epoch": 0.73, + "learning_rate": 3.450794201741945e-06, + "loss": 0.5912, + "step": 20994 + }, + { + "epoch": 0.73, + "learning_rate": 3.4499713879461515e-06, + "loss": 0.6395, + "step": 20995 + }, + { + "epoch": 0.73, + "learning_rate": 3.449148651809239e-06, + "loss": 0.6385, + "step": 20996 + }, + { + "epoch": 0.73, + "learning_rate": 3.448325993340953e-06, + "loss": 0.6869, + "step": 20997 + }, + { + "epoch": 0.73, + "learning_rate": 3.4475034125510543e-06, + "loss": 0.6297, + "step": 20998 + }, + { + "epoch": 0.73, + "learning_rate": 3.446680909449288e-06, + "loss": 0.6424, + "step": 20999 + }, + { + "epoch": 0.73, + "learning_rate": 3.445858484045409e-06, + "loss": 0.6202, + "step": 21000 + }, + { + "epoch": 0.73, + "learning_rate": 3.4450361363491693e-06, + "loss": 0.6632, + "step": 21001 + }, + { + "epoch": 0.73, + "learning_rate": 3.4442138663703182e-06, + "loss": 0.6325, + "step": 21002 + }, + { + "epoch": 0.73, + "learning_rate": 3.4433916741186045e-06, + "loss": 0.6657, + "step": 21003 + }, + { + "epoch": 0.73, + "learning_rate": 3.44256955960378e-06, + "loss": 0.6445, + "step": 21004 + }, + { + "epoch": 0.73, + "learning_rate": 3.4417475228355855e-06, + "loss": 0.6093, + "step": 21005 + }, + { + "epoch": 0.73, + "learning_rate": 3.4409255638237705e-06, + "loss": 0.5848, + "step": 21006 + }, + { + "epoch": 0.73, + "learning_rate": 3.44010368257808e-06, + "loss": 0.6372, + "step": 21007 + }, + { + "epoch": 0.73, + "learning_rate": 3.4392818791082583e-06, + "loss": 0.6058, + "step": 21008 + }, + { + "epoch": 0.73, + "learning_rate": 3.4384601534240492e-06, + "loss": 0.6252, + "step": 21009 + }, + { + "epoch": 0.73, + "learning_rate": 3.437638505535199e-06, + "loss": 0.637, + "step": 21010 + }, + { + "epoch": 0.73, + "learning_rate": 3.4368169354514423e-06, + "loss": 0.6714, + "step": 21011 + }, + { + "epoch": 0.73, + "learning_rate": 3.4359954431825236e-06, + "loss": 0.6114, + "step": 21012 + }, + { + "epoch": 0.73, + "learning_rate": 3.435174028738183e-06, + "loss": 0.6583, + "step": 21013 + }, + { + "epoch": 0.73, + "learning_rate": 3.434352692128158e-06, + "loss": 0.6107, + "step": 21014 + }, + { + "epoch": 0.73, + "learning_rate": 3.4335314333621873e-06, + "loss": 0.6517, + "step": 21015 + }, + { + "epoch": 0.73, + "learning_rate": 3.432710252450012e-06, + "loss": 0.6533, + "step": 21016 + }, + { + "epoch": 0.73, + "learning_rate": 3.4318891494013607e-06, + "loss": 0.6315, + "step": 21017 + }, + { + "epoch": 0.73, + "learning_rate": 3.4310681242259715e-06, + "loss": 0.6275, + "step": 21018 + }, + { + "epoch": 0.73, + "learning_rate": 3.430247176933581e-06, + "loss": 0.6433, + "step": 21019 + }, + { + "epoch": 0.73, + "learning_rate": 3.4294263075339196e-06, + "loss": 0.6223, + "step": 21020 + }, + { + "epoch": 0.73, + "learning_rate": 3.4286055160367216e-06, + "loss": 0.6111, + "step": 21021 + }, + { + "epoch": 0.73, + "learning_rate": 3.427784802451721e-06, + "loss": 0.6745, + "step": 21022 + }, + { + "epoch": 0.73, + "learning_rate": 3.4269641667886434e-06, + "loss": 0.5814, + "step": 21023 + }, + { + "epoch": 0.73, + "learning_rate": 3.42614360905722e-06, + "loss": 0.6146, + "step": 21024 + }, + { + "epoch": 0.73, + "learning_rate": 3.4253231292671796e-06, + "loss": 0.6074, + "step": 21025 + }, + { + "epoch": 0.73, + "learning_rate": 3.4245027274282504e-06, + "loss": 0.5834, + "step": 21026 + }, + { + "epoch": 0.73, + "learning_rate": 3.4236824035501603e-06, + "loss": 0.6873, + "step": 21027 + }, + { + "epoch": 0.73, + "learning_rate": 3.422862157642637e-06, + "loss": 0.614, + "step": 21028 + }, + { + "epoch": 0.73, + "learning_rate": 3.4220419897154e-06, + "loss": 0.685, + "step": 21029 + }, + { + "epoch": 0.73, + "learning_rate": 3.4212218997781754e-06, + "loss": 0.7026, + "step": 21030 + }, + { + "epoch": 0.73, + "learning_rate": 3.4204018878406887e-06, + "loss": 0.6307, + "step": 21031 + }, + { + "epoch": 0.73, + "learning_rate": 3.4195819539126597e-06, + "loss": 0.6366, + "step": 21032 + }, + { + "epoch": 0.73, + "learning_rate": 3.418762098003812e-06, + "loss": 0.6129, + "step": 21033 + }, + { + "epoch": 0.73, + "learning_rate": 3.4179423201238673e-06, + "loss": 0.6098, + "step": 21034 + }, + { + "epoch": 0.73, + "learning_rate": 3.4171226202825403e-06, + "loss": 0.5856, + "step": 21035 + }, + { + "epoch": 0.73, + "learning_rate": 3.4163029984895515e-06, + "loss": 0.5976, + "step": 21036 + }, + { + "epoch": 0.73, + "learning_rate": 3.4154834547546188e-06, + "loss": 0.615, + "step": 21037 + }, + { + "epoch": 0.73, + "learning_rate": 3.41466398908746e-06, + "loss": 0.6631, + "step": 21038 + }, + { + "epoch": 0.73, + "learning_rate": 3.41384460149779e-06, + "loss": 0.6341, + "step": 21039 + }, + { + "epoch": 0.73, + "learning_rate": 3.4130252919953265e-06, + "loss": 0.6062, + "step": 21040 + }, + { + "epoch": 0.73, + "learning_rate": 3.4122060605897777e-06, + "loss": 0.6433, + "step": 21041 + }, + { + "epoch": 0.73, + "learning_rate": 3.411386907290859e-06, + "loss": 0.6264, + "step": 21042 + }, + { + "epoch": 0.73, + "learning_rate": 3.4105678321082845e-06, + "loss": 0.6046, + "step": 21043 + }, + { + "epoch": 0.73, + "learning_rate": 3.4097488350517626e-06, + "loss": 0.6333, + "step": 21044 + }, + { + "epoch": 0.73, + "learning_rate": 3.408929916131006e-06, + "loss": 0.6127, + "step": 21045 + }, + { + "epoch": 0.73, + "learning_rate": 3.408111075355727e-06, + "loss": 0.6635, + "step": 21046 + }, + { + "epoch": 0.73, + "learning_rate": 3.407292312735625e-06, + "loss": 0.6262, + "step": 21047 + }, + { + "epoch": 0.73, + "learning_rate": 3.406473628280413e-06, + "loss": 0.6045, + "step": 21048 + }, + { + "epoch": 0.73, + "learning_rate": 3.4056550219997975e-06, + "loss": 0.6702, + "step": 21049 + }, + { + "epoch": 0.73, + "learning_rate": 3.4048364939034827e-06, + "loss": 0.6251, + "step": 21050 + }, + { + "epoch": 0.73, + "learning_rate": 3.404018044001175e-06, + "loss": 0.6025, + "step": 21051 + }, + { + "epoch": 0.73, + "learning_rate": 3.4031996723025805e-06, + "loss": 0.6607, + "step": 21052 + }, + { + "epoch": 0.73, + "learning_rate": 3.4023813788173955e-06, + "loss": 0.694, + "step": 21053 + }, + { + "epoch": 0.73, + "learning_rate": 3.4015631635553246e-06, + "loss": 0.6282, + "step": 21054 + }, + { + "epoch": 0.73, + "learning_rate": 3.40074502652607e-06, + "loss": 0.6411, + "step": 21055 + }, + { + "epoch": 0.73, + "learning_rate": 3.3999269677393322e-06, + "loss": 0.6583, + "step": 21056 + }, + { + "epoch": 0.73, + "learning_rate": 3.3991089872048078e-06, + "loss": 0.6292, + "step": 21057 + }, + { + "epoch": 0.73, + "learning_rate": 3.3982910849322004e-06, + "loss": 0.6472, + "step": 21058 + }, + { + "epoch": 0.73, + "learning_rate": 3.3974732609312e-06, + "loss": 0.631, + "step": 21059 + }, + { + "epoch": 0.73, + "learning_rate": 3.3966555152115068e-06, + "loss": 0.6798, + "step": 21060 + }, + { + "epoch": 0.73, + "learning_rate": 3.395837847782816e-06, + "loss": 0.6576, + "step": 21061 + }, + { + "epoch": 0.73, + "learning_rate": 3.395020258654821e-06, + "loss": 0.6522, + "step": 21062 + }, + { + "epoch": 0.73, + "learning_rate": 3.3942027478372196e-06, + "loss": 0.6703, + "step": 21063 + }, + { + "epoch": 0.73, + "learning_rate": 3.3933853153396977e-06, + "loss": 0.6894, + "step": 21064 + }, + { + "epoch": 0.73, + "learning_rate": 3.39256796117195e-06, + "loss": 0.6674, + "step": 21065 + }, + { + "epoch": 0.73, + "learning_rate": 3.3917506853436675e-06, + "loss": 0.634, + "step": 21066 + }, + { + "epoch": 0.73, + "learning_rate": 3.3909334878645416e-06, + "loss": 0.6179, + "step": 21067 + }, + { + "epoch": 0.73, + "learning_rate": 3.3901163687442582e-06, + "loss": 0.6921, + "step": 21068 + }, + { + "epoch": 0.73, + "learning_rate": 3.38929932799251e-06, + "loss": 0.6414, + "step": 21069 + }, + { + "epoch": 0.73, + "learning_rate": 3.388482365618979e-06, + "loss": 0.6258, + "step": 21070 + }, + { + "epoch": 0.73, + "learning_rate": 3.387665481633352e-06, + "loss": 0.6191, + "step": 21071 + }, + { + "epoch": 0.73, + "learning_rate": 3.3868486760453157e-06, + "loss": 0.648, + "step": 21072 + }, + { + "epoch": 0.73, + "learning_rate": 3.3860319488645544e-06, + "loss": 0.636, + "step": 21073 + }, + { + "epoch": 0.73, + "learning_rate": 3.3852153001007506e-06, + "loss": 0.6217, + "step": 21074 + }, + { + "epoch": 0.73, + "learning_rate": 3.3843987297635906e-06, + "loss": 0.6255, + "step": 21075 + }, + { + "epoch": 0.73, + "learning_rate": 3.383582237862749e-06, + "loss": 0.6491, + "step": 21076 + }, + { + "epoch": 0.73, + "learning_rate": 3.3827658244079096e-06, + "loss": 0.6288, + "step": 21077 + }, + { + "epoch": 0.73, + "learning_rate": 3.3819494894087523e-06, + "loss": 0.6631, + "step": 21078 + }, + { + "epoch": 0.73, + "learning_rate": 3.3811332328749558e-06, + "loss": 0.5884, + "step": 21079 + }, + { + "epoch": 0.73, + "learning_rate": 3.380317054816198e-06, + "loss": 0.6004, + "step": 21080 + }, + { + "epoch": 0.73, + "learning_rate": 3.379500955242159e-06, + "loss": 0.5747, + "step": 21081 + }, + { + "epoch": 0.73, + "learning_rate": 3.3786849341625072e-06, + "loss": 0.6494, + "step": 21082 + }, + { + "epoch": 0.73, + "learning_rate": 3.377868991586921e-06, + "loss": 0.6475, + "step": 21083 + }, + { + "epoch": 0.73, + "learning_rate": 3.3770531275250763e-06, + "loss": 0.6205, + "step": 21084 + }, + { + "epoch": 0.73, + "learning_rate": 3.3762373419866432e-06, + "loss": 0.6017, + "step": 21085 + }, + { + "epoch": 0.73, + "learning_rate": 3.3754216349812972e-06, + "loss": 0.6281, + "step": 21086 + }, + { + "epoch": 0.73, + "learning_rate": 3.37460600651871e-06, + "loss": 0.6445, + "step": 21087 + }, + { + "epoch": 0.73, + "learning_rate": 3.3737904566085465e-06, + "loss": 0.5806, + "step": 21088 + }, + { + "epoch": 0.73, + "learning_rate": 3.37297498526048e-06, + "loss": 0.6361, + "step": 21089 + }, + { + "epoch": 0.73, + "learning_rate": 3.372159592484179e-06, + "loss": 0.6655, + "step": 21090 + }, + { + "epoch": 0.73, + "learning_rate": 3.3713442782893093e-06, + "loss": 0.6049, + "step": 21091 + }, + { + "epoch": 0.73, + "learning_rate": 3.3705290426855375e-06, + "loss": 0.6346, + "step": 21092 + }, + { + "epoch": 0.73, + "learning_rate": 3.3697138856825353e-06, + "loss": 0.6307, + "step": 21093 + }, + { + "epoch": 0.73, + "learning_rate": 3.3688988072899577e-06, + "loss": 0.6525, + "step": 21094 + }, + { + "epoch": 0.73, + "learning_rate": 3.368083807517474e-06, + "loss": 0.6617, + "step": 21095 + }, + { + "epoch": 0.73, + "learning_rate": 3.367268886374745e-06, + "loss": 0.7749, + "step": 21096 + }, + { + "epoch": 0.73, + "learning_rate": 3.3664540438714357e-06, + "loss": 0.6352, + "step": 21097 + }, + { + "epoch": 0.73, + "learning_rate": 3.3656392800172034e-06, + "loss": 0.6077, + "step": 21098 + }, + { + "epoch": 0.73, + "learning_rate": 3.364824594821714e-06, + "loss": 0.6434, + "step": 21099 + }, + { + "epoch": 0.73, + "learning_rate": 3.3640099882946198e-06, + "loss": 0.6095, + "step": 21100 + }, + { + "epoch": 0.73, + "learning_rate": 3.3631954604455807e-06, + "loss": 0.5617, + "step": 21101 + }, + { + "epoch": 0.73, + "learning_rate": 3.362381011284256e-06, + "loss": 0.6207, + "step": 21102 + }, + { + "epoch": 0.73, + "learning_rate": 3.3615666408202996e-06, + "loss": 0.6282, + "step": 21103 + }, + { + "epoch": 0.73, + "learning_rate": 3.36075234906337e-06, + "loss": 0.6914, + "step": 21104 + }, + { + "epoch": 0.73, + "learning_rate": 3.359938136023122e-06, + "loss": 0.6372, + "step": 21105 + }, + { + "epoch": 0.73, + "learning_rate": 3.3591240017092053e-06, + "loss": 0.6638, + "step": 21106 + }, + { + "epoch": 0.73, + "learning_rate": 3.358309946131273e-06, + "loss": 0.6629, + "step": 21107 + }, + { + "epoch": 0.73, + "learning_rate": 3.357495969298978e-06, + "loss": 0.6839, + "step": 21108 + }, + { + "epoch": 0.73, + "learning_rate": 3.3566820712219716e-06, + "loss": 0.6501, + "step": 21109 + }, + { + "epoch": 0.73, + "learning_rate": 3.355868251909904e-06, + "loss": 0.6119, + "step": 21110 + }, + { + "epoch": 0.73, + "learning_rate": 3.3550545113724253e-06, + "loss": 0.63, + "step": 21111 + }, + { + "epoch": 0.73, + "learning_rate": 3.354240849619178e-06, + "loss": 0.5963, + "step": 21112 + }, + { + "epoch": 0.73, + "learning_rate": 3.3534272666598124e-06, + "loss": 0.6537, + "step": 21113 + }, + { + "epoch": 0.73, + "learning_rate": 3.3526137625039745e-06, + "loss": 0.651, + "step": 21114 + }, + { + "epoch": 0.73, + "learning_rate": 3.3518003371613095e-06, + "loss": 0.5845, + "step": 21115 + }, + { + "epoch": 0.73, + "learning_rate": 3.3509869906414617e-06, + "loss": 0.6451, + "step": 21116 + }, + { + "epoch": 0.73, + "learning_rate": 3.3501737229540775e-06, + "loss": 0.6833, + "step": 21117 + }, + { + "epoch": 0.73, + "learning_rate": 3.349360534108792e-06, + "loss": 0.607, + "step": 21118 + }, + { + "epoch": 0.73, + "learning_rate": 3.3485474241152514e-06, + "loss": 0.6596, + "step": 21119 + }, + { + "epoch": 0.73, + "learning_rate": 3.347734392983095e-06, + "loss": 0.5705, + "step": 21120 + }, + { + "epoch": 0.73, + "learning_rate": 3.3469214407219617e-06, + "loss": 0.5733, + "step": 21121 + }, + { + "epoch": 0.73, + "learning_rate": 3.346108567341495e-06, + "loss": 0.6313, + "step": 21122 + }, + { + "epoch": 0.73, + "learning_rate": 3.3452957728513247e-06, + "loss": 0.6234, + "step": 21123 + }, + { + "epoch": 0.73, + "learning_rate": 3.344483057261092e-06, + "loss": 0.6469, + "step": 21124 + }, + { + "epoch": 0.73, + "learning_rate": 3.343670420580435e-06, + "loss": 0.7004, + "step": 21125 + }, + { + "epoch": 0.73, + "learning_rate": 3.342857862818978e-06, + "loss": 0.6452, + "step": 21126 + }, + { + "epoch": 0.73, + "learning_rate": 3.3420453839863664e-06, + "loss": 0.6409, + "step": 21127 + }, + { + "epoch": 0.73, + "learning_rate": 3.341232984092232e-06, + "loss": 0.7064, + "step": 21128 + }, + { + "epoch": 0.73, + "learning_rate": 3.340420663146201e-06, + "loss": 0.5995, + "step": 21129 + }, + { + "epoch": 0.73, + "learning_rate": 3.339608421157907e-06, + "loss": 0.617, + "step": 21130 + }, + { + "epoch": 0.73, + "learning_rate": 3.338796258136985e-06, + "loss": 0.6628, + "step": 21131 + }, + { + "epoch": 0.73, + "learning_rate": 3.337984174093053e-06, + "loss": 0.691, + "step": 21132 + }, + { + "epoch": 0.73, + "learning_rate": 3.3371721690357483e-06, + "loss": 0.6374, + "step": 21133 + }, + { + "epoch": 0.73, + "learning_rate": 3.3363602429747e-06, + "loss": 0.6774, + "step": 21134 + }, + { + "epoch": 0.73, + "learning_rate": 3.335548395919528e-06, + "loss": 0.6046, + "step": 21135 + }, + { + "epoch": 0.73, + "learning_rate": 3.334736627879859e-06, + "loss": 0.6633, + "step": 21136 + }, + { + "epoch": 0.73, + "learning_rate": 3.333924938865323e-06, + "loss": 0.62, + "step": 21137 + }, + { + "epoch": 0.73, + "learning_rate": 3.3331133288855323e-06, + "loss": 0.6253, + "step": 21138 + }, + { + "epoch": 0.73, + "learning_rate": 3.3323017979501206e-06, + "loss": 0.626, + "step": 21139 + }, + { + "epoch": 0.73, + "learning_rate": 3.331490346068709e-06, + "loss": 0.641, + "step": 21140 + }, + { + "epoch": 0.73, + "learning_rate": 3.3306789732509115e-06, + "loss": 0.6273, + "step": 21141 + }, + { + "epoch": 0.73, + "learning_rate": 3.329867679506351e-06, + "loss": 0.6706, + "step": 21142 + }, + { + "epoch": 0.73, + "learning_rate": 3.329056464844651e-06, + "loss": 0.6555, + "step": 21143 + }, + { + "epoch": 0.73, + "learning_rate": 3.3282453292754193e-06, + "loss": 0.6277, + "step": 21144 + }, + { + "epoch": 0.73, + "learning_rate": 3.327434272808281e-06, + "loss": 0.6529, + "step": 21145 + }, + { + "epoch": 0.73, + "learning_rate": 3.3266232954528543e-06, + "loss": 0.6656, + "step": 21146 + }, + { + "epoch": 0.73, + "learning_rate": 3.325812397218747e-06, + "loss": 0.6044, + "step": 21147 + }, + { + "epoch": 0.73, + "learning_rate": 3.3250015781155763e-06, + "loss": 0.6334, + "step": 21148 + }, + { + "epoch": 0.73, + "learning_rate": 3.3241908381529596e-06, + "loss": 0.6546, + "step": 21149 + }, + { + "epoch": 0.73, + "learning_rate": 3.323380177340498e-06, + "loss": 0.6283, + "step": 21150 + }, + { + "epoch": 0.73, + "learning_rate": 3.322569595687816e-06, + "loss": 0.6421, + "step": 21151 + }, + { + "epoch": 0.73, + "learning_rate": 3.3217590932045198e-06, + "loss": 0.5841, + "step": 21152 + }, + { + "epoch": 0.73, + "learning_rate": 3.3209486699002136e-06, + "loss": 0.6304, + "step": 21153 + }, + { + "epoch": 0.73, + "learning_rate": 3.320138325784511e-06, + "loss": 0.6412, + "step": 21154 + }, + { + "epoch": 0.73, + "learning_rate": 3.319328060867022e-06, + "loss": 0.5764, + "step": 21155 + }, + { + "epoch": 0.73, + "learning_rate": 3.3185178751573434e-06, + "loss": 0.6458, + "step": 21156 + }, + { + "epoch": 0.73, + "learning_rate": 3.3177077686650905e-06, + "loss": 0.5925, + "step": 21157 + }, + { + "epoch": 0.73, + "learning_rate": 3.3168977413998683e-06, + "loss": 0.6653, + "step": 21158 + }, + { + "epoch": 0.73, + "learning_rate": 3.3160877933712744e-06, + "loss": 0.6542, + "step": 21159 + }, + { + "epoch": 0.73, + "learning_rate": 3.3152779245889143e-06, + "loss": 0.6249, + "step": 21160 + }, + { + "epoch": 0.73, + "learning_rate": 3.314468135062394e-06, + "loss": 0.5904, + "step": 21161 + }, + { + "epoch": 0.73, + "learning_rate": 3.313658424801306e-06, + "loss": 0.5965, + "step": 21162 + }, + { + "epoch": 0.73, + "learning_rate": 3.3128487938152575e-06, + "loss": 0.6198, + "step": 21163 + }, + { + "epoch": 0.73, + "learning_rate": 3.31203924211385e-06, + "loss": 0.6716, + "step": 21164 + }, + { + "epoch": 0.73, + "learning_rate": 3.311229769706674e-06, + "loss": 0.5978, + "step": 21165 + }, + { + "epoch": 0.73, + "learning_rate": 3.3104203766033305e-06, + "loss": 0.6434, + "step": 21166 + }, + { + "epoch": 0.73, + "learning_rate": 3.3096110628134194e-06, + "loss": 0.6108, + "step": 21167 + }, + { + "epoch": 0.73, + "learning_rate": 3.3088018283465253e-06, + "loss": 0.627, + "step": 21168 + }, + { + "epoch": 0.73, + "learning_rate": 3.3079926732122537e-06, + "loss": 0.5663, + "step": 21169 + }, + { + "epoch": 0.73, + "learning_rate": 3.307183597420197e-06, + "loss": 0.6704, + "step": 21170 + }, + { + "epoch": 0.73, + "learning_rate": 3.3063746009799426e-06, + "loss": 0.6554, + "step": 21171 + }, + { + "epoch": 0.73, + "learning_rate": 3.305565683901084e-06, + "loss": 0.6457, + "step": 21172 + }, + { + "epoch": 0.73, + "learning_rate": 3.3047568461932167e-06, + "loss": 0.6356, + "step": 21173 + }, + { + "epoch": 0.73, + "learning_rate": 3.3039480878659204e-06, + "loss": 0.644, + "step": 21174 + }, + { + "epoch": 0.73, + "learning_rate": 3.303139408928793e-06, + "loss": 0.6568, + "step": 21175 + }, + { + "epoch": 0.73, + "learning_rate": 3.302330809391422e-06, + "loss": 0.6041, + "step": 21176 + }, + { + "epoch": 0.73, + "learning_rate": 3.301522289263389e-06, + "loss": 0.5992, + "step": 21177 + }, + { + "epoch": 0.73, + "learning_rate": 3.3007138485542834e-06, + "loss": 0.6211, + "step": 21178 + }, + { + "epoch": 0.73, + "learning_rate": 3.2999054872736925e-06, + "loss": 0.6679, + "step": 21179 + }, + { + "epoch": 0.73, + "learning_rate": 3.299097205431191e-06, + "loss": 0.6732, + "step": 21180 + }, + { + "epoch": 0.73, + "learning_rate": 3.2982890030363723e-06, + "loss": 0.6329, + "step": 21181 + }, + { + "epoch": 0.73, + "learning_rate": 3.297480880098819e-06, + "loss": 0.6155, + "step": 21182 + }, + { + "epoch": 0.73, + "learning_rate": 3.2966728366281044e-06, + "loss": 0.6378, + "step": 21183 + }, + { + "epoch": 0.73, + "learning_rate": 3.295864872633817e-06, + "loss": 0.6636, + "step": 21184 + }, + { + "epoch": 0.73, + "learning_rate": 3.295056988125529e-06, + "loss": 0.6227, + "step": 21185 + }, + { + "epoch": 0.73, + "learning_rate": 3.294249183112819e-06, + "loss": 0.6163, + "step": 21186 + }, + { + "epoch": 0.73, + "learning_rate": 3.2934414576052733e-06, + "loss": 0.613, + "step": 21187 + }, + { + "epoch": 0.73, + "learning_rate": 3.292633811612461e-06, + "loss": 0.618, + "step": 21188 + }, + { + "epoch": 0.73, + "learning_rate": 3.2918262451439585e-06, + "loss": 0.6731, + "step": 21189 + }, + { + "epoch": 0.73, + "learning_rate": 3.2910187582093454e-06, + "loss": 0.6525, + "step": 21190 + }, + { + "epoch": 0.73, + "learning_rate": 3.29021135081819e-06, + "loss": 0.679, + "step": 21191 + }, + { + "epoch": 0.73, + "learning_rate": 3.2894040229800618e-06, + "loss": 0.679, + "step": 21192 + }, + { + "epoch": 0.73, + "learning_rate": 3.2885967747045456e-06, + "loss": 0.6148, + "step": 21193 + }, + { + "epoch": 0.73, + "learning_rate": 3.2877896060012005e-06, + "loss": 0.565, + "step": 21194 + }, + { + "epoch": 0.73, + "learning_rate": 3.286982516879601e-06, + "loss": 0.637, + "step": 21195 + }, + { + "epoch": 0.73, + "learning_rate": 3.2861755073493195e-06, + "loss": 0.6294, + "step": 21196 + }, + { + "epoch": 0.73, + "learning_rate": 3.2853685774199163e-06, + "loss": 0.6385, + "step": 21197 + }, + { + "epoch": 0.73, + "learning_rate": 3.28456172710096e-06, + "loss": 0.6469, + "step": 21198 + }, + { + "epoch": 0.73, + "learning_rate": 3.2837549564020254e-06, + "loss": 0.64, + "step": 21199 + }, + { + "epoch": 0.73, + "learning_rate": 3.2829482653326692e-06, + "loss": 0.6538, + "step": 21200 + }, + { + "epoch": 0.73, + "learning_rate": 3.2821416539024586e-06, + "loss": 0.5938, + "step": 21201 + }, + { + "epoch": 0.73, + "learning_rate": 3.281335122120959e-06, + "loss": 0.6845, + "step": 21202 + }, + { + "epoch": 0.73, + "learning_rate": 3.280528669997729e-06, + "loss": 0.677, + "step": 21203 + }, + { + "epoch": 0.73, + "learning_rate": 3.2797222975423273e-06, + "loss": 0.6419, + "step": 21204 + }, + { + "epoch": 0.73, + "learning_rate": 3.2789160047643254e-06, + "loss": 0.5889, + "step": 21205 + }, + { + "epoch": 0.73, + "learning_rate": 3.278109791673274e-06, + "loss": 0.6634, + "step": 21206 + }, + { + "epoch": 0.73, + "learning_rate": 3.2773036582787343e-06, + "loss": 0.5935, + "step": 21207 + }, + { + "epoch": 0.73, + "learning_rate": 3.2764976045902664e-06, + "loss": 0.6382, + "step": 21208 + }, + { + "epoch": 0.73, + "learning_rate": 3.2756916306174224e-06, + "loss": 0.5961, + "step": 21209 + }, + { + "epoch": 0.73, + "learning_rate": 3.2748857363697563e-06, + "loss": 0.7141, + "step": 21210 + }, + { + "epoch": 0.73, + "learning_rate": 3.2740799218568344e-06, + "loss": 0.6008, + "step": 21211 + }, + { + "epoch": 0.73, + "learning_rate": 3.273274187088199e-06, + "loss": 0.5838, + "step": 21212 + }, + { + "epoch": 0.73, + "learning_rate": 3.2724685320734083e-06, + "loss": 0.5717, + "step": 21213 + }, + { + "epoch": 0.74, + "learning_rate": 3.271662956822017e-06, + "loss": 0.6485, + "step": 21214 + }, + { + "epoch": 0.74, + "learning_rate": 3.2708574613435685e-06, + "loss": 0.6238, + "step": 21215 + }, + { + "epoch": 0.74, + "learning_rate": 3.270052045647615e-06, + "loss": 0.6264, + "step": 21216 + }, + { + "epoch": 0.74, + "learning_rate": 3.2692467097437143e-06, + "loss": 0.6244, + "step": 21217 + }, + { + "epoch": 0.74, + "learning_rate": 3.2684414536414045e-06, + "loss": 0.6362, + "step": 21218 + }, + { + "epoch": 0.74, + "learning_rate": 3.2676362773502367e-06, + "loss": 0.6449, + "step": 21219 + }, + { + "epoch": 0.74, + "learning_rate": 3.2668311808797604e-06, + "loss": 0.6251, + "step": 21220 + }, + { + "epoch": 0.74, + "learning_rate": 3.2660261642395153e-06, + "loss": 0.6043, + "step": 21221 + }, + { + "epoch": 0.74, + "learning_rate": 3.265221227439045e-06, + "loss": 0.6122, + "step": 21222 + }, + { + "epoch": 0.74, + "learning_rate": 3.264416370487904e-06, + "loss": 0.694, + "step": 21223 + }, + { + "epoch": 0.74, + "learning_rate": 3.2636115933956224e-06, + "loss": 0.6239, + "step": 21224 + }, + { + "epoch": 0.74, + "learning_rate": 3.2628068961717486e-06, + "loss": 0.6398, + "step": 21225 + }, + { + "epoch": 0.74, + "learning_rate": 3.2620022788258244e-06, + "loss": 0.6387, + "step": 21226 + }, + { + "epoch": 0.74, + "learning_rate": 3.2611977413673836e-06, + "loss": 0.6182, + "step": 21227 + }, + { + "epoch": 0.74, + "learning_rate": 3.260393283805965e-06, + "loss": 0.623, + "step": 21228 + }, + { + "epoch": 0.74, + "learning_rate": 3.2595889061511156e-06, + "loss": 0.6074, + "step": 21229 + }, + { + "epoch": 0.74, + "learning_rate": 3.2587846084123633e-06, + "loss": 0.6569, + "step": 21230 + }, + { + "epoch": 0.74, + "learning_rate": 3.257980390599247e-06, + "loss": 0.5722, + "step": 21231 + }, + { + "epoch": 0.74, + "learning_rate": 3.257176252721306e-06, + "loss": 0.6447, + "step": 21232 + }, + { + "epoch": 0.74, + "learning_rate": 3.2563721947880667e-06, + "loss": 0.6122, + "step": 21233 + }, + { + "epoch": 0.74, + "learning_rate": 3.255568216809062e-06, + "loss": 0.6564, + "step": 21234 + }, + { + "epoch": 0.74, + "learning_rate": 3.254764318793834e-06, + "loss": 0.6879, + "step": 21235 + }, + { + "epoch": 0.74, + "learning_rate": 3.2539605007519048e-06, + "loss": 0.601, + "step": 21236 + }, + { + "epoch": 0.74, + "learning_rate": 3.2531567626928083e-06, + "loss": 0.6094, + "step": 21237 + }, + { + "epoch": 0.74, + "learning_rate": 3.252353104626076e-06, + "loss": 0.6361, + "step": 21238 + }, + { + "epoch": 0.74, + "learning_rate": 3.2515495265612305e-06, + "loss": 0.5882, + "step": 21239 + }, + { + "epoch": 0.74, + "learning_rate": 3.2507460285077985e-06, + "loss": 0.6124, + "step": 21240 + }, + { + "epoch": 0.74, + "learning_rate": 3.2499426104753174e-06, + "loss": 0.5776, + "step": 21241 + }, + { + "epoch": 0.74, + "learning_rate": 3.2491392724733018e-06, + "loss": 0.6332, + "step": 21242 + }, + { + "epoch": 0.74, + "learning_rate": 3.2483360145112795e-06, + "loss": 0.6032, + "step": 21243 + }, + { + "epoch": 0.74, + "learning_rate": 3.247532836598779e-06, + "loss": 0.5747, + "step": 21244 + }, + { + "epoch": 0.74, + "learning_rate": 3.2467297387453143e-06, + "loss": 0.6444, + "step": 21245 + }, + { + "epoch": 0.74, + "learning_rate": 3.2459267209604118e-06, + "loss": 0.6695, + "step": 21246 + }, + { + "epoch": 0.74, + "learning_rate": 3.2451237832535932e-06, + "loss": 0.67, + "step": 21247 + }, + { + "epoch": 0.74, + "learning_rate": 3.2443209256343756e-06, + "loss": 0.7109, + "step": 21248 + }, + { + "epoch": 0.74, + "learning_rate": 3.2435181481122837e-06, + "loss": 0.5949, + "step": 21249 + }, + { + "epoch": 0.74, + "learning_rate": 3.2427154506968263e-06, + "loss": 0.6263, + "step": 21250 + }, + { + "epoch": 0.74, + "learning_rate": 3.241912833397527e-06, + "loss": 0.6851, + "step": 21251 + }, + { + "epoch": 0.74, + "learning_rate": 3.241110296223898e-06, + "loss": 0.5782, + "step": 21252 + }, + { + "epoch": 0.74, + "learning_rate": 3.240307839185458e-06, + "loss": 0.592, + "step": 21253 + }, + { + "epoch": 0.74, + "learning_rate": 3.23950546229172e-06, + "loss": 0.7001, + "step": 21254 + }, + { + "epoch": 0.74, + "learning_rate": 3.2387031655521994e-06, + "loss": 0.6343, + "step": 21255 + }, + { + "epoch": 0.74, + "learning_rate": 3.2379009489764024e-06, + "loss": 0.6413, + "step": 21256 + }, + { + "epoch": 0.74, + "learning_rate": 3.2370988125738443e-06, + "loss": 0.6507, + "step": 21257 + }, + { + "epoch": 0.74, + "learning_rate": 3.2362967563540347e-06, + "loss": 0.5638, + "step": 21258 + }, + { + "epoch": 0.74, + "learning_rate": 3.2354947803264837e-06, + "loss": 0.6065, + "step": 21259 + }, + { + "epoch": 0.74, + "learning_rate": 3.2346928845006987e-06, + "loss": 0.6425, + "step": 21260 + }, + { + "epoch": 0.74, + "learning_rate": 3.2338910688861903e-06, + "loss": 0.6632, + "step": 21261 + }, + { + "epoch": 0.74, + "learning_rate": 3.2330893334924596e-06, + "loss": 0.6167, + "step": 21262 + }, + { + "epoch": 0.74, + "learning_rate": 3.232287678329016e-06, + "loss": 0.6422, + "step": 21263 + }, + { + "epoch": 0.74, + "learning_rate": 3.2314861034053624e-06, + "loss": 0.5571, + "step": 21264 + }, + { + "epoch": 0.74, + "learning_rate": 3.230684608731003e-06, + "loss": 0.6397, + "step": 21265 + }, + { + "epoch": 0.74, + "learning_rate": 3.2298831943154406e-06, + "loss": 0.6619, + "step": 21266 + }, + { + "epoch": 0.74, + "learning_rate": 3.2290818601681818e-06, + "loss": 0.6022, + "step": 21267 + }, + { + "epoch": 0.74, + "learning_rate": 3.2282806062987183e-06, + "loss": 0.6641, + "step": 21268 + }, + { + "epoch": 0.74, + "learning_rate": 3.2274794327165547e-06, + "loss": 0.66, + "step": 21269 + }, + { + "epoch": 0.74, + "learning_rate": 3.2266783394311896e-06, + "loss": 0.6218, + "step": 21270 + }, + { + "epoch": 0.74, + "learning_rate": 3.2258773264521216e-06, + "loss": 0.5942, + "step": 21271 + }, + { + "epoch": 0.74, + "learning_rate": 3.225076393788846e-06, + "loss": 0.6226, + "step": 21272 + }, + { + "epoch": 0.74, + "learning_rate": 3.2242755414508654e-06, + "loss": 0.6757, + "step": 21273 + }, + { + "epoch": 0.74, + "learning_rate": 3.2234747694476654e-06, + "loss": 0.6157, + "step": 21274 + }, + { + "epoch": 0.74, + "learning_rate": 3.2226740777887435e-06, + "loss": 0.6645, + "step": 21275 + }, + { + "epoch": 0.74, + "learning_rate": 3.221873466483595e-06, + "loss": 0.6432, + "step": 21276 + }, + { + "epoch": 0.74, + "learning_rate": 3.2210729355417103e-06, + "loss": 0.635, + "step": 21277 + }, + { + "epoch": 0.74, + "learning_rate": 3.2202724849725806e-06, + "loss": 0.6533, + "step": 21278 + }, + { + "epoch": 0.74, + "learning_rate": 3.219472114785701e-06, + "loss": 0.6256, + "step": 21279 + }, + { + "epoch": 0.74, + "learning_rate": 3.2186718249905534e-06, + "loss": 0.6221, + "step": 21280 + }, + { + "epoch": 0.74, + "learning_rate": 3.2178716155966307e-06, + "loss": 0.6517, + "step": 21281 + }, + { + "epoch": 0.74, + "learning_rate": 3.217071486613419e-06, + "loss": 0.6636, + "step": 21282 + }, + { + "epoch": 0.74, + "learning_rate": 3.2162714380504044e-06, + "loss": 0.6313, + "step": 21283 + }, + { + "epoch": 0.74, + "learning_rate": 3.2154714699170742e-06, + "loss": 0.6693, + "step": 21284 + }, + { + "epoch": 0.74, + "learning_rate": 3.2146715822229157e-06, + "loss": 0.6388, + "step": 21285 + }, + { + "epoch": 0.74, + "learning_rate": 3.213871774977405e-06, + "loss": 0.6868, + "step": 21286 + }, + { + "epoch": 0.74, + "learning_rate": 3.213072048190029e-06, + "loss": 0.6459, + "step": 21287 + }, + { + "epoch": 0.74, + "learning_rate": 3.21227240187027e-06, + "loss": 0.6406, + "step": 21288 + }, + { + "epoch": 0.74, + "learning_rate": 3.211472836027608e-06, + "loss": 0.6556, + "step": 21289 + }, + { + "epoch": 0.74, + "learning_rate": 3.2106733506715228e-06, + "loss": 0.6083, + "step": 21290 + }, + { + "epoch": 0.74, + "learning_rate": 3.2098739458114967e-06, + "loss": 0.6301, + "step": 21291 + }, + { + "epoch": 0.74, + "learning_rate": 3.209074621457001e-06, + "loss": 0.5846, + "step": 21292 + }, + { + "epoch": 0.74, + "learning_rate": 3.208275377617517e-06, + "loss": 0.6225, + "step": 21293 + }, + { + "epoch": 0.74, + "learning_rate": 3.2074762143025196e-06, + "loss": 0.6166, + "step": 21294 + }, + { + "epoch": 0.74, + "learning_rate": 3.206677131521485e-06, + "loss": 0.5802, + "step": 21295 + }, + { + "epoch": 0.74, + "learning_rate": 3.205878129283886e-06, + "loss": 0.6555, + "step": 21296 + }, + { + "epoch": 0.74, + "learning_rate": 3.205079207599199e-06, + "loss": 0.559, + "step": 21297 + }, + { + "epoch": 0.74, + "learning_rate": 3.2042803664768907e-06, + "loss": 0.6519, + "step": 21298 + }, + { + "epoch": 0.74, + "learning_rate": 3.2034816059264363e-06, + "loss": 0.6301, + "step": 21299 + }, + { + "epoch": 0.74, + "learning_rate": 3.2026829259573044e-06, + "loss": 0.6509, + "step": 21300 + }, + { + "epoch": 0.74, + "learning_rate": 3.2018843265789647e-06, + "loss": 0.6827, + "step": 21301 + }, + { + "epoch": 0.74, + "learning_rate": 3.2010858078008866e-06, + "loss": 0.6468, + "step": 21302 + }, + { + "epoch": 0.74, + "learning_rate": 3.20028736963254e-06, + "loss": 0.6231, + "step": 21303 + }, + { + "epoch": 0.74, + "learning_rate": 3.1994890120833844e-06, + "loss": 0.6524, + "step": 21304 + }, + { + "epoch": 0.74, + "learning_rate": 3.1986907351628894e-06, + "loss": 0.6079, + "step": 21305 + }, + { + "epoch": 0.74, + "learning_rate": 3.1978925388805206e-06, + "loss": 0.6281, + "step": 21306 + }, + { + "epoch": 0.74, + "learning_rate": 3.197094423245739e-06, + "loss": 0.5978, + "step": 21307 + }, + { + "epoch": 0.74, + "learning_rate": 3.1962963882680133e-06, + "loss": 0.6377, + "step": 21308 + }, + { + "epoch": 0.74, + "learning_rate": 3.1954984339567964e-06, + "loss": 0.6378, + "step": 21309 + }, + { + "epoch": 0.74, + "learning_rate": 3.194700560321554e-06, + "loss": 0.6439, + "step": 21310 + }, + { + "epoch": 0.74, + "learning_rate": 3.193902767371745e-06, + "loss": 0.5908, + "step": 21311 + }, + { + "epoch": 0.74, + "learning_rate": 3.1931050551168276e-06, + "loss": 0.6331, + "step": 21312 + }, + { + "epoch": 0.74, + "learning_rate": 3.192307423566261e-06, + "loss": 0.6624, + "step": 21313 + }, + { + "epoch": 0.74, + "learning_rate": 3.191509872729506e-06, + "loss": 0.6111, + "step": 21314 + }, + { + "epoch": 0.74, + "learning_rate": 3.1907124026160095e-06, + "loss": 0.6433, + "step": 21315 + }, + { + "epoch": 0.74, + "learning_rate": 3.189915013235232e-06, + "loss": 0.6253, + "step": 21316 + }, + { + "epoch": 0.74, + "learning_rate": 3.189117704596627e-06, + "loss": 0.5823, + "step": 21317 + }, + { + "epoch": 0.74, + "learning_rate": 3.1883204767096478e-06, + "loss": 0.6254, + "step": 21318 + }, + { + "epoch": 0.74, + "learning_rate": 3.187523329583745e-06, + "loss": 0.6394, + "step": 21319 + }, + { + "epoch": 0.74, + "learning_rate": 3.1867262632283745e-06, + "loss": 0.5975, + "step": 21320 + }, + { + "epoch": 0.74, + "learning_rate": 3.1859292776529803e-06, + "loss": 0.6697, + "step": 21321 + }, + { + "epoch": 0.74, + "learning_rate": 3.1851323728670135e-06, + "loss": 0.6553, + "step": 21322 + }, + { + "epoch": 0.74, + "learning_rate": 3.1843355488799244e-06, + "loss": 0.6856, + "step": 21323 + }, + { + "epoch": 0.74, + "learning_rate": 3.1835388057011584e-06, + "loss": 0.6893, + "step": 21324 + }, + { + "epoch": 0.74, + "learning_rate": 3.182742143340163e-06, + "loss": 0.5886, + "step": 21325 + }, + { + "epoch": 0.74, + "learning_rate": 3.1819455618063868e-06, + "loss": 0.6352, + "step": 21326 + }, + { + "epoch": 0.74, + "learning_rate": 3.1811490611092667e-06, + "loss": 0.6207, + "step": 21327 + }, + { + "epoch": 0.74, + "learning_rate": 3.1803526412582507e-06, + "loss": 0.5792, + "step": 21328 + }, + { + "epoch": 0.74, + "learning_rate": 3.179556302262782e-06, + "loss": 0.5904, + "step": 21329 + }, + { + "epoch": 0.74, + "learning_rate": 3.178760044132301e-06, + "loss": 0.6308, + "step": 21330 + }, + { + "epoch": 0.74, + "learning_rate": 3.177963866876248e-06, + "loss": 0.6048, + "step": 21331 + }, + { + "epoch": 0.74, + "learning_rate": 3.1771677705040672e-06, + "loss": 0.6585, + "step": 21332 + }, + { + "epoch": 0.74, + "learning_rate": 3.1763717550251894e-06, + "loss": 0.5941, + "step": 21333 + }, + { + "epoch": 0.74, + "learning_rate": 3.1755758204490563e-06, + "loss": 0.6609, + "step": 21334 + }, + { + "epoch": 0.74, + "learning_rate": 3.1747799667851056e-06, + "loss": 0.6442, + "step": 21335 + }, + { + "epoch": 0.74, + "learning_rate": 3.173984194042772e-06, + "loss": 0.634, + "step": 21336 + }, + { + "epoch": 0.74, + "learning_rate": 3.1731885022314903e-06, + "loss": 0.6253, + "step": 21337 + }, + { + "epoch": 0.74, + "learning_rate": 3.1723928913606984e-06, + "loss": 0.5963, + "step": 21338 + }, + { + "epoch": 0.74, + "learning_rate": 3.171597361439822e-06, + "loss": 0.6093, + "step": 21339 + }, + { + "epoch": 0.74, + "learning_rate": 3.1708019124782974e-06, + "loss": 0.6338, + "step": 21340 + }, + { + "epoch": 0.74, + "learning_rate": 3.1700065444855554e-06, + "loss": 0.5978, + "step": 21341 + }, + { + "epoch": 0.74, + "learning_rate": 3.1692112574710254e-06, + "loss": 0.6314, + "step": 21342 + }, + { + "epoch": 0.74, + "learning_rate": 3.1684160514441374e-06, + "loss": 0.6126, + "step": 21343 + }, + { + "epoch": 0.74, + "learning_rate": 3.167620926414322e-06, + "loss": 0.668, + "step": 21344 + }, + { + "epoch": 0.74, + "learning_rate": 3.166825882391e-06, + "loss": 0.6087, + "step": 21345 + }, + { + "epoch": 0.74, + "learning_rate": 3.1660309193836016e-06, + "loss": 0.6541, + "step": 21346 + }, + { + "epoch": 0.74, + "learning_rate": 3.165236037401551e-06, + "loss": 0.6487, + "step": 21347 + }, + { + "epoch": 0.74, + "learning_rate": 3.164441236454274e-06, + "loss": 0.5822, + "step": 21348 + }, + { + "epoch": 0.74, + "learning_rate": 3.163646516551193e-06, + "loss": 0.6264, + "step": 21349 + }, + { + "epoch": 0.74, + "learning_rate": 3.162851877701734e-06, + "loss": 0.648, + "step": 21350 + }, + { + "epoch": 0.74, + "learning_rate": 3.1620573199153115e-06, + "loss": 0.6139, + "step": 21351 + }, + { + "epoch": 0.74, + "learning_rate": 3.161262843201349e-06, + "loss": 0.6464, + "step": 21352 + }, + { + "epoch": 0.74, + "learning_rate": 3.160468447569267e-06, + "loss": 0.6308, + "step": 21353 + }, + { + "epoch": 0.74, + "learning_rate": 3.159674133028484e-06, + "loss": 0.5582, + "step": 21354 + }, + { + "epoch": 0.74, + "learning_rate": 3.1588798995884172e-06, + "loss": 0.68, + "step": 21355 + }, + { + "epoch": 0.74, + "learning_rate": 3.1580857472584856e-06, + "loss": 0.6386, + "step": 21356 + }, + { + "epoch": 0.74, + "learning_rate": 3.1572916760480997e-06, + "loss": 0.6057, + "step": 21357 + }, + { + "epoch": 0.74, + "learning_rate": 3.1564976859666774e-06, + "loss": 0.6132, + "step": 21358 + }, + { + "epoch": 0.74, + "learning_rate": 3.155703777023632e-06, + "loss": 0.6686, + "step": 21359 + }, + { + "epoch": 0.74, + "learning_rate": 3.1549099492283762e-06, + "loss": 0.6081, + "step": 21360 + }, + { + "epoch": 0.74, + "learning_rate": 3.154116202590323e-06, + "loss": 0.653, + "step": 21361 + }, + { + "epoch": 0.74, + "learning_rate": 3.1533225371188847e-06, + "loss": 0.6475, + "step": 21362 + }, + { + "epoch": 0.74, + "learning_rate": 3.152528952823465e-06, + "loss": 0.6309, + "step": 21363 + }, + { + "epoch": 0.74, + "learning_rate": 3.151735449713478e-06, + "loss": 0.6385, + "step": 21364 + }, + { + "epoch": 0.74, + "learning_rate": 3.1509420277983293e-06, + "loss": 0.5848, + "step": 21365 + }, + { + "epoch": 0.74, + "learning_rate": 3.1501486870874263e-06, + "loss": 0.6125, + "step": 21366 + }, + { + "epoch": 0.74, + "learning_rate": 3.149355427590177e-06, + "loss": 0.6552, + "step": 21367 + }, + { + "epoch": 0.74, + "learning_rate": 3.1485622493159886e-06, + "loss": 0.6849, + "step": 21368 + }, + { + "epoch": 0.74, + "learning_rate": 3.1477691522742583e-06, + "loss": 0.66, + "step": 21369 + }, + { + "epoch": 0.74, + "learning_rate": 3.1469761364743956e-06, + "loss": 0.638, + "step": 21370 + }, + { + "epoch": 0.74, + "learning_rate": 3.146183201925793e-06, + "loss": 0.6501, + "step": 21371 + }, + { + "epoch": 0.74, + "learning_rate": 3.1453903486378634e-06, + "loss": 0.6443, + "step": 21372 + }, + { + "epoch": 0.74, + "learning_rate": 3.1445975766200044e-06, + "loss": 0.6143, + "step": 21373 + }, + { + "epoch": 0.74, + "learning_rate": 3.1438048858816106e-06, + "loss": 0.6498, + "step": 21374 + }, + { + "epoch": 0.74, + "learning_rate": 3.1430122764320824e-06, + "loss": 0.6268, + "step": 21375 + }, + { + "epoch": 0.74, + "learning_rate": 3.1422197482808226e-06, + "loss": 0.5967, + "step": 21376 + }, + { + "epoch": 0.74, + "learning_rate": 3.141427301437214e-06, + "loss": 0.641, + "step": 21377 + }, + { + "epoch": 0.74, + "learning_rate": 3.1406349359106657e-06, + "loss": 0.6037, + "step": 21378 + }, + { + "epoch": 0.74, + "learning_rate": 3.1398426517105707e-06, + "loss": 0.6617, + "step": 21379 + }, + { + "epoch": 0.74, + "learning_rate": 3.139050448846316e-06, + "loss": 0.6279, + "step": 21380 + }, + { + "epoch": 0.74, + "learning_rate": 3.138258327327296e-06, + "loss": 0.6454, + "step": 21381 + }, + { + "epoch": 0.74, + "learning_rate": 3.137466287162908e-06, + "loss": 0.595, + "step": 21382 + }, + { + "epoch": 0.74, + "learning_rate": 3.1366743283625322e-06, + "loss": 0.5761, + "step": 21383 + }, + { + "epoch": 0.74, + "learning_rate": 3.135882450935567e-06, + "loss": 0.6551, + "step": 21384 + }, + { + "epoch": 0.74, + "learning_rate": 3.135090654891402e-06, + "loss": 0.5782, + "step": 21385 + }, + { + "epoch": 0.74, + "learning_rate": 3.1342989402394174e-06, + "loss": 0.6619, + "step": 21386 + }, + { + "epoch": 0.74, + "learning_rate": 3.1335073069890043e-06, + "loss": 0.677, + "step": 21387 + }, + { + "epoch": 0.74, + "learning_rate": 3.1327157551495523e-06, + "loss": 0.6317, + "step": 21388 + }, + { + "epoch": 0.74, + "learning_rate": 3.1319242847304355e-06, + "loss": 0.643, + "step": 21389 + }, + { + "epoch": 0.74, + "learning_rate": 3.131132895741047e-06, + "loss": 0.6398, + "step": 21390 + }, + { + "epoch": 0.74, + "learning_rate": 3.1303415881907705e-06, + "loss": 0.6385, + "step": 21391 + }, + { + "epoch": 0.74, + "learning_rate": 3.1295503620889823e-06, + "loss": 0.6117, + "step": 21392 + }, + { + "epoch": 0.74, + "learning_rate": 3.128759217445065e-06, + "loss": 0.6272, + "step": 21393 + }, + { + "epoch": 0.74, + "learning_rate": 3.1279681542684026e-06, + "loss": 0.6728, + "step": 21394 + }, + { + "epoch": 0.74, + "learning_rate": 3.127177172568365e-06, + "loss": 0.6149, + "step": 21395 + }, + { + "epoch": 0.74, + "learning_rate": 3.1263862723543393e-06, + "loss": 0.6179, + "step": 21396 + }, + { + "epoch": 0.74, + "learning_rate": 3.1255954536357013e-06, + "loss": 0.5668, + "step": 21397 + }, + { + "epoch": 0.74, + "learning_rate": 3.1248047164218244e-06, + "loss": 0.6797, + "step": 21398 + }, + { + "epoch": 0.74, + "learning_rate": 3.1240140607220827e-06, + "loss": 0.6235, + "step": 21399 + }, + { + "epoch": 0.74, + "learning_rate": 3.1232234865458567e-06, + "loss": 0.6669, + "step": 21400 + }, + { + "epoch": 0.74, + "learning_rate": 3.122432993902509e-06, + "loss": 0.5861, + "step": 21401 + }, + { + "epoch": 0.74, + "learning_rate": 3.121642582801422e-06, + "loss": 0.6447, + "step": 21402 + }, + { + "epoch": 0.74, + "learning_rate": 3.120852253251966e-06, + "loss": 0.6308, + "step": 21403 + }, + { + "epoch": 0.74, + "learning_rate": 3.1200620052635057e-06, + "loss": 0.5996, + "step": 21404 + }, + { + "epoch": 0.74, + "learning_rate": 3.119271838845412e-06, + "loss": 0.6469, + "step": 21405 + }, + { + "epoch": 0.74, + "learning_rate": 3.11848175400706e-06, + "loss": 0.6424, + "step": 21406 + }, + { + "epoch": 0.74, + "learning_rate": 3.1176917507578054e-06, + "loss": 0.6463, + "step": 21407 + }, + { + "epoch": 0.74, + "learning_rate": 3.1169018291070242e-06, + "loss": 0.692, + "step": 21408 + }, + { + "epoch": 0.74, + "learning_rate": 3.1161119890640813e-06, + "loss": 0.6517, + "step": 21409 + }, + { + "epoch": 0.74, + "learning_rate": 3.1153222306383368e-06, + "loss": 0.5749, + "step": 21410 + }, + { + "epoch": 0.74, + "learning_rate": 3.1145325538391558e-06, + "loss": 0.6134, + "step": 21411 + }, + { + "epoch": 0.74, + "learning_rate": 3.113742958675905e-06, + "loss": 0.6499, + "step": 21412 + }, + { + "epoch": 0.74, + "learning_rate": 3.1129534451579357e-06, + "loss": 0.6252, + "step": 21413 + }, + { + "epoch": 0.74, + "learning_rate": 3.1121640132946195e-06, + "loss": 0.6517, + "step": 21414 + }, + { + "epoch": 0.74, + "learning_rate": 3.1113746630953146e-06, + "loss": 0.6327, + "step": 21415 + }, + { + "epoch": 0.74, + "learning_rate": 3.1105853945693744e-06, + "loss": 0.6257, + "step": 21416 + }, + { + "epoch": 0.74, + "learning_rate": 3.109796207726159e-06, + "loss": 0.6019, + "step": 21417 + }, + { + "epoch": 0.74, + "learning_rate": 3.109007102575029e-06, + "loss": 0.5746, + "step": 21418 + }, + { + "epoch": 0.74, + "learning_rate": 3.1082180791253314e-06, + "loss": 0.5588, + "step": 21419 + }, + { + "epoch": 0.74, + "learning_rate": 3.10742913738643e-06, + "loss": 0.5703, + "step": 21420 + }, + { + "epoch": 0.74, + "learning_rate": 3.1066402773676774e-06, + "loss": 0.65, + "step": 21421 + }, + { + "epoch": 0.74, + "learning_rate": 3.105851499078422e-06, + "loss": 0.6245, + "step": 21422 + }, + { + "epoch": 0.74, + "learning_rate": 3.105062802528017e-06, + "loss": 0.6297, + "step": 21423 + }, + { + "epoch": 0.74, + "learning_rate": 3.104274187725819e-06, + "loss": 0.7053, + "step": 21424 + }, + { + "epoch": 0.74, + "learning_rate": 3.1034856546811664e-06, + "loss": 0.615, + "step": 21425 + }, + { + "epoch": 0.74, + "learning_rate": 3.10269720340342e-06, + "loss": 0.6359, + "step": 21426 + }, + { + "epoch": 0.74, + "learning_rate": 3.1019088339019254e-06, + "loss": 0.6013, + "step": 21427 + }, + { + "epoch": 0.74, + "learning_rate": 3.101120546186025e-06, + "loss": 0.6778, + "step": 21428 + }, + { + "epoch": 0.74, + "learning_rate": 3.1003323402650677e-06, + "loss": 0.5834, + "step": 21429 + }, + { + "epoch": 0.74, + "learning_rate": 3.0995442161484015e-06, + "loss": 0.5976, + "step": 21430 + }, + { + "epoch": 0.74, + "learning_rate": 3.0987561738453618e-06, + "loss": 0.6521, + "step": 21431 + }, + { + "epoch": 0.74, + "learning_rate": 3.0979682133653033e-06, + "loss": 0.7011, + "step": 21432 + }, + { + "epoch": 0.74, + "learning_rate": 3.09718033471756e-06, + "loss": 0.5645, + "step": 21433 + }, + { + "epoch": 0.74, + "learning_rate": 3.096392537911477e-06, + "loss": 0.6231, + "step": 21434 + }, + { + "epoch": 0.74, + "learning_rate": 3.095604822956395e-06, + "loss": 0.7076, + "step": 21435 + }, + { + "epoch": 0.74, + "learning_rate": 3.0948171898616498e-06, + "loss": 0.6242, + "step": 21436 + }, + { + "epoch": 0.74, + "learning_rate": 3.094029638636579e-06, + "loss": 0.6659, + "step": 21437 + }, + { + "epoch": 0.74, + "learning_rate": 3.093242169290529e-06, + "loss": 0.6773, + "step": 21438 + }, + { + "epoch": 0.74, + "learning_rate": 3.0924547818328267e-06, + "loss": 0.6873, + "step": 21439 + }, + { + "epoch": 0.74, + "learning_rate": 3.0916674762728104e-06, + "loss": 0.5973, + "step": 21440 + }, + { + "epoch": 0.74, + "learning_rate": 3.09088025261982e-06, + "loss": 0.6734, + "step": 21441 + }, + { + "epoch": 0.74, + "learning_rate": 3.09009311088318e-06, + "loss": 0.6327, + "step": 21442 + }, + { + "epoch": 0.74, + "learning_rate": 3.089306051072225e-06, + "loss": 0.6257, + "step": 21443 + }, + { + "epoch": 0.74, + "learning_rate": 3.0885190731962946e-06, + "loss": 0.6167, + "step": 21444 + }, + { + "epoch": 0.74, + "learning_rate": 3.0877321772647095e-06, + "loss": 0.6495, + "step": 21445 + }, + { + "epoch": 0.74, + "learning_rate": 3.0869453632868053e-06, + "loss": 0.6885, + "step": 21446 + }, + { + "epoch": 0.74, + "learning_rate": 3.0861586312719104e-06, + "loss": 0.612, + "step": 21447 + }, + { + "epoch": 0.74, + "learning_rate": 3.085371981229349e-06, + "loss": 0.5931, + "step": 21448 + }, + { + "epoch": 0.74, + "learning_rate": 3.084585413168446e-06, + "loss": 0.5685, + "step": 21449 + }, + { + "epoch": 0.74, + "learning_rate": 3.083798927098538e-06, + "loss": 0.6605, + "step": 21450 + }, + { + "epoch": 0.74, + "learning_rate": 3.0830125230289386e-06, + "loss": 0.6766, + "step": 21451 + }, + { + "epoch": 0.74, + "learning_rate": 3.0822262009689774e-06, + "loss": 0.6488, + "step": 21452 + }, + { + "epoch": 0.74, + "learning_rate": 3.081439960927978e-06, + "loss": 0.5966, + "step": 21453 + }, + { + "epoch": 0.74, + "learning_rate": 3.0806538029152554e-06, + "loss": 0.6156, + "step": 21454 + }, + { + "epoch": 0.74, + "learning_rate": 3.0798677269401333e-06, + "loss": 0.5969, + "step": 21455 + }, + { + "epoch": 0.74, + "learning_rate": 3.0790817330119394e-06, + "loss": 0.6158, + "step": 21456 + }, + { + "epoch": 0.74, + "learning_rate": 3.0782958211399826e-06, + "loss": 0.6626, + "step": 21457 + }, + { + "epoch": 0.74, + "learning_rate": 3.077509991333586e-06, + "loss": 0.6361, + "step": 21458 + }, + { + "epoch": 0.74, + "learning_rate": 3.076724243602068e-06, + "loss": 0.6706, + "step": 21459 + }, + { + "epoch": 0.74, + "learning_rate": 3.0759385779547392e-06, + "loss": 0.6509, + "step": 21460 + }, + { + "epoch": 0.74, + "learning_rate": 3.0751529944009174e-06, + "loss": 0.6479, + "step": 21461 + }, + { + "epoch": 0.74, + "learning_rate": 3.074367492949917e-06, + "loss": 0.6072, + "step": 21462 + }, + { + "epoch": 0.74, + "learning_rate": 3.07358207361105e-06, + "loss": 0.5998, + "step": 21463 + }, + { + "epoch": 0.74, + "learning_rate": 3.0727967363936307e-06, + "loss": 0.6015, + "step": 21464 + }, + { + "epoch": 0.74, + "learning_rate": 3.072011481306971e-06, + "loss": 0.6376, + "step": 21465 + }, + { + "epoch": 0.74, + "learning_rate": 3.0712263083603766e-06, + "loss": 0.6313, + "step": 21466 + }, + { + "epoch": 0.74, + "learning_rate": 3.0704412175631594e-06, + "loss": 0.6563, + "step": 21467 + }, + { + "epoch": 0.74, + "learning_rate": 3.0696562089246275e-06, + "loss": 0.6479, + "step": 21468 + }, + { + "epoch": 0.74, + "learning_rate": 3.0688712824540878e-06, + "loss": 0.6432, + "step": 21469 + }, + { + "epoch": 0.74, + "learning_rate": 3.0680864381608478e-06, + "loss": 0.6625, + "step": 21470 + }, + { + "epoch": 0.74, + "learning_rate": 3.067301676054215e-06, + "loss": 0.6272, + "step": 21471 + }, + { + "epoch": 0.74, + "learning_rate": 3.066516996143487e-06, + "loss": 0.6303, + "step": 21472 + }, + { + "epoch": 0.74, + "learning_rate": 3.0657323984379704e-06, + "loss": 0.6855, + "step": 21473 + }, + { + "epoch": 0.74, + "learning_rate": 3.064947882946969e-06, + "loss": 0.5726, + "step": 21474 + }, + { + "epoch": 0.74, + "learning_rate": 3.0641634496797834e-06, + "loss": 0.6615, + "step": 21475 + }, + { + "epoch": 0.74, + "learning_rate": 3.0633790986457135e-06, + "loss": 0.6922, + "step": 21476 + }, + { + "epoch": 0.74, + "learning_rate": 3.0625948298540632e-06, + "loss": 0.6562, + "step": 21477 + }, + { + "epoch": 0.74, + "learning_rate": 3.0618106433141237e-06, + "loss": 0.6502, + "step": 21478 + }, + { + "epoch": 0.74, + "learning_rate": 3.0610265390351945e-06, + "loss": 0.5785, + "step": 21479 + }, + { + "epoch": 0.74, + "learning_rate": 3.0602425170265747e-06, + "loss": 0.5755, + "step": 21480 + }, + { + "epoch": 0.74, + "learning_rate": 3.0594585772975594e-06, + "loss": 0.616, + "step": 21481 + }, + { + "epoch": 0.74, + "learning_rate": 3.0586747198574408e-06, + "loss": 0.6377, + "step": 21482 + }, + { + "epoch": 0.74, + "learning_rate": 3.057890944715519e-06, + "loss": 0.5852, + "step": 21483 + }, + { + "epoch": 0.74, + "learning_rate": 3.0571072518810774e-06, + "loss": 0.6959, + "step": 21484 + }, + { + "epoch": 0.74, + "learning_rate": 3.0563236413634135e-06, + "loss": 0.5992, + "step": 21485 + }, + { + "epoch": 0.74, + "learning_rate": 3.0555401131718155e-06, + "loss": 0.6737, + "step": 21486 + }, + { + "epoch": 0.74, + "learning_rate": 3.0547566673155736e-06, + "loss": 0.6878, + "step": 21487 + }, + { + "epoch": 0.74, + "learning_rate": 3.053973303803979e-06, + "loss": 0.6162, + "step": 21488 + }, + { + "epoch": 0.74, + "learning_rate": 3.0531900226463194e-06, + "loss": 0.6316, + "step": 21489 + }, + { + "epoch": 0.74, + "learning_rate": 3.0524068238518776e-06, + "loss": 0.6127, + "step": 21490 + }, + { + "epoch": 0.74, + "learning_rate": 3.0516237074299415e-06, + "loss": 0.6791, + "step": 21491 + }, + { + "epoch": 0.74, + "learning_rate": 3.0508406733897954e-06, + "loss": 0.6497, + "step": 21492 + }, + { + "epoch": 0.74, + "learning_rate": 3.0500577217407245e-06, + "loss": 0.6486, + "step": 21493 + }, + { + "epoch": 0.74, + "learning_rate": 3.0492748524920148e-06, + "loss": 0.6441, + "step": 21494 + }, + { + "epoch": 0.74, + "learning_rate": 3.048492065652939e-06, + "loss": 0.6416, + "step": 21495 + }, + { + "epoch": 0.74, + "learning_rate": 3.047709361232786e-06, + "loss": 0.6215, + "step": 21496 + }, + { + "epoch": 0.74, + "learning_rate": 3.046926739240832e-06, + "loss": 0.657, + "step": 21497 + }, + { + "epoch": 0.74, + "learning_rate": 3.046144199686357e-06, + "loss": 0.6425, + "step": 21498 + }, + { + "epoch": 0.74, + "learning_rate": 3.0453617425786396e-06, + "loss": 0.6164, + "step": 21499 + }, + { + "epoch": 0.74, + "learning_rate": 3.0445793679269597e-06, + "loss": 0.6619, + "step": 21500 + }, + { + "epoch": 0.74, + "learning_rate": 3.0437970757405864e-06, + "loss": 0.6391, + "step": 21501 + }, + { + "epoch": 0.74, + "learning_rate": 3.0430148660287994e-06, + "loss": 0.617, + "step": 21502 + }, + { + "epoch": 0.75, + "learning_rate": 3.042232738800871e-06, + "loss": 0.6588, + "step": 21503 + }, + { + "epoch": 0.75, + "learning_rate": 3.041450694066075e-06, + "loss": 0.6553, + "step": 21504 + }, + { + "epoch": 0.75, + "learning_rate": 3.0406687318336834e-06, + "loss": 0.6872, + "step": 21505 + }, + { + "epoch": 0.75, + "learning_rate": 3.0398868521129722e-06, + "loss": 0.7102, + "step": 21506 + }, + { + "epoch": 0.75, + "learning_rate": 3.0391050549132016e-06, + "loss": 0.6461, + "step": 21507 + }, + { + "epoch": 0.75, + "learning_rate": 3.0383233402436475e-06, + "loss": 0.6723, + "step": 21508 + }, + { + "epoch": 0.75, + "learning_rate": 3.037541708113577e-06, + "loss": 0.6424, + "step": 21509 + }, + { + "epoch": 0.75, + "learning_rate": 3.036760158532257e-06, + "loss": 0.6104, + "step": 21510 + }, + { + "epoch": 0.75, + "learning_rate": 3.035978691508953e-06, + "loss": 0.6199, + "step": 21511 + }, + { + "epoch": 0.75, + "learning_rate": 3.035197307052935e-06, + "loss": 0.631, + "step": 21512 + }, + { + "epoch": 0.75, + "learning_rate": 3.0344160051734605e-06, + "loss": 0.5743, + "step": 21513 + }, + { + "epoch": 0.75, + "learning_rate": 3.0336347858797953e-06, + "loss": 0.684, + "step": 21514 + }, + { + "epoch": 0.75, + "learning_rate": 3.032853649181202e-06, + "loss": 0.6426, + "step": 21515 + }, + { + "epoch": 0.75, + "learning_rate": 3.0320725950869424e-06, + "loss": 0.6566, + "step": 21516 + }, + { + "epoch": 0.75, + "learning_rate": 3.0312916236062773e-06, + "loss": 0.5873, + "step": 21517 + }, + { + "epoch": 0.75, + "learning_rate": 3.0305107347484673e-06, + "loss": 0.6252, + "step": 21518 + }, + { + "epoch": 0.75, + "learning_rate": 3.0297299285227677e-06, + "loss": 0.6283, + "step": 21519 + }, + { + "epoch": 0.75, + "learning_rate": 3.028949204938436e-06, + "loss": 0.6258, + "step": 21520 + }, + { + "epoch": 0.75, + "learning_rate": 3.02816856400473e-06, + "loss": 0.6362, + "step": 21521 + }, + { + "epoch": 0.75, + "learning_rate": 3.0273880057309048e-06, + "loss": 0.6568, + "step": 21522 + }, + { + "epoch": 0.75, + "learning_rate": 3.0266075301262155e-06, + "loss": 0.5914, + "step": 21523 + }, + { + "epoch": 0.75, + "learning_rate": 3.0258271371999192e-06, + "loss": 0.6814, + "step": 21524 + }, + { + "epoch": 0.75, + "learning_rate": 3.0250468269612597e-06, + "loss": 0.629, + "step": 21525 + }, + { + "epoch": 0.75, + "learning_rate": 3.0242665994194953e-06, + "loss": 0.6155, + "step": 21526 + }, + { + "epoch": 0.75, + "learning_rate": 3.023486454583874e-06, + "loss": 0.6814, + "step": 21527 + }, + { + "epoch": 0.75, + "learning_rate": 3.0227063924636457e-06, + "loss": 0.6576, + "step": 21528 + }, + { + "epoch": 0.75, + "learning_rate": 3.0219264130680593e-06, + "loss": 0.615, + "step": 21529 + }, + { + "epoch": 0.75, + "learning_rate": 3.021146516406367e-06, + "loss": 0.5995, + "step": 21530 + }, + { + "epoch": 0.75, + "learning_rate": 3.0203667024878067e-06, + "loss": 0.6103, + "step": 21531 + }, + { + "epoch": 0.75, + "learning_rate": 3.0195869713216287e-06, + "loss": 0.612, + "step": 21532 + }, + { + "epoch": 0.75, + "learning_rate": 3.018807322917078e-06, + "loss": 0.6239, + "step": 21533 + }, + { + "epoch": 0.75, + "learning_rate": 3.018027757283396e-06, + "loss": 0.6128, + "step": 21534 + }, + { + "epoch": 0.75, + "learning_rate": 3.017248274429829e-06, + "loss": 0.5824, + "step": 21535 + }, + { + "epoch": 0.75, + "learning_rate": 3.016468874365619e-06, + "loss": 0.6339, + "step": 21536 + }, + { + "epoch": 0.75, + "learning_rate": 3.0156895571000023e-06, + "loss": 0.6466, + "step": 21537 + }, + { + "epoch": 0.75, + "learning_rate": 3.0149103226422217e-06, + "loss": 0.6318, + "step": 21538 + }, + { + "epoch": 0.75, + "learning_rate": 3.0141311710015142e-06, + "loss": 0.6454, + "step": 21539 + }, + { + "epoch": 0.75, + "learning_rate": 3.0133521021871192e-06, + "loss": 0.713, + "step": 21540 + }, + { + "epoch": 0.75, + "learning_rate": 3.0125731162082728e-06, + "loss": 0.6554, + "step": 21541 + }, + { + "epoch": 0.75, + "learning_rate": 3.011794213074215e-06, + "loss": 0.6785, + "step": 21542 + }, + { + "epoch": 0.75, + "learning_rate": 3.0110153927941734e-06, + "loss": 0.6288, + "step": 21543 + }, + { + "epoch": 0.75, + "learning_rate": 3.0102366553773854e-06, + "loss": 0.6511, + "step": 21544 + }, + { + "epoch": 0.75, + "learning_rate": 3.0094580008330843e-06, + "loss": 0.6449, + "step": 21545 + }, + { + "epoch": 0.75, + "learning_rate": 3.0086794291705013e-06, + "loss": 0.653, + "step": 21546 + }, + { + "epoch": 0.75, + "learning_rate": 3.007900940398868e-06, + "loss": 0.6052, + "step": 21547 + }, + { + "epoch": 0.75, + "learning_rate": 3.007122534527418e-06, + "loss": 0.6352, + "step": 21548 + }, + { + "epoch": 0.75, + "learning_rate": 3.006344211565372e-06, + "loss": 0.5958, + "step": 21549 + }, + { + "epoch": 0.75, + "learning_rate": 3.0055659715219633e-06, + "loss": 0.6397, + "step": 21550 + }, + { + "epoch": 0.75, + "learning_rate": 3.004787814406417e-06, + "loss": 0.6049, + "step": 21551 + }, + { + "epoch": 0.75, + "learning_rate": 3.0040097402279613e-06, + "loss": 0.6338, + "step": 21552 + }, + { + "epoch": 0.75, + "learning_rate": 3.0032317489958184e-06, + "loss": 0.6112, + "step": 21553 + }, + { + "epoch": 0.75, + "learning_rate": 3.0024538407192194e-06, + "loss": 0.6079, + "step": 21554 + }, + { + "epoch": 0.75, + "learning_rate": 3.0016760154073774e-06, + "loss": 0.6521, + "step": 21555 + }, + { + "epoch": 0.75, + "learning_rate": 3.0008982730695193e-06, + "loss": 0.6813, + "step": 21556 + }, + { + "epoch": 0.75, + "learning_rate": 3.0001206137148666e-06, + "loss": 0.6422, + "step": 21557 + }, + { + "epoch": 0.75, + "learning_rate": 2.999343037352639e-06, + "loss": 0.6094, + "step": 21558 + }, + { + "epoch": 0.75, + "learning_rate": 2.998565543992058e-06, + "loss": 0.6493, + "step": 21559 + }, + { + "epoch": 0.75, + "learning_rate": 2.9977881336423364e-06, + "loss": 0.604, + "step": 21560 + }, + { + "epoch": 0.75, + "learning_rate": 2.997010806312695e-06, + "loss": 0.6139, + "step": 21561 + }, + { + "epoch": 0.75, + "learning_rate": 2.9962335620123482e-06, + "loss": 0.6306, + "step": 21562 + }, + { + "epoch": 0.75, + "learning_rate": 2.9954564007505137e-06, + "loss": 0.6443, + "step": 21563 + }, + { + "epoch": 0.75, + "learning_rate": 2.9946793225364036e-06, + "loss": 0.6525, + "step": 21564 + }, + { + "epoch": 0.75, + "learning_rate": 2.9939023273792343e-06, + "loss": 0.6061, + "step": 21565 + }, + { + "epoch": 0.75, + "learning_rate": 2.9931254152882137e-06, + "loss": 0.623, + "step": 21566 + }, + { + "epoch": 0.75, + "learning_rate": 2.9923485862725553e-06, + "loss": 0.6417, + "step": 21567 + }, + { + "epoch": 0.75, + "learning_rate": 2.9915718403414684e-06, + "loss": 0.5821, + "step": 21568 + }, + { + "epoch": 0.75, + "learning_rate": 2.9907951775041633e-06, + "loss": 0.6571, + "step": 21569 + }, + { + "epoch": 0.75, + "learning_rate": 2.990018597769847e-06, + "loss": 0.6204, + "step": 21570 + }, + { + "epoch": 0.75, + "learning_rate": 2.9892421011477325e-06, + "loss": 0.5625, + "step": 21571 + }, + { + "epoch": 0.75, + "learning_rate": 2.9884656876470175e-06, + "loss": 0.5875, + "step": 21572 + }, + { + "epoch": 0.75, + "learning_rate": 2.9876893572769116e-06, + "loss": 0.6008, + "step": 21573 + }, + { + "epoch": 0.75, + "learning_rate": 2.98691311004662e-06, + "loss": 0.5848, + "step": 21574 + }, + { + "epoch": 0.75, + "learning_rate": 2.9861369459653433e-06, + "loss": 0.6531, + "step": 21575 + }, + { + "epoch": 0.75, + "learning_rate": 2.9853608650422873e-06, + "loss": 0.6342, + "step": 21576 + }, + { + "epoch": 0.75, + "learning_rate": 2.9845848672866538e-06, + "loss": 0.6312, + "step": 21577 + }, + { + "epoch": 0.75, + "learning_rate": 2.9838089527076384e-06, + "loss": 0.6762, + "step": 21578 + }, + { + "epoch": 0.75, + "learning_rate": 2.983033121314444e-06, + "loss": 0.6407, + "step": 21579 + }, + { + "epoch": 0.75, + "learning_rate": 2.982257373116267e-06, + "loss": 0.5472, + "step": 21580 + }, + { + "epoch": 0.75, + "learning_rate": 2.981481708122308e-06, + "loss": 0.6594, + "step": 21581 + }, + { + "epoch": 0.75, + "learning_rate": 2.9807061263417614e-06, + "loss": 0.6647, + "step": 21582 + }, + { + "epoch": 0.75, + "learning_rate": 2.979930627783826e-06, + "loss": 0.6717, + "step": 21583 + }, + { + "epoch": 0.75, + "learning_rate": 2.9791552124576904e-06, + "loss": 0.6381, + "step": 21584 + }, + { + "epoch": 0.75, + "learning_rate": 2.9783798803725518e-06, + "loss": 0.6298, + "step": 21585 + }, + { + "epoch": 0.75, + "learning_rate": 2.9776046315376004e-06, + "loss": 0.6384, + "step": 21586 + }, + { + "epoch": 0.75, + "learning_rate": 2.9768294659620313e-06, + "loss": 0.6284, + "step": 21587 + }, + { + "epoch": 0.75, + "learning_rate": 2.9760543836550313e-06, + "loss": 0.6106, + "step": 21588 + }, + { + "epoch": 0.75, + "learning_rate": 2.9752793846257967e-06, + "loss": 0.6097, + "step": 21589 + }, + { + "epoch": 0.75, + "learning_rate": 2.974504468883508e-06, + "loss": 0.6164, + "step": 21590 + }, + { + "epoch": 0.75, + "learning_rate": 2.9737296364373557e-06, + "loss": 0.5859, + "step": 21591 + }, + { + "epoch": 0.75, + "learning_rate": 2.9729548872965264e-06, + "loss": 0.6187, + "step": 21592 + }, + { + "epoch": 0.75, + "learning_rate": 2.972180221470207e-06, + "loss": 0.6544, + "step": 21593 + }, + { + "epoch": 0.75, + "learning_rate": 2.9714056389675818e-06, + "loss": 0.6673, + "step": 21594 + }, + { + "epoch": 0.75, + "learning_rate": 2.970631139797836e-06, + "loss": 0.5674, + "step": 21595 + }, + { + "epoch": 0.75, + "learning_rate": 2.969856723970147e-06, + "loss": 0.6384, + "step": 21596 + }, + { + "epoch": 0.75, + "learning_rate": 2.9690823914937006e-06, + "loss": 0.5961, + "step": 21597 + }, + { + "epoch": 0.75, + "learning_rate": 2.968308142377676e-06, + "loss": 0.5907, + "step": 21598 + }, + { + "epoch": 0.75, + "learning_rate": 2.967533976631253e-06, + "loss": 0.7038, + "step": 21599 + }, + { + "epoch": 0.75, + "learning_rate": 2.966759894263612e-06, + "loss": 0.6215, + "step": 21600 + }, + { + "epoch": 0.75, + "learning_rate": 2.9659858952839316e-06, + "loss": 0.6525, + "step": 21601 + }, + { + "epoch": 0.75, + "learning_rate": 2.9652119797013847e-06, + "loss": 0.5964, + "step": 21602 + }, + { + "epoch": 0.75, + "learning_rate": 2.9644381475251472e-06, + "loss": 0.6213, + "step": 21603 + }, + { + "epoch": 0.75, + "learning_rate": 2.9636643987643963e-06, + "loss": 0.5474, + "step": 21604 + }, + { + "epoch": 0.75, + "learning_rate": 2.9628907334283054e-06, + "loss": 0.5759, + "step": 21605 + }, + { + "epoch": 0.75, + "learning_rate": 2.962117151526046e-06, + "loss": 0.6507, + "step": 21606 + }, + { + "epoch": 0.75, + "learning_rate": 2.961343653066795e-06, + "loss": 0.6395, + "step": 21607 + }, + { + "epoch": 0.75, + "learning_rate": 2.9605702380597145e-06, + "loss": 0.5989, + "step": 21608 + }, + { + "epoch": 0.75, + "learning_rate": 2.9597969065139796e-06, + "loss": 0.6226, + "step": 21609 + }, + { + "epoch": 0.75, + "learning_rate": 2.9590236584387576e-06, + "loss": 0.5785, + "step": 21610 + }, + { + "epoch": 0.75, + "learning_rate": 2.958250493843218e-06, + "loss": 0.6317, + "step": 21611 + }, + { + "epoch": 0.75, + "learning_rate": 2.957477412736526e-06, + "loss": 0.6644, + "step": 21612 + }, + { + "epoch": 0.75, + "learning_rate": 2.956704415127851e-06, + "loss": 0.6165, + "step": 21613 + }, + { + "epoch": 0.75, + "learning_rate": 2.9559315010263522e-06, + "loss": 0.6302, + "step": 21614 + }, + { + "epoch": 0.75, + "learning_rate": 2.955158670441196e-06, + "loss": 0.6018, + "step": 21615 + }, + { + "epoch": 0.75, + "learning_rate": 2.9543859233815463e-06, + "loss": 0.6527, + "step": 21616 + }, + { + "epoch": 0.75, + "learning_rate": 2.9536132598565637e-06, + "loss": 0.6219, + "step": 21617 + }, + { + "epoch": 0.75, + "learning_rate": 2.952840679875413e-06, + "loss": 0.657, + "step": 21618 + }, + { + "epoch": 0.75, + "learning_rate": 2.9520681834472478e-06, + "loss": 0.5633, + "step": 21619 + }, + { + "epoch": 0.75, + "learning_rate": 2.951295770581228e-06, + "loss": 0.67, + "step": 21620 + }, + { + "epoch": 0.75, + "learning_rate": 2.9505234412865192e-06, + "loss": 0.6471, + "step": 21621 + }, + { + "epoch": 0.75, + "learning_rate": 2.9497511955722646e-06, + "loss": 0.6659, + "step": 21622 + }, + { + "epoch": 0.75, + "learning_rate": 2.948979033447632e-06, + "loss": 0.6429, + "step": 21623 + }, + { + "epoch": 0.75, + "learning_rate": 2.9482069549217764e-06, + "loss": 0.6138, + "step": 21624 + }, + { + "epoch": 0.75, + "learning_rate": 2.9474349600038444e-06, + "loss": 0.65, + "step": 21625 + }, + { + "epoch": 0.75, + "learning_rate": 2.946663048702991e-06, + "loss": 0.6164, + "step": 21626 + }, + { + "epoch": 0.75, + "learning_rate": 2.945891221028375e-06, + "loss": 0.6456, + "step": 21627 + }, + { + "epoch": 0.75, + "learning_rate": 2.9451194769891345e-06, + "loss": 0.6415, + "step": 21628 + }, + { + "epoch": 0.75, + "learning_rate": 2.9443478165944305e-06, + "loss": 0.6965, + "step": 21629 + }, + { + "epoch": 0.75, + "learning_rate": 2.943576239853412e-06, + "loss": 0.5243, + "step": 21630 + }, + { + "epoch": 0.75, + "learning_rate": 2.9428047467752195e-06, + "loss": 0.6466, + "step": 21631 + }, + { + "epoch": 0.75, + "learning_rate": 2.9420333373690057e-06, + "loss": 0.6715, + "step": 21632 + }, + { + "epoch": 0.75, + "learning_rate": 2.941262011643917e-06, + "loss": 0.6415, + "step": 21633 + }, + { + "epoch": 0.75, + "learning_rate": 2.94049076960909e-06, + "loss": 0.6217, + "step": 21634 + }, + { + "epoch": 0.75, + "learning_rate": 2.9397196112736794e-06, + "loss": 0.6909, + "step": 21635 + }, + { + "epoch": 0.75, + "learning_rate": 2.9389485366468264e-06, + "loss": 0.573, + "step": 21636 + }, + { + "epoch": 0.75, + "learning_rate": 2.938177545737668e-06, + "loss": 0.6477, + "step": 21637 + }, + { + "epoch": 0.75, + "learning_rate": 2.937406638555348e-06, + "loss": 0.6573, + "step": 21638 + }, + { + "epoch": 0.75, + "learning_rate": 2.93663581510901e-06, + "loss": 0.6117, + "step": 21639 + }, + { + "epoch": 0.75, + "learning_rate": 2.9358650754077834e-06, + "loss": 0.6328, + "step": 21640 + }, + { + "epoch": 0.75, + "learning_rate": 2.9350944194608154e-06, + "loss": 0.6438, + "step": 21641 + }, + { + "epoch": 0.75, + "learning_rate": 2.934323847277243e-06, + "loss": 0.5984, + "step": 21642 + }, + { + "epoch": 0.75, + "learning_rate": 2.933553358866197e-06, + "loss": 0.6339, + "step": 21643 + }, + { + "epoch": 0.75, + "learning_rate": 2.9327829542368146e-06, + "loss": 0.619, + "step": 21644 + }, + { + "epoch": 0.75, + "learning_rate": 2.9320126333982334e-06, + "loss": 0.5829, + "step": 21645 + }, + { + "epoch": 0.75, + "learning_rate": 2.931242396359577e-06, + "loss": 0.6154, + "step": 21646 + }, + { + "epoch": 0.75, + "learning_rate": 2.930472243129988e-06, + "loss": 0.6723, + "step": 21647 + }, + { + "epoch": 0.75, + "learning_rate": 2.929702173718596e-06, + "loss": 0.6651, + "step": 21648 + }, + { + "epoch": 0.75, + "learning_rate": 2.9289321881345257e-06, + "loss": 0.6364, + "step": 21649 + }, + { + "epoch": 0.75, + "learning_rate": 2.92816228638691e-06, + "loss": 0.6707, + "step": 21650 + }, + { + "epoch": 0.75, + "learning_rate": 2.9273924684848776e-06, + "loss": 0.5969, + "step": 21651 + }, + { + "epoch": 0.75, + "learning_rate": 2.9266227344375532e-06, + "loss": 0.6419, + "step": 21652 + }, + { + "epoch": 0.75, + "learning_rate": 2.92585308425406e-06, + "loss": 0.6218, + "step": 21653 + }, + { + "epoch": 0.75, + "learning_rate": 2.9250835179435333e-06, + "loss": 0.5953, + "step": 21654 + }, + { + "epoch": 0.75, + "learning_rate": 2.924314035515089e-06, + "loss": 0.6907, + "step": 21655 + }, + { + "epoch": 0.75, + "learning_rate": 2.923544636977853e-06, + "loss": 0.6209, + "step": 21656 + }, + { + "epoch": 0.75, + "learning_rate": 2.9227753223409492e-06, + "loss": 0.6355, + "step": 21657 + }, + { + "epoch": 0.75, + "learning_rate": 2.922006091613494e-06, + "loss": 0.6203, + "step": 21658 + }, + { + "epoch": 0.75, + "learning_rate": 2.9212369448046075e-06, + "loss": 0.6055, + "step": 21659 + }, + { + "epoch": 0.75, + "learning_rate": 2.9204678819234168e-06, + "loss": 0.6003, + "step": 21660 + }, + { + "epoch": 0.75, + "learning_rate": 2.9196989029790322e-06, + "loss": 0.596, + "step": 21661 + }, + { + "epoch": 0.75, + "learning_rate": 2.9189300079805747e-06, + "loss": 0.6291, + "step": 21662 + }, + { + "epoch": 0.75, + "learning_rate": 2.9181611969371625e-06, + "loss": 0.6445, + "step": 21663 + }, + { + "epoch": 0.75, + "learning_rate": 2.9173924698579037e-06, + "loss": 0.6505, + "step": 21664 + }, + { + "epoch": 0.75, + "learning_rate": 2.916623826751914e-06, + "loss": 0.6061, + "step": 21665 + }, + { + "epoch": 0.75, + "learning_rate": 2.915855267628317e-06, + "loss": 0.6502, + "step": 21666 + }, + { + "epoch": 0.75, + "learning_rate": 2.9150867924962124e-06, + "loss": 0.6534, + "step": 21667 + }, + { + "epoch": 0.75, + "learning_rate": 2.9143184013647175e-06, + "loss": 0.6793, + "step": 21668 + }, + { + "epoch": 0.75, + "learning_rate": 2.913550094242944e-06, + "loss": 0.6386, + "step": 21669 + }, + { + "epoch": 0.75, + "learning_rate": 2.9127818711399945e-06, + "loss": 0.676, + "step": 21670 + }, + { + "epoch": 0.75, + "learning_rate": 2.9120137320649798e-06, + "loss": 0.6212, + "step": 21671 + }, + { + "epoch": 0.75, + "learning_rate": 2.9112456770270137e-06, + "loss": 0.6599, + "step": 21672 + }, + { + "epoch": 0.75, + "learning_rate": 2.9104777060351952e-06, + "loss": 0.6527, + "step": 21673 + }, + { + "epoch": 0.75, + "learning_rate": 2.9097098190986306e-06, + "loss": 0.6216, + "step": 21674 + }, + { + "epoch": 0.75, + "learning_rate": 2.9089420162264294e-06, + "loss": 0.5934, + "step": 21675 + }, + { + "epoch": 0.75, + "learning_rate": 2.9081742974276883e-06, + "loss": 0.615, + "step": 21676 + }, + { + "epoch": 0.75, + "learning_rate": 2.9074066627115082e-06, + "loss": 0.6296, + "step": 21677 + }, + { + "epoch": 0.75, + "learning_rate": 2.906639112087e-06, + "loss": 0.6643, + "step": 21678 + }, + { + "epoch": 0.75, + "learning_rate": 2.905871645563256e-06, + "loss": 0.6249, + "step": 21679 + }, + { + "epoch": 0.75, + "learning_rate": 2.9051042631493775e-06, + "loss": 0.6658, + "step": 21680 + }, + { + "epoch": 0.75, + "learning_rate": 2.9043369648544662e-06, + "loss": 0.6026, + "step": 21681 + }, + { + "epoch": 0.75, + "learning_rate": 2.9035697506876127e-06, + "loss": 0.5855, + "step": 21682 + }, + { + "epoch": 0.75, + "learning_rate": 2.9028026206579173e-06, + "loss": 0.6425, + "step": 21683 + }, + { + "epoch": 0.75, + "learning_rate": 2.9020355747744744e-06, + "loss": 0.659, + "step": 21684 + }, + { + "epoch": 0.75, + "learning_rate": 2.9012686130463797e-06, + "loss": 0.6088, + "step": 21685 + }, + { + "epoch": 0.75, + "learning_rate": 2.900501735482728e-06, + "loss": 0.6608, + "step": 21686 + }, + { + "epoch": 0.75, + "learning_rate": 2.8997349420926055e-06, + "loss": 0.607, + "step": 21687 + }, + { + "epoch": 0.75, + "learning_rate": 2.8989682328851076e-06, + "loss": 0.6222, + "step": 21688 + }, + { + "epoch": 0.75, + "learning_rate": 2.8982016078693252e-06, + "loss": 0.6254, + "step": 21689 + }, + { + "epoch": 0.75, + "learning_rate": 2.897435067054345e-06, + "loss": 0.6, + "step": 21690 + }, + { + "epoch": 0.75, + "learning_rate": 2.8966686104492582e-06, + "loss": 0.7115, + "step": 21691 + }, + { + "epoch": 0.75, + "learning_rate": 2.895902238063153e-06, + "loss": 0.6327, + "step": 21692 + }, + { + "epoch": 0.75, + "learning_rate": 2.89513594990511e-06, + "loss": 0.6274, + "step": 21693 + }, + { + "epoch": 0.75, + "learning_rate": 2.894369745984219e-06, + "loss": 0.6288, + "step": 21694 + }, + { + "epoch": 0.75, + "learning_rate": 2.8936036263095625e-06, + "loss": 0.687, + "step": 21695 + }, + { + "epoch": 0.75, + "learning_rate": 2.892837590890225e-06, + "loss": 0.6305, + "step": 21696 + }, + { + "epoch": 0.75, + "learning_rate": 2.892071639735289e-06, + "loss": 0.6133, + "step": 21697 + }, + { + "epoch": 0.75, + "learning_rate": 2.8913057728538375e-06, + "loss": 0.6453, + "step": 21698 + }, + { + "epoch": 0.75, + "learning_rate": 2.8905399902549456e-06, + "loss": 0.6037, + "step": 21699 + }, + { + "epoch": 0.75, + "learning_rate": 2.8897742919476967e-06, + "loss": 0.6231, + "step": 21700 + }, + { + "epoch": 0.75, + "learning_rate": 2.8890086779411673e-06, + "loss": 0.6486, + "step": 21701 + }, + { + "epoch": 0.75, + "learning_rate": 2.888243148244435e-06, + "loss": 0.5596, + "step": 21702 + }, + { + "epoch": 0.75, + "learning_rate": 2.887477702866578e-06, + "loss": 0.6179, + "step": 21703 + }, + { + "epoch": 0.75, + "learning_rate": 2.886712341816672e-06, + "loss": 0.6638, + "step": 21704 + }, + { + "epoch": 0.75, + "learning_rate": 2.8859470651037867e-06, + "loss": 0.6654, + "step": 21705 + }, + { + "epoch": 0.75, + "learning_rate": 2.8851818727369985e-06, + "loss": 0.5784, + "step": 21706 + }, + { + "epoch": 0.75, + "learning_rate": 2.8844167647253796e-06, + "loss": 0.6409, + "step": 21707 + }, + { + "epoch": 0.75, + "learning_rate": 2.883651741078001e-06, + "loss": 0.6064, + "step": 21708 + }, + { + "epoch": 0.75, + "learning_rate": 2.8828868018039324e-06, + "loss": 0.6331, + "step": 21709 + }, + { + "epoch": 0.75, + "learning_rate": 2.8821219469122487e-06, + "loss": 0.6497, + "step": 21710 + }, + { + "epoch": 0.75, + "learning_rate": 2.8813571764120097e-06, + "loss": 0.6652, + "step": 21711 + }, + { + "epoch": 0.75, + "learning_rate": 2.8805924903122863e-06, + "loss": 0.5814, + "step": 21712 + }, + { + "epoch": 0.75, + "learning_rate": 2.8798278886221443e-06, + "loss": 0.6608, + "step": 21713 + }, + { + "epoch": 0.75, + "learning_rate": 2.879063371350651e-06, + "loss": 0.5875, + "step": 21714 + }, + { + "epoch": 0.75, + "learning_rate": 2.8782989385068694e-06, + "loss": 0.6278, + "step": 21715 + }, + { + "epoch": 0.75, + "learning_rate": 2.877534590099865e-06, + "loss": 0.6362, + "step": 21716 + }, + { + "epoch": 0.75, + "learning_rate": 2.876770326138696e-06, + "loss": 0.6604, + "step": 21717 + }, + { + "epoch": 0.75, + "learning_rate": 2.876006146632425e-06, + "loss": 0.5884, + "step": 21718 + }, + { + "epoch": 0.75, + "learning_rate": 2.8752420515901137e-06, + "loss": 0.5885, + "step": 21719 + }, + { + "epoch": 0.75, + "learning_rate": 2.8744780410208197e-06, + "loss": 0.6667, + "step": 21720 + }, + { + "epoch": 0.75, + "learning_rate": 2.8737141149336034e-06, + "loss": 0.6795, + "step": 21721 + }, + { + "epoch": 0.75, + "learning_rate": 2.8729502733375238e-06, + "loss": 0.5846, + "step": 21722 + }, + { + "epoch": 0.75, + "learning_rate": 2.8721865162416306e-06, + "loss": 0.6766, + "step": 21723 + }, + { + "epoch": 0.75, + "learning_rate": 2.871422843654984e-06, + "loss": 0.5824, + "step": 21724 + }, + { + "epoch": 0.75, + "learning_rate": 2.8706592555866364e-06, + "loss": 0.6443, + "step": 21725 + }, + { + "epoch": 0.75, + "learning_rate": 2.869895752045643e-06, + "loss": 0.6247, + "step": 21726 + }, + { + "epoch": 0.75, + "learning_rate": 2.869132333041055e-06, + "loss": 0.5822, + "step": 21727 + }, + { + "epoch": 0.75, + "learning_rate": 2.8683689985819264e-06, + "loss": 0.6178, + "step": 21728 + }, + { + "epoch": 0.75, + "learning_rate": 2.867605748677301e-06, + "loss": 0.6174, + "step": 21729 + }, + { + "epoch": 0.75, + "learning_rate": 2.8668425833362333e-06, + "loss": 0.5799, + "step": 21730 + }, + { + "epoch": 0.75, + "learning_rate": 2.86607950256777e-06, + "loss": 0.5896, + "step": 21731 + }, + { + "epoch": 0.75, + "learning_rate": 2.8653165063809584e-06, + "loss": 0.6074, + "step": 21732 + }, + { + "epoch": 0.75, + "learning_rate": 2.8645535947848456e-06, + "loss": 0.5738, + "step": 21733 + }, + { + "epoch": 0.75, + "learning_rate": 2.863790767788479e-06, + "loss": 0.6327, + "step": 21734 + }, + { + "epoch": 0.75, + "learning_rate": 2.8630280254008967e-06, + "loss": 0.6528, + "step": 21735 + }, + { + "epoch": 0.75, + "learning_rate": 2.8622653676311462e-06, + "loss": 0.6653, + "step": 21736 + }, + { + "epoch": 0.75, + "learning_rate": 2.8615027944882677e-06, + "loss": 0.6064, + "step": 21737 + }, + { + "epoch": 0.75, + "learning_rate": 2.8607403059813054e-06, + "loss": 0.5981, + "step": 21738 + }, + { + "epoch": 0.75, + "learning_rate": 2.8599779021192976e-06, + "loss": 0.6351, + "step": 21739 + }, + { + "epoch": 0.75, + "learning_rate": 2.859215582911287e-06, + "loss": 0.6694, + "step": 21740 + }, + { + "epoch": 0.75, + "learning_rate": 2.8584533483663045e-06, + "loss": 0.6764, + "step": 21741 + }, + { + "epoch": 0.75, + "learning_rate": 2.857691198493393e-06, + "loss": 0.6178, + "step": 21742 + }, + { + "epoch": 0.75, + "learning_rate": 2.8569291333015867e-06, + "loss": 0.6044, + "step": 21743 + }, + { + "epoch": 0.75, + "learning_rate": 2.8561671527999224e-06, + "loss": 0.6293, + "step": 21744 + }, + { + "epoch": 0.75, + "learning_rate": 2.8554052569974366e-06, + "loss": 0.6464, + "step": 21745 + }, + { + "epoch": 0.75, + "learning_rate": 2.8546434459031558e-06, + "loss": 0.6621, + "step": 21746 + }, + { + "epoch": 0.75, + "learning_rate": 2.853881719526116e-06, + "loss": 0.6717, + "step": 21747 + }, + { + "epoch": 0.75, + "learning_rate": 2.8531200778753477e-06, + "loss": 0.6461, + "step": 21748 + }, + { + "epoch": 0.75, + "learning_rate": 2.8523585209598826e-06, + "loss": 0.6223, + "step": 21749 + }, + { + "epoch": 0.75, + "learning_rate": 2.851597048788749e-06, + "loss": 0.6243, + "step": 21750 + }, + { + "epoch": 0.75, + "learning_rate": 2.8508356613709775e-06, + "loss": 0.6704, + "step": 21751 + }, + { + "epoch": 0.75, + "learning_rate": 2.850074358715591e-06, + "loss": 0.642, + "step": 21752 + }, + { + "epoch": 0.75, + "learning_rate": 2.8493131408316167e-06, + "loss": 0.6165, + "step": 21753 + }, + { + "epoch": 0.75, + "learning_rate": 2.8485520077280814e-06, + "loss": 0.6106, + "step": 21754 + }, + { + "epoch": 0.75, + "learning_rate": 2.8477909594140085e-06, + "loss": 0.691, + "step": 21755 + }, + { + "epoch": 0.75, + "learning_rate": 2.8470299958984204e-06, + "loss": 0.5842, + "step": 21756 + }, + { + "epoch": 0.75, + "learning_rate": 2.8462691171903447e-06, + "loss": 0.589, + "step": 21757 + }, + { + "epoch": 0.75, + "learning_rate": 2.8455083232987946e-06, + "loss": 0.6351, + "step": 21758 + }, + { + "epoch": 0.75, + "learning_rate": 2.8447476142327936e-06, + "loss": 0.5665, + "step": 21759 + }, + { + "epoch": 0.75, + "learning_rate": 2.843986990001362e-06, + "loss": 0.6417, + "step": 21760 + }, + { + "epoch": 0.75, + "learning_rate": 2.8432264506135155e-06, + "loss": 0.6096, + "step": 21761 + }, + { + "epoch": 0.75, + "learning_rate": 2.842465996078274e-06, + "loss": 0.6256, + "step": 21762 + }, + { + "epoch": 0.75, + "learning_rate": 2.841705626404655e-06, + "loss": 0.6509, + "step": 21763 + }, + { + "epoch": 0.75, + "learning_rate": 2.8409453416016685e-06, + "loss": 0.6203, + "step": 21764 + }, + { + "epoch": 0.75, + "learning_rate": 2.84018514167833e-06, + "loss": 0.6444, + "step": 21765 + }, + { + "epoch": 0.75, + "learning_rate": 2.839425026643655e-06, + "loss": 0.6724, + "step": 21766 + }, + { + "epoch": 0.75, + "learning_rate": 2.8386649965066537e-06, + "loss": 0.6237, + "step": 21767 + }, + { + "epoch": 0.75, + "learning_rate": 2.8379050512763396e-06, + "loss": 0.6642, + "step": 21768 + }, + { + "epoch": 0.75, + "learning_rate": 2.837145190961723e-06, + "loss": 0.6364, + "step": 21769 + }, + { + "epoch": 0.75, + "learning_rate": 2.8363854155718084e-06, + "loss": 0.6744, + "step": 21770 + }, + { + "epoch": 0.75, + "learning_rate": 2.835625725115606e-06, + "loss": 0.6466, + "step": 21771 + }, + { + "epoch": 0.75, + "learning_rate": 2.834866119602124e-06, + "loss": 0.6176, + "step": 21772 + }, + { + "epoch": 0.75, + "learning_rate": 2.8341065990403683e-06, + "loss": 0.6584, + "step": 21773 + }, + { + "epoch": 0.75, + "learning_rate": 2.833347163439344e-06, + "loss": 0.6527, + "step": 21774 + }, + { + "epoch": 0.75, + "learning_rate": 2.8325878128080585e-06, + "loss": 0.6153, + "step": 21775 + }, + { + "epoch": 0.75, + "learning_rate": 2.8318285471555072e-06, + "loss": 0.6685, + "step": 21776 + }, + { + "epoch": 0.75, + "learning_rate": 2.8310693664906963e-06, + "loss": 0.6452, + "step": 21777 + }, + { + "epoch": 0.75, + "learning_rate": 2.830310270822627e-06, + "loss": 0.633, + "step": 21778 + }, + { + "epoch": 0.75, + "learning_rate": 2.829551260160299e-06, + "loss": 0.6347, + "step": 21779 + }, + { + "epoch": 0.75, + "learning_rate": 2.8287923345127123e-06, + "loss": 0.6345, + "step": 21780 + }, + { + "epoch": 0.75, + "learning_rate": 2.8280334938888663e-06, + "loss": 0.6147, + "step": 21781 + }, + { + "epoch": 0.75, + "learning_rate": 2.8272747382977538e-06, + "loss": 0.6099, + "step": 21782 + }, + { + "epoch": 0.75, + "learning_rate": 2.8265160677483717e-06, + "loss": 0.6156, + "step": 21783 + }, + { + "epoch": 0.75, + "learning_rate": 2.825757482249717e-06, + "loss": 0.6276, + "step": 21784 + }, + { + "epoch": 0.75, + "learning_rate": 2.8249989818107813e-06, + "loss": 0.5926, + "step": 21785 + }, + { + "epoch": 0.75, + "learning_rate": 2.8242405664405604e-06, + "loss": 0.5767, + "step": 21786 + }, + { + "epoch": 0.75, + "learning_rate": 2.8234822361480475e-06, + "loss": 0.5937, + "step": 21787 + }, + { + "epoch": 0.75, + "learning_rate": 2.822723990942229e-06, + "loss": 0.6468, + "step": 21788 + }, + { + "epoch": 0.75, + "learning_rate": 2.8219658308320953e-06, + "loss": 0.672, + "step": 21789 + }, + { + "epoch": 0.75, + "learning_rate": 2.821207755826638e-06, + "loss": 0.6337, + "step": 21790 + }, + { + "epoch": 0.76, + "learning_rate": 2.820449765934844e-06, + "loss": 0.5829, + "step": 21791 + }, + { + "epoch": 0.76, + "learning_rate": 2.8196918611657e-06, + "loss": 0.6148, + "step": 21792 + }, + { + "epoch": 0.76, + "learning_rate": 2.8189340415281953e-06, + "loss": 0.6452, + "step": 21793 + }, + { + "epoch": 0.76, + "learning_rate": 2.8181763070313073e-06, + "loss": 0.617, + "step": 21794 + }, + { + "epoch": 0.76, + "learning_rate": 2.817418657684026e-06, + "loss": 0.6501, + "step": 21795 + }, + { + "epoch": 0.76, + "learning_rate": 2.816661093495332e-06, + "loss": 0.6343, + "step": 21796 + }, + { + "epoch": 0.76, + "learning_rate": 2.815903614474207e-06, + "loss": 0.6334, + "step": 21797 + }, + { + "epoch": 0.76, + "learning_rate": 2.8151462206296334e-06, + "loss": 0.6542, + "step": 21798 + }, + { + "epoch": 0.76, + "learning_rate": 2.8143889119705924e-06, + "loss": 0.6976, + "step": 21799 + }, + { + "epoch": 0.76, + "learning_rate": 2.8136316885060588e-06, + "loss": 0.652, + "step": 21800 + }, + { + "epoch": 0.76, + "learning_rate": 2.8128745502450115e-06, + "loss": 0.6494, + "step": 21801 + }, + { + "epoch": 0.76, + "learning_rate": 2.812117497196428e-06, + "loss": 0.6299, + "step": 21802 + }, + { + "epoch": 0.76, + "learning_rate": 2.8113605293692858e-06, + "loss": 0.6708, + "step": 21803 + }, + { + "epoch": 0.76, + "learning_rate": 2.810603646772556e-06, + "loss": 0.66, + "step": 21804 + }, + { + "epoch": 0.76, + "learning_rate": 2.80984684941522e-06, + "loss": 0.6728, + "step": 21805 + }, + { + "epoch": 0.76, + "learning_rate": 2.8090901373062406e-06, + "loss": 0.6219, + "step": 21806 + }, + { + "epoch": 0.76, + "learning_rate": 2.8083335104545938e-06, + "loss": 0.6653, + "step": 21807 + }, + { + "epoch": 0.76, + "learning_rate": 2.8075769688692522e-06, + "loss": 0.6043, + "step": 21808 + }, + { + "epoch": 0.76, + "learning_rate": 2.806820512559183e-06, + "loss": 0.6141, + "step": 21809 + }, + { + "epoch": 0.76, + "learning_rate": 2.806064141533359e-06, + "loss": 0.6045, + "step": 21810 + }, + { + "epoch": 0.76, + "learning_rate": 2.805307855800743e-06, + "loss": 0.6559, + "step": 21811 + }, + { + "epoch": 0.76, + "learning_rate": 2.8045516553703023e-06, + "loss": 0.6919, + "step": 21812 + }, + { + "epoch": 0.76, + "learning_rate": 2.803795540251005e-06, + "loss": 0.6509, + "step": 21813 + }, + { + "epoch": 0.76, + "learning_rate": 2.803039510451815e-06, + "loss": 0.6541, + "step": 21814 + }, + { + "epoch": 0.76, + "learning_rate": 2.802283565981695e-06, + "loss": 0.6359, + "step": 21815 + }, + { + "epoch": 0.76, + "learning_rate": 2.8015277068496127e-06, + "loss": 0.6435, + "step": 21816 + }, + { + "epoch": 0.76, + "learning_rate": 2.800771933064521e-06, + "loss": 0.6411, + "step": 21817 + }, + { + "epoch": 0.76, + "learning_rate": 2.8000162446353864e-06, + "loss": 0.6492, + "step": 21818 + }, + { + "epoch": 0.76, + "learning_rate": 2.7992606415711665e-06, + "loss": 0.6507, + "step": 21819 + }, + { + "epoch": 0.76, + "learning_rate": 2.7985051238808203e-06, + "loss": 0.6171, + "step": 21820 + }, + { + "epoch": 0.76, + "learning_rate": 2.797749691573307e-06, + "loss": 0.6656, + "step": 21821 + }, + { + "epoch": 0.76, + "learning_rate": 2.796994344657584e-06, + "loss": 0.6145, + "step": 21822 + }, + { + "epoch": 0.76, + "learning_rate": 2.7962390831426022e-06, + "loss": 0.663, + "step": 21823 + }, + { + "epoch": 0.76, + "learning_rate": 2.7954839070373185e-06, + "loss": 0.6629, + "step": 21824 + }, + { + "epoch": 0.76, + "learning_rate": 2.794728816350688e-06, + "loss": 0.6206, + "step": 21825 + }, + { + "epoch": 0.76, + "learning_rate": 2.7939738110916615e-06, + "loss": 0.6006, + "step": 21826 + }, + { + "epoch": 0.76, + "learning_rate": 2.7932188912691903e-06, + "loss": 0.6461, + "step": 21827 + }, + { + "epoch": 0.76, + "learning_rate": 2.79246405689223e-06, + "loss": 0.6545, + "step": 21828 + }, + { + "epoch": 0.76, + "learning_rate": 2.791709307969722e-06, + "loss": 0.6304, + "step": 21829 + }, + { + "epoch": 0.76, + "learning_rate": 2.7909546445106197e-06, + "loss": 0.6642, + "step": 21830 + }, + { + "epoch": 0.76, + "learning_rate": 2.7902000665238683e-06, + "loss": 0.6232, + "step": 21831 + }, + { + "epoch": 0.76, + "learning_rate": 2.789445574018417e-06, + "loss": 0.6203, + "step": 21832 + }, + { + "epoch": 0.76, + "learning_rate": 2.788691167003208e-06, + "loss": 0.6184, + "step": 21833 + }, + { + "epoch": 0.76, + "learning_rate": 2.7879368454871923e-06, + "loss": 0.6186, + "step": 21834 + }, + { + "epoch": 0.76, + "learning_rate": 2.7871826094793043e-06, + "loss": 0.6339, + "step": 21835 + }, + { + "epoch": 0.76, + "learning_rate": 2.7864284589884915e-06, + "loss": 0.6058, + "step": 21836 + }, + { + "epoch": 0.76, + "learning_rate": 2.785674394023694e-06, + "loss": 0.6936, + "step": 21837 + }, + { + "epoch": 0.76, + "learning_rate": 2.7849204145938535e-06, + "loss": 0.6009, + "step": 21838 + }, + { + "epoch": 0.76, + "learning_rate": 2.7841665207079083e-06, + "loss": 0.6942, + "step": 21839 + }, + { + "epoch": 0.76, + "learning_rate": 2.7834127123748e-06, + "loss": 0.7107, + "step": 21840 + }, + { + "epoch": 0.76, + "learning_rate": 2.7826589896034596e-06, + "loss": 0.6422, + "step": 21841 + }, + { + "epoch": 0.76, + "learning_rate": 2.781905352402827e-06, + "loss": 0.6029, + "step": 21842 + }, + { + "epoch": 0.76, + "learning_rate": 2.7811518007818404e-06, + "loss": 0.6356, + "step": 21843 + }, + { + "epoch": 0.76, + "learning_rate": 2.7803983347494257e-06, + "loss": 0.681, + "step": 21844 + }, + { + "epoch": 0.76, + "learning_rate": 2.7796449543145243e-06, + "loss": 0.6051, + "step": 21845 + }, + { + "epoch": 0.76, + "learning_rate": 2.7788916594860683e-06, + "loss": 0.5988, + "step": 21846 + }, + { + "epoch": 0.76, + "learning_rate": 2.778138450272985e-06, + "loss": 0.6821, + "step": 21847 + }, + { + "epoch": 0.76, + "learning_rate": 2.777385326684204e-06, + "loss": 0.6067, + "step": 21848 + }, + { + "epoch": 0.76, + "learning_rate": 2.77663228872866e-06, + "loss": 0.6236, + "step": 21849 + }, + { + "epoch": 0.76, + "learning_rate": 2.7758793364152727e-06, + "loss": 0.6785, + "step": 21850 + }, + { + "epoch": 0.76, + "learning_rate": 2.775126469752977e-06, + "loss": 0.6, + "step": 21851 + }, + { + "epoch": 0.76, + "learning_rate": 2.7743736887507e-06, + "loss": 0.5859, + "step": 21852 + }, + { + "epoch": 0.76, + "learning_rate": 2.7736209934173596e-06, + "loss": 0.6619, + "step": 21853 + }, + { + "epoch": 0.76, + "learning_rate": 2.772868383761884e-06, + "loss": 0.6338, + "step": 21854 + }, + { + "epoch": 0.76, + "learning_rate": 2.7721158597931995e-06, + "loss": 0.6282, + "step": 21855 + }, + { + "epoch": 0.76, + "learning_rate": 2.771363421520218e-06, + "loss": 0.7323, + "step": 21856 + }, + { + "epoch": 0.76, + "learning_rate": 2.7706110689518708e-06, + "loss": 0.6579, + "step": 21857 + }, + { + "epoch": 0.76, + "learning_rate": 2.7698588020970774e-06, + "loss": 0.6361, + "step": 21858 + }, + { + "epoch": 0.76, + "learning_rate": 2.769106620964752e-06, + "loss": 0.6299, + "step": 21859 + }, + { + "epoch": 0.76, + "learning_rate": 2.7683545255638132e-06, + "loss": 0.5851, + "step": 21860 + }, + { + "epoch": 0.76, + "learning_rate": 2.767602515903184e-06, + "loss": 0.663, + "step": 21861 + }, + { + "epoch": 0.76, + "learning_rate": 2.76685059199177e-06, + "loss": 0.6417, + "step": 21862 + }, + { + "epoch": 0.76, + "learning_rate": 2.766098753838494e-06, + "loss": 0.7414, + "step": 21863 + }, + { + "epoch": 0.76, + "learning_rate": 2.765347001452272e-06, + "loss": 0.5826, + "step": 21864 + }, + { + "epoch": 0.76, + "learning_rate": 2.7645953348420096e-06, + "loss": 0.6283, + "step": 21865 + }, + { + "epoch": 0.76, + "learning_rate": 2.763843754016623e-06, + "loss": 0.6971, + "step": 21866 + }, + { + "epoch": 0.76, + "learning_rate": 2.763092258985025e-06, + "loss": 0.6459, + "step": 21867 + }, + { + "epoch": 0.76, + "learning_rate": 2.7623408497561176e-06, + "loss": 0.6729, + "step": 21868 + }, + { + "epoch": 0.76, + "learning_rate": 2.7615895263388215e-06, + "loss": 0.6293, + "step": 21869 + }, + { + "epoch": 0.76, + "learning_rate": 2.7608382887420338e-06, + "loss": 0.6096, + "step": 21870 + }, + { + "epoch": 0.76, + "learning_rate": 2.7600871369746664e-06, + "loss": 0.615, + "step": 21871 + }, + { + "epoch": 0.76, + "learning_rate": 2.759336071045627e-06, + "loss": 0.6118, + "step": 21872 + }, + { + "epoch": 0.76, + "learning_rate": 2.758585090963817e-06, + "loss": 0.6553, + "step": 21873 + }, + { + "epoch": 0.76, + "learning_rate": 2.7578341967381363e-06, + "loss": 0.6273, + "step": 21874 + }, + { + "epoch": 0.76, + "learning_rate": 2.757083388377498e-06, + "loss": 0.6207, + "step": 21875 + }, + { + "epoch": 0.76, + "learning_rate": 2.7563326658907974e-06, + "loss": 0.6159, + "step": 21876 + }, + { + "epoch": 0.76, + "learning_rate": 2.7555820292869352e-06, + "loss": 0.6186, + "step": 21877 + }, + { + "epoch": 0.76, + "learning_rate": 2.7548314785748155e-06, + "loss": 0.6256, + "step": 21878 + }, + { + "epoch": 0.76, + "learning_rate": 2.7540810137633313e-06, + "loss": 0.661, + "step": 21879 + }, + { + "epoch": 0.76, + "learning_rate": 2.7533306348613786e-06, + "loss": 0.647, + "step": 21880 + }, + { + "epoch": 0.76, + "learning_rate": 2.7525803418778652e-06, + "loss": 0.6743, + "step": 21881 + }, + { + "epoch": 0.76, + "learning_rate": 2.751830134821677e-06, + "loss": 0.612, + "step": 21882 + }, + { + "epoch": 0.76, + "learning_rate": 2.7510800137017114e-06, + "loss": 0.6839, + "step": 21883 + }, + { + "epoch": 0.76, + "learning_rate": 2.7503299785268645e-06, + "loss": 0.5792, + "step": 21884 + }, + { + "epoch": 0.76, + "learning_rate": 2.7495800293060247e-06, + "loss": 0.644, + "step": 21885 + }, + { + "epoch": 0.76, + "learning_rate": 2.748830166048082e-06, + "loss": 0.6819, + "step": 21886 + }, + { + "epoch": 0.76, + "learning_rate": 2.7480803887619358e-06, + "loss": 0.5393, + "step": 21887 + }, + { + "epoch": 0.76, + "learning_rate": 2.7473306974564684e-06, + "loss": 0.592, + "step": 21888 + }, + { + "epoch": 0.76, + "learning_rate": 2.746581092140569e-06, + "loss": 0.6832, + "step": 21889 + }, + { + "epoch": 0.76, + "learning_rate": 2.74583157282313e-06, + "loss": 0.6036, + "step": 21890 + }, + { + "epoch": 0.76, + "learning_rate": 2.745082139513032e-06, + "loss": 0.6098, + "step": 21891 + }, + { + "epoch": 0.76, + "learning_rate": 2.744332792219159e-06, + "loss": 0.6452, + "step": 21892 + }, + { + "epoch": 0.76, + "learning_rate": 2.7435835309504053e-06, + "loss": 0.6473, + "step": 21893 + }, + { + "epoch": 0.76, + "learning_rate": 2.7428343557156455e-06, + "loss": 0.6037, + "step": 21894 + }, + { + "epoch": 0.76, + "learning_rate": 2.742085266523764e-06, + "loss": 0.6058, + "step": 21895 + }, + { + "epoch": 0.76, + "learning_rate": 2.741336263383647e-06, + "loss": 0.6251, + "step": 21896 + }, + { + "epoch": 0.76, + "learning_rate": 2.7405873463041675e-06, + "loss": 0.623, + "step": 21897 + }, + { + "epoch": 0.76, + "learning_rate": 2.739838515294205e-06, + "loss": 0.6723, + "step": 21898 + }, + { + "epoch": 0.76, + "learning_rate": 2.7390897703626475e-06, + "loss": 0.6298, + "step": 21899 + }, + { + "epoch": 0.76, + "learning_rate": 2.7383411115183624e-06, + "loss": 0.6138, + "step": 21900 + }, + { + "epoch": 0.76, + "learning_rate": 2.7375925387702296e-06, + "loss": 0.6356, + "step": 21901 + }, + { + "epoch": 0.76, + "learning_rate": 2.736844052127127e-06, + "loss": 0.5972, + "step": 21902 + }, + { + "epoch": 0.76, + "learning_rate": 2.736095651597923e-06, + "loss": 0.6306, + "step": 21903 + }, + { + "epoch": 0.76, + "learning_rate": 2.7353473371914917e-06, + "loss": 0.6203, + "step": 21904 + }, + { + "epoch": 0.76, + "learning_rate": 2.7345991089167135e-06, + "loss": 0.5617, + "step": 21905 + }, + { + "epoch": 0.76, + "learning_rate": 2.7338509667824496e-06, + "loss": 0.6083, + "step": 21906 + }, + { + "epoch": 0.76, + "learning_rate": 2.733102910797575e-06, + "loss": 0.7053, + "step": 21907 + }, + { + "epoch": 0.76, + "learning_rate": 2.7323549409709614e-06, + "loss": 0.6449, + "step": 21908 + }, + { + "epoch": 0.76, + "learning_rate": 2.7316070573114696e-06, + "loss": 0.5924, + "step": 21909 + }, + { + "epoch": 0.76, + "learning_rate": 2.730859259827968e-06, + "loss": 0.6052, + "step": 21910 + }, + { + "epoch": 0.76, + "learning_rate": 2.7301115485293315e-06, + "loss": 0.6073, + "step": 21911 + }, + { + "epoch": 0.76, + "learning_rate": 2.7293639234244175e-06, + "loss": 0.6102, + "step": 21912 + }, + { + "epoch": 0.76, + "learning_rate": 2.7286163845220892e-06, + "loss": 0.644, + "step": 21913 + }, + { + "epoch": 0.76, + "learning_rate": 2.727868931831217e-06, + "loss": 0.6146, + "step": 21914 + }, + { + "epoch": 0.76, + "learning_rate": 2.727121565360653e-06, + "loss": 0.5932, + "step": 21915 + }, + { + "epoch": 0.76, + "learning_rate": 2.726374285119262e-06, + "loss": 0.6636, + "step": 21916 + }, + { + "epoch": 0.76, + "learning_rate": 2.72562709111591e-06, + "loss": 0.6414, + "step": 21917 + }, + { + "epoch": 0.76, + "learning_rate": 2.7248799833594476e-06, + "loss": 0.615, + "step": 21918 + }, + { + "epoch": 0.76, + "learning_rate": 2.7241329618587363e-06, + "loss": 0.6384, + "step": 21919 + }, + { + "epoch": 0.76, + "learning_rate": 2.7233860266226365e-06, + "loss": 0.6183, + "step": 21920 + }, + { + "epoch": 0.76, + "learning_rate": 2.722639177659997e-06, + "loss": 0.5726, + "step": 21921 + }, + { + "epoch": 0.76, + "learning_rate": 2.7218924149796723e-06, + "loss": 0.6441, + "step": 21922 + }, + { + "epoch": 0.76, + "learning_rate": 2.721145738590527e-06, + "loss": 0.611, + "step": 21923 + }, + { + "epoch": 0.76, + "learning_rate": 2.7203991485014025e-06, + "loss": 0.6726, + "step": 21924 + }, + { + "epoch": 0.76, + "learning_rate": 2.719652644721156e-06, + "loss": 0.7045, + "step": 21925 + }, + { + "epoch": 0.76, + "learning_rate": 2.7189062272586396e-06, + "loss": 0.576, + "step": 21926 + }, + { + "epoch": 0.76, + "learning_rate": 2.7181598961226973e-06, + "loss": 0.618, + "step": 21927 + }, + { + "epoch": 0.76, + "learning_rate": 2.7174136513221784e-06, + "loss": 0.6386, + "step": 21928 + }, + { + "epoch": 0.76, + "learning_rate": 2.7166674928659387e-06, + "loss": 0.6264, + "step": 21929 + }, + { + "epoch": 0.76, + "learning_rate": 2.7159214207628157e-06, + "loss": 0.6123, + "step": 21930 + }, + { + "epoch": 0.76, + "learning_rate": 2.715175435021663e-06, + "loss": 0.6268, + "step": 21931 + }, + { + "epoch": 0.76, + "learning_rate": 2.7144295356513174e-06, + "loss": 0.6511, + "step": 21932 + }, + { + "epoch": 0.76, + "learning_rate": 2.713683722660626e-06, + "loss": 0.5848, + "step": 21933 + }, + { + "epoch": 0.76, + "learning_rate": 2.7129379960584314e-06, + "loss": 0.5886, + "step": 21934 + }, + { + "epoch": 0.76, + "learning_rate": 2.7121923558535745e-06, + "loss": 0.6607, + "step": 21935 + }, + { + "epoch": 0.76, + "learning_rate": 2.711446802054898e-06, + "loss": 0.6735, + "step": 21936 + }, + { + "epoch": 0.76, + "learning_rate": 2.7107013346712407e-06, + "loss": 0.6258, + "step": 21937 + }, + { + "epoch": 0.76, + "learning_rate": 2.7099559537114383e-06, + "loss": 0.6006, + "step": 21938 + }, + { + "epoch": 0.76, + "learning_rate": 2.7092106591843293e-06, + "loss": 0.6892, + "step": 21939 + }, + { + "epoch": 0.76, + "learning_rate": 2.7084654510987506e-06, + "loss": 0.5839, + "step": 21940 + }, + { + "epoch": 0.76, + "learning_rate": 2.707720329463539e-06, + "loss": 0.6516, + "step": 21941 + }, + { + "epoch": 0.76, + "learning_rate": 2.706975294287527e-06, + "loss": 0.6398, + "step": 21942 + }, + { + "epoch": 0.76, + "learning_rate": 2.7062303455795513e-06, + "loss": 0.6431, + "step": 21943 + }, + { + "epoch": 0.76, + "learning_rate": 2.705485483348439e-06, + "loss": 0.6358, + "step": 21944 + }, + { + "epoch": 0.76, + "learning_rate": 2.704740707603024e-06, + "loss": 0.6401, + "step": 21945 + }, + { + "epoch": 0.76, + "learning_rate": 2.703996018352136e-06, + "loss": 0.5911, + "step": 21946 + }, + { + "epoch": 0.76, + "learning_rate": 2.7032514156046054e-06, + "loss": 0.6392, + "step": 21947 + }, + { + "epoch": 0.76, + "learning_rate": 2.702506899369258e-06, + "loss": 0.6077, + "step": 21948 + }, + { + "epoch": 0.76, + "learning_rate": 2.701762469654927e-06, + "loss": 0.6107, + "step": 21949 + }, + { + "epoch": 0.76, + "learning_rate": 2.7010181264704315e-06, + "loss": 0.698, + "step": 21950 + }, + { + "epoch": 0.76, + "learning_rate": 2.700273869824599e-06, + "loss": 0.6423, + "step": 21951 + }, + { + "epoch": 0.76, + "learning_rate": 2.6995296997262545e-06, + "loss": 0.6294, + "step": 21952 + }, + { + "epoch": 0.76, + "learning_rate": 2.6987856161842197e-06, + "loss": 0.6172, + "step": 21953 + }, + { + "epoch": 0.76, + "learning_rate": 2.698041619207318e-06, + "loss": 0.6645, + "step": 21954 + }, + { + "epoch": 0.76, + "learning_rate": 2.6972977088043727e-06, + "loss": 0.6747, + "step": 21955 + }, + { + "epoch": 0.76, + "learning_rate": 2.696553884984198e-06, + "loss": 0.6322, + "step": 21956 + }, + { + "epoch": 0.76, + "learning_rate": 2.6958101477556167e-06, + "loss": 0.6463, + "step": 21957 + }, + { + "epoch": 0.76, + "learning_rate": 2.6950664971274443e-06, + "loss": 0.6643, + "step": 21958 + }, + { + "epoch": 0.76, + "learning_rate": 2.694322933108501e-06, + "loss": 0.6509, + "step": 21959 + }, + { + "epoch": 0.76, + "learning_rate": 2.6935794557076e-06, + "loss": 0.6139, + "step": 21960 + }, + { + "epoch": 0.76, + "learning_rate": 2.6928360649335606e-06, + "loss": 0.6807, + "step": 21961 + }, + { + "epoch": 0.76, + "learning_rate": 2.6920927607951907e-06, + "loss": 0.6545, + "step": 21962 + }, + { + "epoch": 0.76, + "learning_rate": 2.6913495433013047e-06, + "loss": 0.6044, + "step": 21963 + }, + { + "epoch": 0.76, + "learning_rate": 2.6906064124607157e-06, + "loss": 0.5934, + "step": 21964 + }, + { + "epoch": 0.76, + "learning_rate": 2.689863368282235e-06, + "loss": 0.623, + "step": 21965 + }, + { + "epoch": 0.76, + "learning_rate": 2.6891204107746704e-06, + "loss": 0.6098, + "step": 21966 + }, + { + "epoch": 0.76, + "learning_rate": 2.688377539946835e-06, + "loss": 0.6439, + "step": 21967 + }, + { + "epoch": 0.76, + "learning_rate": 2.68763475580753e-06, + "loss": 0.6289, + "step": 21968 + }, + { + "epoch": 0.76, + "learning_rate": 2.6868920583655657e-06, + "loss": 0.6769, + "step": 21969 + }, + { + "epoch": 0.76, + "learning_rate": 2.686149447629747e-06, + "loss": 0.6245, + "step": 21970 + }, + { + "epoch": 0.76, + "learning_rate": 2.6854069236088777e-06, + "loss": 0.6359, + "step": 21971 + }, + { + "epoch": 0.76, + "learning_rate": 2.684664486311763e-06, + "loss": 0.6364, + "step": 21972 + }, + { + "epoch": 0.76, + "learning_rate": 2.6839221357472078e-06, + "loss": 0.6124, + "step": 21973 + }, + { + "epoch": 0.76, + "learning_rate": 2.683179871924008e-06, + "loss": 0.6377, + "step": 21974 + }, + { + "epoch": 0.76, + "learning_rate": 2.682437694850966e-06, + "loss": 0.6264, + "step": 21975 + }, + { + "epoch": 0.76, + "learning_rate": 2.6816956045368815e-06, + "loss": 0.5735, + "step": 21976 + }, + { + "epoch": 0.76, + "learning_rate": 2.6809536009905547e-06, + "loss": 0.6032, + "step": 21977 + }, + { + "epoch": 0.76, + "learning_rate": 2.68021168422078e-06, + "loss": 0.5764, + "step": 21978 + }, + { + "epoch": 0.76, + "learning_rate": 2.6794698542363595e-06, + "loss": 0.6641, + "step": 21979 + }, + { + "epoch": 0.76, + "learning_rate": 2.6787281110460806e-06, + "loss": 0.6001, + "step": 21980 + }, + { + "epoch": 0.76, + "learning_rate": 2.677986454658742e-06, + "loss": 0.6098, + "step": 21981 + }, + { + "epoch": 0.76, + "learning_rate": 2.6772448850831368e-06, + "loss": 0.6339, + "step": 21982 + }, + { + "epoch": 0.76, + "learning_rate": 2.6765034023280554e-06, + "loss": 0.6553, + "step": 21983 + }, + { + "epoch": 0.76, + "learning_rate": 2.6757620064022914e-06, + "loss": 0.6095, + "step": 21984 + }, + { + "epoch": 0.76, + "learning_rate": 2.6750206973146374e-06, + "loss": 0.6639, + "step": 21985 + }, + { + "epoch": 0.76, + "learning_rate": 2.6742794750738754e-06, + "loss": 0.6854, + "step": 21986 + }, + { + "epoch": 0.76, + "learning_rate": 2.673538339688798e-06, + "loss": 0.5896, + "step": 21987 + }, + { + "epoch": 0.76, + "learning_rate": 2.672797291168191e-06, + "loss": 0.6153, + "step": 21988 + }, + { + "epoch": 0.76, + "learning_rate": 2.672056329520841e-06, + "loss": 0.6781, + "step": 21989 + }, + { + "epoch": 0.76, + "learning_rate": 2.6713154547555344e-06, + "loss": 0.5565, + "step": 21990 + }, + { + "epoch": 0.76, + "learning_rate": 2.670574666881055e-06, + "loss": 0.6429, + "step": 21991 + }, + { + "epoch": 0.76, + "learning_rate": 2.6698339659061835e-06, + "loss": 0.668, + "step": 21992 + }, + { + "epoch": 0.76, + "learning_rate": 2.669093351839701e-06, + "loss": 0.6494, + "step": 21993 + }, + { + "epoch": 0.76, + "learning_rate": 2.668352824690392e-06, + "loss": 0.6773, + "step": 21994 + }, + { + "epoch": 0.76, + "learning_rate": 2.667612384467034e-06, + "loss": 0.697, + "step": 21995 + }, + { + "epoch": 0.76, + "learning_rate": 2.6668720311784102e-06, + "loss": 0.6859, + "step": 21996 + }, + { + "epoch": 0.76, + "learning_rate": 2.666131764833293e-06, + "loss": 0.6381, + "step": 21997 + }, + { + "epoch": 0.76, + "learning_rate": 2.665391585440459e-06, + "loss": 0.6317, + "step": 21998 + }, + { + "epoch": 0.76, + "learning_rate": 2.6646514930086874e-06, + "loss": 0.6373, + "step": 21999 + }, + { + "epoch": 0.76, + "learning_rate": 2.6639114875467507e-06, + "loss": 0.6337, + "step": 22000 + }, + { + "epoch": 0.76, + "learning_rate": 2.6631715690634253e-06, + "loss": 0.6403, + "step": 22001 + }, + { + "epoch": 0.76, + "learning_rate": 2.6624317375674836e-06, + "loss": 0.629, + "step": 22002 + }, + { + "epoch": 0.76, + "learning_rate": 2.661691993067693e-06, + "loss": 0.6169, + "step": 22003 + }, + { + "epoch": 0.76, + "learning_rate": 2.6609523355728264e-06, + "loss": 0.6748, + "step": 22004 + }, + { + "epoch": 0.76, + "learning_rate": 2.6602127650916545e-06, + "loss": 0.6509, + "step": 22005 + }, + { + "epoch": 0.76, + "learning_rate": 2.659473281632945e-06, + "loss": 0.6212, + "step": 22006 + }, + { + "epoch": 0.76, + "learning_rate": 2.6587338852054657e-06, + "loss": 0.6639, + "step": 22007 + }, + { + "epoch": 0.76, + "learning_rate": 2.657994575817985e-06, + "loss": 0.6711, + "step": 22008 + }, + { + "epoch": 0.76, + "learning_rate": 2.6572553534792645e-06, + "loss": 0.6134, + "step": 22009 + }, + { + "epoch": 0.76, + "learning_rate": 2.65651621819807e-06, + "loss": 0.6751, + "step": 22010 + }, + { + "epoch": 0.76, + "learning_rate": 2.655777169983165e-06, + "loss": 0.6055, + "step": 22011 + }, + { + "epoch": 0.76, + "learning_rate": 2.6550382088433125e-06, + "loss": 0.6714, + "step": 22012 + }, + { + "epoch": 0.76, + "learning_rate": 2.6542993347872727e-06, + "loss": 0.62, + "step": 22013 + }, + { + "epoch": 0.76, + "learning_rate": 2.6535605478238103e-06, + "loss": 0.634, + "step": 22014 + }, + { + "epoch": 0.76, + "learning_rate": 2.6528218479616784e-06, + "loss": 0.6263, + "step": 22015 + }, + { + "epoch": 0.76, + "learning_rate": 2.652083235209637e-06, + "loss": 0.632, + "step": 22016 + }, + { + "epoch": 0.76, + "learning_rate": 2.6513447095764443e-06, + "loss": 0.6193, + "step": 22017 + }, + { + "epoch": 0.76, + "learning_rate": 2.6506062710708556e-06, + "loss": 0.6903, + "step": 22018 + }, + { + "epoch": 0.76, + "learning_rate": 2.6498679197016275e-06, + "loss": 0.6532, + "step": 22019 + }, + { + "epoch": 0.76, + "learning_rate": 2.649129655477516e-06, + "loss": 0.5941, + "step": 22020 + }, + { + "epoch": 0.76, + "learning_rate": 2.648391478407267e-06, + "loss": 0.6391, + "step": 22021 + }, + { + "epoch": 0.76, + "learning_rate": 2.647653388499638e-06, + "loss": 0.5722, + "step": 22022 + }, + { + "epoch": 0.76, + "learning_rate": 2.646915385763379e-06, + "loss": 0.638, + "step": 22023 + }, + { + "epoch": 0.76, + "learning_rate": 2.6461774702072397e-06, + "loss": 0.6777, + "step": 22024 + }, + { + "epoch": 0.76, + "learning_rate": 2.6454396418399685e-06, + "loss": 0.5726, + "step": 22025 + }, + { + "epoch": 0.76, + "learning_rate": 2.6447019006703177e-06, + "loss": 0.5959, + "step": 22026 + }, + { + "epoch": 0.76, + "learning_rate": 2.643964246707027e-06, + "loss": 0.6622, + "step": 22027 + }, + { + "epoch": 0.76, + "learning_rate": 2.643226679958846e-06, + "loss": 0.6628, + "step": 22028 + }, + { + "epoch": 0.76, + "learning_rate": 2.642489200434518e-06, + "loss": 0.6746, + "step": 22029 + }, + { + "epoch": 0.76, + "learning_rate": 2.6417518081427885e-06, + "loss": 0.6269, + "step": 22030 + }, + { + "epoch": 0.76, + "learning_rate": 2.6410145030923994e-06, + "loss": 0.6223, + "step": 22031 + }, + { + "epoch": 0.76, + "learning_rate": 2.640277285292097e-06, + "loss": 0.6722, + "step": 22032 + }, + { + "epoch": 0.76, + "learning_rate": 2.6395401547506127e-06, + "loss": 0.6415, + "step": 22033 + }, + { + "epoch": 0.76, + "learning_rate": 2.638803111476691e-06, + "loss": 0.6692, + "step": 22034 + }, + { + "epoch": 0.76, + "learning_rate": 2.6380661554790708e-06, + "loss": 0.6334, + "step": 22035 + }, + { + "epoch": 0.76, + "learning_rate": 2.637329286766489e-06, + "loss": 0.6537, + "step": 22036 + }, + { + "epoch": 0.76, + "learning_rate": 2.6365925053476826e-06, + "loss": 0.6325, + "step": 22037 + }, + { + "epoch": 0.76, + "learning_rate": 2.6358558112313903e-06, + "loss": 0.6488, + "step": 22038 + }, + { + "epoch": 0.76, + "learning_rate": 2.6351192044263385e-06, + "loss": 0.6432, + "step": 22039 + }, + { + "epoch": 0.76, + "learning_rate": 2.6343826849412666e-06, + "loss": 0.6323, + "step": 22040 + }, + { + "epoch": 0.76, + "learning_rate": 2.633646252784905e-06, + "loss": 0.6643, + "step": 22041 + }, + { + "epoch": 0.76, + "learning_rate": 2.632909907965986e-06, + "loss": 0.6164, + "step": 22042 + }, + { + "epoch": 0.76, + "learning_rate": 2.632173650493238e-06, + "loss": 0.6064, + "step": 22043 + }, + { + "epoch": 0.76, + "learning_rate": 2.631437480375396e-06, + "loss": 0.6539, + "step": 22044 + }, + { + "epoch": 0.76, + "learning_rate": 2.6307013976211813e-06, + "loss": 0.6536, + "step": 22045 + }, + { + "epoch": 0.76, + "learning_rate": 2.6299654022393227e-06, + "loss": 0.6085, + "step": 22046 + }, + { + "epoch": 0.76, + "learning_rate": 2.629229494238549e-06, + "loss": 0.6266, + "step": 22047 + }, + { + "epoch": 0.76, + "learning_rate": 2.6284936736275825e-06, + "loss": 0.6597, + "step": 22048 + }, + { + "epoch": 0.76, + "learning_rate": 2.6277579404151477e-06, + "loss": 0.6384, + "step": 22049 + }, + { + "epoch": 0.76, + "learning_rate": 2.6270222946099723e-06, + "loss": 0.6308, + "step": 22050 + }, + { + "epoch": 0.76, + "learning_rate": 2.6262867362207723e-06, + "loss": 0.6216, + "step": 22051 + }, + { + "epoch": 0.76, + "learning_rate": 2.62555126525627e-06, + "loss": 0.5933, + "step": 22052 + }, + { + "epoch": 0.76, + "learning_rate": 2.6248158817251857e-06, + "loss": 0.6255, + "step": 22053 + }, + { + "epoch": 0.76, + "learning_rate": 2.6240805856362397e-06, + "loss": 0.6429, + "step": 22054 + }, + { + "epoch": 0.76, + "learning_rate": 2.623345376998151e-06, + "loss": 0.6106, + "step": 22055 + }, + { + "epoch": 0.76, + "learning_rate": 2.622610255819632e-06, + "loss": 0.627, + "step": 22056 + }, + { + "epoch": 0.76, + "learning_rate": 2.6218752221094015e-06, + "loss": 0.6406, + "step": 22057 + }, + { + "epoch": 0.76, + "learning_rate": 2.621140275876175e-06, + "loss": 0.6443, + "step": 22058 + }, + { + "epoch": 0.76, + "learning_rate": 2.6204054171286596e-06, + "loss": 0.611, + "step": 22059 + }, + { + "epoch": 0.76, + "learning_rate": 2.6196706458755773e-06, + "loss": 0.6938, + "step": 22060 + }, + { + "epoch": 0.76, + "learning_rate": 2.6189359621256373e-06, + "loss": 0.6137, + "step": 22061 + }, + { + "epoch": 0.76, + "learning_rate": 2.618201365887546e-06, + "loss": 0.6342, + "step": 22062 + }, + { + "epoch": 0.76, + "learning_rate": 2.617466857170016e-06, + "loss": 0.6694, + "step": 22063 + }, + { + "epoch": 0.76, + "learning_rate": 2.616732435981757e-06, + "loss": 0.6134, + "step": 22064 + }, + { + "epoch": 0.76, + "learning_rate": 2.6159981023314695e-06, + "loss": 0.651, + "step": 22065 + }, + { + "epoch": 0.76, + "learning_rate": 2.6152638562278687e-06, + "loss": 0.6376, + "step": 22066 + }, + { + "epoch": 0.76, + "learning_rate": 2.61452969767966e-06, + "loss": 0.6267, + "step": 22067 + }, + { + "epoch": 0.76, + "learning_rate": 2.613795626695541e-06, + "loss": 0.6155, + "step": 22068 + }, + { + "epoch": 0.76, + "learning_rate": 2.613061643284218e-06, + "loss": 0.6183, + "step": 22069 + }, + { + "epoch": 0.76, + "learning_rate": 2.6123277474543975e-06, + "loss": 0.6506, + "step": 22070 + }, + { + "epoch": 0.76, + "learning_rate": 2.6115939392147705e-06, + "loss": 0.6299, + "step": 22071 + }, + { + "epoch": 0.76, + "learning_rate": 2.6108602185740463e-06, + "loss": 0.5991, + "step": 22072 + }, + { + "epoch": 0.76, + "learning_rate": 2.6101265855409254e-06, + "loss": 0.6362, + "step": 22073 + }, + { + "epoch": 0.76, + "learning_rate": 2.6093930401240985e-06, + "loss": 0.6242, + "step": 22074 + }, + { + "epoch": 0.76, + "learning_rate": 2.608659582332266e-06, + "loss": 0.6786, + "step": 22075 + }, + { + "epoch": 0.76, + "learning_rate": 2.607926212174128e-06, + "loss": 0.6544, + "step": 22076 + }, + { + "epoch": 0.76, + "learning_rate": 2.6071929296583698e-06, + "loss": 0.6003, + "step": 22077 + }, + { + "epoch": 0.76, + "learning_rate": 2.606459734793694e-06, + "loss": 0.7104, + "step": 22078 + }, + { + "epoch": 0.76, + "learning_rate": 2.605726627588794e-06, + "loss": 0.6048, + "step": 22079 + }, + { + "epoch": 0.77, + "learning_rate": 2.6049936080523553e-06, + "loss": 0.6275, + "step": 22080 + }, + { + "epoch": 0.77, + "learning_rate": 2.604260676193072e-06, + "loss": 0.5871, + "step": 22081 + }, + { + "epoch": 0.77, + "learning_rate": 2.603527832019638e-06, + "loss": 0.646, + "step": 22082 + }, + { + "epoch": 0.77, + "learning_rate": 2.6027950755407318e-06, + "loss": 0.6103, + "step": 22083 + }, + { + "epoch": 0.77, + "learning_rate": 2.60206240676505e-06, + "loss": 0.6029, + "step": 22084 + }, + { + "epoch": 0.77, + "learning_rate": 2.60132982570128e-06, + "loss": 0.5876, + "step": 22085 + }, + { + "epoch": 0.77, + "learning_rate": 2.600597332358101e-06, + "loss": 0.5901, + "step": 22086 + }, + { + "epoch": 0.77, + "learning_rate": 2.599864926744201e-06, + "loss": 0.5863, + "step": 22087 + }, + { + "epoch": 0.77, + "learning_rate": 2.599132608868268e-06, + "loss": 0.6224, + "step": 22088 + }, + { + "epoch": 0.77, + "learning_rate": 2.598400378738972e-06, + "loss": 0.652, + "step": 22089 + }, + { + "epoch": 0.77, + "learning_rate": 2.5976682363650065e-06, + "loss": 0.605, + "step": 22090 + }, + { + "epoch": 0.77, + "learning_rate": 2.596936181755051e-06, + "loss": 0.5973, + "step": 22091 + }, + { + "epoch": 0.77, + "learning_rate": 2.596204214917779e-06, + "loss": 0.6642, + "step": 22092 + }, + { + "epoch": 0.77, + "learning_rate": 2.5954723358618718e-06, + "loss": 0.6798, + "step": 22093 + }, + { + "epoch": 0.77, + "learning_rate": 2.5947405445960105e-06, + "loss": 0.6369, + "step": 22094 + }, + { + "epoch": 0.77, + "learning_rate": 2.594008841128861e-06, + "loss": 0.652, + "step": 22095 + }, + { + "epoch": 0.77, + "learning_rate": 2.5932772254691085e-06, + "loss": 0.6179, + "step": 22096 + }, + { + "epoch": 0.77, + "learning_rate": 2.592545697625427e-06, + "loss": 0.6831, + "step": 22097 + }, + { + "epoch": 0.77, + "learning_rate": 2.591814257606483e-06, + "loss": 0.6213, + "step": 22098 + }, + { + "epoch": 0.77, + "learning_rate": 2.591082905420954e-06, + "loss": 0.5994, + "step": 22099 + }, + { + "epoch": 0.77, + "learning_rate": 2.5903516410775107e-06, + "loss": 0.6581, + "step": 22100 + }, + { + "epoch": 0.77, + "learning_rate": 2.5896204645848177e-06, + "loss": 0.6652, + "step": 22101 + }, + { + "epoch": 0.77, + "learning_rate": 2.58888937595155e-06, + "loss": 0.6072, + "step": 22102 + }, + { + "epoch": 0.77, + "learning_rate": 2.588158375186377e-06, + "loss": 0.6394, + "step": 22103 + }, + { + "epoch": 0.77, + "learning_rate": 2.5874274622979602e-06, + "loss": 0.5562, + "step": 22104 + }, + { + "epoch": 0.77, + "learning_rate": 2.5866966372949675e-06, + "loss": 0.6228, + "step": 22105 + }, + { + "epoch": 0.77, + "learning_rate": 2.585965900186067e-06, + "loss": 0.6595, + "step": 22106 + }, + { + "epoch": 0.77, + "learning_rate": 2.585235250979913e-06, + "loss": 0.6307, + "step": 22107 + }, + { + "epoch": 0.77, + "learning_rate": 2.584504689685179e-06, + "loss": 0.6361, + "step": 22108 + }, + { + "epoch": 0.77, + "learning_rate": 2.5837742163105238e-06, + "loss": 0.6415, + "step": 22109 + }, + { + "epoch": 0.77, + "learning_rate": 2.5830438308646055e-06, + "loss": 0.6416, + "step": 22110 + }, + { + "epoch": 0.77, + "learning_rate": 2.5823135333560843e-06, + "loss": 0.6447, + "step": 22111 + }, + { + "epoch": 0.77, + "learning_rate": 2.5815833237936226e-06, + "loss": 0.5791, + "step": 22112 + }, + { + "epoch": 0.77, + "learning_rate": 2.580853202185869e-06, + "loss": 0.6584, + "step": 22113 + }, + { + "epoch": 0.77, + "learning_rate": 2.58012316854149e-06, + "loss": 0.7071, + "step": 22114 + }, + { + "epoch": 0.77, + "learning_rate": 2.579393222869139e-06, + "loss": 0.6958, + "step": 22115 + }, + { + "epoch": 0.77, + "learning_rate": 2.5786633651774652e-06, + "loss": 0.6019, + "step": 22116 + }, + { + "epoch": 0.77, + "learning_rate": 2.5779335954751282e-06, + "loss": 0.6629, + "step": 22117 + }, + { + "epoch": 0.77, + "learning_rate": 2.5772039137707748e-06, + "loss": 0.667, + "step": 22118 + }, + { + "epoch": 0.77, + "learning_rate": 2.5764743200730556e-06, + "loss": 0.6207, + "step": 22119 + }, + { + "epoch": 0.77, + "learning_rate": 2.5757448143906303e-06, + "loss": 0.6082, + "step": 22120 + }, + { + "epoch": 0.77, + "learning_rate": 2.57501539673214e-06, + "loss": 0.6415, + "step": 22121 + }, + { + "epoch": 0.77, + "learning_rate": 2.574286067106233e-06, + "loss": 0.6764, + "step": 22122 + }, + { + "epoch": 0.77, + "learning_rate": 2.5735568255215624e-06, + "loss": 0.646, + "step": 22123 + }, + { + "epoch": 0.77, + "learning_rate": 2.5728276719867674e-06, + "loss": 0.6169, + "step": 22124 + }, + { + "epoch": 0.77, + "learning_rate": 2.5720986065104912e-06, + "loss": 0.6621, + "step": 22125 + }, + { + "epoch": 0.77, + "learning_rate": 2.57136962910139e-06, + "loss": 0.6731, + "step": 22126 + }, + { + "epoch": 0.77, + "learning_rate": 2.5706407397680955e-06, + "loss": 0.6163, + "step": 22127 + }, + { + "epoch": 0.77, + "learning_rate": 2.569911938519253e-06, + "loss": 0.6258, + "step": 22128 + }, + { + "epoch": 0.77, + "learning_rate": 2.5691832253635075e-06, + "loss": 0.6877, + "step": 22129 + }, + { + "epoch": 0.77, + "learning_rate": 2.568454600309491e-06, + "loss": 0.6042, + "step": 22130 + }, + { + "epoch": 0.77, + "learning_rate": 2.567726063365843e-06, + "loss": 0.639, + "step": 22131 + }, + { + "epoch": 0.77, + "learning_rate": 2.566997614541211e-06, + "loss": 0.6961, + "step": 22132 + }, + { + "epoch": 0.77, + "learning_rate": 2.5662692538442213e-06, + "loss": 0.6335, + "step": 22133 + }, + { + "epoch": 0.77, + "learning_rate": 2.565540981283514e-06, + "loss": 0.6115, + "step": 22134 + }, + { + "epoch": 0.77, + "learning_rate": 2.564812796867726e-06, + "loss": 0.5503, + "step": 22135 + }, + { + "epoch": 0.77, + "learning_rate": 2.5640847006054847e-06, + "loss": 0.6159, + "step": 22136 + }, + { + "epoch": 0.77, + "learning_rate": 2.563356692505423e-06, + "loss": 0.6326, + "step": 22137 + }, + { + "epoch": 0.77, + "learning_rate": 2.562628772576181e-06, + "loss": 0.6019, + "step": 22138 + }, + { + "epoch": 0.77, + "learning_rate": 2.5619009408263793e-06, + "loss": 0.6334, + "step": 22139 + }, + { + "epoch": 0.77, + "learning_rate": 2.5611731972646527e-06, + "loss": 0.561, + "step": 22140 + }, + { + "epoch": 0.77, + "learning_rate": 2.56044554189963e-06, + "loss": 0.6405, + "step": 22141 + }, + { + "epoch": 0.77, + "learning_rate": 2.5597179747399337e-06, + "loss": 0.6517, + "step": 22142 + }, + { + "epoch": 0.77, + "learning_rate": 2.5589904957941903e-06, + "loss": 0.5968, + "step": 22143 + }, + { + "epoch": 0.77, + "learning_rate": 2.5582631050710326e-06, + "loss": 0.6147, + "step": 22144 + }, + { + "epoch": 0.77, + "learning_rate": 2.5575358025790776e-06, + "loss": 0.6618, + "step": 22145 + }, + { + "epoch": 0.77, + "learning_rate": 2.55680858832695e-06, + "loss": 0.6191, + "step": 22146 + }, + { + "epoch": 0.77, + "learning_rate": 2.5560814623232755e-06, + "loss": 0.6289, + "step": 22147 + }, + { + "epoch": 0.77, + "learning_rate": 2.555354424576668e-06, + "loss": 0.6733, + "step": 22148 + }, + { + "epoch": 0.77, + "learning_rate": 2.554627475095749e-06, + "loss": 0.6516, + "step": 22149 + }, + { + "epoch": 0.77, + "learning_rate": 2.5539006138891464e-06, + "loss": 0.6508, + "step": 22150 + }, + { + "epoch": 0.77, + "learning_rate": 2.553173840965467e-06, + "loss": 0.6561, + "step": 22151 + }, + { + "epoch": 0.77, + "learning_rate": 2.552447156333333e-06, + "loss": 0.6471, + "step": 22152 + }, + { + "epoch": 0.77, + "learning_rate": 2.5517205600013617e-06, + "loss": 0.6254, + "step": 22153 + }, + { + "epoch": 0.77, + "learning_rate": 2.550994051978163e-06, + "loss": 0.6445, + "step": 22154 + }, + { + "epoch": 0.77, + "learning_rate": 2.5502676322723485e-06, + "loss": 0.6552, + "step": 22155 + }, + { + "epoch": 0.77, + "learning_rate": 2.5495413008925417e-06, + "loss": 0.6205, + "step": 22156 + }, + { + "epoch": 0.77, + "learning_rate": 2.548815057847346e-06, + "loss": 0.5974, + "step": 22157 + }, + { + "epoch": 0.77, + "learning_rate": 2.5480889031453715e-06, + "loss": 0.5815, + "step": 22158 + }, + { + "epoch": 0.77, + "learning_rate": 2.547362836795234e-06, + "loss": 0.6657, + "step": 22159 + }, + { + "epoch": 0.77, + "learning_rate": 2.5466368588055347e-06, + "loss": 0.6745, + "step": 22160 + }, + { + "epoch": 0.77, + "learning_rate": 2.5459109691848805e-06, + "loss": 0.6462, + "step": 22161 + }, + { + "epoch": 0.77, + "learning_rate": 2.5451851679418882e-06, + "loss": 0.6496, + "step": 22162 + }, + { + "epoch": 0.77, + "learning_rate": 2.544459455085152e-06, + "loss": 0.6329, + "step": 22163 + }, + { + "epoch": 0.77, + "learning_rate": 2.5437338306232807e-06, + "loss": 0.6769, + "step": 22164 + }, + { + "epoch": 0.77, + "learning_rate": 2.5430082945648793e-06, + "loss": 0.669, + "step": 22165 + }, + { + "epoch": 0.77, + "learning_rate": 2.542282846918546e-06, + "loss": 0.64, + "step": 22166 + }, + { + "epoch": 0.77, + "learning_rate": 2.5415574876928806e-06, + "loss": 0.601, + "step": 22167 + }, + { + "epoch": 0.77, + "learning_rate": 2.5408322168964915e-06, + "loss": 0.6433, + "step": 22168 + }, + { + "epoch": 0.77, + "learning_rate": 2.5401070345379688e-06, + "loss": 0.5776, + "step": 22169 + }, + { + "epoch": 0.77, + "learning_rate": 2.5393819406259145e-06, + "loss": 0.6269, + "step": 22170 + }, + { + "epoch": 0.77, + "learning_rate": 2.538656935168928e-06, + "loss": 0.6538, + "step": 22171 + }, + { + "epoch": 0.77, + "learning_rate": 2.5379320181756007e-06, + "loss": 0.6658, + "step": 22172 + }, + { + "epoch": 0.77, + "learning_rate": 2.5372071896545237e-06, + "loss": 0.6787, + "step": 22173 + }, + { + "epoch": 0.77, + "learning_rate": 2.536482449614304e-06, + "loss": 0.659, + "step": 22174 + }, + { + "epoch": 0.77, + "learning_rate": 2.535757798063522e-06, + "loss": 0.578, + "step": 22175 + }, + { + "epoch": 0.77, + "learning_rate": 2.5350332350107732e-06, + "loss": 0.5711, + "step": 22176 + }, + { + "epoch": 0.77, + "learning_rate": 2.5343087604646522e-06, + "loss": 0.6263, + "step": 22177 + }, + { + "epoch": 0.77, + "learning_rate": 2.533584374433742e-06, + "loss": 0.5834, + "step": 22178 + }, + { + "epoch": 0.77, + "learning_rate": 2.532860076926634e-06, + "loss": 0.6323, + "step": 22179 + }, + { + "epoch": 0.77, + "learning_rate": 2.532135867951916e-06, + "loss": 0.6229, + "step": 22180 + }, + { + "epoch": 0.77, + "learning_rate": 2.5314117475181732e-06, + "loss": 0.6264, + "step": 22181 + }, + { + "epoch": 0.77, + "learning_rate": 2.530687715633996e-06, + "loss": 0.6463, + "step": 22182 + }, + { + "epoch": 0.77, + "learning_rate": 2.529963772307962e-06, + "loss": 0.6804, + "step": 22183 + }, + { + "epoch": 0.77, + "learning_rate": 2.529239917548656e-06, + "loss": 0.6364, + "step": 22184 + }, + { + "epoch": 0.77, + "learning_rate": 2.5285161513646615e-06, + "loss": 0.6292, + "step": 22185 + }, + { + "epoch": 0.77, + "learning_rate": 2.5277924737645598e-06, + "loss": 0.5985, + "step": 22186 + }, + { + "epoch": 0.77, + "learning_rate": 2.527068884756931e-06, + "loss": 0.598, + "step": 22187 + }, + { + "epoch": 0.77, + "learning_rate": 2.526345384350357e-06, + "loss": 0.6837, + "step": 22188 + }, + { + "epoch": 0.77, + "learning_rate": 2.525621972553409e-06, + "loss": 0.7108, + "step": 22189 + }, + { + "epoch": 0.77, + "learning_rate": 2.5248986493746688e-06, + "loss": 0.5728, + "step": 22190 + }, + { + "epoch": 0.77, + "learning_rate": 2.5241754148227103e-06, + "loss": 0.6145, + "step": 22191 + }, + { + "epoch": 0.77, + "learning_rate": 2.523452268906109e-06, + "loss": 0.6022, + "step": 22192 + }, + { + "epoch": 0.77, + "learning_rate": 2.522729211633439e-06, + "loss": 0.6757, + "step": 22193 + }, + { + "epoch": 0.77, + "learning_rate": 2.5220062430132764e-06, + "loss": 0.6272, + "step": 22194 + }, + { + "epoch": 0.77, + "learning_rate": 2.5212833630541866e-06, + "loss": 0.627, + "step": 22195 + }, + { + "epoch": 0.77, + "learning_rate": 2.520560571764743e-06, + "loss": 0.6542, + "step": 22196 + }, + { + "epoch": 0.77, + "learning_rate": 2.5198378691535154e-06, + "loss": 0.6345, + "step": 22197 + }, + { + "epoch": 0.77, + "learning_rate": 2.519115255229072e-06, + "loss": 0.638, + "step": 22198 + }, + { + "epoch": 0.77, + "learning_rate": 2.51839272999998e-06, + "loss": 0.6593, + "step": 22199 + }, + { + "epoch": 0.77, + "learning_rate": 2.517670293474811e-06, + "loss": 0.6081, + "step": 22200 + }, + { + "epoch": 0.77, + "learning_rate": 2.5169479456621216e-06, + "loss": 0.6709, + "step": 22201 + }, + { + "epoch": 0.77, + "learning_rate": 2.5162256865704813e-06, + "loss": 0.641, + "step": 22202 + }, + { + "epoch": 0.77, + "learning_rate": 2.5155035162084518e-06, + "loss": 0.6205, + "step": 22203 + }, + { + "epoch": 0.77, + "learning_rate": 2.5147814345845966e-06, + "loss": 0.6667, + "step": 22204 + }, + { + "epoch": 0.77, + "learning_rate": 2.514059441707476e-06, + "loss": 0.6335, + "step": 22205 + }, + { + "epoch": 0.77, + "learning_rate": 2.513337537585654e-06, + "loss": 0.6497, + "step": 22206 + }, + { + "epoch": 0.77, + "learning_rate": 2.5126157222276824e-06, + "loss": 0.663, + "step": 22207 + }, + { + "epoch": 0.77, + "learning_rate": 2.511893995642124e-06, + "loss": 0.6187, + "step": 22208 + }, + { + "epoch": 0.77, + "learning_rate": 2.5111723578375337e-06, + "loss": 0.6345, + "step": 22209 + }, + { + "epoch": 0.77, + "learning_rate": 2.5104508088224688e-06, + "loss": 0.5993, + "step": 22210 + }, + { + "epoch": 0.77, + "learning_rate": 2.509729348605484e-06, + "loss": 0.576, + "step": 22211 + }, + { + "epoch": 0.77, + "learning_rate": 2.5090079771951357e-06, + "loss": 0.6173, + "step": 22212 + }, + { + "epoch": 0.77, + "learning_rate": 2.5082866945999716e-06, + "loss": 0.5937, + "step": 22213 + }, + { + "epoch": 0.77, + "learning_rate": 2.507565500828546e-06, + "loss": 0.6829, + "step": 22214 + }, + { + "epoch": 0.77, + "learning_rate": 2.5068443958894097e-06, + "loss": 0.6311, + "step": 22215 + }, + { + "epoch": 0.77, + "learning_rate": 2.5061233797911112e-06, + "loss": 0.6511, + "step": 22216 + }, + { + "epoch": 0.77, + "learning_rate": 2.5054024525421995e-06, + "loss": 0.5827, + "step": 22217 + }, + { + "epoch": 0.77, + "learning_rate": 2.5046816141512254e-06, + "loss": 0.6254, + "step": 22218 + }, + { + "epoch": 0.77, + "learning_rate": 2.50396086462673e-06, + "loss": 0.5828, + "step": 22219 + }, + { + "epoch": 0.77, + "learning_rate": 2.5032402039772607e-06, + "loss": 0.6703, + "step": 22220 + }, + { + "epoch": 0.77, + "learning_rate": 2.502519632211362e-06, + "loss": 0.6561, + "step": 22221 + }, + { + "epoch": 0.77, + "learning_rate": 2.5017991493375783e-06, + "loss": 0.6167, + "step": 22222 + }, + { + "epoch": 0.77, + "learning_rate": 2.501078755364451e-06, + "loss": 0.6499, + "step": 22223 + }, + { + "epoch": 0.77, + "learning_rate": 2.500358450300523e-06, + "loss": 0.6284, + "step": 22224 + }, + { + "epoch": 0.77, + "learning_rate": 2.49963823415433e-06, + "loss": 0.6317, + "step": 22225 + }, + { + "epoch": 0.77, + "learning_rate": 2.4989181069344147e-06, + "loss": 0.6271, + "step": 22226 + }, + { + "epoch": 0.77, + "learning_rate": 2.4981980686493133e-06, + "loss": 0.6924, + "step": 22227 + }, + { + "epoch": 0.77, + "learning_rate": 2.4974781193075646e-06, + "loss": 0.6358, + "step": 22228 + }, + { + "epoch": 0.77, + "learning_rate": 2.496758258917703e-06, + "loss": 0.6202, + "step": 22229 + }, + { + "epoch": 0.77, + "learning_rate": 2.496038487488266e-06, + "loss": 0.6414, + "step": 22230 + }, + { + "epoch": 0.77, + "learning_rate": 2.495318805027783e-06, + "loss": 0.6147, + "step": 22231 + }, + { + "epoch": 0.77, + "learning_rate": 2.494599211544789e-06, + "loss": 0.6581, + "step": 22232 + }, + { + "epoch": 0.77, + "learning_rate": 2.493879707047816e-06, + "loss": 0.6476, + "step": 22233 + }, + { + "epoch": 0.77, + "learning_rate": 2.4931602915453945e-06, + "loss": 0.6637, + "step": 22234 + }, + { + "epoch": 0.77, + "learning_rate": 2.4924409650460535e-06, + "loss": 0.651, + "step": 22235 + }, + { + "epoch": 0.77, + "learning_rate": 2.491721727558325e-06, + "loss": 0.6367, + "step": 22236 + }, + { + "epoch": 0.77, + "learning_rate": 2.491002579090731e-06, + "loss": 0.6826, + "step": 22237 + }, + { + "epoch": 0.77, + "learning_rate": 2.490283519651799e-06, + "loss": 0.6173, + "step": 22238 + }, + { + "epoch": 0.77, + "learning_rate": 2.4895645492500576e-06, + "loss": 0.6433, + "step": 22239 + }, + { + "epoch": 0.77, + "learning_rate": 2.4888456678940276e-06, + "loss": 0.5853, + "step": 22240 + }, + { + "epoch": 0.77, + "learning_rate": 2.488126875592237e-06, + "loss": 0.6685, + "step": 22241 + }, + { + "epoch": 0.77, + "learning_rate": 2.4874081723532027e-06, + "loss": 0.6098, + "step": 22242 + }, + { + "epoch": 0.77, + "learning_rate": 2.4866895581854476e-06, + "loss": 0.6599, + "step": 22243 + }, + { + "epoch": 0.77, + "learning_rate": 2.485971033097493e-06, + "loss": 0.6759, + "step": 22244 + }, + { + "epoch": 0.77, + "learning_rate": 2.4852525970978556e-06, + "loss": 0.6592, + "step": 22245 + }, + { + "epoch": 0.77, + "learning_rate": 2.4845342501950565e-06, + "loss": 0.6216, + "step": 22246 + }, + { + "epoch": 0.77, + "learning_rate": 2.4838159923976123e-06, + "loss": 0.6592, + "step": 22247 + }, + { + "epoch": 0.77, + "learning_rate": 2.483097823714036e-06, + "loss": 0.6555, + "step": 22248 + }, + { + "epoch": 0.77, + "learning_rate": 2.482379744152843e-06, + "loss": 0.666, + "step": 22249 + }, + { + "epoch": 0.77, + "learning_rate": 2.4816617537225483e-06, + "loss": 0.6547, + "step": 22250 + }, + { + "epoch": 0.77, + "learning_rate": 2.480943852431664e-06, + "loss": 0.6276, + "step": 22251 + }, + { + "epoch": 0.77, + "learning_rate": 2.4802260402887023e-06, + "loss": 0.6172, + "step": 22252 + }, + { + "epoch": 0.77, + "learning_rate": 2.479508317302176e-06, + "loss": 0.6444, + "step": 22253 + }, + { + "epoch": 0.77, + "learning_rate": 2.4787906834805896e-06, + "loss": 0.6169, + "step": 22254 + }, + { + "epoch": 0.77, + "learning_rate": 2.478073138832453e-06, + "loss": 0.6547, + "step": 22255 + }, + { + "epoch": 0.77, + "learning_rate": 2.477355683366276e-06, + "loss": 0.6275, + "step": 22256 + }, + { + "epoch": 0.77, + "learning_rate": 2.4766383170905628e-06, + "loss": 0.6294, + "step": 22257 + }, + { + "epoch": 0.77, + "learning_rate": 2.47592104001382e-06, + "loss": 0.5406, + "step": 22258 + }, + { + "epoch": 0.77, + "learning_rate": 2.475203852144553e-06, + "loss": 0.5928, + "step": 22259 + }, + { + "epoch": 0.77, + "learning_rate": 2.474486753491262e-06, + "loss": 0.643, + "step": 22260 + }, + { + "epoch": 0.77, + "learning_rate": 2.47376974406245e-06, + "loss": 0.6214, + "step": 22261 + }, + { + "epoch": 0.77, + "learning_rate": 2.4730528238666174e-06, + "loss": 0.5944, + "step": 22262 + }, + { + "epoch": 0.77, + "learning_rate": 2.472335992912266e-06, + "loss": 0.6546, + "step": 22263 + }, + { + "epoch": 0.77, + "learning_rate": 2.471619251207893e-06, + "loss": 0.6554, + "step": 22264 + }, + { + "epoch": 0.77, + "learning_rate": 2.4709025987620017e-06, + "loss": 0.7192, + "step": 22265 + }, + { + "epoch": 0.77, + "learning_rate": 2.4701860355830796e-06, + "loss": 0.6985, + "step": 22266 + }, + { + "epoch": 0.77, + "learning_rate": 2.4694695616796294e-06, + "loss": 0.6416, + "step": 22267 + }, + { + "epoch": 0.77, + "learning_rate": 2.4687531770601426e-06, + "loss": 0.6014, + "step": 22268 + }, + { + "epoch": 0.77, + "learning_rate": 2.4680368817331136e-06, + "loss": 0.66, + "step": 22269 + }, + { + "epoch": 0.77, + "learning_rate": 2.4673206757070356e-06, + "loss": 0.6038, + "step": 22270 + }, + { + "epoch": 0.77, + "learning_rate": 2.466604558990403e-06, + "loss": 0.629, + "step": 22271 + }, + { + "epoch": 0.77, + "learning_rate": 2.4658885315917003e-06, + "loss": 0.6575, + "step": 22272 + }, + { + "epoch": 0.77, + "learning_rate": 2.4651725935194202e-06, + "loss": 0.6218, + "step": 22273 + }, + { + "epoch": 0.77, + "learning_rate": 2.46445674478205e-06, + "loss": 0.7432, + "step": 22274 + }, + { + "epoch": 0.77, + "learning_rate": 2.463740985388078e-06, + "loss": 0.6407, + "step": 22275 + }, + { + "epoch": 0.77, + "learning_rate": 2.4630253153459892e-06, + "loss": 0.6303, + "step": 22276 + }, + { + "epoch": 0.77, + "learning_rate": 2.4623097346642734e-06, + "loss": 0.6608, + "step": 22277 + }, + { + "epoch": 0.77, + "learning_rate": 2.461594243351407e-06, + "loss": 0.6079, + "step": 22278 + }, + { + "epoch": 0.77, + "learning_rate": 2.460878841415878e-06, + "loss": 0.6496, + "step": 22279 + }, + { + "epoch": 0.77, + "learning_rate": 2.4601635288661674e-06, + "loss": 0.6169, + "step": 22280 + }, + { + "epoch": 0.77, + "learning_rate": 2.4594483057107554e-06, + "loss": 0.6198, + "step": 22281 + }, + { + "epoch": 0.77, + "learning_rate": 2.458733171958123e-06, + "loss": 0.6657, + "step": 22282 + }, + { + "epoch": 0.77, + "learning_rate": 2.4580181276167516e-06, + "loss": 0.6354, + "step": 22283 + }, + { + "epoch": 0.77, + "learning_rate": 2.4573031726951136e-06, + "loss": 0.674, + "step": 22284 + }, + { + "epoch": 0.77, + "learning_rate": 2.456588307201687e-06, + "loss": 0.6594, + "step": 22285 + }, + { + "epoch": 0.77, + "learning_rate": 2.455873531144949e-06, + "loss": 0.623, + "step": 22286 + }, + { + "epoch": 0.77, + "learning_rate": 2.455158844533373e-06, + "loss": 0.5739, + "step": 22287 + }, + { + "epoch": 0.77, + "learning_rate": 2.4544442473754336e-06, + "loss": 0.6523, + "step": 22288 + }, + { + "epoch": 0.77, + "learning_rate": 2.4537297396796058e-06, + "loss": 0.6047, + "step": 22289 + }, + { + "epoch": 0.77, + "learning_rate": 2.453015321454355e-06, + "loss": 0.6374, + "step": 22290 + }, + { + "epoch": 0.77, + "learning_rate": 2.4523009927081556e-06, + "loss": 0.6691, + "step": 22291 + }, + { + "epoch": 0.77, + "learning_rate": 2.4515867534494743e-06, + "loss": 0.612, + "step": 22292 + }, + { + "epoch": 0.77, + "learning_rate": 2.4508726036867815e-06, + "loss": 0.7, + "step": 22293 + }, + { + "epoch": 0.77, + "learning_rate": 2.4501585434285435e-06, + "loss": 0.5909, + "step": 22294 + }, + { + "epoch": 0.77, + "learning_rate": 2.4494445726832296e-06, + "loss": 0.6007, + "step": 22295 + }, + { + "epoch": 0.77, + "learning_rate": 2.448730691459299e-06, + "loss": 0.6159, + "step": 22296 + }, + { + "epoch": 0.77, + "learning_rate": 2.4480168997652177e-06, + "loss": 0.612, + "step": 22297 + }, + { + "epoch": 0.77, + "learning_rate": 2.4473031976094507e-06, + "loss": 0.6359, + "step": 22298 + }, + { + "epoch": 0.77, + "learning_rate": 2.446589585000457e-06, + "loss": 0.6494, + "step": 22299 + }, + { + "epoch": 0.77, + "learning_rate": 2.4458760619467004e-06, + "loss": 0.6101, + "step": 22300 + }, + { + "epoch": 0.77, + "learning_rate": 2.445162628456641e-06, + "loss": 0.6674, + "step": 22301 + }, + { + "epoch": 0.77, + "learning_rate": 2.4444492845387323e-06, + "loss": 0.5484, + "step": 22302 + }, + { + "epoch": 0.77, + "learning_rate": 2.443736030201439e-06, + "loss": 0.6191, + "step": 22303 + }, + { + "epoch": 0.77, + "learning_rate": 2.4430228654532075e-06, + "loss": 0.6226, + "step": 22304 + }, + { + "epoch": 0.77, + "learning_rate": 2.4423097903025026e-06, + "loss": 0.5942, + "step": 22305 + }, + { + "epoch": 0.77, + "learning_rate": 2.441596804757779e-06, + "loss": 0.6207, + "step": 22306 + }, + { + "epoch": 0.77, + "learning_rate": 2.440883908827483e-06, + "loss": 0.6747, + "step": 22307 + }, + { + "epoch": 0.77, + "learning_rate": 2.4401711025200714e-06, + "loss": 0.6352, + "step": 22308 + }, + { + "epoch": 0.77, + "learning_rate": 2.439458385843997e-06, + "loss": 0.698, + "step": 22309 + }, + { + "epoch": 0.77, + "learning_rate": 2.438745758807701e-06, + "loss": 0.6504, + "step": 22310 + }, + { + "epoch": 0.77, + "learning_rate": 2.4380332214196433e-06, + "loss": 0.6037, + "step": 22311 + }, + { + "epoch": 0.77, + "learning_rate": 2.437320773688271e-06, + "loss": 0.6445, + "step": 22312 + }, + { + "epoch": 0.77, + "learning_rate": 2.436608415622024e-06, + "loss": 0.6752, + "step": 22313 + }, + { + "epoch": 0.77, + "learning_rate": 2.4358961472293506e-06, + "loss": 0.6456, + "step": 22314 + }, + { + "epoch": 0.77, + "learning_rate": 2.4351839685187017e-06, + "loss": 0.6458, + "step": 22315 + }, + { + "epoch": 0.77, + "learning_rate": 2.43447187949851e-06, + "loss": 0.6444, + "step": 22316 + }, + { + "epoch": 0.77, + "learning_rate": 2.4337598801772277e-06, + "loss": 0.6468, + "step": 22317 + }, + { + "epoch": 0.77, + "learning_rate": 2.433047970563297e-06, + "loss": 0.6373, + "step": 22318 + }, + { + "epoch": 0.77, + "learning_rate": 2.432336150665151e-06, + "loss": 0.669, + "step": 22319 + }, + { + "epoch": 0.77, + "learning_rate": 2.431624420491233e-06, + "loss": 0.6114, + "step": 22320 + }, + { + "epoch": 0.77, + "learning_rate": 2.4309127800499843e-06, + "loss": 0.6643, + "step": 22321 + }, + { + "epoch": 0.77, + "learning_rate": 2.4302012293498345e-06, + "loss": 0.6352, + "step": 22322 + }, + { + "epoch": 0.77, + "learning_rate": 2.429489768399228e-06, + "loss": 0.6329, + "step": 22323 + }, + { + "epoch": 0.77, + "learning_rate": 2.428778397206599e-06, + "loss": 0.6329, + "step": 22324 + }, + { + "epoch": 0.77, + "learning_rate": 2.428067115780377e-06, + "loss": 0.6533, + "step": 22325 + }, + { + "epoch": 0.77, + "learning_rate": 2.427355924128999e-06, + "loss": 0.6007, + "step": 22326 + }, + { + "epoch": 0.77, + "learning_rate": 2.4266448222608975e-06, + "loss": 0.606, + "step": 22327 + }, + { + "epoch": 0.77, + "learning_rate": 2.4259338101844965e-06, + "loss": 0.6329, + "step": 22328 + }, + { + "epoch": 0.77, + "learning_rate": 2.425222887908235e-06, + "loss": 0.6696, + "step": 22329 + }, + { + "epoch": 0.77, + "learning_rate": 2.424512055440541e-06, + "loss": 0.6765, + "step": 22330 + }, + { + "epoch": 0.77, + "learning_rate": 2.4238013127898363e-06, + "loss": 0.6144, + "step": 22331 + }, + { + "epoch": 0.77, + "learning_rate": 2.423090659964551e-06, + "loss": 0.6053, + "step": 22332 + }, + { + "epoch": 0.77, + "learning_rate": 2.422380096973114e-06, + "loss": 0.6038, + "step": 22333 + }, + { + "epoch": 0.77, + "learning_rate": 2.421669623823941e-06, + "loss": 0.6134, + "step": 22334 + }, + { + "epoch": 0.77, + "learning_rate": 2.4209592405254634e-06, + "loss": 0.6243, + "step": 22335 + }, + { + "epoch": 0.77, + "learning_rate": 2.4202489470861046e-06, + "loss": 0.7025, + "step": 22336 + }, + { + "epoch": 0.77, + "learning_rate": 2.41953874351428e-06, + "loss": 0.6126, + "step": 22337 + }, + { + "epoch": 0.77, + "learning_rate": 2.418828629818414e-06, + "loss": 0.6221, + "step": 22338 + }, + { + "epoch": 0.77, + "learning_rate": 2.418118606006927e-06, + "loss": 0.6467, + "step": 22339 + }, + { + "epoch": 0.77, + "learning_rate": 2.4174086720882295e-06, + "loss": 0.6538, + "step": 22340 + }, + { + "epoch": 0.77, + "learning_rate": 2.4166988280707472e-06, + "loss": 0.6302, + "step": 22341 + }, + { + "epoch": 0.77, + "learning_rate": 2.4159890739628955e-06, + "loss": 0.6851, + "step": 22342 + }, + { + "epoch": 0.77, + "learning_rate": 2.4152794097730846e-06, + "loss": 0.6259, + "step": 22343 + }, + { + "epoch": 0.77, + "learning_rate": 2.4145698355097314e-06, + "loss": 0.6307, + "step": 22344 + }, + { + "epoch": 0.77, + "learning_rate": 2.413860351181251e-06, + "loss": 0.6742, + "step": 22345 + }, + { + "epoch": 0.77, + "learning_rate": 2.4131509567960467e-06, + "loss": 0.6908, + "step": 22346 + }, + { + "epoch": 0.77, + "learning_rate": 2.4124416523625384e-06, + "loss": 0.6273, + "step": 22347 + }, + { + "epoch": 0.77, + "learning_rate": 2.411732437889135e-06, + "loss": 0.5989, + "step": 22348 + }, + { + "epoch": 0.77, + "learning_rate": 2.4110233133842396e-06, + "loss": 0.7009, + "step": 22349 + }, + { + "epoch": 0.77, + "learning_rate": 2.410314278856264e-06, + "loss": 0.6603, + "step": 22350 + }, + { + "epoch": 0.77, + "learning_rate": 2.409605334313616e-06, + "loss": 0.603, + "step": 22351 + }, + { + "epoch": 0.77, + "learning_rate": 2.408896479764693e-06, + "loss": 0.6201, + "step": 22352 + }, + { + "epoch": 0.77, + "learning_rate": 2.408187715217908e-06, + "loss": 0.6561, + "step": 22353 + }, + { + "epoch": 0.77, + "learning_rate": 2.4074790406816638e-06, + "loss": 0.6748, + "step": 22354 + }, + { + "epoch": 0.77, + "learning_rate": 2.406770456164357e-06, + "loss": 0.6553, + "step": 22355 + }, + { + "epoch": 0.77, + "learning_rate": 2.406061961674393e-06, + "loss": 0.616, + "step": 22356 + }, + { + "epoch": 0.77, + "learning_rate": 2.4053535572201725e-06, + "loss": 0.5571, + "step": 22357 + }, + { + "epoch": 0.77, + "learning_rate": 2.4046452428100873e-06, + "loss": 0.6028, + "step": 22358 + }, + { + "epoch": 0.77, + "learning_rate": 2.4039370184525445e-06, + "loss": 0.6004, + "step": 22359 + }, + { + "epoch": 0.77, + "learning_rate": 2.4032288841559403e-06, + "loss": 0.6854, + "step": 22360 + }, + { + "epoch": 0.77, + "learning_rate": 2.4025208399286647e-06, + "loss": 0.6048, + "step": 22361 + }, + { + "epoch": 0.77, + "learning_rate": 2.401812885779116e-06, + "loss": 0.6576, + "step": 22362 + }, + { + "epoch": 0.77, + "learning_rate": 2.4011050217156883e-06, + "loss": 0.6227, + "step": 22363 + }, + { + "epoch": 0.77, + "learning_rate": 2.4003972477467686e-06, + "loss": 0.6308, + "step": 22364 + }, + { + "epoch": 0.77, + "learning_rate": 2.3996895638807593e-06, + "loss": 0.6012, + "step": 22365 + }, + { + "epoch": 0.77, + "learning_rate": 2.398981970126041e-06, + "loss": 0.5787, + "step": 22366 + }, + { + "epoch": 0.77, + "learning_rate": 2.3982744664910075e-06, + "loss": 0.6156, + "step": 22367 + }, + { + "epoch": 0.77, + "learning_rate": 2.3975670529840478e-06, + "loss": 0.6472, + "step": 22368 + }, + { + "epoch": 0.78, + "learning_rate": 2.3968597296135464e-06, + "loss": 0.6154, + "step": 22369 + }, + { + "epoch": 0.78, + "learning_rate": 2.396152496387888e-06, + "loss": 0.6283, + "step": 22370 + }, + { + "epoch": 0.78, + "learning_rate": 2.395445353315465e-06, + "loss": 0.6232, + "step": 22371 + }, + { + "epoch": 0.78, + "learning_rate": 2.3947383004046566e-06, + "loss": 0.6244, + "step": 22372 + }, + { + "epoch": 0.78, + "learning_rate": 2.3940313376638446e-06, + "loss": 0.6263, + "step": 22373 + }, + { + "epoch": 0.78, + "learning_rate": 2.3933244651014167e-06, + "loss": 0.6374, + "step": 22374 + }, + { + "epoch": 0.78, + "learning_rate": 2.392617682725745e-06, + "loss": 0.5795, + "step": 22375 + }, + { + "epoch": 0.78, + "learning_rate": 2.3919109905452133e-06, + "loss": 0.6385, + "step": 22376 + }, + { + "epoch": 0.78, + "learning_rate": 2.3912043885682057e-06, + "loss": 0.675, + "step": 22377 + }, + { + "epoch": 0.78, + "learning_rate": 2.390497876803093e-06, + "loss": 0.6304, + "step": 22378 + }, + { + "epoch": 0.78, + "learning_rate": 2.3897914552582536e-06, + "loss": 0.6883, + "step": 22379 + }, + { + "epoch": 0.78, + "learning_rate": 2.3890851239420663e-06, + "loss": 0.6248, + "step": 22380 + }, + { + "epoch": 0.78, + "learning_rate": 2.3883788828628997e-06, + "loss": 0.6273, + "step": 22381 + }, + { + "epoch": 0.78, + "learning_rate": 2.3876727320291305e-06, + "loss": 0.6996, + "step": 22382 + }, + { + "epoch": 0.78, + "learning_rate": 2.38696667144913e-06, + "loss": 0.6274, + "step": 22383 + }, + { + "epoch": 0.78, + "learning_rate": 2.386260701131271e-06, + "loss": 0.572, + "step": 22384 + }, + { + "epoch": 0.78, + "learning_rate": 2.385554821083923e-06, + "loss": 0.6289, + "step": 22385 + }, + { + "epoch": 0.78, + "learning_rate": 2.384849031315457e-06, + "loss": 0.6222, + "step": 22386 + }, + { + "epoch": 0.78, + "learning_rate": 2.3841433318342367e-06, + "loss": 0.6211, + "step": 22387 + }, + { + "epoch": 0.78, + "learning_rate": 2.3834377226486317e-06, + "loss": 0.6407, + "step": 22388 + }, + { + "epoch": 0.78, + "learning_rate": 2.3827322037670062e-06, + "loss": 0.6635, + "step": 22389 + }, + { + "epoch": 0.78, + "learning_rate": 2.3820267751977276e-06, + "loss": 0.6431, + "step": 22390 + }, + { + "epoch": 0.78, + "learning_rate": 2.381321436949158e-06, + "loss": 0.6518, + "step": 22391 + }, + { + "epoch": 0.78, + "learning_rate": 2.380616189029663e-06, + "loss": 0.5962, + "step": 22392 + }, + { + "epoch": 0.78, + "learning_rate": 2.3799110314475982e-06, + "loss": 0.6362, + "step": 22393 + }, + { + "epoch": 0.78, + "learning_rate": 2.3792059642113284e-06, + "loss": 0.5733, + "step": 22394 + }, + { + "epoch": 0.78, + "learning_rate": 2.378500987329212e-06, + "loss": 0.6411, + "step": 22395 + }, + { + "epoch": 0.78, + "learning_rate": 2.3777961008096082e-06, + "loss": 0.6832, + "step": 22396 + }, + { + "epoch": 0.78, + "learning_rate": 2.3770913046608736e-06, + "loss": 0.6509, + "step": 22397 + }, + { + "epoch": 0.78, + "learning_rate": 2.376386598891367e-06, + "loss": 0.6189, + "step": 22398 + }, + { + "epoch": 0.78, + "learning_rate": 2.375681983509438e-06, + "loss": 0.6463, + "step": 22399 + }, + { + "epoch": 0.78, + "learning_rate": 2.3749774585234442e-06, + "loss": 0.6563, + "step": 22400 + }, + { + "epoch": 0.78, + "learning_rate": 2.374273023941739e-06, + "loss": 0.6296, + "step": 22401 + }, + { + "epoch": 0.78, + "learning_rate": 2.3735686797726732e-06, + "loss": 0.5617, + "step": 22402 + }, + { + "epoch": 0.78, + "learning_rate": 2.372864426024598e-06, + "loss": 0.6096, + "step": 22403 + }, + { + "epoch": 0.78, + "learning_rate": 2.3721602627058673e-06, + "loss": 0.652, + "step": 22404 + }, + { + "epoch": 0.78, + "learning_rate": 2.371456189824821e-06, + "loss": 0.5452, + "step": 22405 + }, + { + "epoch": 0.78, + "learning_rate": 2.3707522073898137e-06, + "loss": 0.6268, + "step": 22406 + }, + { + "epoch": 0.78, + "learning_rate": 2.370048315409189e-06, + "loss": 0.638, + "step": 22407 + }, + { + "epoch": 0.78, + "learning_rate": 2.369344513891294e-06, + "loss": 0.6758, + "step": 22408 + }, + { + "epoch": 0.78, + "learning_rate": 2.368640802844473e-06, + "loss": 0.6069, + "step": 22409 + }, + { + "epoch": 0.78, + "learning_rate": 2.3679371822770715e-06, + "loss": 0.6568, + "step": 22410 + }, + { + "epoch": 0.78, + "learning_rate": 2.367233652197426e-06, + "loss": 0.6072, + "step": 22411 + }, + { + "epoch": 0.78, + "learning_rate": 2.3665302126138812e-06, + "loss": 0.6825, + "step": 22412 + }, + { + "epoch": 0.78, + "learning_rate": 2.365826863534777e-06, + "loss": 0.6358, + "step": 22413 + }, + { + "epoch": 0.78, + "learning_rate": 2.3651236049684523e-06, + "loss": 0.6349, + "step": 22414 + }, + { + "epoch": 0.78, + "learning_rate": 2.3644204369232458e-06, + "loss": 0.612, + "step": 22415 + }, + { + "epoch": 0.78, + "learning_rate": 2.363717359407498e-06, + "loss": 0.5695, + "step": 22416 + }, + { + "epoch": 0.78, + "learning_rate": 2.363014372429536e-06, + "loss": 0.6345, + "step": 22417 + }, + { + "epoch": 0.78, + "learning_rate": 2.3623114759977015e-06, + "loss": 0.6251, + "step": 22418 + }, + { + "epoch": 0.78, + "learning_rate": 2.3616086701203243e-06, + "loss": 0.607, + "step": 22419 + }, + { + "epoch": 0.78, + "learning_rate": 2.36090595480574e-06, + "loss": 0.654, + "step": 22420 + }, + { + "epoch": 0.78, + "learning_rate": 2.3602033300622797e-06, + "loss": 0.5906, + "step": 22421 + }, + { + "epoch": 0.78, + "learning_rate": 2.359500795898275e-06, + "loss": 0.6065, + "step": 22422 + }, + { + "epoch": 0.78, + "learning_rate": 2.3587983523220514e-06, + "loss": 0.6135, + "step": 22423 + }, + { + "epoch": 0.78, + "learning_rate": 2.3580959993419395e-06, + "loss": 0.6162, + "step": 22424 + }, + { + "epoch": 0.78, + "learning_rate": 2.3573937369662658e-06, + "loss": 0.6257, + "step": 22425 + }, + { + "epoch": 0.78, + "learning_rate": 2.3566915652033582e-06, + "loss": 0.61, + "step": 22426 + }, + { + "epoch": 0.78, + "learning_rate": 2.3559894840615437e-06, + "loss": 0.6567, + "step": 22427 + }, + { + "epoch": 0.78, + "learning_rate": 2.355287493549141e-06, + "loss": 0.6127, + "step": 22428 + }, + { + "epoch": 0.78, + "learning_rate": 2.3545855936744746e-06, + "loss": 0.593, + "step": 22429 + }, + { + "epoch": 0.78, + "learning_rate": 2.3538837844458685e-06, + "loss": 0.6475, + "step": 22430 + }, + { + "epoch": 0.78, + "learning_rate": 2.353182065871642e-06, + "loss": 0.6336, + "step": 22431 + }, + { + "epoch": 0.78, + "learning_rate": 2.3524804379601152e-06, + "loss": 0.6114, + "step": 22432 + }, + { + "epoch": 0.78, + "learning_rate": 2.35177890071961e-06, + "loss": 0.6693, + "step": 22433 + }, + { + "epoch": 0.78, + "learning_rate": 2.351077454158438e-06, + "loss": 0.6743, + "step": 22434 + }, + { + "epoch": 0.78, + "learning_rate": 2.350376098284919e-06, + "loss": 0.5762, + "step": 22435 + }, + { + "epoch": 0.78, + "learning_rate": 2.3496748331073684e-06, + "loss": 0.6325, + "step": 22436 + }, + { + "epoch": 0.78, + "learning_rate": 2.3489736586341005e-06, + "loss": 0.6144, + "step": 22437 + }, + { + "epoch": 0.78, + "learning_rate": 2.348272574873428e-06, + "loss": 0.6393, + "step": 22438 + }, + { + "epoch": 0.78, + "learning_rate": 2.3475715818336663e-06, + "loss": 0.6093, + "step": 22439 + }, + { + "epoch": 0.78, + "learning_rate": 2.346870679523121e-06, + "loss": 0.6372, + "step": 22440 + }, + { + "epoch": 0.78, + "learning_rate": 2.3461698679501056e-06, + "loss": 0.6523, + "step": 22441 + }, + { + "epoch": 0.78, + "learning_rate": 2.3454691471229284e-06, + "loss": 0.6266, + "step": 22442 + }, + { + "epoch": 0.78, + "learning_rate": 2.344768517049897e-06, + "loss": 0.5784, + "step": 22443 + }, + { + "epoch": 0.78, + "learning_rate": 2.3440679777393195e-06, + "loss": 0.5868, + "step": 22444 + }, + { + "epoch": 0.78, + "learning_rate": 2.3433675291995027e-06, + "loss": 0.6074, + "step": 22445 + }, + { + "epoch": 0.78, + "learning_rate": 2.3426671714387483e-06, + "loss": 0.5582, + "step": 22446 + }, + { + "epoch": 0.78, + "learning_rate": 2.3419669044653603e-06, + "loss": 0.6158, + "step": 22447 + }, + { + "epoch": 0.78, + "learning_rate": 2.341266728287642e-06, + "loss": 0.5925, + "step": 22448 + }, + { + "epoch": 0.78, + "learning_rate": 2.340566642913895e-06, + "loss": 0.628, + "step": 22449 + }, + { + "epoch": 0.78, + "learning_rate": 2.339866648352419e-06, + "loss": 0.6457, + "step": 22450 + }, + { + "epoch": 0.78, + "learning_rate": 2.3391667446115184e-06, + "loss": 0.6062, + "step": 22451 + }, + { + "epoch": 0.78, + "learning_rate": 2.3384669316994833e-06, + "loss": 0.645, + "step": 22452 + }, + { + "epoch": 0.78, + "learning_rate": 2.337767209624614e-06, + "loss": 0.6468, + "step": 22453 + }, + { + "epoch": 0.78, + "learning_rate": 2.3370675783952077e-06, + "loss": 0.5891, + "step": 22454 + }, + { + "epoch": 0.78, + "learning_rate": 2.3363680380195598e-06, + "loss": 0.6462, + "step": 22455 + }, + { + "epoch": 0.78, + "learning_rate": 2.3356685885059628e-06, + "loss": 0.5555, + "step": 22456 + }, + { + "epoch": 0.78, + "learning_rate": 2.3349692298627125e-06, + "loss": 0.6577, + "step": 22457 + }, + { + "epoch": 0.78, + "learning_rate": 2.3342699620980957e-06, + "loss": 0.6191, + "step": 22458 + }, + { + "epoch": 0.78, + "learning_rate": 2.333570785220406e-06, + "loss": 0.658, + "step": 22459 + }, + { + "epoch": 0.78, + "learning_rate": 2.332871699237932e-06, + "loss": 0.6249, + "step": 22460 + }, + { + "epoch": 0.78, + "learning_rate": 2.3321727041589635e-06, + "loss": 0.6534, + "step": 22461 + }, + { + "epoch": 0.78, + "learning_rate": 2.331473799991788e-06, + "loss": 0.6746, + "step": 22462 + }, + { + "epoch": 0.78, + "learning_rate": 2.3307749867446926e-06, + "loss": 0.6586, + "step": 22463 + }, + { + "epoch": 0.78, + "learning_rate": 2.33007626442596e-06, + "loss": 0.5821, + "step": 22464 + }, + { + "epoch": 0.78, + "learning_rate": 2.3293776330438756e-06, + "loss": 0.6648, + "step": 22465 + }, + { + "epoch": 0.78, + "learning_rate": 2.3286790926067227e-06, + "loss": 0.632, + "step": 22466 + }, + { + "epoch": 0.78, + "learning_rate": 2.3279806431227827e-06, + "loss": 0.6245, + "step": 22467 + }, + { + "epoch": 0.78, + "learning_rate": 2.3272822846003374e-06, + "loss": 0.6457, + "step": 22468 + }, + { + "epoch": 0.78, + "learning_rate": 2.3265840170476704e-06, + "loss": 0.6222, + "step": 22469 + }, + { + "epoch": 0.78, + "learning_rate": 2.3258858404730534e-06, + "loss": 0.5989, + "step": 22470 + }, + { + "epoch": 0.78, + "learning_rate": 2.325187754884768e-06, + "loss": 0.5593, + "step": 22471 + }, + { + "epoch": 0.78, + "learning_rate": 2.3244897602910897e-06, + "loss": 0.6476, + "step": 22472 + }, + { + "epoch": 0.78, + "learning_rate": 2.323791856700295e-06, + "loss": 0.6536, + "step": 22473 + }, + { + "epoch": 0.78, + "learning_rate": 2.3230940441206584e-06, + "loss": 0.6759, + "step": 22474 + }, + { + "epoch": 0.78, + "learning_rate": 2.3223963225604563e-06, + "loss": 0.5975, + "step": 22475 + }, + { + "epoch": 0.78, + "learning_rate": 2.321698692027955e-06, + "loss": 0.6242, + "step": 22476 + }, + { + "epoch": 0.78, + "learning_rate": 2.321001152531429e-06, + "loss": 0.6408, + "step": 22477 + }, + { + "epoch": 0.78, + "learning_rate": 2.320303704079149e-06, + "loss": 0.6443, + "step": 22478 + }, + { + "epoch": 0.78, + "learning_rate": 2.3196063466793816e-06, + "loss": 0.636, + "step": 22479 + }, + { + "epoch": 0.78, + "learning_rate": 2.318909080340398e-06, + "loss": 0.648, + "step": 22480 + }, + { + "epoch": 0.78, + "learning_rate": 2.3182119050704668e-06, + "loss": 0.6003, + "step": 22481 + }, + { + "epoch": 0.78, + "learning_rate": 2.3175148208778474e-06, + "loss": 0.7212, + "step": 22482 + }, + { + "epoch": 0.78, + "learning_rate": 2.316817827770809e-06, + "loss": 0.6538, + "step": 22483 + }, + { + "epoch": 0.78, + "learning_rate": 2.3161209257576144e-06, + "loss": 0.684, + "step": 22484 + }, + { + "epoch": 0.78, + "learning_rate": 2.3154241148465263e-06, + "loss": 0.6591, + "step": 22485 + }, + { + "epoch": 0.78, + "learning_rate": 2.314727395045806e-06, + "loss": 0.6415, + "step": 22486 + }, + { + "epoch": 0.78, + "learning_rate": 2.3140307663637174e-06, + "loss": 0.6532, + "step": 22487 + }, + { + "epoch": 0.78, + "learning_rate": 2.3133342288085137e-06, + "loss": 0.6243, + "step": 22488 + }, + { + "epoch": 0.78, + "learning_rate": 2.312637782388457e-06, + "loss": 0.576, + "step": 22489 + }, + { + "epoch": 0.78, + "learning_rate": 2.3119414271118036e-06, + "loss": 0.6497, + "step": 22490 + }, + { + "epoch": 0.78, + "learning_rate": 2.311245162986809e-06, + "loss": 0.5992, + "step": 22491 + }, + { + "epoch": 0.78, + "learning_rate": 2.310548990021734e-06, + "loss": 0.6062, + "step": 22492 + }, + { + "epoch": 0.78, + "learning_rate": 2.3098529082248245e-06, + "loss": 0.6407, + "step": 22493 + }, + { + "epoch": 0.78, + "learning_rate": 2.309156917604337e-06, + "loss": 0.6226, + "step": 22494 + }, + { + "epoch": 0.78, + "learning_rate": 2.308461018168523e-06, + "loss": 0.6227, + "step": 22495 + }, + { + "epoch": 0.78, + "learning_rate": 2.307765209925633e-06, + "loss": 0.6521, + "step": 22496 + }, + { + "epoch": 0.78, + "learning_rate": 2.3070694928839176e-06, + "loss": 0.587, + "step": 22497 + }, + { + "epoch": 0.78, + "learning_rate": 2.3063738670516277e-06, + "loss": 0.6371, + "step": 22498 + }, + { + "epoch": 0.78, + "learning_rate": 2.3056783324370046e-06, + "loss": 0.6442, + "step": 22499 + }, + { + "epoch": 0.78, + "learning_rate": 2.3049828890482995e-06, + "loss": 0.5823, + "step": 22500 + }, + { + "epoch": 0.78, + "learning_rate": 2.3042875368937555e-06, + "loss": 0.6145, + "step": 22501 + }, + { + "epoch": 0.78, + "learning_rate": 2.3035922759816187e-06, + "loss": 0.6072, + "step": 22502 + }, + { + "epoch": 0.78, + "learning_rate": 2.302897106320131e-06, + "loss": 0.5834, + "step": 22503 + }, + { + "epoch": 0.78, + "learning_rate": 2.3022020279175383e-06, + "loss": 0.6202, + "step": 22504 + }, + { + "epoch": 0.78, + "learning_rate": 2.301507040782075e-06, + "loss": 0.6522, + "step": 22505 + }, + { + "epoch": 0.78, + "learning_rate": 2.3008121449219844e-06, + "loss": 0.5962, + "step": 22506 + }, + { + "epoch": 0.78, + "learning_rate": 2.3001173403455056e-06, + "loss": 0.6297, + "step": 22507 + }, + { + "epoch": 0.78, + "learning_rate": 2.2994226270608754e-06, + "loss": 0.6817, + "step": 22508 + }, + { + "epoch": 0.78, + "learning_rate": 2.2987280050763316e-06, + "loss": 0.7229, + "step": 22509 + }, + { + "epoch": 0.78, + "learning_rate": 2.2980334744001133e-06, + "loss": 0.6711, + "step": 22510 + }, + { + "epoch": 0.78, + "learning_rate": 2.2973390350404478e-06, + "loss": 0.587, + "step": 22511 + }, + { + "epoch": 0.78, + "learning_rate": 2.2966446870055715e-06, + "loss": 0.6188, + "step": 22512 + }, + { + "epoch": 0.78, + "learning_rate": 2.2959504303037173e-06, + "loss": 0.6581, + "step": 22513 + }, + { + "epoch": 0.78, + "learning_rate": 2.2952562649431166e-06, + "loss": 0.6139, + "step": 22514 + }, + { + "epoch": 0.78, + "learning_rate": 2.294562190931999e-06, + "loss": 0.6282, + "step": 22515 + }, + { + "epoch": 0.78, + "learning_rate": 2.293868208278598e-06, + "loss": 0.5986, + "step": 22516 + }, + { + "epoch": 0.78, + "learning_rate": 2.2931743169911335e-06, + "loss": 0.687, + "step": 22517 + }, + { + "epoch": 0.78, + "learning_rate": 2.2924805170778373e-06, + "loss": 0.6397, + "step": 22518 + }, + { + "epoch": 0.78, + "learning_rate": 2.2917868085469353e-06, + "loss": 0.6429, + "step": 22519 + }, + { + "epoch": 0.78, + "learning_rate": 2.2910931914066503e-06, + "loss": 0.6192, + "step": 22520 + }, + { + "epoch": 0.78, + "learning_rate": 2.2903996656652085e-06, + "loss": 0.6711, + "step": 22521 + }, + { + "epoch": 0.78, + "learning_rate": 2.289706231330834e-06, + "loss": 0.6325, + "step": 22522 + }, + { + "epoch": 0.78, + "learning_rate": 2.2890128884117425e-06, + "loss": 0.5834, + "step": 22523 + }, + { + "epoch": 0.78, + "learning_rate": 2.2883196369161574e-06, + "loss": 0.6378, + "step": 22524 + }, + { + "epoch": 0.78, + "learning_rate": 2.2876264768522983e-06, + "loss": 0.6052, + "step": 22525 + }, + { + "epoch": 0.78, + "learning_rate": 2.2869334082283844e-06, + "loss": 0.6298, + "step": 22526 + }, + { + "epoch": 0.78, + "learning_rate": 2.286240431052631e-06, + "loss": 0.6659, + "step": 22527 + }, + { + "epoch": 0.78, + "learning_rate": 2.2855475453332587e-06, + "loss": 0.6657, + "step": 22528 + }, + { + "epoch": 0.78, + "learning_rate": 2.2848547510784757e-06, + "loss": 0.607, + "step": 22529 + }, + { + "epoch": 0.78, + "learning_rate": 2.2841620482964997e-06, + "loss": 0.6376, + "step": 22530 + }, + { + "epoch": 0.78, + "learning_rate": 2.2834694369955436e-06, + "loss": 0.6043, + "step": 22531 + }, + { + "epoch": 0.78, + "learning_rate": 2.282776917183819e-06, + "loss": 0.5894, + "step": 22532 + }, + { + "epoch": 0.78, + "learning_rate": 2.282084488869536e-06, + "loss": 0.6428, + "step": 22533 + }, + { + "epoch": 0.78, + "learning_rate": 2.281392152060906e-06, + "loss": 0.6959, + "step": 22534 + }, + { + "epoch": 0.78, + "learning_rate": 2.280699906766135e-06, + "loss": 0.6152, + "step": 22535 + }, + { + "epoch": 0.78, + "learning_rate": 2.2800077529934315e-06, + "loss": 0.6421, + "step": 22536 + }, + { + "epoch": 0.78, + "learning_rate": 2.2793156907510017e-06, + "loss": 0.6081, + "step": 22537 + }, + { + "epoch": 0.78, + "learning_rate": 2.2786237200470507e-06, + "loss": 0.6493, + "step": 22538 + }, + { + "epoch": 0.78, + "learning_rate": 2.2779318408897833e-06, + "loss": 0.6287, + "step": 22539 + }, + { + "epoch": 0.78, + "learning_rate": 2.277240053287405e-06, + "loss": 0.6239, + "step": 22540 + }, + { + "epoch": 0.78, + "learning_rate": 2.276548357248113e-06, + "loss": 0.6134, + "step": 22541 + }, + { + "epoch": 0.78, + "learning_rate": 2.27585675278011e-06, + "loss": 0.6476, + "step": 22542 + }, + { + "epoch": 0.78, + "learning_rate": 2.2751652398915967e-06, + "loss": 0.655, + "step": 22543 + }, + { + "epoch": 0.78, + "learning_rate": 2.2744738185907713e-06, + "loss": 0.6126, + "step": 22544 + }, + { + "epoch": 0.78, + "learning_rate": 2.2737824888858306e-06, + "loss": 0.6313, + "step": 22545 + }, + { + "epoch": 0.78, + "learning_rate": 2.273091250784977e-06, + "loss": 0.597, + "step": 22546 + }, + { + "epoch": 0.78, + "learning_rate": 2.2724001042963963e-06, + "loss": 0.6802, + "step": 22547 + }, + { + "epoch": 0.78, + "learning_rate": 2.271709049428289e-06, + "loss": 0.705, + "step": 22548 + }, + { + "epoch": 0.78, + "learning_rate": 2.2710180861888474e-06, + "loss": 0.6118, + "step": 22549 + }, + { + "epoch": 0.78, + "learning_rate": 2.270327214586263e-06, + "loss": 0.6575, + "step": 22550 + }, + { + "epoch": 0.78, + "learning_rate": 2.26963643462873e-06, + "loss": 0.6835, + "step": 22551 + }, + { + "epoch": 0.78, + "learning_rate": 2.2689457463244345e-06, + "loss": 0.6816, + "step": 22552 + }, + { + "epoch": 0.78, + "learning_rate": 2.2682551496815665e-06, + "loss": 0.6278, + "step": 22553 + }, + { + "epoch": 0.78, + "learning_rate": 2.2675646447083167e-06, + "loss": 0.6936, + "step": 22554 + }, + { + "epoch": 0.78, + "learning_rate": 2.2668742314128643e-06, + "loss": 0.584, + "step": 22555 + }, + { + "epoch": 0.78, + "learning_rate": 2.266183909803403e-06, + "loss": 0.6392, + "step": 22556 + }, + { + "epoch": 0.78, + "learning_rate": 2.265493679888119e-06, + "loss": 0.5689, + "step": 22557 + }, + { + "epoch": 0.78, + "learning_rate": 2.264803541675187e-06, + "loss": 0.6504, + "step": 22558 + }, + { + "epoch": 0.78, + "learning_rate": 2.264113495172795e-06, + "loss": 0.6666, + "step": 22559 + }, + { + "epoch": 0.78, + "learning_rate": 2.2634235403891257e-06, + "loss": 0.6438, + "step": 22560 + }, + { + "epoch": 0.78, + "learning_rate": 2.2627336773323516e-06, + "loss": 0.6613, + "step": 22561 + }, + { + "epoch": 0.78, + "learning_rate": 2.2620439060106603e-06, + "loss": 0.6536, + "step": 22562 + }, + { + "epoch": 0.78, + "learning_rate": 2.261354226432231e-06, + "loss": 0.6182, + "step": 22563 + }, + { + "epoch": 0.78, + "learning_rate": 2.260664638605232e-06, + "loss": 0.6457, + "step": 22564 + }, + { + "epoch": 0.78, + "learning_rate": 2.259975142537846e-06, + "loss": 0.6452, + "step": 22565 + }, + { + "epoch": 0.78, + "learning_rate": 2.2592857382382473e-06, + "loss": 0.6331, + "step": 22566 + }, + { + "epoch": 0.78, + "learning_rate": 2.258596425714603e-06, + "loss": 0.6607, + "step": 22567 + }, + { + "epoch": 0.78, + "learning_rate": 2.257907204975094e-06, + "loss": 0.7404, + "step": 22568 + }, + { + "epoch": 0.78, + "learning_rate": 2.2572180760278916e-06, + "loss": 0.6321, + "step": 22569 + }, + { + "epoch": 0.78, + "learning_rate": 2.25652903888116e-06, + "loss": 0.6047, + "step": 22570 + }, + { + "epoch": 0.78, + "learning_rate": 2.2558400935430736e-06, + "loss": 0.6838, + "step": 22571 + }, + { + "epoch": 0.78, + "learning_rate": 2.255151240021801e-06, + "loss": 0.6155, + "step": 22572 + }, + { + "epoch": 0.78, + "learning_rate": 2.254462478325503e-06, + "loss": 0.6528, + "step": 22573 + }, + { + "epoch": 0.78, + "learning_rate": 2.2537738084623527e-06, + "loss": 0.6948, + "step": 22574 + }, + { + "epoch": 0.78, + "learning_rate": 2.253085230440516e-06, + "loss": 0.6611, + "step": 22575 + }, + { + "epoch": 0.78, + "learning_rate": 2.2523967442681506e-06, + "loss": 0.6374, + "step": 22576 + }, + { + "epoch": 0.78, + "learning_rate": 2.2517083499534233e-06, + "loss": 0.6336, + "step": 22577 + }, + { + "epoch": 0.78, + "learning_rate": 2.2510200475044963e-06, + "loss": 0.6053, + "step": 22578 + }, + { + "epoch": 0.78, + "learning_rate": 2.2503318369295278e-06, + "loss": 0.625, + "step": 22579 + }, + { + "epoch": 0.78, + "learning_rate": 2.249643718236676e-06, + "loss": 0.7078, + "step": 22580 + }, + { + "epoch": 0.78, + "learning_rate": 2.2489556914341072e-06, + "loss": 0.614, + "step": 22581 + }, + { + "epoch": 0.78, + "learning_rate": 2.2482677565299716e-06, + "loss": 0.6443, + "step": 22582 + }, + { + "epoch": 0.78, + "learning_rate": 2.2475799135324273e-06, + "loss": 0.6397, + "step": 22583 + }, + { + "epoch": 0.78, + "learning_rate": 2.246892162449632e-06, + "loss": 0.6497, + "step": 22584 + }, + { + "epoch": 0.78, + "learning_rate": 2.246204503289736e-06, + "loss": 0.6804, + "step": 22585 + }, + { + "epoch": 0.78, + "learning_rate": 2.245516936060892e-06, + "loss": 0.6067, + "step": 22586 + }, + { + "epoch": 0.78, + "learning_rate": 2.2448294607712585e-06, + "loss": 0.6211, + "step": 22587 + }, + { + "epoch": 0.78, + "learning_rate": 2.24414207742898e-06, + "loss": 0.6293, + "step": 22588 + }, + { + "epoch": 0.78, + "learning_rate": 2.2434547860422084e-06, + "loss": 0.6256, + "step": 22589 + }, + { + "epoch": 0.78, + "learning_rate": 2.2427675866190946e-06, + "loss": 0.6517, + "step": 22590 + }, + { + "epoch": 0.78, + "learning_rate": 2.242080479167782e-06, + "loss": 0.654, + "step": 22591 + }, + { + "epoch": 0.78, + "learning_rate": 2.2413934636964165e-06, + "loss": 0.685, + "step": 22592 + }, + { + "epoch": 0.78, + "learning_rate": 2.240706540213151e-06, + "loss": 0.5988, + "step": 22593 + }, + { + "epoch": 0.78, + "learning_rate": 2.240019708726122e-06, + "loss": 0.6056, + "step": 22594 + }, + { + "epoch": 0.78, + "learning_rate": 2.239332969243476e-06, + "loss": 0.6398, + "step": 22595 + }, + { + "epoch": 0.78, + "learning_rate": 2.238646321773359e-06, + "loss": 0.6426, + "step": 22596 + }, + { + "epoch": 0.78, + "learning_rate": 2.237959766323904e-06, + "loss": 0.6782, + "step": 22597 + }, + { + "epoch": 0.78, + "learning_rate": 2.2372733029032523e-06, + "loss": 0.575, + "step": 22598 + }, + { + "epoch": 0.78, + "learning_rate": 2.236586931519551e-06, + "loss": 0.5739, + "step": 22599 + }, + { + "epoch": 0.78, + "learning_rate": 2.23590065218093e-06, + "loss": 0.6329, + "step": 22600 + }, + { + "epoch": 0.78, + "learning_rate": 2.2352144648955287e-06, + "loss": 0.609, + "step": 22601 + }, + { + "epoch": 0.78, + "learning_rate": 2.2345283696714848e-06, + "loss": 0.5652, + "step": 22602 + }, + { + "epoch": 0.78, + "learning_rate": 2.233842366516927e-06, + "loss": 0.611, + "step": 22603 + }, + { + "epoch": 0.78, + "learning_rate": 2.2331564554399898e-06, + "loss": 0.6182, + "step": 22604 + }, + { + "epoch": 0.78, + "learning_rate": 2.232470636448815e-06, + "loss": 0.6632, + "step": 22605 + }, + { + "epoch": 0.78, + "learning_rate": 2.231784909551522e-06, + "loss": 0.6998, + "step": 22606 + }, + { + "epoch": 0.78, + "learning_rate": 2.2310992747562465e-06, + "loss": 0.6402, + "step": 22607 + }, + { + "epoch": 0.78, + "learning_rate": 2.2304137320711195e-06, + "loss": 0.6258, + "step": 22608 + }, + { + "epoch": 0.78, + "learning_rate": 2.2297282815042633e-06, + "loss": 0.6514, + "step": 22609 + }, + { + "epoch": 0.78, + "learning_rate": 2.2290429230638054e-06, + "loss": 0.6276, + "step": 22610 + }, + { + "epoch": 0.78, + "learning_rate": 2.228357656757879e-06, + "loss": 0.6052, + "step": 22611 + }, + { + "epoch": 0.78, + "learning_rate": 2.2276724825946017e-06, + "loss": 0.5977, + "step": 22612 + }, + { + "epoch": 0.78, + "learning_rate": 2.2269874005821014e-06, + "loss": 0.7034, + "step": 22613 + }, + { + "epoch": 0.78, + "learning_rate": 2.226302410728496e-06, + "loss": 0.621, + "step": 22614 + }, + { + "epoch": 0.78, + "learning_rate": 2.225617513041909e-06, + "loss": 0.5987, + "step": 22615 + }, + { + "epoch": 0.78, + "learning_rate": 2.224932707530462e-06, + "loss": 0.6061, + "step": 22616 + }, + { + "epoch": 0.78, + "learning_rate": 2.224247994202271e-06, + "loss": 0.616, + "step": 22617 + }, + { + "epoch": 0.78, + "learning_rate": 2.223563373065458e-06, + "loss": 0.687, + "step": 22618 + }, + { + "epoch": 0.78, + "learning_rate": 2.222878844128141e-06, + "loss": 0.5905, + "step": 22619 + }, + { + "epoch": 0.78, + "learning_rate": 2.2221944073984314e-06, + "loss": 0.6527, + "step": 22620 + }, + { + "epoch": 0.78, + "learning_rate": 2.2215100628844444e-06, + "loss": 0.6454, + "step": 22621 + }, + { + "epoch": 0.78, + "learning_rate": 2.220825810594297e-06, + "loss": 0.609, + "step": 22622 + }, + { + "epoch": 0.78, + "learning_rate": 2.2201416505360997e-06, + "loss": 0.6123, + "step": 22623 + }, + { + "epoch": 0.78, + "learning_rate": 2.2194575827179644e-06, + "loss": 0.6124, + "step": 22624 + }, + { + "epoch": 0.78, + "learning_rate": 2.218773607148005e-06, + "loss": 0.6449, + "step": 22625 + }, + { + "epoch": 0.78, + "learning_rate": 2.2180897238343246e-06, + "loss": 0.6915, + "step": 22626 + }, + { + "epoch": 0.78, + "learning_rate": 2.217405932785035e-06, + "loss": 0.6489, + "step": 22627 + }, + { + "epoch": 0.78, + "learning_rate": 2.216722234008244e-06, + "loss": 0.6508, + "step": 22628 + }, + { + "epoch": 0.78, + "learning_rate": 2.216038627512056e-06, + "loss": 0.6091, + "step": 22629 + }, + { + "epoch": 0.78, + "learning_rate": 2.215355113304577e-06, + "loss": 0.6623, + "step": 22630 + }, + { + "epoch": 0.78, + "learning_rate": 2.2146716913939127e-06, + "loss": 0.6099, + "step": 22631 + }, + { + "epoch": 0.78, + "learning_rate": 2.213988361788162e-06, + "loss": 0.6752, + "step": 22632 + }, + { + "epoch": 0.78, + "learning_rate": 2.2133051244954283e-06, + "loss": 0.6299, + "step": 22633 + }, + { + "epoch": 0.78, + "learning_rate": 2.2126219795238124e-06, + "loss": 0.6383, + "step": 22634 + }, + { + "epoch": 0.78, + "learning_rate": 2.211938926881415e-06, + "loss": 0.6089, + "step": 22635 + }, + { + "epoch": 0.78, + "learning_rate": 2.2112559665763323e-06, + "loss": 0.601, + "step": 22636 + }, + { + "epoch": 0.78, + "learning_rate": 2.210573098616667e-06, + "loss": 0.5806, + "step": 22637 + }, + { + "epoch": 0.78, + "learning_rate": 2.2098903230105074e-06, + "loss": 0.6341, + "step": 22638 + }, + { + "epoch": 0.78, + "learning_rate": 2.2092076397659535e-06, + "loss": 0.6058, + "step": 22639 + }, + { + "epoch": 0.78, + "learning_rate": 2.208525048891098e-06, + "loss": 0.6502, + "step": 22640 + }, + { + "epoch": 0.78, + "learning_rate": 2.2078425503940336e-06, + "loss": 0.6532, + "step": 22641 + }, + { + "epoch": 0.78, + "learning_rate": 2.207160144282854e-06, + "loss": 0.5841, + "step": 22642 + }, + { + "epoch": 0.78, + "learning_rate": 2.206477830565651e-06, + "loss": 0.6247, + "step": 22643 + }, + { + "epoch": 0.78, + "learning_rate": 2.2057956092505093e-06, + "loss": 0.6345, + "step": 22644 + }, + { + "epoch": 0.78, + "learning_rate": 2.205113480345521e-06, + "loss": 0.6477, + "step": 22645 + }, + { + "epoch": 0.78, + "learning_rate": 2.204431443858773e-06, + "loss": 0.6788, + "step": 22646 + }, + { + "epoch": 0.78, + "learning_rate": 2.2037494997983513e-06, + "loss": 0.6226, + "step": 22647 + }, + { + "epoch": 0.78, + "learning_rate": 2.2030676481723412e-06, + "loss": 0.5995, + "step": 22648 + }, + { + "epoch": 0.78, + "learning_rate": 2.2023858889888304e-06, + "loss": 0.6179, + "step": 22649 + }, + { + "epoch": 0.78, + "learning_rate": 2.201704222255897e-06, + "loss": 0.6146, + "step": 22650 + }, + { + "epoch": 0.78, + "learning_rate": 2.2010226479816242e-06, + "loss": 0.6702, + "step": 22651 + }, + { + "epoch": 0.78, + "learning_rate": 2.2003411661740936e-06, + "loss": 0.6301, + "step": 22652 + }, + { + "epoch": 0.78, + "learning_rate": 2.199659776841385e-06, + "loss": 0.6484, + "step": 22653 + }, + { + "epoch": 0.78, + "learning_rate": 2.198978479991577e-06, + "loss": 0.6922, + "step": 22654 + }, + { + "epoch": 0.78, + "learning_rate": 2.1982972756327516e-06, + "loss": 0.5962, + "step": 22655 + }, + { + "epoch": 0.78, + "learning_rate": 2.1976161637729767e-06, + "loss": 0.6359, + "step": 22656 + }, + { + "epoch": 0.79, + "learning_rate": 2.1969351444203334e-06, + "loss": 0.5991, + "step": 22657 + }, + { + "epoch": 0.79, + "learning_rate": 2.1962542175828937e-06, + "loss": 0.6816, + "step": 22658 + }, + { + "epoch": 0.79, + "learning_rate": 2.195573383268733e-06, + "loss": 0.6069, + "step": 22659 + }, + { + "epoch": 0.79, + "learning_rate": 2.1948926414859227e-06, + "loss": 0.6434, + "step": 22660 + }, + { + "epoch": 0.79, + "learning_rate": 2.1942119922425364e-06, + "loss": 0.6488, + "step": 22661 + }, + { + "epoch": 0.79, + "learning_rate": 2.1935314355466374e-06, + "loss": 0.6817, + "step": 22662 + }, + { + "epoch": 0.79, + "learning_rate": 2.1928509714062996e-06, + "loss": 0.614, + "step": 22663 + }, + { + "epoch": 0.79, + "learning_rate": 2.1921705998295893e-06, + "loss": 0.654, + "step": 22664 + }, + { + "epoch": 0.79, + "learning_rate": 2.191490320824573e-06, + "loss": 0.6447, + "step": 22665 + }, + { + "epoch": 0.79, + "learning_rate": 2.190810134399317e-06, + "loss": 0.634, + "step": 22666 + }, + { + "epoch": 0.79, + "learning_rate": 2.1901300405618888e-06, + "loss": 0.6273, + "step": 22667 + }, + { + "epoch": 0.79, + "learning_rate": 2.1894500393203454e-06, + "loss": 0.6286, + "step": 22668 + }, + { + "epoch": 0.79, + "learning_rate": 2.1887701306827526e-06, + "loss": 0.5944, + "step": 22669 + }, + { + "epoch": 0.79, + "learning_rate": 2.188090314657171e-06, + "loss": 0.6329, + "step": 22670 + }, + { + "epoch": 0.79, + "learning_rate": 2.1874105912516607e-06, + "loss": 0.6834, + "step": 22671 + }, + { + "epoch": 0.79, + "learning_rate": 2.1867309604742803e-06, + "loss": 0.6821, + "step": 22672 + }, + { + "epoch": 0.79, + "learning_rate": 2.1860514223330918e-06, + "loss": 0.6593, + "step": 22673 + }, + { + "epoch": 0.79, + "learning_rate": 2.1853719768361446e-06, + "loss": 0.6111, + "step": 22674 + }, + { + "epoch": 0.79, + "learning_rate": 2.184692623991499e-06, + "loss": 0.5988, + "step": 22675 + }, + { + "epoch": 0.79, + "learning_rate": 2.1840133638072093e-06, + "loss": 0.6024, + "step": 22676 + }, + { + "epoch": 0.79, + "learning_rate": 2.1833341962913267e-06, + "loss": 0.6528, + "step": 22677 + }, + { + "epoch": 0.79, + "learning_rate": 2.18265512145191e-06, + "loss": 0.6638, + "step": 22678 + }, + { + "epoch": 0.79, + "learning_rate": 2.181976139297002e-06, + "loss": 0.6761, + "step": 22679 + }, + { + "epoch": 0.79, + "learning_rate": 2.1812972498346564e-06, + "loss": 0.6201, + "step": 22680 + }, + { + "epoch": 0.79, + "learning_rate": 2.1806184530729234e-06, + "loss": 0.6363, + "step": 22681 + }, + { + "epoch": 0.79, + "learning_rate": 2.1799397490198504e-06, + "loss": 0.6245, + "step": 22682 + }, + { + "epoch": 0.79, + "learning_rate": 2.179261137683484e-06, + "loss": 0.6064, + "step": 22683 + }, + { + "epoch": 0.79, + "learning_rate": 2.178582619071872e-06, + "loss": 0.7355, + "step": 22684 + }, + { + "epoch": 0.79, + "learning_rate": 2.1779041931930543e-06, + "loss": 0.6671, + "step": 22685 + }, + { + "epoch": 0.79, + "learning_rate": 2.177225860055079e-06, + "loss": 0.6663, + "step": 22686 + }, + { + "epoch": 0.79, + "learning_rate": 2.176547619665985e-06, + "loss": 0.6081, + "step": 22687 + }, + { + "epoch": 0.79, + "learning_rate": 2.175869472033817e-06, + "loss": 0.6592, + "step": 22688 + }, + { + "epoch": 0.79, + "learning_rate": 2.175191417166613e-06, + "loss": 0.6247, + "step": 22689 + }, + { + "epoch": 0.79, + "learning_rate": 2.174513455072418e-06, + "loss": 0.6646, + "step": 22690 + }, + { + "epoch": 0.79, + "learning_rate": 2.173835585759261e-06, + "loss": 0.6278, + "step": 22691 + }, + { + "epoch": 0.79, + "learning_rate": 2.1731578092351825e-06, + "loss": 0.6446, + "step": 22692 + }, + { + "epoch": 0.79, + "learning_rate": 2.1724801255082208e-06, + "loss": 0.6505, + "step": 22693 + }, + { + "epoch": 0.79, + "learning_rate": 2.171802534586408e-06, + "loss": 0.6567, + "step": 22694 + }, + { + "epoch": 0.79, + "learning_rate": 2.171125036477779e-06, + "loss": 0.6592, + "step": 22695 + }, + { + "epoch": 0.79, + "learning_rate": 2.17044763119037e-06, + "loss": 0.6374, + "step": 22696 + }, + { + "epoch": 0.79, + "learning_rate": 2.169770318732205e-06, + "loss": 0.5711, + "step": 22697 + }, + { + "epoch": 0.79, + "learning_rate": 2.169093099111318e-06, + "loss": 0.5988, + "step": 22698 + }, + { + "epoch": 0.79, + "learning_rate": 2.168415972335739e-06, + "loss": 0.6257, + "step": 22699 + }, + { + "epoch": 0.79, + "learning_rate": 2.167738938413496e-06, + "loss": 0.639, + "step": 22700 + }, + { + "epoch": 0.79, + "learning_rate": 2.1670619973526152e-06, + "loss": 0.5605, + "step": 22701 + }, + { + "epoch": 0.79, + "learning_rate": 2.1663851491611255e-06, + "loss": 0.641, + "step": 22702 + }, + { + "epoch": 0.79, + "learning_rate": 2.165708393847048e-06, + "loss": 0.5762, + "step": 22703 + }, + { + "epoch": 0.79, + "learning_rate": 2.1650317314184068e-06, + "loss": 0.6266, + "step": 22704 + }, + { + "epoch": 0.79, + "learning_rate": 2.164355161883226e-06, + "loss": 0.6883, + "step": 22705 + }, + { + "epoch": 0.79, + "learning_rate": 2.1636786852495272e-06, + "loss": 0.6257, + "step": 22706 + }, + { + "epoch": 0.79, + "learning_rate": 2.16300230152533e-06, + "loss": 0.6226, + "step": 22707 + }, + { + "epoch": 0.79, + "learning_rate": 2.162326010718657e-06, + "loss": 0.643, + "step": 22708 + }, + { + "epoch": 0.79, + "learning_rate": 2.1616498128375217e-06, + "loss": 0.5938, + "step": 22709 + }, + { + "epoch": 0.79, + "learning_rate": 2.160973707889943e-06, + "loss": 0.6586, + "step": 22710 + }, + { + "epoch": 0.79, + "learning_rate": 2.1602976958839383e-06, + "loss": 0.6114, + "step": 22711 + }, + { + "epoch": 0.79, + "learning_rate": 2.1596217768275205e-06, + "loss": 0.5869, + "step": 22712 + }, + { + "epoch": 0.79, + "learning_rate": 2.1589459507287056e-06, + "loss": 0.6454, + "step": 22713 + }, + { + "epoch": 0.79, + "learning_rate": 2.1582702175955074e-06, + "loss": 0.6483, + "step": 22714 + }, + { + "epoch": 0.79, + "learning_rate": 2.157594577435934e-06, + "loss": 0.6478, + "step": 22715 + }, + { + "epoch": 0.79, + "learning_rate": 2.1569190302579968e-06, + "loss": 0.6165, + "step": 22716 + }, + { + "epoch": 0.79, + "learning_rate": 2.156243576069705e-06, + "loss": 0.6062, + "step": 22717 + }, + { + "epoch": 0.79, + "learning_rate": 2.15556821487907e-06, + "loss": 0.593, + "step": 22718 + }, + { + "epoch": 0.79, + "learning_rate": 2.154892946694096e-06, + "loss": 0.622, + "step": 22719 + }, + { + "epoch": 0.79, + "learning_rate": 2.154217771522793e-06, + "loss": 0.6471, + "step": 22720 + }, + { + "epoch": 0.79, + "learning_rate": 2.1535426893731603e-06, + "loss": 0.6191, + "step": 22721 + }, + { + "epoch": 0.79, + "learning_rate": 2.152867700253206e-06, + "loss": 0.654, + "step": 22722 + }, + { + "epoch": 0.79, + "learning_rate": 2.1521928041709305e-06, + "loss": 0.6737, + "step": 22723 + }, + { + "epoch": 0.79, + "learning_rate": 2.1515180011343373e-06, + "loss": 0.632, + "step": 22724 + }, + { + "epoch": 0.79, + "learning_rate": 2.1508432911514264e-06, + "loss": 0.6248, + "step": 22725 + }, + { + "epoch": 0.79, + "learning_rate": 2.150168674230201e-06, + "loss": 0.6328, + "step": 22726 + }, + { + "epoch": 0.79, + "learning_rate": 2.1494941503786526e-06, + "loss": 0.6435, + "step": 22727 + }, + { + "epoch": 0.79, + "learning_rate": 2.148819719604782e-06, + "loss": 0.6423, + "step": 22728 + }, + { + "epoch": 0.79, + "learning_rate": 2.1481453819165866e-06, + "loss": 0.6006, + "step": 22729 + }, + { + "epoch": 0.79, + "learning_rate": 2.1474711373220593e-06, + "loss": 0.6238, + "step": 22730 + }, + { + "epoch": 0.79, + "learning_rate": 2.1467969858291948e-06, + "loss": 0.6083, + "step": 22731 + }, + { + "epoch": 0.79, + "learning_rate": 2.1461229274459895e-06, + "loss": 0.6565, + "step": 22732 + }, + { + "epoch": 0.79, + "learning_rate": 2.1454489621804296e-06, + "loss": 0.6784, + "step": 22733 + }, + { + "epoch": 0.79, + "learning_rate": 2.1447750900405075e-06, + "loss": 0.6528, + "step": 22734 + }, + { + "epoch": 0.79, + "learning_rate": 2.1441013110342148e-06, + "loss": 0.6336, + "step": 22735 + }, + { + "epoch": 0.79, + "learning_rate": 2.1434276251695386e-06, + "loss": 0.6637, + "step": 22736 + }, + { + "epoch": 0.79, + "learning_rate": 2.142754032454466e-06, + "loss": 0.6224, + "step": 22737 + }, + { + "epoch": 0.79, + "learning_rate": 2.142080532896986e-06, + "loss": 0.6457, + "step": 22738 + }, + { + "epoch": 0.79, + "learning_rate": 2.1414071265050796e-06, + "loss": 0.6574, + "step": 22739 + }, + { + "epoch": 0.79, + "learning_rate": 2.1407338132867328e-06, + "loss": 0.6214, + "step": 22740 + }, + { + "epoch": 0.79, + "learning_rate": 2.1400605932499295e-06, + "loss": 0.6189, + "step": 22741 + }, + { + "epoch": 0.79, + "learning_rate": 2.1393874664026492e-06, + "loss": 0.5981, + "step": 22742 + }, + { + "epoch": 0.79, + "learning_rate": 2.1387144327528787e-06, + "loss": 0.6293, + "step": 22743 + }, + { + "epoch": 0.79, + "learning_rate": 2.138041492308589e-06, + "loss": 0.6111, + "step": 22744 + }, + { + "epoch": 0.79, + "learning_rate": 2.1373686450777633e-06, + "loss": 0.609, + "step": 22745 + }, + { + "epoch": 0.79, + "learning_rate": 2.1366958910683787e-06, + "loss": 0.6053, + "step": 22746 + }, + { + "epoch": 0.79, + "learning_rate": 2.136023230288411e-06, + "loss": 0.64, + "step": 22747 + }, + { + "epoch": 0.79, + "learning_rate": 2.1353506627458365e-06, + "loss": 0.6804, + "step": 22748 + }, + { + "epoch": 0.79, + "learning_rate": 2.134678188448631e-06, + "loss": 0.6335, + "step": 22749 + }, + { + "epoch": 0.79, + "learning_rate": 2.134005807404763e-06, + "loss": 0.627, + "step": 22750 + }, + { + "epoch": 0.79, + "learning_rate": 2.133333519622206e-06, + "loss": 0.6919, + "step": 22751 + }, + { + "epoch": 0.79, + "learning_rate": 2.1326613251089324e-06, + "loss": 0.6489, + "step": 22752 + }, + { + "epoch": 0.79, + "learning_rate": 2.13198922387291e-06, + "loss": 0.651, + "step": 22753 + }, + { + "epoch": 0.79, + "learning_rate": 2.1313172159221094e-06, + "loss": 0.5861, + "step": 22754 + }, + { + "epoch": 0.79, + "learning_rate": 2.130645301264499e-06, + "loss": 0.6392, + "step": 22755 + }, + { + "epoch": 0.79, + "learning_rate": 2.1299734799080417e-06, + "loss": 0.6583, + "step": 22756 + }, + { + "epoch": 0.79, + "learning_rate": 2.129301751860704e-06, + "loss": 0.6504, + "step": 22757 + }, + { + "epoch": 0.79, + "learning_rate": 2.1286301171304504e-06, + "loss": 0.6467, + "step": 22758 + }, + { + "epoch": 0.79, + "learning_rate": 2.127958575725243e-06, + "loss": 0.6023, + "step": 22759 + }, + { + "epoch": 0.79, + "learning_rate": 2.127287127653046e-06, + "loss": 0.6807, + "step": 22760 + }, + { + "epoch": 0.79, + "learning_rate": 2.126615772921822e-06, + "loss": 0.6462, + "step": 22761 + }, + { + "epoch": 0.79, + "learning_rate": 2.125944511539525e-06, + "loss": 0.6846, + "step": 22762 + }, + { + "epoch": 0.79, + "learning_rate": 2.125273343514116e-06, + "loss": 0.6341, + "step": 22763 + }, + { + "epoch": 0.79, + "learning_rate": 2.124602268853554e-06, + "loss": 0.5974, + "step": 22764 + }, + { + "epoch": 0.79, + "learning_rate": 2.1239312875657937e-06, + "loss": 0.5923, + "step": 22765 + }, + { + "epoch": 0.79, + "learning_rate": 2.123260399658792e-06, + "loss": 0.6698, + "step": 22766 + }, + { + "epoch": 0.79, + "learning_rate": 2.1225896051405047e-06, + "loss": 0.6523, + "step": 22767 + }, + { + "epoch": 0.79, + "learning_rate": 2.1219189040188803e-06, + "loss": 0.5989, + "step": 22768 + }, + { + "epoch": 0.79, + "learning_rate": 2.121248296301872e-06, + "loss": 0.6668, + "step": 22769 + }, + { + "epoch": 0.79, + "learning_rate": 2.120577781997436e-06, + "loss": 0.6073, + "step": 22770 + }, + { + "epoch": 0.79, + "learning_rate": 2.1199073611135115e-06, + "loss": 0.6436, + "step": 22771 + }, + { + "epoch": 0.79, + "learning_rate": 2.119237033658057e-06, + "loss": 0.6407, + "step": 22772 + }, + { + "epoch": 0.79, + "learning_rate": 2.1185667996390193e-06, + "loss": 0.6221, + "step": 22773 + }, + { + "epoch": 0.79, + "learning_rate": 2.117896659064339e-06, + "loss": 0.672, + "step": 22774 + }, + { + "epoch": 0.79, + "learning_rate": 2.117226611941965e-06, + "loss": 0.6155, + "step": 22775 + }, + { + "epoch": 0.79, + "learning_rate": 2.1165566582798435e-06, + "loss": 0.6678, + "step": 22776 + }, + { + "epoch": 0.79, + "learning_rate": 2.11588679808591e-06, + "loss": 0.5592, + "step": 22777 + }, + { + "epoch": 0.79, + "learning_rate": 2.115217031368115e-06, + "loss": 0.6652, + "step": 22778 + }, + { + "epoch": 0.79, + "learning_rate": 2.1145473581344e-06, + "loss": 0.5601, + "step": 22779 + }, + { + "epoch": 0.79, + "learning_rate": 2.113877778392698e-06, + "loss": 0.5952, + "step": 22780 + }, + { + "epoch": 0.79, + "learning_rate": 2.11320829215095e-06, + "loss": 0.6233, + "step": 22781 + }, + { + "epoch": 0.79, + "learning_rate": 2.112538899417098e-06, + "loss": 0.6203, + "step": 22782 + }, + { + "epoch": 0.79, + "learning_rate": 2.11186960019907e-06, + "loss": 0.7006, + "step": 22783 + }, + { + "epoch": 0.79, + "learning_rate": 2.111200394504809e-06, + "loss": 0.6187, + "step": 22784 + }, + { + "epoch": 0.79, + "learning_rate": 2.1105312823422485e-06, + "loss": 0.6642, + "step": 22785 + }, + { + "epoch": 0.79, + "learning_rate": 2.1098622637193177e-06, + "loss": 0.6234, + "step": 22786 + }, + { + "epoch": 0.79, + "learning_rate": 2.109193338643951e-06, + "loss": 0.6908, + "step": 22787 + }, + { + "epoch": 0.79, + "learning_rate": 2.1085245071240813e-06, + "loss": 0.6223, + "step": 22788 + }, + { + "epoch": 0.79, + "learning_rate": 2.1078557691676318e-06, + "loss": 0.5778, + "step": 22789 + }, + { + "epoch": 0.79, + "learning_rate": 2.1071871247825384e-06, + "loss": 0.6593, + "step": 22790 + }, + { + "epoch": 0.79, + "learning_rate": 2.106518573976728e-06, + "loss": 0.5788, + "step": 22791 + }, + { + "epoch": 0.79, + "learning_rate": 2.1058501167581236e-06, + "loss": 0.6172, + "step": 22792 + }, + { + "epoch": 0.79, + "learning_rate": 2.1051817531346507e-06, + "loss": 0.6374, + "step": 22793 + }, + { + "epoch": 0.79, + "learning_rate": 2.1045134831142387e-06, + "loss": 0.6571, + "step": 22794 + }, + { + "epoch": 0.79, + "learning_rate": 2.1038453067048025e-06, + "loss": 0.6301, + "step": 22795 + }, + { + "epoch": 0.79, + "learning_rate": 2.103177223914271e-06, + "loss": 0.6516, + "step": 22796 + }, + { + "epoch": 0.79, + "learning_rate": 2.102509234750565e-06, + "loss": 0.6809, + "step": 22797 + }, + { + "epoch": 0.79, + "learning_rate": 2.101841339221601e-06, + "loss": 0.6301, + "step": 22798 + }, + { + "epoch": 0.79, + "learning_rate": 2.1011735373352983e-06, + "loss": 0.6428, + "step": 22799 + }, + { + "epoch": 0.79, + "learning_rate": 2.1005058290995784e-06, + "loss": 0.6115, + "step": 22800 + }, + { + "epoch": 0.79, + "learning_rate": 2.0998382145223497e-06, + "loss": 0.6684, + "step": 22801 + }, + { + "epoch": 0.79, + "learning_rate": 2.0991706936115375e-06, + "loss": 0.6439, + "step": 22802 + }, + { + "epoch": 0.79, + "learning_rate": 2.098503266375048e-06, + "loss": 0.648, + "step": 22803 + }, + { + "epoch": 0.79, + "learning_rate": 2.0978359328207986e-06, + "loss": 0.6277, + "step": 22804 + }, + { + "epoch": 0.79, + "learning_rate": 2.0971686929567038e-06, + "loss": 0.6596, + "step": 22805 + }, + { + "epoch": 0.79, + "learning_rate": 2.096501546790668e-06, + "loss": 0.5724, + "step": 22806 + }, + { + "epoch": 0.79, + "learning_rate": 2.0958344943306007e-06, + "loss": 0.5898, + "step": 22807 + }, + { + "epoch": 0.79, + "learning_rate": 2.0951675355844213e-06, + "loss": 0.5769, + "step": 22808 + }, + { + "epoch": 0.79, + "learning_rate": 2.094500670560027e-06, + "loss": 0.5949, + "step": 22809 + }, + { + "epoch": 0.79, + "learning_rate": 2.093833899265327e-06, + "loss": 0.6278, + "step": 22810 + }, + { + "epoch": 0.79, + "learning_rate": 2.0931672217082323e-06, + "loss": 0.5837, + "step": 22811 + }, + { + "epoch": 0.79, + "learning_rate": 2.0925006378966373e-06, + "loss": 0.6093, + "step": 22812 + }, + { + "epoch": 0.79, + "learning_rate": 2.0918341478384486e-06, + "loss": 0.6416, + "step": 22813 + }, + { + "epoch": 0.79, + "learning_rate": 2.0911677515415763e-06, + "loss": 0.6939, + "step": 22814 + }, + { + "epoch": 0.79, + "learning_rate": 2.090501449013911e-06, + "loss": 0.6366, + "step": 22815 + }, + { + "epoch": 0.79, + "learning_rate": 2.089835240263357e-06, + "loss": 0.6195, + "step": 22816 + }, + { + "epoch": 0.79, + "learning_rate": 2.089169125297815e-06, + "loss": 0.6745, + "step": 22817 + }, + { + "epoch": 0.79, + "learning_rate": 2.088503104125178e-06, + "loss": 0.6466, + "step": 22818 + }, + { + "epoch": 0.79, + "learning_rate": 2.087837176753342e-06, + "loss": 0.6801, + "step": 22819 + }, + { + "epoch": 0.79, + "learning_rate": 2.0871713431902106e-06, + "loss": 0.6136, + "step": 22820 + }, + { + "epoch": 0.79, + "learning_rate": 2.0865056034436703e-06, + "loss": 0.554, + "step": 22821 + }, + { + "epoch": 0.79, + "learning_rate": 2.085839957521616e-06, + "loss": 0.6507, + "step": 22822 + }, + { + "epoch": 0.79, + "learning_rate": 2.0851744054319434e-06, + "loss": 0.5792, + "step": 22823 + }, + { + "epoch": 0.79, + "learning_rate": 2.0845089471825386e-06, + "loss": 0.6236, + "step": 22824 + }, + { + "epoch": 0.79, + "learning_rate": 2.08384358278129e-06, + "loss": 0.636, + "step": 22825 + }, + { + "epoch": 0.79, + "learning_rate": 2.083178312236095e-06, + "loss": 0.6807, + "step": 22826 + }, + { + "epoch": 0.79, + "learning_rate": 2.0825131355548335e-06, + "loss": 0.6064, + "step": 22827 + }, + { + "epoch": 0.79, + "learning_rate": 2.0818480527453944e-06, + "loss": 0.6339, + "step": 22828 + }, + { + "epoch": 0.79, + "learning_rate": 2.081183063815666e-06, + "loss": 0.5802, + "step": 22829 + }, + { + "epoch": 0.79, + "learning_rate": 2.0805181687735267e-06, + "loss": 0.6282, + "step": 22830 + }, + { + "epoch": 0.79, + "learning_rate": 2.079853367626861e-06, + "loss": 0.5788, + "step": 22831 + }, + { + "epoch": 0.79, + "learning_rate": 2.0791886603835563e-06, + "loss": 0.6069, + "step": 22832 + }, + { + "epoch": 0.79, + "learning_rate": 2.078524047051488e-06, + "loss": 0.6697, + "step": 22833 + }, + { + "epoch": 0.79, + "learning_rate": 2.077859527638538e-06, + "loss": 0.6236, + "step": 22834 + }, + { + "epoch": 0.79, + "learning_rate": 2.0771951021525883e-06, + "loss": 0.6027, + "step": 22835 + }, + { + "epoch": 0.79, + "learning_rate": 2.0765307706015094e-06, + "loss": 0.616, + "step": 22836 + }, + { + "epoch": 0.79, + "learning_rate": 2.0758665329931784e-06, + "loss": 0.7213, + "step": 22837 + }, + { + "epoch": 0.79, + "learning_rate": 2.07520238933548e-06, + "loss": 0.6299, + "step": 22838 + }, + { + "epoch": 0.79, + "learning_rate": 2.0745383396362793e-06, + "loss": 0.6539, + "step": 22839 + }, + { + "epoch": 0.79, + "learning_rate": 2.0738743839034526e-06, + "loss": 0.6327, + "step": 22840 + }, + { + "epoch": 0.79, + "learning_rate": 2.073210522144874e-06, + "loss": 0.62, + "step": 22841 + }, + { + "epoch": 0.79, + "learning_rate": 2.0725467543684086e-06, + "loss": 0.6382, + "step": 22842 + }, + { + "epoch": 0.79, + "learning_rate": 2.0718830805819278e-06, + "loss": 0.5574, + "step": 22843 + }, + { + "epoch": 0.79, + "learning_rate": 2.071219500793308e-06, + "loss": 0.6574, + "step": 22844 + }, + { + "epoch": 0.79, + "learning_rate": 2.0705560150104074e-06, + "loss": 0.5752, + "step": 22845 + }, + { + "epoch": 0.79, + "learning_rate": 2.0698926232410964e-06, + "loss": 0.6178, + "step": 22846 + }, + { + "epoch": 0.79, + "learning_rate": 2.069229325493244e-06, + "loss": 0.614, + "step": 22847 + }, + { + "epoch": 0.79, + "learning_rate": 2.0685661217747055e-06, + "loss": 0.6272, + "step": 22848 + }, + { + "epoch": 0.79, + "learning_rate": 2.0679030120933473e-06, + "loss": 0.6337, + "step": 22849 + }, + { + "epoch": 0.79, + "learning_rate": 2.0672399964570388e-06, + "loss": 0.6111, + "step": 22850 + }, + { + "epoch": 0.79, + "learning_rate": 2.0665770748736326e-06, + "loss": 0.6615, + "step": 22851 + }, + { + "epoch": 0.79, + "learning_rate": 2.06591424735099e-06, + "loss": 0.6102, + "step": 22852 + }, + { + "epoch": 0.79, + "learning_rate": 2.065251513896974e-06, + "loss": 0.665, + "step": 22853 + }, + { + "epoch": 0.79, + "learning_rate": 2.0645888745194355e-06, + "loss": 0.6311, + "step": 22854 + }, + { + "epoch": 0.79, + "learning_rate": 2.0639263292262323e-06, + "loss": 0.6041, + "step": 22855 + }, + { + "epoch": 0.79, + "learning_rate": 2.0632638780252266e-06, + "loss": 0.6014, + "step": 22856 + }, + { + "epoch": 0.79, + "learning_rate": 2.0626015209242654e-06, + "loss": 0.5928, + "step": 22857 + }, + { + "epoch": 0.79, + "learning_rate": 2.0619392579312036e-06, + "loss": 0.6853, + "step": 22858 + }, + { + "epoch": 0.79, + "learning_rate": 2.061277089053897e-06, + "loss": 0.6526, + "step": 22859 + }, + { + "epoch": 0.79, + "learning_rate": 2.060615014300189e-06, + "loss": 0.6347, + "step": 22860 + }, + { + "epoch": 0.79, + "learning_rate": 2.0599530336779317e-06, + "loss": 0.6556, + "step": 22861 + }, + { + "epoch": 0.79, + "learning_rate": 2.0592911471949807e-06, + "loss": 0.5625, + "step": 22862 + }, + { + "epoch": 0.79, + "learning_rate": 2.058629354859175e-06, + "loss": 0.6161, + "step": 22863 + }, + { + "epoch": 0.79, + "learning_rate": 2.057967656678368e-06, + "loss": 0.7113, + "step": 22864 + }, + { + "epoch": 0.79, + "learning_rate": 2.057306052660397e-06, + "loss": 0.5866, + "step": 22865 + }, + { + "epoch": 0.79, + "learning_rate": 2.056644542813111e-06, + "loss": 0.5768, + "step": 22866 + }, + { + "epoch": 0.79, + "learning_rate": 2.0559831271443532e-06, + "loss": 0.6832, + "step": 22867 + }, + { + "epoch": 0.79, + "learning_rate": 2.055321805661963e-06, + "loss": 0.6477, + "step": 22868 + }, + { + "epoch": 0.79, + "learning_rate": 2.0546605783737837e-06, + "loss": 0.6148, + "step": 22869 + }, + { + "epoch": 0.79, + "learning_rate": 2.0539994452876568e-06, + "loss": 0.6549, + "step": 22870 + }, + { + "epoch": 0.79, + "learning_rate": 2.053338406411416e-06, + "loss": 0.6441, + "step": 22871 + }, + { + "epoch": 0.79, + "learning_rate": 2.0526774617528998e-06, + "loss": 0.6396, + "step": 22872 + }, + { + "epoch": 0.79, + "learning_rate": 2.052016611319947e-06, + "loss": 0.6636, + "step": 22873 + }, + { + "epoch": 0.79, + "learning_rate": 2.0513558551203905e-06, + "loss": 0.6486, + "step": 22874 + }, + { + "epoch": 0.79, + "learning_rate": 2.0506951931620666e-06, + "loss": 0.6178, + "step": 22875 + }, + { + "epoch": 0.79, + "learning_rate": 2.050034625452808e-06, + "loss": 0.6434, + "step": 22876 + }, + { + "epoch": 0.79, + "learning_rate": 2.049374152000445e-06, + "loss": 0.5885, + "step": 22877 + }, + { + "epoch": 0.79, + "learning_rate": 2.048713772812808e-06, + "loss": 0.6611, + "step": 22878 + }, + { + "epoch": 0.79, + "learning_rate": 2.0480534878977277e-06, + "loss": 0.6837, + "step": 22879 + }, + { + "epoch": 0.79, + "learning_rate": 2.0473932972630328e-06, + "loss": 0.5981, + "step": 22880 + }, + { + "epoch": 0.79, + "learning_rate": 2.0467332009165498e-06, + "loss": 0.642, + "step": 22881 + }, + { + "epoch": 0.79, + "learning_rate": 2.0460731988661087e-06, + "loss": 0.6733, + "step": 22882 + }, + { + "epoch": 0.79, + "learning_rate": 2.045413291119529e-06, + "loss": 0.6863, + "step": 22883 + }, + { + "epoch": 0.79, + "learning_rate": 2.0447534776846377e-06, + "loss": 0.6017, + "step": 22884 + }, + { + "epoch": 0.79, + "learning_rate": 2.0440937585692566e-06, + "loss": 0.6359, + "step": 22885 + }, + { + "epoch": 0.79, + "learning_rate": 2.043434133781209e-06, + "loss": 0.6705, + "step": 22886 + }, + { + "epoch": 0.79, + "learning_rate": 2.0427746033283147e-06, + "loss": 0.6374, + "step": 22887 + }, + { + "epoch": 0.79, + "learning_rate": 2.042115167218396e-06, + "loss": 0.6299, + "step": 22888 + }, + { + "epoch": 0.79, + "learning_rate": 2.0414558254592655e-06, + "loss": 0.6514, + "step": 22889 + }, + { + "epoch": 0.79, + "learning_rate": 2.040796578058745e-06, + "loss": 0.6788, + "step": 22890 + }, + { + "epoch": 0.79, + "learning_rate": 2.0401374250246477e-06, + "loss": 0.6198, + "step": 22891 + }, + { + "epoch": 0.79, + "learning_rate": 2.0394783663647923e-06, + "loss": 0.6472, + "step": 22892 + }, + { + "epoch": 0.79, + "learning_rate": 2.03881940208699e-06, + "loss": 0.6104, + "step": 22893 + }, + { + "epoch": 0.79, + "learning_rate": 2.038160532199057e-06, + "loss": 0.6691, + "step": 22894 + }, + { + "epoch": 0.79, + "learning_rate": 2.0375017567088005e-06, + "loss": 0.6363, + "step": 22895 + }, + { + "epoch": 0.79, + "learning_rate": 2.0368430756240344e-06, + "loss": 0.6514, + "step": 22896 + }, + { + "epoch": 0.79, + "learning_rate": 2.036184488952566e-06, + "loss": 0.6585, + "step": 22897 + }, + { + "epoch": 0.79, + "learning_rate": 2.0355259967022044e-06, + "loss": 0.5807, + "step": 22898 + }, + { + "epoch": 0.79, + "learning_rate": 2.0348675988807578e-06, + "loss": 0.6538, + "step": 22899 + }, + { + "epoch": 0.79, + "learning_rate": 2.0342092954960347e-06, + "loss": 0.6434, + "step": 22900 + }, + { + "epoch": 0.79, + "learning_rate": 2.0335510865558337e-06, + "loss": 0.6613, + "step": 22901 + }, + { + "epoch": 0.79, + "learning_rate": 2.0328929720679625e-06, + "loss": 0.5404, + "step": 22902 + }, + { + "epoch": 0.79, + "learning_rate": 2.032234952040224e-06, + "loss": 0.6563, + "step": 22903 + }, + { + "epoch": 0.79, + "learning_rate": 2.031577026480419e-06, + "loss": 0.6443, + "step": 22904 + }, + { + "epoch": 0.79, + "learning_rate": 2.030919195396348e-06, + "loss": 0.6644, + "step": 22905 + }, + { + "epoch": 0.79, + "learning_rate": 2.0302614587958137e-06, + "loss": 0.6322, + "step": 22906 + }, + { + "epoch": 0.79, + "learning_rate": 2.0296038166866094e-06, + "loss": 0.5284, + "step": 22907 + }, + { + "epoch": 0.79, + "learning_rate": 2.0289462690765347e-06, + "loss": 0.5404, + "step": 22908 + }, + { + "epoch": 0.79, + "learning_rate": 2.0282888159733847e-06, + "loss": 0.6231, + "step": 22909 + }, + { + "epoch": 0.79, + "learning_rate": 2.0276314573849552e-06, + "loss": 0.6097, + "step": 22910 + }, + { + "epoch": 0.79, + "learning_rate": 2.02697419331904e-06, + "loss": 0.6317, + "step": 22911 + }, + { + "epoch": 0.79, + "learning_rate": 2.026317023783435e-06, + "loss": 0.6165, + "step": 22912 + }, + { + "epoch": 0.79, + "learning_rate": 2.0256599487859254e-06, + "loss": 0.617, + "step": 22913 + }, + { + "epoch": 0.79, + "learning_rate": 2.0250029683343043e-06, + "loss": 0.6551, + "step": 22914 + }, + { + "epoch": 0.79, + "learning_rate": 2.0243460824363616e-06, + "loss": 0.6679, + "step": 22915 + }, + { + "epoch": 0.79, + "learning_rate": 2.023689291099885e-06, + "loss": 0.6466, + "step": 22916 + }, + { + "epoch": 0.79, + "learning_rate": 2.0230325943326623e-06, + "loss": 0.6044, + "step": 22917 + }, + { + "epoch": 0.79, + "learning_rate": 2.0223759921424824e-06, + "loss": 0.6273, + "step": 22918 + }, + { + "epoch": 0.79, + "learning_rate": 2.0217194845371235e-06, + "loss": 0.6251, + "step": 22919 + }, + { + "epoch": 0.79, + "learning_rate": 2.0210630715243727e-06, + "loss": 0.7112, + "step": 22920 + }, + { + "epoch": 0.79, + "learning_rate": 2.020406753112012e-06, + "loss": 0.5967, + "step": 22921 + }, + { + "epoch": 0.79, + "learning_rate": 2.0197505293078246e-06, + "loss": 0.5936, + "step": 22922 + }, + { + "epoch": 0.79, + "learning_rate": 2.019094400119589e-06, + "loss": 0.5799, + "step": 22923 + }, + { + "epoch": 0.79, + "learning_rate": 2.0184383655550875e-06, + "loss": 0.6414, + "step": 22924 + }, + { + "epoch": 0.79, + "learning_rate": 2.0177824256220945e-06, + "loss": 0.5849, + "step": 22925 + }, + { + "epoch": 0.79, + "learning_rate": 2.017126580328388e-06, + "loss": 0.6021, + "step": 22926 + }, + { + "epoch": 0.79, + "learning_rate": 2.016470829681744e-06, + "loss": 0.6035, + "step": 22927 + }, + { + "epoch": 0.79, + "learning_rate": 2.0158151736899377e-06, + "loss": 0.6252, + "step": 22928 + }, + { + "epoch": 0.79, + "learning_rate": 2.0151596123607452e-06, + "loss": 0.6447, + "step": 22929 + }, + { + "epoch": 0.79, + "learning_rate": 2.0145041457019333e-06, + "loss": 0.6611, + "step": 22930 + }, + { + "epoch": 0.79, + "learning_rate": 2.0138487737212764e-06, + "loss": 0.6475, + "step": 22931 + }, + { + "epoch": 0.79, + "learning_rate": 2.0131934964265452e-06, + "loss": 0.6695, + "step": 22932 + }, + { + "epoch": 0.79, + "learning_rate": 2.0125383138255083e-06, + "loss": 0.6201, + "step": 22933 + }, + { + "epoch": 0.79, + "learning_rate": 2.0118832259259347e-06, + "loss": 0.6227, + "step": 22934 + }, + { + "epoch": 0.79, + "learning_rate": 2.0112282327355925e-06, + "loss": 0.5978, + "step": 22935 + }, + { + "epoch": 0.79, + "learning_rate": 2.0105733342622426e-06, + "loss": 0.6578, + "step": 22936 + }, + { + "epoch": 0.79, + "learning_rate": 2.0099185305136527e-06, + "loss": 0.5649, + "step": 22937 + }, + { + "epoch": 0.79, + "learning_rate": 2.0092638214975856e-06, + "loss": 0.6409, + "step": 22938 + }, + { + "epoch": 0.79, + "learning_rate": 2.0086092072218042e-06, + "loss": 0.6408, + "step": 22939 + }, + { + "epoch": 0.79, + "learning_rate": 2.0079546876940712e-06, + "loss": 0.5812, + "step": 22940 + }, + { + "epoch": 0.79, + "learning_rate": 2.007300262922147e-06, + "loss": 0.6281, + "step": 22941 + }, + { + "epoch": 0.79, + "learning_rate": 2.0066459329137865e-06, + "loss": 0.6408, + "step": 22942 + }, + { + "epoch": 0.79, + "learning_rate": 2.0059916976767503e-06, + "loss": 0.6041, + "step": 22943 + }, + { + "epoch": 0.79, + "learning_rate": 2.005337557218795e-06, + "loss": 0.6484, + "step": 22944 + }, + { + "epoch": 0.79, + "learning_rate": 2.004683511547676e-06, + "loss": 0.692, + "step": 22945 + }, + { + "epoch": 0.8, + "learning_rate": 2.004029560671148e-06, + "loss": 0.579, + "step": 22946 + }, + { + "epoch": 0.8, + "learning_rate": 2.003375704596967e-06, + "loss": 0.6532, + "step": 22947 + }, + { + "epoch": 0.8, + "learning_rate": 2.0027219433328805e-06, + "loss": 0.5985, + "step": 22948 + }, + { + "epoch": 0.8, + "learning_rate": 2.002068276886642e-06, + "loss": 0.6789, + "step": 22949 + }, + { + "epoch": 0.8, + "learning_rate": 2.0014147052660017e-06, + "loss": 0.6106, + "step": 22950 + }, + { + "epoch": 0.8, + "learning_rate": 2.0007612284787082e-06, + "loss": 0.6257, + "step": 22951 + }, + { + "epoch": 0.8, + "learning_rate": 2.0001078465325084e-06, + "loss": 0.6508, + "step": 22952 + }, + { + "epoch": 0.8, + "learning_rate": 1.9994545594351544e-06, + "loss": 0.657, + "step": 22953 + }, + { + "epoch": 0.8, + "learning_rate": 1.998801367194384e-06, + "loss": 0.5759, + "step": 22954 + }, + { + "epoch": 0.8, + "learning_rate": 1.998148269817944e-06, + "loss": 0.6212, + "step": 22955 + }, + { + "epoch": 0.8, + "learning_rate": 1.9974952673135795e-06, + "loss": 0.6099, + "step": 22956 + }, + { + "epoch": 0.8, + "learning_rate": 1.9968423596890318e-06, + "loss": 0.6274, + "step": 22957 + }, + { + "epoch": 0.8, + "learning_rate": 1.996189546952042e-06, + "loss": 0.6357, + "step": 22958 + }, + { + "epoch": 0.8, + "learning_rate": 1.9955368291103526e-06, + "loss": 0.6293, + "step": 22959 + }, + { + "epoch": 0.8, + "learning_rate": 1.9948842061716976e-06, + "loss": 0.6352, + "step": 22960 + }, + { + "epoch": 0.8, + "learning_rate": 1.9942316781438163e-06, + "loss": 0.5897, + "step": 22961 + }, + { + "epoch": 0.8, + "learning_rate": 1.993579245034446e-06, + "loss": 0.622, + "step": 22962 + }, + { + "epoch": 0.8, + "learning_rate": 1.9929269068513215e-06, + "loss": 0.6316, + "step": 22963 + }, + { + "epoch": 0.8, + "learning_rate": 1.9922746636021782e-06, + "loss": 0.5966, + "step": 22964 + }, + { + "epoch": 0.8, + "learning_rate": 1.991622515294751e-06, + "loss": 0.6686, + "step": 22965 + }, + { + "epoch": 0.8, + "learning_rate": 1.9909704619367663e-06, + "loss": 0.6557, + "step": 22966 + }, + { + "epoch": 0.8, + "learning_rate": 1.9903185035359585e-06, + "loss": 0.6487, + "step": 22967 + }, + { + "epoch": 0.8, + "learning_rate": 1.9896666401000573e-06, + "loss": 0.6762, + "step": 22968 + }, + { + "epoch": 0.8, + "learning_rate": 1.989014871636792e-06, + "loss": 0.6261, + "step": 22969 + }, + { + "epoch": 0.8, + "learning_rate": 1.9883631981538885e-06, + "loss": 0.6208, + "step": 22970 + }, + { + "epoch": 0.8, + "learning_rate": 1.9877116196590763e-06, + "loss": 0.6925, + "step": 22971 + }, + { + "epoch": 0.8, + "learning_rate": 1.987060136160076e-06, + "loss": 0.63, + "step": 22972 + }, + { + "epoch": 0.8, + "learning_rate": 1.9864087476646153e-06, + "loss": 0.6451, + "step": 22973 + }, + { + "epoch": 0.8, + "learning_rate": 1.9857574541804148e-06, + "loss": 0.5971, + "step": 22974 + }, + { + "epoch": 0.8, + "learning_rate": 1.985106255715199e-06, + "loss": 0.6423, + "step": 22975 + }, + { + "epoch": 0.8, + "learning_rate": 1.9844551522766864e-06, + "loss": 0.6539, + "step": 22976 + }, + { + "epoch": 0.8, + "learning_rate": 1.983804143872601e-06, + "loss": 0.6056, + "step": 22977 + }, + { + "epoch": 0.8, + "learning_rate": 1.983153230510655e-06, + "loss": 0.6679, + "step": 22978 + }, + { + "epoch": 0.8, + "learning_rate": 1.982502412198569e-06, + "loss": 0.6521, + "step": 22979 + }, + { + "epoch": 0.8, + "learning_rate": 1.9818516889440586e-06, + "loss": 0.6316, + "step": 22980 + }, + { + "epoch": 0.8, + "learning_rate": 1.9812010607548404e-06, + "loss": 0.6287, + "step": 22981 + }, + { + "epoch": 0.8, + "learning_rate": 1.980550527638626e-06, + "loss": 0.6374, + "step": 22982 + }, + { + "epoch": 0.8, + "learning_rate": 1.979900089603134e-06, + "loss": 0.6124, + "step": 22983 + }, + { + "epoch": 0.8, + "learning_rate": 1.979249746656068e-06, + "loss": 0.6462, + "step": 22984 + }, + { + "epoch": 0.8, + "learning_rate": 1.9785994988051426e-06, + "loss": 0.6215, + "step": 22985 + }, + { + "epoch": 0.8, + "learning_rate": 1.9779493460580677e-06, + "loss": 0.6468, + "step": 22986 + }, + { + "epoch": 0.8, + "learning_rate": 1.9772992884225518e-06, + "loss": 0.6209, + "step": 22987 + }, + { + "epoch": 0.8, + "learning_rate": 1.9766493259063036e-06, + "loss": 0.6795, + "step": 22988 + }, + { + "epoch": 0.8, + "learning_rate": 1.975999458517025e-06, + "loss": 0.6128, + "step": 22989 + }, + { + "epoch": 0.8, + "learning_rate": 1.9753496862624235e-06, + "loss": 0.5921, + "step": 22990 + }, + { + "epoch": 0.8, + "learning_rate": 1.9747000091502046e-06, + "loss": 0.6292, + "step": 22991 + }, + { + "epoch": 0.8, + "learning_rate": 1.9740504271880635e-06, + "loss": 0.6472, + "step": 22992 + }, + { + "epoch": 0.8, + "learning_rate": 1.9734009403837106e-06, + "loss": 0.5945, + "step": 22993 + }, + { + "epoch": 0.8, + "learning_rate": 1.972751548744847e-06, + "loss": 0.6408, + "step": 22994 + }, + { + "epoch": 0.8, + "learning_rate": 1.9721022522791645e-06, + "loss": 0.597, + "step": 22995 + }, + { + "epoch": 0.8, + "learning_rate": 1.9714530509943653e-06, + "loss": 0.662, + "step": 22996 + }, + { + "epoch": 0.8, + "learning_rate": 1.9708039448981486e-06, + "loss": 0.6767, + "step": 22997 + }, + { + "epoch": 0.8, + "learning_rate": 1.970154933998203e-06, + "loss": 0.6383, + "step": 22998 + }, + { + "epoch": 0.8, + "learning_rate": 1.969506018302232e-06, + "loss": 0.6632, + "step": 22999 + }, + { + "epoch": 0.8, + "learning_rate": 1.968857197817927e-06, + "loss": 0.6257, + "step": 23000 + }, + { + "epoch": 0.8, + "learning_rate": 1.9682084725529773e-06, + "loss": 0.6101, + "step": 23001 + }, + { + "epoch": 0.8, + "learning_rate": 1.9675598425150767e-06, + "loss": 0.5842, + "step": 23002 + }, + { + "epoch": 0.8, + "learning_rate": 1.9669113077119183e-06, + "loss": 0.6199, + "step": 23003 + }, + { + "epoch": 0.8, + "learning_rate": 1.966262868151182e-06, + "loss": 0.6009, + "step": 23004 + }, + { + "epoch": 0.8, + "learning_rate": 1.9656145238405656e-06, + "loss": 0.6829, + "step": 23005 + }, + { + "epoch": 0.8, + "learning_rate": 1.964966274787755e-06, + "loss": 0.6477, + "step": 23006 + }, + { + "epoch": 0.8, + "learning_rate": 1.9643181210004303e-06, + "loss": 0.6632, + "step": 23007 + }, + { + "epoch": 0.8, + "learning_rate": 1.9636700624862803e-06, + "loss": 0.6638, + "step": 23008 + }, + { + "epoch": 0.8, + "learning_rate": 1.9630220992529904e-06, + "loss": 0.6195, + "step": 23009 + }, + { + "epoch": 0.8, + "learning_rate": 1.962374231308234e-06, + "loss": 0.6599, + "step": 23010 + }, + { + "epoch": 0.8, + "learning_rate": 1.9617264586597017e-06, + "loss": 0.5401, + "step": 23011 + }, + { + "epoch": 0.8, + "learning_rate": 1.9610787813150744e-06, + "loss": 0.6137, + "step": 23012 + }, + { + "epoch": 0.8, + "learning_rate": 1.9604311992820235e-06, + "loss": 0.6278, + "step": 23013 + }, + { + "epoch": 0.8, + "learning_rate": 1.9597837125682317e-06, + "loss": 0.6463, + "step": 23014 + }, + { + "epoch": 0.8, + "learning_rate": 1.9591363211813772e-06, + "loss": 0.6843, + "step": 23015 + }, + { + "epoch": 0.8, + "learning_rate": 1.958489025129128e-06, + "loss": 0.6089, + "step": 23016 + }, + { + "epoch": 0.8, + "learning_rate": 1.9578418244191668e-06, + "loss": 0.6933, + "step": 23017 + }, + { + "epoch": 0.8, + "learning_rate": 1.9571947190591666e-06, + "loss": 0.6547, + "step": 23018 + }, + { + "epoch": 0.8, + "learning_rate": 1.9565477090567952e-06, + "loss": 0.637, + "step": 23019 + }, + { + "epoch": 0.8, + "learning_rate": 1.955900794419725e-06, + "loss": 0.6211, + "step": 23020 + }, + { + "epoch": 0.8, + "learning_rate": 1.9552539751556298e-06, + "loss": 0.6249, + "step": 23021 + }, + { + "epoch": 0.8, + "learning_rate": 1.9546072512721704e-06, + "loss": 0.5906, + "step": 23022 + }, + { + "epoch": 0.8, + "learning_rate": 1.9539606227770214e-06, + "loss": 0.5996, + "step": 23023 + }, + { + "epoch": 0.8, + "learning_rate": 1.95331408967785e-06, + "loss": 0.6245, + "step": 23024 + }, + { + "epoch": 0.8, + "learning_rate": 1.9526676519823173e-06, + "loss": 0.6416, + "step": 23025 + }, + { + "epoch": 0.8, + "learning_rate": 1.9520213096980888e-06, + "loss": 0.6888, + "step": 23026 + }, + { + "epoch": 0.8, + "learning_rate": 1.951375062832832e-06, + "loss": 0.632, + "step": 23027 + }, + { + "epoch": 0.8, + "learning_rate": 1.9507289113941996e-06, + "loss": 0.6267, + "step": 23028 + }, + { + "epoch": 0.8, + "learning_rate": 1.950082855389861e-06, + "loss": 0.6496, + "step": 23029 + }, + { + "epoch": 0.8, + "learning_rate": 1.9494368948274755e-06, + "loss": 0.6309, + "step": 23030 + }, + { + "epoch": 0.8, + "learning_rate": 1.9487910297146974e-06, + "loss": 0.6718, + "step": 23031 + }, + { + "epoch": 0.8, + "learning_rate": 1.9481452600591867e-06, + "loss": 0.659, + "step": 23032 + }, + { + "epoch": 0.8, + "learning_rate": 1.947499585868602e-06, + "loss": 0.6308, + "step": 23033 + }, + { + "epoch": 0.8, + "learning_rate": 1.9468540071505903e-06, + "loss": 0.6798, + "step": 23034 + }, + { + "epoch": 0.8, + "learning_rate": 1.946208523912816e-06, + "loss": 0.6494, + "step": 23035 + }, + { + "epoch": 0.8, + "learning_rate": 1.945563136162929e-06, + "loss": 0.6362, + "step": 23036 + }, + { + "epoch": 0.8, + "learning_rate": 1.944917843908577e-06, + "loss": 0.6237, + "step": 23037 + }, + { + "epoch": 0.8, + "learning_rate": 1.944272647157415e-06, + "loss": 0.6685, + "step": 23038 + }, + { + "epoch": 0.8, + "learning_rate": 1.943627545917093e-06, + "loss": 0.652, + "step": 23039 + }, + { + "epoch": 0.8, + "learning_rate": 1.942982540195253e-06, + "loss": 0.6012, + "step": 23040 + }, + { + "epoch": 0.8, + "learning_rate": 1.942337629999549e-06, + "loss": 0.6298, + "step": 23041 + }, + { + "epoch": 0.8, + "learning_rate": 1.941692815337628e-06, + "loss": 0.596, + "step": 23042 + }, + { + "epoch": 0.8, + "learning_rate": 1.9410480962171307e-06, + "loss": 0.6145, + "step": 23043 + }, + { + "epoch": 0.8, + "learning_rate": 1.9404034726457034e-06, + "loss": 0.6094, + "step": 23044 + }, + { + "epoch": 0.8, + "learning_rate": 1.9397589446309893e-06, + "loss": 0.6144, + "step": 23045 + }, + { + "epoch": 0.8, + "learning_rate": 1.9391145121806254e-06, + "loss": 0.6825, + "step": 23046 + }, + { + "epoch": 0.8, + "learning_rate": 1.9384701753022574e-06, + "loss": 0.6396, + "step": 23047 + }, + { + "epoch": 0.8, + "learning_rate": 1.9378259340035268e-06, + "loss": 0.6195, + "step": 23048 + }, + { + "epoch": 0.8, + "learning_rate": 1.937181788292066e-06, + "loss": 0.6067, + "step": 23049 + }, + { + "epoch": 0.8, + "learning_rate": 1.936537738175517e-06, + "loss": 0.6387, + "step": 23050 + }, + { + "epoch": 0.8, + "learning_rate": 1.93589378366151e-06, + "loss": 0.5898, + "step": 23051 + }, + { + "epoch": 0.8, + "learning_rate": 1.9352499247576815e-06, + "loss": 0.5928, + "step": 23052 + }, + { + "epoch": 0.8, + "learning_rate": 1.9346061614716727e-06, + "loss": 0.6172, + "step": 23053 + }, + { + "epoch": 0.8, + "learning_rate": 1.933962493811108e-06, + "loss": 0.5968, + "step": 23054 + }, + { + "epoch": 0.8, + "learning_rate": 1.93331892178362e-06, + "loss": 0.657, + "step": 23055 + }, + { + "epoch": 0.8, + "learning_rate": 1.9326754453968454e-06, + "loss": 0.6566, + "step": 23056 + }, + { + "epoch": 0.8, + "learning_rate": 1.9320320646584044e-06, + "loss": 0.6622, + "step": 23057 + }, + { + "epoch": 0.8, + "learning_rate": 1.931388779575927e-06, + "loss": 0.6234, + "step": 23058 + }, + { + "epoch": 0.8, + "learning_rate": 1.9307455901570484e-06, + "loss": 0.57, + "step": 23059 + }, + { + "epoch": 0.8, + "learning_rate": 1.930102496409385e-06, + "loss": 0.659, + "step": 23060 + }, + { + "epoch": 0.8, + "learning_rate": 1.929459498340566e-06, + "loss": 0.6692, + "step": 23061 + }, + { + "epoch": 0.8, + "learning_rate": 1.928816595958215e-06, + "loss": 0.6248, + "step": 23062 + }, + { + "epoch": 0.8, + "learning_rate": 1.9281737892699525e-06, + "loss": 0.6219, + "step": 23063 + }, + { + "epoch": 0.8, + "learning_rate": 1.9275310782833965e-06, + "loss": 0.6378, + "step": 23064 + }, + { + "epoch": 0.8, + "learning_rate": 1.9268884630061777e-06, + "loss": 0.6439, + "step": 23065 + }, + { + "epoch": 0.8, + "learning_rate": 1.926245943445906e-06, + "loss": 0.6284, + "step": 23066 + }, + { + "epoch": 0.8, + "learning_rate": 1.925603519610201e-06, + "loss": 0.6143, + "step": 23067 + }, + { + "epoch": 0.8, + "learning_rate": 1.9249611915066834e-06, + "loss": 0.6273, + "step": 23068 + }, + { + "epoch": 0.8, + "learning_rate": 1.9243189591429633e-06, + "loss": 0.6167, + "step": 23069 + }, + { + "epoch": 0.8, + "learning_rate": 1.9236768225266557e-06, + "loss": 0.6275, + "step": 23070 + }, + { + "epoch": 0.8, + "learning_rate": 1.9230347816653803e-06, + "loss": 0.6317, + "step": 23071 + }, + { + "epoch": 0.8, + "learning_rate": 1.9223928365667432e-06, + "loss": 0.6559, + "step": 23072 + }, + { + "epoch": 0.8, + "learning_rate": 1.9217509872383565e-06, + "loss": 0.6373, + "step": 23073 + }, + { + "epoch": 0.8, + "learning_rate": 1.9211092336878344e-06, + "loss": 0.6271, + "step": 23074 + }, + { + "epoch": 0.8, + "learning_rate": 1.9204675759227787e-06, + "loss": 0.6166, + "step": 23075 + }, + { + "epoch": 0.8, + "learning_rate": 1.9198260139507983e-06, + "loss": 0.6391, + "step": 23076 + }, + { + "epoch": 0.8, + "learning_rate": 1.919184547779508e-06, + "loss": 0.6456, + "step": 23077 + }, + { + "epoch": 0.8, + "learning_rate": 1.918543177416503e-06, + "loss": 0.596, + "step": 23078 + }, + { + "epoch": 0.8, + "learning_rate": 1.9179019028693936e-06, + "loss": 0.5997, + "step": 23079 + }, + { + "epoch": 0.8, + "learning_rate": 1.917260724145782e-06, + "loss": 0.702, + "step": 23080 + }, + { + "epoch": 0.8, + "learning_rate": 1.9166196412532667e-06, + "loss": 0.6798, + "step": 23081 + }, + { + "epoch": 0.8, + "learning_rate": 1.91597865419945e-06, + "loss": 0.6183, + "step": 23082 + }, + { + "epoch": 0.8, + "learning_rate": 1.9153377629919367e-06, + "loss": 0.5945, + "step": 23083 + }, + { + "epoch": 0.8, + "learning_rate": 1.9146969676383187e-06, + "loss": 0.6465, + "step": 23084 + }, + { + "epoch": 0.8, + "learning_rate": 1.914056268146196e-06, + "loss": 0.6401, + "step": 23085 + }, + { + "epoch": 0.8, + "learning_rate": 1.9134156645231685e-06, + "loss": 0.6037, + "step": 23086 + }, + { + "epoch": 0.8, + "learning_rate": 1.912775156776824e-06, + "loss": 0.6622, + "step": 23087 + }, + { + "epoch": 0.8, + "learning_rate": 1.912134744914759e-06, + "loss": 0.6172, + "step": 23088 + }, + { + "epoch": 0.8, + "eval_loss": 0.5751644968986511, + "eval_runtime": 4921.5874, + "eval_samples_per_second": 112.086, + "eval_steps_per_second": 37.362, + "step": 23088 + }, + { + "epoch": 0.8, + "learning_rate": 1.9114944289445725e-06, + "loss": 0.575, + "step": 23089 + }, + { + "epoch": 0.8, + "learning_rate": 1.9108542088738493e-06, + "loss": 0.5839, + "step": 23090 + }, + { + "epoch": 0.8, + "learning_rate": 1.9102140847101814e-06, + "loss": 0.7018, + "step": 23091 + }, + { + "epoch": 0.8, + "learning_rate": 1.909574056461162e-06, + "loss": 0.5891, + "step": 23092 + }, + { + "epoch": 0.8, + "learning_rate": 1.908934124134375e-06, + "loss": 0.638, + "step": 23093 + }, + { + "epoch": 0.8, + "learning_rate": 1.9082942877374054e-06, + "loss": 0.6007, + "step": 23094 + }, + { + "epoch": 0.8, + "learning_rate": 1.9076545472778496e-06, + "loss": 0.5981, + "step": 23095 + }, + { + "epoch": 0.8, + "learning_rate": 1.9070149027632823e-06, + "loss": 0.6246, + "step": 23096 + }, + { + "epoch": 0.8, + "learning_rate": 1.9063753542012909e-06, + "loss": 0.6149, + "step": 23097 + }, + { + "epoch": 0.8, + "learning_rate": 1.9057359015994614e-06, + "loss": 0.6118, + "step": 23098 + }, + { + "epoch": 0.8, + "learning_rate": 1.905096544965369e-06, + "loss": 0.6525, + "step": 23099 + }, + { + "epoch": 0.8, + "learning_rate": 1.9044572843065956e-06, + "loss": 0.6739, + "step": 23100 + }, + { + "epoch": 0.8, + "learning_rate": 1.903818119630726e-06, + "loss": 0.6662, + "step": 23101 + }, + { + "epoch": 0.8, + "learning_rate": 1.9031790509453329e-06, + "loss": 0.592, + "step": 23102 + }, + { + "epoch": 0.8, + "learning_rate": 1.9025400782579939e-06, + "loss": 0.6266, + "step": 23103 + }, + { + "epoch": 0.8, + "learning_rate": 1.9019012015762884e-06, + "loss": 0.6286, + "step": 23104 + }, + { + "epoch": 0.8, + "learning_rate": 1.9012624209077857e-06, + "loss": 0.6158, + "step": 23105 + }, + { + "epoch": 0.8, + "learning_rate": 1.9006237362600588e-06, + "loss": 0.5835, + "step": 23106 + }, + { + "epoch": 0.8, + "learning_rate": 1.8999851476406883e-06, + "loss": 0.6896, + "step": 23107 + }, + { + "epoch": 0.8, + "learning_rate": 1.8993466550572392e-06, + "loss": 0.6373, + "step": 23108 + }, + { + "epoch": 0.8, + "learning_rate": 1.8987082585172822e-06, + "loss": 0.6248, + "step": 23109 + }, + { + "epoch": 0.8, + "learning_rate": 1.898069958028389e-06, + "loss": 0.6183, + "step": 23110 + }, + { + "epoch": 0.8, + "learning_rate": 1.8974317535981236e-06, + "loss": 0.654, + "step": 23111 + }, + { + "epoch": 0.8, + "learning_rate": 1.8967936452340542e-06, + "loss": 0.6279, + "step": 23112 + }, + { + "epoch": 0.8, + "learning_rate": 1.896155632943747e-06, + "loss": 0.6721, + "step": 23113 + }, + { + "epoch": 0.8, + "learning_rate": 1.8955177167347661e-06, + "loss": 0.6495, + "step": 23114 + }, + { + "epoch": 0.8, + "learning_rate": 1.8948798966146776e-06, + "loss": 0.6775, + "step": 23115 + }, + { + "epoch": 0.8, + "learning_rate": 1.8942421725910377e-06, + "loss": 0.6432, + "step": 23116 + }, + { + "epoch": 0.8, + "learning_rate": 1.8936045446714114e-06, + "loss": 0.631, + "step": 23117 + }, + { + "epoch": 0.8, + "learning_rate": 1.8929670128633581e-06, + "loss": 0.6079, + "step": 23118 + }, + { + "epoch": 0.8, + "learning_rate": 1.8923295771744355e-06, + "loss": 0.6129, + "step": 23119 + }, + { + "epoch": 0.8, + "learning_rate": 1.8916922376122027e-06, + "loss": 0.5882, + "step": 23120 + }, + { + "epoch": 0.8, + "learning_rate": 1.8910549941842172e-06, + "loss": 0.6229, + "step": 23121 + }, + { + "epoch": 0.8, + "learning_rate": 1.8904178468980306e-06, + "loss": 0.6578, + "step": 23122 + }, + { + "epoch": 0.8, + "learning_rate": 1.889780795761199e-06, + "loss": 0.6707, + "step": 23123 + }, + { + "epoch": 0.8, + "learning_rate": 1.8891438407812757e-06, + "loss": 0.6184, + "step": 23124 + }, + { + "epoch": 0.8, + "learning_rate": 1.888506981965813e-06, + "loss": 0.6025, + "step": 23125 + }, + { + "epoch": 0.8, + "learning_rate": 1.8878702193223609e-06, + "loss": 0.6379, + "step": 23126 + }, + { + "epoch": 0.8, + "learning_rate": 1.8872335528584707e-06, + "loss": 0.6186, + "step": 23127 + }, + { + "epoch": 0.8, + "learning_rate": 1.8865969825816877e-06, + "loss": 0.6343, + "step": 23128 + }, + { + "epoch": 0.8, + "learning_rate": 1.8859605084995613e-06, + "loss": 0.6657, + "step": 23129 + }, + { + "epoch": 0.8, + "learning_rate": 1.8853241306196368e-06, + "loss": 0.6467, + "step": 23130 + }, + { + "epoch": 0.8, + "learning_rate": 1.8846878489494603e-06, + "loss": 0.6475, + "step": 23131 + }, + { + "epoch": 0.8, + "learning_rate": 1.8840516634965743e-06, + "loss": 0.631, + "step": 23132 + }, + { + "epoch": 0.8, + "learning_rate": 1.8834155742685255e-06, + "loss": 0.6341, + "step": 23133 + }, + { + "epoch": 0.8, + "learning_rate": 1.882779581272851e-06, + "loss": 0.6435, + "step": 23134 + }, + { + "epoch": 0.8, + "learning_rate": 1.8821436845170927e-06, + "loss": 0.6031, + "step": 23135 + }, + { + "epoch": 0.8, + "learning_rate": 1.8815078840087885e-06, + "loss": 0.6301, + "step": 23136 + }, + { + "epoch": 0.8, + "learning_rate": 1.8808721797554797e-06, + "loss": 0.645, + "step": 23137 + }, + { + "epoch": 0.8, + "learning_rate": 1.880236571764702e-06, + "loss": 0.625, + "step": 23138 + }, + { + "epoch": 0.8, + "learning_rate": 1.879601060043994e-06, + "loss": 0.6367, + "step": 23139 + }, + { + "epoch": 0.8, + "learning_rate": 1.8789656446008841e-06, + "loss": 0.6231, + "step": 23140 + }, + { + "epoch": 0.8, + "learning_rate": 1.8783303254429109e-06, + "loss": 0.6034, + "step": 23141 + }, + { + "epoch": 0.8, + "learning_rate": 1.8776951025776047e-06, + "loss": 0.5712, + "step": 23142 + }, + { + "epoch": 0.8, + "learning_rate": 1.8770599760124985e-06, + "loss": 0.6155, + "step": 23143 + }, + { + "epoch": 0.8, + "learning_rate": 1.876424945755122e-06, + "loss": 0.614, + "step": 23144 + }, + { + "epoch": 0.8, + "learning_rate": 1.8757900118130057e-06, + "loss": 0.6359, + "step": 23145 + }, + { + "epoch": 0.8, + "learning_rate": 1.8751551741936746e-06, + "loss": 0.6314, + "step": 23146 + }, + { + "epoch": 0.8, + "learning_rate": 1.8745204329046562e-06, + "loss": 0.5968, + "step": 23147 + }, + { + "epoch": 0.8, + "learning_rate": 1.8738857879534766e-06, + "loss": 0.6355, + "step": 23148 + }, + { + "epoch": 0.8, + "learning_rate": 1.873251239347661e-06, + "loss": 0.6153, + "step": 23149 + }, + { + "epoch": 0.8, + "learning_rate": 1.872616787094733e-06, + "loss": 0.6542, + "step": 23150 + }, + { + "epoch": 0.8, + "learning_rate": 1.8719824312022161e-06, + "loss": 0.6351, + "step": 23151 + }, + { + "epoch": 0.8, + "learning_rate": 1.871348171677626e-06, + "loss": 0.6767, + "step": 23152 + }, + { + "epoch": 0.8, + "learning_rate": 1.8707140085284869e-06, + "loss": 0.6477, + "step": 23153 + }, + { + "epoch": 0.8, + "learning_rate": 1.8700799417623172e-06, + "loss": 0.6509, + "step": 23154 + }, + { + "epoch": 0.8, + "learning_rate": 1.8694459713866342e-06, + "loss": 0.597, + "step": 23155 + }, + { + "epoch": 0.8, + "learning_rate": 1.868812097408954e-06, + "loss": 0.6483, + "step": 23156 + }, + { + "epoch": 0.8, + "learning_rate": 1.8681783198367953e-06, + "loss": 0.6453, + "step": 23157 + }, + { + "epoch": 0.8, + "learning_rate": 1.8675446386776664e-06, + "loss": 0.6227, + "step": 23158 + }, + { + "epoch": 0.8, + "learning_rate": 1.8669110539390832e-06, + "loss": 0.5857, + "step": 23159 + }, + { + "epoch": 0.8, + "learning_rate": 1.8662775656285593e-06, + "loss": 0.6729, + "step": 23160 + }, + { + "epoch": 0.8, + "learning_rate": 1.8656441737536025e-06, + "loss": 0.6427, + "step": 23161 + }, + { + "epoch": 0.8, + "learning_rate": 1.8650108783217247e-06, + "loss": 0.6564, + "step": 23162 + }, + { + "epoch": 0.8, + "learning_rate": 1.8643776793404366e-06, + "loss": 0.6156, + "step": 23163 + }, + { + "epoch": 0.8, + "learning_rate": 1.8637445768172402e-06, + "loss": 0.6143, + "step": 23164 + }, + { + "epoch": 0.8, + "learning_rate": 1.8631115707596438e-06, + "loss": 0.5633, + "step": 23165 + }, + { + "epoch": 0.8, + "learning_rate": 1.8624786611751522e-06, + "loss": 0.6073, + "step": 23166 + }, + { + "epoch": 0.8, + "learning_rate": 1.8618458480712708e-06, + "loss": 0.6178, + "step": 23167 + }, + { + "epoch": 0.8, + "learning_rate": 1.8612131314555027e-06, + "loss": 0.6522, + "step": 23168 + }, + { + "epoch": 0.8, + "learning_rate": 1.8605805113353502e-06, + "loss": 0.6333, + "step": 23169 + }, + { + "epoch": 0.8, + "learning_rate": 1.859947987718309e-06, + "loss": 0.6455, + "step": 23170 + }, + { + "epoch": 0.8, + "learning_rate": 1.8593155606118829e-06, + "loss": 0.6366, + "step": 23171 + }, + { + "epoch": 0.8, + "learning_rate": 1.858683230023568e-06, + "loss": 0.6079, + "step": 23172 + }, + { + "epoch": 0.8, + "learning_rate": 1.8580509959608617e-06, + "loss": 0.6222, + "step": 23173 + }, + { + "epoch": 0.8, + "learning_rate": 1.8574188584312647e-06, + "loss": 0.5973, + "step": 23174 + }, + { + "epoch": 0.8, + "learning_rate": 1.856786817442263e-06, + "loss": 0.6574, + "step": 23175 + }, + { + "epoch": 0.8, + "learning_rate": 1.8561548730013567e-06, + "loss": 0.6439, + "step": 23176 + }, + { + "epoch": 0.8, + "learning_rate": 1.855523025116035e-06, + "loss": 0.6629, + "step": 23177 + }, + { + "epoch": 0.8, + "learning_rate": 1.8548912737937919e-06, + "loss": 0.6485, + "step": 23178 + }, + { + "epoch": 0.8, + "learning_rate": 1.8542596190421146e-06, + "loss": 0.6637, + "step": 23179 + }, + { + "epoch": 0.8, + "learning_rate": 1.8536280608684975e-06, + "loss": 0.6523, + "step": 23180 + }, + { + "epoch": 0.8, + "learning_rate": 1.8529965992804233e-06, + "loss": 0.6262, + "step": 23181 + }, + { + "epoch": 0.8, + "learning_rate": 1.8523652342853793e-06, + "loss": 0.6224, + "step": 23182 + }, + { + "epoch": 0.8, + "learning_rate": 1.8517339658908528e-06, + "loss": 0.6833, + "step": 23183 + }, + { + "epoch": 0.8, + "learning_rate": 1.8511027941043268e-06, + "loss": 0.6441, + "step": 23184 + }, + { + "epoch": 0.8, + "learning_rate": 1.8504717189332865e-06, + "loss": 0.6645, + "step": 23185 + }, + { + "epoch": 0.8, + "learning_rate": 1.8498407403852158e-06, + "loss": 0.5672, + "step": 23186 + }, + { + "epoch": 0.8, + "learning_rate": 1.84920985846759e-06, + "loss": 0.5998, + "step": 23187 + }, + { + "epoch": 0.8, + "learning_rate": 1.8485790731878928e-06, + "loss": 0.677, + "step": 23188 + }, + { + "epoch": 0.8, + "learning_rate": 1.8479483845536018e-06, + "loss": 0.6462, + "step": 23189 + }, + { + "epoch": 0.8, + "learning_rate": 1.8473177925721951e-06, + "loss": 0.6301, + "step": 23190 + }, + { + "epoch": 0.8, + "learning_rate": 1.8466872972511485e-06, + "loss": 0.5851, + "step": 23191 + }, + { + "epoch": 0.8, + "learning_rate": 1.846056898597942e-06, + "loss": 0.6436, + "step": 23192 + }, + { + "epoch": 0.8, + "learning_rate": 1.8454265966200424e-06, + "loss": 0.6477, + "step": 23193 + }, + { + "epoch": 0.8, + "learning_rate": 1.8447963913249257e-06, + "loss": 0.6144, + "step": 23194 + }, + { + "epoch": 0.8, + "learning_rate": 1.8441662827200645e-06, + "loss": 0.6164, + "step": 23195 + }, + { + "epoch": 0.8, + "learning_rate": 1.84353627081293e-06, + "loss": 0.6376, + "step": 23196 + }, + { + "epoch": 0.8, + "learning_rate": 1.8429063556109895e-06, + "loss": 0.6677, + "step": 23197 + }, + { + "epoch": 0.8, + "learning_rate": 1.8422765371217166e-06, + "loss": 0.706, + "step": 23198 + }, + { + "epoch": 0.8, + "learning_rate": 1.8416468153525723e-06, + "loss": 0.6848, + "step": 23199 + }, + { + "epoch": 0.8, + "learning_rate": 1.8410171903110251e-06, + "loss": 0.6355, + "step": 23200 + }, + { + "epoch": 0.8, + "learning_rate": 1.8403876620045402e-06, + "loss": 0.6429, + "step": 23201 + }, + { + "epoch": 0.8, + "learning_rate": 1.8397582304405815e-06, + "loss": 0.638, + "step": 23202 + }, + { + "epoch": 0.8, + "learning_rate": 1.8391288956266119e-06, + "loss": 0.6376, + "step": 23203 + }, + { + "epoch": 0.8, + "learning_rate": 1.8384996575700953e-06, + "loss": 0.6165, + "step": 23204 + }, + { + "epoch": 0.8, + "learning_rate": 1.837870516278487e-06, + "loss": 0.6612, + "step": 23205 + }, + { + "epoch": 0.8, + "learning_rate": 1.8372414717592491e-06, + "loss": 0.6559, + "step": 23206 + }, + { + "epoch": 0.8, + "learning_rate": 1.8366125240198397e-06, + "loss": 0.6706, + "step": 23207 + }, + { + "epoch": 0.8, + "learning_rate": 1.835983673067715e-06, + "loss": 0.6166, + "step": 23208 + }, + { + "epoch": 0.8, + "learning_rate": 1.8353549189103315e-06, + "loss": 0.5958, + "step": 23209 + }, + { + "epoch": 0.8, + "learning_rate": 1.8347262615551465e-06, + "loss": 0.616, + "step": 23210 + }, + { + "epoch": 0.8, + "learning_rate": 1.8340977010096083e-06, + "loss": 0.6212, + "step": 23211 + }, + { + "epoch": 0.8, + "learning_rate": 1.8334692372811713e-06, + "loss": 0.5849, + "step": 23212 + }, + { + "epoch": 0.8, + "learning_rate": 1.8328408703772882e-06, + "loss": 0.6788, + "step": 23213 + }, + { + "epoch": 0.8, + "learning_rate": 1.8322126003054074e-06, + "loss": 0.593, + "step": 23214 + }, + { + "epoch": 0.8, + "learning_rate": 1.8315844270729788e-06, + "loss": 0.6174, + "step": 23215 + }, + { + "epoch": 0.8, + "learning_rate": 1.8309563506874517e-06, + "loss": 0.6416, + "step": 23216 + }, + { + "epoch": 0.8, + "learning_rate": 1.830328371156269e-06, + "loss": 0.6105, + "step": 23217 + }, + { + "epoch": 0.8, + "learning_rate": 1.8297004884868785e-06, + "loss": 0.6329, + "step": 23218 + }, + { + "epoch": 0.8, + "learning_rate": 1.829072702686724e-06, + "loss": 0.6071, + "step": 23219 + }, + { + "epoch": 0.8, + "learning_rate": 1.8284450137632481e-06, + "loss": 0.6456, + "step": 23220 + }, + { + "epoch": 0.8, + "learning_rate": 1.8278174217238941e-06, + "loss": 0.6465, + "step": 23221 + }, + { + "epoch": 0.8, + "learning_rate": 1.8271899265761052e-06, + "loss": 0.612, + "step": 23222 + }, + { + "epoch": 0.8, + "learning_rate": 1.8265625283273158e-06, + "loss": 0.6031, + "step": 23223 + }, + { + "epoch": 0.8, + "learning_rate": 1.8259352269849672e-06, + "loss": 0.6321, + "step": 23224 + }, + { + "epoch": 0.8, + "learning_rate": 1.8253080225564968e-06, + "loss": 0.6407, + "step": 23225 + }, + { + "epoch": 0.8, + "learning_rate": 1.8246809150493405e-06, + "loss": 0.6403, + "step": 23226 + }, + { + "epoch": 0.8, + "learning_rate": 1.8240539044709337e-06, + "loss": 0.6008, + "step": 23227 + }, + { + "epoch": 0.8, + "learning_rate": 1.8234269908287127e-06, + "loss": 0.6471, + "step": 23228 + }, + { + "epoch": 0.8, + "learning_rate": 1.822800174130106e-06, + "loss": 0.6593, + "step": 23229 + }, + { + "epoch": 0.8, + "learning_rate": 1.8221734543825476e-06, + "loss": 0.6173, + "step": 23230 + }, + { + "epoch": 0.8, + "learning_rate": 1.8215468315934681e-06, + "loss": 0.6781, + "step": 23231 + }, + { + "epoch": 0.8, + "learning_rate": 1.8209203057702963e-06, + "loss": 0.5725, + "step": 23232 + }, + { + "epoch": 0.8, + "learning_rate": 1.8202938769204614e-06, + "loss": 0.6897, + "step": 23233 + }, + { + "epoch": 0.8, + "learning_rate": 1.8196675450513923e-06, + "loss": 0.6246, + "step": 23234 + }, + { + "epoch": 0.81, + "learning_rate": 1.8190413101705096e-06, + "loss": 0.6588, + "step": 23235 + }, + { + "epoch": 0.81, + "learning_rate": 1.8184151722852439e-06, + "loss": 0.5842, + "step": 23236 + }, + { + "epoch": 0.81, + "learning_rate": 1.8177891314030116e-06, + "loss": 0.6932, + "step": 23237 + }, + { + "epoch": 0.81, + "learning_rate": 1.8171631875312412e-06, + "loss": 0.6301, + "step": 23238 + }, + { + "epoch": 0.81, + "learning_rate": 1.8165373406773558e-06, + "loss": 0.6034, + "step": 23239 + }, + { + "epoch": 0.81, + "learning_rate": 1.8159115908487702e-06, + "loss": 0.6684, + "step": 23240 + }, + { + "epoch": 0.81, + "learning_rate": 1.8152859380529042e-06, + "loss": 0.6402, + "step": 23241 + }, + { + "epoch": 0.81, + "learning_rate": 1.814660382297181e-06, + "loss": 0.6522, + "step": 23242 + }, + { + "epoch": 0.81, + "learning_rate": 1.8140349235890075e-06, + "loss": 0.5583, + "step": 23243 + }, + { + "epoch": 0.81, + "learning_rate": 1.8134095619358083e-06, + "loss": 0.6211, + "step": 23244 + }, + { + "epoch": 0.81, + "learning_rate": 1.812784297344997e-06, + "loss": 0.6539, + "step": 23245 + }, + { + "epoch": 0.81, + "learning_rate": 1.8121591298239827e-06, + "loss": 0.5549, + "step": 23246 + }, + { + "epoch": 0.81, + "learning_rate": 1.81153405938018e-06, + "loss": 0.6433, + "step": 23247 + }, + { + "epoch": 0.81, + "learning_rate": 1.810909086021001e-06, + "loss": 0.6248, + "step": 23248 + }, + { + "epoch": 0.81, + "learning_rate": 1.8102842097538498e-06, + "loss": 0.6448, + "step": 23249 + }, + { + "epoch": 0.81, + "learning_rate": 1.8096594305861415e-06, + "loss": 0.6417, + "step": 23250 + }, + { + "epoch": 0.81, + "learning_rate": 1.8090347485252835e-06, + "loss": 0.6516, + "step": 23251 + }, + { + "epoch": 0.81, + "learning_rate": 1.8084101635786788e-06, + "loss": 0.6135, + "step": 23252 + }, + { + "epoch": 0.81, + "learning_rate": 1.8077856757537326e-06, + "loss": 0.5986, + "step": 23253 + }, + { + "epoch": 0.81, + "learning_rate": 1.8071612850578546e-06, + "loss": 0.6693, + "step": 23254 + }, + { + "epoch": 0.81, + "learning_rate": 1.8065369914984376e-06, + "loss": 0.5671, + "step": 23255 + }, + { + "epoch": 0.81, + "learning_rate": 1.8059127950828914e-06, + "loss": 0.6221, + "step": 23256 + }, + { + "epoch": 0.81, + "learning_rate": 1.8052886958186178e-06, + "loss": 0.6638, + "step": 23257 + }, + { + "epoch": 0.81, + "learning_rate": 1.8046646937130097e-06, + "loss": 0.6228, + "step": 23258 + }, + { + "epoch": 0.81, + "learning_rate": 1.8040407887734702e-06, + "loss": 0.5946, + "step": 23259 + }, + { + "epoch": 0.81, + "learning_rate": 1.8034169810073965e-06, + "loss": 0.5667, + "step": 23260 + }, + { + "epoch": 0.81, + "learning_rate": 1.8027932704221784e-06, + "loss": 0.6365, + "step": 23261 + }, + { + "epoch": 0.81, + "learning_rate": 1.802169657025219e-06, + "loss": 0.5909, + "step": 23262 + }, + { + "epoch": 0.81, + "learning_rate": 1.80154614082391e-06, + "loss": 0.6387, + "step": 23263 + }, + { + "epoch": 0.81, + "learning_rate": 1.8009227218256408e-06, + "loss": 0.6461, + "step": 23264 + }, + { + "epoch": 0.81, + "learning_rate": 1.8002994000378038e-06, + "loss": 0.6372, + "step": 23265 + }, + { + "epoch": 0.81, + "learning_rate": 1.7996761754677938e-06, + "loss": 0.6627, + "step": 23266 + }, + { + "epoch": 0.81, + "learning_rate": 1.7990530481229896e-06, + "loss": 0.6538, + "step": 23267 + }, + { + "epoch": 0.81, + "learning_rate": 1.7984300180107894e-06, + "loss": 0.6603, + "step": 23268 + }, + { + "epoch": 0.81, + "learning_rate": 1.7978070851385788e-06, + "loss": 0.6365, + "step": 23269 + }, + { + "epoch": 0.81, + "learning_rate": 1.7971842495137383e-06, + "loss": 0.6192, + "step": 23270 + }, + { + "epoch": 0.81, + "learning_rate": 1.7965615111436552e-06, + "loss": 0.661, + "step": 23271 + }, + { + "epoch": 0.81, + "learning_rate": 1.795938870035715e-06, + "loss": 0.6271, + "step": 23272 + }, + { + "epoch": 0.81, + "learning_rate": 1.7953163261972938e-06, + "loss": 0.6516, + "step": 23273 + }, + { + "epoch": 0.81, + "learning_rate": 1.7946938796357781e-06, + "loss": 0.6431, + "step": 23274 + }, + { + "epoch": 0.81, + "learning_rate": 1.7940715303585488e-06, + "loss": 0.648, + "step": 23275 + }, + { + "epoch": 0.81, + "learning_rate": 1.7934492783729796e-06, + "loss": 0.6028, + "step": 23276 + }, + { + "epoch": 0.81, + "learning_rate": 1.7928271236864504e-06, + "loss": 0.6001, + "step": 23277 + }, + { + "epoch": 0.81, + "learning_rate": 1.7922050663063406e-06, + "loss": 0.6347, + "step": 23278 + }, + { + "epoch": 0.81, + "learning_rate": 1.7915831062400168e-06, + "loss": 0.6769, + "step": 23279 + }, + { + "epoch": 0.81, + "learning_rate": 1.7909612434948631e-06, + "loss": 0.6115, + "step": 23280 + }, + { + "epoch": 0.81, + "learning_rate": 1.79033947807825e-06, + "loss": 0.7098, + "step": 23281 + }, + { + "epoch": 0.81, + "learning_rate": 1.7897178099975443e-06, + "loss": 0.642, + "step": 23282 + }, + { + "epoch": 0.81, + "learning_rate": 1.7890962392601208e-06, + "loss": 0.6704, + "step": 23283 + }, + { + "epoch": 0.81, + "learning_rate": 1.7884747658733515e-06, + "loss": 0.5936, + "step": 23284 + }, + { + "epoch": 0.81, + "learning_rate": 1.7878533898445948e-06, + "loss": 0.6536, + "step": 23285 + }, + { + "epoch": 0.81, + "learning_rate": 1.7872321111812286e-06, + "loss": 0.6088, + "step": 23286 + }, + { + "epoch": 0.81, + "learning_rate": 1.7866109298906165e-06, + "loss": 0.6589, + "step": 23287 + }, + { + "epoch": 0.81, + "learning_rate": 1.7859898459801194e-06, + "loss": 0.6035, + "step": 23288 + }, + { + "epoch": 0.81, + "learning_rate": 1.785368859457104e-06, + "loss": 0.5768, + "step": 23289 + }, + { + "epoch": 0.81, + "learning_rate": 1.784747970328935e-06, + "loss": 0.602, + "step": 23290 + }, + { + "epoch": 0.81, + "learning_rate": 1.7841271786029656e-06, + "loss": 0.6629, + "step": 23291 + }, + { + "epoch": 0.81, + "learning_rate": 1.7835064842865646e-06, + "loss": 0.6659, + "step": 23292 + }, + { + "epoch": 0.81, + "learning_rate": 1.7828858873870903e-06, + "loss": 0.6292, + "step": 23293 + }, + { + "epoch": 0.81, + "learning_rate": 1.7822653879118955e-06, + "loss": 0.6255, + "step": 23294 + }, + { + "epoch": 0.81, + "learning_rate": 1.7816449858683405e-06, + "loss": 0.6441, + "step": 23295 + }, + { + "epoch": 0.81, + "learning_rate": 1.7810246812637832e-06, + "loss": 0.6109, + "step": 23296 + }, + { + "epoch": 0.81, + "learning_rate": 1.7804044741055692e-06, + "loss": 0.6249, + "step": 23297 + }, + { + "epoch": 0.81, + "learning_rate": 1.779784364401065e-06, + "loss": 0.618, + "step": 23298 + }, + { + "epoch": 0.81, + "learning_rate": 1.7791643521576118e-06, + "loss": 0.5846, + "step": 23299 + }, + { + "epoch": 0.81, + "learning_rate": 1.7785444373825645e-06, + "loss": 0.6613, + "step": 23300 + }, + { + "epoch": 0.81, + "learning_rate": 1.7779246200832768e-06, + "loss": 0.5901, + "step": 23301 + }, + { + "epoch": 0.81, + "learning_rate": 1.7773049002670906e-06, + "loss": 0.6255, + "step": 23302 + }, + { + "epoch": 0.81, + "learning_rate": 1.7766852779413534e-06, + "loss": 0.5799, + "step": 23303 + }, + { + "epoch": 0.81, + "learning_rate": 1.7760657531134207e-06, + "loss": 0.6231, + "step": 23304 + }, + { + "epoch": 0.81, + "learning_rate": 1.7754463257906284e-06, + "loss": 0.6397, + "step": 23305 + }, + { + "epoch": 0.81, + "learning_rate": 1.7748269959803256e-06, + "loss": 0.6445, + "step": 23306 + }, + { + "epoch": 0.81, + "learning_rate": 1.7742077636898547e-06, + "loss": 0.6417, + "step": 23307 + }, + { + "epoch": 0.81, + "learning_rate": 1.7735886289265546e-06, + "loss": 0.6084, + "step": 23308 + }, + { + "epoch": 0.81, + "learning_rate": 1.7729695916977675e-06, + "loss": 0.6625, + "step": 23309 + }, + { + "epoch": 0.81, + "learning_rate": 1.7723506520108337e-06, + "loss": 0.6416, + "step": 23310 + }, + { + "epoch": 0.81, + "learning_rate": 1.7717318098730896e-06, + "loss": 0.6052, + "step": 23311 + }, + { + "epoch": 0.81, + "learning_rate": 1.7711130652918752e-06, + "loss": 0.6228, + "step": 23312 + }, + { + "epoch": 0.81, + "learning_rate": 1.7704944182745265e-06, + "loss": 0.6287, + "step": 23313 + }, + { + "epoch": 0.81, + "learning_rate": 1.7698758688283746e-06, + "loss": 0.6086, + "step": 23314 + }, + { + "epoch": 0.81, + "learning_rate": 1.7692574169607556e-06, + "loss": 0.6134, + "step": 23315 + }, + { + "epoch": 0.81, + "learning_rate": 1.7686390626790019e-06, + "loss": 0.6491, + "step": 23316 + }, + { + "epoch": 0.81, + "learning_rate": 1.7680208059904448e-06, + "loss": 0.663, + "step": 23317 + }, + { + "epoch": 0.81, + "learning_rate": 1.7674026469024152e-06, + "loss": 0.6044, + "step": 23318 + }, + { + "epoch": 0.81, + "learning_rate": 1.7667845854222432e-06, + "loss": 0.6073, + "step": 23319 + }, + { + "epoch": 0.81, + "learning_rate": 1.7661666215572527e-06, + "loss": 0.7259, + "step": 23320 + }, + { + "epoch": 0.81, + "learning_rate": 1.765548755314772e-06, + "loss": 0.6087, + "step": 23321 + }, + { + "epoch": 0.81, + "learning_rate": 1.764930986702128e-06, + "loss": 0.6586, + "step": 23322 + }, + { + "epoch": 0.81, + "learning_rate": 1.7643133157266458e-06, + "loss": 0.6445, + "step": 23323 + }, + { + "epoch": 0.81, + "learning_rate": 1.7636957423956459e-06, + "loss": 0.6458, + "step": 23324 + }, + { + "epoch": 0.81, + "learning_rate": 1.7630782667164548e-06, + "loss": 0.5655, + "step": 23325 + }, + { + "epoch": 0.81, + "learning_rate": 1.7624608886963878e-06, + "loss": 0.5841, + "step": 23326 + }, + { + "epoch": 0.81, + "learning_rate": 1.7618436083427682e-06, + "loss": 0.6254, + "step": 23327 + }, + { + "epoch": 0.81, + "learning_rate": 1.761226425662914e-06, + "loss": 0.6466, + "step": 23328 + }, + { + "epoch": 0.81, + "learning_rate": 1.7606093406641422e-06, + "loss": 0.5982, + "step": 23329 + }, + { + "epoch": 0.81, + "learning_rate": 1.7599923533537699e-06, + "loss": 0.6317, + "step": 23330 + }, + { + "epoch": 0.81, + "learning_rate": 1.7593754637391136e-06, + "loss": 0.5835, + "step": 23331 + }, + { + "epoch": 0.81, + "learning_rate": 1.758758671827484e-06, + "loss": 0.6668, + "step": 23332 + }, + { + "epoch": 0.81, + "learning_rate": 1.7581419776261954e-06, + "loss": 0.6319, + "step": 23333 + }, + { + "epoch": 0.81, + "learning_rate": 1.7575253811425596e-06, + "loss": 0.6019, + "step": 23334 + }, + { + "epoch": 0.81, + "learning_rate": 1.7569088823838864e-06, + "loss": 0.6784, + "step": 23335 + }, + { + "epoch": 0.81, + "learning_rate": 1.7562924813574866e-06, + "loss": 0.608, + "step": 23336 + }, + { + "epoch": 0.81, + "learning_rate": 1.755676178070671e-06, + "loss": 0.6574, + "step": 23337 + }, + { + "epoch": 0.81, + "learning_rate": 1.7550599725307405e-06, + "loss": 0.5925, + "step": 23338 + }, + { + "epoch": 0.81, + "learning_rate": 1.7544438647450036e-06, + "loss": 0.6462, + "step": 23339 + }, + { + "epoch": 0.81, + "learning_rate": 1.7538278547207654e-06, + "loss": 0.5719, + "step": 23340 + }, + { + "epoch": 0.81, + "learning_rate": 1.7532119424653293e-06, + "loss": 0.6222, + "step": 23341 + }, + { + "epoch": 0.81, + "learning_rate": 1.7525961279859982e-06, + "loss": 0.5861, + "step": 23342 + }, + { + "epoch": 0.81, + "learning_rate": 1.7519804112900752e-06, + "loss": 0.5617, + "step": 23343 + }, + { + "epoch": 0.81, + "learning_rate": 1.7513647923848565e-06, + "loss": 0.6583, + "step": 23344 + }, + { + "epoch": 0.81, + "learning_rate": 1.7507492712776419e-06, + "loss": 0.6448, + "step": 23345 + }, + { + "epoch": 0.81, + "learning_rate": 1.7501338479757301e-06, + "loss": 0.668, + "step": 23346 + }, + { + "epoch": 0.81, + "learning_rate": 1.7495185224864186e-06, + "loss": 0.6043, + "step": 23347 + }, + { + "epoch": 0.81, + "learning_rate": 1.7489032948170003e-06, + "loss": 0.6256, + "step": 23348 + }, + { + "epoch": 0.81, + "learning_rate": 1.7482881649747752e-06, + "loss": 0.6546, + "step": 23349 + }, + { + "epoch": 0.81, + "learning_rate": 1.7476731329670293e-06, + "loss": 0.6011, + "step": 23350 + }, + { + "epoch": 0.81, + "learning_rate": 1.747058198801057e-06, + "loss": 0.6351, + "step": 23351 + }, + { + "epoch": 0.81, + "learning_rate": 1.7464433624841504e-06, + "loss": 0.6344, + "step": 23352 + }, + { + "epoch": 0.81, + "learning_rate": 1.745828624023599e-06, + "loss": 0.6312, + "step": 23353 + }, + { + "epoch": 0.81, + "learning_rate": 1.7452139834266901e-06, + "loss": 0.6453, + "step": 23354 + }, + { + "epoch": 0.81, + "learning_rate": 1.7445994407007149e-06, + "loss": 0.5574, + "step": 23355 + }, + { + "epoch": 0.81, + "learning_rate": 1.7439849958529531e-06, + "loss": 0.6322, + "step": 23356 + }, + { + "epoch": 0.81, + "learning_rate": 1.7433706488906943e-06, + "loss": 0.6044, + "step": 23357 + }, + { + "epoch": 0.81, + "learning_rate": 1.7427563998212204e-06, + "loss": 0.5791, + "step": 23358 + }, + { + "epoch": 0.81, + "learning_rate": 1.7421422486518147e-06, + "loss": 0.6384, + "step": 23359 + }, + { + "epoch": 0.81, + "learning_rate": 1.7415281953897612e-06, + "loss": 0.6664, + "step": 23360 + }, + { + "epoch": 0.81, + "learning_rate": 1.7409142400423363e-06, + "loss": 0.6031, + "step": 23361 + }, + { + "epoch": 0.81, + "learning_rate": 1.7403003826168208e-06, + "loss": 0.6032, + "step": 23362 + }, + { + "epoch": 0.81, + "learning_rate": 1.7396866231204923e-06, + "loss": 0.6293, + "step": 23363 + }, + { + "epoch": 0.81, + "learning_rate": 1.7390729615606283e-06, + "loss": 0.6128, + "step": 23364 + }, + { + "epoch": 0.81, + "learning_rate": 1.7384593979445042e-06, + "loss": 0.6705, + "step": 23365 + }, + { + "epoch": 0.81, + "learning_rate": 1.7378459322793973e-06, + "loss": 0.6572, + "step": 23366 + }, + { + "epoch": 0.81, + "learning_rate": 1.7372325645725774e-06, + "loss": 0.6662, + "step": 23367 + }, + { + "epoch": 0.81, + "learning_rate": 1.7366192948313166e-06, + "loss": 0.6207, + "step": 23368 + }, + { + "epoch": 0.81, + "learning_rate": 1.7360061230628878e-06, + "loss": 0.5252, + "step": 23369 + }, + { + "epoch": 0.81, + "learning_rate": 1.7353930492745596e-06, + "loss": 0.6652, + "step": 23370 + }, + { + "epoch": 0.81, + "learning_rate": 1.7347800734736031e-06, + "loss": 0.6275, + "step": 23371 + }, + { + "epoch": 0.81, + "learning_rate": 1.7341671956672857e-06, + "loss": 0.6706, + "step": 23372 + }, + { + "epoch": 0.81, + "learning_rate": 1.7335544158628703e-06, + "loss": 0.6545, + "step": 23373 + }, + { + "epoch": 0.81, + "learning_rate": 1.7329417340676247e-06, + "loss": 0.6509, + "step": 23374 + }, + { + "epoch": 0.81, + "learning_rate": 1.7323291502888118e-06, + "loss": 0.603, + "step": 23375 + }, + { + "epoch": 0.81, + "learning_rate": 1.731716664533697e-06, + "loss": 0.6049, + "step": 23376 + }, + { + "epoch": 0.81, + "learning_rate": 1.7311042768095398e-06, + "loss": 0.6204, + "step": 23377 + }, + { + "epoch": 0.81, + "learning_rate": 1.7304919871236037e-06, + "loss": 0.5924, + "step": 23378 + }, + { + "epoch": 0.81, + "learning_rate": 1.7298797954831436e-06, + "loss": 0.5964, + "step": 23379 + }, + { + "epoch": 0.81, + "learning_rate": 1.7292677018954207e-06, + "loss": 0.605, + "step": 23380 + }, + { + "epoch": 0.81, + "learning_rate": 1.7286557063676922e-06, + "loss": 0.656, + "step": 23381 + }, + { + "epoch": 0.81, + "learning_rate": 1.7280438089072126e-06, + "loss": 0.6411, + "step": 23382 + }, + { + "epoch": 0.81, + "learning_rate": 1.7274320095212382e-06, + "loss": 0.6964, + "step": 23383 + }, + { + "epoch": 0.81, + "learning_rate": 1.7268203082170244e-06, + "loss": 0.6209, + "step": 23384 + }, + { + "epoch": 0.81, + "learning_rate": 1.7262087050018194e-06, + "loss": 0.6025, + "step": 23385 + }, + { + "epoch": 0.81, + "learning_rate": 1.7255971998828768e-06, + "loss": 0.6098, + "step": 23386 + }, + { + "epoch": 0.81, + "learning_rate": 1.7249857928674464e-06, + "loss": 0.6386, + "step": 23387 + }, + { + "epoch": 0.81, + "learning_rate": 1.7243744839627762e-06, + "loss": 0.6204, + "step": 23388 + }, + { + "epoch": 0.81, + "learning_rate": 1.7237632731761168e-06, + "loss": 0.647, + "step": 23389 + }, + { + "epoch": 0.81, + "learning_rate": 1.723152160514715e-06, + "loss": 0.6898, + "step": 23390 + }, + { + "epoch": 0.81, + "learning_rate": 1.7225411459858122e-06, + "loss": 0.6644, + "step": 23391 + }, + { + "epoch": 0.81, + "learning_rate": 1.7219302295966556e-06, + "loss": 0.6495, + "step": 23392 + }, + { + "epoch": 0.81, + "learning_rate": 1.7213194113544873e-06, + "loss": 0.6431, + "step": 23393 + }, + { + "epoch": 0.81, + "learning_rate": 1.7207086912665504e-06, + "loss": 0.684, + "step": 23394 + }, + { + "epoch": 0.81, + "learning_rate": 1.720098069340085e-06, + "loss": 0.6598, + "step": 23395 + }, + { + "epoch": 0.81, + "learning_rate": 1.7194875455823335e-06, + "loss": 0.6487, + "step": 23396 + }, + { + "epoch": 0.81, + "learning_rate": 1.7188771200005304e-06, + "loss": 0.6655, + "step": 23397 + }, + { + "epoch": 0.81, + "learning_rate": 1.7182667926019136e-06, + "loss": 0.694, + "step": 23398 + }, + { + "epoch": 0.81, + "learning_rate": 1.7176565633937214e-06, + "loss": 0.6222, + "step": 23399 + }, + { + "epoch": 0.81, + "learning_rate": 1.717046432383187e-06, + "loss": 0.5871, + "step": 23400 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164363995775458e-06, + "loss": 0.6459, + "step": 23401 + }, + { + "epoch": 0.81, + "learning_rate": 1.715826464984033e-06, + "loss": 0.6213, + "step": 23402 + }, + { + "epoch": 0.81, + "learning_rate": 1.7152166286098727e-06, + "loss": 0.6694, + "step": 23403 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146068904623003e-06, + "loss": 0.6248, + "step": 23404 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139972505485447e-06, + "loss": 0.6972, + "step": 23405 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133877088758332e-06, + "loss": 0.6865, + "step": 23406 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127782654513936e-06, + "loss": 0.6275, + "step": 23407 + }, + { + "epoch": 0.81, + "learning_rate": 1.712168920282453e-06, + "loss": 0.6445, + "step": 23408 + }, + { + "epoch": 0.81, + "learning_rate": 1.711559673376232e-06, + "loss": 0.6529, + "step": 23409 + }, + { + "epoch": 0.81, + "learning_rate": 1.710950524739955e-06, + "loss": 0.6333, + "step": 23410 + }, + { + "epoch": 0.81, + "learning_rate": 1.7103414743808455e-06, + "loss": 0.6718, + "step": 23411 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097325223061257e-06, + "loss": 0.5986, + "step": 23412 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091236685230127e-06, + "loss": 0.6067, + "step": 23413 + }, + { + "epoch": 0.81, + "learning_rate": 1.7085149130387291e-06, + "loss": 0.5752, + "step": 23414 + }, + { + "epoch": 0.81, + "learning_rate": 1.7079062558604876e-06, + "loss": 0.6023, + "step": 23415 + }, + { + "epoch": 0.81, + "learning_rate": 1.707297696995508e-06, + "loss": 0.6259, + "step": 23416 + }, + { + "epoch": 0.81, + "learning_rate": 1.7066892364510036e-06, + "loss": 0.6115, + "step": 23417 + }, + { + "epoch": 0.81, + "learning_rate": 1.7060808742341895e-06, + "loss": 0.5955, + "step": 23418 + }, + { + "epoch": 0.81, + "learning_rate": 1.7054726103522778e-06, + "loss": 0.6048, + "step": 23419 + }, + { + "epoch": 0.81, + "learning_rate": 1.7048644448124852e-06, + "loss": 0.6321, + "step": 23420 + }, + { + "epoch": 0.81, + "learning_rate": 1.7042563776220133e-06, + "loss": 0.6432, + "step": 23421 + }, + { + "epoch": 0.81, + "learning_rate": 1.703648408788078e-06, + "loss": 0.6495, + "step": 23422 + }, + { + "epoch": 0.81, + "learning_rate": 1.703040538317885e-06, + "loss": 0.6063, + "step": 23423 + }, + { + "epoch": 0.81, + "learning_rate": 1.7024327662186423e-06, + "loss": 0.5986, + "step": 23424 + }, + { + "epoch": 0.81, + "learning_rate": 1.7018250924975577e-06, + "loss": 0.6122, + "step": 23425 + }, + { + "epoch": 0.81, + "learning_rate": 1.7012175171618329e-06, + "loss": 0.6204, + "step": 23426 + }, + { + "epoch": 0.81, + "learning_rate": 1.700610040218671e-06, + "loss": 0.5719, + "step": 23427 + }, + { + "epoch": 0.81, + "learning_rate": 1.7000026616752763e-06, + "loss": 0.587, + "step": 23428 + }, + { + "epoch": 0.81, + "learning_rate": 1.6993953815388485e-06, + "loss": 0.6478, + "step": 23429 + }, + { + "epoch": 0.81, + "learning_rate": 1.69878819981659e-06, + "loss": 0.6032, + "step": 23430 + }, + { + "epoch": 0.81, + "learning_rate": 1.6981811165157014e-06, + "loss": 0.654, + "step": 23431 + }, + { + "epoch": 0.81, + "learning_rate": 1.6975741316433735e-06, + "loss": 0.5889, + "step": 23432 + }, + { + "epoch": 0.81, + "learning_rate": 1.6969672452068087e-06, + "loss": 0.6146, + "step": 23433 + }, + { + "epoch": 0.81, + "learning_rate": 1.6963604572131997e-06, + "loss": 0.6235, + "step": 23434 + }, + { + "epoch": 0.81, + "learning_rate": 1.6957537676697411e-06, + "loss": 0.6284, + "step": 23435 + }, + { + "epoch": 0.81, + "learning_rate": 1.695147176583627e-06, + "loss": 0.6589, + "step": 23436 + }, + { + "epoch": 0.81, + "learning_rate": 1.6945406839620515e-06, + "loss": 0.6027, + "step": 23437 + }, + { + "epoch": 0.81, + "learning_rate": 1.6939342898122002e-06, + "loss": 0.6693, + "step": 23438 + }, + { + "epoch": 0.81, + "learning_rate": 1.693327994141265e-06, + "loss": 0.6004, + "step": 23439 + }, + { + "epoch": 0.81, + "learning_rate": 1.6927217969564336e-06, + "loss": 0.6453, + "step": 23440 + }, + { + "epoch": 0.81, + "learning_rate": 1.6921156982648946e-06, + "loss": 0.6544, + "step": 23441 + }, + { + "epoch": 0.81, + "learning_rate": 1.6915096980738344e-06, + "loss": 0.5685, + "step": 23442 + }, + { + "epoch": 0.81, + "learning_rate": 1.6909037963904383e-06, + "loss": 0.609, + "step": 23443 + }, + { + "epoch": 0.81, + "learning_rate": 1.6902979932218866e-06, + "loss": 0.6029, + "step": 23444 + }, + { + "epoch": 0.81, + "learning_rate": 1.6896922885753641e-06, + "loss": 0.6121, + "step": 23445 + }, + { + "epoch": 0.81, + "learning_rate": 1.6890866824580532e-06, + "loss": 0.6431, + "step": 23446 + }, + { + "epoch": 0.81, + "learning_rate": 1.6884811748771313e-06, + "loss": 0.6744, + "step": 23447 + }, + { + "epoch": 0.81, + "learning_rate": 1.6878757658397805e-06, + "loss": 0.5633, + "step": 23448 + }, + { + "epoch": 0.81, + "learning_rate": 1.6872704553531793e-06, + "loss": 0.6833, + "step": 23449 + }, + { + "epoch": 0.81, + "learning_rate": 1.6866652434245002e-06, + "loss": 0.5688, + "step": 23450 + }, + { + "epoch": 0.81, + "learning_rate": 1.6860601300609203e-06, + "loss": 0.6955, + "step": 23451 + }, + { + "epoch": 0.81, + "learning_rate": 1.6854551152696152e-06, + "loss": 0.6736, + "step": 23452 + }, + { + "epoch": 0.81, + "learning_rate": 1.6848501990577582e-06, + "loss": 0.6064, + "step": 23453 + }, + { + "epoch": 0.81, + "learning_rate": 1.6842453814325199e-06, + "loss": 0.6413, + "step": 23454 + }, + { + "epoch": 0.81, + "learning_rate": 1.683640662401076e-06, + "loss": 0.643, + "step": 23455 + }, + { + "epoch": 0.81, + "learning_rate": 1.6830360419705882e-06, + "loss": 0.641, + "step": 23456 + }, + { + "epoch": 0.81, + "learning_rate": 1.6824315201482299e-06, + "loss": 0.6437, + "step": 23457 + }, + { + "epoch": 0.81, + "learning_rate": 1.6818270969411677e-06, + "loss": 0.6215, + "step": 23458 + }, + { + "epoch": 0.81, + "learning_rate": 1.6812227723565677e-06, + "loss": 0.5828, + "step": 23459 + }, + { + "epoch": 0.81, + "learning_rate": 1.6806185464015957e-06, + "loss": 0.6259, + "step": 23460 + }, + { + "epoch": 0.81, + "learning_rate": 1.6800144190834168e-06, + "loss": 0.6727, + "step": 23461 + }, + { + "epoch": 0.81, + "learning_rate": 1.6794103904091884e-06, + "loss": 0.672, + "step": 23462 + }, + { + "epoch": 0.81, + "learning_rate": 1.6788064603860766e-06, + "loss": 0.6426, + "step": 23463 + }, + { + "epoch": 0.81, + "learning_rate": 1.6782026290212406e-06, + "loss": 0.5593, + "step": 23464 + }, + { + "epoch": 0.81, + "learning_rate": 1.6775988963218393e-06, + "loss": 0.6126, + "step": 23465 + }, + { + "epoch": 0.81, + "learning_rate": 1.6769952622950302e-06, + "loss": 0.7035, + "step": 23466 + }, + { + "epoch": 0.81, + "learning_rate": 1.6763917269479745e-06, + "loss": 0.5812, + "step": 23467 + }, + { + "epoch": 0.81, + "learning_rate": 1.675788290287822e-06, + "loss": 0.6273, + "step": 23468 + }, + { + "epoch": 0.81, + "learning_rate": 1.6751849523217289e-06, + "loss": 0.6667, + "step": 23469 + }, + { + "epoch": 0.81, + "learning_rate": 1.6745817130568487e-06, + "loss": 0.6877, + "step": 23470 + }, + { + "epoch": 0.81, + "learning_rate": 1.6739785725003343e-06, + "loss": 0.641, + "step": 23471 + }, + { + "epoch": 0.81, + "learning_rate": 1.673375530659337e-06, + "loss": 0.6067, + "step": 23472 + }, + { + "epoch": 0.81, + "learning_rate": 1.6727725875410083e-06, + "loss": 0.6375, + "step": 23473 + }, + { + "epoch": 0.81, + "learning_rate": 1.6721697431524919e-06, + "loss": 0.6611, + "step": 23474 + }, + { + "epoch": 0.81, + "learning_rate": 1.6715669975009374e-06, + "loss": 0.5521, + "step": 23475 + }, + { + "epoch": 0.81, + "learning_rate": 1.6709643505934925e-06, + "loss": 0.6245, + "step": 23476 + }, + { + "epoch": 0.81, + "learning_rate": 1.6703618024373014e-06, + "loss": 0.7013, + "step": 23477 + }, + { + "epoch": 0.81, + "learning_rate": 1.6697593530395072e-06, + "loss": 0.651, + "step": 23478 + }, + { + "epoch": 0.81, + "learning_rate": 1.6691570024072578e-06, + "loss": 0.6488, + "step": 23479 + }, + { + "epoch": 0.81, + "learning_rate": 1.6685547505476872e-06, + "loss": 0.6362, + "step": 23480 + }, + { + "epoch": 0.81, + "learning_rate": 1.667952597467939e-06, + "loss": 0.5826, + "step": 23481 + }, + { + "epoch": 0.81, + "learning_rate": 1.6673505431751535e-06, + "loss": 0.6765, + "step": 23482 + }, + { + "epoch": 0.81, + "learning_rate": 1.666748587676469e-06, + "loss": 0.6205, + "step": 23483 + }, + { + "epoch": 0.81, + "learning_rate": 1.6661467309790224e-06, + "loss": 0.6304, + "step": 23484 + }, + { + "epoch": 0.81, + "learning_rate": 1.6655449730899477e-06, + "loss": 0.6802, + "step": 23485 + }, + { + "epoch": 0.81, + "learning_rate": 1.6649433140163796e-06, + "loss": 0.6496, + "step": 23486 + }, + { + "epoch": 0.81, + "learning_rate": 1.6643417537654548e-06, + "loss": 0.6672, + "step": 23487 + }, + { + "epoch": 0.81, + "learning_rate": 1.663740292344298e-06, + "loss": 0.6195, + "step": 23488 + }, + { + "epoch": 0.81, + "learning_rate": 1.6631389297600487e-06, + "loss": 0.564, + "step": 23489 + }, + { + "epoch": 0.81, + "learning_rate": 1.6625376660198356e-06, + "loss": 0.6709, + "step": 23490 + }, + { + "epoch": 0.81, + "learning_rate": 1.661936501130783e-06, + "loss": 0.6428, + "step": 23491 + }, + { + "epoch": 0.81, + "learning_rate": 1.661335435100021e-06, + "loss": 0.5832, + "step": 23492 + }, + { + "epoch": 0.81, + "learning_rate": 1.6607344679346782e-06, + "loss": 0.6303, + "step": 23493 + }, + { + "epoch": 0.81, + "learning_rate": 1.6601335996418733e-06, + "loss": 0.6052, + "step": 23494 + }, + { + "epoch": 0.81, + "learning_rate": 1.6595328302287362e-06, + "loss": 0.6183, + "step": 23495 + }, + { + "epoch": 0.81, + "learning_rate": 1.65893215970239e-06, + "loss": 0.6144, + "step": 23496 + }, + { + "epoch": 0.81, + "learning_rate": 1.6583315880699536e-06, + "loss": 0.6528, + "step": 23497 + }, + { + "epoch": 0.81, + "learning_rate": 1.6577311153385478e-06, + "loss": 0.7047, + "step": 23498 + }, + { + "epoch": 0.81, + "learning_rate": 1.6571307415152948e-06, + "loss": 0.6503, + "step": 23499 + }, + { + "epoch": 0.81, + "learning_rate": 1.6565304666073056e-06, + "loss": 0.5955, + "step": 23500 + }, + { + "epoch": 0.81, + "learning_rate": 1.6559302906217055e-06, + "loss": 0.6543, + "step": 23501 + }, + { + "epoch": 0.81, + "learning_rate": 1.655330213565609e-06, + "loss": 0.6552, + "step": 23502 + }, + { + "epoch": 0.81, + "learning_rate": 1.654730235446127e-06, + "loss": 0.6304, + "step": 23503 + }, + { + "epoch": 0.81, + "learning_rate": 1.6541303562703748e-06, + "loss": 0.6502, + "step": 23504 + }, + { + "epoch": 0.81, + "learning_rate": 1.6535305760454667e-06, + "loss": 0.6251, + "step": 23505 + }, + { + "epoch": 0.81, + "learning_rate": 1.6529308947785094e-06, + "loss": 0.6352, + "step": 23506 + }, + { + "epoch": 0.81, + "learning_rate": 1.652331312476614e-06, + "loss": 0.6412, + "step": 23507 + }, + { + "epoch": 0.81, + "learning_rate": 1.6517318291468954e-06, + "loss": 0.6676, + "step": 23508 + }, + { + "epoch": 0.81, + "learning_rate": 1.6511324447964527e-06, + "loss": 0.5901, + "step": 23509 + }, + { + "epoch": 0.81, + "learning_rate": 1.650533159432398e-06, + "loss": 0.651, + "step": 23510 + }, + { + "epoch": 0.81, + "learning_rate": 1.6499339730618357e-06, + "loss": 0.6044, + "step": 23511 + }, + { + "epoch": 0.81, + "learning_rate": 1.6493348856918678e-06, + "loss": 0.63, + "step": 23512 + }, + { + "epoch": 0.81, + "learning_rate": 1.6487358973295965e-06, + "loss": 0.6528, + "step": 23513 + }, + { + "epoch": 0.81, + "learning_rate": 1.648137007982129e-06, + "loss": 0.6498, + "step": 23514 + }, + { + "epoch": 0.81, + "learning_rate": 1.6475382176565602e-06, + "loss": 0.5843, + "step": 23515 + }, + { + "epoch": 0.81, + "learning_rate": 1.646939526359993e-06, + "loss": 0.6256, + "step": 23516 + }, + { + "epoch": 0.81, + "learning_rate": 1.6463409340995252e-06, + "loss": 0.6257, + "step": 23517 + }, + { + "epoch": 0.81, + "learning_rate": 1.645742440882252e-06, + "loss": 0.6223, + "step": 23518 + }, + { + "epoch": 0.81, + "learning_rate": 1.6451440467152668e-06, + "loss": 0.6072, + "step": 23519 + }, + { + "epoch": 0.81, + "learning_rate": 1.644545751605674e-06, + "loss": 0.6179, + "step": 23520 + }, + { + "epoch": 0.81, + "learning_rate": 1.6439475555605578e-06, + "loss": 0.6586, + "step": 23521 + }, + { + "epoch": 0.81, + "learning_rate": 1.6433494585870136e-06, + "loss": 0.6474, + "step": 23522 + }, + { + "epoch": 0.82, + "learning_rate": 1.6427514606921357e-06, + "loss": 0.5896, + "step": 23523 + }, + { + "epoch": 0.82, + "learning_rate": 1.6421535618830087e-06, + "loss": 0.6461, + "step": 23524 + }, + { + "epoch": 0.82, + "learning_rate": 1.641555762166721e-06, + "loss": 0.5805, + "step": 23525 + }, + { + "epoch": 0.82, + "learning_rate": 1.6409580615503684e-06, + "loss": 0.5799, + "step": 23526 + }, + { + "epoch": 0.82, + "learning_rate": 1.6403604600410294e-06, + "loss": 0.6826, + "step": 23527 + }, + { + "epoch": 0.82, + "learning_rate": 1.639762957645793e-06, + "loss": 0.6033, + "step": 23528 + }, + { + "epoch": 0.82, + "learning_rate": 1.6391655543717444e-06, + "loss": 0.6405, + "step": 23529 + }, + { + "epoch": 0.82, + "learning_rate": 1.6385682502259627e-06, + "loss": 0.6112, + "step": 23530 + }, + { + "epoch": 0.82, + "learning_rate": 1.6379710452155285e-06, + "loss": 0.5966, + "step": 23531 + }, + { + "epoch": 0.82, + "learning_rate": 1.6373739393475308e-06, + "loss": 0.6206, + "step": 23532 + }, + { + "epoch": 0.82, + "learning_rate": 1.6367769326290417e-06, + "loss": 0.6624, + "step": 23533 + }, + { + "epoch": 0.82, + "learning_rate": 1.636180025067141e-06, + "loss": 0.6724, + "step": 23534 + }, + { + "epoch": 0.82, + "learning_rate": 1.6355832166689089e-06, + "loss": 0.66, + "step": 23535 + }, + { + "epoch": 0.82, + "learning_rate": 1.6349865074414173e-06, + "loss": 0.6819, + "step": 23536 + }, + { + "epoch": 0.82, + "learning_rate": 1.6343898973917395e-06, + "loss": 0.653, + "step": 23537 + }, + { + "epoch": 0.82, + "learning_rate": 1.6337933865269562e-06, + "loss": 0.5999, + "step": 23538 + }, + { + "epoch": 0.82, + "learning_rate": 1.6331969748541331e-06, + "loss": 0.6149, + "step": 23539 + }, + { + "epoch": 0.82, + "learning_rate": 1.6326006623803448e-06, + "loss": 0.6407, + "step": 23540 + }, + { + "epoch": 0.82, + "learning_rate": 1.632004449112663e-06, + "loss": 0.6759, + "step": 23541 + }, + { + "epoch": 0.82, + "learning_rate": 1.6314083350581512e-06, + "loss": 0.5859, + "step": 23542 + }, + { + "epoch": 0.82, + "learning_rate": 1.6308123202238769e-06, + "loss": 0.6406, + "step": 23543 + }, + { + "epoch": 0.82, + "learning_rate": 1.6302164046169156e-06, + "loss": 0.6669, + "step": 23544 + }, + { + "epoch": 0.82, + "learning_rate": 1.6296205882443239e-06, + "loss": 0.6578, + "step": 23545 + }, + { + "epoch": 0.82, + "learning_rate": 1.6290248711131707e-06, + "loss": 0.6519, + "step": 23546 + }, + { + "epoch": 0.82, + "learning_rate": 1.6284292532305146e-06, + "loss": 0.6556, + "step": 23547 + }, + { + "epoch": 0.82, + "learning_rate": 1.62783373460342e-06, + "loss": 0.6341, + "step": 23548 + }, + { + "epoch": 0.82, + "learning_rate": 1.627238315238947e-06, + "loss": 0.6325, + "step": 23549 + }, + { + "epoch": 0.82, + "learning_rate": 1.6266429951441566e-06, + "loss": 0.6009, + "step": 23550 + }, + { + "epoch": 0.82, + "learning_rate": 1.626047774326104e-06, + "loss": 0.6543, + "step": 23551 + }, + { + "epoch": 0.82, + "learning_rate": 1.6254526527918512e-06, + "loss": 0.6506, + "step": 23552 + }, + { + "epoch": 0.82, + "learning_rate": 1.6248576305484497e-06, + "loss": 0.6187, + "step": 23553 + }, + { + "epoch": 0.82, + "learning_rate": 1.6242627076029549e-06, + "loss": 0.6205, + "step": 23554 + }, + { + "epoch": 0.82, + "learning_rate": 1.623667883962421e-06, + "loss": 0.6089, + "step": 23555 + }, + { + "epoch": 0.82, + "learning_rate": 1.6230731596339e-06, + "loss": 0.6579, + "step": 23556 + }, + { + "epoch": 0.82, + "learning_rate": 1.6224785346244443e-06, + "loss": 0.6057, + "step": 23557 + }, + { + "epoch": 0.82, + "learning_rate": 1.6218840089411047e-06, + "loss": 0.6406, + "step": 23558 + }, + { + "epoch": 0.82, + "learning_rate": 1.621289582590927e-06, + "loss": 0.5979, + "step": 23559 + }, + { + "epoch": 0.82, + "learning_rate": 1.6206952555809607e-06, + "loss": 0.6673, + "step": 23560 + }, + { + "epoch": 0.82, + "learning_rate": 1.6201010279182506e-06, + "loss": 0.6748, + "step": 23561 + }, + { + "epoch": 0.82, + "learning_rate": 1.6195068996098451e-06, + "loss": 0.6667, + "step": 23562 + }, + { + "epoch": 0.82, + "learning_rate": 1.6189128706627855e-06, + "loss": 0.641, + "step": 23563 + }, + { + "epoch": 0.82, + "learning_rate": 1.6183189410841193e-06, + "loss": 0.5954, + "step": 23564 + }, + { + "epoch": 0.82, + "learning_rate": 1.617725110880881e-06, + "loss": 0.5803, + "step": 23565 + }, + { + "epoch": 0.82, + "learning_rate": 1.6171313800601163e-06, + "loss": 0.5847, + "step": 23566 + }, + { + "epoch": 0.82, + "learning_rate": 1.6165377486288635e-06, + "loss": 0.5924, + "step": 23567 + }, + { + "epoch": 0.82, + "learning_rate": 1.6159442165941607e-06, + "loss": 0.6335, + "step": 23568 + }, + { + "epoch": 0.82, + "learning_rate": 1.6153507839630457e-06, + "loss": 0.6367, + "step": 23569 + }, + { + "epoch": 0.82, + "learning_rate": 1.6147574507425546e-06, + "loss": 0.5806, + "step": 23570 + }, + { + "epoch": 0.82, + "learning_rate": 1.6141642169397199e-06, + "loss": 0.6587, + "step": 23571 + }, + { + "epoch": 0.82, + "learning_rate": 1.613571082561577e-06, + "loss": 0.6439, + "step": 23572 + }, + { + "epoch": 0.82, + "learning_rate": 1.6129780476151568e-06, + "loss": 0.6831, + "step": 23573 + }, + { + "epoch": 0.82, + "learning_rate": 1.6123851121074919e-06, + "loss": 0.694, + "step": 23574 + }, + { + "epoch": 0.82, + "learning_rate": 1.6117922760456118e-06, + "loss": 0.6327, + "step": 23575 + }, + { + "epoch": 0.82, + "learning_rate": 1.6111995394365488e-06, + "loss": 0.6231, + "step": 23576 + }, + { + "epoch": 0.82, + "learning_rate": 1.6106069022873239e-06, + "loss": 0.6163, + "step": 23577 + }, + { + "epoch": 0.82, + "learning_rate": 1.610014364604966e-06, + "loss": 0.6103, + "step": 23578 + }, + { + "epoch": 0.82, + "learning_rate": 1.6094219263965028e-06, + "loss": 0.654, + "step": 23579 + }, + { + "epoch": 0.82, + "learning_rate": 1.6088295876689553e-06, + "loss": 0.6686, + "step": 23580 + }, + { + "epoch": 0.82, + "learning_rate": 1.608237348429349e-06, + "loss": 0.6139, + "step": 23581 + }, + { + "epoch": 0.82, + "learning_rate": 1.607645208684706e-06, + "loss": 0.648, + "step": 23582 + }, + { + "epoch": 0.82, + "learning_rate": 1.6070531684420442e-06, + "loss": 0.6881, + "step": 23583 + }, + { + "epoch": 0.82, + "learning_rate": 1.6064612277083835e-06, + "loss": 0.6412, + "step": 23584 + }, + { + "epoch": 0.82, + "learning_rate": 1.6058693864907426e-06, + "loss": 0.6359, + "step": 23585 + }, + { + "epoch": 0.82, + "learning_rate": 1.6052776447961393e-06, + "loss": 0.6111, + "step": 23586 + }, + { + "epoch": 0.82, + "learning_rate": 1.6046860026315892e-06, + "loss": 0.6415, + "step": 23587 + }, + { + "epoch": 0.82, + "learning_rate": 1.6040944600041086e-06, + "loss": 0.6397, + "step": 23588 + }, + { + "epoch": 0.82, + "learning_rate": 1.6035030169207067e-06, + "loss": 0.6682, + "step": 23589 + }, + { + "epoch": 0.82, + "learning_rate": 1.6029116733883977e-06, + "loss": 0.6274, + "step": 23590 + }, + { + "epoch": 0.82, + "learning_rate": 1.6023204294141936e-06, + "loss": 0.668, + "step": 23591 + }, + { + "epoch": 0.82, + "learning_rate": 1.6017292850051037e-06, + "loss": 0.5841, + "step": 23592 + }, + { + "epoch": 0.82, + "learning_rate": 1.6011382401681375e-06, + "loss": 0.6689, + "step": 23593 + }, + { + "epoch": 0.82, + "learning_rate": 1.600547294910304e-06, + "loss": 0.6302, + "step": 23594 + }, + { + "epoch": 0.82, + "learning_rate": 1.5999564492386054e-06, + "loss": 0.6923, + "step": 23595 + }, + { + "epoch": 0.82, + "learning_rate": 1.5993657031600495e-06, + "loss": 0.5981, + "step": 23596 + }, + { + "epoch": 0.82, + "learning_rate": 1.5987750566816396e-06, + "loss": 0.6102, + "step": 23597 + }, + { + "epoch": 0.82, + "learning_rate": 1.59818450981038e-06, + "loss": 0.6336, + "step": 23598 + }, + { + "epoch": 0.82, + "learning_rate": 1.5975940625532705e-06, + "loss": 0.6906, + "step": 23599 + }, + { + "epoch": 0.82, + "learning_rate": 1.5970037149173145e-06, + "loss": 0.6422, + "step": 23600 + }, + { + "epoch": 0.82, + "learning_rate": 1.5964134669095078e-06, + "loss": 0.6096, + "step": 23601 + }, + { + "epoch": 0.82, + "learning_rate": 1.5958233185368488e-06, + "loss": 0.6126, + "step": 23602 + }, + { + "epoch": 0.82, + "learning_rate": 1.5952332698063367e-06, + "loss": 0.6466, + "step": 23603 + }, + { + "epoch": 0.82, + "learning_rate": 1.5946433207249668e-06, + "loss": 0.6487, + "step": 23604 + }, + { + "epoch": 0.82, + "learning_rate": 1.5940534712997324e-06, + "loss": 0.6622, + "step": 23605 + }, + { + "epoch": 0.82, + "learning_rate": 1.5934637215376303e-06, + "loss": 0.6554, + "step": 23606 + }, + { + "epoch": 0.82, + "learning_rate": 1.592874071445647e-06, + "loss": 0.6332, + "step": 23607 + }, + { + "epoch": 0.82, + "learning_rate": 1.592284521030777e-06, + "loss": 0.5895, + "step": 23608 + }, + { + "epoch": 0.82, + "learning_rate": 1.59169507030001e-06, + "loss": 0.6393, + "step": 23609 + }, + { + "epoch": 0.82, + "learning_rate": 1.5911057192603351e-06, + "loss": 0.6511, + "step": 23610 + }, + { + "epoch": 0.82, + "learning_rate": 1.5905164679187412e-06, + "loss": 0.5737, + "step": 23611 + }, + { + "epoch": 0.82, + "learning_rate": 1.5899273162822094e-06, + "loss": 0.5967, + "step": 23612 + }, + { + "epoch": 0.82, + "learning_rate": 1.5893382643577294e-06, + "loss": 0.6198, + "step": 23613 + }, + { + "epoch": 0.82, + "learning_rate": 1.5887493121522824e-06, + "loss": 0.6306, + "step": 23614 + }, + { + "epoch": 0.82, + "learning_rate": 1.5881604596728539e-06, + "loss": 0.5959, + "step": 23615 + }, + { + "epoch": 0.82, + "learning_rate": 1.587571706926424e-06, + "loss": 0.5802, + "step": 23616 + }, + { + "epoch": 0.82, + "learning_rate": 1.5869830539199748e-06, + "loss": 0.6078, + "step": 23617 + }, + { + "epoch": 0.82, + "learning_rate": 1.586394500660482e-06, + "loss": 0.6116, + "step": 23618 + }, + { + "epoch": 0.82, + "learning_rate": 1.5858060471549263e-06, + "loss": 0.6744, + "step": 23619 + }, + { + "epoch": 0.82, + "learning_rate": 1.5852176934102824e-06, + "loss": 0.6588, + "step": 23620 + }, + { + "epoch": 0.82, + "learning_rate": 1.5846294394335292e-06, + "loss": 0.6082, + "step": 23621 + }, + { + "epoch": 0.82, + "learning_rate": 1.5840412852316389e-06, + "loss": 0.6195, + "step": 23622 + }, + { + "epoch": 0.82, + "learning_rate": 1.583453230811588e-06, + "loss": 0.657, + "step": 23623 + }, + { + "epoch": 0.82, + "learning_rate": 1.5828652761803432e-06, + "loss": 0.6051, + "step": 23624 + }, + { + "epoch": 0.82, + "learning_rate": 1.5822774213448777e-06, + "loss": 0.6245, + "step": 23625 + }, + { + "epoch": 0.82, + "learning_rate": 1.5816896663121628e-06, + "loss": 0.5916, + "step": 23626 + }, + { + "epoch": 0.82, + "learning_rate": 1.581102011089166e-06, + "loss": 0.6301, + "step": 23627 + }, + { + "epoch": 0.82, + "learning_rate": 1.5805144556828544e-06, + "loss": 0.6616, + "step": 23628 + }, + { + "epoch": 0.82, + "learning_rate": 1.5799270001001977e-06, + "loss": 0.7073, + "step": 23629 + }, + { + "epoch": 0.82, + "learning_rate": 1.5793396443481556e-06, + "loss": 0.6699, + "step": 23630 + }, + { + "epoch": 0.82, + "learning_rate": 1.578752388433693e-06, + "loss": 0.6478, + "step": 23631 + }, + { + "epoch": 0.82, + "learning_rate": 1.5781652323637753e-06, + "loss": 0.6287, + "step": 23632 + }, + { + "epoch": 0.82, + "learning_rate": 1.5775781761453612e-06, + "loss": 0.641, + "step": 23633 + }, + { + "epoch": 0.82, + "learning_rate": 1.5769912197854131e-06, + "loss": 0.6066, + "step": 23634 + }, + { + "epoch": 0.82, + "learning_rate": 1.576404363290891e-06, + "loss": 0.6342, + "step": 23635 + }, + { + "epoch": 0.82, + "learning_rate": 1.5758176066687492e-06, + "loss": 0.6001, + "step": 23636 + }, + { + "epoch": 0.82, + "learning_rate": 1.5752309499259454e-06, + "loss": 0.6428, + "step": 23637 + }, + { + "epoch": 0.82, + "learning_rate": 1.5746443930694367e-06, + "loss": 0.635, + "step": 23638 + }, + { + "epoch": 0.82, + "learning_rate": 1.574057936106177e-06, + "loss": 0.6811, + "step": 23639 + }, + { + "epoch": 0.82, + "learning_rate": 1.5734715790431188e-06, + "loss": 0.6526, + "step": 23640 + }, + { + "epoch": 0.82, + "learning_rate": 1.5728853218872175e-06, + "loss": 0.6562, + "step": 23641 + }, + { + "epoch": 0.82, + "learning_rate": 1.5722991646454189e-06, + "loss": 0.6003, + "step": 23642 + }, + { + "epoch": 0.82, + "learning_rate": 1.571713107324675e-06, + "loss": 0.6564, + "step": 23643 + }, + { + "epoch": 0.82, + "learning_rate": 1.5711271499319336e-06, + "loss": 0.6149, + "step": 23644 + }, + { + "epoch": 0.82, + "learning_rate": 1.5705412924741414e-06, + "loss": 0.6405, + "step": 23645 + }, + { + "epoch": 0.82, + "learning_rate": 1.5699555349582474e-06, + "loss": 0.6336, + "step": 23646 + }, + { + "epoch": 0.82, + "learning_rate": 1.5693698773911959e-06, + "loss": 0.6228, + "step": 23647 + }, + { + "epoch": 0.82, + "learning_rate": 1.5687843197799269e-06, + "loss": 0.5782, + "step": 23648 + }, + { + "epoch": 0.82, + "learning_rate": 1.5681988621313847e-06, + "loss": 0.615, + "step": 23649 + }, + { + "epoch": 0.82, + "learning_rate": 1.567613504452513e-06, + "loss": 0.6057, + "step": 23650 + }, + { + "epoch": 0.82, + "learning_rate": 1.5670282467502497e-06, + "loss": 0.5652, + "step": 23651 + }, + { + "epoch": 0.82, + "learning_rate": 1.566443089031533e-06, + "loss": 0.6017, + "step": 23652 + }, + { + "epoch": 0.82, + "learning_rate": 1.5658580313033056e-06, + "loss": 0.6231, + "step": 23653 + }, + { + "epoch": 0.82, + "learning_rate": 1.5652730735724974e-06, + "loss": 0.642, + "step": 23654 + }, + { + "epoch": 0.82, + "learning_rate": 1.5646882158460474e-06, + "loss": 0.6056, + "step": 23655 + }, + { + "epoch": 0.82, + "learning_rate": 1.5641034581308889e-06, + "loss": 0.61, + "step": 23656 + }, + { + "epoch": 0.82, + "learning_rate": 1.5635188004339563e-06, + "loss": 0.6932, + "step": 23657 + }, + { + "epoch": 0.82, + "learning_rate": 1.5629342427621797e-06, + "loss": 0.6384, + "step": 23658 + }, + { + "epoch": 0.82, + "learning_rate": 1.5623497851224934e-06, + "loss": 0.6259, + "step": 23659 + }, + { + "epoch": 0.82, + "learning_rate": 1.5617654275218209e-06, + "loss": 0.6066, + "step": 23660 + }, + { + "epoch": 0.82, + "learning_rate": 1.5611811699670943e-06, + "loss": 0.5846, + "step": 23661 + }, + { + "epoch": 0.82, + "learning_rate": 1.5605970124652404e-06, + "loss": 0.6158, + "step": 23662 + }, + { + "epoch": 0.82, + "learning_rate": 1.5600129550231845e-06, + "loss": 0.583, + "step": 23663 + }, + { + "epoch": 0.82, + "learning_rate": 1.5594289976478516e-06, + "loss": 0.655, + "step": 23664 + }, + { + "epoch": 0.82, + "learning_rate": 1.558845140346168e-06, + "loss": 0.6449, + "step": 23665 + }, + { + "epoch": 0.82, + "learning_rate": 1.5582613831250504e-06, + "loss": 0.659, + "step": 23666 + }, + { + "epoch": 0.82, + "learning_rate": 1.5576777259914234e-06, + "loss": 0.7006, + "step": 23667 + }, + { + "epoch": 0.82, + "learning_rate": 1.5570941689522058e-06, + "loss": 0.6724, + "step": 23668 + }, + { + "epoch": 0.82, + "learning_rate": 1.5565107120143186e-06, + "loss": 0.6869, + "step": 23669 + }, + { + "epoch": 0.82, + "learning_rate": 1.5559273551846788e-06, + "loss": 0.6285, + "step": 23670 + }, + { + "epoch": 0.82, + "learning_rate": 1.5553440984702005e-06, + "loss": 0.6602, + "step": 23671 + }, + { + "epoch": 0.82, + "learning_rate": 1.554760941877801e-06, + "loss": 0.6476, + "step": 23672 + }, + { + "epoch": 0.82, + "learning_rate": 1.5541778854143929e-06, + "loss": 0.6277, + "step": 23673 + }, + { + "epoch": 0.82, + "learning_rate": 1.55359492908689e-06, + "loss": 0.6888, + "step": 23674 + }, + { + "epoch": 0.82, + "learning_rate": 1.5530120729022035e-06, + "loss": 0.6759, + "step": 23675 + }, + { + "epoch": 0.82, + "learning_rate": 1.5524293168672478e-06, + "loss": 0.6746, + "step": 23676 + }, + { + "epoch": 0.82, + "learning_rate": 1.551846660988926e-06, + "loss": 0.6337, + "step": 23677 + }, + { + "epoch": 0.82, + "learning_rate": 1.5512641052741494e-06, + "loss": 0.6316, + "step": 23678 + }, + { + "epoch": 0.82, + "learning_rate": 1.5506816497298238e-06, + "loss": 0.6035, + "step": 23679 + }, + { + "epoch": 0.82, + "learning_rate": 1.5500992943628568e-06, + "loss": 0.6137, + "step": 23680 + }, + { + "epoch": 0.82, + "learning_rate": 1.5495170391801506e-06, + "loss": 0.6322, + "step": 23681 + }, + { + "epoch": 0.82, + "learning_rate": 1.548934884188613e-06, + "loss": 0.6366, + "step": 23682 + }, + { + "epoch": 0.82, + "learning_rate": 1.54835282939514e-06, + "loss": 0.6093, + "step": 23683 + }, + { + "epoch": 0.82, + "learning_rate": 1.5477708748066357e-06, + "loss": 0.6348, + "step": 23684 + }, + { + "epoch": 0.82, + "learning_rate": 1.54718902043e-06, + "loss": 0.6239, + "step": 23685 + }, + { + "epoch": 0.82, + "learning_rate": 1.546607266272132e-06, + "loss": 0.6207, + "step": 23686 + }, + { + "epoch": 0.82, + "learning_rate": 1.5460256123399275e-06, + "loss": 0.6295, + "step": 23687 + }, + { + "epoch": 0.82, + "learning_rate": 1.5454440586402864e-06, + "loss": 0.6147, + "step": 23688 + }, + { + "epoch": 0.82, + "learning_rate": 1.5448626051800985e-06, + "loss": 0.6226, + "step": 23689 + }, + { + "epoch": 0.82, + "learning_rate": 1.544281251966261e-06, + "loss": 0.5993, + "step": 23690 + }, + { + "epoch": 0.82, + "learning_rate": 1.5436999990056646e-06, + "loss": 0.5381, + "step": 23691 + }, + { + "epoch": 0.82, + "learning_rate": 1.5431188463052028e-06, + "loss": 0.6244, + "step": 23692 + }, + { + "epoch": 0.82, + "learning_rate": 1.5425377938717644e-06, + "loss": 0.6639, + "step": 23693 + }, + { + "epoch": 0.82, + "learning_rate": 1.5419568417122421e-06, + "loss": 0.6511, + "step": 23694 + }, + { + "epoch": 0.82, + "learning_rate": 1.541375989833519e-06, + "loss": 0.654, + "step": 23695 + }, + { + "epoch": 0.82, + "learning_rate": 1.5407952382424829e-06, + "loss": 0.6135, + "step": 23696 + }, + { + "epoch": 0.82, + "learning_rate": 1.5402145869460228e-06, + "loss": 0.6346, + "step": 23697 + }, + { + "epoch": 0.82, + "learning_rate": 1.5396340359510164e-06, + "loss": 0.6394, + "step": 23698 + }, + { + "epoch": 0.82, + "learning_rate": 1.539053585264353e-06, + "loss": 0.6086, + "step": 23699 + }, + { + "epoch": 0.82, + "learning_rate": 1.5384732348929143e-06, + "loss": 0.674, + "step": 23700 + }, + { + "epoch": 0.82, + "learning_rate": 1.5378929848435776e-06, + "loss": 0.6511, + "step": 23701 + }, + { + "epoch": 0.82, + "learning_rate": 1.5373128351232236e-06, + "loss": 0.6952, + "step": 23702 + }, + { + "epoch": 0.82, + "learning_rate": 1.5367327857387337e-06, + "loss": 0.6474, + "step": 23703 + }, + { + "epoch": 0.82, + "learning_rate": 1.5361528366969781e-06, + "loss": 0.6551, + "step": 23704 + }, + { + "epoch": 0.82, + "learning_rate": 1.5355729880048398e-06, + "loss": 0.5565, + "step": 23705 + }, + { + "epoch": 0.82, + "learning_rate": 1.5349932396691936e-06, + "loss": 0.6147, + "step": 23706 + }, + { + "epoch": 0.82, + "learning_rate": 1.5344135916969084e-06, + "loss": 0.6663, + "step": 23707 + }, + { + "epoch": 0.82, + "learning_rate": 1.5338340440948595e-06, + "loss": 0.6086, + "step": 23708 + }, + { + "epoch": 0.82, + "learning_rate": 1.5332545968699198e-06, + "loss": 0.6659, + "step": 23709 + }, + { + "epoch": 0.82, + "learning_rate": 1.5326752500289522e-06, + "loss": 0.6664, + "step": 23710 + }, + { + "epoch": 0.82, + "learning_rate": 1.5320960035788334e-06, + "loss": 0.6437, + "step": 23711 + }, + { + "epoch": 0.82, + "learning_rate": 1.5315168575264317e-06, + "loss": 0.5965, + "step": 23712 + }, + { + "epoch": 0.82, + "learning_rate": 1.5309378118786066e-06, + "loss": 0.5973, + "step": 23713 + }, + { + "epoch": 0.82, + "learning_rate": 1.5303588666422287e-06, + "loss": 0.6823, + "step": 23714 + }, + { + "epoch": 0.82, + "learning_rate": 1.529780021824162e-06, + "loss": 0.6205, + "step": 23715 + }, + { + "epoch": 0.82, + "learning_rate": 1.5292012774312626e-06, + "loss": 0.6395, + "step": 23716 + }, + { + "epoch": 0.82, + "learning_rate": 1.5286226334704013e-06, + "loss": 0.6278, + "step": 23717 + }, + { + "epoch": 0.82, + "learning_rate": 1.5280440899484372e-06, + "loss": 0.6048, + "step": 23718 + }, + { + "epoch": 0.82, + "learning_rate": 1.5274656468722249e-06, + "loss": 0.6379, + "step": 23719 + }, + { + "epoch": 0.82, + "learning_rate": 1.5268873042486243e-06, + "loss": 0.5879, + "step": 23720 + }, + { + "epoch": 0.82, + "learning_rate": 1.5263090620844968e-06, + "loss": 0.6561, + "step": 23721 + }, + { + "epoch": 0.82, + "learning_rate": 1.5257309203866898e-06, + "loss": 0.6062, + "step": 23722 + }, + { + "epoch": 0.82, + "learning_rate": 1.525152879162065e-06, + "loss": 0.621, + "step": 23723 + }, + { + "epoch": 0.82, + "learning_rate": 1.5245749384174758e-06, + "loss": 0.6752, + "step": 23724 + }, + { + "epoch": 0.82, + "learning_rate": 1.5239970981597697e-06, + "loss": 0.594, + "step": 23725 + }, + { + "epoch": 0.82, + "learning_rate": 1.5234193583958e-06, + "loss": 0.5786, + "step": 23726 + }, + { + "epoch": 0.82, + "learning_rate": 1.5228417191324197e-06, + "loss": 0.5866, + "step": 23727 + }, + { + "epoch": 0.82, + "learning_rate": 1.5222641803764692e-06, + "loss": 0.6572, + "step": 23728 + }, + { + "epoch": 0.82, + "learning_rate": 1.5216867421348035e-06, + "loss": 0.6192, + "step": 23729 + }, + { + "epoch": 0.82, + "learning_rate": 1.5211094044142694e-06, + "loss": 0.6454, + "step": 23730 + }, + { + "epoch": 0.82, + "learning_rate": 1.5205321672217066e-06, + "loss": 0.6553, + "step": 23731 + }, + { + "epoch": 0.82, + "learning_rate": 1.5199550305639621e-06, + "loss": 0.5977, + "step": 23732 + }, + { + "epoch": 0.82, + "learning_rate": 1.5193779944478793e-06, + "loss": 0.6001, + "step": 23733 + }, + { + "epoch": 0.82, + "learning_rate": 1.5188010588802949e-06, + "loss": 0.6895, + "step": 23734 + }, + { + "epoch": 0.82, + "learning_rate": 1.5182242238680567e-06, + "loss": 0.6318, + "step": 23735 + }, + { + "epoch": 0.82, + "learning_rate": 1.517647489417997e-06, + "loss": 0.6254, + "step": 23736 + }, + { + "epoch": 0.82, + "learning_rate": 1.5170708555369574e-06, + "loss": 0.5948, + "step": 23737 + }, + { + "epoch": 0.82, + "learning_rate": 1.5164943222317763e-06, + "loss": 0.6653, + "step": 23738 + }, + { + "epoch": 0.82, + "learning_rate": 1.515917889509283e-06, + "loss": 0.5969, + "step": 23739 + }, + { + "epoch": 0.82, + "learning_rate": 1.515341557376314e-06, + "loss": 0.5986, + "step": 23740 + }, + { + "epoch": 0.82, + "learning_rate": 1.51476532583971e-06, + "loss": 0.6857, + "step": 23741 + }, + { + "epoch": 0.82, + "learning_rate": 1.5141891949062927e-06, + "loss": 0.5995, + "step": 23742 + }, + { + "epoch": 0.82, + "learning_rate": 1.5136131645828977e-06, + "loss": 0.6712, + "step": 23743 + }, + { + "epoch": 0.82, + "learning_rate": 1.5130372348763567e-06, + "loss": 0.6457, + "step": 23744 + }, + { + "epoch": 0.82, + "learning_rate": 1.5124614057934928e-06, + "loss": 0.6262, + "step": 23745 + }, + { + "epoch": 0.82, + "learning_rate": 1.5118856773411327e-06, + "loss": 0.6713, + "step": 23746 + }, + { + "epoch": 0.82, + "learning_rate": 1.5113100495261112e-06, + "loss": 0.688, + "step": 23747 + }, + { + "epoch": 0.82, + "learning_rate": 1.5107345223552438e-06, + "loss": 0.6206, + "step": 23748 + }, + { + "epoch": 0.82, + "learning_rate": 1.5101590958353584e-06, + "loss": 0.6184, + "step": 23749 + }, + { + "epoch": 0.82, + "learning_rate": 1.5095837699732796e-06, + "loss": 0.6002, + "step": 23750 + }, + { + "epoch": 0.82, + "learning_rate": 1.5090085447758218e-06, + "loss": 0.5846, + "step": 23751 + }, + { + "epoch": 0.82, + "learning_rate": 1.5084334202498075e-06, + "loss": 0.6898, + "step": 23752 + }, + { + "epoch": 0.82, + "learning_rate": 1.507858396402061e-06, + "loss": 0.6131, + "step": 23753 + }, + { + "epoch": 0.82, + "learning_rate": 1.5072834732393938e-06, + "loss": 0.6614, + "step": 23754 + }, + { + "epoch": 0.82, + "learning_rate": 1.5067086507686245e-06, + "loss": 0.6736, + "step": 23755 + }, + { + "epoch": 0.82, + "learning_rate": 1.5061339289965704e-06, + "loss": 0.6, + "step": 23756 + }, + { + "epoch": 0.82, + "learning_rate": 1.5055593079300412e-06, + "loss": 0.6209, + "step": 23757 + }, + { + "epoch": 0.82, + "learning_rate": 1.5049847875758494e-06, + "loss": 0.6525, + "step": 23758 + }, + { + "epoch": 0.82, + "learning_rate": 1.504410367940814e-06, + "loss": 0.6448, + "step": 23759 + }, + { + "epoch": 0.82, + "learning_rate": 1.5038360490317382e-06, + "loss": 0.6132, + "step": 23760 + }, + { + "epoch": 0.82, + "learning_rate": 1.5032618308554337e-06, + "loss": 0.5856, + "step": 23761 + }, + { + "epoch": 0.82, + "learning_rate": 1.5026877134187113e-06, + "loss": 0.6666, + "step": 23762 + }, + { + "epoch": 0.82, + "learning_rate": 1.5021136967283722e-06, + "loss": 0.6277, + "step": 23763 + }, + { + "epoch": 0.82, + "learning_rate": 1.5015397807912235e-06, + "loss": 0.6237, + "step": 23764 + }, + { + "epoch": 0.82, + "learning_rate": 1.5009659656140762e-06, + "loss": 0.6412, + "step": 23765 + }, + { + "epoch": 0.82, + "learning_rate": 1.500392251203725e-06, + "loss": 0.597, + "step": 23766 + }, + { + "epoch": 0.82, + "learning_rate": 1.4998186375669765e-06, + "loss": 0.6139, + "step": 23767 + }, + { + "epoch": 0.82, + "learning_rate": 1.4992451247106344e-06, + "loss": 0.6434, + "step": 23768 + }, + { + "epoch": 0.82, + "learning_rate": 1.4986717126414907e-06, + "loss": 0.6179, + "step": 23769 + }, + { + "epoch": 0.82, + "learning_rate": 1.498098401366347e-06, + "loss": 0.5717, + "step": 23770 + }, + { + "epoch": 0.82, + "learning_rate": 1.4975251908920053e-06, + "loss": 0.6289, + "step": 23771 + }, + { + "epoch": 0.82, + "learning_rate": 1.4969520812252559e-06, + "loss": 0.6101, + "step": 23772 + }, + { + "epoch": 0.82, + "learning_rate": 1.4963790723728966e-06, + "loss": 0.6509, + "step": 23773 + }, + { + "epoch": 0.82, + "learning_rate": 1.4958061643417232e-06, + "loss": 0.6456, + "step": 23774 + }, + { + "epoch": 0.82, + "learning_rate": 1.4952333571385224e-06, + "loss": 0.6269, + "step": 23775 + }, + { + "epoch": 0.82, + "learning_rate": 1.4946606507700866e-06, + "loss": 0.5851, + "step": 23776 + }, + { + "epoch": 0.82, + "learning_rate": 1.4940880452432128e-06, + "loss": 0.7139, + "step": 23777 + }, + { + "epoch": 0.82, + "learning_rate": 1.4935155405646828e-06, + "loss": 0.645, + "step": 23778 + }, + { + "epoch": 0.82, + "learning_rate": 1.4929431367412872e-06, + "loss": 0.6499, + "step": 23779 + }, + { + "epoch": 0.82, + "learning_rate": 1.4923708337798148e-06, + "loss": 0.6637, + "step": 23780 + }, + { + "epoch": 0.82, + "learning_rate": 1.4917986316870459e-06, + "loss": 0.6143, + "step": 23781 + }, + { + "epoch": 0.82, + "learning_rate": 1.4912265304697637e-06, + "loss": 0.6482, + "step": 23782 + }, + { + "epoch": 0.82, + "learning_rate": 1.4906545301347608e-06, + "loss": 0.635, + "step": 23783 + }, + { + "epoch": 0.82, + "learning_rate": 1.4900826306888093e-06, + "loss": 0.6012, + "step": 23784 + }, + { + "epoch": 0.82, + "learning_rate": 1.4895108321386942e-06, + "loss": 0.6001, + "step": 23785 + }, + { + "epoch": 0.82, + "learning_rate": 1.4889391344911952e-06, + "loss": 0.6064, + "step": 23786 + }, + { + "epoch": 0.82, + "learning_rate": 1.4883675377530882e-06, + "loss": 0.5504, + "step": 23787 + }, + { + "epoch": 0.82, + "learning_rate": 1.4877960419311487e-06, + "loss": 0.6783, + "step": 23788 + }, + { + "epoch": 0.82, + "learning_rate": 1.4872246470321594e-06, + "loss": 0.6204, + "step": 23789 + }, + { + "epoch": 0.82, + "learning_rate": 1.486653353062889e-06, + "loss": 0.6794, + "step": 23790 + }, + { + "epoch": 0.82, + "learning_rate": 1.486082160030111e-06, + "loss": 0.6871, + "step": 23791 + }, + { + "epoch": 0.82, + "learning_rate": 1.4855110679406026e-06, + "loss": 0.6235, + "step": 23792 + }, + { + "epoch": 0.82, + "learning_rate": 1.4849400768011291e-06, + "loss": 0.6681, + "step": 23793 + }, + { + "epoch": 0.82, + "learning_rate": 1.4843691866184606e-06, + "loss": 0.6064, + "step": 23794 + }, + { + "epoch": 0.82, + "learning_rate": 1.483798397399372e-06, + "loss": 0.6501, + "step": 23795 + }, + { + "epoch": 0.82, + "learning_rate": 1.4832277091506241e-06, + "loss": 0.6305, + "step": 23796 + }, + { + "epoch": 0.82, + "learning_rate": 1.4826571218789875e-06, + "loss": 0.6688, + "step": 23797 + }, + { + "epoch": 0.82, + "learning_rate": 1.4820866355912234e-06, + "loss": 0.6817, + "step": 23798 + }, + { + "epoch": 0.82, + "learning_rate": 1.4815162502940972e-06, + "loss": 0.6536, + "step": 23799 + }, + { + "epoch": 0.82, + "learning_rate": 1.4809459659943714e-06, + "loss": 0.6768, + "step": 23800 + }, + { + "epoch": 0.82, + "learning_rate": 1.4803757826988086e-06, + "loss": 0.6491, + "step": 23801 + }, + { + "epoch": 0.82, + "learning_rate": 1.4798057004141675e-06, + "loss": 0.5981, + "step": 23802 + }, + { + "epoch": 0.82, + "learning_rate": 1.4792357191472106e-06, + "loss": 0.6165, + "step": 23803 + }, + { + "epoch": 0.82, + "learning_rate": 1.4786658389046904e-06, + "loss": 0.596, + "step": 23804 + }, + { + "epoch": 0.82, + "learning_rate": 1.4780960596933669e-06, + "loss": 0.6726, + "step": 23805 + }, + { + "epoch": 0.82, + "learning_rate": 1.4775263815199947e-06, + "loss": 0.6532, + "step": 23806 + }, + { + "epoch": 0.82, + "learning_rate": 1.4769568043913284e-06, + "loss": 0.6397, + "step": 23807 + }, + { + "epoch": 0.82, + "learning_rate": 1.4763873283141206e-06, + "loss": 0.6064, + "step": 23808 + }, + { + "epoch": 0.82, + "learning_rate": 1.4758179532951255e-06, + "loss": 0.6457, + "step": 23809 + }, + { + "epoch": 0.82, + "learning_rate": 1.4752486793410904e-06, + "loss": 0.5699, + "step": 23810 + }, + { + "epoch": 0.82, + "learning_rate": 1.474679506458765e-06, + "loss": 0.6715, + "step": 23811 + }, + { + "epoch": 0.83, + "learning_rate": 1.4741104346548985e-06, + "loss": 0.6092, + "step": 23812 + }, + { + "epoch": 0.83, + "learning_rate": 1.473541463936239e-06, + "loss": 0.5936, + "step": 23813 + }, + { + "epoch": 0.83, + "learning_rate": 1.4729725943095309e-06, + "loss": 0.6358, + "step": 23814 + }, + { + "epoch": 0.83, + "learning_rate": 1.472403825781522e-06, + "loss": 0.6156, + "step": 23815 + }, + { + "epoch": 0.83, + "learning_rate": 1.4718351583589508e-06, + "loss": 0.6447, + "step": 23816 + }, + { + "epoch": 0.83, + "learning_rate": 1.4712665920485614e-06, + "loss": 0.6522, + "step": 23817 + }, + { + "epoch": 0.83, + "learning_rate": 1.4706981268570963e-06, + "loss": 0.6, + "step": 23818 + }, + { + "epoch": 0.83, + "learning_rate": 1.4701297627912947e-06, + "loss": 0.6222, + "step": 23819 + }, + { + "epoch": 0.83, + "learning_rate": 1.4695614998578945e-06, + "loss": 0.6205, + "step": 23820 + }, + { + "epoch": 0.83, + "learning_rate": 1.4689933380636357e-06, + "loss": 0.6128, + "step": 23821 + }, + { + "epoch": 0.83, + "learning_rate": 1.4684252774152508e-06, + "loss": 0.6668, + "step": 23822 + }, + { + "epoch": 0.83, + "learning_rate": 1.4678573179194778e-06, + "loss": 0.6249, + "step": 23823 + }, + { + "epoch": 0.83, + "learning_rate": 1.4672894595830478e-06, + "loss": 0.6311, + "step": 23824 + }, + { + "epoch": 0.83, + "learning_rate": 1.4667217024126967e-06, + "loss": 0.5693, + "step": 23825 + }, + { + "epoch": 0.83, + "learning_rate": 1.4661540464151535e-06, + "loss": 0.6349, + "step": 23826 + }, + { + "epoch": 0.83, + "learning_rate": 1.4655864915971519e-06, + "loss": 0.64, + "step": 23827 + }, + { + "epoch": 0.83, + "learning_rate": 1.465019037965416e-06, + "loss": 0.6766, + "step": 23828 + }, + { + "epoch": 0.83, + "learning_rate": 1.4644516855266767e-06, + "loss": 0.6608, + "step": 23829 + }, + { + "epoch": 0.83, + "learning_rate": 1.4638844342876602e-06, + "loss": 0.612, + "step": 23830 + }, + { + "epoch": 0.83, + "learning_rate": 1.4633172842550914e-06, + "loss": 0.6715, + "step": 23831 + }, + { + "epoch": 0.83, + "learning_rate": 1.462750235435696e-06, + "loss": 0.7011, + "step": 23832 + }, + { + "epoch": 0.83, + "learning_rate": 1.4621832878361975e-06, + "loss": 0.6816, + "step": 23833 + }, + { + "epoch": 0.83, + "learning_rate": 1.4616164414633149e-06, + "loss": 0.6216, + "step": 23834 + }, + { + "epoch": 0.83, + "learning_rate": 1.4610496963237709e-06, + "loss": 0.6172, + "step": 23835 + }, + { + "epoch": 0.83, + "learning_rate": 1.460483052424284e-06, + "loss": 0.6496, + "step": 23836 + }, + { + "epoch": 0.83, + "learning_rate": 1.4599165097715727e-06, + "loss": 0.5721, + "step": 23837 + }, + { + "epoch": 0.83, + "learning_rate": 1.459350068372355e-06, + "loss": 0.6726, + "step": 23838 + }, + { + "epoch": 0.83, + "learning_rate": 1.4587837282333484e-06, + "loss": 0.6314, + "step": 23839 + }, + { + "epoch": 0.83, + "learning_rate": 1.4582174893612632e-06, + "loss": 0.5748, + "step": 23840 + }, + { + "epoch": 0.83, + "learning_rate": 1.4576513517628144e-06, + "loss": 0.6417, + "step": 23841 + }, + { + "epoch": 0.83, + "learning_rate": 1.4570853154447162e-06, + "loss": 0.6347, + "step": 23842 + }, + { + "epoch": 0.83, + "learning_rate": 1.4565193804136769e-06, + "loss": 0.6122, + "step": 23843 + }, + { + "epoch": 0.83, + "learning_rate": 1.4559535466764096e-06, + "loss": 0.6502, + "step": 23844 + }, + { + "epoch": 0.83, + "learning_rate": 1.4553878142396228e-06, + "loss": 0.6467, + "step": 23845 + }, + { + "epoch": 0.83, + "learning_rate": 1.4548221831100196e-06, + "loss": 0.6237, + "step": 23846 + }, + { + "epoch": 0.83, + "learning_rate": 1.4542566532943092e-06, + "loss": 0.6639, + "step": 23847 + }, + { + "epoch": 0.83, + "learning_rate": 1.4536912247991975e-06, + "loss": 0.6349, + "step": 23848 + }, + { + "epoch": 0.83, + "learning_rate": 1.4531258976313868e-06, + "loss": 0.5806, + "step": 23849 + }, + { + "epoch": 0.83, + "learning_rate": 1.4525606717975804e-06, + "loss": 0.6306, + "step": 23850 + }, + { + "epoch": 0.83, + "learning_rate": 1.4519955473044822e-06, + "loss": 0.6339, + "step": 23851 + }, + { + "epoch": 0.83, + "learning_rate": 1.4514305241587877e-06, + "loss": 0.5798, + "step": 23852 + }, + { + "epoch": 0.83, + "learning_rate": 1.4508656023671986e-06, + "loss": 0.6788, + "step": 23853 + }, + { + "epoch": 0.83, + "learning_rate": 1.4503007819364124e-06, + "loss": 0.6518, + "step": 23854 + }, + { + "epoch": 0.83, + "learning_rate": 1.449736062873126e-06, + "loss": 0.604, + "step": 23855 + }, + { + "epoch": 0.83, + "learning_rate": 1.4491714451840343e-06, + "loss": 0.6104, + "step": 23856 + }, + { + "epoch": 0.83, + "learning_rate": 1.4486069288758354e-06, + "loss": 0.6073, + "step": 23857 + }, + { + "epoch": 0.83, + "learning_rate": 1.4480425139552157e-06, + "loss": 0.6016, + "step": 23858 + }, + { + "epoch": 0.83, + "learning_rate": 1.4474782004288702e-06, + "loss": 0.6468, + "step": 23859 + }, + { + "epoch": 0.83, + "learning_rate": 1.44691398830349e-06, + "loss": 0.6607, + "step": 23860 + }, + { + "epoch": 0.83, + "learning_rate": 1.446349877585763e-06, + "loss": 0.5978, + "step": 23861 + }, + { + "epoch": 0.83, + "learning_rate": 1.4457858682823821e-06, + "loss": 0.6368, + "step": 23862 + }, + { + "epoch": 0.83, + "learning_rate": 1.4452219604000284e-06, + "loss": 0.6026, + "step": 23863 + }, + { + "epoch": 0.83, + "learning_rate": 1.4446581539453907e-06, + "loss": 0.6136, + "step": 23864 + }, + { + "epoch": 0.83, + "learning_rate": 1.4440944489251519e-06, + "loss": 0.6518, + "step": 23865 + }, + { + "epoch": 0.83, + "learning_rate": 1.4435308453459973e-06, + "loss": 0.6236, + "step": 23866 + }, + { + "epoch": 0.83, + "learning_rate": 1.4429673432146085e-06, + "loss": 0.6346, + "step": 23867 + }, + { + "epoch": 0.83, + "learning_rate": 1.442403942537669e-06, + "loss": 0.605, + "step": 23868 + }, + { + "epoch": 0.83, + "learning_rate": 1.4418406433218546e-06, + "loss": 0.6052, + "step": 23869 + }, + { + "epoch": 0.83, + "learning_rate": 1.4412774455738444e-06, + "loss": 0.6007, + "step": 23870 + }, + { + "epoch": 0.83, + "learning_rate": 1.4407143493003173e-06, + "loss": 0.6072, + "step": 23871 + }, + { + "epoch": 0.83, + "learning_rate": 1.4401513545079493e-06, + "loss": 0.6469, + "step": 23872 + }, + { + "epoch": 0.83, + "learning_rate": 1.439588461203415e-06, + "loss": 0.6599, + "step": 23873 + }, + { + "epoch": 0.83, + "learning_rate": 1.4390256693933902e-06, + "loss": 0.6373, + "step": 23874 + }, + { + "epoch": 0.83, + "learning_rate": 1.438462979084544e-06, + "loss": 0.5979, + "step": 23875 + }, + { + "epoch": 0.83, + "learning_rate": 1.4379003902835497e-06, + "loss": 0.6342, + "step": 23876 + }, + { + "epoch": 0.83, + "learning_rate": 1.4373379029970779e-06, + "loss": 0.5868, + "step": 23877 + }, + { + "epoch": 0.83, + "learning_rate": 1.4367755172317965e-06, + "loss": 0.6402, + "step": 23878 + }, + { + "epoch": 0.83, + "learning_rate": 1.4362132329943735e-06, + "loss": 0.6201, + "step": 23879 + }, + { + "epoch": 0.83, + "learning_rate": 1.4356510502914788e-06, + "loss": 0.6351, + "step": 23880 + }, + { + "epoch": 0.83, + "learning_rate": 1.435088969129772e-06, + "loss": 0.6594, + "step": 23881 + }, + { + "epoch": 0.83, + "learning_rate": 1.434526989515921e-06, + "loss": 0.6669, + "step": 23882 + }, + { + "epoch": 0.83, + "learning_rate": 1.4339651114565877e-06, + "loss": 0.7147, + "step": 23883 + }, + { + "epoch": 0.83, + "learning_rate": 1.4334033349584332e-06, + "loss": 0.5992, + "step": 23884 + }, + { + "epoch": 0.83, + "learning_rate": 1.4328416600281202e-06, + "loss": 0.6012, + "step": 23885 + }, + { + "epoch": 0.83, + "learning_rate": 1.4322800866723085e-06, + "loss": 0.6044, + "step": 23886 + }, + { + "epoch": 0.83, + "learning_rate": 1.4317186148976514e-06, + "loss": 0.6276, + "step": 23887 + }, + { + "epoch": 0.83, + "learning_rate": 1.4311572447108102e-06, + "loss": 0.6732, + "step": 23888 + }, + { + "epoch": 0.83, + "learning_rate": 1.4305959761184397e-06, + "loss": 0.6119, + "step": 23889 + }, + { + "epoch": 0.83, + "learning_rate": 1.4300348091271932e-06, + "loss": 0.6827, + "step": 23890 + }, + { + "epoch": 0.83, + "learning_rate": 1.4294737437437256e-06, + "loss": 0.6599, + "step": 23891 + }, + { + "epoch": 0.83, + "learning_rate": 1.4289127799746915e-06, + "loss": 0.6265, + "step": 23892 + }, + { + "epoch": 0.83, + "learning_rate": 1.4283519178267358e-06, + "loss": 0.6933, + "step": 23893 + }, + { + "epoch": 0.83, + "learning_rate": 1.4277911573065117e-06, + "loss": 0.641, + "step": 23894 + }, + { + "epoch": 0.83, + "learning_rate": 1.4272304984206674e-06, + "loss": 0.6369, + "step": 23895 + }, + { + "epoch": 0.83, + "learning_rate": 1.42666994117585e-06, + "loss": 0.6179, + "step": 23896 + }, + { + "epoch": 0.83, + "learning_rate": 1.426109485578705e-06, + "loss": 0.6336, + "step": 23897 + }, + { + "epoch": 0.83, + "learning_rate": 1.4255491316358816e-06, + "loss": 0.6582, + "step": 23898 + }, + { + "epoch": 0.83, + "learning_rate": 1.4249888793540167e-06, + "loss": 0.6414, + "step": 23899 + }, + { + "epoch": 0.83, + "learning_rate": 1.4244287287397563e-06, + "loss": 0.6386, + "step": 23900 + }, + { + "epoch": 0.83, + "learning_rate": 1.4238686797997425e-06, + "loss": 0.577, + "step": 23901 + }, + { + "epoch": 0.83, + "learning_rate": 1.4233087325406136e-06, + "loss": 0.6264, + "step": 23902 + }, + { + "epoch": 0.83, + "learning_rate": 1.4227488869690087e-06, + "loss": 0.5958, + "step": 23903 + }, + { + "epoch": 0.83, + "learning_rate": 1.4221891430915692e-06, + "loss": 0.6118, + "step": 23904 + }, + { + "epoch": 0.83, + "learning_rate": 1.4216295009149251e-06, + "loss": 0.6385, + "step": 23905 + }, + { + "epoch": 0.83, + "learning_rate": 1.4210699604457156e-06, + "loss": 0.6439, + "step": 23906 + }, + { + "epoch": 0.83, + "learning_rate": 1.4205105216905747e-06, + "loss": 0.6475, + "step": 23907 + }, + { + "epoch": 0.83, + "learning_rate": 1.4199511846561343e-06, + "loss": 0.6094, + "step": 23908 + }, + { + "epoch": 0.83, + "learning_rate": 1.419391949349026e-06, + "loss": 0.6234, + "step": 23909 + }, + { + "epoch": 0.83, + "learning_rate": 1.4188328157758824e-06, + "loss": 0.6629, + "step": 23910 + }, + { + "epoch": 0.83, + "learning_rate": 1.4182737839433303e-06, + "loss": 0.6034, + "step": 23911 + }, + { + "epoch": 0.83, + "learning_rate": 1.4177148538579978e-06, + "loss": 0.7097, + "step": 23912 + }, + { + "epoch": 0.83, + "learning_rate": 1.4171560255265114e-06, + "loss": 0.6545, + "step": 23913 + }, + { + "epoch": 0.83, + "learning_rate": 1.4165972989554988e-06, + "loss": 0.6249, + "step": 23914 + }, + { + "epoch": 0.83, + "learning_rate": 1.416038674151583e-06, + "loss": 0.7104, + "step": 23915 + }, + { + "epoch": 0.83, + "learning_rate": 1.4154801511213889e-06, + "loss": 0.609, + "step": 23916 + }, + { + "epoch": 0.83, + "learning_rate": 1.4149217298715356e-06, + "loss": 0.6843, + "step": 23917 + }, + { + "epoch": 0.83, + "learning_rate": 1.4143634104086458e-06, + "loss": 0.5758, + "step": 23918 + }, + { + "epoch": 0.83, + "learning_rate": 1.4138051927393381e-06, + "loss": 0.6432, + "step": 23919 + }, + { + "epoch": 0.83, + "learning_rate": 1.4132470768702323e-06, + "loss": 0.5854, + "step": 23920 + }, + { + "epoch": 0.83, + "learning_rate": 1.412689062807946e-06, + "loss": 0.6914, + "step": 23921 + }, + { + "epoch": 0.83, + "learning_rate": 1.4121311505590918e-06, + "loss": 0.5988, + "step": 23922 + }, + { + "epoch": 0.83, + "learning_rate": 1.4115733401302866e-06, + "loss": 0.6345, + "step": 23923 + }, + { + "epoch": 0.83, + "learning_rate": 1.4110156315281453e-06, + "loss": 0.5423, + "step": 23924 + }, + { + "epoch": 0.83, + "learning_rate": 1.4104580247592758e-06, + "loss": 0.6468, + "step": 23925 + }, + { + "epoch": 0.83, + "learning_rate": 1.409900519830293e-06, + "loss": 0.5911, + "step": 23926 + }, + { + "epoch": 0.83, + "learning_rate": 1.40934311674781e-06, + "loss": 0.5857, + "step": 23927 + }, + { + "epoch": 0.83, + "learning_rate": 1.4087858155184274e-06, + "loss": 0.6259, + "step": 23928 + }, + { + "epoch": 0.83, + "learning_rate": 1.408228616148758e-06, + "loss": 0.6565, + "step": 23929 + }, + { + "epoch": 0.83, + "learning_rate": 1.4076715186454094e-06, + "loss": 0.6777, + "step": 23930 + }, + { + "epoch": 0.83, + "learning_rate": 1.4071145230149797e-06, + "loss": 0.5936, + "step": 23931 + }, + { + "epoch": 0.83, + "learning_rate": 1.4065576292640792e-06, + "loss": 0.566, + "step": 23932 + }, + { + "epoch": 0.83, + "learning_rate": 1.4060008373993118e-06, + "loss": 0.5878, + "step": 23933 + }, + { + "epoch": 0.83, + "learning_rate": 1.405444147427273e-06, + "loss": 0.623, + "step": 23934 + }, + { + "epoch": 0.83, + "learning_rate": 1.4048875593545663e-06, + "loss": 0.6267, + "step": 23935 + }, + { + "epoch": 0.83, + "learning_rate": 1.4043310731877923e-06, + "loss": 0.579, + "step": 23936 + }, + { + "epoch": 0.83, + "learning_rate": 1.4037746889335435e-06, + "loss": 0.6399, + "step": 23937 + }, + { + "epoch": 0.83, + "learning_rate": 1.4032184065984212e-06, + "loss": 0.6092, + "step": 23938 + }, + { + "epoch": 0.83, + "learning_rate": 1.402662226189022e-06, + "loss": 0.6273, + "step": 23939 + }, + { + "epoch": 0.83, + "learning_rate": 1.4021061477119357e-06, + "loss": 0.6354, + "step": 23940 + }, + { + "epoch": 0.83, + "learning_rate": 1.4015501711737578e-06, + "loss": 0.6354, + "step": 23941 + }, + { + "epoch": 0.83, + "learning_rate": 1.4009942965810818e-06, + "loss": 0.624, + "step": 23942 + }, + { + "epoch": 0.83, + "learning_rate": 1.4004385239404917e-06, + "loss": 0.6455, + "step": 23943 + }, + { + "epoch": 0.83, + "learning_rate": 1.399882853258584e-06, + "loss": 0.6295, + "step": 23944 + }, + { + "epoch": 0.83, + "learning_rate": 1.3993272845419458e-06, + "loss": 0.6096, + "step": 23945 + }, + { + "epoch": 0.83, + "learning_rate": 1.398771817797161e-06, + "loss": 0.6596, + "step": 23946 + }, + { + "epoch": 0.83, + "learning_rate": 1.3982164530308162e-06, + "loss": 0.7171, + "step": 23947 + }, + { + "epoch": 0.83, + "learning_rate": 1.3976611902494997e-06, + "loss": 0.6215, + "step": 23948 + }, + { + "epoch": 0.83, + "learning_rate": 1.3971060294597872e-06, + "loss": 0.5899, + "step": 23949 + }, + { + "epoch": 0.83, + "learning_rate": 1.3965509706682668e-06, + "loss": 0.664, + "step": 23950 + }, + { + "epoch": 0.83, + "learning_rate": 1.395996013881521e-06, + "loss": 0.6226, + "step": 23951 + }, + { + "epoch": 0.83, + "learning_rate": 1.3954411591061245e-06, + "loss": 0.6868, + "step": 23952 + }, + { + "epoch": 0.83, + "learning_rate": 1.3948864063486578e-06, + "loss": 0.6, + "step": 23953 + }, + { + "epoch": 0.83, + "learning_rate": 1.3943317556156998e-06, + "loss": 0.651, + "step": 23954 + }, + { + "epoch": 0.83, + "learning_rate": 1.393777206913821e-06, + "loss": 0.6445, + "step": 23955 + }, + { + "epoch": 0.83, + "learning_rate": 1.3932227602496029e-06, + "loss": 0.6175, + "step": 23956 + }, + { + "epoch": 0.83, + "learning_rate": 1.3926684156296188e-06, + "loss": 0.6803, + "step": 23957 + }, + { + "epoch": 0.83, + "learning_rate": 1.392114173060436e-06, + "loss": 0.6467, + "step": 23958 + }, + { + "epoch": 0.83, + "learning_rate": 1.39156003254863e-06, + "loss": 0.6734, + "step": 23959 + }, + { + "epoch": 0.83, + "learning_rate": 1.3910059941007703e-06, + "loss": 0.671, + "step": 23960 + }, + { + "epoch": 0.83, + "learning_rate": 1.3904520577234215e-06, + "loss": 0.6077, + "step": 23961 + }, + { + "epoch": 0.83, + "learning_rate": 1.3898982234231574e-06, + "loss": 0.6415, + "step": 23962 + }, + { + "epoch": 0.83, + "learning_rate": 1.3893444912065423e-06, + "loss": 0.6408, + "step": 23963 + }, + { + "epoch": 0.83, + "learning_rate": 1.3887908610801392e-06, + "loss": 0.6176, + "step": 23964 + }, + { + "epoch": 0.83, + "learning_rate": 1.388237333050515e-06, + "loss": 0.6291, + "step": 23965 + }, + { + "epoch": 0.83, + "learning_rate": 1.387683907124232e-06, + "loss": 0.681, + "step": 23966 + }, + { + "epoch": 0.83, + "learning_rate": 1.3871305833078464e-06, + "loss": 0.5863, + "step": 23967 + }, + { + "epoch": 0.83, + "learning_rate": 1.3865773616079258e-06, + "loss": 0.5991, + "step": 23968 + }, + { + "epoch": 0.83, + "learning_rate": 1.3860242420310287e-06, + "loss": 0.632, + "step": 23969 + }, + { + "epoch": 0.83, + "learning_rate": 1.3854712245837087e-06, + "loss": 0.6289, + "step": 23970 + }, + { + "epoch": 0.83, + "learning_rate": 1.384918309272525e-06, + "loss": 0.6287, + "step": 23971 + }, + { + "epoch": 0.83, + "learning_rate": 1.3843654961040354e-06, + "loss": 0.5779, + "step": 23972 + }, + { + "epoch": 0.83, + "learning_rate": 1.383812785084786e-06, + "loss": 0.6499, + "step": 23973 + }, + { + "epoch": 0.83, + "learning_rate": 1.3832601762213383e-06, + "loss": 0.6553, + "step": 23974 + }, + { + "epoch": 0.83, + "learning_rate": 1.3827076695202446e-06, + "loss": 0.573, + "step": 23975 + }, + { + "epoch": 0.83, + "learning_rate": 1.3821552649880487e-06, + "loss": 0.6038, + "step": 23976 + }, + { + "epoch": 0.83, + "learning_rate": 1.3816029626313055e-06, + "loss": 0.6173, + "step": 23977 + }, + { + "epoch": 0.83, + "learning_rate": 1.3810507624565627e-06, + "loss": 0.6342, + "step": 23978 + }, + { + "epoch": 0.83, + "learning_rate": 1.380498664470361e-06, + "loss": 0.6678, + "step": 23979 + }, + { + "epoch": 0.83, + "learning_rate": 1.379946668679255e-06, + "loss": 0.591, + "step": 23980 + }, + { + "epoch": 0.83, + "learning_rate": 1.3793947750897873e-06, + "loss": 0.6592, + "step": 23981 + }, + { + "epoch": 0.83, + "learning_rate": 1.3788429837084971e-06, + "loss": 0.6339, + "step": 23982 + }, + { + "epoch": 0.83, + "learning_rate": 1.3782912945419314e-06, + "loss": 0.5841, + "step": 23983 + }, + { + "epoch": 0.83, + "learning_rate": 1.377739707596627e-06, + "loss": 0.6351, + "step": 23984 + }, + { + "epoch": 0.83, + "learning_rate": 1.3771882228791234e-06, + "loss": 0.6501, + "step": 23985 + }, + { + "epoch": 0.83, + "learning_rate": 1.3766368403959662e-06, + "loss": 0.6322, + "step": 23986 + }, + { + "epoch": 0.83, + "learning_rate": 1.3760855601536848e-06, + "loss": 0.637, + "step": 23987 + }, + { + "epoch": 0.83, + "learning_rate": 1.3755343821588185e-06, + "loss": 0.66, + "step": 23988 + }, + { + "epoch": 0.83, + "learning_rate": 1.3749833064179053e-06, + "loss": 0.6248, + "step": 23989 + }, + { + "epoch": 0.83, + "learning_rate": 1.374432332937472e-06, + "loss": 0.5907, + "step": 23990 + }, + { + "epoch": 0.83, + "learning_rate": 1.3738814617240536e-06, + "loss": 0.6078, + "step": 23991 + }, + { + "epoch": 0.83, + "learning_rate": 1.3733306927841871e-06, + "loss": 0.6284, + "step": 23992 + }, + { + "epoch": 0.83, + "learning_rate": 1.372780026124395e-06, + "loss": 0.5953, + "step": 23993 + }, + { + "epoch": 0.83, + "learning_rate": 1.37222946175121e-06, + "loss": 0.6653, + "step": 23994 + }, + { + "epoch": 0.83, + "learning_rate": 1.37167899967116e-06, + "loss": 0.6043, + "step": 23995 + }, + { + "epoch": 0.83, + "learning_rate": 1.3711286398907698e-06, + "loss": 0.6298, + "step": 23996 + }, + { + "epoch": 0.83, + "learning_rate": 1.370578382416562e-06, + "loss": 0.5899, + "step": 23997 + }, + { + "epoch": 0.83, + "learning_rate": 1.3700282272550681e-06, + "loss": 0.5905, + "step": 23998 + }, + { + "epoch": 0.83, + "learning_rate": 1.3694781744128038e-06, + "loss": 0.6117, + "step": 23999 + }, + { + "epoch": 0.83, + "learning_rate": 1.3689282238962942e-06, + "loss": 0.6275, + "step": 24000 + }, + { + "epoch": 0.83, + "learning_rate": 1.3683783757120605e-06, + "loss": 0.683, + "step": 24001 + }, + { + "epoch": 0.83, + "learning_rate": 1.3678286298666187e-06, + "loss": 0.5866, + "step": 24002 + }, + { + "epoch": 0.83, + "learning_rate": 1.367278986366486e-06, + "loss": 0.6688, + "step": 24003 + }, + { + "epoch": 0.83, + "learning_rate": 1.3667294452181857e-06, + "loss": 0.6468, + "step": 24004 + }, + { + "epoch": 0.83, + "learning_rate": 1.366180006428226e-06, + "loss": 0.6407, + "step": 24005 + }, + { + "epoch": 0.83, + "learning_rate": 1.3656306700031253e-06, + "loss": 0.5994, + "step": 24006 + }, + { + "epoch": 0.83, + "learning_rate": 1.3650814359493968e-06, + "loss": 0.6335, + "step": 24007 + }, + { + "epoch": 0.83, + "learning_rate": 1.3645323042735492e-06, + "loss": 0.572, + "step": 24008 + }, + { + "epoch": 0.83, + "learning_rate": 1.3639832749820935e-06, + "loss": 0.6543, + "step": 24009 + }, + { + "epoch": 0.83, + "learning_rate": 1.3634343480815437e-06, + "loss": 0.6924, + "step": 24010 + }, + { + "epoch": 0.83, + "learning_rate": 1.3628855235784045e-06, + "loss": 0.6178, + "step": 24011 + }, + { + "epoch": 0.83, + "learning_rate": 1.3623368014791827e-06, + "loss": 0.6865, + "step": 24012 + }, + { + "epoch": 0.83, + "learning_rate": 1.3617881817903866e-06, + "loss": 0.6684, + "step": 24013 + }, + { + "epoch": 0.83, + "learning_rate": 1.3612396645185166e-06, + "loss": 0.6224, + "step": 24014 + }, + { + "epoch": 0.83, + "learning_rate": 1.3606912496700775e-06, + "loss": 0.6825, + "step": 24015 + }, + { + "epoch": 0.83, + "learning_rate": 1.3601429372515761e-06, + "loss": 0.5939, + "step": 24016 + }, + { + "epoch": 0.83, + "learning_rate": 1.3595947272695076e-06, + "loss": 0.5982, + "step": 24017 + }, + { + "epoch": 0.83, + "learning_rate": 1.359046619730373e-06, + "loss": 0.5657, + "step": 24018 + }, + { + "epoch": 0.83, + "learning_rate": 1.3584986146406742e-06, + "loss": 0.6237, + "step": 24019 + }, + { + "epoch": 0.83, + "learning_rate": 1.3579507120069047e-06, + "loss": 0.6734, + "step": 24020 + }, + { + "epoch": 0.83, + "learning_rate": 1.357402911835558e-06, + "loss": 0.6667, + "step": 24021 + }, + { + "epoch": 0.83, + "learning_rate": 1.3568552141331382e-06, + "loss": 0.6495, + "step": 24022 + }, + { + "epoch": 0.83, + "learning_rate": 1.3563076189061308e-06, + "loss": 0.6277, + "step": 24023 + }, + { + "epoch": 0.83, + "learning_rate": 1.355760126161031e-06, + "loss": 0.6255, + "step": 24024 + }, + { + "epoch": 0.83, + "learning_rate": 1.355212735904332e-06, + "loss": 0.6471, + "step": 24025 + }, + { + "epoch": 0.83, + "learning_rate": 1.3546654481425202e-06, + "loss": 0.6007, + "step": 24026 + }, + { + "epoch": 0.83, + "learning_rate": 1.3541182628820826e-06, + "loss": 0.5953, + "step": 24027 + }, + { + "epoch": 0.83, + "learning_rate": 1.353571180129516e-06, + "loss": 0.6562, + "step": 24028 + }, + { + "epoch": 0.83, + "learning_rate": 1.3530241998912974e-06, + "loss": 0.6123, + "step": 24029 + }, + { + "epoch": 0.83, + "learning_rate": 1.3524773221739152e-06, + "loss": 0.6172, + "step": 24030 + }, + { + "epoch": 0.83, + "learning_rate": 1.3519305469838563e-06, + "loss": 0.6479, + "step": 24031 + }, + { + "epoch": 0.83, + "learning_rate": 1.3513838743275987e-06, + "loss": 0.6645, + "step": 24032 + }, + { + "epoch": 0.83, + "learning_rate": 1.350837304211623e-06, + "loss": 0.6712, + "step": 24033 + }, + { + "epoch": 0.83, + "learning_rate": 1.3502908366424171e-06, + "loss": 0.6343, + "step": 24034 + }, + { + "epoch": 0.83, + "learning_rate": 1.349744471626453e-06, + "loss": 0.6117, + "step": 24035 + }, + { + "epoch": 0.83, + "learning_rate": 1.3491982091702116e-06, + "loss": 0.5969, + "step": 24036 + }, + { + "epoch": 0.83, + "learning_rate": 1.3486520492801702e-06, + "loss": 0.6569, + "step": 24037 + }, + { + "epoch": 0.83, + "learning_rate": 1.3481059919628004e-06, + "loss": 0.6164, + "step": 24038 + }, + { + "epoch": 0.83, + "learning_rate": 1.3475600372245768e-06, + "loss": 0.6001, + "step": 24039 + }, + { + "epoch": 0.83, + "learning_rate": 1.3470141850719786e-06, + "loss": 0.6077, + "step": 24040 + }, + { + "epoch": 0.83, + "learning_rate": 1.346468435511471e-06, + "loss": 0.6492, + "step": 24041 + }, + { + "epoch": 0.83, + "learning_rate": 1.3459227885495274e-06, + "loss": 0.6075, + "step": 24042 + }, + { + "epoch": 0.83, + "learning_rate": 1.3453772441926184e-06, + "loss": 0.6518, + "step": 24043 + }, + { + "epoch": 0.83, + "learning_rate": 1.3448318024472073e-06, + "loss": 0.6082, + "step": 24044 + }, + { + "epoch": 0.83, + "learning_rate": 1.344286463319765e-06, + "loss": 0.6112, + "step": 24045 + }, + { + "epoch": 0.83, + "learning_rate": 1.343741226816756e-06, + "loss": 0.6213, + "step": 24046 + }, + { + "epoch": 0.83, + "learning_rate": 1.3431960929446454e-06, + "loss": 0.5726, + "step": 24047 + }, + { + "epoch": 0.83, + "learning_rate": 1.3426510617098976e-06, + "loss": 0.5874, + "step": 24048 + }, + { + "epoch": 0.83, + "learning_rate": 1.3421061331189723e-06, + "loss": 0.6225, + "step": 24049 + }, + { + "epoch": 0.83, + "learning_rate": 1.3415613071783296e-06, + "loss": 0.5861, + "step": 24050 + }, + { + "epoch": 0.83, + "learning_rate": 1.341016583894431e-06, + "loss": 0.5974, + "step": 24051 + }, + { + "epoch": 0.83, + "learning_rate": 1.340471963273734e-06, + "loss": 0.6161, + "step": 24052 + }, + { + "epoch": 0.83, + "learning_rate": 1.3399274453226973e-06, + "loss": 0.6179, + "step": 24053 + }, + { + "epoch": 0.83, + "learning_rate": 1.3393830300477772e-06, + "loss": 0.6366, + "step": 24054 + }, + { + "epoch": 0.83, + "learning_rate": 1.3388387174554252e-06, + "loss": 0.5865, + "step": 24055 + }, + { + "epoch": 0.83, + "learning_rate": 1.338294507552096e-06, + "loss": 0.6363, + "step": 24056 + }, + { + "epoch": 0.83, + "learning_rate": 1.3377504003442433e-06, + "loss": 0.6579, + "step": 24057 + }, + { + "epoch": 0.83, + "learning_rate": 1.3372063958383164e-06, + "loss": 0.7104, + "step": 24058 + }, + { + "epoch": 0.83, + "learning_rate": 1.3366624940407668e-06, + "loss": 0.6262, + "step": 24059 + }, + { + "epoch": 0.83, + "learning_rate": 1.3361186949580451e-06, + "loss": 0.6238, + "step": 24060 + }, + { + "epoch": 0.83, + "learning_rate": 1.3355749985965938e-06, + "loss": 0.6332, + "step": 24061 + }, + { + "epoch": 0.83, + "learning_rate": 1.335031404962861e-06, + "loss": 0.6359, + "step": 24062 + }, + { + "epoch": 0.83, + "learning_rate": 1.3344879140632917e-06, + "loss": 0.6407, + "step": 24063 + }, + { + "epoch": 0.83, + "learning_rate": 1.3339445259043314e-06, + "loss": 0.6144, + "step": 24064 + }, + { + "epoch": 0.83, + "learning_rate": 1.3334012404924201e-06, + "loss": 0.6593, + "step": 24065 + }, + { + "epoch": 0.83, + "learning_rate": 1.3328580578340034e-06, + "loss": 0.6607, + "step": 24066 + }, + { + "epoch": 0.83, + "learning_rate": 1.332314977935516e-06, + "loss": 0.6421, + "step": 24067 + }, + { + "epoch": 0.83, + "learning_rate": 1.3317720008033997e-06, + "loss": 0.6593, + "step": 24068 + }, + { + "epoch": 0.83, + "learning_rate": 1.3312291264440914e-06, + "loss": 0.5603, + "step": 24069 + }, + { + "epoch": 0.83, + "learning_rate": 1.330686354864027e-06, + "loss": 0.5601, + "step": 24070 + }, + { + "epoch": 0.83, + "learning_rate": 1.3301436860696437e-06, + "loss": 0.6238, + "step": 24071 + }, + { + "epoch": 0.83, + "learning_rate": 1.3296011200673764e-06, + "loss": 0.6351, + "step": 24072 + }, + { + "epoch": 0.83, + "learning_rate": 1.3290586568636533e-06, + "loss": 0.6159, + "step": 24073 + }, + { + "epoch": 0.83, + "learning_rate": 1.328516296464909e-06, + "loss": 0.6504, + "step": 24074 + }, + { + "epoch": 0.83, + "learning_rate": 1.327974038877573e-06, + "loss": 0.5933, + "step": 24075 + }, + { + "epoch": 0.83, + "learning_rate": 1.3274318841080757e-06, + "loss": 0.5915, + "step": 24076 + }, + { + "epoch": 0.83, + "learning_rate": 1.3268898321628433e-06, + "loss": 0.6404, + "step": 24077 + }, + { + "epoch": 0.83, + "learning_rate": 1.3263478830483068e-06, + "loss": 0.6502, + "step": 24078 + }, + { + "epoch": 0.83, + "learning_rate": 1.325806036770886e-06, + "loss": 0.6536, + "step": 24079 + }, + { + "epoch": 0.83, + "learning_rate": 1.3252642933370063e-06, + "loss": 0.6354, + "step": 24080 + }, + { + "epoch": 0.83, + "learning_rate": 1.3247226527530932e-06, + "loss": 0.641, + "step": 24081 + }, + { + "epoch": 0.83, + "learning_rate": 1.3241811150255668e-06, + "loss": 0.6313, + "step": 24082 + }, + { + "epoch": 0.83, + "learning_rate": 1.3236396801608487e-06, + "loss": 0.585, + "step": 24083 + }, + { + "epoch": 0.83, + "learning_rate": 1.3230983481653593e-06, + "loss": 0.625, + "step": 24084 + }, + { + "epoch": 0.83, + "learning_rate": 1.3225571190455145e-06, + "loss": 0.6111, + "step": 24085 + }, + { + "epoch": 0.83, + "learning_rate": 1.3220159928077304e-06, + "loss": 0.6475, + "step": 24086 + }, + { + "epoch": 0.83, + "learning_rate": 1.321474969458425e-06, + "loss": 0.6458, + "step": 24087 + }, + { + "epoch": 0.83, + "learning_rate": 1.3209340490040135e-06, + "loss": 0.6176, + "step": 24088 + }, + { + "epoch": 0.83, + "learning_rate": 1.3203932314509061e-06, + "loss": 0.6586, + "step": 24089 + }, + { + "epoch": 0.83, + "learning_rate": 1.3198525168055198e-06, + "loss": 0.6087, + "step": 24090 + }, + { + "epoch": 0.83, + "learning_rate": 1.3193119050742597e-06, + "loss": 0.6198, + "step": 24091 + }, + { + "epoch": 0.83, + "learning_rate": 1.3187713962635384e-06, + "loss": 0.6766, + "step": 24092 + }, + { + "epoch": 0.83, + "learning_rate": 1.3182309903797642e-06, + "loss": 0.6816, + "step": 24093 + }, + { + "epoch": 0.83, + "learning_rate": 1.3176906874293437e-06, + "loss": 0.5963, + "step": 24094 + }, + { + "epoch": 0.83, + "learning_rate": 1.3171504874186837e-06, + "loss": 0.6335, + "step": 24095 + }, + { + "epoch": 0.83, + "learning_rate": 1.3166103903541904e-06, + "loss": 0.6112, + "step": 24096 + }, + { + "epoch": 0.83, + "learning_rate": 1.3160703962422639e-06, + "loss": 0.6264, + "step": 24097 + }, + { + "epoch": 0.83, + "learning_rate": 1.3155305050893075e-06, + "loss": 0.6431, + "step": 24098 + }, + { + "epoch": 0.83, + "learning_rate": 1.3149907169017228e-06, + "loss": 0.5885, + "step": 24099 + }, + { + "epoch": 0.84, + "learning_rate": 1.3144510316859106e-06, + "loss": 0.5922, + "step": 24100 + }, + { + "epoch": 0.84, + "learning_rate": 1.3139114494482674e-06, + "loss": 0.6423, + "step": 24101 + }, + { + "epoch": 0.84, + "learning_rate": 1.3133719701951953e-06, + "loss": 0.6525, + "step": 24102 + }, + { + "epoch": 0.84, + "learning_rate": 1.3128325939330844e-06, + "loss": 0.6312, + "step": 24103 + }, + { + "epoch": 0.84, + "learning_rate": 1.312293320668332e-06, + "loss": 0.6247, + "step": 24104 + }, + { + "epoch": 0.84, + "learning_rate": 1.3117541504073328e-06, + "loss": 0.6198, + "step": 24105 + }, + { + "epoch": 0.84, + "learning_rate": 1.3112150831564786e-06, + "loss": 0.6484, + "step": 24106 + }, + { + "epoch": 0.84, + "learning_rate": 1.3106761189221628e-06, + "loss": 0.6171, + "step": 24107 + }, + { + "epoch": 0.84, + "learning_rate": 1.310137257710772e-06, + "loss": 0.6745, + "step": 24108 + }, + { + "epoch": 0.84, + "learning_rate": 1.309598499528697e-06, + "loss": 0.6922, + "step": 24109 + }, + { + "epoch": 0.84, + "learning_rate": 1.3090598443823243e-06, + "loss": 0.5624, + "step": 24110 + }, + { + "epoch": 0.84, + "learning_rate": 1.3085212922780422e-06, + "loss": 0.6379, + "step": 24111 + }, + { + "epoch": 0.84, + "learning_rate": 1.307982843222234e-06, + "loss": 0.6354, + "step": 24112 + }, + { + "epoch": 0.84, + "learning_rate": 1.3074444972212885e-06, + "loss": 0.6382, + "step": 24113 + }, + { + "epoch": 0.84, + "learning_rate": 1.3069062542815815e-06, + "loss": 0.6086, + "step": 24114 + }, + { + "epoch": 0.84, + "learning_rate": 1.3063681144094964e-06, + "loss": 0.6237, + "step": 24115 + }, + { + "epoch": 0.84, + "learning_rate": 1.3058300776114163e-06, + "loss": 0.6208, + "step": 24116 + }, + { + "epoch": 0.84, + "learning_rate": 1.3052921438937182e-06, + "loss": 0.6646, + "step": 24117 + }, + { + "epoch": 0.84, + "learning_rate": 1.3047543132627816e-06, + "loss": 0.6303, + "step": 24118 + }, + { + "epoch": 0.84, + "learning_rate": 1.3042165857249834e-06, + "loss": 0.6175, + "step": 24119 + }, + { + "epoch": 0.84, + "learning_rate": 1.3036789612866952e-06, + "loss": 0.6973, + "step": 24120 + }, + { + "epoch": 0.84, + "learning_rate": 1.3031414399542952e-06, + "loss": 0.6029, + "step": 24121 + }, + { + "epoch": 0.84, + "learning_rate": 1.302604021734154e-06, + "loss": 0.5859, + "step": 24122 + }, + { + "epoch": 0.84, + "learning_rate": 1.3020667066326442e-06, + "loss": 0.601, + "step": 24123 + }, + { + "epoch": 0.84, + "learning_rate": 1.3015294946561373e-06, + "loss": 0.6435, + "step": 24124 + }, + { + "epoch": 0.84, + "learning_rate": 1.3009923858110041e-06, + "loss": 0.6364, + "step": 24125 + }, + { + "epoch": 0.84, + "learning_rate": 1.300455380103608e-06, + "loss": 0.6487, + "step": 24126 + }, + { + "epoch": 0.84, + "learning_rate": 1.2999184775403173e-06, + "loss": 0.605, + "step": 24127 + }, + { + "epoch": 0.84, + "learning_rate": 1.2993816781275003e-06, + "loss": 0.6226, + "step": 24128 + }, + { + "epoch": 0.84, + "learning_rate": 1.2988449818715187e-06, + "loss": 0.6217, + "step": 24129 + }, + { + "epoch": 0.84, + "learning_rate": 1.2983083887787374e-06, + "loss": 0.6662, + "step": 24130 + }, + { + "epoch": 0.84, + "learning_rate": 1.2977718988555198e-06, + "loss": 0.627, + "step": 24131 + }, + { + "epoch": 0.84, + "learning_rate": 1.2972355121082226e-06, + "loss": 0.617, + "step": 24132 + }, + { + "epoch": 0.84, + "learning_rate": 1.296699228543208e-06, + "loss": 0.6768, + "step": 24133 + }, + { + "epoch": 0.84, + "learning_rate": 1.296163048166833e-06, + "loss": 0.6976, + "step": 24134 + }, + { + "epoch": 0.84, + "learning_rate": 1.2956269709854563e-06, + "loss": 0.6177, + "step": 24135 + }, + { + "epoch": 0.84, + "learning_rate": 1.2950909970054326e-06, + "loss": 0.623, + "step": 24136 + }, + { + "epoch": 0.84, + "learning_rate": 1.294555126233119e-06, + "loss": 0.6216, + "step": 24137 + }, + { + "epoch": 0.84, + "learning_rate": 1.294019358674864e-06, + "loss": 0.5928, + "step": 24138 + }, + { + "epoch": 0.84, + "learning_rate": 1.2934836943370233e-06, + "loss": 0.6104, + "step": 24139 + }, + { + "epoch": 0.84, + "learning_rate": 1.2929481332259475e-06, + "loss": 0.6164, + "step": 24140 + }, + { + "epoch": 0.84, + "learning_rate": 1.292412675347986e-06, + "loss": 0.6356, + "step": 24141 + }, + { + "epoch": 0.84, + "learning_rate": 1.291877320709487e-06, + "loss": 0.6709, + "step": 24142 + }, + { + "epoch": 0.84, + "learning_rate": 1.2913420693168e-06, + "loss": 0.6067, + "step": 24143 + }, + { + "epoch": 0.84, + "learning_rate": 1.2908069211762676e-06, + "loss": 0.5791, + "step": 24144 + }, + { + "epoch": 0.84, + "learning_rate": 1.2902718762942368e-06, + "loss": 0.6342, + "step": 24145 + }, + { + "epoch": 0.84, + "learning_rate": 1.2897369346770494e-06, + "loss": 0.6143, + "step": 24146 + }, + { + "epoch": 0.84, + "learning_rate": 1.2892020963310504e-06, + "loss": 0.6228, + "step": 24147 + }, + { + "epoch": 0.84, + "learning_rate": 1.2886673612625789e-06, + "loss": 0.6321, + "step": 24148 + }, + { + "epoch": 0.84, + "learning_rate": 1.2881327294779788e-06, + "loss": 0.7298, + "step": 24149 + }, + { + "epoch": 0.84, + "learning_rate": 1.287598200983583e-06, + "loss": 0.6665, + "step": 24150 + }, + { + "epoch": 0.84, + "learning_rate": 1.2870637757857318e-06, + "loss": 0.6324, + "step": 24151 + }, + { + "epoch": 0.84, + "learning_rate": 1.2865294538907624e-06, + "loss": 0.6768, + "step": 24152 + }, + { + "epoch": 0.84, + "learning_rate": 1.2859952353050075e-06, + "loss": 0.6274, + "step": 24153 + }, + { + "epoch": 0.84, + "learning_rate": 1.2854611200348033e-06, + "loss": 0.6117, + "step": 24154 + }, + { + "epoch": 0.84, + "learning_rate": 1.2849271080864834e-06, + "loss": 0.6248, + "step": 24155 + }, + { + "epoch": 0.84, + "learning_rate": 1.284393199466375e-06, + "loss": 0.6376, + "step": 24156 + }, + { + "epoch": 0.84, + "learning_rate": 1.2838593941808108e-06, + "loss": 0.6564, + "step": 24157 + }, + { + "epoch": 0.84, + "learning_rate": 1.2833256922361192e-06, + "loss": 0.6375, + "step": 24158 + }, + { + "epoch": 0.84, + "learning_rate": 1.2827920936386273e-06, + "loss": 0.6101, + "step": 24159 + }, + { + "epoch": 0.84, + "learning_rate": 1.2822585983946633e-06, + "loss": 0.6349, + "step": 24160 + }, + { + "epoch": 0.84, + "learning_rate": 1.2817252065105545e-06, + "loss": 0.6463, + "step": 24161 + }, + { + "epoch": 0.84, + "learning_rate": 1.2811919179926192e-06, + "loss": 0.5903, + "step": 24162 + }, + { + "epoch": 0.84, + "learning_rate": 1.2806587328471832e-06, + "loss": 0.6142, + "step": 24163 + }, + { + "epoch": 0.84, + "learning_rate": 1.280125651080567e-06, + "loss": 0.5856, + "step": 24164 + }, + { + "epoch": 0.84, + "learning_rate": 1.2795926726990926e-06, + "loss": 0.6336, + "step": 24165 + }, + { + "epoch": 0.84, + "learning_rate": 1.2790597977090792e-06, + "loss": 0.6582, + "step": 24166 + }, + { + "epoch": 0.84, + "learning_rate": 1.2785270261168458e-06, + "loss": 0.6093, + "step": 24167 + }, + { + "epoch": 0.84, + "learning_rate": 1.2779943579287046e-06, + "loss": 0.6256, + "step": 24168 + }, + { + "epoch": 0.84, + "learning_rate": 1.2774617931509758e-06, + "loss": 0.6292, + "step": 24169 + }, + { + "epoch": 0.84, + "learning_rate": 1.2769293317899666e-06, + "loss": 0.6364, + "step": 24170 + }, + { + "epoch": 0.84, + "learning_rate": 1.2763969738519988e-06, + "loss": 0.6025, + "step": 24171 + }, + { + "epoch": 0.84, + "learning_rate": 1.2758647193433816e-06, + "loss": 0.6516, + "step": 24172 + }, + { + "epoch": 0.84, + "learning_rate": 1.275332568270421e-06, + "loss": 0.6702, + "step": 24173 + }, + { + "epoch": 0.84, + "learning_rate": 1.274800520639431e-06, + "loss": 0.6061, + "step": 24174 + }, + { + "epoch": 0.84, + "learning_rate": 1.2742685764567197e-06, + "loss": 0.6196, + "step": 24175 + }, + { + "epoch": 0.84, + "learning_rate": 1.273736735728589e-06, + "loss": 0.7116, + "step": 24176 + }, + { + "epoch": 0.84, + "learning_rate": 1.2732049984613493e-06, + "loss": 0.596, + "step": 24177 + }, + { + "epoch": 0.84, + "learning_rate": 1.2726733646613066e-06, + "loss": 0.6513, + "step": 24178 + }, + { + "epoch": 0.84, + "learning_rate": 1.272141834334759e-06, + "loss": 0.6008, + "step": 24179 + }, + { + "epoch": 0.84, + "learning_rate": 1.2716104074880098e-06, + "loss": 0.6486, + "step": 24180 + }, + { + "epoch": 0.84, + "learning_rate": 1.2710790841273647e-06, + "loss": 0.6621, + "step": 24181 + }, + { + "epoch": 0.84, + "learning_rate": 1.2705478642591128e-06, + "loss": 0.6478, + "step": 24182 + }, + { + "epoch": 0.84, + "learning_rate": 1.270016747889562e-06, + "loss": 0.6252, + "step": 24183 + }, + { + "epoch": 0.84, + "learning_rate": 1.269485735025009e-06, + "loss": 0.596, + "step": 24184 + }, + { + "epoch": 0.84, + "learning_rate": 1.2689548256717433e-06, + "loss": 0.6365, + "step": 24185 + }, + { + "epoch": 0.84, + "learning_rate": 1.2684240198360643e-06, + "loss": 0.5932, + "step": 24186 + }, + { + "epoch": 0.84, + "learning_rate": 1.2678933175242647e-06, + "loss": 0.6631, + "step": 24187 + }, + { + "epoch": 0.84, + "learning_rate": 1.267362718742633e-06, + "loss": 0.6384, + "step": 24188 + }, + { + "epoch": 0.84, + "learning_rate": 1.266832223497465e-06, + "loss": 0.6468, + "step": 24189 + }, + { + "epoch": 0.84, + "learning_rate": 1.2663018317950504e-06, + "loss": 0.6469, + "step": 24190 + }, + { + "epoch": 0.84, + "learning_rate": 1.2657715436416728e-06, + "loss": 0.6464, + "step": 24191 + }, + { + "epoch": 0.84, + "learning_rate": 1.265241359043624e-06, + "loss": 0.6325, + "step": 24192 + }, + { + "epoch": 0.84, + "learning_rate": 1.2647112780071892e-06, + "loss": 0.6484, + "step": 24193 + }, + { + "epoch": 0.84, + "learning_rate": 1.2641813005386482e-06, + "loss": 0.577, + "step": 24194 + }, + { + "epoch": 0.84, + "learning_rate": 1.2636514266442923e-06, + "loss": 0.6816, + "step": 24195 + }, + { + "epoch": 0.84, + "learning_rate": 1.2631216563304015e-06, + "loss": 0.6269, + "step": 24196 + }, + { + "epoch": 0.84, + "learning_rate": 1.2625919896032535e-06, + "loss": 0.6393, + "step": 24197 + }, + { + "epoch": 0.84, + "learning_rate": 1.2620624264691305e-06, + "loss": 0.6259, + "step": 24198 + }, + { + "epoch": 0.84, + "learning_rate": 1.2615329669343123e-06, + "loss": 0.6132, + "step": 24199 + }, + { + "epoch": 0.84, + "learning_rate": 1.2610036110050716e-06, + "loss": 0.6031, + "step": 24200 + }, + { + "epoch": 0.84, + "learning_rate": 1.26047435868769e-06, + "loss": 0.5774, + "step": 24201 + }, + { + "epoch": 0.84, + "learning_rate": 1.2599452099884423e-06, + "loss": 0.6257, + "step": 24202 + }, + { + "epoch": 0.84, + "learning_rate": 1.2594161649135982e-06, + "loss": 0.6368, + "step": 24203 + }, + { + "epoch": 0.84, + "learning_rate": 1.2588872234694327e-06, + "loss": 0.6009, + "step": 24204 + }, + { + "epoch": 0.84, + "learning_rate": 1.2583583856622195e-06, + "loss": 0.6253, + "step": 24205 + }, + { + "epoch": 0.84, + "learning_rate": 1.2578296514982203e-06, + "loss": 0.5915, + "step": 24206 + }, + { + "epoch": 0.84, + "learning_rate": 1.2573010209837122e-06, + "loss": 0.6131, + "step": 24207 + }, + { + "epoch": 0.84, + "learning_rate": 1.2567724941249627e-06, + "loss": 0.5988, + "step": 24208 + }, + { + "epoch": 0.84, + "learning_rate": 1.256244070928232e-06, + "loss": 0.5841, + "step": 24209 + }, + { + "epoch": 0.84, + "learning_rate": 1.2557157513997898e-06, + "loss": 0.5967, + "step": 24210 + }, + { + "epoch": 0.84, + "learning_rate": 1.255187535545901e-06, + "loss": 0.6536, + "step": 24211 + }, + { + "epoch": 0.84, + "learning_rate": 1.2546594233728215e-06, + "loss": 0.6766, + "step": 24212 + }, + { + "epoch": 0.84, + "learning_rate": 1.25413141488682e-06, + "loss": 0.6127, + "step": 24213 + }, + { + "epoch": 0.84, + "learning_rate": 1.2536035100941568e-06, + "loss": 0.6303, + "step": 24214 + }, + { + "epoch": 0.84, + "learning_rate": 1.2530757090010848e-06, + "loss": 0.6264, + "step": 24215 + }, + { + "epoch": 0.84, + "learning_rate": 1.2525480116138667e-06, + "loss": 0.6147, + "step": 24216 + }, + { + "epoch": 0.84, + "learning_rate": 1.2520204179387585e-06, + "loss": 0.6423, + "step": 24217 + }, + { + "epoch": 0.84, + "learning_rate": 1.251492927982011e-06, + "loss": 0.5567, + "step": 24218 + }, + { + "epoch": 0.84, + "learning_rate": 1.2509655417498834e-06, + "loss": 0.5954, + "step": 24219 + }, + { + "epoch": 0.84, + "learning_rate": 1.2504382592486286e-06, + "loss": 0.6627, + "step": 24220 + }, + { + "epoch": 0.84, + "learning_rate": 1.2499110804844949e-06, + "loss": 0.6115, + "step": 24221 + }, + { + "epoch": 0.84, + "learning_rate": 1.249384005463734e-06, + "loss": 0.6733, + "step": 24222 + }, + { + "epoch": 0.84, + "learning_rate": 1.2488570341925977e-06, + "loss": 0.6746, + "step": 24223 + }, + { + "epoch": 0.84, + "learning_rate": 1.2483301666773273e-06, + "loss": 0.683, + "step": 24224 + }, + { + "epoch": 0.84, + "learning_rate": 1.2478034029241758e-06, + "loss": 0.6071, + "step": 24225 + }, + { + "epoch": 0.84, + "learning_rate": 1.2472767429393884e-06, + "loss": 0.6115, + "step": 24226 + }, + { + "epoch": 0.84, + "learning_rate": 1.2467501867292054e-06, + "loss": 0.6057, + "step": 24227 + }, + { + "epoch": 0.84, + "learning_rate": 1.2462237342998718e-06, + "loss": 0.6569, + "step": 24228 + }, + { + "epoch": 0.84, + "learning_rate": 1.2456973856576327e-06, + "loss": 0.631, + "step": 24229 + }, + { + "epoch": 0.84, + "learning_rate": 1.2451711408087196e-06, + "loss": 0.7085, + "step": 24230 + }, + { + "epoch": 0.84, + "learning_rate": 1.2446449997593824e-06, + "loss": 0.6308, + "step": 24231 + }, + { + "epoch": 0.84, + "learning_rate": 1.2441189625158522e-06, + "loss": 0.6157, + "step": 24232 + }, + { + "epoch": 0.84, + "learning_rate": 1.243593029084368e-06, + "loss": 0.6364, + "step": 24233 + }, + { + "epoch": 0.84, + "learning_rate": 1.2430671994711662e-06, + "loss": 0.6784, + "step": 24234 + }, + { + "epoch": 0.84, + "learning_rate": 1.2425414736824804e-06, + "loss": 0.6472, + "step": 24235 + }, + { + "epoch": 0.84, + "learning_rate": 1.2420158517245418e-06, + "loss": 0.617, + "step": 24236 + }, + { + "epoch": 0.84, + "learning_rate": 1.2414903336035856e-06, + "loss": 0.6311, + "step": 24237 + }, + { + "epoch": 0.84, + "learning_rate": 1.24096491932584e-06, + "loss": 0.6306, + "step": 24238 + }, + { + "epoch": 0.84, + "learning_rate": 1.2404396088975357e-06, + "loss": 0.6325, + "step": 24239 + }, + { + "epoch": 0.84, + "learning_rate": 1.2399144023249033e-06, + "loss": 0.6656, + "step": 24240 + }, + { + "epoch": 0.84, + "learning_rate": 1.2393892996141654e-06, + "loss": 0.6339, + "step": 24241 + }, + { + "epoch": 0.84, + "learning_rate": 1.2388643007715483e-06, + "loss": 0.6261, + "step": 24242 + }, + { + "epoch": 0.84, + "learning_rate": 1.2383394058032794e-06, + "loss": 0.6238, + "step": 24243 + }, + { + "epoch": 0.84, + "learning_rate": 1.237814614715579e-06, + "loss": 0.6203, + "step": 24244 + }, + { + "epoch": 0.84, + "learning_rate": 1.237289927514671e-06, + "loss": 0.5981, + "step": 24245 + }, + { + "epoch": 0.84, + "learning_rate": 1.2367653442067783e-06, + "loss": 0.6007, + "step": 24246 + }, + { + "epoch": 0.84, + "learning_rate": 1.236240864798116e-06, + "loss": 0.6212, + "step": 24247 + }, + { + "epoch": 0.84, + "learning_rate": 1.2357164892949037e-06, + "loss": 0.6594, + "step": 24248 + }, + { + "epoch": 0.84, + "learning_rate": 1.2351922177033604e-06, + "loss": 0.6131, + "step": 24249 + }, + { + "epoch": 0.84, + "learning_rate": 1.2346680500297003e-06, + "loss": 0.6472, + "step": 24250 + }, + { + "epoch": 0.84, + "learning_rate": 1.2341439862801386e-06, + "loss": 0.63, + "step": 24251 + }, + { + "epoch": 0.84, + "learning_rate": 1.23362002646089e-06, + "loss": 0.6635, + "step": 24252 + }, + { + "epoch": 0.84, + "learning_rate": 1.2330961705781652e-06, + "loss": 0.6523, + "step": 24253 + }, + { + "epoch": 0.84, + "learning_rate": 1.2325724186381739e-06, + "loss": 0.5973, + "step": 24254 + }, + { + "epoch": 0.84, + "learning_rate": 1.2320487706471284e-06, + "loss": 0.6923, + "step": 24255 + }, + { + "epoch": 0.84, + "learning_rate": 1.2315252266112355e-06, + "loss": 0.6819, + "step": 24256 + }, + { + "epoch": 0.84, + "learning_rate": 1.231001786536704e-06, + "loss": 0.693, + "step": 24257 + }, + { + "epoch": 0.84, + "learning_rate": 1.2304784504297408e-06, + "loss": 0.6584, + "step": 24258 + }, + { + "epoch": 0.84, + "learning_rate": 1.229955218296548e-06, + "loss": 0.6664, + "step": 24259 + }, + { + "epoch": 0.84, + "learning_rate": 1.2294320901433288e-06, + "loss": 0.6112, + "step": 24260 + }, + { + "epoch": 0.84, + "learning_rate": 1.228909065976287e-06, + "loss": 0.6616, + "step": 24261 + }, + { + "epoch": 0.84, + "learning_rate": 1.2283861458016244e-06, + "loss": 0.6654, + "step": 24262 + }, + { + "epoch": 0.84, + "learning_rate": 1.2278633296255404e-06, + "loss": 0.666, + "step": 24263 + }, + { + "epoch": 0.84, + "learning_rate": 1.2273406174542358e-06, + "loss": 0.6592, + "step": 24264 + }, + { + "epoch": 0.84, + "learning_rate": 1.2268180092939019e-06, + "loss": 0.6144, + "step": 24265 + }, + { + "epoch": 0.84, + "learning_rate": 1.2262955051507398e-06, + "loss": 0.69, + "step": 24266 + }, + { + "epoch": 0.84, + "learning_rate": 1.225773105030944e-06, + "loss": 0.6414, + "step": 24267 + }, + { + "epoch": 0.84, + "learning_rate": 1.2252508089407068e-06, + "loss": 0.6785, + "step": 24268 + }, + { + "epoch": 0.84, + "learning_rate": 1.2247286168862204e-06, + "loss": 0.6326, + "step": 24269 + }, + { + "epoch": 0.84, + "learning_rate": 1.2242065288736804e-06, + "loss": 0.6504, + "step": 24270 + }, + { + "epoch": 0.84, + "learning_rate": 1.2236845449092705e-06, + "loss": 0.6473, + "step": 24271 + }, + { + "epoch": 0.84, + "learning_rate": 1.2231626649991834e-06, + "loss": 0.6081, + "step": 24272 + }, + { + "epoch": 0.84, + "learning_rate": 1.2226408891496044e-06, + "loss": 0.6392, + "step": 24273 + }, + { + "epoch": 0.84, + "learning_rate": 1.2221192173667217e-06, + "loss": 0.5665, + "step": 24274 + }, + { + "epoch": 0.84, + "learning_rate": 1.2215976496567207e-06, + "loss": 0.6779, + "step": 24275 + }, + { + "epoch": 0.84, + "learning_rate": 1.2210761860257848e-06, + "loss": 0.6684, + "step": 24276 + }, + { + "epoch": 0.84, + "learning_rate": 1.2205548264800947e-06, + "loss": 0.6135, + "step": 24277 + }, + { + "epoch": 0.84, + "learning_rate": 1.2200335710258337e-06, + "loss": 0.6365, + "step": 24278 + }, + { + "epoch": 0.84, + "learning_rate": 1.219512419669181e-06, + "loss": 0.6069, + "step": 24279 + }, + { + "epoch": 0.84, + "learning_rate": 1.218991372416316e-06, + "loss": 0.6627, + "step": 24280 + }, + { + "epoch": 0.84, + "learning_rate": 1.2184704292734161e-06, + "loss": 0.6574, + "step": 24281 + }, + { + "epoch": 0.84, + "learning_rate": 1.2179495902466597e-06, + "loss": 0.6284, + "step": 24282 + }, + { + "epoch": 0.84, + "learning_rate": 1.2174288553422186e-06, + "loss": 0.5837, + "step": 24283 + }, + { + "epoch": 0.84, + "learning_rate": 1.216908224566269e-06, + "loss": 0.6678, + "step": 24284 + }, + { + "epoch": 0.84, + "learning_rate": 1.2163876979249823e-06, + "loss": 0.6662, + "step": 24285 + }, + { + "epoch": 0.84, + "learning_rate": 1.2158672754245304e-06, + "loss": 0.6495, + "step": 24286 + }, + { + "epoch": 0.84, + "learning_rate": 1.2153469570710851e-06, + "loss": 0.6541, + "step": 24287 + }, + { + "epoch": 0.84, + "learning_rate": 1.214826742870816e-06, + "loss": 0.6845, + "step": 24288 + }, + { + "epoch": 0.84, + "learning_rate": 1.214306632829887e-06, + "loss": 0.5556, + "step": 24289 + }, + { + "epoch": 0.84, + "learning_rate": 1.2137866269544663e-06, + "loss": 0.6915, + "step": 24290 + }, + { + "epoch": 0.84, + "learning_rate": 1.2132667252507203e-06, + "loss": 0.6715, + "step": 24291 + }, + { + "epoch": 0.84, + "learning_rate": 1.2127469277248115e-06, + "loss": 0.627, + "step": 24292 + }, + { + "epoch": 0.84, + "learning_rate": 1.2122272343829077e-06, + "loss": 0.6065, + "step": 24293 + }, + { + "epoch": 0.84, + "learning_rate": 1.2117076452311628e-06, + "loss": 0.6369, + "step": 24294 + }, + { + "epoch": 0.84, + "learning_rate": 1.2111881602757424e-06, + "loss": 0.6591, + "step": 24295 + }, + { + "epoch": 0.84, + "learning_rate": 1.2106687795228034e-06, + "loss": 0.6544, + "step": 24296 + }, + { + "epoch": 0.84, + "learning_rate": 1.2101495029785048e-06, + "loss": 0.6245, + "step": 24297 + }, + { + "epoch": 0.84, + "learning_rate": 1.2096303306490031e-06, + "loss": 0.682, + "step": 24298 + }, + { + "epoch": 0.84, + "learning_rate": 1.2091112625404555e-06, + "loss": 0.6259, + "step": 24299 + }, + { + "epoch": 0.84, + "learning_rate": 1.2085922986590126e-06, + "loss": 0.6446, + "step": 24300 + }, + { + "epoch": 0.84, + "learning_rate": 1.2080734390108296e-06, + "loss": 0.6684, + "step": 24301 + }, + { + "epoch": 0.84, + "learning_rate": 1.207554683602058e-06, + "loss": 0.6322, + "step": 24302 + }, + { + "epoch": 0.84, + "learning_rate": 1.2070360324388474e-06, + "loss": 0.628, + "step": 24303 + }, + { + "epoch": 0.84, + "learning_rate": 1.2065174855273477e-06, + "loss": 0.6356, + "step": 24304 + }, + { + "epoch": 0.84, + "learning_rate": 1.2059990428737101e-06, + "loss": 0.621, + "step": 24305 + }, + { + "epoch": 0.84, + "learning_rate": 1.2054807044840745e-06, + "loss": 0.6601, + "step": 24306 + }, + { + "epoch": 0.84, + "learning_rate": 1.2049624703645913e-06, + "loss": 0.6667, + "step": 24307 + }, + { + "epoch": 0.84, + "learning_rate": 1.2044443405214047e-06, + "loss": 0.553, + "step": 24308 + }, + { + "epoch": 0.84, + "learning_rate": 1.203926314960655e-06, + "loss": 0.5913, + "step": 24309 + }, + { + "epoch": 0.84, + "learning_rate": 1.2034083936884877e-06, + "loss": 0.6194, + "step": 24310 + }, + { + "epoch": 0.84, + "learning_rate": 1.202890576711042e-06, + "loss": 0.6099, + "step": 24311 + }, + { + "epoch": 0.84, + "learning_rate": 1.2023728640344568e-06, + "loss": 0.6694, + "step": 24312 + }, + { + "epoch": 0.84, + "learning_rate": 1.2018552556648689e-06, + "loss": 0.6734, + "step": 24313 + }, + { + "epoch": 0.84, + "learning_rate": 1.2013377516084169e-06, + "loss": 0.6533, + "step": 24314 + }, + { + "epoch": 0.84, + "learning_rate": 1.200820351871237e-06, + "loss": 0.6292, + "step": 24315 + }, + { + "epoch": 0.84, + "learning_rate": 1.200303056459462e-06, + "loss": 0.6261, + "step": 24316 + }, + { + "epoch": 0.84, + "learning_rate": 1.1997858653792283e-06, + "loss": 0.6386, + "step": 24317 + }, + { + "epoch": 0.84, + "learning_rate": 1.199268778636663e-06, + "loss": 0.6302, + "step": 24318 + }, + { + "epoch": 0.84, + "learning_rate": 1.198751796237899e-06, + "loss": 0.6069, + "step": 24319 + }, + { + "epoch": 0.84, + "learning_rate": 1.1982349181890673e-06, + "loss": 0.652, + "step": 24320 + }, + { + "epoch": 0.84, + "learning_rate": 1.1977181444962948e-06, + "loss": 0.6637, + "step": 24321 + }, + { + "epoch": 0.84, + "learning_rate": 1.197201475165708e-06, + "loss": 0.6174, + "step": 24322 + }, + { + "epoch": 0.84, + "learning_rate": 1.196684910203435e-06, + "loss": 0.6737, + "step": 24323 + }, + { + "epoch": 0.84, + "learning_rate": 1.1961684496155978e-06, + "loss": 0.584, + "step": 24324 + }, + { + "epoch": 0.84, + "learning_rate": 1.1956520934083192e-06, + "loss": 0.6653, + "step": 24325 + }, + { + "epoch": 0.84, + "learning_rate": 1.1951358415877234e-06, + "loss": 0.5839, + "step": 24326 + }, + { + "epoch": 0.84, + "learning_rate": 1.1946196941599309e-06, + "loss": 0.6845, + "step": 24327 + }, + { + "epoch": 0.84, + "learning_rate": 1.19410365113106e-06, + "loss": 0.6328, + "step": 24328 + }, + { + "epoch": 0.84, + "learning_rate": 1.1935877125072325e-06, + "loss": 0.672, + "step": 24329 + }, + { + "epoch": 0.84, + "learning_rate": 1.1930718782945605e-06, + "loss": 0.5969, + "step": 24330 + }, + { + "epoch": 0.84, + "learning_rate": 1.1925561484991622e-06, + "loss": 0.6471, + "step": 24331 + }, + { + "epoch": 0.84, + "learning_rate": 1.1920405231271514e-06, + "loss": 0.5968, + "step": 24332 + }, + { + "epoch": 0.84, + "learning_rate": 1.1915250021846437e-06, + "loss": 0.5953, + "step": 24333 + }, + { + "epoch": 0.84, + "learning_rate": 1.1910095856777492e-06, + "loss": 0.6057, + "step": 24334 + }, + { + "epoch": 0.84, + "learning_rate": 1.1904942736125814e-06, + "loss": 0.5979, + "step": 24335 + }, + { + "epoch": 0.84, + "learning_rate": 1.189979065995246e-06, + "loss": 0.64, + "step": 24336 + }, + { + "epoch": 0.84, + "learning_rate": 1.1894639628318538e-06, + "loss": 0.7045, + "step": 24337 + }, + { + "epoch": 0.84, + "learning_rate": 1.1889489641285113e-06, + "loss": 0.62, + "step": 24338 + }, + { + "epoch": 0.84, + "learning_rate": 1.1884340698913255e-06, + "loss": 0.6318, + "step": 24339 + }, + { + "epoch": 0.84, + "learning_rate": 1.1879192801264006e-06, + "loss": 0.6793, + "step": 24340 + }, + { + "epoch": 0.84, + "learning_rate": 1.1874045948398416e-06, + "loss": 0.6151, + "step": 24341 + }, + { + "epoch": 0.84, + "learning_rate": 1.186890014037747e-06, + "loss": 0.6295, + "step": 24342 + }, + { + "epoch": 0.84, + "learning_rate": 1.1863755377262199e-06, + "loss": 0.6488, + "step": 24343 + }, + { + "epoch": 0.84, + "learning_rate": 1.1858611659113594e-06, + "loss": 0.6703, + "step": 24344 + }, + { + "epoch": 0.84, + "learning_rate": 1.1853468985992656e-06, + "loss": 0.667, + "step": 24345 + }, + { + "epoch": 0.84, + "learning_rate": 1.1848327357960353e-06, + "loss": 0.6174, + "step": 24346 + }, + { + "epoch": 0.84, + "learning_rate": 1.1843186775077653e-06, + "loss": 0.6007, + "step": 24347 + }, + { + "epoch": 0.84, + "learning_rate": 1.183804723740548e-06, + "loss": 0.6228, + "step": 24348 + }, + { + "epoch": 0.84, + "learning_rate": 1.1832908745004778e-06, + "loss": 0.7143, + "step": 24349 + }, + { + "epoch": 0.84, + "learning_rate": 1.1827771297936475e-06, + "loss": 0.6188, + "step": 24350 + }, + { + "epoch": 0.84, + "learning_rate": 1.1822634896261487e-06, + "loss": 0.6232, + "step": 24351 + }, + { + "epoch": 0.84, + "learning_rate": 1.18174995400407e-06, + "loss": 0.607, + "step": 24352 + }, + { + "epoch": 0.84, + "learning_rate": 1.1812365229335033e-06, + "loss": 0.6471, + "step": 24353 + }, + { + "epoch": 0.84, + "learning_rate": 1.18072319642053e-06, + "loss": 0.6328, + "step": 24354 + }, + { + "epoch": 0.84, + "learning_rate": 1.1802099744712414e-06, + "loss": 0.6408, + "step": 24355 + }, + { + "epoch": 0.84, + "learning_rate": 1.17969685709172e-06, + "loss": 0.619, + "step": 24356 + }, + { + "epoch": 0.84, + "learning_rate": 1.17918384428805e-06, + "loss": 0.6372, + "step": 24357 + }, + { + "epoch": 0.84, + "learning_rate": 1.1786709360663162e-06, + "loss": 0.6508, + "step": 24358 + }, + { + "epoch": 0.84, + "learning_rate": 1.1781581324325954e-06, + "loss": 0.6657, + "step": 24359 + }, + { + "epoch": 0.84, + "learning_rate": 1.1776454333929698e-06, + "loss": 0.5927, + "step": 24360 + }, + { + "epoch": 0.84, + "learning_rate": 1.1771328389535175e-06, + "loss": 0.639, + "step": 24361 + }, + { + "epoch": 0.84, + "learning_rate": 1.1766203491203165e-06, + "loss": 0.6453, + "step": 24362 + }, + { + "epoch": 0.84, + "learning_rate": 1.1761079638994434e-06, + "loss": 0.6123, + "step": 24363 + }, + { + "epoch": 0.84, + "learning_rate": 1.175595683296974e-06, + "loss": 0.6614, + "step": 24364 + }, + { + "epoch": 0.84, + "learning_rate": 1.1750835073189782e-06, + "loss": 0.6309, + "step": 24365 + }, + { + "epoch": 0.84, + "learning_rate": 1.1745714359715322e-06, + "loss": 0.6478, + "step": 24366 + }, + { + "epoch": 0.84, + "learning_rate": 1.1740594692607055e-06, + "loss": 0.641, + "step": 24367 + }, + { + "epoch": 0.84, + "learning_rate": 1.1735476071925688e-06, + "loss": 0.6949, + "step": 24368 + }, + { + "epoch": 0.84, + "learning_rate": 1.173035849773191e-06, + "loss": 0.5463, + "step": 24369 + }, + { + "epoch": 0.84, + "learning_rate": 1.172524197008641e-06, + "loss": 0.7055, + "step": 24370 + }, + { + "epoch": 0.84, + "learning_rate": 1.1720126489049811e-06, + "loss": 0.5965, + "step": 24371 + }, + { + "epoch": 0.84, + "learning_rate": 1.1715012054682796e-06, + "loss": 0.6194, + "step": 24372 + }, + { + "epoch": 0.84, + "learning_rate": 1.1709898667045982e-06, + "loss": 0.686, + "step": 24373 + }, + { + "epoch": 0.84, + "learning_rate": 1.1704786326200013e-06, + "loss": 0.6096, + "step": 24374 + }, + { + "epoch": 0.84, + "learning_rate": 1.1699675032205504e-06, + "loss": 0.6329, + "step": 24375 + }, + { + "epoch": 0.84, + "learning_rate": 1.1694564785123064e-06, + "loss": 0.6715, + "step": 24376 + }, + { + "epoch": 0.84, + "learning_rate": 1.1689455585013243e-06, + "loss": 0.6317, + "step": 24377 + }, + { + "epoch": 0.84, + "learning_rate": 1.1684347431936637e-06, + "loss": 0.6296, + "step": 24378 + }, + { + "epoch": 0.84, + "learning_rate": 1.1679240325953812e-06, + "loss": 0.6317, + "step": 24379 + }, + { + "epoch": 0.84, + "learning_rate": 1.1674134267125314e-06, + "loss": 0.6614, + "step": 24380 + }, + { + "epoch": 0.84, + "learning_rate": 1.16690292555117e-06, + "loss": 0.5873, + "step": 24381 + }, + { + "epoch": 0.84, + "learning_rate": 1.1663925291173495e-06, + "loss": 0.6043, + "step": 24382 + }, + { + "epoch": 0.84, + "learning_rate": 1.1658822374171186e-06, + "loss": 0.6005, + "step": 24383 + }, + { + "epoch": 0.84, + "learning_rate": 1.165372050456529e-06, + "loss": 0.6612, + "step": 24384 + }, + { + "epoch": 0.84, + "learning_rate": 1.1648619682416297e-06, + "loss": 0.6257, + "step": 24385 + }, + { + "epoch": 0.84, + "learning_rate": 1.1643519907784673e-06, + "loss": 0.5986, + "step": 24386 + }, + { + "epoch": 0.84, + "learning_rate": 1.1638421180730908e-06, + "loss": 0.6452, + "step": 24387 + }, + { + "epoch": 0.84, + "learning_rate": 1.1633323501315442e-06, + "loss": 0.6528, + "step": 24388 + }, + { + "epoch": 0.85, + "learning_rate": 1.1628226869598703e-06, + "loss": 0.657, + "step": 24389 + }, + { + "epoch": 0.85, + "learning_rate": 1.1623131285641121e-06, + "loss": 0.6099, + "step": 24390 + }, + { + "epoch": 0.85, + "learning_rate": 1.1618036749503115e-06, + "loss": 0.648, + "step": 24391 + }, + { + "epoch": 0.85, + "learning_rate": 1.161294326124508e-06, + "loss": 0.664, + "step": 24392 + }, + { + "epoch": 0.85, + "learning_rate": 1.1607850820927413e-06, + "loss": 0.6387, + "step": 24393 + }, + { + "epoch": 0.85, + "learning_rate": 1.160275942861052e-06, + "loss": 0.6728, + "step": 24394 + }, + { + "epoch": 0.85, + "learning_rate": 1.1597669084354712e-06, + "loss": 0.6259, + "step": 24395 + }, + { + "epoch": 0.85, + "learning_rate": 1.159257978822037e-06, + "loss": 0.5875, + "step": 24396 + }, + { + "epoch": 0.85, + "learning_rate": 1.1587491540267836e-06, + "loss": 0.6532, + "step": 24397 + }, + { + "epoch": 0.85, + "learning_rate": 1.1582404340557419e-06, + "loss": 0.6229, + "step": 24398 + }, + { + "epoch": 0.85, + "learning_rate": 1.1577318189149457e-06, + "loss": 0.5809, + "step": 24399 + }, + { + "epoch": 0.85, + "learning_rate": 1.1572233086104257e-06, + "loss": 0.6778, + "step": 24400 + }, + { + "epoch": 0.85, + "learning_rate": 1.1567149031482084e-06, + "loss": 0.6216, + "step": 24401 + }, + { + "epoch": 0.85, + "learning_rate": 1.1562066025343222e-06, + "loss": 0.6753, + "step": 24402 + }, + { + "epoch": 0.85, + "learning_rate": 1.1556984067747935e-06, + "loss": 0.6153, + "step": 24403 + }, + { + "epoch": 0.85, + "learning_rate": 1.1551903158756494e-06, + "loss": 0.6401, + "step": 24404 + }, + { + "epoch": 0.85, + "learning_rate": 1.1546823298429122e-06, + "loss": 0.5983, + "step": 24405 + }, + { + "epoch": 0.85, + "learning_rate": 1.1541744486826067e-06, + "loss": 0.6501, + "step": 24406 + }, + { + "epoch": 0.85, + "learning_rate": 1.1536666724007528e-06, + "loss": 0.6371, + "step": 24407 + }, + { + "epoch": 0.85, + "learning_rate": 1.15315900100337e-06, + "loss": 0.6045, + "step": 24408 + }, + { + "epoch": 0.85, + "learning_rate": 1.152651434496479e-06, + "loss": 0.6419, + "step": 24409 + }, + { + "epoch": 0.85, + "learning_rate": 1.1521439728860973e-06, + "loss": 0.5726, + "step": 24410 + }, + { + "epoch": 0.85, + "learning_rate": 1.151636616178241e-06, + "loss": 0.6286, + "step": 24411 + }, + { + "epoch": 0.85, + "learning_rate": 1.151129364378928e-06, + "loss": 0.5647, + "step": 24412 + }, + { + "epoch": 0.85, + "learning_rate": 1.1506222174941684e-06, + "loss": 0.6896, + "step": 24413 + }, + { + "epoch": 0.85, + "learning_rate": 1.1501151755299765e-06, + "loss": 0.606, + "step": 24414 + }, + { + "epoch": 0.85, + "learning_rate": 1.1496082384923646e-06, + "loss": 0.6495, + "step": 24415 + }, + { + "epoch": 0.85, + "learning_rate": 1.1491014063873428e-06, + "loss": 0.65, + "step": 24416 + }, + { + "epoch": 0.85, + "learning_rate": 1.1485946792209225e-06, + "loss": 0.6386, + "step": 24417 + }, + { + "epoch": 0.85, + "learning_rate": 1.148088056999107e-06, + "loss": 0.6278, + "step": 24418 + }, + { + "epoch": 0.85, + "learning_rate": 1.1475815397279067e-06, + "loss": 0.5798, + "step": 24419 + }, + { + "epoch": 0.85, + "learning_rate": 1.1470751274133263e-06, + "loss": 0.6338, + "step": 24420 + }, + { + "epoch": 0.85, + "learning_rate": 1.1465688200613656e-06, + "loss": 0.6448, + "step": 24421 + }, + { + "epoch": 0.85, + "learning_rate": 1.146062617678032e-06, + "loss": 0.6705, + "step": 24422 + }, + { + "epoch": 0.85, + "learning_rate": 1.1455565202693297e-06, + "loss": 0.6488, + "step": 24423 + }, + { + "epoch": 0.85, + "learning_rate": 1.145050527841254e-06, + "loss": 0.5875, + "step": 24424 + }, + { + "epoch": 0.85, + "learning_rate": 1.144544640399805e-06, + "loss": 0.6534, + "step": 24425 + }, + { + "epoch": 0.85, + "learning_rate": 1.1440388579509842e-06, + "loss": 0.6113, + "step": 24426 + }, + { + "epoch": 0.85, + "learning_rate": 1.1435331805007833e-06, + "loss": 0.603, + "step": 24427 + }, + { + "epoch": 0.85, + "learning_rate": 1.1430276080551972e-06, + "loss": 0.615, + "step": 24428 + }, + { + "epoch": 0.85, + "learning_rate": 1.142522140620228e-06, + "loss": 0.6394, + "step": 24429 + }, + { + "epoch": 0.85, + "learning_rate": 1.142016778201861e-06, + "loss": 0.6682, + "step": 24430 + }, + { + "epoch": 0.85, + "learning_rate": 1.1415115208060913e-06, + "loss": 0.6223, + "step": 24431 + }, + { + "epoch": 0.85, + "learning_rate": 1.1410063684389106e-06, + "loss": 0.7128, + "step": 24432 + }, + { + "epoch": 0.85, + "learning_rate": 1.1405013211063032e-06, + "loss": 0.6352, + "step": 24433 + }, + { + "epoch": 0.85, + "learning_rate": 1.1399963788142575e-06, + "loss": 0.6275, + "step": 24434 + }, + { + "epoch": 0.85, + "learning_rate": 1.139491541568768e-06, + "loss": 0.5998, + "step": 24435 + }, + { + "epoch": 0.85, + "learning_rate": 1.1389868093758128e-06, + "loss": 0.7071, + "step": 24436 + }, + { + "epoch": 0.85, + "learning_rate": 1.1384821822413772e-06, + "loss": 0.6259, + "step": 24437 + }, + { + "epoch": 0.85, + "learning_rate": 1.1379776601714475e-06, + "loss": 0.6759, + "step": 24438 + }, + { + "epoch": 0.85, + "learning_rate": 1.1374732431720027e-06, + "loss": 0.636, + "step": 24439 + }, + { + "epoch": 0.85, + "learning_rate": 1.1369689312490196e-06, + "loss": 0.622, + "step": 24440 + }, + { + "epoch": 0.85, + "learning_rate": 1.136464724408487e-06, + "loss": 0.6424, + "step": 24441 + }, + { + "epoch": 0.85, + "learning_rate": 1.1359606226563746e-06, + "loss": 0.6208, + "step": 24442 + }, + { + "epoch": 0.85, + "learning_rate": 1.1354566259986631e-06, + "loss": 0.6118, + "step": 24443 + }, + { + "epoch": 0.85, + "learning_rate": 1.134952734441328e-06, + "loss": 0.6376, + "step": 24444 + }, + { + "epoch": 0.85, + "learning_rate": 1.1344489479903409e-06, + "loss": 0.6412, + "step": 24445 + }, + { + "epoch": 0.85, + "learning_rate": 1.133945266651675e-06, + "loss": 0.647, + "step": 24446 + }, + { + "epoch": 0.85, + "learning_rate": 1.1334416904313073e-06, + "loss": 0.5926, + "step": 24447 + }, + { + "epoch": 0.85, + "learning_rate": 1.1329382193352023e-06, + "loss": 0.6966, + "step": 24448 + }, + { + "epoch": 0.85, + "learning_rate": 1.1324348533693318e-06, + "loss": 0.6685, + "step": 24449 + }, + { + "epoch": 0.85, + "learning_rate": 1.1319315925396656e-06, + "loss": 0.5982, + "step": 24450 + }, + { + "epoch": 0.85, + "learning_rate": 1.1314284368521667e-06, + "loss": 0.6162, + "step": 24451 + }, + { + "epoch": 0.85, + "learning_rate": 1.1309253863128e-06, + "loss": 0.6702, + "step": 24452 + }, + { + "epoch": 0.85, + "learning_rate": 1.1304224409275365e-06, + "loss": 0.6361, + "step": 24453 + }, + { + "epoch": 0.85, + "learning_rate": 1.1299196007023338e-06, + "loss": 0.5743, + "step": 24454 + }, + { + "epoch": 0.85, + "learning_rate": 1.1294168656431536e-06, + "loss": 0.6174, + "step": 24455 + }, + { + "epoch": 0.85, + "learning_rate": 1.1289142357559612e-06, + "loss": 0.6173, + "step": 24456 + }, + { + "epoch": 0.85, + "learning_rate": 1.1284117110467097e-06, + "loss": 0.6423, + "step": 24457 + }, + { + "epoch": 0.85, + "learning_rate": 1.1279092915213585e-06, + "loss": 0.6446, + "step": 24458 + }, + { + "epoch": 0.85, + "learning_rate": 1.1274069771858697e-06, + "loss": 0.6442, + "step": 24459 + }, + { + "epoch": 0.85, + "learning_rate": 1.126904768046192e-06, + "loss": 0.6153, + "step": 24460 + }, + { + "epoch": 0.85, + "learning_rate": 1.1264026641082837e-06, + "loss": 0.6171, + "step": 24461 + }, + { + "epoch": 0.85, + "learning_rate": 1.125900665378099e-06, + "loss": 0.5959, + "step": 24462 + }, + { + "epoch": 0.85, + "learning_rate": 1.1253987718615866e-06, + "loss": 0.628, + "step": 24463 + }, + { + "epoch": 0.85, + "learning_rate": 1.124896983564695e-06, + "loss": 0.5986, + "step": 24464 + }, + { + "epoch": 0.85, + "learning_rate": 1.1243953004933805e-06, + "loss": 0.688, + "step": 24465 + }, + { + "epoch": 0.85, + "learning_rate": 1.1238937226535861e-06, + "loss": 0.6376, + "step": 24466 + }, + { + "epoch": 0.85, + "learning_rate": 1.1233922500512594e-06, + "loss": 0.5917, + "step": 24467 + }, + { + "epoch": 0.85, + "learning_rate": 1.122890882692349e-06, + "loss": 0.6242, + "step": 24468 + }, + { + "epoch": 0.85, + "learning_rate": 1.1223896205827956e-06, + "loss": 0.6678, + "step": 24469 + }, + { + "epoch": 0.85, + "learning_rate": 1.1218884637285398e-06, + "loss": 0.6484, + "step": 24470 + }, + { + "epoch": 0.85, + "learning_rate": 1.1213874121355327e-06, + "loss": 0.6509, + "step": 24471 + }, + { + "epoch": 0.85, + "learning_rate": 1.1208864658097062e-06, + "loss": 0.6309, + "step": 24472 + }, + { + "epoch": 0.85, + "learning_rate": 1.1203856247570033e-06, + "loss": 0.6094, + "step": 24473 + }, + { + "epoch": 0.85, + "learning_rate": 1.1198848889833636e-06, + "loss": 0.646, + "step": 24474 + }, + { + "epoch": 0.85, + "learning_rate": 1.119384258494719e-06, + "loss": 0.7011, + "step": 24475 + }, + { + "epoch": 0.85, + "learning_rate": 1.118883733297007e-06, + "loss": 0.6119, + "step": 24476 + }, + { + "epoch": 0.85, + "learning_rate": 1.1183833133961674e-06, + "loss": 0.5991, + "step": 24477 + }, + { + "epoch": 0.85, + "learning_rate": 1.1178829987981256e-06, + "loss": 0.6388, + "step": 24478 + }, + { + "epoch": 0.85, + "learning_rate": 1.1173827895088197e-06, + "loss": 0.6033, + "step": 24479 + }, + { + "epoch": 0.85, + "learning_rate": 1.1168826855341752e-06, + "loss": 0.6246, + "step": 24480 + }, + { + "epoch": 0.85, + "learning_rate": 1.116382686880124e-06, + "loss": 0.6179, + "step": 24481 + }, + { + "epoch": 0.85, + "learning_rate": 1.115882793552594e-06, + "loss": 0.6346, + "step": 24482 + }, + { + "epoch": 0.85, + "learning_rate": 1.115383005557511e-06, + "loss": 0.6547, + "step": 24483 + }, + { + "epoch": 0.85, + "learning_rate": 1.1148833229008028e-06, + "loss": 0.6308, + "step": 24484 + }, + { + "epoch": 0.85, + "learning_rate": 1.1143837455883932e-06, + "loss": 0.6337, + "step": 24485 + }, + { + "epoch": 0.85, + "learning_rate": 1.1138842736262035e-06, + "loss": 0.6816, + "step": 24486 + }, + { + "epoch": 0.85, + "learning_rate": 1.1133849070201564e-06, + "loss": 0.6544, + "step": 24487 + }, + { + "epoch": 0.85, + "learning_rate": 1.1128856457761728e-06, + "loss": 0.599, + "step": 24488 + }, + { + "epoch": 0.85, + "learning_rate": 1.1123864899001723e-06, + "loss": 0.6351, + "step": 24489 + }, + { + "epoch": 0.85, + "learning_rate": 1.1118874393980728e-06, + "loss": 0.6357, + "step": 24490 + }, + { + "epoch": 0.85, + "learning_rate": 1.1113884942757935e-06, + "loss": 0.6294, + "step": 24491 + }, + { + "epoch": 0.85, + "learning_rate": 1.1108896545392455e-06, + "loss": 0.6272, + "step": 24492 + }, + { + "epoch": 0.85, + "learning_rate": 1.1103909201943452e-06, + "loss": 0.6511, + "step": 24493 + }, + { + "epoch": 0.85, + "learning_rate": 1.1098922912470067e-06, + "loss": 0.622, + "step": 24494 + }, + { + "epoch": 0.85, + "learning_rate": 1.1093937677031408e-06, + "loss": 0.6951, + "step": 24495 + }, + { + "epoch": 0.85, + "learning_rate": 1.1088953495686584e-06, + "loss": 0.6238, + "step": 24496 + }, + { + "epoch": 0.85, + "learning_rate": 1.1083970368494702e-06, + "loss": 0.6061, + "step": 24497 + }, + { + "epoch": 0.85, + "learning_rate": 1.1078988295514825e-06, + "loss": 0.6148, + "step": 24498 + }, + { + "epoch": 0.85, + "learning_rate": 1.1074007276806009e-06, + "loss": 0.6568, + "step": 24499 + }, + { + "epoch": 0.85, + "learning_rate": 1.1069027312427349e-06, + "loss": 0.6871, + "step": 24500 + }, + { + "epoch": 0.85, + "learning_rate": 1.1064048402437855e-06, + "loss": 0.6704, + "step": 24501 + }, + { + "epoch": 0.85, + "learning_rate": 1.1059070546896577e-06, + "loss": 0.5918, + "step": 24502 + }, + { + "epoch": 0.85, + "learning_rate": 1.105409374586255e-06, + "loss": 0.6152, + "step": 24503 + }, + { + "epoch": 0.85, + "learning_rate": 1.1049117999394732e-06, + "loss": 0.5823, + "step": 24504 + }, + { + "epoch": 0.85, + "learning_rate": 1.1044143307552146e-06, + "loss": 0.6627, + "step": 24505 + }, + { + "epoch": 0.85, + "learning_rate": 1.1039169670393768e-06, + "loss": 0.6319, + "step": 24506 + }, + { + "epoch": 0.85, + "learning_rate": 1.1034197087978583e-06, + "loss": 0.6392, + "step": 24507 + }, + { + "epoch": 0.85, + "learning_rate": 1.102922556036552e-06, + "loss": 0.6188, + "step": 24508 + }, + { + "epoch": 0.85, + "learning_rate": 1.1024255087613566e-06, + "loss": 0.6802, + "step": 24509 + }, + { + "epoch": 0.85, + "learning_rate": 1.1019285669781598e-06, + "loss": 0.5946, + "step": 24510 + }, + { + "epoch": 0.85, + "learning_rate": 1.1014317306928557e-06, + "loss": 0.6112, + "step": 24511 + }, + { + "epoch": 0.85, + "learning_rate": 1.100934999911335e-06, + "loss": 0.594, + "step": 24512 + }, + { + "epoch": 0.85, + "learning_rate": 1.1004383746394876e-06, + "loss": 0.6558, + "step": 24513 + }, + { + "epoch": 0.85, + "learning_rate": 1.099941854883202e-06, + "loss": 0.6509, + "step": 24514 + }, + { + "epoch": 0.85, + "learning_rate": 1.0994454406483657e-06, + "loss": 0.6438, + "step": 24515 + }, + { + "epoch": 0.85, + "learning_rate": 1.0989491319408607e-06, + "loss": 0.6633, + "step": 24516 + }, + { + "epoch": 0.85, + "learning_rate": 1.0984529287665736e-06, + "loss": 0.6165, + "step": 24517 + }, + { + "epoch": 0.85, + "learning_rate": 1.0979568311313883e-06, + "loss": 0.6392, + "step": 24518 + }, + { + "epoch": 0.85, + "learning_rate": 1.0974608390411857e-06, + "loss": 0.6905, + "step": 24519 + }, + { + "epoch": 0.85, + "learning_rate": 1.0969649525018456e-06, + "loss": 0.5623, + "step": 24520 + }, + { + "epoch": 0.85, + "learning_rate": 1.096469171519252e-06, + "loss": 0.609, + "step": 24521 + }, + { + "epoch": 0.85, + "learning_rate": 1.0959734960992762e-06, + "loss": 0.6139, + "step": 24522 + }, + { + "epoch": 0.85, + "learning_rate": 1.0954779262477988e-06, + "loss": 0.5772, + "step": 24523 + }, + { + "epoch": 0.85, + "learning_rate": 1.094982461970695e-06, + "loss": 0.6264, + "step": 24524 + }, + { + "epoch": 0.85, + "learning_rate": 1.094487103273838e-06, + "loss": 0.7355, + "step": 24525 + }, + { + "epoch": 0.85, + "learning_rate": 1.093991850163103e-06, + "loss": 0.6183, + "step": 24526 + }, + { + "epoch": 0.85, + "learning_rate": 1.0934967026443622e-06, + "loss": 0.6673, + "step": 24527 + }, + { + "epoch": 0.85, + "learning_rate": 1.0930016607234829e-06, + "loss": 0.6095, + "step": 24528 + }, + { + "epoch": 0.85, + "learning_rate": 1.092506724406337e-06, + "loss": 0.6568, + "step": 24529 + }, + { + "epoch": 0.85, + "learning_rate": 1.092011893698791e-06, + "loss": 0.5843, + "step": 24530 + }, + { + "epoch": 0.85, + "learning_rate": 1.0915171686067128e-06, + "loss": 0.6277, + "step": 24531 + }, + { + "epoch": 0.85, + "learning_rate": 1.0910225491359682e-06, + "loss": 0.5909, + "step": 24532 + }, + { + "epoch": 0.85, + "learning_rate": 1.090528035292423e-06, + "loss": 0.5951, + "step": 24533 + }, + { + "epoch": 0.85, + "learning_rate": 1.0900336270819367e-06, + "loss": 0.6377, + "step": 24534 + }, + { + "epoch": 0.85, + "learning_rate": 1.0895393245103725e-06, + "loss": 0.6266, + "step": 24535 + }, + { + "epoch": 0.85, + "learning_rate": 1.089045127583591e-06, + "loss": 0.6611, + "step": 24536 + }, + { + "epoch": 0.85, + "learning_rate": 1.0885510363074536e-06, + "loss": 0.6333, + "step": 24537 + }, + { + "epoch": 0.85, + "learning_rate": 1.0880570506878152e-06, + "loss": 0.529, + "step": 24538 + }, + { + "epoch": 0.85, + "learning_rate": 1.0875631707305367e-06, + "loss": 0.6005, + "step": 24539 + }, + { + "epoch": 0.85, + "learning_rate": 1.0870693964414692e-06, + "loss": 0.6401, + "step": 24540 + }, + { + "epoch": 0.85, + "learning_rate": 1.0865757278264687e-06, + "loss": 0.6387, + "step": 24541 + }, + { + "epoch": 0.85, + "learning_rate": 1.0860821648913888e-06, + "loss": 0.6824, + "step": 24542 + }, + { + "epoch": 0.85, + "learning_rate": 1.08558870764208e-06, + "loss": 0.6772, + "step": 24543 + }, + { + "epoch": 0.85, + "learning_rate": 1.085095356084397e-06, + "loss": 0.6862, + "step": 24544 + }, + { + "epoch": 0.85, + "learning_rate": 1.0846021102241834e-06, + "loss": 0.653, + "step": 24545 + }, + { + "epoch": 0.85, + "learning_rate": 1.0841089700672903e-06, + "loss": 0.6314, + "step": 24546 + }, + { + "epoch": 0.85, + "learning_rate": 1.083615935619563e-06, + "loss": 0.6826, + "step": 24547 + }, + { + "epoch": 0.85, + "learning_rate": 1.0831230068868493e-06, + "loss": 0.6069, + "step": 24548 + }, + { + "epoch": 0.85, + "learning_rate": 1.082630183874992e-06, + "loss": 0.6578, + "step": 24549 + }, + { + "epoch": 0.85, + "learning_rate": 1.0821374665898354e-06, + "loss": 0.6193, + "step": 24550 + }, + { + "epoch": 0.85, + "learning_rate": 1.0816448550372194e-06, + "loss": 0.645, + "step": 24551 + }, + { + "epoch": 0.85, + "learning_rate": 1.0811523492229848e-06, + "loss": 0.6194, + "step": 24552 + }, + { + "epoch": 0.85, + "learning_rate": 1.0806599491529711e-06, + "loss": 0.6536, + "step": 24553 + }, + { + "epoch": 0.85, + "learning_rate": 1.0801676548330175e-06, + "loss": 0.6539, + "step": 24554 + }, + { + "epoch": 0.85, + "learning_rate": 1.0796754662689602e-06, + "loss": 0.6531, + "step": 24555 + }, + { + "epoch": 0.85, + "learning_rate": 1.0791833834666365e-06, + "loss": 0.6559, + "step": 24556 + }, + { + "epoch": 0.85, + "learning_rate": 1.0786914064318766e-06, + "loss": 0.5959, + "step": 24557 + }, + { + "epoch": 0.85, + "learning_rate": 1.0781995351705143e-06, + "loss": 0.5987, + "step": 24558 + }, + { + "epoch": 0.85, + "learning_rate": 1.0777077696883843e-06, + "loss": 0.5774, + "step": 24559 + }, + { + "epoch": 0.85, + "learning_rate": 1.0772161099913148e-06, + "loss": 0.5961, + "step": 24560 + }, + { + "epoch": 0.85, + "learning_rate": 1.0767245560851358e-06, + "loss": 0.6437, + "step": 24561 + }, + { + "epoch": 0.85, + "learning_rate": 1.0762331079756772e-06, + "loss": 0.6177, + "step": 24562 + }, + { + "epoch": 0.85, + "learning_rate": 1.0757417656687619e-06, + "loss": 0.6387, + "step": 24563 + }, + { + "epoch": 0.85, + "learning_rate": 1.0752505291702165e-06, + "loss": 0.6174, + "step": 24564 + }, + { + "epoch": 0.85, + "learning_rate": 1.074759398485866e-06, + "loss": 0.6329, + "step": 24565 + }, + { + "epoch": 0.85, + "learning_rate": 1.0742683736215343e-06, + "loss": 0.6712, + "step": 24566 + }, + { + "epoch": 0.85, + "learning_rate": 1.0737774545830415e-06, + "loss": 0.594, + "step": 24567 + }, + { + "epoch": 0.85, + "learning_rate": 1.073286641376211e-06, + "loss": 0.6578, + "step": 24568 + }, + { + "epoch": 0.85, + "learning_rate": 1.0727959340068571e-06, + "loss": 0.6227, + "step": 24569 + }, + { + "epoch": 0.85, + "learning_rate": 1.0723053324808008e-06, + "loss": 0.6311, + "step": 24570 + }, + { + "epoch": 0.85, + "learning_rate": 1.0718148368038583e-06, + "loss": 0.5826, + "step": 24571 + }, + { + "epoch": 0.85, + "learning_rate": 1.0713244469818452e-06, + "loss": 0.6384, + "step": 24572 + }, + { + "epoch": 0.85, + "learning_rate": 1.0708341630205754e-06, + "loss": 0.6424, + "step": 24573 + }, + { + "epoch": 0.85, + "learning_rate": 1.0703439849258646e-06, + "loss": 0.6213, + "step": 24574 + }, + { + "epoch": 0.85, + "learning_rate": 1.0698539127035191e-06, + "loss": 0.6498, + "step": 24575 + }, + { + "epoch": 0.85, + "learning_rate": 1.069363946359353e-06, + "loss": 0.6561, + "step": 24576 + }, + { + "epoch": 0.85, + "learning_rate": 1.0688740858991741e-06, + "loss": 0.6696, + "step": 24577 + }, + { + "epoch": 0.85, + "learning_rate": 1.0683843313287911e-06, + "loss": 0.655, + "step": 24578 + }, + { + "epoch": 0.85, + "learning_rate": 1.0678946826540104e-06, + "loss": 0.6576, + "step": 24579 + }, + { + "epoch": 0.85, + "learning_rate": 1.0674051398806395e-06, + "loss": 0.6544, + "step": 24580 + }, + { + "epoch": 0.85, + "learning_rate": 1.0669157030144773e-06, + "loss": 0.6531, + "step": 24581 + }, + { + "epoch": 0.85, + "learning_rate": 1.0664263720613311e-06, + "loss": 0.5799, + "step": 24582 + }, + { + "epoch": 0.85, + "learning_rate": 1.0659371470270009e-06, + "loss": 0.6567, + "step": 24583 + }, + { + "epoch": 0.85, + "learning_rate": 1.0654480279172874e-06, + "loss": 0.6409, + "step": 24584 + }, + { + "epoch": 0.85, + "learning_rate": 1.0649590147379907e-06, + "loss": 0.6347, + "step": 24585 + }, + { + "epoch": 0.85, + "learning_rate": 1.0644701074949082e-06, + "loss": 0.6511, + "step": 24586 + }, + { + "epoch": 0.85, + "learning_rate": 1.0639813061938353e-06, + "loss": 0.6914, + "step": 24587 + }, + { + "epoch": 0.85, + "learning_rate": 1.0634926108405675e-06, + "loss": 0.5978, + "step": 24588 + }, + { + "epoch": 0.85, + "learning_rate": 1.0630040214408998e-06, + "loss": 0.6573, + "step": 24589 + }, + { + "epoch": 0.85, + "learning_rate": 1.0625155380006247e-06, + "loss": 0.614, + "step": 24590 + }, + { + "epoch": 0.85, + "learning_rate": 1.062027160525534e-06, + "loss": 0.6257, + "step": 24591 + }, + { + "epoch": 0.85, + "learning_rate": 1.0615388890214207e-06, + "loss": 0.6225, + "step": 24592 + }, + { + "epoch": 0.85, + "learning_rate": 1.0610507234940681e-06, + "loss": 0.6153, + "step": 24593 + }, + { + "epoch": 0.85, + "learning_rate": 1.0605626639492671e-06, + "loss": 0.6396, + "step": 24594 + }, + { + "epoch": 0.85, + "learning_rate": 1.0600747103928043e-06, + "loss": 0.6472, + "step": 24595 + }, + { + "epoch": 0.85, + "learning_rate": 1.059586862830464e-06, + "loss": 0.6471, + "step": 24596 + }, + { + "epoch": 0.85, + "learning_rate": 1.0590991212680324e-06, + "loss": 0.6259, + "step": 24597 + }, + { + "epoch": 0.85, + "learning_rate": 1.0586114857112927e-06, + "loss": 0.6876, + "step": 24598 + }, + { + "epoch": 0.85, + "learning_rate": 1.0581239561660218e-06, + "loss": 0.6027, + "step": 24599 + }, + { + "epoch": 0.85, + "learning_rate": 1.0576365326380045e-06, + "loss": 0.6007, + "step": 24600 + }, + { + "epoch": 0.85, + "learning_rate": 1.0571492151330165e-06, + "loss": 0.6338, + "step": 24601 + }, + { + "epoch": 0.85, + "learning_rate": 1.0566620036568386e-06, + "loss": 0.6256, + "step": 24602 + }, + { + "epoch": 0.85, + "learning_rate": 1.0561748982152475e-06, + "loss": 0.6481, + "step": 24603 + }, + { + "epoch": 0.85, + "learning_rate": 1.055687898814015e-06, + "loss": 0.6068, + "step": 24604 + }, + { + "epoch": 0.85, + "learning_rate": 1.0552010054589178e-06, + "loss": 0.5791, + "step": 24605 + }, + { + "epoch": 0.85, + "learning_rate": 1.0547142181557267e-06, + "loss": 0.6076, + "step": 24606 + }, + { + "epoch": 0.85, + "learning_rate": 1.0542275369102163e-06, + "loss": 0.6163, + "step": 24607 + }, + { + "epoch": 0.85, + "learning_rate": 1.0537409617281536e-06, + "loss": 0.6922, + "step": 24608 + }, + { + "epoch": 0.85, + "learning_rate": 1.05325449261531e-06, + "loss": 0.6833, + "step": 24609 + }, + { + "epoch": 0.85, + "learning_rate": 1.0527681295774516e-06, + "loss": 0.6535, + "step": 24610 + }, + { + "epoch": 0.85, + "learning_rate": 1.0522818726203442e-06, + "loss": 0.6351, + "step": 24611 + }, + { + "epoch": 0.85, + "learning_rate": 1.0517957217497553e-06, + "loss": 0.5835, + "step": 24612 + }, + { + "epoch": 0.85, + "learning_rate": 1.051309676971447e-06, + "loss": 0.6092, + "step": 24613 + }, + { + "epoch": 0.85, + "learning_rate": 1.0508237382911823e-06, + "loss": 0.6421, + "step": 24614 + }, + { + "epoch": 0.85, + "learning_rate": 1.0503379057147257e-06, + "loss": 0.6326, + "step": 24615 + }, + { + "epoch": 0.85, + "learning_rate": 1.0498521792478323e-06, + "loss": 0.6562, + "step": 24616 + }, + { + "epoch": 0.85, + "learning_rate": 1.0493665588962632e-06, + "loss": 0.6085, + "step": 24617 + }, + { + "epoch": 0.85, + "learning_rate": 1.048881044665776e-06, + "loss": 0.6981, + "step": 24618 + }, + { + "epoch": 0.85, + "learning_rate": 1.0483956365621273e-06, + "loss": 0.6968, + "step": 24619 + }, + { + "epoch": 0.85, + "learning_rate": 1.0479103345910725e-06, + "loss": 0.6678, + "step": 24620 + }, + { + "epoch": 0.85, + "learning_rate": 1.0474251387583666e-06, + "loss": 0.5955, + "step": 24621 + }, + { + "epoch": 0.85, + "learning_rate": 1.046940049069759e-06, + "loss": 0.597, + "step": 24622 + }, + { + "epoch": 0.85, + "learning_rate": 1.0464550655310035e-06, + "loss": 0.6051, + "step": 24623 + }, + { + "epoch": 0.85, + "learning_rate": 1.0459701881478501e-06, + "loss": 0.6117, + "step": 24624 + }, + { + "epoch": 0.85, + "learning_rate": 1.0454854169260442e-06, + "loss": 0.6265, + "step": 24625 + }, + { + "epoch": 0.85, + "learning_rate": 1.045000751871338e-06, + "loss": 0.6347, + "step": 24626 + }, + { + "epoch": 0.85, + "learning_rate": 1.0445161929894776e-06, + "loss": 0.6262, + "step": 24627 + }, + { + "epoch": 0.85, + "learning_rate": 1.0440317402862044e-06, + "loss": 0.6042, + "step": 24628 + }, + { + "epoch": 0.85, + "learning_rate": 1.0435473937672646e-06, + "loss": 0.6401, + "step": 24629 + }, + { + "epoch": 0.85, + "learning_rate": 1.0430631534384027e-06, + "loss": 0.662, + "step": 24630 + }, + { + "epoch": 0.85, + "learning_rate": 1.042579019305353e-06, + "loss": 0.635, + "step": 24631 + }, + { + "epoch": 0.85, + "learning_rate": 1.042094991373863e-06, + "loss": 0.5887, + "step": 24632 + }, + { + "epoch": 0.85, + "learning_rate": 1.0416110696496695e-06, + "loss": 0.5704, + "step": 24633 + }, + { + "epoch": 0.85, + "learning_rate": 1.0411272541385088e-06, + "loss": 0.6269, + "step": 24634 + }, + { + "epoch": 0.85, + "learning_rate": 1.040643544846116e-06, + "loss": 0.6071, + "step": 24635 + }, + { + "epoch": 0.85, + "learning_rate": 1.0401599417782304e-06, + "loss": 0.6603, + "step": 24636 + }, + { + "epoch": 0.85, + "learning_rate": 1.0396764449405793e-06, + "loss": 0.6782, + "step": 24637 + }, + { + "epoch": 0.85, + "learning_rate": 1.0391930543389006e-06, + "loss": 0.6556, + "step": 24638 + }, + { + "epoch": 0.85, + "learning_rate": 1.038709769978925e-06, + "loss": 0.6953, + "step": 24639 + }, + { + "epoch": 0.85, + "learning_rate": 1.0382265918663803e-06, + "loss": 0.6648, + "step": 24640 + }, + { + "epoch": 0.85, + "learning_rate": 1.0377435200069952e-06, + "loss": 0.6035, + "step": 24641 + }, + { + "epoch": 0.85, + "learning_rate": 1.0372605544064994e-06, + "loss": 0.587, + "step": 24642 + }, + { + "epoch": 0.85, + "learning_rate": 1.0367776950706155e-06, + "loss": 0.7101, + "step": 24643 + }, + { + "epoch": 0.85, + "learning_rate": 1.0362949420050716e-06, + "loss": 0.5753, + "step": 24644 + }, + { + "epoch": 0.85, + "learning_rate": 1.0358122952155914e-06, + "loss": 0.578, + "step": 24645 + }, + { + "epoch": 0.85, + "learning_rate": 1.0353297547078955e-06, + "loss": 0.6242, + "step": 24646 + }, + { + "epoch": 0.85, + "learning_rate": 1.0348473204877052e-06, + "loss": 0.5931, + "step": 24647 + }, + { + "epoch": 0.85, + "learning_rate": 1.0343649925607424e-06, + "loss": 0.6402, + "step": 24648 + }, + { + "epoch": 0.85, + "learning_rate": 1.0338827709327215e-06, + "loss": 0.6013, + "step": 24649 + }, + { + "epoch": 0.85, + "learning_rate": 1.0334006556093634e-06, + "loss": 0.6386, + "step": 24650 + }, + { + "epoch": 0.85, + "learning_rate": 1.032918646596386e-06, + "loss": 0.603, + "step": 24651 + }, + { + "epoch": 0.85, + "learning_rate": 1.0324367438994986e-06, + "loss": 0.6616, + "step": 24652 + }, + { + "epoch": 0.85, + "learning_rate": 1.0319549475244184e-06, + "loss": 0.6507, + "step": 24653 + }, + { + "epoch": 0.85, + "learning_rate": 1.0314732574768593e-06, + "loss": 0.5625, + "step": 24654 + }, + { + "epoch": 0.85, + "learning_rate": 1.0309916737625248e-06, + "loss": 0.6469, + "step": 24655 + }, + { + "epoch": 0.85, + "learning_rate": 1.0305101963871333e-06, + "loss": 0.5889, + "step": 24656 + }, + { + "epoch": 0.85, + "learning_rate": 1.0300288253563905e-06, + "loss": 0.6173, + "step": 24657 + }, + { + "epoch": 0.85, + "learning_rate": 1.029547560676002e-06, + "loss": 0.6953, + "step": 24658 + }, + { + "epoch": 0.85, + "learning_rate": 1.0290664023516738e-06, + "loss": 0.6424, + "step": 24659 + }, + { + "epoch": 0.85, + "learning_rate": 1.0285853503891153e-06, + "loss": 0.602, + "step": 24660 + }, + { + "epoch": 0.85, + "learning_rate": 1.0281044047940214e-06, + "loss": 0.5939, + "step": 24661 + }, + { + "epoch": 0.85, + "learning_rate": 1.0276235655721012e-06, + "loss": 0.6664, + "step": 24662 + }, + { + "epoch": 0.85, + "learning_rate": 1.0271428327290555e-06, + "loss": 0.6034, + "step": 24663 + }, + { + "epoch": 0.85, + "learning_rate": 1.026662206270581e-06, + "loss": 0.6349, + "step": 24664 + }, + { + "epoch": 0.85, + "learning_rate": 1.0261816862023787e-06, + "loss": 0.6811, + "step": 24665 + }, + { + "epoch": 0.85, + "learning_rate": 1.025701272530143e-06, + "loss": 0.6411, + "step": 24666 + }, + { + "epoch": 0.85, + "learning_rate": 1.025220965259569e-06, + "loss": 0.5957, + "step": 24667 + }, + { + "epoch": 0.85, + "learning_rate": 1.024740764396357e-06, + "loss": 0.6948, + "step": 24668 + }, + { + "epoch": 0.85, + "learning_rate": 1.0242606699461966e-06, + "loss": 0.6325, + "step": 24669 + }, + { + "epoch": 0.85, + "learning_rate": 1.0237806819147788e-06, + "loss": 0.6294, + "step": 24670 + }, + { + "epoch": 0.85, + "learning_rate": 1.0233008003077982e-06, + "loss": 0.6661, + "step": 24671 + }, + { + "epoch": 0.85, + "learning_rate": 1.0228210251309412e-06, + "loss": 0.7067, + "step": 24672 + }, + { + "epoch": 0.85, + "learning_rate": 1.0223413563898944e-06, + "loss": 0.6416, + "step": 24673 + }, + { + "epoch": 0.85, + "learning_rate": 1.021861794090352e-06, + "loss": 0.6408, + "step": 24674 + }, + { + "epoch": 0.85, + "learning_rate": 1.0213823382379927e-06, + "loss": 0.6439, + "step": 24675 + }, + { + "epoch": 0.85, + "learning_rate": 1.0209029888385036e-06, + "loss": 0.6761, + "step": 24676 + }, + { + "epoch": 0.85, + "learning_rate": 1.0204237458975708e-06, + "loss": 0.6445, + "step": 24677 + }, + { + "epoch": 0.86, + "learning_rate": 1.019944609420872e-06, + "loss": 0.642, + "step": 24678 + }, + { + "epoch": 0.86, + "learning_rate": 1.0194655794140872e-06, + "loss": 0.6181, + "step": 24679 + }, + { + "epoch": 0.86, + "learning_rate": 1.0189866558829032e-06, + "loss": 0.6033, + "step": 24680 + }, + { + "epoch": 0.86, + "learning_rate": 1.0185078388329905e-06, + "loss": 0.6798, + "step": 24681 + }, + { + "epoch": 0.86, + "learning_rate": 1.0180291282700295e-06, + "loss": 0.6445, + "step": 24682 + }, + { + "epoch": 0.86, + "learning_rate": 1.0175505241996974e-06, + "loss": 0.6625, + "step": 24683 + }, + { + "epoch": 0.86, + "learning_rate": 1.0170720266276647e-06, + "loss": 0.6793, + "step": 24684 + }, + { + "epoch": 0.86, + "learning_rate": 1.016593635559604e-06, + "loss": 0.6188, + "step": 24685 + }, + { + "epoch": 0.86, + "learning_rate": 1.0161153510011945e-06, + "loss": 0.6853, + "step": 24686 + }, + { + "epoch": 0.86, + "learning_rate": 1.0156371729580993e-06, + "loss": 0.6328, + "step": 24687 + }, + { + "epoch": 0.86, + "learning_rate": 1.0151591014359918e-06, + "loss": 0.6266, + "step": 24688 + }, + { + "epoch": 0.86, + "learning_rate": 1.0146811364405407e-06, + "loss": 0.6113, + "step": 24689 + }, + { + "epoch": 0.86, + "learning_rate": 1.0142032779774092e-06, + "loss": 0.6583, + "step": 24690 + }, + { + "epoch": 0.86, + "learning_rate": 1.0137255260522628e-06, + "loss": 0.5799, + "step": 24691 + }, + { + "epoch": 0.86, + "learning_rate": 1.0132478806707713e-06, + "loss": 0.6683, + "step": 24692 + }, + { + "epoch": 0.86, + "learning_rate": 1.0127703418385937e-06, + "loss": 0.6094, + "step": 24693 + }, + { + "epoch": 0.86, + "learning_rate": 1.012292909561392e-06, + "loss": 0.614, + "step": 24694 + }, + { + "epoch": 0.86, + "learning_rate": 1.0118155838448297e-06, + "loss": 0.6435, + "step": 24695 + }, + { + "epoch": 0.86, + "learning_rate": 1.0113383646945617e-06, + "loss": 0.6533, + "step": 24696 + }, + { + "epoch": 0.86, + "learning_rate": 1.0108612521162453e-06, + "loss": 0.6248, + "step": 24697 + }, + { + "epoch": 0.86, + "learning_rate": 1.0103842461155456e-06, + "loss": 0.6321, + "step": 24698 + }, + { + "epoch": 0.86, + "learning_rate": 1.0099073466981091e-06, + "loss": 0.635, + "step": 24699 + }, + { + "epoch": 0.86, + "learning_rate": 1.0094305538695937e-06, + "loss": 0.6395, + "step": 24700 + }, + { + "epoch": 0.86, + "learning_rate": 1.0089538676356546e-06, + "loss": 0.6475, + "step": 24701 + }, + { + "epoch": 0.86, + "learning_rate": 1.00847728800194e-06, + "loss": 0.5902, + "step": 24702 + }, + { + "epoch": 0.86, + "learning_rate": 1.0080008149740984e-06, + "loss": 0.5833, + "step": 24703 + }, + { + "epoch": 0.86, + "learning_rate": 1.0075244485577863e-06, + "loss": 0.6404, + "step": 24704 + }, + { + "epoch": 0.86, + "learning_rate": 1.0070481887586459e-06, + "loss": 0.63, + "step": 24705 + }, + { + "epoch": 0.86, + "learning_rate": 1.0065720355823238e-06, + "loss": 0.6058, + "step": 24706 + }, + { + "epoch": 0.86, + "learning_rate": 1.0060959890344702e-06, + "loss": 0.6549, + "step": 24707 + }, + { + "epoch": 0.86, + "learning_rate": 1.0056200491207246e-06, + "loss": 0.6045, + "step": 24708 + }, + { + "epoch": 0.86, + "learning_rate": 1.0051442158467283e-06, + "loss": 0.6337, + "step": 24709 + }, + { + "epoch": 0.86, + "learning_rate": 1.0046684892181303e-06, + "loss": 0.6135, + "step": 24710 + }, + { + "epoch": 0.86, + "learning_rate": 1.0041928692405645e-06, + "loss": 0.6157, + "step": 24711 + }, + { + "epoch": 0.86, + "learning_rate": 1.003717355919671e-06, + "loss": 0.7028, + "step": 24712 + }, + { + "epoch": 0.86, + "learning_rate": 1.0032419492610911e-06, + "loss": 0.6539, + "step": 24713 + }, + { + "epoch": 0.86, + "learning_rate": 1.002766649270458e-06, + "loss": 0.6621, + "step": 24714 + }, + { + "epoch": 0.86, + "learning_rate": 1.0022914559534048e-06, + "loss": 0.5894, + "step": 24715 + }, + { + "epoch": 0.86, + "learning_rate": 1.0018163693155726e-06, + "loss": 0.6183, + "step": 24716 + }, + { + "epoch": 0.86, + "learning_rate": 1.0013413893625879e-06, + "loss": 0.6104, + "step": 24717 + }, + { + "epoch": 0.86, + "learning_rate": 1.0008665161000853e-06, + "loss": 0.6171, + "step": 24718 + }, + { + "epoch": 0.86, + "learning_rate": 1.0003917495336956e-06, + "loss": 0.6826, + "step": 24719 + }, + { + "epoch": 0.86, + "learning_rate": 9.999170896690436e-07, + "loss": 0.6284, + "step": 24720 + }, + { + "epoch": 0.86, + "learning_rate": 9.994425365117587e-07, + "loss": 0.614, + "step": 24721 + }, + { + "epoch": 0.86, + "learning_rate": 9.989680900674714e-07, + "loss": 0.65, + "step": 24722 + }, + { + "epoch": 0.86, + "learning_rate": 9.984937503418024e-07, + "loss": 0.6198, + "step": 24723 + }, + { + "epoch": 0.86, + "learning_rate": 9.980195173403772e-07, + "loss": 0.6285, + "step": 24724 + }, + { + "epoch": 0.86, + "learning_rate": 9.975453910688193e-07, + "loss": 0.6635, + "step": 24725 + }, + { + "epoch": 0.86, + "learning_rate": 9.970713715327473e-07, + "loss": 0.6579, + "step": 24726 + }, + { + "epoch": 0.86, + "learning_rate": 9.965974587377835e-07, + "loss": 0.6057, + "step": 24727 + }, + { + "epoch": 0.86, + "learning_rate": 9.961236526895457e-07, + "loss": 0.6665, + "step": 24728 + }, + { + "epoch": 0.86, + "learning_rate": 9.956499533936525e-07, + "loss": 0.6508, + "step": 24729 + }, + { + "epoch": 0.86, + "learning_rate": 9.951763608557208e-07, + "loss": 0.5992, + "step": 24730 + }, + { + "epoch": 0.86, + "learning_rate": 9.947028750813625e-07, + "loss": 0.6486, + "step": 24731 + }, + { + "epoch": 0.86, + "learning_rate": 9.942294960761944e-07, + "loss": 0.7002, + "step": 24732 + }, + { + "epoch": 0.86, + "learning_rate": 9.937562238458277e-07, + "loss": 0.6117, + "step": 24733 + }, + { + "epoch": 0.86, + "learning_rate": 9.93283058395873e-07, + "loss": 0.6867, + "step": 24734 + }, + { + "epoch": 0.86, + "learning_rate": 9.928099997319417e-07, + "loss": 0.6499, + "step": 24735 + }, + { + "epoch": 0.86, + "learning_rate": 9.923370478596438e-07, + "loss": 0.6031, + "step": 24736 + }, + { + "epoch": 0.86, + "learning_rate": 9.918642027845837e-07, + "loss": 0.5838, + "step": 24737 + }, + { + "epoch": 0.86, + "learning_rate": 9.913914645123678e-07, + "loss": 0.6402, + "step": 24738 + }, + { + "epoch": 0.86, + "learning_rate": 9.90918833048603e-07, + "loss": 0.676, + "step": 24739 + }, + { + "epoch": 0.86, + "learning_rate": 9.904463083988912e-07, + "loss": 0.649, + "step": 24740 + }, + { + "epoch": 0.86, + "learning_rate": 9.89973890568836e-07, + "loss": 0.593, + "step": 24741 + }, + { + "epoch": 0.86, + "learning_rate": 9.895015795640406e-07, + "loss": 0.6527, + "step": 24742 + }, + { + "epoch": 0.86, + "learning_rate": 9.890293753900992e-07, + "loss": 0.6249, + "step": 24743 + }, + { + "epoch": 0.86, + "learning_rate": 9.885572780526143e-07, + "loss": 0.5923, + "step": 24744 + }, + { + "epoch": 0.86, + "learning_rate": 9.880852875571823e-07, + "loss": 0.6317, + "step": 24745 + }, + { + "epoch": 0.86, + "learning_rate": 9.876134039093988e-07, + "loss": 0.6503, + "step": 24746 + }, + { + "epoch": 0.86, + "learning_rate": 9.871416271148604e-07, + "loss": 0.615, + "step": 24747 + }, + { + "epoch": 0.86, + "learning_rate": 9.866699571791593e-07, + "loss": 0.6838, + "step": 24748 + }, + { + "epoch": 0.86, + "learning_rate": 9.86198394107888e-07, + "loss": 0.6344, + "step": 24749 + }, + { + "epoch": 0.86, + "learning_rate": 9.857269379066358e-07, + "loss": 0.5869, + "step": 24750 + }, + { + "epoch": 0.86, + "learning_rate": 9.852555885809945e-07, + "loss": 0.6226, + "step": 24751 + }, + { + "epoch": 0.86, + "learning_rate": 9.847843461365513e-07, + "loss": 0.6232, + "step": 24752 + }, + { + "epoch": 0.86, + "learning_rate": 9.843132105788944e-07, + "loss": 0.6656, + "step": 24753 + }, + { + "epoch": 0.86, + "learning_rate": 9.838421819136112e-07, + "loss": 0.6217, + "step": 24754 + }, + { + "epoch": 0.86, + "learning_rate": 9.833712601462819e-07, + "loss": 0.657, + "step": 24755 + }, + { + "epoch": 0.86, + "learning_rate": 9.82900445282493e-07, + "loss": 0.6254, + "step": 24756 + }, + { + "epoch": 0.86, + "learning_rate": 9.824297373278268e-07, + "loss": 0.6456, + "step": 24757 + }, + { + "epoch": 0.86, + "learning_rate": 9.819591362878621e-07, + "loss": 0.6188, + "step": 24758 + }, + { + "epoch": 0.86, + "learning_rate": 9.814886421681802e-07, + "loss": 0.5853, + "step": 24759 + }, + { + "epoch": 0.86, + "learning_rate": 9.810182549743608e-07, + "loss": 0.6454, + "step": 24760 + }, + { + "epoch": 0.86, + "learning_rate": 9.805479747119773e-07, + "loss": 0.6098, + "step": 24761 + }, + { + "epoch": 0.86, + "learning_rate": 9.800778013866064e-07, + "loss": 0.5959, + "step": 24762 + }, + { + "epoch": 0.86, + "learning_rate": 9.796077350038247e-07, + "loss": 0.6043, + "step": 24763 + }, + { + "epoch": 0.86, + "learning_rate": 9.791377755692034e-07, + "loss": 0.6433, + "step": 24764 + }, + { + "epoch": 0.86, + "learning_rate": 9.786679230883155e-07, + "loss": 0.6613, + "step": 24765 + }, + { + "epoch": 0.86, + "learning_rate": 9.781981775667327e-07, + "loss": 0.6245, + "step": 24766 + }, + { + "epoch": 0.86, + "learning_rate": 9.777285390100221e-07, + "loss": 0.6693, + "step": 24767 + }, + { + "epoch": 0.86, + "learning_rate": 9.77259007423752e-07, + "loss": 0.6291, + "step": 24768 + }, + { + "epoch": 0.86, + "learning_rate": 9.76789582813491e-07, + "loss": 0.6254, + "step": 24769 + }, + { + "epoch": 0.86, + "learning_rate": 9.763202651848035e-07, + "loss": 0.6232, + "step": 24770 + }, + { + "epoch": 0.86, + "learning_rate": 9.758510545432543e-07, + "loss": 0.6308, + "step": 24771 + }, + { + "epoch": 0.86, + "learning_rate": 9.753819508944085e-07, + "loss": 0.6005, + "step": 24772 + }, + { + "epoch": 0.86, + "learning_rate": 9.749129542438241e-07, + "loss": 0.6421, + "step": 24773 + }, + { + "epoch": 0.86, + "learning_rate": 9.744440645970633e-07, + "loss": 0.7088, + "step": 24774 + }, + { + "epoch": 0.86, + "learning_rate": 9.73975281959686e-07, + "loss": 0.5766, + "step": 24775 + }, + { + "epoch": 0.86, + "learning_rate": 9.735066063372488e-07, + "loss": 0.7131, + "step": 24776 + }, + { + "epoch": 0.86, + "learning_rate": 9.7303803773531e-07, + "loss": 0.6393, + "step": 24777 + }, + { + "epoch": 0.86, + "learning_rate": 9.725695761594256e-07, + "loss": 0.5966, + "step": 24778 + }, + { + "epoch": 0.86, + "learning_rate": 9.721012216151472e-07, + "loss": 0.64, + "step": 24779 + }, + { + "epoch": 0.86, + "learning_rate": 9.716329741080288e-07, + "loss": 0.5694, + "step": 24780 + }, + { + "epoch": 0.86, + "learning_rate": 9.71164833643623e-07, + "loss": 0.6466, + "step": 24781 + }, + { + "epoch": 0.86, + "learning_rate": 9.706968002274797e-07, + "loss": 0.6149, + "step": 24782 + }, + { + "epoch": 0.86, + "learning_rate": 9.702288738651477e-07, + "loss": 0.6745, + "step": 24783 + }, + { + "epoch": 0.86, + "learning_rate": 9.697610545621772e-07, + "loss": 0.5783, + "step": 24784 + }, + { + "epoch": 0.86, + "learning_rate": 9.692933423241101e-07, + "loss": 0.6206, + "step": 24785 + }, + { + "epoch": 0.86, + "learning_rate": 9.688257371564947e-07, + "loss": 0.6281, + "step": 24786 + }, + { + "epoch": 0.86, + "learning_rate": 9.683582390648748e-07, + "loss": 0.5873, + "step": 24787 + }, + { + "epoch": 0.86, + "learning_rate": 9.678908480547932e-07, + "loss": 0.5923, + "step": 24788 + }, + { + "epoch": 0.86, + "learning_rate": 9.67423564131792e-07, + "loss": 0.6038, + "step": 24789 + }, + { + "epoch": 0.86, + "learning_rate": 9.669563873014108e-07, + "loss": 0.6748, + "step": 24790 + }, + { + "epoch": 0.86, + "learning_rate": 9.66489317569188e-07, + "loss": 0.6127, + "step": 24791 + }, + { + "epoch": 0.86, + "learning_rate": 9.660223549406611e-07, + "loss": 0.572, + "step": 24792 + }, + { + "epoch": 0.86, + "learning_rate": 9.65555499421368e-07, + "loss": 0.6837, + "step": 24793 + }, + { + "epoch": 0.86, + "learning_rate": 9.650887510168427e-07, + "loss": 0.6368, + "step": 24794 + }, + { + "epoch": 0.86, + "learning_rate": 9.646221097326213e-07, + "loss": 0.6059, + "step": 24795 + }, + { + "epoch": 0.86, + "learning_rate": 9.641555755742328e-07, + "loss": 0.688, + "step": 24796 + }, + { + "epoch": 0.86, + "learning_rate": 9.6368914854721e-07, + "loss": 0.5705, + "step": 24797 + }, + { + "epoch": 0.86, + "learning_rate": 9.632228286570832e-07, + "loss": 0.6962, + "step": 24798 + }, + { + "epoch": 0.86, + "learning_rate": 9.627566159093815e-07, + "loss": 0.659, + "step": 24799 + }, + { + "epoch": 0.86, + "learning_rate": 9.622905103096324e-07, + "loss": 0.6544, + "step": 24800 + }, + { + "epoch": 0.86, + "learning_rate": 9.61824511863364e-07, + "loss": 0.6332, + "step": 24801 + }, + { + "epoch": 0.86, + "learning_rate": 9.613586205760983e-07, + "loss": 0.6164, + "step": 24802 + }, + { + "epoch": 0.86, + "learning_rate": 9.608928364533588e-07, + "loss": 0.6495, + "step": 24803 + }, + { + "epoch": 0.86, + "learning_rate": 9.604271595006698e-07, + "loss": 0.6028, + "step": 24804 + }, + { + "epoch": 0.86, + "learning_rate": 9.599615897235514e-07, + "loss": 0.6201, + "step": 24805 + }, + { + "epoch": 0.86, + "learning_rate": 9.59496127127525e-07, + "loss": 0.6444, + "step": 24806 + }, + { + "epoch": 0.86, + "learning_rate": 9.590307717181103e-07, + "loss": 0.6652, + "step": 24807 + }, + { + "epoch": 0.86, + "learning_rate": 9.585655235008195e-07, + "loss": 0.6052, + "step": 24808 + }, + { + "epoch": 0.86, + "learning_rate": 9.58100382481173e-07, + "loss": 0.6792, + "step": 24809 + }, + { + "epoch": 0.86, + "learning_rate": 9.57635348664684e-07, + "loss": 0.6157, + "step": 24810 + }, + { + "epoch": 0.86, + "learning_rate": 9.571704220568668e-07, + "loss": 0.6536, + "step": 24811 + }, + { + "epoch": 0.86, + "learning_rate": 9.567056026632337e-07, + "loss": 0.5903, + "step": 24812 + }, + { + "epoch": 0.86, + "learning_rate": 9.562408904892972e-07, + "loss": 0.635, + "step": 24813 + }, + { + "epoch": 0.86, + "learning_rate": 9.557762855405627e-07, + "loss": 0.6585, + "step": 24814 + }, + { + "epoch": 0.86, + "learning_rate": 9.553117878225425e-07, + "loss": 0.6012, + "step": 24815 + }, + { + "epoch": 0.86, + "learning_rate": 9.548473973407423e-07, + "loss": 0.6168, + "step": 24816 + }, + { + "epoch": 0.86, + "learning_rate": 9.543831141006676e-07, + "loss": 0.6199, + "step": 24817 + }, + { + "epoch": 0.86, + "learning_rate": 9.539189381078251e-07, + "loss": 0.7044, + "step": 24818 + }, + { + "epoch": 0.86, + "learning_rate": 9.534548693677181e-07, + "loss": 0.6862, + "step": 24819 + }, + { + "epoch": 0.86, + "learning_rate": 9.529909078858457e-07, + "loss": 0.6173, + "step": 24820 + }, + { + "epoch": 0.86, + "learning_rate": 9.525270536677112e-07, + "loss": 0.5814, + "step": 24821 + }, + { + "epoch": 0.86, + "learning_rate": 9.520633067188134e-07, + "loss": 0.5801, + "step": 24822 + }, + { + "epoch": 0.86, + "learning_rate": 9.515996670446504e-07, + "loss": 0.5689, + "step": 24823 + }, + { + "epoch": 0.86, + "learning_rate": 9.511361346507197e-07, + "loss": 0.6329, + "step": 24824 + }, + { + "epoch": 0.86, + "learning_rate": 9.506727095425183e-07, + "loss": 0.5842, + "step": 24825 + }, + { + "epoch": 0.86, + "learning_rate": 9.502093917255384e-07, + "loss": 0.6392, + "step": 24826 + }, + { + "epoch": 0.86, + "learning_rate": 9.497461812052744e-07, + "loss": 0.6374, + "step": 24827 + }, + { + "epoch": 0.86, + "learning_rate": 9.492830779872175e-07, + "loss": 0.6544, + "step": 24828 + }, + { + "epoch": 0.86, + "learning_rate": 9.48820082076859e-07, + "loss": 0.6234, + "step": 24829 + }, + { + "epoch": 0.86, + "learning_rate": 9.483571934796887e-07, + "loss": 0.6569, + "step": 24830 + }, + { + "epoch": 0.86, + "learning_rate": 9.478944122011958e-07, + "loss": 0.6063, + "step": 24831 + }, + { + "epoch": 0.86, + "learning_rate": 9.474317382468634e-07, + "loss": 0.6362, + "step": 24832 + }, + { + "epoch": 0.86, + "learning_rate": 9.469691716221796e-07, + "loss": 0.6422, + "step": 24833 + }, + { + "epoch": 0.86, + "learning_rate": 9.465067123326277e-07, + "loss": 0.6035, + "step": 24834 + }, + { + "epoch": 0.86, + "learning_rate": 9.460443603836922e-07, + "loss": 0.6547, + "step": 24835 + }, + { + "epoch": 0.86, + "learning_rate": 9.455821157808543e-07, + "loss": 0.6446, + "step": 24836 + }, + { + "epoch": 0.86, + "learning_rate": 9.451199785295961e-07, + "loss": 0.634, + "step": 24837 + }, + { + "epoch": 0.86, + "learning_rate": 9.446579486353924e-07, + "loss": 0.6555, + "step": 24838 + }, + { + "epoch": 0.86, + "learning_rate": 9.441960261037241e-07, + "loss": 0.7614, + "step": 24839 + }, + { + "epoch": 0.86, + "learning_rate": 9.437342109400683e-07, + "loss": 0.6125, + "step": 24840 + }, + { + "epoch": 0.86, + "learning_rate": 9.43272503149899e-07, + "loss": 0.6599, + "step": 24841 + }, + { + "epoch": 0.86, + "learning_rate": 9.428109027386911e-07, + "loss": 0.6323, + "step": 24842 + }, + { + "epoch": 0.86, + "learning_rate": 9.423494097119201e-07, + "loss": 0.6153, + "step": 24843 + }, + { + "epoch": 0.86, + "learning_rate": 9.418880240750517e-07, + "loss": 0.6267, + "step": 24844 + }, + { + "epoch": 0.86, + "learning_rate": 9.414267458335602e-07, + "loss": 0.7123, + "step": 24845 + }, + { + "epoch": 0.86, + "learning_rate": 9.409655749929136e-07, + "loss": 0.6401, + "step": 24846 + }, + { + "epoch": 0.86, + "learning_rate": 9.405045115585787e-07, + "loss": 0.6278, + "step": 24847 + }, + { + "epoch": 0.86, + "learning_rate": 9.400435555360243e-07, + "loss": 0.6758, + "step": 24848 + }, + { + "epoch": 0.86, + "learning_rate": 9.395827069307162e-07, + "loss": 0.6275, + "step": 24849 + }, + { + "epoch": 0.86, + "learning_rate": 9.391219657481143e-07, + "loss": 0.6014, + "step": 24850 + }, + { + "epoch": 0.86, + "learning_rate": 9.386613319936843e-07, + "loss": 0.6534, + "step": 24851 + }, + { + "epoch": 0.86, + "learning_rate": 9.382008056728864e-07, + "loss": 0.6633, + "step": 24852 + }, + { + "epoch": 0.86, + "learning_rate": 9.377403867911816e-07, + "loss": 0.6669, + "step": 24853 + }, + { + "epoch": 0.86, + "learning_rate": 9.372800753540301e-07, + "loss": 0.6029, + "step": 24854 + }, + { + "epoch": 0.86, + "learning_rate": 9.368198713668853e-07, + "loss": 0.6159, + "step": 24855 + }, + { + "epoch": 0.86, + "learning_rate": 9.363597748352061e-07, + "loss": 0.5878, + "step": 24856 + }, + { + "epoch": 0.86, + "learning_rate": 9.358997857644492e-07, + "loss": 0.6076, + "step": 24857 + }, + { + "epoch": 0.86, + "learning_rate": 9.354399041600625e-07, + "loss": 0.6283, + "step": 24858 + }, + { + "epoch": 0.86, + "learning_rate": 9.349801300275052e-07, + "loss": 0.6752, + "step": 24859 + }, + { + "epoch": 0.86, + "learning_rate": 9.345204633722272e-07, + "loss": 0.6388, + "step": 24860 + }, + { + "epoch": 0.86, + "learning_rate": 9.340609041996751e-07, + "loss": 0.5739, + "step": 24861 + }, + { + "epoch": 0.86, + "learning_rate": 9.336014525152992e-07, + "loss": 0.5939, + "step": 24862 + }, + { + "epoch": 0.86, + "learning_rate": 9.331421083245495e-07, + "loss": 0.5901, + "step": 24863 + }, + { + "epoch": 0.86, + "learning_rate": 9.326828716328651e-07, + "loss": 0.5933, + "step": 24864 + }, + { + "epoch": 0.86, + "learning_rate": 9.322237424456981e-07, + "loss": 0.6254, + "step": 24865 + }, + { + "epoch": 0.86, + "learning_rate": 9.31764720768491e-07, + "loss": 0.67, + "step": 24866 + }, + { + "epoch": 0.86, + "learning_rate": 9.313058066066827e-07, + "loss": 0.6047, + "step": 24867 + }, + { + "epoch": 0.86, + "learning_rate": 9.308469999657166e-07, + "loss": 0.7025, + "step": 24868 + }, + { + "epoch": 0.86, + "learning_rate": 9.303883008510328e-07, + "loss": 0.6381, + "step": 24869 + }, + { + "epoch": 0.86, + "learning_rate": 9.299297092680659e-07, + "loss": 0.7041, + "step": 24870 + }, + { + "epoch": 0.86, + "learning_rate": 9.294712252222571e-07, + "loss": 0.6592, + "step": 24871 + }, + { + "epoch": 0.86, + "learning_rate": 9.290128487190442e-07, + "loss": 0.663, + "step": 24872 + }, + { + "epoch": 0.86, + "learning_rate": 9.285545797638562e-07, + "loss": 0.6241, + "step": 24873 + }, + { + "epoch": 0.86, + "learning_rate": 9.280964183621288e-07, + "loss": 0.606, + "step": 24874 + }, + { + "epoch": 0.86, + "learning_rate": 9.276383645192966e-07, + "loss": 0.613, + "step": 24875 + }, + { + "epoch": 0.86, + "learning_rate": 9.271804182407839e-07, + "loss": 0.6152, + "step": 24876 + }, + { + "epoch": 0.86, + "learning_rate": 9.267225795320279e-07, + "loss": 0.6245, + "step": 24877 + }, + { + "epoch": 0.86, + "learning_rate": 9.262648483984537e-07, + "loss": 0.5919, + "step": 24878 + }, + { + "epoch": 0.86, + "learning_rate": 9.258072248454875e-07, + "loss": 0.649, + "step": 24879 + }, + { + "epoch": 0.86, + "learning_rate": 9.253497088785546e-07, + "loss": 0.6416, + "step": 24880 + }, + { + "epoch": 0.86, + "learning_rate": 9.248923005030818e-07, + "loss": 0.6618, + "step": 24881 + }, + { + "epoch": 0.86, + "learning_rate": 9.244349997244884e-07, + "loss": 0.5935, + "step": 24882 + }, + { + "epoch": 0.86, + "learning_rate": 9.239778065481996e-07, + "loss": 0.6683, + "step": 24883 + }, + { + "epoch": 0.86, + "learning_rate": 9.235207209796382e-07, + "loss": 0.5927, + "step": 24884 + }, + { + "epoch": 0.86, + "learning_rate": 9.230637430242173e-07, + "loss": 0.6856, + "step": 24885 + }, + { + "epoch": 0.86, + "learning_rate": 9.226068726873594e-07, + "loss": 0.6318, + "step": 24886 + }, + { + "epoch": 0.86, + "learning_rate": 9.221501099744801e-07, + "loss": 0.6119, + "step": 24887 + }, + { + "epoch": 0.86, + "learning_rate": 9.216934548909929e-07, + "loss": 0.6372, + "step": 24888 + }, + { + "epoch": 0.86, + "learning_rate": 9.212369074423144e-07, + "loss": 0.6559, + "step": 24889 + }, + { + "epoch": 0.86, + "learning_rate": 9.207804676338594e-07, + "loss": 0.6547, + "step": 24890 + }, + { + "epoch": 0.86, + "learning_rate": 9.203241354710358e-07, + "loss": 0.6487, + "step": 24891 + }, + { + "epoch": 0.86, + "learning_rate": 9.198679109592546e-07, + "loss": 0.6435, + "step": 24892 + }, + { + "epoch": 0.86, + "learning_rate": 9.194117941039282e-07, + "loss": 0.5671, + "step": 24893 + }, + { + "epoch": 0.86, + "learning_rate": 9.189557849104581e-07, + "loss": 0.6577, + "step": 24894 + }, + { + "epoch": 0.86, + "learning_rate": 9.184998833842573e-07, + "loss": 0.626, + "step": 24895 + }, + { + "epoch": 0.86, + "learning_rate": 9.180440895307297e-07, + "loss": 0.6486, + "step": 24896 + }, + { + "epoch": 0.86, + "learning_rate": 9.175884033552762e-07, + "loss": 0.5795, + "step": 24897 + }, + { + "epoch": 0.86, + "learning_rate": 9.171328248633016e-07, + "loss": 0.6355, + "step": 24898 + }, + { + "epoch": 0.86, + "learning_rate": 9.166773540602092e-07, + "loss": 0.6748, + "step": 24899 + }, + { + "epoch": 0.86, + "learning_rate": 9.162219909513925e-07, + "loss": 0.6142, + "step": 24900 + }, + { + "epoch": 0.86, + "learning_rate": 9.157667355422583e-07, + "loss": 0.6656, + "step": 24901 + }, + { + "epoch": 0.86, + "learning_rate": 9.153115878382024e-07, + "loss": 0.6306, + "step": 24902 + }, + { + "epoch": 0.86, + "learning_rate": 9.148565478446181e-07, + "loss": 0.619, + "step": 24903 + }, + { + "epoch": 0.86, + "learning_rate": 9.144016155669022e-07, + "loss": 0.6145, + "step": 24904 + }, + { + "epoch": 0.86, + "learning_rate": 9.139467910104504e-07, + "loss": 0.62, + "step": 24905 + }, + { + "epoch": 0.86, + "learning_rate": 9.134920741806496e-07, + "loss": 0.643, + "step": 24906 + }, + { + "epoch": 0.86, + "learning_rate": 9.130374650828966e-07, + "loss": 0.6093, + "step": 24907 + }, + { + "epoch": 0.86, + "learning_rate": 9.125829637225813e-07, + "loss": 0.6492, + "step": 24908 + }, + { + "epoch": 0.86, + "learning_rate": 9.121285701050886e-07, + "loss": 0.581, + "step": 24909 + }, + { + "epoch": 0.86, + "learning_rate": 9.116742842358083e-07, + "loss": 0.627, + "step": 24910 + }, + { + "epoch": 0.86, + "learning_rate": 9.112201061201275e-07, + "loss": 0.6625, + "step": 24911 + }, + { + "epoch": 0.86, + "learning_rate": 9.107660357634263e-07, + "loss": 0.6339, + "step": 24912 + }, + { + "epoch": 0.86, + "learning_rate": 9.103120731710935e-07, + "loss": 0.6172, + "step": 24913 + }, + { + "epoch": 0.86, + "learning_rate": 9.098582183485116e-07, + "loss": 0.6596, + "step": 24914 + }, + { + "epoch": 0.86, + "learning_rate": 9.094044713010585e-07, + "loss": 0.5722, + "step": 24915 + }, + { + "epoch": 0.86, + "learning_rate": 9.089508320341156e-07, + "loss": 0.5972, + "step": 24916 + }, + { + "epoch": 0.86, + "learning_rate": 9.084973005530595e-07, + "loss": 0.6518, + "step": 24917 + }, + { + "epoch": 0.86, + "learning_rate": 9.080438768632671e-07, + "loss": 0.6384, + "step": 24918 + }, + { + "epoch": 0.86, + "learning_rate": 9.075905609701185e-07, + "loss": 0.658, + "step": 24919 + }, + { + "epoch": 0.86, + "learning_rate": 9.071373528789851e-07, + "loss": 0.6392, + "step": 24920 + }, + { + "epoch": 0.86, + "learning_rate": 9.066842525952402e-07, + "loss": 0.6498, + "step": 24921 + }, + { + "epoch": 0.86, + "learning_rate": 9.062312601242595e-07, + "loss": 0.6379, + "step": 24922 + }, + { + "epoch": 0.86, + "learning_rate": 9.057783754714078e-07, + "loss": 0.6462, + "step": 24923 + }, + { + "epoch": 0.86, + "learning_rate": 9.053255986420562e-07, + "loss": 0.6505, + "step": 24924 + }, + { + "epoch": 0.86, + "learning_rate": 9.048729296415782e-07, + "loss": 0.621, + "step": 24925 + }, + { + "epoch": 0.86, + "learning_rate": 9.044203684753361e-07, + "loss": 0.6278, + "step": 24926 + }, + { + "epoch": 0.86, + "learning_rate": 9.039679151486957e-07, + "loss": 0.6161, + "step": 24927 + }, + { + "epoch": 0.86, + "learning_rate": 9.035155696670239e-07, + "loss": 0.6355, + "step": 24928 + }, + { + "epoch": 0.86, + "learning_rate": 9.030633320356796e-07, + "loss": 0.6624, + "step": 24929 + }, + { + "epoch": 0.86, + "learning_rate": 9.026112022600264e-07, + "loss": 0.5683, + "step": 24930 + }, + { + "epoch": 0.86, + "learning_rate": 9.0215918034543e-07, + "loss": 0.6385, + "step": 24931 + }, + { + "epoch": 0.86, + "learning_rate": 9.017072662972415e-07, + "loss": 0.6657, + "step": 24932 + }, + { + "epoch": 0.86, + "learning_rate": 9.012554601208245e-07, + "loss": 0.6846, + "step": 24933 + }, + { + "epoch": 0.86, + "learning_rate": 9.008037618215348e-07, + "loss": 0.6362, + "step": 24934 + }, + { + "epoch": 0.86, + "learning_rate": 9.003521714047258e-07, + "loss": 0.6102, + "step": 24935 + }, + { + "epoch": 0.86, + "learning_rate": 8.999006888757511e-07, + "loss": 0.637, + "step": 24936 + }, + { + "epoch": 0.86, + "learning_rate": 8.994493142399685e-07, + "loss": 0.6456, + "step": 24937 + }, + { + "epoch": 0.86, + "learning_rate": 8.989980475027249e-07, + "loss": 0.666, + "step": 24938 + }, + { + "epoch": 0.86, + "learning_rate": 8.985468886693727e-07, + "loss": 0.6331, + "step": 24939 + }, + { + "epoch": 0.86, + "learning_rate": 8.98095837745262e-07, + "loss": 0.6271, + "step": 24940 + }, + { + "epoch": 0.86, + "learning_rate": 8.976448947357375e-07, + "loss": 0.6294, + "step": 24941 + }, + { + "epoch": 0.86, + "learning_rate": 8.97194059646146e-07, + "loss": 0.6304, + "step": 24942 + }, + { + "epoch": 0.86, + "learning_rate": 8.967433324818365e-07, + "loss": 0.6623, + "step": 24943 + }, + { + "epoch": 0.86, + "learning_rate": 8.962927132481491e-07, + "loss": 0.611, + "step": 24944 + }, + { + "epoch": 0.86, + "learning_rate": 8.958422019504287e-07, + "loss": 0.6263, + "step": 24945 + }, + { + "epoch": 0.86, + "learning_rate": 8.953917985940164e-07, + "loss": 0.6769, + "step": 24946 + }, + { + "epoch": 0.86, + "learning_rate": 8.949415031842501e-07, + "loss": 0.6752, + "step": 24947 + }, + { + "epoch": 0.86, + "learning_rate": 8.944913157264689e-07, + "loss": 0.5851, + "step": 24948 + }, + { + "epoch": 0.86, + "learning_rate": 8.940412362260154e-07, + "loss": 0.6686, + "step": 24949 + }, + { + "epoch": 0.86, + "learning_rate": 8.935912646882194e-07, + "loss": 0.6401, + "step": 24950 + }, + { + "epoch": 0.86, + "learning_rate": 8.931414011184191e-07, + "loss": 0.6909, + "step": 24951 + }, + { + "epoch": 0.86, + "learning_rate": 8.926916455219503e-07, + "loss": 0.6821, + "step": 24952 + }, + { + "epoch": 0.86, + "learning_rate": 8.922419979041407e-07, + "loss": 0.6601, + "step": 24953 + }, + { + "epoch": 0.86, + "learning_rate": 8.917924582703208e-07, + "loss": 0.5935, + "step": 24954 + }, + { + "epoch": 0.86, + "learning_rate": 8.913430266258282e-07, + "loss": 0.6604, + "step": 24955 + }, + { + "epoch": 0.86, + "learning_rate": 8.908937029759835e-07, + "loss": 0.6088, + "step": 24956 + }, + { + "epoch": 0.86, + "learning_rate": 8.904444873261175e-07, + "loss": 0.616, + "step": 24957 + }, + { + "epoch": 0.86, + "learning_rate": 8.899953796815586e-07, + "loss": 0.6563, + "step": 24958 + }, + { + "epoch": 0.86, + "learning_rate": 8.895463800476256e-07, + "loss": 0.6766, + "step": 24959 + }, + { + "epoch": 0.86, + "learning_rate": 8.890974884296433e-07, + "loss": 0.6338, + "step": 24960 + }, + { + "epoch": 0.86, + "learning_rate": 8.886487048329395e-07, + "loss": 0.609, + "step": 24961 + }, + { + "epoch": 0.86, + "learning_rate": 8.882000292628301e-07, + "loss": 0.648, + "step": 24962 + }, + { + "epoch": 0.86, + "learning_rate": 8.877514617246352e-07, + "loss": 0.656, + "step": 24963 + }, + { + "epoch": 0.86, + "learning_rate": 8.873030022236751e-07, + "loss": 0.6718, + "step": 24964 + }, + { + "epoch": 0.86, + "learning_rate": 8.868546507652643e-07, + "loss": 0.6469, + "step": 24965 + }, + { + "epoch": 0.87, + "learning_rate": 8.864064073547197e-07, + "loss": 0.6463, + "step": 24966 + }, + { + "epoch": 0.87, + "learning_rate": 8.859582719973559e-07, + "loss": 0.6759, + "step": 24967 + }, + { + "epoch": 0.87, + "learning_rate": 8.855102446984865e-07, + "loss": 0.6238, + "step": 24968 + }, + { + "epoch": 0.87, + "learning_rate": 8.850623254634228e-07, + "loss": 0.6112, + "step": 24969 + }, + { + "epoch": 0.87, + "learning_rate": 8.846145142974771e-07, + "loss": 0.6518, + "step": 24970 + }, + { + "epoch": 0.87, + "learning_rate": 8.841668112059565e-07, + "loss": 0.6046, + "step": 24971 + }, + { + "epoch": 0.87, + "learning_rate": 8.837192161941688e-07, + "loss": 0.6574, + "step": 24972 + }, + { + "epoch": 0.87, + "learning_rate": 8.83271729267422e-07, + "loss": 0.6662, + "step": 24973 + }, + { + "epoch": 0.87, + "learning_rate": 8.828243504310219e-07, + "loss": 0.6637, + "step": 24974 + }, + { + "epoch": 0.87, + "learning_rate": 8.823770796902731e-07, + "loss": 0.6704, + "step": 24975 + }, + { + "epoch": 0.87, + "learning_rate": 8.819299170504791e-07, + "loss": 0.5545, + "step": 24976 + }, + { + "epoch": 0.87, + "learning_rate": 8.81482862516938e-07, + "loss": 0.6091, + "step": 24977 + }, + { + "epoch": 0.87, + "learning_rate": 8.810359160949533e-07, + "loss": 0.6455, + "step": 24978 + }, + { + "epoch": 0.87, + "learning_rate": 8.805890777898229e-07, + "loss": 0.5674, + "step": 24979 + }, + { + "epoch": 0.87, + "learning_rate": 8.80142347606846e-07, + "loss": 0.5538, + "step": 24980 + }, + { + "epoch": 0.87, + "learning_rate": 8.796957255513194e-07, + "loss": 0.6661, + "step": 24981 + }, + { + "epoch": 0.87, + "learning_rate": 8.792492116285345e-07, + "loss": 0.6252, + "step": 24982 + }, + { + "epoch": 0.87, + "learning_rate": 8.788028058437892e-07, + "loss": 0.633, + "step": 24983 + }, + { + "epoch": 0.87, + "learning_rate": 8.783565082023748e-07, + "loss": 0.5778, + "step": 24984 + }, + { + "epoch": 0.87, + "learning_rate": 8.779103187095827e-07, + "loss": 0.632, + "step": 24985 + }, + { + "epoch": 0.87, + "learning_rate": 8.774642373707032e-07, + "loss": 0.6629, + "step": 24986 + }, + { + "epoch": 0.87, + "learning_rate": 8.770182641910274e-07, + "loss": 0.5808, + "step": 24987 + }, + { + "epoch": 0.87, + "learning_rate": 8.76572399175839e-07, + "loss": 0.6566, + "step": 24988 + }, + { + "epoch": 0.87, + "learning_rate": 8.76126642330426e-07, + "loss": 0.6869, + "step": 24989 + }, + { + "epoch": 0.87, + "learning_rate": 8.75680993660073e-07, + "loss": 0.6672, + "step": 24990 + }, + { + "epoch": 0.87, + "learning_rate": 8.752354531700646e-07, + "loss": 0.5979, + "step": 24991 + }, + { + "epoch": 0.87, + "learning_rate": 8.747900208656824e-07, + "loss": 0.6236, + "step": 24992 + }, + { + "epoch": 0.87, + "learning_rate": 8.743446967522096e-07, + "loss": 0.6779, + "step": 24993 + }, + { + "epoch": 0.87, + "learning_rate": 8.738994808349233e-07, + "loss": 0.6514, + "step": 24994 + }, + { + "epoch": 0.87, + "learning_rate": 8.734543731191025e-07, + "loss": 0.6153, + "step": 24995 + }, + { + "epoch": 0.87, + "learning_rate": 8.730093736100254e-07, + "loss": 0.6583, + "step": 24996 + }, + { + "epoch": 0.87, + "learning_rate": 8.725644823129686e-07, + "loss": 0.6381, + "step": 24997 + }, + { + "epoch": 0.87, + "learning_rate": 8.721196992332049e-07, + "loss": 0.6132, + "step": 24998 + }, + { + "epoch": 0.87, + "learning_rate": 8.716750243760119e-07, + "loss": 0.5923, + "step": 24999 + }, + { + "epoch": 0.87, + "learning_rate": 8.712304577466569e-07, + "loss": 0.5515, + "step": 25000 + }, + { + "epoch": 0.87, + "learning_rate": 8.707859993504119e-07, + "loss": 0.6451, + "step": 25001 + }, + { + "epoch": 0.87, + "learning_rate": 8.703416491925487e-07, + "loss": 0.6219, + "step": 25002 + }, + { + "epoch": 0.87, + "learning_rate": 8.698974072783328e-07, + "loss": 0.5886, + "step": 25003 + }, + { + "epoch": 0.87, + "learning_rate": 8.694532736130346e-07, + "loss": 0.6472, + "step": 25004 + }, + { + "epoch": 0.87, + "learning_rate": 8.690092482019185e-07, + "loss": 0.6062, + "step": 25005 + }, + { + "epoch": 0.87, + "learning_rate": 8.685653310502473e-07, + "loss": 0.629, + "step": 25006 + }, + { + "epoch": 0.87, + "learning_rate": 8.681215221632855e-07, + "loss": 0.607, + "step": 25007 + }, + { + "epoch": 0.87, + "learning_rate": 8.676778215462944e-07, + "loss": 0.5592, + "step": 25008 + }, + { + "epoch": 0.87, + "learning_rate": 8.672342292045355e-07, + "loss": 0.5845, + "step": 25009 + }, + { + "epoch": 0.87, + "learning_rate": 8.667907451432678e-07, + "loss": 0.6381, + "step": 25010 + }, + { + "epoch": 0.87, + "learning_rate": 8.663473693677504e-07, + "loss": 0.6267, + "step": 25011 + }, + { + "epoch": 0.87, + "learning_rate": 8.659041018832382e-07, + "loss": 0.5758, + "step": 25012 + }, + { + "epoch": 0.87, + "learning_rate": 8.654609426949878e-07, + "loss": 0.5656, + "step": 25013 + }, + { + "epoch": 0.87, + "learning_rate": 8.65017891808253e-07, + "loss": 0.6451, + "step": 25014 + }, + { + "epoch": 0.87, + "learning_rate": 8.645749492282862e-07, + "loss": 0.6114, + "step": 25015 + }, + { + "epoch": 0.87, + "learning_rate": 8.641321149603398e-07, + "loss": 0.6722, + "step": 25016 + }, + { + "epoch": 0.87, + "learning_rate": 8.636893890096665e-07, + "loss": 0.5704, + "step": 25017 + }, + { + "epoch": 0.87, + "learning_rate": 8.632467713815107e-07, + "loss": 0.6619, + "step": 25018 + }, + { + "epoch": 0.87, + "learning_rate": 8.628042620811228e-07, + "loss": 0.6538, + "step": 25019 + }, + { + "epoch": 0.87, + "learning_rate": 8.623618611137497e-07, + "loss": 0.6012, + "step": 25020 + }, + { + "epoch": 0.87, + "learning_rate": 8.619195684846349e-07, + "loss": 0.5902, + "step": 25021 + }, + { + "epoch": 0.87, + "learning_rate": 8.614773841990231e-07, + "loss": 0.6305, + "step": 25022 + }, + { + "epoch": 0.87, + "learning_rate": 8.610353082621603e-07, + "loss": 0.6401, + "step": 25023 + }, + { + "epoch": 0.87, + "learning_rate": 8.605933406792821e-07, + "loss": 0.6158, + "step": 25024 + }, + { + "epoch": 0.87, + "learning_rate": 8.601514814556311e-07, + "loss": 0.6135, + "step": 25025 + }, + { + "epoch": 0.87, + "learning_rate": 8.597097305964463e-07, + "loss": 0.6397, + "step": 25026 + }, + { + "epoch": 0.87, + "learning_rate": 8.592680881069659e-07, + "loss": 0.6637, + "step": 25027 + }, + { + "epoch": 0.87, + "learning_rate": 8.588265539924246e-07, + "loss": 0.6453, + "step": 25028 + }, + { + "epoch": 0.87, + "learning_rate": 8.583851282580602e-07, + "loss": 0.6535, + "step": 25029 + }, + { + "epoch": 0.87, + "learning_rate": 8.579438109091032e-07, + "loss": 0.6189, + "step": 25030 + }, + { + "epoch": 0.87, + "learning_rate": 8.57502601950786e-07, + "loss": 0.6237, + "step": 25031 + }, + { + "epoch": 0.87, + "learning_rate": 8.57061501388341e-07, + "loss": 0.6141, + "step": 25032 + }, + { + "epoch": 0.87, + "learning_rate": 8.566205092269985e-07, + "loss": 0.6429, + "step": 25033 + }, + { + "epoch": 0.87, + "learning_rate": 8.561796254719857e-07, + "loss": 0.6893, + "step": 25034 + }, + { + "epoch": 0.87, + "learning_rate": 8.557388501285324e-07, + "loss": 0.6605, + "step": 25035 + }, + { + "epoch": 0.87, + "learning_rate": 8.552981832018603e-07, + "loss": 0.7093, + "step": 25036 + }, + { + "epoch": 0.87, + "learning_rate": 8.548576246971963e-07, + "loss": 0.6666, + "step": 25037 + }, + { + "epoch": 0.87, + "learning_rate": 8.54417174619765e-07, + "loss": 0.6197, + "step": 25038 + }, + { + "epoch": 0.87, + "learning_rate": 8.539768329747866e-07, + "loss": 0.5966, + "step": 25039 + }, + { + "epoch": 0.87, + "learning_rate": 8.535365997674838e-07, + "loss": 0.619, + "step": 25040 + }, + { + "epoch": 0.87, + "learning_rate": 8.530964750030734e-07, + "loss": 0.6568, + "step": 25041 + }, + { + "epoch": 0.87, + "learning_rate": 8.526564586867758e-07, + "loss": 0.6589, + "step": 25042 + }, + { + "epoch": 0.87, + "learning_rate": 8.522165508238078e-07, + "loss": 0.6382, + "step": 25043 + }, + { + "epoch": 0.87, + "learning_rate": 8.51776751419383e-07, + "loss": 0.5796, + "step": 25044 + }, + { + "epoch": 0.87, + "learning_rate": 8.513370604787185e-07, + "loss": 0.6832, + "step": 25045 + }, + { + "epoch": 0.87, + "learning_rate": 8.508974780070279e-07, + "loss": 0.6729, + "step": 25046 + }, + { + "epoch": 0.87, + "learning_rate": 8.504580040095189e-07, + "loss": 0.6405, + "step": 25047 + }, + { + "epoch": 0.87, + "learning_rate": 8.500186384914055e-07, + "loss": 0.7035, + "step": 25048 + }, + { + "epoch": 0.87, + "learning_rate": 8.495793814578957e-07, + "loss": 0.6242, + "step": 25049 + }, + { + "epoch": 0.87, + "learning_rate": 8.491402329141974e-07, + "loss": 0.6884, + "step": 25050 + }, + { + "epoch": 0.87, + "learning_rate": 8.487011928655175e-07, + "loss": 0.6446, + "step": 25051 + }, + { + "epoch": 0.87, + "learning_rate": 8.482622613170633e-07, + "loss": 0.6178, + "step": 25052 + }, + { + "epoch": 0.87, + "learning_rate": 8.478234382740358e-07, + "loss": 0.5501, + "step": 25053 + }, + { + "epoch": 0.87, + "learning_rate": 8.473847237416377e-07, + "loss": 0.6608, + "step": 25054 + }, + { + "epoch": 0.87, + "learning_rate": 8.469461177250726e-07, + "loss": 0.6319, + "step": 25055 + }, + { + "epoch": 0.87, + "learning_rate": 8.465076202295397e-07, + "loss": 0.6414, + "step": 25056 + }, + { + "epoch": 0.87, + "learning_rate": 8.460692312602392e-07, + "loss": 0.607, + "step": 25057 + }, + { + "epoch": 0.87, + "learning_rate": 8.456309508223681e-07, + "loss": 0.6304, + "step": 25058 + }, + { + "epoch": 0.87, + "learning_rate": 8.451927789211212e-07, + "loss": 0.6205, + "step": 25059 + }, + { + "epoch": 0.87, + "learning_rate": 8.447547155616953e-07, + "loss": 0.6247, + "step": 25060 + }, + { + "epoch": 0.87, + "learning_rate": 8.44316760749283e-07, + "loss": 0.5837, + "step": 25061 + }, + { + "epoch": 0.87, + "learning_rate": 8.43878914489078e-07, + "loss": 0.6429, + "step": 25062 + }, + { + "epoch": 0.87, + "learning_rate": 8.434411767862704e-07, + "loss": 0.5877, + "step": 25063 + }, + { + "epoch": 0.87, + "learning_rate": 8.43003547646053e-07, + "loss": 0.6482, + "step": 25064 + }, + { + "epoch": 0.87, + "learning_rate": 8.425660270736102e-07, + "loss": 0.5694, + "step": 25065 + }, + { + "epoch": 0.87, + "learning_rate": 8.421286150741315e-07, + "loss": 0.5995, + "step": 25066 + }, + { + "epoch": 0.87, + "learning_rate": 8.416913116528025e-07, + "loss": 0.6286, + "step": 25067 + }, + { + "epoch": 0.87, + "learning_rate": 8.412541168148092e-07, + "loss": 0.6224, + "step": 25068 + }, + { + "epoch": 0.87, + "learning_rate": 8.408170305653329e-07, + "loss": 0.6168, + "step": 25069 + }, + { + "epoch": 0.87, + "learning_rate": 8.403800529095596e-07, + "loss": 0.6521, + "step": 25070 + }, + { + "epoch": 0.87, + "learning_rate": 8.399431838526662e-07, + "loss": 0.6353, + "step": 25071 + }, + { + "epoch": 0.87, + "learning_rate": 8.39506423399834e-07, + "loss": 0.5859, + "step": 25072 + }, + { + "epoch": 0.87, + "learning_rate": 8.390697715562412e-07, + "loss": 0.6193, + "step": 25073 + }, + { + "epoch": 0.87, + "learning_rate": 8.386332283270649e-07, + "loss": 0.6533, + "step": 25074 + }, + { + "epoch": 0.87, + "learning_rate": 8.381967937174796e-07, + "loss": 0.605, + "step": 25075 + }, + { + "epoch": 0.87, + "learning_rate": 8.377604677326646e-07, + "loss": 0.6159, + "step": 25076 + }, + { + "epoch": 0.87, + "learning_rate": 8.373242503777867e-07, + "loss": 0.5921, + "step": 25077 + }, + { + "epoch": 0.87, + "learning_rate": 8.36888141658021e-07, + "loss": 0.6104, + "step": 25078 + }, + { + "epoch": 0.87, + "learning_rate": 8.364521415785376e-07, + "loss": 0.6436, + "step": 25079 + }, + { + "epoch": 0.87, + "learning_rate": 8.360162501445068e-07, + "loss": 0.6892, + "step": 25080 + }, + { + "epoch": 0.87, + "learning_rate": 8.355804673610946e-07, + "loss": 0.6223, + "step": 25081 + }, + { + "epoch": 0.87, + "learning_rate": 8.351447932334711e-07, + "loss": 0.6489, + "step": 25082 + }, + { + "epoch": 0.87, + "learning_rate": 8.34709227766799e-07, + "loss": 0.5965, + "step": 25083 + }, + { + "epoch": 0.87, + "learning_rate": 8.342737709662419e-07, + "loss": 0.6367, + "step": 25084 + }, + { + "epoch": 0.87, + "learning_rate": 8.338384228369645e-07, + "loss": 0.6298, + "step": 25085 + }, + { + "epoch": 0.87, + "learning_rate": 8.334031833841272e-07, + "loss": 0.5768, + "step": 25086 + }, + { + "epoch": 0.87, + "learning_rate": 8.329680526128924e-07, + "loss": 0.6514, + "step": 25087 + }, + { + "epoch": 0.87, + "learning_rate": 8.325330305284185e-07, + "loss": 0.6857, + "step": 25088 + }, + { + "epoch": 0.87, + "learning_rate": 8.3209811713586e-07, + "loss": 0.6577, + "step": 25089 + }, + { + "epoch": 0.87, + "learning_rate": 8.316633124403772e-07, + "loss": 0.6127, + "step": 25090 + }, + { + "epoch": 0.87, + "learning_rate": 8.312286164471229e-07, + "loss": 0.601, + "step": 25091 + }, + { + "epoch": 0.87, + "learning_rate": 8.307940291612526e-07, + "loss": 0.638, + "step": 25092 + }, + { + "epoch": 0.87, + "learning_rate": 8.303595505879169e-07, + "loss": 0.6285, + "step": 25093 + }, + { + "epoch": 0.87, + "learning_rate": 8.299251807322717e-07, + "loss": 0.5812, + "step": 25094 + }, + { + "epoch": 0.87, + "learning_rate": 8.294909195994605e-07, + "loss": 0.6381, + "step": 25095 + }, + { + "epoch": 0.87, + "learning_rate": 8.290567671946359e-07, + "loss": 0.6628, + "step": 25096 + }, + { + "epoch": 0.87, + "learning_rate": 8.28622723522945e-07, + "loss": 0.6111, + "step": 25097 + }, + { + "epoch": 0.87, + "learning_rate": 8.281887885895334e-07, + "loss": 0.648, + "step": 25098 + }, + { + "epoch": 0.87, + "learning_rate": 8.277549623995462e-07, + "loss": 0.6887, + "step": 25099 + }, + { + "epoch": 0.87, + "learning_rate": 8.273212449581281e-07, + "loss": 0.5723, + "step": 25100 + }, + { + "epoch": 0.87, + "learning_rate": 8.268876362704192e-07, + "loss": 0.639, + "step": 25101 + }, + { + "epoch": 0.87, + "learning_rate": 8.264541363415623e-07, + "loss": 0.6027, + "step": 25102 + }, + { + "epoch": 0.87, + "learning_rate": 8.260207451766933e-07, + "loss": 0.6149, + "step": 25103 + }, + { + "epoch": 0.87, + "learning_rate": 8.255874627809546e-07, + "loss": 0.6611, + "step": 25104 + }, + { + "epoch": 0.87, + "learning_rate": 8.251542891594844e-07, + "loss": 0.6033, + "step": 25105 + }, + { + "epoch": 0.87, + "learning_rate": 8.247212243174141e-07, + "loss": 0.5807, + "step": 25106 + }, + { + "epoch": 0.87, + "learning_rate": 8.242882682598819e-07, + "loss": 0.6043, + "step": 25107 + }, + { + "epoch": 0.87, + "learning_rate": 8.238554209920202e-07, + "loss": 0.6343, + "step": 25108 + }, + { + "epoch": 0.87, + "learning_rate": 8.234226825189562e-07, + "loss": 0.6343, + "step": 25109 + }, + { + "epoch": 0.87, + "learning_rate": 8.229900528458278e-07, + "loss": 0.6375, + "step": 25110 + }, + { + "epoch": 0.87, + "learning_rate": 8.225575319777623e-07, + "loss": 0.6125, + "step": 25111 + }, + { + "epoch": 0.87, + "learning_rate": 8.221251199198854e-07, + "loss": 0.5819, + "step": 25112 + }, + { + "epoch": 0.87, + "learning_rate": 8.216928166773252e-07, + "loss": 0.6463, + "step": 25113 + }, + { + "epoch": 0.87, + "learning_rate": 8.212606222552089e-07, + "loss": 0.6699, + "step": 25114 + }, + { + "epoch": 0.87, + "learning_rate": 8.208285366586565e-07, + "loss": 0.6629, + "step": 25115 + }, + { + "epoch": 0.87, + "learning_rate": 8.203965598927944e-07, + "loss": 0.6577, + "step": 25116 + }, + { + "epoch": 0.87, + "learning_rate": 8.199646919627447e-07, + "loss": 0.6059, + "step": 25117 + }, + { + "epoch": 0.87, + "learning_rate": 8.195329328736256e-07, + "loss": 0.6655, + "step": 25118 + }, + { + "epoch": 0.87, + "learning_rate": 8.191012826305556e-07, + "loss": 0.6755, + "step": 25119 + }, + { + "epoch": 0.87, + "learning_rate": 8.186697412386569e-07, + "loss": 0.6269, + "step": 25120 + }, + { + "epoch": 0.87, + "learning_rate": 8.182383087030387e-07, + "loss": 0.6176, + "step": 25121 + }, + { + "epoch": 0.87, + "learning_rate": 8.178069850288217e-07, + "loss": 0.6211, + "step": 25122 + }, + { + "epoch": 0.87, + "learning_rate": 8.173757702211215e-07, + "loss": 0.6472, + "step": 25123 + }, + { + "epoch": 0.87, + "learning_rate": 8.169446642850454e-07, + "loss": 0.6214, + "step": 25124 + }, + { + "epoch": 0.87, + "learning_rate": 8.165136672257057e-07, + "loss": 0.5915, + "step": 25125 + }, + { + "epoch": 0.87, + "learning_rate": 8.160827790482162e-07, + "loss": 0.649, + "step": 25126 + }, + { + "epoch": 0.87, + "learning_rate": 8.156519997576806e-07, + "loss": 0.6471, + "step": 25127 + }, + { + "epoch": 0.87, + "learning_rate": 8.152213293592093e-07, + "loss": 0.6641, + "step": 25128 + }, + { + "epoch": 0.87, + "learning_rate": 8.147907678579103e-07, + "loss": 0.6264, + "step": 25129 + }, + { + "epoch": 0.87, + "learning_rate": 8.143603152588841e-07, + "loss": 0.6599, + "step": 25130 + }, + { + "epoch": 0.87, + "learning_rate": 8.139299715672356e-07, + "loss": 0.6275, + "step": 25131 + }, + { + "epoch": 0.87, + "learning_rate": 8.134997367880704e-07, + "loss": 0.6257, + "step": 25132 + }, + { + "epoch": 0.87, + "learning_rate": 8.130696109264824e-07, + "loss": 0.6194, + "step": 25133 + }, + { + "epoch": 0.87, + "learning_rate": 8.126395939875786e-07, + "loss": 0.581, + "step": 25134 + }, + { + "epoch": 0.87, + "learning_rate": 8.12209685976455e-07, + "loss": 0.6307, + "step": 25135 + }, + { + "epoch": 0.87, + "learning_rate": 8.117798868982074e-07, + "loss": 0.6455, + "step": 25136 + }, + { + "epoch": 0.87, + "learning_rate": 8.11350196757933e-07, + "loss": 0.6057, + "step": 25137 + }, + { + "epoch": 0.87, + "learning_rate": 8.109206155607264e-07, + "loss": 0.6437, + "step": 25138 + }, + { + "epoch": 0.87, + "learning_rate": 8.104911433116769e-07, + "loss": 0.6504, + "step": 25139 + }, + { + "epoch": 0.87, + "learning_rate": 8.100617800158805e-07, + "loss": 0.6328, + "step": 25140 + }, + { + "epoch": 0.87, + "learning_rate": 8.096325256784299e-07, + "loss": 0.6191, + "step": 25141 + }, + { + "epoch": 0.87, + "learning_rate": 8.092033803044097e-07, + "loss": 0.6558, + "step": 25142 + }, + { + "epoch": 0.87, + "learning_rate": 8.087743438989093e-07, + "loss": 0.625, + "step": 25143 + }, + { + "epoch": 0.87, + "learning_rate": 8.08345416467019e-07, + "loss": 0.6744, + "step": 25144 + }, + { + "epoch": 0.87, + "learning_rate": 8.07916598013817e-07, + "loss": 0.6331, + "step": 25145 + }, + { + "epoch": 0.87, + "learning_rate": 8.074878885443926e-07, + "loss": 0.5944, + "step": 25146 + }, + { + "epoch": 0.87, + "learning_rate": 8.070592880638306e-07, + "loss": 0.6305, + "step": 25147 + }, + { + "epoch": 0.87, + "learning_rate": 8.06630796577208e-07, + "loss": 0.6192, + "step": 25148 + }, + { + "epoch": 0.87, + "learning_rate": 8.062024140896074e-07, + "loss": 0.6607, + "step": 25149 + }, + { + "epoch": 0.87, + "learning_rate": 8.057741406061092e-07, + "loss": 0.6934, + "step": 25150 + }, + { + "epoch": 0.87, + "learning_rate": 8.05345976131785e-07, + "loss": 0.5944, + "step": 25151 + }, + { + "epoch": 0.87, + "learning_rate": 8.049179206717173e-07, + "loss": 0.6061, + "step": 25152 + }, + { + "epoch": 0.87, + "learning_rate": 8.04489974230982e-07, + "loss": 0.5696, + "step": 25153 + }, + { + "epoch": 0.87, + "learning_rate": 8.040621368146484e-07, + "loss": 0.6676, + "step": 25154 + }, + { + "epoch": 0.87, + "learning_rate": 8.036344084277913e-07, + "loss": 0.5923, + "step": 25155 + }, + { + "epoch": 0.87, + "learning_rate": 8.032067890754824e-07, + "loss": 0.6105, + "step": 25156 + }, + { + "epoch": 0.87, + "learning_rate": 8.027792787627886e-07, + "loss": 0.5836, + "step": 25157 + }, + { + "epoch": 0.87, + "learning_rate": 8.023518774947825e-07, + "loss": 0.6127, + "step": 25158 + }, + { + "epoch": 0.87, + "learning_rate": 8.019245852765323e-07, + "loss": 0.6118, + "step": 25159 + }, + { + "epoch": 0.87, + "learning_rate": 8.014974021130994e-07, + "loss": 0.6202, + "step": 25160 + }, + { + "epoch": 0.87, + "learning_rate": 8.010703280095511e-07, + "loss": 0.6098, + "step": 25161 + }, + { + "epoch": 0.87, + "learning_rate": 8.00643362970952e-07, + "loss": 0.6309, + "step": 25162 + }, + { + "epoch": 0.87, + "learning_rate": 8.002165070023616e-07, + "loss": 0.6879, + "step": 25163 + }, + { + "epoch": 0.87, + "learning_rate": 7.997897601088422e-07, + "loss": 0.5789, + "step": 25164 + }, + { + "epoch": 0.87, + "learning_rate": 7.993631222954545e-07, + "loss": 0.6417, + "step": 25165 + }, + { + "epoch": 0.87, + "learning_rate": 7.989365935672544e-07, + "loss": 0.6435, + "step": 25166 + }, + { + "epoch": 0.87, + "learning_rate": 7.985101739293033e-07, + "loss": 0.6607, + "step": 25167 + }, + { + "epoch": 0.87, + "learning_rate": 7.980838633866516e-07, + "loss": 0.6613, + "step": 25168 + }, + { + "epoch": 0.87, + "learning_rate": 7.976576619443566e-07, + "loss": 0.6407, + "step": 25169 + }, + { + "epoch": 0.87, + "learning_rate": 7.972315696074706e-07, + "loss": 0.6247, + "step": 25170 + }, + { + "epoch": 0.87, + "learning_rate": 7.968055863810464e-07, + "loss": 0.6345, + "step": 25171 + }, + { + "epoch": 0.87, + "learning_rate": 7.963797122701333e-07, + "loss": 0.6539, + "step": 25172 + }, + { + "epoch": 0.87, + "learning_rate": 7.959539472797839e-07, + "loss": 0.6481, + "step": 25173 + }, + { + "epoch": 0.87, + "learning_rate": 7.95528291415042e-07, + "loss": 0.6351, + "step": 25174 + }, + { + "epoch": 0.87, + "learning_rate": 7.951027446809556e-07, + "loss": 0.6697, + "step": 25175 + }, + { + "epoch": 0.87, + "learning_rate": 7.946773070825698e-07, + "loss": 0.6293, + "step": 25176 + }, + { + "epoch": 0.87, + "learning_rate": 7.942519786249304e-07, + "loss": 0.6168, + "step": 25177 + }, + { + "epoch": 0.87, + "learning_rate": 7.938267593130778e-07, + "loss": 0.5963, + "step": 25178 + }, + { + "epoch": 0.87, + "learning_rate": 7.934016491520579e-07, + "loss": 0.6633, + "step": 25179 + }, + { + "epoch": 0.87, + "learning_rate": 7.929766481469059e-07, + "loss": 0.7079, + "step": 25180 + }, + { + "epoch": 0.87, + "learning_rate": 7.925517563026619e-07, + "loss": 0.6099, + "step": 25181 + }, + { + "epoch": 0.87, + "learning_rate": 7.921269736243642e-07, + "loss": 0.6792, + "step": 25182 + }, + { + "epoch": 0.87, + "learning_rate": 7.917023001170498e-07, + "loss": 0.5728, + "step": 25183 + }, + { + "epoch": 0.87, + "learning_rate": 7.912777357857537e-07, + "loss": 0.6483, + "step": 25184 + }, + { + "epoch": 0.87, + "learning_rate": 7.908532806355107e-07, + "loss": 0.6523, + "step": 25185 + }, + { + "epoch": 0.87, + "learning_rate": 7.904289346713489e-07, + "loss": 0.6449, + "step": 25186 + }, + { + "epoch": 0.87, + "learning_rate": 7.900046978983034e-07, + "loss": 0.6838, + "step": 25187 + }, + { + "epoch": 0.87, + "learning_rate": 7.895805703214022e-07, + "loss": 0.6281, + "step": 25188 + }, + { + "epoch": 0.87, + "learning_rate": 7.891565519456757e-07, + "loss": 0.6858, + "step": 25189 + }, + { + "epoch": 0.87, + "learning_rate": 7.887326427761488e-07, + "loss": 0.6153, + "step": 25190 + }, + { + "epoch": 0.87, + "learning_rate": 7.883088428178509e-07, + "loss": 0.6537, + "step": 25191 + }, + { + "epoch": 0.87, + "learning_rate": 7.878851520758024e-07, + "loss": 0.6767, + "step": 25192 + }, + { + "epoch": 0.87, + "learning_rate": 7.874615705550293e-07, + "loss": 0.5937, + "step": 25193 + }, + { + "epoch": 0.87, + "learning_rate": 7.87038098260553e-07, + "loss": 0.6836, + "step": 25194 + }, + { + "epoch": 0.87, + "learning_rate": 7.866147351973952e-07, + "loss": 0.5687, + "step": 25195 + }, + { + "epoch": 0.87, + "learning_rate": 7.86191481370574e-07, + "loss": 0.6158, + "step": 25196 + }, + { + "epoch": 0.87, + "learning_rate": 7.857683367851098e-07, + "loss": 0.6281, + "step": 25197 + }, + { + "epoch": 0.87, + "learning_rate": 7.853453014460167e-07, + "loss": 0.6258, + "step": 25198 + }, + { + "epoch": 0.87, + "learning_rate": 7.849223753583113e-07, + "loss": 0.62, + "step": 25199 + }, + { + "epoch": 0.87, + "learning_rate": 7.844995585270088e-07, + "loss": 0.6267, + "step": 25200 + }, + { + "epoch": 0.87, + "learning_rate": 7.840768509571217e-07, + "loss": 0.6152, + "step": 25201 + }, + { + "epoch": 0.87, + "learning_rate": 7.836542526536616e-07, + "loss": 0.6474, + "step": 25202 + }, + { + "epoch": 0.87, + "learning_rate": 7.832317636216402e-07, + "loss": 0.6597, + "step": 25203 + }, + { + "epoch": 0.87, + "learning_rate": 7.828093838660644e-07, + "loss": 0.6673, + "step": 25204 + }, + { + "epoch": 0.87, + "learning_rate": 7.823871133919436e-07, + "loss": 0.6923, + "step": 25205 + }, + { + "epoch": 0.87, + "learning_rate": 7.819649522042838e-07, + "loss": 0.666, + "step": 25206 + }, + { + "epoch": 0.87, + "learning_rate": 7.815429003080898e-07, + "loss": 0.6004, + "step": 25207 + }, + { + "epoch": 0.87, + "learning_rate": 7.811209577083656e-07, + "loss": 0.5576, + "step": 25208 + }, + { + "epoch": 0.87, + "learning_rate": 7.806991244101169e-07, + "loss": 0.6444, + "step": 25209 + }, + { + "epoch": 0.87, + "learning_rate": 7.802774004183411e-07, + "loss": 0.5508, + "step": 25210 + }, + { + "epoch": 0.87, + "learning_rate": 7.798557857380396e-07, + "loss": 0.6161, + "step": 25211 + }, + { + "epoch": 0.87, + "learning_rate": 7.794342803742105e-07, + "loss": 0.6578, + "step": 25212 + }, + { + "epoch": 0.87, + "learning_rate": 7.790128843318523e-07, + "loss": 0.6675, + "step": 25213 + }, + { + "epoch": 0.87, + "learning_rate": 7.785915976159619e-07, + "loss": 0.6069, + "step": 25214 + }, + { + "epoch": 0.87, + "learning_rate": 7.781704202315343e-07, + "loss": 0.6435, + "step": 25215 + }, + { + "epoch": 0.87, + "learning_rate": 7.777493521835599e-07, + "loss": 0.6043, + "step": 25216 + }, + { + "epoch": 0.87, + "learning_rate": 7.773283934770337e-07, + "loss": 0.6411, + "step": 25217 + }, + { + "epoch": 0.87, + "learning_rate": 7.76907544116946e-07, + "loss": 0.6698, + "step": 25218 + }, + { + "epoch": 0.87, + "learning_rate": 7.764868041082873e-07, + "loss": 0.6098, + "step": 25219 + }, + { + "epoch": 0.87, + "learning_rate": 7.760661734560448e-07, + "loss": 0.6202, + "step": 25220 + }, + { + "epoch": 0.87, + "learning_rate": 7.756456521652078e-07, + "loss": 0.6261, + "step": 25221 + }, + { + "epoch": 0.87, + "learning_rate": 7.752252402407589e-07, + "loss": 0.6168, + "step": 25222 + }, + { + "epoch": 0.87, + "learning_rate": 7.748049376876832e-07, + "loss": 0.625, + "step": 25223 + }, + { + "epoch": 0.87, + "learning_rate": 7.743847445109665e-07, + "loss": 0.6034, + "step": 25224 + }, + { + "epoch": 0.87, + "learning_rate": 7.739646607155882e-07, + "loss": 0.6537, + "step": 25225 + }, + { + "epoch": 0.87, + "learning_rate": 7.73544686306531e-07, + "loss": 0.6655, + "step": 25226 + }, + { + "epoch": 0.87, + "learning_rate": 7.731248212887721e-07, + "loss": 0.6324, + "step": 25227 + }, + { + "epoch": 0.87, + "learning_rate": 7.727050656672907e-07, + "loss": 0.6346, + "step": 25228 + }, + { + "epoch": 0.87, + "learning_rate": 7.722854194470631e-07, + "loss": 0.6243, + "step": 25229 + }, + { + "epoch": 0.87, + "learning_rate": 7.71865882633065e-07, + "loss": 0.6397, + "step": 25230 + }, + { + "epoch": 0.87, + "learning_rate": 7.714464552302702e-07, + "loss": 0.6153, + "step": 25231 + }, + { + "epoch": 0.87, + "learning_rate": 7.71027137243654e-07, + "loss": 0.6178, + "step": 25232 + }, + { + "epoch": 0.87, + "learning_rate": 7.706079286781843e-07, + "loss": 0.6097, + "step": 25233 + }, + { + "epoch": 0.87, + "learning_rate": 7.701888295388327e-07, + "loss": 0.6208, + "step": 25234 + }, + { + "epoch": 0.87, + "learning_rate": 7.697698398305676e-07, + "loss": 0.6297, + "step": 25235 + }, + { + "epoch": 0.87, + "learning_rate": 7.693509595583582e-07, + "loss": 0.6134, + "step": 25236 + }, + { + "epoch": 0.87, + "learning_rate": 7.689321887271695e-07, + "loss": 0.6103, + "step": 25237 + }, + { + "epoch": 0.87, + "learning_rate": 7.685135273419686e-07, + "loss": 0.5886, + "step": 25238 + }, + { + "epoch": 0.87, + "learning_rate": 7.68094975407716e-07, + "loss": 0.6477, + "step": 25239 + }, + { + "epoch": 0.87, + "learning_rate": 7.676765329293767e-07, + "loss": 0.5875, + "step": 25240 + }, + { + "epoch": 0.87, + "learning_rate": 7.67258199911911e-07, + "loss": 0.6517, + "step": 25241 + }, + { + "epoch": 0.87, + "learning_rate": 7.668399763602786e-07, + "loss": 0.6786, + "step": 25242 + }, + { + "epoch": 0.87, + "learning_rate": 7.664218622794373e-07, + "loss": 0.6363, + "step": 25243 + }, + { + "epoch": 0.87, + "learning_rate": 7.660038576743478e-07, + "loss": 0.6558, + "step": 25244 + }, + { + "epoch": 0.87, + "learning_rate": 7.655859625499618e-07, + "loss": 0.6178, + "step": 25245 + }, + { + "epoch": 0.87, + "learning_rate": 7.651681769112362e-07, + "loss": 0.6464, + "step": 25246 + }, + { + "epoch": 0.87, + "learning_rate": 7.647505007631239e-07, + "loss": 0.6369, + "step": 25247 + }, + { + "epoch": 0.87, + "learning_rate": 7.643329341105765e-07, + "loss": 0.6511, + "step": 25248 + }, + { + "epoch": 0.87, + "learning_rate": 7.639154769585467e-07, + "loss": 0.6505, + "step": 25249 + }, + { + "epoch": 0.87, + "learning_rate": 7.634981293119825e-07, + "loss": 0.6679, + "step": 25250 + }, + { + "epoch": 0.87, + "learning_rate": 7.630808911758314e-07, + "loss": 0.5803, + "step": 25251 + }, + { + "epoch": 0.87, + "learning_rate": 7.626637625550415e-07, + "loss": 0.6194, + "step": 25252 + }, + { + "epoch": 0.87, + "learning_rate": 7.622467434545577e-07, + "loss": 0.6578, + "step": 25253 + }, + { + "epoch": 0.87, + "learning_rate": 7.618298338793239e-07, + "loss": 0.6176, + "step": 25254 + }, + { + "epoch": 0.88, + "learning_rate": 7.614130338342851e-07, + "loss": 0.6479, + "step": 25255 + }, + { + "epoch": 0.88, + "learning_rate": 7.609963433243828e-07, + "loss": 0.6065, + "step": 25256 + }, + { + "epoch": 0.88, + "learning_rate": 7.605797623545542e-07, + "loss": 0.6396, + "step": 25257 + }, + { + "epoch": 0.88, + "learning_rate": 7.601632909297407e-07, + "loss": 0.6185, + "step": 25258 + }, + { + "epoch": 0.88, + "learning_rate": 7.597469290548798e-07, + "loss": 0.6201, + "step": 25259 + }, + { + "epoch": 0.88, + "learning_rate": 7.593306767349074e-07, + "loss": 0.6409, + "step": 25260 + }, + { + "epoch": 0.88, + "learning_rate": 7.589145339747606e-07, + "loss": 0.6447, + "step": 25261 + }, + { + "epoch": 0.88, + "learning_rate": 7.584985007793721e-07, + "loss": 0.6925, + "step": 25262 + }, + { + "epoch": 0.88, + "learning_rate": 7.580825771536737e-07, + "loss": 0.6702, + "step": 25263 + }, + { + "epoch": 0.88, + "learning_rate": 7.57666763102598e-07, + "loss": 0.6366, + "step": 25264 + }, + { + "epoch": 0.88, + "learning_rate": 7.572510586310733e-07, + "loss": 0.6176, + "step": 25265 + }, + { + "epoch": 0.88, + "learning_rate": 7.5683546374403e-07, + "loss": 0.5864, + "step": 25266 + }, + { + "epoch": 0.88, + "learning_rate": 7.564199784463955e-07, + "loss": 0.6644, + "step": 25267 + }, + { + "epoch": 0.88, + "learning_rate": 7.560046027430957e-07, + "loss": 0.5989, + "step": 25268 + }, + { + "epoch": 0.88, + "learning_rate": 7.555893366390544e-07, + "loss": 0.6826, + "step": 25269 + }, + { + "epoch": 0.88, + "learning_rate": 7.551741801391954e-07, + "loss": 0.5797, + "step": 25270 + }, + { + "epoch": 0.88, + "learning_rate": 7.547591332484416e-07, + "loss": 0.6075, + "step": 25271 + }, + { + "epoch": 0.88, + "learning_rate": 7.543441959717135e-07, + "loss": 0.6056, + "step": 25272 + }, + { + "epoch": 0.88, + "learning_rate": 7.539293683139303e-07, + "loss": 0.6551, + "step": 25273 + }, + { + "epoch": 0.88, + "learning_rate": 7.535146502800128e-07, + "loss": 0.6214, + "step": 25274 + }, + { + "epoch": 0.88, + "learning_rate": 7.531000418748746e-07, + "loss": 0.6454, + "step": 25275 + }, + { + "epoch": 0.88, + "learning_rate": 7.526855431034319e-07, + "loss": 0.586, + "step": 25276 + }, + { + "epoch": 0.88, + "learning_rate": 7.522711539706007e-07, + "loss": 0.6408, + "step": 25277 + }, + { + "epoch": 0.88, + "learning_rate": 7.518568744812926e-07, + "loss": 0.7003, + "step": 25278 + }, + { + "epoch": 0.88, + "learning_rate": 7.514427046404215e-07, + "loss": 0.665, + "step": 25279 + }, + { + "epoch": 0.88, + "learning_rate": 7.510286444528981e-07, + "loss": 0.5687, + "step": 25280 + }, + { + "epoch": 0.88, + "learning_rate": 7.50614693923627e-07, + "loss": 0.6593, + "step": 25281 + }, + { + "epoch": 0.88, + "learning_rate": 7.502008530575211e-07, + "loss": 0.6218, + "step": 25282 + }, + { + "epoch": 0.88, + "learning_rate": 7.497871218594843e-07, + "loss": 0.6276, + "step": 25283 + }, + { + "epoch": 0.88, + "learning_rate": 7.493735003344227e-07, + "loss": 0.6337, + "step": 25284 + }, + { + "epoch": 0.88, + "learning_rate": 7.489599884872401e-07, + "loss": 0.6311, + "step": 25285 + }, + { + "epoch": 0.88, + "learning_rate": 7.485465863228413e-07, + "loss": 0.5871, + "step": 25286 + }, + { + "epoch": 0.88, + "learning_rate": 7.481332938461239e-07, + "loss": 0.6304, + "step": 25287 + }, + { + "epoch": 0.88, + "learning_rate": 7.477201110619903e-07, + "loss": 0.6163, + "step": 25288 + }, + { + "epoch": 0.88, + "learning_rate": 7.4730703797534e-07, + "loss": 0.6905, + "step": 25289 + }, + { + "epoch": 0.88, + "learning_rate": 7.46894074591068e-07, + "loss": 0.6095, + "step": 25290 + }, + { + "epoch": 0.88, + "learning_rate": 7.464812209140748e-07, + "loss": 0.5589, + "step": 25291 + }, + { + "epoch": 0.88, + "learning_rate": 7.460684769492499e-07, + "loss": 0.6495, + "step": 25292 + }, + { + "epoch": 0.88, + "learning_rate": 7.456558427014893e-07, + "loss": 0.6564, + "step": 25293 + }, + { + "epoch": 0.88, + "learning_rate": 7.452433181756868e-07, + "loss": 0.5753, + "step": 25294 + }, + { + "epoch": 0.88, + "learning_rate": 7.44830903376731e-07, + "loss": 0.6532, + "step": 25295 + }, + { + "epoch": 0.88, + "learning_rate": 7.444185983095131e-07, + "loss": 0.6639, + "step": 25296 + }, + { + "epoch": 0.88, + "learning_rate": 7.440064029789229e-07, + "loss": 0.6038, + "step": 25297 + }, + { + "epoch": 0.88, + "learning_rate": 7.43594317389843e-07, + "loss": 0.6368, + "step": 25298 + }, + { + "epoch": 0.88, + "learning_rate": 7.431823415471629e-07, + "loss": 0.6058, + "step": 25299 + }, + { + "epoch": 0.88, + "learning_rate": 7.427704754557664e-07, + "loss": 0.5832, + "step": 25300 + }, + { + "epoch": 0.88, + "learning_rate": 7.423587191205351e-07, + "loss": 0.6794, + "step": 25301 + }, + { + "epoch": 0.88, + "learning_rate": 7.419470725463529e-07, + "loss": 0.587, + "step": 25302 + }, + { + "epoch": 0.88, + "learning_rate": 7.415355357381015e-07, + "loss": 0.6108, + "step": 25303 + }, + { + "epoch": 0.88, + "learning_rate": 7.41124108700656e-07, + "loss": 0.6335, + "step": 25304 + }, + { + "epoch": 0.88, + "learning_rate": 7.407127914388978e-07, + "loss": 0.669, + "step": 25305 + }, + { + "epoch": 0.88, + "learning_rate": 7.40301583957701e-07, + "loss": 0.6228, + "step": 25306 + }, + { + "epoch": 0.88, + "learning_rate": 7.398904862619438e-07, + "loss": 0.6263, + "step": 25307 + }, + { + "epoch": 0.88, + "learning_rate": 7.39479498356499e-07, + "loss": 0.6384, + "step": 25308 + }, + { + "epoch": 0.88, + "learning_rate": 7.390686202462405e-07, + "loss": 0.6965, + "step": 25309 + }, + { + "epoch": 0.88, + "learning_rate": 7.386578519360365e-07, + "loss": 0.6049, + "step": 25310 + }, + { + "epoch": 0.88, + "learning_rate": 7.3824719343076e-07, + "loss": 0.6332, + "step": 25311 + }, + { + "epoch": 0.88, + "learning_rate": 7.378366447352791e-07, + "loss": 0.6093, + "step": 25312 + }, + { + "epoch": 0.88, + "learning_rate": 7.374262058544624e-07, + "loss": 0.6289, + "step": 25313 + }, + { + "epoch": 0.88, + "learning_rate": 7.370158767931734e-07, + "loss": 0.5854, + "step": 25314 + }, + { + "epoch": 0.88, + "learning_rate": 7.366056575562818e-07, + "loss": 0.6186, + "step": 25315 + }, + { + "epoch": 0.88, + "learning_rate": 7.36195548148646e-07, + "loss": 0.6248, + "step": 25316 + }, + { + "epoch": 0.88, + "learning_rate": 7.35785548575132e-07, + "loss": 0.6425, + "step": 25317 + }, + { + "epoch": 0.88, + "learning_rate": 7.35375658840598e-07, + "loss": 0.6006, + "step": 25318 + }, + { + "epoch": 0.88, + "learning_rate": 7.349658789499071e-07, + "loss": 0.6572, + "step": 25319 + }, + { + "epoch": 0.88, + "learning_rate": 7.34556208907915e-07, + "loss": 0.6185, + "step": 25320 + }, + { + "epoch": 0.88, + "learning_rate": 7.341466487194814e-07, + "loss": 0.6708, + "step": 25321 + }, + { + "epoch": 0.88, + "learning_rate": 7.337371983894592e-07, + "loss": 0.6205, + "step": 25322 + }, + { + "epoch": 0.88, + "learning_rate": 7.333278579227043e-07, + "loss": 0.6085, + "step": 25323 + }, + { + "epoch": 0.88, + "learning_rate": 7.329186273240707e-07, + "loss": 0.6054, + "step": 25324 + }, + { + "epoch": 0.88, + "learning_rate": 7.325095065984089e-07, + "loss": 0.6508, + "step": 25325 + }, + { + "epoch": 0.88, + "learning_rate": 7.321004957505707e-07, + "loss": 0.65, + "step": 25326 + }, + { + "epoch": 0.88, + "learning_rate": 7.316915947854065e-07, + "loss": 0.5879, + "step": 25327 + }, + { + "epoch": 0.88, + "learning_rate": 7.312828037077613e-07, + "loss": 0.654, + "step": 25328 + }, + { + "epoch": 0.88, + "learning_rate": 7.308741225224836e-07, + "loss": 0.6919, + "step": 25329 + }, + { + "epoch": 0.88, + "learning_rate": 7.304655512344183e-07, + "loss": 0.6122, + "step": 25330 + }, + { + "epoch": 0.88, + "learning_rate": 7.300570898484105e-07, + "loss": 0.6359, + "step": 25331 + }, + { + "epoch": 0.88, + "learning_rate": 7.296487383693019e-07, + "loss": 0.6624, + "step": 25332 + }, + { + "epoch": 0.88, + "learning_rate": 7.292404968019373e-07, + "loss": 0.6562, + "step": 25333 + }, + { + "epoch": 0.88, + "learning_rate": 7.288323651511508e-07, + "loss": 0.6117, + "step": 25334 + }, + { + "epoch": 0.88, + "learning_rate": 7.284243434217864e-07, + "loss": 0.6415, + "step": 25335 + }, + { + "epoch": 0.88, + "learning_rate": 7.280164316186788e-07, + "loss": 0.6217, + "step": 25336 + }, + { + "epoch": 0.88, + "learning_rate": 7.276086297466667e-07, + "loss": 0.6462, + "step": 25337 + }, + { + "epoch": 0.88, + "learning_rate": 7.272009378105827e-07, + "loss": 0.6697, + "step": 25338 + }, + { + "epoch": 0.88, + "learning_rate": 7.26793355815264e-07, + "loss": 0.62, + "step": 25339 + }, + { + "epoch": 0.88, + "learning_rate": 7.263858837655391e-07, + "loss": 0.6, + "step": 25340 + }, + { + "epoch": 0.88, + "learning_rate": 7.259785216662407e-07, + "loss": 0.5916, + "step": 25341 + }, + { + "epoch": 0.88, + "learning_rate": 7.255712695221984e-07, + "loss": 0.6026, + "step": 25342 + }, + { + "epoch": 0.88, + "learning_rate": 7.251641273382403e-07, + "loss": 0.6168, + "step": 25343 + }, + { + "epoch": 0.88, + "learning_rate": 7.247570951191951e-07, + "loss": 0.6255, + "step": 25344 + }, + { + "epoch": 0.88, + "learning_rate": 7.243501728698898e-07, + "loss": 0.6344, + "step": 25345 + }, + { + "epoch": 0.88, + "learning_rate": 7.239433605951452e-07, + "loss": 0.6092, + "step": 25346 + }, + { + "epoch": 0.88, + "learning_rate": 7.235366582997849e-07, + "loss": 0.6411, + "step": 25347 + }, + { + "epoch": 0.88, + "learning_rate": 7.231300659886342e-07, + "loss": 0.6395, + "step": 25348 + }, + { + "epoch": 0.88, + "learning_rate": 7.227235836665103e-07, + "loss": 0.6543, + "step": 25349 + }, + { + "epoch": 0.88, + "learning_rate": 7.223172113382371e-07, + "loss": 0.6039, + "step": 25350 + }, + { + "epoch": 0.88, + "learning_rate": 7.219109490086274e-07, + "loss": 0.6118, + "step": 25351 + }, + { + "epoch": 0.88, + "learning_rate": 7.215047966824995e-07, + "loss": 0.6329, + "step": 25352 + }, + { + "epoch": 0.88, + "learning_rate": 7.210987543646719e-07, + "loss": 0.6406, + "step": 25353 + }, + { + "epoch": 0.88, + "learning_rate": 7.206928220599552e-07, + "loss": 0.6692, + "step": 25354 + }, + { + "epoch": 0.88, + "learning_rate": 7.202869997731621e-07, + "loss": 0.6125, + "step": 25355 + }, + { + "epoch": 0.88, + "learning_rate": 7.198812875091076e-07, + "loss": 0.6458, + "step": 25356 + }, + { + "epoch": 0.88, + "learning_rate": 7.194756852725993e-07, + "loss": 0.5764, + "step": 25357 + }, + { + "epoch": 0.88, + "learning_rate": 7.190701930684463e-07, + "loss": 0.6592, + "step": 25358 + }, + { + "epoch": 0.88, + "learning_rate": 7.186648109014571e-07, + "loss": 0.6523, + "step": 25359 + }, + { + "epoch": 0.88, + "learning_rate": 7.18259538776438e-07, + "loss": 0.6091, + "step": 25360 + }, + { + "epoch": 0.88, + "learning_rate": 7.178543766981904e-07, + "loss": 0.6077, + "step": 25361 + }, + { + "epoch": 0.88, + "learning_rate": 7.174493246715242e-07, + "loss": 0.6243, + "step": 25362 + }, + { + "epoch": 0.88, + "learning_rate": 7.170443827012386e-07, + "loss": 0.6727, + "step": 25363 + }, + { + "epoch": 0.88, + "learning_rate": 7.166395507921331e-07, + "loss": 0.6038, + "step": 25364 + }, + { + "epoch": 0.88, + "learning_rate": 7.162348289490117e-07, + "loss": 0.6368, + "step": 25365 + }, + { + "epoch": 0.88, + "learning_rate": 7.158302171766696e-07, + "loss": 0.6606, + "step": 25366 + }, + { + "epoch": 0.88, + "learning_rate": 7.154257154799016e-07, + "loss": 0.5698, + "step": 25367 + }, + { + "epoch": 0.88, + "learning_rate": 7.150213238635117e-07, + "loss": 0.6292, + "step": 25368 + }, + { + "epoch": 0.88, + "learning_rate": 7.146170423322873e-07, + "loss": 0.6535, + "step": 25369 + }, + { + "epoch": 0.88, + "learning_rate": 7.142128708910235e-07, + "loss": 0.6701, + "step": 25370 + }, + { + "epoch": 0.88, + "learning_rate": 7.138088095445139e-07, + "loss": 0.6426, + "step": 25371 + }, + { + "epoch": 0.88, + "learning_rate": 7.134048582975473e-07, + "loss": 0.6177, + "step": 25372 + }, + { + "epoch": 0.88, + "learning_rate": 7.130010171549118e-07, + "loss": 0.6341, + "step": 25373 + }, + { + "epoch": 0.88, + "learning_rate": 7.125972861214003e-07, + "loss": 0.6274, + "step": 25374 + }, + { + "epoch": 0.88, + "learning_rate": 7.121936652017958e-07, + "loss": 0.6221, + "step": 25375 + }, + { + "epoch": 0.88, + "learning_rate": 7.117901544008843e-07, + "loss": 0.6285, + "step": 25376 + }, + { + "epoch": 0.88, + "learning_rate": 7.113867537234509e-07, + "loss": 0.6404, + "step": 25377 + }, + { + "epoch": 0.88, + "learning_rate": 7.109834631742763e-07, + "loss": 0.6486, + "step": 25378 + }, + { + "epoch": 0.88, + "learning_rate": 7.105802827581421e-07, + "loss": 0.6785, + "step": 25379 + }, + { + "epoch": 0.88, + "learning_rate": 7.101772124798334e-07, + "loss": 0.6438, + "step": 25380 + }, + { + "epoch": 0.88, + "learning_rate": 7.097742523441242e-07, + "loss": 0.6868, + "step": 25381 + }, + { + "epoch": 0.88, + "learning_rate": 7.093714023557918e-07, + "loss": 0.6337, + "step": 25382 + }, + { + "epoch": 0.88, + "learning_rate": 7.089686625196169e-07, + "loss": 0.6283, + "step": 25383 + }, + { + "epoch": 0.88, + "learning_rate": 7.085660328403709e-07, + "loss": 0.6459, + "step": 25384 + }, + { + "epoch": 0.88, + "learning_rate": 7.081635133228248e-07, + "loss": 0.6438, + "step": 25385 + }, + { + "epoch": 0.88, + "learning_rate": 7.077611039717591e-07, + "loss": 0.5878, + "step": 25386 + }, + { + "epoch": 0.88, + "learning_rate": 7.073588047919388e-07, + "loss": 0.6468, + "step": 25387 + }, + { + "epoch": 0.88, + "learning_rate": 7.069566157881346e-07, + "loss": 0.6258, + "step": 25388 + }, + { + "epoch": 0.88, + "learning_rate": 7.065545369651161e-07, + "loss": 0.6656, + "step": 25389 + }, + { + "epoch": 0.88, + "learning_rate": 7.061525683276493e-07, + "loss": 0.5662, + "step": 25390 + }, + { + "epoch": 0.88, + "learning_rate": 7.057507098804994e-07, + "loss": 0.6464, + "step": 25391 + }, + { + "epoch": 0.88, + "learning_rate": 7.053489616284348e-07, + "loss": 0.5951, + "step": 25392 + }, + { + "epoch": 0.88, + "learning_rate": 7.049473235762139e-07, + "loss": 0.6562, + "step": 25393 + }, + { + "epoch": 0.88, + "learning_rate": 7.045457957286017e-07, + "loss": 0.633, + "step": 25394 + }, + { + "epoch": 0.88, + "learning_rate": 7.041443780903589e-07, + "loss": 0.6297, + "step": 25395 + }, + { + "epoch": 0.88, + "learning_rate": 7.03743070666243e-07, + "loss": 0.6434, + "step": 25396 + }, + { + "epoch": 0.88, + "learning_rate": 7.033418734610098e-07, + "loss": 0.6031, + "step": 25397 + }, + { + "epoch": 0.88, + "learning_rate": 7.029407864794235e-07, + "loss": 0.6155, + "step": 25398 + }, + { + "epoch": 0.88, + "learning_rate": 7.025398097262326e-07, + "loss": 0.6106, + "step": 25399 + }, + { + "epoch": 0.88, + "learning_rate": 7.021389432061942e-07, + "loss": 0.638, + "step": 25400 + }, + { + "epoch": 0.88, + "learning_rate": 7.017381869240625e-07, + "loss": 0.6377, + "step": 25401 + }, + { + "epoch": 0.88, + "learning_rate": 7.013375408845846e-07, + "loss": 0.6761, + "step": 25402 + }, + { + "epoch": 0.88, + "learning_rate": 7.009370050925113e-07, + "loss": 0.6484, + "step": 25403 + }, + { + "epoch": 0.88, + "learning_rate": 7.005365795525965e-07, + "loss": 0.6598, + "step": 25404 + }, + { + "epoch": 0.88, + "learning_rate": 7.001362642695831e-07, + "loss": 0.6475, + "step": 25405 + }, + { + "epoch": 0.88, + "learning_rate": 6.997360592482183e-07, + "loss": 0.6376, + "step": 25406 + }, + { + "epoch": 0.88, + "learning_rate": 6.993359644932496e-07, + "loss": 0.6503, + "step": 25407 + }, + { + "epoch": 0.88, + "learning_rate": 6.989359800094164e-07, + "loss": 0.611, + "step": 25408 + }, + { + "epoch": 0.88, + "learning_rate": 6.985361058014617e-07, + "loss": 0.6331, + "step": 25409 + }, + { + "epoch": 0.88, + "learning_rate": 6.981363418741316e-07, + "loss": 0.6645, + "step": 25410 + }, + { + "epoch": 0.88, + "learning_rate": 6.97736688232159e-07, + "loss": 0.6241, + "step": 25411 + }, + { + "epoch": 0.88, + "learning_rate": 6.973371448802879e-07, + "loss": 0.6673, + "step": 25412 + }, + { + "epoch": 0.88, + "learning_rate": 6.969377118232512e-07, + "loss": 0.6293, + "step": 25413 + }, + { + "epoch": 0.88, + "learning_rate": 6.965383890657862e-07, + "loss": 0.6476, + "step": 25414 + }, + { + "epoch": 0.88, + "learning_rate": 6.96139176612628e-07, + "loss": 0.6804, + "step": 25415 + }, + { + "epoch": 0.88, + "learning_rate": 6.957400744685094e-07, + "loss": 0.6382, + "step": 25416 + }, + { + "epoch": 0.88, + "learning_rate": 6.953410826381613e-07, + "loss": 0.6284, + "step": 25417 + }, + { + "epoch": 0.88, + "learning_rate": 6.949422011263174e-07, + "loss": 0.6353, + "step": 25418 + }, + { + "epoch": 0.88, + "learning_rate": 6.945434299377029e-07, + "loss": 0.6476, + "step": 25419 + }, + { + "epoch": 0.88, + "learning_rate": 6.941447690770475e-07, + "loss": 0.6453, + "step": 25420 + }, + { + "epoch": 0.88, + "learning_rate": 6.937462185490773e-07, + "loss": 0.5936, + "step": 25421 + }, + { + "epoch": 0.88, + "learning_rate": 6.933477783585185e-07, + "loss": 0.6392, + "step": 25422 + }, + { + "epoch": 0.88, + "learning_rate": 6.929494485100952e-07, + "loss": 0.6715, + "step": 25423 + }, + { + "epoch": 0.88, + "learning_rate": 6.925512290085313e-07, + "loss": 0.6459, + "step": 25424 + }, + { + "epoch": 0.88, + "learning_rate": 6.92153119858544e-07, + "loss": 0.6378, + "step": 25425 + }, + { + "epoch": 0.88, + "learning_rate": 6.917551210648577e-07, + "loss": 0.5975, + "step": 25426 + }, + { + "epoch": 0.88, + "learning_rate": 6.913572326321883e-07, + "loss": 0.5736, + "step": 25427 + }, + { + "epoch": 0.88, + "learning_rate": 6.909594545652542e-07, + "loss": 0.685, + "step": 25428 + }, + { + "epoch": 0.88, + "learning_rate": 6.905617868687719e-07, + "loss": 0.5336, + "step": 25429 + }, + { + "epoch": 0.88, + "learning_rate": 6.901642295474575e-07, + "loss": 0.6161, + "step": 25430 + }, + { + "epoch": 0.88, + "learning_rate": 6.897667826060217e-07, + "loss": 0.6303, + "step": 25431 + }, + { + "epoch": 0.88, + "learning_rate": 6.893694460491785e-07, + "loss": 0.6201, + "step": 25432 + }, + { + "epoch": 0.88, + "learning_rate": 6.889722198816384e-07, + "loss": 0.5966, + "step": 25433 + }, + { + "epoch": 0.88, + "learning_rate": 6.885751041081112e-07, + "loss": 0.6443, + "step": 25434 + }, + { + "epoch": 0.88, + "learning_rate": 6.881780987333053e-07, + "loss": 0.6133, + "step": 25435 + }, + { + "epoch": 0.88, + "learning_rate": 6.877812037619291e-07, + "loss": 0.6374, + "step": 25436 + }, + { + "epoch": 0.88, + "learning_rate": 6.873844191986845e-07, + "loss": 0.6635, + "step": 25437 + }, + { + "epoch": 0.88, + "learning_rate": 6.869877450482787e-07, + "loss": 0.6174, + "step": 25438 + }, + { + "epoch": 0.88, + "learning_rate": 6.865911813154146e-07, + "loss": 0.6038, + "step": 25439 + }, + { + "epoch": 0.88, + "learning_rate": 6.861947280047932e-07, + "loss": 0.5863, + "step": 25440 + }, + { + "epoch": 0.88, + "learning_rate": 6.857983851211147e-07, + "loss": 0.6292, + "step": 25441 + }, + { + "epoch": 0.88, + "learning_rate": 6.854021526690813e-07, + "loss": 0.6945, + "step": 25442 + }, + { + "epoch": 0.88, + "learning_rate": 6.850060306533868e-07, + "loss": 0.6125, + "step": 25443 + }, + { + "epoch": 0.88, + "learning_rate": 6.846100190787286e-07, + "loss": 0.6702, + "step": 25444 + }, + { + "epoch": 0.88, + "learning_rate": 6.842141179498029e-07, + "loss": 0.6351, + "step": 25445 + }, + { + "epoch": 0.88, + "learning_rate": 6.838183272713039e-07, + "loss": 0.6194, + "step": 25446 + }, + { + "epoch": 0.88, + "learning_rate": 6.834226470479233e-07, + "loss": 0.5707, + "step": 25447 + }, + { + "epoch": 0.88, + "learning_rate": 6.830270772843539e-07, + "loss": 0.577, + "step": 25448 + }, + { + "epoch": 0.88, + "learning_rate": 6.826316179852832e-07, + "loss": 0.6552, + "step": 25449 + }, + { + "epoch": 0.88, + "learning_rate": 6.822362691554018e-07, + "loss": 0.6449, + "step": 25450 + }, + { + "epoch": 0.88, + "learning_rate": 6.818410307993961e-07, + "loss": 0.6328, + "step": 25451 + }, + { + "epoch": 0.88, + "learning_rate": 6.814459029219522e-07, + "loss": 0.6422, + "step": 25452 + }, + { + "epoch": 0.88, + "learning_rate": 6.810508855277554e-07, + "loss": 0.593, + "step": 25453 + }, + { + "epoch": 0.88, + "learning_rate": 6.806559786214906e-07, + "loss": 0.6255, + "step": 25454 + }, + { + "epoch": 0.88, + "learning_rate": 6.802611822078365e-07, + "loss": 0.6442, + "step": 25455 + }, + { + "epoch": 0.88, + "learning_rate": 6.798664962914758e-07, + "loss": 0.6278, + "step": 25456 + }, + { + "epoch": 0.88, + "learning_rate": 6.794719208770873e-07, + "loss": 0.6156, + "step": 25457 + }, + { + "epoch": 0.88, + "learning_rate": 6.790774559693503e-07, + "loss": 0.6372, + "step": 25458 + }, + { + "epoch": 0.88, + "learning_rate": 6.786831015729412e-07, + "loss": 0.5904, + "step": 25459 + }, + { + "epoch": 0.88, + "learning_rate": 6.782888576925362e-07, + "loss": 0.6616, + "step": 25460 + }, + { + "epoch": 0.88, + "learning_rate": 6.778947243328083e-07, + "loss": 0.6802, + "step": 25461 + }, + { + "epoch": 0.88, + "learning_rate": 6.775007014984303e-07, + "loss": 0.6573, + "step": 25462 + }, + { + "epoch": 0.88, + "learning_rate": 6.771067891940741e-07, + "loss": 0.6932, + "step": 25463 + }, + { + "epoch": 0.88, + "learning_rate": 6.767129874244105e-07, + "loss": 0.6367, + "step": 25464 + }, + { + "epoch": 0.88, + "learning_rate": 6.763192961941089e-07, + "loss": 0.6109, + "step": 25465 + }, + { + "epoch": 0.88, + "learning_rate": 6.759257155078391e-07, + "loss": 0.6112, + "step": 25466 + }, + { + "epoch": 0.88, + "learning_rate": 6.755322453702617e-07, + "loss": 0.6235, + "step": 25467 + }, + { + "epoch": 0.88, + "learning_rate": 6.751388857860464e-07, + "loss": 0.6054, + "step": 25468 + }, + { + "epoch": 0.88, + "learning_rate": 6.747456367598549e-07, + "loss": 0.683, + "step": 25469 + }, + { + "epoch": 0.88, + "learning_rate": 6.7435249829635e-07, + "loss": 0.652, + "step": 25470 + }, + { + "epoch": 0.88, + "learning_rate": 6.739594704001939e-07, + "loss": 0.6328, + "step": 25471 + }, + { + "epoch": 0.88, + "learning_rate": 6.735665530760472e-07, + "loss": 0.6368, + "step": 25472 + }, + { + "epoch": 0.88, + "learning_rate": 6.731737463285648e-07, + "loss": 0.658, + "step": 25473 + }, + { + "epoch": 0.88, + "learning_rate": 6.727810501624066e-07, + "loss": 0.6112, + "step": 25474 + }, + { + "epoch": 0.88, + "learning_rate": 6.723884645822287e-07, + "loss": 0.6177, + "step": 25475 + }, + { + "epoch": 0.88, + "learning_rate": 6.719959895926842e-07, + "loss": 0.6016, + "step": 25476 + }, + { + "epoch": 0.88, + "learning_rate": 6.716036251984293e-07, + "loss": 0.6077, + "step": 25477 + }, + { + "epoch": 0.88, + "learning_rate": 6.712113714041124e-07, + "loss": 0.6403, + "step": 25478 + }, + { + "epoch": 0.88, + "learning_rate": 6.708192282143855e-07, + "loss": 0.5909, + "step": 25479 + }, + { + "epoch": 0.88, + "learning_rate": 6.704271956338981e-07, + "loss": 0.6898, + "step": 25480 + }, + { + "epoch": 0.88, + "learning_rate": 6.700352736672977e-07, + "loss": 0.6364, + "step": 25481 + }, + { + "epoch": 0.88, + "learning_rate": 6.696434623192328e-07, + "loss": 0.5972, + "step": 25482 + }, + { + "epoch": 0.88, + "learning_rate": 6.692517615943483e-07, + "loss": 0.7274, + "step": 25483 + }, + { + "epoch": 0.88, + "learning_rate": 6.688601714972853e-07, + "loss": 0.6349, + "step": 25484 + }, + { + "epoch": 0.88, + "learning_rate": 6.684686920326899e-07, + "loss": 0.6564, + "step": 25485 + }, + { + "epoch": 0.88, + "learning_rate": 6.68077323205203e-07, + "loss": 0.6546, + "step": 25486 + }, + { + "epoch": 0.88, + "learning_rate": 6.676860650194639e-07, + "loss": 0.6683, + "step": 25487 + }, + { + "epoch": 0.88, + "learning_rate": 6.672949174801124e-07, + "loss": 0.6095, + "step": 25488 + }, + { + "epoch": 0.88, + "learning_rate": 6.66903880591786e-07, + "loss": 0.7046, + "step": 25489 + }, + { + "epoch": 0.88, + "learning_rate": 6.665129543591198e-07, + "loss": 0.6077, + "step": 25490 + }, + { + "epoch": 0.88, + "learning_rate": 6.6612213878675e-07, + "loss": 0.6212, + "step": 25491 + }, + { + "epoch": 0.88, + "learning_rate": 6.657314338793086e-07, + "loss": 0.6436, + "step": 25492 + }, + { + "epoch": 0.88, + "learning_rate": 6.653408396414296e-07, + "loss": 0.6633, + "step": 25493 + }, + { + "epoch": 0.88, + "learning_rate": 6.649503560777426e-07, + "loss": 0.6053, + "step": 25494 + }, + { + "epoch": 0.88, + "learning_rate": 6.645599831928806e-07, + "loss": 0.6186, + "step": 25495 + }, + { + "epoch": 0.88, + "learning_rate": 6.641697209914666e-07, + "loss": 0.6357, + "step": 25496 + }, + { + "epoch": 0.88, + "learning_rate": 6.637795694781313e-07, + "loss": 0.6388, + "step": 25497 + }, + { + "epoch": 0.88, + "learning_rate": 6.633895286574998e-07, + "loss": 0.6143, + "step": 25498 + }, + { + "epoch": 0.88, + "learning_rate": 6.629995985341963e-07, + "loss": 0.6055, + "step": 25499 + }, + { + "epoch": 0.88, + "learning_rate": 6.626097791128427e-07, + "loss": 0.7086, + "step": 25500 + }, + { + "epoch": 0.88, + "learning_rate": 6.622200703980652e-07, + "loss": 0.5988, + "step": 25501 + }, + { + "epoch": 0.88, + "learning_rate": 6.618304723944791e-07, + "loss": 0.5994, + "step": 25502 + }, + { + "epoch": 0.88, + "learning_rate": 6.614409851067049e-07, + "loss": 0.6405, + "step": 25503 + }, + { + "epoch": 0.88, + "learning_rate": 6.610516085393615e-07, + "loss": 0.6429, + "step": 25504 + }, + { + "epoch": 0.88, + "learning_rate": 6.606623426970649e-07, + "loss": 0.6141, + "step": 25505 + }, + { + "epoch": 0.88, + "learning_rate": 6.602731875844314e-07, + "loss": 0.618, + "step": 25506 + }, + { + "epoch": 0.88, + "learning_rate": 6.598841432060754e-07, + "loss": 0.5665, + "step": 25507 + }, + { + "epoch": 0.88, + "learning_rate": 6.594952095666063e-07, + "loss": 0.6809, + "step": 25508 + }, + { + "epoch": 0.88, + "learning_rate": 6.591063866706371e-07, + "loss": 0.6431, + "step": 25509 + }, + { + "epoch": 0.88, + "learning_rate": 6.587176745227775e-07, + "loss": 0.6217, + "step": 25510 + }, + { + "epoch": 0.88, + "learning_rate": 6.583290731276381e-07, + "loss": 0.6589, + "step": 25511 + }, + { + "epoch": 0.88, + "learning_rate": 6.579405824898233e-07, + "loss": 0.5732, + "step": 25512 + }, + { + "epoch": 0.88, + "learning_rate": 6.575522026139436e-07, + "loss": 0.6722, + "step": 25513 + }, + { + "epoch": 0.88, + "learning_rate": 6.571639335045988e-07, + "loss": 0.6035, + "step": 25514 + }, + { + "epoch": 0.88, + "learning_rate": 6.567757751663939e-07, + "loss": 0.6306, + "step": 25515 + }, + { + "epoch": 0.88, + "learning_rate": 6.563877276039321e-07, + "loss": 0.6491, + "step": 25516 + }, + { + "epoch": 0.88, + "learning_rate": 6.55999790821813e-07, + "loss": 0.6308, + "step": 25517 + }, + { + "epoch": 0.88, + "learning_rate": 6.556119648246361e-07, + "loss": 0.6262, + "step": 25518 + }, + { + "epoch": 0.88, + "learning_rate": 6.552242496170025e-07, + "loss": 0.6523, + "step": 25519 + }, + { + "epoch": 0.88, + "learning_rate": 6.548366452035049e-07, + "loss": 0.6355, + "step": 25520 + }, + { + "epoch": 0.88, + "learning_rate": 6.544491515887397e-07, + "loss": 0.6362, + "step": 25521 + }, + { + "epoch": 0.88, + "learning_rate": 6.540617687773032e-07, + "loss": 0.6181, + "step": 25522 + }, + { + "epoch": 0.88, + "learning_rate": 6.536744967737862e-07, + "loss": 0.6326, + "step": 25523 + }, + { + "epoch": 0.88, + "learning_rate": 6.532873355827818e-07, + "loss": 0.6098, + "step": 25524 + }, + { + "epoch": 0.88, + "learning_rate": 6.529002852088817e-07, + "loss": 0.6403, + "step": 25525 + }, + { + "epoch": 0.88, + "learning_rate": 6.525133456566701e-07, + "loss": 0.5951, + "step": 25526 + }, + { + "epoch": 0.88, + "learning_rate": 6.521265169307378e-07, + "loss": 0.6179, + "step": 25527 + }, + { + "epoch": 0.88, + "learning_rate": 6.517397990356711e-07, + "loss": 0.6134, + "step": 25528 + }, + { + "epoch": 0.88, + "learning_rate": 6.513531919760552e-07, + "loss": 0.6513, + "step": 25529 + }, + { + "epoch": 0.88, + "learning_rate": 6.50966695756472e-07, + "loss": 0.6279, + "step": 25530 + }, + { + "epoch": 0.88, + "learning_rate": 6.505803103815078e-07, + "loss": 0.6543, + "step": 25531 + }, + { + "epoch": 0.88, + "learning_rate": 6.501940358557391e-07, + "loss": 0.6039, + "step": 25532 + }, + { + "epoch": 0.88, + "learning_rate": 6.498078721837476e-07, + "loss": 0.6489, + "step": 25533 + }, + { + "epoch": 0.88, + "learning_rate": 6.494218193701118e-07, + "loss": 0.6329, + "step": 25534 + }, + { + "epoch": 0.88, + "learning_rate": 6.490358774194094e-07, + "loss": 0.638, + "step": 25535 + }, + { + "epoch": 0.88, + "learning_rate": 6.486500463362167e-07, + "loss": 0.6725, + "step": 25536 + }, + { + "epoch": 0.88, + "learning_rate": 6.482643261251064e-07, + "loss": 0.5998, + "step": 25537 + }, + { + "epoch": 0.88, + "learning_rate": 6.47878716790652e-07, + "loss": 0.6821, + "step": 25538 + }, + { + "epoch": 0.88, + "learning_rate": 6.474932183374261e-07, + "loss": 0.6144, + "step": 25539 + }, + { + "epoch": 0.88, + "learning_rate": 6.471078307699985e-07, + "loss": 0.5891, + "step": 25540 + }, + { + "epoch": 0.88, + "learning_rate": 6.46722554092939e-07, + "loss": 0.6116, + "step": 25541 + }, + { + "epoch": 0.88, + "learning_rate": 6.463373883108182e-07, + "loss": 0.661, + "step": 25542 + }, + { + "epoch": 0.88, + "learning_rate": 6.459523334281981e-07, + "loss": 0.6156, + "step": 25543 + }, + { + "epoch": 0.89, + "learning_rate": 6.45567389449645e-07, + "loss": 0.626, + "step": 25544 + }, + { + "epoch": 0.89, + "learning_rate": 6.451825563797254e-07, + "loss": 0.6142, + "step": 25545 + }, + { + "epoch": 0.89, + "learning_rate": 6.447978342229999e-07, + "loss": 0.6231, + "step": 25546 + }, + { + "epoch": 0.89, + "learning_rate": 6.444132229840305e-07, + "loss": 0.6124, + "step": 25547 + }, + { + "epoch": 0.89, + "learning_rate": 6.44028722667378e-07, + "loss": 0.6476, + "step": 25548 + }, + { + "epoch": 0.89, + "learning_rate": 6.436443332775999e-07, + "loss": 0.6307, + "step": 25549 + }, + { + "epoch": 0.89, + "learning_rate": 6.432600548192535e-07, + "loss": 0.6217, + "step": 25550 + }, + { + "epoch": 0.89, + "learning_rate": 6.428758872968977e-07, + "loss": 0.5846, + "step": 25551 + }, + { + "epoch": 0.89, + "learning_rate": 6.424918307150807e-07, + "loss": 0.6698, + "step": 25552 + }, + { + "epoch": 0.89, + "learning_rate": 6.421078850783635e-07, + "loss": 0.6117, + "step": 25553 + }, + { + "epoch": 0.89, + "learning_rate": 6.417240503912958e-07, + "loss": 0.5705, + "step": 25554 + }, + { + "epoch": 0.89, + "learning_rate": 6.413403266584262e-07, + "loss": 0.5795, + "step": 25555 + }, + { + "epoch": 0.89, + "learning_rate": 6.409567138843053e-07, + "loss": 0.6509, + "step": 25556 + }, + { + "epoch": 0.89, + "learning_rate": 6.405732120734842e-07, + "loss": 0.6448, + "step": 25557 + }, + { + "epoch": 0.89, + "learning_rate": 6.401898212305036e-07, + "loss": 0.6788, + "step": 25558 + }, + { + "epoch": 0.89, + "learning_rate": 6.398065413599153e-07, + "loss": 0.6242, + "step": 25559 + }, + { + "epoch": 0.89, + "learning_rate": 6.394233724662624e-07, + "loss": 0.6168, + "step": 25560 + }, + { + "epoch": 0.89, + "learning_rate": 6.390403145540847e-07, + "loss": 0.6373, + "step": 25561 + }, + { + "epoch": 0.89, + "learning_rate": 6.386573676279262e-07, + "loss": 0.6205, + "step": 25562 + }, + { + "epoch": 0.89, + "learning_rate": 6.382745316923278e-07, + "loss": 0.5781, + "step": 25563 + }, + { + "epoch": 0.89, + "learning_rate": 6.378918067518247e-07, + "loss": 0.6388, + "step": 25564 + }, + { + "epoch": 0.89, + "learning_rate": 6.375091928109589e-07, + "loss": 0.6197, + "step": 25565 + }, + { + "epoch": 0.89, + "learning_rate": 6.371266898742667e-07, + "loss": 0.6916, + "step": 25566 + }, + { + "epoch": 0.89, + "learning_rate": 6.367442979462802e-07, + "loss": 0.6022, + "step": 25567 + }, + { + "epoch": 0.89, + "learning_rate": 6.363620170315355e-07, + "loss": 0.6557, + "step": 25568 + }, + { + "epoch": 0.89, + "learning_rate": 6.359798471345646e-07, + "loss": 0.6249, + "step": 25569 + }, + { + "epoch": 0.89, + "learning_rate": 6.355977882598951e-07, + "loss": 0.6427, + "step": 25570 + }, + { + "epoch": 0.89, + "learning_rate": 6.352158404120612e-07, + "loss": 0.6462, + "step": 25571 + }, + { + "epoch": 0.89, + "learning_rate": 6.348340035955924e-07, + "loss": 0.6797, + "step": 25572 + }, + { + "epoch": 0.89, + "learning_rate": 6.344522778150109e-07, + "loss": 0.6377, + "step": 25573 + }, + { + "epoch": 0.89, + "learning_rate": 6.340706630748461e-07, + "loss": 0.6811, + "step": 25574 + }, + { + "epoch": 0.89, + "learning_rate": 6.336891593796224e-07, + "loss": 0.6222, + "step": 25575 + }, + { + "epoch": 0.89, + "learning_rate": 6.333077667338594e-07, + "loss": 0.6685, + "step": 25576 + }, + { + "epoch": 0.89, + "learning_rate": 6.329264851420836e-07, + "loss": 0.7011, + "step": 25577 + }, + { + "epoch": 0.89, + "learning_rate": 6.325453146088145e-07, + "loss": 0.6288, + "step": 25578 + }, + { + "epoch": 0.89, + "learning_rate": 6.321642551385698e-07, + "loss": 0.6253, + "step": 25579 + }, + { + "epoch": 0.89, + "learning_rate": 6.317833067358681e-07, + "loss": 0.6067, + "step": 25580 + }, + { + "epoch": 0.89, + "learning_rate": 6.314024694052278e-07, + "loss": 0.5988, + "step": 25581 + }, + { + "epoch": 0.89, + "learning_rate": 6.310217431511589e-07, + "loss": 0.5846, + "step": 25582 + }, + { + "epoch": 0.89, + "learning_rate": 6.30641127978181e-07, + "loss": 0.6613, + "step": 25583 + }, + { + "epoch": 0.89, + "learning_rate": 6.30260623890806e-07, + "loss": 0.6265, + "step": 25584 + }, + { + "epoch": 0.89, + "learning_rate": 6.298802308935437e-07, + "loss": 0.576, + "step": 25585 + }, + { + "epoch": 0.89, + "learning_rate": 6.294999489909026e-07, + "loss": 0.6367, + "step": 25586 + }, + { + "epoch": 0.89, + "learning_rate": 6.29119778187397e-07, + "loss": 0.6185, + "step": 25587 + }, + { + "epoch": 0.89, + "learning_rate": 6.287397184875255e-07, + "loss": 0.5698, + "step": 25588 + }, + { + "epoch": 0.89, + "learning_rate": 6.283597698958022e-07, + "loss": 0.6336, + "step": 25589 + }, + { + "epoch": 0.89, + "learning_rate": 6.279799324167302e-07, + "loss": 0.6633, + "step": 25590 + }, + { + "epoch": 0.89, + "learning_rate": 6.276002060548103e-07, + "loss": 0.6295, + "step": 25591 + }, + { + "epoch": 0.89, + "learning_rate": 6.272205908145467e-07, + "loss": 0.621, + "step": 25592 + }, + { + "epoch": 0.89, + "learning_rate": 6.268410867004404e-07, + "loss": 0.6016, + "step": 25593 + }, + { + "epoch": 0.89, + "learning_rate": 6.264616937169865e-07, + "loss": 0.5446, + "step": 25594 + }, + { + "epoch": 0.89, + "learning_rate": 6.260824118686892e-07, + "loss": 0.6492, + "step": 25595 + }, + { + "epoch": 0.89, + "learning_rate": 6.25703241160045e-07, + "loss": 0.6336, + "step": 25596 + }, + { + "epoch": 0.89, + "learning_rate": 6.253241815955446e-07, + "loss": 0.6413, + "step": 25597 + }, + { + "epoch": 0.89, + "learning_rate": 6.249452331796879e-07, + "loss": 0.6397, + "step": 25598 + }, + { + "epoch": 0.89, + "learning_rate": 6.245663959169623e-07, + "loss": 0.6143, + "step": 25599 + }, + { + "epoch": 0.89, + "learning_rate": 6.24187669811861e-07, + "loss": 0.6001, + "step": 25600 + }, + { + "epoch": 0.89, + "learning_rate": 6.23809054868878e-07, + "loss": 0.6252, + "step": 25601 + }, + { + "epoch": 0.89, + "learning_rate": 6.234305510924988e-07, + "loss": 0.627, + "step": 25602 + }, + { + "epoch": 0.89, + "learning_rate": 6.230521584872118e-07, + "loss": 0.6637, + "step": 25603 + }, + { + "epoch": 0.89, + "learning_rate": 6.226738770575047e-07, + "loss": 0.6092, + "step": 25604 + }, + { + "epoch": 0.89, + "learning_rate": 6.222957068078594e-07, + "loss": 0.6382, + "step": 25605 + }, + { + "epoch": 0.89, + "learning_rate": 6.219176477427602e-07, + "loss": 0.6132, + "step": 25606 + }, + { + "epoch": 0.89, + "learning_rate": 6.215396998666933e-07, + "loss": 0.5941, + "step": 25607 + }, + { + "epoch": 0.89, + "learning_rate": 6.211618631841355e-07, + "loss": 0.6484, + "step": 25608 + }, + { + "epoch": 0.89, + "learning_rate": 6.207841376995682e-07, + "loss": 0.6089, + "step": 25609 + }, + { + "epoch": 0.89, + "learning_rate": 6.204065234174717e-07, + "loss": 0.6589, + "step": 25610 + }, + { + "epoch": 0.89, + "learning_rate": 6.200290203423187e-07, + "loss": 0.6246, + "step": 25611 + }, + { + "epoch": 0.89, + "learning_rate": 6.19651628478587e-07, + "loss": 0.597, + "step": 25612 + }, + { + "epoch": 0.89, + "learning_rate": 6.192743478307528e-07, + "loss": 0.6214, + "step": 25613 + }, + { + "epoch": 0.89, + "learning_rate": 6.188971784032882e-07, + "loss": 0.6313, + "step": 25614 + }, + { + "epoch": 0.89, + "learning_rate": 6.185201202006641e-07, + "loss": 0.6344, + "step": 25615 + }, + { + "epoch": 0.89, + "learning_rate": 6.181431732273524e-07, + "loss": 0.6452, + "step": 25616 + }, + { + "epoch": 0.89, + "learning_rate": 6.177663374878207e-07, + "loss": 0.5987, + "step": 25617 + }, + { + "epoch": 0.89, + "learning_rate": 6.173896129865364e-07, + "loss": 0.6005, + "step": 25618 + }, + { + "epoch": 0.89, + "learning_rate": 6.170129997279695e-07, + "loss": 0.6408, + "step": 25619 + }, + { + "epoch": 0.89, + "learning_rate": 6.166364977165817e-07, + "loss": 0.6019, + "step": 25620 + }, + { + "epoch": 0.89, + "learning_rate": 6.162601069568385e-07, + "loss": 0.7069, + "step": 25621 + }, + { + "epoch": 0.89, + "learning_rate": 6.158838274532042e-07, + "loss": 0.6628, + "step": 25622 + }, + { + "epoch": 0.89, + "learning_rate": 6.155076592101361e-07, + "loss": 0.6185, + "step": 25623 + }, + { + "epoch": 0.89, + "learning_rate": 6.151316022320941e-07, + "loss": 0.6093, + "step": 25624 + }, + { + "epoch": 0.89, + "learning_rate": 6.147556565235424e-07, + "loss": 0.6802, + "step": 25625 + }, + { + "epoch": 0.89, + "learning_rate": 6.14379822088933e-07, + "loss": 0.6757, + "step": 25626 + }, + { + "epoch": 0.89, + "learning_rate": 6.140040989327245e-07, + "loss": 0.6332, + "step": 25627 + }, + { + "epoch": 0.89, + "learning_rate": 6.136284870593711e-07, + "loss": 0.6657, + "step": 25628 + }, + { + "epoch": 0.89, + "learning_rate": 6.13252986473325e-07, + "loss": 0.5919, + "step": 25629 + }, + { + "epoch": 0.89, + "learning_rate": 6.128775971790379e-07, + "loss": 0.6482, + "step": 25630 + }, + { + "epoch": 0.89, + "learning_rate": 6.125023191809643e-07, + "loss": 0.5886, + "step": 25631 + }, + { + "epoch": 0.89, + "learning_rate": 6.121271524835493e-07, + "loss": 0.6969, + "step": 25632 + }, + { + "epoch": 0.89, + "learning_rate": 6.117520970912427e-07, + "loss": 0.6723, + "step": 25633 + }, + { + "epoch": 0.89, + "learning_rate": 6.113771530084933e-07, + "loss": 0.6055, + "step": 25634 + }, + { + "epoch": 0.89, + "learning_rate": 6.110023202397419e-07, + "loss": 0.6506, + "step": 25635 + }, + { + "epoch": 0.89, + "learning_rate": 6.106275987894339e-07, + "loss": 0.6429, + "step": 25636 + }, + { + "epoch": 0.89, + "learning_rate": 6.102529886620167e-07, + "loss": 0.6118, + "step": 25637 + }, + { + "epoch": 0.89, + "learning_rate": 6.098784898619269e-07, + "loss": 0.6479, + "step": 25638 + }, + { + "epoch": 0.89, + "learning_rate": 6.095041023936055e-07, + "loss": 0.6124, + "step": 25639 + }, + { + "epoch": 0.89, + "learning_rate": 6.091298262614942e-07, + "loss": 0.6558, + "step": 25640 + }, + { + "epoch": 0.89, + "learning_rate": 6.087556614700263e-07, + "loss": 0.6401, + "step": 25641 + }, + { + "epoch": 0.89, + "learning_rate": 6.083816080236394e-07, + "loss": 0.6129, + "step": 25642 + }, + { + "epoch": 0.89, + "learning_rate": 6.080076659267708e-07, + "loss": 0.6294, + "step": 25643 + }, + { + "epoch": 0.89, + "learning_rate": 6.076338351838518e-07, + "loss": 0.6335, + "step": 25644 + }, + { + "epoch": 0.89, + "learning_rate": 6.072601157993141e-07, + "loss": 0.6726, + "step": 25645 + }, + { + "epoch": 0.89, + "learning_rate": 6.068865077775921e-07, + "loss": 0.6426, + "step": 25646 + }, + { + "epoch": 0.89, + "learning_rate": 6.06513011123111e-07, + "loss": 0.6364, + "step": 25647 + }, + { + "epoch": 0.89, + "learning_rate": 6.061396258402996e-07, + "loss": 0.6206, + "step": 25648 + }, + { + "epoch": 0.89, + "learning_rate": 6.057663519335888e-07, + "loss": 0.607, + "step": 25649 + }, + { + "epoch": 0.89, + "learning_rate": 6.053931894074005e-07, + "loss": 0.6324, + "step": 25650 + }, + { + "epoch": 0.89, + "learning_rate": 6.050201382661602e-07, + "loss": 0.6237, + "step": 25651 + }, + { + "epoch": 0.89, + "learning_rate": 6.046471985142922e-07, + "loss": 0.6848, + "step": 25652 + }, + { + "epoch": 0.89, + "learning_rate": 6.042743701562149e-07, + "loss": 0.6383, + "step": 25653 + }, + { + "epoch": 0.89, + "learning_rate": 6.039016531963504e-07, + "loss": 0.6536, + "step": 25654 + }, + { + "epoch": 0.89, + "learning_rate": 6.035290476391198e-07, + "loss": 0.6592, + "step": 25655 + }, + { + "epoch": 0.89, + "learning_rate": 6.031565534889372e-07, + "loss": 0.61, + "step": 25656 + }, + { + "epoch": 0.89, + "learning_rate": 6.027841707502214e-07, + "loss": 0.6253, + "step": 25657 + }, + { + "epoch": 0.89, + "learning_rate": 6.024118994273887e-07, + "loss": 0.6435, + "step": 25658 + }, + { + "epoch": 0.89, + "learning_rate": 6.02039739524849e-07, + "loss": 0.6429, + "step": 25659 + }, + { + "epoch": 0.89, + "learning_rate": 6.016676910470165e-07, + "loss": 0.648, + "step": 25660 + }, + { + "epoch": 0.89, + "learning_rate": 6.012957539983022e-07, + "loss": 0.628, + "step": 25661 + }, + { + "epoch": 0.89, + "learning_rate": 6.009239283831169e-07, + "loss": 0.6271, + "step": 25662 + }, + { + "epoch": 0.89, + "learning_rate": 6.005522142058696e-07, + "loss": 0.6378, + "step": 25663 + }, + { + "epoch": 0.89, + "learning_rate": 6.00180611470964e-07, + "loss": 0.63, + "step": 25664 + }, + { + "epoch": 0.89, + "learning_rate": 5.998091201828093e-07, + "loss": 0.6611, + "step": 25665 + }, + { + "epoch": 0.89, + "learning_rate": 5.994377403458084e-07, + "loss": 0.6444, + "step": 25666 + }, + { + "epoch": 0.89, + "learning_rate": 5.990664719643646e-07, + "loss": 0.6645, + "step": 25667 + }, + { + "epoch": 0.89, + "learning_rate": 5.986953150428798e-07, + "loss": 0.6516, + "step": 25668 + }, + { + "epoch": 0.89, + "learning_rate": 5.983242695857561e-07, + "loss": 0.6347, + "step": 25669 + }, + { + "epoch": 0.89, + "learning_rate": 5.979533355973898e-07, + "loss": 0.6057, + "step": 25670 + }, + { + "epoch": 0.89, + "learning_rate": 5.97582513082181e-07, + "loss": 0.6338, + "step": 25671 + }, + { + "epoch": 0.89, + "learning_rate": 5.972118020445261e-07, + "loss": 0.5813, + "step": 25672 + }, + { + "epoch": 0.89, + "learning_rate": 5.968412024888182e-07, + "loss": 0.6765, + "step": 25673 + }, + { + "epoch": 0.89, + "learning_rate": 5.964707144194548e-07, + "loss": 0.6371, + "step": 25674 + }, + { + "epoch": 0.89, + "learning_rate": 5.96100337840827e-07, + "loss": 0.6045, + "step": 25675 + }, + { + "epoch": 0.89, + "learning_rate": 5.957300727573245e-07, + "loss": 0.6486, + "step": 25676 + }, + { + "epoch": 0.89, + "learning_rate": 5.953599191733383e-07, + "loss": 0.6571, + "step": 25677 + }, + { + "epoch": 0.89, + "learning_rate": 5.949898770932572e-07, + "loss": 0.6265, + "step": 25678 + }, + { + "epoch": 0.89, + "learning_rate": 5.946199465214686e-07, + "loss": 0.6543, + "step": 25679 + }, + { + "epoch": 0.89, + "learning_rate": 5.94250127462358e-07, + "loss": 0.6711, + "step": 25680 + }, + { + "epoch": 0.89, + "learning_rate": 5.938804199203118e-07, + "loss": 0.5772, + "step": 25681 + }, + { + "epoch": 0.89, + "learning_rate": 5.935108238997112e-07, + "loss": 0.6391, + "step": 25682 + }, + { + "epoch": 0.89, + "learning_rate": 5.93141339404939e-07, + "loss": 0.6228, + "step": 25683 + }, + { + "epoch": 0.89, + "learning_rate": 5.927719664403753e-07, + "loss": 0.6256, + "step": 25684 + }, + { + "epoch": 0.89, + "learning_rate": 5.924027050104008e-07, + "loss": 0.6207, + "step": 25685 + }, + { + "epoch": 0.89, + "learning_rate": 5.920335551193934e-07, + "loss": 0.6405, + "step": 25686 + }, + { + "epoch": 0.89, + "learning_rate": 5.916645167717294e-07, + "loss": 0.6877, + "step": 25687 + }, + { + "epoch": 0.89, + "learning_rate": 5.912955899717842e-07, + "loss": 0.6397, + "step": 25688 + }, + { + "epoch": 0.89, + "learning_rate": 5.909267747239312e-07, + "loss": 0.6398, + "step": 25689 + }, + { + "epoch": 0.89, + "learning_rate": 5.905580710325432e-07, + "loss": 0.6513, + "step": 25690 + }, + { + "epoch": 0.89, + "learning_rate": 5.901894789019936e-07, + "loss": 0.605, + "step": 25691 + }, + { + "epoch": 0.89, + "learning_rate": 5.898209983366498e-07, + "loss": 0.636, + "step": 25692 + }, + { + "epoch": 0.89, + "learning_rate": 5.894526293408842e-07, + "loss": 0.6234, + "step": 25693 + }, + { + "epoch": 0.89, + "learning_rate": 5.890843719190609e-07, + "loss": 0.5711, + "step": 25694 + }, + { + "epoch": 0.89, + "learning_rate": 5.887162260755463e-07, + "loss": 0.624, + "step": 25695 + }, + { + "epoch": 0.89, + "learning_rate": 5.883481918147072e-07, + "loss": 0.6634, + "step": 25696 + }, + { + "epoch": 0.89, + "learning_rate": 5.879802691409053e-07, + "loss": 0.6539, + "step": 25697 + }, + { + "epoch": 0.89, + "learning_rate": 5.876124580585041e-07, + "loss": 0.6227, + "step": 25698 + }, + { + "epoch": 0.89, + "learning_rate": 5.872447585718655e-07, + "loss": 0.6575, + "step": 25699 + }, + { + "epoch": 0.89, + "learning_rate": 5.868771706853449e-07, + "loss": 0.6261, + "step": 25700 + }, + { + "epoch": 0.89, + "learning_rate": 5.865096944033044e-07, + "loss": 0.6546, + "step": 25701 + }, + { + "epoch": 0.89, + "learning_rate": 5.861423297300994e-07, + "loss": 0.6566, + "step": 25702 + }, + { + "epoch": 0.89, + "learning_rate": 5.857750766700854e-07, + "loss": 0.6151, + "step": 25703 + }, + { + "epoch": 0.89, + "learning_rate": 5.854079352276165e-07, + "loss": 0.6379, + "step": 25704 + }, + { + "epoch": 0.89, + "learning_rate": 5.850409054070483e-07, + "loss": 0.6048, + "step": 25705 + }, + { + "epoch": 0.89, + "learning_rate": 5.846739872127283e-07, + "loss": 0.6045, + "step": 25706 + }, + { + "epoch": 0.89, + "learning_rate": 5.843071806490086e-07, + "loss": 0.6652, + "step": 25707 + }, + { + "epoch": 0.89, + "learning_rate": 5.83940485720238e-07, + "loss": 0.6398, + "step": 25708 + }, + { + "epoch": 0.89, + "learning_rate": 5.835739024307652e-07, + "loss": 0.645, + "step": 25709 + }, + { + "epoch": 0.89, + "learning_rate": 5.832074307849345e-07, + "loss": 0.6685, + "step": 25710 + }, + { + "epoch": 0.89, + "learning_rate": 5.828410707870935e-07, + "loss": 0.675, + "step": 25711 + }, + { + "epoch": 0.89, + "learning_rate": 5.824748224415832e-07, + "loss": 0.6159, + "step": 25712 + }, + { + "epoch": 0.89, + "learning_rate": 5.821086857527481e-07, + "loss": 0.6534, + "step": 25713 + }, + { + "epoch": 0.89, + "learning_rate": 5.817426607249277e-07, + "loss": 0.6677, + "step": 25714 + }, + { + "epoch": 0.89, + "learning_rate": 5.81376747362461e-07, + "loss": 0.6827, + "step": 25715 + }, + { + "epoch": 0.89, + "learning_rate": 5.810109456696888e-07, + "loss": 0.6538, + "step": 25716 + }, + { + "epoch": 0.89, + "learning_rate": 5.806452556509478e-07, + "loss": 0.679, + "step": 25717 + }, + { + "epoch": 0.89, + "learning_rate": 5.802796773105723e-07, + "loss": 0.6429, + "step": 25718 + }, + { + "epoch": 0.89, + "learning_rate": 5.799142106528965e-07, + "loss": 0.6861, + "step": 25719 + }, + { + "epoch": 0.89, + "learning_rate": 5.795488556822537e-07, + "loss": 0.6155, + "step": 25720 + }, + { + "epoch": 0.89, + "learning_rate": 5.79183612402977e-07, + "loss": 0.6601, + "step": 25721 + }, + { + "epoch": 0.89, + "learning_rate": 5.788184808193975e-07, + "loss": 0.6607, + "step": 25722 + }, + { + "epoch": 0.89, + "learning_rate": 5.784534609358405e-07, + "loss": 0.6316, + "step": 25723 + }, + { + "epoch": 0.89, + "learning_rate": 5.780885527566371e-07, + "loss": 0.6394, + "step": 25724 + }, + { + "epoch": 0.89, + "learning_rate": 5.777237562861115e-07, + "loss": 0.6111, + "step": 25725 + }, + { + "epoch": 0.89, + "learning_rate": 5.773590715285915e-07, + "loss": 0.5919, + "step": 25726 + }, + { + "epoch": 0.89, + "learning_rate": 5.769944984883979e-07, + "loss": 0.6492, + "step": 25727 + }, + { + "epoch": 0.89, + "learning_rate": 5.766300371698574e-07, + "loss": 0.6121, + "step": 25728 + }, + { + "epoch": 0.89, + "learning_rate": 5.762656875772866e-07, + "loss": 0.5878, + "step": 25729 + }, + { + "epoch": 0.89, + "learning_rate": 5.759014497150062e-07, + "loss": 0.6208, + "step": 25730 + }, + { + "epoch": 0.89, + "learning_rate": 5.755373235873363e-07, + "loss": 0.6682, + "step": 25731 + }, + { + "epoch": 0.89, + "learning_rate": 5.751733091985934e-07, + "loss": 0.6901, + "step": 25732 + }, + { + "epoch": 0.89, + "learning_rate": 5.74809406553094e-07, + "loss": 0.6075, + "step": 25733 + }, + { + "epoch": 0.89, + "learning_rate": 5.744456156551526e-07, + "loss": 0.6428, + "step": 25734 + }, + { + "epoch": 0.89, + "learning_rate": 5.74081936509081e-07, + "loss": 0.616, + "step": 25735 + }, + { + "epoch": 0.89, + "learning_rate": 5.737183691191917e-07, + "loss": 0.5731, + "step": 25736 + }, + { + "epoch": 0.89, + "learning_rate": 5.733549134897953e-07, + "loss": 0.6594, + "step": 25737 + }, + { + "epoch": 0.89, + "learning_rate": 5.729915696252008e-07, + "loss": 0.6627, + "step": 25738 + }, + { + "epoch": 0.89, + "learning_rate": 5.726283375297171e-07, + "loss": 0.6037, + "step": 25739 + }, + { + "epoch": 0.89, + "learning_rate": 5.722652172076514e-07, + "loss": 0.634, + "step": 25740 + }, + { + "epoch": 0.89, + "learning_rate": 5.719022086633064e-07, + "loss": 0.6092, + "step": 25741 + }, + { + "epoch": 0.89, + "learning_rate": 5.715393119009871e-07, + "loss": 0.6555, + "step": 25742 + }, + { + "epoch": 0.89, + "learning_rate": 5.711765269249969e-07, + "loss": 0.6827, + "step": 25743 + }, + { + "epoch": 0.89, + "learning_rate": 5.708138537396357e-07, + "loss": 0.6405, + "step": 25744 + }, + { + "epoch": 0.89, + "learning_rate": 5.704512923492045e-07, + "loss": 0.5995, + "step": 25745 + }, + { + "epoch": 0.89, + "learning_rate": 5.700888427580031e-07, + "loss": 0.7173, + "step": 25746 + }, + { + "epoch": 0.89, + "learning_rate": 5.69726504970326e-07, + "loss": 0.6303, + "step": 25747 + }, + { + "epoch": 0.89, + "learning_rate": 5.693642789904708e-07, + "loss": 0.5947, + "step": 25748 + }, + { + "epoch": 0.89, + "learning_rate": 5.690021648227306e-07, + "loss": 0.599, + "step": 25749 + }, + { + "epoch": 0.89, + "learning_rate": 5.686401624714011e-07, + "loss": 0.6534, + "step": 25750 + }, + { + "epoch": 0.89, + "learning_rate": 5.682782719407731e-07, + "loss": 0.652, + "step": 25751 + }, + { + "epoch": 0.89, + "learning_rate": 5.679164932351389e-07, + "loss": 0.5661, + "step": 25752 + }, + { + "epoch": 0.89, + "learning_rate": 5.675548263587848e-07, + "loss": 0.6345, + "step": 25753 + }, + { + "epoch": 0.89, + "learning_rate": 5.671932713160011e-07, + "loss": 0.5846, + "step": 25754 + }, + { + "epoch": 0.89, + "learning_rate": 5.66831828111073e-07, + "loss": 0.6441, + "step": 25755 + }, + { + "epoch": 0.89, + "learning_rate": 5.664704967482859e-07, + "loss": 0.6204, + "step": 25756 + }, + { + "epoch": 0.89, + "learning_rate": 5.661092772319254e-07, + "loss": 0.627, + "step": 25757 + }, + { + "epoch": 0.89, + "learning_rate": 5.657481695662747e-07, + "loss": 0.5896, + "step": 25758 + }, + { + "epoch": 0.89, + "learning_rate": 5.653871737556127e-07, + "loss": 0.6036, + "step": 25759 + }, + { + "epoch": 0.89, + "learning_rate": 5.650262898042203e-07, + "loss": 0.6066, + "step": 25760 + }, + { + "epoch": 0.89, + "learning_rate": 5.646655177163762e-07, + "loss": 0.6562, + "step": 25761 + }, + { + "epoch": 0.89, + "learning_rate": 5.643048574963583e-07, + "loss": 0.6378, + "step": 25762 + }, + { + "epoch": 0.89, + "learning_rate": 5.63944309148442e-07, + "loss": 0.6386, + "step": 25763 + }, + { + "epoch": 0.89, + "learning_rate": 5.635838726769049e-07, + "loss": 0.6051, + "step": 25764 + }, + { + "epoch": 0.89, + "learning_rate": 5.632235480860171e-07, + "loss": 0.6179, + "step": 25765 + }, + { + "epoch": 0.89, + "learning_rate": 5.628633353800506e-07, + "loss": 0.6142, + "step": 25766 + }, + { + "epoch": 0.89, + "learning_rate": 5.625032345632775e-07, + "loss": 0.6284, + "step": 25767 + }, + { + "epoch": 0.89, + "learning_rate": 5.621432456399679e-07, + "loss": 0.6, + "step": 25768 + }, + { + "epoch": 0.89, + "learning_rate": 5.617833686143881e-07, + "loss": 0.5961, + "step": 25769 + }, + { + "epoch": 0.89, + "learning_rate": 5.614236034908083e-07, + "loss": 0.6551, + "step": 25770 + }, + { + "epoch": 0.89, + "learning_rate": 5.610639502734894e-07, + "loss": 0.6023, + "step": 25771 + }, + { + "epoch": 0.89, + "learning_rate": 5.607044089666969e-07, + "loss": 0.6196, + "step": 25772 + }, + { + "epoch": 0.89, + "learning_rate": 5.603449795746962e-07, + "loss": 0.6608, + "step": 25773 + }, + { + "epoch": 0.89, + "learning_rate": 5.599856621017452e-07, + "loss": 0.6432, + "step": 25774 + }, + { + "epoch": 0.89, + "learning_rate": 5.59626456552107e-07, + "loss": 0.6241, + "step": 25775 + }, + { + "epoch": 0.89, + "learning_rate": 5.592673629300404e-07, + "loss": 0.6158, + "step": 25776 + }, + { + "epoch": 0.89, + "learning_rate": 5.58908381239801e-07, + "loss": 0.6005, + "step": 25777 + }, + { + "epoch": 0.89, + "learning_rate": 5.585495114856443e-07, + "loss": 0.6726, + "step": 25778 + }, + { + "epoch": 0.89, + "learning_rate": 5.581907536718278e-07, + "loss": 0.6558, + "step": 25779 + }, + { + "epoch": 0.89, + "learning_rate": 5.578321078026039e-07, + "loss": 0.6445, + "step": 25780 + }, + { + "epoch": 0.89, + "learning_rate": 5.574735738822245e-07, + "loss": 0.6431, + "step": 25781 + }, + { + "epoch": 0.89, + "learning_rate": 5.571151519149421e-07, + "loss": 0.6116, + "step": 25782 + }, + { + "epoch": 0.89, + "learning_rate": 5.56756841905004e-07, + "loss": 0.6036, + "step": 25783 + }, + { + "epoch": 0.89, + "learning_rate": 5.563986438566582e-07, + "loss": 0.6106, + "step": 25784 + }, + { + "epoch": 0.89, + "learning_rate": 5.560405577741535e-07, + "loss": 0.6708, + "step": 25785 + }, + { + "epoch": 0.89, + "learning_rate": 5.556825836617341e-07, + "loss": 0.6378, + "step": 25786 + }, + { + "epoch": 0.89, + "learning_rate": 5.553247215236468e-07, + "loss": 0.6977, + "step": 25787 + }, + { + "epoch": 0.89, + "learning_rate": 5.549669713641314e-07, + "loss": 0.6068, + "step": 25788 + }, + { + "epoch": 0.89, + "learning_rate": 5.546093331874292e-07, + "loss": 0.6238, + "step": 25789 + }, + { + "epoch": 0.89, + "learning_rate": 5.542518069977843e-07, + "loss": 0.6401, + "step": 25790 + }, + { + "epoch": 0.89, + "learning_rate": 5.5389439279943e-07, + "loss": 0.5721, + "step": 25791 + }, + { + "epoch": 0.89, + "learning_rate": 5.535370905966087e-07, + "loss": 0.6449, + "step": 25792 + }, + { + "epoch": 0.89, + "learning_rate": 5.531799003935567e-07, + "loss": 0.6515, + "step": 25793 + }, + { + "epoch": 0.89, + "learning_rate": 5.528228221945054e-07, + "loss": 0.5563, + "step": 25794 + }, + { + "epoch": 0.89, + "learning_rate": 5.524658560036899e-07, + "loss": 0.6255, + "step": 25795 + }, + { + "epoch": 0.89, + "learning_rate": 5.52109001825345e-07, + "loss": 0.599, + "step": 25796 + }, + { + "epoch": 0.89, + "learning_rate": 5.517522596636971e-07, + "loss": 0.6201, + "step": 25797 + }, + { + "epoch": 0.89, + "learning_rate": 5.513956295229783e-07, + "loss": 0.5871, + "step": 25798 + }, + { + "epoch": 0.89, + "learning_rate": 5.510391114074199e-07, + "loss": 0.6519, + "step": 25799 + }, + { + "epoch": 0.89, + "learning_rate": 5.506827053212427e-07, + "loss": 0.6491, + "step": 25800 + }, + { + "epoch": 0.89, + "learning_rate": 5.503264112686768e-07, + "loss": 0.6689, + "step": 25801 + }, + { + "epoch": 0.89, + "learning_rate": 5.499702292539455e-07, + "loss": 0.6641, + "step": 25802 + }, + { + "epoch": 0.89, + "learning_rate": 5.496141592812698e-07, + "loss": 0.6166, + "step": 25803 + }, + { + "epoch": 0.89, + "learning_rate": 5.492582013548742e-07, + "loss": 0.6044, + "step": 25804 + }, + { + "epoch": 0.89, + "learning_rate": 5.489023554789785e-07, + "loss": 0.6845, + "step": 25805 + }, + { + "epoch": 0.89, + "learning_rate": 5.485466216578005e-07, + "loss": 0.6799, + "step": 25806 + }, + { + "epoch": 0.89, + "learning_rate": 5.481909998955582e-07, + "loss": 0.7005, + "step": 25807 + }, + { + "epoch": 0.89, + "learning_rate": 5.478354901964688e-07, + "loss": 0.6456, + "step": 25808 + }, + { + "epoch": 0.89, + "learning_rate": 5.47480092564745e-07, + "loss": 0.6083, + "step": 25809 + }, + { + "epoch": 0.89, + "learning_rate": 5.471248070046031e-07, + "loss": 0.632, + "step": 25810 + }, + { + "epoch": 0.89, + "learning_rate": 5.467696335202566e-07, + "loss": 0.6711, + "step": 25811 + }, + { + "epoch": 0.89, + "learning_rate": 5.46414572115912e-07, + "loss": 0.7065, + "step": 25812 + }, + { + "epoch": 0.89, + "learning_rate": 5.460596227957826e-07, + "loss": 0.5789, + "step": 25813 + }, + { + "epoch": 0.89, + "learning_rate": 5.457047855640762e-07, + "loss": 0.6269, + "step": 25814 + }, + { + "epoch": 0.89, + "learning_rate": 5.453500604249973e-07, + "loss": 0.5582, + "step": 25815 + }, + { + "epoch": 0.89, + "learning_rate": 5.449954473827546e-07, + "loss": 0.6377, + "step": 25816 + }, + { + "epoch": 0.89, + "learning_rate": 5.446409464415525e-07, + "loss": 0.6085, + "step": 25817 + }, + { + "epoch": 0.89, + "learning_rate": 5.442865576055922e-07, + "loss": 0.618, + "step": 25818 + }, + { + "epoch": 0.89, + "learning_rate": 5.439322808790759e-07, + "loss": 0.5865, + "step": 25819 + }, + { + "epoch": 0.89, + "learning_rate": 5.435781162662068e-07, + "loss": 0.6773, + "step": 25820 + }, + { + "epoch": 0.89, + "learning_rate": 5.432240637711772e-07, + "loss": 0.6191, + "step": 25821 + }, + { + "epoch": 0.89, + "learning_rate": 5.428701233981914e-07, + "loss": 0.6437, + "step": 25822 + }, + { + "epoch": 0.89, + "learning_rate": 5.425162951514451e-07, + "loss": 0.6074, + "step": 25823 + }, + { + "epoch": 0.89, + "learning_rate": 5.421625790351303e-07, + "loss": 0.6124, + "step": 25824 + }, + { + "epoch": 0.89, + "learning_rate": 5.418089750534428e-07, + "loss": 0.6045, + "step": 25825 + }, + { + "epoch": 0.89, + "learning_rate": 5.414554832105756e-07, + "loss": 0.6393, + "step": 25826 + }, + { + "epoch": 0.89, + "learning_rate": 5.411021035107167e-07, + "loss": 0.6986, + "step": 25827 + }, + { + "epoch": 0.89, + "learning_rate": 5.407488359580582e-07, + "loss": 0.6447, + "step": 25828 + }, + { + "epoch": 0.89, + "learning_rate": 5.403956805567901e-07, + "loss": 0.63, + "step": 25829 + }, + { + "epoch": 0.89, + "learning_rate": 5.400426373110968e-07, + "loss": 0.6441, + "step": 25830 + }, + { + "epoch": 0.89, + "learning_rate": 5.396897062251638e-07, + "loss": 0.5785, + "step": 25831 + }, + { + "epoch": 0.9, + "learning_rate": 5.39336887303179e-07, + "loss": 0.6232, + "step": 25832 + }, + { + "epoch": 0.9, + "learning_rate": 5.389841805493201e-07, + "loss": 0.5984, + "step": 25833 + }, + { + "epoch": 0.9, + "learning_rate": 5.386315859677737e-07, + "loss": 0.6177, + "step": 25834 + }, + { + "epoch": 0.9, + "learning_rate": 5.3827910356272e-07, + "loss": 0.6214, + "step": 25835 + }, + { + "epoch": 0.9, + "learning_rate": 5.379267333383342e-07, + "loss": 0.594, + "step": 25836 + }, + { + "epoch": 0.9, + "learning_rate": 5.375744752987976e-07, + "loss": 0.6069, + "step": 25837 + }, + { + "epoch": 0.9, + "learning_rate": 5.37222329448287e-07, + "loss": 0.6467, + "step": 25838 + }, + { + "epoch": 0.9, + "learning_rate": 5.368702957909733e-07, + "loss": 0.6284, + "step": 25839 + }, + { + "epoch": 0.9, + "learning_rate": 5.365183743310343e-07, + "loss": 0.6555, + "step": 25840 + }, + { + "epoch": 0.9, + "learning_rate": 5.361665650726422e-07, + "loss": 0.6459, + "step": 25841 + }, + { + "epoch": 0.9, + "learning_rate": 5.358148680199671e-07, + "loss": 0.6609, + "step": 25842 + }, + { + "epoch": 0.9, + "learning_rate": 5.354632831771778e-07, + "loss": 0.6621, + "step": 25843 + }, + { + "epoch": 0.9, + "learning_rate": 5.351118105484466e-07, + "loss": 0.6544, + "step": 25844 + }, + { + "epoch": 0.9, + "learning_rate": 5.347604501379344e-07, + "loss": 0.6457, + "step": 25845 + }, + { + "epoch": 0.9, + "learning_rate": 5.344092019498126e-07, + "loss": 0.6619, + "step": 25846 + }, + { + "epoch": 0.9, + "learning_rate": 5.340580659882444e-07, + "loss": 0.6587, + "step": 25847 + }, + { + "epoch": 0.9, + "learning_rate": 5.337070422573909e-07, + "loss": 0.6156, + "step": 25848 + }, + { + "epoch": 0.9, + "learning_rate": 5.333561307614177e-07, + "loss": 0.6508, + "step": 25849 + }, + { + "epoch": 0.9, + "learning_rate": 5.330053315044814e-07, + "loss": 0.6379, + "step": 25850 + }, + { + "epoch": 0.9, + "learning_rate": 5.326546444907399e-07, + "loss": 0.6842, + "step": 25851 + }, + { + "epoch": 0.9, + "learning_rate": 5.323040697243587e-07, + "loss": 0.6065, + "step": 25852 + }, + { + "epoch": 0.9, + "learning_rate": 5.319536072094866e-07, + "loss": 0.683, + "step": 25853 + }, + { + "epoch": 0.9, + "learning_rate": 5.316032569502816e-07, + "loss": 0.6893, + "step": 25854 + }, + { + "epoch": 0.9, + "learning_rate": 5.312530189508991e-07, + "loss": 0.6259, + "step": 25855 + }, + { + "epoch": 0.9, + "learning_rate": 5.309028932154892e-07, + "loss": 0.6945, + "step": 25856 + }, + { + "epoch": 0.9, + "learning_rate": 5.30552879748203e-07, + "loss": 0.6038, + "step": 25857 + }, + { + "epoch": 0.9, + "learning_rate": 5.302029785531926e-07, + "loss": 0.576, + "step": 25858 + }, + { + "epoch": 0.9, + "learning_rate": 5.298531896346048e-07, + "loss": 0.5775, + "step": 25859 + }, + { + "epoch": 0.9, + "learning_rate": 5.295035129965875e-07, + "loss": 0.6178, + "step": 25860 + }, + { + "epoch": 0.9, + "learning_rate": 5.291539486432873e-07, + "loss": 0.5827, + "step": 25861 + }, + { + "epoch": 0.9, + "learning_rate": 5.288044965788464e-07, + "loss": 0.5917, + "step": 25862 + }, + { + "epoch": 0.9, + "learning_rate": 5.284551568074081e-07, + "loss": 0.7071, + "step": 25863 + }, + { + "epoch": 0.9, + "learning_rate": 5.281059293331181e-07, + "loss": 0.6477, + "step": 25864 + }, + { + "epoch": 0.9, + "learning_rate": 5.27756814160113e-07, + "loss": 0.6174, + "step": 25865 + }, + { + "epoch": 0.9, + "learning_rate": 5.27407811292533e-07, + "loss": 0.6139, + "step": 25866 + }, + { + "epoch": 0.9, + "learning_rate": 5.270589207345178e-07, + "loss": 0.5989, + "step": 25867 + }, + { + "epoch": 0.9, + "learning_rate": 5.267101424902011e-07, + "loss": 0.6232, + "step": 25868 + }, + { + "epoch": 0.9, + "learning_rate": 5.263614765637182e-07, + "loss": 0.6566, + "step": 25869 + }, + { + "epoch": 0.9, + "learning_rate": 5.26012922959207e-07, + "loss": 0.657, + "step": 25870 + }, + { + "epoch": 0.9, + "learning_rate": 5.256644816807954e-07, + "loss": 0.6106, + "step": 25871 + }, + { + "epoch": 0.9, + "learning_rate": 5.253161527326167e-07, + "loss": 0.6589, + "step": 25872 + }, + { + "epoch": 0.9, + "learning_rate": 5.249679361188021e-07, + "loss": 0.6046, + "step": 25873 + }, + { + "epoch": 0.9, + "learning_rate": 5.24619831843477e-07, + "loss": 0.624, + "step": 25874 + }, + { + "epoch": 0.9, + "learning_rate": 5.242718399107693e-07, + "loss": 0.6633, + "step": 25875 + }, + { + "epoch": 0.9, + "learning_rate": 5.239239603248081e-07, + "loss": 0.7111, + "step": 25876 + }, + { + "epoch": 0.9, + "learning_rate": 5.235761930897143e-07, + "loss": 0.6289, + "step": 25877 + }, + { + "epoch": 0.9, + "learning_rate": 5.232285382096125e-07, + "loss": 0.6401, + "step": 25878 + }, + { + "epoch": 0.9, + "learning_rate": 5.22880995688626e-07, + "loss": 0.6317, + "step": 25879 + }, + { + "epoch": 0.9, + "learning_rate": 5.225335655308728e-07, + "loss": 0.6217, + "step": 25880 + }, + { + "epoch": 0.9, + "learning_rate": 5.221862477404716e-07, + "loss": 0.5649, + "step": 25881 + }, + { + "epoch": 0.9, + "learning_rate": 5.218390423215435e-07, + "loss": 0.6446, + "step": 25882 + }, + { + "epoch": 0.9, + "learning_rate": 5.214919492782033e-07, + "loss": 0.6733, + "step": 25883 + }, + { + "epoch": 0.9, + "learning_rate": 5.211449686145664e-07, + "loss": 0.6524, + "step": 25884 + }, + { + "epoch": 0.9, + "learning_rate": 5.207981003347484e-07, + "loss": 0.6319, + "step": 25885 + }, + { + "epoch": 0.9, + "learning_rate": 5.204513444428583e-07, + "loss": 0.5774, + "step": 25886 + }, + { + "epoch": 0.9, + "learning_rate": 5.201047009430082e-07, + "loss": 0.593, + "step": 25887 + }, + { + "epoch": 0.9, + "learning_rate": 5.197581698393117e-07, + "loss": 0.6107, + "step": 25888 + }, + { + "epoch": 0.9, + "learning_rate": 5.194117511358732e-07, + "loss": 0.6313, + "step": 25889 + }, + { + "epoch": 0.9, + "learning_rate": 5.190654448368016e-07, + "loss": 0.6795, + "step": 25890 + }, + { + "epoch": 0.9, + "learning_rate": 5.187192509462035e-07, + "loss": 0.6542, + "step": 25891 + }, + { + "epoch": 0.9, + "learning_rate": 5.183731694681815e-07, + "loss": 0.5801, + "step": 25892 + }, + { + "epoch": 0.9, + "learning_rate": 5.180272004068398e-07, + "loss": 0.5815, + "step": 25893 + }, + { + "epoch": 0.9, + "learning_rate": 5.176813437662798e-07, + "loss": 0.6143, + "step": 25894 + }, + { + "epoch": 0.9, + "learning_rate": 5.173355995506036e-07, + "loss": 0.62, + "step": 25895 + }, + { + "epoch": 0.9, + "learning_rate": 5.16989967763909e-07, + "loss": 0.606, + "step": 25896 + }, + { + "epoch": 0.9, + "learning_rate": 5.166444484102961e-07, + "loss": 0.6287, + "step": 25897 + }, + { + "epoch": 0.9, + "learning_rate": 5.162990414938585e-07, + "loss": 0.6178, + "step": 25898 + }, + { + "epoch": 0.9, + "learning_rate": 5.159537470186926e-07, + "loss": 0.6546, + "step": 25899 + }, + { + "epoch": 0.9, + "learning_rate": 5.15608564988892e-07, + "loss": 0.632, + "step": 25900 + }, + { + "epoch": 0.9, + "learning_rate": 5.1526349540855e-07, + "loss": 0.6231, + "step": 25901 + }, + { + "epoch": 0.9, + "learning_rate": 5.149185382817568e-07, + "loss": 0.6766, + "step": 25902 + }, + { + "epoch": 0.9, + "learning_rate": 5.145736936126056e-07, + "loss": 0.6426, + "step": 25903 + }, + { + "epoch": 0.9, + "learning_rate": 5.142289614051799e-07, + "loss": 0.6058, + "step": 25904 + }, + { + "epoch": 0.9, + "learning_rate": 5.138843416635708e-07, + "loss": 0.596, + "step": 25905 + }, + { + "epoch": 0.9, + "learning_rate": 5.135398343918618e-07, + "loss": 0.6186, + "step": 25906 + }, + { + "epoch": 0.9, + "learning_rate": 5.131954395941385e-07, + "loss": 0.6078, + "step": 25907 + }, + { + "epoch": 0.9, + "learning_rate": 5.128511572744843e-07, + "loss": 0.6287, + "step": 25908 + }, + { + "epoch": 0.9, + "learning_rate": 5.125069874369826e-07, + "loss": 0.6661, + "step": 25909 + }, + { + "epoch": 0.9, + "learning_rate": 5.1216293008571e-07, + "loss": 0.6739, + "step": 25910 + }, + { + "epoch": 0.9, + "learning_rate": 5.11818985224749e-07, + "loss": 0.5998, + "step": 25911 + }, + { + "epoch": 0.9, + "learning_rate": 5.114751528581763e-07, + "loss": 0.6331, + "step": 25912 + }, + { + "epoch": 0.9, + "learning_rate": 5.111314329900685e-07, + "loss": 0.6766, + "step": 25913 + }, + { + "epoch": 0.9, + "learning_rate": 5.107878256245025e-07, + "loss": 0.628, + "step": 25914 + }, + { + "epoch": 0.9, + "learning_rate": 5.104443307655493e-07, + "loss": 0.62, + "step": 25915 + }, + { + "epoch": 0.9, + "learning_rate": 5.101009484172836e-07, + "loss": 0.6053, + "step": 25916 + }, + { + "epoch": 0.9, + "learning_rate": 5.097576785837754e-07, + "loss": 0.6443, + "step": 25917 + }, + { + "epoch": 0.9, + "learning_rate": 5.094145212690948e-07, + "loss": 0.6495, + "step": 25918 + }, + { + "epoch": 0.9, + "learning_rate": 5.090714764773108e-07, + "loss": 0.6481, + "step": 25919 + }, + { + "epoch": 0.9, + "learning_rate": 5.087285442124923e-07, + "loss": 0.6156, + "step": 25920 + }, + { + "epoch": 0.9, + "learning_rate": 5.083857244787027e-07, + "loss": 0.6313, + "step": 25921 + }, + { + "epoch": 0.9, + "learning_rate": 5.080430172800066e-07, + "loss": 0.6426, + "step": 25922 + }, + { + "epoch": 0.9, + "learning_rate": 5.077004226204674e-07, + "loss": 0.6538, + "step": 25923 + }, + { + "epoch": 0.9, + "learning_rate": 5.073579405041473e-07, + "loss": 0.5875, + "step": 25924 + }, + { + "epoch": 0.9, + "learning_rate": 5.070155709351077e-07, + "loss": 0.6243, + "step": 25925 + }, + { + "epoch": 0.9, + "learning_rate": 5.066733139174096e-07, + "loss": 0.6149, + "step": 25926 + }, + { + "epoch": 0.9, + "learning_rate": 5.063311694551054e-07, + "loss": 0.6435, + "step": 25927 + }, + { + "epoch": 0.9, + "learning_rate": 5.059891375522552e-07, + "loss": 0.5963, + "step": 25928 + }, + { + "epoch": 0.9, + "learning_rate": 5.056472182129146e-07, + "loss": 0.6334, + "step": 25929 + }, + { + "epoch": 0.9, + "learning_rate": 5.05305411441136e-07, + "loss": 0.6883, + "step": 25930 + }, + { + "epoch": 0.9, + "learning_rate": 5.049637172409727e-07, + "loss": 0.6271, + "step": 25931 + }, + { + "epoch": 0.9, + "learning_rate": 5.046221356164771e-07, + "loss": 0.6193, + "step": 25932 + }, + { + "epoch": 0.9, + "learning_rate": 5.042806665716959e-07, + "loss": 0.6527, + "step": 25933 + }, + { + "epoch": 0.9, + "learning_rate": 5.039393101106805e-07, + "loss": 0.6341, + "step": 25934 + }, + { + "epoch": 0.9, + "learning_rate": 5.035980662374762e-07, + "loss": 0.648, + "step": 25935 + }, + { + "epoch": 0.9, + "learning_rate": 5.032569349561312e-07, + "loss": 0.6398, + "step": 25936 + }, + { + "epoch": 0.9, + "learning_rate": 5.029159162706876e-07, + "loss": 0.6415, + "step": 25937 + }, + { + "epoch": 0.9, + "learning_rate": 5.025750101851912e-07, + "loss": 0.6441, + "step": 25938 + }, + { + "epoch": 0.9, + "learning_rate": 5.022342167036808e-07, + "loss": 0.6274, + "step": 25939 + }, + { + "epoch": 0.9, + "learning_rate": 5.018935358301991e-07, + "loss": 0.6244, + "step": 25940 + }, + { + "epoch": 0.9, + "learning_rate": 5.015529675687847e-07, + "loss": 0.6527, + "step": 25941 + }, + { + "epoch": 0.9, + "learning_rate": 5.012125119234745e-07, + "loss": 0.652, + "step": 25942 + }, + { + "epoch": 0.9, + "learning_rate": 5.008721688983065e-07, + "loss": 0.63, + "step": 25943 + }, + { + "epoch": 0.9, + "learning_rate": 5.005319384973173e-07, + "loss": 0.6343, + "step": 25944 + }, + { + "epoch": 0.9, + "learning_rate": 5.001918207245371e-07, + "loss": 0.6338, + "step": 25945 + }, + { + "epoch": 0.9, + "learning_rate": 4.998518155840004e-07, + "loss": 0.6252, + "step": 25946 + }, + { + "epoch": 0.9, + "learning_rate": 4.995119230797373e-07, + "loss": 0.639, + "step": 25947 + }, + { + "epoch": 0.9, + "learning_rate": 4.991721432157792e-07, + "loss": 0.6532, + "step": 25948 + }, + { + "epoch": 0.9, + "learning_rate": 4.98832475996155e-07, + "loss": 0.6263, + "step": 25949 + }, + { + "epoch": 0.9, + "learning_rate": 4.984929214248902e-07, + "loss": 0.6179, + "step": 25950 + }, + { + "epoch": 0.9, + "learning_rate": 4.981534795060116e-07, + "loss": 0.5916, + "step": 25951 + }, + { + "epoch": 0.9, + "learning_rate": 4.978141502435419e-07, + "loss": 0.6373, + "step": 25952 + }, + { + "epoch": 0.9, + "learning_rate": 4.974749336415074e-07, + "loss": 0.6314, + "step": 25953 + }, + { + "epoch": 0.9, + "learning_rate": 4.971358297039275e-07, + "loss": 0.6063, + "step": 25954 + }, + { + "epoch": 0.9, + "learning_rate": 4.967968384348232e-07, + "loss": 0.6739, + "step": 25955 + }, + { + "epoch": 0.9, + "learning_rate": 4.964579598382158e-07, + "loss": 0.6466, + "step": 25956 + }, + { + "epoch": 0.9, + "learning_rate": 4.961191939181198e-07, + "loss": 0.641, + "step": 25957 + }, + { + "epoch": 0.9, + "learning_rate": 4.957805406785532e-07, + "loss": 0.6582, + "step": 25958 + }, + { + "epoch": 0.9, + "learning_rate": 4.954420001235305e-07, + "loss": 0.6234, + "step": 25959 + }, + { + "epoch": 0.9, + "learning_rate": 4.951035722570674e-07, + "loss": 0.595, + "step": 25960 + }, + { + "epoch": 0.9, + "learning_rate": 4.947652570831751e-07, + "loss": 0.6229, + "step": 25961 + }, + { + "epoch": 0.9, + "learning_rate": 4.94427054605866e-07, + "loss": 0.595, + "step": 25962 + }, + { + "epoch": 0.9, + "learning_rate": 4.940889648291469e-07, + "loss": 0.6242, + "step": 25963 + }, + { + "epoch": 0.9, + "learning_rate": 4.93750987757029e-07, + "loss": 0.6121, + "step": 25964 + }, + { + "epoch": 0.9, + "learning_rate": 4.93413123393518e-07, + "loss": 0.5855, + "step": 25965 + }, + { + "epoch": 0.9, + "learning_rate": 4.930753717426207e-07, + "loss": 0.6697, + "step": 25966 + }, + { + "epoch": 0.9, + "learning_rate": 4.927377328083405e-07, + "loss": 0.6569, + "step": 25967 + }, + { + "epoch": 0.9, + "learning_rate": 4.924002065946831e-07, + "loss": 0.5902, + "step": 25968 + }, + { + "epoch": 0.9, + "learning_rate": 4.920627931056465e-07, + "loss": 0.6626, + "step": 25969 + }, + { + "epoch": 0.9, + "learning_rate": 4.917254923452341e-07, + "loss": 0.6213, + "step": 25970 + }, + { + "epoch": 0.9, + "learning_rate": 4.913883043174439e-07, + "loss": 0.6977, + "step": 25971 + }, + { + "epoch": 0.9, + "learning_rate": 4.910512290262736e-07, + "loss": 0.6007, + "step": 25972 + }, + { + "epoch": 0.9, + "learning_rate": 4.907142664757203e-07, + "loss": 0.6285, + "step": 25973 + }, + { + "epoch": 0.9, + "learning_rate": 4.903774166697783e-07, + "loss": 0.6039, + "step": 25974 + }, + { + "epoch": 0.9, + "learning_rate": 4.900406796124413e-07, + "loss": 0.6344, + "step": 25975 + }, + { + "epoch": 0.9, + "learning_rate": 4.897040553077025e-07, + "loss": 0.587, + "step": 25976 + }, + { + "epoch": 0.9, + "learning_rate": 4.893675437595535e-07, + "loss": 0.6184, + "step": 25977 + }, + { + "epoch": 0.9, + "learning_rate": 4.890311449719821e-07, + "loss": 0.6023, + "step": 25978 + }, + { + "epoch": 0.9, + "learning_rate": 4.886948589489792e-07, + "loss": 0.5906, + "step": 25979 + }, + { + "epoch": 0.9, + "learning_rate": 4.8835868569453e-07, + "loss": 0.6377, + "step": 25980 + }, + { + "epoch": 0.9, + "learning_rate": 4.880226252126208e-07, + "loss": 0.6366, + "step": 25981 + }, + { + "epoch": 0.9, + "learning_rate": 4.876866775072353e-07, + "loss": 0.6026, + "step": 25982 + }, + { + "epoch": 0.9, + "learning_rate": 4.873508425823581e-07, + "loss": 0.6318, + "step": 25983 + }, + { + "epoch": 0.9, + "learning_rate": 4.870151204419704e-07, + "loss": 0.6481, + "step": 25984 + }, + { + "epoch": 0.9, + "learning_rate": 4.866795110900535e-07, + "loss": 0.681, + "step": 25985 + }, + { + "epoch": 0.9, + "learning_rate": 4.863440145305842e-07, + "loss": 0.6472, + "step": 25986 + }, + { + "epoch": 0.9, + "learning_rate": 4.860086307675404e-07, + "loss": 0.6813, + "step": 25987 + }, + { + "epoch": 0.9, + "learning_rate": 4.856733598049013e-07, + "loss": 0.5799, + "step": 25988 + }, + { + "epoch": 0.9, + "learning_rate": 4.85338201646639e-07, + "loss": 0.6093, + "step": 25989 + }, + { + "epoch": 0.9, + "learning_rate": 4.850031562967284e-07, + "loss": 0.6121, + "step": 25990 + }, + { + "epoch": 0.9, + "learning_rate": 4.846682237591438e-07, + "loss": 0.6422, + "step": 25991 + }, + { + "epoch": 0.9, + "learning_rate": 4.843334040378522e-07, + "loss": 0.6109, + "step": 25992 + }, + { + "epoch": 0.9, + "learning_rate": 4.83998697136826e-07, + "loss": 0.7125, + "step": 25993 + }, + { + "epoch": 0.9, + "learning_rate": 4.836641030600331e-07, + "loss": 0.6657, + "step": 25994 + }, + { + "epoch": 0.9, + "learning_rate": 4.833296218114413e-07, + "loss": 0.5976, + "step": 25995 + }, + { + "epoch": 0.9, + "learning_rate": 4.829952533950145e-07, + "loss": 0.6774, + "step": 25996 + }, + { + "epoch": 0.9, + "learning_rate": 4.82660997814719e-07, + "loss": 0.6188, + "step": 25997 + }, + { + "epoch": 0.9, + "learning_rate": 4.823268550745164e-07, + "loss": 0.6209, + "step": 25998 + }, + { + "epoch": 0.9, + "learning_rate": 4.81992825178369e-07, + "loss": 0.5847, + "step": 25999 + }, + { + "epoch": 0.9, + "learning_rate": 4.816589081302359e-07, + "loss": 0.6949, + "step": 26000 + }, + { + "epoch": 0.9, + "learning_rate": 4.813251039340782e-07, + "loss": 0.6546, + "step": 26001 + }, + { + "epoch": 0.9, + "learning_rate": 4.80991412593852e-07, + "loss": 0.6301, + "step": 26002 + }, + { + "epoch": 0.9, + "learning_rate": 4.80657834113516e-07, + "loss": 0.65, + "step": 26003 + }, + { + "epoch": 0.9, + "learning_rate": 4.803243684970215e-07, + "loss": 0.6604, + "step": 26004 + }, + { + "epoch": 0.9, + "learning_rate": 4.799910157483245e-07, + "loss": 0.658, + "step": 26005 + }, + { + "epoch": 0.9, + "learning_rate": 4.796577758713772e-07, + "loss": 0.6242, + "step": 26006 + }, + { + "epoch": 0.9, + "learning_rate": 4.793246488701298e-07, + "loss": 0.6295, + "step": 26007 + }, + { + "epoch": 0.9, + "learning_rate": 4.789916347485324e-07, + "loss": 0.6457, + "step": 26008 + }, + { + "epoch": 0.9, + "learning_rate": 4.786587335105352e-07, + "loss": 0.6313, + "step": 26009 + }, + { + "epoch": 0.9, + "learning_rate": 4.783259451600808e-07, + "loss": 0.5967, + "step": 26010 + }, + { + "epoch": 0.9, + "learning_rate": 4.77993269701118e-07, + "loss": 0.5775, + "step": 26011 + }, + { + "epoch": 0.9, + "learning_rate": 4.776607071375905e-07, + "loss": 0.6347, + "step": 26012 + }, + { + "epoch": 0.9, + "learning_rate": 4.773282574734406e-07, + "loss": 0.6917, + "step": 26013 + }, + { + "epoch": 0.9, + "learning_rate": 4.769959207126119e-07, + "loss": 0.6135, + "step": 26014 + }, + { + "epoch": 0.9, + "learning_rate": 4.7666369685904323e-07, + "loss": 0.669, + "step": 26015 + }, + { + "epoch": 0.9, + "learning_rate": 4.763315859166717e-07, + "loss": 0.6239, + "step": 26016 + }, + { + "epoch": 0.9, + "learning_rate": 4.7599958788943744e-07, + "loss": 0.6696, + "step": 26017 + }, + { + "epoch": 0.9, + "learning_rate": 4.7566770278127614e-07, + "loss": 0.6637, + "step": 26018 + }, + { + "epoch": 0.9, + "learning_rate": 4.753359305961225e-07, + "loss": 0.5719, + "step": 26019 + }, + { + "epoch": 0.9, + "learning_rate": 4.7500427133790996e-07, + "loss": 0.614, + "step": 26020 + }, + { + "epoch": 0.9, + "learning_rate": 4.7467272501057313e-07, + "loss": 0.6729, + "step": 26021 + }, + { + "epoch": 0.9, + "learning_rate": 4.743412916180379e-07, + "loss": 0.6429, + "step": 26022 + }, + { + "epoch": 0.9, + "learning_rate": 4.740099711642376e-07, + "loss": 0.6319, + "step": 26023 + }, + { + "epoch": 0.9, + "learning_rate": 4.736787636531004e-07, + "loss": 0.6015, + "step": 26024 + }, + { + "epoch": 0.9, + "learning_rate": 4.733476690885508e-07, + "loss": 0.6392, + "step": 26025 + }, + { + "epoch": 0.9, + "learning_rate": 4.730166874745168e-07, + "loss": 0.6467, + "step": 26026 + }, + { + "epoch": 0.9, + "learning_rate": 4.7268581881492193e-07, + "loss": 0.6301, + "step": 26027 + }, + { + "epoch": 0.9, + "learning_rate": 4.723550631136886e-07, + "loss": 0.5268, + "step": 26028 + }, + { + "epoch": 0.9, + "learning_rate": 4.720244203747382e-07, + "loss": 0.647, + "step": 26029 + }, + { + "epoch": 0.9, + "learning_rate": 4.716938906019908e-07, + "loss": 0.6664, + "step": 26030 + }, + { + "epoch": 0.9, + "learning_rate": 4.7136347379936554e-07, + "loss": 0.5911, + "step": 26031 + }, + { + "epoch": 0.9, + "learning_rate": 4.710331699707815e-07, + "loss": 0.625, + "step": 26032 + }, + { + "epoch": 0.9, + "learning_rate": 4.707029791201534e-07, + "loss": 0.6309, + "step": 26033 + }, + { + "epoch": 0.9, + "learning_rate": 4.7037290125139576e-07, + "loss": 0.6814, + "step": 26034 + }, + { + "epoch": 0.9, + "learning_rate": 4.700429363684222e-07, + "loss": 0.6777, + "step": 26035 + }, + { + "epoch": 0.9, + "learning_rate": 4.697130844751441e-07, + "loss": 0.661, + "step": 26036 + }, + { + "epoch": 0.9, + "learning_rate": 4.693833455754737e-07, + "loss": 0.6226, + "step": 26037 + }, + { + "epoch": 0.9, + "learning_rate": 4.6905371967332134e-07, + "loss": 0.6413, + "step": 26038 + }, + { + "epoch": 0.9, + "learning_rate": 4.6872420677259277e-07, + "loss": 0.6491, + "step": 26039 + }, + { + "epoch": 0.9, + "learning_rate": 4.6839480687719594e-07, + "loss": 0.6532, + "step": 26040 + }, + { + "epoch": 0.9, + "learning_rate": 4.680655199910378e-07, + "loss": 0.6301, + "step": 26041 + }, + { + "epoch": 0.9, + "learning_rate": 4.677363461180173e-07, + "loss": 0.6364, + "step": 26042 + }, + { + "epoch": 0.9, + "learning_rate": 4.674072852620426e-07, + "loss": 0.6424, + "step": 26043 + }, + { + "epoch": 0.9, + "learning_rate": 4.670783374270149e-07, + "loss": 0.6032, + "step": 26044 + }, + { + "epoch": 0.9, + "learning_rate": 4.6674950261683116e-07, + "loss": 0.6223, + "step": 26045 + }, + { + "epoch": 0.9, + "learning_rate": 4.664207808353915e-07, + "loss": 0.6086, + "step": 26046 + }, + { + "epoch": 0.9, + "learning_rate": 4.660921720865952e-07, + "loss": 0.6481, + "step": 26047 + }, + { + "epoch": 0.9, + "learning_rate": 4.657636763743345e-07, + "loss": 0.5807, + "step": 26048 + }, + { + "epoch": 0.9, + "learning_rate": 4.654352937025064e-07, + "loss": 0.5928, + "step": 26049 + }, + { + "epoch": 0.9, + "learning_rate": 4.6510702407500664e-07, + "loss": 0.6348, + "step": 26050 + }, + { + "epoch": 0.9, + "learning_rate": 4.647788674957232e-07, + "loss": 0.697, + "step": 26051 + }, + { + "epoch": 0.9, + "learning_rate": 4.644508239685475e-07, + "loss": 0.6346, + "step": 26052 + }, + { + "epoch": 0.9, + "learning_rate": 4.6412289349737183e-07, + "loss": 0.7038, + "step": 26053 + }, + { + "epoch": 0.9, + "learning_rate": 4.6379507608607987e-07, + "loss": 0.643, + "step": 26054 + }, + { + "epoch": 0.9, + "learning_rate": 4.634673717385618e-07, + "loss": 0.6324, + "step": 26055 + }, + { + "epoch": 0.9, + "learning_rate": 4.6313978045870344e-07, + "loss": 0.605, + "step": 26056 + }, + { + "epoch": 0.9, + "learning_rate": 4.62812302250385e-07, + "loss": 0.6522, + "step": 26057 + }, + { + "epoch": 0.9, + "learning_rate": 4.624849371174911e-07, + "loss": 0.6324, + "step": 26058 + }, + { + "epoch": 0.9, + "learning_rate": 4.621576850639053e-07, + "loss": 0.683, + "step": 26059 + }, + { + "epoch": 0.9, + "learning_rate": 4.618305460935035e-07, + "loss": 0.6379, + "step": 26060 + }, + { + "epoch": 0.9, + "learning_rate": 4.61503520210167e-07, + "loss": 0.6659, + "step": 26061 + }, + { + "epoch": 0.9, + "learning_rate": 4.6117660741777373e-07, + "loss": 0.6174, + "step": 26062 + }, + { + "epoch": 0.9, + "learning_rate": 4.6084980772019727e-07, + "loss": 0.6123, + "step": 26063 + }, + { + "epoch": 0.9, + "learning_rate": 4.605231211213135e-07, + "loss": 0.6239, + "step": 26064 + }, + { + "epoch": 0.9, + "learning_rate": 4.60196547624997e-07, + "loss": 0.6603, + "step": 26065 + }, + { + "epoch": 0.9, + "learning_rate": 4.5987008723511586e-07, + "loss": 0.6569, + "step": 26066 + }, + { + "epoch": 0.9, + "learning_rate": 4.595437399555447e-07, + "loss": 0.5961, + "step": 26067 + }, + { + "epoch": 0.9, + "learning_rate": 4.5921750579015157e-07, + "loss": 0.6286, + "step": 26068 + }, + { + "epoch": 0.9, + "learning_rate": 4.5889138474280337e-07, + "loss": 0.6561, + "step": 26069 + }, + { + "epoch": 0.9, + "learning_rate": 4.58565376817367e-07, + "loss": 0.6507, + "step": 26070 + }, + { + "epoch": 0.9, + "learning_rate": 4.5823948201771054e-07, + "loss": 0.6226, + "step": 26071 + }, + { + "epoch": 0.9, + "learning_rate": 4.579137003476919e-07, + "loss": 0.6882, + "step": 26072 + }, + { + "epoch": 0.9, + "learning_rate": 4.5758803181117806e-07, + "loss": 0.6202, + "step": 26073 + }, + { + "epoch": 0.9, + "learning_rate": 4.572624764120315e-07, + "loss": 0.6363, + "step": 26074 + }, + { + "epoch": 0.9, + "learning_rate": 4.5693703415410796e-07, + "loss": 0.6261, + "step": 26075 + }, + { + "epoch": 0.9, + "learning_rate": 4.566117050412677e-07, + "loss": 0.5893, + "step": 26076 + }, + { + "epoch": 0.9, + "learning_rate": 4.5628648907736994e-07, + "loss": 0.603, + "step": 26077 + }, + { + "epoch": 0.9, + "learning_rate": 4.55961386266266e-07, + "loss": 0.6046, + "step": 26078 + }, + { + "epoch": 0.9, + "learning_rate": 4.556363966118149e-07, + "loss": 0.6597, + "step": 26079 + }, + { + "epoch": 0.9, + "learning_rate": 4.5531152011786816e-07, + "loss": 0.6509, + "step": 26080 + }, + { + "epoch": 0.9, + "learning_rate": 4.549867567882771e-07, + "loss": 0.6815, + "step": 26081 + }, + { + "epoch": 0.9, + "learning_rate": 4.5466210662689193e-07, + "loss": 0.6346, + "step": 26082 + }, + { + "epoch": 0.9, + "learning_rate": 4.5433756963756403e-07, + "loss": 0.621, + "step": 26083 + }, + { + "epoch": 0.9, + "learning_rate": 4.54013145824137e-07, + "loss": 0.6451, + "step": 26084 + }, + { + "epoch": 0.9, + "learning_rate": 4.536888351904611e-07, + "loss": 0.5863, + "step": 26085 + }, + { + "epoch": 0.9, + "learning_rate": 4.533646377403822e-07, + "loss": 0.5907, + "step": 26086 + }, + { + "epoch": 0.9, + "learning_rate": 4.530405534777393e-07, + "loss": 0.5878, + "step": 26087 + }, + { + "epoch": 0.9, + "learning_rate": 4.527165824063784e-07, + "loss": 0.6315, + "step": 26088 + }, + { + "epoch": 0.9, + "learning_rate": 4.523927245301418e-07, + "loss": 0.649, + "step": 26089 + }, + { + "epoch": 0.9, + "learning_rate": 4.5206897985286546e-07, + "loss": 0.6253, + "step": 26090 + }, + { + "epoch": 0.9, + "learning_rate": 4.5174534837838737e-07, + "loss": 0.6031, + "step": 26091 + }, + { + "epoch": 0.9, + "learning_rate": 4.5142183011054995e-07, + "loss": 0.6257, + "step": 26092 + }, + { + "epoch": 0.9, + "learning_rate": 4.510984250531847e-07, + "loss": 0.689, + "step": 26093 + }, + { + "epoch": 0.9, + "learning_rate": 4.507751332101273e-07, + "loss": 0.6789, + "step": 26094 + }, + { + "epoch": 0.9, + "learning_rate": 4.504519545852115e-07, + "loss": 0.5909, + "step": 26095 + }, + { + "epoch": 0.9, + "learning_rate": 4.5012888918226636e-07, + "loss": 0.6073, + "step": 26096 + }, + { + "epoch": 0.9, + "learning_rate": 4.4980593700512445e-07, + "loss": 0.5325, + "step": 26097 + }, + { + "epoch": 0.9, + "learning_rate": 4.494830980576137e-07, + "loss": 0.6092, + "step": 26098 + }, + { + "epoch": 0.9, + "learning_rate": 4.4916037234356223e-07, + "loss": 0.5915, + "step": 26099 + }, + { + "epoch": 0.9, + "learning_rate": 4.488377598667981e-07, + "loss": 0.5763, + "step": 26100 + }, + { + "epoch": 0.9, + "learning_rate": 4.485152606311427e-07, + "loss": 0.6411, + "step": 26101 + }, + { + "epoch": 0.9, + "learning_rate": 4.481928746404229e-07, + "loss": 0.6008, + "step": 26102 + }, + { + "epoch": 0.9, + "learning_rate": 4.478706018984591e-07, + "loss": 0.6613, + "step": 26103 + }, + { + "epoch": 0.9, + "learning_rate": 4.4754844240907257e-07, + "loss": 0.6284, + "step": 26104 + }, + { + "epoch": 0.9, + "learning_rate": 4.4722639617608255e-07, + "loss": 0.6349, + "step": 26105 + }, + { + "epoch": 0.9, + "learning_rate": 4.4690446320331036e-07, + "loss": 0.6349, + "step": 26106 + }, + { + "epoch": 0.9, + "learning_rate": 4.465826434945686e-07, + "loss": 0.6489, + "step": 26107 + }, + { + "epoch": 0.9, + "learning_rate": 4.4626093705367413e-07, + "loss": 0.5967, + "step": 26108 + }, + { + "epoch": 0.9, + "learning_rate": 4.459393438844428e-07, + "loss": 0.6525, + "step": 26109 + }, + { + "epoch": 0.9, + "learning_rate": 4.4561786399068605e-07, + "loss": 0.6474, + "step": 26110 + }, + { + "epoch": 0.9, + "learning_rate": 4.452964973762164e-07, + "loss": 0.5917, + "step": 26111 + }, + { + "epoch": 0.9, + "learning_rate": 4.4497524404484405e-07, + "loss": 0.6287, + "step": 26112 + }, + { + "epoch": 0.9, + "learning_rate": 4.446541040003771e-07, + "loss": 0.6456, + "step": 26113 + }, + { + "epoch": 0.9, + "learning_rate": 4.4433307724662254e-07, + "loss": 0.675, + "step": 26114 + }, + { + "epoch": 0.9, + "learning_rate": 4.440121637873873e-07, + "loss": 0.647, + "step": 26115 + }, + { + "epoch": 0.9, + "learning_rate": 4.4369136362647615e-07, + "loss": 0.6517, + "step": 26116 + }, + { + "epoch": 0.9, + "learning_rate": 4.4337067676769264e-07, + "loss": 0.6493, + "step": 26117 + }, + { + "epoch": 0.9, + "learning_rate": 4.430501032148404e-07, + "loss": 0.5956, + "step": 26118 + }, + { + "epoch": 0.9, + "learning_rate": 4.427296429717187e-07, + "loss": 0.6276, + "step": 26119 + }, + { + "epoch": 0.9, + "learning_rate": 4.424092960421256e-07, + "loss": 0.6157, + "step": 26120 + }, + { + "epoch": 0.91, + "learning_rate": 4.420890624298613e-07, + "loss": 0.6878, + "step": 26121 + }, + { + "epoch": 0.91, + "learning_rate": 4.417689421387217e-07, + "loss": 0.6193, + "step": 26122 + }, + { + "epoch": 0.91, + "learning_rate": 4.4144893517250263e-07, + "loss": 0.6384, + "step": 26123 + }, + { + "epoch": 0.91, + "learning_rate": 4.411290415349989e-07, + "loss": 0.5376, + "step": 26124 + }, + { + "epoch": 0.91, + "learning_rate": 4.408092612300019e-07, + "loss": 0.6022, + "step": 26125 + }, + { + "epoch": 0.91, + "learning_rate": 4.40489594261303e-07, + "loss": 0.6504, + "step": 26126 + }, + { + "epoch": 0.91, + "learning_rate": 4.4017004063269363e-07, + "loss": 0.6593, + "step": 26127 + }, + { + "epoch": 0.91, + "learning_rate": 4.398506003479608e-07, + "loss": 0.6593, + "step": 26128 + }, + { + "epoch": 0.91, + "learning_rate": 4.3953127341089365e-07, + "loss": 0.5569, + "step": 26129 + }, + { + "epoch": 0.91, + "learning_rate": 4.3921205982527694e-07, + "loss": 0.5248, + "step": 26130 + }, + { + "epoch": 0.91, + "learning_rate": 4.388929595948965e-07, + "loss": 0.5579, + "step": 26131 + }, + { + "epoch": 0.91, + "learning_rate": 4.3857397272353385e-07, + "loss": 0.596, + "step": 26132 + }, + { + "epoch": 0.91, + "learning_rate": 4.382550992149714e-07, + "loss": 0.6473, + "step": 26133 + }, + { + "epoch": 0.91, + "learning_rate": 4.379363390729907e-07, + "loss": 0.6896, + "step": 26134 + }, + { + "epoch": 0.91, + "learning_rate": 4.3761769230137196e-07, + "loss": 0.6224, + "step": 26135 + }, + { + "epoch": 0.91, + "learning_rate": 4.372991589038922e-07, + "loss": 0.6449, + "step": 26136 + }, + { + "epoch": 0.91, + "learning_rate": 4.3698073888432613e-07, + "loss": 0.642, + "step": 26137 + }, + { + "epoch": 0.91, + "learning_rate": 4.366624322464519e-07, + "loss": 0.5853, + "step": 26138 + }, + { + "epoch": 0.91, + "learning_rate": 4.36344238994042e-07, + "loss": 0.6575, + "step": 26139 + }, + { + "epoch": 0.91, + "learning_rate": 4.3602615913086787e-07, + "loss": 0.6435, + "step": 26140 + }, + { + "epoch": 0.91, + "learning_rate": 4.357081926607032e-07, + "loss": 0.6588, + "step": 26141 + }, + { + "epoch": 0.91, + "learning_rate": 4.3539033958731824e-07, + "loss": 0.6189, + "step": 26142 + }, + { + "epoch": 0.91, + "learning_rate": 4.3507259991447895e-07, + "loss": 0.6029, + "step": 26143 + }, + { + "epoch": 0.91, + "learning_rate": 4.347549736459533e-07, + "loss": 0.5914, + "step": 26144 + }, + { + "epoch": 0.91, + "learning_rate": 4.344374607855073e-07, + "loss": 0.6323, + "step": 26145 + }, + { + "epoch": 0.91, + "learning_rate": 4.3412006133690564e-07, + "loss": 0.5856, + "step": 26146 + }, + { + "epoch": 0.91, + "learning_rate": 4.33802775303912e-07, + "loss": 0.6373, + "step": 26147 + }, + { + "epoch": 0.91, + "learning_rate": 4.3348560269028895e-07, + "loss": 0.6509, + "step": 26148 + }, + { + "epoch": 0.91, + "learning_rate": 4.3316854349979456e-07, + "loss": 0.5958, + "step": 26149 + }, + { + "epoch": 0.91, + "learning_rate": 4.3285159773618914e-07, + "loss": 0.6604, + "step": 26150 + }, + { + "epoch": 0.91, + "learning_rate": 4.325347654032297e-07, + "loss": 0.613, + "step": 26151 + }, + { + "epoch": 0.91, + "learning_rate": 4.3221804650467435e-07, + "loss": 0.653, + "step": 26152 + }, + { + "epoch": 0.91, + "learning_rate": 4.319014410442779e-07, + "loss": 0.6276, + "step": 26153 + }, + { + "epoch": 0.91, + "learning_rate": 4.3158494902579396e-07, + "loss": 0.6407, + "step": 26154 + }, + { + "epoch": 0.91, + "learning_rate": 4.3126857045297286e-07, + "loss": 0.6389, + "step": 26155 + }, + { + "epoch": 0.91, + "learning_rate": 4.309523053295683e-07, + "loss": 0.6639, + "step": 26156 + }, + { + "epoch": 0.91, + "learning_rate": 4.306361536593295e-07, + "loss": 0.7004, + "step": 26157 + }, + { + "epoch": 0.91, + "learning_rate": 4.303201154460035e-07, + "loss": 0.6358, + "step": 26158 + }, + { + "epoch": 0.91, + "learning_rate": 4.300041906933394e-07, + "loss": 0.6593, + "step": 26159 + }, + { + "epoch": 0.91, + "learning_rate": 4.29688379405081e-07, + "loss": 0.7056, + "step": 26160 + }, + { + "epoch": 0.91, + "learning_rate": 4.2937268158497305e-07, + "loss": 0.6298, + "step": 26161 + }, + { + "epoch": 0.91, + "learning_rate": 4.2905709723675916e-07, + "loss": 0.6651, + "step": 26162 + }, + { + "epoch": 0.91, + "learning_rate": 4.2874162636418084e-07, + "loss": 0.6124, + "step": 26163 + }, + { + "epoch": 0.91, + "learning_rate": 4.2842626897097726e-07, + "loss": 0.6376, + "step": 26164 + }, + { + "epoch": 0.91, + "learning_rate": 4.2811102506088997e-07, + "loss": 0.6313, + "step": 26165 + }, + { + "epoch": 0.91, + "learning_rate": 4.277958946376548e-07, + "loss": 0.6273, + "step": 26166 + }, + { + "epoch": 0.91, + "learning_rate": 4.2748087770500767e-07, + "loss": 0.6447, + "step": 26167 + }, + { + "epoch": 0.91, + "learning_rate": 4.271659742666834e-07, + "loss": 0.6499, + "step": 26168 + }, + { + "epoch": 0.91, + "learning_rate": 4.268511843264167e-07, + "loss": 0.6281, + "step": 26169 + }, + { + "epoch": 0.91, + "learning_rate": 4.265365078879391e-07, + "loss": 0.5999, + "step": 26170 + }, + { + "epoch": 0.91, + "learning_rate": 4.2622194495498314e-07, + "loss": 0.6391, + "step": 26171 + }, + { + "epoch": 0.91, + "learning_rate": 4.2590749553127585e-07, + "loss": 0.6163, + "step": 26172 + }, + { + "epoch": 0.91, + "learning_rate": 4.2559315962054535e-07, + "loss": 0.667, + "step": 26173 + }, + { + "epoch": 0.91, + "learning_rate": 4.252789372265209e-07, + "loss": 0.6121, + "step": 26174 + }, + { + "epoch": 0.91, + "learning_rate": 4.249648283529262e-07, + "loss": 0.6311, + "step": 26175 + }, + { + "epoch": 0.91, + "learning_rate": 4.2465083300348595e-07, + "loss": 0.6486, + "step": 26176 + }, + { + "epoch": 0.91, + "learning_rate": 4.243369511819251e-07, + "loss": 0.6774, + "step": 26177 + }, + { + "epoch": 0.91, + "learning_rate": 4.2402318289196054e-07, + "loss": 0.6065, + "step": 26178 + }, + { + "epoch": 0.91, + "learning_rate": 4.237095281373149e-07, + "loss": 0.6765, + "step": 26179 + }, + { + "epoch": 0.91, + "learning_rate": 4.2339598692170747e-07, + "loss": 0.5784, + "step": 26180 + }, + { + "epoch": 0.91, + "learning_rate": 4.2308255924885523e-07, + "loss": 0.6098, + "step": 26181 + }, + { + "epoch": 0.91, + "learning_rate": 4.2276924512247295e-07, + "loss": 0.5878, + "step": 26182 + }, + { + "epoch": 0.91, + "learning_rate": 4.2245604454627885e-07, + "loss": 0.6469, + "step": 26183 + }, + { + "epoch": 0.91, + "learning_rate": 4.221429575239822e-07, + "loss": 0.6727, + "step": 26184 + }, + { + "epoch": 0.91, + "learning_rate": 4.2182998405929766e-07, + "loss": 0.5908, + "step": 26185 + }, + { + "epoch": 0.91, + "learning_rate": 4.215171241559346e-07, + "loss": 0.6718, + "step": 26186 + }, + { + "epoch": 0.91, + "learning_rate": 4.2120437781760224e-07, + "loss": 0.6561, + "step": 26187 + }, + { + "epoch": 0.91, + "learning_rate": 4.208917450480099e-07, + "loss": 0.6477, + "step": 26188 + }, + { + "epoch": 0.91, + "learning_rate": 4.205792258508645e-07, + "loss": 0.6199, + "step": 26189 + }, + { + "epoch": 0.91, + "learning_rate": 4.2026682022986986e-07, + "loss": 0.6612, + "step": 26190 + }, + { + "epoch": 0.91, + "learning_rate": 4.199545281887296e-07, + "loss": 0.6075, + "step": 26191 + }, + { + "epoch": 0.91, + "learning_rate": 4.1964234973114747e-07, + "loss": 0.6273, + "step": 26192 + }, + { + "epoch": 0.91, + "learning_rate": 4.1933028486082493e-07, + "loss": 0.6429, + "step": 26193 + }, + { + "epoch": 0.91, + "learning_rate": 4.1901833358146127e-07, + "loss": 0.5855, + "step": 26194 + }, + { + "epoch": 0.91, + "learning_rate": 4.187064958967557e-07, + "loss": 0.6312, + "step": 26195 + }, + { + "epoch": 0.91, + "learning_rate": 4.183947718104053e-07, + "loss": 0.612, + "step": 26196 + }, + { + "epoch": 0.91, + "learning_rate": 4.1808316132610385e-07, + "loss": 0.6066, + "step": 26197 + }, + { + "epoch": 0.91, + "learning_rate": 4.1777166444754936e-07, + "loss": 0.6914, + "step": 26198 + }, + { + "epoch": 0.91, + "learning_rate": 4.174602811784323e-07, + "loss": 0.6173, + "step": 26199 + }, + { + "epoch": 0.91, + "learning_rate": 4.1714901152244633e-07, + "loss": 0.6498, + "step": 26200 + }, + { + "epoch": 0.91, + "learning_rate": 4.168378554832819e-07, + "loss": 0.6211, + "step": 26201 + }, + { + "epoch": 0.91, + "learning_rate": 4.1652681306462715e-07, + "loss": 0.6686, + "step": 26202 + }, + { + "epoch": 0.91, + "learning_rate": 4.162158842701691e-07, + "loss": 0.6535, + "step": 26203 + }, + { + "epoch": 0.91, + "learning_rate": 4.1590506910359597e-07, + "loss": 0.6439, + "step": 26204 + }, + { + "epoch": 0.91, + "learning_rate": 4.155943675685914e-07, + "loss": 0.6581, + "step": 26205 + }, + { + "epoch": 0.91, + "learning_rate": 4.1528377966884024e-07, + "loss": 0.6183, + "step": 26206 + }, + { + "epoch": 0.91, + "learning_rate": 4.149733054080263e-07, + "loss": 0.5764, + "step": 26207 + }, + { + "epoch": 0.91, + "learning_rate": 4.146629447898276e-07, + "loss": 0.618, + "step": 26208 + }, + { + "epoch": 0.91, + "learning_rate": 4.1435269781792465e-07, + "loss": 0.6761, + "step": 26209 + }, + { + "epoch": 0.91, + "learning_rate": 4.1404256449599666e-07, + "loss": 0.6742, + "step": 26210 + }, + { + "epoch": 0.91, + "learning_rate": 4.1373254482772076e-07, + "loss": 0.6274, + "step": 26211 + }, + { + "epoch": 0.91, + "learning_rate": 4.134226388167717e-07, + "loss": 0.6661, + "step": 26212 + }, + { + "epoch": 0.91, + "learning_rate": 4.1311284646682656e-07, + "loss": 0.6609, + "step": 26213 + }, + { + "epoch": 0.91, + "learning_rate": 4.128031677815536e-07, + "loss": 0.6303, + "step": 26214 + }, + { + "epoch": 0.91, + "learning_rate": 4.124936027646276e-07, + "loss": 0.6062, + "step": 26215 + }, + { + "epoch": 0.91, + "learning_rate": 4.121841514197178e-07, + "loss": 0.6162, + "step": 26216 + }, + { + "epoch": 0.91, + "learning_rate": 4.118748137504935e-07, + "loss": 0.5954, + "step": 26217 + }, + { + "epoch": 0.91, + "learning_rate": 4.11565589760623e-07, + "loss": 0.6014, + "step": 26218 + }, + { + "epoch": 0.91, + "learning_rate": 4.112564794537732e-07, + "loss": 0.6263, + "step": 26219 + }, + { + "epoch": 0.91, + "learning_rate": 4.1094748283360576e-07, + "loss": 0.6445, + "step": 26220 + }, + { + "epoch": 0.91, + "learning_rate": 4.106385999037865e-07, + "loss": 0.651, + "step": 26221 + }, + { + "epoch": 0.91, + "learning_rate": 4.10329830667977e-07, + "loss": 0.6167, + "step": 26222 + }, + { + "epoch": 0.91, + "learning_rate": 4.1002117512983775e-07, + "loss": 0.6838, + "step": 26223 + }, + { + "epoch": 0.91, + "learning_rate": 4.0971263329303126e-07, + "loss": 0.646, + "step": 26224 + }, + { + "epoch": 0.91, + "learning_rate": 4.094042051612113e-07, + "loss": 0.6508, + "step": 26225 + }, + { + "epoch": 0.91, + "learning_rate": 4.090958907380371e-07, + "loss": 0.6625, + "step": 26226 + }, + { + "epoch": 0.91, + "learning_rate": 4.087876900271637e-07, + "loss": 0.6663, + "step": 26227 + }, + { + "epoch": 0.91, + "learning_rate": 4.0847960303224464e-07, + "loss": 0.6514, + "step": 26228 + }, + { + "epoch": 0.91, + "learning_rate": 4.081716297569338e-07, + "loss": 0.6369, + "step": 26229 + }, + { + "epoch": 0.91, + "learning_rate": 4.078637702048827e-07, + "loss": 0.6357, + "step": 26230 + }, + { + "epoch": 0.91, + "learning_rate": 4.075560243797394e-07, + "loss": 0.5953, + "step": 26231 + }, + { + "epoch": 0.91, + "learning_rate": 4.072483922851544e-07, + "loss": 0.5998, + "step": 26232 + }, + { + "epoch": 0.91, + "learning_rate": 4.0694087392477486e-07, + "loss": 0.6476, + "step": 26233 + }, + { + "epoch": 0.91, + "learning_rate": 4.0663346930224557e-07, + "loss": 0.6482, + "step": 26234 + }, + { + "epoch": 0.91, + "learning_rate": 4.0632617842121357e-07, + "loss": 0.5975, + "step": 26235 + }, + { + "epoch": 0.91, + "learning_rate": 4.0601900128532046e-07, + "loss": 0.6345, + "step": 26236 + }, + { + "epoch": 0.91, + "learning_rate": 4.0571193789820886e-07, + "loss": 0.6464, + "step": 26237 + }, + { + "epoch": 0.91, + "learning_rate": 4.0540498826351804e-07, + "loss": 0.6824, + "step": 26238 + }, + { + "epoch": 0.91, + "learning_rate": 4.050981523848885e-07, + "loss": 0.6819, + "step": 26239 + }, + { + "epoch": 0.91, + "learning_rate": 4.0479143026595835e-07, + "loss": 0.6122, + "step": 26240 + }, + { + "epoch": 0.91, + "learning_rate": 4.0448482191036364e-07, + "loss": 0.6505, + "step": 26241 + }, + { + "epoch": 0.91, + "learning_rate": 4.0417832732174036e-07, + "loss": 0.6749, + "step": 26242 + }, + { + "epoch": 0.91, + "learning_rate": 4.0387194650372106e-07, + "loss": 0.6615, + "step": 26243 + }, + { + "epoch": 0.91, + "learning_rate": 4.035656794599385e-07, + "loss": 0.6348, + "step": 26244 + }, + { + "epoch": 0.91, + "learning_rate": 4.032595261940253e-07, + "loss": 0.5794, + "step": 26245 + }, + { + "epoch": 0.91, + "learning_rate": 4.0295348670960967e-07, + "loss": 0.6618, + "step": 26246 + }, + { + "epoch": 0.91, + "learning_rate": 4.026475610103209e-07, + "loss": 0.5858, + "step": 26247 + }, + { + "epoch": 0.91, + "learning_rate": 4.023417490997883e-07, + "loss": 0.6105, + "step": 26248 + }, + { + "epoch": 0.91, + "learning_rate": 4.0203605098163234e-07, + "loss": 0.6227, + "step": 26249 + }, + { + "epoch": 0.91, + "learning_rate": 4.0173046665948125e-07, + "loss": 0.6369, + "step": 26250 + }, + { + "epoch": 0.91, + "learning_rate": 4.014249961369576e-07, + "loss": 0.6398, + "step": 26251 + }, + { + "epoch": 0.91, + "learning_rate": 4.0111963941768306e-07, + "loss": 0.6647, + "step": 26252 + }, + { + "epoch": 0.91, + "learning_rate": 4.0081439650527687e-07, + "loss": 0.5924, + "step": 26253 + }, + { + "epoch": 0.91, + "learning_rate": 4.005092674033617e-07, + "loss": 0.6291, + "step": 26254 + }, + { + "epoch": 0.91, + "learning_rate": 4.0020425211555024e-07, + "loss": 0.6161, + "step": 26255 + }, + { + "epoch": 0.91, + "learning_rate": 3.998993506454618e-07, + "loss": 0.6671, + "step": 26256 + }, + { + "epoch": 0.91, + "learning_rate": 3.9959456299671015e-07, + "loss": 0.6602, + "step": 26257 + }, + { + "epoch": 0.91, + "learning_rate": 3.9928988917291023e-07, + "loss": 0.6052, + "step": 26258 + }, + { + "epoch": 0.91, + "learning_rate": 3.989853291776724e-07, + "loss": 0.6745, + "step": 26259 + }, + { + "epoch": 0.91, + "learning_rate": 3.9868088301461163e-07, + "loss": 0.6006, + "step": 26260 + }, + { + "epoch": 0.91, + "learning_rate": 3.983765506873327e-07, + "loss": 0.6425, + "step": 26261 + }, + { + "epoch": 0.91, + "learning_rate": 3.980723321994451e-07, + "loss": 0.6014, + "step": 26262 + }, + { + "epoch": 0.91, + "learning_rate": 3.97768227554558e-07, + "loss": 0.6349, + "step": 26263 + }, + { + "epoch": 0.91, + "learning_rate": 3.974642367562742e-07, + "loss": 0.666, + "step": 26264 + }, + { + "epoch": 0.91, + "learning_rate": 3.971603598081997e-07, + "loss": 0.6166, + "step": 26265 + }, + { + "epoch": 0.91, + "learning_rate": 3.968565967139382e-07, + "loss": 0.6666, + "step": 26266 + }, + { + "epoch": 0.91, + "learning_rate": 3.9655294747708907e-07, + "loss": 0.6768, + "step": 26267 + }, + { + "epoch": 0.91, + "learning_rate": 3.962494121012517e-07, + "loss": 0.6948, + "step": 26268 + }, + { + "epoch": 0.91, + "learning_rate": 3.959459905900276e-07, + "loss": 0.5998, + "step": 26269 + }, + { + "epoch": 0.91, + "learning_rate": 3.956426829470128e-07, + "loss": 0.6254, + "step": 26270 + }, + { + "epoch": 0.91, + "learning_rate": 3.953394891758033e-07, + "loss": 0.6633, + "step": 26271 + }, + { + "epoch": 0.91, + "learning_rate": 3.950364092799952e-07, + "loss": 0.5759, + "step": 26272 + }, + { + "epoch": 0.91, + "learning_rate": 3.9473344326317995e-07, + "loss": 0.6157, + "step": 26273 + }, + { + "epoch": 0.91, + "learning_rate": 3.944305911289492e-07, + "loss": 0.596, + "step": 26274 + }, + { + "epoch": 0.91, + "learning_rate": 3.9412785288089673e-07, + "loss": 0.6307, + "step": 26275 + }, + { + "epoch": 0.91, + "learning_rate": 3.938252285226085e-07, + "loss": 0.6765, + "step": 26276 + }, + { + "epoch": 0.91, + "learning_rate": 3.9352271805767506e-07, + "loss": 0.6054, + "step": 26277 + }, + { + "epoch": 0.91, + "learning_rate": 3.932203214896835e-07, + "loss": 0.6173, + "step": 26278 + }, + { + "epoch": 0.91, + "learning_rate": 3.9291803882221534e-07, + "loss": 0.6335, + "step": 26279 + }, + { + "epoch": 0.91, + "learning_rate": 3.926158700588578e-07, + "loss": 0.6159, + "step": 26280 + }, + { + "epoch": 0.91, + "learning_rate": 3.9231381520319353e-07, + "loss": 0.5929, + "step": 26281 + }, + { + "epoch": 0.91, + "learning_rate": 3.9201187425879974e-07, + "loss": 0.6394, + "step": 26282 + }, + { + "epoch": 0.91, + "learning_rate": 3.917100472292623e-07, + "loss": 0.6251, + "step": 26283 + }, + { + "epoch": 0.91, + "learning_rate": 3.9140833411815625e-07, + "loss": 0.6534, + "step": 26284 + }, + { + "epoch": 0.91, + "learning_rate": 3.911067349290587e-07, + "loss": 0.6412, + "step": 26285 + }, + { + "epoch": 0.91, + "learning_rate": 3.908052496655468e-07, + "loss": 0.6292, + "step": 26286 + }, + { + "epoch": 0.91, + "learning_rate": 3.9050387833119427e-07, + "loss": 0.5879, + "step": 26287 + }, + { + "epoch": 0.91, + "learning_rate": 3.902026209295717e-07, + "loss": 0.6604, + "step": 26288 + }, + { + "epoch": 0.91, + "learning_rate": 3.899014774642573e-07, + "loss": 0.6404, + "step": 26289 + }, + { + "epoch": 0.91, + "learning_rate": 3.8960044793881604e-07, + "loss": 0.5972, + "step": 26290 + }, + { + "epoch": 0.91, + "learning_rate": 3.8929953235681826e-07, + "loss": 0.5746, + "step": 26291 + }, + { + "epoch": 0.91, + "learning_rate": 3.889987307218335e-07, + "loss": 0.6593, + "step": 26292 + }, + { + "epoch": 0.91, + "learning_rate": 3.8869804303742544e-07, + "loss": 0.6416, + "step": 26293 + }, + { + "epoch": 0.91, + "learning_rate": 3.883974693071602e-07, + "loss": 0.619, + "step": 26294 + }, + { + "epoch": 0.91, + "learning_rate": 3.880970095346026e-07, + "loss": 0.6229, + "step": 26295 + }, + { + "epoch": 0.91, + "learning_rate": 3.8779666372331435e-07, + "loss": 0.5669, + "step": 26296 + }, + { + "epoch": 0.91, + "learning_rate": 3.874964318768548e-07, + "loss": 0.598, + "step": 26297 + }, + { + "epoch": 0.91, + "learning_rate": 3.871963139987878e-07, + "loss": 0.6268, + "step": 26298 + }, + { + "epoch": 0.91, + "learning_rate": 3.8689631009266595e-07, + "loss": 0.7189, + "step": 26299 + }, + { + "epoch": 0.91, + "learning_rate": 3.865964201620487e-07, + "loss": 0.5905, + "step": 26300 + }, + { + "epoch": 0.91, + "learning_rate": 3.8629664421049427e-07, + "loss": 0.6493, + "step": 26301 + }, + { + "epoch": 0.91, + "learning_rate": 3.8599698224155214e-07, + "loss": 0.6619, + "step": 26302 + }, + { + "epoch": 0.91, + "learning_rate": 3.856974342587794e-07, + "loss": 0.5718, + "step": 26303 + }, + { + "epoch": 0.91, + "learning_rate": 3.853980002657254e-07, + "loss": 0.68, + "step": 26304 + }, + { + "epoch": 0.91, + "learning_rate": 3.8509868026594066e-07, + "loss": 0.6571, + "step": 26305 + }, + { + "epoch": 0.91, + "learning_rate": 3.847994742629713e-07, + "loss": 0.6918, + "step": 26306 + }, + { + "epoch": 0.91, + "learning_rate": 3.84500382260371e-07, + "loss": 0.6698, + "step": 26307 + }, + { + "epoch": 0.91, + "learning_rate": 3.8420140426168153e-07, + "loss": 0.6203, + "step": 26308 + }, + { + "epoch": 0.91, + "learning_rate": 3.839025402704477e-07, + "loss": 0.6275, + "step": 26309 + }, + { + "epoch": 0.91, + "learning_rate": 3.8360379029021456e-07, + "loss": 0.6217, + "step": 26310 + }, + { + "epoch": 0.91, + "learning_rate": 3.833051543245225e-07, + "loss": 0.6863, + "step": 26311 + }, + { + "epoch": 0.91, + "learning_rate": 3.8300663237691214e-07, + "loss": 0.6353, + "step": 26312 + }, + { + "epoch": 0.91, + "learning_rate": 3.827082244509261e-07, + "loss": 0.6622, + "step": 26313 + }, + { + "epoch": 0.91, + "learning_rate": 3.8240993055009835e-07, + "loss": 0.644, + "step": 26314 + }, + { + "epoch": 0.91, + "learning_rate": 3.8211175067796704e-07, + "loss": 0.6915, + "step": 26315 + }, + { + "epoch": 0.91, + "learning_rate": 3.8181368483806935e-07, + "loss": 0.6246, + "step": 26316 + }, + { + "epoch": 0.91, + "learning_rate": 3.8151573303393587e-07, + "loss": 0.663, + "step": 26317 + }, + { + "epoch": 0.91, + "learning_rate": 3.8121789526910036e-07, + "loss": 0.6726, + "step": 26318 + }, + { + "epoch": 0.91, + "learning_rate": 3.809201715470956e-07, + "loss": 0.6494, + "step": 26319 + }, + { + "epoch": 0.91, + "learning_rate": 3.8062256187144984e-07, + "loss": 0.5864, + "step": 26320 + }, + { + "epoch": 0.91, + "learning_rate": 3.8032506624569256e-07, + "loss": 0.6826, + "step": 26321 + }, + { + "epoch": 0.91, + "learning_rate": 3.800276846733519e-07, + "loss": 0.5707, + "step": 26322 + }, + { + "epoch": 0.91, + "learning_rate": 3.797304171579508e-07, + "loss": 0.652, + "step": 26323 + }, + { + "epoch": 0.91, + "learning_rate": 3.7943326370301403e-07, + "loss": 0.6774, + "step": 26324 + }, + { + "epoch": 0.91, + "learning_rate": 3.7913622431206886e-07, + "loss": 0.6347, + "step": 26325 + }, + { + "epoch": 0.91, + "learning_rate": 3.7883929898863247e-07, + "loss": 0.6359, + "step": 26326 + }, + { + "epoch": 0.91, + "learning_rate": 3.785424877362265e-07, + "loss": 0.5802, + "step": 26327 + }, + { + "epoch": 0.91, + "learning_rate": 3.782457905583725e-07, + "loss": 0.6411, + "step": 26328 + }, + { + "epoch": 0.91, + "learning_rate": 3.7794920745858554e-07, + "loss": 0.6357, + "step": 26329 + }, + { + "epoch": 0.91, + "learning_rate": 3.776527384403805e-07, + "loss": 0.5923, + "step": 26330 + }, + { + "epoch": 0.91, + "learning_rate": 3.7735638350727797e-07, + "loss": 0.588, + "step": 26331 + }, + { + "epoch": 0.91, + "learning_rate": 3.7706014266278624e-07, + "loss": 0.6356, + "step": 26332 + }, + { + "epoch": 0.91, + "learning_rate": 3.767640159104191e-07, + "loss": 0.6373, + "step": 26333 + }, + { + "epoch": 0.91, + "learning_rate": 3.764680032536905e-07, + "loss": 0.6159, + "step": 26334 + }, + { + "epoch": 0.91, + "learning_rate": 3.761721046961053e-07, + "loss": 0.6258, + "step": 26335 + }, + { + "epoch": 0.91, + "learning_rate": 3.7587632024117415e-07, + "loss": 0.6504, + "step": 26336 + }, + { + "epoch": 0.91, + "learning_rate": 3.755806498924053e-07, + "loss": 0.6074, + "step": 26337 + }, + { + "epoch": 0.91, + "learning_rate": 3.7528509365330143e-07, + "loss": 0.7038, + "step": 26338 + }, + { + "epoch": 0.91, + "learning_rate": 3.7498965152736764e-07, + "loss": 0.6513, + "step": 26339 + }, + { + "epoch": 0.91, + "learning_rate": 3.7469432351811e-07, + "loss": 0.6483, + "step": 26340 + }, + { + "epoch": 0.91, + "learning_rate": 3.7439910962902447e-07, + "loss": 0.6841, + "step": 26341 + }, + { + "epoch": 0.91, + "learning_rate": 3.7410400986361397e-07, + "loss": 0.6158, + "step": 26342 + }, + { + "epoch": 0.91, + "learning_rate": 3.738090242253789e-07, + "loss": 0.6116, + "step": 26343 + }, + { + "epoch": 0.91, + "learning_rate": 3.7351415271781435e-07, + "loss": 0.6639, + "step": 26344 + }, + { + "epoch": 0.91, + "learning_rate": 3.7321939534441745e-07, + "loss": 0.6282, + "step": 26345 + }, + { + "epoch": 0.91, + "learning_rate": 3.7292475210868207e-07, + "loss": 0.6212, + "step": 26346 + }, + { + "epoch": 0.91, + "learning_rate": 3.7263022301410213e-07, + "loss": 0.6342, + "step": 26347 + }, + { + "epoch": 0.91, + "learning_rate": 3.7233580806416926e-07, + "loss": 0.6511, + "step": 26348 + }, + { + "epoch": 0.91, + "learning_rate": 3.7204150726237396e-07, + "loss": 0.6217, + "step": 26349 + }, + { + "epoch": 0.91, + "learning_rate": 3.717473206122069e-07, + "loss": 0.5933, + "step": 26350 + }, + { + "epoch": 0.91, + "learning_rate": 3.7145324811715623e-07, + "loss": 0.6438, + "step": 26351 + }, + { + "epoch": 0.91, + "learning_rate": 3.7115928978070594e-07, + "loss": 0.6759, + "step": 26352 + }, + { + "epoch": 0.91, + "learning_rate": 3.7086544560634206e-07, + "loss": 0.6254, + "step": 26353 + }, + { + "epoch": 0.91, + "learning_rate": 3.7057171559755076e-07, + "loss": 0.616, + "step": 26354 + }, + { + "epoch": 0.91, + "learning_rate": 3.702780997578126e-07, + "loss": 0.6275, + "step": 26355 + }, + { + "epoch": 0.91, + "learning_rate": 3.6998459809060916e-07, + "loss": 0.6298, + "step": 26356 + }, + { + "epoch": 0.91, + "learning_rate": 3.6969121059942104e-07, + "loss": 0.6215, + "step": 26357 + }, + { + "epoch": 0.91, + "learning_rate": 3.6939793728772544e-07, + "loss": 0.6743, + "step": 26358 + }, + { + "epoch": 0.91, + "learning_rate": 3.691047781589996e-07, + "loss": 0.6457, + "step": 26359 + }, + { + "epoch": 0.91, + "learning_rate": 3.688117332167196e-07, + "loss": 0.6377, + "step": 26360 + }, + { + "epoch": 0.91, + "learning_rate": 3.6851880246436047e-07, + "loss": 0.6816, + "step": 26361 + }, + { + "epoch": 0.91, + "learning_rate": 3.6822598590539495e-07, + "loss": 0.6377, + "step": 26362 + }, + { + "epoch": 0.91, + "learning_rate": 3.679332835432958e-07, + "loss": 0.612, + "step": 26363 + }, + { + "epoch": 0.91, + "learning_rate": 3.6764069538153144e-07, + "loss": 0.6404, + "step": 26364 + }, + { + "epoch": 0.91, + "learning_rate": 3.673482214235702e-07, + "loss": 0.6001, + "step": 26365 + }, + { + "epoch": 0.91, + "learning_rate": 3.670558616728825e-07, + "loss": 0.6378, + "step": 26366 + }, + { + "epoch": 0.91, + "learning_rate": 3.667636161329324e-07, + "loss": 0.6525, + "step": 26367 + }, + { + "epoch": 0.91, + "learning_rate": 3.66471484807186e-07, + "loss": 0.6749, + "step": 26368 + }, + { + "epoch": 0.91, + "learning_rate": 3.6617946769910816e-07, + "loss": 0.6415, + "step": 26369 + }, + { + "epoch": 0.91, + "learning_rate": 3.658875648121585e-07, + "loss": 0.5854, + "step": 26370 + }, + { + "epoch": 0.91, + "learning_rate": 3.655957761497986e-07, + "loss": 0.6333, + "step": 26371 + }, + { + "epoch": 0.91, + "learning_rate": 3.653041017154879e-07, + "loss": 0.6264, + "step": 26372 + }, + { + "epoch": 0.91, + "learning_rate": 3.650125415126859e-07, + "loss": 0.6503, + "step": 26373 + }, + { + "epoch": 0.91, + "learning_rate": 3.647210955448488e-07, + "loss": 0.61, + "step": 26374 + }, + { + "epoch": 0.91, + "learning_rate": 3.644297638154315e-07, + "loss": 0.5688, + "step": 26375 + }, + { + "epoch": 0.91, + "learning_rate": 3.6413854632788904e-07, + "loss": 0.6819, + "step": 26376 + }, + { + "epoch": 0.91, + "learning_rate": 3.63847443085672e-07, + "loss": 0.6398, + "step": 26377 + }, + { + "epoch": 0.91, + "learning_rate": 3.6355645409223427e-07, + "loss": 0.5934, + "step": 26378 + }, + { + "epoch": 0.91, + "learning_rate": 3.6326557935102427e-07, + "loss": 0.653, + "step": 26379 + }, + { + "epoch": 0.91, + "learning_rate": 3.6297481886549136e-07, + "loss": 0.6227, + "step": 26380 + }, + { + "epoch": 0.91, + "learning_rate": 3.6268417263908504e-07, + "loss": 0.6221, + "step": 26381 + }, + { + "epoch": 0.91, + "learning_rate": 3.6239364067524707e-07, + "loss": 0.5897, + "step": 26382 + }, + { + "epoch": 0.91, + "learning_rate": 3.621032229774246e-07, + "loss": 0.6301, + "step": 26383 + }, + { + "epoch": 0.91, + "learning_rate": 3.618129195490594e-07, + "loss": 0.609, + "step": 26384 + }, + { + "epoch": 0.91, + "learning_rate": 3.6152273039359533e-07, + "loss": 0.6408, + "step": 26385 + }, + { + "epoch": 0.91, + "learning_rate": 3.6123265551447183e-07, + "loss": 0.6451, + "step": 26386 + }, + { + "epoch": 0.91, + "learning_rate": 3.6094269491512956e-07, + "loss": 0.6122, + "step": 26387 + }, + { + "epoch": 0.91, + "learning_rate": 3.606528485990046e-07, + "loss": 0.5782, + "step": 26388 + }, + { + "epoch": 0.91, + "learning_rate": 3.6036311656953315e-07, + "loss": 0.5995, + "step": 26389 + }, + { + "epoch": 0.91, + "learning_rate": 3.600734988301513e-07, + "loss": 0.6458, + "step": 26390 + }, + { + "epoch": 0.91, + "learning_rate": 3.5978399538429186e-07, + "loss": 0.5397, + "step": 26391 + }, + { + "epoch": 0.91, + "learning_rate": 3.594946062353888e-07, + "loss": 0.6117, + "step": 26392 + }, + { + "epoch": 0.91, + "learning_rate": 3.592053313868737e-07, + "loss": 0.6688, + "step": 26393 + }, + { + "epoch": 0.91, + "learning_rate": 3.58916170842174e-07, + "loss": 0.6618, + "step": 26394 + }, + { + "epoch": 0.91, + "learning_rate": 3.5862712460471903e-07, + "loss": 0.6407, + "step": 26395 + }, + { + "epoch": 0.91, + "learning_rate": 3.5833819267793613e-07, + "loss": 0.6591, + "step": 26396 + }, + { + "epoch": 0.91, + "learning_rate": 3.580493750652514e-07, + "loss": 0.6225, + "step": 26397 + }, + { + "epoch": 0.91, + "learning_rate": 3.5776067177008656e-07, + "loss": 0.6193, + "step": 26398 + }, + { + "epoch": 0.91, + "learning_rate": 3.574720827958689e-07, + "loss": 0.6768, + "step": 26399 + }, + { + "epoch": 0.91, + "learning_rate": 3.571836081460167e-07, + "loss": 0.6045, + "step": 26400 + }, + { + "epoch": 0.91, + "learning_rate": 3.568952478239507e-07, + "loss": 0.5935, + "step": 26401 + }, + { + "epoch": 0.91, + "learning_rate": 3.566070018330892e-07, + "loss": 0.6265, + "step": 26402 + }, + { + "epoch": 0.91, + "learning_rate": 3.563188701768516e-07, + "loss": 0.5644, + "step": 26403 + }, + { + "epoch": 0.91, + "learning_rate": 3.5603085285865314e-07, + "loss": 0.6633, + "step": 26404 + }, + { + "epoch": 0.91, + "learning_rate": 3.557429498819087e-07, + "loss": 0.6867, + "step": 26405 + }, + { + "epoch": 0.91, + "learning_rate": 3.554551612500323e-07, + "loss": 0.6589, + "step": 26406 + }, + { + "epoch": 0.91, + "learning_rate": 3.551674869664334e-07, + "loss": 0.6103, + "step": 26407 + }, + { + "epoch": 0.91, + "learning_rate": 3.5487992703452603e-07, + "loss": 0.6194, + "step": 26408 + }, + { + "epoch": 0.92, + "learning_rate": 3.545924814577184e-07, + "loss": 0.6843, + "step": 26409 + }, + { + "epoch": 0.92, + "learning_rate": 3.5430515023941903e-07, + "loss": 0.6244, + "step": 26410 + }, + { + "epoch": 0.92, + "learning_rate": 3.540179333830329e-07, + "loss": 0.5972, + "step": 26411 + }, + { + "epoch": 0.92, + "learning_rate": 3.5373083089196627e-07, + "loss": 0.6641, + "step": 26412 + }, + { + "epoch": 0.92, + "learning_rate": 3.5344384276962296e-07, + "loss": 0.5931, + "step": 26413 + }, + { + "epoch": 0.92, + "learning_rate": 3.531569690194059e-07, + "loss": 0.6219, + "step": 26414 + }, + { + "epoch": 0.92, + "learning_rate": 3.528702096447167e-07, + "loss": 0.7088, + "step": 26415 + }, + { + "epoch": 0.92, + "learning_rate": 3.5258356464895615e-07, + "loss": 0.6013, + "step": 26416 + }, + { + "epoch": 0.92, + "learning_rate": 3.522970340355203e-07, + "loss": 0.6063, + "step": 26417 + }, + { + "epoch": 0.92, + "learning_rate": 3.5201061780780754e-07, + "loss": 0.6035, + "step": 26418 + }, + { + "epoch": 0.92, + "learning_rate": 3.5172431596921296e-07, + "loss": 0.5984, + "step": 26419 + }, + { + "epoch": 0.92, + "learning_rate": 3.5143812852313275e-07, + "loss": 0.6302, + "step": 26420 + }, + { + "epoch": 0.92, + "learning_rate": 3.511520554729575e-07, + "loss": 0.6432, + "step": 26421 + }, + { + "epoch": 0.92, + "learning_rate": 3.5086609682208337e-07, + "loss": 0.6577, + "step": 26422 + }, + { + "epoch": 0.92, + "learning_rate": 3.505802525738955e-07, + "loss": 0.6082, + "step": 26423 + }, + { + "epoch": 0.92, + "learning_rate": 3.5029452273178664e-07, + "loss": 0.5632, + "step": 26424 + }, + { + "epoch": 0.92, + "learning_rate": 3.5000890729914197e-07, + "loss": 0.6318, + "step": 26425 + }, + { + "epoch": 0.92, + "learning_rate": 3.4972340627934866e-07, + "loss": 0.6185, + "step": 26426 + }, + { + "epoch": 0.92, + "learning_rate": 3.4943801967579295e-07, + "loss": 0.6409, + "step": 26427 + }, + { + "epoch": 0.92, + "learning_rate": 3.491527474918588e-07, + "loss": 0.595, + "step": 26428 + }, + { + "epoch": 0.92, + "learning_rate": 3.488675897309257e-07, + "loss": 0.6569, + "step": 26429 + }, + { + "epoch": 0.92, + "learning_rate": 3.4858254639637657e-07, + "loss": 0.6346, + "step": 26430 + }, + { + "epoch": 0.92, + "learning_rate": 3.4829761749158976e-07, + "loss": 0.6559, + "step": 26431 + }, + { + "epoch": 0.92, + "learning_rate": 3.4801280301994366e-07, + "loss": 0.6497, + "step": 26432 + }, + { + "epoch": 0.92, + "learning_rate": 3.4772810298481673e-07, + "loss": 0.6513, + "step": 26433 + }, + { + "epoch": 0.92, + "learning_rate": 3.4744351738958406e-07, + "loss": 0.664, + "step": 26434 + }, + { + "epoch": 0.92, + "learning_rate": 3.4715904623761844e-07, + "loss": 0.6267, + "step": 26435 + }, + { + "epoch": 0.92, + "learning_rate": 3.4687468953229276e-07, + "loss": 0.6092, + "step": 26436 + }, + { + "epoch": 0.92, + "learning_rate": 3.465904472769788e-07, + "loss": 0.6136, + "step": 26437 + }, + { + "epoch": 0.92, + "learning_rate": 3.46306319475046e-07, + "loss": 0.597, + "step": 26438 + }, + { + "epoch": 0.92, + "learning_rate": 3.460223061298651e-07, + "loss": 0.5952, + "step": 26439 + }, + { + "epoch": 0.92, + "learning_rate": 3.457384072448022e-07, + "loss": 0.5924, + "step": 26440 + }, + { + "epoch": 0.92, + "learning_rate": 3.4545462282322253e-07, + "loss": 0.6215, + "step": 26441 + }, + { + "epoch": 0.92, + "learning_rate": 3.4517095286849213e-07, + "loss": 0.6317, + "step": 26442 + }, + { + "epoch": 0.92, + "learning_rate": 3.448873973839728e-07, + "loss": 0.6327, + "step": 26443 + }, + { + "epoch": 0.92, + "learning_rate": 3.4460395637302633e-07, + "loss": 0.5581, + "step": 26444 + }, + { + "epoch": 0.92, + "learning_rate": 3.443206298390156e-07, + "loss": 0.6499, + "step": 26445 + }, + { + "epoch": 0.92, + "learning_rate": 3.4403741778529785e-07, + "loss": 0.6325, + "step": 26446 + }, + { + "epoch": 0.92, + "learning_rate": 3.437543202152316e-07, + "loss": 0.6022, + "step": 26447 + }, + { + "epoch": 0.92, + "learning_rate": 3.4347133713217295e-07, + "loss": 0.6037, + "step": 26448 + }, + { + "epoch": 0.92, + "learning_rate": 3.4318846853947596e-07, + "loss": 0.661, + "step": 26449 + }, + { + "epoch": 0.92, + "learning_rate": 3.429057144404968e-07, + "loss": 0.609, + "step": 26450 + }, + { + "epoch": 0.92, + "learning_rate": 3.4262307483858614e-07, + "loss": 0.588, + "step": 26451 + }, + { + "epoch": 0.92, + "learning_rate": 3.4234054973709687e-07, + "loss": 0.5837, + "step": 26452 + }, + { + "epoch": 0.92, + "learning_rate": 3.4205813913937626e-07, + "loss": 0.6199, + "step": 26453 + }, + { + "epoch": 0.92, + "learning_rate": 3.417758430487739e-07, + "loss": 0.6347, + "step": 26454 + }, + { + "epoch": 0.92, + "learning_rate": 3.4149366146863703e-07, + "loss": 0.6195, + "step": 26455 + }, + { + "epoch": 0.92, + "learning_rate": 3.4121159440230977e-07, + "loss": 0.651, + "step": 26456 + }, + { + "epoch": 0.92, + "learning_rate": 3.4092964185313825e-07, + "loss": 0.6153, + "step": 26457 + }, + { + "epoch": 0.92, + "learning_rate": 3.406478038244665e-07, + "loss": 0.6265, + "step": 26458 + }, + { + "epoch": 0.92, + "learning_rate": 3.403660803196318e-07, + "loss": 0.6422, + "step": 26459 + }, + { + "epoch": 0.92, + "learning_rate": 3.400844713419771e-07, + "loss": 0.5482, + "step": 26460 + }, + { + "epoch": 0.92, + "learning_rate": 3.3980297689484077e-07, + "loss": 0.6197, + "step": 26461 + }, + { + "epoch": 0.92, + "learning_rate": 3.395215969815602e-07, + "loss": 0.6553, + "step": 26462 + }, + { + "epoch": 0.92, + "learning_rate": 3.3924033160547153e-07, + "loss": 0.6172, + "step": 26463 + }, + { + "epoch": 0.92, + "learning_rate": 3.389591807699111e-07, + "loss": 0.6213, + "step": 26464 + }, + { + "epoch": 0.92, + "learning_rate": 3.3867814447821056e-07, + "loss": 0.606, + "step": 26465 + }, + { + "epoch": 0.92, + "learning_rate": 3.383972227337007e-07, + "loss": 0.6701, + "step": 26466 + }, + { + "epoch": 0.92, + "learning_rate": 3.381164155397143e-07, + "loss": 0.5846, + "step": 26467 + }, + { + "epoch": 0.92, + "learning_rate": 3.37835722899581e-07, + "loss": 0.6495, + "step": 26468 + }, + { + "epoch": 0.92, + "learning_rate": 3.375551448166281e-07, + "loss": 0.6407, + "step": 26469 + }, + { + "epoch": 0.92, + "learning_rate": 3.3727468129418184e-07, + "loss": 0.6008, + "step": 26470 + }, + { + "epoch": 0.92, + "learning_rate": 3.3699433233556623e-07, + "loss": 0.6486, + "step": 26471 + }, + { + "epoch": 0.92, + "learning_rate": 3.367140979441086e-07, + "loss": 0.6241, + "step": 26472 + }, + { + "epoch": 0.92, + "learning_rate": 3.364339781231274e-07, + "loss": 0.6879, + "step": 26473 + }, + { + "epoch": 0.92, + "learning_rate": 3.3615397287594664e-07, + "loss": 0.6547, + "step": 26474 + }, + { + "epoch": 0.92, + "learning_rate": 3.358740822058859e-07, + "loss": 0.593, + "step": 26475 + }, + { + "epoch": 0.92, + "learning_rate": 3.3559430611626253e-07, + "loss": 0.6321, + "step": 26476 + }, + { + "epoch": 0.92, + "learning_rate": 3.35314644610395e-07, + "loss": 0.6495, + "step": 26477 + }, + { + "epoch": 0.92, + "learning_rate": 3.3503509769159834e-07, + "loss": 0.611, + "step": 26478 + }, + { + "epoch": 0.92, + "learning_rate": 3.347556653631845e-07, + "loss": 0.6296, + "step": 26479 + }, + { + "epoch": 0.92, + "learning_rate": 3.344763476284707e-07, + "loss": 0.6485, + "step": 26480 + }, + { + "epoch": 0.92, + "learning_rate": 3.341971444907677e-07, + "loss": 0.6056, + "step": 26481 + }, + { + "epoch": 0.92, + "learning_rate": 3.339180559533828e-07, + "loss": 0.5849, + "step": 26482 + }, + { + "epoch": 0.92, + "learning_rate": 3.336390820196278e-07, + "loss": 0.6441, + "step": 26483 + }, + { + "epoch": 0.92, + "learning_rate": 3.333602226928112e-07, + "loss": 0.6613, + "step": 26484 + }, + { + "epoch": 0.92, + "learning_rate": 3.330814779762348e-07, + "loss": 0.6042, + "step": 26485 + }, + { + "epoch": 0.92, + "learning_rate": 3.32802847873207e-07, + "loss": 0.6277, + "step": 26486 + }, + { + "epoch": 0.92, + "learning_rate": 3.3252433238703085e-07, + "loss": 0.6067, + "step": 26487 + }, + { + "epoch": 0.92, + "learning_rate": 3.3224593152100804e-07, + "loss": 0.6244, + "step": 26488 + }, + { + "epoch": 0.92, + "learning_rate": 3.319676452784404e-07, + "loss": 0.6499, + "step": 26489 + }, + { + "epoch": 0.92, + "learning_rate": 3.316894736626264e-07, + "loss": 0.6456, + "step": 26490 + }, + { + "epoch": 0.92, + "learning_rate": 3.3141141667686226e-07, + "loss": 0.612, + "step": 26491 + }, + { + "epoch": 0.92, + "learning_rate": 3.311334743244465e-07, + "loss": 0.6147, + "step": 26492 + }, + { + "epoch": 0.92, + "learning_rate": 3.3085564660867763e-07, + "loss": 0.6149, + "step": 26493 + }, + { + "epoch": 0.92, + "learning_rate": 3.305779335328441e-07, + "loss": 0.5989, + "step": 26494 + }, + { + "epoch": 0.92, + "learning_rate": 3.3030033510024205e-07, + "loss": 0.6729, + "step": 26495 + }, + { + "epoch": 0.92, + "learning_rate": 3.3002285131416235e-07, + "loss": 0.6057, + "step": 26496 + }, + { + "epoch": 0.92, + "learning_rate": 3.2974548217789224e-07, + "loss": 0.6412, + "step": 26497 + }, + { + "epoch": 0.92, + "learning_rate": 3.294682276947225e-07, + "loss": 0.6087, + "step": 26498 + }, + { + "epoch": 0.92, + "learning_rate": 3.291910878679427e-07, + "loss": 0.6466, + "step": 26499 + }, + { + "epoch": 0.92, + "learning_rate": 3.289140627008347e-07, + "loss": 0.5982, + "step": 26500 + }, + { + "epoch": 0.92, + "learning_rate": 3.286371521966847e-07, + "loss": 0.6764, + "step": 26501 + }, + { + "epoch": 0.92, + "learning_rate": 3.283603563587756e-07, + "loss": 0.6277, + "step": 26502 + }, + { + "epoch": 0.92, + "learning_rate": 3.280836751903882e-07, + "loss": 0.67, + "step": 26503 + }, + { + "epoch": 0.92, + "learning_rate": 3.2780710869480425e-07, + "loss": 0.6702, + "step": 26504 + }, + { + "epoch": 0.92, + "learning_rate": 3.275306568753034e-07, + "loss": 0.6206, + "step": 26505 + }, + { + "epoch": 0.92, + "learning_rate": 3.272543197351619e-07, + "loss": 0.6344, + "step": 26506 + }, + { + "epoch": 0.92, + "learning_rate": 3.2697809727765593e-07, + "loss": 0.6395, + "step": 26507 + }, + { + "epoch": 0.92, + "learning_rate": 3.26701989506063e-07, + "loss": 0.6425, + "step": 26508 + }, + { + "epoch": 0.92, + "learning_rate": 3.264259964236516e-07, + "loss": 0.6594, + "step": 26509 + }, + { + "epoch": 0.92, + "learning_rate": 3.26150118033699e-07, + "loss": 0.6464, + "step": 26510 + }, + { + "epoch": 0.92, + "learning_rate": 3.258743543394749e-07, + "loss": 0.6457, + "step": 26511 + }, + { + "epoch": 0.92, + "learning_rate": 3.2559870534424776e-07, + "loss": 0.6055, + "step": 26512 + }, + { + "epoch": 0.92, + "learning_rate": 3.2532317105128495e-07, + "loss": 0.6559, + "step": 26513 + }, + { + "epoch": 0.92, + "learning_rate": 3.2504775146385616e-07, + "loss": 0.5936, + "step": 26514 + }, + { + "epoch": 0.92, + "learning_rate": 3.247724465852231e-07, + "loss": 0.633, + "step": 26515 + }, + { + "epoch": 0.92, + "learning_rate": 3.2449725641865326e-07, + "loss": 0.6382, + "step": 26516 + }, + { + "epoch": 0.92, + "learning_rate": 3.2422218096740845e-07, + "loss": 0.6428, + "step": 26517 + }, + { + "epoch": 0.92, + "learning_rate": 3.239472202347493e-07, + "loss": 0.6112, + "step": 26518 + }, + { + "epoch": 0.92, + "learning_rate": 3.2367237422393563e-07, + "loss": 0.6363, + "step": 26519 + }, + { + "epoch": 0.92, + "learning_rate": 3.2339764293822686e-07, + "loss": 0.666, + "step": 26520 + }, + { + "epoch": 0.92, + "learning_rate": 3.2312302638087934e-07, + "loss": 0.6838, + "step": 26521 + }, + { + "epoch": 0.92, + "learning_rate": 3.2284852455514937e-07, + "loss": 0.6085, + "step": 26522 + }, + { + "epoch": 0.92, + "learning_rate": 3.225741374642943e-07, + "loss": 0.6571, + "step": 26523 + }, + { + "epoch": 0.92, + "learning_rate": 3.2229986511156277e-07, + "loss": 0.7027, + "step": 26524 + }, + { + "epoch": 0.92, + "learning_rate": 3.2202570750020866e-07, + "loss": 0.632, + "step": 26525 + }, + { + "epoch": 0.92, + "learning_rate": 3.2175166463348396e-07, + "loss": 0.7007, + "step": 26526 + }, + { + "epoch": 0.92, + "learning_rate": 3.2147773651463375e-07, + "loss": 0.6358, + "step": 26527 + }, + { + "epoch": 0.92, + "learning_rate": 3.2120392314690996e-07, + "loss": 0.6207, + "step": 26528 + }, + { + "epoch": 0.92, + "learning_rate": 3.2093022453355883e-07, + "loss": 0.6765, + "step": 26529 + }, + { + "epoch": 0.92, + "learning_rate": 3.206566406778222e-07, + "loss": 0.6182, + "step": 26530 + }, + { + "epoch": 0.92, + "learning_rate": 3.203831715829464e-07, + "loss": 0.6144, + "step": 26531 + }, + { + "epoch": 0.92, + "learning_rate": 3.201098172521722e-07, + "loss": 0.6329, + "step": 26532 + }, + { + "epoch": 0.92, + "learning_rate": 3.1983657768874023e-07, + "loss": 0.6391, + "step": 26533 + }, + { + "epoch": 0.92, + "learning_rate": 3.195634528958935e-07, + "loss": 0.6459, + "step": 26534 + }, + { + "epoch": 0.92, + "learning_rate": 3.1929044287686615e-07, + "loss": 0.6254, + "step": 26535 + }, + { + "epoch": 0.92, + "learning_rate": 3.1901754763489667e-07, + "loss": 0.6439, + "step": 26536 + }, + { + "epoch": 0.92, + "learning_rate": 3.1874476717322246e-07, + "loss": 0.6943, + "step": 26537 + }, + { + "epoch": 0.92, + "learning_rate": 3.1847210149507426e-07, + "loss": 0.6413, + "step": 26538 + }, + { + "epoch": 0.92, + "learning_rate": 3.1819955060368614e-07, + "loss": 0.613, + "step": 26539 + }, + { + "epoch": 0.92, + "learning_rate": 3.1792711450229107e-07, + "loss": 0.6296, + "step": 26540 + }, + { + "epoch": 0.92, + "learning_rate": 3.176547931941176e-07, + "loss": 0.5829, + "step": 26541 + }, + { + "epoch": 0.92, + "learning_rate": 3.173825866823943e-07, + "loss": 0.6327, + "step": 26542 + }, + { + "epoch": 0.92, + "learning_rate": 3.171104949703496e-07, + "loss": 0.6358, + "step": 26543 + }, + { + "epoch": 0.92, + "learning_rate": 3.168385180612088e-07, + "loss": 0.6658, + "step": 26544 + }, + { + "epoch": 0.92, + "learning_rate": 3.1656665595819593e-07, + "loss": 0.6801, + "step": 26545 + }, + { + "epoch": 0.92, + "learning_rate": 3.1629490866453615e-07, + "loss": 0.5962, + "step": 26546 + }, + { + "epoch": 0.92, + "learning_rate": 3.160232761834492e-07, + "loss": 0.6187, + "step": 26547 + }, + { + "epoch": 0.92, + "learning_rate": 3.1575175851815687e-07, + "loss": 0.6456, + "step": 26548 + }, + { + "epoch": 0.92, + "learning_rate": 3.1548035567187885e-07, + "loss": 0.516, + "step": 26549 + }, + { + "epoch": 0.92, + "learning_rate": 3.152090676478314e-07, + "loss": 0.6668, + "step": 26550 + }, + { + "epoch": 0.92, + "learning_rate": 3.1493789444923093e-07, + "loss": 0.6219, + "step": 26551 + }, + { + "epoch": 0.92, + "learning_rate": 3.1466683607929484e-07, + "loss": 0.6216, + "step": 26552 + }, + { + "epoch": 0.92, + "learning_rate": 3.143958925412349e-07, + "loss": 0.6091, + "step": 26553 + }, + { + "epoch": 0.92, + "learning_rate": 3.1412506383826426e-07, + "loss": 0.6441, + "step": 26554 + }, + { + "epoch": 0.92, + "learning_rate": 3.1385434997359356e-07, + "loss": 0.6287, + "step": 26555 + }, + { + "epoch": 0.92, + "learning_rate": 3.1358375095043246e-07, + "loss": 0.6597, + "step": 26556 + }, + { + "epoch": 0.92, + "learning_rate": 3.1331326677198846e-07, + "loss": 0.6694, + "step": 26557 + }, + { + "epoch": 0.92, + "learning_rate": 3.130428974414712e-07, + "loss": 0.6378, + "step": 26558 + }, + { + "epoch": 0.92, + "learning_rate": 3.1277264296208365e-07, + "loss": 0.6622, + "step": 26559 + }, + { + "epoch": 0.92, + "learning_rate": 3.125025033370299e-07, + "loss": 0.6154, + "step": 26560 + }, + { + "epoch": 0.92, + "learning_rate": 3.1223247856951634e-07, + "loss": 0.6249, + "step": 26561 + }, + { + "epoch": 0.92, + "learning_rate": 3.119625686627392e-07, + "loss": 0.5727, + "step": 26562 + }, + { + "epoch": 0.92, + "learning_rate": 3.116927736199016e-07, + "loss": 0.6344, + "step": 26563 + }, + { + "epoch": 0.92, + "learning_rate": 3.114230934442031e-07, + "loss": 0.6423, + "step": 26564 + }, + { + "epoch": 0.92, + "learning_rate": 3.1115352813883893e-07, + "loss": 0.652, + "step": 26565 + }, + { + "epoch": 0.92, + "learning_rate": 3.1088407770700655e-07, + "loss": 0.6464, + "step": 26566 + }, + { + "epoch": 0.92, + "learning_rate": 3.106147421519012e-07, + "loss": 0.6524, + "step": 26567 + }, + { + "epoch": 0.92, + "learning_rate": 3.103455214767137e-07, + "loss": 0.6278, + "step": 26568 + }, + { + "epoch": 0.92, + "learning_rate": 3.10076415684637e-07, + "loss": 0.5889, + "step": 26569 + }, + { + "epoch": 0.92, + "learning_rate": 3.0980742477886407e-07, + "loss": 0.5839, + "step": 26570 + }, + { + "epoch": 0.92, + "learning_rate": 3.0953854876258125e-07, + "loss": 0.6355, + "step": 26571 + }, + { + "epoch": 0.92, + "learning_rate": 3.092697876389772e-07, + "loss": 0.6243, + "step": 26572 + }, + { + "epoch": 0.92, + "learning_rate": 3.0900114141124036e-07, + "loss": 0.6303, + "step": 26573 + }, + { + "epoch": 0.92, + "learning_rate": 3.087326100825527e-07, + "loss": 0.595, + "step": 26574 + }, + { + "epoch": 0.92, + "learning_rate": 3.0846419365609834e-07, + "loss": 0.6682, + "step": 26575 + }, + { + "epoch": 0.92, + "learning_rate": 3.081958921350625e-07, + "loss": 0.6323, + "step": 26576 + }, + { + "epoch": 0.92, + "learning_rate": 3.0792770552262485e-07, + "loss": 0.6462, + "step": 26577 + }, + { + "epoch": 0.92, + "learning_rate": 3.0765963382196393e-07, + "loss": 0.6807, + "step": 26578 + }, + { + "epoch": 0.92, + "learning_rate": 3.073916770362595e-07, + "loss": 0.6351, + "step": 26579 + }, + { + "epoch": 0.92, + "learning_rate": 3.0712383516868783e-07, + "loss": 0.582, + "step": 26580 + }, + { + "epoch": 0.92, + "learning_rate": 3.0685610822242307e-07, + "loss": 0.6259, + "step": 26581 + }, + { + "epoch": 0.92, + "learning_rate": 3.0658849620064267e-07, + "loss": 0.6517, + "step": 26582 + }, + { + "epoch": 0.92, + "learning_rate": 3.063209991065175e-07, + "loss": 0.6286, + "step": 26583 + }, + { + "epoch": 0.92, + "learning_rate": 3.060536169432193e-07, + "loss": 0.6361, + "step": 26584 + }, + { + "epoch": 0.92, + "learning_rate": 3.0578634971392016e-07, + "loss": 0.6789, + "step": 26585 + }, + { + "epoch": 0.92, + "learning_rate": 3.0551919742178524e-07, + "loss": 0.6024, + "step": 26586 + }, + { + "epoch": 0.92, + "learning_rate": 3.0525216006998314e-07, + "loss": 0.65, + "step": 26587 + }, + { + "epoch": 0.92, + "learning_rate": 3.049852376616824e-07, + "loss": 0.6463, + "step": 26588 + }, + { + "epoch": 0.92, + "learning_rate": 3.04718430200045e-07, + "loss": 0.6303, + "step": 26589 + }, + { + "epoch": 0.92, + "learning_rate": 3.0445173768823497e-07, + "loss": 0.6284, + "step": 26590 + }, + { + "epoch": 0.92, + "learning_rate": 3.0418516012941546e-07, + "loss": 0.6005, + "step": 26591 + }, + { + "epoch": 0.92, + "learning_rate": 3.03918697526745e-07, + "loss": 0.6259, + "step": 26592 + }, + { + "epoch": 0.92, + "learning_rate": 3.036523498833843e-07, + "loss": 0.6414, + "step": 26593 + }, + { + "epoch": 0.92, + "learning_rate": 3.03386117202491e-07, + "loss": 0.6459, + "step": 26594 + }, + { + "epoch": 0.92, + "learning_rate": 3.0311999948722137e-07, + "loss": 0.6122, + "step": 26595 + }, + { + "epoch": 0.92, + "learning_rate": 3.028539967407329e-07, + "loss": 0.6243, + "step": 26596 + }, + { + "epoch": 0.92, + "learning_rate": 3.025881089661753e-07, + "loss": 0.6361, + "step": 26597 + }, + { + "epoch": 0.92, + "learning_rate": 3.023223361667027e-07, + "loss": 0.6259, + "step": 26598 + }, + { + "epoch": 0.92, + "learning_rate": 3.0205667834546706e-07, + "loss": 0.6101, + "step": 26599 + }, + { + "epoch": 0.92, + "learning_rate": 3.017911355056169e-07, + "loss": 0.5891, + "step": 26600 + }, + { + "epoch": 0.92, + "learning_rate": 3.015257076503009e-07, + "loss": 0.6347, + "step": 26601 + }, + { + "epoch": 0.92, + "learning_rate": 3.0126039478266753e-07, + "loss": 0.66, + "step": 26602 + }, + { + "epoch": 0.92, + "learning_rate": 3.0099519690585997e-07, + "loss": 0.6103, + "step": 26603 + }, + { + "epoch": 0.92, + "learning_rate": 3.0073011402302454e-07, + "loss": 0.6281, + "step": 26604 + }, + { + "epoch": 0.92, + "learning_rate": 3.0046514613730315e-07, + "loss": 0.6588, + "step": 26605 + }, + { + "epoch": 0.92, + "learning_rate": 3.0020029325183667e-07, + "loss": 0.6593, + "step": 26606 + }, + { + "epoch": 0.92, + "learning_rate": 2.999355553697658e-07, + "loss": 0.6484, + "step": 26607 + }, + { + "epoch": 0.92, + "learning_rate": 2.996709324942315e-07, + "loss": 0.6576, + "step": 26608 + }, + { + "epoch": 0.92, + "learning_rate": 2.994064246283679e-07, + "loss": 0.6112, + "step": 26609 + }, + { + "epoch": 0.92, + "learning_rate": 2.991420317753124e-07, + "loss": 0.6243, + "step": 26610 + }, + { + "epoch": 0.92, + "learning_rate": 2.988777539381993e-07, + "loss": 0.6611, + "step": 26611 + }, + { + "epoch": 0.92, + "learning_rate": 2.9861359112016375e-07, + "loss": 0.6046, + "step": 26612 + }, + { + "epoch": 0.92, + "learning_rate": 2.9834954332433554e-07, + "loss": 0.62, + "step": 26613 + }, + { + "epoch": 0.92, + "learning_rate": 2.980856105538466e-07, + "loss": 0.597, + "step": 26614 + }, + { + "epoch": 0.92, + "learning_rate": 2.9782179281182543e-07, + "loss": 0.6455, + "step": 26615 + }, + { + "epoch": 0.92, + "learning_rate": 2.9755809010139967e-07, + "loss": 0.6715, + "step": 26616 + }, + { + "epoch": 0.92, + "learning_rate": 2.972945024256968e-07, + "loss": 0.6389, + "step": 26617 + }, + { + "epoch": 0.92, + "learning_rate": 2.9703102978784205e-07, + "loss": 0.6372, + "step": 26618 + }, + { + "epoch": 0.92, + "learning_rate": 2.967676721909585e-07, + "loss": 0.6323, + "step": 26619 + }, + { + "epoch": 0.92, + "learning_rate": 2.9650442963816914e-07, + "loss": 0.5856, + "step": 26620 + }, + { + "epoch": 0.92, + "learning_rate": 2.9624130213259493e-07, + "loss": 0.6003, + "step": 26621 + }, + { + "epoch": 0.92, + "learning_rate": 2.9597828967735443e-07, + "loss": 0.633, + "step": 26622 + }, + { + "epoch": 0.92, + "learning_rate": 2.957153922755673e-07, + "loss": 0.6261, + "step": 26623 + }, + { + "epoch": 0.92, + "learning_rate": 2.954526099303501e-07, + "loss": 0.6773, + "step": 26624 + }, + { + "epoch": 0.92, + "learning_rate": 2.9518994264481795e-07, + "loss": 0.5909, + "step": 26625 + }, + { + "epoch": 0.92, + "learning_rate": 2.949273904220873e-07, + "loss": 0.6213, + "step": 26626 + }, + { + "epoch": 0.92, + "learning_rate": 2.94664953265269e-07, + "loss": 0.6663, + "step": 26627 + }, + { + "epoch": 0.92, + "learning_rate": 2.944026311774739e-07, + "loss": 0.6098, + "step": 26628 + }, + { + "epoch": 0.92, + "learning_rate": 2.94140424161814e-07, + "loss": 0.6756, + "step": 26629 + }, + { + "epoch": 0.92, + "learning_rate": 2.938783322213967e-07, + "loss": 0.6671, + "step": 26630 + }, + { + "epoch": 0.92, + "learning_rate": 2.9361635535933077e-07, + "loss": 0.6221, + "step": 26631 + }, + { + "epoch": 0.92, + "learning_rate": 2.9335449357872246e-07, + "loss": 0.5555, + "step": 26632 + }, + { + "epoch": 0.92, + "learning_rate": 2.93092746882675e-07, + "loss": 0.6573, + "step": 26633 + }, + { + "epoch": 0.92, + "learning_rate": 2.928311152742913e-07, + "loss": 0.6227, + "step": 26634 + }, + { + "epoch": 0.92, + "learning_rate": 2.9256959875667455e-07, + "loss": 0.602, + "step": 26635 + }, + { + "epoch": 0.92, + "learning_rate": 2.923081973329256e-07, + "loss": 0.641, + "step": 26636 + }, + { + "epoch": 0.92, + "learning_rate": 2.9204691100614304e-07, + "loss": 0.6271, + "step": 26637 + }, + { + "epoch": 0.92, + "learning_rate": 2.917857397794266e-07, + "loss": 0.6959, + "step": 26638 + }, + { + "epoch": 0.92, + "learning_rate": 2.9152468365586936e-07, + "loss": 0.7219, + "step": 26639 + }, + { + "epoch": 0.92, + "learning_rate": 2.912637426385678e-07, + "loss": 0.6439, + "step": 26640 + }, + { + "epoch": 0.92, + "learning_rate": 2.910029167306172e-07, + "loss": 0.6569, + "step": 26641 + }, + { + "epoch": 0.92, + "learning_rate": 2.9074220593510947e-07, + "loss": 0.6005, + "step": 26642 + }, + { + "epoch": 0.92, + "learning_rate": 2.904816102551333e-07, + "loss": 0.6412, + "step": 26643 + }, + { + "epoch": 0.92, + "learning_rate": 2.902211296937829e-07, + "loss": 0.6062, + "step": 26644 + }, + { + "epoch": 0.92, + "learning_rate": 2.8996076425414244e-07, + "loss": 0.5877, + "step": 26645 + }, + { + "epoch": 0.92, + "learning_rate": 2.897005139393005e-07, + "loss": 0.6274, + "step": 26646 + }, + { + "epoch": 0.92, + "learning_rate": 2.894403787523425e-07, + "loss": 0.652, + "step": 26647 + }, + { + "epoch": 0.92, + "learning_rate": 2.8918035869635264e-07, + "loss": 0.5843, + "step": 26648 + }, + { + "epoch": 0.92, + "learning_rate": 2.889204537744139e-07, + "loss": 0.6328, + "step": 26649 + }, + { + "epoch": 0.92, + "learning_rate": 2.8866066398960835e-07, + "loss": 0.6359, + "step": 26650 + }, + { + "epoch": 0.92, + "learning_rate": 2.884009893450146e-07, + "loss": 0.6184, + "step": 26651 + }, + { + "epoch": 0.92, + "learning_rate": 2.881414298437124e-07, + "loss": 0.5781, + "step": 26652 + }, + { + "epoch": 0.92, + "learning_rate": 2.878819854887793e-07, + "loss": 0.6125, + "step": 26653 + }, + { + "epoch": 0.92, + "learning_rate": 2.876226562832918e-07, + "loss": 0.6428, + "step": 26654 + }, + { + "epoch": 0.92, + "learning_rate": 2.87363442230324e-07, + "loss": 0.588, + "step": 26655 + }, + { + "epoch": 0.92, + "learning_rate": 2.87104343332949e-07, + "loss": 0.5938, + "step": 26656 + }, + { + "epoch": 0.92, + "learning_rate": 2.8684535959423777e-07, + "loss": 0.6228, + "step": 26657 + }, + { + "epoch": 0.92, + "learning_rate": 2.8658649101726333e-07, + "loss": 0.6356, + "step": 26658 + }, + { + "epoch": 0.92, + "learning_rate": 2.863277376050921e-07, + "loss": 0.589, + "step": 26659 + }, + { + "epoch": 0.92, + "learning_rate": 2.86069099360794e-07, + "loss": 0.6389, + "step": 26660 + }, + { + "epoch": 0.92, + "learning_rate": 2.8581057628743636e-07, + "loss": 0.6473, + "step": 26661 + }, + { + "epoch": 0.92, + "learning_rate": 2.855521683880813e-07, + "loss": 0.6556, + "step": 26662 + }, + { + "epoch": 0.92, + "learning_rate": 2.852938756657953e-07, + "loss": 0.6493, + "step": 26663 + }, + { + "epoch": 0.92, + "learning_rate": 2.85035698123638e-07, + "loss": 0.5576, + "step": 26664 + }, + { + "epoch": 0.92, + "learning_rate": 2.8477763576467253e-07, + "loss": 0.6742, + "step": 26665 + }, + { + "epoch": 0.92, + "learning_rate": 2.8451968859195876e-07, + "loss": 0.6564, + "step": 26666 + }, + { + "epoch": 0.92, + "learning_rate": 2.842618566085542e-07, + "loss": 0.6267, + "step": 26667 + }, + { + "epoch": 0.92, + "learning_rate": 2.840041398175153e-07, + "loss": 0.6289, + "step": 26668 + }, + { + "epoch": 0.92, + "learning_rate": 2.8374653822189846e-07, + "loss": 0.5885, + "step": 26669 + }, + { + "epoch": 0.92, + "learning_rate": 2.8348905182475683e-07, + "loss": 0.5788, + "step": 26670 + }, + { + "epoch": 0.92, + "learning_rate": 2.8323168062914355e-07, + "loss": 0.6056, + "step": 26671 + }, + { + "epoch": 0.92, + "learning_rate": 2.8297442463811164e-07, + "loss": 0.6601, + "step": 26672 + }, + { + "epoch": 0.92, + "learning_rate": 2.8271728385471095e-07, + "loss": 0.6374, + "step": 26673 + }, + { + "epoch": 0.92, + "learning_rate": 2.824602582819869e-07, + "loss": 0.621, + "step": 26674 + }, + { + "epoch": 0.92, + "learning_rate": 2.822033479229902e-07, + "loss": 0.5917, + "step": 26675 + }, + { + "epoch": 0.92, + "learning_rate": 2.819465527807663e-07, + "loss": 0.6079, + "step": 26676 + }, + { + "epoch": 0.92, + "learning_rate": 2.8168987285835946e-07, + "loss": 0.6069, + "step": 26677 + }, + { + "epoch": 0.92, + "learning_rate": 2.8143330815881167e-07, + "loss": 0.6219, + "step": 26678 + }, + { + "epoch": 0.92, + "learning_rate": 2.811768586851682e-07, + "loss": 0.6055, + "step": 26679 + }, + { + "epoch": 0.92, + "learning_rate": 2.809205244404656e-07, + "loss": 0.6294, + "step": 26680 + }, + { + "epoch": 0.92, + "learning_rate": 2.806643054277458e-07, + "loss": 0.6368, + "step": 26681 + }, + { + "epoch": 0.92, + "learning_rate": 2.804082016500453e-07, + "loss": 0.6043, + "step": 26682 + }, + { + "epoch": 0.92, + "learning_rate": 2.8015221311040064e-07, + "loss": 0.6253, + "step": 26683 + }, + { + "epoch": 0.92, + "learning_rate": 2.7989633981184706e-07, + "loss": 0.652, + "step": 26684 + }, + { + "epoch": 0.92, + "learning_rate": 2.796405817574199e-07, + "loss": 0.6438, + "step": 26685 + }, + { + "epoch": 0.92, + "learning_rate": 2.7938493895014907e-07, + "loss": 0.6544, + "step": 26686 + }, + { + "epoch": 0.92, + "learning_rate": 2.791294113930665e-07, + "loss": 0.6349, + "step": 26687 + }, + { + "epoch": 0.92, + "learning_rate": 2.788739990892009e-07, + "loss": 0.6423, + "step": 26688 + }, + { + "epoch": 0.92, + "learning_rate": 2.7861870204158206e-07, + "loss": 0.6426, + "step": 26689 + }, + { + "epoch": 0.92, + "learning_rate": 2.7836352025323535e-07, + "loss": 0.6695, + "step": 26690 + }, + { + "epoch": 0.92, + "learning_rate": 2.781084537271883e-07, + "loss": 0.6016, + "step": 26691 + }, + { + "epoch": 0.92, + "learning_rate": 2.77853502466463e-07, + "loss": 0.6199, + "step": 26692 + }, + { + "epoch": 0.92, + "learning_rate": 2.7759866647408373e-07, + "loss": 0.5942, + "step": 26693 + }, + { + "epoch": 0.92, + "learning_rate": 2.7734394575307024e-07, + "loss": 0.6206, + "step": 26694 + }, + { + "epoch": 0.92, + "learning_rate": 2.7708934030644343e-07, + "loss": 0.5986, + "step": 26695 + }, + { + "epoch": 0.92, + "learning_rate": 2.76834850137222e-07, + "loss": 0.6177, + "step": 26696 + }, + { + "epoch": 0.92, + "learning_rate": 2.765804752484247e-07, + "loss": 0.5922, + "step": 26697 + }, + { + "epoch": 0.93, + "learning_rate": 2.7632621564306463e-07, + "loss": 0.6503, + "step": 26698 + }, + { + "epoch": 0.93, + "learning_rate": 2.7607207132415824e-07, + "loss": 0.6137, + "step": 26699 + }, + { + "epoch": 0.93, + "learning_rate": 2.7581804229471874e-07, + "loss": 0.6298, + "step": 26700 + }, + { + "epoch": 0.93, + "learning_rate": 2.7556412855775707e-07, + "loss": 0.5922, + "step": 26701 + }, + { + "epoch": 0.93, + "learning_rate": 2.7531033011628405e-07, + "loss": 0.6168, + "step": 26702 + }, + { + "epoch": 0.93, + "learning_rate": 2.7505664697330956e-07, + "loss": 0.6349, + "step": 26703 + }, + { + "epoch": 0.93, + "learning_rate": 2.7480307913184015e-07, + "loss": 0.5508, + "step": 26704 + }, + { + "epoch": 0.93, + "learning_rate": 2.7454962659488214e-07, + "loss": 0.6183, + "step": 26705 + }, + { + "epoch": 0.93, + "learning_rate": 2.7429628936544104e-07, + "loss": 0.6545, + "step": 26706 + }, + { + "epoch": 0.93, + "learning_rate": 2.740430674465211e-07, + "loss": 0.6798, + "step": 26707 + }, + { + "epoch": 0.93, + "learning_rate": 2.737899608411232e-07, + "loss": 0.6476, + "step": 26708 + }, + { + "epoch": 0.93, + "learning_rate": 2.735369695522505e-07, + "loss": 0.6015, + "step": 26709 + }, + { + "epoch": 0.93, + "learning_rate": 2.7328409358290065e-07, + "loss": 0.5936, + "step": 26710 + }, + { + "epoch": 0.93, + "learning_rate": 2.730313329360712e-07, + "loss": 0.5695, + "step": 26711 + }, + { + "epoch": 0.93, + "learning_rate": 2.727786876147609e-07, + "loss": 0.6225, + "step": 26712 + }, + { + "epoch": 0.93, + "learning_rate": 2.725261576219629e-07, + "loss": 0.6565, + "step": 26713 + }, + { + "epoch": 0.93, + "learning_rate": 2.7227374296067365e-07, + "loss": 0.6155, + "step": 26714 + }, + { + "epoch": 0.93, + "learning_rate": 2.720214436338864e-07, + "loss": 0.6238, + "step": 26715 + }, + { + "epoch": 0.93, + "learning_rate": 2.7176925964458865e-07, + "loss": 0.5993, + "step": 26716 + }, + { + "epoch": 0.93, + "learning_rate": 2.715171909957737e-07, + "loss": 0.674, + "step": 26717 + }, + { + "epoch": 0.93, + "learning_rate": 2.712652376904279e-07, + "loss": 0.6038, + "step": 26718 + }, + { + "epoch": 0.93, + "learning_rate": 2.7101339973154004e-07, + "loss": 0.686, + "step": 26719 + }, + { + "epoch": 0.93, + "learning_rate": 2.7076167712209664e-07, + "loss": 0.6362, + "step": 26720 + }, + { + "epoch": 0.93, + "learning_rate": 2.705100698650809e-07, + "loss": 0.6282, + "step": 26721 + }, + { + "epoch": 0.93, + "learning_rate": 2.702585779634748e-07, + "loss": 0.6564, + "step": 26722 + }, + { + "epoch": 0.93, + "learning_rate": 2.700072014202637e-07, + "loss": 0.6727, + "step": 26723 + }, + { + "epoch": 0.93, + "learning_rate": 2.697559402384231e-07, + "loss": 0.6192, + "step": 26724 + }, + { + "epoch": 0.93, + "learning_rate": 2.6950479442093503e-07, + "loss": 0.6596, + "step": 26725 + }, + { + "epoch": 0.93, + "learning_rate": 2.6925376397077816e-07, + "loss": 0.6289, + "step": 26726 + }, + { + "epoch": 0.93, + "learning_rate": 2.690028488909269e-07, + "loss": 0.6985, + "step": 26727 + }, + { + "epoch": 0.93, + "learning_rate": 2.687520491843565e-07, + "loss": 0.6098, + "step": 26728 + }, + { + "epoch": 0.93, + "learning_rate": 2.685013648540413e-07, + "loss": 0.5937, + "step": 26729 + }, + { + "epoch": 0.93, + "learning_rate": 2.682507959029512e-07, + "loss": 0.6792, + "step": 26730 + }, + { + "epoch": 0.93, + "learning_rate": 2.6800034233405935e-07, + "loss": 0.6434, + "step": 26731 + }, + { + "epoch": 0.93, + "learning_rate": 2.677500041503356e-07, + "loss": 0.6107, + "step": 26732 + }, + { + "epoch": 0.93, + "learning_rate": 2.6749978135474643e-07, + "loss": 0.5445, + "step": 26733 + }, + { + "epoch": 0.93, + "learning_rate": 2.6724967395025836e-07, + "loss": 0.6218, + "step": 26734 + }, + { + "epoch": 0.93, + "learning_rate": 2.6699968193983796e-07, + "loss": 0.6062, + "step": 26735 + }, + { + "epoch": 0.93, + "learning_rate": 2.6674980532644725e-07, + "loss": 0.5972, + "step": 26736 + }, + { + "epoch": 0.93, + "learning_rate": 2.6650004411305165e-07, + "loss": 0.634, + "step": 26737 + }, + { + "epoch": 0.93, + "learning_rate": 2.66250398302611e-07, + "loss": 0.6357, + "step": 26738 + }, + { + "epoch": 0.93, + "learning_rate": 2.660008678980852e-07, + "loss": 0.6695, + "step": 26739 + }, + { + "epoch": 0.93, + "learning_rate": 2.6575145290243185e-07, + "loss": 0.6125, + "step": 26740 + }, + { + "epoch": 0.93, + "learning_rate": 2.655021533186097e-07, + "loss": 0.6438, + "step": 26741 + }, + { + "epoch": 0.93, + "learning_rate": 2.652529691495731e-07, + "loss": 0.6118, + "step": 26742 + }, + { + "epoch": 0.93, + "learning_rate": 2.650039003982763e-07, + "loss": 0.6336, + "step": 26743 + }, + { + "epoch": 0.93, + "learning_rate": 2.647549470676758e-07, + "loss": 0.667, + "step": 26744 + }, + { + "epoch": 0.93, + "learning_rate": 2.6450610916071815e-07, + "loss": 0.6449, + "step": 26745 + }, + { + "epoch": 0.93, + "learning_rate": 2.642573866803566e-07, + "loss": 0.5996, + "step": 26746 + }, + { + "epoch": 0.93, + "learning_rate": 2.6400877962954094e-07, + "loss": 0.6919, + "step": 26747 + }, + { + "epoch": 0.93, + "learning_rate": 2.6376028801121446e-07, + "loss": 0.6542, + "step": 26748 + }, + { + "epoch": 0.93, + "learning_rate": 2.6351191182832803e-07, + "loss": 0.5726, + "step": 26749 + }, + { + "epoch": 0.93, + "learning_rate": 2.632636510838249e-07, + "loss": 0.6262, + "step": 26750 + }, + { + "epoch": 0.93, + "learning_rate": 2.6301550578064715e-07, + "loss": 0.6271, + "step": 26751 + }, + { + "epoch": 0.93, + "learning_rate": 2.627674759217391e-07, + "loss": 0.6293, + "step": 26752 + }, + { + "epoch": 0.93, + "learning_rate": 2.6251956151003956e-07, + "loss": 0.6618, + "step": 26753 + }, + { + "epoch": 0.93, + "learning_rate": 2.622717625484883e-07, + "loss": 0.6871, + "step": 26754 + }, + { + "epoch": 0.93, + "learning_rate": 2.6202407904002303e-07, + "loss": 0.6293, + "step": 26755 + }, + { + "epoch": 0.93, + "learning_rate": 2.617765109875836e-07, + "loss": 0.6337, + "step": 26756 + }, + { + "epoch": 0.93, + "learning_rate": 2.6152905839409993e-07, + "loss": 0.6018, + "step": 26757 + }, + { + "epoch": 0.93, + "learning_rate": 2.612817212625096e-07, + "loss": 0.6325, + "step": 26758 + }, + { + "epoch": 0.93, + "learning_rate": 2.6103449959574476e-07, + "loss": 0.5942, + "step": 26759 + }, + { + "epoch": 0.93, + "learning_rate": 2.607873933967331e-07, + "loss": 0.6508, + "step": 26760 + }, + { + "epoch": 0.93, + "learning_rate": 2.6054040266840884e-07, + "loss": 0.6323, + "step": 26761 + }, + { + "epoch": 0.93, + "learning_rate": 2.602935274136997e-07, + "loss": 0.6102, + "step": 26762 + }, + { + "epoch": 0.93, + "learning_rate": 2.6004676763553007e-07, + "loss": 0.666, + "step": 26763 + }, + { + "epoch": 0.93, + "learning_rate": 2.5980012333682636e-07, + "loss": 0.6129, + "step": 26764 + }, + { + "epoch": 0.93, + "learning_rate": 2.5955359452051634e-07, + "loss": 0.6224, + "step": 26765 + }, + { + "epoch": 0.93, + "learning_rate": 2.593071811895165e-07, + "loss": 0.6344, + "step": 26766 + }, + { + "epoch": 0.93, + "learning_rate": 2.590608833467545e-07, + "loss": 0.5977, + "step": 26767 + }, + { + "epoch": 0.93, + "learning_rate": 2.5881470099514807e-07, + "loss": 0.6106, + "step": 26768 + }, + { + "epoch": 0.93, + "learning_rate": 2.585686341376159e-07, + "loss": 0.6064, + "step": 26769 + }, + { + "epoch": 0.93, + "learning_rate": 2.5832268277707463e-07, + "loss": 0.6446, + "step": 26770 + }, + { + "epoch": 0.93, + "learning_rate": 2.58076846916443e-07, + "loss": 0.6207, + "step": 26771 + }, + { + "epoch": 0.93, + "learning_rate": 2.57831126558632e-07, + "loss": 0.6571, + "step": 26772 + }, + { + "epoch": 0.93, + "learning_rate": 2.5758552170655706e-07, + "loss": 0.5959, + "step": 26773 + }, + { + "epoch": 0.93, + "learning_rate": 2.5734003236313145e-07, + "loss": 0.6187, + "step": 26774 + }, + { + "epoch": 0.93, + "learning_rate": 2.570946585312639e-07, + "loss": 0.5932, + "step": 26775 + }, + { + "epoch": 0.93, + "learning_rate": 2.568494002138633e-07, + "loss": 0.6123, + "step": 26776 + }, + { + "epoch": 0.93, + "learning_rate": 2.5660425741383943e-07, + "loss": 0.6655, + "step": 26777 + }, + { + "epoch": 0.93, + "learning_rate": 2.563592301340945e-07, + "loss": 0.6069, + "step": 26778 + }, + { + "epoch": 0.93, + "learning_rate": 2.561143183775405e-07, + "loss": 0.5975, + "step": 26779 + }, + { + "epoch": 0.93, + "learning_rate": 2.558695221470753e-07, + "loss": 0.6653, + "step": 26780 + }, + { + "epoch": 0.93, + "learning_rate": 2.5562484144560306e-07, + "loss": 0.6121, + "step": 26781 + }, + { + "epoch": 0.93, + "learning_rate": 2.55380276276026e-07, + "loss": 0.667, + "step": 26782 + }, + { + "epoch": 0.93, + "learning_rate": 2.551358266412429e-07, + "loss": 0.6695, + "step": 26783 + }, + { + "epoch": 0.93, + "learning_rate": 2.5489149254415036e-07, + "loss": 0.6468, + "step": 26784 + }, + { + "epoch": 0.93, + "learning_rate": 2.5464727398764823e-07, + "loss": 0.6121, + "step": 26785 + }, + { + "epoch": 0.93, + "learning_rate": 2.5440317097462974e-07, + "loss": 0.6088, + "step": 26786 + }, + { + "epoch": 0.93, + "learning_rate": 2.5415918350799043e-07, + "loss": 0.6309, + "step": 26787 + }, + { + "epoch": 0.93, + "learning_rate": 2.5391531159062345e-07, + "loss": 0.6985, + "step": 26788 + }, + { + "epoch": 0.93, + "learning_rate": 2.5367155522541765e-07, + "loss": 0.6558, + "step": 26789 + }, + { + "epoch": 0.93, + "learning_rate": 2.5342791441526406e-07, + "loss": 0.7036, + "step": 26790 + }, + { + "epoch": 0.93, + "learning_rate": 2.531843891630548e-07, + "loss": 0.658, + "step": 26791 + }, + { + "epoch": 0.93, + "learning_rate": 2.5294097947167304e-07, + "loss": 0.6679, + "step": 26792 + }, + { + "epoch": 0.93, + "learning_rate": 2.526976853440055e-07, + "loss": 0.5742, + "step": 26793 + }, + { + "epoch": 0.93, + "learning_rate": 2.524545067829387e-07, + "loss": 0.6039, + "step": 26794 + }, + { + "epoch": 0.93, + "learning_rate": 2.5221144379135255e-07, + "loss": 0.5983, + "step": 26795 + }, + { + "epoch": 0.93, + "learning_rate": 2.519684963721314e-07, + "loss": 0.6353, + "step": 26796 + }, + { + "epoch": 0.93, + "learning_rate": 2.5172566452815626e-07, + "loss": 0.7335, + "step": 26797 + }, + { + "epoch": 0.93, + "learning_rate": 2.514829482623038e-07, + "loss": 0.6161, + "step": 26798 + }, + { + "epoch": 0.93, + "learning_rate": 2.5124034757745275e-07, + "loss": 0.6488, + "step": 26799 + }, + { + "epoch": 0.93, + "learning_rate": 2.5099786247648085e-07, + "loss": 0.6491, + "step": 26800 + }, + { + "epoch": 0.93, + "learning_rate": 2.507554929622613e-07, + "loss": 0.6393, + "step": 26801 + }, + { + "epoch": 0.93, + "learning_rate": 2.505132390376663e-07, + "loss": 0.647, + "step": 26802 + }, + { + "epoch": 0.93, + "learning_rate": 2.5027110070557246e-07, + "loss": 0.6696, + "step": 26803 + }, + { + "epoch": 0.93, + "learning_rate": 2.5002907796884747e-07, + "loss": 0.6266, + "step": 26804 + }, + { + "epoch": 0.93, + "learning_rate": 2.497871708303612e-07, + "loss": 0.6285, + "step": 26805 + }, + { + "epoch": 0.93, + "learning_rate": 2.495453792929836e-07, + "loss": 0.662, + "step": 26806 + }, + { + "epoch": 0.93, + "learning_rate": 2.49303703359578e-07, + "loss": 0.6136, + "step": 26807 + }, + { + "epoch": 0.93, + "learning_rate": 2.49062143033012e-07, + "loss": 0.6073, + "step": 26808 + }, + { + "epoch": 0.93, + "learning_rate": 2.488206983161501e-07, + "loss": 0.7008, + "step": 26809 + }, + { + "epoch": 0.93, + "learning_rate": 2.4857936921185433e-07, + "loss": 0.6218, + "step": 26810 + }, + { + "epoch": 0.93, + "learning_rate": 2.483381557229847e-07, + "loss": 0.6173, + "step": 26811 + }, + { + "epoch": 0.93, + "learning_rate": 2.4809705785240337e-07, + "loss": 0.6468, + "step": 26812 + }, + { + "epoch": 0.93, + "learning_rate": 2.4785607560296686e-07, + "loss": 0.6412, + "step": 26813 + }, + { + "epoch": 0.93, + "learning_rate": 2.476152089775319e-07, + "loss": 0.6466, + "step": 26814 + }, + { + "epoch": 0.93, + "learning_rate": 2.473744579789572e-07, + "loss": 0.6159, + "step": 26815 + }, + { + "epoch": 0.93, + "learning_rate": 2.4713382261009497e-07, + "loss": 0.6424, + "step": 26816 + }, + { + "epoch": 0.93, + "learning_rate": 2.468933028737985e-07, + "loss": 0.6636, + "step": 26817 + }, + { + "epoch": 0.93, + "learning_rate": 2.466528987729211e-07, + "loss": 0.6288, + "step": 26818 + }, + { + "epoch": 0.93, + "learning_rate": 2.464126103103104e-07, + "loss": 0.6525, + "step": 26819 + }, + { + "epoch": 0.93, + "learning_rate": 2.4617243748881635e-07, + "loss": 0.6741, + "step": 26820 + }, + { + "epoch": 0.93, + "learning_rate": 2.4593238031128676e-07, + "loss": 0.5968, + "step": 26821 + }, + { + "epoch": 0.93, + "learning_rate": 2.4569243878056704e-07, + "loss": 0.6463, + "step": 26822 + }, + { + "epoch": 0.93, + "learning_rate": 2.4545261289950385e-07, + "loss": 0.6297, + "step": 26823 + }, + { + "epoch": 0.93, + "learning_rate": 2.4521290267093935e-07, + "loss": 0.6368, + "step": 26824 + }, + { + "epoch": 0.93, + "learning_rate": 2.4497330809771566e-07, + "loss": 0.5876, + "step": 26825 + }, + { + "epoch": 0.93, + "learning_rate": 2.4473382918267395e-07, + "loss": 0.6188, + "step": 26826 + }, + { + "epoch": 0.93, + "learning_rate": 2.444944659286519e-07, + "loss": 0.5795, + "step": 26827 + }, + { + "epoch": 0.93, + "learning_rate": 2.442552183384894e-07, + "loss": 0.584, + "step": 26828 + }, + { + "epoch": 0.93, + "learning_rate": 2.4401608641502314e-07, + "loss": 0.6807, + "step": 26829 + }, + { + "epoch": 0.93, + "learning_rate": 2.4377707016108755e-07, + "loss": 0.6376, + "step": 26830 + }, + { + "epoch": 0.93, + "learning_rate": 2.435381695795158e-07, + "loss": 0.6491, + "step": 26831 + }, + { + "epoch": 0.93, + "learning_rate": 2.4329938467314127e-07, + "loss": 0.608, + "step": 26832 + }, + { + "epoch": 0.93, + "learning_rate": 2.4306071544479395e-07, + "loss": 0.5697, + "step": 26833 + }, + { + "epoch": 0.93, + "learning_rate": 2.428221618973059e-07, + "loss": 0.611, + "step": 26834 + }, + { + "epoch": 0.93, + "learning_rate": 2.425837240335027e-07, + "loss": 0.6687, + "step": 26835 + }, + { + "epoch": 0.93, + "learning_rate": 2.4234540185621435e-07, + "loss": 0.6758, + "step": 26836 + }, + { + "epoch": 0.93, + "learning_rate": 2.42107195368263e-07, + "loss": 0.6176, + "step": 26837 + }, + { + "epoch": 0.93, + "learning_rate": 2.418691045724753e-07, + "loss": 0.6547, + "step": 26838 + }, + { + "epoch": 0.93, + "learning_rate": 2.416311294716733e-07, + "loss": 0.6126, + "step": 26839 + }, + { + "epoch": 0.93, + "learning_rate": 2.413932700686794e-07, + "loss": 0.605, + "step": 26840 + }, + { + "epoch": 0.93, + "learning_rate": 2.4115552636631236e-07, + "loss": 0.6131, + "step": 26841 + }, + { + "epoch": 0.93, + "learning_rate": 2.409178983673921e-07, + "loss": 0.6462, + "step": 26842 + }, + { + "epoch": 0.93, + "learning_rate": 2.406803860747342e-07, + "loss": 0.6185, + "step": 26843 + }, + { + "epoch": 0.93, + "learning_rate": 2.404429894911575e-07, + "loss": 0.6374, + "step": 26844 + }, + { + "epoch": 0.93, + "learning_rate": 2.402057086194731e-07, + "loss": 0.6336, + "step": 26845 + }, + { + "epoch": 0.93, + "learning_rate": 2.399685434624976e-07, + "loss": 0.6307, + "step": 26846 + }, + { + "epoch": 0.93, + "learning_rate": 2.3973149402304216e-07, + "loss": 0.6556, + "step": 26847 + }, + { + "epoch": 0.93, + "learning_rate": 2.394945603039156e-07, + "loss": 0.6059, + "step": 26848 + }, + { + "epoch": 0.93, + "learning_rate": 2.39257742307929e-07, + "loss": 0.6043, + "step": 26849 + }, + { + "epoch": 0.93, + "learning_rate": 2.3902104003788783e-07, + "loss": 0.6397, + "step": 26850 + }, + { + "epoch": 0.93, + "learning_rate": 2.3878445349660105e-07, + "loss": 0.6487, + "step": 26851 + }, + { + "epoch": 0.93, + "learning_rate": 2.3854798268687195e-07, + "loss": 0.6391, + "step": 26852 + }, + { + "epoch": 0.93, + "learning_rate": 2.3831162761150606e-07, + "loss": 0.6218, + "step": 26853 + }, + { + "epoch": 0.93, + "learning_rate": 2.3807538827330333e-07, + "loss": 0.6737, + "step": 26854 + }, + { + "epoch": 0.93, + "learning_rate": 2.37839264675066e-07, + "loss": 0.5954, + "step": 26855 + }, + { + "epoch": 0.93, + "learning_rate": 2.3760325681959296e-07, + "loss": 0.6044, + "step": 26856 + }, + { + "epoch": 0.93, + "learning_rate": 2.3736736470968302e-07, + "loss": 0.6436, + "step": 26857 + }, + { + "epoch": 0.93, + "learning_rate": 2.3713158834813287e-07, + "loss": 0.6449, + "step": 26858 + }, + { + "epoch": 0.93, + "learning_rate": 2.3689592773773807e-07, + "loss": 0.5965, + "step": 26859 + }, + { + "epoch": 0.93, + "learning_rate": 2.366603828812919e-07, + "loss": 0.6692, + "step": 26860 + }, + { + "epoch": 0.93, + "learning_rate": 2.364249537815877e-07, + "loss": 0.6626, + "step": 26861 + }, + { + "epoch": 0.93, + "learning_rate": 2.3618964044141768e-07, + "loss": 0.648, + "step": 26862 + }, + { + "epoch": 0.93, + "learning_rate": 2.359544428635696e-07, + "loss": 0.6762, + "step": 26863 + }, + { + "epoch": 0.93, + "learning_rate": 2.3571936105083347e-07, + "loss": 0.6461, + "step": 26864 + }, + { + "epoch": 0.93, + "learning_rate": 2.3548439500599707e-07, + "loss": 0.6155, + "step": 26865 + }, + { + "epoch": 0.93, + "learning_rate": 2.352495447318437e-07, + "loss": 0.6418, + "step": 26866 + }, + { + "epoch": 0.93, + "learning_rate": 2.3501481023116002e-07, + "loss": 0.6292, + "step": 26867 + }, + { + "epoch": 0.93, + "learning_rate": 2.3478019150672938e-07, + "loss": 0.6745, + "step": 26868 + }, + { + "epoch": 0.93, + "learning_rate": 2.3454568856133175e-07, + "loss": 0.6146, + "step": 26869 + }, + { + "epoch": 0.93, + "learning_rate": 2.3431130139774827e-07, + "loss": 0.5839, + "step": 26870 + }, + { + "epoch": 0.93, + "learning_rate": 2.340770300187589e-07, + "loss": 0.5825, + "step": 26871 + }, + { + "epoch": 0.93, + "learning_rate": 2.3384287442714038e-07, + "loss": 0.6219, + "step": 26872 + }, + { + "epoch": 0.93, + "learning_rate": 2.3360883462566818e-07, + "loss": 0.6576, + "step": 26873 + }, + { + "epoch": 0.93, + "learning_rate": 2.3337491061711681e-07, + "loss": 0.6364, + "step": 26874 + }, + { + "epoch": 0.93, + "learning_rate": 2.331411024042618e-07, + "loss": 0.6429, + "step": 26875 + }, + { + "epoch": 0.93, + "learning_rate": 2.3290740998987426e-07, + "loss": 0.6403, + "step": 26876 + }, + { + "epoch": 0.93, + "learning_rate": 2.3267383337672533e-07, + "loss": 0.6687, + "step": 26877 + }, + { + "epoch": 0.93, + "learning_rate": 2.3244037256758278e-07, + "loss": 0.6589, + "step": 26878 + }, + { + "epoch": 0.93, + "learning_rate": 2.3220702756521662e-07, + "loss": 0.631, + "step": 26879 + }, + { + "epoch": 0.93, + "learning_rate": 2.319737983723913e-07, + "loss": 0.5994, + "step": 26880 + }, + { + "epoch": 0.93, + "learning_rate": 2.3174068499187352e-07, + "loss": 0.6647, + "step": 26881 + }, + { + "epoch": 0.93, + "learning_rate": 2.315076874264266e-07, + "loss": 0.6655, + "step": 26882 + }, + { + "epoch": 0.93, + "learning_rate": 2.31274805678815e-07, + "loss": 0.6032, + "step": 26883 + }, + { + "epoch": 0.93, + "learning_rate": 2.310420397517965e-07, + "loss": 0.6236, + "step": 26884 + }, + { + "epoch": 0.93, + "learning_rate": 2.3080938964813227e-07, + "loss": 0.6266, + "step": 26885 + }, + { + "epoch": 0.93, + "learning_rate": 2.3057685537058117e-07, + "loss": 0.6369, + "step": 26886 + }, + { + "epoch": 0.93, + "learning_rate": 2.303444369218999e-07, + "loss": 0.5797, + "step": 26887 + }, + { + "epoch": 0.93, + "learning_rate": 2.3011213430484403e-07, + "loss": 0.6665, + "step": 26888 + }, + { + "epoch": 0.93, + "learning_rate": 2.2987994752216914e-07, + "loss": 0.641, + "step": 26889 + }, + { + "epoch": 0.93, + "learning_rate": 2.2964787657662524e-07, + "loss": 0.6547, + "step": 26890 + }, + { + "epoch": 0.93, + "learning_rate": 2.2941592147096458e-07, + "loss": 0.6916, + "step": 26891 + }, + { + "epoch": 0.93, + "learning_rate": 2.2918408220793942e-07, + "loss": 0.6543, + "step": 26892 + }, + { + "epoch": 0.93, + "learning_rate": 2.2895235879029643e-07, + "loss": 0.6217, + "step": 26893 + }, + { + "epoch": 0.93, + "learning_rate": 2.2872075122078342e-07, + "loss": 0.6334, + "step": 26894 + }, + { + "epoch": 0.93, + "learning_rate": 2.2848925950214817e-07, + "loss": 0.6395, + "step": 26895 + }, + { + "epoch": 0.93, + "learning_rate": 2.2825788363713186e-07, + "loss": 0.7169, + "step": 26896 + }, + { + "epoch": 0.93, + "learning_rate": 2.2802662362848115e-07, + "loss": 0.638, + "step": 26897 + }, + { + "epoch": 0.93, + "learning_rate": 2.2779547947893498e-07, + "loss": 0.6254, + "step": 26898 + }, + { + "epoch": 0.93, + "learning_rate": 2.275644511912367e-07, + "loss": 0.6243, + "step": 26899 + }, + { + "epoch": 0.93, + "learning_rate": 2.2733353876812302e-07, + "loss": 0.6861, + "step": 26900 + }, + { + "epoch": 0.93, + "learning_rate": 2.2710274221233396e-07, + "loss": 0.7436, + "step": 26901 + }, + { + "epoch": 0.93, + "learning_rate": 2.2687206152660401e-07, + "loss": 0.6301, + "step": 26902 + }, + { + "epoch": 0.93, + "learning_rate": 2.2664149671366763e-07, + "loss": 0.5994, + "step": 26903 + }, + { + "epoch": 0.93, + "learning_rate": 2.2641104777626045e-07, + "loss": 0.6289, + "step": 26904 + }, + { + "epoch": 0.93, + "learning_rate": 2.2618071471711466e-07, + "loss": 0.684, + "step": 26905 + }, + { + "epoch": 0.93, + "learning_rate": 2.2595049753896038e-07, + "loss": 0.7002, + "step": 26906 + }, + { + "epoch": 0.93, + "learning_rate": 2.2572039624452647e-07, + "loss": 0.6177, + "step": 26907 + }, + { + "epoch": 0.93, + "learning_rate": 2.25490410836543e-07, + "loss": 0.5911, + "step": 26908 + }, + { + "epoch": 0.93, + "learning_rate": 2.2526054131773444e-07, + "loss": 0.6797, + "step": 26909 + }, + { + "epoch": 0.93, + "learning_rate": 2.2503078769082643e-07, + "loss": 0.6294, + "step": 26910 + }, + { + "epoch": 0.93, + "learning_rate": 2.2480114995854562e-07, + "loss": 0.6211, + "step": 26911 + }, + { + "epoch": 0.93, + "learning_rate": 2.245716281236121e-07, + "loss": 0.6256, + "step": 26912 + }, + { + "epoch": 0.93, + "learning_rate": 2.2434222218874813e-07, + "loss": 0.6675, + "step": 26913 + }, + { + "epoch": 0.93, + "learning_rate": 2.2411293215667373e-07, + "loss": 0.6022, + "step": 26914 + }, + { + "epoch": 0.93, + "learning_rate": 2.2388375803010566e-07, + "loss": 0.6582, + "step": 26915 + }, + { + "epoch": 0.93, + "learning_rate": 2.2365469981176392e-07, + "loss": 0.5902, + "step": 26916 + }, + { + "epoch": 0.93, + "learning_rate": 2.234257575043619e-07, + "loss": 0.617, + "step": 26917 + }, + { + "epoch": 0.93, + "learning_rate": 2.2319693111061636e-07, + "loss": 0.6936, + "step": 26918 + }, + { + "epoch": 0.93, + "learning_rate": 2.229682206332373e-07, + "loss": 0.6328, + "step": 26919 + }, + { + "epoch": 0.93, + "learning_rate": 2.2273962607493816e-07, + "loss": 0.6664, + "step": 26920 + }, + { + "epoch": 0.93, + "learning_rate": 2.2251114743843005e-07, + "loss": 0.5389, + "step": 26921 + }, + { + "epoch": 0.93, + "learning_rate": 2.2228278472641973e-07, + "loss": 0.6833, + "step": 26922 + }, + { + "epoch": 0.93, + "learning_rate": 2.2205453794161614e-07, + "loss": 0.6395, + "step": 26923 + }, + { + "epoch": 0.93, + "learning_rate": 2.2182640708672708e-07, + "loss": 0.6548, + "step": 26924 + }, + { + "epoch": 0.93, + "learning_rate": 2.215983921644538e-07, + "loss": 0.671, + "step": 26925 + }, + { + "epoch": 0.93, + "learning_rate": 2.213704931775007e-07, + "loss": 0.6475, + "step": 26926 + }, + { + "epoch": 0.93, + "learning_rate": 2.2114271012857125e-07, + "loss": 0.6099, + "step": 26927 + }, + { + "epoch": 0.93, + "learning_rate": 2.2091504302036438e-07, + "loss": 0.6035, + "step": 26928 + }, + { + "epoch": 0.93, + "learning_rate": 2.2068749185558126e-07, + "loss": 0.6153, + "step": 26929 + }, + { + "epoch": 0.93, + "learning_rate": 2.2046005663691972e-07, + "loss": 0.6293, + "step": 26930 + }, + { + "epoch": 0.93, + "learning_rate": 2.2023273736707428e-07, + "loss": 0.6776, + "step": 26931 + }, + { + "epoch": 0.93, + "learning_rate": 2.200055340487406e-07, + "loss": 0.6453, + "step": 26932 + }, + { + "epoch": 0.93, + "learning_rate": 2.1977844668461422e-07, + "loss": 0.6395, + "step": 26933 + }, + { + "epoch": 0.93, + "learning_rate": 2.195514752773853e-07, + "loss": 0.6808, + "step": 26934 + }, + { + "epoch": 0.93, + "learning_rate": 2.1932461982974607e-07, + "loss": 0.6673, + "step": 26935 + }, + { + "epoch": 0.93, + "learning_rate": 2.1909788034438772e-07, + "loss": 0.6076, + "step": 26936 + }, + { + "epoch": 0.93, + "learning_rate": 2.188712568239959e-07, + "loss": 0.6604, + "step": 26937 + }, + { + "epoch": 0.93, + "learning_rate": 2.1864474927125735e-07, + "loss": 0.6053, + "step": 26938 + }, + { + "epoch": 0.93, + "learning_rate": 2.1841835768885988e-07, + "loss": 0.6168, + "step": 26939 + }, + { + "epoch": 0.93, + "learning_rate": 2.1819208207948695e-07, + "loss": 0.5862, + "step": 26940 + }, + { + "epoch": 0.93, + "learning_rate": 2.1796592244581971e-07, + "loss": 0.6213, + "step": 26941 + }, + { + "epoch": 0.93, + "learning_rate": 2.177398787905427e-07, + "loss": 0.6094, + "step": 26942 + }, + { + "epoch": 0.93, + "learning_rate": 2.1751395111633268e-07, + "loss": 0.5953, + "step": 26943 + }, + { + "epoch": 0.93, + "learning_rate": 2.1728813942586967e-07, + "loss": 0.5967, + "step": 26944 + }, + { + "epoch": 0.93, + "learning_rate": 2.170624437218305e-07, + "loss": 0.6129, + "step": 26945 + }, + { + "epoch": 0.93, + "learning_rate": 2.1683686400689298e-07, + "loss": 0.6197, + "step": 26946 + }, + { + "epoch": 0.93, + "learning_rate": 2.166114002837283e-07, + "loss": 0.6668, + "step": 26947 + }, + { + "epoch": 0.93, + "learning_rate": 2.1638605255501433e-07, + "loss": 0.6237, + "step": 26948 + }, + { + "epoch": 0.93, + "learning_rate": 2.1616082082341784e-07, + "loss": 0.5887, + "step": 26949 + }, + { + "epoch": 0.93, + "learning_rate": 2.1593570509161222e-07, + "loss": 0.6021, + "step": 26950 + }, + { + "epoch": 0.93, + "learning_rate": 2.1571070536226536e-07, + "loss": 0.6427, + "step": 26951 + }, + { + "epoch": 0.93, + "learning_rate": 2.154858216380451e-07, + "loss": 0.6088, + "step": 26952 + }, + { + "epoch": 0.93, + "learning_rate": 2.152610539216182e-07, + "loss": 0.651, + "step": 26953 + }, + { + "epoch": 0.93, + "learning_rate": 2.1503640221564926e-07, + "loss": 0.6357, + "step": 26954 + }, + { + "epoch": 0.93, + "learning_rate": 2.1481186652280162e-07, + "loss": 0.6302, + "step": 26955 + }, + { + "epoch": 0.93, + "learning_rate": 2.145874468457376e-07, + "loss": 0.5978, + "step": 26956 + }, + { + "epoch": 0.93, + "learning_rate": 2.1436314318711849e-07, + "loss": 0.6152, + "step": 26957 + }, + { + "epoch": 0.93, + "learning_rate": 2.1413895554960318e-07, + "loss": 0.6505, + "step": 26958 + }, + { + "epoch": 0.93, + "learning_rate": 2.1391488393584959e-07, + "loss": 0.6299, + "step": 26959 + }, + { + "epoch": 0.93, + "learning_rate": 2.1369092834851447e-07, + "loss": 0.7024, + "step": 26960 + }, + { + "epoch": 0.93, + "learning_rate": 2.1346708879025346e-07, + "loss": 0.5895, + "step": 26961 + }, + { + "epoch": 0.93, + "learning_rate": 2.1324336526371892e-07, + "loss": 0.6285, + "step": 26962 + }, + { + "epoch": 0.93, + "learning_rate": 2.1301975777156536e-07, + "loss": 0.6615, + "step": 26963 + }, + { + "epoch": 0.93, + "learning_rate": 2.12796266316444e-07, + "loss": 0.6175, + "step": 26964 + }, + { + "epoch": 0.93, + "learning_rate": 2.1257289090100274e-07, + "loss": 0.6688, + "step": 26965 + }, + { + "epoch": 0.93, + "learning_rate": 2.1234963152789166e-07, + "loss": 0.6085, + "step": 26966 + }, + { + "epoch": 0.93, + "learning_rate": 2.1212648819975644e-07, + "loss": 0.644, + "step": 26967 + }, + { + "epoch": 0.93, + "learning_rate": 2.1190346091924496e-07, + "loss": 0.6186, + "step": 26968 + }, + { + "epoch": 0.93, + "learning_rate": 2.116805496889973e-07, + "loss": 0.6887, + "step": 26969 + }, + { + "epoch": 0.93, + "learning_rate": 2.1145775451166028e-07, + "loss": 0.6066, + "step": 26970 + }, + { + "epoch": 0.93, + "learning_rate": 2.1123507538987508e-07, + "loss": 0.6109, + "step": 26971 + }, + { + "epoch": 0.93, + "learning_rate": 2.1101251232628073e-07, + "loss": 0.6297, + "step": 26972 + }, + { + "epoch": 0.93, + "learning_rate": 2.107900653235151e-07, + "loss": 0.6575, + "step": 26973 + }, + { + "epoch": 0.93, + "learning_rate": 2.105677343842183e-07, + "loss": 0.6304, + "step": 26974 + }, + { + "epoch": 0.93, + "learning_rate": 2.1034551951102268e-07, + "loss": 0.6037, + "step": 26975 + }, + { + "epoch": 0.93, + "learning_rate": 2.10123420706565e-07, + "loss": 0.7023, + "step": 26976 + }, + { + "epoch": 0.93, + "learning_rate": 2.0990143797347984e-07, + "loss": 0.5515, + "step": 26977 + }, + { + "epoch": 0.93, + "learning_rate": 2.096795713143973e-07, + "loss": 0.6801, + "step": 26978 + }, + { + "epoch": 0.93, + "learning_rate": 2.0945782073194754e-07, + "loss": 0.5708, + "step": 26979 + }, + { + "epoch": 0.93, + "learning_rate": 2.0923618622876173e-07, + "loss": 0.6239, + "step": 26980 + }, + { + "epoch": 0.93, + "learning_rate": 2.090146678074645e-07, + "loss": 0.6256, + "step": 26981 + }, + { + "epoch": 0.93, + "learning_rate": 2.087932654706859e-07, + "loss": 0.638, + "step": 26982 + }, + { + "epoch": 0.93, + "learning_rate": 2.0857197922104834e-07, + "loss": 0.6223, + "step": 26983 + }, + { + "epoch": 0.93, + "learning_rate": 2.0835080906117633e-07, + "loss": 0.6265, + "step": 26984 + }, + { + "epoch": 0.93, + "learning_rate": 2.0812975499369115e-07, + "loss": 0.6262, + "step": 26985 + }, + { + "epoch": 0.93, + "learning_rate": 2.0790881702121623e-07, + "loss": 0.6839, + "step": 26986 + }, + { + "epoch": 0.94, + "learning_rate": 2.0768799514636728e-07, + "loss": 0.6646, + "step": 26987 + }, + { + "epoch": 0.94, + "learning_rate": 2.074672893717644e-07, + "loss": 0.6784, + "step": 26988 + }, + { + "epoch": 0.94, + "learning_rate": 2.0724669970002664e-07, + "loss": 0.6259, + "step": 26989 + }, + { + "epoch": 0.94, + "learning_rate": 2.0702622613376632e-07, + "loss": 0.6441, + "step": 26990 + }, + { + "epoch": 0.94, + "learning_rate": 2.0680586867559692e-07, + "loss": 0.6272, + "step": 26991 + }, + { + "epoch": 0.94, + "learning_rate": 2.0658562732813415e-07, + "loss": 0.6434, + "step": 26992 + }, + { + "epoch": 0.94, + "learning_rate": 2.0636550209398588e-07, + "loss": 0.66, + "step": 26993 + }, + { + "epoch": 0.94, + "learning_rate": 2.0614549297576447e-07, + "loss": 0.6333, + "step": 26994 + }, + { + "epoch": 0.94, + "learning_rate": 2.0592559997607785e-07, + "loss": 0.6611, + "step": 26995 + }, + { + "epoch": 0.94, + "learning_rate": 2.0570582309753285e-07, + "loss": 0.6519, + "step": 26996 + }, + { + "epoch": 0.94, + "learning_rate": 2.0548616234273399e-07, + "loss": 0.6135, + "step": 26997 + }, + { + "epoch": 0.94, + "learning_rate": 2.0526661771428925e-07, + "loss": 0.6424, + "step": 26998 + }, + { + "epoch": 0.94, + "learning_rate": 2.0504718921479648e-07, + "loss": 0.6502, + "step": 26999 + }, + { + "epoch": 0.94, + "learning_rate": 2.0482787684686035e-07, + "loss": 0.6301, + "step": 27000 + }, + { + "epoch": 0.94, + "learning_rate": 2.0460868061308203e-07, + "loss": 0.6161, + "step": 27001 + }, + { + "epoch": 0.94, + "learning_rate": 2.043896005160584e-07, + "loss": 0.5902, + "step": 27002 + }, + { + "epoch": 0.94, + "learning_rate": 2.0417063655838732e-07, + "loss": 0.662, + "step": 27003 + }, + { + "epoch": 0.94, + "learning_rate": 2.0395178874266565e-07, + "loss": 0.573, + "step": 27004 + }, + { + "epoch": 0.94, + "learning_rate": 2.0373305707148684e-07, + "loss": 0.6433, + "step": 27005 + }, + { + "epoch": 0.94, + "learning_rate": 2.0351444154744437e-07, + "loss": 0.6237, + "step": 27006 + }, + { + "epoch": 0.94, + "learning_rate": 2.0329594217313287e-07, + "loss": 0.6391, + "step": 27007 + }, + { + "epoch": 0.94, + "learning_rate": 2.0307755895114023e-07, + "loss": 0.6767, + "step": 27008 + }, + { + "epoch": 0.94, + "learning_rate": 2.0285929188405551e-07, + "loss": 0.6403, + "step": 27009 + }, + { + "epoch": 0.94, + "learning_rate": 2.0264114097446884e-07, + "loss": 0.6763, + "step": 27010 + }, + { + "epoch": 0.94, + "learning_rate": 2.0242310622496374e-07, + "loss": 0.5961, + "step": 27011 + }, + { + "epoch": 0.94, + "learning_rate": 2.0220518763812592e-07, + "loss": 0.6442, + "step": 27012 + }, + { + "epoch": 0.94, + "learning_rate": 2.0198738521654105e-07, + "loss": 0.6475, + "step": 27013 + }, + { + "epoch": 0.94, + "learning_rate": 2.017696989627904e-07, + "loss": 0.6161, + "step": 27014 + }, + { + "epoch": 0.94, + "learning_rate": 2.0155212887945418e-07, + "loss": 0.6449, + "step": 27015 + }, + { + "epoch": 0.94, + "learning_rate": 2.0133467496911364e-07, + "loss": 0.6335, + "step": 27016 + }, + { + "epoch": 0.94, + "learning_rate": 2.0111733723434555e-07, + "loss": 0.6338, + "step": 27017 + }, + { + "epoch": 0.94, + "learning_rate": 2.0090011567772572e-07, + "loss": 0.6334, + "step": 27018 + }, + { + "epoch": 0.94, + "learning_rate": 2.0068301030183313e-07, + "loss": 0.6204, + "step": 27019 + }, + { + "epoch": 0.94, + "learning_rate": 2.0046602110923796e-07, + "loss": 0.6652, + "step": 27020 + }, + { + "epoch": 0.94, + "learning_rate": 2.0024914810251483e-07, + "loss": 0.6553, + "step": 27021 + }, + { + "epoch": 0.94, + "learning_rate": 2.0003239128423614e-07, + "loss": 0.6311, + "step": 27022 + }, + { + "epoch": 0.94, + "learning_rate": 1.9981575065696978e-07, + "loss": 0.6656, + "step": 27023 + }, + { + "epoch": 0.94, + "learning_rate": 1.9959922622328375e-07, + "loss": 0.6516, + "step": 27024 + }, + { + "epoch": 0.94, + "learning_rate": 1.993828179857471e-07, + "loss": 0.65, + "step": 27025 + }, + { + "epoch": 0.94, + "learning_rate": 1.9916652594692552e-07, + "loss": 0.6146, + "step": 27026 + }, + { + "epoch": 0.94, + "learning_rate": 1.9895035010938257e-07, + "loss": 0.6671, + "step": 27027 + }, + { + "epoch": 0.94, + "learning_rate": 1.9873429047568283e-07, + "loss": 0.7014, + "step": 27028 + }, + { + "epoch": 0.94, + "learning_rate": 1.9851834704838535e-07, + "loss": 0.6532, + "step": 27029 + }, + { + "epoch": 0.94, + "learning_rate": 1.9830251983005145e-07, + "loss": 0.5848, + "step": 27030 + }, + { + "epoch": 0.94, + "learning_rate": 1.9808680882324128e-07, + "loss": 0.6328, + "step": 27031 + }, + { + "epoch": 0.94, + "learning_rate": 1.9787121403051057e-07, + "loss": 0.6906, + "step": 27032 + }, + { + "epoch": 0.94, + "learning_rate": 1.976557354544184e-07, + "loss": 0.6437, + "step": 27033 + }, + { + "epoch": 0.94, + "learning_rate": 1.9744037309751607e-07, + "loss": 0.623, + "step": 27034 + }, + { + "epoch": 0.94, + "learning_rate": 1.9722512696235818e-07, + "loss": 0.6588, + "step": 27035 + }, + { + "epoch": 0.94, + "learning_rate": 1.9700999705149715e-07, + "loss": 0.6625, + "step": 27036 + }, + { + "epoch": 0.94, + "learning_rate": 1.9679498336748315e-07, + "loss": 0.6704, + "step": 27037 + }, + { + "epoch": 0.94, + "learning_rate": 1.9658008591286638e-07, + "loss": 0.6504, + "step": 27038 + }, + { + "epoch": 0.94, + "learning_rate": 1.9636530469019478e-07, + "loss": 0.583, + "step": 27039 + }, + { + "epoch": 0.94, + "learning_rate": 1.9615063970201297e-07, + "loss": 0.5704, + "step": 27040 + }, + { + "epoch": 0.94, + "learning_rate": 1.9593609095086674e-07, + "loss": 0.6224, + "step": 27041 + }, + { + "epoch": 0.94, + "learning_rate": 1.957216584393018e-07, + "loss": 0.5598, + "step": 27042 + }, + { + "epoch": 0.94, + "learning_rate": 1.9550734216985724e-07, + "loss": 0.6289, + "step": 27043 + }, + { + "epoch": 0.94, + "learning_rate": 1.9529314214507767e-07, + "loss": 0.6635, + "step": 27044 + }, + { + "epoch": 0.94, + "learning_rate": 1.9507905836750107e-07, + "loss": 0.6803, + "step": 27045 + }, + { + "epoch": 0.94, + "learning_rate": 1.9486509083966432e-07, + "loss": 0.6682, + "step": 27046 + }, + { + "epoch": 0.94, + "learning_rate": 1.9465123956410537e-07, + "loss": 0.6021, + "step": 27047 + }, + { + "epoch": 0.94, + "learning_rate": 1.9443750454336109e-07, + "loss": 0.6452, + "step": 27048 + }, + { + "epoch": 0.94, + "learning_rate": 1.9422388577996277e-07, + "loss": 0.5757, + "step": 27049 + }, + { + "epoch": 0.94, + "learning_rate": 1.9401038327644505e-07, + "loss": 0.6353, + "step": 27050 + }, + { + "epoch": 0.94, + "learning_rate": 1.9379699703534037e-07, + "loss": 0.6546, + "step": 27051 + }, + { + "epoch": 0.94, + "learning_rate": 1.935837270591756e-07, + "loss": 0.6855, + "step": 27052 + }, + { + "epoch": 0.94, + "learning_rate": 1.9337057335048204e-07, + "loss": 0.6499, + "step": 27053 + }, + { + "epoch": 0.94, + "learning_rate": 1.9315753591178432e-07, + "loss": 0.6378, + "step": 27054 + }, + { + "epoch": 0.94, + "learning_rate": 1.9294461474561043e-07, + "loss": 0.6129, + "step": 27055 + }, + { + "epoch": 0.94, + "learning_rate": 1.9273180985448504e-07, + "loss": 0.6851, + "step": 27056 + }, + { + "epoch": 0.94, + "learning_rate": 1.925191212409294e-07, + "loss": 0.6541, + "step": 27057 + }, + { + "epoch": 0.94, + "learning_rate": 1.9230654890746714e-07, + "loss": 0.646, + "step": 27058 + }, + { + "epoch": 0.94, + "learning_rate": 1.920940928566162e-07, + "loss": 0.6338, + "step": 27059 + }, + { + "epoch": 0.94, + "learning_rate": 1.9188175309089675e-07, + "loss": 0.6227, + "step": 27060 + }, + { + "epoch": 0.94, + "learning_rate": 1.916695296128268e-07, + "loss": 0.6132, + "step": 27061 + }, + { + "epoch": 0.94, + "learning_rate": 1.9145742242492217e-07, + "loss": 0.6594, + "step": 27062 + }, + { + "epoch": 0.94, + "learning_rate": 1.9124543152969856e-07, + "loss": 0.6672, + "step": 27063 + }, + { + "epoch": 0.94, + "learning_rate": 1.9103355692966842e-07, + "loss": 0.6569, + "step": 27064 + }, + { + "epoch": 0.94, + "learning_rate": 1.9082179862734306e-07, + "loss": 0.6397, + "step": 27065 + }, + { + "epoch": 0.94, + "learning_rate": 1.9061015662523384e-07, + "loss": 0.6418, + "step": 27066 + }, + { + "epoch": 0.94, + "learning_rate": 1.9039863092584986e-07, + "loss": 0.6358, + "step": 27067 + }, + { + "epoch": 0.94, + "learning_rate": 1.9018722153170023e-07, + "loss": 0.611, + "step": 27068 + }, + { + "epoch": 0.94, + "learning_rate": 1.8997592844529066e-07, + "loss": 0.6204, + "step": 27069 + }, + { + "epoch": 0.94, + "learning_rate": 1.8976475166912588e-07, + "loss": 0.6439, + "step": 27070 + }, + { + "epoch": 0.94, + "learning_rate": 1.8955369120570944e-07, + "loss": 0.6767, + "step": 27071 + }, + { + "epoch": 0.94, + "learning_rate": 1.8934274705754486e-07, + "loss": 0.6247, + "step": 27072 + }, + { + "epoch": 0.94, + "learning_rate": 1.8913191922713236e-07, + "loss": 0.6255, + "step": 27073 + }, + { + "epoch": 0.94, + "learning_rate": 1.889212077169722e-07, + "loss": 0.6324, + "step": 27074 + }, + { + "epoch": 0.94, + "learning_rate": 1.8871061252956235e-07, + "loss": 0.6628, + "step": 27075 + }, + { + "epoch": 0.94, + "learning_rate": 1.885001336673986e-07, + "loss": 0.6699, + "step": 27076 + }, + { + "epoch": 0.94, + "learning_rate": 1.8828977113297786e-07, + "loss": 0.6003, + "step": 27077 + }, + { + "epoch": 0.94, + "learning_rate": 1.8807952492879367e-07, + "loss": 0.6901, + "step": 27078 + }, + { + "epoch": 0.94, + "learning_rate": 1.8786939505733847e-07, + "loss": 0.6563, + "step": 27079 + }, + { + "epoch": 0.94, + "learning_rate": 1.8765938152110473e-07, + "loss": 0.6391, + "step": 27080 + }, + { + "epoch": 0.94, + "learning_rate": 1.8744948432258157e-07, + "loss": 0.6457, + "step": 27081 + }, + { + "epoch": 0.94, + "learning_rate": 1.8723970346425813e-07, + "loss": 0.6387, + "step": 27082 + }, + { + "epoch": 0.94, + "learning_rate": 1.8703003894862016e-07, + "loss": 0.6628, + "step": 27083 + }, + { + "epoch": 0.94, + "learning_rate": 1.8682049077815456e-07, + "loss": 0.6258, + "step": 27084 + }, + { + "epoch": 0.94, + "learning_rate": 1.8661105895534604e-07, + "loss": 0.6408, + "step": 27085 + }, + { + "epoch": 0.94, + "learning_rate": 1.8640174348267815e-07, + "loss": 0.6082, + "step": 27086 + }, + { + "epoch": 0.94, + "learning_rate": 1.8619254436263224e-07, + "loss": 0.6373, + "step": 27087 + }, + { + "epoch": 0.94, + "learning_rate": 1.8598346159768742e-07, + "loss": 0.6652, + "step": 27088 + }, + { + "epoch": 0.94, + "learning_rate": 1.8577449519032288e-07, + "loss": 0.6102, + "step": 27089 + }, + { + "epoch": 0.94, + "learning_rate": 1.8556564514301655e-07, + "loss": 0.6014, + "step": 27090 + }, + { + "epoch": 0.94, + "learning_rate": 1.853569114582454e-07, + "loss": 0.6043, + "step": 27091 + }, + { + "epoch": 0.94, + "learning_rate": 1.8514829413848522e-07, + "loss": 0.6143, + "step": 27092 + }, + { + "epoch": 0.94, + "learning_rate": 1.8493979318620625e-07, + "loss": 0.6365, + "step": 27093 + }, + { + "epoch": 0.94, + "learning_rate": 1.8473140860388207e-07, + "loss": 0.628, + "step": 27094 + }, + { + "epoch": 0.94, + "learning_rate": 1.845231403939829e-07, + "loss": 0.686, + "step": 27095 + }, + { + "epoch": 0.94, + "learning_rate": 1.843149885589801e-07, + "loss": 0.5894, + "step": 27096 + }, + { + "epoch": 0.94, + "learning_rate": 1.8410695310133842e-07, + "loss": 0.6882, + "step": 27097 + }, + { + "epoch": 0.94, + "learning_rate": 1.8389903402352805e-07, + "loss": 0.6768, + "step": 27098 + }, + { + "epoch": 0.94, + "learning_rate": 1.8369123132801038e-07, + "loss": 0.6689, + "step": 27099 + }, + { + "epoch": 0.94, + "learning_rate": 1.834835450172512e-07, + "loss": 0.6243, + "step": 27100 + }, + { + "epoch": 0.94, + "learning_rate": 1.8327597509371186e-07, + "loss": 0.6193, + "step": 27101 + }, + { + "epoch": 0.94, + "learning_rate": 1.830685215598549e-07, + "loss": 0.6533, + "step": 27102 + }, + { + "epoch": 0.94, + "learning_rate": 1.828611844181394e-07, + "loss": 0.6124, + "step": 27103 + }, + { + "epoch": 0.94, + "learning_rate": 1.826539636710234e-07, + "loss": 0.6242, + "step": 27104 + }, + { + "epoch": 0.94, + "learning_rate": 1.8244685932096274e-07, + "loss": 0.6526, + "step": 27105 + }, + { + "epoch": 0.94, + "learning_rate": 1.8223987137041432e-07, + "loss": 0.6344, + "step": 27106 + }, + { + "epoch": 0.94, + "learning_rate": 1.8203299982183175e-07, + "loss": 0.6873, + "step": 27107 + }, + { + "epoch": 0.94, + "learning_rate": 1.818262446776675e-07, + "loss": 0.5985, + "step": 27108 + }, + { + "epoch": 0.94, + "learning_rate": 1.81619605940373e-07, + "loss": 0.588, + "step": 27109 + }, + { + "epoch": 0.94, + "learning_rate": 1.8141308361239952e-07, + "loss": 0.6808, + "step": 27110 + }, + { + "epoch": 0.94, + "learning_rate": 1.8120667769619404e-07, + "loss": 0.6546, + "step": 27111 + }, + { + "epoch": 0.94, + "learning_rate": 1.810003881942035e-07, + "loss": 0.6812, + "step": 27112 + }, + { + "epoch": 0.94, + "learning_rate": 1.8079421510887485e-07, + "loss": 0.6135, + "step": 27113 + }, + { + "epoch": 0.94, + "learning_rate": 1.8058815844265277e-07, + "loss": 0.6309, + "step": 27114 + }, + { + "epoch": 0.94, + "learning_rate": 1.8038221819797863e-07, + "loss": 0.6346, + "step": 27115 + }, + { + "epoch": 0.94, + "learning_rate": 1.8017639437729607e-07, + "loss": 0.6544, + "step": 27116 + }, + { + "epoch": 0.94, + "learning_rate": 1.7997068698304422e-07, + "loss": 0.6369, + "step": 27117 + }, + { + "epoch": 0.94, + "learning_rate": 1.7976509601766222e-07, + "loss": 0.6052, + "step": 27118 + }, + { + "epoch": 0.94, + "learning_rate": 1.7955962148358707e-07, + "loss": 0.6245, + "step": 27119 + }, + { + "epoch": 0.94, + "learning_rate": 1.793542633832568e-07, + "loss": 0.6059, + "step": 27120 + }, + { + "epoch": 0.94, + "learning_rate": 1.7914902171910388e-07, + "loss": 0.6406, + "step": 27121 + }, + { + "epoch": 0.94, + "learning_rate": 1.7894389649356304e-07, + "loss": 0.6664, + "step": 27122 + }, + { + "epoch": 0.94, + "learning_rate": 1.7873888770906678e-07, + "loss": 0.6745, + "step": 27123 + }, + { + "epoch": 0.94, + "learning_rate": 1.7853399536804427e-07, + "loss": 0.7024, + "step": 27124 + }, + { + "epoch": 0.94, + "learning_rate": 1.783292194729247e-07, + "loss": 0.6356, + "step": 27125 + }, + { + "epoch": 0.94, + "learning_rate": 1.781245600261372e-07, + "loss": 0.622, + "step": 27126 + }, + { + "epoch": 0.94, + "learning_rate": 1.7792001703010763e-07, + "loss": 0.5979, + "step": 27127 + }, + { + "epoch": 0.94, + "learning_rate": 1.7771559048726295e-07, + "loss": 0.6256, + "step": 27128 + }, + { + "epoch": 0.94, + "learning_rate": 1.7751128040002342e-07, + "loss": 0.7081, + "step": 27129 + }, + { + "epoch": 0.94, + "learning_rate": 1.7730708677081375e-07, + "loss": 0.6026, + "step": 27130 + }, + { + "epoch": 0.94, + "learning_rate": 1.771030096020543e-07, + "loss": 0.6616, + "step": 27131 + }, + { + "epoch": 0.94, + "learning_rate": 1.7689904889616416e-07, + "loss": 0.6405, + "step": 27132 + }, + { + "epoch": 0.94, + "learning_rate": 1.7669520465556256e-07, + "loss": 0.5755, + "step": 27133 + }, + { + "epoch": 0.94, + "learning_rate": 1.7649147688266643e-07, + "loss": 0.6344, + "step": 27134 + }, + { + "epoch": 0.94, + "learning_rate": 1.762878655798894e-07, + "loss": 0.6504, + "step": 27135 + }, + { + "epoch": 0.94, + "learning_rate": 1.7608437074964734e-07, + "loss": 0.6176, + "step": 27136 + }, + { + "epoch": 0.94, + "learning_rate": 1.7588099239435274e-07, + "loss": 0.641, + "step": 27137 + }, + { + "epoch": 0.94, + "learning_rate": 1.756777305164159e-07, + "loss": 0.6233, + "step": 27138 + }, + { + "epoch": 0.94, + "learning_rate": 1.754745851182482e-07, + "loss": 0.6308, + "step": 27139 + }, + { + "epoch": 0.94, + "learning_rate": 1.7527155620225777e-07, + "loss": 0.6213, + "step": 27140 + }, + { + "epoch": 0.94, + "learning_rate": 1.7506864377085043e-07, + "loss": 0.6299, + "step": 27141 + }, + { + "epoch": 0.94, + "learning_rate": 1.7486584782643313e-07, + "loss": 0.5855, + "step": 27142 + }, + { + "epoch": 0.94, + "learning_rate": 1.746631683714095e-07, + "loss": 0.6606, + "step": 27143 + }, + { + "epoch": 0.94, + "learning_rate": 1.744606054081832e-07, + "loss": 0.6496, + "step": 27144 + }, + { + "epoch": 0.94, + "learning_rate": 1.7425815893915677e-07, + "loss": 0.6083, + "step": 27145 + }, + { + "epoch": 0.94, + "learning_rate": 1.7405582896672934e-07, + "loss": 0.6436, + "step": 27146 + }, + { + "epoch": 0.94, + "learning_rate": 1.7385361549329904e-07, + "loss": 0.6592, + "step": 27147 + }, + { + "epoch": 0.94, + "learning_rate": 1.7365151852126505e-07, + "loss": 0.6565, + "step": 27148 + }, + { + "epoch": 0.94, + "learning_rate": 1.7344953805302212e-07, + "loss": 0.6507, + "step": 27149 + }, + { + "epoch": 0.94, + "learning_rate": 1.732476740909661e-07, + "loss": 0.5943, + "step": 27150 + }, + { + "epoch": 0.94, + "learning_rate": 1.7304592663748954e-07, + "loss": 0.6802, + "step": 27151 + }, + { + "epoch": 0.94, + "learning_rate": 1.7284429569498494e-07, + "loss": 0.6924, + "step": 27152 + }, + { + "epoch": 0.94, + "learning_rate": 1.7264278126584266e-07, + "loss": 0.6353, + "step": 27153 + }, + { + "epoch": 0.94, + "learning_rate": 1.7244138335245185e-07, + "loss": 0.6904, + "step": 27154 + }, + { + "epoch": 0.94, + "learning_rate": 1.7224010195719954e-07, + "loss": 0.6203, + "step": 27155 + }, + { + "epoch": 0.94, + "learning_rate": 1.7203893708247378e-07, + "loss": 0.6341, + "step": 27156 + }, + { + "epoch": 0.94, + "learning_rate": 1.7183788873065933e-07, + "loss": 0.6365, + "step": 27157 + }, + { + "epoch": 0.94, + "learning_rate": 1.7163695690413873e-07, + "loss": 0.6268, + "step": 27158 + }, + { + "epoch": 0.94, + "learning_rate": 1.7143614160529454e-07, + "loss": 0.5908, + "step": 27159 + }, + { + "epoch": 0.94, + "learning_rate": 1.7123544283650817e-07, + "loss": 0.6028, + "step": 27160 + }, + { + "epoch": 0.94, + "learning_rate": 1.7103486060015994e-07, + "loss": 0.6124, + "step": 27161 + }, + { + "epoch": 0.94, + "learning_rate": 1.7083439489862576e-07, + "loss": 0.6355, + "step": 27162 + }, + { + "epoch": 0.94, + "learning_rate": 1.7063404573428587e-07, + "loss": 0.6299, + "step": 27163 + }, + { + "epoch": 0.94, + "learning_rate": 1.704338131095118e-07, + "loss": 0.611, + "step": 27164 + }, + { + "epoch": 0.94, + "learning_rate": 1.7023369702668048e-07, + "loss": 0.662, + "step": 27165 + }, + { + "epoch": 0.94, + "learning_rate": 1.7003369748816223e-07, + "loss": 0.5802, + "step": 27166 + }, + { + "epoch": 0.94, + "learning_rate": 1.6983381449632962e-07, + "loss": 0.637, + "step": 27167 + }, + { + "epoch": 0.94, + "learning_rate": 1.6963404805355298e-07, + "loss": 0.625, + "step": 27168 + }, + { + "epoch": 0.94, + "learning_rate": 1.6943439816220154e-07, + "loss": 0.6617, + "step": 27169 + }, + { + "epoch": 0.94, + "learning_rate": 1.692348648246389e-07, + "loss": 0.6198, + "step": 27170 + }, + { + "epoch": 0.94, + "learning_rate": 1.6903544804323324e-07, + "loss": 0.6363, + "step": 27171 + }, + { + "epoch": 0.94, + "learning_rate": 1.6883614782034929e-07, + "loss": 0.6004, + "step": 27172 + }, + { + "epoch": 0.94, + "learning_rate": 1.6863696415834853e-07, + "loss": 0.6482, + "step": 27173 + }, + { + "epoch": 0.94, + "learning_rate": 1.6843789705959347e-07, + "loss": 0.6265, + "step": 27174 + }, + { + "epoch": 0.94, + "learning_rate": 1.6823894652644447e-07, + "loss": 0.5618, + "step": 27175 + }, + { + "epoch": 0.94, + "learning_rate": 1.6804011256125962e-07, + "loss": 0.6205, + "step": 27176 + }, + { + "epoch": 0.94, + "learning_rate": 1.6784139516639709e-07, + "loss": 0.5948, + "step": 27177 + }, + { + "epoch": 0.94, + "learning_rate": 1.676427943442127e-07, + "loss": 0.6202, + "step": 27178 + }, + { + "epoch": 0.94, + "learning_rate": 1.674443100970602e-07, + "loss": 0.5855, + "step": 27179 + }, + { + "epoch": 0.94, + "learning_rate": 1.672459424272943e-07, + "loss": 0.6094, + "step": 27180 + }, + { + "epoch": 0.94, + "learning_rate": 1.6704769133726652e-07, + "loss": 0.6777, + "step": 27181 + }, + { + "epoch": 0.94, + "learning_rate": 1.6684955682932712e-07, + "loss": 0.6543, + "step": 27182 + }, + { + "epoch": 0.94, + "learning_rate": 1.666515389058243e-07, + "loss": 0.6209, + "step": 27183 + }, + { + "epoch": 0.94, + "learning_rate": 1.6645363756910727e-07, + "loss": 0.5951, + "step": 27184 + }, + { + "epoch": 0.94, + "learning_rate": 1.662558528215219e-07, + "loss": 0.6956, + "step": 27185 + }, + { + "epoch": 0.94, + "learning_rate": 1.66058184665413e-07, + "loss": 0.6261, + "step": 27186 + }, + { + "epoch": 0.94, + "learning_rate": 1.6586063310312539e-07, + "loss": 0.6013, + "step": 27187 + }, + { + "epoch": 0.94, + "learning_rate": 1.6566319813699826e-07, + "loss": 0.627, + "step": 27188 + }, + { + "epoch": 0.94, + "learning_rate": 1.6546587976937534e-07, + "loss": 0.6702, + "step": 27189 + }, + { + "epoch": 0.94, + "learning_rate": 1.6526867800259583e-07, + "loss": 0.6515, + "step": 27190 + }, + { + "epoch": 0.94, + "learning_rate": 1.6507159283899565e-07, + "loss": 0.6645, + "step": 27191 + }, + { + "epoch": 0.94, + "learning_rate": 1.6487462428091404e-07, + "loss": 0.6428, + "step": 27192 + }, + { + "epoch": 0.94, + "learning_rate": 1.6467777233068583e-07, + "loss": 0.6434, + "step": 27193 + }, + { + "epoch": 0.94, + "learning_rate": 1.6448103699064355e-07, + "loss": 0.6489, + "step": 27194 + }, + { + "epoch": 0.94, + "learning_rate": 1.642844182631209e-07, + "loss": 0.652, + "step": 27195 + }, + { + "epoch": 0.94, + "learning_rate": 1.640879161504483e-07, + "loss": 0.5956, + "step": 27196 + }, + { + "epoch": 0.94, + "learning_rate": 1.63891530654956e-07, + "loss": 0.6962, + "step": 27197 + }, + { + "epoch": 0.94, + "learning_rate": 1.6369526177897221e-07, + "loss": 0.5834, + "step": 27198 + }, + { + "epoch": 0.94, + "learning_rate": 1.6349910952482505e-07, + "loss": 0.6568, + "step": 27199 + }, + { + "epoch": 0.94, + "learning_rate": 1.6330307389483823e-07, + "loss": 0.6465, + "step": 27200 + }, + { + "epoch": 0.94, + "learning_rate": 1.6310715489133654e-07, + "loss": 0.6778, + "step": 27201 + }, + { + "epoch": 0.94, + "learning_rate": 1.629113525166448e-07, + "loss": 0.6174, + "step": 27202 + }, + { + "epoch": 0.94, + "learning_rate": 1.6271566677308114e-07, + "loss": 0.6324, + "step": 27203 + }, + { + "epoch": 0.94, + "learning_rate": 1.6252009766296817e-07, + "loss": 0.619, + "step": 27204 + }, + { + "epoch": 0.94, + "learning_rate": 1.623246451886251e-07, + "loss": 0.6056, + "step": 27205 + }, + { + "epoch": 0.94, + "learning_rate": 1.621293093523668e-07, + "loss": 0.6755, + "step": 27206 + }, + { + "epoch": 0.94, + "learning_rate": 1.619340901565114e-07, + "loss": 0.6331, + "step": 27207 + }, + { + "epoch": 0.94, + "learning_rate": 1.6173898760337259e-07, + "loss": 0.592, + "step": 27208 + }, + { + "epoch": 0.94, + "learning_rate": 1.6154400169526186e-07, + "loss": 0.634, + "step": 27209 + }, + { + "epoch": 0.94, + "learning_rate": 1.6134913243449402e-07, + "loss": 0.6402, + "step": 27210 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115437982337835e-07, + "loss": 0.6033, + "step": 27211 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095974386422298e-07, + "loss": 0.6465, + "step": 27212 + }, + { + "epoch": 0.94, + "learning_rate": 1.607652245593372e-07, + "loss": 0.6555, + "step": 27213 + }, + { + "epoch": 0.94, + "learning_rate": 1.605708219110269e-07, + "loss": 0.6737, + "step": 27214 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037653592159365e-07, + "loss": 0.6569, + "step": 27215 + }, + { + "epoch": 0.94, + "learning_rate": 1.6018236659334663e-07, + "loss": 0.6554, + "step": 27216 + }, + { + "epoch": 0.94, + "learning_rate": 1.5998831392858405e-07, + "loss": 0.6476, + "step": 27217 + }, + { + "epoch": 0.94, + "learning_rate": 1.5979437792960738e-07, + "loss": 0.5886, + "step": 27218 + }, + { + "epoch": 0.94, + "learning_rate": 1.5960055859871705e-07, + "loss": 0.6029, + "step": 27219 + }, + { + "epoch": 0.94, + "learning_rate": 1.5940685593821003e-07, + "loss": 0.666, + "step": 27220 + }, + { + "epoch": 0.94, + "learning_rate": 1.5921326995038122e-07, + "loss": 0.626, + "step": 27221 + }, + { + "epoch": 0.94, + "learning_rate": 1.5901980063752988e-07, + "loss": 0.6524, + "step": 27222 + }, + { + "epoch": 0.94, + "learning_rate": 1.5882644800194747e-07, + "loss": 0.6342, + "step": 27223 + }, + { + "epoch": 0.94, + "learning_rate": 1.5863321204592662e-07, + "loss": 0.6523, + "step": 27224 + }, + { + "epoch": 0.94, + "learning_rate": 1.5844009277175887e-07, + "loss": 0.5684, + "step": 27225 + }, + { + "epoch": 0.94, + "learning_rate": 1.5824709018173233e-07, + "loss": 0.72, + "step": 27226 + }, + { + "epoch": 0.94, + "learning_rate": 1.5805420427813634e-07, + "loss": 0.6342, + "step": 27227 + }, + { + "epoch": 0.94, + "learning_rate": 1.5786143506325902e-07, + "loss": 0.6208, + "step": 27228 + }, + { + "epoch": 0.94, + "learning_rate": 1.576687825393841e-07, + "loss": 0.6587, + "step": 27229 + }, + { + "epoch": 0.94, + "learning_rate": 1.5747624670879647e-07, + "loss": 0.652, + "step": 27230 + }, + { + "epoch": 0.94, + "learning_rate": 1.572838275737787e-07, + "loss": 0.6413, + "step": 27231 + }, + { + "epoch": 0.94, + "learning_rate": 1.570915251366123e-07, + "loss": 0.6232, + "step": 27232 + }, + { + "epoch": 0.94, + "learning_rate": 1.568993393995766e-07, + "loss": 0.684, + "step": 27233 + }, + { + "epoch": 0.94, + "learning_rate": 1.5670727036495193e-07, + "loss": 0.6378, + "step": 27234 + }, + { + "epoch": 0.94, + "learning_rate": 1.565153180350143e-07, + "loss": 0.6868, + "step": 27235 + }, + { + "epoch": 0.94, + "learning_rate": 1.5632348241203853e-07, + "loss": 0.5763, + "step": 27236 + }, + { + "epoch": 0.94, + "learning_rate": 1.5613176349830173e-07, + "loss": 0.656, + "step": 27237 + }, + { + "epoch": 0.94, + "learning_rate": 1.5594016129607426e-07, + "loss": 0.6258, + "step": 27238 + }, + { + "epoch": 0.94, + "learning_rate": 1.5574867580762875e-07, + "loss": 0.6556, + "step": 27239 + }, + { + "epoch": 0.94, + "learning_rate": 1.5555730703523675e-07, + "loss": 0.638, + "step": 27240 + }, + { + "epoch": 0.94, + "learning_rate": 1.553660549811664e-07, + "loss": 0.6066, + "step": 27241 + }, + { + "epoch": 0.94, + "learning_rate": 1.5517491964768373e-07, + "loss": 0.6234, + "step": 27242 + }, + { + "epoch": 0.94, + "learning_rate": 1.5498390103705795e-07, + "loss": 0.6709, + "step": 27243 + }, + { + "epoch": 0.94, + "learning_rate": 1.5479299915155066e-07, + "loss": 0.5819, + "step": 27244 + }, + { + "epoch": 0.94, + "learning_rate": 1.5460221399342557e-07, + "loss": 0.6269, + "step": 27245 + }, + { + "epoch": 0.94, + "learning_rate": 1.5441154556494753e-07, + "loss": 0.6293, + "step": 27246 + }, + { + "epoch": 0.94, + "learning_rate": 1.5422099386837475e-07, + "loss": 0.6502, + "step": 27247 + }, + { + "epoch": 0.94, + "learning_rate": 1.5403055890596764e-07, + "loss": 0.6474, + "step": 27248 + }, + { + "epoch": 0.94, + "learning_rate": 1.5384024067998326e-07, + "loss": 0.6467, + "step": 27249 + }, + { + "epoch": 0.94, + "learning_rate": 1.5365003919267761e-07, + "loss": 0.6418, + "step": 27250 + }, + { + "epoch": 0.94, + "learning_rate": 1.5345995444630557e-07, + "loss": 0.6646, + "step": 27251 + }, + { + "epoch": 0.94, + "learning_rate": 1.532699864431242e-07, + "loss": 0.6483, + "step": 27252 + }, + { + "epoch": 0.94, + "learning_rate": 1.5308013518538166e-07, + "loss": 0.7064, + "step": 27253 + }, + { + "epoch": 0.94, + "learning_rate": 1.5289040067533067e-07, + "loss": 0.6146, + "step": 27254 + }, + { + "epoch": 0.94, + "learning_rate": 1.527007829152216e-07, + "loss": 0.6221, + "step": 27255 + }, + { + "epoch": 0.94, + "learning_rate": 1.5251128190730047e-07, + "loss": 0.6285, + "step": 27256 + }, + { + "epoch": 0.94, + "learning_rate": 1.5232189765381544e-07, + "loss": 0.6242, + "step": 27257 + }, + { + "epoch": 0.94, + "learning_rate": 1.5213263015701252e-07, + "loss": 0.6706, + "step": 27258 + }, + { + "epoch": 0.94, + "learning_rate": 1.5194347941913434e-07, + "loss": 0.609, + "step": 27259 + }, + { + "epoch": 0.94, + "learning_rate": 1.5175444544242357e-07, + "loss": 0.6515, + "step": 27260 + }, + { + "epoch": 0.94, + "learning_rate": 1.5156552822912284e-07, + "loss": 0.6144, + "step": 27261 + }, + { + "epoch": 0.94, + "learning_rate": 1.513767277814715e-07, + "loss": 0.5802, + "step": 27262 + }, + { + "epoch": 0.94, + "learning_rate": 1.5118804410170551e-07, + "loss": 0.6577, + "step": 27263 + }, + { + "epoch": 0.94, + "learning_rate": 1.509994771920664e-07, + "loss": 0.6093, + "step": 27264 + }, + { + "epoch": 0.94, + "learning_rate": 1.5081102705478578e-07, + "loss": 0.6797, + "step": 27265 + }, + { + "epoch": 0.94, + "learning_rate": 1.506226936921007e-07, + "loss": 0.6231, + "step": 27266 + }, + { + "epoch": 0.94, + "learning_rate": 1.504344771062438e-07, + "loss": 0.6018, + "step": 27267 + }, + { + "epoch": 0.94, + "learning_rate": 1.5024637729944446e-07, + "loss": 0.6071, + "step": 27268 + }, + { + "epoch": 0.94, + "learning_rate": 1.500583942739342e-07, + "loss": 0.624, + "step": 27269 + }, + { + "epoch": 0.94, + "learning_rate": 1.4987052803194345e-07, + "loss": 0.548, + "step": 27270 + }, + { + "epoch": 0.94, + "learning_rate": 1.4968277857569713e-07, + "loss": 0.6405, + "step": 27271 + }, + { + "epoch": 0.94, + "learning_rate": 1.494951459074212e-07, + "loss": 0.6323, + "step": 27272 + }, + { + "epoch": 0.94, + "learning_rate": 1.493076300293439e-07, + "loss": 0.6614, + "step": 27273 + }, + { + "epoch": 0.94, + "learning_rate": 1.4912023094368344e-07, + "loss": 0.6907, + "step": 27274 + }, + { + "epoch": 0.95, + "learning_rate": 1.4893294865266472e-07, + "loss": 0.5816, + "step": 27275 + }, + { + "epoch": 0.95, + "learning_rate": 1.487457831585082e-07, + "loss": 0.6111, + "step": 27276 + }, + { + "epoch": 0.95, + "learning_rate": 1.4855873446343093e-07, + "loss": 0.6537, + "step": 27277 + }, + { + "epoch": 0.95, + "learning_rate": 1.4837180256965456e-07, + "loss": 0.6658, + "step": 27278 + }, + { + "epoch": 0.95, + "learning_rate": 1.4818498747939058e-07, + "loss": 0.588, + "step": 27279 + }, + { + "epoch": 0.95, + "learning_rate": 1.4799828919485616e-07, + "loss": 0.6767, + "step": 27280 + }, + { + "epoch": 0.95, + "learning_rate": 1.4781170771826615e-07, + "loss": 0.5846, + "step": 27281 + }, + { + "epoch": 0.95, + "learning_rate": 1.47625243051831e-07, + "loss": 0.6786, + "step": 27282 + }, + { + "epoch": 0.95, + "learning_rate": 1.4743889519776122e-07, + "loss": 0.6055, + "step": 27283 + }, + { + "epoch": 0.95, + "learning_rate": 1.4725266415826834e-07, + "loss": 0.5877, + "step": 27284 + }, + { + "epoch": 0.95, + "learning_rate": 1.4706654993555724e-07, + "loss": 0.5401, + "step": 27285 + }, + { + "epoch": 0.95, + "learning_rate": 1.4688055253183732e-07, + "loss": 0.5993, + "step": 27286 + }, + { + "epoch": 0.95, + "learning_rate": 1.466946719493123e-07, + "loss": 0.663, + "step": 27287 + }, + { + "epoch": 0.95, + "learning_rate": 1.4650890819018604e-07, + "loss": 0.6753, + "step": 27288 + }, + { + "epoch": 0.95, + "learning_rate": 1.4632326125666117e-07, + "loss": 0.5775, + "step": 27289 + }, + { + "epoch": 0.95, + "learning_rate": 1.4613773115094044e-07, + "loss": 0.6325, + "step": 27290 + }, + { + "epoch": 0.95, + "learning_rate": 1.45952317875222e-07, + "loss": 0.6512, + "step": 27291 + }, + { + "epoch": 0.95, + "learning_rate": 1.4576702143170308e-07, + "loss": 0.6038, + "step": 27292 + }, + { + "epoch": 0.95, + "learning_rate": 1.4558184182258182e-07, + "loss": 0.6331, + "step": 27293 + }, + { + "epoch": 0.95, + "learning_rate": 1.4539677905005433e-07, + "loss": 0.6402, + "step": 27294 + }, + { + "epoch": 0.95, + "learning_rate": 1.4521183311631437e-07, + "loss": 0.639, + "step": 27295 + }, + { + "epoch": 0.95, + "learning_rate": 1.4502700402355462e-07, + "loss": 0.6705, + "step": 27296 + }, + { + "epoch": 0.95, + "learning_rate": 1.4484229177396557e-07, + "loss": 0.6322, + "step": 27297 + }, + { + "epoch": 0.95, + "learning_rate": 1.446576963697388e-07, + "loss": 0.6149, + "step": 27298 + }, + { + "epoch": 0.95, + "learning_rate": 1.4447321781306144e-07, + "loss": 0.6857, + "step": 27299 + }, + { + "epoch": 0.95, + "learning_rate": 1.4428885610612064e-07, + "loss": 0.6348, + "step": 27300 + }, + { + "epoch": 0.95, + "learning_rate": 1.4410461125110464e-07, + "loss": 0.6341, + "step": 27301 + }, + { + "epoch": 0.95, + "learning_rate": 1.4392048325019613e-07, + "loss": 0.6715, + "step": 27302 + }, + { + "epoch": 0.95, + "learning_rate": 1.4373647210557673e-07, + "loss": 0.6265, + "step": 27303 + }, + { + "epoch": 0.95, + "learning_rate": 1.4355257781943134e-07, + "loss": 0.5706, + "step": 27304 + }, + { + "epoch": 0.95, + "learning_rate": 1.4336880039393708e-07, + "loss": 0.589, + "step": 27305 + }, + { + "epoch": 0.95, + "learning_rate": 1.431851398312756e-07, + "loss": 0.6401, + "step": 27306 + }, + { + "epoch": 0.95, + "learning_rate": 1.4300159613362285e-07, + "loss": 0.6098, + "step": 27307 + }, + { + "epoch": 0.95, + "learning_rate": 1.4281816930315606e-07, + "loss": 0.6313, + "step": 27308 + }, + { + "epoch": 0.95, + "learning_rate": 1.4263485934204792e-07, + "loss": 0.6509, + "step": 27309 + }, + { + "epoch": 0.95, + "learning_rate": 1.424516662524744e-07, + "loss": 0.5734, + "step": 27310 + }, + { + "epoch": 0.95, + "learning_rate": 1.42268590036605e-07, + "loss": 0.573, + "step": 27311 + }, + { + "epoch": 0.95, + "learning_rate": 1.420856306966123e-07, + "loss": 0.6241, + "step": 27312 + }, + { + "epoch": 0.95, + "learning_rate": 1.4190278823466462e-07, + "loss": 0.5688, + "step": 27313 + }, + { + "epoch": 0.95, + "learning_rate": 1.4172006265293025e-07, + "loss": 0.644, + "step": 27314 + }, + { + "epoch": 0.95, + "learning_rate": 1.4153745395357522e-07, + "loss": 0.633, + "step": 27315 + }, + { + "epoch": 0.95, + "learning_rate": 1.4135496213876444e-07, + "loss": 0.6838, + "step": 27316 + }, + { + "epoch": 0.95, + "learning_rate": 1.4117258721066173e-07, + "loss": 0.6167, + "step": 27317 + }, + { + "epoch": 0.95, + "learning_rate": 1.4099032917142986e-07, + "loss": 0.6181, + "step": 27318 + }, + { + "epoch": 0.95, + "learning_rate": 1.4080818802322926e-07, + "loss": 0.6397, + "step": 27319 + }, + { + "epoch": 0.95, + "learning_rate": 1.4062616376822046e-07, + "loss": 0.5975, + "step": 27320 + }, + { + "epoch": 0.95, + "learning_rate": 1.4044425640855953e-07, + "loss": 0.6546, + "step": 27321 + }, + { + "epoch": 0.95, + "learning_rate": 1.4026246594640358e-07, + "loss": 0.6763, + "step": 27322 + }, + { + "epoch": 0.95, + "learning_rate": 1.400807923839098e-07, + "loss": 0.6162, + "step": 27323 + }, + { + "epoch": 0.95, + "learning_rate": 1.3989923572323094e-07, + "loss": 0.5743, + "step": 27324 + }, + { + "epoch": 0.95, + "learning_rate": 1.3971779596651968e-07, + "loss": 0.6318, + "step": 27325 + }, + { + "epoch": 0.95, + "learning_rate": 1.3953647311592766e-07, + "loss": 0.5899, + "step": 27326 + }, + { + "epoch": 0.95, + "learning_rate": 1.3935526717360425e-07, + "loss": 0.6955, + "step": 27327 + }, + { + "epoch": 0.95, + "learning_rate": 1.3917417814169777e-07, + "loss": 0.641, + "step": 27328 + }, + { + "epoch": 0.95, + "learning_rate": 1.3899320602235422e-07, + "loss": 0.6392, + "step": 27329 + }, + { + "epoch": 0.95, + "learning_rate": 1.3881235081772194e-07, + "loss": 0.6097, + "step": 27330 + }, + { + "epoch": 0.95, + "learning_rate": 1.386316125299436e-07, + "loss": 0.5944, + "step": 27331 + }, + { + "epoch": 0.95, + "learning_rate": 1.3845099116116201e-07, + "loss": 0.6228, + "step": 27332 + }, + { + "epoch": 0.95, + "learning_rate": 1.3827048671351871e-07, + "loss": 0.6339, + "step": 27333 + }, + { + "epoch": 0.95, + "learning_rate": 1.3809009918915318e-07, + "loss": 0.6396, + "step": 27334 + }, + { + "epoch": 0.95, + "learning_rate": 1.3790982859020584e-07, + "loss": 0.6403, + "step": 27335 + }, + { + "epoch": 0.95, + "learning_rate": 1.3772967491881283e-07, + "loss": 0.6664, + "step": 27336 + }, + { + "epoch": 0.95, + "learning_rate": 1.375496381771102e-07, + "loss": 0.6611, + "step": 27337 + }, + { + "epoch": 0.95, + "learning_rate": 1.37369718367234e-07, + "loss": 0.6218, + "step": 27338 + }, + { + "epoch": 0.95, + "learning_rate": 1.3718991549131477e-07, + "loss": 0.616, + "step": 27339 + }, + { + "epoch": 0.95, + "learning_rate": 1.3701022955148525e-07, + "loss": 0.6777, + "step": 27340 + }, + { + "epoch": 0.95, + "learning_rate": 1.3683066054987703e-07, + "loss": 0.6556, + "step": 27341 + }, + { + "epoch": 0.95, + "learning_rate": 1.3665120848861846e-07, + "loss": 0.654, + "step": 27342 + }, + { + "epoch": 0.95, + "learning_rate": 1.3647187336983668e-07, + "loss": 0.6312, + "step": 27343 + }, + { + "epoch": 0.95, + "learning_rate": 1.3629265519565782e-07, + "loss": 0.5841, + "step": 27344 + }, + { + "epoch": 0.95, + "learning_rate": 1.361135539682079e-07, + "loss": 0.6948, + "step": 27345 + }, + { + "epoch": 0.95, + "learning_rate": 1.359345696896097e-07, + "loss": 0.6234, + "step": 27346 + }, + { + "epoch": 0.95, + "learning_rate": 1.3575570236198487e-07, + "loss": 0.6146, + "step": 27347 + }, + { + "epoch": 0.95, + "learning_rate": 1.3557695198745391e-07, + "loss": 0.5771, + "step": 27348 + }, + { + "epoch": 0.95, + "learning_rate": 1.3539831856813845e-07, + "loss": 0.5985, + "step": 27349 + }, + { + "epoch": 0.95, + "learning_rate": 1.352198021061535e-07, + "loss": 0.6075, + "step": 27350 + }, + { + "epoch": 0.95, + "learning_rate": 1.350414026036162e-07, + "loss": 0.6573, + "step": 27351 + }, + { + "epoch": 0.95, + "learning_rate": 1.348631200626438e-07, + "loss": 0.5941, + "step": 27352 + }, + { + "epoch": 0.95, + "learning_rate": 1.346849544853479e-07, + "loss": 0.604, + "step": 27353 + }, + { + "epoch": 0.95, + "learning_rate": 1.345069058738413e-07, + "loss": 0.5983, + "step": 27354 + }, + { + "epoch": 0.95, + "learning_rate": 1.3432897423023562e-07, + "loss": 0.6616, + "step": 27355 + }, + { + "epoch": 0.95, + "learning_rate": 1.3415115955664026e-07, + "loss": 0.5747, + "step": 27356 + }, + { + "epoch": 0.95, + "learning_rate": 1.3397346185516246e-07, + "loss": 0.6284, + "step": 27357 + }, + { + "epoch": 0.95, + "learning_rate": 1.3379588112791053e-07, + "loss": 0.6057, + "step": 27358 + }, + { + "epoch": 0.95, + "learning_rate": 1.3361841737698832e-07, + "loss": 0.6002, + "step": 27359 + }, + { + "epoch": 0.95, + "learning_rate": 1.3344107060450195e-07, + "loss": 0.6241, + "step": 27360 + }, + { + "epoch": 0.95, + "learning_rate": 1.3326384081255306e-07, + "loss": 0.6599, + "step": 27361 + }, + { + "epoch": 0.95, + "learning_rate": 1.3308672800324218e-07, + "loss": 0.594, + "step": 27362 + }, + { + "epoch": 0.95, + "learning_rate": 1.3290973217866987e-07, + "loss": 0.6246, + "step": 27363 + }, + { + "epoch": 0.95, + "learning_rate": 1.3273285334093444e-07, + "loss": 0.631, + "step": 27364 + }, + { + "epoch": 0.95, + "learning_rate": 1.325560914921331e-07, + "loss": 0.6736, + "step": 27365 + }, + { + "epoch": 0.95, + "learning_rate": 1.3237944663436198e-07, + "loss": 0.6446, + "step": 27366 + }, + { + "epoch": 0.95, + "learning_rate": 1.3220291876971602e-07, + "loss": 0.5744, + "step": 27367 + }, + { + "epoch": 0.95, + "learning_rate": 1.3202650790028692e-07, + "loss": 0.6221, + "step": 27368 + }, + { + "epoch": 0.95, + "learning_rate": 1.3185021402816524e-07, + "loss": 0.6923, + "step": 27369 + }, + { + "epoch": 0.95, + "learning_rate": 1.316740371554437e-07, + "loss": 0.661, + "step": 27370 + }, + { + "epoch": 0.95, + "learning_rate": 1.3149797728420954e-07, + "loss": 0.6555, + "step": 27371 + }, + { + "epoch": 0.95, + "learning_rate": 1.3132203441655112e-07, + "loss": 0.6419, + "step": 27372 + }, + { + "epoch": 0.95, + "learning_rate": 1.311462085545534e-07, + "loss": 0.6625, + "step": 27373 + }, + { + "epoch": 0.95, + "learning_rate": 1.309704997003025e-07, + "loss": 0.6675, + "step": 27374 + }, + { + "epoch": 0.95, + "learning_rate": 1.30794907855879e-07, + "loss": 0.5569, + "step": 27375 + }, + { + "epoch": 0.95, + "learning_rate": 1.306194330233679e-07, + "loss": 0.6538, + "step": 27376 + }, + { + "epoch": 0.95, + "learning_rate": 1.304440752048475e-07, + "loss": 0.6899, + "step": 27377 + }, + { + "epoch": 0.95, + "learning_rate": 1.3026883440239724e-07, + "loss": 0.6805, + "step": 27378 + }, + { + "epoch": 0.95, + "learning_rate": 1.3009371061809662e-07, + "loss": 0.5782, + "step": 27379 + }, + { + "epoch": 0.95, + "learning_rate": 1.2991870385402062e-07, + "loss": 0.6331, + "step": 27380 + }, + { + "epoch": 0.95, + "learning_rate": 1.2974381411224313e-07, + "loss": 0.6164, + "step": 27381 + }, + { + "epoch": 0.95, + "learning_rate": 1.2956904139483806e-07, + "loss": 0.577, + "step": 27382 + }, + { + "epoch": 0.95, + "learning_rate": 1.293943857038793e-07, + "loss": 0.6226, + "step": 27383 + }, + { + "epoch": 0.95, + "learning_rate": 1.292198470414352e-07, + "loss": 0.6171, + "step": 27384 + }, + { + "epoch": 0.95, + "learning_rate": 1.2904542540957853e-07, + "loss": 0.5969, + "step": 27385 + }, + { + "epoch": 0.95, + "learning_rate": 1.2887112081037434e-07, + "loss": 0.5821, + "step": 27386 + }, + { + "epoch": 0.95, + "learning_rate": 1.2869693324588871e-07, + "loss": 0.6242, + "step": 27387 + }, + { + "epoch": 0.95, + "learning_rate": 1.2852286271818893e-07, + "loss": 0.6292, + "step": 27388 + }, + { + "epoch": 0.95, + "learning_rate": 1.2834890922933885e-07, + "loss": 0.654, + "step": 27389 + }, + { + "epoch": 0.95, + "learning_rate": 1.2817507278139906e-07, + "loss": 0.6717, + "step": 27390 + }, + { + "epoch": 0.95, + "learning_rate": 1.2800135337643348e-07, + "loss": 0.636, + "step": 27391 + }, + { + "epoch": 0.95, + "learning_rate": 1.2782775101649824e-07, + "loss": 0.6451, + "step": 27392 + }, + { + "epoch": 0.95, + "learning_rate": 1.276542657036539e-07, + "loss": 0.6184, + "step": 27393 + }, + { + "epoch": 0.95, + "learning_rate": 1.2748089743995661e-07, + "loss": 0.6174, + "step": 27394 + }, + { + "epoch": 0.95, + "learning_rate": 1.273076462274625e-07, + "loss": 0.6491, + "step": 27395 + }, + { + "epoch": 0.95, + "learning_rate": 1.2713451206822547e-07, + "loss": 0.5982, + "step": 27396 + }, + { + "epoch": 0.95, + "learning_rate": 1.269614949642972e-07, + "loss": 0.5853, + "step": 27397 + }, + { + "epoch": 0.95, + "learning_rate": 1.2678859491773055e-07, + "loss": 0.6209, + "step": 27398 + }, + { + "epoch": 0.95, + "learning_rate": 1.2661581193057494e-07, + "loss": 0.6495, + "step": 27399 + }, + { + "epoch": 0.95, + "learning_rate": 1.264431460048776e-07, + "loss": 0.604, + "step": 27400 + }, + { + "epoch": 0.95, + "learning_rate": 1.2627059714268807e-07, + "loss": 0.5604, + "step": 27401 + }, + { + "epoch": 0.95, + "learning_rate": 1.2609816534605135e-07, + "loss": 0.5694, + "step": 27402 + }, + { + "epoch": 0.95, + "learning_rate": 1.2592585061701024e-07, + "loss": 0.6444, + "step": 27403 + }, + { + "epoch": 0.95, + "learning_rate": 1.2575365295760977e-07, + "loss": 0.6154, + "step": 27404 + }, + { + "epoch": 0.95, + "learning_rate": 1.2558157236989055e-07, + "loss": 0.6483, + "step": 27405 + }, + { + "epoch": 0.95, + "learning_rate": 1.2540960885589203e-07, + "loss": 0.5934, + "step": 27406 + }, + { + "epoch": 0.95, + "learning_rate": 1.2523776241765483e-07, + "loss": 0.675, + "step": 27407 + }, + { + "epoch": 0.95, + "learning_rate": 1.250660330572151e-07, + "loss": 0.6075, + "step": 27408 + }, + { + "epoch": 0.95, + "learning_rate": 1.2489442077661007e-07, + "loss": 0.6159, + "step": 27409 + }, + { + "epoch": 0.95, + "learning_rate": 1.247229255778737e-07, + "loss": 0.6658, + "step": 27410 + }, + { + "epoch": 0.95, + "learning_rate": 1.245515474630399e-07, + "loss": 0.6498, + "step": 27411 + }, + { + "epoch": 0.95, + "learning_rate": 1.2438028643413812e-07, + "loss": 0.6079, + "step": 27412 + }, + { + "epoch": 0.95, + "learning_rate": 1.2420914249320127e-07, + "loss": 0.6277, + "step": 27413 + }, + { + "epoch": 0.95, + "learning_rate": 1.2403811564225988e-07, + "loss": 0.5776, + "step": 27414 + }, + { + "epoch": 0.95, + "learning_rate": 1.238672058833379e-07, + "loss": 0.642, + "step": 27415 + }, + { + "epoch": 0.95, + "learning_rate": 1.2369641321846482e-07, + "loss": 0.6389, + "step": 27416 + }, + { + "epoch": 0.95, + "learning_rate": 1.2352573764966346e-07, + "loss": 0.6467, + "step": 27417 + }, + { + "epoch": 0.95, + "learning_rate": 1.2335517917895778e-07, + "loss": 0.5883, + "step": 27418 + }, + { + "epoch": 0.95, + "learning_rate": 1.231847378083717e-07, + "loss": 0.6859, + "step": 27419 + }, + { + "epoch": 0.95, + "learning_rate": 1.2301441353992472e-07, + "loss": 0.6549, + "step": 27420 + }, + { + "epoch": 0.95, + "learning_rate": 1.228442063756352e-07, + "loss": 0.6006, + "step": 27421 + }, + { + "epoch": 0.95, + "learning_rate": 1.226741163175238e-07, + "loss": 0.6373, + "step": 27422 + }, + { + "epoch": 0.95, + "learning_rate": 1.2250414336760442e-07, + "loss": 0.6215, + "step": 27423 + }, + { + "epoch": 0.95, + "learning_rate": 1.2233428752789322e-07, + "loss": 0.6529, + "step": 27424 + }, + { + "epoch": 0.95, + "learning_rate": 1.221645488004053e-07, + "loss": 0.5862, + "step": 27425 + }, + { + "epoch": 0.95, + "learning_rate": 1.2199492718715233e-07, + "loss": 0.6405, + "step": 27426 + }, + { + "epoch": 0.95, + "learning_rate": 1.2182542269014496e-07, + "loss": 0.6722, + "step": 27427 + }, + { + "epoch": 0.95, + "learning_rate": 1.216560353113927e-07, + "loss": 0.6299, + "step": 27428 + }, + { + "epoch": 0.95, + "learning_rate": 1.2148676505290502e-07, + "loss": 0.6224, + "step": 27429 + }, + { + "epoch": 0.95, + "learning_rate": 1.21317611916687e-07, + "loss": 0.6487, + "step": 27430 + }, + { + "epoch": 0.95, + "learning_rate": 1.2114857590474592e-07, + "loss": 0.5789, + "step": 27431 + }, + { + "epoch": 0.95, + "learning_rate": 1.2097965701908576e-07, + "loss": 0.6338, + "step": 27432 + }, + { + "epoch": 0.95, + "learning_rate": 1.2081085526170932e-07, + "loss": 0.6359, + "step": 27433 + }, + { + "epoch": 0.95, + "learning_rate": 1.2064217063461615e-07, + "loss": 0.6406, + "step": 27434 + }, + { + "epoch": 0.95, + "learning_rate": 1.2047360313980794e-07, + "loss": 0.6244, + "step": 27435 + }, + { + "epoch": 0.95, + "learning_rate": 1.20305152779282e-07, + "loss": 0.6436, + "step": 27436 + }, + { + "epoch": 0.95, + "learning_rate": 1.2013681955503786e-07, + "loss": 0.5753, + "step": 27437 + }, + { + "epoch": 0.95, + "learning_rate": 1.1996860346906948e-07, + "loss": 0.5927, + "step": 27438 + }, + { + "epoch": 0.95, + "learning_rate": 1.1980050452337078e-07, + "loss": 0.6866, + "step": 27439 + }, + { + "epoch": 0.95, + "learning_rate": 1.1963252271993574e-07, + "loss": 0.6499, + "step": 27440 + }, + { + "epoch": 0.95, + "learning_rate": 1.1946465806075724e-07, + "loss": 0.6138, + "step": 27441 + }, + { + "epoch": 0.95, + "learning_rate": 1.1929691054782256e-07, + "loss": 0.6724, + "step": 27442 + }, + { + "epoch": 0.95, + "learning_rate": 1.1912928018312231e-07, + "loss": 0.6525, + "step": 27443 + }, + { + "epoch": 0.95, + "learning_rate": 1.1896176696864492e-07, + "loss": 0.6677, + "step": 27444 + }, + { + "epoch": 0.95, + "learning_rate": 1.1879437090637436e-07, + "loss": 0.5987, + "step": 27445 + }, + { + "epoch": 0.95, + "learning_rate": 1.1862709199829681e-07, + "loss": 0.6263, + "step": 27446 + }, + { + "epoch": 0.95, + "learning_rate": 1.1845993024639512e-07, + "loss": 0.6326, + "step": 27447 + }, + { + "epoch": 0.95, + "learning_rate": 1.1829288565264996e-07, + "loss": 0.5902, + "step": 27448 + }, + { + "epoch": 0.95, + "learning_rate": 1.1812595821904415e-07, + "loss": 0.6388, + "step": 27449 + }, + { + "epoch": 0.95, + "learning_rate": 1.1795914794755614e-07, + "loss": 0.6471, + "step": 27450 + }, + { + "epoch": 0.95, + "learning_rate": 1.1779245484016321e-07, + "loss": 0.6141, + "step": 27451 + }, + { + "epoch": 0.95, + "learning_rate": 1.1762587889884048e-07, + "loss": 0.6608, + "step": 27452 + }, + { + "epoch": 0.95, + "learning_rate": 1.1745942012556633e-07, + "loss": 0.6909, + "step": 27453 + }, + { + "epoch": 0.95, + "learning_rate": 1.1729307852231032e-07, + "loss": 0.6531, + "step": 27454 + }, + { + "epoch": 0.95, + "learning_rate": 1.1712685409104641e-07, + "loss": 0.6078, + "step": 27455 + }, + { + "epoch": 0.95, + "learning_rate": 1.1696074683374748e-07, + "loss": 0.6757, + "step": 27456 + }, + { + "epoch": 0.95, + "learning_rate": 1.1679475675237972e-07, + "loss": 0.6374, + "step": 27457 + }, + { + "epoch": 0.95, + "learning_rate": 1.1662888384891269e-07, + "loss": 0.6258, + "step": 27458 + }, + { + "epoch": 0.95, + "learning_rate": 1.1646312812531257e-07, + "loss": 0.6221, + "step": 27459 + }, + { + "epoch": 0.95, + "learning_rate": 1.1629748958354448e-07, + "loss": 0.6418, + "step": 27460 + }, + { + "epoch": 0.95, + "learning_rate": 1.1613196822557238e-07, + "loss": 0.64, + "step": 27461 + }, + { + "epoch": 0.95, + "learning_rate": 1.1596656405336026e-07, + "loss": 0.607, + "step": 27462 + }, + { + "epoch": 0.95, + "learning_rate": 1.1580127706886767e-07, + "loss": 0.6184, + "step": 27463 + }, + { + "epoch": 0.95, + "learning_rate": 1.1563610727405417e-07, + "loss": 0.6843, + "step": 27464 + }, + { + "epoch": 0.95, + "learning_rate": 1.1547105467087815e-07, + "loss": 0.5965, + "step": 27465 + }, + { + "epoch": 0.95, + "learning_rate": 1.1530611926129698e-07, + "loss": 0.5925, + "step": 27466 + }, + { + "epoch": 0.95, + "learning_rate": 1.1514130104726573e-07, + "loss": 0.633, + "step": 27467 + }, + { + "epoch": 0.95, + "learning_rate": 1.1497660003073952e-07, + "loss": 0.6137, + "step": 27468 + }, + { + "epoch": 0.95, + "learning_rate": 1.14812016213669e-07, + "loss": 0.6052, + "step": 27469 + }, + { + "epoch": 0.95, + "learning_rate": 1.1464754959800817e-07, + "loss": 0.6549, + "step": 27470 + }, + { + "epoch": 0.95, + "learning_rate": 1.1448320018570547e-07, + "loss": 0.6085, + "step": 27471 + }, + { + "epoch": 0.95, + "learning_rate": 1.1431896797870823e-07, + "loss": 0.58, + "step": 27472 + }, + { + "epoch": 0.95, + "learning_rate": 1.1415485297896711e-07, + "loss": 0.6481, + "step": 27473 + }, + { + "epoch": 0.95, + "learning_rate": 1.1399085518842502e-07, + "loss": 0.6199, + "step": 27474 + }, + { + "epoch": 0.95, + "learning_rate": 1.1382697460902703e-07, + "loss": 0.6577, + "step": 27475 + }, + { + "epoch": 0.95, + "learning_rate": 1.1366321124271717e-07, + "loss": 0.6114, + "step": 27476 + }, + { + "epoch": 0.95, + "learning_rate": 1.1349956509143501e-07, + "loss": 0.6347, + "step": 27477 + }, + { + "epoch": 0.95, + "learning_rate": 1.133360361571223e-07, + "loss": 0.6431, + "step": 27478 + }, + { + "epoch": 0.95, + "learning_rate": 1.1317262444171751e-07, + "loss": 0.6424, + "step": 27479 + }, + { + "epoch": 0.95, + "learning_rate": 1.1300932994715908e-07, + "loss": 0.6216, + "step": 27480 + }, + { + "epoch": 0.95, + "learning_rate": 1.1284615267538102e-07, + "loss": 0.583, + "step": 27481 + }, + { + "epoch": 0.95, + "learning_rate": 1.1268309262832067e-07, + "loss": 0.6307, + "step": 27482 + }, + { + "epoch": 0.95, + "learning_rate": 1.125201498079076e-07, + "loss": 0.6861, + "step": 27483 + }, + { + "epoch": 0.95, + "learning_rate": 1.1235732421607693e-07, + "loss": 0.6337, + "step": 27484 + }, + { + "epoch": 0.95, + "learning_rate": 1.1219461585475822e-07, + "loss": 0.6282, + "step": 27485 + }, + { + "epoch": 0.95, + "learning_rate": 1.1203202472588105e-07, + "loss": 0.6172, + "step": 27486 + }, + { + "epoch": 0.95, + "learning_rate": 1.1186955083137163e-07, + "loss": 0.6509, + "step": 27487 + }, + { + "epoch": 0.95, + "learning_rate": 1.1170719417315845e-07, + "loss": 0.6664, + "step": 27488 + }, + { + "epoch": 0.95, + "learning_rate": 1.1154495475316329e-07, + "loss": 0.6402, + "step": 27489 + }, + { + "epoch": 0.95, + "learning_rate": 1.113828325733124e-07, + "loss": 0.6236, + "step": 27490 + }, + { + "epoch": 0.95, + "learning_rate": 1.1122082763552754e-07, + "loss": 0.6631, + "step": 27491 + }, + { + "epoch": 0.95, + "learning_rate": 1.1105893994172945e-07, + "loss": 0.6075, + "step": 27492 + }, + { + "epoch": 0.95, + "learning_rate": 1.1089716949383655e-07, + "loss": 0.6035, + "step": 27493 + }, + { + "epoch": 0.95, + "learning_rate": 1.1073551629376844e-07, + "loss": 0.6421, + "step": 27494 + }, + { + "epoch": 0.95, + "learning_rate": 1.1057398034344024e-07, + "loss": 0.6694, + "step": 27495 + }, + { + "epoch": 0.95, + "learning_rate": 1.104125616447671e-07, + "loss": 0.6461, + "step": 27496 + }, + { + "epoch": 0.95, + "learning_rate": 1.1025126019966414e-07, + "loss": 0.6592, + "step": 27497 + }, + { + "epoch": 0.95, + "learning_rate": 1.1009007601004318e-07, + "loss": 0.5916, + "step": 27498 + }, + { + "epoch": 0.95, + "learning_rate": 1.0992900907781379e-07, + "loss": 0.6134, + "step": 27499 + }, + { + "epoch": 0.95, + "learning_rate": 1.0976805940488888e-07, + "loss": 0.685, + "step": 27500 + }, + { + "epoch": 0.95, + "learning_rate": 1.0960722699317362e-07, + "loss": 0.6375, + "step": 27501 + }, + { + "epoch": 0.95, + "learning_rate": 1.0944651184457645e-07, + "loss": 0.6422, + "step": 27502 + }, + { + "epoch": 0.95, + "learning_rate": 1.0928591396100252e-07, + "loss": 0.6527, + "step": 27503 + }, + { + "epoch": 0.95, + "learning_rate": 1.0912543334435589e-07, + "loss": 0.5891, + "step": 27504 + }, + { + "epoch": 0.95, + "learning_rate": 1.0896506999653945e-07, + "loss": 0.6963, + "step": 27505 + }, + { + "epoch": 0.95, + "learning_rate": 1.0880482391945501e-07, + "loss": 0.6222, + "step": 27506 + }, + { + "epoch": 0.95, + "learning_rate": 1.0864469511500109e-07, + "loss": 0.6603, + "step": 27507 + }, + { + "epoch": 0.95, + "learning_rate": 1.0848468358507613e-07, + "loss": 0.6343, + "step": 27508 + }, + { + "epoch": 0.95, + "learning_rate": 1.0832478933157865e-07, + "loss": 0.5697, + "step": 27509 + }, + { + "epoch": 0.95, + "learning_rate": 1.0816501235640376e-07, + "loss": 0.6164, + "step": 27510 + }, + { + "epoch": 0.95, + "learning_rate": 1.0800535266144663e-07, + "loss": 0.6759, + "step": 27511 + }, + { + "epoch": 0.95, + "learning_rate": 1.0784581024859909e-07, + "loss": 0.6823, + "step": 27512 + }, + { + "epoch": 0.95, + "learning_rate": 1.0768638511975293e-07, + "loss": 0.6146, + "step": 27513 + }, + { + "epoch": 0.95, + "learning_rate": 1.0752707727679779e-07, + "loss": 0.5619, + "step": 27514 + }, + { + "epoch": 0.95, + "learning_rate": 1.0736788672162434e-07, + "loss": 0.6709, + "step": 27515 + }, + { + "epoch": 0.95, + "learning_rate": 1.0720881345611778e-07, + "loss": 0.6381, + "step": 27516 + }, + { + "epoch": 0.95, + "learning_rate": 1.0704985748216656e-07, + "loss": 0.6076, + "step": 27517 + }, + { + "epoch": 0.95, + "learning_rate": 1.0689101880165365e-07, + "loss": 0.5543, + "step": 27518 + }, + { + "epoch": 0.95, + "learning_rate": 1.0673229741646196e-07, + "loss": 0.6856, + "step": 27519 + }, + { + "epoch": 0.95, + "learning_rate": 1.0657369332847334e-07, + "loss": 0.566, + "step": 27520 + }, + { + "epoch": 0.95, + "learning_rate": 1.064152065395696e-07, + "loss": 0.7188, + "step": 27521 + }, + { + "epoch": 0.95, + "learning_rate": 1.0625683705162925e-07, + "loss": 0.5428, + "step": 27522 + }, + { + "epoch": 0.95, + "learning_rate": 1.0609858486652969e-07, + "loss": 0.6742, + "step": 27523 + }, + { + "epoch": 0.95, + "learning_rate": 1.0594044998614716e-07, + "loss": 0.6181, + "step": 27524 + }, + { + "epoch": 0.95, + "learning_rate": 1.0578243241235686e-07, + "loss": 0.6794, + "step": 27525 + }, + { + "epoch": 0.95, + "learning_rate": 1.0562453214703172e-07, + "loss": 0.6508, + "step": 27526 + }, + { + "epoch": 0.95, + "learning_rate": 1.0546674919204359e-07, + "loss": 0.623, + "step": 27527 + }, + { + "epoch": 0.95, + "learning_rate": 1.0530908354926428e-07, + "loss": 0.6509, + "step": 27528 + }, + { + "epoch": 0.95, + "learning_rate": 1.0515153522056343e-07, + "loss": 0.6695, + "step": 27529 + }, + { + "epoch": 0.95, + "learning_rate": 1.0499410420780732e-07, + "loss": 0.6277, + "step": 27530 + }, + { + "epoch": 0.95, + "learning_rate": 1.0483679051286333e-07, + "loss": 0.6483, + "step": 27531 + }, + { + "epoch": 0.95, + "learning_rate": 1.0467959413759777e-07, + "loss": 0.6523, + "step": 27532 + }, + { + "epoch": 0.95, + "learning_rate": 1.0452251508387134e-07, + "loss": 0.6293, + "step": 27533 + }, + { + "epoch": 0.95, + "learning_rate": 1.0436555335355036e-07, + "loss": 0.6271, + "step": 27534 + }, + { + "epoch": 0.95, + "learning_rate": 1.0420870894849334e-07, + "loss": 0.6332, + "step": 27535 + }, + { + "epoch": 0.95, + "learning_rate": 1.0405198187055877e-07, + "loss": 0.6012, + "step": 27536 + }, + { + "epoch": 0.95, + "learning_rate": 1.0389537212160739e-07, + "loss": 0.6757, + "step": 27537 + }, + { + "epoch": 0.95, + "learning_rate": 1.037388797034955e-07, + "loss": 0.6706, + "step": 27538 + }, + { + "epoch": 0.95, + "learning_rate": 1.0358250461807717e-07, + "loss": 0.6177, + "step": 27539 + }, + { + "epoch": 0.95, + "learning_rate": 1.0342624686720759e-07, + "loss": 0.6072, + "step": 27540 + }, + { + "epoch": 0.95, + "learning_rate": 1.0327010645273972e-07, + "loss": 0.6566, + "step": 27541 + }, + { + "epoch": 0.95, + "learning_rate": 1.0311408337652318e-07, + "loss": 0.6214, + "step": 27542 + }, + { + "epoch": 0.95, + "learning_rate": 1.0295817764040983e-07, + "loss": 0.7029, + "step": 27543 + }, + { + "epoch": 0.95, + "learning_rate": 1.0280238924624597e-07, + "loss": 0.6777, + "step": 27544 + }, + { + "epoch": 0.95, + "learning_rate": 1.0264671819588013e-07, + "loss": 0.6872, + "step": 27545 + }, + { + "epoch": 0.95, + "learning_rate": 1.0249116449115859e-07, + "loss": 0.6245, + "step": 27546 + }, + { + "epoch": 0.95, + "learning_rate": 1.0233572813392434e-07, + "loss": 0.6265, + "step": 27547 + }, + { + "epoch": 0.95, + "learning_rate": 1.0218040912602034e-07, + "loss": 0.6811, + "step": 27548 + }, + { + "epoch": 0.95, + "learning_rate": 1.0202520746928734e-07, + "loss": 0.6041, + "step": 27549 + }, + { + "epoch": 0.95, + "learning_rate": 1.0187012316556832e-07, + "loss": 0.6141, + "step": 27550 + }, + { + "epoch": 0.95, + "learning_rate": 1.0171515621669847e-07, + "loss": 0.6282, + "step": 27551 + }, + { + "epoch": 0.95, + "learning_rate": 1.0156030662451855e-07, + "loss": 0.6066, + "step": 27552 + }, + { + "epoch": 0.95, + "learning_rate": 1.0140557439086263e-07, + "loss": 0.6526, + "step": 27553 + }, + { + "epoch": 0.95, + "learning_rate": 1.0125095951756481e-07, + "loss": 0.6038, + "step": 27554 + }, + { + "epoch": 0.95, + "learning_rate": 1.0109646200645806e-07, + "loss": 0.6267, + "step": 27555 + }, + { + "epoch": 0.95, + "learning_rate": 1.0094208185937538e-07, + "loss": 0.6647, + "step": 27556 + }, + { + "epoch": 0.95, + "learning_rate": 1.0078781907814749e-07, + "loss": 0.5978, + "step": 27557 + }, + { + "epoch": 0.95, + "learning_rate": 1.0063367366460185e-07, + "loss": 0.6751, + "step": 27558 + }, + { + "epoch": 0.95, + "learning_rate": 1.00479645620567e-07, + "loss": 0.6393, + "step": 27559 + }, + { + "epoch": 0.95, + "learning_rate": 1.0032573494786924e-07, + "loss": 0.6052, + "step": 27560 + }, + { + "epoch": 0.95, + "learning_rate": 1.0017194164833267e-07, + "loss": 0.6141, + "step": 27561 + }, + { + "epoch": 0.95, + "learning_rate": 1.0001826572378137e-07, + "loss": 0.6364, + "step": 27562 + }, + { + "epoch": 0.95, + "learning_rate": 9.986470717603614e-08, + "loss": 0.67, + "step": 27563 + }, + { + "epoch": 0.96, + "learning_rate": 9.971126600691994e-08, + "loss": 0.6098, + "step": 27564 + }, + { + "epoch": 0.96, + "learning_rate": 9.955794221825021e-08, + "loss": 0.6425, + "step": 27565 + }, + { + "epoch": 0.96, + "learning_rate": 9.94047358118444e-08, + "loss": 0.6395, + "step": 27566 + }, + { + "epoch": 0.96, + "learning_rate": 9.925164678951993e-08, + "loss": 0.5767, + "step": 27567 + }, + { + "epoch": 0.96, + "learning_rate": 9.909867515309201e-08, + "loss": 0.6115, + "step": 27568 + }, + { + "epoch": 0.96, + "learning_rate": 9.894582090437476e-08, + "loss": 0.6314, + "step": 27569 + }, + { + "epoch": 0.96, + "learning_rate": 9.879308404517895e-08, + "loss": 0.6374, + "step": 27570 + }, + { + "epoch": 0.96, + "learning_rate": 9.864046457731646e-08, + "loss": 0.6751, + "step": 27571 + }, + { + "epoch": 0.96, + "learning_rate": 9.848796250259585e-08, + "loss": 0.6296, + "step": 27572 + }, + { + "epoch": 0.96, + "learning_rate": 9.833557782282677e-08, + "loss": 0.6064, + "step": 27573 + }, + { + "epoch": 0.96, + "learning_rate": 9.818331053981444e-08, + "loss": 0.6054, + "step": 27574 + }, + { + "epoch": 0.96, + "learning_rate": 9.803116065536522e-08, + "loss": 0.622, + "step": 27575 + }, + { + "epoch": 0.96, + "learning_rate": 9.787912817128209e-08, + "loss": 0.6282, + "step": 27576 + }, + { + "epoch": 0.96, + "learning_rate": 9.772721308936917e-08, + "loss": 0.6444, + "step": 27577 + }, + { + "epoch": 0.96, + "learning_rate": 9.757541541142612e-08, + "loss": 0.6282, + "step": 27578 + }, + { + "epoch": 0.96, + "learning_rate": 9.742373513925263e-08, + "loss": 0.6222, + "step": 27579 + }, + { + "epoch": 0.96, + "learning_rate": 9.727217227464836e-08, + "loss": 0.6567, + "step": 27580 + }, + { + "epoch": 0.96, + "learning_rate": 9.712072681940854e-08, + "loss": 0.6602, + "step": 27581 + }, + { + "epoch": 0.96, + "learning_rate": 9.696939877533063e-08, + "loss": 0.6543, + "step": 27582 + }, + { + "epoch": 0.96, + "learning_rate": 9.681818814420763e-08, + "loss": 0.6453, + "step": 27583 + }, + { + "epoch": 0.96, + "learning_rate": 9.666709492783256e-08, + "loss": 0.6829, + "step": 27584 + }, + { + "epoch": 0.96, + "learning_rate": 9.65161191279973e-08, + "loss": 0.6063, + "step": 27585 + }, + { + "epoch": 0.96, + "learning_rate": 9.636526074649045e-08, + "loss": 0.6979, + "step": 27586 + }, + { + "epoch": 0.96, + "learning_rate": 9.621451978510165e-08, + "loss": 0.6438, + "step": 27587 + }, + { + "epoch": 0.96, + "learning_rate": 9.606389624561952e-08, + "loss": 0.6621, + "step": 27588 + }, + { + "epoch": 0.96, + "learning_rate": 9.591339012982703e-08, + "loss": 0.6441, + "step": 27589 + }, + { + "epoch": 0.96, + "learning_rate": 9.576300143951056e-08, + "loss": 0.6975, + "step": 27590 + }, + { + "epoch": 0.96, + "learning_rate": 9.561273017645201e-08, + "loss": 0.578, + "step": 27591 + }, + { + "epoch": 0.96, + "learning_rate": 9.546257634243439e-08, + "loss": 0.6463, + "step": 27592 + }, + { + "epoch": 0.96, + "learning_rate": 9.531253993923739e-08, + "loss": 0.67, + "step": 27593 + }, + { + "epoch": 0.96, + "learning_rate": 9.51626209686396e-08, + "loss": 0.6662, + "step": 27594 + }, + { + "epoch": 0.96, + "learning_rate": 9.501281943241847e-08, + "loss": 0.6501, + "step": 27595 + }, + { + "epoch": 0.96, + "learning_rate": 9.486313533234925e-08, + "loss": 0.6162, + "step": 27596 + }, + { + "epoch": 0.96, + "learning_rate": 9.471356867020942e-08, + "loss": 0.6011, + "step": 27597 + }, + { + "epoch": 0.96, + "learning_rate": 9.456411944776866e-08, + "loss": 0.6438, + "step": 27598 + }, + { + "epoch": 0.96, + "learning_rate": 9.441478766680223e-08, + "loss": 0.6272, + "step": 27599 + }, + { + "epoch": 0.96, + "learning_rate": 9.426557332907871e-08, + "loss": 0.6357, + "step": 27600 + }, + { + "epoch": 0.96, + "learning_rate": 9.411647643636779e-08, + "loss": 0.6237, + "step": 27601 + }, + { + "epoch": 0.96, + "learning_rate": 9.396749699043583e-08, + "loss": 0.5898, + "step": 27602 + }, + { + "epoch": 0.96, + "learning_rate": 9.381863499305143e-08, + "loss": 0.6243, + "step": 27603 + }, + { + "epoch": 0.96, + "learning_rate": 9.366989044597874e-08, + "loss": 0.6118, + "step": 27604 + }, + { + "epoch": 0.96, + "learning_rate": 9.352126335097966e-08, + "loss": 0.5948, + "step": 27605 + }, + { + "epoch": 0.96, + "learning_rate": 9.337275370981946e-08, + "loss": 0.5545, + "step": 27606 + }, + { + "epoch": 0.96, + "learning_rate": 9.322436152425674e-08, + "loss": 0.6371, + "step": 27607 + }, + { + "epoch": 0.96, + "learning_rate": 9.307608679605119e-08, + "loss": 0.6376, + "step": 27608 + }, + { + "epoch": 0.96, + "learning_rate": 9.292792952696028e-08, + "loss": 0.6559, + "step": 27609 + }, + { + "epoch": 0.96, + "learning_rate": 9.277988971874263e-08, + "loss": 0.6231, + "step": 27610 + }, + { + "epoch": 0.96, + "learning_rate": 9.263196737315128e-08, + "loss": 0.6022, + "step": 27611 + }, + { + "epoch": 0.96, + "learning_rate": 9.248416249194148e-08, + "loss": 0.6135, + "step": 27612 + }, + { + "epoch": 0.96, + "learning_rate": 9.233647507686405e-08, + "loss": 0.5879, + "step": 27613 + }, + { + "epoch": 0.96, + "learning_rate": 9.218890512967094e-08, + "loss": 0.6402, + "step": 27614 + }, + { + "epoch": 0.96, + "learning_rate": 9.204145265211184e-08, + "loss": 0.6571, + "step": 27615 + }, + { + "epoch": 0.96, + "learning_rate": 9.189411764593536e-08, + "loss": 0.6137, + "step": 27616 + }, + { + "epoch": 0.96, + "learning_rate": 9.17469001128879e-08, + "loss": 0.6014, + "step": 27617 + }, + { + "epoch": 0.96, + "learning_rate": 9.15998000547158e-08, + "loss": 0.6027, + "step": 27618 + }, + { + "epoch": 0.96, + "learning_rate": 9.145281747316104e-08, + "loss": 0.6362, + "step": 27619 + }, + { + "epoch": 0.96, + "learning_rate": 9.130595236996776e-08, + "loss": 0.6243, + "step": 27620 + }, + { + "epoch": 0.96, + "learning_rate": 9.115920474687678e-08, + "loss": 0.6755, + "step": 27621 + }, + { + "epoch": 0.96, + "learning_rate": 9.101257460562895e-08, + "loss": 0.6403, + "step": 27622 + }, + { + "epoch": 0.96, + "learning_rate": 9.086606194796176e-08, + "loss": 0.6367, + "step": 27623 + }, + { + "epoch": 0.96, + "learning_rate": 9.071966677561273e-08, + "loss": 0.6083, + "step": 27624 + }, + { + "epoch": 0.96, + "learning_rate": 9.0573389090316e-08, + "loss": 0.6934, + "step": 27625 + }, + { + "epoch": 0.96, + "learning_rate": 9.042722889380795e-08, + "loss": 0.639, + "step": 27626 + }, + { + "epoch": 0.96, + "learning_rate": 9.028118618782167e-08, + "loss": 0.5551, + "step": 27627 + }, + { + "epoch": 0.96, + "learning_rate": 9.013526097408687e-08, + "loss": 0.6433, + "step": 27628 + }, + { + "epoch": 0.96, + "learning_rate": 8.998945325433439e-08, + "loss": 0.6025, + "step": 27629 + }, + { + "epoch": 0.96, + "learning_rate": 8.984376303029397e-08, + "loss": 0.6284, + "step": 27630 + }, + { + "epoch": 0.96, + "learning_rate": 8.969819030369198e-08, + "loss": 0.5856, + "step": 27631 + }, + { + "epoch": 0.96, + "learning_rate": 8.955273507625484e-08, + "loss": 0.6303, + "step": 27632 + }, + { + "epoch": 0.96, + "learning_rate": 8.940739734970561e-08, + "loss": 0.6419, + "step": 27633 + }, + { + "epoch": 0.96, + "learning_rate": 8.926217712576957e-08, + "loss": 0.6055, + "step": 27634 + }, + { + "epoch": 0.96, + "learning_rate": 8.911707440616756e-08, + "loss": 0.6779, + "step": 27635 + }, + { + "epoch": 0.96, + "learning_rate": 8.897208919261934e-08, + "loss": 0.6186, + "step": 27636 + }, + { + "epoch": 0.96, + "learning_rate": 8.882722148684575e-08, + "loss": 0.5826, + "step": 27637 + }, + { + "epoch": 0.96, + "learning_rate": 8.868247129056207e-08, + "loss": 0.6795, + "step": 27638 + }, + { + "epoch": 0.96, + "learning_rate": 8.853783860548581e-08, + "loss": 0.6276, + "step": 27639 + }, + { + "epoch": 0.96, + "learning_rate": 8.839332343333117e-08, + "loss": 0.6055, + "step": 27640 + }, + { + "epoch": 0.96, + "learning_rate": 8.824892577581234e-08, + "loss": 0.6729, + "step": 27641 + }, + { + "epoch": 0.96, + "learning_rate": 8.810464563464128e-08, + "loss": 0.6687, + "step": 27642 + }, + { + "epoch": 0.96, + "learning_rate": 8.796048301152771e-08, + "loss": 0.6291, + "step": 27643 + }, + { + "epoch": 0.96, + "learning_rate": 8.78164379081814e-08, + "loss": 0.5719, + "step": 27644 + }, + { + "epoch": 0.96, + "learning_rate": 8.767251032630985e-08, + "loss": 0.6111, + "step": 27645 + }, + { + "epoch": 0.96, + "learning_rate": 8.752870026762062e-08, + "loss": 0.6218, + "step": 27646 + }, + { + "epoch": 0.96, + "learning_rate": 8.738500773381786e-08, + "loss": 0.6449, + "step": 27647 + }, + { + "epoch": 0.96, + "learning_rate": 8.724143272660579e-08, + "loss": 0.5905, + "step": 27648 + }, + { + "epoch": 0.96, + "learning_rate": 8.709797524768526e-08, + "loss": 0.6221, + "step": 27649 + }, + { + "epoch": 0.96, + "learning_rate": 8.695463529875936e-08, + "loss": 0.5964, + "step": 27650 + }, + { + "epoch": 0.96, + "learning_rate": 8.681141288152451e-08, + "loss": 0.6294, + "step": 27651 + }, + { + "epoch": 0.96, + "learning_rate": 8.666830799768155e-08, + "loss": 0.6132, + "step": 27652 + }, + { + "epoch": 0.96, + "learning_rate": 8.652532064892693e-08, + "loss": 0.6809, + "step": 27653 + }, + { + "epoch": 0.96, + "learning_rate": 8.638245083695485e-08, + "loss": 0.6442, + "step": 27654 + }, + { + "epoch": 0.96, + "learning_rate": 8.623969856345948e-08, + "loss": 0.625, + "step": 27655 + }, + { + "epoch": 0.96, + "learning_rate": 8.609706383013395e-08, + "loss": 0.6053, + "step": 27656 + }, + { + "epoch": 0.96, + "learning_rate": 8.595454663866686e-08, + "loss": 0.6028, + "step": 27657 + }, + { + "epoch": 0.96, + "learning_rate": 8.581214699075136e-08, + "loss": 0.6602, + "step": 27658 + }, + { + "epoch": 0.96, + "learning_rate": 8.566986488807494e-08, + "loss": 0.6227, + "step": 27659 + }, + { + "epoch": 0.96, + "learning_rate": 8.552770033232294e-08, + "loss": 0.6028, + "step": 27660 + }, + { + "epoch": 0.96, + "learning_rate": 8.538565332518289e-08, + "loss": 0.6322, + "step": 27661 + }, + { + "epoch": 0.96, + "learning_rate": 8.52437238683379e-08, + "loss": 0.6119, + "step": 27662 + }, + { + "epoch": 0.96, + "learning_rate": 8.510191196346995e-08, + "loss": 0.6192, + "step": 27663 + }, + { + "epoch": 0.96, + "learning_rate": 8.496021761226103e-08, + "loss": 0.6326, + "step": 27664 + }, + { + "epoch": 0.96, + "learning_rate": 8.481864081639312e-08, + "loss": 0.6016, + "step": 27665 + }, + { + "epoch": 0.96, + "learning_rate": 8.467718157754157e-08, + "loss": 0.6499, + "step": 27666 + }, + { + "epoch": 0.96, + "learning_rate": 8.453583989738501e-08, + "loss": 0.6105, + "step": 27667 + }, + { + "epoch": 0.96, + "learning_rate": 8.439461577759989e-08, + "loss": 0.6364, + "step": 27668 + }, + { + "epoch": 0.96, + "learning_rate": 8.42535092198582e-08, + "loss": 0.64, + "step": 27669 + }, + { + "epoch": 0.96, + "learning_rate": 8.411252022583639e-08, + "loss": 0.6286, + "step": 27670 + }, + { + "epoch": 0.96, + "learning_rate": 8.397164879720421e-08, + "loss": 0.6371, + "step": 27671 + }, + { + "epoch": 0.96, + "learning_rate": 8.383089493563146e-08, + "loss": 0.6102, + "step": 27672 + }, + { + "epoch": 0.96, + "learning_rate": 8.36902586427868e-08, + "loss": 0.6001, + "step": 27673 + }, + { + "epoch": 0.96, + "learning_rate": 8.354973992033999e-08, + "loss": 0.6725, + "step": 27674 + }, + { + "epoch": 0.96, + "learning_rate": 8.340933876995416e-08, + "loss": 0.6085, + "step": 27675 + }, + { + "epoch": 0.96, + "learning_rate": 8.326905519329575e-08, + "loss": 0.6408, + "step": 27676 + }, + { + "epoch": 0.96, + "learning_rate": 8.312888919202677e-08, + "loss": 0.6356, + "step": 27677 + }, + { + "epoch": 0.96, + "learning_rate": 8.298884076781033e-08, + "loss": 0.6165, + "step": 27678 + }, + { + "epoch": 0.96, + "learning_rate": 8.284890992230621e-08, + "loss": 0.6519, + "step": 27679 + }, + { + "epoch": 0.96, + "learning_rate": 8.27090966571742e-08, + "loss": 0.6105, + "step": 27680 + }, + { + "epoch": 0.96, + "learning_rate": 8.256940097406962e-08, + "loss": 0.6436, + "step": 27681 + }, + { + "epoch": 0.96, + "learning_rate": 8.242982287465118e-08, + "loss": 0.607, + "step": 27682 + }, + { + "epoch": 0.96, + "learning_rate": 8.229036236057308e-08, + "loss": 0.6014, + "step": 27683 + }, + { + "epoch": 0.96, + "learning_rate": 8.215101943348847e-08, + "loss": 0.652, + "step": 27684 + }, + { + "epoch": 0.96, + "learning_rate": 8.201179409505045e-08, + "loss": 0.6247, + "step": 27685 + }, + { + "epoch": 0.96, + "learning_rate": 8.187268634690881e-08, + "loss": 0.6242, + "step": 27686 + }, + { + "epoch": 0.96, + "learning_rate": 8.173369619071114e-08, + "loss": 0.5815, + "step": 27687 + }, + { + "epoch": 0.96, + "learning_rate": 8.159482362810834e-08, + "loss": 0.6416, + "step": 27688 + }, + { + "epoch": 0.96, + "learning_rate": 8.145606866074685e-08, + "loss": 0.6042, + "step": 27689 + }, + { + "epoch": 0.96, + "learning_rate": 8.131743129026981e-08, + "loss": 0.6412, + "step": 27690 + }, + { + "epoch": 0.96, + "learning_rate": 8.117891151832147e-08, + "loss": 0.6514, + "step": 27691 + }, + { + "epoch": 0.96, + "learning_rate": 8.104050934654495e-08, + "loss": 0.6766, + "step": 27692 + }, + { + "epoch": 0.96, + "learning_rate": 8.090222477658005e-08, + "loss": 0.622, + "step": 27693 + }, + { + "epoch": 0.96, + "learning_rate": 8.076405781006769e-08, + "loss": 0.6005, + "step": 27694 + }, + { + "epoch": 0.96, + "learning_rate": 8.062600844864543e-08, + "loss": 0.5978, + "step": 27695 + }, + { + "epoch": 0.96, + "learning_rate": 8.048807669394975e-08, + "loss": 0.6614, + "step": 27696 + }, + { + "epoch": 0.96, + "learning_rate": 8.035026254761602e-08, + "loss": 0.6136, + "step": 27697 + }, + { + "epoch": 0.96, + "learning_rate": 8.021256601127959e-08, + "loss": 0.6329, + "step": 27698 + }, + { + "epoch": 0.96, + "learning_rate": 8.007498708657025e-08, + "loss": 0.6313, + "step": 27699 + }, + { + "epoch": 0.96, + "learning_rate": 7.993752577512004e-08, + "loss": 0.6616, + "step": 27700 + }, + { + "epoch": 0.96, + "learning_rate": 7.9800182078561e-08, + "loss": 0.6608, + "step": 27701 + }, + { + "epoch": 0.96, + "learning_rate": 7.966295599851959e-08, + "loss": 0.6703, + "step": 27702 + }, + { + "epoch": 0.96, + "learning_rate": 7.95258475366234e-08, + "loss": 0.666, + "step": 27703 + }, + { + "epoch": 0.96, + "learning_rate": 7.93888566944978e-08, + "loss": 0.589, + "step": 27704 + }, + { + "epoch": 0.96, + "learning_rate": 7.925198347376484e-08, + "loss": 0.6703, + "step": 27705 + }, + { + "epoch": 0.96, + "learning_rate": 7.911522787605097e-08, + "loss": 0.6399, + "step": 27706 + }, + { + "epoch": 0.96, + "learning_rate": 7.897858990297713e-08, + "loss": 0.6285, + "step": 27707 + }, + { + "epoch": 0.96, + "learning_rate": 7.884206955616092e-08, + "loss": 0.6306, + "step": 27708 + }, + { + "epoch": 0.96, + "learning_rate": 7.870566683722214e-08, + "loss": 0.623, + "step": 27709 + }, + { + "epoch": 0.96, + "learning_rate": 7.85693817477795e-08, + "loss": 0.6556, + "step": 27710 + }, + { + "epoch": 0.96, + "learning_rate": 7.843321428944617e-08, + "loss": 0.6339, + "step": 27711 + }, + { + "epoch": 0.96, + "learning_rate": 7.829716446383862e-08, + "loss": 0.6729, + "step": 27712 + }, + { + "epoch": 0.96, + "learning_rate": 7.816123227256889e-08, + "loss": 0.5872, + "step": 27713 + }, + { + "epoch": 0.96, + "learning_rate": 7.802541771724903e-08, + "loss": 0.5997, + "step": 27714 + }, + { + "epoch": 0.96, + "learning_rate": 7.788972079948998e-08, + "loss": 0.5869, + "step": 27715 + }, + { + "epoch": 0.96, + "learning_rate": 7.775414152089933e-08, + "loss": 0.6283, + "step": 27716 + }, + { + "epoch": 0.96, + "learning_rate": 7.761867988308358e-08, + "loss": 0.6275, + "step": 27717 + }, + { + "epoch": 0.96, + "learning_rate": 7.748333588765256e-08, + "loss": 0.6191, + "step": 27718 + }, + { + "epoch": 0.96, + "learning_rate": 7.734810953620719e-08, + "loss": 0.6369, + "step": 27719 + }, + { + "epoch": 0.96, + "learning_rate": 7.721300083035287e-08, + "loss": 0.6188, + "step": 27720 + }, + { + "epoch": 0.96, + "learning_rate": 7.707800977169055e-08, + "loss": 0.5962, + "step": 27721 + }, + { + "epoch": 0.96, + "learning_rate": 7.694313636182115e-08, + "loss": 0.6763, + "step": 27722 + }, + { + "epoch": 0.96, + "learning_rate": 7.68083806023423e-08, + "loss": 0.5901, + "step": 27723 + }, + { + "epoch": 0.96, + "learning_rate": 7.667374249485493e-08, + "loss": 0.6276, + "step": 27724 + }, + { + "epoch": 0.96, + "learning_rate": 7.653922204095221e-08, + "loss": 0.6472, + "step": 27725 + }, + { + "epoch": 0.96, + "learning_rate": 7.640481924223064e-08, + "loss": 0.6295, + "step": 27726 + }, + { + "epoch": 0.96, + "learning_rate": 7.62705341002834e-08, + "loss": 0.6553, + "step": 27727 + }, + { + "epoch": 0.96, + "learning_rate": 7.613636661670254e-08, + "loss": 0.6314, + "step": 27728 + }, + { + "epoch": 0.96, + "learning_rate": 7.60023167930779e-08, + "loss": 0.6229, + "step": 27729 + }, + { + "epoch": 0.96, + "learning_rate": 7.586838463100154e-08, + "loss": 0.6244, + "step": 27730 + }, + { + "epoch": 0.96, + "learning_rate": 7.573457013205887e-08, + "loss": 0.6701, + "step": 27731 + }, + { + "epoch": 0.96, + "learning_rate": 7.560087329783639e-08, + "loss": 0.6029, + "step": 27732 + }, + { + "epoch": 0.96, + "learning_rate": 7.54672941299206e-08, + "loss": 0.6341, + "step": 27733 + }, + { + "epoch": 0.96, + "learning_rate": 7.533383262989469e-08, + "loss": 0.6428, + "step": 27734 + }, + { + "epoch": 0.96, + "learning_rate": 7.520048879934073e-08, + "loss": 0.6069, + "step": 27735 + }, + { + "epoch": 0.96, + "learning_rate": 7.506726263983965e-08, + "loss": 0.6354, + "step": 27736 + }, + { + "epoch": 0.96, + "learning_rate": 7.493415415297245e-08, + "loss": 0.6342, + "step": 27737 + }, + { + "epoch": 0.96, + "learning_rate": 7.480116334031451e-08, + "loss": 0.6289, + "step": 27738 + }, + { + "epoch": 0.96, + "learning_rate": 7.466829020344568e-08, + "loss": 0.6341, + "step": 27739 + }, + { + "epoch": 0.96, + "learning_rate": 7.453553474393915e-08, + "loss": 0.6326, + "step": 27740 + }, + { + "epoch": 0.96, + "learning_rate": 7.440289696336922e-08, + "loss": 0.6709, + "step": 27741 + }, + { + "epoch": 0.96, + "learning_rate": 7.427037686330907e-08, + "loss": 0.6312, + "step": 27742 + }, + { + "epoch": 0.96, + "learning_rate": 7.413797444533077e-08, + "loss": 0.6623, + "step": 27743 + }, + { + "epoch": 0.96, + "learning_rate": 7.400568971100198e-08, + "loss": 0.5829, + "step": 27744 + }, + { + "epoch": 0.96, + "learning_rate": 7.387352266189251e-08, + "loss": 0.6524, + "step": 27745 + }, + { + "epoch": 0.96, + "learning_rate": 7.374147329956893e-08, + "loss": 0.5741, + "step": 27746 + }, + { + "epoch": 0.96, + "learning_rate": 7.360954162559774e-08, + "loss": 0.664, + "step": 27747 + }, + { + "epoch": 0.96, + "learning_rate": 7.347772764154104e-08, + "loss": 0.6565, + "step": 27748 + }, + { + "epoch": 0.96, + "learning_rate": 7.334603134896312e-08, + "loss": 0.5974, + "step": 27749 + }, + { + "epoch": 0.96, + "learning_rate": 7.321445274942607e-08, + "loss": 0.5768, + "step": 27750 + }, + { + "epoch": 0.96, + "learning_rate": 7.308299184448974e-08, + "loss": 0.6469, + "step": 27751 + }, + { + "epoch": 0.96, + "learning_rate": 7.295164863571069e-08, + "loss": 0.6068, + "step": 27752 + }, + { + "epoch": 0.96, + "learning_rate": 7.282042312464876e-08, + "loss": 0.624, + "step": 27753 + }, + { + "epoch": 0.96, + "learning_rate": 7.268931531285828e-08, + "loss": 0.5857, + "step": 27754 + }, + { + "epoch": 0.96, + "learning_rate": 7.255832520189354e-08, + "loss": 0.6361, + "step": 27755 + }, + { + "epoch": 0.96, + "learning_rate": 7.242745279330777e-08, + "loss": 0.6607, + "step": 27756 + }, + { + "epoch": 0.96, + "learning_rate": 7.229669808865414e-08, + "loss": 0.6263, + "step": 27757 + }, + { + "epoch": 0.96, + "learning_rate": 7.216606108948143e-08, + "loss": 0.6764, + "step": 27758 + }, + { + "epoch": 0.96, + "learning_rate": 7.203554179733951e-08, + "loss": 0.6554, + "step": 27759 + }, + { + "epoch": 0.96, + "learning_rate": 7.190514021377382e-08, + "loss": 0.5833, + "step": 27760 + }, + { + "epoch": 0.96, + "learning_rate": 7.177485634033199e-08, + "loss": 0.6634, + "step": 27761 + }, + { + "epoch": 0.96, + "learning_rate": 7.164469017855946e-08, + "loss": 0.6152, + "step": 27762 + }, + { + "epoch": 0.96, + "learning_rate": 7.151464172999834e-08, + "loss": 0.6073, + "step": 27763 + }, + { + "epoch": 0.96, + "learning_rate": 7.13847109961907e-08, + "loss": 0.6942, + "step": 27764 + }, + { + "epoch": 0.96, + "learning_rate": 7.125489797867646e-08, + "loss": 0.6175, + "step": 27765 + }, + { + "epoch": 0.96, + "learning_rate": 7.112520267899547e-08, + "loss": 0.6224, + "step": 27766 + }, + { + "epoch": 0.96, + "learning_rate": 7.099562509868541e-08, + "loss": 0.6187, + "step": 27767 + }, + { + "epoch": 0.96, + "learning_rate": 7.086616523928281e-08, + "loss": 0.6042, + "step": 27768 + }, + { + "epoch": 0.96, + "learning_rate": 7.073682310232199e-08, + "loss": 0.5683, + "step": 27769 + }, + { + "epoch": 0.96, + "learning_rate": 7.06075986893373e-08, + "loss": 0.6399, + "step": 27770 + }, + { + "epoch": 0.96, + "learning_rate": 7.047849200185974e-08, + "loss": 0.6067, + "step": 27771 + }, + { + "epoch": 0.96, + "learning_rate": 7.03495030414203e-08, + "loss": 0.6455, + "step": 27772 + }, + { + "epoch": 0.96, + "learning_rate": 7.022063180954886e-08, + "loss": 0.6301, + "step": 27773 + }, + { + "epoch": 0.96, + "learning_rate": 7.009187830777308e-08, + "loss": 0.6163, + "step": 27774 + }, + { + "epoch": 0.96, + "learning_rate": 6.996324253761955e-08, + "loss": 0.624, + "step": 27775 + }, + { + "epoch": 0.96, + "learning_rate": 6.983472450061257e-08, + "loss": 0.656, + "step": 27776 + }, + { + "epoch": 0.96, + "learning_rate": 6.970632419827761e-08, + "loss": 0.6433, + "step": 27777 + }, + { + "epoch": 0.96, + "learning_rate": 6.957804163213567e-08, + "loss": 0.6012, + "step": 27778 + }, + { + "epoch": 0.96, + "learning_rate": 6.944987680370774e-08, + "loss": 0.6604, + "step": 27779 + }, + { + "epoch": 0.96, + "learning_rate": 6.932182971451485e-08, + "loss": 0.5883, + "step": 27780 + }, + { + "epoch": 0.96, + "learning_rate": 6.919390036607354e-08, + "loss": 0.6369, + "step": 27781 + }, + { + "epoch": 0.96, + "learning_rate": 6.90660887599004e-08, + "loss": 0.6559, + "step": 27782 + }, + { + "epoch": 0.96, + "learning_rate": 6.893839489751197e-08, + "loss": 0.6328, + "step": 27783 + }, + { + "epoch": 0.96, + "learning_rate": 6.88108187804215e-08, + "loss": 0.6194, + "step": 27784 + }, + { + "epoch": 0.96, + "learning_rate": 6.868336041014224e-08, + "loss": 0.6739, + "step": 27785 + }, + { + "epoch": 0.96, + "learning_rate": 6.855601978818516e-08, + "loss": 0.6719, + "step": 27786 + }, + { + "epoch": 0.96, + "learning_rate": 6.842879691605908e-08, + "loss": 0.6187, + "step": 27787 + }, + { + "epoch": 0.96, + "learning_rate": 6.83016917952739e-08, + "loss": 0.6645, + "step": 27788 + }, + { + "epoch": 0.96, + "learning_rate": 6.81747044273351e-08, + "loss": 0.6075, + "step": 27789 + }, + { + "epoch": 0.96, + "learning_rate": 6.804783481374922e-08, + "loss": 0.6154, + "step": 27790 + }, + { + "epoch": 0.96, + "learning_rate": 6.792108295601951e-08, + "loss": 0.6569, + "step": 27791 + }, + { + "epoch": 0.96, + "learning_rate": 6.779444885565146e-08, + "loss": 0.6866, + "step": 27792 + }, + { + "epoch": 0.96, + "learning_rate": 6.766793251414272e-08, + "loss": 0.6301, + "step": 27793 + }, + { + "epoch": 0.96, + "learning_rate": 6.754153393299545e-08, + "loss": 0.6299, + "step": 27794 + }, + { + "epoch": 0.96, + "learning_rate": 6.741525311370845e-08, + "loss": 0.6557, + "step": 27795 + }, + { + "epoch": 0.96, + "learning_rate": 6.728909005777828e-08, + "loss": 0.6161, + "step": 27796 + }, + { + "epoch": 0.96, + "learning_rate": 6.716304476670044e-08, + "loss": 0.577, + "step": 27797 + }, + { + "epoch": 0.96, + "learning_rate": 6.703711724197037e-08, + "loss": 0.5468, + "step": 27798 + }, + { + "epoch": 0.96, + "learning_rate": 6.691130748508023e-08, + "loss": 0.6421, + "step": 27799 + }, + { + "epoch": 0.96, + "learning_rate": 6.678561549752216e-08, + "loss": 0.5799, + "step": 27800 + }, + { + "epoch": 0.96, + "learning_rate": 6.666004128078607e-08, + "loss": 0.6488, + "step": 27801 + }, + { + "epoch": 0.96, + "learning_rate": 6.653458483636078e-08, + "loss": 0.6466, + "step": 27802 + }, + { + "epoch": 0.96, + "learning_rate": 6.640924616573396e-08, + "loss": 0.6426, + "step": 27803 + }, + { + "epoch": 0.96, + "learning_rate": 6.628402527039224e-08, + "loss": 0.6157, + "step": 27804 + }, + { + "epoch": 0.96, + "learning_rate": 6.615892215181885e-08, + "loss": 0.6487, + "step": 27805 + }, + { + "epoch": 0.96, + "learning_rate": 6.603393681149706e-08, + "loss": 0.7066, + "step": 27806 + }, + { + "epoch": 0.96, + "learning_rate": 6.590906925091123e-08, + "loss": 0.6318, + "step": 27807 + }, + { + "epoch": 0.96, + "learning_rate": 6.578431947153907e-08, + "loss": 0.6091, + "step": 27808 + }, + { + "epoch": 0.96, + "learning_rate": 6.565968747486051e-08, + "loss": 0.6729, + "step": 27809 + }, + { + "epoch": 0.96, + "learning_rate": 6.553517326235436e-08, + "loss": 0.6339, + "step": 27810 + }, + { + "epoch": 0.96, + "learning_rate": 6.541077683549502e-08, + "loss": 0.6493, + "step": 27811 + }, + { + "epoch": 0.96, + "learning_rate": 6.528649819575794e-08, + "loss": 0.6002, + "step": 27812 + }, + { + "epoch": 0.96, + "learning_rate": 6.516233734461751e-08, + "loss": 0.6804, + "step": 27813 + }, + { + "epoch": 0.96, + "learning_rate": 6.50382942835448e-08, + "loss": 0.651, + "step": 27814 + }, + { + "epoch": 0.96, + "learning_rate": 6.491436901401082e-08, + "loss": 0.6848, + "step": 27815 + }, + { + "epoch": 0.96, + "learning_rate": 6.479056153748665e-08, + "loss": 0.6349, + "step": 27816 + }, + { + "epoch": 0.96, + "learning_rate": 6.466687185543663e-08, + "loss": 0.6171, + "step": 27817 + }, + { + "epoch": 0.96, + "learning_rate": 6.454329996932963e-08, + "loss": 0.6191, + "step": 27818 + }, + { + "epoch": 0.96, + "learning_rate": 6.441984588062999e-08, + "loss": 0.6452, + "step": 27819 + }, + { + "epoch": 0.96, + "learning_rate": 6.429650959080213e-08, + "loss": 0.6121, + "step": 27820 + }, + { + "epoch": 0.96, + "learning_rate": 6.41732911013071e-08, + "loss": 0.6119, + "step": 27821 + }, + { + "epoch": 0.96, + "learning_rate": 6.405019041360816e-08, + "loss": 0.6616, + "step": 27822 + }, + { + "epoch": 0.96, + "learning_rate": 6.392720752916193e-08, + "loss": 0.682, + "step": 27823 + }, + { + "epoch": 0.96, + "learning_rate": 6.380434244942724e-08, + "loss": 0.6596, + "step": 27824 + }, + { + "epoch": 0.96, + "learning_rate": 6.368159517586293e-08, + "loss": 0.6342, + "step": 27825 + }, + { + "epoch": 0.96, + "learning_rate": 6.355896570992225e-08, + "loss": 0.646, + "step": 27826 + }, + { + "epoch": 0.96, + "learning_rate": 6.343645405305964e-08, + "loss": 0.6303, + "step": 27827 + }, + { + "epoch": 0.96, + "learning_rate": 6.331406020672726e-08, + "loss": 0.694, + "step": 27828 + }, + { + "epoch": 0.96, + "learning_rate": 6.319178417237725e-08, + "loss": 0.6623, + "step": 27829 + }, + { + "epoch": 0.96, + "learning_rate": 6.306962595145849e-08, + "loss": 0.5928, + "step": 27830 + }, + { + "epoch": 0.96, + "learning_rate": 6.29475855454198e-08, + "loss": 0.6202, + "step": 27831 + }, + { + "epoch": 0.96, + "learning_rate": 6.28256629557078e-08, + "loss": 0.6772, + "step": 27832 + }, + { + "epoch": 0.96, + "learning_rate": 6.270385818376801e-08, + "loss": 0.5809, + "step": 27833 + }, + { + "epoch": 0.96, + "learning_rate": 6.258217123104593e-08, + "loss": 0.6494, + "step": 27834 + }, + { + "epoch": 0.96, + "learning_rate": 6.246060209898152e-08, + "loss": 0.6418, + "step": 27835 + }, + { + "epoch": 0.96, + "learning_rate": 6.233915078901809e-08, + "loss": 0.6065, + "step": 27836 + }, + { + "epoch": 0.96, + "learning_rate": 6.221781730259558e-08, + "loss": 0.6626, + "step": 27837 + }, + { + "epoch": 0.96, + "learning_rate": 6.209660164115171e-08, + "loss": 0.6148, + "step": 27838 + }, + { + "epoch": 0.96, + "learning_rate": 6.197550380612538e-08, + "loss": 0.6152, + "step": 27839 + }, + { + "epoch": 0.96, + "learning_rate": 6.185452379894985e-08, + "loss": 0.6555, + "step": 27840 + }, + { + "epoch": 0.96, + "learning_rate": 6.173366162106175e-08, + "loss": 0.6241, + "step": 27841 + }, + { + "epoch": 0.96, + "learning_rate": 6.161291727389218e-08, + "loss": 0.6548, + "step": 27842 + }, + { + "epoch": 0.96, + "learning_rate": 6.149229075887331e-08, + "loss": 0.6023, + "step": 27843 + }, + { + "epoch": 0.96, + "learning_rate": 6.137178207743622e-08, + "loss": 0.5622, + "step": 27844 + }, + { + "epoch": 0.96, + "learning_rate": 6.125139123100976e-08, + "loss": 0.5847, + "step": 27845 + }, + { + "epoch": 0.96, + "learning_rate": 6.113111822101947e-08, + "loss": 0.6975, + "step": 27846 + }, + { + "epoch": 0.96, + "learning_rate": 6.101096304889309e-08, + "loss": 0.6282, + "step": 27847 + }, + { + "epoch": 0.96, + "learning_rate": 6.089092571605393e-08, + "loss": 0.5718, + "step": 27848 + }, + { + "epoch": 0.96, + "learning_rate": 6.07710062239264e-08, + "loss": 0.6025, + "step": 27849 + }, + { + "epoch": 0.96, + "learning_rate": 6.065120457393158e-08, + "loss": 0.7128, + "step": 27850 + }, + { + "epoch": 0.96, + "learning_rate": 6.053152076749169e-08, + "loss": 0.6363, + "step": 27851 + }, + { + "epoch": 0.96, + "learning_rate": 6.041195480602225e-08, + "loss": 0.6046, + "step": 27852 + }, + { + "epoch": 0.97, + "learning_rate": 6.029250669094322e-08, + "loss": 0.5973, + "step": 27853 + }, + { + "epoch": 0.97, + "learning_rate": 6.017317642367015e-08, + "loss": 0.6702, + "step": 27854 + }, + { + "epoch": 0.97, + "learning_rate": 6.005396400561859e-08, + "loss": 0.613, + "step": 27855 + }, + { + "epoch": 0.97, + "learning_rate": 5.99348694382007e-08, + "loss": 0.6198, + "step": 27856 + }, + { + "epoch": 0.97, + "learning_rate": 5.981589272282984e-08, + "loss": 0.6126, + "step": 27857 + }, + { + "epoch": 0.97, + "learning_rate": 5.969703386091486e-08, + "loss": 0.6202, + "step": 27858 + }, + { + "epoch": 0.97, + "learning_rate": 5.957829285386685e-08, + "loss": 0.5952, + "step": 27859 + }, + { + "epoch": 0.97, + "learning_rate": 5.945966970309358e-08, + "loss": 0.6021, + "step": 27860 + }, + { + "epoch": 0.97, + "learning_rate": 5.934116440999948e-08, + "loss": 0.6287, + "step": 27861 + }, + { + "epoch": 0.97, + "learning_rate": 5.9222776975991214e-08, + "loss": 0.6727, + "step": 27862 + }, + { + "epoch": 0.97, + "learning_rate": 5.91045074024732e-08, + "loss": 0.637, + "step": 27863 + }, + { + "epoch": 0.97, + "learning_rate": 5.898635569084543e-08, + "loss": 0.5125, + "step": 27864 + }, + { + "epoch": 0.97, + "learning_rate": 5.8868321842510123e-08, + "loss": 0.6381, + "step": 27865 + }, + { + "epoch": 0.97, + "learning_rate": 5.8750405858866156e-08, + "loss": 0.6512, + "step": 27866 + }, + { + "epoch": 0.97, + "learning_rate": 5.8632607741312406e-08, + "loss": 0.6651, + "step": 27867 + }, + { + "epoch": 0.97, + "learning_rate": 5.851492749124443e-08, + "loss": 0.6756, + "step": 27868 + }, + { + "epoch": 0.97, + "learning_rate": 5.839736511005889e-08, + "loss": 0.6477, + "step": 27869 + }, + { + "epoch": 0.97, + "learning_rate": 5.8279920599148e-08, + "loss": 0.6073, + "step": 27870 + }, + { + "epoch": 0.97, + "learning_rate": 5.816259395990509e-08, + "loss": 0.5935, + "step": 27871 + }, + { + "epoch": 0.97, + "learning_rate": 5.8045385193721274e-08, + "loss": 0.6186, + "step": 27872 + }, + { + "epoch": 0.97, + "learning_rate": 5.792829430198543e-08, + "loss": 0.5859, + "step": 27873 + }, + { + "epoch": 0.97, + "learning_rate": 5.7811321286087575e-08, + "loss": 0.5552, + "step": 27874 + }, + { + "epoch": 0.97, + "learning_rate": 5.769446614741325e-08, + "loss": 0.5935, + "step": 27875 + }, + { + "epoch": 0.97, + "learning_rate": 5.757772888734803e-08, + "loss": 0.6643, + "step": 27876 + }, + { + "epoch": 0.97, + "learning_rate": 5.746110950727524e-08, + "loss": 0.6505, + "step": 27877 + }, + { + "epoch": 0.97, + "learning_rate": 5.734460800857933e-08, + "loss": 0.6557, + "step": 27878 + }, + { + "epoch": 0.97, + "learning_rate": 5.72282243926392e-08, + "loss": 0.6055, + "step": 27879 + }, + { + "epoch": 0.97, + "learning_rate": 5.7111958660837075e-08, + "loss": 0.5953, + "step": 27880 + }, + { + "epoch": 0.97, + "learning_rate": 5.6995810814551856e-08, + "loss": 0.6402, + "step": 27881 + }, + { + "epoch": 0.97, + "learning_rate": 5.6879780855158e-08, + "loss": 0.612, + "step": 27882 + }, + { + "epoch": 0.97, + "learning_rate": 5.6763868784032174e-08, + "loss": 0.5903, + "step": 27883 + }, + { + "epoch": 0.97, + "learning_rate": 5.664807460254884e-08, + "loss": 0.638, + "step": 27884 + }, + { + "epoch": 0.97, + "learning_rate": 5.653239831208135e-08, + "loss": 0.6077, + "step": 27885 + }, + { + "epoch": 0.97, + "learning_rate": 5.641683991400082e-08, + "loss": 0.6085, + "step": 27886 + }, + { + "epoch": 0.97, + "learning_rate": 5.630139940967727e-08, + "loss": 0.612, + "step": 27887 + }, + { + "epoch": 0.97, + "learning_rate": 5.618607680047961e-08, + "loss": 0.6271, + "step": 27888 + }, + { + "epoch": 0.97, + "learning_rate": 5.607087208777562e-08, + "loss": 0.6411, + "step": 27889 + }, + { + "epoch": 0.97, + "learning_rate": 5.5955785272929774e-08, + "loss": 0.6178, + "step": 27890 + }, + { + "epoch": 0.97, + "learning_rate": 5.584081635730654e-08, + "loss": 0.6116, + "step": 27891 + }, + { + "epoch": 0.97, + "learning_rate": 5.572596534227148e-08, + "loss": 0.6452, + "step": 27892 + }, + { + "epoch": 0.97, + "learning_rate": 5.561123222918463e-08, + "loss": 0.617, + "step": 27893 + }, + { + "epoch": 0.97, + "learning_rate": 5.5496617019404894e-08, + "loss": 0.6126, + "step": 27894 + }, + { + "epoch": 0.97, + "learning_rate": 5.5382119714293416e-08, + "loss": 0.623, + "step": 27895 + }, + { + "epoch": 0.97, + "learning_rate": 5.526774031520687e-08, + "loss": 0.6193, + "step": 27896 + }, + { + "epoch": 0.97, + "learning_rate": 5.515347882350197e-08, + "loss": 0.642, + "step": 27897 + }, + { + "epoch": 0.97, + "learning_rate": 5.5039335240532063e-08, + "loss": 0.6984, + "step": 27898 + }, + { + "epoch": 0.97, + "learning_rate": 5.492530956765163e-08, + "loss": 0.6223, + "step": 27899 + }, + { + "epoch": 0.97, + "learning_rate": 5.481140180621291e-08, + "loss": 0.6056, + "step": 27900 + }, + { + "epoch": 0.97, + "learning_rate": 5.469761195756485e-08, + "loss": 0.6412, + "step": 27901 + }, + { + "epoch": 0.97, + "learning_rate": 5.458394002305745e-08, + "loss": 0.6875, + "step": 27902 + }, + { + "epoch": 0.97, + "learning_rate": 5.4470386004038535e-08, + "loss": 0.6032, + "step": 27903 + }, + { + "epoch": 0.97, + "learning_rate": 5.435694990185481e-08, + "loss": 0.6533, + "step": 27904 + }, + { + "epoch": 0.97, + "learning_rate": 5.424363171785074e-08, + "loss": 0.6665, + "step": 27905 + }, + { + "epoch": 0.97, + "learning_rate": 5.413043145336972e-08, + "loss": 0.64, + "step": 27906 + }, + { + "epoch": 0.97, + "learning_rate": 5.401734910975398e-08, + "loss": 0.6549, + "step": 27907 + }, + { + "epoch": 0.97, + "learning_rate": 5.390438468834358e-08, + "loss": 0.6611, + "step": 27908 + }, + { + "epoch": 0.97, + "learning_rate": 5.3791538190479665e-08, + "loss": 0.6075, + "step": 27909 + }, + { + "epoch": 0.97, + "learning_rate": 5.367880961749894e-08, + "loss": 0.6104, + "step": 27910 + }, + { + "epoch": 0.97, + "learning_rate": 5.3566198970737e-08, + "loss": 0.6571, + "step": 27911 + }, + { + "epoch": 0.97, + "learning_rate": 5.345370625153168e-08, + "loss": 0.6592, + "step": 27912 + }, + { + "epoch": 0.97, + "learning_rate": 5.3341331461214116e-08, + "loss": 0.6909, + "step": 27913 + }, + { + "epoch": 0.97, + "learning_rate": 5.32290746011177e-08, + "loss": 0.5804, + "step": 27914 + }, + { + "epoch": 0.97, + "learning_rate": 5.311693567257248e-08, + "loss": 0.6735, + "step": 27915 + }, + { + "epoch": 0.97, + "learning_rate": 5.300491467691071e-08, + "loss": 0.624, + "step": 27916 + }, + { + "epoch": 0.97, + "learning_rate": 5.2893011615458013e-08, + "loss": 0.6425, + "step": 27917 + }, + { + "epoch": 0.97, + "learning_rate": 5.278122648954109e-08, + "loss": 0.6372, + "step": 27918 + }, + { + "epoch": 0.97, + "learning_rate": 5.266955930048778e-08, + "loss": 0.6081, + "step": 27919 + }, + { + "epoch": 0.97, + "learning_rate": 5.2558010049618134e-08, + "loss": 0.617, + "step": 27920 + }, + { + "epoch": 0.97, + "learning_rate": 5.244657873825776e-08, + "loss": 0.5647, + "step": 27921 + }, + { + "epoch": 0.97, + "learning_rate": 5.233526536772671e-08, + "loss": 0.6838, + "step": 27922 + }, + { + "epoch": 0.97, + "learning_rate": 5.222406993934504e-08, + "loss": 0.6281, + "step": 27923 + }, + { + "epoch": 0.97, + "learning_rate": 5.211299245443169e-08, + "loss": 0.6079, + "step": 27924 + }, + { + "epoch": 0.97, + "learning_rate": 5.200203291430228e-08, + "loss": 0.5762, + "step": 27925 + }, + { + "epoch": 0.97, + "learning_rate": 5.1891191320273536e-08, + "loss": 0.5933, + "step": 27926 + }, + { + "epoch": 0.97, + "learning_rate": 5.178046767365885e-08, + "loss": 0.6546, + "step": 27927 + }, + { + "epoch": 0.97, + "learning_rate": 5.1669861975771616e-08, + "loss": 0.6169, + "step": 27928 + }, + { + "epoch": 0.97, + "learning_rate": 5.15593742279219e-08, + "loss": 0.6008, + "step": 27929 + }, + { + "epoch": 0.97, + "learning_rate": 5.144900443142087e-08, + "loss": 0.6376, + "step": 27930 + }, + { + "epoch": 0.97, + "learning_rate": 5.133875258757748e-08, + "loss": 0.6372, + "step": 27931 + }, + { + "epoch": 0.97, + "learning_rate": 5.1228618697698463e-08, + "loss": 0.5421, + "step": 27932 + }, + { + "epoch": 0.97, + "learning_rate": 5.111860276308833e-08, + "loss": 0.6869, + "step": 27933 + }, + { + "epoch": 0.97, + "learning_rate": 5.100870478505382e-08, + "loss": 0.5973, + "step": 27934 + }, + { + "epoch": 0.97, + "learning_rate": 5.089892476489611e-08, + "loss": 0.6478, + "step": 27935 + }, + { + "epoch": 0.97, + "learning_rate": 5.078926270391748e-08, + "loss": 0.6287, + "step": 27936 + }, + { + "epoch": 0.97, + "learning_rate": 5.0679718603418024e-08, + "loss": 0.5933, + "step": 27937 + }, + { + "epoch": 0.97, + "learning_rate": 5.057029246469669e-08, + "loss": 0.6301, + "step": 27938 + }, + { + "epoch": 0.97, + "learning_rate": 5.0460984289049106e-08, + "loss": 0.664, + "step": 27939 + }, + { + "epoch": 0.97, + "learning_rate": 5.035179407777424e-08, + "loss": 0.6587, + "step": 27940 + }, + { + "epoch": 0.97, + "learning_rate": 5.0242721832164385e-08, + "loss": 0.6424, + "step": 27941 + }, + { + "epoch": 0.97, + "learning_rate": 5.013376755351407e-08, + "loss": 0.6562, + "step": 27942 + }, + { + "epoch": 0.97, + "learning_rate": 5.002493124311558e-08, + "loss": 0.6795, + "step": 27943 + }, + { + "epoch": 0.97, + "learning_rate": 4.991621290225679e-08, + "loss": 0.63, + "step": 27944 + }, + { + "epoch": 0.97, + "learning_rate": 4.9807612532227766e-08, + "loss": 0.5794, + "step": 27945 + }, + { + "epoch": 0.97, + "learning_rate": 4.9699130134318596e-08, + "loss": 0.613, + "step": 27946 + }, + { + "epoch": 0.97, + "learning_rate": 4.959076570981158e-08, + "loss": 0.6235, + "step": 27947 + }, + { + "epoch": 0.97, + "learning_rate": 4.948251925999459e-08, + "loss": 0.6557, + "step": 27948 + }, + { + "epoch": 0.97, + "learning_rate": 4.9374390786149914e-08, + "loss": 0.6571, + "step": 27949 + }, + { + "epoch": 0.97, + "learning_rate": 4.926638028955877e-08, + "loss": 0.619, + "step": 27950 + }, + { + "epoch": 0.97, + "learning_rate": 4.915848777150234e-08, + "loss": 0.6253, + "step": 27951 + }, + { + "epoch": 0.97, + "learning_rate": 4.9050713233259604e-08, + "loss": 0.601, + "step": 27952 + }, + { + "epoch": 0.97, + "learning_rate": 4.894305667610955e-08, + "loss": 0.6529, + "step": 27953 + }, + { + "epoch": 0.97, + "learning_rate": 4.8835518101326693e-08, + "loss": 0.6586, + "step": 27954 + }, + { + "epoch": 0.97, + "learning_rate": 4.872809751018892e-08, + "loss": 0.6297, + "step": 27955 + }, + { + "epoch": 0.97, + "learning_rate": 4.8620794903966316e-08, + "loss": 0.6246, + "step": 27956 + }, + { + "epoch": 0.97, + "learning_rate": 4.851361028393231e-08, + "loss": 0.6794, + "step": 27957 + }, + { + "epoch": 0.97, + "learning_rate": 4.8406543651360324e-08, + "loss": 0.6395, + "step": 27958 + }, + { + "epoch": 0.97, + "learning_rate": 4.8299595007516023e-08, + "loss": 0.6243, + "step": 27959 + }, + { + "epoch": 0.97, + "learning_rate": 4.8192764353668374e-08, + "loss": 0.6119, + "step": 27960 + }, + { + "epoch": 0.97, + "learning_rate": 4.808605169108638e-08, + "loss": 0.5834, + "step": 27961 + }, + { + "epoch": 0.97, + "learning_rate": 4.797945702103235e-08, + "loss": 0.634, + "step": 27962 + }, + { + "epoch": 0.97, + "learning_rate": 4.7872980344771945e-08, + "loss": 0.6923, + "step": 27963 + }, + { + "epoch": 0.97, + "learning_rate": 4.776662166356638e-08, + "loss": 0.6475, + "step": 27964 + }, + { + "epoch": 0.97, + "learning_rate": 4.766038097867687e-08, + "loss": 0.5735, + "step": 27965 + }, + { + "epoch": 0.97, + "learning_rate": 4.755425829136351e-08, + "loss": 0.639, + "step": 27966 + }, + { + "epoch": 0.97, + "learning_rate": 4.7448253602885296e-08, + "loss": 0.6549, + "step": 27967 + }, + { + "epoch": 0.97, + "learning_rate": 4.7342366914496784e-08, + "loss": 0.6488, + "step": 27968 + }, + { + "epoch": 0.97, + "learning_rate": 4.723659822745474e-08, + "loss": 0.6723, + "step": 27969 + }, + { + "epoch": 0.97, + "learning_rate": 4.7130947543013724e-08, + "loss": 0.5904, + "step": 27970 + }, + { + "epoch": 0.97, + "learning_rate": 4.702541486242496e-08, + "loss": 0.633, + "step": 27971 + }, + { + "epoch": 0.97, + "learning_rate": 4.692000018694187e-08, + "loss": 0.64, + "step": 27972 + }, + { + "epoch": 0.97, + "learning_rate": 4.6814703517812364e-08, + "loss": 0.6184, + "step": 27973 + }, + { + "epoch": 0.97, + "learning_rate": 4.670952485628433e-08, + "loss": 0.6437, + "step": 27974 + }, + { + "epoch": 0.97, + "learning_rate": 4.6604464203606756e-08, + "loss": 0.5621, + "step": 27975 + }, + { + "epoch": 0.97, + "learning_rate": 4.649952156102422e-08, + "loss": 0.5994, + "step": 27976 + }, + { + "epoch": 0.97, + "learning_rate": 4.639469692978127e-08, + "loss": 0.6075, + "step": 27977 + }, + { + "epoch": 0.97, + "learning_rate": 4.628999031112136e-08, + "loss": 0.6286, + "step": 27978 + }, + { + "epoch": 0.97, + "learning_rate": 4.618540170628349e-08, + "loss": 0.6564, + "step": 27979 + }, + { + "epoch": 0.97, + "learning_rate": 4.608093111651002e-08, + "loss": 0.5915, + "step": 27980 + }, + { + "epoch": 0.97, + "learning_rate": 4.597657854303883e-08, + "loss": 0.6829, + "step": 27981 + }, + { + "epoch": 0.97, + "learning_rate": 4.587234398710783e-08, + "loss": 0.6298, + "step": 27982 + }, + { + "epoch": 0.97, + "learning_rate": 4.576822744995158e-08, + "loss": 0.606, + "step": 27983 + }, + { + "epoch": 0.97, + "learning_rate": 4.566422893280575e-08, + "loss": 0.6504, + "step": 27984 + }, + { + "epoch": 0.97, + "learning_rate": 4.5560348436901603e-08, + "loss": 0.603, + "step": 27985 + }, + { + "epoch": 0.97, + "learning_rate": 4.545658596347258e-08, + "loss": 0.6325, + "step": 27986 + }, + { + "epoch": 0.97, + "learning_rate": 4.53529415137488e-08, + "loss": 0.6283, + "step": 27987 + }, + { + "epoch": 0.97, + "learning_rate": 4.524941508895819e-08, + "loss": 0.6052, + "step": 27988 + }, + { + "epoch": 0.97, + "learning_rate": 4.514600669032865e-08, + "loss": 0.6607, + "step": 27989 + }, + { + "epoch": 0.97, + "learning_rate": 4.504271631908586e-08, + "loss": 0.5756, + "step": 27990 + }, + { + "epoch": 0.97, + "learning_rate": 4.49395439764555e-08, + "loss": 0.6097, + "step": 27991 + }, + { + "epoch": 0.97, + "learning_rate": 4.4836489663658836e-08, + "loss": 0.6691, + "step": 27992 + }, + { + "epoch": 0.97, + "learning_rate": 4.4733553381919316e-08, + "loss": 0.613, + "step": 27993 + }, + { + "epoch": 0.97, + "learning_rate": 4.463073513245708e-08, + "loss": 0.6267, + "step": 27994 + }, + { + "epoch": 0.97, + "learning_rate": 4.452803491649227e-08, + "loss": 0.6372, + "step": 27995 + }, + { + "epoch": 0.97, + "learning_rate": 4.4425452735240574e-08, + "loss": 0.6244, + "step": 27996 + }, + { + "epoch": 0.97, + "learning_rate": 4.432298858991879e-08, + "loss": 0.6316, + "step": 27997 + }, + { + "epoch": 0.97, + "learning_rate": 4.422064248174151e-08, + "loss": 0.6934, + "step": 27998 + }, + { + "epoch": 0.97, + "learning_rate": 4.411841441192333e-08, + "loss": 0.6313, + "step": 27999 + }, + { + "epoch": 0.97, + "learning_rate": 4.401630438167548e-08, + "loss": 0.6593, + "step": 28000 + }, + { + "epoch": 0.97, + "learning_rate": 4.3914312392208116e-08, + "loss": 0.5834, + "step": 28001 + }, + { + "epoch": 0.97, + "learning_rate": 4.381243844473249e-08, + "loss": 0.6082, + "step": 28002 + }, + { + "epoch": 0.97, + "learning_rate": 4.37106825404543e-08, + "loss": 0.6565, + "step": 28003 + }, + { + "epoch": 0.97, + "learning_rate": 4.3609044680580356e-08, + "loss": 0.6597, + "step": 28004 + }, + { + "epoch": 0.97, + "learning_rate": 4.3507524866316376e-08, + "loss": 0.6416, + "step": 28005 + }, + { + "epoch": 0.97, + "learning_rate": 4.3406123098864714e-08, + "loss": 0.6556, + "step": 28006 + }, + { + "epoch": 0.97, + "learning_rate": 4.330483937942997e-08, + "loss": 0.681, + "step": 28007 + }, + { + "epoch": 0.97, + "learning_rate": 4.320367370921119e-08, + "loss": 0.6184, + "step": 28008 + }, + { + "epoch": 0.97, + "learning_rate": 4.3102626089408515e-08, + "loss": 0.6215, + "step": 28009 + }, + { + "epoch": 0.97, + "learning_rate": 4.3001696521219884e-08, + "loss": 0.6856, + "step": 28010 + }, + { + "epoch": 0.97, + "learning_rate": 4.2900885005840995e-08, + "loss": 0.6326, + "step": 28011 + }, + { + "epoch": 0.97, + "learning_rate": 4.2800191544468686e-08, + "loss": 0.6804, + "step": 28012 + }, + { + "epoch": 0.97, + "learning_rate": 4.2699616138295316e-08, + "loss": 0.6491, + "step": 28013 + }, + { + "epoch": 0.97, + "learning_rate": 4.2599158788515505e-08, + "loss": 0.6594, + "step": 28014 + }, + { + "epoch": 0.97, + "learning_rate": 4.2498819496317176e-08, + "loss": 0.6196, + "step": 28015 + }, + { + "epoch": 0.97, + "learning_rate": 4.239859826289272e-08, + "loss": 0.6553, + "step": 28016 + }, + { + "epoch": 0.97, + "learning_rate": 4.229849508942896e-08, + "loss": 0.6362, + "step": 28017 + }, + { + "epoch": 0.97, + "learning_rate": 4.219850997711272e-08, + "loss": 0.6584, + "step": 28018 + }, + { + "epoch": 0.97, + "learning_rate": 4.209864292712973e-08, + "loss": 0.6153, + "step": 28019 + }, + { + "epoch": 0.97, + "learning_rate": 4.1998893940665696e-08, + "loss": 0.6541, + "step": 28020 + }, + { + "epoch": 0.97, + "learning_rate": 4.1899263018899685e-08, + "loss": 0.6139, + "step": 28021 + }, + { + "epoch": 0.97, + "learning_rate": 4.179975016301629e-08, + "loss": 0.6004, + "step": 28022 + }, + { + "epoch": 0.97, + "learning_rate": 4.170035537419348e-08, + "loss": 0.6588, + "step": 28023 + }, + { + "epoch": 0.97, + "learning_rate": 4.1601078653610295e-08, + "loss": 0.6467, + "step": 28024 + }, + { + "epoch": 0.97, + "learning_rate": 4.150192000244469e-08, + "loss": 0.6285, + "step": 28025 + }, + { + "epoch": 0.97, + "learning_rate": 4.1402879421870154e-08, + "loss": 0.6561, + "step": 28026 + }, + { + "epoch": 0.97, + "learning_rate": 4.130395691306244e-08, + "loss": 0.6889, + "step": 28027 + }, + { + "epoch": 0.97, + "learning_rate": 4.1205152477193924e-08, + "loss": 0.6133, + "step": 28028 + }, + { + "epoch": 0.97, + "learning_rate": 4.1106466115437006e-08, + "loss": 0.6648, + "step": 28029 + }, + { + "epoch": 0.97, + "learning_rate": 4.1007897828960754e-08, + "loss": 0.7149, + "step": 28030 + }, + { + "epoch": 0.97, + "learning_rate": 4.090944761893423e-08, + "loss": 0.6398, + "step": 28031 + }, + { + "epoch": 0.97, + "learning_rate": 4.081111548652428e-08, + "loss": 0.634, + "step": 28032 + }, + { + "epoch": 0.97, + "learning_rate": 4.0712901432896636e-08, + "loss": 0.6297, + "step": 28033 + }, + { + "epoch": 0.97, + "learning_rate": 4.0614805459215925e-08, + "loss": 0.5892, + "step": 28034 + }, + { + "epoch": 0.97, + "learning_rate": 4.0516827566646764e-08, + "loss": 0.62, + "step": 28035 + }, + { + "epoch": 0.97, + "learning_rate": 4.0418967756348236e-08, + "loss": 0.6094, + "step": 28036 + }, + { + "epoch": 0.97, + "learning_rate": 4.032122602948163e-08, + "loss": 0.6546, + "step": 28037 + }, + { + "epoch": 0.97, + "learning_rate": 4.0223602387207125e-08, + "loss": 0.6542, + "step": 28038 + }, + { + "epoch": 0.97, + "learning_rate": 4.012609683068047e-08, + "loss": 0.603, + "step": 28039 + }, + { + "epoch": 0.97, + "learning_rate": 4.0028709361057406e-08, + "loss": 0.606, + "step": 28040 + }, + { + "epoch": 0.97, + "learning_rate": 3.9931439979493667e-08, + "loss": 0.6178, + "step": 28041 + }, + { + "epoch": 0.97, + "learning_rate": 3.983428868714278e-08, + "loss": 0.6587, + "step": 28042 + }, + { + "epoch": 0.97, + "learning_rate": 3.973725548515606e-08, + "loss": 0.6033, + "step": 28043 + }, + { + "epoch": 0.97, + "learning_rate": 3.964034037468367e-08, + "loss": 0.644, + "step": 28044 + }, + { + "epoch": 0.97, + "learning_rate": 3.954354335687582e-08, + "loss": 0.6112, + "step": 28045 + }, + { + "epoch": 0.97, + "learning_rate": 3.9446864432878264e-08, + "loss": 0.707, + "step": 28046 + }, + { + "epoch": 0.97, + "learning_rate": 3.9350303603838954e-08, + "loss": 0.6319, + "step": 28047 + }, + { + "epoch": 0.97, + "learning_rate": 3.925386087090144e-08, + "loss": 0.6231, + "step": 28048 + }, + { + "epoch": 0.97, + "learning_rate": 3.9157536235210346e-08, + "loss": 0.6581, + "step": 28049 + }, + { + "epoch": 0.97, + "learning_rate": 3.906132969790699e-08, + "loss": 0.6171, + "step": 28050 + }, + { + "epoch": 0.97, + "learning_rate": 3.896524126013268e-08, + "loss": 0.6901, + "step": 28051 + }, + { + "epoch": 0.97, + "learning_rate": 3.886927092302539e-08, + "loss": 0.6054, + "step": 28052 + }, + { + "epoch": 0.97, + "learning_rate": 3.8773418687724215e-08, + "loss": 0.6684, + "step": 28053 + }, + { + "epoch": 0.97, + "learning_rate": 3.8677684555364917e-08, + "loss": 0.6433, + "step": 28054 + }, + { + "epoch": 0.97, + "learning_rate": 3.858206852708324e-08, + "loss": 0.7306, + "step": 28055 + }, + { + "epoch": 0.97, + "learning_rate": 3.848657060401273e-08, + "loss": 0.6014, + "step": 28056 + }, + { + "epoch": 0.97, + "learning_rate": 3.83911907872847e-08, + "loss": 0.5954, + "step": 28057 + }, + { + "epoch": 0.97, + "learning_rate": 3.829592907803048e-08, + "loss": 0.5734, + "step": 28058 + }, + { + "epoch": 0.97, + "learning_rate": 3.820078547737915e-08, + "loss": 0.6428, + "step": 28059 + }, + { + "epoch": 0.97, + "learning_rate": 3.810575998645982e-08, + "loss": 0.6075, + "step": 28060 + }, + { + "epoch": 0.97, + "learning_rate": 3.8010852606399365e-08, + "loss": 0.6521, + "step": 28061 + }, + { + "epoch": 0.97, + "learning_rate": 3.791606333832132e-08, + "loss": 0.6249, + "step": 28062 + }, + { + "epoch": 0.97, + "learning_rate": 3.7821392183350344e-08, + "loss": 0.6241, + "step": 28063 + }, + { + "epoch": 0.97, + "learning_rate": 3.7726839142609997e-08, + "loss": 0.6429, + "step": 28064 + }, + { + "epoch": 0.97, + "learning_rate": 3.763240421721937e-08, + "loss": 0.6431, + "step": 28065 + }, + { + "epoch": 0.97, + "learning_rate": 3.7538087408299784e-08, + "loss": 0.6297, + "step": 28066 + }, + { + "epoch": 0.97, + "learning_rate": 3.744388871696814e-08, + "loss": 0.6198, + "step": 28067 + }, + { + "epoch": 0.97, + "learning_rate": 3.7349808144342413e-08, + "loss": 0.6143, + "step": 28068 + }, + { + "epoch": 0.97, + "learning_rate": 3.7255845691536174e-08, + "loss": 0.6496, + "step": 28069 + }, + { + "epoch": 0.97, + "learning_rate": 3.71620013596663e-08, + "loss": 0.6039, + "step": 28070 + }, + { + "epoch": 0.97, + "learning_rate": 3.7068275149843017e-08, + "loss": 0.6474, + "step": 28071 + }, + { + "epoch": 0.97, + "learning_rate": 3.697466706317876e-08, + "loss": 0.5835, + "step": 28072 + }, + { + "epoch": 0.97, + "learning_rate": 3.688117710078376e-08, + "loss": 0.6108, + "step": 28073 + }, + { + "epoch": 0.97, + "learning_rate": 3.678780526376602e-08, + "loss": 0.6638, + "step": 28074 + }, + { + "epoch": 0.97, + "learning_rate": 3.6694551553231315e-08, + "loss": 0.6495, + "step": 28075 + }, + { + "epoch": 0.97, + "learning_rate": 3.6601415970286546e-08, + "loss": 0.6149, + "step": 28076 + }, + { + "epoch": 0.97, + "learning_rate": 3.650839851603638e-08, + "loss": 0.6211, + "step": 28077 + }, + { + "epoch": 0.97, + "learning_rate": 3.641549919158216e-08, + "loss": 0.5779, + "step": 28078 + }, + { + "epoch": 0.97, + "learning_rate": 3.632271799802634e-08, + "loss": 0.6317, + "step": 28079 + }, + { + "epoch": 0.97, + "learning_rate": 3.6230054936469136e-08, + "loss": 0.6456, + "step": 28080 + }, + { + "epoch": 0.97, + "learning_rate": 3.613751000800969e-08, + "loss": 0.5978, + "step": 28081 + }, + { + "epoch": 0.97, + "learning_rate": 3.604508321374267e-08, + "loss": 0.5957, + "step": 28082 + }, + { + "epoch": 0.97, + "learning_rate": 3.59527745547672e-08, + "loss": 0.6236, + "step": 28083 + }, + { + "epoch": 0.97, + "learning_rate": 3.586058403217574e-08, + "loss": 0.6278, + "step": 28084 + }, + { + "epoch": 0.97, + "learning_rate": 3.5768511647061856e-08, + "loss": 0.631, + "step": 28085 + }, + { + "epoch": 0.97, + "learning_rate": 3.567655740051579e-08, + "loss": 0.6197, + "step": 28086 + }, + { + "epoch": 0.97, + "learning_rate": 3.558472129363e-08, + "loss": 0.599, + "step": 28087 + }, + { + "epoch": 0.97, + "learning_rate": 3.54930033274925e-08, + "loss": 0.6759, + "step": 28088 + }, + { + "epoch": 0.97, + "learning_rate": 3.5401403503191324e-08, + "loss": 0.693, + "step": 28089 + }, + { + "epoch": 0.97, + "learning_rate": 3.5309921821811146e-08, + "loss": 0.6258, + "step": 28090 + }, + { + "epoch": 0.97, + "learning_rate": 3.521855828443665e-08, + "loss": 0.6131, + "step": 28091 + }, + { + "epoch": 0.97, + "learning_rate": 3.512731289215254e-08, + "loss": 0.613, + "step": 28092 + }, + { + "epoch": 0.97, + "learning_rate": 3.5036185646039056e-08, + "loss": 0.6357, + "step": 28093 + }, + { + "epoch": 0.97, + "learning_rate": 3.494517654717755e-08, + "loss": 0.559, + "step": 28094 + }, + { + "epoch": 0.97, + "learning_rate": 3.4854285596647166e-08, + "loss": 0.656, + "step": 28095 + }, + { + "epoch": 0.97, + "learning_rate": 3.476351279552481e-08, + "loss": 0.6059, + "step": 28096 + }, + { + "epoch": 0.97, + "learning_rate": 3.467285814488741e-08, + "loss": 0.6555, + "step": 28097 + }, + { + "epoch": 0.97, + "learning_rate": 3.458232164580966e-08, + "loss": 0.618, + "step": 28098 + }, + { + "epoch": 0.97, + "learning_rate": 3.449190329936403e-08, + "loss": 0.6266, + "step": 28099 + }, + { + "epoch": 0.97, + "learning_rate": 3.4401603106624106e-08, + "loss": 0.6288, + "step": 28100 + }, + { + "epoch": 0.97, + "learning_rate": 3.4311421068659035e-08, + "loss": 0.6979, + "step": 28101 + }, + { + "epoch": 0.97, + "learning_rate": 3.422135718653907e-08, + "loss": 0.6442, + "step": 28102 + }, + { + "epoch": 0.97, + "learning_rate": 3.413141146133225e-08, + "loss": 0.5877, + "step": 28103 + }, + { + "epoch": 0.97, + "learning_rate": 3.404158389410328e-08, + "loss": 0.6353, + "step": 28104 + }, + { + "epoch": 0.97, + "learning_rate": 3.3951874485919076e-08, + "loss": 0.6046, + "step": 28105 + }, + { + "epoch": 0.97, + "learning_rate": 3.386228323784213e-08, + "loss": 0.6332, + "step": 28106 + }, + { + "epoch": 0.97, + "learning_rate": 3.377281015093492e-08, + "loss": 0.5879, + "step": 28107 + }, + { + "epoch": 0.97, + "learning_rate": 3.368345522625993e-08, + "loss": 0.6426, + "step": 28108 + }, + { + "epoch": 0.97, + "learning_rate": 3.359421846487298e-08, + "loss": 0.6429, + "step": 28109 + }, + { + "epoch": 0.97, + "learning_rate": 3.350509986783546e-08, + "loss": 0.6812, + "step": 28110 + }, + { + "epoch": 0.97, + "learning_rate": 3.341609943620206e-08, + "loss": 0.6233, + "step": 28111 + }, + { + "epoch": 0.97, + "learning_rate": 3.33272171710286e-08, + "loss": 0.6389, + "step": 28112 + }, + { + "epoch": 0.97, + "learning_rate": 3.32384530733687e-08, + "loss": 0.5806, + "step": 28113 + }, + { + "epoch": 0.97, + "learning_rate": 3.314980714427596e-08, + "loss": 0.6903, + "step": 28114 + }, + { + "epoch": 0.97, + "learning_rate": 3.3061279384799524e-08, + "loss": 0.6197, + "step": 28115 + }, + { + "epoch": 0.97, + "learning_rate": 3.2972869795989684e-08, + "loss": 0.6441, + "step": 28116 + }, + { + "epoch": 0.97, + "learning_rate": 3.288457837889558e-08, + "loss": 0.6756, + "step": 28117 + }, + { + "epoch": 0.97, + "learning_rate": 3.279640513456306e-08, + "loss": 0.6547, + "step": 28118 + }, + { + "epoch": 0.97, + "learning_rate": 3.270835006403683e-08, + "loss": 0.639, + "step": 28119 + }, + { + "epoch": 0.97, + "learning_rate": 3.262041316836384e-08, + "loss": 0.557, + "step": 28120 + }, + { + "epoch": 0.97, + "learning_rate": 3.2532594448583256e-08, + "loss": 0.5904, + "step": 28121 + }, + { + "epoch": 0.97, + "learning_rate": 3.244489390573757e-08, + "loss": 0.5806, + "step": 28122 + }, + { + "epoch": 0.97, + "learning_rate": 3.235731154086708e-08, + "loss": 0.6929, + "step": 28123 + }, + { + "epoch": 0.97, + "learning_rate": 3.226984735500871e-08, + "loss": 0.6341, + "step": 28124 + }, + { + "epoch": 0.97, + "learning_rate": 3.218250134920164e-08, + "loss": 0.6335, + "step": 28125 + }, + { + "epoch": 0.97, + "learning_rate": 3.2095273524480605e-08, + "loss": 0.6005, + "step": 28126 + }, + { + "epoch": 0.97, + "learning_rate": 3.2008163881879215e-08, + "loss": 0.6604, + "step": 28127 + }, + { + "epoch": 0.97, + "learning_rate": 3.192117242242998e-08, + "loss": 0.6241, + "step": 28128 + }, + { + "epoch": 0.97, + "learning_rate": 3.18342991471654e-08, + "loss": 0.56, + "step": 28129 + }, + { + "epoch": 0.97, + "learning_rate": 3.174754405711578e-08, + "loss": 0.625, + "step": 28130 + }, + { + "epoch": 0.97, + "learning_rate": 3.166090715330805e-08, + "loss": 0.6351, + "step": 28131 + }, + { + "epoch": 0.97, + "learning_rate": 3.1574388436770296e-08, + "loss": 0.5887, + "step": 28132 + }, + { + "epoch": 0.97, + "learning_rate": 3.148798790852836e-08, + "loss": 0.614, + "step": 28133 + }, + { + "epoch": 0.97, + "learning_rate": 3.140170556960698e-08, + "loss": 0.6372, + "step": 28134 + }, + { + "epoch": 0.97, + "learning_rate": 3.131554142102866e-08, + "loss": 0.5924, + "step": 28135 + }, + { + "epoch": 0.97, + "learning_rate": 3.122949546381482e-08, + "loss": 0.6266, + "step": 28136 + }, + { + "epoch": 0.97, + "learning_rate": 3.1143567698985745e-08, + "loss": 0.6004, + "step": 28137 + }, + { + "epoch": 0.97, + "learning_rate": 3.105775812756062e-08, + "loss": 0.6235, + "step": 28138 + }, + { + "epoch": 0.97, + "learning_rate": 3.097206675055642e-08, + "loss": 0.5666, + "step": 28139 + }, + { + "epoch": 0.97, + "learning_rate": 3.088649356898899e-08, + "loss": 0.6149, + "step": 28140 + }, + { + "epoch": 0.98, + "learning_rate": 3.080103858387306e-08, + "loss": 0.6079, + "step": 28141 + }, + { + "epoch": 0.98, + "learning_rate": 3.0715701796222295e-08, + "loss": 0.6331, + "step": 28142 + }, + { + "epoch": 0.98, + "learning_rate": 3.063048320704809e-08, + "loss": 0.6403, + "step": 28143 + }, + { + "epoch": 0.98, + "learning_rate": 3.0545382817360744e-08, + "loss": 0.5923, + "step": 28144 + }, + { + "epoch": 0.98, + "learning_rate": 3.0460400628169465e-08, + "loss": 0.6324, + "step": 28145 + }, + { + "epoch": 0.98, + "learning_rate": 3.037553664048121e-08, + "loss": 0.6284, + "step": 28146 + }, + { + "epoch": 0.98, + "learning_rate": 3.029079085530407e-08, + "loss": 0.6388, + "step": 28147 + }, + { + "epoch": 0.98, + "learning_rate": 3.0206163273639455e-08, + "loss": 0.5888, + "step": 28148 + }, + { + "epoch": 0.98, + "learning_rate": 3.012165389649435e-08, + "loss": 0.6667, + "step": 28149 + }, + { + "epoch": 0.98, + "learning_rate": 3.0037262724867957e-08, + "loss": 0.6239, + "step": 28150 + }, + { + "epoch": 0.98, + "learning_rate": 2.9952989759761684e-08, + "loss": 0.651, + "step": 28151 + }, + { + "epoch": 0.98, + "learning_rate": 2.986883500217475e-08, + "loss": 0.6098, + "step": 28152 + }, + { + "epoch": 0.98, + "learning_rate": 2.9784798453106332e-08, + "loss": 0.5797, + "step": 28153 + }, + { + "epoch": 0.98, + "learning_rate": 2.97008801135501e-08, + "loss": 0.6528, + "step": 28154 + }, + { + "epoch": 0.98, + "learning_rate": 2.9617079984503028e-08, + "loss": 0.6272, + "step": 28155 + }, + { + "epoch": 0.98, + "learning_rate": 2.9533398066957652e-08, + "loss": 0.6359, + "step": 28156 + }, + { + "epoch": 0.98, + "learning_rate": 2.9449834361907624e-08, + "loss": 0.6321, + "step": 28157 + }, + { + "epoch": 0.98, + "learning_rate": 2.9366388870342157e-08, + "loss": 0.6392, + "step": 28158 + }, + { + "epoch": 0.98, + "learning_rate": 2.928306159325045e-08, + "loss": 0.6362, + "step": 28159 + }, + { + "epoch": 0.98, + "learning_rate": 2.919985253162172e-08, + "loss": 0.5915, + "step": 28160 + }, + { + "epoch": 0.98, + "learning_rate": 2.9116761686441842e-08, + "loss": 0.6651, + "step": 28161 + }, + { + "epoch": 0.98, + "learning_rate": 2.9033789058695584e-08, + "loss": 0.5789, + "step": 28162 + }, + { + "epoch": 0.98, + "learning_rate": 2.8950934649366603e-08, + "loss": 0.6223, + "step": 28163 + }, + { + "epoch": 0.98, + "learning_rate": 2.8868198459439668e-08, + "loss": 0.6748, + "step": 28164 + }, + { + "epoch": 0.98, + "learning_rate": 2.8785580489891774e-08, + "loss": 0.5843, + "step": 28165 + }, + { + "epoch": 0.98, + "learning_rate": 2.870308074170547e-08, + "loss": 0.6524, + "step": 28166 + }, + { + "epoch": 0.98, + "learning_rate": 2.862069921585775e-08, + "loss": 0.5715, + "step": 28167 + }, + { + "epoch": 0.98, + "learning_rate": 2.8538435913325614e-08, + "loss": 0.6201, + "step": 28168 + }, + { + "epoch": 0.98, + "learning_rate": 2.8456290835083834e-08, + "loss": 0.6673, + "step": 28169 + }, + { + "epoch": 0.98, + "learning_rate": 2.8374263982107188e-08, + "loss": 0.6236, + "step": 28170 + }, + { + "epoch": 0.98, + "learning_rate": 2.8292355355367118e-08, + "loss": 0.6176, + "step": 28171 + }, + { + "epoch": 0.98, + "learning_rate": 2.8210564955836182e-08, + "loss": 0.6415, + "step": 28172 + }, + { + "epoch": 0.98, + "learning_rate": 2.812889278448361e-08, + "loss": 0.578, + "step": 28173 + }, + { + "epoch": 0.98, + "learning_rate": 2.8047338842276396e-08, + "loss": 0.6248, + "step": 28174 + }, + { + "epoch": 0.98, + "learning_rate": 2.796590313018377e-08, + "loss": 0.6093, + "step": 28175 + }, + { + "epoch": 0.98, + "learning_rate": 2.7884585649169404e-08, + "loss": 0.6385, + "step": 28176 + }, + { + "epoch": 0.98, + "learning_rate": 2.7803386400198085e-08, + "loss": 0.6322, + "step": 28177 + }, + { + "epoch": 0.98, + "learning_rate": 2.7722305384232372e-08, + "loss": 0.6489, + "step": 28178 + }, + { + "epoch": 0.98, + "learning_rate": 2.7641342602234833e-08, + "loss": 0.5864, + "step": 28179 + }, + { + "epoch": 0.98, + "learning_rate": 2.7560498055163586e-08, + "loss": 0.6309, + "step": 28180 + }, + { + "epoch": 0.98, + "learning_rate": 2.7479771743976756e-08, + "loss": 0.5959, + "step": 28181 + }, + { + "epoch": 0.98, + "learning_rate": 2.7399163669634686e-08, + "loss": 0.5952, + "step": 28182 + }, + { + "epoch": 0.98, + "learning_rate": 2.731867383308884e-08, + "loss": 0.5874, + "step": 28183 + }, + { + "epoch": 0.98, + "learning_rate": 2.7238302235296223e-08, + "loss": 0.6611, + "step": 28184 + }, + { + "epoch": 0.98, + "learning_rate": 2.715804887720941e-08, + "loss": 0.5486, + "step": 28185 + }, + { + "epoch": 0.98, + "learning_rate": 2.707791375977986e-08, + "loss": 0.642, + "step": 28186 + }, + { + "epoch": 0.98, + "learning_rate": 2.699789688395793e-08, + "loss": 0.6064, + "step": 28187 + }, + { + "epoch": 0.98, + "learning_rate": 2.6917998250690636e-08, + "loss": 0.6259, + "step": 28188 + }, + { + "epoch": 0.98, + "learning_rate": 2.6838217860927217e-08, + "loss": 0.6322, + "step": 28189 + }, + { + "epoch": 0.98, + "learning_rate": 2.675855571561248e-08, + "loss": 0.6303, + "step": 28190 + }, + { + "epoch": 0.98, + "learning_rate": 2.6679011815691213e-08, + "loss": 0.6373, + "step": 28191 + }, + { + "epoch": 0.98, + "learning_rate": 2.6599586162107115e-08, + "loss": 0.6035, + "step": 28192 + }, + { + "epoch": 0.98, + "learning_rate": 2.6520278755800545e-08, + "loss": 0.6698, + "step": 28193 + }, + { + "epoch": 0.98, + "learning_rate": 2.6441089597714077e-08, + "loss": 0.6287, + "step": 28194 + }, + { + "epoch": 0.98, + "learning_rate": 2.6362018688783632e-08, + "loss": 0.5971, + "step": 28195 + }, + { + "epoch": 0.98, + "learning_rate": 2.6283066029948457e-08, + "loss": 0.5887, + "step": 28196 + }, + { + "epoch": 0.98, + "learning_rate": 2.620423162214447e-08, + "loss": 0.6369, + "step": 28197 + }, + { + "epoch": 0.98, + "learning_rate": 2.6125515466306483e-08, + "loss": 0.6916, + "step": 28198 + }, + { + "epoch": 0.98, + "learning_rate": 2.604691756336708e-08, + "loss": 0.6508, + "step": 28199 + }, + { + "epoch": 0.98, + "learning_rate": 2.5968437914258847e-08, + "loss": 0.6292, + "step": 28200 + }, + { + "epoch": 0.98, + "learning_rate": 2.5890076519912155e-08, + "loss": 0.5955, + "step": 28201 + }, + { + "epoch": 0.98, + "learning_rate": 2.5811833381256256e-08, + "loss": 0.5989, + "step": 28202 + }, + { + "epoch": 0.98, + "learning_rate": 2.573370849921819e-08, + "loss": 0.6607, + "step": 28203 + }, + { + "epoch": 0.98, + "learning_rate": 2.5655701874723883e-08, + "loss": 0.6538, + "step": 28204 + }, + { + "epoch": 0.98, + "learning_rate": 2.5577813508699258e-08, + "loss": 0.6581, + "step": 28205 + }, + { + "epoch": 0.98, + "learning_rate": 2.5500043402068018e-08, + "loss": 0.6811, + "step": 28206 + }, + { + "epoch": 0.98, + "learning_rate": 2.542239155575055e-08, + "loss": 0.6678, + "step": 28207 + }, + { + "epoch": 0.98, + "learning_rate": 2.5344857970668325e-08, + "loss": 0.6011, + "step": 28208 + }, + { + "epoch": 0.98, + "learning_rate": 2.5267442647741724e-08, + "loss": 0.6624, + "step": 28209 + }, + { + "epoch": 0.98, + "learning_rate": 2.5190145587887792e-08, + "loss": 0.6347, + "step": 28210 + }, + { + "epoch": 0.98, + "learning_rate": 2.5112966792022466e-08, + "loss": 0.6316, + "step": 28211 + }, + { + "epoch": 0.98, + "learning_rate": 2.503590626106056e-08, + "loss": 0.6581, + "step": 28212 + }, + { + "epoch": 0.98, + "learning_rate": 2.4958963995918016e-08, + "loss": 0.6597, + "step": 28213 + }, + { + "epoch": 0.98, + "learning_rate": 2.4882139997504107e-08, + "loss": 0.6303, + "step": 28214 + }, + { + "epoch": 0.98, + "learning_rate": 2.480543426673143e-08, + "loss": 0.6101, + "step": 28215 + }, + { + "epoch": 0.98, + "learning_rate": 2.4728846804508154e-08, + "loss": 0.5769, + "step": 28216 + }, + { + "epoch": 0.98, + "learning_rate": 2.465237761174466e-08, + "loss": 0.5982, + "step": 28217 + }, + { + "epoch": 0.98, + "learning_rate": 2.4576026689345776e-08, + "loss": 0.6865, + "step": 28218 + }, + { + "epoch": 0.98, + "learning_rate": 2.449979403821634e-08, + "loss": 0.6093, + "step": 28219 + }, + { + "epoch": 0.98, + "learning_rate": 2.442367965926118e-08, + "loss": 0.6093, + "step": 28220 + }, + { + "epoch": 0.98, + "learning_rate": 2.4347683553382906e-08, + "loss": 0.6699, + "step": 28221 + }, + { + "epoch": 0.98, + "learning_rate": 2.427180572148191e-08, + "loss": 0.6841, + "step": 28222 + }, + { + "epoch": 0.98, + "learning_rate": 2.4196046164457477e-08, + "loss": 0.5661, + "step": 28223 + }, + { + "epoch": 0.98, + "learning_rate": 2.412040488320888e-08, + "loss": 0.6354, + "step": 28224 + }, + { + "epoch": 0.98, + "learning_rate": 2.4044881878633185e-08, + "loss": 0.6161, + "step": 28225 + }, + { + "epoch": 0.98, + "learning_rate": 2.396947715162412e-08, + "loss": 0.6634, + "step": 28226 + }, + { + "epoch": 0.98, + "learning_rate": 2.3894190703076525e-08, + "loss": 0.5843, + "step": 28227 + }, + { + "epoch": 0.98, + "learning_rate": 2.3819022533883017e-08, + "loss": 0.6183, + "step": 28228 + }, + { + "epoch": 0.98, + "learning_rate": 2.3743972644936218e-08, + "loss": 0.6369, + "step": 28229 + }, + { + "epoch": 0.98, + "learning_rate": 2.3669041037123196e-08, + "loss": 0.6155, + "step": 28230 + }, + { + "epoch": 0.98, + "learning_rate": 2.359422771133435e-08, + "loss": 0.6255, + "step": 28231 + }, + { + "epoch": 0.98, + "learning_rate": 2.3519532668456748e-08, + "loss": 0.5967, + "step": 28232 + }, + { + "epoch": 0.98, + "learning_rate": 2.3444955909374124e-08, + "loss": 0.6319, + "step": 28233 + }, + { + "epoch": 0.98, + "learning_rate": 2.337049743497244e-08, + "loss": 0.6119, + "step": 28234 + }, + { + "epoch": 0.98, + "learning_rate": 2.329615724613432e-08, + "loss": 0.6175, + "step": 28235 + }, + { + "epoch": 0.98, + "learning_rate": 2.3221935343741286e-08, + "loss": 0.5878, + "step": 28236 + }, + { + "epoch": 0.98, + "learning_rate": 2.3147831728672632e-08, + "loss": 0.5933, + "step": 28237 + }, + { + "epoch": 0.98, + "learning_rate": 2.3073846401806542e-08, + "loss": 0.6492, + "step": 28238 + }, + { + "epoch": 0.98, + "learning_rate": 2.2999979364021208e-08, + "loss": 0.5737, + "step": 28239 + }, + { + "epoch": 0.98, + "learning_rate": 2.292623061619259e-08, + "loss": 0.5918, + "step": 28240 + }, + { + "epoch": 0.98, + "learning_rate": 2.2852600159194437e-08, + "loss": 0.6253, + "step": 28241 + }, + { + "epoch": 0.98, + "learning_rate": 2.2779087993899384e-08, + "loss": 0.6438, + "step": 28242 + }, + { + "epoch": 0.98, + "learning_rate": 2.2705694121178955e-08, + "loss": 0.6781, + "step": 28243 + }, + { + "epoch": 0.98, + "learning_rate": 2.263241854190468e-08, + "loss": 0.6094, + "step": 28244 + }, + { + "epoch": 0.98, + "learning_rate": 2.2559261256944742e-08, + "loss": 0.5883, + "step": 28245 + }, + { + "epoch": 0.98, + "learning_rate": 2.2486222267166237e-08, + "loss": 0.6497, + "step": 28246 + }, + { + "epoch": 0.98, + "learning_rate": 2.241330157343513e-08, + "loss": 0.6007, + "step": 28247 + }, + { + "epoch": 0.98, + "learning_rate": 2.234049917661518e-08, + "loss": 0.5793, + "step": 28248 + }, + { + "epoch": 0.98, + "learning_rate": 2.2267815077571253e-08, + "loss": 0.646, + "step": 28249 + }, + { + "epoch": 0.98, + "learning_rate": 2.2195249277163766e-08, + "loss": 0.6486, + "step": 28250 + }, + { + "epoch": 0.98, + "learning_rate": 2.2122801776254254e-08, + "loss": 0.6219, + "step": 28251 + }, + { + "epoch": 0.98, + "learning_rate": 2.2050472575700922e-08, + "loss": 0.6404, + "step": 28252 + }, + { + "epoch": 0.98, + "learning_rate": 2.1978261676360858e-08, + "loss": 0.6614, + "step": 28253 + }, + { + "epoch": 0.98, + "learning_rate": 2.1906169079091154e-08, + "loss": 0.6267, + "step": 28254 + }, + { + "epoch": 0.98, + "learning_rate": 2.1834194784746688e-08, + "loss": 0.6183, + "step": 28255 + }, + { + "epoch": 0.98, + "learning_rate": 2.1762338794178993e-08, + "loss": 0.6172, + "step": 28256 + }, + { + "epoch": 0.98, + "learning_rate": 2.1690601108241838e-08, + "loss": 0.5989, + "step": 28257 + }, + { + "epoch": 0.98, + "learning_rate": 2.1618981727785648e-08, + "loss": 0.6468, + "step": 28258 + }, + { + "epoch": 0.98, + "learning_rate": 2.1547480653659748e-08, + "loss": 0.5957, + "step": 28259 + }, + { + "epoch": 0.98, + "learning_rate": 2.1476097886710122e-08, + "loss": 0.6419, + "step": 28260 + }, + { + "epoch": 0.98, + "learning_rate": 2.140483342778499e-08, + "loss": 0.5833, + "step": 28261 + }, + { + "epoch": 0.98, + "learning_rate": 2.1333687277727e-08, + "loss": 0.6629, + "step": 28262 + }, + { + "epoch": 0.98, + "learning_rate": 2.126265943738326e-08, + "loss": 0.6332, + "step": 28263 + }, + { + "epoch": 0.98, + "learning_rate": 2.1191749907591986e-08, + "loss": 0.6001, + "step": 28264 + }, + { + "epoch": 0.98, + "learning_rate": 2.1120958689196948e-08, + "loss": 0.6187, + "step": 28265 + }, + { + "epoch": 0.98, + "learning_rate": 2.105028578303636e-08, + "loss": 0.669, + "step": 28266 + }, + { + "epoch": 0.98, + "learning_rate": 2.097973118994845e-08, + "loss": 0.6471, + "step": 28267 + }, + { + "epoch": 0.98, + "learning_rate": 2.0909294910768097e-08, + "loss": 0.6517, + "step": 28268 + }, + { + "epoch": 0.98, + "learning_rate": 2.083897694633241e-08, + "loss": 0.631, + "step": 28269 + }, + { + "epoch": 0.98, + "learning_rate": 2.0768777297474064e-08, + "loss": 0.6601, + "step": 28270 + }, + { + "epoch": 0.98, + "learning_rate": 2.0698695965025716e-08, + "loss": 0.6119, + "step": 28271 + }, + { + "epoch": 0.98, + "learning_rate": 2.062873294981893e-08, + "loss": 0.592, + "step": 28272 + }, + { + "epoch": 0.98, + "learning_rate": 2.055888825268193e-08, + "loss": 0.6639, + "step": 28273 + }, + { + "epoch": 0.98, + "learning_rate": 2.048916187444294e-08, + "loss": 0.6188, + "step": 28274 + }, + { + "epoch": 0.98, + "learning_rate": 2.0419553815929083e-08, + "loss": 0.642, + "step": 28275 + }, + { + "epoch": 0.98, + "learning_rate": 2.035006407796636e-08, + "loss": 0.6065, + "step": 28276 + }, + { + "epoch": 0.98, + "learning_rate": 2.0280692661377443e-08, + "loss": 0.6581, + "step": 28277 + }, + { + "epoch": 0.98, + "learning_rate": 2.0211439566986123e-08, + "loss": 0.6707, + "step": 28278 + }, + { + "epoch": 0.98, + "learning_rate": 2.0142304795611745e-08, + "loss": 0.6306, + "step": 28279 + }, + { + "epoch": 0.98, + "learning_rate": 2.007328834807476e-08, + "loss": 0.6442, + "step": 28280 + }, + { + "epoch": 0.98, + "learning_rate": 2.0004390225194516e-08, + "loss": 0.6149, + "step": 28281 + }, + { + "epoch": 0.98, + "learning_rate": 1.993561042778702e-08, + "loss": 0.7116, + "step": 28282 + }, + { + "epoch": 0.98, + "learning_rate": 1.9866948956667186e-08, + "loss": 0.5911, + "step": 28283 + }, + { + "epoch": 0.98, + "learning_rate": 1.9798405812648803e-08, + "loss": 0.6028, + "step": 28284 + }, + { + "epoch": 0.98, + "learning_rate": 1.972998099654677e-08, + "loss": 0.6076, + "step": 28285 + }, + { + "epoch": 0.98, + "learning_rate": 1.9661674509170447e-08, + "loss": 0.6745, + "step": 28286 + }, + { + "epoch": 0.98, + "learning_rate": 1.9593486351329184e-08, + "loss": 0.6041, + "step": 28287 + }, + { + "epoch": 0.98, + "learning_rate": 1.952541652383344e-08, + "loss": 0.6608, + "step": 28288 + }, + { + "epoch": 0.98, + "learning_rate": 1.9457465027489243e-08, + "loss": 0.5779, + "step": 28289 + }, + { + "epoch": 0.98, + "learning_rate": 1.938963186310261e-08, + "loss": 0.5874, + "step": 28290 + }, + { + "epoch": 0.98, + "learning_rate": 1.9321917031476233e-08, + "loss": 0.6641, + "step": 28291 + }, + { + "epoch": 0.98, + "learning_rate": 1.9254320533415026e-08, + "loss": 0.6896, + "step": 28292 + }, + { + "epoch": 0.98, + "learning_rate": 1.918684236971946e-08, + "loss": 0.6146, + "step": 28293 + }, + { + "epoch": 0.98, + "learning_rate": 1.9119482541190005e-08, + "loss": 0.6478, + "step": 28294 + }, + { + "epoch": 0.98, + "learning_rate": 1.9052241048624907e-08, + "loss": 0.6505, + "step": 28295 + }, + { + "epoch": 0.98, + "learning_rate": 1.8985117892820205e-08, + "loss": 0.5918, + "step": 28296 + }, + { + "epoch": 0.98, + "learning_rate": 1.891811307457414e-08, + "loss": 0.5845, + "step": 28297 + }, + { + "epoch": 0.98, + "learning_rate": 1.8851226594679416e-08, + "loss": 0.6209, + "step": 28298 + }, + { + "epoch": 0.98, + "learning_rate": 1.8784458453929845e-08, + "loss": 0.6682, + "step": 28299 + }, + { + "epoch": 0.98, + "learning_rate": 1.871780865311812e-08, + "loss": 0.6415, + "step": 28300 + }, + { + "epoch": 0.98, + "learning_rate": 1.8651277193031392e-08, + "loss": 0.6546, + "step": 28301 + }, + { + "epoch": 0.98, + "learning_rate": 1.858486407446125e-08, + "loss": 0.5951, + "step": 28302 + }, + { + "epoch": 0.98, + "learning_rate": 1.8518569298192622e-08, + "loss": 0.6298, + "step": 28303 + }, + { + "epoch": 0.98, + "learning_rate": 1.845239286501488e-08, + "loss": 0.6364, + "step": 28304 + }, + { + "epoch": 0.98, + "learning_rate": 1.8386334775709614e-08, + "loss": 0.5829, + "step": 28305 + }, + { + "epoch": 0.98, + "learning_rate": 1.8320395031061755e-08, + "loss": 0.6717, + "step": 28306 + }, + { + "epoch": 0.98, + "learning_rate": 1.825457363185179e-08, + "loss": 0.7132, + "step": 28307 + }, + { + "epoch": 0.98, + "learning_rate": 1.8188870578861317e-08, + "loss": 0.661, + "step": 28308 + }, + { + "epoch": 0.98, + "learning_rate": 1.81232858728686e-08, + "loss": 0.6154, + "step": 28309 + }, + { + "epoch": 0.98, + "learning_rate": 1.805781951465191e-08, + "loss": 0.6504, + "step": 28310 + }, + { + "epoch": 0.98, + "learning_rate": 1.7992471504986175e-08, + "loss": 0.6004, + "step": 28311 + }, + { + "epoch": 0.98, + "learning_rate": 1.7927241844647447e-08, + "loss": 0.6056, + "step": 28312 + }, + { + "epoch": 0.98, + "learning_rate": 1.786213053440955e-08, + "loss": 0.5955, + "step": 28313 + }, + { + "epoch": 0.98, + "learning_rate": 1.7797137575041868e-08, + "loss": 0.6749, + "step": 28314 + }, + { + "epoch": 0.98, + "learning_rate": 1.7732262967318227e-08, + "loss": 0.6553, + "step": 28315 + }, + { + "epoch": 0.98, + "learning_rate": 1.766750671200468e-08, + "loss": 0.6761, + "step": 28316 + }, + { + "epoch": 0.98, + "learning_rate": 1.760286880987172e-08, + "loss": 0.5783, + "step": 28317 + }, + { + "epoch": 0.98, + "learning_rate": 1.7538349261684294e-08, + "loss": 0.6433, + "step": 28318 + }, + { + "epoch": 0.98, + "learning_rate": 1.7473948068207346e-08, + "loss": 0.6567, + "step": 28319 + }, + { + "epoch": 0.98, + "learning_rate": 1.7409665230205818e-08, + "loss": 0.5975, + "step": 28320 + }, + { + "epoch": 0.98, + "learning_rate": 1.7345500748439104e-08, + "loss": 0.6318, + "step": 28321 + }, + { + "epoch": 0.98, + "learning_rate": 1.7281454623671034e-08, + "loss": 0.6654, + "step": 28322 + }, + { + "epoch": 0.98, + "learning_rate": 1.7217526856658785e-08, + "loss": 0.5984, + "step": 28323 + }, + { + "epoch": 0.98, + "learning_rate": 1.7153717448160634e-08, + "loss": 0.5916, + "step": 28324 + }, + { + "epoch": 0.98, + "learning_rate": 1.7090026398933756e-08, + "loss": 0.6907, + "step": 28325 + }, + { + "epoch": 0.98, + "learning_rate": 1.7026453709734216e-08, + "loss": 0.6716, + "step": 28326 + }, + { + "epoch": 0.98, + "learning_rate": 1.6962999381313627e-08, + "loss": 0.5919, + "step": 28327 + }, + { + "epoch": 0.98, + "learning_rate": 1.6899663414424727e-08, + "loss": 0.6743, + "step": 28328 + }, + { + "epoch": 0.98, + "learning_rate": 1.6836445809820244e-08, + "loss": 0.6611, + "step": 28329 + }, + { + "epoch": 0.98, + "learning_rate": 1.677334656824736e-08, + "loss": 0.6144, + "step": 28330 + }, + { + "epoch": 0.98, + "learning_rate": 1.6710365690455475e-08, + "loss": 0.574, + "step": 28331 + }, + { + "epoch": 0.98, + "learning_rate": 1.664750317719177e-08, + "loss": 0.6406, + "step": 28332 + }, + { + "epoch": 0.98, + "learning_rate": 1.65847590292012e-08, + "loss": 0.6129, + "step": 28333 + }, + { + "epoch": 0.98, + "learning_rate": 1.6522133247226514e-08, + "loss": 0.6183, + "step": 28334 + }, + { + "epoch": 0.98, + "learning_rate": 1.645962583201155e-08, + "loss": 0.6566, + "step": 28335 + }, + { + "epoch": 0.98, + "learning_rate": 1.6397236784296834e-08, + "loss": 0.6053, + "step": 28336 + }, + { + "epoch": 0.98, + "learning_rate": 1.633496610482177e-08, + "loss": 0.5867, + "step": 28337 + }, + { + "epoch": 0.98, + "learning_rate": 1.627281379432577e-08, + "loss": 0.62, + "step": 28338 + }, + { + "epoch": 0.98, + "learning_rate": 1.621077985354491e-08, + "loss": 0.6214, + "step": 28339 + }, + { + "epoch": 0.98, + "learning_rate": 1.6148864283214162e-08, + "loss": 0.654, + "step": 28340 + }, + { + "epoch": 0.98, + "learning_rate": 1.6087067084068485e-08, + "loss": 0.5842, + "step": 28341 + }, + { + "epoch": 0.98, + "learning_rate": 1.6025388256840637e-08, + "loss": 0.6561, + "step": 28342 + }, + { + "epoch": 0.98, + "learning_rate": 1.5963827802262244e-08, + "loss": 0.5718, + "step": 28343 + }, + { + "epoch": 0.98, + "learning_rate": 1.590238572106162e-08, + "loss": 0.6059, + "step": 28344 + }, + { + "epoch": 0.98, + "learning_rate": 1.5841062013968178e-08, + "loss": 0.6731, + "step": 28345 + }, + { + "epoch": 0.98, + "learning_rate": 1.5779856681709116e-08, + "loss": 0.6346, + "step": 28346 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718769725010518e-08, + "loss": 0.6199, + "step": 28347 + }, + { + "epoch": 0.98, + "learning_rate": 1.565780114459514e-08, + "loss": 0.6037, + "step": 28348 + }, + { + "epoch": 0.98, + "learning_rate": 1.559695094118796e-08, + "loss": 0.6799, + "step": 28349 + }, + { + "epoch": 0.98, + "learning_rate": 1.55362191155084e-08, + "loss": 0.6496, + "step": 28350 + }, + { + "epoch": 0.98, + "learning_rate": 1.5475605668276992e-08, + "loss": 0.6223, + "step": 28351 + }, + { + "epoch": 0.98, + "learning_rate": 1.541511060021317e-08, + "loss": 0.5902, + "step": 28352 + }, + { + "epoch": 0.98, + "learning_rate": 1.5354733912035237e-08, + "loss": 0.6326, + "step": 28353 + }, + { + "epoch": 0.98, + "learning_rate": 1.529447560445596e-08, + "loss": 0.6131, + "step": 28354 + }, + { + "epoch": 0.98, + "learning_rate": 1.5234335678191435e-08, + "loss": 0.5918, + "step": 28355 + }, + { + "epoch": 0.98, + "learning_rate": 1.5174314133955536e-08, + "loss": 0.6246, + "step": 28356 + }, + { + "epoch": 0.98, + "learning_rate": 1.5114410972457692e-08, + "loss": 0.6214, + "step": 28357 + }, + { + "epoch": 0.98, + "learning_rate": 1.505462619441067e-08, + "loss": 0.6603, + "step": 28358 + }, + { + "epoch": 0.98, + "learning_rate": 1.499495980052168e-08, + "loss": 0.6727, + "step": 28359 + }, + { + "epoch": 0.98, + "learning_rate": 1.4935411791497933e-08, + "loss": 0.6372, + "step": 28360 + }, + { + "epoch": 0.98, + "learning_rate": 1.4875982168046643e-08, + "loss": 0.6553, + "step": 28361 + }, + { + "epoch": 0.98, + "learning_rate": 1.4816670930871691e-08, + "loss": 0.6398, + "step": 28362 + }, + { + "epoch": 0.98, + "learning_rate": 1.4757478080675846e-08, + "loss": 0.6283, + "step": 28363 + }, + { + "epoch": 0.98, + "learning_rate": 1.4698403618162994e-08, + "loss": 0.6309, + "step": 28364 + }, + { + "epoch": 0.98, + "learning_rate": 1.463944754403146e-08, + "loss": 0.5699, + "step": 28365 + }, + { + "epoch": 0.98, + "learning_rate": 1.4580609858979577e-08, + "loss": 0.6547, + "step": 28366 + }, + { + "epoch": 0.98, + "learning_rate": 1.4521890563707896e-08, + "loss": 0.6059, + "step": 28367 + }, + { + "epoch": 0.98, + "learning_rate": 1.4463289658910306e-08, + "loss": 0.6154, + "step": 28368 + }, + { + "epoch": 0.98, + "learning_rate": 1.4404807145281808e-08, + "loss": 0.603, + "step": 28369 + }, + { + "epoch": 0.98, + "learning_rate": 1.4346443023516287e-08, + "loss": 0.6367, + "step": 28370 + }, + { + "epoch": 0.98, + "learning_rate": 1.4288197294305418e-08, + "loss": 0.6105, + "step": 28371 + }, + { + "epoch": 0.98, + "learning_rate": 1.4230069958340865e-08, + "loss": 0.6117, + "step": 28372 + }, + { + "epoch": 0.98, + "learning_rate": 1.4172061016309857e-08, + "loss": 0.6797, + "step": 28373 + }, + { + "epoch": 0.98, + "learning_rate": 1.4114170468901845e-08, + "loss": 0.6099, + "step": 28374 + }, + { + "epoch": 0.98, + "learning_rate": 1.4056398316801833e-08, + "loss": 0.5442, + "step": 28375 + }, + { + "epoch": 0.98, + "learning_rate": 1.3998744560695942e-08, + "loss": 0.5611, + "step": 28376 + }, + { + "epoch": 0.98, + "learning_rate": 1.3941209201268069e-08, + "loss": 0.6712, + "step": 28377 + }, + { + "epoch": 0.98, + "learning_rate": 1.388379223919878e-08, + "loss": 0.6357, + "step": 28378 + }, + { + "epoch": 0.98, + "learning_rate": 1.382649367516975e-08, + "loss": 0.6748, + "step": 28379 + }, + { + "epoch": 0.98, + "learning_rate": 1.3769313509860438e-08, + "loss": 0.6127, + "step": 28380 + }, + { + "epoch": 0.98, + "learning_rate": 1.371225174394808e-08, + "loss": 0.6596, + "step": 28381 + }, + { + "epoch": 0.98, + "learning_rate": 1.36553083781088e-08, + "loss": 0.5797, + "step": 28382 + }, + { + "epoch": 0.98, + "learning_rate": 1.3598483413020947e-08, + "loss": 0.6329, + "step": 28383 + }, + { + "epoch": 0.98, + "learning_rate": 1.3541776849353982e-08, + "loss": 0.6609, + "step": 28384 + }, + { + "epoch": 0.98, + "learning_rate": 1.3485188687782925e-08, + "loss": 0.6355, + "step": 28385 + }, + { + "epoch": 0.98, + "learning_rate": 1.3428718928978346e-08, + "loss": 0.5823, + "step": 28386 + }, + { + "epoch": 0.98, + "learning_rate": 1.3372367573608603e-08, + "loss": 0.6316, + "step": 28387 + }, + { + "epoch": 0.98, + "learning_rate": 1.3316134622343157e-08, + "loss": 0.5929, + "step": 28388 + }, + { + "epoch": 0.98, + "learning_rate": 1.3260020075848145e-08, + "loss": 0.5873, + "step": 28389 + }, + { + "epoch": 0.98, + "learning_rate": 1.320402393478859e-08, + "loss": 0.6726, + "step": 28390 + }, + { + "epoch": 0.98, + "learning_rate": 1.3148146199829515e-08, + "loss": 0.6671, + "step": 28391 + }, + { + "epoch": 0.98, + "learning_rate": 1.3092386871631502e-08, + "loss": 0.6697, + "step": 28392 + }, + { + "epoch": 0.98, + "learning_rate": 1.3036745950857355e-08, + "loss": 0.654, + "step": 28393 + }, + { + "epoch": 0.98, + "learning_rate": 1.2981223438165436e-08, + "loss": 0.592, + "step": 28394 + }, + { + "epoch": 0.98, + "learning_rate": 1.2925819334216327e-08, + "loss": 0.6436, + "step": 28395 + }, + { + "epoch": 0.98, + "learning_rate": 1.287053363966395e-08, + "loss": 0.6043, + "step": 28396 + }, + { + "epoch": 0.98, + "learning_rate": 1.2815366355165559e-08, + "loss": 0.6192, + "step": 28397 + }, + { + "epoch": 0.98, + "learning_rate": 1.2760317481375072e-08, + "loss": 0.6514, + "step": 28398 + }, + { + "epoch": 0.98, + "learning_rate": 1.2705387018944193e-08, + "loss": 0.6532, + "step": 28399 + }, + { + "epoch": 0.98, + "learning_rate": 1.265057496852573e-08, + "loss": 0.6437, + "step": 28400 + }, + { + "epoch": 0.98, + "learning_rate": 1.2595881330768056e-08, + "loss": 0.5935, + "step": 28401 + }, + { + "epoch": 0.98, + "learning_rate": 1.254130610632176e-08, + "loss": 0.6027, + "step": 28402 + }, + { + "epoch": 0.98, + "learning_rate": 1.2486849295830773e-08, + "loss": 0.6469, + "step": 28403 + }, + { + "epoch": 0.98, + "learning_rate": 1.2432510899943461e-08, + "loss": 0.6122, + "step": 28404 + }, + { + "epoch": 0.98, + "learning_rate": 1.2378290919302649e-08, + "loss": 0.6037, + "step": 28405 + }, + { + "epoch": 0.98, + "learning_rate": 1.2324189354552263e-08, + "loss": 0.6983, + "step": 28406 + }, + { + "epoch": 0.98, + "learning_rate": 1.2270206206331791e-08, + "loss": 0.6443, + "step": 28407 + }, + { + "epoch": 0.98, + "learning_rate": 1.2216341475284055e-08, + "loss": 0.5957, + "step": 28408 + }, + { + "epoch": 0.98, + "learning_rate": 1.2162595162045209e-08, + "loss": 0.6354, + "step": 28409 + }, + { + "epoch": 0.98, + "learning_rate": 1.2108967267253636e-08, + "loss": 0.6387, + "step": 28410 + }, + { + "epoch": 0.98, + "learning_rate": 1.2055457791545488e-08, + "loss": 0.6473, + "step": 28411 + }, + { + "epoch": 0.98, + "learning_rate": 1.2002066735554708e-08, + "loss": 0.692, + "step": 28412 + }, + { + "epoch": 0.98, + "learning_rate": 1.1948794099914118e-08, + "loss": 0.6302, + "step": 28413 + }, + { + "epoch": 0.98, + "learning_rate": 1.1895639885254328e-08, + "loss": 0.6444, + "step": 28414 + }, + { + "epoch": 0.98, + "learning_rate": 1.1842604092208166e-08, + "loss": 0.6533, + "step": 28415 + }, + { + "epoch": 0.98, + "learning_rate": 1.1789686721402904e-08, + "loss": 0.5641, + "step": 28416 + }, + { + "epoch": 0.98, + "learning_rate": 1.1736887773465821e-08, + "loss": 0.6041, + "step": 28417 + }, + { + "epoch": 0.98, + "learning_rate": 1.1684207249023083e-08, + "loss": 0.6452, + "step": 28418 + }, + { + "epoch": 0.98, + "learning_rate": 1.1631645148699745e-08, + "loss": 0.6316, + "step": 28419 + }, + { + "epoch": 0.98, + "learning_rate": 1.1579201473117529e-08, + "loss": 0.6548, + "step": 28420 + }, + { + "epoch": 0.98, + "learning_rate": 1.1526876222900384e-08, + "loss": 0.666, + "step": 28421 + }, + { + "epoch": 0.98, + "learning_rate": 1.1474669398667815e-08, + "loss": 0.6517, + "step": 28422 + }, + { + "epoch": 0.98, + "learning_rate": 1.1422581001037104e-08, + "loss": 0.6103, + "step": 28423 + }, + { + "epoch": 0.98, + "learning_rate": 1.1370611030628863e-08, + "loss": 0.6297, + "step": 28424 + }, + { + "epoch": 0.98, + "learning_rate": 1.1318759488057052e-08, + "loss": 0.6349, + "step": 28425 + }, + { + "epoch": 0.98, + "learning_rate": 1.126702637393673e-08, + "loss": 0.601, + "step": 28426 + }, + { + "epoch": 0.98, + "learning_rate": 1.121541168888296e-08, + "loss": 0.6587, + "step": 28427 + }, + { + "epoch": 0.98, + "learning_rate": 1.1163915433505256e-08, + "loss": 0.6372, + "step": 28428 + }, + { + "epoch": 0.98, + "learning_rate": 1.1112537608415353e-08, + "loss": 0.6093, + "step": 28429 + }, + { + "epoch": 0.99, + "learning_rate": 1.1061278214221648e-08, + "loss": 0.6176, + "step": 28430 + }, + { + "epoch": 0.99, + "learning_rate": 1.101013725153366e-08, + "loss": 0.6362, + "step": 28431 + }, + { + "epoch": 0.99, + "learning_rate": 1.0959114720956455e-08, + "loss": 0.6633, + "step": 28432 + }, + { + "epoch": 0.99, + "learning_rate": 1.0908210623095106e-08, + "loss": 0.5725, + "step": 28433 + }, + { + "epoch": 0.99, + "learning_rate": 1.0857424958552465e-08, + "loss": 0.6476, + "step": 28434 + }, + { + "epoch": 0.99, + "learning_rate": 1.0806757727932492e-08, + "loss": 0.6465, + "step": 28435 + }, + { + "epoch": 0.99, + "learning_rate": 1.075620893183471e-08, + "loss": 0.591, + "step": 28436 + }, + { + "epoch": 0.99, + "learning_rate": 1.0705778570857528e-08, + "loss": 0.6364, + "step": 28437 + }, + { + "epoch": 0.99, + "learning_rate": 1.0655466645600465e-08, + "loss": 0.5904, + "step": 28438 + }, + { + "epoch": 0.99, + "learning_rate": 1.0605273156659712e-08, + "loss": 0.6101, + "step": 28439 + }, + { + "epoch": 0.99, + "learning_rate": 1.0555198104629238e-08, + "loss": 0.6134, + "step": 28440 + }, + { + "epoch": 0.99, + "learning_rate": 1.0505241490104124e-08, + "loss": 0.6702, + "step": 28441 + }, + { + "epoch": 0.99, + "learning_rate": 1.0455403313677226e-08, + "loss": 0.6621, + "step": 28442 + }, + { + "epoch": 0.99, + "learning_rate": 1.0405683575936964e-08, + "loss": 0.653, + "step": 28443 + }, + { + "epoch": 0.99, + "learning_rate": 1.0356082277473978e-08, + "loss": 0.6502, + "step": 28444 + }, + { + "epoch": 0.99, + "learning_rate": 1.0306599418877794e-08, + "loss": 0.5884, + "step": 28445 + }, + { + "epoch": 0.99, + "learning_rate": 1.0257235000733502e-08, + "loss": 0.5735, + "step": 28446 + }, + { + "epoch": 0.99, + "learning_rate": 1.0207989023626185e-08, + "loss": 0.6047, + "step": 28447 + }, + { + "epoch": 0.99, + "learning_rate": 1.0158861488140937e-08, + "loss": 0.5816, + "step": 28448 + }, + { + "epoch": 0.99, + "learning_rate": 1.010985239485951e-08, + "loss": 0.6137, + "step": 28449 + }, + { + "epoch": 0.99, + "learning_rate": 1.0060961744362552e-08, + "loss": 0.6513, + "step": 28450 + }, + { + "epoch": 0.99, + "learning_rate": 1.001218953723071e-08, + "loss": 0.5989, + "step": 28451 + }, + { + "epoch": 0.99, + "learning_rate": 9.96353577404241e-09, + "loss": 0.6278, + "step": 28452 + }, + { + "epoch": 0.99, + "learning_rate": 9.915000455372747e-09, + "loss": 0.6385, + "step": 28453 + }, + { + "epoch": 0.99, + "learning_rate": 9.866583581797928e-09, + "loss": 0.6278, + "step": 28454 + }, + { + "epoch": 0.99, + "learning_rate": 9.818285153893048e-09, + "loss": 0.6273, + "step": 28455 + }, + { + "epoch": 0.99, + "learning_rate": 9.77010517223098e-09, + "loss": 0.6738, + "step": 28456 + }, + { + "epoch": 0.99, + "learning_rate": 9.722043637381273e-09, + "loss": 0.6673, + "step": 28457 + }, + { + "epoch": 0.99, + "learning_rate": 9.674100549913468e-09, + "loss": 0.6325, + "step": 28458 + }, + { + "epoch": 0.99, + "learning_rate": 9.62627591039822e-09, + "loss": 0.6233, + "step": 28459 + }, + { + "epoch": 0.99, + "learning_rate": 9.578569719400632e-09, + "loss": 0.691, + "step": 28460 + }, + { + "epoch": 0.99, + "learning_rate": 9.53098197748803e-09, + "loss": 0.6054, + "step": 28461 + }, + { + "epoch": 0.99, + "learning_rate": 9.483512685223294e-09, + "loss": 0.5654, + "step": 28462 + }, + { + "epoch": 0.99, + "learning_rate": 9.436161843169312e-09, + "loss": 0.6365, + "step": 28463 + }, + { + "epoch": 0.99, + "learning_rate": 9.388929451887852e-09, + "loss": 0.6672, + "step": 28464 + }, + { + "epoch": 0.99, + "learning_rate": 9.341815511938467e-09, + "loss": 0.5744, + "step": 28465 + }, + { + "epoch": 0.99, + "learning_rate": 9.294820023880713e-09, + "loss": 0.6426, + "step": 28466 + }, + { + "epoch": 0.99, + "learning_rate": 9.247942988270808e-09, + "loss": 0.6044, + "step": 28467 + }, + { + "epoch": 0.99, + "learning_rate": 9.201184405664976e-09, + "loss": 0.6365, + "step": 28468 + }, + { + "epoch": 0.99, + "learning_rate": 9.154544276617217e-09, + "loss": 0.5471, + "step": 28469 + }, + { + "epoch": 0.99, + "learning_rate": 9.108022601681533e-09, + "loss": 0.6986, + "step": 28470 + }, + { + "epoch": 0.99, + "learning_rate": 9.061619381408593e-09, + "loss": 0.6622, + "step": 28471 + }, + { + "epoch": 0.99, + "learning_rate": 9.01533461634796e-09, + "loss": 0.584, + "step": 28472 + }, + { + "epoch": 0.99, + "learning_rate": 8.969168307050302e-09, + "loss": 0.649, + "step": 28473 + }, + { + "epoch": 0.99, + "learning_rate": 8.923120454060742e-09, + "loss": 0.6319, + "step": 28474 + }, + { + "epoch": 0.99, + "learning_rate": 8.877191057927725e-09, + "loss": 0.5914, + "step": 28475 + }, + { + "epoch": 0.99, + "learning_rate": 8.831380119193045e-09, + "loss": 0.5833, + "step": 28476 + }, + { + "epoch": 0.99, + "learning_rate": 8.785687638401818e-09, + "loss": 0.6956, + "step": 28477 + }, + { + "epoch": 0.99, + "learning_rate": 8.740113616095835e-09, + "loss": 0.5905, + "step": 28478 + }, + { + "epoch": 0.99, + "learning_rate": 8.694658052813554e-09, + "loss": 0.6448, + "step": 28479 + }, + { + "epoch": 0.99, + "learning_rate": 8.649320949096763e-09, + "loss": 0.659, + "step": 28480 + }, + { + "epoch": 0.99, + "learning_rate": 8.604102305480588e-09, + "loss": 0.5929, + "step": 28481 + }, + { + "epoch": 0.99, + "learning_rate": 8.55900212250127e-09, + "loss": 0.6072, + "step": 28482 + }, + { + "epoch": 0.99, + "learning_rate": 8.514020400695044e-09, + "loss": 0.6375, + "step": 28483 + }, + { + "epoch": 0.99, + "learning_rate": 8.469157140593708e-09, + "loss": 0.6021, + "step": 28484 + }, + { + "epoch": 0.99, + "learning_rate": 8.424412342731281e-09, + "loss": 0.7119, + "step": 28485 + }, + { + "epoch": 0.99, + "learning_rate": 8.379786007635116e-09, + "loss": 0.5886, + "step": 28486 + }, + { + "epoch": 0.99, + "learning_rate": 8.33527813583701e-09, + "loss": 0.6677, + "step": 28487 + }, + { + "epoch": 0.99, + "learning_rate": 8.29088872786432e-09, + "loss": 0.6196, + "step": 28488 + }, + { + "epoch": 0.99, + "learning_rate": 8.246617784241073e-09, + "loss": 0.6259, + "step": 28489 + }, + { + "epoch": 0.99, + "learning_rate": 8.202465305494622e-09, + "loss": 0.5653, + "step": 28490 + }, + { + "epoch": 0.99, + "learning_rate": 8.158431292147883e-09, + "loss": 0.6389, + "step": 28491 + }, + { + "epoch": 0.99, + "learning_rate": 8.114515744722663e-09, + "loss": 0.6559, + "step": 28492 + }, + { + "epoch": 0.99, + "learning_rate": 8.070718663739652e-09, + "loss": 0.6219, + "step": 28493 + }, + { + "epoch": 0.99, + "learning_rate": 8.027040049718438e-09, + "loss": 0.6306, + "step": 28494 + }, + { + "epoch": 0.99, + "learning_rate": 7.983479903176384e-09, + "loss": 0.6344, + "step": 28495 + }, + { + "epoch": 0.99, + "learning_rate": 7.940038224629742e-09, + "loss": 0.5985, + "step": 28496 + }, + { + "epoch": 0.99, + "learning_rate": 7.89671501459366e-09, + "loss": 0.6606, + "step": 28497 + }, + { + "epoch": 0.99, + "learning_rate": 7.853510273583276e-09, + "loss": 0.667, + "step": 28498 + }, + { + "epoch": 0.99, + "learning_rate": 7.810424002108185e-09, + "loss": 0.6514, + "step": 28499 + }, + { + "epoch": 0.99, + "learning_rate": 7.767456200681311e-09, + "loss": 0.6523, + "step": 28500 + }, + { + "epoch": 0.99, + "learning_rate": 7.724606869812245e-09, + "loss": 0.6321, + "step": 28501 + }, + { + "epoch": 0.99, + "learning_rate": 7.68187601000725e-09, + "loss": 0.5889, + "step": 28502 + }, + { + "epoch": 0.99, + "learning_rate": 7.639263621774806e-09, + "loss": 0.643, + "step": 28503 + }, + { + "epoch": 0.99, + "learning_rate": 7.596769705618956e-09, + "loss": 0.6249, + "step": 28504 + }, + { + "epoch": 0.99, + "learning_rate": 7.55439426204374e-09, + "loss": 0.6627, + "step": 28505 + }, + { + "epoch": 0.99, + "learning_rate": 7.51213729155098e-09, + "loss": 0.5699, + "step": 28506 + }, + { + "epoch": 0.99, + "learning_rate": 7.469998794643607e-09, + "loss": 0.6144, + "step": 28507 + }, + { + "epoch": 0.99, + "learning_rate": 7.427978771819e-09, + "loss": 0.5973, + "step": 28508 + }, + { + "epoch": 0.99, + "learning_rate": 7.38607722357676e-09, + "loss": 0.6161, + "step": 28509 + }, + { + "epoch": 0.99, + "learning_rate": 7.344294150414266e-09, + "loss": 0.6234, + "step": 28510 + }, + { + "epoch": 0.99, + "learning_rate": 7.302629552824458e-09, + "loss": 0.5813, + "step": 28511 + }, + { + "epoch": 0.99, + "learning_rate": 7.261083431303606e-09, + "loss": 0.6375, + "step": 28512 + }, + { + "epoch": 0.99, + "learning_rate": 7.219655786343538e-09, + "loss": 0.6223, + "step": 28513 + }, + { + "epoch": 0.99, + "learning_rate": 7.178346618434973e-09, + "loss": 0.6338, + "step": 28514 + }, + { + "epoch": 0.99, + "learning_rate": 7.1371559280686285e-09, + "loss": 0.6116, + "step": 28515 + }, + { + "epoch": 0.99, + "learning_rate": 7.096083715731894e-09, + "loss": 0.6955, + "step": 28516 + }, + { + "epoch": 0.99, + "learning_rate": 7.055129981912157e-09, + "loss": 0.5827, + "step": 28517 + }, + { + "epoch": 0.99, + "learning_rate": 7.014294727095694e-09, + "loss": 0.6374, + "step": 28518 + }, + { + "epoch": 0.99, + "learning_rate": 6.9735779517643436e-09, + "loss": 0.6246, + "step": 28519 + }, + { + "epoch": 0.99, + "learning_rate": 6.9329796564043814e-09, + "loss": 0.6136, + "step": 28520 + }, + { + "epoch": 0.99, + "learning_rate": 6.8924998414943155e-09, + "loss": 0.6548, + "step": 28521 + }, + { + "epoch": 0.99, + "learning_rate": 6.8521385075148716e-09, + "loss": 0.6128, + "step": 28522 + }, + { + "epoch": 0.99, + "learning_rate": 6.8118956549445555e-09, + "loss": 0.606, + "step": 28523 + }, + { + "epoch": 0.99, + "learning_rate": 6.771771284261874e-09, + "loss": 0.6236, + "step": 28524 + }, + { + "epoch": 0.99, + "learning_rate": 6.731765395939782e-09, + "loss": 0.696, + "step": 28525 + }, + { + "epoch": 0.99, + "learning_rate": 6.691877990454565e-09, + "loss": 0.6131, + "step": 28526 + }, + { + "epoch": 0.99, + "learning_rate": 6.652109068279178e-09, + "loss": 0.6248, + "step": 28527 + }, + { + "epoch": 0.99, + "learning_rate": 6.612458629885465e-09, + "loss": 0.5928, + "step": 28528 + }, + { + "epoch": 0.99, + "learning_rate": 6.572926675741942e-09, + "loss": 0.6532, + "step": 28529 + }, + { + "epoch": 0.99, + "learning_rate": 6.5335132063171216e-09, + "loss": 0.6587, + "step": 28530 + }, + { + "epoch": 0.99, + "learning_rate": 6.494218222080628e-09, + "loss": 0.6133, + "step": 28531 + }, + { + "epoch": 0.99, + "learning_rate": 6.455041723496536e-09, + "loss": 0.62, + "step": 28532 + }, + { + "epoch": 0.99, + "learning_rate": 6.4159837110300274e-09, + "loss": 0.6456, + "step": 28533 + }, + { + "epoch": 0.99, + "learning_rate": 6.377044185144066e-09, + "loss": 0.7008, + "step": 28534 + }, + { + "epoch": 0.99, + "learning_rate": 6.3382231462993935e-09, + "loss": 0.5842, + "step": 28535 + }, + { + "epoch": 0.99, + "learning_rate": 6.299520594957864e-09, + "loss": 0.6262, + "step": 28536 + }, + { + "epoch": 0.99, + "learning_rate": 6.260936531577999e-09, + "loss": 0.6123, + "step": 28537 + }, + { + "epoch": 0.99, + "learning_rate": 6.2224709566161e-09, + "loss": 0.6397, + "step": 28538 + }, + { + "epoch": 0.99, + "learning_rate": 6.184123870529579e-09, + "loss": 0.5864, + "step": 28539 + }, + { + "epoch": 0.99, + "learning_rate": 6.145895273772517e-09, + "loss": 0.5948, + "step": 28540 + }, + { + "epoch": 0.99, + "learning_rate": 6.107785166797886e-09, + "loss": 0.6085, + "step": 28541 + }, + { + "epoch": 0.99, + "learning_rate": 6.069793550057546e-09, + "loss": 0.6461, + "step": 28542 + }, + { + "epoch": 0.99, + "learning_rate": 6.031920424002247e-09, + "loss": 0.6111, + "step": 28543 + }, + { + "epoch": 0.99, + "learning_rate": 5.994165789081629e-09, + "loss": 0.6773, + "step": 28544 + }, + { + "epoch": 0.99, + "learning_rate": 5.956529645742004e-09, + "loss": 0.6717, + "step": 28545 + }, + { + "epoch": 0.99, + "learning_rate": 5.91901199443079e-09, + "loss": 0.6506, + "step": 28546 + }, + { + "epoch": 0.99, + "learning_rate": 5.881612835590966e-09, + "loss": 0.6277, + "step": 28547 + }, + { + "epoch": 0.99, + "learning_rate": 5.844332169668843e-09, + "loss": 0.6311, + "step": 28548 + }, + { + "epoch": 0.99, + "learning_rate": 5.807169997104067e-09, + "loss": 0.6407, + "step": 28549 + }, + { + "epoch": 0.99, + "learning_rate": 5.770126318338509e-09, + "loss": 0.5476, + "step": 28550 + }, + { + "epoch": 0.99, + "learning_rate": 5.733201133810706e-09, + "loss": 0.6124, + "step": 28551 + }, + { + "epoch": 0.99, + "learning_rate": 5.696394443958087e-09, + "loss": 0.6276, + "step": 28552 + }, + { + "epoch": 0.99, + "learning_rate": 5.6597062492180775e-09, + "loss": 0.6335, + "step": 28553 + }, + { + "epoch": 0.99, + "learning_rate": 5.623136550024777e-09, + "loss": 0.6818, + "step": 28554 + }, + { + "epoch": 0.99, + "learning_rate": 5.586685346812281e-09, + "loss": 0.6185, + "step": 28555 + }, + { + "epoch": 0.99, + "learning_rate": 5.550352640012468e-09, + "loss": 0.5974, + "step": 28556 + }, + { + "epoch": 0.99, + "learning_rate": 5.514138430056104e-09, + "loss": 0.6019, + "step": 28557 + }, + { + "epoch": 0.99, + "learning_rate": 5.478042717373955e-09, + "loss": 0.6146, + "step": 28558 + }, + { + "epoch": 0.99, + "learning_rate": 5.442065502391236e-09, + "loss": 0.6531, + "step": 28559 + }, + { + "epoch": 0.99, + "learning_rate": 5.406206785536494e-09, + "loss": 0.5844, + "step": 28560 + }, + { + "epoch": 0.99, + "learning_rate": 5.370466567234944e-09, + "loss": 0.6434, + "step": 28561 + }, + { + "epoch": 0.99, + "learning_rate": 5.334844847909582e-09, + "loss": 0.6174, + "step": 28562 + }, + { + "epoch": 0.99, + "learning_rate": 5.299341627982291e-09, + "loss": 0.6235, + "step": 28563 + }, + { + "epoch": 0.99, + "learning_rate": 5.263956907876067e-09, + "loss": 0.6161, + "step": 28564 + }, + { + "epoch": 0.99, + "learning_rate": 5.228690688007243e-09, + "loss": 0.6418, + "step": 28565 + }, + { + "epoch": 0.99, + "learning_rate": 5.193542968796594e-09, + "loss": 0.6165, + "step": 28566 + }, + { + "epoch": 0.99, + "learning_rate": 5.158513750660455e-09, + "loss": 0.6049, + "step": 28567 + }, + { + "epoch": 0.99, + "learning_rate": 5.1236030340129365e-09, + "loss": 0.7095, + "step": 28568 + }, + { + "epoch": 0.99, + "learning_rate": 5.088810819269263e-09, + "loss": 0.5931, + "step": 28569 + }, + { + "epoch": 0.99, + "learning_rate": 5.054137106841328e-09, + "loss": 0.6026, + "step": 28570 + }, + { + "epoch": 0.99, + "learning_rate": 5.019581897139913e-09, + "loss": 0.631, + "step": 28571 + }, + { + "epoch": 0.99, + "learning_rate": 4.985145190574692e-09, + "loss": 0.6307, + "step": 28572 + }, + { + "epoch": 0.99, + "learning_rate": 4.950826987555335e-09, + "loss": 0.6616, + "step": 28573 + }, + { + "epoch": 0.99, + "learning_rate": 4.916627288487075e-09, + "loss": 0.6727, + "step": 28574 + }, + { + "epoch": 0.99, + "learning_rate": 4.882546093776252e-09, + "loss": 0.6269, + "step": 28575 + }, + { + "epoch": 0.99, + "learning_rate": 4.84858340382699e-09, + "loss": 0.6522, + "step": 28576 + }, + { + "epoch": 0.99, + "learning_rate": 4.8147392190411865e-09, + "loss": 0.6094, + "step": 28577 + }, + { + "epoch": 0.99, + "learning_rate": 4.7810135398207444e-09, + "loss": 0.6305, + "step": 28578 + }, + { + "epoch": 0.99, + "learning_rate": 4.747406366565344e-09, + "loss": 0.6214, + "step": 28579 + }, + { + "epoch": 0.99, + "learning_rate": 4.7139176996735535e-09, + "loss": 0.6174, + "step": 28580 + }, + { + "epoch": 0.99, + "learning_rate": 4.680547539542834e-09, + "loss": 0.6193, + "step": 28581 + }, + { + "epoch": 0.99, + "learning_rate": 4.647295886568426e-09, + "loss": 0.5999, + "step": 28582 + }, + { + "epoch": 0.99, + "learning_rate": 4.614162741143346e-09, + "loss": 0.6143, + "step": 28583 + }, + { + "epoch": 0.99, + "learning_rate": 4.581148103662836e-09, + "loss": 0.7111, + "step": 28584 + }, + { + "epoch": 0.99, + "learning_rate": 4.548251974516582e-09, + "loss": 0.6237, + "step": 28585 + }, + { + "epoch": 0.99, + "learning_rate": 4.515474354095384e-09, + "loss": 0.6208, + "step": 28586 + }, + { + "epoch": 0.99, + "learning_rate": 4.482815242786709e-09, + "loss": 0.5909, + "step": 28587 + }, + { + "epoch": 0.99, + "learning_rate": 4.4502746409791355e-09, + "loss": 0.6381, + "step": 28588 + }, + { + "epoch": 0.99, + "learning_rate": 4.4178525490590204e-09, + "loss": 0.598, + "step": 28589 + }, + { + "epoch": 0.99, + "learning_rate": 4.385548967408282e-09, + "loss": 0.6797, + "step": 28590 + }, + { + "epoch": 0.99, + "learning_rate": 4.353363896412166e-09, + "loss": 0.6255, + "step": 28591 + }, + { + "epoch": 0.99, + "learning_rate": 4.32129733645148e-09, + "loss": 0.6151, + "step": 28592 + }, + { + "epoch": 0.99, + "learning_rate": 4.28934928790592e-09, + "loss": 0.6652, + "step": 28593 + }, + { + "epoch": 0.99, + "learning_rate": 4.257519751155182e-09, + "loss": 0.6358, + "step": 28594 + }, + { + "epoch": 0.99, + "learning_rate": 4.225808726575631e-09, + "loss": 0.596, + "step": 28595 + }, + { + "epoch": 0.99, + "learning_rate": 4.194216214544744e-09, + "loss": 0.6228, + "step": 28596 + }, + { + "epoch": 0.99, + "learning_rate": 4.162742215435555e-09, + "loss": 0.654, + "step": 28597 + }, + { + "epoch": 0.99, + "learning_rate": 4.131386729622211e-09, + "loss": 0.6188, + "step": 28598 + }, + { + "epoch": 0.99, + "learning_rate": 4.100149757475524e-09, + "loss": 0.6751, + "step": 28599 + }, + { + "epoch": 0.99, + "learning_rate": 4.069031299367421e-09, + "loss": 0.6582, + "step": 28600 + }, + { + "epoch": 0.99, + "learning_rate": 4.0380313556653836e-09, + "loss": 0.5732, + "step": 28601 + }, + { + "epoch": 0.99, + "learning_rate": 4.0071499267368975e-09, + "loss": 0.6465, + "step": 28602 + }, + { + "epoch": 0.99, + "learning_rate": 3.976387012949445e-09, + "loss": 0.6191, + "step": 28603 + }, + { + "epoch": 0.99, + "learning_rate": 3.94574261466607e-09, + "loss": 0.6245, + "step": 28604 + }, + { + "epoch": 0.99, + "learning_rate": 3.915216732252036e-09, + "loss": 0.614, + "step": 28605 + }, + { + "epoch": 0.99, + "learning_rate": 3.8848093660681655e-09, + "loss": 0.5709, + "step": 28606 + }, + { + "epoch": 0.99, + "learning_rate": 3.854520516474169e-09, + "loss": 0.6392, + "step": 28607 + }, + { + "epoch": 0.99, + "learning_rate": 3.824350183829761e-09, + "loss": 0.5395, + "step": 28608 + }, + { + "epoch": 0.99, + "learning_rate": 3.794298368494653e-09, + "loss": 0.675, + "step": 28609 + }, + { + "epoch": 0.99, + "learning_rate": 3.764365070821896e-09, + "loss": 0.692, + "step": 28610 + }, + { + "epoch": 0.99, + "learning_rate": 3.7345502911678714e-09, + "loss": 0.6121, + "step": 28611 + }, + { + "epoch": 0.99, + "learning_rate": 3.7048540298867396e-09, + "loss": 0.5862, + "step": 28612 + }, + { + "epoch": 0.99, + "learning_rate": 3.6752762873304425e-09, + "loss": 0.6142, + "step": 28613 + }, + { + "epoch": 0.99, + "learning_rate": 3.64581706384759e-09, + "loss": 0.6963, + "step": 28614 + }, + { + "epoch": 0.99, + "learning_rate": 3.616476359790122e-09, + "loss": 0.5877, + "step": 28615 + }, + { + "epoch": 0.99, + "learning_rate": 3.587254175505539e-09, + "loss": 0.6714, + "step": 28616 + }, + { + "epoch": 0.99, + "learning_rate": 3.55815051133801e-09, + "loss": 0.6902, + "step": 28617 + }, + { + "epoch": 0.99, + "learning_rate": 3.5291653676350348e-09, + "loss": 0.6493, + "step": 28618 + }, + { + "epoch": 0.99, + "learning_rate": 3.500298744739672e-09, + "loss": 0.6612, + "step": 28619 + }, + { + "epoch": 0.99, + "learning_rate": 3.47155064299276e-09, + "loss": 0.6021, + "step": 28620 + }, + { + "epoch": 0.99, + "learning_rate": 3.4429210627373587e-09, + "loss": 0.6461, + "step": 28621 + }, + { + "epoch": 0.99, + "learning_rate": 3.414410004310975e-09, + "loss": 0.5731, + "step": 28622 + }, + { + "epoch": 0.99, + "learning_rate": 3.3860174680533375e-09, + "loss": 0.5746, + "step": 28623 + }, + { + "epoch": 0.99, + "learning_rate": 3.3577434542997335e-09, + "loss": 0.6081, + "step": 28624 + }, + { + "epoch": 0.99, + "learning_rate": 3.32958796338656e-09, + "loss": 0.623, + "step": 28625 + }, + { + "epoch": 0.99, + "learning_rate": 3.3015509956457746e-09, + "loss": 0.6713, + "step": 28626 + }, + { + "epoch": 0.99, + "learning_rate": 3.273632551411554e-09, + "loss": 0.5934, + "step": 28627 + }, + { + "epoch": 0.99, + "learning_rate": 3.2458326310147447e-09, + "loss": 0.6637, + "step": 28628 + }, + { + "epoch": 0.99, + "learning_rate": 3.2181512347839726e-09, + "loss": 0.6706, + "step": 28629 + }, + { + "epoch": 0.99, + "learning_rate": 3.190588363048974e-09, + "loss": 0.6112, + "step": 28630 + }, + { + "epoch": 0.99, + "learning_rate": 3.1631440161350445e-09, + "loss": 0.5838, + "step": 28631 + }, + { + "epoch": 0.99, + "learning_rate": 3.1358181943674793e-09, + "loss": 0.6212, + "step": 28632 + }, + { + "epoch": 0.99, + "learning_rate": 3.1086108980715735e-09, + "loss": 0.6271, + "step": 28633 + }, + { + "epoch": 0.99, + "learning_rate": 3.081522127569292e-09, + "loss": 0.6253, + "step": 28634 + }, + { + "epoch": 0.99, + "learning_rate": 3.054551883181489e-09, + "loss": 0.6663, + "step": 28635 + }, + { + "epoch": 0.99, + "learning_rate": 3.0277001652279094e-09, + "loss": 0.6728, + "step": 28636 + }, + { + "epoch": 0.99, + "learning_rate": 3.0009669740271865e-09, + "loss": 0.6655, + "step": 28637 + }, + { + "epoch": 0.99, + "learning_rate": 2.9743523098968443e-09, + "loss": 0.608, + "step": 28638 + }, + { + "epoch": 0.99, + "learning_rate": 2.9478561731510758e-09, + "loss": 0.6169, + "step": 28639 + }, + { + "epoch": 0.99, + "learning_rate": 2.921478564106295e-09, + "loss": 0.6687, + "step": 28640 + }, + { + "epoch": 0.99, + "learning_rate": 2.8952194830722535e-09, + "loss": 0.6502, + "step": 28641 + }, + { + "epoch": 0.99, + "learning_rate": 2.869078930362035e-09, + "loss": 0.646, + "step": 28642 + }, + { + "epoch": 0.99, + "learning_rate": 2.8430569062853908e-09, + "loss": 0.6432, + "step": 28643 + }, + { + "epoch": 0.99, + "learning_rate": 2.8171534111509635e-09, + "loss": 0.6218, + "step": 28644 + }, + { + "epoch": 0.99, + "learning_rate": 2.7913684452662848e-09, + "loss": 0.6199, + "step": 28645 + }, + { + "epoch": 0.99, + "learning_rate": 2.7657020089355556e-09, + "loss": 0.6383, + "step": 28646 + }, + { + "epoch": 0.99, + "learning_rate": 2.7401541024640875e-09, + "loss": 0.6576, + "step": 28647 + }, + { + "epoch": 0.99, + "learning_rate": 2.7147247261549714e-09, + "loss": 0.6248, + "step": 28648 + }, + { + "epoch": 0.99, + "learning_rate": 2.6894138803090773e-09, + "loss": 0.6772, + "step": 28649 + }, + { + "epoch": 0.99, + "learning_rate": 2.664221565227276e-09, + "loss": 0.6666, + "step": 28650 + }, + { + "epoch": 0.99, + "learning_rate": 2.6391477812082176e-09, + "loss": 0.6641, + "step": 28651 + }, + { + "epoch": 0.99, + "learning_rate": 2.6141925285483315e-09, + "loss": 0.6788, + "step": 28652 + }, + { + "epoch": 0.99, + "learning_rate": 2.5893558075440474e-09, + "loss": 0.6388, + "step": 28653 + }, + { + "epoch": 0.99, + "learning_rate": 2.5646376184895737e-09, + "loss": 0.6209, + "step": 28654 + }, + { + "epoch": 0.99, + "learning_rate": 2.54003796167801e-09, + "loss": 0.6283, + "step": 28655 + }, + { + "epoch": 0.99, + "learning_rate": 2.515556837400235e-09, + "loss": 0.6351, + "step": 28656 + }, + { + "epoch": 0.99, + "learning_rate": 2.4911942459493467e-09, + "loss": 0.5735, + "step": 28657 + }, + { + "epoch": 0.99, + "learning_rate": 2.4669501876106725e-09, + "loss": 0.5949, + "step": 28658 + }, + { + "epoch": 0.99, + "learning_rate": 2.4428246626739814e-09, + "loss": 0.6183, + "step": 28659 + }, + { + "epoch": 0.99, + "learning_rate": 2.4188176714246005e-09, + "loss": 0.5981, + "step": 28660 + }, + { + "epoch": 0.99, + "learning_rate": 2.3949292141478564e-09, + "loss": 0.6508, + "step": 28661 + }, + { + "epoch": 0.99, + "learning_rate": 2.3711592911246363e-09, + "loss": 0.6371, + "step": 28662 + }, + { + "epoch": 0.99, + "learning_rate": 2.3475079026391566e-09, + "loss": 0.6085, + "step": 28663 + }, + { + "epoch": 0.99, + "learning_rate": 2.3239750489711943e-09, + "loss": 0.6187, + "step": 28664 + }, + { + "epoch": 0.99, + "learning_rate": 2.300560730399415e-09, + "loss": 0.606, + "step": 28665 + }, + { + "epoch": 0.99, + "learning_rate": 2.2772649472024842e-09, + "loss": 0.6011, + "step": 28666 + }, + { + "epoch": 0.99, + "learning_rate": 2.254087699654628e-09, + "loss": 0.6457, + "step": 28667 + }, + { + "epoch": 0.99, + "learning_rate": 2.231028988032291e-09, + "loss": 0.6428, + "step": 28668 + }, + { + "epoch": 0.99, + "learning_rate": 2.2080888126085888e-09, + "loss": 0.6482, + "step": 28669 + }, + { + "epoch": 0.99, + "learning_rate": 2.185267173654415e-09, + "loss": 0.6547, + "step": 28670 + }, + { + "epoch": 0.99, + "learning_rate": 2.162564071441775e-09, + "loss": 0.5887, + "step": 28671 + }, + { + "epoch": 0.99, + "learning_rate": 2.1399795062393424e-09, + "loss": 0.6694, + "step": 28672 + }, + { + "epoch": 0.99, + "learning_rate": 2.117513478314681e-09, + "loss": 0.5973, + "step": 28673 + }, + { + "epoch": 0.99, + "learning_rate": 2.0951659879342447e-09, + "loss": 0.6609, + "step": 28674 + }, + { + "epoch": 0.99, + "learning_rate": 2.072937035363376e-09, + "loss": 0.655, + "step": 28675 + }, + { + "epoch": 0.99, + "learning_rate": 2.0508266208651985e-09, + "loss": 0.6723, + "step": 28676 + }, + { + "epoch": 0.99, + "learning_rate": 2.0288347447017243e-09, + "loss": 0.6416, + "step": 28677 + }, + { + "epoch": 0.99, + "learning_rate": 2.006961407133856e-09, + "loss": 0.6365, + "step": 28678 + }, + { + "epoch": 0.99, + "learning_rate": 1.985206608421386e-09, + "loss": 0.6049, + "step": 28679 + }, + { + "epoch": 0.99, + "learning_rate": 1.963570348821886e-09, + "loss": 0.6399, + "step": 28680 + }, + { + "epoch": 0.99, + "learning_rate": 1.942052628590707e-09, + "loss": 0.693, + "step": 28681 + }, + { + "epoch": 0.99, + "learning_rate": 1.920653447985421e-09, + "loss": 0.6242, + "step": 28682 + }, + { + "epoch": 0.99, + "learning_rate": 1.8993728072580486e-09, + "loss": 0.6172, + "step": 28683 + }, + { + "epoch": 0.99, + "learning_rate": 1.87821070666061e-09, + "loss": 0.5951, + "step": 28684 + }, + { + "epoch": 0.99, + "learning_rate": 1.8571671464451268e-09, + "loss": 0.6157, + "step": 28685 + }, + { + "epoch": 0.99, + "learning_rate": 1.8362421268613984e-09, + "loss": 0.6534, + "step": 28686 + }, + { + "epoch": 0.99, + "learning_rate": 1.8154356481558944e-09, + "loss": 0.6181, + "step": 28687 + }, + { + "epoch": 0.99, + "learning_rate": 1.7947477105761945e-09, + "loss": 0.6849, + "step": 28688 + }, + { + "epoch": 0.99, + "learning_rate": 1.7741783143676583e-09, + "loss": 0.6354, + "step": 28689 + }, + { + "epoch": 0.99, + "learning_rate": 1.7537274597745347e-09, + "loss": 0.6414, + "step": 28690 + }, + { + "epoch": 0.99, + "learning_rate": 1.7333951470377419e-09, + "loss": 0.5934, + "step": 28691 + }, + { + "epoch": 0.99, + "learning_rate": 1.713181376400419e-09, + "loss": 0.6266, + "step": 28692 + }, + { + "epoch": 0.99, + "learning_rate": 1.6930861481001537e-09, + "loss": 0.6248, + "step": 28693 + }, + { + "epoch": 0.99, + "learning_rate": 1.6731094623778644e-09, + "loss": 0.6811, + "step": 28694 + }, + { + "epoch": 0.99, + "learning_rate": 1.6532513194678079e-09, + "loss": 0.6344, + "step": 28695 + }, + { + "epoch": 0.99, + "learning_rate": 1.633511719606462e-09, + "loss": 0.626, + "step": 28696 + }, + { + "epoch": 0.99, + "learning_rate": 1.6138906630280838e-09, + "loss": 0.6582, + "step": 28697 + }, + { + "epoch": 0.99, + "learning_rate": 1.5943881499647095e-09, + "loss": 0.5711, + "step": 28698 + }, + { + "epoch": 0.99, + "learning_rate": 1.5750041806483763e-09, + "loss": 0.6322, + "step": 28699 + }, + { + "epoch": 0.99, + "learning_rate": 1.5557387553077895e-09, + "loss": 0.601, + "step": 28700 + }, + { + "epoch": 0.99, + "learning_rate": 1.536591874172766e-09, + "loss": 0.6372, + "step": 28701 + }, + { + "epoch": 0.99, + "learning_rate": 1.5175635374686804e-09, + "loss": 0.6818, + "step": 28702 + }, + { + "epoch": 0.99, + "learning_rate": 1.4986537454231288e-09, + "loss": 0.5859, + "step": 28703 + }, + { + "epoch": 0.99, + "learning_rate": 1.4798624982581556e-09, + "loss": 0.6722, + "step": 28704 + }, + { + "epoch": 0.99, + "learning_rate": 1.461189796198026e-09, + "loss": 0.5881, + "step": 28705 + }, + { + "epoch": 0.99, + "learning_rate": 1.4426356394636742e-09, + "loss": 0.6628, + "step": 28706 + }, + { + "epoch": 0.99, + "learning_rate": 1.4242000282760349e-09, + "loss": 0.6286, + "step": 28707 + }, + { + "epoch": 0.99, + "learning_rate": 1.4058829628516012e-09, + "loss": 0.6182, + "step": 28708 + }, + { + "epoch": 0.99, + "learning_rate": 1.3876844434090874e-09, + "loss": 0.6701, + "step": 28709 + }, + { + "epoch": 0.99, + "learning_rate": 1.3696044701638766e-09, + "loss": 0.6355, + "step": 28710 + }, + { + "epoch": 0.99, + "learning_rate": 1.351643043330242e-09, + "loss": 0.6449, + "step": 28711 + }, + { + "epoch": 0.99, + "learning_rate": 1.333800163121346e-09, + "loss": 0.6292, + "step": 28712 + }, + { + "epoch": 0.99, + "learning_rate": 1.3160758297481313e-09, + "loss": 0.6979, + "step": 28713 + }, + { + "epoch": 0.99, + "learning_rate": 1.2984700434215403e-09, + "loss": 0.6725, + "step": 28714 + }, + { + "epoch": 0.99, + "learning_rate": 1.2809828043502948e-09, + "loss": 0.6442, + "step": 28715 + }, + { + "epoch": 0.99, + "learning_rate": 1.2636141127420066e-09, + "loss": 0.6123, + "step": 28716 + }, + { + "epoch": 0.99, + "learning_rate": 1.2463639688009565e-09, + "loss": 0.5718, + "step": 28717 + }, + { + "epoch": 1.0, + "learning_rate": 1.2292323727336463e-09, + "loss": 0.6361, + "step": 28718 + }, + { + "epoch": 1.0, + "learning_rate": 1.2122193247410263e-09, + "loss": 0.6426, + "step": 28719 + }, + { + "epoch": 1.0, + "learning_rate": 1.1953248250273775e-09, + "loss": 0.6524, + "step": 28720 + }, + { + "epoch": 1.0, + "learning_rate": 1.1785488737914297e-09, + "loss": 0.6431, + "step": 28721 + }, + { + "epoch": 1.0, + "learning_rate": 1.161891471231913e-09, + "loss": 0.6966, + "step": 28722 + }, + { + "epoch": 1.0, + "learning_rate": 1.145352617546447e-09, + "loss": 0.5618, + "step": 28723 + }, + { + "epoch": 1.0, + "learning_rate": 1.1289323129326513e-09, + "loss": 0.5374, + "step": 28724 + }, + { + "epoch": 1.0, + "learning_rate": 1.1126305575825946e-09, + "loss": 0.6334, + "step": 28725 + }, + { + "epoch": 1.0, + "learning_rate": 1.0964473516916762e-09, + "loss": 0.6645, + "step": 28726 + }, + { + "epoch": 1.0, + "learning_rate": 1.0803826954508544e-09, + "loss": 0.6324, + "step": 28727 + }, + { + "epoch": 1.0, + "learning_rate": 1.0644365890510878e-09, + "loss": 0.599, + "step": 28728 + }, + { + "epoch": 1.0, + "learning_rate": 1.0486090326811138e-09, + "loss": 0.7716, + "step": 28729 + }, + { + "epoch": 1.0, + "learning_rate": 1.0329000265285605e-09, + "loss": 0.6405, + "step": 28730 + }, + { + "epoch": 1.0, + "learning_rate": 1.0173095707799451e-09, + "loss": 0.5958, + "step": 28731 + }, + { + "epoch": 1.0, + "learning_rate": 1.001837665619565e-09, + "loss": 0.6329, + "step": 28732 + }, + { + "epoch": 1.0, + "learning_rate": 9.864843112317169e-10, + "loss": 0.642, + "step": 28733 + }, + { + "epoch": 1.0, + "learning_rate": 9.712495077973671e-10, + "loss": 0.6313, + "step": 28734 + }, + { + "epoch": 1.0, + "learning_rate": 9.561332554974824e-10, + "loss": 0.5864, + "step": 28735 + }, + { + "epoch": 1.0, + "learning_rate": 9.411355545119182e-10, + "loss": 0.6124, + "step": 28736 + }, + { + "epoch": 1.0, + "learning_rate": 9.26256405018311e-10, + "loss": 0.6473, + "step": 28737 + }, + { + "epoch": 1.0, + "learning_rate": 9.114958071920754e-10, + "loss": 0.6214, + "step": 28738 + }, + { + "epoch": 1.0, + "learning_rate": 8.968537612097372e-10, + "loss": 0.664, + "step": 28739 + }, + { + "epoch": 1.0, + "learning_rate": 8.823302672433809e-10, + "loss": 0.6402, + "step": 28740 + }, + { + "epoch": 1.0, + "learning_rate": 8.679253254673114e-10, + "loss": 0.6387, + "step": 28741 + }, + { + "epoch": 1.0, + "learning_rate": 8.536389360491726e-10, + "loss": 0.5808, + "step": 28742 + }, + { + "epoch": 1.0, + "learning_rate": 8.394710991610489e-10, + "loss": 0.5806, + "step": 28743 + }, + { + "epoch": 1.0, + "learning_rate": 8.25421814970584e-10, + "loss": 0.5862, + "step": 28744 + }, + { + "epoch": 1.0, + "learning_rate": 8.114910836432011e-10, + "loss": 0.6365, + "step": 28745 + }, + { + "epoch": 1.0, + "learning_rate": 7.976789053443235e-10, + "loss": 0.611, + "step": 28746 + }, + { + "epoch": 1.0, + "learning_rate": 7.839852802382642e-10, + "loss": 0.6484, + "step": 28747 + }, + { + "epoch": 1.0, + "learning_rate": 7.704102084871156e-10, + "loss": 0.6471, + "step": 28748 + }, + { + "epoch": 1.0, + "learning_rate": 7.569536902518604e-10, + "loss": 0.6016, + "step": 28749 + }, + { + "epoch": 1.0, + "learning_rate": 7.436157256912602e-10, + "loss": 0.6156, + "step": 28750 + }, + { + "epoch": 1.0, + "learning_rate": 7.303963149651872e-10, + "loss": 0.6755, + "step": 28751 + }, + { + "epoch": 1.0, + "learning_rate": 7.172954582290725e-10, + "loss": 0.6814, + "step": 28752 + }, + { + "epoch": 1.0, + "learning_rate": 7.043131556383476e-10, + "loss": 0.5977, + "step": 28753 + }, + { + "epoch": 1.0, + "learning_rate": 6.914494073484435e-10, + "loss": 0.5721, + "step": 28754 + }, + { + "epoch": 1.0, + "learning_rate": 6.787042135092403e-10, + "loss": 0.6453, + "step": 28755 + }, + { + "epoch": 1.0, + "learning_rate": 6.660775742739489e-10, + "loss": 0.6442, + "step": 28756 + }, + { + "epoch": 1.0, + "learning_rate": 6.535694897913392e-10, + "loss": 0.6279, + "step": 28757 + }, + { + "epoch": 1.0, + "learning_rate": 6.411799602090707e-10, + "loss": 0.6535, + "step": 28758 + }, + { + "epoch": 1.0, + "learning_rate": 6.289089856759135e-10, + "loss": 0.6782, + "step": 28759 + }, + { + "epoch": 1.0, + "learning_rate": 6.167565663361963e-10, + "loss": 0.5885, + "step": 28760 + }, + { + "epoch": 1.0, + "learning_rate": 6.047227023331381e-10, + "loss": 0.6498, + "step": 28761 + }, + { + "epoch": 1.0, + "learning_rate": 5.928073938110679e-10, + "loss": 0.6681, + "step": 28762 + }, + { + "epoch": 1.0, + "learning_rate": 5.810106409109839e-10, + "loss": 0.6478, + "step": 28763 + }, + { + "epoch": 1.0, + "learning_rate": 5.693324437716641e-10, + "loss": 0.6136, + "step": 28764 + }, + { + "epoch": 1.0, + "learning_rate": 5.577728025329965e-10, + "loss": 0.5998, + "step": 28765 + }, + { + "epoch": 1.0, + "learning_rate": 5.463317173304284e-10, + "loss": 0.6426, + "step": 28766 + }, + { + "epoch": 1.0, + "learning_rate": 5.350091883016273e-10, + "loss": 0.6322, + "step": 28767 + }, + { + "epoch": 1.0, + "learning_rate": 5.238052155787099e-10, + "loss": 0.5805, + "step": 28768 + }, + { + "epoch": 1.0, + "learning_rate": 5.127197992960132e-10, + "loss": 0.5958, + "step": 28769 + }, + { + "epoch": 1.0, + "learning_rate": 5.017529395845433e-10, + "loss": 0.6706, + "step": 28770 + }, + { + "epoch": 1.0, + "learning_rate": 4.909046365730863e-10, + "loss": 0.5906, + "step": 28771 + }, + { + "epoch": 1.0, + "learning_rate": 4.801748903926484e-10, + "loss": 0.6555, + "step": 28772 + }, + { + "epoch": 1.0, + "learning_rate": 4.695637011686848e-10, + "loss": 0.6681, + "step": 28773 + }, + { + "epoch": 1.0, + "learning_rate": 4.590710690277611e-10, + "loss": 0.6782, + "step": 28774 + }, + { + "epoch": 1.0, + "learning_rate": 4.4869699409311187e-10, + "loss": 0.6125, + "step": 28775 + }, + { + "epoch": 1.0, + "learning_rate": 4.384414764901923e-10, + "loss": 0.6571, + "step": 28776 + }, + { + "epoch": 1.0, + "learning_rate": 4.2830451633779637e-10, + "loss": 0.6149, + "step": 28777 + }, + { + "epoch": 1.0, + "learning_rate": 4.182861137580485e-10, + "loss": 0.6139, + "step": 28778 + }, + { + "epoch": 1.0, + "learning_rate": 4.083862688686324e-10, + "loss": 0.6196, + "step": 28779 + }, + { + "epoch": 1.0, + "learning_rate": 3.986049817872317e-10, + "loss": 0.6527, + "step": 28780 + }, + { + "epoch": 1.0, + "learning_rate": 3.8894225263041987e-10, + "loss": 0.6965, + "step": 28781 + }, + { + "epoch": 1.0, + "learning_rate": 3.793980815125498e-10, + "loss": 0.5885, + "step": 28782 + }, + { + "epoch": 1.0, + "learning_rate": 3.69972468545754e-10, + "loss": 0.6283, + "step": 28783 + }, + { + "epoch": 1.0, + "learning_rate": 3.6066541384327524e-10, + "loss": 0.6303, + "step": 28784 + }, + { + "epoch": 1.0, + "learning_rate": 3.5147691751391543e-10, + "loss": 0.6404, + "step": 28785 + }, + { + "epoch": 1.0, + "learning_rate": 3.424069796675866e-10, + "loss": 0.6848, + "step": 28786 + }, + { + "epoch": 1.0, + "learning_rate": 3.3345560041198046e-10, + "loss": 0.6464, + "step": 28787 + }, + { + "epoch": 1.0, + "learning_rate": 3.2462277985256807e-10, + "loss": 0.6492, + "step": 28788 + }, + { + "epoch": 1.0, + "learning_rate": 3.159085180948207e-10, + "loss": 0.6338, + "step": 28789 + }, + { + "epoch": 1.0, + "learning_rate": 3.073128152419891e-10, + "loss": 0.6349, + "step": 28790 + }, + { + "epoch": 1.0, + "learning_rate": 2.988356713951035e-10, + "loss": 0.6242, + "step": 28791 + }, + { + "epoch": 1.0, + "learning_rate": 2.9047708665519425e-10, + "loss": 0.6125, + "step": 28792 + }, + { + "epoch": 1.0, + "learning_rate": 2.822370611210712e-10, + "loss": 0.5709, + "step": 28793 + }, + { + "epoch": 1.0, + "learning_rate": 2.7411559489043393e-10, + "loss": 0.667, + "step": 28794 + }, + { + "epoch": 1.0, + "learning_rate": 2.661126880609821e-10, + "loss": 0.625, + "step": 28795 + }, + { + "epoch": 1.0, + "learning_rate": 2.582283407259745e-10, + "loss": 0.6663, + "step": 28796 + }, + { + "epoch": 1.0, + "learning_rate": 2.5046255297977993e-10, + "loss": 0.6069, + "step": 28797 + }, + { + "epoch": 1.0, + "learning_rate": 2.4281532491343685e-10, + "loss": 0.6668, + "step": 28798 + }, + { + "epoch": 1.0, + "learning_rate": 2.3528665661909367e-10, + "loss": 0.6523, + "step": 28799 + }, + { + "epoch": 1.0, + "learning_rate": 2.2787654818445804e-10, + "loss": 0.6314, + "step": 28800 + }, + { + "epoch": 1.0, + "learning_rate": 2.205849996983478e-10, + "loss": 0.6234, + "step": 28801 + }, + { + "epoch": 1.0, + "learning_rate": 2.134120112462501e-10, + "loss": 0.6408, + "step": 28802 + }, + { + "epoch": 1.0, + "learning_rate": 2.0635758291476238e-10, + "loss": 0.5751, + "step": 28803 + }, + { + "epoch": 1.0, + "learning_rate": 1.9942171478715134e-10, + "loss": 0.5748, + "step": 28804 + }, + { + "epoch": 1.0, + "learning_rate": 1.9260440694446325e-10, + "loss": 0.6396, + "step": 28805 + }, + { + "epoch": 1.0, + "learning_rate": 1.8590565946885465e-10, + "loss": 0.6516, + "step": 28806 + }, + { + "epoch": 1.0, + "learning_rate": 1.793254724380411e-10, + "loss": 0.6594, + "step": 28807 + }, + { + "epoch": 1.0, + "learning_rate": 1.728638459319587e-10, + "loss": 0.6384, + "step": 28808 + }, + { + "epoch": 1.0, + "learning_rate": 1.6652078002721284e-10, + "loss": 0.6512, + "step": 28809 + }, + { + "epoch": 1.0, + "learning_rate": 1.602962747970782e-10, + "loss": 0.6262, + "step": 28810 + }, + { + "epoch": 1.0, + "learning_rate": 1.5419033031705e-10, + "loss": 0.6943, + "step": 28811 + }, + { + "epoch": 1.0, + "learning_rate": 1.4820294665818247e-10, + "loss": 0.7248, + "step": 28812 + }, + { + "epoch": 1.0, + "learning_rate": 1.4233412389264012e-10, + "loss": 0.6348, + "step": 28813 + }, + { + "epoch": 1.0, + "learning_rate": 1.36583862090367e-10, + "loss": 0.6072, + "step": 28814 + }, + { + "epoch": 1.0, + "learning_rate": 1.309521613179765e-10, + "loss": 0.5981, + "step": 28815 + }, + { + "epoch": 1.0, + "learning_rate": 1.254390216431922e-10, + "loss": 0.593, + "step": 28816 + }, + { + "epoch": 1.0, + "learning_rate": 1.2004444313151732e-10, + "loss": 0.638, + "step": 28817 + }, + { + "epoch": 1.0, + "learning_rate": 1.1476842584623448e-10, + "loss": 0.6279, + "step": 28818 + }, + { + "epoch": 1.0, + "learning_rate": 1.0961096985062647e-10, + "loss": 0.655, + "step": 28819 + }, + { + "epoch": 1.0, + "learning_rate": 1.0457207520575551e-10, + "loss": 0.5785, + "step": 28820 + }, + { + "epoch": 1.0, + "learning_rate": 9.965174197046346e-11, + "loss": 0.6772, + "step": 28821 + }, + { + "epoch": 1.0, + "learning_rate": 9.48499702035921e-11, + "loss": 0.6137, + "step": 28822 + }, + { + "epoch": 1.0, + "learning_rate": 9.016675996287305e-11, + "loss": 0.6692, + "step": 28823 + }, + { + "epoch": 1.0, + "learning_rate": 8.560211130270724e-11, + "loss": 0.662, + "step": 28824 + }, + { + "epoch": 1.0, + "learning_rate": 8.11560242786058e-11, + "loss": 0.6618, + "step": 28825 + }, + { + "epoch": 1.0, + "learning_rate": 7.682849894163902e-11, + "loss": 0.6765, + "step": 28826 + }, + { + "epoch": 1.0, + "learning_rate": 7.261953534398736e-11, + "loss": 0.6334, + "step": 28827 + }, + { + "epoch": 1.0, + "learning_rate": 6.852913353450063e-11, + "loss": 0.6774, + "step": 28828 + }, + { + "epoch": 1.0, + "learning_rate": 6.455729356424911e-11, + "loss": 0.6406, + "step": 28829 + }, + { + "epoch": 1.0, + "learning_rate": 6.070401547764171e-11, + "loss": 0.6408, + "step": 28830 + }, + { + "epoch": 1.0, + "learning_rate": 5.696929932130779e-11, + "loss": 0.6537, + "step": 28831 + }, + { + "epoch": 1.0, + "learning_rate": 5.3353145139656284e-11, + "loss": 0.6322, + "step": 28832 + }, + { + "epoch": 1.0, + "learning_rate": 4.9855552975985875e-11, + "loss": 0.669, + "step": 28833 + }, + { + "epoch": 1.0, + "learning_rate": 4.6476522870264605e-11, + "loss": 0.6104, + "step": 28834 + }, + { + "epoch": 1.0, + "learning_rate": 4.3216054864680946e-11, + "loss": 0.6696, + "step": 28835 + }, + { + "epoch": 1.0, + "learning_rate": 4.0074148995872254e-11, + "loss": 0.6365, + "step": 28836 + }, + { + "epoch": 1.0, + "learning_rate": 3.705080530269634e-11, + "loss": 0.657, + "step": 28837 + }, + { + "epoch": 1.0, + "learning_rate": 3.414602382068033e-11, + "loss": 0.66, + "step": 28838 + }, + { + "epoch": 1.0, + "learning_rate": 3.1359804583130924e-11, + "loss": 0.5967, + "step": 28839 + }, + { + "epoch": 1.0, + "learning_rate": 2.8692147623354817e-11, + "loss": 0.5877, + "step": 28840 + }, + { + "epoch": 1.0, + "learning_rate": 2.614305297465869e-11, + "loss": 0.6345, + "step": 28841 + }, + { + "epoch": 1.0, + "learning_rate": 2.3712520664798123e-11, + "loss": 0.6491, + "step": 28842 + }, + { + "epoch": 1.0, + "learning_rate": 2.140055072485936e-11, + "loss": 0.6044, + "step": 28843 + }, + { + "epoch": 1.0, + "learning_rate": 1.9207143181487752e-11, + "loss": 0.608, + "step": 28844 + }, + { + "epoch": 1.0, + "learning_rate": 1.713229805910821e-11, + "loss": 0.6408, + "step": 28845 + }, + { + "epoch": 1.0, + "learning_rate": 1.5176015384366083e-11, + "loss": 0.6499, + "step": 28846 + }, + { + "epoch": 1.0, + "learning_rate": 1.3338295180576055e-11, + "loss": 0.6278, + "step": 28847 + }, + { + "epoch": 1.0, + "learning_rate": 1.1619137467722142e-11, + "loss": 0.6448, + "step": 28848 + }, + { + "epoch": 1.0, + "learning_rate": 1.0018542268008801e-11, + "loss": 0.6321, + "step": 28849 + }, + { + "epoch": 1.0, + "learning_rate": 8.536509598089383e-12, + "loss": 0.6547, + "step": 28850 + }, + { + "epoch": 1.0, + "learning_rate": 7.1730394790581194e-12, + "loss": 0.6632, + "step": 28851 + }, + { + "epoch": 1.0, + "learning_rate": 5.928131923127467e-12, + "loss": 0.6338, + "step": 28852 + }, + { + "epoch": 1.0, + "learning_rate": 4.801786948060994e-12, + "loss": 0.6432, + "step": 28853 + }, + { + "epoch": 1.0, + "learning_rate": 3.794004566071152e-12, + "loss": 0.5524, + "step": 28854 + }, + { + "epoch": 1.0, + "learning_rate": 2.9047847893703963e-12, + "loss": 0.664, + "step": 28855 + }, + { + "epoch": 1.0, + "learning_rate": 2.1341276268405097e-12, + "loss": 0.5892, + "step": 28856 + }, + { + "epoch": 1.0, + "learning_rate": 1.4820330906939462e-12, + "loss": 0.6121, + "step": 28857 + }, + { + "epoch": 1.0, + "learning_rate": 9.485011864818206e-13, + "loss": 0.6341, + "step": 28858 + }, + { + "epoch": 1.0, + "learning_rate": 5.33531920865471e-13, + "loss": 0.6557, + "step": 28859 + }, + { + "epoch": 1.0, + "learning_rate": 2.371252993960127e-13, + "loss": 0.5615, + "step": 28860 + }, + { + "epoch": 1.0, + "eval_loss": 0.5751461982727051, + "eval_runtime": 4924.422, + "eval_samples_per_second": 112.021, + "eval_steps_per_second": 37.341, + "step": 28860 + }, + { + "epoch": 1.0, + "learning_rate": 5.928132540411468e-14, + "loss": 0.6164, + "step": 28861 + }, + { + "epoch": 1.0, + "learning_rate": 0.0, + "loss": 0.599, + "step": 28862 + }, + { + "epoch": 1.0, + "step": 28862, + "total_flos": 1.3321809067702747e+19, + "train_loss": 0.6358378202117544, + "train_runtime": 173828.4743, + "train_samples_per_second": 23.91, + "train_steps_per_second": 0.166 + } + ], + "logging_steps": 1.0, + "max_steps": 28862, + "num_train_epochs": 1, + "save_steps": 5772, + "total_flos": 1.3321809067702747e+19, + "trial_name": null, + "trial_params": null +}